You are viewing a plain text version of this content. The canonical link for it is here.
Posted to commits@ctakes.apache.org by se...@apache.org on 2019/06/03 20:03:13 UTC
svn commit: r1860575 -
/ctakes/trunk/ctakes-core/src/main/java/org/apache/ctakes/core/ae/ParagraphAnnotator.java
Author: seanfinan
Date: Mon Jun 3 20:03:13 2019
New Revision: 1860575
URL: http://svn.apache.org/viewvc?rev=1860575&view=rev
Log:
Allow tab or space in between eol characters to distinguish paragraph separation. Useful for notes with indentation.
Modified:
ctakes/trunk/ctakes-core/src/main/java/org/apache/ctakes/core/ae/ParagraphAnnotator.java
Modified: ctakes/trunk/ctakes-core/src/main/java/org/apache/ctakes/core/ae/ParagraphAnnotator.java
URL: http://svn.apache.org/viewvc/ctakes/trunk/ctakes-core/src/main/java/org/apache/ctakes/core/ae/ParagraphAnnotator.java?rev=1860575&r1=1860574&r2=1860575&view=diff
==============================================================================
--- ctakes/trunk/ctakes-core/src/main/java/org/apache/ctakes/core/ae/ParagraphAnnotator.java (original)
+++ ctakes/trunk/ctakes-core/src/main/java/org/apache/ctakes/core/ae/ParagraphAnnotator.java Mon Jun 3 20:03:13 2019
@@ -49,7 +49,8 @@ final public class ParagraphAnnotator ex
)
private String _paragraphTypesPath;
- static private final String DEFAULT_PARAGRAPH = "Default Paragraph||(?:(?:\\r?\\n){2,})";
+ // Allows spaces or tabs within the double-eol paragraph separator.
+ static private final String DEFAULT_PARAGRAPH = "Default Paragraph||(?:(?:[\\t ]*\\r?\\n){2,})";
/**
* Holder for section type as defined in the user's specification bsv file