You are viewing a plain text version of this content. The canonical link for it is here.
Posted to commits@ctakes.apache.org by se...@apache.org on 2019/06/03 20:03:13 UTC

svn commit: r1860575 - /ctakes/trunk/ctakes-core/src/main/java/org/apache/ctakes/core/ae/ParagraphAnnotator.java

Author: seanfinan
Date: Mon Jun  3 20:03:13 2019
New Revision: 1860575

URL: http://svn.apache.org/viewvc?rev=1860575&view=rev
Log:
Allow tab or space in between eol characters to distinguish paragraph separation.  Useful for notes with indentation.

Modified:
    ctakes/trunk/ctakes-core/src/main/java/org/apache/ctakes/core/ae/ParagraphAnnotator.java

Modified: ctakes/trunk/ctakes-core/src/main/java/org/apache/ctakes/core/ae/ParagraphAnnotator.java
URL: http://svn.apache.org/viewvc/ctakes/trunk/ctakes-core/src/main/java/org/apache/ctakes/core/ae/ParagraphAnnotator.java?rev=1860575&r1=1860574&r2=1860575&view=diff
==============================================================================
--- ctakes/trunk/ctakes-core/src/main/java/org/apache/ctakes/core/ae/ParagraphAnnotator.java (original)
+++ ctakes/trunk/ctakes-core/src/main/java/org/apache/ctakes/core/ae/ParagraphAnnotator.java Mon Jun  3 20:03:13 2019
@@ -49,7 +49,8 @@ final public class ParagraphAnnotator ex
    )
    private String _paragraphTypesPath;
 
-   static private final String DEFAULT_PARAGRAPH = "Default Paragraph||(?:(?:\\r?\\n){2,})";
+   // Allows spaces or tabs within the double-eol paragraph separator.
+   static private final String DEFAULT_PARAGRAPH = "Default Paragraph||(?:(?:[\\t ]*\\r?\\n){2,})";
 
    /**
     * Holder for section type as defined in the user's specification bsv file