You are viewing a plain text version of this content. The canonical link for it is here.
Posted to commits@ctakes.apache.org by dl...@apache.org on 2015/09/09 23:12:16 UTC

svn commit: r1702112 - in /ctakes/sandbox/ctakes-wsd/src/main/java/org/apache/ctakes: bootstrap/NarrativeContainers.java index/SearchUtility.java pipelines/BasicPipeline.java

Author: dligach
Date: Wed Sep  9 21:12:16 2015
New Revision: 1702112

URL: http://svn.apache.org/r1702112
Log:
now looking for events only within sentence boundaries

Modified:
    ctakes/sandbox/ctakes-wsd/src/main/java/org/apache/ctakes/bootstrap/NarrativeContainers.java
    ctakes/sandbox/ctakes-wsd/src/main/java/org/apache/ctakes/index/SearchUtility.java
    ctakes/sandbox/ctakes-wsd/src/main/java/org/apache/ctakes/pipelines/BasicPipeline.java

Modified: ctakes/sandbox/ctakes-wsd/src/main/java/org/apache/ctakes/bootstrap/NarrativeContainers.java
URL: http://svn.apache.org/viewvc/ctakes/sandbox/ctakes-wsd/src/main/java/org/apache/ctakes/bootstrap/NarrativeContainers.java?rev=1702112&r1=1702111&r2=1702112&view=diff
==============================================================================
--- ctakes/sandbox/ctakes-wsd/src/main/java/org/apache/ctakes/bootstrap/NarrativeContainers.java (original)
+++ ctakes/sandbox/ctakes-wsd/src/main/java/org/apache/ctakes/bootstrap/NarrativeContainers.java Wed Sep  9 21:12:16 2015
@@ -69,13 +69,15 @@ public class NarrativeContainers {
     
     @Override
     public void process(JCas jCas) throws AnalysisEngineProcessException {
-
+      
       for(Sentence sentence : JCasUtil.select(jCas, Sentence.class)) {
         for(WordToken word : JCasUtil.selectCovered(jCas, WordToken.class, sentence)) {
           if(word.getCoveredText().equals(anchor)) {
-            EventMention nearestEvent = getNearestEventMention(jCas, word);
+            EventMention nearestEvent = getNearestEventMention(jCas, word, sentence);
             if(nearestEvent != null) {
+              System.out.println(sentence.getCoveredText());
               System.out.println(nearestEvent.getCoveredText());
+              System.out.println();
             }
           } 
         }
@@ -86,7 +88,7 @@ public class NarrativeContainers {
      * Find nearest event mention on the right of a word token. 
      * Must be within allowable distance. Return null if none found.
      */
-    private static EventMention getNearestEventMention(JCas jCas, WordToken word) {
+    private static EventMention getNearestEventMention(JCas jCas, WordToken word, Sentence sentence) {
 
       List<EventMention> eventMentions = JCasUtil.selectFollowing(jCas, EventMention.class, word, 1);
       if(eventMentions.size() < 1) {
@@ -94,6 +96,9 @@ public class NarrativeContainers {
       }
 
       EventMention nearestEventMention = eventMentions.get(0);
+      if((nearestEventMention.getBegin() < sentence.getBegin()) || (nearestEventMention.getBegin() > sentence.getEnd())) {
+        return null;
+      }
       int distance = JCasUtil.selectBetween(jCas, WordToken.class, word, nearestEventMention).size();
       if(distance > maxDistance) {
         return null;

Modified: ctakes/sandbox/ctakes-wsd/src/main/java/org/apache/ctakes/index/SearchUtility.java
URL: http://svn.apache.org/viewvc/ctakes/sandbox/ctakes-wsd/src/main/java/org/apache/ctakes/index/SearchUtility.java?rev=1702112&r1=1702111&r2=1702112&view=diff
==============================================================================
--- ctakes/sandbox/ctakes-wsd/src/main/java/org/apache/ctakes/index/SearchUtility.java (original)
+++ ctakes/sandbox/ctakes-wsd/src/main/java/org/apache/ctakes/index/SearchUtility.java Wed Sep  9 21:12:16 2015
@@ -17,7 +17,7 @@ import org.apache.lucene.store.FSDirecto
 
 public class SearchUtility {
   
-  public static final boolean printEntireDocument = false;
+  public static final boolean printEntireDocument = true;
   public static final int contextWindowInCharacters = 30;
   
   public static void main(String[] args) throws IOException {

Modified: ctakes/sandbox/ctakes-wsd/src/main/java/org/apache/ctakes/pipelines/BasicPipeline.java
URL: http://svn.apache.org/viewvc/ctakes/sandbox/ctakes-wsd/src/main/java/org/apache/ctakes/pipelines/BasicPipeline.java?rev=1702112&r1=1702111&r2=1702112&view=diff
==============================================================================
--- ctakes/sandbox/ctakes-wsd/src/main/java/org/apache/ctakes/pipelines/BasicPipeline.java (original)
+++ ctakes/sandbox/ctakes-wsd/src/main/java/org/apache/ctakes/pipelines/BasicPipeline.java Wed Sep  9 21:12:16 2015
@@ -58,8 +58,8 @@ import com.google.common.io.CharStreams;
 
 public class BasicPipeline {
 
-  public static File inputDirectory = new File("/Users/dima/Boston/Data/DeepPhe/Text/");
-  public static String outputDirectory = "/Users/dima/Boston/Data/DeepPhe/Xmi/";
+  public static File inputDirectory = new File("/Users/dima/Boston/Out/Text/");
+  public static String outputDirectory = "/Users/dima/Boston/Out/Xmi/";
 
   public static void main(String[] args) throws Exception {