You are viewing a plain text version of this content. The canonical link for it is here.
Posted to commits@ctakes.apache.org by cl...@apache.org on 2014/04/22 17:15:28 UTC

svn commit: r1589163 - in /ctakes/trunk/ctakes-temporal/src/main/java/org/apache/ctakes/temporal/ae/feature: CheckSpecialWordRelationExtractor.java NearbyVerbTenseRelationExtractor.java SectionHeaderRelationExtractor.java

Author: clin
Date: Tue Apr 22 15:15:27 2014
New Revision: 1589163

URL: http://svn.apache.org/r1589163
Log:
added three more feature extractors for event-time relation discovery.

Added:
    ctakes/trunk/ctakes-temporal/src/main/java/org/apache/ctakes/temporal/ae/feature/CheckSpecialWordRelationExtractor.java   (with props)
    ctakes/trunk/ctakes-temporal/src/main/java/org/apache/ctakes/temporal/ae/feature/NearbyVerbTenseRelationExtractor.java   (with props)
    ctakes/trunk/ctakes-temporal/src/main/java/org/apache/ctakes/temporal/ae/feature/SectionHeaderRelationExtractor.java   (with props)

Added: ctakes/trunk/ctakes-temporal/src/main/java/org/apache/ctakes/temporal/ae/feature/CheckSpecialWordRelationExtractor.java
URL: http://svn.apache.org/viewvc/ctakes/trunk/ctakes-temporal/src/main/java/org/apache/ctakes/temporal/ae/feature/CheckSpecialWordRelationExtractor.java?rev=1589163&view=auto
==============================================================================
--- ctakes/trunk/ctakes-temporal/src/main/java/org/apache/ctakes/temporal/ae/feature/CheckSpecialWordRelationExtractor.java (added)
+++ ctakes/trunk/ctakes-temporal/src/main/java/org/apache/ctakes/temporal/ae/feature/CheckSpecialWordRelationExtractor.java Tue Apr 22 15:15:27 2014
@@ -0,0 +1,64 @@
+package org.apache.ctakes.temporal.ae.feature;
+
+import java.util.ArrayList;
+import java.util.Arrays;
+import java.util.Collection;
+import java.util.List;
+import java.util.Map;
+
+import org.apache.ctakes.relationextractor.ae.features.RelationFeaturesExtractor;
+import org.apache.ctakes.typesystem.type.syntax.WordToken;
+import org.apache.ctakes.typesystem.type.textsem.EventMention;
+import org.apache.ctakes.typesystem.type.textsem.IdentifiedAnnotation;
+import org.apache.ctakes.typesystem.type.textspan.Sentence;
+import org.apache.uima.analysis_engine.AnalysisEngineProcessException;
+import org.apache.uima.jcas.JCas;
+import org.cleartk.classifier.Feature;
+import org.uimafit.util.JCasUtil;
+
+public class CheckSpecialWordRelationExtractor implements RelationFeaturesExtractor{
+	
+	final static List<String> specialWd = Arrays.asList("before","prior","previous","previously","ago","soon","earlier","early","after","later","subsequent","follow","following","followed","post","since","back","start","started","by","past","starting");
+
+	@Override
+	public List<Feature> extract(JCas jcas, IdentifiedAnnotation arg1,
+			IdentifiedAnnotation arg2) throws AnalysisEngineProcessException {
+		List<Feature> feats = new ArrayList<Feature>();
+
+		//find event
+		EventMention event = null;
+		if(arg1 instanceof EventMention){
+			event = (EventMention) arg1;
+		}else if(arg1 instanceof EventMention){
+			event = (EventMention) arg2;
+		}else{
+			return feats;
+		}
+
+		//1 get covering sentence:
+		Map<EventMention, Collection<Sentence>> coveringMap =
+				JCasUtil.indexCovering(jcas, EventMention.class, Sentence.class);
+		Collection<Sentence> sentList = coveringMap.get(event);
+
+		//2 get Verb Tense
+		if (sentList != null && !sentList.isEmpty()){
+			for(Sentence sent : sentList) {
+				for ( WordToken wt : JCasUtil.selectCovered(jcas, WordToken.class, sent)) {
+					if (wt != null){
+						String wdtext = wt.getCoveredText().toLowerCase();
+						if (specialWd.contains(wdtext)){
+							Feature feature = new Feature("SpecialWd", wdtext);
+							feats.add(feature);
+						}
+					}
+				}
+				
+				//logger.info("found nearby verb's pos tag: "+ verbTP);
+			}
+
+		}
+		return feats;
+	}
+
+
+}

Propchange: ctakes/trunk/ctakes-temporal/src/main/java/org/apache/ctakes/temporal/ae/feature/CheckSpecialWordRelationExtractor.java
------------------------------------------------------------------------------
    svn:mime-type = text/plain

Added: ctakes/trunk/ctakes-temporal/src/main/java/org/apache/ctakes/temporal/ae/feature/NearbyVerbTenseRelationExtractor.java
URL: http://svn.apache.org/viewvc/ctakes/trunk/ctakes-temporal/src/main/java/org/apache/ctakes/temporal/ae/feature/NearbyVerbTenseRelationExtractor.java?rev=1589163&view=auto
==============================================================================
--- ctakes/trunk/ctakes-temporal/src/main/java/org/apache/ctakes/temporal/ae/feature/NearbyVerbTenseRelationExtractor.java (added)
+++ ctakes/trunk/ctakes-temporal/src/main/java/org/apache/ctakes/temporal/ae/feature/NearbyVerbTenseRelationExtractor.java Tue Apr 22 15:15:27 2014
@@ -0,0 +1,62 @@
+package org.apache.ctakes.temporal.ae.feature;
+
+import java.util.ArrayList;
+import java.util.Collection;
+import java.util.List;
+import java.util.Map;
+
+import org.apache.ctakes.relationextractor.ae.features.RelationFeaturesExtractor;
+import org.apache.ctakes.typesystem.type.syntax.WordToken;
+import org.apache.ctakes.typesystem.type.textsem.EventMention;
+import org.apache.ctakes.typesystem.type.textsem.IdentifiedAnnotation;
+import org.apache.ctakes.typesystem.type.textspan.Sentence;
+import org.apache.uima.analysis_engine.AnalysisEngineProcessException;
+import org.apache.uima.jcas.JCas;
+import org.cleartk.classifier.Feature;
+import org.uimafit.util.JCasUtil;
+
+public class NearbyVerbTenseRelationExtractor implements RelationFeaturesExtractor{
+
+	@Override
+	public List<Feature> extract(JCas jcas, IdentifiedAnnotation arg1,
+			IdentifiedAnnotation arg2) throws AnalysisEngineProcessException {
+		List<Feature> feats = new ArrayList<Feature>();
+
+		//find event
+		EventMention event = null;
+		if(arg1 instanceof EventMention){
+			event = (EventMention) arg1;
+		}else if(arg1 instanceof EventMention){
+			event = (EventMention) arg2;
+		}else{
+			return feats;
+		}
+
+		//1 get covering sentence:
+		Map<EventMention, Collection<Sentence>> coveringMap =
+				JCasUtil.indexCovering(jcas, EventMention.class, Sentence.class);
+		Collection<Sentence> sentList = coveringMap.get(event);
+
+		//2 get Verb Tense
+		if (sentList != null && !sentList.isEmpty()){
+			for(Sentence sent : sentList) {
+				String verbTP ="";
+				for ( WordToken wt : JCasUtil.selectCovered(jcas, WordToken.class, sent)) {
+					if (wt != null){
+						String pos = wt.getPartOfSpeech();
+						if (pos.startsWith("VB")){
+							verbTP = verbTP + "_" + pos;
+						}
+					}
+				}
+				Feature feature = new Feature("VerbTenseFeature", verbTP);
+				feats.add(feature);
+				//logger.info("found nearby verb's pos tag: "+ verbTP);
+			}
+
+		}
+		return feats;
+	}
+
+
+}

Propchange: ctakes/trunk/ctakes-temporal/src/main/java/org/apache/ctakes/temporal/ae/feature/NearbyVerbTenseRelationExtractor.java
------------------------------------------------------------------------------
    svn:mime-type = text/plain

Added: ctakes/trunk/ctakes-temporal/src/main/java/org/apache/ctakes/temporal/ae/feature/SectionHeaderRelationExtractor.java
URL: http://svn.apache.org/viewvc/ctakes/trunk/ctakes-temporal/src/main/java/org/apache/ctakes/temporal/ae/feature/SectionHeaderRelationExtractor.java?rev=1589163&view=auto
==============================================================================
--- ctakes/trunk/ctakes-temporal/src/main/java/org/apache/ctakes/temporal/ae/feature/SectionHeaderRelationExtractor.java (added)
+++ ctakes/trunk/ctakes-temporal/src/main/java/org/apache/ctakes/temporal/ae/feature/SectionHeaderRelationExtractor.java Tue Apr 22 15:15:27 2014
@@ -0,0 +1,52 @@
+package org.apache.ctakes.temporal.ae.feature;
+
+import java.util.ArrayList;
+import java.util.Collection;
+import java.util.List;
+import java.util.Map;
+
+import org.apache.ctakes.relationextractor.ae.features.RelationFeaturesExtractor;
+import org.apache.ctakes.typesystem.type.textsem.EventMention;
+import org.apache.ctakes.typesystem.type.textsem.IdentifiedAnnotation;
+import org.apache.ctakes.typesystem.type.textspan.Segment;
+import org.apache.uima.analysis_engine.AnalysisEngineProcessException;
+import org.apache.uima.jcas.JCas;
+import org.cleartk.classifier.Feature;
+import org.uimafit.util.JCasUtil;
+
+public class SectionHeaderRelationExtractor implements RelationFeaturesExtractor{
+
+	@Override
+	public List<Feature> extract(JCas jcas, IdentifiedAnnotation arg1,
+			IdentifiedAnnotation arg2) throws AnalysisEngineProcessException {
+		List<Feature> feats = new ArrayList<Feature>();
+
+		//find event
+		EventMention event = null;
+		if(arg1 instanceof EventMention){
+			event = (EventMention) arg1;
+		}else if(arg1 instanceof EventMention){
+			event = (EventMention) arg2;
+		}else{
+			return feats;
+		}
+
+		//get covering segment set:
+		Map<EventMention, Collection<Segment>> coveringMap =
+				JCasUtil.indexCovering(jcas, EventMention.class, Segment.class);
+		Collection<Segment> segList = coveringMap.get(event);
+
+		//get segment id
+		if (segList != null && !segList.isEmpty()){
+			for(Segment seg : segList) {
+				String segname = seg.getId();
+				Feature feature = new Feature("SegmentID", segname);
+				feats.add(feature);
+			}
+
+		}
+		return feats;
+	}
+
+
+}

Propchange: ctakes/trunk/ctakes-temporal/src/main/java/org/apache/ctakes/temporal/ae/feature/SectionHeaderRelationExtractor.java
------------------------------------------------------------------------------
    svn:mime-type = text/plain