You are viewing a plain text version of this content. The canonical link for it is here.
Posted to commits@ctakes.apache.org by se...@apache.org on 2014/11/04 19:03:26 UTC

svn commit: r1636667 - /ctakes/trunk/ctakes-clinical-pipeline/desc/analysis_engine/AggregatePlaintextUMLSProcessor.xml

Author: seanfinan
Date: Tue Nov  4 18:03:26 2014
New Revision: 1636667

URL: http://svn.apache.org/r1636667
Log:
Swapped out current dictionary-lookup for dictionary-lookup-fast.
commented out LookupWindow** as the dictionary-lookup-fast uses Sentence by default. 

Modified:
    ctakes/trunk/ctakes-clinical-pipeline/desc/analysis_engine/AggregatePlaintextUMLSProcessor.xml

Modified: ctakes/trunk/ctakes-clinical-pipeline/desc/analysis_engine/AggregatePlaintextUMLSProcessor.xml
URL: http://svn.apache.org/viewvc/ctakes/trunk/ctakes-clinical-pipeline/desc/analysis_engine/AggregatePlaintextUMLSProcessor.xml?rev=1636667&r1=1636666&r2=1636667&view=diff
==============================================================================
--- ctakes/trunk/ctakes-clinical-pipeline/desc/analysis_engine/AggregatePlaintextUMLSProcessor.xml (original)
+++ ctakes/trunk/ctakes-clinical-pipeline/desc/analysis_engine/AggregatePlaintextUMLSProcessor.xml Tue Nov  4 18:03:26 2014
@@ -33,7 +33,7 @@
       <import location="../../../ctakes-context-tokenizer/desc/analysis_engine/ContextDependentTokenizerAnnotator.xml"/>
     </delegateAnalysisEngine>
     <delegateAnalysisEngine key="DictionaryLookupAnnotatorDB">
-      <import location="../../../ctakes-dictionary-lookup/desc/analysis_engine/DictionaryLookupAnnotatorUMLS.xml"/>
+       <import location="../../../ctakes-dictionary-lookup-fast/desc/analysis_engine/UmlsLookupAnnotator.xml"/>
     </delegateAnalysisEngine>
     <delegateAnalysisEngine key="StatusAnnotator">
       <import location="../../../ctakes-ne-contexts/desc/StatusAnnotator.xml"/>
@@ -47,9 +47,24 @@
     <delegateAnalysisEngine key="SentenceDetectorAnnotator">
       <import location="../../../ctakes-core/desc/analysis_engine/SentenceDetectorAnnotator.xml"/>
     </delegateAnalysisEngine>
-    <delegateAnalysisEngine key="LookupWindowAnnotator">
-      <import location="LookupWindowAnnotator.xml"/>
-    </delegateAnalysisEngine>
+     <!-- By default, the dictionary lookup window is Sentence.
+          The change was made in 3.2.1 because experiments showed that many terms were missed when relying upon the
+          accuracy of LookupWindowAnnotator to correctly identify all present full noun phrases.
+          Instead, reliance is now upon the fact that most terms in the dictionary itself are (or fit in) noun phrases.
+     To revert to LookupWindowAnnotation:
+       1.  uncomment the following lines to load the LookupWindowAnnotator,
+       2.  uncomment the LookupWindowAnnotator line in <fixedFlow>,
+       3.  uncomment the LookupWindowAnnotation line in <capability> <outputs> <type>
+       4.  in ctakes-dictionary-lookup-fast .. /desc/analysis_engine/UmlsLookupAnnotator.xml
+       switch the value for <nameValuePair> windowAnnotations.
+       LookupWindowAnnotation is still there, just commented
+       5.  also uncomment <capability> <inputs> <type> ... LookupWindowAnnotation in UmlsLookupAnnotator.xml
+       The AdjustNounPhrase*** annotators have been left in case another module needs them.
+       I leave it to somebody with more applicable knowledge to remove them from the flow.
+       -->
+    <!--<delegateAnalysisEngine key="LookupWindowAnnotator">-->
+      <!--<import location="LookupWindowAnnotator.xml"/>-->
+    <!--</delegateAnalysisEngine>-->
     <delegateAnalysisEngine key="AdjustNounPhraseToIncludeFollowingNP">
       <import location="../../../ctakes-chunker/desc/AdjustNounPhraseToIncludeFollowingNP.xml"/>
     </delegateAnalysisEngine>
@@ -128,7 +143,7 @@ and requires an UMLS license.  Please up
         <node>Chunker</node>
         <node>AdjustNounPhraseToIncludeFollowingNP</node>
         <node>AdjustNounPhraseToIncludeFollowingPPNP</node>
-        <node>LookupWindowAnnotator</node>
+        <!--<node>LookupWindowAnnotator</node>-->
         <node>DictionaryLookupAnnotatorDB</node>
         <node>DependencyParser</node>
 		<node>SemanticRoleLabeler</node>        
@@ -182,7 +197,7 @@ and requires an UMLS license.  Please up
           <type allAnnotatorFeatures="true">org.apache.ctakes.typesystem.type.syntax.NumToken</type>
           <type allAnnotatorFeatures="true">org.apache.ctakes.typesystem.type.syntax.</type>
           <type allAnnotatorFeatures="true">org.apache.ctakes.typesystem.type.textsem.MeasurementAnnotation</type>
-          <type allAnnotatorFeatures="true">edu.mayo.bmi.uima.lookup.type.LookupWindowAnnotation</type>
+          <!--<type allAnnotatorFeatures="true">edu.mayo.bmi.uima.lookup.type.LookupWindowAnnotation</type>-->
           <type allAnnotatorFeatures="true">org.apache.ctakes.typesystem.type.syntax.Lemma</type>
           <type allAnnotatorFeatures="true">org.apache.ctakes.typesystem.type.syntax.LST</type>
           <type allAnnotatorFeatures="true">org.apache.ctakes.typesystem.type.syntax.INTJ</type>