You are viewing a plain text version of this content. The canonical link for it is here.
Posted to commits@ctakes.apache.org by se...@apache.org on 2014/11/04 19:03:26 UTC
svn commit: r1636667 -
/ctakes/trunk/ctakes-clinical-pipeline/desc/analysis_engine/AggregatePlaintextUMLSProcessor.xml
Author: seanfinan
Date: Tue Nov 4 18:03:26 2014
New Revision: 1636667
URL: http://svn.apache.org/r1636667
Log:
Swapped out current dictionary-lookup for dictionary-lookup-fast.
commented out LookupWindow** as the dictionary-lookup-fast uses Sentence by default.
Modified:
ctakes/trunk/ctakes-clinical-pipeline/desc/analysis_engine/AggregatePlaintextUMLSProcessor.xml
Modified: ctakes/trunk/ctakes-clinical-pipeline/desc/analysis_engine/AggregatePlaintextUMLSProcessor.xml
URL: http://svn.apache.org/viewvc/ctakes/trunk/ctakes-clinical-pipeline/desc/analysis_engine/AggregatePlaintextUMLSProcessor.xml?rev=1636667&r1=1636666&r2=1636667&view=diff
==============================================================================
--- ctakes/trunk/ctakes-clinical-pipeline/desc/analysis_engine/AggregatePlaintextUMLSProcessor.xml (original)
+++ ctakes/trunk/ctakes-clinical-pipeline/desc/analysis_engine/AggregatePlaintextUMLSProcessor.xml Tue Nov 4 18:03:26 2014
@@ -33,7 +33,7 @@
<import location="../../../ctakes-context-tokenizer/desc/analysis_engine/ContextDependentTokenizerAnnotator.xml"/>
</delegateAnalysisEngine>
<delegateAnalysisEngine key="DictionaryLookupAnnotatorDB">
- <import location="../../../ctakes-dictionary-lookup/desc/analysis_engine/DictionaryLookupAnnotatorUMLS.xml"/>
+ <import location="../../../ctakes-dictionary-lookup-fast/desc/analysis_engine/UmlsLookupAnnotator.xml"/>
</delegateAnalysisEngine>
<delegateAnalysisEngine key="StatusAnnotator">
<import location="../../../ctakes-ne-contexts/desc/StatusAnnotator.xml"/>
@@ -47,9 +47,24 @@
<delegateAnalysisEngine key="SentenceDetectorAnnotator">
<import location="../../../ctakes-core/desc/analysis_engine/SentenceDetectorAnnotator.xml"/>
</delegateAnalysisEngine>
- <delegateAnalysisEngine key="LookupWindowAnnotator">
- <import location="LookupWindowAnnotator.xml"/>
- </delegateAnalysisEngine>
+ <!-- By default, the dictionary lookup window is Sentence.
+ The change was made in 3.2.1 because experiments showed that many terms were missed when relying upon the
+ accuracy of LookupWindowAnnotator to correctly identify all present full noun phrases.
+ Instead, reliance is now upon the fact that most terms in the dictionary itself are (or fit in) noun phrases.
+ To revert to LookupWindowAnnotation:
+ 1. uncomment the following lines to load the LookupWindowAnnotator,
+ 2. uncomment the LookupWindowAnnotator line in <fixedFlow>,
+ 3. uncomment the LookupWindowAnnotation line in <capability> <outputs> <type>
+ 4. in ctakes-dictionary-lookup-fast .. /desc/analysis_engine/UmlsLookupAnnotator.xml
+ switch the value for <nameValuePair> windowAnnotations.
+ LookupWindowAnnotation is still there, just commented
+ 5. also uncomment <capability> <inputs> <type> ... LookupWindowAnnotation in UmlsLookupAnnotator.xml
+ The AdjustNounPhrase*** annotators have been left in case another module needs them.
+ I leave it to somebody with more applicable knowledge to remove them from the flow.
+ -->
+ <!--<delegateAnalysisEngine key="LookupWindowAnnotator">-->
+ <!--<import location="LookupWindowAnnotator.xml"/>-->
+ <!--</delegateAnalysisEngine>-->
<delegateAnalysisEngine key="AdjustNounPhraseToIncludeFollowingNP">
<import location="../../../ctakes-chunker/desc/AdjustNounPhraseToIncludeFollowingNP.xml"/>
</delegateAnalysisEngine>
@@ -128,7 +143,7 @@ and requires an UMLS license. Please up
<node>Chunker</node>
<node>AdjustNounPhraseToIncludeFollowingNP</node>
<node>AdjustNounPhraseToIncludeFollowingPPNP</node>
- <node>LookupWindowAnnotator</node>
+ <!--<node>LookupWindowAnnotator</node>-->
<node>DictionaryLookupAnnotatorDB</node>
<node>DependencyParser</node>
<node>SemanticRoleLabeler</node>
@@ -182,7 +197,7 @@ and requires an UMLS license. Please up
<type allAnnotatorFeatures="true">org.apache.ctakes.typesystem.type.syntax.NumToken</type>
<type allAnnotatorFeatures="true">org.apache.ctakes.typesystem.type.syntax.</type>
<type allAnnotatorFeatures="true">org.apache.ctakes.typesystem.type.textsem.MeasurementAnnotation</type>
- <type allAnnotatorFeatures="true">edu.mayo.bmi.uima.lookup.type.LookupWindowAnnotation</type>
+ <!--<type allAnnotatorFeatures="true">edu.mayo.bmi.uima.lookup.type.LookupWindowAnnotation</type>-->
<type allAnnotatorFeatures="true">org.apache.ctakes.typesystem.type.syntax.Lemma</type>
<type allAnnotatorFeatures="true">org.apache.ctakes.typesystem.type.syntax.LST</type>
<type allAnnotatorFeatures="true">org.apache.ctakes.typesystem.type.syntax.INTJ</type>