You are viewing a plain text version of this content. The canonical link for it is here.
Posted to commits@uima.apache.org by cw...@apache.org on 2018/05/01 17:27:36 UTC

svn commit: r1830695 - in /uima/uima-ducc/trunk/uima-ducc-pullservice/src/test/resources: GovernmentOfficialRecognizer_RegEx_TAE.xml SimpleNameRecognizer_RegEx_TAE.xml TestAAE.xml

Author: cwiklik
Date: Tue May  1 17:27:36 2018
New Revision: 1830695

URL: http://svn.apache.org/viewvc?rev=1830695&view=rev
Log:
UIMA-5756 Added example AE descriptors

Added:
    uima/uima-ducc/trunk/uima-ducc-pullservice/src/test/resources/GovernmentOfficialRecognizer_RegEx_TAE.xml
    uima/uima-ducc/trunk/uima-ducc-pullservice/src/test/resources/SimpleNameRecognizer_RegEx_TAE.xml
    uima/uima-ducc/trunk/uima-ducc-pullservice/src/test/resources/TestAAE.xml

Added: uima/uima-ducc/trunk/uima-ducc-pullservice/src/test/resources/GovernmentOfficialRecognizer_RegEx_TAE.xml
URL: http://svn.apache.org/viewvc/uima/uima-ducc/trunk/uima-ducc-pullservice/src/test/resources/GovernmentOfficialRecognizer_RegEx_TAE.xml?rev=1830695&view=auto
==============================================================================
--- uima/uima-ducc/trunk/uima-ducc-pullservice/src/test/resources/GovernmentOfficialRecognizer_RegEx_TAE.xml (added)
+++ uima/uima-ducc/trunk/uima-ducc-pullservice/src/test/resources/GovernmentOfficialRecognizer_RegEx_TAE.xml Tue May  1 17:27:36 2018
@@ -0,0 +1,141 @@
+<?xml version="1.0" encoding="UTF-8"?>
+
+	<!--
+	 ***************************************************************
+	 * Licensed to the Apache Software Foundation (ASF) under one
+	 * or more contributor license agreements.  See the NOTICE file
+	 * distributed with this work for additional information
+	 * regarding copyright ownership.  The ASF licenses this file
+	 * to you under the Apache License, Version 2.0 (the
+	 * "License"); you may not use this file except in compliance
+	 * with the License.  You may obtain a copy of the License at
+         *
+	 *   http://www.apache.org/licenses/LICENSE-2.0
+	 * 
+	 * Unless required by applicable law or agreed to in writing,
+	 * software distributed under the License is distributed on an
+	 * "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+	 * KIND, either express or implied.  See the License for the
+	 * specific language governing permissions and limitations
+	 * under the License.
+	 ***************************************************************
+   -->
+   
+<analysisEngineDescription xmlns="http://uima.apache.org/resourceSpecifier">
+  <frameworkImplementation>org.apache.uima.java</frameworkImplementation>
+  <primitive>true</primitive>
+  <annotatorImplementationName>org.apache.uima.examples.cas.RegExAnnotator</annotatorImplementationName>
+  <analysisEngineMetaData>
+    <name>Government Title Recognizer using Regular Expressions</name>
+    <description>Detects Government Titles using regular expressions.</description>
+    <configurationParameters>
+      <configurationParameter>
+        <name>Patterns</name>
+        <description>Regular expression patterns to match.  The language is that supported by Java 1.4.</description>
+        <type>String</type>
+        <multiValued>true</multiValued>
+        <mandatory>false</mandatory>
+      </configurationParameter>
+      <configurationParameter>
+        <name>TypeNames</name>
+        <description>Names of CAS Types to create for the patterns found.  The indexes of this array
+correspond to the indexes of the Patterns or PatternFiles arrays.  If a match is found for
+Patterns[i], it will result in an annotation of type
+TypeNames[i].</description>
+        <type>String</type>
+        <multiValued>true</multiValued>
+        <mandatory>false</mandatory>
+      </configurationParameter>
+      <configurationParameter>
+        <name>ContainingAnnotationTypes</name>
+        <description>Names of CAS Input Types within which annotations should be created.</description>
+        <type>String</type>
+        <multiValued>true</multiValued>
+        <mandatory>false</mandatory>
+      </configurationParameter>
+      <configurationParameter>
+        <name>AnnotateEntireContainingAnnotation</name>
+        <description>When the ContainingAnnoationTypes parameter is specified, a value of true for this
+	parameter will cause the entire containing annotation to be used as the span of the new
+	annotation, rather than just the span of the regular expression match.  This can be used
+	to "classify" previously created annotations according to whether or not they contain
+	text matching a regular expression.</description>
+        <type>Boolean</type>
+        <multiValued>false</multiValued>
+        <mandatory>false</mandatory>
+      </configurationParameter>
+    </configurationParameters>
+    <configurationParameterSettings>
+      <nameValuePair>
+        <name>ContainingAnnotationTypes</name>
+        <value>
+          <array>
+            <string>example.Name</string>
+          </array>
+        </value>
+      </nameValuePair>
+      <nameValuePair>
+        <name>AnnotateEntireContainingAnnotation</name>
+        <value>
+          <boolean>true</boolean>
+        </value>
+      </nameValuePair>
+    </configurationParameterSettings>
+    <typeSystemDescription>
+      <types>
+        <typeDescription>
+          <name>example.Name</name>
+          <description>A proper name.</description>
+          <supertypeName>uima.tcas.Annotation</supertypeName>
+        </typeDescription>
+        <typeDescription>
+          <name>example.GovernmentOfficial</name>
+          <description>A government official.</description>
+          <supertypeName>uima.tcas.Annotation</supertypeName>
+        </typeDescription>
+      </types>
+    </typeSystemDescription>
+    <capabilities>
+      <capability>
+        <inputs>
+          <type>example.Name</type>
+        </inputs>
+        <outputs>
+          <type>example.GovernmentOfficial</type>
+        </outputs>
+        <languagesSupported>
+          <language>en</language>
+        </languagesSupported>
+      </capability>
+    </capabilities>
+	<operationalProperties>
+		<modifiesCas>true</modifiesCas>
+		<multipleDeploymentAllowed>true</multipleDeploymentAllowed>
+		<outputsNewCASes>false</outputsNewCASes>
+	</operationalProperties>
+  </analysisEngineMetaData>
+  <externalResourceDependencies>
+    <externalResourceDependency>
+      <key>PatternFile</key>
+      <description>An optional external file containing regular expressions to match. File format is as follows: - Lines starting with # or whitepsace are ignored - Lines starting with % indicate an annotation type. - All other lines are regular expressions. The languages is that supported by Java 1.4. If a regular expression is matched, it will be annotated with the last annotation type declared (the nearest preceding line starting with %).</description>
+      <optional>true</optional>
+    </externalResourceDependency>
+  </externalResourceDependencies>
+  <resourceManagerConfiguration>
+    <externalResources>
+      <externalResource>
+        <name>GovernmentTitlePatterns</name>
+        <description>File containing Regular Expressions for the CAS type example.GovernmentOfficial.</description>
+        <fileResourceSpecifier>
+          <fileUrl>file:GovernmentTitlePatterns.dat</fileUrl>
+        </fileResourceSpecifier>
+      </externalResource>
+    </externalResources>
+    <externalResourceBindings>
+      <externalResourceBinding>
+        <key>PatternFile</key>
+        <resourceName>GovernmentTitlePatterns</resourceName>
+      </externalResourceBinding>
+    </externalResourceBindings>
+  </resourceManagerConfiguration>
+</analysisEngineDescription>

Added: uima/uima-ducc/trunk/uima-ducc-pullservice/src/test/resources/SimpleNameRecognizer_RegEx_TAE.xml
URL: http://svn.apache.org/viewvc/uima/uima-ducc/trunk/uima-ducc-pullservice/src/test/resources/SimpleNameRecognizer_RegEx_TAE.xml?rev=1830695&view=auto
==============================================================================
--- uima/uima-ducc/trunk/uima-ducc-pullservice/src/test/resources/SimpleNameRecognizer_RegEx_TAE.xml (added)
+++ uima/uima-ducc/trunk/uima-ducc-pullservice/src/test/resources/SimpleNameRecognizer_RegEx_TAE.xml Tue May  1 17:27:36 2018
@@ -0,0 +1,110 @@
+<?xml version="1.0" encoding="UTF-8"?>
+
+	<!--
+	 ***************************************************************
+	 * Licensed to the Apache Software Foundation (ASF) under one
+	 * or more contributor license agreements.  See the NOTICE file
+	 * distributed with this work for additional information
+	 * regarding copyright ownership.  The ASF licenses this file
+	 * to you under the Apache License, Version 2.0 (the
+	 * "License"); you may not use this file except in compliance
+	 * with the License.  You may obtain a copy of the License at
+         *
+	 *   http://www.apache.org/licenses/LICENSE-2.0
+	 * 
+	 * Unless required by applicable law or agreed to in writing,
+	 * software distributed under the License is distributed on an
+	 * "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+	 * KIND, either express or implied.  See the License for the
+	 * specific language governing permissions and limitations
+	 * under the License.
+	 ***************************************************************
+   -->
+   
+<analysisEngineDescription xmlns="http://uima.apache.org/resourceSpecifier">
+  <frameworkImplementation>org.apache.uima.java</frameworkImplementation>
+  <primitive>true</primitive>
+  <annotatorImplementationName>org.apache.uima.examples.cas.RegExAnnotator</annotatorImplementationName>
+  <analysisEngineMetaData>
+    <name>Simple Name Recognizer using Regular Expressions</name>
+    <description>Detects Names using a simple regular expression.</description>
+    <configurationParameters>
+      <configurationParameter>
+        <name>Patterns</name>
+        <description>Regular expression patterns to match.  The language is that supported by Java 1.4.</description>
+        <type>String</type>
+        <multiValued>true</multiValued>
+        <mandatory>false</mandatory>
+      </configurationParameter>
+      <configurationParameter>
+        <name>TypeNames</name>
+        <description>Names of CAS Types to create for the patterns found.  The indexes of this array
+correspond to the indexes of the Patterns or PatternFiles arrays.  If a match is found for
+Patterns[i], it will result in an annotation of type
+TypeNames[i].</description>
+        <type>String</type>
+        <multiValued>true</multiValued>
+        <mandatory>false</mandatory>
+      </configurationParameter>
+      <configurationParameter>
+        <name>ContainingAnnotationTypes</name>
+        <description>Names of CAS Input Types within which annotations should be created.</description>
+        <type>String</type>
+        <multiValued>true</multiValued>
+        <mandatory>false</mandatory>
+      </configurationParameter>
+      <configurationParameter>
+        <name>AnnotateEntireContainingAnnotation</name>
+        <description>When the ContainingAnnoationTypes parameter is specified, a value of true for this
+	parameter will cause the entire containing annotation to be used as the span of the new
+	annotation, rather than just the span of the regular expression match.  This can be used
+	to "classify" previously created annotations according to whether or not they contain
+	text matching a regular expression.</description>
+        <type>Boolean</type>
+        <multiValued>false</multiValued>
+        <mandatory>false</mandatory>
+      </configurationParameter>
+    </configurationParameters>
+    <configurationParameterSettings>
+      <nameValuePair>
+        <name>Patterns</name>
+        <value>
+          <array>
+            <string>\p{Upper}\w*(\.?\s\p{Upper}\w*)+</string>
+          </array>
+        </value>
+      </nameValuePair>
+      <nameValuePair>
+        <name>TypeNames</name>
+        <value>
+          <array>
+            <string>example.Name</string>
+          </array>
+        </value>
+      </nameValuePair>
+    </configurationParameterSettings>
+    <typeSystemDescription>
+      <types>
+        <typeDescription>
+          <name>example.Name</name>
+          <description>A proper name.</description>
+          <supertypeName>uima.tcas.Annotation</supertypeName>
+        </typeDescription>
+      </types>
+    </typeSystemDescription>
+    <capabilities>
+      <capability>
+        <inputs/>
+        <outputs>
+          <type>example.Name</type>
+        </outputs>
+        <languagesSupported/>
+      </capability>
+    </capabilities>
+	<operationalProperties>
+		<modifiesCas>true</modifiesCas>
+		<multipleDeploymentAllowed>true</multipleDeploymentAllowed>
+		<outputsNewCASes>false</outputsNewCASes>
+	</operationalProperties>
+  </analysisEngineMetaData>
+</analysisEngineDescription>

Added: uima/uima-ducc/trunk/uima-ducc-pullservice/src/test/resources/TestAAE.xml
URL: http://svn.apache.org/viewvc/uima/uima-ducc/trunk/uima-ducc-pullservice/src/test/resources/TestAAE.xml?rev=1830695&view=auto
==============================================================================
--- uima/uima-ducc/trunk/uima-ducc-pullservice/src/test/resources/TestAAE.xml (added)
+++ uima/uima-ducc/trunk/uima-ducc-pullservice/src/test/resources/TestAAE.xml Tue May  1 17:27:36 2018
@@ -0,0 +1,75 @@
+<?xml version="1.0" encoding="UTF-8"?>
+
+        <!--                                                                                                                                                                                 
+         ***************************************************************                                                                                                                     
+         * Licensed to the Apache Software Foundation (ASF) under one                                                                                                                        
+         * or more contributor license agreements.  See the NOTICE file                                                                                                                      
+         * distributed with this work for additional information                                                                                                                             
+         * regarding copyright ownership.  The ASF licenses this file                                                                                                                        
+         * to you under the Apache License, Version 2.0 (the                                                                                                                                 
+         * "License"); you may not use this file except in compliance                                                                                                                        
+         * with the License.  You may obtain a copy of the License at                                                                                                                        
+         *                                                                                                                                                                                   
+         *   http://www.apache.org/licenses/LICENSE-2.0                                                                                                                                      
+         *                                                                                                                                                                                   
+         * Unless required by applicable law or agreed to in writing,                                                                                                                        
+         * software distributed under the License is distributed on an                                                                                                                       
+         * "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY                                                                                                                            
+         * KIND, either express or implied.  See the License for the                                                                                                                         
+         * specific language governing permissions and limitations                                                                                                                           
+         * under the License.                                                                                                                                                                
+         ***************************************************************                                                                                                                     
+   -->
+
+<analysisEngineDescription xmlns="http://uima.apache.org/resourceSpecifier">
+  <frameworkImplementation>org.apache.uima.java</frameworkImplementation>
+  <primitive>false</primitive>
+  <delegateAnalysisEngineSpecifiers>
+    <delegateAnalysisEngine key="GovernmentOfficialRecognizer">
+      <import location="GovernmentOfficialRecognizer_RegEx_TAE.xml"/>
+    </delegateAnalysisEngine>
+    <delegateAnalysisEngine key="NameRecognizer">
+      <import location="SimpleNameRecognizer_RegEx_TAE.xml"/>
+    </delegateAnalysisEngine>
+  </delegateAnalysisEngineSpecifiers>
+  <analysisEngineMetaData>
+    <name>Aggregate TAE - Name Recognizer and Government Official Recognizer</name>
+    <description>Detects Names and Government Officials</description>
+    <version></version>
+    <vendor></vendor>
+    <configurationParameters/>
+    <configurationParameterSettings/>
+    <flowConstraints>
+      <fixedFlow>
+        <node>NameRecognizer</node>
+        <node>GovernmentOfficialRecognizer</node>
+      </fixedFlow>
+    </flowConstraints>
+    <capabilities>
+      <capability>
+        <inputs/>
+        <outputs>
+          <type>example.GovernmentOfficial</type>
+        </outputs>
+        <languagesSupported>
+          <language>en</language>
+        </languagesSupported>
+      </capability>
+      <capability>
+        <inputs/>
+        <outputs>
+          <type>example.Name</type>
+        </outputs>
+        <languagesSupported>
+          <language>x-unspecified</language>
+        </languagesSupported>
+      </capability>
+    </capabilities>
+     
+<operationalProperties>
+                <modifiesCas>true</modifiesCas>
+                <multipleDeploymentAllowed>true</multipleDeploymentAllowed>
+                <outputsNewCASes>false</outputsNewCASes>
+        </operationalProperties>
+  </analysisEngineMetaData>
+</analysisEngineDescription>
\ No newline at end of file