You are viewing a plain text version of this content. The canonical link for it is here.
Posted to commits@uima.apache.org by cw...@apache.org on 2018/05/01 17:27:36 UTC
svn commit: r1830695 - in
/uima/uima-ducc/trunk/uima-ducc-pullservice/src/test/resources:
GovernmentOfficialRecognizer_RegEx_TAE.xml
SimpleNameRecognizer_RegEx_TAE.xml TestAAE.xml
Author: cwiklik
Date: Tue May 1 17:27:36 2018
New Revision: 1830695
URL: http://svn.apache.org/viewvc?rev=1830695&view=rev
Log:
UIMA-5756 Added example AE descriptors
Added:
uima/uima-ducc/trunk/uima-ducc-pullservice/src/test/resources/GovernmentOfficialRecognizer_RegEx_TAE.xml
uima/uima-ducc/trunk/uima-ducc-pullservice/src/test/resources/SimpleNameRecognizer_RegEx_TAE.xml
uima/uima-ducc/trunk/uima-ducc-pullservice/src/test/resources/TestAAE.xml
Added: uima/uima-ducc/trunk/uima-ducc-pullservice/src/test/resources/GovernmentOfficialRecognizer_RegEx_TAE.xml
URL: http://svn.apache.org/viewvc/uima/uima-ducc/trunk/uima-ducc-pullservice/src/test/resources/GovernmentOfficialRecognizer_RegEx_TAE.xml?rev=1830695&view=auto
==============================================================================
--- uima/uima-ducc/trunk/uima-ducc-pullservice/src/test/resources/GovernmentOfficialRecognizer_RegEx_TAE.xml (added)
+++ uima/uima-ducc/trunk/uima-ducc-pullservice/src/test/resources/GovernmentOfficialRecognizer_RegEx_TAE.xml Tue May 1 17:27:36 2018
@@ -0,0 +1,141 @@
+<?xml version="1.0" encoding="UTF-8"?>
+
+ <!--
+ ***************************************************************
+ * Licensed to the Apache Software Foundation (ASF) under one
+ * or more contributor license agreements. See the NOTICE file
+ * distributed with this work for additional information
+ * regarding copyright ownership. The ASF licenses this file
+ * to you under the Apache License, Version 2.0 (the
+ * "License"); you may not use this file except in compliance
+ * with the License. You may obtain a copy of the License at
+ *
+ * http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing,
+ * software distributed under the License is distributed on an
+ * "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+ * KIND, either express or implied. See the License for the
+ * specific language governing permissions and limitations
+ * under the License.
+ ***************************************************************
+ -->
+
+<analysisEngineDescription xmlns="http://uima.apache.org/resourceSpecifier">
+ <frameworkImplementation>org.apache.uima.java</frameworkImplementation>
+ <primitive>true</primitive>
+ <annotatorImplementationName>org.apache.uima.examples.cas.RegExAnnotator</annotatorImplementationName>
+ <analysisEngineMetaData>
+ <name>Government Title Recognizer using Regular Expressions</name>
+ <description>Detects Government Titles using regular expressions.</description>
+ <configurationParameters>
+ <configurationParameter>
+ <name>Patterns</name>
+ <description>Regular expression patterns to match. The language is that supported by Java 1.4.</description>
+ <type>String</type>
+ <multiValued>true</multiValued>
+ <mandatory>false</mandatory>
+ </configurationParameter>
+ <configurationParameter>
+ <name>TypeNames</name>
+ <description>Names of CAS Types to create for the patterns found. The indexes of this array
+correspond to the indexes of the Patterns or PatternFiles arrays. If a match is found for
+Patterns[i], it will result in an annotation of type
+TypeNames[i].</description>
+ <type>String</type>
+ <multiValued>true</multiValued>
+ <mandatory>false</mandatory>
+ </configurationParameter>
+ <configurationParameter>
+ <name>ContainingAnnotationTypes</name>
+ <description>Names of CAS Input Types within which annotations should be created.</description>
+ <type>String</type>
+ <multiValued>true</multiValued>
+ <mandatory>false</mandatory>
+ </configurationParameter>
+ <configurationParameter>
+ <name>AnnotateEntireContainingAnnotation</name>
+ <description>When the ContainingAnnoationTypes parameter is specified, a value of true for this
+ parameter will cause the entire containing annotation to be used as the span of the new
+ annotation, rather than just the span of the regular expression match. This can be used
+ to "classify" previously created annotations according to whether or not they contain
+ text matching a regular expression.</description>
+ <type>Boolean</type>
+ <multiValued>false</multiValued>
+ <mandatory>false</mandatory>
+ </configurationParameter>
+ </configurationParameters>
+ <configurationParameterSettings>
+ <nameValuePair>
+ <name>ContainingAnnotationTypes</name>
+ <value>
+ <array>
+ <string>example.Name</string>
+ </array>
+ </value>
+ </nameValuePair>
+ <nameValuePair>
+ <name>AnnotateEntireContainingAnnotation</name>
+ <value>
+ <boolean>true</boolean>
+ </value>
+ </nameValuePair>
+ </configurationParameterSettings>
+ <typeSystemDescription>
+ <types>
+ <typeDescription>
+ <name>example.Name</name>
+ <description>A proper name.</description>
+ <supertypeName>uima.tcas.Annotation</supertypeName>
+ </typeDescription>
+ <typeDescription>
+ <name>example.GovernmentOfficial</name>
+ <description>A government official.</description>
+ <supertypeName>uima.tcas.Annotation</supertypeName>
+ </typeDescription>
+ </types>
+ </typeSystemDescription>
+ <capabilities>
+ <capability>
+ <inputs>
+ <type>example.Name</type>
+ </inputs>
+ <outputs>
+ <type>example.GovernmentOfficial</type>
+ </outputs>
+ <languagesSupported>
+ <language>en</language>
+ </languagesSupported>
+ </capability>
+ </capabilities>
+ <operationalProperties>
+ <modifiesCas>true</modifiesCas>
+ <multipleDeploymentAllowed>true</multipleDeploymentAllowed>
+ <outputsNewCASes>false</outputsNewCASes>
+ </operationalProperties>
+ </analysisEngineMetaData>
+ <externalResourceDependencies>
+ <externalResourceDependency>
+ <key>PatternFile</key>
+ <description>An optional external file containing regular expressions to match. File format is as follows: - Lines starting with # or whitepsace are ignored - Lines starting with % indicate an annotation type. - All other lines are regular expressions. The languages is that supported by Java 1.4. If a regular expression is matched, it will be annotated with the last annotation type declared (the nearest preceding line starting with %).</description>
+ <optional>true</optional>
+ </externalResourceDependency>
+ </externalResourceDependencies>
+ <resourceManagerConfiguration>
+ <externalResources>
+ <externalResource>
+ <name>GovernmentTitlePatterns</name>
+ <description>File containing Regular Expressions for the CAS type example.GovernmentOfficial.</description>
+ <fileResourceSpecifier>
+ <fileUrl>file:GovernmentTitlePatterns.dat</fileUrl>
+ </fileResourceSpecifier>
+ </externalResource>
+ </externalResources>
+ <externalResourceBindings>
+ <externalResourceBinding>
+ <key>PatternFile</key>
+ <resourceName>GovernmentTitlePatterns</resourceName>
+ </externalResourceBinding>
+ </externalResourceBindings>
+ </resourceManagerConfiguration>
+</analysisEngineDescription>
Added: uima/uima-ducc/trunk/uima-ducc-pullservice/src/test/resources/SimpleNameRecognizer_RegEx_TAE.xml
URL: http://svn.apache.org/viewvc/uima/uima-ducc/trunk/uima-ducc-pullservice/src/test/resources/SimpleNameRecognizer_RegEx_TAE.xml?rev=1830695&view=auto
==============================================================================
--- uima/uima-ducc/trunk/uima-ducc-pullservice/src/test/resources/SimpleNameRecognizer_RegEx_TAE.xml (added)
+++ uima/uima-ducc/trunk/uima-ducc-pullservice/src/test/resources/SimpleNameRecognizer_RegEx_TAE.xml Tue May 1 17:27:36 2018
@@ -0,0 +1,110 @@
+<?xml version="1.0" encoding="UTF-8"?>
+
+ <!--
+ ***************************************************************
+ * Licensed to the Apache Software Foundation (ASF) under one
+ * or more contributor license agreements. See the NOTICE file
+ * distributed with this work for additional information
+ * regarding copyright ownership. The ASF licenses this file
+ * to you under the Apache License, Version 2.0 (the
+ * "License"); you may not use this file except in compliance
+ * with the License. You may obtain a copy of the License at
+ *
+ * http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing,
+ * software distributed under the License is distributed on an
+ * "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+ * KIND, either express or implied. See the License for the
+ * specific language governing permissions and limitations
+ * under the License.
+ ***************************************************************
+ -->
+
+<analysisEngineDescription xmlns="http://uima.apache.org/resourceSpecifier">
+ <frameworkImplementation>org.apache.uima.java</frameworkImplementation>
+ <primitive>true</primitive>
+ <annotatorImplementationName>org.apache.uima.examples.cas.RegExAnnotator</annotatorImplementationName>
+ <analysisEngineMetaData>
+ <name>Simple Name Recognizer using Regular Expressions</name>
+ <description>Detects Names using a simple regular expression.</description>
+ <configurationParameters>
+ <configurationParameter>
+ <name>Patterns</name>
+ <description>Regular expression patterns to match. The language is that supported by Java 1.4.</description>
+ <type>String</type>
+ <multiValued>true</multiValued>
+ <mandatory>false</mandatory>
+ </configurationParameter>
+ <configurationParameter>
+ <name>TypeNames</name>
+ <description>Names of CAS Types to create for the patterns found. The indexes of this array
+correspond to the indexes of the Patterns or PatternFiles arrays. If a match is found for
+Patterns[i], it will result in an annotation of type
+TypeNames[i].</description>
+ <type>String</type>
+ <multiValued>true</multiValued>
+ <mandatory>false</mandatory>
+ </configurationParameter>
+ <configurationParameter>
+ <name>ContainingAnnotationTypes</name>
+ <description>Names of CAS Input Types within which annotations should be created.</description>
+ <type>String</type>
+ <multiValued>true</multiValued>
+ <mandatory>false</mandatory>
+ </configurationParameter>
+ <configurationParameter>
+ <name>AnnotateEntireContainingAnnotation</name>
+ <description>When the ContainingAnnoationTypes parameter is specified, a value of true for this
+ parameter will cause the entire containing annotation to be used as the span of the new
+ annotation, rather than just the span of the regular expression match. This can be used
+ to "classify" previously created annotations according to whether or not they contain
+ text matching a regular expression.</description>
+ <type>Boolean</type>
+ <multiValued>false</multiValued>
+ <mandatory>false</mandatory>
+ </configurationParameter>
+ </configurationParameters>
+ <configurationParameterSettings>
+ <nameValuePair>
+ <name>Patterns</name>
+ <value>
+ <array>
+ <string>\p{Upper}\w*(\.?\s\p{Upper}\w*)+</string>
+ </array>
+ </value>
+ </nameValuePair>
+ <nameValuePair>
+ <name>TypeNames</name>
+ <value>
+ <array>
+ <string>example.Name</string>
+ </array>
+ </value>
+ </nameValuePair>
+ </configurationParameterSettings>
+ <typeSystemDescription>
+ <types>
+ <typeDescription>
+ <name>example.Name</name>
+ <description>A proper name.</description>
+ <supertypeName>uima.tcas.Annotation</supertypeName>
+ </typeDescription>
+ </types>
+ </typeSystemDescription>
+ <capabilities>
+ <capability>
+ <inputs/>
+ <outputs>
+ <type>example.Name</type>
+ </outputs>
+ <languagesSupported/>
+ </capability>
+ </capabilities>
+ <operationalProperties>
+ <modifiesCas>true</modifiesCas>
+ <multipleDeploymentAllowed>true</multipleDeploymentAllowed>
+ <outputsNewCASes>false</outputsNewCASes>
+ </operationalProperties>
+ </analysisEngineMetaData>
+</analysisEngineDescription>
Added: uima/uima-ducc/trunk/uima-ducc-pullservice/src/test/resources/TestAAE.xml
URL: http://svn.apache.org/viewvc/uima/uima-ducc/trunk/uima-ducc-pullservice/src/test/resources/TestAAE.xml?rev=1830695&view=auto
==============================================================================
--- uima/uima-ducc/trunk/uima-ducc-pullservice/src/test/resources/TestAAE.xml (added)
+++ uima/uima-ducc/trunk/uima-ducc-pullservice/src/test/resources/TestAAE.xml Tue May 1 17:27:36 2018
@@ -0,0 +1,75 @@
+<?xml version="1.0" encoding="UTF-8"?>
+
+ <!--
+ ***************************************************************
+ * Licensed to the Apache Software Foundation (ASF) under one
+ * or more contributor license agreements. See the NOTICE file
+ * distributed with this work for additional information
+ * regarding copyright ownership. The ASF licenses this file
+ * to you under the Apache License, Version 2.0 (the
+ * "License"); you may not use this file except in compliance
+ * with the License. You may obtain a copy of the License at
+ *
+ * http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing,
+ * software distributed under the License is distributed on an
+ * "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+ * KIND, either express or implied. See the License for the
+ * specific language governing permissions and limitations
+ * under the License.
+ ***************************************************************
+ -->
+
+<analysisEngineDescription xmlns="http://uima.apache.org/resourceSpecifier">
+ <frameworkImplementation>org.apache.uima.java</frameworkImplementation>
+ <primitive>false</primitive>
+ <delegateAnalysisEngineSpecifiers>
+ <delegateAnalysisEngine key="GovernmentOfficialRecognizer">
+ <import location="GovernmentOfficialRecognizer_RegEx_TAE.xml"/>
+ </delegateAnalysisEngine>
+ <delegateAnalysisEngine key="NameRecognizer">
+ <import location="SimpleNameRecognizer_RegEx_TAE.xml"/>
+ </delegateAnalysisEngine>
+ </delegateAnalysisEngineSpecifiers>
+ <analysisEngineMetaData>
+ <name>Aggregate TAE - Name Recognizer and Government Official Recognizer</name>
+ <description>Detects Names and Government Officials</description>
+ <version></version>
+ <vendor></vendor>
+ <configurationParameters/>
+ <configurationParameterSettings/>
+ <flowConstraints>
+ <fixedFlow>
+ <node>NameRecognizer</node>
+ <node>GovernmentOfficialRecognizer</node>
+ </fixedFlow>
+ </flowConstraints>
+ <capabilities>
+ <capability>
+ <inputs/>
+ <outputs>
+ <type>example.GovernmentOfficial</type>
+ </outputs>
+ <languagesSupported>
+ <language>en</language>
+ </languagesSupported>
+ </capability>
+ <capability>
+ <inputs/>
+ <outputs>
+ <type>example.Name</type>
+ </outputs>
+ <languagesSupported>
+ <language>x-unspecified</language>
+ </languagesSupported>
+ </capability>
+ </capabilities>
+
+<operationalProperties>
+ <modifiesCas>true</modifiesCas>
+ <multipleDeploymentAllowed>true</multipleDeploymentAllowed>
+ <outputsNewCASes>false</outputsNewCASes>
+ </operationalProperties>
+ </analysisEngineMetaData>
+</analysisEngineDescription>
\ No newline at end of file