You are viewing a plain text version of this content. The canonical link for it is here.
Posted to commits@uima.apache.org by ea...@apache.org on 2007/02/03 17:47:15 UTC

svn commit: r503239 - in /incubator/uima/uimacpp/trunk/examples/descriptors: ./ DaveDetector.xml SimpleTextSegmenter.xml SofaDataAnnotator.xml SofaExampleAnnotator.xml XCasWriterCasConsumer.xml

Author: eae
Date: Sat Feb  3 08:47:14 2007
New Revision: 503239

URL: http://svn.apache.org/viewvc?view=rev&rev=503239
Log:
Initial entry

Added:
    incubator/uima/uimacpp/trunk/examples/descriptors/
    incubator/uima/uimacpp/trunk/examples/descriptors/DaveDetector.xml
    incubator/uima/uimacpp/trunk/examples/descriptors/SimpleTextSegmenter.xml
    incubator/uima/uimacpp/trunk/examples/descriptors/SofaDataAnnotator.xml
    incubator/uima/uimacpp/trunk/examples/descriptors/SofaExampleAnnotator.xml
    incubator/uima/uimacpp/trunk/examples/descriptors/XCasWriterCasConsumer.xml

Added: incubator/uima/uimacpp/trunk/examples/descriptors/DaveDetector.xml
URL: http://svn.apache.org/viewvc/incubator/uima/uimacpp/trunk/examples/descriptors/DaveDetector.xml?view=auto&rev=503239
==============================================================================
--- incubator/uima/uimacpp/trunk/examples/descriptors/DaveDetector.xml (added)
+++ incubator/uima/uimacpp/trunk/examples/descriptors/DaveDetector.xml Sat Feb  3 08:47:14 2007
@@ -0,0 +1,75 @@
+<?xml version="1.0" encoding="UTF-8" ?> 
+<taeDescription xmlns="http://uima.apache.org/resourceSpecifier">
+  <frameworkImplementation>org.apache.uima.cpp</frameworkImplementation>
+  <primitive>true</primitive>
+<annotatorImplementationName>DaveDetector</annotatorImplementationName>
+
+
+<analysisEngineMetaData>
+  <name>Dave Detector</name>
+  <description>Detects Daves in text, and annotates them.</description>
+  <version>1.0</version>
+  <vendor>IBM</vendor>
+
+
+<!--
+  Configuration Parameter Definitions
+-->
+        <configurationParameters>
+            <configurationParameter>
+                <name>DaveString</name>
+                <description>simple string for finding a Dave</description>
+                <type>String</type>
+                <multiValued>false</multiValued>
+                <mandatory>true</mandatory>
+            </configurationParameter>
+        </configurationParameters>
+
+<!--
+        Values for the configuration parameters
+-->
+        <configurationParameterSettings>
+          <nameValuePair>
+            <name>DaveString</name>
+            <value>
+              <string>Dave</string>
+            </value>
+          </nameValuePair>
+        </configurationParameterSettings>
+ 
+
+<!--
+        TypeSystem Definition
+-->
+
+<typeSystemDescription>
+  <types>
+    <typeDescription>
+      <name>org.apache.uima.examples.David</name>
+      <description></description>
+      <supertypeName>uima.tcas.Annotation</supertypeName>
+      <features>
+      </features>
+    </typeDescription>
+  </types>
+</typeSystemDescription>
+
+
+<!--
+Capabilities: Inputs, Outputs, and Preconditions
+-->
+<capabilities>
+  <capability>
+    <inputs/>
+    <outputs>
+      <type allAnnotatorFeatures="true">org.apache.uima.examples.David</type>
+    </outputs> 
+    <languagesSupported>
+      <language>x-unspecified</language>
+    </languagesSupported>
+  </capability>
+</capabilities>
+
+</analysisEngineMetaData>
+</taeDescription>
+

Added: incubator/uima/uimacpp/trunk/examples/descriptors/SimpleTextSegmenter.xml
URL: http://svn.apache.org/viewvc/incubator/uima/uimacpp/trunk/examples/descriptors/SimpleTextSegmenter.xml?view=auto&rev=503239
==============================================================================
--- incubator/uima/uimacpp/trunk/examples/descriptors/SimpleTextSegmenter.xml (added)
+++ incubator/uima/uimacpp/trunk/examples/descriptors/SimpleTextSegmenter.xml Sat Feb  3 08:47:14 2007
@@ -0,0 +1,52 @@
+<?xml version="1.0" encoding="UTF-8" ?> 
+<!-- For testing only. -->
+
+<analysisEngineDescription xmlns="http://uima.apache.org/resourceSpecifier">
+<frameworkImplementation>org.apache.uima.cpp</frameworkImplementation>
+<primitive>true</primitive>
+<annotatorImplementationName>SimpleTextSegmenter</annotatorImplementationName>
+ 
+<analysisEngineMetaData>
+	<name>Simple Text Segmenter</name>
+	<description>Splits a text document into pieces. The point at which the text is split is determined by SegmentDelimiter configuration parameter which defaults to new line ('\n')</description>
+	<version>1.0</version>
+	<vendor>IBM</vendor>
+	
+	<configurationParameters>
+		<configurationParameter>
+			<name>SegmentDelimiter</name>
+			<description>segment delimiter</description>
+			<type>String</type>
+			<multiValued>false</multiValued>
+			<mandatory>false</mandatory>
+		</configurationParameter>
+	</configurationParameters>
+	<configurationParameterSettings>
+		<nameValuePair>
+			<name>SegmentDelimiter</name>
+			<value>
+				<string>.</string>
+			</value>
+		</nameValuePair>
+	</configurationParameterSettings>
+
+	<typeSystemDescription>
+	  <imports>
+		<import name="org.apache.uima.examples.SourceDocumentInformation"/>
+	  </imports>
+	</typeSystemDescription>
+		
+	<capabilities>
+		<capability>
+			<outputs/>
+		</capability>
+	</capabilities>
+	
+	<operationalProperties>
+		<modifiesCas>false</modifiesCas>
+		<multipleDeploymentAllowed>true</multipleDeploymentAllowed>
+		<outputsNewCASes>true</outputsNewCASes>
+	</operationalProperties>
+	
+</analysisEngineMetaData>
+</analysisEngineDescription>

Added: incubator/uima/uimacpp/trunk/examples/descriptors/SofaDataAnnotator.xml
URL: http://svn.apache.org/viewvc/incubator/uima/uimacpp/trunk/examples/descriptors/SofaDataAnnotator.xml?view=auto&rev=503239
==============================================================================
--- incubator/uima/uimacpp/trunk/examples/descriptors/SofaDataAnnotator.xml (added)
+++ incubator/uima/uimacpp/trunk/examples/descriptors/SofaDataAnnotator.xml Sat Feb  3 08:47:14 2007
@@ -0,0 +1,15 @@
+<?xml version="1.0" encoding="UTF-8" ?> 
+<taeDescription xmlns="http://uima.apache.org/resourceSpecifier">
+  <frameworkImplementation>org.apache.uima.cpp</frameworkImplementation>
+  <primitive>true</primitive>
+<annotatorImplementationName>SofaDataAnnotator</annotatorImplementationName>
+<analysisEngineMetaData>
+  <name>Sofa Test Annotator</name>
+  <description>Tokenizes sofa data on whitespace.</description>
+  <version>1.0</version>
+  <vendor>IBM</vendor>
+</analysisEngineMetaData>
+</taeDescription>
+
+
+

Added: incubator/uima/uimacpp/trunk/examples/descriptors/SofaExampleAnnotator.xml
URL: http://svn.apache.org/viewvc/incubator/uima/uimacpp/trunk/examples/descriptors/SofaExampleAnnotator.xml?view=auto&rev=503239
==============================================================================
--- incubator/uima/uimacpp/trunk/examples/descriptors/SofaExampleAnnotator.xml (added)
+++ incubator/uima/uimacpp/trunk/examples/descriptors/SofaExampleAnnotator.xml Sat Feb  3 08:47:14 2007
@@ -0,0 +1,75 @@
+<?xml version="1.0" encoding="UTF-8" ?> 
+<taeDescription xmlns="http://uima.apache.org/resourceSpecifier">
+  <frameworkImplementation>org.apache.uima.cpp</frameworkImplementation>
+  <primitive>true</primitive>
+<annotatorImplementationName>SofaExampleAnnotator</annotatorImplementationName>
+
+
+<analysisEngineMetaData>
+  <name>Sofa Test Annotator</name>
+  <description>Looks for an English Sofa and creates a German one.</description>
+  <version>1.0</version>
+  <vendor>IBM</vendor>
+
+
+<!--
+  Configuration Parameter Definitions
+-->
+        <configurationParameters/>
+
+<!--
+        Values for the configuration parameters
+-->
+        <configurationParameterSettings/>
+ 
+
+<!--
+        TypeSystem Definition
+-->
+
+  <typeSystemDescription>
+    <types>
+      <typeDescription>
+        <name>sofa.test.CrossAnnotation</name>
+        <description></description>
+        <supertypeName>uima.tcas.Annotation</supertypeName>
+        <features>
+  	<featureDescription>
+  	  <name>otherAnnotation</name>
+  	  <description></description>
+  	  <rangeTypeName>uima.tcas.Annotation</rangeTypeName>
+  	</featureDescription>
+        </features>
+      </typeDescription>
+    </types>
+  </typeSystemDescription>
+
+<!--
+        IndexSystem Definition
+-->
+
+        
+
+<!--
+Capabilities: Inputs, Outputs, and Preconditions
+-->
+  <capabilities>
+    <capability>
+      <inputs/>
+      <outputs>
+        <type allAnnotatorFeatures="true">sofa.test.CrossAnnotation</type>
+      </outputs> 
+      <inputSofas>
+  	<sofaName>EnglishDocument</sofaName>
+      </inputSofas>
+      <outputSofas>
+  	<sofaName>GermanDocument</sofaName>
+      </outputSofas>
+      <languagesSupported>
+        <language>x-unspecified</language>
+      </languagesSupported>
+    </capability>
+  </capabilities>
+
+</analysisEngineMetaData>
+</taeDescription>

Added: incubator/uima/uimacpp/trunk/examples/descriptors/XCasWriterCasConsumer.xml
URL: http://svn.apache.org/viewvc/incubator/uima/uimacpp/trunk/examples/descriptors/XCasWriterCasConsumer.xml?view=auto&rev=503239
==============================================================================
--- incubator/uima/uimacpp/trunk/examples/descriptors/XCasWriterCasConsumer.xml (added)
+++ incubator/uima/uimacpp/trunk/examples/descriptors/XCasWriterCasConsumer.xml Sat Feb  3 08:47:14 2007
@@ -0,0 +1,77 @@
+<?xml version="1.0" encoding="UTF-8"?>
+
+<!-- A simple CAS consumer that writes an inline XML representation of the CAS to the filesystem.  -->
+
+<casConsumerDescription xmlns="http://uima.apache.org/resourceSpecifier" xmlns:xi="http://www.w3.org/2001/XInclude">
+	 
+        <frameworkImplementation>org.apache.uima.cpp</frameworkImplementation>
+        <implementationName>XCasWriterCasConsumer</implementationName>
+         
+	<processingResourceMetaData>
+
+		<name>XCAS Writer CAS Consumer</name>
+		<description>Writes the CAS to a stand-off XML format (XCAS)</description>
+		<version>1.0</version>
+		<vendor>IBM</vendor>
+
+		<configurationParameters>
+			<configurationParameter>
+				<name>OutputDirectory</name>
+				<description>The directory where xcas files are to be created.  The directory will be created if it does not exist.</description>
+				<type>String</type>
+				<multiValued>false</multiValued>
+				<mandatory>false</mandatory>
+			</configurationParameter>
+		</configurationParameters>
+
+
+          <!-- 
+		<configurationParameterSettings>
+			<nameValuePair>
+				<name>OutputDirectory</name>
+				<value>
+					<string>xcasOutputDirectory</string>
+				</value>
+			</nameValuePair>
+		</configurationParameterSettings>
+          -->
+
+
+	<typeSystemDescription>
+             <types>
+		<typeDescription>
+			<name>org.apache.uima.examples.SourceDocumentInformation</name>
+			<description>Stores detailed information about the original source document from which the current CAS was initialized. All information (like size) refers to the source document and not to the document in the CAS which may be converted and filtered by a CAS Initializer. For example this information will be written to the Semantic Search index so that the original document contents can be retrieved by queries.</description>
+			<supertypeName>uima.tcas.Annotation</supertypeName>
+			<features>
+				<featureDescription>
+					<name>uri</name>
+					<description>URI of document. (For example, file:///MyDirectory/myFile.txt for a simple file or http://www.research.ibm.com/UIMA/relatedprojects.htm for content from a web source.)</description>
+					<rangeTypeName>uima.cas.String</rangeTypeName>
+				</featureDescription>
+				<featureDescription>
+					<name>offsetInSource</name>
+					<description>Byte offset of the start of document content within original source file or other input source. Only used if the CAS document was retrieved from an source where one physical source file contained several conceptual documents. Zero otherwise.</description>
+					<rangeTypeName>uima.cas.Integer</rangeTypeName>
+				</featureDescription>
+				<featureDescription>
+					<name>documentSize</name>
+					<description>Size of original document in bytes before processing by CAS Initializer. Either absolute file size of size within file or other source.</description>
+					<rangeTypeName>uima.cas.Integer</rangeTypeName>
+				</featureDescription>
+			</features>
+		</typeDescription>
+	    </types>
+	</typeSystemDescription>
+
+		<capabilities>
+			<capability>
+				<inputs>
+          			<type allAnnotatorFeatures="true">org.apache.uima.examples.SourceDocumentInformation</type>
+				</inputs>
+			</capability>
+		</capabilities>
+
+	</processingResourceMetaData>
+
+</casConsumerDescription>