You are viewing a plain text version of this content. The canonical link for it is here.
Posted to commits@uima.apache.org by bu...@apache.org on 2010/12/18 23:21:27 UTC
svn commit: r1050726 [2/2] - in /uima/sandbox/trunk/GaleMultiModalExample:
./ desc/ desc/typesystem/
Added: uima/sandbox/trunk/GaleMultiModalExample/desc/typesystem/GaleTTSTypes.xml
URL: http://svn.apache.org/viewvc/uima/sandbox/trunk/GaleMultiModalExample/desc/typesystem/GaleTTSTypes.xml?rev=1050726&view=auto
==============================================================================
--- uima/sandbox/trunk/GaleMultiModalExample/desc/typesystem/GaleTTSTypes.xml (added)
+++ uima/sandbox/trunk/GaleMultiModalExample/desc/typesystem/GaleTTSTypes.xml Sat Dec 18 22:21:26 2010
@@ -0,0 +1,53 @@
+<?xml version="1.0" encoding="UTF-8"?>
+
+ <!--
+ ***************************************************************
+ * Licensed to the Apache Software Foundation (ASF) under one
+ * or more contributor license agreements. See the NOTICE file
+ * distributed with this work for additional information
+ * regarding copyright ownership. The ASF licenses this file
+ * to you under the Apache License, Version 2.0 (the
+ * "License"); you may not use this file except in compliance
+ * with the License. You may obtain a copy of the License at
+ *
+ * http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing,
+ * software distributed under the License is distributed on an
+ * "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+ * KIND, either express or implied. See the License for the
+ * specific language governing permissions and limitations
+ * under the License.
+ ***************************************************************
+ -->
+
+<typeSystemDescription xmlns="http://uima.apache.org/resourceSpecifier">
+ <name>TTS</name>
+ <description>Component of GALE Type System: TTS.</description>
+ <version>1.4</version>
+ <types>
+ <typeDescription>
+ <name>org.gale.AudioData</name>
+ <description>Audio data</description>
+ <supertypeName>uima.cas.TOP</supertypeName>
+ <features>
+ <featureDescription>
+ <name>buffer</name>
+ <description>An array of bytes holding the audio.</description>
+ <rangeTypeName>uima.cas.ByteArray</rangeTypeName>
+ </featureDescription>
+ <featureDescription>
+ <name>mimeType</name>
+ <description>Mimetype of audio</description>
+ <rangeTypeName>uima.cas.String</rangeTypeName>
+ </featureDescription>
+ <featureDescription>
+ <name>componentId</name>
+ <description> ID of the component creating this entry
+ </description>
+ <rangeTypeName>uima.cas.String</rangeTypeName>
+ </featureDescription>
+ </features>
+ </typeDescription>
+ </types>
+</typeSystemDescription>
Propchange: uima/sandbox/trunk/GaleMultiModalExample/desc/typesystem/GaleTTSTypes.xml
------------------------------------------------------------------------------
svn:eol-style = native
Added: uima/sandbox/trunk/GaleMultiModalExample/desc/typesystem/GaleTokenTypePriorities.xml
URL: http://svn.apache.org/viewvc/uima/sandbox/trunk/GaleMultiModalExample/desc/typesystem/GaleTokenTypePriorities.xml?rev=1050726&view=auto
==============================================================================
--- uima/sandbox/trunk/GaleMultiModalExample/desc/typesystem/GaleTokenTypePriorities.xml (added)
+++ uima/sandbox/trunk/GaleMultiModalExample/desc/typesystem/GaleTokenTypePriorities.xml Sat Dec 18 22:21:26 2010
@@ -0,0 +1,36 @@
+<?xml version="1.0" encoding="UTF-8"?>
+
+ <!--
+ ***************************************************************
+ * Licensed to the Apache Software Foundation (ASF) under one
+ * or more contributor license agreements. See the NOTICE file
+ * distributed with this work for additional information
+ * regarding copyright ownership. The ASF licenses this file
+ * to you under the Apache License, Version 2.0 (the
+ * "License"); you may not use this file except in compliance
+ * with the License. You may obtain a copy of the License at
+ *
+ * http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing,
+ * software distributed under the License is distributed on an
+ * "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+ * KIND, either express or implied. See the License for the
+ * specific language governing permissions and limitations
+ * under the License.
+ ***************************************************************
+ -->
+
+<typePriorities xmlns="http://uima.apache.org/resourceSpecifier">
+ <name>GaleTokenTypePriorities</name>
+ <description>Component of GALE Type System: priorities for text-token types.</description>
+ <version>1.4</version>
+ <priorityLists>
+ <priorityList>
+ <type>org.gale.Paragraph</type>
+ <type>org.gale.Sentence</type>
+ <type>org.gale.NonWhiteSpaceToken</type>
+ <type>org.gale.SubWordUnit</type>
+ </priorityList>
+ </priorityLists>
+</typePriorities>
Propchange: uima/sandbox/trunk/GaleMultiModalExample/desc/typesystem/GaleTokenTypePriorities.xml
------------------------------------------------------------------------------
svn:eol-style = native
Added: uima/sandbox/trunk/GaleMultiModalExample/desc/typesystem/GaleTokenTypes.xml
URL: http://svn.apache.org/viewvc/uima/sandbox/trunk/GaleMultiModalExample/desc/typesystem/GaleTokenTypes.xml?rev=1050726&view=auto
==============================================================================
--- uima/sandbox/trunk/GaleMultiModalExample/desc/typesystem/GaleTokenTypes.xml (added)
+++ uima/sandbox/trunk/GaleMultiModalExample/desc/typesystem/GaleTokenTypes.xml Sat Dec 18 22:21:26 2010
@@ -0,0 +1,210 @@
+<?xml version="1.0" encoding="UTF-8"?>
+
+ <!--
+ ***************************************************************
+ * Licensed to the Apache Software Foundation (ASF) under one
+ * or more contributor license agreements. See the NOTICE file
+ * distributed with this work for additional information
+ * regarding copyright ownership. The ASF licenses this file
+ * to you under the Apache License, Version 2.0 (the
+ * "License"); you may not use this file except in compliance
+ * with the License. You may obtain a copy of the License at
+ *
+ * http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing,
+ * software distributed under the License is distributed on an
+ * "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+ * KIND, either express or implied. See the License for the
+ * specific language governing permissions and limitations
+ * under the License.
+ ***************************************************************
+ -->
+
+<typeSystemDescription xmlns="http://uima.apache.org/resourceSpecifier">
+ <name>GTS</name>
+ <description>Component of GALE Type System: types for text tokens.</description>
+ <version>1.4</version>
+ <types>
+
+ <!-- ================================================================
+ Token
+ ================================================================ -->
+
+ <typeDescription>
+ <name>org.gale.Token</name>
+ <description>Tokenizer output - these should be non-overlapping
+ Frequently the set of Tokens will cover the entire document, but this
+ is not required. The type hierarchy derived from Token is used purely
+ for constructing specific iterators, not for data inheritance.
+ </description>
+ <supertypeName>uima.tcas.Annotation</supertypeName>
+ </typeDescription>
+
+
+ <!-- ================================================================
+ WhiteSpaceToken
+ ================================================================ -->
+
+ <typeDescription>
+ <name>org.gale.WhiteSpaceToken</name>
+ <description>A span of characters that meet the
+ Unicode definition of whitespace.
+ </description>
+ <supertypeName>org.gale.Token</supertypeName>
+ </typeDescription>
+
+ <!-- ================================================================
+ NonWhiteSpaceToken
+ ================================================================ -->
+
+ <typeDescription>
+ <name>org.gale.NonWhiteSpaceToken</name>
+ <description>A span of characters that meet the Unicode
+ definition of non-whitespace.
+ </description>
+ <supertypeName>org.gale.Token</supertypeName>
+ </typeDescription>
+
+ <!-- ================================================================
+ PunctuationToken
+ ================================================================ -->
+
+ <typeDescription>
+ <name>org.gale.PunctuationToken</name>
+ <description>A span of characters (often just one character) that meet the Unicode definition
+ of punctuation.
+ </description>
+ <supertypeName>org.gale.NonWhiteSpaceToken</supertypeName>
+ </typeDescription>
+
+
+ <!-- ================================================================
+ WordToken
+ ================================================================ -->
+
+ <typeDescription>
+ <name>org.gale.WordToken</name>
+ <description>A basic unanalyzed word
+ </description>
+ <supertypeName>org.gale.NonWhiteSpaceToken</supertypeName>
+ </typeDescription>
+
+
+ <!-- ================================================================
+ Sentence
+ ================================================================ -->
+
+ <typeDescription>
+ <name>org.gale.Sentence</name>
+ <description>A Sentence is not derived from Token, but covers one
+ or more Tokens (It should not cross brackets with a Token.) Sentences
+ are non-overlapping. Sentences are not required to collectively
+ cover the entire document text, but often do.
+ </description>
+ <supertypeName>uima.tcas.Annotation</supertypeName>
+ </typeDescription>
+
+ <!-- ================================================================
+ Paragraph
+ ================================================================ -->
+
+ <typeDescription>
+ <name>org.gale.Paragraph</name>
+ <description>A Paragraph is not derived from Sentence, but covers one
+ or more Sentences (It should not cross brackets with a Sentence.) Paragraphs
+ are non-overlapping. Paragraphs are not required to collectively
+ cover the entire document text, but often do.
+ </description>
+ <supertypeName>uima.tcas.Annotation</supertypeName>
+ </typeDescription>
+
+
+
+ <!-- ================================================================
+ SubWordUnit
+ ================================================================ -->
+
+ <typeDescription>
+ <name>org.gale.SubWordUnit</name>
+ <description>Subword units represent morphemes or stems. If the analysis is
+ produced on the same sofa as the input text, then begin and end should come from the
+ token that is analyzed. So a 1-character prefix in a WordToken from 0 to 3
+ should go from 0 to 1.
+ </description>
+ <supertypeName>uima.tcas.Annotation</supertypeName>
+ <features>
+ <featureDescription>
+ <name>index</name>
+ <description>Used to represent the position in a sequence of
+ morphemes derived from a WordToken. The first
+ SubWordUnit is numbered 0, and following units increment from there.
+ </description>
+ <rangeTypeName>uima.cas.Integer</rangeTypeName>
+ </featureDescription>
+
+ <featureDescription>
+ <name>affixType</name>
+ <description>This enum can be one of prefix, suffix, or stem.
+ (Should infix be another valid value?)
+ </description>
+ <rangeTypeName>uima.cas.String</rangeTypeName>
+ </featureDescription>
+
+ <featureDescription>
+ <name>token</name>
+ <description>The WordToken that was analyzed to produce the subword unit
+ </description>
+ <rangeTypeName>org.gale.WordToken</rangeTypeName>
+ </featureDescription>
+
+ <featureDescription>
+ <name>value</name>
+ <description>The value of the subword unit produced by the analysis, for example
+ if "running" is stemmed to "run" then value = "run"
+ </description>
+ <rangeTypeName>uima.cas.String</rangeTypeName>
+ </featureDescription>
+ </features>
+ </typeDescription>
+
+
+ <!-- ================================================================
+ TextLanguageID
+ ================================================================ -->
+
+ <typeDescription>
+ <name>org.gale.TextLanguageID</name>
+ <description> Value containing automatically identified language of
+ a span in the document. Since documents may be multilingual,
+ there may be multiple TextLanguageID annotations in a view. Also,
+ there may be more than one annotation covering the same text if
+ an automatic language detection engine is unsure of its output.
+ </description>
+ <supertypeName>uima.tcas.Annotation</supertypeName>
+ <features>
+ <featureDescription>
+ <name>language</name>
+ <description>the language, iso639 two letter code, lowercase
+ should the optional extension (en_us) be here or a separate field?
+ </description>
+ <rangeTypeName>uima.cas.String</rangeTypeName>
+ </featureDescription>
+
+ <featureDescription>
+ <name>confidence</name>
+ <description>Value representing the "score" of the language
+ identification, such as the probability that the span is actually
+ in this language. If multiple LanguageIDs are annotated, the
+ primary sorting key will be by score, with largest score first
+ (top-n lists).
+ </description>
+ <rangeTypeName>uima.cas.Float</rangeTypeName>
+ </featureDescription>
+ </features>
+ </typeDescription>
+
+
+
+ </types>
+</typeSystemDescription>
Propchange: uima/sandbox/trunk/GaleMultiModalExample/desc/typesystem/GaleTokenTypes.xml
------------------------------------------------------------------------------
svn:eol-style = native
Added: uima/sandbox/trunk/GaleMultiModalExample/desc/typesystem/GaleXrefTypes.xml
URL: http://svn.apache.org/viewvc/uima/sandbox/trunk/GaleMultiModalExample/desc/typesystem/GaleXrefTypes.xml?rev=1050726&view=auto
==============================================================================
--- uima/sandbox/trunk/GaleMultiModalExample/desc/typesystem/GaleXrefTypes.xml (added)
+++ uima/sandbox/trunk/GaleMultiModalExample/desc/typesystem/GaleXrefTypes.xml Sat Dec 18 22:21:26 2010
@@ -0,0 +1,173 @@
+<?xml version="1.0" encoding="UTF-8"?>
+
+ <!--
+ ***************************************************************
+ * Licensed to the Apache Software Foundation (ASF) under one
+ * or more contributor license agreements. See the NOTICE file
+ * distributed with this work for additional information
+ * regarding copyright ownership. The ASF licenses this file
+ * to you under the Apache License, Version 2.0 (the
+ * "License"); you may not use this file except in compliance
+ * with the License. You may obtain a copy of the License at
+ *
+ * http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing,
+ * software distributed under the License is distributed on an
+ * "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+ * KIND, either express or implied. See the License for the
+ * specific language governing permissions and limitations
+ * under the License.
+ ***************************************************************
+ -->
+
+<typeSystemDescription xmlns="http://uima.apache.org/resourceSpecifier">
+ <name>GTS</name>
+ <description>Component of GALE Type System: types for cross-referencing among sofas.</description>
+ <version>1.4</version>
+ <imports>
+ <import location="GaleSpeechTypes.xml"/>
+ <import location="GaleMTTypes.xml"/>
+ <import location="GaleEntityTypes.xml"/>
+ </imports>
+ <types>
+
+ <!-- ================================================================
+ AudioXref
+ ================================================================ -->
+
+ <typeDescription>
+ <name>org.gale.AudioXref</name>
+ <description>Cross-reference from a text annotation back to the corresponding AudioSpan.
+ </description>
+ <supertypeName>uima.tcas.Annotation</supertypeName>
+ <features>
+ <featureDescription>
+ <name>span</name>
+ <description>Reference to an AudioSpan on the Audio Sofa</description>
+ <rangeTypeName>org.gale.AudioSpan</rangeTypeName>
+ </featureDescription>
+ </features>
+ </typeDescription>
+
+ <!-- ================================================================
+ TranslateXref
+ ================================================================ -->
+
+ <typeDescription>
+ <name>org.gale.TranslateXref</name>
+ <description>Cross-reference from an annotation on target text back to the corresponding source.
+ Aligns a pair of phrases in the source and target texts such
+ that all word-word alignments are within the phrases.
+ Usually the smallest pairings with all internal alignments, but
+ could be larger, i.e. sentence-to-sentence.
+ </description>
+ <supertypeName>uima.tcas.Annotation</supertypeName>
+ <features>
+ <featureDescription>
+ <name>source</name>
+ <description>Reference to an Annotation on the source language Sofa</description>
+ <rangeTypeName>uima.tcas.Annotation</rangeTypeName>
+ </featureDescription>
+ </features>
+ </typeDescription>
+
+ <!-- ================================================================
+ TranslationResultXref
+ ================================================================ -->
+
+ <typeDescription>
+ <name>org.gale.TranslationResultXref</name>
+ <description>Cross-reference from an annotation on target
+ text back to the corresponding TranslationResult.
+ Aligns a span of target text to the TranslationResult
+ on the source-language sofa that provided it.
+ </description>
+ <supertypeName>uima.tcas.Annotation</supertypeName>
+ <features>
+ <featureDescription>
+ <name>source</name>
+ <description>Reference to an TranslationResult on the source language Sofa</description>
+ <rangeTypeName>org.gale.TranslationResult</rangeTypeName>
+ </featureDescription>
+ </features>
+ </typeDescription>
+
+ <!-- ================================================================
+ EntityMentionXref
+ ================================================================ -->
+
+ <typeDescription>
+ <name>org.gale.EntityMentionXref</name>
+ <description>Cross-reference from an EntityMention on target text
+ back to the corresponding EntityMention on the source-language
+ sofa. Mentions are expected to be a single span of text in both
+ the source and target sofas.
+ </description>
+ <supertypeName>uima.tcas.Annotation</supertypeName>
+ <features>
+ <featureDescription>
+ <name>source</name>
+ <description>Reference to a Mention on the source language Sofa</description>
+ <rangeTypeName>org.gale.EntityMention</rangeTypeName>
+ </featureDescription>
+ <featureDescription>
+ <name>target</name>
+ <description>Reference to an EntityMention on the target language Sofa</description>
+ <rangeTypeName>org.gale.EntityMention</rangeTypeName>
+ </featureDescription>
+ </features>
+ </typeDescription>
+
+ <!-- ================================================================
+ EventMentionXref
+ ================================================================ -->
+
+ <typeDescription>
+ <name>org.gale.EventMentionXref</name>
+ <description>Cross-reference from an EventMention on
+ target text back to the corresponding EventMention on the
+ source-language sofa.
+ </description>
+ <supertypeName>uima.tcas.Annotation</supertypeName>
+ <features>
+ <featureDescription>
+ <name>source</name>
+ <description>Reference to a Mention on the source language Sofa</description>
+ <rangeTypeName>org.gale.EventMention</rangeTypeName>
+ </featureDescription>
+ <featureDescription>
+ <name>target</name>
+ <description>Reference to an Mention on the target language Sofa</description>
+ <rangeTypeName>org.gale.EventMention</rangeTypeName>
+ </featureDescription>
+ </features>
+ </typeDescription>
+
+ <!-- ================================================================
+ RelationMentionXref
+ ================================================================ -->
+
+ <typeDescription>
+ <name>org.gale.RelationMentionXref</name>
+ <description>Cross-reference from a RelationMention on
+ target text back to the corresponding RelationMention on
+ the source-language sofa.
+ </description>
+ <supertypeName>uima.tcas.Annotation</supertypeName>
+ <features>
+ <featureDescription>
+ <name>source</name>
+ <description>Reference to a Mention on the source-language Sofa</description>
+ <rangeTypeName>org.gale.RelationMention</rangeTypeName>
+ </featureDescription>
+ <featureDescription>
+ <name>target</name>
+ <description>Reference to an RelationMention on the target-language Sofa</description>
+ <rangeTypeName>org.gale.RelationMention</rangeTypeName>
+ </featureDescription>
+ </features>
+ </typeDescription>
+
+ </types>
+</typeSystemDescription>
Propchange: uima/sandbox/trunk/GaleMultiModalExample/desc/typesystem/GaleXrefTypes.xml
------------------------------------------------------------------------------
svn:eol-style = native