You are viewing a plain text version of this content. The canonical link for it is here.
Posted to commits@opennlp.apache.org by jo...@apache.org on 2012/03/05 18:43:42 UTC
svn commit: r1297142 -
/opennlp/sandbox/corpus-server-connector/desc/CSQueueCollectionReader.xml
Author: joern
Date: Mon Mar 5 17:43:42 2012
New Revision: 1297142
URL: http://svn.apache.org/viewvc?rev=1297142&view=rev
Log:
OPENNLP-460 Updated to fit implementation.
Modified:
opennlp/sandbox/corpus-server-connector/desc/CSQueueCollectionReader.xml
Modified: opennlp/sandbox/corpus-server-connector/desc/CSQueueCollectionReader.xml
URL: http://svn.apache.org/viewvc/opennlp/sandbox/corpus-server-connector/desc/CSQueueCollectionReader.xml?rev=1297142&r1=1297141&r2=1297142&view=diff
==============================================================================
--- opennlp/sandbox/corpus-server-connector/desc/CSQueueCollectionReader.xml (original)
+++ opennlp/sandbox/corpus-server-connector/desc/CSQueueCollectionReader.xml Mon Mar 5 17:43:42 2012
@@ -9,7 +9,7 @@
* to you under the Apache License, Version 2.0 (the
* "License"); you may not use this file except in compliance
* with the License. You may obtain a copy of the License at
- *
+ *
* http://www.apache.org/licenses/LICENSE-2.0
*
* Unless required by applicable law or agreed to in writing,
@@ -31,15 +31,29 @@
<vendor>The Apache Software Foundation</vendor>
<configurationParameters>
<configurationParameter>
- <name>CorpusAddress</name>
- <description>Directory containing input files</description>
+ <name>ServerAddress</name>
+ <description>The location of the server.</description>
<type>String</type>
<multiValued>false</multiValued>
<mandatory>true</mandatory>
</configurationParameter>
<configurationParameter>
- <name>QueueAddress</name>
- <description>Directory containing input files</description>
+ <name>CorpusName</name>
+ <description>The id of the corpus which should be processed.</description>
+ <type>String</type>
+ <multiValued>false</multiValued>
+ <mandatory>true</mandatory>
+ </configurationParameter>
+ <configurationParameter>
+ <name>SearchQuery</name>
+ <description>The query to populate the queue.</description>
+ <type>String</type>
+ <multiValued>false</multiValued>
+ <mandatory>true</mandatory>
+ </configurationParameter>
+ <configurationParameter>
+ <name>QueueName</name>
+ <description>Name of the queue to create with the search query.</description>
<type>String</type>
<multiValued>false</multiValued>
<mandatory>true</mandatory>
@@ -47,24 +61,35 @@
</configurationParameters>
<configurationParameterSettings>
<nameValuePair>
- <name>CorpusAddress</name>
+ <name>ServerAddress</name>
<value>
- <string>http://localhost:8080/corpus-server/rest/corpora/wikinews</string>
+ <string>http://localhost:8080/corpus-server/rest</string>
+ </value>
+ </nameValuePair>
+ <nameValuePair>
+ <name>CorpusName</name>
+ <value>
+ <string>wikinews</string>
+ </value>
+ </nameValuePair>
+ <nameValuePair>
+ <name>SearchQuery</name>
+ <value>
+ <string>status-token:true</string>
+ </value>
+ </nameValuePair>
+ <nameValuePair>
+ <name>QueueName</name>
+ <value>
+ <string>EnglishTokenizerTraining</string>
</value>
</nameValuePair>
- <nameValuePair>
- <name>QueueAddress</name>
- <value>
- <string>http://localhost:8080/corpus-server/rest/queues/WikinewsNerPersonTrainingTask</string>
- </value>
- </nameValuePair>
</configurationParameterSettings>
-
- <!-- Type System of CASes returned by this Collection Reader -->
- <!-- TODO: Can TS be imported via http?! Otherwise it must be downloaded by the user! -->
+
+ <!-- Type System must be compatible with the one used for the corpus. -->
<typeSystemDescription>
<imports>
- <import name="org.apache.uima.examples.SourceDocumentInformation"/>
+ <import location="TypeSystem.xml"/>
</imports>
</typeSystemDescription>