You are viewing a plain text version of this content. The canonical link for it is here.
Posted to commits@stanbol.apache.org by rw...@apache.org on 2011/09/22 08:51:36 UTC
svn commit: r1173968 [2/5] - in /incubator/stanbol/trunk:
commons/installer/bundleprovider/src/main/java/org/apache/stanbol/commons/installer/provider/bundle/impl/
commons/jsonld/ commons/opennlp/
commons/opennlp/src/main/java/org/apache/stanbol/common...
Added: incubator/stanbol/trunk/data/opennlp/lang/de/download_models.xml
URL: http://svn.apache.org/viewvc/incubator/stanbol/trunk/data/opennlp/lang/de/download_models.xml?rev=1173968&view=auto
==============================================================================
--- incubator/stanbol/trunk/data/opennlp/lang/de/download_models.xml (added)
+++ incubator/stanbol/trunk/data/opennlp/lang/de/download_models.xml Thu Sep 22 06:51:30 2011
@@ -0,0 +1,36 @@
+<?xml version="1.0" encoding="UTF-8"?>
+<!--
+ Licensed to the Apache Software Foundation (ASF) under one or more
+ contributor license agreements. See the NOTICE file distributed with
+ this work for additional information regarding copyright ownership.
+ The ASF licenses this file to You under the Apache License, Version 2.0
+ (the "License"); you may not use this file except in compliance with
+ the License. You may obtain a copy of the License at
+
+ http://www.apache.org/licenses/LICENSE-2.0
+
+ Unless required by applicable law or agreed to in writing, software
+ distributed under the License is distributed on an "AS IS" BASIS,
+ WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+ See the License for the specific language governing permissions and
+ limitations under the License.
+-->
+<project name="OpenNLP Model Download Helper" default="download" basedir=".">
+ <description>
+ Contains only a singel target that is used by the Maven Ant
+ Plugin to download OpenNLP Models from the Web
+ </description>
+
+ <target name="download">
+ <copy todir="${target.directory}" flatten="true">
+ <resources>
+ <url url="${model.url}/de-token.bin"/>
+ <url url="${model.url}/de-sent.bin"/>
+ <url url="${model.url}/de-pos-perceptron.bin"/>
+ <!-- no Chunker for german
+ <url url="${model.url}/de-chunker.bin"/>
+ -->
+ </resources>
+ </copy>
+ </target>
+</project>
\ No newline at end of file
Propchange: incubator/stanbol/trunk/data/opennlp/lang/de/download_models.xml
------------------------------------------------------------------------------
svn:mime-type = text/plain
Added: incubator/stanbol/trunk/data/opennlp/lang/de/pom.xml
URL: http://svn.apache.org/viewvc/incubator/stanbol/trunk/data/opennlp/lang/de/pom.xml?rev=1173968&view=auto
==============================================================================
--- incubator/stanbol/trunk/data/opennlp/lang/de/pom.xml (added)
+++ incubator/stanbol/trunk/data/opennlp/lang/de/pom.xml Thu Sep 22 06:51:30 2011
@@ -0,0 +1,122 @@
+<?xml version="1.0" encoding="UTF-8"?>
+<!--
+ Licensed to the Apache Software Foundation (ASF) under one or more
+ contributor license agreements. See the NOTICE file distributed with
+ this work for additional information regarding copyright ownership.
+ The ASF licenses this file to You under the Apache License, Version 2.0
+ (the "License"); you may not use this file except in compliance with
+ the License. You may obtain a copy of the License at
+
+ http://www.apache.org/licenses/LICENSE-2.0
+
+ Unless required by applicable law or agreed to in writing, software
+ distributed under the License is distributed on an "AS IS" BASIS,
+ WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+ See the License for the specific language governing permissions and
+ limitations under the License.
+-->
+<project xmlns="http://maven.apache.org/POM/4.0.0" xmlns:xsi="http://www.w3.org/2001/XMLSchema-instance"
+ xsi:schemaLocation="http://maven.apache.org/POM/4.0.0 http://maven.apache.org/maven-v4_0_0.xsd">
+
+ <modelVersion>4.0.0</modelVersion>
+ <parent>
+ <groupId>org.apache.stanbol</groupId>
+ <artifactId>org.apache.stanbol.data.parent</artifactId>
+ <version>0.9.0-incubating-SNAPSHOT</version>
+ <relativePath>../../../parent</relativePath>
+ </parent>
+
+ <groupId>org.apache.stanbol</groupId>
+ <artifactId>org.apache.stanbol.data.opennlp.lang.de</artifactId>
+ <version>1.0.0-incubating</version>
+ <packaging>bundle</packaging>
+
+ <name>Apache Stanbol Data: OpenNLP Models for German</name>
+ <description>
+ Bundle containing all necessary/available models for parsing German language texts. This does not include Models for named entity recocnition (NER).
+ </description>
+ <inceptionYear>2011</inceptionYear>
+
+ <scm>
+ <connection>
+ scm:svn:http://svn.apache.org/repos/asf/incubator/stanbol/trunk/data/opennlp/lang/de
+ </connection>
+ <developerConnection>
+ scm:svn:https://svn.apache.org/repos/asf/incubator/stanbol/trunk/data/opennlp/lang/de
+ </developerConnection>
+ <url>http://incubator.apache.org/stanbol/</url>
+ </scm>
+ <properties>
+ <project.build.sourceEncoding>UTF-8</project.build.sourceEncoding>
+ <!-- define the path to/home of the OpenNLP modles-->
+ <opennlp.model.path>org/apache/stanbol/data/opennlp</opennlp.model.path>
+ <opennlp.model.home>http://dev.iks-project.eu/downloads/opennlp/models-1.5/</opennlp.model.home>
+ </properties>
+
+ <build>
+ <plugins>
+ <plugin>
+ <groupId>org.apache.felix</groupId>
+ <artifactId>maven-bundle-plugin</artifactId>
+ <configuration>
+ <instructions>
+ <_versionpolicy>$${version;===;${@}}</_versionpolicy>
+
+ <!--
+ Extension used to provide files in that directory to the
+ DataFileProvider
+ -->
+ <Data-Files>${opennlp.model.path}</Data-Files>
+ <!--
+ Use a priority lower than 0 to allow providers without a
+ defined ranking to override this default data.
+ -->
+ <Data-Files-Priority>
+ -100
+ </Data-Files-Priority>
+ </instructions>
+ </configuration>
+ </plugin>
+ <plugin>
+ <!--
+ Ant is used to download the models from the
+ http://opennlp.sourceforge.net site.
+ -->
+ <groupId>org.apache.maven.plugins</groupId>
+ <artifactId>maven-antrun-plugin</artifactId>
+ <executions>
+ <execution>
+ <id>compile</id>
+ <phase>compile</phase>
+ <configuration>
+ <!--
+ TODO: I would like to add an "unless" constraint to the
+ target that prevents execution if Maven operates in offline
+ mode. However I was not able to find out how to obtain this
+ information. ${settings.offline} (as noted by several
+ resources) does not work.
+ Until fixed builds will fail if no internetconnection is
+ available!
+ -->
+ <target>
+ <property name="target.directory" value="${project.basedir}/src/main/resources/${opennlp.model.path}"/>
+ <property name="model.url" value="${opennlp.model.home}"/>
+
+ <echo message="copy OpenNLP models"/>
+ <echo message=" FROM ${model.url} "/>
+ <echo message=" TO ${target.directory}"/>
+
+ <ant antfile="${basedir}/download_models.xml">
+ <target name="download"/>
+ </ant>
+ </target>
+ </configuration>
+ <goals>
+ <goal>run</goal>
+ </goals>
+ </execution>
+ </executions>
+ </plugin>
+ </plugins>
+ </build>
+</project>
Propchange: incubator/stanbol/trunk/data/opennlp/lang/de/pom.xml
------------------------------------------------------------------------------
svn:mime-type = text/plain
Propchange: incubator/stanbol/trunk/data/opennlp/lang/de/src/main/resources/org/apache/stanbol/data/opennlp/
------------------------------------------------------------------------------
--- svn:ignore (added)
+++ svn:ignore Thu Sep 22 06:51:30 2011
@@ -0,0 +1,5 @@
+de-sent.bin
+
+de-pos-perceptron.bin
+
+de-token.bin
Propchange: incubator/stanbol/trunk/data/opennlp/lang/de/target/
------------------------------------------------------------------------------
--- svn:ignore (added)
+++ svn:ignore Thu Sep 22 06:51:30 2011
@@ -0,0 +1,15 @@
+maven-shared-archive-resources
+
+org.apache.stanbol.data.opennlp.lang.de-1.0.0-incubating-sources.jar
+
+.plxarc
+
+test-classes
+
+antrun
+
+org.apache.stanbol.data.opennlp.lang.de-1.0.0-incubating.jar
+
+surefire
+
+classes
Modified: incubator/stanbol/trunk/data/opennlp/lang/en/download_models.xml
URL: http://svn.apache.org/viewvc/incubator/stanbol/trunk/data/opennlp/lang/en/download_models.xml?rev=1173968&r1=1173967&r2=1173968&view=diff
==============================================================================
--- incubator/stanbol/trunk/data/opennlp/lang/en/download_models.xml (original)
+++ incubator/stanbol/trunk/data/opennlp/lang/en/download_models.xml Thu Sep 22 06:51:30 2011
@@ -24,6 +24,7 @@
<target name="download">
<copy todir="${target.directory}" flatten="true">
<resources>
+ <url url="${model.url}/en-token.bin"/>
<url url="${model.url}/en-sent.bin"/>
<url url="${model.url}/en-pos-perceptron.bin"/>
<url url="${model.url}/en-chunker.bin"/>
Added: incubator/stanbol/trunk/data/opennlp/lang/nl/README.md
URL: http://svn.apache.org/viewvc/incubator/stanbol/trunk/data/opennlp/lang/nl/README.md?rev=1173968&view=auto
==============================================================================
--- incubator/stanbol/trunk/data/opennlp/lang/nl/README.md (added)
+++ incubator/stanbol/trunk/data/opennlp/lang/nl/README.md Thu Sep 22 06:51:30 2011
@@ -0,0 +1,21 @@
+# Data files Bundles for OpenNLP
+
+This source repository only holds the pom.xml file and folder structure of this bundle.
+
+To avoid loading subversion repository with large binary files this artifact has to be build and deployed manually to retrieve precomputed models from other sites.
+
+
+## Downloading the OpenNLP statistical model
+
+The OpenNLP models are downloaded from
+
+ http://opennlp.sourceforge.net/models-1.5
+
+This url is defined as property in the 'pom.xml'
+The list of downloaded file is defined within the 'download_models.xml'
+
+## NOTE
+
+Using this bundles is only an alternative of manually copying the required OpenNLP models to the '{stanbol-installation}/sling/datafiles'.
+
+In addition model files in this folder have precedence to models provided by this bundle.
Added: incubator/stanbol/trunk/data/opennlp/lang/nl/download_models.xml
URL: http://svn.apache.org/viewvc/incubator/stanbol/trunk/data/opennlp/lang/nl/download_models.xml?rev=1173968&view=auto
==============================================================================
--- incubator/stanbol/trunk/data/opennlp/lang/nl/download_models.xml (added)
+++ incubator/stanbol/trunk/data/opennlp/lang/nl/download_models.xml Thu Sep 22 06:51:30 2011
@@ -0,0 +1,36 @@
+<?xml version="1.0" encoding="UTF-8"?>
+<!--
+ Licensed to the Apache Software Foundation (ASF) under one or more
+ contributor license agreements. See the NOTICE file distributed with
+ this work for additional information regarding copyright ownership.
+ The ASF licenses this file to You under the Apache License, Version 2.0
+ (the "License"); you may not use this file except in compliance with
+ the License. You may obtain a copy of the License at
+
+ http://www.apache.org/licenses/LICENSE-2.0
+
+ Unless required by applicable law or agreed to in writing, software
+ distributed under the License is distributed on an "AS IS" BASIS,
+ WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+ See the License for the specific language governing permissions and
+ limitations under the License.
+-->
+<project name="OpenNLP Model Download Helper" default="download" basedir=".">
+ <description>
+ Contains only a singel target that is used by the Maven Ant
+ Plugin to download OpenNLP Models from the Web
+ </description>
+
+ <target name="download">
+ <copy todir="${target.directory}" flatten="true">
+ <resources>
+ <url url="${model.url}/nl-token.bin"/>
+ <url url="${model.url}/nl-sent.bin"/>
+ <url url="${model.url}/nl-pos-perceptron.bin"/>
+ <!-- no Chunker for nl
+ <url url="${model.url}/nl-chunker.bin"/>
+ -->
+ </resources>
+ </copy>
+ </target>
+</project>
\ No newline at end of file
Propchange: incubator/stanbol/trunk/data/opennlp/lang/nl/download_models.xml
------------------------------------------------------------------------------
svn:mime-type = text/plain
Added: incubator/stanbol/trunk/data/opennlp/lang/nl/pom.xml
URL: http://svn.apache.org/viewvc/incubator/stanbol/trunk/data/opennlp/lang/nl/pom.xml?rev=1173968&view=auto
==============================================================================
--- incubator/stanbol/trunk/data/opennlp/lang/nl/pom.xml (added)
+++ incubator/stanbol/trunk/data/opennlp/lang/nl/pom.xml Thu Sep 22 06:51:30 2011
@@ -0,0 +1,122 @@
+<?xml version="1.0" encoding="UTF-8"?>
+<!--
+ Licensed to the Apache Software Foundation (ASF) under one or more
+ contributor license agreements. See the NOTICE file distributed with
+ this work for additional information regarding copyright ownership.
+ The ASF licenses this file to You under the Apache License, Version 2.0
+ (the "License"); you may not use this file except in compliance with
+ the License. You may obtain a copy of the License at
+
+ http://www.apache.org/licenses/LICENSE-2.0
+
+ Unless required by applicable law or agreed to in writing, software
+ distributed under the License is distributed on an "AS IS" BASIS,
+ WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+ See the License for the specific language governing permissions and
+ limitations under the License.
+-->
+<project xmlns="http://maven.apache.org/POM/4.0.0" xmlns:xsi="http://www.w3.org/2001/XMLSchema-instance"
+ xsi:schemaLocation="http://maven.apache.org/POM/4.0.0 http://maven.apache.org/maven-v4_0_0.xsd">
+
+ <modelVersion>4.0.0</modelVersion>
+ <parent>
+ <groupId>org.apache.stanbol</groupId>
+ <artifactId>org.apache.stanbol.data.parent</artifactId>
+ <version>0.9.0-incubating-SNAPSHOT</version>
+ <relativePath>../../../parent</relativePath>
+ </parent>
+
+ <groupId>org.apache.stanbol</groupId>
+ <artifactId>org.apache.stanbol.data.opennlp.lang.nl</artifactId>
+ <version>1.0.0-incubating</version>
+ <packaging>bundle</packaging>
+
+ <name>Apache Stanbol Data: OpenNLP Models for Dutch</name>
+ <description>
+ Bundle containing all necessary/available models for parsing Dutch language texts. This does not include Models for named entity recocnition (NER).
+ </description>
+ <inceptionYear>2011</inceptionYear>
+
+ <scm>
+ <connection>
+ scm:svn:http://svn.apache.org/repos/asf/incubator/stanbol/trunk/data/opennlp/lang/nl
+ </connection>
+ <developerConnection>
+ scm:svn:https://svn.apache.org/repos/asf/incubator/stanbol/trunk/data/opennlp/lang/nl
+ </developerConnection>
+ <url>http://incubator.apache.org/stanbol/</url>
+ </scm>
+ <properties>
+ <project.build.sourceEncoding>UTF-8</project.build.sourceEncoding>
+ <!-- define the path to/home of the OpenNLP modles-->
+ <opennlp.model.path>org/apache/stanbol/data/opennlp</opennlp.model.path>
+ <opennlp.model.home>http://dev.iks-project.eu/downloads/opennlp/models-1.5/</opennlp.model.home>
+ </properties>
+
+ <build>
+ <plugins>
+ <plugin>
+ <groupId>org.apache.felix</groupId>
+ <artifactId>maven-bundle-plugin</artifactId>
+ <configuration>
+ <instructions>
+ <_versionpolicy>$${version;===;${@}}</_versionpolicy>
+
+ <!--
+ Extension used to provide files in that directory to the
+ DataFileProvider
+ -->
+ <Data-Files>${opennlp.model.path}</Data-Files>
+ <!--
+ Use a priority lower than 0 to allow providers without a
+ defined ranking to override this default data.
+ -->
+ <Data-Files-Priority>
+ -100
+ </Data-Files-Priority>
+ </instructions>
+ </configuration>
+ </plugin>
+ <plugin>
+ <!--
+ Ant is used to download the models from the
+ http://opennlp.sourceforge.net site.
+ -->
+ <groupId>org.apache.maven.plugins</groupId>
+ <artifactId>maven-antrun-plugin</artifactId>
+ <executions>
+ <execution>
+ <id>compile</id>
+ <phase>compile</phase>
+ <configuration>
+ <!--
+ TODO: I would like to add an "unless" constraint to the
+ target that prevents execution if Maven operates in offline
+ mode. However I was not able to find out how to obtain this
+ information. ${settings.offline} (as noted by several
+ resources) does not work.
+ Until fixed builds will fail if no internetconnection is
+ available!
+ -->
+ <target>
+ <property name="target.directory" value="${project.basedir}/src/main/resources/${opennlp.model.path}"/>
+ <property name="model.url" value="${opennlp.model.home}"/>
+
+ <echo message="copy OpenNLP models"/>
+ <echo message=" FROM ${model.url} "/>
+ <echo message=" TO ${target.directory}"/>
+
+ <ant antfile="${basedir}/download_models.xml">
+ <target name="download"/>
+ </ant>
+ </target>
+ </configuration>
+ <goals>
+ <goal>run</goal>
+ </goals>
+ </execution>
+ </executions>
+ </plugin>
+ </plugins>
+ </build>
+</project>
Propchange: incubator/stanbol/trunk/data/opennlp/lang/nl/pom.xml
------------------------------------------------------------------------------
svn:mime-type = text/plain
Propchange: incubator/stanbol/trunk/data/opennlp/lang/nl/src/main/resources/org/apache/stanbol/data/opennlp/
------------------------------------------------------------------------------
--- svn:ignore (added)
+++ svn:ignore Thu Sep 22 06:51:30 2011
@@ -0,0 +1,5 @@
+nl-token.bin
+
+nl-pos-perceptron.bin
+
+nl-sent.bin
Propchange: incubator/stanbol/trunk/data/opennlp/lang/nl/target/
------------------------------------------------------------------------------
--- svn:ignore (added)
+++ svn:ignore Thu Sep 22 06:51:30 2011
@@ -0,0 +1,15 @@
+test-classes
+
+org.apache.stanbol.data.opennlp.lang.nl-1.0.0-incubating.jar
+
+antrun
+
+classes
+
+.plxarc
+
+surefire
+
+maven-shared-archive-resources
+
+org.apache.stanbol.data.opennlp.lang.nl-1.0.0-incubating-sources.jar
Added: incubator/stanbol/trunk/data/opennlp/lang/pt/README.md
URL: http://svn.apache.org/viewvc/incubator/stanbol/trunk/data/opennlp/lang/pt/README.md?rev=1173968&view=auto
==============================================================================
--- incubator/stanbol/trunk/data/opennlp/lang/pt/README.md (added)
+++ incubator/stanbol/trunk/data/opennlp/lang/pt/README.md Thu Sep 22 06:51:30 2011
@@ -0,0 +1,21 @@
+# Data files Bundles for OpenNLP
+
+This source repository only holds the pom.xml file and folder structure of this bundle.
+
+To avoid loading subversion repository with large binary files this artifact has to be build and deployed manually to retrieve precomputed models from other sites.
+
+
+## Downloading the OpenNLP statistical model
+
+The OpenNLP models are downloaded from
+
+ http://opennlp.sourceforge.net/models-1.5
+
+This url is defined as property in the 'pom.xml'
+The list of downloaded file is defined within the 'download_models.xml'
+
+## NOTE
+
+Using this bundles is only an alternative of manually copying the required OpenNLP models to the '{stanbol-installation}/sling/datafiles'.
+
+In addition model files in this folder have precedence to models provided by this bundle.
Added: incubator/stanbol/trunk/data/opennlp/lang/pt/download_models.xml
URL: http://svn.apache.org/viewvc/incubator/stanbol/trunk/data/opennlp/lang/pt/download_models.xml?rev=1173968&view=auto
==============================================================================
--- incubator/stanbol/trunk/data/opennlp/lang/pt/download_models.xml (added)
+++ incubator/stanbol/trunk/data/opennlp/lang/pt/download_models.xml Thu Sep 22 06:51:30 2011
@@ -0,0 +1,36 @@
+<?xml version="1.0" encoding="UTF-8"?>
+<!--
+ Licensed to the Apache Software Foundation (ASF) under one or more
+ contributor license agreements. See the NOTICE file distributed with
+ this work for additional information regarding copyright ownership.
+ The ASF licenses this file to You under the Apache License, Version 2.0
+ (the "License"); you may not use this file except in compliance with
+ the License. You may obtain a copy of the License at
+
+ http://www.apache.org/licenses/LICENSE-2.0
+
+ Unless required by applicable law or agreed to in writing, software
+ distributed under the License is distributed on an "AS IS" BASIS,
+ WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+ See the License for the specific language governing permissions and
+ limitations under the License.
+-->
+<project name="OpenNLP Model Download Helper" default="download" basedir=".">
+ <description>
+ Contains only a singel target that is used by the Maven Ant
+ Plugin to download OpenNLP Models from the Web
+ </description>
+
+ <target name="download">
+ <copy todir="${target.directory}" flatten="true">
+ <resources>
+ <url url="${model.url}/pt-token.bin"/>
+ <url url="${model.url}/pt-sent.bin"/>
+ <url url="${model.url}/pt-pos-perceptron.bin"/>
+ <!-- no Chunker for pt
+ <url url="${model.url}/pt-chunker.bin"/>
+ -->
+ </resources>
+ </copy>
+ </target>
+</project>
\ No newline at end of file
Propchange: incubator/stanbol/trunk/data/opennlp/lang/pt/download_models.xml
------------------------------------------------------------------------------
svn:mime-type = text/plain
Added: incubator/stanbol/trunk/data/opennlp/lang/pt/pom.xml
URL: http://svn.apache.org/viewvc/incubator/stanbol/trunk/data/opennlp/lang/pt/pom.xml?rev=1173968&view=auto
==============================================================================
--- incubator/stanbol/trunk/data/opennlp/lang/pt/pom.xml (added)
+++ incubator/stanbol/trunk/data/opennlp/lang/pt/pom.xml Thu Sep 22 06:51:30 2011
@@ -0,0 +1,122 @@
+<?xml version="1.0" encoding="UTF-8"?>
+<!--
+ Licensed to the Apache Software Foundation (ASF) under one or more
+ contributor license agreements. See the NOTICE file distributed with
+ this work for additional information regarding copyright ownership.
+ The ASF licenses this file to You under the Apache License, Version 2.0
+ (the "License"); you may not use this file except in compliance with
+ the License. You may obtain a copy of the License at
+
+ http://www.apache.org/licenses/LICENSE-2.0
+
+ Unless required by applicable law or agreed to in writing, software
+ distributed under the License is distributed on an "AS IS" BASIS,
+ WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+ See the License for the specific language governing permissions and
+ limitations under the License.
+-->
+<project xmlns="http://maven.apache.org/POM/4.0.0" xmlns:xsi="http://www.w3.org/2001/XMLSchema-instance"
+ xsi:schemaLocation="http://maven.apache.org/POM/4.0.0 http://maven.apache.org/maven-v4_0_0.xsd">
+
+ <modelVersion>4.0.0</modelVersion>
+ <parent>
+ <groupId>org.apache.stanbol</groupId>
+ <artifactId>org.apache.stanbol.data.parent</artifactId>
+ <version>0.9.0-incubating-SNAPSHOT</version>
+ <relativePath>../../../parent</relativePath>
+ </parent>
+
+ <groupId>org.apache.stanbol</groupId>
+ <artifactId>org.apache.stanbol.data.opennlp.lang.pt</artifactId>
+ <version>1.0.0-incubating</version>
+ <packaging>bundle</packaging>
+
+ <name>Apache Stanbol Data: OpenNLP Models for Portuguese</name>
+ <description>
+ Bundle containing all necessary/available models for parsing Portuguese language texts. This does not include Models for named entity recocnition (NER).
+ </description>
+ <inceptionYear>2011</inceptionYear>
+
+ <scm>
+ <connection>
+ scm:svn:http://svn.apache.org/repos/asf/incubator/stanbol/trunk/data/opennlp/lang/pt
+ </connection>
+ <developerConnection>
+ scm:svn:https://svn.apache.org/repos/asf/incubator/stanbol/trunk/data/opennlp/lang/pt
+ </developerConnection>
+ <url>http://incubator.apache.org/stanbol/</url>
+ </scm>
+ <properties>
+ <project.build.sourceEncoding>UTF-8</project.build.sourceEncoding>
+ <!-- define the path to/home of the OpenNLP modles-->
+ <opennlp.model.path>org/apache/stanbol/data/opennlp</opennlp.model.path>
+ <opennlp.model.home>http://dev.iks-project.eu/downloads/opennlp/models-1.5/</opennlp.model.home>
+ </properties>
+
+ <build>
+ <plugins>
+ <plugin>
+ <groupId>org.apache.felix</groupId>
+ <artifactId>maven-bundle-plugin</artifactId>
+ <configuration>
+ <instructions>
+ <_versionpolicy>$${version;===;${@}}</_versionpolicy>
+
+ <!--
+ Extension used to provide files in that directory to the
+ DataFileProvider
+ -->
+ <Data-Files>${opennlp.model.path}</Data-Files>
+ <!--
+ Use a priority lower than 0 to allow providers without a
+ defined ranking to override this default data.
+ -->
+ <Data-Files-Priority>
+ -100
+ </Data-Files-Priority>
+ </instructions>
+ </configuration>
+ </plugin>
+ <plugin>
+ <!--
+ Ant is used to download the models from the
+ http://opennlp.sourceforge.net site.
+ -->
+ <groupId>org.apache.maven.plugins</groupId>
+ <artifactId>maven-antrun-plugin</artifactId>
+ <executions>
+ <execution>
+ <id>compile</id>
+ <phase>compile</phase>
+ <configuration>
+ <!--
+ TODO: I would like to add an "unless" constraint to the
+ target that prevents execution if Maven operates in offline
+ mode. However I was not able to find out how to obtain this
+ information. ${settings.offline} (as noted by several
+ resources) does not work.
+ Until fixed builds will fail if no internetconnection is
+ available!
+ -->
+ <target>
+ <property name="target.directory" value="${project.basedir}/src/main/resources/${opennlp.model.path}"/>
+ <property name="model.url" value="${opennlp.model.home}"/>
+
+ <echo message="copy OpenNLP models"/>
+ <echo message=" FROM ${model.url} "/>
+ <echo message=" TO ${target.directory}"/>
+
+ <ant antfile="${basedir}/download_models.xml">
+ <target name="download"/>
+ </ant>
+ </target>
+ </configuration>
+ <goals>
+ <goal>run</goal>
+ </goals>
+ </execution>
+ </executions>
+ </plugin>
+ </plugins>
+ </build>
+</project>
Propchange: incubator/stanbol/trunk/data/opennlp/lang/pt/pom.xml
------------------------------------------------------------------------------
svn:mime-type = text/plain
Propchange: incubator/stanbol/trunk/data/opennlp/lang/pt/src/main/resources/org/apache/stanbol/data/opennlp/
------------------------------------------------------------------------------
--- svn:ignore (added)
+++ svn:ignore Thu Sep 22 06:51:30 2011
@@ -0,0 +1,5 @@
+pt-token.bin
+
+pt-pos-perceptron.bin
+
+pt-sent.bin
Propchange: incubator/stanbol/trunk/data/opennlp/lang/pt/target/
------------------------------------------------------------------------------
--- svn:ignore (added)
+++ svn:ignore Thu Sep 22 06:51:30 2011
@@ -0,0 +1,15 @@
+antrun
+
+classes
+
+surefire
+
+org.apache.stanbol.data.opennlp.lang.pt-1.0.0-incubating-sources.jar
+
+maven-shared-archive-resources
+
+test-classes
+
+.plxarc
+
+org.apache.stanbol.data.opennlp.lang.pt-1.0.0-incubating.jar
Added: incubator/stanbol/trunk/data/opennlp/lang/se/README.md
URL: http://svn.apache.org/viewvc/incubator/stanbol/trunk/data/opennlp/lang/se/README.md?rev=1173968&view=auto
==============================================================================
--- incubator/stanbol/trunk/data/opennlp/lang/se/README.md (added)
+++ incubator/stanbol/trunk/data/opennlp/lang/se/README.md Thu Sep 22 06:51:30 2011
@@ -0,0 +1,21 @@
+# Data files Bundles for OpenNLP
+
+This source repository only holds the pom.xml file and folder structure of this bundle.
+
+To avoid loading subversion repository with large binary files this artifact has to be build and deployed manually to retrieve precomputed models from other sites.
+
+
+## Downloading the OpenNLP statistical model
+
+The OpenNLP models are downloaded from
+
+ http://opennlp.sourceforge.net/models-1.5
+
+This url is defined as property in the 'pom.xml'
+The list of downloaded file is defined within the 'download_models.xml'
+
+## NOTE
+
+Using this bundles is only an alternative of manually copying the required OpenNLP models to the '{stanbol-installation}/sling/datafiles'.
+
+In addition model files in this folder have precedence to models provided by this bundle.
Added: incubator/stanbol/trunk/data/opennlp/lang/se/download_models.xml
URL: http://svn.apache.org/viewvc/incubator/stanbol/trunk/data/opennlp/lang/se/download_models.xml?rev=1173968&view=auto
==============================================================================
--- incubator/stanbol/trunk/data/opennlp/lang/se/download_models.xml (added)
+++ incubator/stanbol/trunk/data/opennlp/lang/se/download_models.xml Thu Sep 22 06:51:30 2011
@@ -0,0 +1,36 @@
+<?xml version="1.0" encoding="UTF-8"?>
+<!--
+ Licensed to the Apache Software Foundation (ASF) under one or more
+ contributor license agreements. See the NOTICE file distributed with
+ this work for additional information regarding copyright ownership.
+ The ASF licenses this file to You under the Apache License, Version 2.0
+ (the "License"); you may not use this file except in compliance with
+ the License. You may obtain a copy of the License at
+
+ http://www.apache.org/licenses/LICENSE-2.0
+
+ Unless required by applicable law or agreed to in writing, software
+ distributed under the License is distributed on an "AS IS" BASIS,
+ WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+ See the License for the specific language governing permissions and
+ limitations under the License.
+-->
+<project name="OpenNLP Model Download Helper" default="download" basedir=".">
+ <description>
+ Contains only a singel target that is used by the Maven Ant
+ Plugin to download OpenNLP Models from the Web
+ </description>
+
+ <target name="download">
+ <copy todir="${target.directory}" flatten="true">
+ <resources>
+ <url url="${model.url}/se-token.bin"/>
+ <url url="${model.url}/se-sent.bin"/>
+ <url url="${model.url}/se-pos-perceptron.bin"/>
+ <!-- no Chunker for se
+ <url url="${model.url}/se-chunker.bin"/>
+ -->
+ </resources>
+ </copy>
+ </target>
+</project>
\ No newline at end of file
Propchange: incubator/stanbol/trunk/data/opennlp/lang/se/download_models.xml
------------------------------------------------------------------------------
svn:mime-type = text/plain
Added: incubator/stanbol/trunk/data/opennlp/lang/se/pom.xml
URL: http://svn.apache.org/viewvc/incubator/stanbol/trunk/data/opennlp/lang/se/pom.xml?rev=1173968&view=auto
==============================================================================
--- incubator/stanbol/trunk/data/opennlp/lang/se/pom.xml (added)
+++ incubator/stanbol/trunk/data/opennlp/lang/se/pom.xml Thu Sep 22 06:51:30 2011
@@ -0,0 +1,122 @@
+<?xml version="1.0" encoding="UTF-8"?>
+<!--
+ Licensed to the Apache Software Foundation (ASF) under one or more
+ contributor license agreements. See the NOTICE file distributed with
+ this work for additional information regarding copyright ownership.
+ The ASF licenses this file to You under the Apache License, Version 2.0
+ (the "License"); you may not use this file except in compliance with
+ the License. You may obtain a copy of the License at
+
+ http://www.apache.org/licenses/LICENSE-2.0
+
+ Unless required by applicable law or agreed to in writing, software
+ distributed under the License is distributed on an "AS IS" BASIS,
+ WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+ See the License for the specific language governing permissions and
+ limitations under the License.
+-->
+<project xmlns="http://maven.apache.org/POM/4.0.0" xmlns:xsi="http://www.w3.org/2001/XMLSchema-instance"
+ xsi:schemaLocation="http://maven.apache.org/POM/4.0.0 http://maven.apache.org/maven-v4_0_0.xsd">
+
+ <modelVersion>4.0.0</modelVersion>
+ <parent>
+ <groupId>org.apache.stanbol</groupId>
+ <artifactId>org.apache.stanbol.data.parent</artifactId>
+ <version>0.9.0-incubating-SNAPSHOT</version>
+ <relativePath>../../../parent</relativePath>
+ </parent>
+
+ <groupId>org.apache.stanbol</groupId>
+ <artifactId>org.apache.stanbol.data.opennlp.lang.se</artifactId>
+ <version>1.0.0-incubating</version>
+ <packaging>bundle</packaging>
+
+ <name>Apache Stanbol Data: OpenNLP Models for Swedish</name>
+ <description>
+ Bundle containing all necessary/available models for parsing Swedish language texts. This does not include Models for named entity recocnition (NER).
+ </description>
+ <inceptionYear>2011</inceptionYear>
+
+ <scm>
+ <connection>
+ scm:svn:http://svn.apache.org/repos/asf/incubator/stanbol/trunk/data/opennlp/lang/se
+ </connection>
+ <developerConnection>
+ scm:svn:https://svn.apache.org/repos/asf/incubator/stanbol/trunk/data/opennlp/lang/se
+ </developerConnection>
+ <url>http://incubator.apache.org/stanbol/</url>
+ </scm>
+ <properties>
+ <project.build.sourceEncoding>UTF-8</project.build.sourceEncoding>
+ <!-- define the path to/home of the OpenNLP modles-->
+ <opennlp.model.path>org/apache/stanbol/data/opennlp</opennlp.model.path>
+ <opennlp.model.home>http://dev.iks-project.eu/downloads/opennlp/models-1.5/</opennlp.model.home>
+ </properties>
+
+ <build>
+ <plugins>
+ <plugin>
+ <groupId>org.apache.felix</groupId>
+ <artifactId>maven-bundle-plugin</artifactId>
+ <configuration>
+ <instructions>
+ <_versionpolicy>$${version;===;${@}}</_versionpolicy>
+
+ <!--
+ Extension used to provide files in that directory to the
+ DataFileProvider
+ -->
+ <Data-Files>${opennlp.model.path}</Data-Files>
+ <!--
+ Use a priority lower than 0 to allow providers without a
+ defined ranking to override this default data.
+ -->
+ <Data-Files-Priority>
+ -100
+ </Data-Files-Priority>
+ </instructions>
+ </configuration>
+ </plugin>
+ <plugin>
+ <!--
+ Ant is used to download the models from the
+ http://opennlp.sourceforge.net site.
+ -->
+ <groupId>org.apache.maven.plugins</groupId>
+ <artifactId>maven-antrun-plugin</artifactId>
+ <executions>
+ <execution>
+ <id>compile</id>
+ <phase>compile</phase>
+ <configuration>
+ <!--
+ TODO: I would like to add an "unless" constraint to the
+ target that prevents execution if Maven operates in offline
+ mode. However I was not able to find out how to obtain this
+ information. ${settings.offline} (as noted by several
+ resources) does not work.
+ Until fixed builds will fail if no internetconnection is
+ available!
+ -->
+ <target>
+ <property name="target.directory" value="${project.basedir}/src/main/resources/${opennlp.model.path}"/>
+ <property name="model.url" value="${opennlp.model.home}"/>
+
+ <echo message="copy OpenNLP models"/>
+ <echo message=" FROM ${model.url} "/>
+ <echo message=" TO ${target.directory}"/>
+
+ <ant antfile="${basedir}/download_models.xml">
+ <target name="download"/>
+ </ant>
+ </target>
+ </configuration>
+ <goals>
+ <goal>run</goal>
+ </goals>
+ </execution>
+ </executions>
+ </plugin>
+ </plugins>
+ </build>
+</project>
Propchange: incubator/stanbol/trunk/data/opennlp/lang/se/pom.xml
------------------------------------------------------------------------------
svn:mime-type = text/plain
Propchange: incubator/stanbol/trunk/data/opennlp/lang/se/src/main/resources/org/apache/stanbol/data/opennlp/
------------------------------------------------------------------------------
--- svn:ignore (added)
+++ svn:ignore Thu Sep 22 06:51:30 2011
@@ -0,0 +1,5 @@
+se-pos-perceptron.bin
+
+se-token.bin
+
+se-sent.bin
Propchange: incubator/stanbol/trunk/data/opennlp/lang/se/target/
------------------------------------------------------------------------------
--- svn:ignore (added)
+++ svn:ignore Thu Sep 22 06:51:30 2011
@@ -0,0 +1,15 @@
+maven-shared-archive-resources
+
+org.apache.stanbol.data.opennlp.lang.se-1.0.0-incubating.jar
+
+test-classes
+
+surefire
+
+.plxarc
+
+classes
+
+org.apache.stanbol.data.opennlp.lang.se-1.0.0-incubating-sources.jar
+
+antrun
Added: incubator/stanbol/trunk/data/opennlp/ner/es/README.md
URL: http://svn.apache.org/viewvc/incubator/stanbol/trunk/data/opennlp/ner/es/README.md?rev=1173968&view=auto
==============================================================================
--- incubator/stanbol/trunk/data/opennlp/ner/es/README.md (added)
+++ incubator/stanbol/trunk/data/opennlp/ner/es/README.md Thu Sep 22 06:51:30 2011
@@ -0,0 +1,21 @@
+# Data files Bundles for OpenNLP
+
+This source repository only holds the pom.xml file and folder structure of this bundle.
+
+To avoid loading subversion repository with large binary files this artifact has to be build and deployed manually to retrieve precomputed models from other sites.
+
+
+## Downloading the OpenNLP statistical model
+
+The OpenNLP models are downloaded from
+
+ http://opennlp.sourceforge.net/models-1.5
+
+This url is defined as property in the 'pom.xml'
+The list of downloaded file is defined within the 'download_models.xml'
+
+## NOTE
+
+Using this bundles is only an alternative of manually copying the required OpenNLP models to the '{stanbol-installation}/sling/datafiles'.
+
+In addition model files in this folder have precedence to models provided by this bundle.
Added: incubator/stanbol/trunk/data/opennlp/ner/es/download_models.xml
URL: http://svn.apache.org/viewvc/incubator/stanbol/trunk/data/opennlp/ner/es/download_models.xml?rev=1173968&view=auto
==============================================================================
--- incubator/stanbol/trunk/data/opennlp/ner/es/download_models.xml (added)
+++ incubator/stanbol/trunk/data/opennlp/ner/es/download_models.xml Thu Sep 22 06:51:30 2011
@@ -0,0 +1,33 @@
+<?xml version="1.0" encoding="UTF-8"?>
+<!--
+ Licensed to the Apache Software Foundation (ASF) under one or more
+ contributor license agreements. See the NOTICE file distributed with
+ this work for additional information regarding copyright ownership.
+ The ASF licenses this file to You under the Apache License, Version 2.0
+ (the "License"); you may not use this file except in compliance with
+ the License. You may obtain a copy of the License at
+
+ http://www.apache.org/licenses/LICENSE-2.0
+
+ Unless required by applicable law or agreed to in writing, software
+ distributed under the License is distributed on an "AS IS" BASIS,
+ WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+ See the License for the specific language governing permissions and
+ limitations under the License.
+-->
+<project name="OpenNLP Model Download Helper" default="download" basedir=".">
+ <description>
+ Contains only a singel target that is used by the Maven Ant
+ Plugin to download OpenNLP Models from the Web
+ </description>
+
+ <target name="download">
+ <copy todir="${target.directory}" flatten="true">
+ <resources>
+ <url url="${model.url}/es-ner-person.bin"/>
+ <url url="${model.url}/es-ner-location.bin"/>
+ <url url="${model.url}/es-ner-organization.bin"/>
+ </resources>
+ </copy>
+ </target>
+</project>
\ No newline at end of file
Propchange: incubator/stanbol/trunk/data/opennlp/ner/es/download_models.xml
------------------------------------------------------------------------------
svn:mime-type = text/plain
Added: incubator/stanbol/trunk/data/opennlp/ner/es/pom.xml
URL: http://svn.apache.org/viewvc/incubator/stanbol/trunk/data/opennlp/ner/es/pom.xml?rev=1173968&view=auto
==============================================================================
--- incubator/stanbol/trunk/data/opennlp/ner/es/pom.xml (added)
+++ incubator/stanbol/trunk/data/opennlp/ner/es/pom.xml Thu Sep 22 06:51:30 2011
@@ -0,0 +1,123 @@
+<?xml version="1.0" encoding="UTF-8"?>
+<!--
+ Licensed to the Apache Software Foundation (ASF) under one or more
+ contributor license agreements. See the NOTICE file distributed with
+ this work for additional information regarding copyright ownership.
+ The ASF licenses this file to You under the Apache License, Version 2.0
+ (the "License"); you may not use this file except in compliance with
+ the License. You may obtain a copy of the License at
+
+ http://www.apache.org/licenses/LICENSE-2.0
+
+ Unless required by applicable law or agreed to in writing, software
+ distributed under the License is distributed on an "AS IS" BASIS,
+ WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+ See the License for the specific language governing permissions and
+ limitations under the License.
+-->
+<project xmlns="http://maven.apache.org/POM/4.0.0" xmlns:xsi="http://www.w3.org/2001/XMLSchema-instance"
+ xsi:schemaLocation="http://maven.apache.org/POM/4.0.0 http://maven.apache.org/maven-v4_0_0.xsd">
+
+ <modelVersion>4.0.0</modelVersion>
+ <parent>
+ <groupId>org.apache.stanbol</groupId>
+ <artifactId>org.apache.stanbol.data.parent</artifactId>
+ <version>0.9.0-incubating-SNAPSHOT</version>
+ <relativePath>../../../parent</relativePath>
+ </parent>
+
+ <groupId>org.apache.stanbol</groupId>
+ <artifactId>org.apache.stanbol.data.opennlp.ner.es</artifactId>
+ <version>1.0.0-incubating</version>
+ <packaging>bundle</packaging>
+
+ <name>Apache Stanbol Data: OpenNLP NER Models for Spanish</name>
+ <description>
+ Bundle containing the NER models for finding Persons, Organizations
+ and Places for Spanish language texts.
+ </description>
+ <inceptionYear>2011</inceptionYear>
+
+ <scm>
+ <connection>
+ scm:svn:http://svn.apache.org/repos/asf/incubator/stanbol/trunk/data/opennlp/ner/es
+ </connection>
+ <developerConnection>
+ scm:svn:https://svn.apache.org/repos/asf/incubator/stanbol/trunk/data/opennlp/ner/es
+ </developerConnection>
+ <url>http://incubator.apache.org/stanbol/</url>
+ </scm>
+ <properties>
+ <project.build.sourceEncoding>UTF-8</project.build.sourceEncoding>
+ <!-- define the path to/home of the OpenNLP modles-->
+ <opennlp.model.path>org/apache/stanbol/data/opennlp</opennlp.model.path>
+ <opennlp.model.home>http://dev.iks-project.eu/downloads/opennlp/models-1.5/</opennlp.model.home>
+ </properties>
+
+ <build>
+ <plugins>
+ <plugin>
+ <groupId>org.apache.felix</groupId>
+ <artifactId>maven-bundle-plugin</artifactId>
+ <configuration>
+ <instructions>
+ <_versionpolicy>$${version;===;${@}}</_versionpolicy>
+
+ <!--
+ Extension used to provide files in that directory to the
+ DataFileProvider
+ -->
+ <Data-Files>${opennlp.model.path}</Data-Files>
+ <!--
+ Use a priority lower than 0 to allow providers without a
+ defined ranking to override this default data.
+ -->
+ <Data-Files-Priority>
+ -100
+ </Data-Files-Priority>
+ </instructions>
+ </configuration>
+ </plugin>
+ <plugin>
+ <!--
+ Ant is used to download the models from the
+ http://opennlp.sourceforge.net site.
+ -->
+ <groupId>org.apache.maven.plugins</groupId>
+ <artifactId>maven-antrun-plugin</artifactId>
+ <executions>
+ <execution>
+ <id>compile</id>
+ <phase>compile</phase>
+ <configuration>
+ <!--
+ TODO: I would like to add an "unless" constraint to the
+ target that prevents execution if Maven operates in offline
+ mode. However I was not able to find out how to obtain this
+ information. ${settings.offline} (as noted by several
+ resources) does not work.
+ Until fixed builds will fail if no internetconnection is
+ available!
+ -->
+ <target>
+ <property name="target.directory" value="${project.basedir}/src/main/resources/${opennlp.model.path}"/>
+ <property name="model.url" value="${opennlp.model.home}"/>
+
+ <echo message="copy OpenNLP models"/>
+ <echo message=" FROM ${model.url} "/>
+ <echo message=" TO ${target.directory}"/>
+
+ <ant antfile="${basedir}/download_models.xml">
+ <target name="download"/>
+ </ant>
+ </target>
+ </configuration>
+ <goals>
+ <goal>run</goal>
+ </goals>
+ </execution>
+ </executions>
+ </plugin>
+ </plugins>
+ </build>
+</project>
Propchange: incubator/stanbol/trunk/data/opennlp/ner/es/pom.xml
------------------------------------------------------------------------------
svn:mime-type = text/plain
Propchange: incubator/stanbol/trunk/data/opennlp/ner/es/src/main/resources/org/apache/stanbol/data/opennlp/
------------------------------------------------------------------------------
--- svn:ignore (added)
+++ svn:ignore Thu Sep 22 06:51:30 2011
@@ -0,0 +1,5 @@
+es-ner-person.bin
+
+es-ner-organization.bin
+
+es-ner-location.bin
Propchange: incubator/stanbol/trunk/data/opennlp/ner/es/target/
------------------------------------------------------------------------------
--- svn:ignore (added)
+++ svn:ignore Thu Sep 22 06:51:30 2011
@@ -0,0 +1,15 @@
+surefire
+
+antrun
+
+classes
+
+maven-shared-archive-resources
+
+test-classes
+
+org.apache.stanbol.data.opennlp.ner.es-1.0.0-incubating.jar
+
+org.apache.stanbol.data.opennlp.ner.es-1.0.0-incubating-sources.jar
+
+.plxarc
Added: incubator/stanbol/trunk/data/opennlp/ner/nl/README.md
URL: http://svn.apache.org/viewvc/incubator/stanbol/trunk/data/opennlp/ner/nl/README.md?rev=1173968&view=auto
==============================================================================
--- incubator/stanbol/trunk/data/opennlp/ner/nl/README.md (added)
+++ incubator/stanbol/trunk/data/opennlp/ner/nl/README.md Thu Sep 22 06:51:30 2011
@@ -0,0 +1,21 @@
+# Data files Bundles for OpenNLP
+
+This source repository only holds the pom.xml file and folder structure of this bundle.
+
+To avoid loading subversion repository with large binary files this artifact has to be build and deployed manually to retrieve precomputed models from other sites.
+
+
+## Downloading the OpenNLP statistical model
+
+The OpenNLP models are downloaded from
+
+ http://opennlp.sourceforge.net/models-1.5
+
+This url is defined as property in the 'pom.xml'
+The list of downloaded file is defined within the 'download_models.xml'
+
+## NOTE
+
+Using this bundles is only an alternative of manually copying the required OpenNLP models to the '{stanbol-installation}/sling/datafiles'.
+
+In addition model files in this folder have precedence to models provided by this bundle.
Added: incubator/stanbol/trunk/data/opennlp/ner/nl/download_models.xml
URL: http://svn.apache.org/viewvc/incubator/stanbol/trunk/data/opennlp/ner/nl/download_models.xml?rev=1173968&view=auto
==============================================================================
--- incubator/stanbol/trunk/data/opennlp/ner/nl/download_models.xml (added)
+++ incubator/stanbol/trunk/data/opennlp/ner/nl/download_models.xml Thu Sep 22 06:51:30 2011
@@ -0,0 +1,33 @@
+<?xml version="1.0" encoding="UTF-8"?>
+<!--
+ Licensed to the Apache Software Foundation (ASF) under one or more
+ contributor license agreements. See the NOTICE file distributed with
+ this work for additional information regarding copyright ownership.
+ The ASF licenses this file to You under the Apache License, Version 2.0
+ (the "License"); you may not use this file except in compliance with
+ the License. You may obtain a copy of the License at
+
+ http://www.apache.org/licenses/LICENSE-2.0
+
+ Unless required by applicable law or agreed to in writing, software
+ distributed under the License is distributed on an "AS IS" BASIS,
+ WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+ See the License for the specific language governing permissions and
+ limitations under the License.
+-->
+<project name="OpenNLP Model Download Helper" default="download" basedir=".">
+ <description>
+ Contains only a singel target that is used by the Maven Ant
+ Plugin to download OpenNLP Models from the Web
+ </description>
+
+ <target name="download">
+ <copy todir="${target.directory}" flatten="true">
+ <resources>
+ <url url="${model.url}/nl-ner-person.bin"/>
+ <url url="${model.url}/nl-ner-location.bin"/>
+ <url url="${model.url}/nl-ner-organization.bin"/>
+ </resources>
+ </copy>
+ </target>
+</project>
\ No newline at end of file
Propchange: incubator/stanbol/trunk/data/opennlp/ner/nl/download_models.xml
------------------------------------------------------------------------------
svn:mime-type = text/plain
Added: incubator/stanbol/trunk/data/opennlp/ner/nl/pom.xml
URL: http://svn.apache.org/viewvc/incubator/stanbol/trunk/data/opennlp/ner/nl/pom.xml?rev=1173968&view=auto
==============================================================================
--- incubator/stanbol/trunk/data/opennlp/ner/nl/pom.xml (added)
+++ incubator/stanbol/trunk/data/opennlp/ner/nl/pom.xml Thu Sep 22 06:51:30 2011
@@ -0,0 +1,123 @@
+<?xml version="1.0" encoding="UTF-8"?>
+<!--
+ Licensed to the Apache Software Foundation (ASF) under one or more
+ contributor license agreements. See the NOTICE file distributed with
+ this work for additional information regarding copyright ownership.
+ The ASF licenses this file to You under the Apache License, Version 2.0
+ (the "License"); you may not use this file except in compliance with
+ the License. You may obtain a copy of the License at
+
+ http://www.apache.org/licenses/LICENSE-2.0
+
+ Unless required by applicable law or agreed to in writing, software
+ distributed under the License is distributed on an "AS IS" BASIS,
+ WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+ See the License for the specific language governing permissions and
+ limitations under the License.
+-->
+<project xmlns="http://maven.apache.org/POM/4.0.0" xmlns:xsi="http://www.w3.org/2001/XMLSchema-instance"
+ xsi:schemaLocation="http://maven.apache.org/POM/4.0.0 http://maven.apache.org/maven-v4_0_0.xsd">
+
+ <modelVersion>4.0.0</modelVersion>
+ <parent>
+ <groupId>org.apache.stanbol</groupId>
+ <artifactId>org.apache.stanbol.data.parent</artifactId>
+ <version>0.9.0-incubating-SNAPSHOT</version>
+ <relativePath>../../../parent</relativePath>
+ </parent>
+
+ <groupId>org.apache.stanbol</groupId>
+ <artifactId>org.apache.stanbol.data.opennlp.ner.nl</artifactId>
+ <version>1.0.0-incubating</version>
+ <packaging>bundle</packaging>
+
+ <name>Apache Stanbol Data: OpenNLP NER Models for Dutch</name>
+ <description>
+ Bundle containing the NER models for finding Persons, Organizations
+ and Places for Dutch language texts.
+ </description>
+ <inceptionYear>2011</inceptionYear>
+
+ <scm>
+ <connection>
+ scm:svn:http://svn.apache.org/repos/asf/incubator/stanbol/trunk/data/opennlp/ner/nl
+ </connection>
+ <developerConnection>
+ scm:svn:https://svn.apache.org/repos/asf/incubator/stanbol/trunk/data/opennlp/ner/nl
+ </developerConnection>
+ <url>http://incubator.apache.org/stanbol/</url>
+ </scm>
+ <properties>
+ <project.build.sourceEncoding>UTF-8</project.build.sourceEncoding>
+ <!-- define the path to/home of the OpenNLP modles-->
+ <opennlp.model.path>org/apache/stanbol/data/opennlp</opennlp.model.path>
+ <opennlp.model.home>http://dev.iks-project.eu/downloads/opennlp/models-1.5/</opennlp.model.home>
+ </properties>
+
+ <build>
+ <plugins>
+ <plugin>
+ <groupId>org.apache.felix</groupId>
+ <artifactId>maven-bundle-plugin</artifactId>
+ <configuration>
+ <instructions>
+ <_versionpolicy>$${version;===;${@}}</_versionpolicy>
+
+ <!--
+ Extension used to provide files in that directory to the
+ DataFileProvider
+ -->
+ <Data-Files>${opennlp.model.path}</Data-Files>
+ <!--
+ Use a priority lower than 0 to allow providers without a
+ defined ranking to override this default data.
+ -->
+ <Data-Files-Priority>
+ -100
+ </Data-Files-Priority>
+ </instructions>
+ </configuration>
+ </plugin>
+ <plugin>
+ <!--
+ Ant is used to download the models from the
+ http://opennlp.sourceforge.net site.
+ -->
+ <groupId>org.apache.maven.plugins</groupId>
+ <artifactId>maven-antrun-plugin</artifactId>
+ <executions>
+ <execution>
+ <id>compile</id>
+ <phase>compile</phase>
+ <configuration>
+ <!--
+ TODO: I would like to add an "unless" constraint to the
+ target that prevents execution if Maven operates in offline
+ mode. However I was not able to find out how to obtain this
+ information. ${settings.offline} (as noted by several
+ resources) does not work.
+ Until fixed builds will fail if no internetconnection is
+ available!
+ -->
+ <target>
+ <property name="target.directory" value="${project.basedir}/src/main/resources/${opennlp.model.path}"/>
+ <property name="model.url" value="${opennlp.model.home}"/>
+
+ <echo message="copy OpenNLP models"/>
+ <echo message=" FROM ${model.url} "/>
+ <echo message=" TO ${target.directory}"/>
+
+ <ant antfile="${basedir}/download_models.xml">
+ <target name="download"/>
+ </ant>
+ </target>
+ </configuration>
+ <goals>
+ <goal>run</goal>
+ </goals>
+ </execution>
+ </executions>
+ </plugin>
+ </plugins>
+ </build>
+</project>
Propchange: incubator/stanbol/trunk/data/opennlp/ner/nl/pom.xml
------------------------------------------------------------------------------
svn:mime-type = text/plain
Propchange: incubator/stanbol/trunk/data/opennlp/ner/nl/src/main/resources/org/apache/stanbol/data/opennlp/
------------------------------------------------------------------------------
--- svn:ignore (added)
+++ svn:ignore Thu Sep 22 06:51:30 2011
@@ -0,0 +1,5 @@
+nl-ner-location.bin
+
+nl-ner-person.bin
+
+nl-ner-organization.bin
Propchange: incubator/stanbol/trunk/data/opennlp/ner/nl/target/
------------------------------------------------------------------------------
--- svn:ignore (added)
+++ svn:ignore Thu Sep 22 06:51:30 2011
@@ -0,0 +1,15 @@
+org.apache.stanbol.data.opennlp.ner.nl-1.0.0-incubating.jar
+
+classes
+
+org.apache.stanbol.data.opennlp.ner.nl-1.0.0-incubating-sources.jar
+
+maven-shared-archive-resources
+
+surefire
+
+test-classes
+
+antrun
+
+.plxarc
Propchange: incubator/stanbol/trunk/data/parent/
------------------------------------------------------------------------------
--- svn:ignore (added)
+++ svn:ignore Thu Sep 22 06:51:30 2011
@@ -0,0 +1 @@
+target
Modified: incubator/stanbol/trunk/data/pom.xml
URL: http://svn.apache.org/viewvc/incubator/stanbol/trunk/data/pom.xml?rev=1173968&r1=1173967&r2=1173968&view=diff
==============================================================================
--- incubator/stanbol/trunk/data/pom.xml (original)
+++ incubator/stanbol/trunk/data/pom.xml Thu Sep 22 06:51:30 2011
@@ -15,22 +15,16 @@
See the License for the specific language governing permissions and
limitations under the License.
-->
-<project>
+<project xmlns="http://maven.apache.org/POM/4.0.0" xmlns:xsi="http://www.w3.org/2001/XMLSchema-instance"
+ xsi:schemaLocation="http://maven.apache.org/POM/4.0.0 http://maven.apache.org/maven-v4_0_0.xsd">
<modelVersion>4.0.0</modelVersion>
- <parent>
- <groupId>org.apache.stanbol</groupId>
- <artifactId>org.apache.stanbol.data.parent</artifactId>
- <version>0.9.0-incubating-SNAPSHOT</version>
- <relativePath>parent</relativePath>
- </parent>
-
<groupId>org.apache.stanbol</groupId>
<artifactId>org.apache.stanbol.data.reactor</artifactId>
<version>0.9.0-incubating-SNAPSHOT</version>
<packaging>pom</packaging>
- <name>Apache Stanbol Data Reactor</name>
+ <name>Apache Stanbol Data reactor</name>
<scm>
<connection>
scm:svn:http://svn.apache.org/repos/asf/incubator/stanbol/trunk/data
@@ -40,11 +34,13 @@
</developerConnection>
<url>http://incubator.apache.org/stanbol/</url>
</scm>
-
+ <modules>
+ <module>parent</module>
+ </modules>
<profiles>
<profile>
<!--
- Provile that includes all the data modules used as default data
+ Profile that includes all the data modules used as default data
within the Stanbol Launchers.
This profile is activated by default because this bundles are
@@ -78,5 +74,25 @@
<module>sites/dbpediacached</module>
</modules>
</profile>
+ <profile>
+ <!--
+ Profile including all OpenNLP language and NER modules
+ -->
+ <id>opennlp</id>
+ <activation>
+ <activeByDefault>false</activeByDefault>
+ </activation>
+ <modules>
+ <module>opennlp/lang/da</module>
+ <module>opennlp/lang/de</module>
+ <module>opennlp/lang/en</module>
+ <module>opennlp/lang/nl</module>
+ <module>opennlp/lang/pt</module>
+ <module>opennlp/lang/se</module>
+ <module>opennlp/ner/en</module>
+ <module>opennlp/ner/es</module>
+ <module>opennlp/ner/nl</module>
+ </modules>
+ </profile>
</profiles>
</project>
Modified: incubator/stanbol/trunk/data/sites/dbpediadefault/pom.xml
URL: http://svn.apache.org/viewvc/incubator/stanbol/trunk/data/sites/dbpediadefault/pom.xml?rev=1173968&r1=1173967&r2=1173968&view=diff
==============================================================================
--- incubator/stanbol/trunk/data/sites/dbpediadefault/pom.xml (original)
+++ incubator/stanbol/trunk/data/sites/dbpediadefault/pom.xml Thu Sep 22 06:51:30 2011
@@ -29,7 +29,7 @@
<groupId>org.apache.stanbol</groupId>
<artifactId>org.apache.stanbol.data.sites.dbpedia.default</artifactId>
- <version>1.0.1-incubating</version>
+ <version>1.0.2-incubating</version>
<packaging>bundle</packaging>
<name>Apache Stanbol Data: DBpedia.org defaultdata version</name>
Modified: incubator/stanbol/trunk/data/sites/geonames/pom.xml
URL: http://svn.apache.org/viewvc/incubator/stanbol/trunk/data/sites/geonames/pom.xml?rev=1173968&r1=1173967&r2=1173968&view=diff
==============================================================================
--- incubator/stanbol/trunk/data/sites/geonames/pom.xml (original)
+++ incubator/stanbol/trunk/data/sites/geonames/pom.xml Thu Sep 22 06:51:30 2011
@@ -76,7 +76,7 @@
</Install-Path>
<_versionpolicy>$${version;===;${@}}</_versionpolicy>
<Export-Package>
- org.apache.stanbol.data.site.geonames.*;version="${pom.version}"
+ org.apache.stanbol.data.site.geonames.*;version="${project.version}ion}"
</Export-Package>
</instructions>
</configuration>
Modified: incubator/stanbol/trunk/enhancer/clerezza/clerezza-sparql/pom.xml
URL: http://svn.apache.org/viewvc/incubator/stanbol/trunk/enhancer/clerezza/clerezza-sparql/pom.xml?rev=1173968&r1=1173967&r2=1173968&view=diff
==============================================================================
--- incubator/stanbol/trunk/enhancer/clerezza/clerezza-sparql/pom.xml (original)
+++ incubator/stanbol/trunk/enhancer/clerezza/clerezza-sparql/pom.xml Thu Sep 22 06:51:30 2011
@@ -53,7 +53,7 @@
<configuration>
<instructions>
<Private-Package>
- org.apache.stanbol.enhancer.clerezza.sparql.*;version=${pom.version}
+ org.apache.stanbol.enhancer.clerezza.sparql.*;version=${project.version}
</Private-Package>
</instructions>
</configuration>
Modified: incubator/stanbol/trunk/enhancer/clerezza/org.apache.stanbol.enhancer.clerezza/pom.xml
URL: http://svn.apache.org/viewvc/incubator/stanbol/trunk/enhancer/clerezza/org.apache.stanbol.enhancer.clerezza/pom.xml?rev=1173968&r1=1173967&r2=1173968&view=diff
==============================================================================
--- incubator/stanbol/trunk/enhancer/clerezza/org.apache.stanbol.enhancer.clerezza/pom.xml (original)
+++ incubator/stanbol/trunk/enhancer/clerezza/org.apache.stanbol.enhancer.clerezza/pom.xml Thu Sep 22 06:51:30 2011
@@ -50,7 +50,7 @@
<configuration>
<instructions>
<Export-Package>
- org.apache.stanbol.enhancer.bundle;version=${pom.version}
+ org.apache.stanbol.enhancer.bundle;version=${project.version}
</Export-Package>
</instructions>
</configuration>
Modified: incubator/stanbol/trunk/enhancer/engines/autotagging/pom.xml
URL: http://svn.apache.org/viewvc/incubator/stanbol/trunk/enhancer/engines/autotagging/pom.xml?rev=1173968&r1=1173967&r2=1173968&view=diff
==============================================================================
--- incubator/stanbol/trunk/enhancer/engines/autotagging/pom.xml (original)
+++ incubator/stanbol/trunk/enhancer/engines/autotagging/pom.xml Thu Sep 22 06:51:30 2011
@@ -58,15 +58,15 @@
<configuration>
<instructions>
<Export-Package>
- org.apache.stanbol.enhancer.engines.autotagging;version=${pom.version},
- org.apache.stanbol.autotagging;version="${pom.version}",
+ org.apache.stanbol.enhancer.engines.autotagging;version=${project.version},
+ org.apache.stanbol.autotagging;version=${project.version}",
org.apache.lucene.*,
opennlp.english.namefind,
opennlp.english.sentdetect,
dbpedia
</Export-Package>
<Private-Package>
- org.apache.stanbol.enhancer.engines.autotagging.impl.*
+ org.apache.stanbol.enhancer.engines.autotagging.impl.*;version=${project.version}
</Private-Package>
<!-- TODO those should be bundles! -->
<Embed-Dependency>
Propchange: incubator/stanbol/trunk/enhancer/engines/entitydisambiguation/
------------------------------------------------------------------------------
--- svn:ignore (added)
+++ svn:ignore Thu Sep 22 06:51:30 2011
@@ -0,0 +1 @@
+target
Modified: incubator/stanbol/trunk/enhancer/engines/entitytagging/pom.xml
URL: http://svn.apache.org/viewvc/incubator/stanbol/trunk/enhancer/engines/entitytagging/pom.xml?rev=1173968&r1=1173967&r2=1173968&view=diff
==============================================================================
--- incubator/stanbol/trunk/enhancer/engines/entitytagging/pom.xml (original)
+++ incubator/stanbol/trunk/enhancer/engines/entitytagging/pom.xml Thu Sep 22 06:51:30 2011
@@ -60,7 +60,7 @@
<configuration>
<instructions>
<Export-Package>
- org.apache.stanbol.enhancer.engines.entitytagging;version=${pom.version}
+ org.apache.stanbol.enhancer.engines.entitytagging;version=${project.version}
</Export-Package>
<Private-Package>
org.apache.stanbol.enhancer.engines.entitytagging.impl.*
Modified: incubator/stanbol/trunk/enhancer/engines/geonames/pom.xml
URL: http://svn.apache.org/viewvc/incubator/stanbol/trunk/enhancer/engines/geonames/pom.xml?rev=1173968&r1=1173967&r2=1173968&view=diff
==============================================================================
--- incubator/stanbol/trunk/enhancer/engines/geonames/pom.xml (original)
+++ incubator/stanbol/trunk/enhancer/engines/geonames/pom.xml Thu Sep 22 06:51:30 2011
@@ -58,10 +58,10 @@
<configuration>
<instructions>
<Export-Package>
- org.apache.stanbol.enhancer.engines.geonames;version=${pom.version},
+ org.apache.stanbol.enhancer.engines.geonames;version=${project.version}
</Export-Package>
<Private-Package>
- org.apache.stanbol.enhancer.engines.geonames.impl.*,
+ org.apache.stanbol.enhancer.engines.geonames.impl.*;version=${project.version}
</Private-Package>
</instructions>
</configuration>
Propchange: incubator/stanbol/trunk/enhancer/engines/keywordextraction/
------------------------------------------------------------------------------
--- svn:ignore (added)
+++ svn:ignore Thu Sep 22 06:51:30 2011
@@ -0,0 +1,7 @@
+target
+
+.settings
+
+.project
+
+.classpath
Added: incubator/stanbol/trunk/enhancer/engines/keywordextraction/pom.xml
URL: http://svn.apache.org/viewvc/incubator/stanbol/trunk/enhancer/engines/keywordextraction/pom.xml?rev=1173968&view=auto
==============================================================================
--- incubator/stanbol/trunk/enhancer/engines/keywordextraction/pom.xml (added)
+++ incubator/stanbol/trunk/enhancer/engines/keywordextraction/pom.xml Thu Sep 22 06:51:30 2011
@@ -0,0 +1,155 @@
+<?xml version="1.0" encoding="UTF-8"?>
+<!--
+ Licensed to the Apache Software Foundation (ASF) under one or more
+ contributor license agreements. See the NOTICE file distributed with
+ this work for additional information regarding copyright ownership.
+ The ASF licenses this file to You under the Apache License, Version 2.0
+ (the "License"); you may not use this file except in compliance with
+ the License. You may obtain a copy of the License at
+
+ http://www.apache.org/licenses/LICENSE-2.0
+
+ Unless required by applicable law or agreed to in writing, software
+ distributed under the License is distributed on an "AS IS" BASIS,
+ WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+ See the License for the specific language governing permissions and
+ limitations under the License.
+-->
+<project xmlns="http://maven.apache.org/POM/4.0.0" xmlns:xsi="http://www.w3.org/2001/XMLSchema-instance"
+ xsi:schemaLocation="http://maven.apache.org/POM/4.0.0 http://maven.apache.org/maven-v4_0_0.xsd">
+
+ <modelVersion>4.0.0</modelVersion>
+
+ <parent>
+ <groupId>org.apache.stanbol</groupId>
+ <artifactId>org.apache.stanbol.enhancer.parent</artifactId>
+ <version>0.9.0-incubating-SNAPSHOT</version>
+ <relativePath>../../parent</relativePath>
+ </parent>
+
+ <groupId>org.apache.stanbol</groupId>
+ <artifactId>org.apache.stanbol.enhancer.engine.keywordextraction</artifactId>
+ <packaging>bundle</packaging>
+
+ <name>Apache Stanbol Enhancer Enhancement Engine and utilities for extracting keywords form parsed text.</name>
+ <description>
+ Implementation of Utilities and an Engine to extract keywords defined in
+ a controlloed vocabulary from a parsed text.
+ This also provides default implementation to use OpenNLP to parse the
+ text and the Entityhub to search for Entities.
+ </description>
+
+ <inceptionYear>2011</inceptionYear>
+
+ <scm>
+ <connection>
+ scm:svn:http://svn.apache.org/repos/asf/incubator/stanbol/trunk/enhancer/engines/keywordextraction/
+ </connection>
+ <developerConnection>
+ scm:svn:https://svn.apache.org/repos/asf/incubator/stanbol/trunk/enhancer/engines/keywordextraction/
+ </developerConnection>
+ <url>http://incubator.apache.org/stanbol/</url>
+ </scm>
+
+ <build>
+ <plugins>
+ <plugin>
+ <groupId>org.apache.felix</groupId>
+ <artifactId>maven-bundle-plugin</artifactId>
+ <extensions>true</extensions>
+ <configuration>
+ <instructions>
+ <Export-Package>
+ org.apache.stanbol.enhancer.engines.keywordextraction.linking;version=${project.version},
+ org.apache.stanbol.enhancer.engines.keywordextraction.linking.impl;version=${project.version},
+ org.apache.stanbol.enhancer.engines.keywordextraction.engine;version=${project.version},
+ </Export-Package>
+ <Private-Package>
+ org.apache.stanbol.enhancer.engines.keywordextraction.impl;version=${project.version}
+ </Private-Package>
+ </instructions>
+ </configuration>
+ </plugin>
+ <plugin>
+ <groupId>org.apache.felix</groupId>
+ <artifactId>maven-scr-plugin</artifactId>
+ </plugin>
+ </plugins>
+ </build>
+
+ <dependencies>
+ <dependency>
+ <groupId>org.apache.stanbol</groupId>
+ <artifactId>org.apache.stanbol.enhancer.servicesapi</artifactId>
+ </dependency>
+ <dependency>
+ <groupId>org.apache.stanbol</groupId>
+ <artifactId>org.apache.stanbol.commons.stanboltools.offline</artifactId>
+ </dependency>
+ <dependency>
+ <groupId>org.apache.stanbol</groupId>
+ <artifactId>org.apache.stanbol.entityhub.servicesapi</artifactId>
+ <scope>compile</scope>
+ </dependency>
+ <dependency>
+ <groupId>org.apache.stanbol</groupId>
+ <artifactId>org.apache.stanbol.entityhub.model.clerezza</artifactId>
+ <scope>compile</scope>
+ </dependency>
+
+ <dependency>
+ <groupId>org.apache.stanbol</groupId>
+ <artifactId>org.apache.stanbol.commons.opennlp</artifactId>
+ </dependency>
+
+ <dependency>
+ <groupId>commons-io</groupId>
+ <artifactId>commons-io</artifactId>
+ </dependency>
+ <dependency>
+ <groupId>commons-lang</groupId>
+ <artifactId>commons-lang</artifactId>
+ </dependency>
+
+ <dependency>
+ <groupId>org.apache.felix</groupId>
+ <artifactId>org.apache.felix.scr.annotations</artifactId>
+ </dependency>
+ <dependency>
+ <groupId>org.apache.clerezza</groupId>
+ <artifactId>rdf.core</artifactId>
+ </dependency>
+ <dependency>
+ <groupId>org.slf4j</groupId>
+ <artifactId>slf4j-api</artifactId>
+ </dependency>
+
+ <!-- Testing -->
+ <dependency>
+ <groupId>junit</groupId>
+ <artifactId>junit</artifactId>
+ <scope>test</scope>
+ </dependency>
+ <dependency>
+ <groupId>org.slf4j</groupId>
+ <artifactId>slf4j-simple</artifactId>
+ <scope>test</scope>
+ </dependency>
+ <dependency>
+ <groupId>org.apache.stanbol</groupId>
+ <artifactId>org.apache.stanbol.commons.stanboltools.datafileprovider</artifactId>
+ <scope>test</scope>
+ </dependency>
+ <dependency>
+ <groupId>org.apache.stanbol</groupId>
+ <artifactId>org.apache.stanbol.entityhub.core</artifactId>
+ <scope>test</scope>
+ </dependency>
+ <dependency>
+ <groupId>org.apache.stanbol</groupId>
+ <artifactId>org.apache.stanbol.data.opennlp.lang.en</artifactId>
+ <scope>test</scope>
+ </dependency>
+ </dependencies>
+
+</project>
Propchange: incubator/stanbol/trunk/enhancer/engines/keywordextraction/pom.xml
------------------------------------------------------------------------------
svn:mime-type = text/plain