You are viewing a plain text version of this content. The canonical link for it is here.
Posted to commits@stanbol.apache.org by rw...@apache.org on 2013/10/09 15:11:40 UTC

svn commit: r1530593 - in /stanbol/trunk/entityhub/indexing: dbpedia/src/main/resources/indexing/config/ freebase/src/main/resources/ freebase/src/main/resources/indexing/config/ genericrdf/src/main/resources/indexing/config/ geonames/src/main/resource...

Author: rwesten
Date: Wed Oct  9 13:11:40 2013
New Revision: 1530593

URL: http://svn.apache.org/r1530593
Log:
STANBOL-1167: added FST model builder to default configs

Added:
    stanbol/trunk/entityhub/indexing/dbpedia/src/main/resources/indexing/config/fst.config
    stanbol/trunk/entityhub/indexing/freebase/src/main/resources/indexing/config/fst.config
    stanbol/trunk/entityhub/indexing/genericrdf/src/main/resources/indexing/config/fst.config
    stanbol/trunk/entityhub/indexing/geonames/src/main/resources/indexing/config/fst.config
Modified:
    stanbol/trunk/entityhub/indexing/dbpedia/src/main/resources/indexing/config/indexing.properties
    stanbol/trunk/entityhub/indexing/freebase/src/main/resources/indexing/config/indexing.properties
    stanbol/trunk/entityhub/indexing/freebase/src/main/resources/log4j.properties
    stanbol/trunk/entityhub/indexing/genericrdf/src/main/resources/indexing/config/indexing.properties
    stanbol/trunk/entityhub/indexing/geonames/src/main/resources/indexing/config/indexing.properties

Added: stanbol/trunk/entityhub/indexing/dbpedia/src/main/resources/indexing/config/fst.config
URL: http://svn.apache.org/viewvc/stanbol/trunk/entityhub/indexing/dbpedia/src/main/resources/indexing/config/fst.config?rev=1530593&view=auto
==============================================================================
--- stanbol/trunk/entityhub/indexing/dbpedia/src/main/resources/indexing/config/fst.config (added)
+++ stanbol/trunk/entityhub/indexing/dbpedia/src/main/resources/indexing/config/fst.config Wed Oct  9 13:11:40 2013
@@ -0,0 +1,18 @@
+# Licensed to the Apache Software Foundation (ASF) under one or more
+# contributor license agreements.  See the NOTICE file distributed with
+# this work for additional information regarding copyright ownership.
+# The ASF licenses this file to You under the Apache License, Version 2.0
+# (the "License"); you may not use this file except in compliance with
+# the License.  You may obtain a copy of the License at
+#
+#     http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+
+#Syntax
+#index={indexField};[store={storeField}]
+index=rdfs:label
\ No newline at end of file

Modified: stanbol/trunk/entityhub/indexing/dbpedia/src/main/resources/indexing/config/indexing.properties
URL: http://svn.apache.org/viewvc/stanbol/trunk/entityhub/indexing/dbpedia/src/main/resources/indexing/config/indexing.properties?rev=1530593&r1=1530592&r2=1530593&view=diff
==============================================================================
--- stanbol/trunk/entityhub/indexing/dbpedia/src/main/resources/indexing/config/indexing.properties (original)
+++ stanbol/trunk/entityhub/indexing/dbpedia/src/main/resources/indexing/config/indexing.properties Wed Oct  9 13:11:40 2013
@@ -47,8 +47,10 @@ entityProcessor=org.apache.stanbol.entit
 fieldConfiguration=mappings.txt
 
 # Finally we need a destination to store the data
-# Note also the configured fieldboosts.properties
-indexingDestination=org.apache.stanbol.entityhub.indexing.destination.solryard.SolrYardIndexingDestination,solrConf,boosts:fieldboosts
+# Note also 
+# * the configured fieldboosts.properties
+# * the configured fst.config
+indexingDestination=org.apache.stanbol.entityhub.indexing.destination.solryard.SolrYardIndexingDestination,solrConf,boosts:fieldboosts,fstConf:fst.config
 
 
 # Additional Properties directly added to the configuration of the

Added: stanbol/trunk/entityhub/indexing/freebase/src/main/resources/indexing/config/fst.config
URL: http://svn.apache.org/viewvc/stanbol/trunk/entityhub/indexing/freebase/src/main/resources/indexing/config/fst.config?rev=1530593&view=auto
==============================================================================
--- stanbol/trunk/entityhub/indexing/freebase/src/main/resources/indexing/config/fst.config (added)
+++ stanbol/trunk/entityhub/indexing/freebase/src/main/resources/indexing/config/fst.config Wed Oct  9 13:11:40 2013
@@ -0,0 +1,18 @@
+# Licensed to the Apache Software Foundation (ASF) under one or more
+# contributor license agreements.  See the NOTICE file distributed with
+# this work for additional information regarding copyright ownership.
+# The ASF licenses this file to You under the Apache License, Version 2.0
+# (the "License"); you may not use this file except in compliance with
+# the License.  You may obtain a copy of the License at
+#
+#     http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+
+#Syntax
+#index={indexField};[store={storeField}]
+index=rdfs:label
\ No newline at end of file

Modified: stanbol/trunk/entityhub/indexing/freebase/src/main/resources/indexing/config/indexing.properties
URL: http://svn.apache.org/viewvc/stanbol/trunk/entityhub/indexing/freebase/src/main/resources/indexing/config/indexing.properties?rev=1530593&r1=1530592&r2=1530593&view=diff
==============================================================================
--- stanbol/trunk/entityhub/indexing/freebase/src/main/resources/indexing/config/indexing.properties (original)
+++ stanbol/trunk/entityhub/indexing/freebase/src/main/resources/indexing/config/indexing.properties Wed Oct  9 13:11:40 2013
@@ -52,7 +52,7 @@ fieldConfiguration=mappings.txt
 
 # Finally we need a destination to store the data
 # Note also the configured fieldboosts.properties
-indexingDestination=org.apache.stanbol.entityhub.indexing.destination.solryard.SolrYardIndexingDestination,solrConf,boosts:fieldboosts
+indexingDestination=org.apache.stanbol.entityhub.indexing.destination.solryard.SolrYardIndexingDestination,solrConf,boosts:fieldboosts,fstConf:fst.config
 
 
 # Additional Properties directly added to the configuration of the

Modified: stanbol/trunk/entityhub/indexing/freebase/src/main/resources/log4j.properties
URL: http://svn.apache.org/viewvc/stanbol/trunk/entityhub/indexing/freebase/src/main/resources/log4j.properties?rev=1530593&r1=1530592&r2=1530593&view=diff
==============================================================================
--- stanbol/trunk/entityhub/indexing/freebase/src/main/resources/log4j.properties (original)
+++ stanbol/trunk/entityhub/indexing/freebase/src/main/resources/log4j.properties Wed Oct  9 13:11:40 2013
@@ -24,4 +24,6 @@ log4j.appender.A1.layout.ConversionPatte
 # however log also INFO messages of the indexing components
 log4j.logger.org.apache.stanbol.entityhub.indexing=INFO
 # for loggings during importing RDF data
-log4j.logger.com.hp.hpl.jena=INFO
\ No newline at end of file
+log4j.logger.com.hp.hpl.jena=INFO
+# do not show warnings for building FST modles
+log4j.logger.org.opensextant.solrtexttagger=ERROR
\ No newline at end of file

Added: stanbol/trunk/entityhub/indexing/genericrdf/src/main/resources/indexing/config/fst.config
URL: http://svn.apache.org/viewvc/stanbol/trunk/entityhub/indexing/genericrdf/src/main/resources/indexing/config/fst.config?rev=1530593&view=auto
==============================================================================
--- stanbol/trunk/entityhub/indexing/genericrdf/src/main/resources/indexing/config/fst.config (added)
+++ stanbol/trunk/entityhub/indexing/genericrdf/src/main/resources/indexing/config/fst.config Wed Oct  9 13:11:40 2013
@@ -0,0 +1,18 @@
+# Licensed to the Apache Software Foundation (ASF) under one or more
+# contributor license agreements.  See the NOTICE file distributed with
+# this work for additional information regarding copyright ownership.
+# The ASF licenses this file to You under the Apache License, Version 2.0
+# (the "License"); you may not use this file except in compliance with
+# the License.  You may obtain a copy of the License at
+#
+#     http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+
+#Syntax
+#index={indexField};[store={storeField}]
+index=rdfs:label
\ No newline at end of file

Modified: stanbol/trunk/entityhub/indexing/genericrdf/src/main/resources/indexing/config/indexing.properties
URL: http://svn.apache.org/viewvc/stanbol/trunk/entityhub/indexing/genericrdf/src/main/resources/indexing/config/indexing.properties?rev=1530593&r1=1530592&r2=1530593&view=diff
==============================================================================
--- stanbol/trunk/entityhub/indexing/genericrdf/src/main/resources/indexing/config/indexing.properties (original)
+++ stanbol/trunk/entityhub/indexing/genericrdf/src/main/resources/indexing/config/indexing.properties Wed Oct  9 13:11:40 2013
@@ -233,7 +233,8 @@ fieldConfiguration=mappings.txt
 # A SolrYard is used as destination for indexing
 # To boost some fields (typically labels) one can use the fieldboosts.properties
 # A default field boost configuration is provided.
-indexingDestination=org.apache.stanbol.entityhub.indexing.destination.solryard.SolrYardIndexingDestination,boosts:fieldboosts
+# A default fst.config is also provided (see STANBOL-1167)
+indexingDestination=org.apache.stanbol.entityhub.indexing.destination.solryard.SolrYardIndexingDestination,boosts:fieldboosts,fstConf:fst.config
 
 
 # ------------

Added: stanbol/trunk/entityhub/indexing/geonames/src/main/resources/indexing/config/fst.config
URL: http://svn.apache.org/viewvc/stanbol/trunk/entityhub/indexing/geonames/src/main/resources/indexing/config/fst.config?rev=1530593&view=auto
==============================================================================
--- stanbol/trunk/entityhub/indexing/geonames/src/main/resources/indexing/config/fst.config (added)
+++ stanbol/trunk/entityhub/indexing/geonames/src/main/resources/indexing/config/fst.config Wed Oct  9 13:11:40 2013
@@ -0,0 +1,26 @@
+# Licensed to the Apache Software Foundation (ASF) under one or more
+# contributor license agreements.  See the NOTICE file distributed with
+# this work for additional information regarding copyright ownership.
+# The ASF licenses this file to You under the Apache License, Version 2.0
+# (the "License"); you may not use this file except in compliance with
+# the License.  You may obtain a copy of the License at
+#
+#     http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+
+#Syntax
+#index={indexField};[store={storeField}]
+
+#Names wis build FST models for
+index=rdfs:label
+index=geonames:name
+index=geonames:officialName
+
+#Other names 
+#index=geonames:alternateName
+#index=geonames:shortName

Modified: stanbol/trunk/entityhub/indexing/geonames/src/main/resources/indexing/config/indexing.properties
URL: http://svn.apache.org/viewvc/stanbol/trunk/entityhub/indexing/geonames/src/main/resources/indexing/config/indexing.properties?rev=1530593&r1=1530592&r2=1530593&view=diff
==============================================================================
--- stanbol/trunk/entityhub/indexing/geonames/src/main/resources/indexing/config/indexing.properties (original)
+++ stanbol/trunk/entityhub/indexing/geonames/src/main/resources/indexing/config/indexing.properties Wed Oct  9 13:11:40 2013
@@ -107,7 +107,7 @@ fieldConfiguration=mappings.txt
 # A SolrYard is used as destination for indexing
 # To boost some fields (typically labels) one can use the fieldboosts.properties
 # A default field boost configuration is provided.
-indexingDestination=org.apache.stanbol.entityhub.indexing.destination.solryard.SolrYardIndexingDestination,boosts:fieldboosts
+indexingDestination=org.apache.stanbol.entityhub.indexing.destination.solryard.SolrYardIndexingDestination,boosts:fieldboosts,fstConf:fst.config
 
 
 # ------------