You are viewing a plain text version of this content. The canonical link for it is here.
Posted to commits@stanbol.apache.org by rw...@apache.org on 2013/10/09 15:11:40 UTC
svn commit: r1530593 - in /stanbol/trunk/entityhub/indexing:
dbpedia/src/main/resources/indexing/config/ freebase/src/main/resources/
freebase/src/main/resources/indexing/config/
genericrdf/src/main/resources/indexing/config/ geonames/src/main/resource...
Author: rwesten
Date: Wed Oct 9 13:11:40 2013
New Revision: 1530593
URL: http://svn.apache.org/r1530593
Log:
STANBOL-1167: added FST model builder to default configs
Added:
stanbol/trunk/entityhub/indexing/dbpedia/src/main/resources/indexing/config/fst.config
stanbol/trunk/entityhub/indexing/freebase/src/main/resources/indexing/config/fst.config
stanbol/trunk/entityhub/indexing/genericrdf/src/main/resources/indexing/config/fst.config
stanbol/trunk/entityhub/indexing/geonames/src/main/resources/indexing/config/fst.config
Modified:
stanbol/trunk/entityhub/indexing/dbpedia/src/main/resources/indexing/config/indexing.properties
stanbol/trunk/entityhub/indexing/freebase/src/main/resources/indexing/config/indexing.properties
stanbol/trunk/entityhub/indexing/freebase/src/main/resources/log4j.properties
stanbol/trunk/entityhub/indexing/genericrdf/src/main/resources/indexing/config/indexing.properties
stanbol/trunk/entityhub/indexing/geonames/src/main/resources/indexing/config/indexing.properties
Added: stanbol/trunk/entityhub/indexing/dbpedia/src/main/resources/indexing/config/fst.config
URL: http://svn.apache.org/viewvc/stanbol/trunk/entityhub/indexing/dbpedia/src/main/resources/indexing/config/fst.config?rev=1530593&view=auto
==============================================================================
--- stanbol/trunk/entityhub/indexing/dbpedia/src/main/resources/indexing/config/fst.config (added)
+++ stanbol/trunk/entityhub/indexing/dbpedia/src/main/resources/indexing/config/fst.config Wed Oct 9 13:11:40 2013
@@ -0,0 +1,18 @@
+# Licensed to the Apache Software Foundation (ASF) under one or more
+# contributor license agreements. See the NOTICE file distributed with
+# this work for additional information regarding copyright ownership.
+# The ASF licenses this file to You under the Apache License, Version 2.0
+# (the "License"); you may not use this file except in compliance with
+# the License. You may obtain a copy of the License at
+#
+# http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+
+#Syntax
+#index={indexField};[store={storeField}]
+index=rdfs:label
\ No newline at end of file
Modified: stanbol/trunk/entityhub/indexing/dbpedia/src/main/resources/indexing/config/indexing.properties
URL: http://svn.apache.org/viewvc/stanbol/trunk/entityhub/indexing/dbpedia/src/main/resources/indexing/config/indexing.properties?rev=1530593&r1=1530592&r2=1530593&view=diff
==============================================================================
--- stanbol/trunk/entityhub/indexing/dbpedia/src/main/resources/indexing/config/indexing.properties (original)
+++ stanbol/trunk/entityhub/indexing/dbpedia/src/main/resources/indexing/config/indexing.properties Wed Oct 9 13:11:40 2013
@@ -47,8 +47,10 @@ entityProcessor=org.apache.stanbol.entit
fieldConfiguration=mappings.txt
# Finally we need a destination to store the data
-# Note also the configured fieldboosts.properties
-indexingDestination=org.apache.stanbol.entityhub.indexing.destination.solryard.SolrYardIndexingDestination,solrConf,boosts:fieldboosts
+# Note also
+# * the configured fieldboosts.properties
+# * the configured fst.config
+indexingDestination=org.apache.stanbol.entityhub.indexing.destination.solryard.SolrYardIndexingDestination,solrConf,boosts:fieldboosts,fstConf:fst.config
# Additional Properties directly added to the configuration of the
Added: stanbol/trunk/entityhub/indexing/freebase/src/main/resources/indexing/config/fst.config
URL: http://svn.apache.org/viewvc/stanbol/trunk/entityhub/indexing/freebase/src/main/resources/indexing/config/fst.config?rev=1530593&view=auto
==============================================================================
--- stanbol/trunk/entityhub/indexing/freebase/src/main/resources/indexing/config/fst.config (added)
+++ stanbol/trunk/entityhub/indexing/freebase/src/main/resources/indexing/config/fst.config Wed Oct 9 13:11:40 2013
@@ -0,0 +1,18 @@
+# Licensed to the Apache Software Foundation (ASF) under one or more
+# contributor license agreements. See the NOTICE file distributed with
+# this work for additional information regarding copyright ownership.
+# The ASF licenses this file to You under the Apache License, Version 2.0
+# (the "License"); you may not use this file except in compliance with
+# the License. You may obtain a copy of the License at
+#
+# http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+
+#Syntax
+#index={indexField};[store={storeField}]
+index=rdfs:label
\ No newline at end of file
Modified: stanbol/trunk/entityhub/indexing/freebase/src/main/resources/indexing/config/indexing.properties
URL: http://svn.apache.org/viewvc/stanbol/trunk/entityhub/indexing/freebase/src/main/resources/indexing/config/indexing.properties?rev=1530593&r1=1530592&r2=1530593&view=diff
==============================================================================
--- stanbol/trunk/entityhub/indexing/freebase/src/main/resources/indexing/config/indexing.properties (original)
+++ stanbol/trunk/entityhub/indexing/freebase/src/main/resources/indexing/config/indexing.properties Wed Oct 9 13:11:40 2013
@@ -52,7 +52,7 @@ fieldConfiguration=mappings.txt
# Finally we need a destination to store the data
# Note also the configured fieldboosts.properties
-indexingDestination=org.apache.stanbol.entityhub.indexing.destination.solryard.SolrYardIndexingDestination,solrConf,boosts:fieldboosts
+indexingDestination=org.apache.stanbol.entityhub.indexing.destination.solryard.SolrYardIndexingDestination,solrConf,boosts:fieldboosts,fstConf:fst.config
# Additional Properties directly added to the configuration of the
Modified: stanbol/trunk/entityhub/indexing/freebase/src/main/resources/log4j.properties
URL: http://svn.apache.org/viewvc/stanbol/trunk/entityhub/indexing/freebase/src/main/resources/log4j.properties?rev=1530593&r1=1530592&r2=1530593&view=diff
==============================================================================
--- stanbol/trunk/entityhub/indexing/freebase/src/main/resources/log4j.properties (original)
+++ stanbol/trunk/entityhub/indexing/freebase/src/main/resources/log4j.properties Wed Oct 9 13:11:40 2013
@@ -24,4 +24,6 @@ log4j.appender.A1.layout.ConversionPatte
# however log also INFO messages of the indexing components
log4j.logger.org.apache.stanbol.entityhub.indexing=INFO
# for loggings during importing RDF data
-log4j.logger.com.hp.hpl.jena=INFO
\ No newline at end of file
+log4j.logger.com.hp.hpl.jena=INFO
+# do not show warnings for building FST modles
+log4j.logger.org.opensextant.solrtexttagger=ERROR
\ No newline at end of file
Added: stanbol/trunk/entityhub/indexing/genericrdf/src/main/resources/indexing/config/fst.config
URL: http://svn.apache.org/viewvc/stanbol/trunk/entityhub/indexing/genericrdf/src/main/resources/indexing/config/fst.config?rev=1530593&view=auto
==============================================================================
--- stanbol/trunk/entityhub/indexing/genericrdf/src/main/resources/indexing/config/fst.config (added)
+++ stanbol/trunk/entityhub/indexing/genericrdf/src/main/resources/indexing/config/fst.config Wed Oct 9 13:11:40 2013
@@ -0,0 +1,18 @@
+# Licensed to the Apache Software Foundation (ASF) under one or more
+# contributor license agreements. See the NOTICE file distributed with
+# this work for additional information regarding copyright ownership.
+# The ASF licenses this file to You under the Apache License, Version 2.0
+# (the "License"); you may not use this file except in compliance with
+# the License. You may obtain a copy of the License at
+#
+# http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+
+#Syntax
+#index={indexField};[store={storeField}]
+index=rdfs:label
\ No newline at end of file
Modified: stanbol/trunk/entityhub/indexing/genericrdf/src/main/resources/indexing/config/indexing.properties
URL: http://svn.apache.org/viewvc/stanbol/trunk/entityhub/indexing/genericrdf/src/main/resources/indexing/config/indexing.properties?rev=1530593&r1=1530592&r2=1530593&view=diff
==============================================================================
--- stanbol/trunk/entityhub/indexing/genericrdf/src/main/resources/indexing/config/indexing.properties (original)
+++ stanbol/trunk/entityhub/indexing/genericrdf/src/main/resources/indexing/config/indexing.properties Wed Oct 9 13:11:40 2013
@@ -233,7 +233,8 @@ fieldConfiguration=mappings.txt
# A SolrYard is used as destination for indexing
# To boost some fields (typically labels) one can use the fieldboosts.properties
# A default field boost configuration is provided.
-indexingDestination=org.apache.stanbol.entityhub.indexing.destination.solryard.SolrYardIndexingDestination,boosts:fieldboosts
+# A default fst.config is also provided (see STANBOL-1167)
+indexingDestination=org.apache.stanbol.entityhub.indexing.destination.solryard.SolrYardIndexingDestination,boosts:fieldboosts,fstConf:fst.config
# ------------
Added: stanbol/trunk/entityhub/indexing/geonames/src/main/resources/indexing/config/fst.config
URL: http://svn.apache.org/viewvc/stanbol/trunk/entityhub/indexing/geonames/src/main/resources/indexing/config/fst.config?rev=1530593&view=auto
==============================================================================
--- stanbol/trunk/entityhub/indexing/geonames/src/main/resources/indexing/config/fst.config (added)
+++ stanbol/trunk/entityhub/indexing/geonames/src/main/resources/indexing/config/fst.config Wed Oct 9 13:11:40 2013
@@ -0,0 +1,26 @@
+# Licensed to the Apache Software Foundation (ASF) under one or more
+# contributor license agreements. See the NOTICE file distributed with
+# this work for additional information regarding copyright ownership.
+# The ASF licenses this file to You under the Apache License, Version 2.0
+# (the "License"); you may not use this file except in compliance with
+# the License. You may obtain a copy of the License at
+#
+# http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+
+#Syntax
+#index={indexField};[store={storeField}]
+
+#Names wis build FST models for
+index=rdfs:label
+index=geonames:name
+index=geonames:officialName
+
+#Other names
+#index=geonames:alternateName
+#index=geonames:shortName
Modified: stanbol/trunk/entityhub/indexing/geonames/src/main/resources/indexing/config/indexing.properties
URL: http://svn.apache.org/viewvc/stanbol/trunk/entityhub/indexing/geonames/src/main/resources/indexing/config/indexing.properties?rev=1530593&r1=1530592&r2=1530593&view=diff
==============================================================================
--- stanbol/trunk/entityhub/indexing/geonames/src/main/resources/indexing/config/indexing.properties (original)
+++ stanbol/trunk/entityhub/indexing/geonames/src/main/resources/indexing/config/indexing.properties Wed Oct 9 13:11:40 2013
@@ -107,7 +107,7 @@ fieldConfiguration=mappings.txt
# A SolrYard is used as destination for indexing
# To boost some fields (typically labels) one can use the fieldboosts.properties
# A default field boost configuration is provided.
-indexingDestination=org.apache.stanbol.entityhub.indexing.destination.solryard.SolrYardIndexingDestination,boosts:fieldboosts
+indexingDestination=org.apache.stanbol.entityhub.indexing.destination.solryard.SolrYardIndexingDestination,boosts:fieldboosts,fstConf:fst.config
# ------------