You are viewing a plain text version of this content. The canonical link for it is here.
Posted to commits@lucene.apache.org by rm...@apache.org on 2012/02/08 17:31:06 UTC
svn commit: r1241962 - in /lucene/dev/branches/branch_3x: ./
lucene/contrib/analyzers/common/src/resources/org/apache/lucene/analysis/ar/
lucene/contrib/analyzers/common/src/resources/org/apache/lucene/analysis/el/
lucene/contrib/analyzers/common/src/r...
Author: rmuir
Date: Wed Feb 8 16:31:06 2012
New Revision: 1241962
URL: http://svn.apache.org/viewvc?rev=1241962&view=rev
Log:
SOLR-3056: document expectations in these files
Modified:
lucene/dev/branches/branch_3x/ (props changed)
lucene/dev/branches/branch_3x/lucene/contrib/analyzers/common/src/resources/org/apache/lucene/analysis/ar/stopwords.txt
lucene/dev/branches/branch_3x/lucene/contrib/analyzers/common/src/resources/org/apache/lucene/analysis/el/stopwords.txt
lucene/dev/branches/branch_3x/lucene/contrib/analyzers/common/src/resources/org/apache/lucene/analysis/fa/stopwords.txt
lucene/dev/branches/branch_3x/lucene/contrib/analyzers/common/src/resources/org/apache/lucene/analysis/hi/stopwords.txt
lucene/dev/branches/branch_3x/solr/ (props changed)
lucene/dev/branches/branch_3x/solr/example/solr/conf/lang/stopwords_ar.txt
lucene/dev/branches/branch_3x/solr/example/solr/conf/lang/stopwords_el.txt
lucene/dev/branches/branch_3x/solr/example/solr/conf/lang/stopwords_fa.txt
lucene/dev/branches/branch_3x/solr/example/solr/conf/lang/stopwords_hi.txt
Modified: lucene/dev/branches/branch_3x/lucene/contrib/analyzers/common/src/resources/org/apache/lucene/analysis/ar/stopwords.txt
URL: http://svn.apache.org/viewvc/lucene/dev/branches/branch_3x/lucene/contrib/analyzers/common/src/resources/org/apache/lucene/analysis/ar/stopwords.txt?rev=1241962&r1=1241961&r2=1241962&view=diff
==============================================================================
--- lucene/dev/branches/branch_3x/lucene/contrib/analyzers/common/src/resources/org/apache/lucene/analysis/ar/stopwords.txt (original)
+++ lucene/dev/branches/branch_3x/lucene/contrib/analyzers/common/src/resources/org/apache/lucene/analysis/ar/stopwords.txt Wed Feb 8 16:31:06 2012
@@ -2,6 +2,8 @@
# See http://members.unine.ch/jacques.savoy/clef/index.html.
# Also see http://www.opensource.org/licenses/bsd-license.html
# Cleaned on October 11, 2009 (not normalized, so use before normalization)
+# This means that when modifying this list, you might need to add some
+# redundant entries, for example containing forms with both أ and ا
Ù
Ù
ÙÙ
Ù
Ù
ÙÙا
Modified: lucene/dev/branches/branch_3x/lucene/contrib/analyzers/common/src/resources/org/apache/lucene/analysis/el/stopwords.txt
URL: http://svn.apache.org/viewvc/lucene/dev/branches/branch_3x/lucene/contrib/analyzers/common/src/resources/org/apache/lucene/analysis/el/stopwords.txt?rev=1241962&r1=1241961&r2=1241962&view=diff
==============================================================================
--- lucene/dev/branches/branch_3x/lucene/contrib/analyzers/common/src/resources/org/apache/lucene/analysis/el/stopwords.txt (original)
+++ lucene/dev/branches/branch_3x/lucene/contrib/analyzers/common/src/resources/org/apache/lucene/analysis/el/stopwords.txt Wed Feb 8 16:31:06 2012
@@ -1,4 +1,6 @@
# Lucene Greek Stopwords list
+# Note: by default this file is used after GreekLowerCaseFilter,
+# so when modifying this file use 'Ï' instead of 'Ï'
ο
η
Ïο
Modified: lucene/dev/branches/branch_3x/lucene/contrib/analyzers/common/src/resources/org/apache/lucene/analysis/fa/stopwords.txt
URL: http://svn.apache.org/viewvc/lucene/dev/branches/branch_3x/lucene/contrib/analyzers/common/src/resources/org/apache/lucene/analysis/fa/stopwords.txt?rev=1241962&r1=1241961&r2=1241962&view=diff
==============================================================================
--- lucene/dev/branches/branch_3x/lucene/contrib/analyzers/common/src/resources/org/apache/lucene/analysis/fa/stopwords.txt (original)
+++ lucene/dev/branches/branch_3x/lucene/contrib/analyzers/common/src/resources/org/apache/lucene/analysis/fa/stopwords.txt Wed Feb 8 16:31:06 2012
@@ -1,6 +1,8 @@
# This file was created by Jacques Savoy and is distributed under the BSD license.
# See http://members.unine.ch/jacques.savoy/clef/index.html.
# Also see http://www.opensource.org/licenses/bsd-license.html
+# Note: by default this file is used after normalization, so when adding entries
+# to this file, use the arabic 'Ù' instead of 'Û'
اÙاÙ
ÙداشتÙ
سراسر
Modified: lucene/dev/branches/branch_3x/lucene/contrib/analyzers/common/src/resources/org/apache/lucene/analysis/hi/stopwords.txt
URL: http://svn.apache.org/viewvc/lucene/dev/branches/branch_3x/lucene/contrib/analyzers/common/src/resources/org/apache/lucene/analysis/hi/stopwords.txt?rev=1241962&r1=1241961&r2=1241962&view=diff
==============================================================================
--- lucene/dev/branches/branch_3x/lucene/contrib/analyzers/common/src/resources/org/apache/lucene/analysis/hi/stopwords.txt (original)
+++ lucene/dev/branches/branch_3x/lucene/contrib/analyzers/common/src/resources/org/apache/lucene/analysis/hi/stopwords.txt Wed Feb 8 16:31:06 2012
@@ -1,6 +1,10 @@
# Also see http://www.opensource.org/licenses/bsd-license.html
# See http://members.unine.ch/jacques.savoy/clef/index.html.
# This file was created by Jacques Savoy and is distributed under the BSD license.
+# Note: by default this file also contains forms normalized by HindiNormalizer
+# for spelling variation (see section below), such that it can be used whether or
+# not you enable that feature. When adding additional entries to this list,
+# please add the normalized form as well.
à¤
à¤à¤¦à¤°
à¤
त
à¤
पना
Modified: lucene/dev/branches/branch_3x/solr/example/solr/conf/lang/stopwords_ar.txt
URL: http://svn.apache.org/viewvc/lucene/dev/branches/branch_3x/solr/example/solr/conf/lang/stopwords_ar.txt?rev=1241962&r1=1241961&r2=1241962&view=diff
==============================================================================
--- lucene/dev/branches/branch_3x/solr/example/solr/conf/lang/stopwords_ar.txt (original)
+++ lucene/dev/branches/branch_3x/solr/example/solr/conf/lang/stopwords_ar.txt Wed Feb 8 16:31:06 2012
@@ -2,6 +2,8 @@
# See http://members.unine.ch/jacques.savoy/clef/index.html.
# Also see http://www.opensource.org/licenses/bsd-license.html
# Cleaned on October 11, 2009 (not normalized, so use before normalization)
+# This means that when modifying this list, you might need to add some
+# redundant entries, for example containing forms with both أ and ا
Ù
Ù
ÙÙ
Ù
Ù
ÙÙا
Modified: lucene/dev/branches/branch_3x/solr/example/solr/conf/lang/stopwords_el.txt
URL: http://svn.apache.org/viewvc/lucene/dev/branches/branch_3x/solr/example/solr/conf/lang/stopwords_el.txt?rev=1241962&r1=1241961&r2=1241962&view=diff
==============================================================================
--- lucene/dev/branches/branch_3x/solr/example/solr/conf/lang/stopwords_el.txt (original)
+++ lucene/dev/branches/branch_3x/solr/example/solr/conf/lang/stopwords_el.txt Wed Feb 8 16:31:06 2012
@@ -1,4 +1,6 @@
# Lucene Greek Stopwords list
+# Note: by default this file is used after GreekLowerCaseFilter,
+# so when modifying this file use 'Ï' instead of 'Ï'
ο
η
Ïο
Modified: lucene/dev/branches/branch_3x/solr/example/solr/conf/lang/stopwords_fa.txt
URL: http://svn.apache.org/viewvc/lucene/dev/branches/branch_3x/solr/example/solr/conf/lang/stopwords_fa.txt?rev=1241962&r1=1241961&r2=1241962&view=diff
==============================================================================
--- lucene/dev/branches/branch_3x/solr/example/solr/conf/lang/stopwords_fa.txt (original)
+++ lucene/dev/branches/branch_3x/solr/example/solr/conf/lang/stopwords_fa.txt Wed Feb 8 16:31:06 2012
@@ -1,6 +1,8 @@
# This file was created by Jacques Savoy and is distributed under the BSD license.
# See http://members.unine.ch/jacques.savoy/clef/index.html.
# Also see http://www.opensource.org/licenses/bsd-license.html
+# Note: by default this file is used after normalization, so when adding entries
+# to this file, use the arabic 'Ù' instead of 'Û'
اÙاÙ
ÙداشتÙ
سراسر
Modified: lucene/dev/branches/branch_3x/solr/example/solr/conf/lang/stopwords_hi.txt
URL: http://svn.apache.org/viewvc/lucene/dev/branches/branch_3x/solr/example/solr/conf/lang/stopwords_hi.txt?rev=1241962&r1=1241961&r2=1241962&view=diff
==============================================================================
--- lucene/dev/branches/branch_3x/solr/example/solr/conf/lang/stopwords_hi.txt (original)
+++ lucene/dev/branches/branch_3x/solr/example/solr/conf/lang/stopwords_hi.txt Wed Feb 8 16:31:06 2012
@@ -1,6 +1,10 @@
# Also see http://www.opensource.org/licenses/bsd-license.html
# See http://members.unine.ch/jacques.savoy/clef/index.html.
# This file was created by Jacques Savoy and is distributed under the BSD license.
+# Note: by default this file also contains forms normalized by HindiNormalizer
+# for spelling variation (see section below), such that it can be used whether or
+# not you enable that feature. When adding additional entries to this list,
+# please add the normalized form as well.
à¤
à¤à¤¦à¤°
à¤
त
à¤
पना