You are viewing a plain text version of this content. The canonical link for it is here.
Posted to commits@lucene.apache.org by rm...@apache.org on 2010/07/14 14:10:37 UTC
svn commit: r964019 [3/4] - in /lucene/dev/trunk: lucene/contrib/
modules/analysis/
modules/analysis/common/src/java/org/apache/lucene/analysis/ar/
modules/analysis/common/src/java/org/apache/lucene/analysis/bg/
modules/analysis/common/src/java/org/apa...
Added: lucene/dev/trunk/modules/analysis/common/src/test/org/apache/lucene/analysis/fr/TestFrenchLightStemFilter.java
URL: http://svn.apache.org/viewvc/lucene/dev/trunk/modules/analysis/common/src/test/org/apache/lucene/analysis/fr/TestFrenchLightStemFilter.java?rev=964019&view=auto
==============================================================================
--- lucene/dev/trunk/modules/analysis/common/src/test/org/apache/lucene/analysis/fr/TestFrenchLightStemFilter.java (added)
+++ lucene/dev/trunk/modules/analysis/common/src/test/org/apache/lucene/analysis/fr/TestFrenchLightStemFilter.java Wed Jul 14 12:10:34 2010
@@ -0,0 +1,162 @@
+package org.apache.lucene.analysis.fr;
+
+/**
+ * Licensed to the Apache Software Foundation (ASF) under one or more
+ * contributor license agreements. See the NOTICE file distributed with
+ * this work for additional information regarding copyright ownership.
+ * The ASF licenses this file to You under the Apache License, Version 2.0
+ * (the "License"); you may not use this file except in compliance with
+ * the License. You may obtain a copy of the License at
+ *
+ * http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing, software
+ * distributed under the License is distributed on an "AS IS" BASIS,
+ * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+ * See the License for the specific language governing permissions and
+ * limitations under the License.
+ */
+
+import java.io.IOException;
+import java.io.Reader;
+
+import org.apache.lucene.analysis.Analyzer;
+import org.apache.lucene.analysis.BaseTokenStreamTestCase;
+import org.apache.lucene.analysis.Tokenizer;
+import org.apache.lucene.analysis.core.WhitespaceTokenizer;
+import org.apache.lucene.analysis.util.ReusableAnalyzerBase;
+
+import static org.apache.lucene.analysis.util.VocabularyAssert.*;
+
+/**
+ * Simple tests for {@link FrenchLightStemFilter}
+ */
+public class TestFrenchLightStemFilter extends BaseTokenStreamTestCase {
+ private Analyzer analyzer = new ReusableAnalyzerBase() {
+ @Override
+ protected TokenStreamComponents createComponents(String fieldName,
+ Reader reader) {
+ Tokenizer source = new WhitespaceTokenizer(TEST_VERSION_CURRENT, reader);
+ return new TokenStreamComponents(source, new FrenchLightStemFilter(source));
+ }
+ };
+
+ /** Test some examples from the paper */
+ public void testExamples() throws IOException {
+ checkOneTerm(analyzer, "chevaux", "cheval");
+ checkOneTerm(analyzer, "cheval", "cheval");
+
+ checkOneTerm(analyzer, "hiboux", "hibou");
+ checkOneTerm(analyzer, "hibou", "hibou");
+
+ checkOneTerm(analyzer, "chantés", "chant");
+ checkOneTerm(analyzer, "chanter", "chant");
+ checkOneTerm(analyzer, "chante", "chant");
+ checkOneTerm(analyzer, "chant", "chant");
+
+ checkOneTerm(analyzer, "baronnes", "baron");
+ checkOneTerm(analyzer, "barons", "baron");
+ checkOneTerm(analyzer, "baron", "baron");
+
+ checkOneTerm(analyzer, "peaux", "peau");
+ checkOneTerm(analyzer, "peau", "peau");
+
+ checkOneTerm(analyzer, "anneaux", "aneau");
+ checkOneTerm(analyzer, "anneau", "aneau");
+
+ checkOneTerm(analyzer, "neveux", "neveu");
+ checkOneTerm(analyzer, "neveu", "neveu");
+
+ checkOneTerm(analyzer, "affreux", "afreu");
+ checkOneTerm(analyzer, "affreuse", "afreu");
+
+ checkOneTerm(analyzer, "investissement", "investi");
+ checkOneTerm(analyzer, "investir", "investi");
+
+ checkOneTerm(analyzer, "assourdissant", "asourdi");
+ checkOneTerm(analyzer, "assourdir", "asourdi");
+
+ checkOneTerm(analyzer, "pratiquement", "pratiqu");
+ checkOneTerm(analyzer, "pratique", "pratiqu");
+
+ checkOneTerm(analyzer, "administrativement", "administratif");
+ checkOneTerm(analyzer, "administratif", "administratif");
+
+ checkOneTerm(analyzer, "justificatrice", "justifi");
+ checkOneTerm(analyzer, "justificateur", "justifi");
+ checkOneTerm(analyzer, "justifier", "justifi");
+
+ checkOneTerm(analyzer, "educatrice", "eduqu");
+ checkOneTerm(analyzer, "eduquer", "eduqu");
+
+ checkOneTerm(analyzer, "communicateur", "comuniqu");
+ checkOneTerm(analyzer, "communiquer", "comuniqu");
+
+ checkOneTerm(analyzer, "accompagnatrice", "acompagn");
+ checkOneTerm(analyzer, "accompagnateur", "acompagn");
+
+ checkOneTerm(analyzer, "administrateur", "administr");
+ checkOneTerm(analyzer, "administrer", "administr");
+
+ checkOneTerm(analyzer, "productrice", "product");
+ checkOneTerm(analyzer, "producteur", "product");
+
+ checkOneTerm(analyzer, "acheteuse", "achet");
+ checkOneTerm(analyzer, "acheteur", "achet");
+
+ checkOneTerm(analyzer, "planteur", "plant");
+ checkOneTerm(analyzer, "plante", "plant");
+
+ checkOneTerm(analyzer, "poreuse", "poreu");
+ checkOneTerm(analyzer, "poreux", "poreu");
+
+ checkOneTerm(analyzer, "plieuse", "plieu");
+
+ checkOneTerm(analyzer, "bijoutière", "bijouti");
+ checkOneTerm(analyzer, "bijoutier", "bijouti");
+
+ checkOneTerm(analyzer, "caissière", "caisi");
+ checkOneTerm(analyzer, "caissier", "caisi");
+
+ checkOneTerm(analyzer, "abrasive", "abrasif");
+ checkOneTerm(analyzer, "abrasif", "abrasif");
+
+ checkOneTerm(analyzer, "folle", "fou");
+ checkOneTerm(analyzer, "fou", "fou");
+
+ checkOneTerm(analyzer, "personnelle", "person");
+ checkOneTerm(analyzer, "personne", "person");
+
+ // algo bug: too short length
+ //checkOneTerm(analyzer, "personnel", "person");
+
+ checkOneTerm(analyzer, "complète", "complet");
+ checkOneTerm(analyzer, "complet", "complet");
+
+ checkOneTerm(analyzer, "aromatique", "aromat");
+
+ checkOneTerm(analyzer, "faiblesse", "faibl");
+ checkOneTerm(analyzer, "faible", "faibl");
+
+ checkOneTerm(analyzer, "patinage", "patin");
+ checkOneTerm(analyzer, "patin", "patin");
+
+ checkOneTerm(analyzer, "sonorisation", "sono");
+
+ checkOneTerm(analyzer, "ritualisation", "rituel");
+ checkOneTerm(analyzer, "rituel", "rituel");
+
+ // algo bug: masked by rules above
+ //checkOneTerm(analyzer, "colonisateur", "colon");
+
+ checkOneTerm(analyzer, "nomination", "nomin");
+
+ checkOneTerm(analyzer, "disposition", "dispos");
+ checkOneTerm(analyzer, "dispose", "dispos");
+ }
+
+ /** Test against a vocabulary from the reference impl */
+ public void testVocabulary() throws IOException {
+ assertVocabulary(analyzer, getDataFile("frlighttestdata.zip"), "frlight.txt");
+ }
+}
Propchange: lucene/dev/trunk/modules/analysis/common/src/test/org/apache/lucene/analysis/fr/TestFrenchLightStemFilter.java
------------------------------------------------------------------------------
svn:eol-style = native
Added: lucene/dev/trunk/modules/analysis/common/src/test/org/apache/lucene/analysis/fr/TestFrenchMinimalStemFilter.java
URL: http://svn.apache.org/viewvc/lucene/dev/trunk/modules/analysis/common/src/test/org/apache/lucene/analysis/fr/TestFrenchMinimalStemFilter.java?rev=964019&view=auto
==============================================================================
--- lucene/dev/trunk/modules/analysis/common/src/test/org/apache/lucene/analysis/fr/TestFrenchMinimalStemFilter.java (added)
+++ lucene/dev/trunk/modules/analysis/common/src/test/org/apache/lucene/analysis/fr/TestFrenchMinimalStemFilter.java Wed Jul 14 12:10:34 2010
@@ -0,0 +1,62 @@
+package org.apache.lucene.analysis.fr;
+
+/**
+ * Licensed to the Apache Software Foundation (ASF) under one or more
+ * contributor license agreements. See the NOTICE file distributed with
+ * this work for additional information regarding copyright ownership.
+ * The ASF licenses this file to You under the Apache License, Version 2.0
+ * (the "License"); you may not use this file except in compliance with
+ * the License. You may obtain a copy of the License at
+ *
+ * http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing, software
+ * distributed under the License is distributed on an "AS IS" BASIS,
+ * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+ * See the License for the specific language governing permissions and
+ * limitations under the License.
+ */
+
+import java.io.IOException;
+import java.io.Reader;
+
+import org.apache.lucene.analysis.Analyzer;
+import org.apache.lucene.analysis.BaseTokenStreamTestCase;
+import org.apache.lucene.analysis.Tokenizer;
+import org.apache.lucene.analysis.core.WhitespaceTokenizer;
+import org.apache.lucene.analysis.util.ReusableAnalyzerBase;
+
+import static org.apache.lucene.analysis.util.VocabularyAssert.*;
+
+/**
+ * Simple tests for {@link FrenchMinimalStemFilter}
+ */
+public class TestFrenchMinimalStemFilter extends BaseTokenStreamTestCase {
+ private Analyzer analyzer = new ReusableAnalyzerBase() {
+ @Override
+ protected TokenStreamComponents createComponents(String fieldName,
+ Reader reader) {
+ Tokenizer source = new WhitespaceTokenizer(TEST_VERSION_CURRENT, reader);
+ return new TokenStreamComponents(source, new FrenchMinimalStemFilter(source));
+ }
+ };
+
+ /** Test some examples from the paper */
+ public void testExamples() throws IOException {
+ checkOneTerm(analyzer, "chevaux", "cheval");
+ checkOneTerm(analyzer, "hiboux", "hibou");
+
+ checkOneTerm(analyzer, "chantés", "chant");
+ checkOneTerm(analyzer, "chanter", "chant");
+ checkOneTerm(analyzer, "chante", "chant");
+
+ checkOneTerm(analyzer, "baronnes", "baron");
+ checkOneTerm(analyzer, "barons", "baron");
+ checkOneTerm(analyzer, "baron", "baron");
+ }
+
+ /** Test against a vocabulary from the reference impl */
+ public void testVocabulary() throws IOException {
+ assertVocabulary(analyzer, getDataFile("frminimaltestdata.zip"), "frminimal.txt");
+ }
+}
Propchange: lucene/dev/trunk/modules/analysis/common/src/test/org/apache/lucene/analysis/fr/TestFrenchMinimalStemFilter.java
------------------------------------------------------------------------------
svn:eol-style = native
Added: lucene/dev/trunk/modules/analysis/common/src/test/org/apache/lucene/analysis/fr/frlighttestdata.zip
URL: http://svn.apache.org/viewvc/lucene/dev/trunk/modules/analysis/common/src/test/org/apache/lucene/analysis/fr/frlighttestdata.zip?rev=964019&view=auto
==============================================================================
Binary file - no diff available.
Propchange: lucene/dev/trunk/modules/analysis/common/src/test/org/apache/lucene/analysis/fr/frlighttestdata.zip
------------------------------------------------------------------------------
svn:mime-type = application/octet-stream
Added: lucene/dev/trunk/modules/analysis/common/src/test/org/apache/lucene/analysis/fr/frminimaltestdata.zip
URL: http://svn.apache.org/viewvc/lucene/dev/trunk/modules/analysis/common/src/test/org/apache/lucene/analysis/fr/frminimaltestdata.zip?rev=964019&view=auto
==============================================================================
Binary file - no diff available.
Propchange: lucene/dev/trunk/modules/analysis/common/src/test/org/apache/lucene/analysis/fr/frminimaltestdata.zip
------------------------------------------------------------------------------
svn:mime-type = application/octet-stream
Added: lucene/dev/trunk/modules/analysis/common/src/test/org/apache/lucene/analysis/hu/TestHungarianLightStemFilter.java
URL: http://svn.apache.org/viewvc/lucene/dev/trunk/modules/analysis/common/src/test/org/apache/lucene/analysis/hu/TestHungarianLightStemFilter.java?rev=964019&view=auto
==============================================================================
--- lucene/dev/trunk/modules/analysis/common/src/test/org/apache/lucene/analysis/hu/TestHungarianLightStemFilter.java (added)
+++ lucene/dev/trunk/modules/analysis/common/src/test/org/apache/lucene/analysis/hu/TestHungarianLightStemFilter.java Wed Jul 14 12:10:34 2010
@@ -0,0 +1,48 @@
+package org.apache.lucene.analysis.hu;
+
+/**
+ * Licensed to the Apache Software Foundation (ASF) under one or more
+ * contributor license agreements. See the NOTICE file distributed with
+ * this work for additional information regarding copyright ownership.
+ * The ASF licenses this file to You under the Apache License, Version 2.0
+ * (the "License"); you may not use this file except in compliance with
+ * the License. You may obtain a copy of the License at
+ *
+ * http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing, software
+ * distributed under the License is distributed on an "AS IS" BASIS,
+ * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+ * See the License for the specific language governing permissions and
+ * limitations under the License.
+ */
+
+import java.io.IOException;
+import java.io.Reader;
+
+import org.apache.lucene.analysis.Analyzer;
+import org.apache.lucene.analysis.BaseTokenStreamTestCase;
+import org.apache.lucene.analysis.Tokenizer;
+import org.apache.lucene.analysis.core.WhitespaceTokenizer;
+import org.apache.lucene.analysis.util.ReusableAnalyzerBase;
+
+import static org.apache.lucene.analysis.util.VocabularyAssert.*;
+
+/**
+ * Simple tests for {@link HungarianLightStemFilter}
+ */
+public class TestHungarianLightStemFilter extends BaseTokenStreamTestCase {
+ private Analyzer analyzer = new ReusableAnalyzerBase() {
+ @Override
+ protected TokenStreamComponents createComponents(String fieldName,
+ Reader reader) {
+ Tokenizer source = new WhitespaceTokenizer(TEST_VERSION_CURRENT, reader);
+ return new TokenStreamComponents(source, new HungarianLightStemFilter(source));
+ }
+ };
+
+ /** Test against a vocabulary from the reference impl */
+ public void testVocabulary() throws IOException {
+ assertVocabulary(analyzer, getDataFile("hulighttestdata.zip"), "hulight.txt");
+ }
+}
Propchange: lucene/dev/trunk/modules/analysis/common/src/test/org/apache/lucene/analysis/hu/TestHungarianLightStemFilter.java
------------------------------------------------------------------------------
svn:eol-style = native
Added: lucene/dev/trunk/modules/analysis/common/src/test/org/apache/lucene/analysis/hu/hulighttestdata.zip
URL: http://svn.apache.org/viewvc/lucene/dev/trunk/modules/analysis/common/src/test/org/apache/lucene/analysis/hu/hulighttestdata.zip?rev=964019&view=auto
==============================================================================
Binary file - no diff available.
Propchange: lucene/dev/trunk/modules/analysis/common/src/test/org/apache/lucene/analysis/hu/hulighttestdata.zip
------------------------------------------------------------------------------
svn:mime-type = application/octet-stream
Added: lucene/dev/trunk/modules/analysis/common/src/test/org/apache/lucene/analysis/it/TestItalianLightStemFilter.java
URL: http://svn.apache.org/viewvc/lucene/dev/trunk/modules/analysis/common/src/test/org/apache/lucene/analysis/it/TestItalianLightStemFilter.java?rev=964019&view=auto
==============================================================================
--- lucene/dev/trunk/modules/analysis/common/src/test/org/apache/lucene/analysis/it/TestItalianLightStemFilter.java (added)
+++ lucene/dev/trunk/modules/analysis/common/src/test/org/apache/lucene/analysis/it/TestItalianLightStemFilter.java Wed Jul 14 12:10:34 2010
@@ -0,0 +1,48 @@
+package org.apache.lucene.analysis.it;
+
+/**
+ * Licensed to the Apache Software Foundation (ASF) under one or more
+ * contributor license agreements. See the NOTICE file distributed with
+ * this work for additional information regarding copyright ownership.
+ * The ASF licenses this file to You under the Apache License, Version 2.0
+ * (the "License"); you may not use this file except in compliance with
+ * the License. You may obtain a copy of the License at
+ *
+ * http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing, software
+ * distributed under the License is distributed on an "AS IS" BASIS,
+ * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+ * See the License for the specific language governing permissions and
+ * limitations under the License.
+ */
+
+import java.io.IOException;
+import java.io.Reader;
+
+import org.apache.lucene.analysis.Analyzer;
+import org.apache.lucene.analysis.BaseTokenStreamTestCase;
+import org.apache.lucene.analysis.Tokenizer;
+import org.apache.lucene.analysis.core.WhitespaceTokenizer;
+import org.apache.lucene.analysis.util.ReusableAnalyzerBase;
+
+import static org.apache.lucene.analysis.util.VocabularyAssert.*;
+
+/**
+ * Simple tests for {@link ItalianLightStemFilter}
+ */
+public class TestItalianLightStemFilter extends BaseTokenStreamTestCase {
+ private Analyzer analyzer = new ReusableAnalyzerBase() {
+ @Override
+ protected TokenStreamComponents createComponents(String fieldName,
+ Reader reader) {
+ Tokenizer source = new WhitespaceTokenizer(TEST_VERSION_CURRENT, reader);
+ return new TokenStreamComponents(source, new ItalianLightStemFilter(source));
+ }
+ };
+
+ /** Test against a vocabulary from the reference impl */
+ public void testVocabulary() throws IOException {
+ assertVocabulary(analyzer, getDataFile("itlighttestdata.zip"), "itlight.txt");
+ }
+}
Propchange: lucene/dev/trunk/modules/analysis/common/src/test/org/apache/lucene/analysis/it/TestItalianLightStemFilter.java
------------------------------------------------------------------------------
svn:eol-style = native
Added: lucene/dev/trunk/modules/analysis/common/src/test/org/apache/lucene/analysis/it/itlighttestdata.zip
URL: http://svn.apache.org/viewvc/lucene/dev/trunk/modules/analysis/common/src/test/org/apache/lucene/analysis/it/itlighttestdata.zip?rev=964019&view=auto
==============================================================================
Binary file - no diff available.
Propchange: lucene/dev/trunk/modules/analysis/common/src/test/org/apache/lucene/analysis/it/itlighttestdata.zip
------------------------------------------------------------------------------
svn:mime-type = application/octet-stream
Added: lucene/dev/trunk/modules/analysis/common/src/test/org/apache/lucene/analysis/pt/TestPortugueseLightStemFilter.java
URL: http://svn.apache.org/viewvc/lucene/dev/trunk/modules/analysis/common/src/test/org/apache/lucene/analysis/pt/TestPortugueseLightStemFilter.java?rev=964019&view=auto
==============================================================================
--- lucene/dev/trunk/modules/analysis/common/src/test/org/apache/lucene/analysis/pt/TestPortugueseLightStemFilter.java (added)
+++ lucene/dev/trunk/modules/analysis/common/src/test/org/apache/lucene/analysis/pt/TestPortugueseLightStemFilter.java Wed Jul 14 12:10:34 2010
@@ -0,0 +1,95 @@
+package org.apache.lucene.analysis.pt;
+
+/**
+ * Licensed to the Apache Software Foundation (ASF) under one or more
+ * contributor license agreements. See the NOTICE file distributed with
+ * this work for additional information regarding copyright ownership.
+ * The ASF licenses this file to You under the Apache License, Version 2.0
+ * (the "License"); you may not use this file except in compliance with
+ * the License. You may obtain a copy of the License at
+ *
+ * http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing, software
+ * distributed under the License is distributed on an "AS IS" BASIS,
+ * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+ * See the License for the specific language governing permissions and
+ * limitations under the License.
+ */
+
+import java.io.IOException;
+import java.io.Reader;
+
+import org.apache.lucene.analysis.Analyzer;
+import org.apache.lucene.analysis.BaseTokenStreamTestCase;
+import org.apache.lucene.analysis.TokenStream;
+import org.apache.lucene.analysis.Tokenizer;
+import org.apache.lucene.analysis.core.LowerCaseFilter;
+import org.apache.lucene.analysis.standard.StandardTokenizer;
+import org.apache.lucene.analysis.util.ReusableAnalyzerBase;
+
+import static org.apache.lucene.analysis.util.VocabularyAssert.*;
+
+/**
+ * Simple tests for {@link PortugueseLightStemFilter}
+ */
+public class TestPortugueseLightStemFilter extends BaseTokenStreamTestCase {
+ private Analyzer analyzer = new ReusableAnalyzerBase() {
+ @Override
+ protected TokenStreamComponents createComponents(String fieldName,
+ Reader reader) {
+ Tokenizer source = new StandardTokenizer(TEST_VERSION_CURRENT, reader);
+ TokenStream result = new LowerCaseFilter(TEST_VERSION_CURRENT, source);
+ return new TokenStreamComponents(source, new PortugueseLightStemFilter(result));
+ }
+ };
+
+ /**
+ * Test the example from the paper "Assessing the impact of stemming accuracy
+ * on information retrieval"
+ */
+ public void testExamples() throws IOException {
+ assertAnalyzesTo(
+ analyzer,
+ "O debate polÃtico, pelo menos o que vem a público, parece, de modo nada "
+ + "surpreendente, restrito a temas menores. Mas há, evidentemente, "
+ + "grandes questões em jogo nas eleições que se aproximam.",
+ new String[] {
+ "o", "debat", "politic", "pelo", "meno", "o", "que", "vem", "a",
+ "public", "parec", "de", "modo", "nada", "surpreendent", "restrit",
+ "a", "tema", "menor", "mas", "há", "evident", "grand", "questa",
+ "em", "jogo", "nas", "eleica", "que", "se", "aproximam"
+ });
+ }
+
+ /**
+ * Test examples from the c implementation
+ */
+ public void testMoreExamples() throws IOException {
+ checkOneTerm(analyzer, "doutores", "doutor");
+ checkOneTerm(analyzer, "doutor", "doutor");
+
+ checkOneTerm(analyzer, "homens", "homem");
+ checkOneTerm(analyzer, "homem", "homem");
+
+ checkOneTerm(analyzer, "papéis", "papel");
+ checkOneTerm(analyzer, "papel", "papel");
+
+ checkOneTerm(analyzer, "normais", "normal");
+ checkOneTerm(analyzer, "normal", "normal");
+
+ checkOneTerm(analyzer, "lencóis", "lencol");
+ checkOneTerm(analyzer, "lencol", "lencol");
+
+ checkOneTerm(analyzer, "barris", "barril");
+ checkOneTerm(analyzer, "barril", "barril");
+
+ checkOneTerm(analyzer, "botões", "bota");
+ checkOneTerm(analyzer, "botão", "bota");
+ }
+
+ /** Test against a vocabulary from the reference impl */
+ public void testVocabulary() throws IOException {
+ assertVocabulary(analyzer, getDataFile("ptlighttestdata.zip"), "ptlight.txt");
+ }
+}
Propchange: lucene/dev/trunk/modules/analysis/common/src/test/org/apache/lucene/analysis/pt/TestPortugueseLightStemFilter.java
------------------------------------------------------------------------------
svn:eol-style = native
Added: lucene/dev/trunk/modules/analysis/common/src/test/org/apache/lucene/analysis/pt/TestPortugueseMinimalStemFilter.java
URL: http://svn.apache.org/viewvc/lucene/dev/trunk/modules/analysis/common/src/test/org/apache/lucene/analysis/pt/TestPortugueseMinimalStemFilter.java?rev=964019&view=auto
==============================================================================
--- lucene/dev/trunk/modules/analysis/common/src/test/org/apache/lucene/analysis/pt/TestPortugueseMinimalStemFilter.java (added)
+++ lucene/dev/trunk/modules/analysis/common/src/test/org/apache/lucene/analysis/pt/TestPortugueseMinimalStemFilter.java Wed Jul 14 12:10:34 2010
@@ -0,0 +1,69 @@
+package org.apache.lucene.analysis.pt;
+
+/**
+ * Licensed to the Apache Software Foundation (ASF) under one or more
+ * contributor license agreements. See the NOTICE file distributed with
+ * this work for additional information regarding copyright ownership.
+ * The ASF licenses this file to You under the Apache License, Version 2.0
+ * (the "License"); you may not use this file except in compliance with
+ * the License. You may obtain a copy of the License at
+ *
+ * http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing, software
+ * distributed under the License is distributed on an "AS IS" BASIS,
+ * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+ * See the License for the specific language governing permissions and
+ * limitations under the License.
+ */
+
+import java.io.IOException;
+import java.io.Reader;
+
+import org.apache.lucene.analysis.Analyzer;
+import org.apache.lucene.analysis.BaseTokenStreamTestCase;
+import org.apache.lucene.analysis.TokenStream;
+import org.apache.lucene.analysis.Tokenizer;
+import org.apache.lucene.analysis.core.LowerCaseFilter;
+import org.apache.lucene.analysis.standard.StandardTokenizer;
+import org.apache.lucene.analysis.util.ReusableAnalyzerBase;
+
+import static org.apache.lucene.analysis.util.VocabularyAssert.*;
+
+/**
+ * Simple tests for {@link PortugueseMinimalStemFilter}
+ */
+public class TestPortugueseMinimalStemFilter extends BaseTokenStreamTestCase {
+ private Analyzer analyzer = new ReusableAnalyzerBase() {
+ @Override
+ protected TokenStreamComponents createComponents(String fieldName,
+ Reader reader) {
+ Tokenizer source = new StandardTokenizer(TEST_VERSION_CURRENT, reader);
+ TokenStream result = new LowerCaseFilter(TEST_VERSION_CURRENT, source);
+ return new TokenStreamComponents(source, new PortugueseMinimalStemFilter(result));
+ }
+ };
+
+ /**
+ * Test the example from the paper "Assessing the impact of stemming accuracy
+ * on information retrieval"
+ */
+ public void testExamples() throws IOException {
+ assertAnalyzesTo(
+ analyzer,
+ "O debate polÃtico, pelo menos o que vem a público, parece, de modo nada "
+ + "surpreendente, restrito a temas menores. Mas há, evidentemente, "
+ + "grandes questões em jogo nas eleições que se aproximam.",
+ new String[] {
+ "o", "debate", "polÃtico", "pelo", "menos", "o", "que", "vem", "a",
+ "público", "parece", "de", "modo", "nada", "surpreendente", "restrito",
+ "a", "tema", "menor", "mas", "há", "evidentemente", "grande", "questão",
+ "em", "jogo", "na", "eleição", "que", "se", "aproximam"
+ });
+ }
+
+ /** Test against a vocabulary from the reference impl */
+ public void testVocabulary() throws IOException {
+ assertVocabulary(analyzer, getDataFile("ptminimaltestdata.zip"), "ptminimal.txt");
+ }
+}
Propchange: lucene/dev/trunk/modules/analysis/common/src/test/org/apache/lucene/analysis/pt/TestPortugueseMinimalStemFilter.java
------------------------------------------------------------------------------
svn:eol-style = native
Added: lucene/dev/trunk/modules/analysis/common/src/test/org/apache/lucene/analysis/pt/ptlighttestdata.zip
URL: http://svn.apache.org/viewvc/lucene/dev/trunk/modules/analysis/common/src/test/org/apache/lucene/analysis/pt/ptlighttestdata.zip?rev=964019&view=auto
==============================================================================
Binary file - no diff available.
Propchange: lucene/dev/trunk/modules/analysis/common/src/test/org/apache/lucene/analysis/pt/ptlighttestdata.zip
------------------------------------------------------------------------------
svn:mime-type = application/octet-stream
Added: lucene/dev/trunk/modules/analysis/common/src/test/org/apache/lucene/analysis/pt/ptminimaltestdata.zip
URL: http://svn.apache.org/viewvc/lucene/dev/trunk/modules/analysis/common/src/test/org/apache/lucene/analysis/pt/ptminimaltestdata.zip?rev=964019&view=auto
==============================================================================
Binary file - no diff available.
Propchange: lucene/dev/trunk/modules/analysis/common/src/test/org/apache/lucene/analysis/pt/ptminimaltestdata.zip
------------------------------------------------------------------------------
svn:mime-type = application/octet-stream
Added: lucene/dev/trunk/modules/analysis/common/src/test/org/apache/lucene/analysis/ru/TestRussianLightStemFilter.java
URL: http://svn.apache.org/viewvc/lucene/dev/trunk/modules/analysis/common/src/test/org/apache/lucene/analysis/ru/TestRussianLightStemFilter.java?rev=964019&view=auto
==============================================================================
--- lucene/dev/trunk/modules/analysis/common/src/test/org/apache/lucene/analysis/ru/TestRussianLightStemFilter.java (added)
+++ lucene/dev/trunk/modules/analysis/common/src/test/org/apache/lucene/analysis/ru/TestRussianLightStemFilter.java Wed Jul 14 12:10:34 2010
@@ -0,0 +1,48 @@
+package org.apache.lucene.analysis.ru;
+
+/**
+ * Licensed to the Apache Software Foundation (ASF) under one or more
+ * contributor license agreements. See the NOTICE file distributed with
+ * this work for additional information regarding copyright ownership.
+ * The ASF licenses this file to You under the Apache License, Version 2.0
+ * (the "License"); you may not use this file except in compliance with
+ * the License. You may obtain a copy of the License at
+ *
+ * http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing, software
+ * distributed under the License is distributed on an "AS IS" BASIS,
+ * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+ * See the License for the specific language governing permissions and
+ * limitations under the License.
+ */
+
+import java.io.IOException;
+import java.io.Reader;
+
+import org.apache.lucene.analysis.Analyzer;
+import org.apache.lucene.analysis.BaseTokenStreamTestCase;
+import org.apache.lucene.analysis.Tokenizer;
+import org.apache.lucene.analysis.core.WhitespaceTokenizer;
+import org.apache.lucene.analysis.util.ReusableAnalyzerBase;
+
+import static org.apache.lucene.analysis.util.VocabularyAssert.*;
+
+/**
+ * Simple tests for {@link RussianLightStemFilter}
+ */
+public class TestRussianLightStemFilter extends BaseTokenStreamTestCase {
+ private Analyzer analyzer = new ReusableAnalyzerBase() {
+ @Override
+ protected TokenStreamComponents createComponents(String fieldName,
+ Reader reader) {
+ Tokenizer source = new WhitespaceTokenizer(TEST_VERSION_CURRENT, reader);
+ return new TokenStreamComponents(source, new RussianLightStemFilter(source));
+ }
+ };
+
+ /** Test against a vocabulary from the reference impl */
+ public void testVocabulary() throws IOException {
+ assertVocabulary(analyzer, getDataFile("rulighttestdata.zip"), "rulight.txt");
+ }
+}
Propchange: lucene/dev/trunk/modules/analysis/common/src/test/org/apache/lucene/analysis/ru/TestRussianLightStemFilter.java
------------------------------------------------------------------------------
svn:eol-style = native
Modified: lucene/dev/trunk/modules/analysis/common/src/test/org/apache/lucene/analysis/ru/TestRussianStem.java
URL: http://svn.apache.org/viewvc/lucene/dev/trunk/modules/analysis/common/src/test/org/apache/lucene/analysis/ru/TestRussianStem.java?rev=964019&r1=964018&r2=964019&view=diff
==============================================================================
--- lucene/dev/trunk/modules/analysis/common/src/test/org/apache/lucene/analysis/ru/TestRussianStem.java (original)
+++ lucene/dev/trunk/modules/analysis/common/src/test/org/apache/lucene/analysis/ru/TestRussianStem.java Wed Jul 14 12:10:34 2010
@@ -17,71 +17,35 @@ package org.apache.lucene.analysis.ru;
* limitations under the License.
*/
+import org.apache.lucene.analysis.Analyzer;
+import org.apache.lucene.analysis.Tokenizer;
+import org.apache.lucene.analysis.core.KeywordTokenizer;
+import org.apache.lucene.analysis.util.ReusableAnalyzerBase;
import org.apache.lucene.util.LuceneTestCase;
-import java.io.BufferedReader;
-import java.io.File;
-import java.io.InputStreamReader;
-import java.io.FileInputStream;
-import java.util.ArrayList;
+import java.io.IOException;
+import java.io.InputStream;
+import java.io.Reader;
+
+import static org.apache.lucene.analysis.util.VocabularyAssert.*;
/**
* @deprecated Remove this test class (and its datafiles!) in Lucene 4.0
*/
@Deprecated
-public class TestRussianStem extends LuceneTestCase
-{
- private ArrayList<String> words = new ArrayList<String>();
- private ArrayList<String> stems = new ArrayList<String>();
-
- public TestRussianStem(String name)
- {
- super(name);
- }
-
- /**
- * @see TestCase#setUp()
- */
- @Override
- protected void setUp() throws Exception {
- super.setUp();
- //System.out.println(new java.util.Date());
- String str;
-
- // open and read words into an array list
- BufferedReader inWords =
- new BufferedReader(
- new InputStreamReader(
- getClass().getResourceAsStream("wordsUTF8.txt"),
- "UTF-8"));
- while ((str = inWords.readLine()) != null)
- {
- words.add(str);
- }
- inWords.close();
-
- // open and read stems into an array list
- BufferedReader inStems =
- new BufferedReader(
- new InputStreamReader(
- getClass().getResourceAsStream("stemsUTF8.txt"),
- "UTF-8"));
- while ((str = inStems.readLine()) != null)
- {
- stems.add(str);
- }
- inStems.close();
- }
-
- public void testStem()
- {
- for (int i = 0; i < words.size(); i++)
- {
- //if ( (i % 100) == 0 ) System.err.println(i);
- String realStem =
- RussianStemmer.stemWord(
- words.get(i));
- assertEquals("unicode", stems.get(i), realStem);
- }
- }
-
+public class TestRussianStem extends LuceneTestCase {
+ public void testStem() throws IOException {
+ Analyzer a = new ReusableAnalyzerBase() {
+ @Override
+ protected TokenStreamComponents createComponents(String fieldName,
+ Reader reader) {
+ Tokenizer t = new KeywordTokenizer(reader);
+ return new TokenStreamComponents(t, new RussianStemFilter(t));
+ }
+ };
+ InputStream voc = getClass().getResourceAsStream("wordsUTF8.txt");
+ InputStream out = getClass().getResourceAsStream("stemsUTF8.txt");
+ assertVocabulary(a, voc, out);
+ voc.close();
+ out.close();
+ }
}
Added: lucene/dev/trunk/modules/analysis/common/src/test/org/apache/lucene/analysis/ru/rulighttestdata.zip
URL: http://svn.apache.org/viewvc/lucene/dev/trunk/modules/analysis/common/src/test/org/apache/lucene/analysis/ru/rulighttestdata.zip?rev=964019&view=auto
==============================================================================
Binary file - no diff available.
Propchange: lucene/dev/trunk/modules/analysis/common/src/test/org/apache/lucene/analysis/ru/rulighttestdata.zip
------------------------------------------------------------------------------
svn:mime-type = application/octet-stream
Modified: lucene/dev/trunk/modules/analysis/common/src/test/org/apache/lucene/analysis/snowball/TestSnowballVocab.java
URL: http://svn.apache.org/viewvc/lucene/dev/trunk/modules/analysis/common/src/test/org/apache/lucene/analysis/snowball/TestSnowballVocab.java?rev=964019&r1=964018&r2=964019&view=diff
==============================================================================
--- lucene/dev/trunk/modules/analysis/common/src/test/org/apache/lucene/analysis/snowball/TestSnowballVocab.java (original)
+++ lucene/dev/trunk/modules/analysis/common/src/test/org/apache/lucene/analysis/snowball/TestSnowballVocab.java Wed Jul 14 12:10:34 2010
@@ -17,38 +17,21 @@ package org.apache.lucene.analysis.snowb
* limitations under the License.
*/
-import java.io.BufferedReader;
import java.io.IOException;
-import java.io.InputStream;
-import java.io.InputStreamReader;
-import java.io.StringReader;
-import java.util.zip.ZipFile;
+import java.io.Reader;
-import org.apache.lucene.analysis.BaseTokenStreamTestCase;
-import org.apache.lucene.analysis.TokenStream;
+import org.apache.lucene.analysis.Analyzer;
import org.apache.lucene.analysis.Tokenizer;
import org.apache.lucene.analysis.core.KeywordTokenizer;
+import org.apache.lucene.analysis.util.ReusableAnalyzerBase;
+import org.apache.lucene.util.LuceneTestCase;
+
+import static org.apache.lucene.analysis.util.VocabularyAssert.*;
/**
* Test the snowball filters against the snowball data tests
*/
-public class TestSnowballVocab extends BaseTokenStreamTestCase {
- private Tokenizer tokenizer = new KeywordTokenizer(new StringReader(""));
- ZipFile zipFile = null;
-
- @Override
- protected void setUp() throws Exception {
- super.setUp();
- this.zipFile = new ZipFile(getDataFile("TestSnowballVocabData.zip"));
- }
-
- @Override
- protected void tearDown() throws Exception {
- this.zipFile.close();
- this.zipFile = null;
- super.tearDown();
- }
-
+public class TestSnowballVocab extends LuceneTestCase {
/**
* Run all languages against their snowball vocabulary tests.
*/
@@ -82,25 +65,20 @@ public class TestSnowballVocab extends B
* For the supplied language, run the stemmer against all strings in voc.txt
* The output should be the same as the string in output.txt
*/
- private void assertCorrectOutput(String snowballLanguage, String dataDirectory)
+ private void assertCorrectOutput(final String snowballLanguage, String dataDirectory)
throws IOException {
if (VERBOSE) System.out.println("checking snowball language: " + snowballLanguage);
- TokenStream filter = new SnowballFilter(tokenizer, snowballLanguage);
- InputStream voc = zipFile.getInputStream(zipFile.getEntry(dataDirectory + "/voc.txt"));
- InputStream out = zipFile.getInputStream(zipFile.getEntry(dataDirectory + "/output.txt"));
- BufferedReader vocReader = new BufferedReader(new InputStreamReader(
- voc, "UTF-8"));
- BufferedReader outputReader = new BufferedReader(new InputStreamReader(
- out, "UTF-8"));
- String inputWord = null;
- while ((inputWord = vocReader.readLine()) != null) {
- String expectedWord = outputReader.readLine();
- assertNotNull(expectedWord);
- tokenizer.reset(new StringReader(inputWord));
- filter.reset();
- assertTokenStreamContents(filter, new String[] {expectedWord});
- }
- vocReader.close();
- outputReader.close();
+
+ Analyzer a = new ReusableAnalyzerBase() {
+ @Override
+ protected TokenStreamComponents createComponents(String fieldName,
+ Reader reader) {
+ Tokenizer t = new KeywordTokenizer(reader);
+ return new TokenStreamComponents(t, new SnowballFilter(t, snowballLanguage));
+ }
+ };
+
+ assertVocabulary(a, getDataFile("TestSnowballVocabData.zip"),
+ dataDirectory + "/voc.txt", dataDirectory + "/output.txt");
}
}
Added: lucene/dev/trunk/modules/analysis/common/src/test/org/apache/lucene/analysis/sv/TestSwedishLightStemFilter.java
URL: http://svn.apache.org/viewvc/lucene/dev/trunk/modules/analysis/common/src/test/org/apache/lucene/analysis/sv/TestSwedishLightStemFilter.java?rev=964019&view=auto
==============================================================================
--- lucene/dev/trunk/modules/analysis/common/src/test/org/apache/lucene/analysis/sv/TestSwedishLightStemFilter.java (added)
+++ lucene/dev/trunk/modules/analysis/common/src/test/org/apache/lucene/analysis/sv/TestSwedishLightStemFilter.java Wed Jul 14 12:10:34 2010
@@ -0,0 +1,48 @@
+package org.apache.lucene.analysis.sv;
+
+/**
+ * Licensed to the Apache Software Foundation (ASF) under one or more
+ * contributor license agreements. See the NOTICE file distributed with
+ * this work for additional information regarding copyright ownership.
+ * The ASF licenses this file to You under the Apache License, Version 2.0
+ * (the "License"); you may not use this file except in compliance with
+ * the License. You may obtain a copy of the License at
+ *
+ * http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing, software
+ * distributed under the License is distributed on an "AS IS" BASIS,
+ * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+ * See the License for the specific language governing permissions and
+ * limitations under the License.
+ */
+
+import java.io.IOException;
+import java.io.Reader;
+
+import org.apache.lucene.analysis.Analyzer;
+import org.apache.lucene.analysis.BaseTokenStreamTestCase;
+import org.apache.lucene.analysis.Tokenizer;
+import org.apache.lucene.analysis.core.WhitespaceTokenizer;
+import org.apache.lucene.analysis.util.ReusableAnalyzerBase;
+
+import static org.apache.lucene.analysis.util.VocabularyAssert.*;
+
+/**
+ * Simple tests for {@link SwedishLightStemFilter}
+ */
+public class TestSwedishLightStemFilter extends BaseTokenStreamTestCase {
+ private Analyzer analyzer = new ReusableAnalyzerBase() {
+ @Override
+ protected TokenStreamComponents createComponents(String fieldName,
+ Reader reader) {
+ Tokenizer source = new WhitespaceTokenizer(TEST_VERSION_CURRENT, reader);
+ return new TokenStreamComponents(source, new SwedishLightStemFilter(source));
+ }
+ };
+
+ /** Test against a vocabulary from the reference impl */
+ public void testVocabulary() throws IOException {
+ assertVocabulary(analyzer, getDataFile("svlighttestdata.zip"), "svlight.txt");
+ }
+}
Propchange: lucene/dev/trunk/modules/analysis/common/src/test/org/apache/lucene/analysis/sv/TestSwedishLightStemFilter.java
------------------------------------------------------------------------------
svn:eol-style = native
Added: lucene/dev/trunk/modules/analysis/common/src/test/org/apache/lucene/analysis/sv/svlighttestdata.zip
URL: http://svn.apache.org/viewvc/lucene/dev/trunk/modules/analysis/common/src/test/org/apache/lucene/analysis/sv/svlighttestdata.zip?rev=964019&view=auto
==============================================================================
Binary file - no diff available.
Propchange: lucene/dev/trunk/modules/analysis/common/src/test/org/apache/lucene/analysis/sv/svlighttestdata.zip
------------------------------------------------------------------------------
svn:mime-type = application/octet-stream
Added: lucene/dev/trunk/modules/analysis/common/src/test/org/apache/lucene/analysis/util/VocabularyAssert.java
URL: http://svn.apache.org/viewvc/lucene/dev/trunk/modules/analysis/common/src/test/org/apache/lucene/analysis/util/VocabularyAssert.java?rev=964019&view=auto
==============================================================================
--- lucene/dev/trunk/modules/analysis/common/src/test/org/apache/lucene/analysis/util/VocabularyAssert.java (added)
+++ lucene/dev/trunk/modules/analysis/common/src/test/org/apache/lucene/analysis/util/VocabularyAssert.java Wed Jul 14 12:10:34 2010
@@ -0,0 +1,83 @@
+package org.apache.lucene.analysis.util;
+
+/**
+ * Licensed to the Apache Software Foundation (ASF) under one or more
+ * contributor license agreements. See the NOTICE file distributed with
+ * this work for additional information regarding copyright ownership.
+ * The ASF licenses this file to You under the Apache License, Version 2.0
+ * (the "License"); you may not use this file except in compliance with
+ * the License. You may obtain a copy of the License at
+ *
+ * http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing, software
+ * distributed under the License is distributed on an "AS IS" BASIS,
+ * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+ * See the License for the specific language governing permissions and
+ * limitations under the License.
+ */
+
+import java.io.BufferedReader;
+import java.io.File;
+import java.io.IOException;
+import java.io.InputStream;
+import java.io.InputStreamReader;
+import java.util.zip.ZipFile;
+
+import org.apache.lucene.analysis.Analyzer;
+import org.apache.lucene.analysis.BaseTokenStreamTestCase;
+import org.junit.Assert;
+
+/** Utility class for doing vocabulary-based stemming tests */
+public class VocabularyAssert {
+ /** Run a vocabulary test against two data files. */
+ public static void assertVocabulary(Analyzer a, InputStream voc, InputStream out)
+ throws IOException {
+ BufferedReader vocReader = new BufferedReader(
+ new InputStreamReader(voc, "UTF-8"));
+ BufferedReader outputReader = new BufferedReader(
+ new InputStreamReader(out, "UTF-8"));
+ String inputWord = null;
+ while ((inputWord = vocReader.readLine()) != null) {
+ String expectedWord = outputReader.readLine();
+ Assert.assertNotNull(expectedWord);
+ BaseTokenStreamTestCase.checkOneTermReuse(a, inputWord, expectedWord);
+ }
+ }
+
+ /** Run a vocabulary test against one file: tab separated. */
+ public static void assertVocabulary(Analyzer a, InputStream vocOut)
+ throws IOException {
+ BufferedReader vocReader = new BufferedReader(
+ new InputStreamReader(vocOut, "UTF-8"));
+ String inputLine = null;
+ while ((inputLine = vocReader.readLine()) != null) {
+ if (inputLine.startsWith("#") || inputLine.trim().length() == 0)
+ continue; /* comment */
+ String words[] = inputLine.split("\t");
+ BaseTokenStreamTestCase.checkOneTermReuse(a, words[0], words[1]);
+ }
+ }
+
+ /** Run a vocabulary test against two data files inside a zip file */
+ public static void assertVocabulary(Analyzer a, File zipFile, String voc, String out)
+ throws IOException {
+ ZipFile zip = new ZipFile(zipFile);
+ InputStream v = zip.getInputStream(zip.getEntry(voc));
+ InputStream o = zip.getInputStream(zip.getEntry(out));
+ assertVocabulary(a, v, o);
+ v.close();
+ o.close();
+ zip.close();
+ }
+
+ /** Run a vocabulary test against a tab-separated data file inside a zip file */
+ public static void assertVocabulary(Analyzer a, File zipFile, String vocOut)
+ throws IOException {
+ ZipFile zip = new ZipFile(zipFile);
+ InputStream vo = zip.getInputStream(zip.getEntry(vocOut));
+ assertVocabulary(a, vo);
+ vo.close();
+ zip.close();
+ }
+}
Propchange: lucene/dev/trunk/modules/analysis/common/src/test/org/apache/lucene/analysis/util/VocabularyAssert.java
------------------------------------------------------------------------------
svn:eol-style = native
Added: lucene/dev/trunk/solr/src/java/org/apache/solr/analysis/EnglishMinimalStemFilterFactory.java
URL: http://svn.apache.org/viewvc/lucene/dev/trunk/solr/src/java/org/apache/solr/analysis/EnglishMinimalStemFilterFactory.java?rev=964019&view=auto
==============================================================================
--- lucene/dev/trunk/solr/src/java/org/apache/solr/analysis/EnglishMinimalStemFilterFactory.java (added)
+++ lucene/dev/trunk/solr/src/java/org/apache/solr/analysis/EnglishMinimalStemFilterFactory.java Wed Jul 14 12:10:34 2010
@@ -0,0 +1,28 @@
+package org.apache.solr.analysis;
+
+/**
+ * Licensed to the Apache Software Foundation (ASF) under one or more
+ * contributor license agreements. See the NOTICE file distributed with
+ * this work for additional information regarding copyright ownership.
+ * The ASF licenses this file to You under the Apache License, Version 2.0
+ * (the "License"); you may not use this file except in compliance with
+ * the License. You may obtain a copy of the License at
+ *
+ * http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing, software
+ * distributed under the License is distributed on an "AS IS" BASIS,
+ * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+ * See the License for the specific language governing permissions and
+ * limitations under the License.
+ */
+
+import org.apache.lucene.analysis.TokenStream;
+import org.apache.lucene.analysis.en.EnglishMinimalStemFilter;
+
+/** Factory for {@link EnglishMinimalStemFilter} */
+public class EnglishMinimalStemFilterFactory extends BaseTokenFilterFactory {
+ public TokenStream create(TokenStream input) {
+ return new EnglishMinimalStemFilter(input);
+ }
+}
Propchange: lucene/dev/trunk/solr/src/java/org/apache/solr/analysis/EnglishMinimalStemFilterFactory.java
------------------------------------------------------------------------------
svn:eol-style = native
Added: lucene/dev/trunk/solr/src/java/org/apache/solr/analysis/FinnishLightStemFilterFactory.java
URL: http://svn.apache.org/viewvc/lucene/dev/trunk/solr/src/java/org/apache/solr/analysis/FinnishLightStemFilterFactory.java?rev=964019&view=auto
==============================================================================
--- lucene/dev/trunk/solr/src/java/org/apache/solr/analysis/FinnishLightStemFilterFactory.java (added)
+++ lucene/dev/trunk/solr/src/java/org/apache/solr/analysis/FinnishLightStemFilterFactory.java Wed Jul 14 12:10:34 2010
@@ -0,0 +1,28 @@
+package org.apache.solr.analysis;
+
+/**
+ * Licensed to the Apache Software Foundation (ASF) under one or more
+ * contributor license agreements. See the NOTICE file distributed with
+ * this work for additional information regarding copyright ownership.
+ * The ASF licenses this file to You under the Apache License, Version 2.0
+ * (the "License"); you may not use this file except in compliance with
+ * the License. You may obtain a copy of the License at
+ *
+ * http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing, software
+ * distributed under the License is distributed on an "AS IS" BASIS,
+ * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+ * See the License for the specific language governing permissions and
+ * limitations under the License.
+ */
+
+import org.apache.lucene.analysis.TokenStream;
+import org.apache.lucene.analysis.fi.FinnishLightStemFilter;
+
+/** Factory for {@link FinnishLightStemFilter} */
+public class FinnishLightStemFilterFactory extends BaseTokenFilterFactory {
+ public TokenStream create(TokenStream input) {
+ return new FinnishLightStemFilter(input);
+ }
+}
Propchange: lucene/dev/trunk/solr/src/java/org/apache/solr/analysis/FinnishLightStemFilterFactory.java
------------------------------------------------------------------------------
svn:eol-style = native
Added: lucene/dev/trunk/solr/src/java/org/apache/solr/analysis/FrenchLightStemFilterFactory.java
URL: http://svn.apache.org/viewvc/lucene/dev/trunk/solr/src/java/org/apache/solr/analysis/FrenchLightStemFilterFactory.java?rev=964019&view=auto
==============================================================================
--- lucene/dev/trunk/solr/src/java/org/apache/solr/analysis/FrenchLightStemFilterFactory.java (added)
+++ lucene/dev/trunk/solr/src/java/org/apache/solr/analysis/FrenchLightStemFilterFactory.java Wed Jul 14 12:10:34 2010
@@ -0,0 +1,28 @@
+package org.apache.solr.analysis;
+
+/**
+ * Licensed to the Apache Software Foundation (ASF) under one or more
+ * contributor license agreements. See the NOTICE file distributed with
+ * this work for additional information regarding copyright ownership.
+ * The ASF licenses this file to You under the Apache License, Version 2.0
+ * (the "License"); you may not use this file except in compliance with
+ * the License. You may obtain a copy of the License at
+ *
+ * http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing, software
+ * distributed under the License is distributed on an "AS IS" BASIS,
+ * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+ * See the License for the specific language governing permissions and
+ * limitations under the License.
+ */
+
+import org.apache.lucene.analysis.TokenStream;
+import org.apache.lucene.analysis.fr.FrenchLightStemFilter;
+
+/** Factory for {@link FrenchLightStemFilter} */
+public class FrenchLightStemFilterFactory extends BaseTokenFilterFactory {
+ public TokenStream create(TokenStream input) {
+ return new FrenchLightStemFilter(input);
+ }
+}
Propchange: lucene/dev/trunk/solr/src/java/org/apache/solr/analysis/FrenchLightStemFilterFactory.java
------------------------------------------------------------------------------
svn:eol-style = native
Added: lucene/dev/trunk/solr/src/java/org/apache/solr/analysis/FrenchMinimalStemFilterFactory.java
URL: http://svn.apache.org/viewvc/lucene/dev/trunk/solr/src/java/org/apache/solr/analysis/FrenchMinimalStemFilterFactory.java?rev=964019&view=auto
==============================================================================
--- lucene/dev/trunk/solr/src/java/org/apache/solr/analysis/FrenchMinimalStemFilterFactory.java (added)
+++ lucene/dev/trunk/solr/src/java/org/apache/solr/analysis/FrenchMinimalStemFilterFactory.java Wed Jul 14 12:10:34 2010
@@ -0,0 +1,28 @@
+package org.apache.solr.analysis;
+
+/**
+ * Licensed to the Apache Software Foundation (ASF) under one or more
+ * contributor license agreements. See the NOTICE file distributed with
+ * this work for additional information regarding copyright ownership.
+ * The ASF licenses this file to You under the Apache License, Version 2.0
+ * (the "License"); you may not use this file except in compliance with
+ * the License. You may obtain a copy of the License at
+ *
+ * http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing, software
+ * distributed under the License is distributed on an "AS IS" BASIS,
+ * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+ * See the License for the specific language governing permissions and
+ * limitations under the License.
+ */
+
+import org.apache.lucene.analysis.TokenStream;
+import org.apache.lucene.analysis.fr.FrenchMinimalStemFilter;
+
+/** Factory for {@link FrenchMinimalStemFilter} */
+public class FrenchMinimalStemFilterFactory extends BaseTokenFilterFactory {
+ public TokenStream create(TokenStream input) {
+ return new FrenchMinimalStemFilter(input);
+ }
+}
Propchange: lucene/dev/trunk/solr/src/java/org/apache/solr/analysis/FrenchMinimalStemFilterFactory.java
------------------------------------------------------------------------------
svn:eol-style = native
Added: lucene/dev/trunk/solr/src/java/org/apache/solr/analysis/GermanLightStemFilterFactory.java
URL: http://svn.apache.org/viewvc/lucene/dev/trunk/solr/src/java/org/apache/solr/analysis/GermanLightStemFilterFactory.java?rev=964019&view=auto
==============================================================================
--- lucene/dev/trunk/solr/src/java/org/apache/solr/analysis/GermanLightStemFilterFactory.java (added)
+++ lucene/dev/trunk/solr/src/java/org/apache/solr/analysis/GermanLightStemFilterFactory.java Wed Jul 14 12:10:34 2010
@@ -0,0 +1,28 @@
+package org.apache.solr.analysis;
+
+/**
+ * Licensed to the Apache Software Foundation (ASF) under one or more
+ * contributor license agreements. See the NOTICE file distributed with
+ * this work for additional information regarding copyright ownership.
+ * The ASF licenses this file to You under the Apache License, Version 2.0
+ * (the "License"); you may not use this file except in compliance with
+ * the License. You may obtain a copy of the License at
+ *
+ * http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing, software
+ * distributed under the License is distributed on an "AS IS" BASIS,
+ * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+ * See the License for the specific language governing permissions and
+ * limitations under the License.
+ */
+
+import org.apache.lucene.analysis.TokenStream;
+import org.apache.lucene.analysis.de.GermanLightStemFilter;
+
+/** Factory for {@link GermanLightStemFilter} */
+public class GermanLightStemFilterFactory extends BaseTokenFilterFactory {
+ public TokenStream create(TokenStream input) {
+ return new GermanLightStemFilter(input);
+ }
+}
Propchange: lucene/dev/trunk/solr/src/java/org/apache/solr/analysis/GermanLightStemFilterFactory.java
------------------------------------------------------------------------------
svn:eol-style = native
Added: lucene/dev/trunk/solr/src/java/org/apache/solr/analysis/GermanMinimalStemFilterFactory.java
URL: http://svn.apache.org/viewvc/lucene/dev/trunk/solr/src/java/org/apache/solr/analysis/GermanMinimalStemFilterFactory.java?rev=964019&view=auto
==============================================================================
--- lucene/dev/trunk/solr/src/java/org/apache/solr/analysis/GermanMinimalStemFilterFactory.java (added)
+++ lucene/dev/trunk/solr/src/java/org/apache/solr/analysis/GermanMinimalStemFilterFactory.java Wed Jul 14 12:10:34 2010
@@ -0,0 +1,28 @@
+package org.apache.solr.analysis;
+
+/**
+ * Licensed to the Apache Software Foundation (ASF) under one or more
+ * contributor license agreements. See the NOTICE file distributed with
+ * this work for additional information regarding copyright ownership.
+ * The ASF licenses this file to You under the Apache License, Version 2.0
+ * (the "License"); you may not use this file except in compliance with
+ * the License. You may obtain a copy of the License at
+ *
+ * http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing, software
+ * distributed under the License is distributed on an "AS IS" BASIS,
+ * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+ * See the License for the specific language governing permissions and
+ * limitations under the License.
+ */
+
+import org.apache.lucene.analysis.TokenStream;
+import org.apache.lucene.analysis.de.GermanMinimalStemFilter;
+
+/** Factory for {@link GermanMinimalStemFilter} */
+public class GermanMinimalStemFilterFactory extends BaseTokenFilterFactory {
+ public TokenStream create(TokenStream input) {
+ return new GermanMinimalStemFilter(input);
+ }
+}
Propchange: lucene/dev/trunk/solr/src/java/org/apache/solr/analysis/GermanMinimalStemFilterFactory.java
------------------------------------------------------------------------------
svn:eol-style = native
Added: lucene/dev/trunk/solr/src/java/org/apache/solr/analysis/HungarianLightStemFilterFactory.java
URL: http://svn.apache.org/viewvc/lucene/dev/trunk/solr/src/java/org/apache/solr/analysis/HungarianLightStemFilterFactory.java?rev=964019&view=auto
==============================================================================
--- lucene/dev/trunk/solr/src/java/org/apache/solr/analysis/HungarianLightStemFilterFactory.java (added)
+++ lucene/dev/trunk/solr/src/java/org/apache/solr/analysis/HungarianLightStemFilterFactory.java Wed Jul 14 12:10:34 2010
@@ -0,0 +1,28 @@
+package org.apache.solr.analysis;
+
+/**
+ * Licensed to the Apache Software Foundation (ASF) under one or more
+ * contributor license agreements. See the NOTICE file distributed with
+ * this work for additional information regarding copyright ownership.
+ * The ASF licenses this file to You under the Apache License, Version 2.0
+ * (the "License"); you may not use this file except in compliance with
+ * the License. You may obtain a copy of the License at
+ *
+ * http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing, software
+ * distributed under the License is distributed on an "AS IS" BASIS,
+ * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+ * See the License for the specific language governing permissions and
+ * limitations under the License.
+ */
+
+import org.apache.lucene.analysis.TokenStream;
+import org.apache.lucene.analysis.hu.HungarianLightStemFilter;
+
+/** Factory for {@link HungarianLightStemFilter} */
+public class HungarianLightStemFilterFactory extends BaseTokenFilterFactory {
+ public TokenStream create(TokenStream input) {
+ return new HungarianLightStemFilter(input);
+ }
+}
Propchange: lucene/dev/trunk/solr/src/java/org/apache/solr/analysis/HungarianLightStemFilterFactory.java
------------------------------------------------------------------------------
svn:eol-style = native
Added: lucene/dev/trunk/solr/src/java/org/apache/solr/analysis/ItalianLightStemFilterFactory.java
URL: http://svn.apache.org/viewvc/lucene/dev/trunk/solr/src/java/org/apache/solr/analysis/ItalianLightStemFilterFactory.java?rev=964019&view=auto
==============================================================================
--- lucene/dev/trunk/solr/src/java/org/apache/solr/analysis/ItalianLightStemFilterFactory.java (added)
+++ lucene/dev/trunk/solr/src/java/org/apache/solr/analysis/ItalianLightStemFilterFactory.java Wed Jul 14 12:10:34 2010
@@ -0,0 +1,28 @@
+package org.apache.solr.analysis;
+
+/**
+ * Licensed to the Apache Software Foundation (ASF) under one or more
+ * contributor license agreements. See the NOTICE file distributed with
+ * this work for additional information regarding copyright ownership.
+ * The ASF licenses this file to You under the Apache License, Version 2.0
+ * (the "License"); you may not use this file except in compliance with
+ * the License. You may obtain a copy of the License at
+ *
+ * http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing, software
+ * distributed under the License is distributed on an "AS IS" BASIS,
+ * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+ * See the License for the specific language governing permissions and
+ * limitations under the License.
+ */
+
+import org.apache.lucene.analysis.TokenStream;
+import org.apache.lucene.analysis.it.ItalianLightStemFilter;
+
+/** Factory for {@link ItalianLightStemFilter} */
+public class ItalianLightStemFilterFactory extends BaseTokenFilterFactory {
+ public TokenStream create(TokenStream input) {
+ return new ItalianLightStemFilter(input);
+ }
+}
Propchange: lucene/dev/trunk/solr/src/java/org/apache/solr/analysis/ItalianLightStemFilterFactory.java
------------------------------------------------------------------------------
svn:eol-style = native
Added: lucene/dev/trunk/solr/src/java/org/apache/solr/analysis/PortugueseLightStemFilterFactory.java
URL: http://svn.apache.org/viewvc/lucene/dev/trunk/solr/src/java/org/apache/solr/analysis/PortugueseLightStemFilterFactory.java?rev=964019&view=auto
==============================================================================
--- lucene/dev/trunk/solr/src/java/org/apache/solr/analysis/PortugueseLightStemFilterFactory.java (added)
+++ lucene/dev/trunk/solr/src/java/org/apache/solr/analysis/PortugueseLightStemFilterFactory.java Wed Jul 14 12:10:34 2010
@@ -0,0 +1,28 @@
+package org.apache.solr.analysis;
+
+/**
+ * Licensed to the Apache Software Foundation (ASF) under one or more
+ * contributor license agreements. See the NOTICE file distributed with
+ * this work for additional information regarding copyright ownership.
+ * The ASF licenses this file to You under the Apache License, Version 2.0
+ * (the "License"); you may not use this file except in compliance with
+ * the License. You may obtain a copy of the License at
+ *
+ * http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing, software
+ * distributed under the License is distributed on an "AS IS" BASIS,
+ * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+ * See the License for the specific language governing permissions and
+ * limitations under the License.
+ */
+
+import org.apache.lucene.analysis.TokenStream;
+import org.apache.lucene.analysis.pt.PortugueseLightStemFilter;
+
+/** Factory for {@link PortugueseLightStemFilter} */
+public class PortugueseLightStemFilterFactory extends BaseTokenFilterFactory {
+ public TokenStream create(TokenStream input) {
+ return new PortugueseLightStemFilter(input);
+ }
+}
Propchange: lucene/dev/trunk/solr/src/java/org/apache/solr/analysis/PortugueseLightStemFilterFactory.java
------------------------------------------------------------------------------
svn:eol-style = native
Added: lucene/dev/trunk/solr/src/java/org/apache/solr/analysis/PortugueseMinimalStemFilterFactory.java
URL: http://svn.apache.org/viewvc/lucene/dev/trunk/solr/src/java/org/apache/solr/analysis/PortugueseMinimalStemFilterFactory.java?rev=964019&view=auto
==============================================================================
--- lucene/dev/trunk/solr/src/java/org/apache/solr/analysis/PortugueseMinimalStemFilterFactory.java (added)
+++ lucene/dev/trunk/solr/src/java/org/apache/solr/analysis/PortugueseMinimalStemFilterFactory.java Wed Jul 14 12:10:34 2010
@@ -0,0 +1,28 @@
+package org.apache.solr.analysis;
+
+/**
+ * Licensed to the Apache Software Foundation (ASF) under one or more
+ * contributor license agreements. See the NOTICE file distributed with
+ * this work for additional information regarding copyright ownership.
+ * The ASF licenses this file to You under the Apache License, Version 2.0
+ * (the "License"); you may not use this file except in compliance with
+ * the License. You may obtain a copy of the License at
+ *
+ * http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing, software
+ * distributed under the License is distributed on an "AS IS" BASIS,
+ * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+ * See the License for the specific language governing permissions and
+ * limitations under the License.
+ */
+
+import org.apache.lucene.analysis.TokenStream;
+import org.apache.lucene.analysis.pt.PortugueseMinimalStemFilter;
+
+/** Factory for {@link PortugueseMinimalStemFilter} */
+public class PortugueseMinimalStemFilterFactory extends BaseTokenFilterFactory {
+ public TokenStream create(TokenStream input) {
+ return new PortugueseMinimalStemFilter(input);
+ }
+}
Propchange: lucene/dev/trunk/solr/src/java/org/apache/solr/analysis/PortugueseMinimalStemFilterFactory.java
------------------------------------------------------------------------------
svn:eol-style = native
Added: lucene/dev/trunk/solr/src/java/org/apache/solr/analysis/RussianLightStemFilterFactory.java
URL: http://svn.apache.org/viewvc/lucene/dev/trunk/solr/src/java/org/apache/solr/analysis/RussianLightStemFilterFactory.java?rev=964019&view=auto
==============================================================================
--- lucene/dev/trunk/solr/src/java/org/apache/solr/analysis/RussianLightStemFilterFactory.java (added)
+++ lucene/dev/trunk/solr/src/java/org/apache/solr/analysis/RussianLightStemFilterFactory.java Wed Jul 14 12:10:34 2010
@@ -0,0 +1,28 @@
+package org.apache.solr.analysis;
+
+/**
+ * Licensed to the Apache Software Foundation (ASF) under one or more
+ * contributor license agreements. See the NOTICE file distributed with
+ * this work for additional information regarding copyright ownership.
+ * The ASF licenses this file to You under the Apache License, Version 2.0
+ * (the "License"); you may not use this file except in compliance with
+ * the License. You may obtain a copy of the License at
+ *
+ * http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing, software
+ * distributed under the License is distributed on an "AS IS" BASIS,
+ * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+ * See the License for the specific language governing permissions and
+ * limitations under the License.
+ */
+
+import org.apache.lucene.analysis.TokenStream;
+import org.apache.lucene.analysis.ru.RussianLightStemFilter;
+
+/** Factory for {@link RussianLightStemFilter} */
+public class RussianLightStemFilterFactory extends BaseTokenFilterFactory {
+ public TokenStream create(TokenStream input) {
+ return new RussianLightStemFilter(input);
+ }
+}
Propchange: lucene/dev/trunk/solr/src/java/org/apache/solr/analysis/RussianLightStemFilterFactory.java
------------------------------------------------------------------------------
svn:eol-style = native
Added: lucene/dev/trunk/solr/src/java/org/apache/solr/analysis/SpanishLightStemFilterFactory.java
URL: http://svn.apache.org/viewvc/lucene/dev/trunk/solr/src/java/org/apache/solr/analysis/SpanishLightStemFilterFactory.java?rev=964019&view=auto
==============================================================================
--- lucene/dev/trunk/solr/src/java/org/apache/solr/analysis/SpanishLightStemFilterFactory.java (added)
+++ lucene/dev/trunk/solr/src/java/org/apache/solr/analysis/SpanishLightStemFilterFactory.java Wed Jul 14 12:10:34 2010
@@ -0,0 +1,28 @@
+package org.apache.solr.analysis;
+
+/**
+ * Licensed to the Apache Software Foundation (ASF) under one or more
+ * contributor license agreements. See the NOTICE file distributed with
+ * this work for additional information regarding copyright ownership.
+ * The ASF licenses this file to You under the Apache License, Version 2.0
+ * (the "License"); you may not use this file except in compliance with
+ * the License. You may obtain a copy of the License at
+ *
+ * http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing, software
+ * distributed under the License is distributed on an "AS IS" BASIS,
+ * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+ * See the License for the specific language governing permissions and
+ * limitations under the License.
+ */
+
+import org.apache.lucene.analysis.TokenStream;
+import org.apache.lucene.analysis.es.SpanishLightStemFilter;
+
+/** Factory for {@link SpanishLightStemFilter} */
+public class SpanishLightStemFilterFactory extends BaseTokenFilterFactory {
+ public TokenStream create(TokenStream input) {
+ return new SpanishLightStemFilter(input);
+ }
+}
Propchange: lucene/dev/trunk/solr/src/java/org/apache/solr/analysis/SpanishLightStemFilterFactory.java
------------------------------------------------------------------------------
svn:eol-style = native
Added: lucene/dev/trunk/solr/src/java/org/apache/solr/analysis/SwedishLightStemFilterFactory.java
URL: http://svn.apache.org/viewvc/lucene/dev/trunk/solr/src/java/org/apache/solr/analysis/SwedishLightStemFilterFactory.java?rev=964019&view=auto
==============================================================================
--- lucene/dev/trunk/solr/src/java/org/apache/solr/analysis/SwedishLightStemFilterFactory.java (added)
+++ lucene/dev/trunk/solr/src/java/org/apache/solr/analysis/SwedishLightStemFilterFactory.java Wed Jul 14 12:10:34 2010
@@ -0,0 +1,28 @@
+package org.apache.solr.analysis;
+
+/**
+ * Licensed to the Apache Software Foundation (ASF) under one or more
+ * contributor license agreements. See the NOTICE file distributed with
+ * this work for additional information regarding copyright ownership.
+ * The ASF licenses this file to You under the Apache License, Version 2.0
+ * (the "License"); you may not use this file except in compliance with
+ * the License. You may obtain a copy of the License at
+ *
+ * http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing, software
+ * distributed under the License is distributed on an "AS IS" BASIS,
+ * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+ * See the License for the specific language governing permissions and
+ * limitations under the License.
+ */
+
+import org.apache.lucene.analysis.TokenStream;
+import org.apache.lucene.analysis.sv.SwedishLightStemFilter;
+
+/** Factory for {@link SwedishLightStemFilter} */
+public class SwedishLightStemFilterFactory extends BaseTokenFilterFactory {
+ public TokenStream create(TokenStream input) {
+ return new SwedishLightStemFilter(input);
+ }
+}
Propchange: lucene/dev/trunk/solr/src/java/org/apache/solr/analysis/SwedishLightStemFilterFactory.java
------------------------------------------------------------------------------
svn:eol-style = native
Added: lucene/dev/trunk/solr/src/test/org/apache/solr/analysis/TestEnglishMinimalStemFilterFactory.java
URL: http://svn.apache.org/viewvc/lucene/dev/trunk/solr/src/test/org/apache/solr/analysis/TestEnglishMinimalStemFilterFactory.java?rev=964019&view=auto
==============================================================================
--- lucene/dev/trunk/solr/src/test/org/apache/solr/analysis/TestEnglishMinimalStemFilterFactory.java (added)
+++ lucene/dev/trunk/solr/src/test/org/apache/solr/analysis/TestEnglishMinimalStemFilterFactory.java Wed Jul 14 12:10:34 2010
@@ -0,0 +1,36 @@
+package org.apache.solr.analysis;
+
+/**
+ * Licensed to the Apache Software Foundation (ASF) under one or more
+ * contributor license agreements. See the NOTICE file distributed with
+ * this work for additional information regarding copyright ownership.
+ * The ASF licenses this file to You under the Apache License, Version 2.0
+ * (the "License"); you may not use this file except in compliance with
+ * the License. You may obtain a copy of the License at
+ *
+ * http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing, software
+ * distributed under the License is distributed on an "AS IS" BASIS,
+ * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+ * See the License for the specific language governing permissions and
+ * limitations under the License.
+ */
+
+import java.io.Reader;
+import java.io.StringReader;
+
+import org.apache.lucene.analysis.TokenStream;
+import org.apache.lucene.analysis.core.WhitespaceTokenizer;
+
+/**
+ * Simple tests to ensure the English minimal stem factory is working.
+ */
+public class TestEnglishMinimalStemFilterFactory extends BaseTokenTestCase {
+ public void testStemming() throws Exception {
+ Reader reader = new StringReader("bricks");
+ EnglishMinimalStemFilterFactory factory = new EnglishMinimalStemFilterFactory();
+ TokenStream stream = factory.create(new WhitespaceTokenizer(DEFAULT_VERSION, reader));
+ assertTokenStreamContents(stream, new String[] { "brick" });
+ }
+}
Propchange: lucene/dev/trunk/solr/src/test/org/apache/solr/analysis/TestEnglishMinimalStemFilterFactory.java
------------------------------------------------------------------------------
svn:eol-style = native
Added: lucene/dev/trunk/solr/src/test/org/apache/solr/analysis/TestFinnishLightStemFilterFactory.java
URL: http://svn.apache.org/viewvc/lucene/dev/trunk/solr/src/test/org/apache/solr/analysis/TestFinnishLightStemFilterFactory.java?rev=964019&view=auto
==============================================================================
--- lucene/dev/trunk/solr/src/test/org/apache/solr/analysis/TestFinnishLightStemFilterFactory.java (added)
+++ lucene/dev/trunk/solr/src/test/org/apache/solr/analysis/TestFinnishLightStemFilterFactory.java Wed Jul 14 12:10:34 2010
@@ -0,0 +1,36 @@
+package org.apache.solr.analysis;
+
+/**
+ * Licensed to the Apache Software Foundation (ASF) under one or more
+ * contributor license agreements. See the NOTICE file distributed with
+ * this work for additional information regarding copyright ownership.
+ * The ASF licenses this file to You under the Apache License, Version 2.0
+ * (the "License"); you may not use this file except in compliance with
+ * the License. You may obtain a copy of the License at
+ *
+ * http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing, software
+ * distributed under the License is distributed on an "AS IS" BASIS,
+ * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+ * See the License for the specific language governing permissions and
+ * limitations under the License.
+ */
+
+import java.io.Reader;
+import java.io.StringReader;
+
+import org.apache.lucene.analysis.TokenStream;
+import org.apache.lucene.analysis.core.WhitespaceTokenizer;
+
+/**
+ * Simple tests to ensure the Finnish light stem factory is working.
+ */
+public class TestFinnishLightStemFilterFactory extends BaseTokenTestCase {
+ public void testStemming() throws Exception {
+ Reader reader = new StringReader("aseistettujen");
+ FinnishLightStemFilterFactory factory = new FinnishLightStemFilterFactory();
+ TokenStream stream = factory.create(new WhitespaceTokenizer(DEFAULT_VERSION, reader));
+ assertTokenStreamContents(stream, new String[] { "aseistet" });
+ }
+}
Propchange: lucene/dev/trunk/solr/src/test/org/apache/solr/analysis/TestFinnishLightStemFilterFactory.java
------------------------------------------------------------------------------
svn:eol-style = native
Added: lucene/dev/trunk/solr/src/test/org/apache/solr/analysis/TestFrenchLightStemFilterFactory.java
URL: http://svn.apache.org/viewvc/lucene/dev/trunk/solr/src/test/org/apache/solr/analysis/TestFrenchLightStemFilterFactory.java?rev=964019&view=auto
==============================================================================
--- lucene/dev/trunk/solr/src/test/org/apache/solr/analysis/TestFrenchLightStemFilterFactory.java (added)
+++ lucene/dev/trunk/solr/src/test/org/apache/solr/analysis/TestFrenchLightStemFilterFactory.java Wed Jul 14 12:10:34 2010
@@ -0,0 +1,36 @@
+package org.apache.solr.analysis;
+
+/**
+ * Licensed to the Apache Software Foundation (ASF) under one or more
+ * contributor license agreements. See the NOTICE file distributed with
+ * this work for additional information regarding copyright ownership.
+ * The ASF licenses this file to You under the Apache License, Version 2.0
+ * (the "License"); you may not use this file except in compliance with
+ * the License. You may obtain a copy of the License at
+ *
+ * http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing, software
+ * distributed under the License is distributed on an "AS IS" BASIS,
+ * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+ * See the License for the specific language governing permissions and
+ * limitations under the License.
+ */
+
+import java.io.Reader;
+import java.io.StringReader;
+
+import org.apache.lucene.analysis.TokenStream;
+import org.apache.lucene.analysis.core.WhitespaceTokenizer;
+
+/**
+ * Simple tests to ensure the French light stem factory is working.
+ */
+public class TestFrenchLightStemFilterFactory extends BaseTokenTestCase {
+ public void testStemming() throws Exception {
+ Reader reader = new StringReader("administrativement");
+ FrenchLightStemFilterFactory factory = new FrenchLightStemFilterFactory();
+ TokenStream stream = factory.create(new WhitespaceTokenizer(DEFAULT_VERSION, reader));
+ assertTokenStreamContents(stream, new String[] { "administratif" });
+ }
+}
Propchange: lucene/dev/trunk/solr/src/test/org/apache/solr/analysis/TestFrenchLightStemFilterFactory.java
------------------------------------------------------------------------------
svn:eol-style = native
Added: lucene/dev/trunk/solr/src/test/org/apache/solr/analysis/TestFrenchMinimalStemFilterFactory.java
URL: http://svn.apache.org/viewvc/lucene/dev/trunk/solr/src/test/org/apache/solr/analysis/TestFrenchMinimalStemFilterFactory.java?rev=964019&view=auto
==============================================================================
--- lucene/dev/trunk/solr/src/test/org/apache/solr/analysis/TestFrenchMinimalStemFilterFactory.java (added)
+++ lucene/dev/trunk/solr/src/test/org/apache/solr/analysis/TestFrenchMinimalStemFilterFactory.java Wed Jul 14 12:10:34 2010
@@ -0,0 +1,36 @@
+package org.apache.solr.analysis;
+
+/**
+ * Licensed to the Apache Software Foundation (ASF) under one or more
+ * contributor license agreements. See the NOTICE file distributed with
+ * this work for additional information regarding copyright ownership.
+ * The ASF licenses this file to You under the Apache License, Version 2.0
+ * (the "License"); you may not use this file except in compliance with
+ * the License. You may obtain a copy of the License at
+ *
+ * http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing, software
+ * distributed under the License is distributed on an "AS IS" BASIS,
+ * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+ * See the License for the specific language governing permissions and
+ * limitations under the License.
+ */
+
+import java.io.Reader;
+import java.io.StringReader;
+
+import org.apache.lucene.analysis.TokenStream;
+import org.apache.lucene.analysis.core.WhitespaceTokenizer;
+
+/**
+ * Simple tests to ensure the French minimal stem factory is working.
+ */
+public class TestFrenchMinimalStemFilterFactory extends BaseTokenTestCase {
+ public void testStemming() throws Exception {
+ Reader reader = new StringReader("chevaux");
+ FrenchMinimalStemFilterFactory factory = new FrenchMinimalStemFilterFactory();
+ TokenStream stream = factory.create(new WhitespaceTokenizer(DEFAULT_VERSION, reader));
+ assertTokenStreamContents(stream, new String[] { "cheval" });
+ }
+}
Propchange: lucene/dev/trunk/solr/src/test/org/apache/solr/analysis/TestFrenchMinimalStemFilterFactory.java
------------------------------------------------------------------------------
svn:eol-style = native
Added: lucene/dev/trunk/solr/src/test/org/apache/solr/analysis/TestGermanLightStemFilterFactory.java
URL: http://svn.apache.org/viewvc/lucene/dev/trunk/solr/src/test/org/apache/solr/analysis/TestGermanLightStemFilterFactory.java?rev=964019&view=auto
==============================================================================
--- lucene/dev/trunk/solr/src/test/org/apache/solr/analysis/TestGermanLightStemFilterFactory.java (added)
+++ lucene/dev/trunk/solr/src/test/org/apache/solr/analysis/TestGermanLightStemFilterFactory.java Wed Jul 14 12:10:34 2010
@@ -0,0 +1,36 @@
+package org.apache.solr.analysis;
+
+/**
+ * Licensed to the Apache Software Foundation (ASF) under one or more
+ * contributor license agreements. See the NOTICE file distributed with
+ * this work for additional information regarding copyright ownership.
+ * The ASF licenses this file to You under the Apache License, Version 2.0
+ * (the "License"); you may not use this file except in compliance with
+ * the License. You may obtain a copy of the License at
+ *
+ * http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing, software
+ * distributed under the License is distributed on an "AS IS" BASIS,
+ * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+ * See the License for the specific language governing permissions and
+ * limitations under the License.
+ */
+
+import java.io.Reader;
+import java.io.StringReader;
+
+import org.apache.lucene.analysis.TokenStream;
+import org.apache.lucene.analysis.core.WhitespaceTokenizer;
+
+/**
+ * Simple tests to ensure the German light stem factory is working.
+ */
+public class TestGermanLightStemFilterFactory extends BaseTokenTestCase {
+ public void testStemming() throws Exception {
+ Reader reader = new StringReader("häuser");
+ GermanLightStemFilterFactory factory = new GermanLightStemFilterFactory();
+ TokenStream stream = factory.create(new WhitespaceTokenizer(DEFAULT_VERSION, reader));
+ assertTokenStreamContents(stream, new String[] { "haus" });
+ }
+}
Propchange: lucene/dev/trunk/solr/src/test/org/apache/solr/analysis/TestGermanLightStemFilterFactory.java
------------------------------------------------------------------------------
svn:eol-style = native
Added: lucene/dev/trunk/solr/src/test/org/apache/solr/analysis/TestGermanMinimalStemFilterFactory.java
URL: http://svn.apache.org/viewvc/lucene/dev/trunk/solr/src/test/org/apache/solr/analysis/TestGermanMinimalStemFilterFactory.java?rev=964019&view=auto
==============================================================================
--- lucene/dev/trunk/solr/src/test/org/apache/solr/analysis/TestGermanMinimalStemFilterFactory.java (added)
+++ lucene/dev/trunk/solr/src/test/org/apache/solr/analysis/TestGermanMinimalStemFilterFactory.java Wed Jul 14 12:10:34 2010
@@ -0,0 +1,36 @@
+package org.apache.solr.analysis;
+
+/**
+ * Licensed to the Apache Software Foundation (ASF) under one or more
+ * contributor license agreements. See the NOTICE file distributed with
+ * this work for additional information regarding copyright ownership.
+ * The ASF licenses this file to You under the Apache License, Version 2.0
+ * (the "License"); you may not use this file except in compliance with
+ * the License. You may obtain a copy of the License at
+ *
+ * http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing, software
+ * distributed under the License is distributed on an "AS IS" BASIS,
+ * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+ * See the License for the specific language governing permissions and
+ * limitations under the License.
+ */
+
+import java.io.Reader;
+import java.io.StringReader;
+
+import org.apache.lucene.analysis.TokenStream;
+import org.apache.lucene.analysis.core.WhitespaceTokenizer;
+
+/**
+ * Simple tests to ensure the German minimal stem factory is working.
+ */
+public class TestGermanMinimalStemFilterFactory extends BaseTokenTestCase {
+ public void testStemming() throws Exception {
+ Reader reader = new StringReader("bilder");
+ GermanMinimalStemFilterFactory factory = new GermanMinimalStemFilterFactory();
+ TokenStream stream = factory.create(new WhitespaceTokenizer(DEFAULT_VERSION, reader));
+ assertTokenStreamContents(stream, new String[] { "bild" });
+ }
+}
Propchange: lucene/dev/trunk/solr/src/test/org/apache/solr/analysis/TestGermanMinimalStemFilterFactory.java
------------------------------------------------------------------------------
svn:eol-style = native
Added: lucene/dev/trunk/solr/src/test/org/apache/solr/analysis/TestHungarianLightStemFilterFactory.java
URL: http://svn.apache.org/viewvc/lucene/dev/trunk/solr/src/test/org/apache/solr/analysis/TestHungarianLightStemFilterFactory.java?rev=964019&view=auto
==============================================================================
--- lucene/dev/trunk/solr/src/test/org/apache/solr/analysis/TestHungarianLightStemFilterFactory.java (added)
+++ lucene/dev/trunk/solr/src/test/org/apache/solr/analysis/TestHungarianLightStemFilterFactory.java Wed Jul 14 12:10:34 2010
@@ -0,0 +1,36 @@
+package org.apache.solr.analysis;
+
+/**
+ * Licensed to the Apache Software Foundation (ASF) under one or more
+ * contributor license agreements. See the NOTICE file distributed with
+ * this work for additional information regarding copyright ownership.
+ * The ASF licenses this file to You under the Apache License, Version 2.0
+ * (the "License"); you may not use this file except in compliance with
+ * the License. You may obtain a copy of the License at
+ *
+ * http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing, software
+ * distributed under the License is distributed on an "AS IS" BASIS,
+ * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+ * See the License for the specific language governing permissions and
+ * limitations under the License.
+ */
+
+import java.io.Reader;
+import java.io.StringReader;
+
+import org.apache.lucene.analysis.TokenStream;
+import org.apache.lucene.analysis.core.WhitespaceTokenizer;
+
+/**
+ * Simple tests to ensure the Hungarian light stem factory is working.
+ */
+public class TestHungarianLightStemFilterFactory extends BaseTokenTestCase {
+ public void testStemming() throws Exception {
+ Reader reader = new StringReader("házakat");
+ HungarianLightStemFilterFactory factory = new HungarianLightStemFilterFactory();
+ TokenStream stream = factory.create(new WhitespaceTokenizer(DEFAULT_VERSION, reader));
+ assertTokenStreamContents(stream, new String[] { "haz" });
+ }
+}
Propchange: lucene/dev/trunk/solr/src/test/org/apache/solr/analysis/TestHungarianLightStemFilterFactory.java
------------------------------------------------------------------------------
svn:eol-style = native