You are viewing a plain text version of this content. The canonical link for it is here.
Posted to dev@lucene.apache.org by go...@apache.org on 2003/10/25 13:23:49 UTC
cvs commit: jakarta-lucene/src/test/org/apache/lucene/analysis/ru TestRussianStem.java
goller 2003/10/25 04:23:49
Modified: src/test/org/apache/lucene/analysis/ru TestRussianStem.java
Log:
modify to use VM property for base data directory, so IDEs can run tests without Ant,
simply copied Eriks modification from TestRussianAnalyzer
Revision Changes Path
1.4 +141 -138 jakarta-lucene/src/test/org/apache/lucene/analysis/ru/TestRussianStem.java
Index: TestRussianStem.java
===================================================================
RCS file: /home/cvs/jakarta-lucene/src/test/org/apache/lucene/analysis/ru/TestRussianStem.java,v
retrieving revision 1.3
retrieving revision 1.4
diff -u -r1.3 -r1.4
--- TestRussianStem.java 29 Jan 2003 17:43:13 -0000 1.3
+++ TestRussianStem.java 25 Oct 2003 11:23:49 -0000 1.4
@@ -1,138 +1,141 @@
-package org.apache.lucene.analysis.ru;
-
-/* ====================================================================
- * The Apache Software License, Version 1.1
- *
- * Copyright (c) 2001 The Apache Software Foundation. All rights
- * reserved.
- *
- * Redistribution and use in source and binary forms, with or without
- * modification, are permitted provided that the following conditions
- * are met:
- *
- * 1. Redistributions of source code must retain the above copyright
- * notice, this list of conditions and the following disclaimer.
- *
- * 2. Redistributions in binary form must reproduce the above copyright
- * notice, this list of conditions and the following disclaimer in
- * the documentation and/or other materials provided with the
- * distribution.
- *
- * 3. The end-user documentation included with the redistribution,
- * if any, must include the following acknowledgment:
- * "This product includes software developed by the
- * Apache Software Foundation (http://www.apache.org/)."
- * Alternately, this acknowledgment may appear in the software itself,
- * if and wherever such third-party acknowledgments normally appear.
- *
- * 4. The names "Apache" and "Apache Software Foundation" and
- * "Apache Lucene" must not be used to endorse or promote products
- * derived from this software without prior written permission. For
- * written permission, please contact apache@apache.org.
- *
- * 5. Products derived from this software may not be called "Apache",
- * "Apache Lucene", nor may "Apache" appear in their name, without
- * prior written permission of the Apache Software Foundation.
- *
- * THIS SOFTWARE IS PROVIDED ``AS IS'' AND ANY EXPRESSED OR IMPLIED
- * WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED WARRANTIES
- * OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE ARE
- * DISCLAIMED. IN NO EVENT SHALL THE APACHE SOFTWARE FOUNDATION OR
- * ITS CONTRIBUTORS BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL,
- * SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT
- * LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF
- * USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND
- * ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY,
- * OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT
- * OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF
- * SUCH DAMAGE.
- * ====================================================================
- *
- * This software consists of voluntary contributions made by many
- * individuals on behalf of the Apache Software Foundation. For more
- * information on the Apache Software Foundation, please see
- * <http://www.apache.org/>.
- */
-
-import junit.framework.TestCase;
-
-import java.io.BufferedReader;
-import java.io.InputStreamReader;
-import java.io.FileInputStream;
-import java.util.ArrayList;
-
-public class TestRussianStem extends TestCase
-{
- private ArrayList words = new ArrayList();
- private ArrayList stems = new ArrayList();
-
- public TestRussianStem(String name)
- {
- super(name);
- }
-
- /**
- * @see TestCase#setUp()
- */
- protected void setUp() throws Exception
- {
- super.setUp();
- //System.out.println(new java.util.Date());
- String str;
-
- // open and read words into an array list
- BufferedReader inWords =
- new BufferedReader(
- new InputStreamReader(
- new FileInputStream("src/test/org/apache/lucene/analysis/ru/wordsUnicode.txt"),
- "Unicode"));
- while ((str = inWords.readLine()) != null)
- {
- words.add(str);
- }
- inWords.close();
-
- // open and read stems into an array list
- BufferedReader inStems =
- new BufferedReader(
- new InputStreamReader(
- new FileInputStream("src/test/org/apache/lucene/analysis/ru/stemsUnicode.txt"),
- "Unicode"));
- while ((str = inStems.readLine()) != null)
- {
- stems.add(str);
- }
- inStems.close();
- }
-
- /**
- * @see TestCase#tearDown()
- */
- protected void tearDown() throws Exception
- {
- super.tearDown();
- }
-
- public void testStem()
- {
- for (int i = 0; i < words.size(); i++)
- {
- //if ( (i % 100) == 0 ) System.err.println(i);
- String realStem =
- RussianStemmer.stem(
- (String) words.get(i),
- RussianCharsets.UnicodeRussian);
- assertEquals("unicode", stems.get(i), realStem);
- }
- }
-
- private String printChars(String output)
- {
- StringBuffer s = new StringBuffer();
- for (int i = 0; i < output.length(); i++)
- {
- s.append(output.charAt(i));
- }
- return s.toString();
- }
-}
+package org.apache.lucene.analysis.ru;
+
+/* ====================================================================
+ * The Apache Software License, Version 1.1
+ *
+ * Copyright (c) 2001 The Apache Software Foundation. All rights
+ * reserved.
+ *
+ * Redistribution and use in source and binary forms, with or without
+ * modification, are permitted provided that the following conditions
+ * are met:
+ *
+ * 1. Redistributions of source code must retain the above copyright
+ * notice, this list of conditions and the following disclaimer.
+ *
+ * 2. Redistributions in binary form must reproduce the above copyright
+ * notice, this list of conditions and the following disclaimer in
+ * the documentation and/or other materials provided with the
+ * distribution.
+ *
+ * 3. The end-user documentation included with the redistribution,
+ * if any, must include the following acknowledgment:
+ * "This product includes software developed by the
+ * Apache Software Foundation (http://www.apache.org/)."
+ * Alternately, this acknowledgment may appear in the software itself,
+ * if and wherever such third-party acknowledgments normally appear.
+ *
+ * 4. The names "Apache" and "Apache Software Foundation" and
+ * "Apache Lucene" must not be used to endorse or promote products
+ * derived from this software without prior written permission. For
+ * written permission, please contact apache@apache.org.
+ *
+ * 5. Products derived from this software may not be called "Apache",
+ * "Apache Lucene", nor may "Apache" appear in their name, without
+ * prior written permission of the Apache Software Foundation.
+ *
+ * THIS SOFTWARE IS PROVIDED ``AS IS'' AND ANY EXPRESSED OR IMPLIED
+ * WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED WARRANTIES
+ * OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE ARE
+ * DISCLAIMED. IN NO EVENT SHALL THE APACHE SOFTWARE FOUNDATION OR
+ * ITS CONTRIBUTORS BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL,
+ * SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT
+ * LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF
+ * USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND
+ * ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY,
+ * OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT
+ * OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF
+ * SUCH DAMAGE.
+ * ====================================================================
+ *
+ * This software consists of voluntary contributions made by many
+ * individuals on behalf of the Apache Software Foundation. For more
+ * information on the Apache Software Foundation, please see
+ * <http://www.apache.org/>.
+ */
+
+import junit.framework.TestCase;
+
+import java.io.BufferedReader;
+import java.io.File;
+import java.io.InputStreamReader;
+import java.io.FileInputStream;
+import java.util.ArrayList;
+
+public class TestRussianStem extends TestCase
+{
+ private ArrayList words = new ArrayList();
+ private ArrayList stems = new ArrayList();
+
+ public TestRussianStem(String name)
+ {
+ super(name);
+ }
+
+ /**
+ * @see TestCase#setUp()
+ */
+ protected void setUp() throws Exception
+ {
+ super.setUp();
+ //System.out.println(new java.util.Date());
+ String str;
+
+ File dataDir = new File(System.getProperty("dataDir"));
+
+ // open and read words into an array list
+ BufferedReader inWords =
+ new BufferedReader(
+ new InputStreamReader(
+ new FileInputStream(new File(dataDir, "/org/apache/lucene/analysis/ru/wordsUnicode.txt")),
+ "Unicode"));
+ while ((str = inWords.readLine()) != null)
+ {
+ words.add(str);
+ }
+ inWords.close();
+
+ // open and read stems into an array list
+ BufferedReader inStems =
+ new BufferedReader(
+ new InputStreamReader(
+ new FileInputStream(new File(dataDir, "/org/apache/lucene/analysis/ru/stemsUnicode.txt")),
+ "Unicode"));
+ while ((str = inStems.readLine()) != null)
+ {
+ stems.add(str);
+ }
+ inStems.close();
+ }
+
+ /**
+ * @see TestCase#tearDown()
+ */
+ protected void tearDown() throws Exception
+ {
+ super.tearDown();
+ }
+
+ public void testStem()
+ {
+ for (int i = 0; i < words.size(); i++)
+ {
+ //if ( (i % 100) == 0 ) System.err.println(i);
+ String realStem =
+ RussianStemmer.stem(
+ (String) words.get(i),
+ RussianCharsets.UnicodeRussian);
+ assertEquals("unicode", stems.get(i), realStem);
+ }
+ }
+
+ private String printChars(String output)
+ {
+ StringBuffer s = new StringBuffer();
+ for (int i = 0; i < output.length(); i++)
+ {
+ s.append(output.charAt(i));
+ }
+ return s.toString();
+ }
+}
---------------------------------------------------------------------
To unsubscribe, e-mail: lucene-dev-unsubscribe@jakarta.apache.org
For additional commands, e-mail: lucene-dev-help@jakarta.apache.org