You are viewing a plain text version of this content. The canonical link for it is here.
Posted to commits@lucene.apache.org by ch...@apache.org on 2012/04/27 07:18:40 UTC
svn commit: r1331220 [2/2] - in /lucene/dev/trunk:
lucene/core/src/java/org/apache/lucene/util/
lucene/core/src/test/org/apache/lucene/util/ solr/
solr/contrib/analysis-extras/src/test/org/apache/solr/analysis/
solr/core/src/java/org/apache/solr/analys...
Modified: lucene/dev/trunk/solr/core/src/test/org/apache/solr/analysis/TestUAX29URLEmailTokenizerFactory.java
URL: http://svn.apache.org/viewvc/lucene/dev/trunk/solr/core/src/test/org/apache/solr/analysis/TestUAX29URLEmailTokenizerFactory.java?rev=1331220&r1=1331219&r2=1331220&view=diff
==============================================================================
--- lucene/dev/trunk/solr/core/src/test/org/apache/solr/analysis/TestUAX29URLEmailTokenizerFactory.java (original)
+++ lucene/dev/trunk/solr/core/src/test/org/apache/solr/analysis/TestUAX29URLEmailTokenizerFactory.java Fri Apr 27 05:18:38 2012
@@ -24,6 +24,7 @@ import java.util.HashMap;
import java.util.Map;
import org.apache.lucene.analysis.Tokenizer;
+import org.apache.lucene.util.Version;
/**
* A few tests based on org.apache.lucene.analysis.TestUAX29URLEmailTokenizer
@@ -34,7 +35,8 @@ public class TestUAX29URLEmailTokenizerF
public void testUAX29URLEmailTokenizer() throws Exception {
Reader reader = new StringReader("Wha\u0301t's this thing do?");
UAX29URLEmailTokenizerFactory factory = new UAX29URLEmailTokenizerFactory();
- factory.init(DEFAULT_VERSION_PARAM);
+ factory.setLuceneMatchVersion(DEFAULT_VERSION);
+ factory.init(EMPTY_PARAMS);
Tokenizer stream = factory.create(reader);
assertTokenStreamContents(stream,
new String[] {"Wha\u0301t's", "this", "thing", "do" });
@@ -43,7 +45,8 @@ public class TestUAX29URLEmailTokenizerF
public void testArabic() throws Exception {
Reader reader = new StringReader("اÙÙÙÙÙ
اÙÙثائÙ٠اÙØ£Ù٠ع٠ÙÙÙÙبÙدÙا ÙسÙ
Ù \"اÙØÙÙÙØ© باÙأرÙاÙ
: Ùصة ÙÙÙÙبÙدÙا\" (باÙØ¥ÙجÙÙزÙØ©: Truth in Numbers: The Wikipedia Story)Ø Ø³ÙتÙ
إطÙاÙÙ ÙÙ 2008.");
UAX29URLEmailTokenizerFactory factory = new UAX29URLEmailTokenizerFactory();
- factory.init(DEFAULT_VERSION_PARAM);
+ factory.setLuceneMatchVersion(DEFAULT_VERSION);
+ factory.init(EMPTY_PARAMS);
Tokenizer stream = factory.create(reader);
assertTokenStreamContents(stream,
new String[] {"اÙÙÙÙÙ
", "اÙÙثائÙÙ", "اÙØ£ÙÙ", "عÙ", "ÙÙÙÙبÙدÙا", "ÙسÙ
Ù", "اÙØÙÙÙØ©", "باÙأرÙاÙ
", "Ùصة", "ÙÙÙÙبÙدÙا",
@@ -53,7 +56,8 @@ public class TestUAX29URLEmailTokenizerF
public void testChinese() throws Exception {
Reader reader = new StringReader("ææ¯ä¸å½äººã ï¼ï¼ï¼ï¼ ï¼´ï½
ï½ï½ï½ ");
UAX29URLEmailTokenizerFactory factory = new UAX29URLEmailTokenizerFactory();
- factory.init(DEFAULT_VERSION_PARAM);
+ factory.setLuceneMatchVersion(DEFAULT_VERSION);
+ factory.init(EMPTY_PARAMS);
Tokenizer stream = factory.create(reader);
assertTokenStreamContents(stream,
new String[] {"æ", "æ¯", "ä¸", "å½", "人", "ï¼ï¼ï¼ï¼", "ï¼´ï½
ï½ï½ï½"});
@@ -62,7 +66,8 @@ public class TestUAX29URLEmailTokenizerF
public void testKorean() throws Exception {
Reader reader = new StringReader("ìë
íì¸ì íê¸ì
ëë¤");
UAX29URLEmailTokenizerFactory factory = new UAX29URLEmailTokenizerFactory();
- factory.init(DEFAULT_VERSION_PARAM);
+ factory.setLuceneMatchVersion(DEFAULT_VERSION);
+ factory.init(EMPTY_PARAMS);
Tokenizer stream = factory.create(reader);
assertTokenStreamContents(stream,
new String[] {"ìë
íì¸ì", "íê¸ì
ëë¤"});
@@ -71,7 +76,8 @@ public class TestUAX29URLEmailTokenizerF
public void testHyphen() throws Exception {
Reader reader = new StringReader("some-dashed-phrase");
UAX29URLEmailTokenizerFactory factory = new UAX29URLEmailTokenizerFactory();
- factory.init(DEFAULT_VERSION_PARAM);
+ factory.setLuceneMatchVersion(DEFAULT_VERSION);
+ factory.init(EMPTY_PARAMS);
Tokenizer stream = factory.create(reader);
assertTokenStreamContents(stream,
new String[] {"some", "dashed", "phrase"});
@@ -95,7 +101,8 @@ public class TestUAX29URLEmailTokenizerF
+ "http://[a42:a7b6::]/qSmxSUU4z/%52qVl4\n";
Reader reader = new StringReader(textWithURLs);
UAX29URLEmailTokenizerFactory factory = new UAX29URLEmailTokenizerFactory();
- factory.init(DEFAULT_VERSION_PARAM);
+ factory.setLuceneMatchVersion(DEFAULT_VERSION);
+ factory.init(EMPTY_PARAMS);
Tokenizer stream = factory.create(reader);
assertTokenStreamContents(stream,
new String[] {
@@ -135,7 +142,8 @@ public class TestUAX29URLEmailTokenizerF
+ "lv'p@tqk.vj5s0tgl.0dlu7su3iyiaz.dqso.494.3hb76.XN--MGBAAM7A8H\n";
Reader reader = new StringReader(textWithEmails);
UAX29URLEmailTokenizerFactory factory = new UAX29URLEmailTokenizerFactory();
- factory.init(DEFAULT_VERSION_PARAM);
+ factory.setLuceneMatchVersion(DEFAULT_VERSION);
+ factory.init(EMPTY_PARAMS);
Tokenizer stream = factory.create(reader);
assertTokenStreamContents(stream,
new String[] {
@@ -166,9 +174,9 @@ public class TestUAX29URLEmailTokenizerF
String content = "one two three " + longWord + " four five six";
Reader reader = new StringReader(content);
Map<String,String> args = new HashMap<String,String>();
- args.put("luceneMatchVersion", DEFAULT_VERSION_PARAM.get("luceneMatchVersion"));
args.put("maxTokenLength", "1000");
UAX29URLEmailTokenizerFactory factory = new UAX29URLEmailTokenizerFactory();
+ factory.setLuceneMatchVersion(DEFAULT_VERSION);
factory.init(args);
Tokenizer stream = factory.create(reader);
assertTokenStreamContents(stream,
@@ -180,14 +188,16 @@ public class TestUAX29URLEmailTokenizerF
public void testMatchVersion() throws Exception {
Reader reader = new StringReader("ãã");
UAX29URLEmailTokenizerFactory factory = new UAX29URLEmailTokenizerFactory();
- factory.init(DEFAULT_VERSION_PARAM);
+ factory.setLuceneMatchVersion(DEFAULT_VERSION);
+ factory.init(EMPTY_PARAMS);
Tokenizer stream = factory.create(reader);
assertTokenStreamContents(stream,
new String[] {"ãã"});
reader = new StringReader("ãã");
factory = new UAX29URLEmailTokenizerFactory();
- factory.init(Collections.singletonMap("luceneMatchVersion", "3.1"));
+ factory.setLuceneMatchVersion(Version.LUCENE_31);
+ factory.init(EMPTY_PARAMS);
stream = factory.create(reader);
assertTokenStreamContents(stream,
new String[] {"ã"}); // old broken behavior
Modified: lucene/dev/trunk/solr/test-framework/src/java/org/apache/solr/analysis/BaseTokenTestCase.java
URL: http://svn.apache.org/viewvc/lucene/dev/trunk/solr/test-framework/src/java/org/apache/solr/analysis/BaseTokenTestCase.java?rev=1331220&r1=1331219&r2=1331220&view=diff
==============================================================================
--- lucene/dev/trunk/solr/test-framework/src/java/org/apache/solr/analysis/BaseTokenTestCase.java (original)
+++ lucene/dev/trunk/solr/test-framework/src/java/org/apache/solr/analysis/BaseTokenTestCase.java Fri Apr 27 05:18:38 2012
@@ -27,12 +27,19 @@ import org.apache.solr.core.Config;
/**
* General token testing helper functions
*/
-public abstract class BaseTokenTestCase extends BaseTokenStreamTestCase
-{
- /** a map containing the default test version param for easy testing */
- protected static final Map<String,String> DEFAULT_VERSION_PARAM =
- Collections.singletonMap("luceneMatchVersion", System.getProperty("tests.luceneMatchVersion", "LUCENE_CURRENT"));
+public abstract class BaseTokenTestCase extends BaseTokenStreamTestCase{
+
+ protected static final Map<String, String> EMPTY_PARAMS = Collections.emptyMap();
/** The default test version for easy testing */
- public static final Version DEFAULT_VERSION = Config.parseLuceneVersionString(DEFAULT_VERSION_PARAM.get("luceneMatchVersion"));
+ public static final Version DEFAULT_VERSION;
+
+ static {
+ String rawVersion = System.getProperty("tests.luceneMatchVersion", "LUCENE_CURRENT");
+ try {
+ DEFAULT_VERSION = Version.parseLeniently(rawVersion);
+ } catch (IllegalArgumentException iae) {
+ throw new RuntimeException("Test Lucene Match Version [" + rawVersion + "] is invalid", iae);
+ }
+ }
}