You are viewing a plain text version of this content. The canonical link for it is here.
Posted to java-commits@lucene.apache.org by yo...@apache.org on 2009/02/25 21:44:05 UTC

svn commit: r747915 - in /lucene/java/trunk: ./ contrib/analyzers/src/java/org/apache/lucene/analysis/reverse/ contrib/analyzers/src/test/org/apache/lucene/analysis/reverse/

Author: yonik
Date: Wed Feb 25 20:44:05 2009
New Revision: 747915

URL: http://svn.apache.org/viewvc?rev=747915&view=rev
Log:
LUCENE-1398: Add ReverseStringFilter to contrib/analyzers

Added:
    lucene/java/trunk/contrib/analyzers/src/java/org/apache/lucene/analysis/reverse/
    lucene/java/trunk/contrib/analyzers/src/java/org/apache/lucene/analysis/reverse/ReverseStringFilter.java   (with props)
    lucene/java/trunk/contrib/analyzers/src/test/org/apache/lucene/analysis/reverse/
    lucene/java/trunk/contrib/analyzers/src/test/org/apache/lucene/analysis/reverse/TestReverseStringFilter.java   (with props)
Modified:
    lucene/java/trunk/CHANGES.txt

Modified: lucene/java/trunk/CHANGES.txt
URL: http://svn.apache.org/viewvc/lucene/java/trunk/CHANGES.txt?rev=747915&r1=747914&r2=747915&view=diff
==============================================================================
--- lucene/java/trunk/CHANGES.txt (original)
+++ lucene/java/trunk/CHANGES.txt Wed Feb 25 20:44:05 2009
@@ -159,6 +159,9 @@
     bitset.  Instead, match() is called on demand per docID.  (John
     Wang via Mike McCandless)
 
+15. LUCENE-1398: Add ReverseStringFilter to contrib/analyzers, a filter
+    to reverse the characters in each token.  (Koji Sekiguchi via yonik)
+
 Optimizations
 
  1. LUCENE-1427: Fixed QueryWrapperFilter to not waste time computing

Added: lucene/java/trunk/contrib/analyzers/src/java/org/apache/lucene/analysis/reverse/ReverseStringFilter.java
URL: http://svn.apache.org/viewvc/lucene/java/trunk/contrib/analyzers/src/java/org/apache/lucene/analysis/reverse/ReverseStringFilter.java?rev=747915&view=auto
==============================================================================
--- lucene/java/trunk/contrib/analyzers/src/java/org/apache/lucene/analysis/reverse/ReverseStringFilter.java (added)
+++ lucene/java/trunk/contrib/analyzers/src/java/org/apache/lucene/analysis/reverse/ReverseStringFilter.java Wed Feb 25 20:44:05 2009
@@ -0,0 +1,68 @@
+/**
+ * Licensed to the Apache Software Foundation (ASF) under one or more
+ * contributor license agreements.  See the NOTICE file distributed with
+ * this work for additional information regarding copyright ownership.
+ * The ASF licenses this file to You under the Apache License, Version 2.0
+ * (the "License"); you may not use this file except in compliance with
+ * the License.  You may obtain a copy of the License at
+ *
+ *     http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing, software
+ * distributed under the License is distributed on an "AS IS" BASIS,
+ * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+ * See the License for the specific language governing permissions and
+ * limitations under the License.
+ */
+
+package org.apache.lucene.analysis.reverse;
+
+import org.apache.lucene.analysis.TokenFilter;
+import org.apache.lucene.analysis.TokenStream;
+import org.apache.lucene.analysis.Token;
+
+import java.io.IOException;
+
+/**
+ * Reverse token string e.g. "country" => "yrtnuoc".
+ *
+ * @version $Id$
+ */
+public final class ReverseStringFilter extends TokenFilter {
+
+  public ReverseStringFilter(TokenStream in) {
+    super(in);
+  }
+
+  public final Token next(Token in) throws IOException {
+    assert in != null;
+    Token token=input.next(in);
+    if( token == null ) return null;
+    reverse( token.termBuffer(), token.termLength() );
+    return token;
+  }
+
+  public static String reverse( final String input ){
+    char[] charInput = input.toCharArray();
+    reverse( charInput );
+    return new String( charInput );
+  }
+  
+  public static void reverse( char[] buffer ){
+    reverse( buffer, buffer.length );
+  }
+  
+  public static void reverse( char[] buffer, int len ){
+    reverse( buffer, 0, len );
+  }
+  
+  public static void reverse( char[] buffer, int start, int len ){
+    if( len <= 1 ) return;
+    int num = len>>1;
+    for( int i = start; i < ( start + num ); i++ ){
+      char c = buffer[i];
+      buffer[i] = buffer[start * 2 + len - i - 1];
+      buffer[start * 2 + len - i - 1] = c;
+    }
+  }
+}

Propchange: lucene/java/trunk/contrib/analyzers/src/java/org/apache/lucene/analysis/reverse/ReverseStringFilter.java
------------------------------------------------------------------------------
    svn:eol-style = native

Propchange: lucene/java/trunk/contrib/analyzers/src/java/org/apache/lucene/analysis/reverse/ReverseStringFilter.java
------------------------------------------------------------------------------
    svn:keywords = Date Author Id Revision HeadURL

Added: lucene/java/trunk/contrib/analyzers/src/test/org/apache/lucene/analysis/reverse/TestReverseStringFilter.java
URL: http://svn.apache.org/viewvc/lucene/java/trunk/contrib/analyzers/src/test/org/apache/lucene/analysis/reverse/TestReverseStringFilter.java?rev=747915&view=auto
==============================================================================
--- lucene/java/trunk/contrib/analyzers/src/test/org/apache/lucene/analysis/reverse/TestReverseStringFilter.java (added)
+++ lucene/java/trunk/contrib/analyzers/src/test/org/apache/lucene/analysis/reverse/TestReverseStringFilter.java Wed Feb 25 20:44:05 2009
@@ -0,0 +1,52 @@
+/**
+ * Licensed to the Apache Software Foundation (ASF) under one or more
+ * contributor license agreements.  See the NOTICE file distributed with
+ * this work for additional information regarding copyright ownership.
+ * The ASF licenses this file to You under the Apache License, Version 2.0
+ * (the "License"); you may not use this file except in compliance with
+ * the License.  You may obtain a copy of the License at
+ *
+ *     http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing, software
+ * distributed under the License is distributed on an "AS IS" BASIS,
+ * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+ * See the License for the specific language governing permissions and
+ * limitations under the License.
+ */
+
+package org.apache.lucene.analysis.reverse;
+
+import java.io.StringReader;
+
+import org.apache.lucene.analysis.Token;
+import org.apache.lucene.analysis.TokenStream;
+import org.apache.lucene.analysis.WhitespaceTokenizer;
+import org.apache.lucene.util.LuceneTestCase;
+
+public class TestReverseStringFilter extends LuceneTestCase {
+  public void testFilter() throws Exception {
+    TokenStream stream = new WhitespaceTokenizer(
+        new StringReader("Do have a nice day"));     // 1-4 length string
+    ReverseStringFilter filter = new ReverseStringFilter(stream);
+    final Token reusableToken = new Token();
+    assertEquals("oD", filter.next(reusableToken).term());
+    assertEquals("evah", filter.next(reusableToken).term());
+    assertEquals("a", filter.next(reusableToken).term());
+    assertEquals("ecin", filter.next(reusableToken).term());
+    assertEquals("yad", filter.next(reusableToken).term());
+    assertNull(filter.next(reusableToken));
+  }
+
+  public void testReverseString() throws Exception {
+    assertEquals( "A", ReverseStringFilter.reverse( "A" ) );
+    assertEquals( "BA", ReverseStringFilter.reverse( "AB" ) );
+    assertEquals( "CBA", ReverseStringFilter.reverse( "ABC" ) );
+  }
+  
+  public void testReverseChar() throws Exception {
+    char[] buffer = { 'A', 'B', 'C', 'D', 'E', 'F' };
+    ReverseStringFilter.reverse( buffer, 2, 3 );
+    assertEquals( "ABEDCF", new String( buffer ) );
+  }
+}

Propchange: lucene/java/trunk/contrib/analyzers/src/test/org/apache/lucene/analysis/reverse/TestReverseStringFilter.java
------------------------------------------------------------------------------
    svn:eol-style = native

Propchange: lucene/java/trunk/contrib/analyzers/src/test/org/apache/lucene/analysis/reverse/TestReverseStringFilter.java
------------------------------------------------------------------------------
    svn:keywords = Date Author Id Revision HeadURL