You are viewing a plain text version of this content. The canonical link for it is here.
Posted to oak-commits@jackrabbit.apache.org by th...@apache.org on 2018/04/26 08:31:39 UTC

svn commit: r1830173 - in /jackrabbit/oak/branches/1.8: ./ oak-core/src/main/java/org/apache/jackrabbit/oak/query/ oak-core/src/test/java/org/apache/jackrabbit/oak/query/ oak-jcr/ oak-jcr/src/test/java/org/apache/jackrabbit/oak/jcr/query/

Author: thomasm
Date: Thu Apr 26 08:31:39 2018
New Revision: 1830173

URL: http://svn.apache.org/viewvc?rev=1830173&view=rev
Log:
OAK-7437 SimpleExcerptProvider highlighting should be case insensitive

Modified:
    jackrabbit/oak/branches/1.8/   (props changed)
    jackrabbit/oak/branches/1.8/oak-core/src/main/java/org/apache/jackrabbit/oak/query/SimpleExcerptProvider.java
    jackrabbit/oak/branches/1.8/oak-core/src/test/java/org/apache/jackrabbit/oak/query/SimpleExcerptProviderTest.java
    jackrabbit/oak/branches/1.8/oak-jcr/   (props changed)
    jackrabbit/oak/branches/1.8/oak-jcr/src/test/java/org/apache/jackrabbit/oak/jcr/query/QueryFulltextTest.java

Propchange: jackrabbit/oak/branches/1.8/
------------------------------------------------------------------------------
--- svn:mergeinfo (original)
+++ svn:mergeinfo Thu Apr 26 08:31:39 2018
@@ -1,3 +1,3 @@
 /jackrabbit/oak/branches/1.0:1665962
-/jackrabbit/oak/trunk
+/jackrabbit/oak/trunk:1820660-1820661,1820729,1820734,1820859,1820861,1820878,1820888,1820947,1821130,1821140-1821141,1821240,1821249,1821258,1821325,1821358,1821361-1821362,1821370,1821375,1821393,1821477,1821487,1821516,1821665,1821668,1821681,1822121,1822201,1822207,1822723,1822808,1822850,1822934,1823135,1823163,1823169,1824196,1824198,1824962,1825362,1825381,1825442,1825448,1825466,1825470,1825475,1825523,1825525,1825619-1825621,1825651,1825654,1825992,1826079,1826090,1826096,1826237,1826338,1826516,1826532,1826640,1826932,1826957,1827472,1827486,1827977,1829987,1830019,1830160
 /jackrabbit/trunk:1345480

Modified: jackrabbit/oak/branches/1.8/oak-core/src/main/java/org/apache/jackrabbit/oak/query/SimpleExcerptProvider.java
URL: http://svn.apache.org/viewvc/jackrabbit/oak/branches/1.8/oak-core/src/main/java/org/apache/jackrabbit/oak/query/SimpleExcerptProvider.java?rev=1830173&r1=1830172&r2=1830173&view=diff
==============================================================================
--- jackrabbit/oak/branches/1.8/oak-core/src/main/java/org/apache/jackrabbit/oak/query/SimpleExcerptProvider.java (original)
+++ jackrabbit/oak/branches/1.8/oak-core/src/main/java/org/apache/jackrabbit/oak/query/SimpleExcerptProvider.java Thu Apr 26 08:31:39 2018
@@ -19,9 +19,12 @@ package org.apache.jackrabbit.oak.query;
 import java.util.BitSet;
 import java.util.HashSet;
 import java.util.Set;
+import java.util.regex.Matcher;
+import java.util.regex.Pattern;
 
 import com.google.common.base.Splitter;
 import com.google.common.collect.ImmutableSet;
+
 import org.apache.jackrabbit.oak.api.PropertyState;
 import org.apache.jackrabbit.oak.api.PropertyValue;
 import org.apache.jackrabbit.oak.api.Tree;
@@ -45,6 +48,8 @@ class SimpleExcerptProvider {
     static final String REP_EXCERPT_FN = "rep:excerpt(.)";
     static final String EXCERPT_END = "</span></div>";
     static final String EXCERPT_BEGIN = "<div><span>";
+    
+    private static final boolean CASE_SENSITIVE_HIGHLIGHT = Boolean.getBoolean("oak.query.caseSensitiveHighlight");
 
     private static int maxFragmentSize = 150;
 
@@ -234,7 +239,7 @@ class SimpleExcerptProvider {
         }
         int index = 0;
         while (index < text.length()) {
-            index = text.indexOf(token, index);
+            index = indexOfSearchText(text, token, index);
             if (index < 0) {
                 break;
             }
@@ -267,6 +272,26 @@ class SimpleExcerptProvider {
             }
         }
     }
+    
+    private static int indexOfSearchText(String text, String searchStr, int fromIndex) {
+        if (CASE_SENSITIVE_HIGHLIGHT) {
+            return text.indexOf(searchStr, fromIndex);
+        }
+        return indexOfIgnoreCase(text, searchStr, fromIndex);
+    }
+    
+    public static int indexOfIgnoreCase(String str, String searchStr, int startPos) {
+        // This is not very efficient, specially as we create the pattern each time.
+        // An alternative is to use apache commons lang StringUtils.indexOfIgnoreCase,
+        // but that would require a new dependency
+        String quotedSearchStr = Pattern.quote(searchStr);
+        Pattern pattern = Pattern.compile(quotedSearchStr, Pattern.CASE_INSENSITIVE);
+        Matcher matcher = pattern.matcher(str);
+        if(matcher.find(startPos)) {
+            return matcher.start();
+        }
+        return -1;
+    }
 
     static boolean isDelimeter(int codePoint) {
         return !isLetterOrDigit(codePoint);

Modified: jackrabbit/oak/branches/1.8/oak-core/src/test/java/org/apache/jackrabbit/oak/query/SimpleExcerptProviderTest.java
URL: http://svn.apache.org/viewvc/jackrabbit/oak/branches/1.8/oak-core/src/test/java/org/apache/jackrabbit/oak/query/SimpleExcerptProviderTest.java?rev=1830173&r1=1830172&r2=1830173&view=diff
==============================================================================
--- jackrabbit/oak/branches/1.8/oak-core/src/test/java/org/apache/jackrabbit/oak/query/SimpleExcerptProviderTest.java (original)
+++ jackrabbit/oak/branches/1.8/oak-core/src/test/java/org/apache/jackrabbit/oak/query/SimpleExcerptProviderTest.java Thu Apr 26 08:31:39 2018
@@ -32,6 +32,18 @@ import org.junit.Test;
 public class SimpleExcerptProviderTest {
 
     @Test
+    public void caseInsensitiveTest() throws Exception {
+        // This will make the test fail:
+        // static {
+        //     System.setProperty("oak.query.caseSensitiveHighlight", "true");
+        // }
+        assertEquals("<div><span><strong>fox</strong> is jumping and dancing foxtrot</span></div>",
+                highlight(sb("fox is jumping and dancing foxtrot"), of("Fox")));
+        assertEquals("<div><span>fox is <strong>jumping</strong></span></div>",
+                highlight(sb("fox is jumping"), of("jUmP*")));
+    }
+
+    @Test
     public void simpleTest() throws Exception {
         assertEquals("<div><span><strong>fox</strong> is jumping</span></div>",
                 highlight(sb("fox is jumping"), of("fox")));

Propchange: jackrabbit/oak/branches/1.8/oak-jcr/
------------------------------------------------------------------------------
--- svn:mergeinfo (added)
+++ svn:mergeinfo Thu Apr 26 08:31:39 2018
@@ -0,0 +1,3 @@
+/jackrabbit/oak/branches/1.0/oak-jcr:1665962
+/jackrabbit/oak/trunk/oak-jcr
+/jackrabbit/trunk/oak-jcr:1345480

Modified: jackrabbit/oak/branches/1.8/oak-jcr/src/test/java/org/apache/jackrabbit/oak/jcr/query/QueryFulltextTest.java
URL: http://svn.apache.org/viewvc/jackrabbit/oak/branches/1.8/oak-jcr/src/test/java/org/apache/jackrabbit/oak/jcr/query/QueryFulltextTest.java?rev=1830173&r1=1830172&r2=1830173&view=diff
==============================================================================
--- jackrabbit/oak/branches/1.8/oak-jcr/src/test/java/org/apache/jackrabbit/oak/jcr/query/QueryFulltextTest.java (original)
+++ jackrabbit/oak/branches/1.8/oak-jcr/src/test/java/org/apache/jackrabbit/oak/jcr/query/QueryFulltextTest.java Thu Apr 26 08:31:39 2018
@@ -42,7 +42,7 @@ public class QueryFulltextTest extends A
     public QueryFulltextTest(NodeStoreFixture fixture) {
         super(fixture);
     }
-    
+
     @Test
     public void excerpt() throws Exception {
         Session session = getAdminSession();
@@ -60,9 +60,9 @@ public class QueryFulltextTest extends A
         RowIterator it;
         Row row;
         String s;
-        
+
         String xpath = "//*[jcr:contains(., 'hello')]/rep:excerpt(.) order by @jcr:path";
-        
+
         q = qm.createQuery(xpath, "xpath");
         it = q.execute().getRows();
         row = it.nextRow();
@@ -73,10 +73,9 @@ public class QueryFulltextTest extends A
         row = it.nextRow();
         path = row.getPath();
         s = row.getValue("rep:excerpt(.)").getString();
-        // TODO is this expected?
-        assertTrue(path + ":" + s + " (3)", s.indexOf("Hello World") >= 0);
+        assertTrue(path + ":" + s + " (3)", s.indexOf("<strong>Hello</strong> World") >= 0);
         assertTrue(path + ":" + s + " (4)", s.indexOf("Description") >= 0);
-        
+
         xpath = "//*[jcr:contains(., 'hello')]/rep:excerpt(.) order by @jcr:path";
 
         q = qm.createQuery(xpath, "xpath");
@@ -89,11 +88,10 @@ public class QueryFulltextTest extends A
         row = it.nextRow();
         path = row.getPath();
         s = row.getValue("rep:excerpt(text)").getString();
-        // TODO is this expected?
-        assertTrue(path + ":" + s + " (7)", s.indexOf("Hello World") >= 0);
+        assertTrue(path + ":" + s + " (7)", s.indexOf("<strong>Hello</strong> World") >= 0);
         assertTrue(path + ":" + s + " (8)", s.indexOf("Description") < 0);
     }
-    
+
     @Test
     public void fulltextOrWithinText() throws Exception {
         Session session = getAdminSession();
@@ -106,18 +104,18 @@ public class QueryFulltextTest extends A
         Node n3 = testRootNode.addNode("node3");
         n3.setProperty("text", "hello hallo");
         session.save();
-       
-        String sql2 = "select [jcr:path] as [path] from [nt:base] " + 
+
+        String sql2 = "select [jcr:path] as [path] from [nt:base] " +
                 "where contains([text], 'hello OR hallo') order by [jcr:path]";
-        
+
         Query q;
-        
+
         q = qm.createQuery("explain " + sql2, Query.JCR_SQL2);
 
-        assertEquals("[nt:base] as [nt:base] /* traverse \"*\" " + 
+        assertEquals("[nt:base] as [nt:base] /* traverse \"*\" " +
                 "where contains([nt:base].[text], 'hello OR hallo') */",
                 getResult(q.execute(), "plan"));
-        
+
         // verify the result
         // uppercase "OR" mean logical "or"
         q = qm.createQuery(sql2, Query.JCR_SQL2);
@@ -125,14 +123,14 @@ public class QueryFulltextTest extends A
                 getResult(q.execute(), "path"));
 
         // lowercase "or" mean search for the term "or"
-        sql2 = "select [jcr:path] as [path] from [nt:base] " + 
+        sql2 = "select [jcr:path] as [path] from [nt:base] " +
                 "where contains([text], 'hello or hallo') order by [jcr:path]";
         q = qm.createQuery(sql2, Query.JCR_SQL2);
-        assertEquals("", 
+        assertEquals("",
                 getResult(q.execute(), "path"));
 
     }
-    
+
     static String getResult(QueryResult result, String propertyName) throws RepositoryException {
         StringBuilder buff = new StringBuilder();
         RowIterator it = result.getRows();
@@ -144,5 +142,5 @@ public class QueryFulltextTest extends A
         }
         return buff.toString();
     }
-    
+
 }