You are viewing a plain text version of this content. The canonical link for it is here.

Posted to commits@jena.apache.org by os...@apache.org on 2015/12/16 10:53:56 UTC

[1/2] jena git commit: add failing unit test for JENA-1093

Repository: jena
Updated Branches:
  refs/heads/master b6192a9e1 -> 67f9905de


add failing unit test for JENA-1093


Project: http://git-wip-us.apache.org/repos/asf/jena/repo
Commit: http://git-wip-us.apache.org/repos/asf/jena/commit/4bf7319c
Tree: http://git-wip-us.apache.org/repos/asf/jena/tree/4bf7319c
Diff: http://git-wip-us.apache.org/repos/asf/jena/diff/4bf7319c

Branch: refs/heads/master
Commit: 4bf7319c31cb3c65c0ab18e67477d4d24ad5c8ed
Parents: b6192a9
Author: Osma Suominen <os...@apache.org>
Authored: Tue Dec 15 16:52:08 2015 +0200
Committer: Osma Suominen <os...@apache.org>
Committed: Tue Dec 15 16:52:08 2015 +0200

----------------------------------------------------------------------
 .../TestDatasetWithLuceneStoredLiterals.java    | 58 ++++++++++++++++++++
 1 file changed, 58 insertions(+)
----------------------------------------------------------------------


http://git-wip-us.apache.org/repos/asf/jena/blob/4bf7319c/jena-text/src/test/java/org/apache/jena/query/text/TestDatasetWithLuceneStoredLiterals.java
----------------------------------------------------------------------
diff --git a/jena-text/src/test/java/org/apache/jena/query/text/TestDatasetWithLuceneStoredLiterals.java b/jena-text/src/test/java/org/apache/jena/query/text/TestDatasetWithLuceneStoredLiterals.java
index b55bbd7..659a0dd 100644
--- a/jena-text/src/test/java/org/apache/jena/query/text/TestDatasetWithLuceneStoredLiterals.java
+++ b/jena-text/src/test/java/org/apache/jena/query/text/TestDatasetWithLuceneStoredLiterals.java
@@ -27,12 +27,15 @@ import java.io.StringReader ;
 import java.util.Arrays ;
 import java.util.HashMap ;
 import java.util.HashSet ;
+import java.util.LinkedList ;
+import java.util.List ;
 import java.util.Map ;
 import java.util.Set ;
 
 import org.apache.jena.assembler.Assembler ;
 import org.apache.jena.atlas.lib.StrUtils ;
 import org.apache.jena.datatypes.xsd.XSDDatatype ;
+import org.apache.jena.graph.Node ;
 import org.apache.jena.graph.NodeFactory ;
 import org.apache.jena.query.Dataset ;
 import org.apache.jena.query.Query ;
@@ -147,6 +150,35 @@ public class TestDatasetWithLuceneStoredLiterals extends AbstractTestDatasetWith
         return literals;
     }
 
+    protected List<Node> doTestSearchWithLiteralsMultiple(String turtle, String queryString, String expectedEntityURI) {
+        List<Node> literals = new LinkedList<>();
+        Model model = dataset.getDefaultModel();
+        Reader reader = new StringReader(turtle);
+        dataset.begin(ReadWrite.WRITE);
+        model.read(reader, "", "TURTLE");
+        dataset.commit();
+
+        Query query = QueryFactory.create(queryString) ;
+        dataset.begin(ReadWrite.READ);
+        try(QueryExecution qexec = QueryExecutionFactory.create(query, dataset)) {
+            ResultSet results = qexec.execSelect() ;
+            int count;
+            for (count=0; results.hasNext(); count++) {
+                QuerySolution soln = results.nextSolution();
+                String entityURI = soln.getResource("s").getURI();
+                assertEquals(expectedEntityURI, entityURI);
+                Literal literal = soln.getLiteral("literal");
+                assertNotNull(literal);
+                literals.add(literal.asNode());
+            }
+        }
+        finally {
+            dataset.end() ;
+        }
+        return literals;
+    }
+
+
     @Test
     public void testLiteralValue() {
         // test basic capturing of the literal value in a variable
@@ -245,4 +277,30 @@ public class TestDatasetWithLuceneStoredLiterals extends AbstractTestDatasetWith
         assertEquals(NodeFactory.createLiteral("true", XSDDatatype.XSDboolean), value.asNode());
     }
 
+    @Test
+    public void testLiteralValueMultiple() {
+        // test capturing of multiple matching literal values in a variable
+        final String testName = "testLiteralValueMultiple";
+        final String turtle = StrUtils.strjoinNL(
+                TURTLE_PROLOG,
+                "<" + RESOURCE_BASE + testName + ">",
+                "  rdfs:comment 'a nontext comment', 'another nontext comment'",
+                "."
+                );
+        String queryString = StrUtils.strjoinNL(
+                QUERY_PROLOG,
+                "SELECT ?s ?literal",
+                "WHERE {",
+                "    (?s ?score ?literal) text:query (rdfs:comment 'nontext') .",
+                "}"
+                );
+
+        String expectedURI = RESOURCE_BASE + testName;
+        List<Node> literals = doTestSearchWithLiteralsMultiple(turtle, queryString, expectedURI);
+
+        assertEquals(2, literals.size());
+        assertTrue(literals.contains(NodeFactory.createLiteral("a nontext comment")));
+        assertTrue(literals.contains(NodeFactory.createLiteral("another nontext comment")));
+    }
+
 }

[2/2] jena git commit: Revert TextQueryPF changes in "JENA-999 - Fix performance of jena-text when subject variable is bound" This reverts part of commit d6adcc17712a3b44cfe6d4264f75fb44ddcc7f67.

Posted by os...@apache.org.

Revert TextQueryPF changes in "JENA-999 - Fix performance of jena-text when subject variable is bound"
This reverts part of commit d6adcc17712a3b44cfe6d4264f75fb44ddcc7f67.


Project: http://git-wip-us.apache.org/repos/asf/jena/repo
Commit: http://git-wip-us.apache.org/repos/asf/jena/commit/67f9905d
Tree: http://git-wip-us.apache.org/repos/asf/jena/tree/67f9905d
Diff: http://git-wip-us.apache.org/repos/asf/jena/diff/67f9905d

Branch: refs/heads/master
Commit: 67f9905def78a37de08aa7522bbbb9c72344cfb8
Parents: 4bf7319
Author: Osma Suominen <os...@apache.org>
Authored: Tue Dec 15 17:42:37 2015 +0200
Committer: Osma Suominen <os...@apache.org>
Committed: Wed Dec 16 09:17:02 2015 +0200

----------------------------------------------------------------------
 .../org/apache/jena/query/text/TextQueryPF.java | 914 ++++++++-----------
 1 file changed, 388 insertions(+), 526 deletions(-)
----------------------------------------------------------------------


http://git-wip-us.apache.org/repos/asf/jena/blob/67f9905d/jena-text/src/main/java/org/apache/jena/query/text/TextQueryPF.java
----------------------------------------------------------------------
diff --git a/jena-text/src/main/java/org/apache/jena/query/text/TextQueryPF.java b/jena-text/src/main/java/org/apache/jena/query/text/TextQueryPF.java
index ab297e0..e0a8a37 100644
--- a/jena-text/src/main/java/org/apache/jena/query/text/TextQueryPF.java
+++ b/jena-text/src/main/java/org/apache/jena/query/text/TextQueryPF.java
@@ -1,526 +1,388 @@
-/*
- * Licensed to the Apache Software Foundation (ASF) under one
- * or more contributor license agreements.  See the NOTICE file
- * distributed with this work for additional information
- * regarding copyright ownership.  The ASF licenses this file
- * to you under the Apache License, Version 2.0 (the
- * "License"); you may not use this file except in compliance
- * with the License.  You may obtain a copy of the License at
- *
- *     http://www.apache.org/licenses/LICENSE-2.0
- *
- * Unless required by applicable law or agreed to in writing, software
- * distributed under the License is distributed on an "AS IS" BASIS,
- * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
- * See the License for the specific language governing permissions and
- * limitations under the License.
- */
-
-package org.apache.jena.query.text;
-
-import java.util.Collection ;
-import java.util.Iterator ;
-import java.util.LinkedHashMap ;
-import java.util.List ;
-import java.util.Map ;
-import java.util.function.Function ;
-
-import org.apache.jena.atlas.io.IndentedWriter ;
-import org.apache.jena.atlas.iterator.Iter ;
-import org.apache.jena.datatypes.RDFDatatype ;
-import org.apache.jena.datatypes.xsd.XSDDatatype ;
-import org.apache.jena.graph.Node ;
-import org.apache.jena.query.QueryBuildException ;
-import org.apache.jena.query.QueryExecException ;
-import org.apache.jena.sparql.core.DatasetGraph ;
-import org.apache.jena.sparql.core.GraphView ;
-import org.apache.jena.sparql.core.Quad ;
-import org.apache.jena.sparql.core.Substitute ;
-import org.apache.jena.sparql.core.Var ;
-import org.apache.jena.sparql.engine.ExecutionContext ;
-import org.apache.jena.sparql.engine.QueryIterator ;
-import org.apache.jena.sparql.engine.binding.Binding ;
-import org.apache.jena.sparql.engine.binding.BindingFactory ;
-import org.apache.jena.sparql.engine.binding.BindingMap ;
-import org.apache.jena.sparql.engine.iterator.QueryIterPlainWrapper ;
-import org.apache.jena.sparql.engine.iterator.QueryIterRepeatApply ;
-import org.apache.jena.sparql.engine.iterator.QueryIterSlice ;
-import org.apache.jena.sparql.mgt.Explain ;
-import org.apache.jena.sparql.pfunction.PropFuncArg ;
-import org.apache.jena.sparql.pfunction.PropFuncArgType ;
-import org.apache.jena.sparql.pfunction.PropertyFunction ;
-import org.apache.jena.sparql.serializer.SerializationContext ;
-import org.apache.jena.sparql.util.Context ;
-import org.apache.jena.sparql.util.FmtUtils ;
-import org.apache.jena.sparql.util.IterLib ;
-import org.apache.jena.sparql.util.NodeFactoryExtra ;
-import org.apache.jena.sparql.util.Symbol ;
-import org.apache.lucene.queryparser.flexible.standard.QueryParserUtil ;
-import org.slf4j.Logger ;
-import org.slf4j.LoggerFactory ;
-
-/**
- * Property function that performs a text query against a {@link TextIndex}.
- */
-public class TextQueryPF implements PropertyFunction
-{
-    private static Logger log = LoggerFactory.getLogger(TextQueryPF.class) ;
-    /*
-     * (?uri ?score) :queryPF (property? "string" limit? score?) 
-     */
-
-    private TextIndex     textIndex        = null ;
-    private boolean       warningIssued    = false ;
-    private String        langArg          = null ;
-
-    public TextQueryPF() { }
-
-
-    @Override
-    public void build(PropFuncArg argSubject, Node predicate, PropFuncArg argObject, ExecutionContext execCxt) {
-        if ( PropFuncArgType.PF_ARG_EITHER.equals(PropFuncArgType.PF_ARG_SINGLE) )
-            if ( argSubject.isList() )
-                throw new QueryBuildException("List arguments (subject) to "+predicate.getURI()) ;
-        
-        if ( PropFuncArgType.PF_ARG_EITHER.equals(PropFuncArgType.PF_ARG_LIST) && ! argSubject.isList() )
-                throw new QueryBuildException("Single argument, list expected (subject) to "+predicate.getURI()) ;
-
-        if ( PropFuncArgType.PF_ARG_EITHER.equals(PropFuncArgType.PF_ARG_SINGLE) && argObject.isList() )
-        {
-            if ( ! argObject.isNode() )
-                // But allow rdf:nil.
-                throw new QueryBuildException("List arguments (object) to "+predicate.getURI()) ;
-        }
-        
-        if ( PropFuncArgType.PF_ARG_EITHER.equals(PropFuncArgType.PF_ARG_LIST) )
-            if ( ! argObject.isList() )
-                throw new QueryBuildException("Single argument, list expected (object) to "+predicate.getURI()) ;        
-        
-        DatasetGraph dsg = execCxt.getDataset() ;
-        textIndex = chooseTextIndex(dsg) ;
-
-        if (argSubject.isList()) {
-            int size = argSubject.getArgListSize();
-            if (size != 2 && size != 3) {
-                throw new QueryBuildException("Subject has "+argSubject.getArgList().size()+" elements, not 2 or 3: "+argSubject);
-            }
-        }
-
-        if (argObject.isList()) {
-            List<Node> list = argObject.getArgList() ;
-
-            if (list.size() == 0)
-                throw new QueryBuildException("Zero-length argument list") ;
-
-            if (list.size() > 4)
-                throw new QueryBuildException("Too many arguments in list : " + list) ;
-            
-            
-            //extract of extra lang arg if present and if is usable.
-            //arg is removed from the list to avoid conflict with order and args length
-            langArg = extractArg("lang", list);
-
-            if (langArg != null && textIndex.getDocDef().getLangField() == null)
-                log.warn("lang argument is ignored if langField not set in the index configuration");
-            
-        }
-    }
-    
-    private static TextIndex chooseTextIndex(DatasetGraph dsg) {
-        
-        Context c = dsg.getContext() ; 
-        
-        Object obj = dsg.getContext().get(TextQuery.textIndex) ;
-
-        if (obj != null) {
-            try {
-                return (TextIndex)obj ;
-            } catch (ClassCastException ex) {
-                log.warn("Context setting '" + TextQuery.textIndex + "'is not a TextIndex") ;
-            }
-        }
-
-        if (dsg instanceof DatasetGraphText) {
-            DatasetGraphText x = (DatasetGraphText)dsg ;
-            return x.getTextIndex() ;
-        }
-        log.warn("Failed to find the text index : tried context and as a text-enabled dataset") ;
-        return null ;
-    }
-
-    private String extractArg(String prefix, List<Node> objArgs) {
-        String value = null;
-        int pos = 0;
-        for (Node node : objArgs) {
-            if (node.isLiteral()) {
-                String arg = node.getLiteral().toString();
-                if (arg.startsWith(prefix + ":")) {
-                    value = arg.split(":")[1];
-                    break;
-                }
-            }
-            pos++;
-        }
-        if (value != null)
-            objArgs.remove(pos);
-
-        return value;
-    }
-
-    @Override
-    public QueryIterator exec(QueryIterator input, PropFuncArg argSubject, Node predicate, PropFuncArg argObject, ExecutionContext execCxt) {
-        if (textIndex == null) {
-            if (!warningIssued) {
-                log.warn("No text index - no text search performed") ;
-                warningIssued = true ;
-            }
-            // Not a text dataset - no-op
-            return input ;
-        }
-        
-        // If the search term is already bound (i.e. it is not dynamically specified by the input QueryIterator), then we can issue the query once and cache the result
-        Map<String,TextHit> textResults = null;
-        StrMatch match = objectToStruct(argObject, execCxt, false);
-        if (null != match) {
-            List<TextHit> hits = query(match.getProperty(), match.getQueryString(), match.getLimit(), execCxt);
-            textResults = new LinkedHashMap<String,TextHit>();
-            for (TextHit hit : hits) {
-                textResults.putIfAbsent(hit.getNode().getURI(), hit);
-            }
-        }
-        
-        return new RepeatApplyIteratorTextQuery(input, argSubject, predicate, argObject, execCxt, textResults) ;
-    }
-    
-    
-    private QueryIterator exec(Binding binding, PropFuncArg argSubject, Node predicate, PropFuncArg argObject, ExecutionContext execCxt, Map<String,TextHit> textResults) {
-        DatasetGraph dsg = execCxt.getDataset() ;
-
-        argSubject = Substitute.substitute(argSubject, binding) ;
-        argObject = Substitute.substitute(argObject, binding) ;
-        
-        Node s = null;
-        Node score = null;
-        Node literal = null;
-
-        if (argSubject.isList()) {
-            // Length checked in build()
-            s = argSubject.getArg(0);
-            score = argSubject.getArg(1);
-            
-            if (!score.isVariable())
-                throw new QueryExecException("Hit score is not a variable: "+argSubject) ;
-
-            if (argSubject.getArgListSize() > 2) {
-                literal = argSubject.getArg(2);
-                if (!literal.isVariable())
-                    throw new QueryExecException("Hit literal is not a variable: "+argSubject) ;
-            }
-        }
-        else {
-            s = argSubject.getArg() ;
-        }
-
-        if (s.isLiteral())
-            // Does not match
-            return IterLib.noResults(execCxt) ;
-        
-        StrMatch match = objectToStruct(argObject, execCxt, true) ;
-        if (match == null) {
-            // can't match
-            return IterLib.noResults(execCxt) ;
-        }
-
-        // ----
-        
-        QueryIterator qIter = (Var.isVar(s)) 
-            ? variableSubject(binding, s, score, literal, match, execCxt, textResults)
-            : concreteSubject(binding, s, score, literal, match, execCxt, textResults) ;
-        if (match.getLimit() >= 0)
-            qIter = new QueryIterSlice(qIter, 0, match.getLimit(), execCxt) ;
-        return qIter ;
-    }
-    
-    private QueryIterator variableSubject(Binding binding, Node s, Node score, Node literal, StrMatch match, ExecutionContext execCxt, Map<String,TextHit> textResults) {
-        Var sVar = Var.alloc(s) ;
-        Var scoreVar = (score==null) ? null : Var.alloc(score) ;
-        Var literalVar = (literal==null) ? null : Var.alloc(literal) ;
-        Collection<TextHit> r = (null != textResults) ? textResults.values() : query(match.getProperty(), match.getQueryString(), match.getLimit(), execCxt) ;
-        Function<TextHit,Binding> converter = new TextHitConverter(binding, sVar, scoreVar, literalVar);
-        Iterator<Binding> bIter = Iter.map(r.iterator(), converter);
-        QueryIterator qIter = new QueryIterPlainWrapper(bIter, execCxt);
-        return qIter ;
-    }
-    
-    private static final Symbol cacheSymbol = Symbol.create("TextQueryPF.cache");
-    
-    private QueryIterator concreteSubject(Binding binding, Node s, Node score, Node literal, StrMatch match, ExecutionContext execCxt, Map<String,TextHit> textResults) {
-        if (!s.isURI()) {
-            log.warn("Subject not a URI: " + s) ;
-            return IterLib.noResults(execCxt) ;
-        }
-        
-        final Var scoreVar = (score==null) ? null : Var.alloc(score) ;
-        final Var literalVar = (literal==null) ? null : Var.alloc(literal) ;
-        
-        if (null != textResults) {
-            // The fast path!  The search term was static, so we already have the results, and can do a hash-join
-            TextHit hit = textResults.get(s.getURI());
-            if (null != hit) {
-                // found the node among the hits
-                if (literalVar == null) {
-                    return (scoreVar == null) ?
-                        IterLib.result(binding, execCxt) :
-                        IterLib.oneResult(binding, scoreVar, NodeFactoryExtra.floatToNode(hit.getScore()), execCxt);
-                }
-                BindingMap bmap = BindingFactory.create(binding);
-                if (scoreVar != null) {
-                    bmap.add(scoreVar, NodeFactoryExtra.floatToNode(hit.getScore()));
-                }
-                bmap.add(literalVar, hit.getLiteral());
-                return IterLib.result(bmap, execCxt) ;
-            }
-        }
-        else {
-            // The slow path!  Since the search term is dynamic, we have to issue a query every iteration
-            if (scoreVar == null)
-            {
-                // If the score var is null, then we can at least do an index join with our query by adding the subject as a parameter to the query
-                String queryString = textIndex.getDocDef().getEntityField() + ":" + QueryParserUtil.escape(s.getURI()) + " AND (" + match.getQueryString() + ")" ;
-                List<TextHit> x = query(match.getProperty(), queryString, -1, execCxt) ;
-                
-                if ( x == null || x.size() == 0 ) // null return value - empty result
-                    return IterLib.noResults(execCxt) ;
-                
-                // Just use the first hit
-                TextHit hit = x.get(0) ;
-                return (literalVar == null) ?
-                    IterLib.result(binding, execCxt) :
-                    IterLib.oneResult(binding, literalVar, hit.getLiteral(), execCxt) ;
-            }
-            else
-            {
-                // If the score var is specified, then we have to issue the query and then perform an inefficient local join so that the score remains accurate
-                List<TextHit> x = query(match.getProperty(), match.getQueryString(), -1, execCxt) ;
-                
-                if ( x == null ) { // null return value - empty result
-                    return IterLib.noResults(execCxt) ;
-                }
-                
-                for (TextHit hit : x ) {
-                    if (hit.getNode().equals(s)) {
-                        // found the node among the hits
-                        if (literalVar == null) {
-                            return IterLib.oneResult(binding, scoreVar, NodeFactoryExtra.floatToNode(hit.getScore()), execCxt);
-                        }
-                        else {
-                            BindingMap bmap = BindingFactory.create(binding);
-                            bmap.add(scoreVar, NodeFactoryExtra.floatToNode(hit.getScore()));
-                            bmap.add(literalVar, hit.getLiteral());
-                            return IterLib.result(bmap, execCxt) ;
-                        }
-                    }
-                }
-            }
-        }
-        
-        // node was not among the hits - empty result
-        return IterLib.noResults(execCxt) ;
-    }
-
-    private List<TextHit> query(Node property, String queryString, int limit, ExecutionContext execCxt) {
-        Explain.explain(execCxt.getContext(), "Text query: "+queryString) ;
-        if ( log.isDebugEnabled())
-            log.debug("Text query: {} ({})", queryString,limit) ;
-        return textIndex.query(property, queryString, limit) ;
-    }
-    
-    /**
-     * Builds up the query string by appending on additional restrictions, such as graph or language tags.
-     */
-    private String buildQueryString(String queryString, ExecutionContext execCxt) {
-        // use the graph information in the text index if possible
-        if (textIndex.getDocDef().getGraphField() != null
-            && execCxt.getActiveGraph() instanceof GraphView) {
-            GraphView activeGraph = (GraphView)execCxt.getActiveGraph() ;
-            if (!Quad.isUnionGraph(activeGraph.getGraphName())) {
-                String uri = 
-                    activeGraph.getGraphName() != null 
-                    ? TextQueryFuncs.graphNodeToString(activeGraph.getGraphName())
-                    : Quad.defaultGraphNodeGenerated.getURI() ;
-                String escaped = QueryParserUtil.escape(uri) ;
-                String qs2 = textIndex.getDocDef().getGraphField() + ":" + escaped ;
-                queryString = "(" + queryString + ") AND " + qs2 ;
-            }
-        }
-
-        //for language-based search extension
-        if (textIndex.getDocDef().getLangField() != null) {
-            String field = textIndex.getDocDef().getLangField();
-            if (langArg != null) {
-                String qs2 = !"none".equals(langArg)?
-                        field + ":" + langArg : "-" + field + ":*";
-                queryString = "(" + queryString + ") AND " + qs2;
-            }
-        }
-        
-        return queryString;
-    }
-    
-    /** Deconstruct the node or list object argument and make a StrMatch 
-     * The 'executionTime' flag indciates whether this is for a build time
-     * static check, or for runtime execution.
-     */
-    private StrMatch objectToStruct(PropFuncArg argObject, ExecutionContext execCxt, boolean executionTime) {
-        EntityDefinition docDef = textIndex.getDocDef() ;
-        if (argObject.isNode()) {
-            Node o = argObject.getArg() ;
-            if (!o.isLiteral()) {
-                if ( executionTime )
-                    log.warn("Object to text query is not a literal") ;
-                return null ;
-            }
-
-            RDFDatatype dt = o.getLiteralDatatype() ;
-            if (dt != null && dt != XSDDatatype.XSDstring) {
-                log.warn("Object to text query is not a string") ;
-                return null ;
-            }
-
-            String qs = o.getLiteralLexicalForm() ;
-            qs = buildQueryString(qs, execCxt) ;
-            return new StrMatch(null, qs, -1, 0) ;
-        }
-
-        List<Node> list = argObject.getArgList() ;
-        if (list.size() == 0 || list.size() > 3)
-            throw new TextIndexException("Change in object list size") ;
-
-        Node predicate = null ;
-        String field = null ;       // Do not prepend the field name - rely on default field
-        int idx = 0 ;
-        Node x = list.get(0) ;
-        // Property?
-        if (x.isURI()) {
-            predicate = x ;
-            idx++ ;
-            if (idx >= list.size())
-                throw new TextIndexException("Property specificed but no query string : " + list) ;
-            x = list.get(idx) ;
-            field = docDef.getField(predicate) ;
-            if (field == null) {
-                log.warn("Predicate not indexed: " + predicate) ;
-                return null ;
-            }
-        }
-
-        // String!
-        if (!x.isLiteral()) {
-            if ( executionTime )
-                log.warn("Text query string is not a literal " + list) ;
-            return null ;
-        }
-        
-        if (x.getLiteralDatatype() != null && !x.getLiteralDatatype().equals(XSDDatatype.XSDstring)) {
-            log.warn("Text query is not a string " + list) ;
-            return null ;
-        }
-        String queryString = x.getLiteralLexicalForm() ;
-        idx++ ;
-
-        int limit = -1 ;
-        float score = 0 ;
-
-        if (idx < list.size()) {
-            // Limit?
-            x = list.get(idx) ;
-            idx++ ;
-            if ( ! x.isLiteral() ) {
-                if ( executionTime )
-                    log.warn("Text query limit is not an integer " + x) ;
-                return null ;
-            }
-            
-            int v = NodeFactoryExtra.nodeToInt(x) ;
-            limit = (v < 0) ? -1 : v ;
-        }
-
-        String qs = queryString ;
-        if (field != null) {
-            qs = field + ":" + qs ;
-        }
-        
-        qs = buildQueryString(qs, execCxt) ;
-
-        return new StrMatch(predicate, qs, limit, score) ;
-    }
-    
-    class RepeatApplyIteratorTextQuery extends QueryIterRepeatApply
-    {
-        private final PropFuncArg argSubject ; 
-        private final Node predicate ;
-        private final PropFuncArg argObject ;
-        private Map<String,TextHit> textResults ;
-        
-        public RepeatApplyIteratorTextQuery(QueryIterator input, PropFuncArg argSubject, Node predicate, PropFuncArg argObject, ExecutionContext execCxt, Map<String,TextHit> textResults)
-        { 
-            super(input, execCxt) ;
-            this.argSubject = argSubject ;
-            this.predicate = predicate ;
-            this.argObject = argObject ;
-            this.textResults = textResults ;
-        }
-
-        @Override
-        protected QueryIterator nextStage(Binding binding)
-        {
-            QueryIterator iter = exec(binding, argSubject, predicate, argObject, getExecContext(), textResults) ;
-            if ( iter == null ) 
-                iter = IterLib.noResults(getExecContext()) ;
-            return iter ;
-        }
-        
-        @Override
-        protected void details(IndentedWriter out, SerializationContext sCxt)
-        {
-            out.print("PropertyFunction ["+FmtUtils.stringForNode(predicate, sCxt)+"]") ;
-            out.print("[") ;
-            argSubject.output(out, sCxt) ;
-            out.print("][") ;
-            argObject.output(out, sCxt) ;
-            out.print("]") ;
-            out.println() ;
-        }
-    }
-
-    static class StrMatch {
-        private final Node   property ;
-        private final String queryString ;
-        private final int    limit ;
-        private final float  scoreLimit ;
-
-        public StrMatch(Node property, String queryString, int limit, float scoreLimit) {
-            super() ;
-            this.property = property ;
-            this.queryString = queryString ;
-            this.limit = limit ;
-            this.scoreLimit = scoreLimit ;
-        }
-
-        public Node getProperty() {
-            return property ;
-        }
-
-        public String getQueryString() {
-            return queryString ;
-        }
-
-        public int getLimit() {
-            return limit ;
-        }
-
-        public float getScoreLimit() {
-            return scoreLimit ;
-        }
-    }
-}
+/**
+ * Licensed to the Apache Software Foundation (ASF) under one
+ * or more contributor license agreements.  See the NOTICE file
+ * distributed with this work for additional information
+ * regarding copyright ownership.  The ASF licenses this file
+ * to you under the Apache License, Version 2.0 (the
+ * "License"); you may not use this file except in compliance
+ * with the License.  You may obtain a copy of the License at
+ *
+ *     http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing, software
+ * distributed under the License is distributed on an "AS IS" BASIS,
+ * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+ * See the License for the specific language governing permissions and
+ * limitations under the License.
+ */
+
+package org.apache.jena.query.text ;
+
+import java.util.Iterator ;
+import java.util.List ;
+import java.util.function.Function ;
+
+import org.apache.jena.atlas.iterator.Iter ;
+import org.apache.jena.atlas.logging.Log ;
+import org.apache.jena.datatypes.RDFDatatype ;
+import org.apache.jena.datatypes.xsd.XSDDatatype ;
+import org.apache.jena.graph.Node ;
+import org.apache.jena.query.QueryBuildException ;
+import org.apache.jena.query.QueryExecException ;
+import org.apache.jena.sparql.core.* ;
+import org.apache.jena.sparql.engine.ExecutionContext ;
+import org.apache.jena.sparql.engine.QueryIterator ;
+import org.apache.jena.sparql.engine.binding.Binding ;
+import org.apache.jena.sparql.engine.binding.BindingFactory ;
+import org.apache.jena.sparql.engine.binding.BindingMap ;
+import org.apache.jena.sparql.engine.iterator.QueryIterPlainWrapper ;
+import org.apache.jena.sparql.engine.iterator.QueryIterSlice ;
+import org.apache.jena.sparql.mgt.Explain ;
+import org.apache.jena.sparql.pfunction.PropFuncArg ;
+import org.apache.jena.sparql.pfunction.PropertyFunctionBase ;
+import org.apache.jena.sparql.util.Context ;
+import org.apache.jena.sparql.util.IterLib ;
+import org.apache.jena.sparql.util.NodeFactoryExtra ;
+import org.apache.lucene.queryparser.classic.QueryParserBase ;
+import org.slf4j.Logger ;
+import org.slf4j.LoggerFactory ;
+
+/** property function that accesses a Solr server */
+public class TextQueryPF extends PropertyFunctionBase {
+    private static Logger log = LoggerFactory.getLogger(TextQueryPF.class) ;
+    /*
+     * (?uri ?score) :queryPF (property? "string" limit? score?) 
+     */
+
+    private TextIndex     textIndex        = null ;
+    private boolean       warningIssued = false ;
+
+    public TextQueryPF() {}
+
+    private String langArg = null;
+
+    @Override
+    public void build(PropFuncArg argSubject, Node predicate, PropFuncArg argObject, ExecutionContext execCxt) {
+        super.build(argSubject, predicate, argObject, execCxt) ;
+        DatasetGraph dsg = execCxt.getDataset() ;
+        textIndex = chooseTextIndex(dsg) ;
+
+        if (argSubject.isList()) {
+            int size = argSubject.getArgListSize();
+            if (size != 2 && size != 3) {
+                throw new QueryBuildException("Subject has "+argSubject.getArgList().size()+" elements, not 2 or 3: "+argSubject);
+            }
+        }
+
+        if (argObject.isList()) {
+            List<Node> list = argObject.getArgList() ;
+
+            if (list.size() == 0)
+                throw new QueryBuildException("Zero-length argument list") ;
+
+            if (list.size() > 4)
+                throw new QueryBuildException("Too many arguments in list : " + list) ;
+            
+            
+            //extract of extra lang arg if present and if is usable.
+            //arg is removed from the list to avoid conflict with order and args length
+            langArg = extractArg("lang", list);
+
+            if (langArg != null && textIndex.getDocDef().getLangField() == null)
+                log.warn("lang argument is ignored if langField not set in the index configuration");
+            
+        }
+    }
+
+    private static TextIndex chooseTextIndex(DatasetGraph dsg) {
+        
+        Context c = dsg.getContext() ; 
+        
+        Object obj = dsg.getContext().get(TextQuery.textIndex) ;
+
+        if (obj != null) {
+            try {
+                return (TextIndex)obj ;
+            } catch (ClassCastException ex) {
+                Log.warn(TextQueryPF.class, "Context setting '" + TextQuery.textIndex + "'is not a TextIndex") ;
+            }
+        }
+
+        if (dsg instanceof DatasetGraphText) {
+            DatasetGraphText x = (DatasetGraphText)dsg ;
+            return x.getTextIndex() ;
+        }
+        Log.warn(TextQueryPF.class, "Failed to find the text index : tried context and as a text-enabled dataset") ;
+        return null ;
+    }
+
+    private String extractArg(String prefix, List<Node> objArgs) {
+        String value = null;
+        int pos = 0;
+        for (Node node : objArgs) {
+            if (node.isLiteral()) {
+                String arg = node.getLiteral().toString();
+                if (arg.startsWith(prefix + ":")) {
+                    value = arg.split(":")[1];
+                    break;
+                }
+            }
+            pos++;
+        }
+        if (value != null)
+            objArgs.remove(pos);
+
+        return value;
+    }
+
+    @Override
+    public QueryIterator exec(Binding binding, PropFuncArg argSubject, Node predicate, PropFuncArg argObject,
+                              ExecutionContext execCxt) {
+        if (textIndex == null) {
+            if (!warningIssued) {
+                Log.warn(getClass(), "No text index - no text search performed") ;
+                warningIssued = true ;
+            }
+            // Not a text dataset - no-op
+            return IterLib.result(binding, execCxt) ;
+        }
+
+        DatasetGraph dsg = execCxt.getDataset() ;
+
+        argSubject = Substitute.substitute(argSubject, binding) ;
+        argObject = Substitute.substitute(argObject, binding) ;
+        
+        Node s = null;
+        Node score = null;
+        Node literal = null;
+
+        if (argSubject.isList()) {
+            // Length checked in build()
+            s = argSubject.getArg(0);
+            score = argSubject.getArg(1);
+            
+            if (!score.isVariable())
+                throw new QueryExecException("Hit score is not a variable: "+argSubject) ;
+
+            if (argSubject.getArgListSize() > 2) {
+                literal = argSubject.getArg(2);
+                if (!literal.isVariable())
+                    throw new QueryExecException("Hit literal is not a variable: "+argSubject) ;
+            }
+        } else {
+            s = argSubject.getArg() ;
+        }
+
+        if (s.isLiteral())
+            // Does not match
+            return IterLib.noResults(execCxt) ;
+
+        StrMatch match = objectToStruct(argObject, true) ;
+        if (match == null) {
+            // can't match
+            return IterLib.noResults(execCxt) ;
+        }
+
+        // ----
+
+        QueryIterator qIter = (Var.isVar(s)) 
+            ? variableSubject(binding, s, score, literal, match, execCxt)
+            : concreteSubject(binding, s, score, literal, match, execCxt) ;
+        if (match.getLimit() >= 0)
+            qIter = new QueryIterSlice(qIter, 0, match.getLimit(), execCxt) ;
+        return qIter ;
+    }
+
+    private QueryIterator variableSubject(Binding binding, Node s, Node score, Node literal, StrMatch match, ExecutionContext execCxt) {
+        Var sVar = Var.alloc(s) ;
+        Var scoreVar = (score==null) ? null : Var.alloc(score) ;
+        Var literalVar = (literal==null) ? null : Var.alloc(literal) ;
+        List<TextHit> r = query(match.getProperty(), match.getQueryString(), match.getLimit(), execCxt) ;
+        Function<TextHit,Binding> converter = new TextHitConverter(binding, sVar, scoreVar, literalVar);
+        Iterator<Binding> bIter = Iter.map(r.iterator(), converter);
+        QueryIterator qIter = new QueryIterPlainWrapper(bIter, execCxt);
+        return qIter ;
+    }
+
+    private QueryIterator concreteSubject(Binding binding, Node s, Node score, Node literal, StrMatch match, ExecutionContext execCxt) {
+        if (!s.isURI()) {
+            log.warn("Subject not a URI: " + s) ;
+            return IterLib.noResults(execCxt) ;
+        }
+
+        Var scoreVar = (score==null) ? null : Var.alloc(score) ;
+        Var literalVar = (literal==null) ? null : Var.alloc(literal) ;
+        String qs = match.getQueryString() ;
+        List<TextHit> x = query(match.getProperty(), match.getQueryString(), -1, execCxt) ;
+        
+        if ( x == null ) // null return value - empty result
+            return IterLib.noResults(execCxt) ;
+        
+        for (TextHit hit : x ) {
+            if (hit.getNode().equals(s)) {
+                // found the node among the hits
+                if (literalVar == null) {
+                    return (scoreVar == null) ?
+                        IterLib.result(binding, execCxt) :
+                        IterLib.oneResult(binding, scoreVar, NodeFactoryExtra.floatToNode(hit.getScore()), execCxt);
+                }
+                BindingMap bmap = BindingFactory.create(binding);
+                if (scoreVar != null) {
+                    bmap.add(scoreVar, NodeFactoryExtra.floatToNode(hit.getScore()));
+                }
+                bmap.add(literalVar, hit.getLiteral());
+                return IterLib.result(bmap, execCxt) ;
+            }
+        }
+
+        // node was not among the hits - empty result
+        return IterLib.noResults(execCxt) ;
+    }
+
+    private List<TextHit> query(Node property, String queryString, int limit, ExecutionContext execCxt) {
+        // use the graph information in the text index if possible
+        if (textIndex.getDocDef().getGraphField() != null
+            && execCxt.getActiveGraph() instanceof GraphView) {
+            GraphView activeGraph = (GraphView)execCxt.getActiveGraph() ;
+            if (!Quad.isUnionGraph(activeGraph.getGraphName())) {
+                String uri = 
+                    activeGraph.getGraphName() != null 
+                    ? TextQueryFuncs.graphNodeToString(activeGraph.getGraphName())
+                    : Quad.defaultGraphNodeGenerated.getURI() ;
+                String escaped = QueryParserBase.escape(uri) ;
+                String qs2 = textIndex.getDocDef().getGraphField() + ":" + escaped ;
+                queryString = "(" + queryString + ") AND " + qs2 ;
+            }
+        }
+
+        //for language-based search extension
+        if (textIndex.getDocDef().getLangField() != null) {
+            String field = textIndex.getDocDef().getLangField();
+            if (langArg != null) {
+                String qs2 = !"none".equals(langArg)?
+                        field + ":" + langArg : "-" + field + ":*";
+                queryString = "(" + queryString + ") AND " + qs2;
+            }
+        }
+
+        Explain.explain(execCxt.getContext(), "Text query: "+queryString) ;
+        if ( log.isDebugEnabled())
+            log.debug("Text query: {} ({})", queryString,limit) ;
+        return textIndex.query(property, queryString, limit) ;
+    }
+    
+    /** Deconstruct the node or list object argument and make a StrMatch 
+     * The 'executionTime' flag indciates whether this is for a build time
+     * static check, or for runtime execution.
+     */
+    private StrMatch objectToStruct(PropFuncArg argObject, boolean executionTime) {
+        EntityDefinition docDef = textIndex.getDocDef() ;
+        if (argObject.isNode()) {
+            Node o = argObject.getArg() ;
+            if (!o.isLiteral()) {
+                if ( executionTime )
+                    log.warn("Object to text query is not a literal") ;
+                return null ;
+            }
+
+            RDFDatatype dt = o.getLiteralDatatype() ;
+            if (dt != null && dt != XSDDatatype.XSDstring) {
+                log.warn("Object to text query is not a string") ;
+                return null ;
+            }
+
+            String qs = o.getLiteralLexicalForm() ;
+            return new StrMatch(null, qs, -1, 0) ;
+        }
+
+        List<Node> list = argObject.getArgList() ;
+        if (list.size() == 0 || list.size() > 3)
+            throw new TextIndexException("Change in object list size") ;
+
+        Node predicate = null ;
+        String field = null ;       // Do not prepend the field name - rely on default field
+        int idx = 0 ;
+        Node x = list.get(0) ;
+        // Property?
+        if (x.isURI()) {
+            predicate = x ;
+            idx++ ;
+            if (idx >= list.size())
+                throw new TextIndexException("Property specificed but no query string : " + list) ;
+            x = list.get(idx) ;
+            field = docDef.getField(predicate) ;
+            if (field == null) {
+                log.warn("Predicate not indexed: " + predicate) ;
+                return null ;
+            }
+        }
+
+        // String!
+        if (!x.isLiteral()) {
+            if ( executionTime )
+                log.warn("Text query string is not a literal " + list) ;
+            return null ;
+        }
+        
+        if (x.getLiteralDatatype() != null && !x.getLiteralDatatype().equals(XSDDatatype.XSDstring)) {
+            log.warn("Text query is not a string " + list) ;
+            return null ;
+        }
+        String queryString = x.getLiteralLexicalForm() ;
+        idx++ ;
+
+        int limit = -1 ;
+        float score = 0 ;
+
+        if (idx < list.size()) {
+            // Limit?
+            x = list.get(idx) ;
+            idx++ ;
+            if ( ! x.isLiteral() ) {
+                if ( executionTime )
+                    log.warn("Text query limit is not an integer " + x) ;
+                return null ;
+            }
+            
+            int v = NodeFactoryExtra.nodeToInt(x) ;
+            limit = (v < 0) ? -1 : v ;
+        }
+
+        String qs = queryString ;
+        if (field != null)
+            qs = field + ":" + qs ;
+
+        return new StrMatch(predicate, qs, limit, score) ;
+    }
+
+    class StrMatch {
+        private final Node   property ;
+        private final String queryString ;
+        private final int    limit ;
+        private final float  scoreLimit ;
+
+        public StrMatch(Node property, String queryString, int limit, float scoreLimit) {
+            super() ;
+            this.property = property ;
+            this.queryString = queryString ;
+            this.limit = limit ;
+            this.scoreLimit = scoreLimit ;
+        }
+
+        public Node getProperty() {
+            return property ;
+        }
+
+        public String getQueryString() {
+            return queryString ;
+        }
+
+        public int getLimit() {
+            return limit ;
+        }
+
+        public float getScoreLimit() {
+            return scoreLimit ;
+        }
+    }
+}