You are viewing a plain text version of this content. The canonical link for it is here.
Posted to commits@tika.apache.org by jn...@apache.org on 2011/03/09 10:04:34 UTC

svn commit: r1079705 - /tika/trunk/tika-parsers/src/main/java/org/apache/tika/parser/pdf/PDF2XHTML.java

Author: jnioche
Date: Wed Mar  9 09:04:34 2011
New Revision: 1079705

URL: http://svn.apache.org/viewvc?rev=1079705&view=rev
Log:
TIKA-611 : setSortByPosition reverted to the default value (false) in PDFTextStripper so that columns are separated

Modified:
    tika/trunk/tika-parsers/src/main/java/org/apache/tika/parser/pdf/PDF2XHTML.java

Modified: tika/trunk/tika-parsers/src/main/java/org/apache/tika/parser/pdf/PDF2XHTML.java
URL: http://svn.apache.org/viewvc/tika/trunk/tika-parsers/src/main/java/org/apache/tika/parser/pdf/PDF2XHTML.java?rev=1079705&r1=1079704&r2=1079705&view=diff
==============================================================================
--- tika/trunk/tika-parsers/src/main/java/org/apache/tika/parser/pdf/PDF2XHTML.java (original)
+++ tika/trunk/tika-parsers/src/main/java/org/apache/tika/parser/pdf/PDF2XHTML.java Wed Mar  9 09:04:34 2011
@@ -79,7 +79,7 @@ class PDF2XHTML extends PDFTextStripper 
             throws IOException {
         this.handler = new XHTMLContentHandler(handler, metadata);
         setForceParsing(true);
-        setSortByPosition(true);
+        setSortByPosition(false);
     }
 
     @Override