You are viewing a plain text version of this content. The canonical link for it is here.
Posted to commits@tika.apache.org by ma...@apache.org on 2015/02/06 20:42:48 UTC

svn commit: r1657933 - in /tika/trunk: CHANGES.txt tika-parsers/src/main/java/org/apache/tika/parser/pkg/RarParser.java

Author: mattmann
Date: Fri Feb  6 19:42:48 2015
New Revision: 1657933

URL: http://svn.apache.org/r1657933
Log:
Patch for TIKA-936 Fix for RarParser for handling Chinese characters contributed by kongxianghe1234 <ko...@gmail.com>. This closes #27.

Modified:
    tika/trunk/CHANGES.txt
    tika/trunk/tika-parsers/src/main/java/org/apache/tika/parser/pkg/RarParser.java

Modified: tika/trunk/CHANGES.txt
URL: http://svn.apache.org/viewvc/tika/trunk/CHANGES.txt?rev=1657933&r1=1657932&r2=1657933&view=diff
==============================================================================
--- tika/trunk/CHANGES.txt (original)
+++ tika/trunk/CHANGES.txt Fri Feb  6 19:42:48 2015
@@ -1,5 +1,9 @@
 Release 1.8 - Current Development
 
+  * The RAR parser was updated to handle Chinese characters 
+    using the functionality provided by allowing encoding to
+    be used within ZipArchiveInputStream. (TIKA-936)
+
   * Fix out of memory error in surefire plugin. (TIKA-1537)
 
   * Build a parser to extract data from GRIB formats (TIKA-1423).

Modified: tika/trunk/tika-parsers/src/main/java/org/apache/tika/parser/pkg/RarParser.java
URL: http://svn.apache.org/viewvc/tika/trunk/tika-parsers/src/main/java/org/apache/tika/parser/pkg/RarParser.java?rev=1657933&r1=1657932&r2=1657933&view=diff
==============================================================================
--- tika/trunk/tika-parsers/src/main/java/org/apache/tika/parser/pkg/RarParser.java (original)
+++ tika/trunk/tika-parsers/src/main/java/org/apache/tika/parser/pkg/RarParser.java Fri Feb  6 19:42:48 2015
@@ -86,7 +86,7 @@ public class RarParser extends AbstractP
                         subFile = rar.getInputStream(header);
 
                         Metadata entrydata = PackageParser.handleEntryMetadata(
-                                header.getFileNameString(),
+                                "".equals(header.getFileNameW())?header.getFileNameString():header.getFileNameW(),
                                 header.getCTime(), header.getMTime(),
                                 header.getFullUnpackSize(),
                                 xhtml
@@ -114,4 +114,4 @@ public class RarParser extends AbstractP
 
         xhtml.endDocument();
     }
-}
\ No newline at end of file
+}