You are viewing a plain text version of this content. The canonical link for it is here.
Posted to commits@tika.apache.org by ta...@apache.org on 2016/11/10 13:32:03 UTC

tika git commit: TIKA-2174/TIKA-2175 -- clean up

Repository: tika
Updated Branches:
  refs/heads/master 98de28828 -> b97045aea


TIKA-2174/TIKA-2175 -- clean up


Project: http://git-wip-us.apache.org/repos/asf/tika/repo
Commit: http://git-wip-us.apache.org/repos/asf/tika/commit/b97045ae
Tree: http://git-wip-us.apache.org/repos/asf/tika/tree/b97045ae
Diff: http://git-wip-us.apache.org/repos/asf/tika/diff/b97045ae

Branch: refs/heads/master
Commit: b97045aea303bac75bd3c937cde6b42c7a3b3c48
Parents: 98de288
Author: tballison <ta...@mitre.org>
Authored: Thu Nov 10 08:31:51 2016 -0500
Committer: tballison <ta...@mitre.org>
Committed: Thu Nov 10 08:31:51 2016 -0500

----------------------------------------------------------------------
 .../src/main/java/org/apache/tika/parser/pdf/PDF2XHTML.java        | 2 +-
 .../java/org/apache/tika/parser/ocr/TesseractOCRParserTest.java    | 2 +-
 2 files changed, 2 insertions(+), 2 deletions(-)
----------------------------------------------------------------------


http://git-wip-us.apache.org/repos/asf/tika/blob/b97045ae/tika-parsers/src/main/java/org/apache/tika/parser/pdf/PDF2XHTML.java
----------------------------------------------------------------------
diff --git a/tika-parsers/src/main/java/org/apache/tika/parser/pdf/PDF2XHTML.java b/tika-parsers/src/main/java/org/apache/tika/parser/pdf/PDF2XHTML.java
index d89dce4..ddbd148 100644
--- a/tika-parsers/src/main/java/org/apache/tika/parser/pdf/PDF2XHTML.java
+++ b/tika-parsers/src/main/java/org/apache/tika/parser/pdf/PDF2XHTML.java
@@ -246,7 +246,7 @@ class PDF2XHTML extends AbstractPDF2XHTML {
                             writeToBuffer(image, extension, buffer);
                         } catch (IOException e) {
                             EmbeddedDocumentUtil.recordException(e, metadata);
-                            return;
+                            continue;
                         }
                         embeddedDocumentExtractor.parseEmbedded(
                                 new ByteArrayInputStream(buffer.toByteArray()),

http://git-wip-us.apache.org/repos/asf/tika/blob/b97045ae/tika-parsers/src/test/java/org/apache/tika/parser/ocr/TesseractOCRParserTest.java
----------------------------------------------------------------------
diff --git a/tika-parsers/src/test/java/org/apache/tika/parser/ocr/TesseractOCRParserTest.java b/tika-parsers/src/test/java/org/apache/tika/parser/ocr/TesseractOCRParserTest.java
index 7607427..956a71b 100644
--- a/tika-parsers/src/test/java/org/apache/tika/parser/ocr/TesseractOCRParserTest.java
+++ b/tika-parsers/src/test/java/org/apache/tika/parser/ocr/TesseractOCRParserTest.java
@@ -91,7 +91,7 @@ public class TesseractOCRParserTest extends TikaTest {
         // Assuming that Tesseract is on the path, we should find 5 Parsers that support PNG.
         assumeTrue(canRun());
 
-        assertEquals(7, parser.getSupportedTypes(parseContext).size());
+        assertEquals(8, parser.getSupportedTypes(parseContext).size());
         assertTrue(parser.getSupportedTypes(parseContext).contains(png));
 
         // DefaultParser will now select the TesseractOCRParser.