You are viewing a plain text version of this content. The canonical link for it is here.
Posted to commits@tika.apache.org by ta...@apache.org on 2016/11/10 13:32:03 UTC
tika git commit: TIKA-2174/TIKA-2175 -- clean up
Repository: tika
Updated Branches:
refs/heads/master 98de28828 -> b97045aea
TIKA-2174/TIKA-2175 -- clean up
Project: http://git-wip-us.apache.org/repos/asf/tika/repo
Commit: http://git-wip-us.apache.org/repos/asf/tika/commit/b97045ae
Tree: http://git-wip-us.apache.org/repos/asf/tika/tree/b97045ae
Diff: http://git-wip-us.apache.org/repos/asf/tika/diff/b97045ae
Branch: refs/heads/master
Commit: b97045aea303bac75bd3c937cde6b42c7a3b3c48
Parents: 98de288
Author: tballison <ta...@mitre.org>
Authored: Thu Nov 10 08:31:51 2016 -0500
Committer: tballison <ta...@mitre.org>
Committed: Thu Nov 10 08:31:51 2016 -0500
----------------------------------------------------------------------
.../src/main/java/org/apache/tika/parser/pdf/PDF2XHTML.java | 2 +-
.../java/org/apache/tika/parser/ocr/TesseractOCRParserTest.java | 2 +-
2 files changed, 2 insertions(+), 2 deletions(-)
----------------------------------------------------------------------
http://git-wip-us.apache.org/repos/asf/tika/blob/b97045ae/tika-parsers/src/main/java/org/apache/tika/parser/pdf/PDF2XHTML.java
----------------------------------------------------------------------
diff --git a/tika-parsers/src/main/java/org/apache/tika/parser/pdf/PDF2XHTML.java b/tika-parsers/src/main/java/org/apache/tika/parser/pdf/PDF2XHTML.java
index d89dce4..ddbd148 100644
--- a/tika-parsers/src/main/java/org/apache/tika/parser/pdf/PDF2XHTML.java
+++ b/tika-parsers/src/main/java/org/apache/tika/parser/pdf/PDF2XHTML.java
@@ -246,7 +246,7 @@ class PDF2XHTML extends AbstractPDF2XHTML {
writeToBuffer(image, extension, buffer);
} catch (IOException e) {
EmbeddedDocumentUtil.recordException(e, metadata);
- return;
+ continue;
}
embeddedDocumentExtractor.parseEmbedded(
new ByteArrayInputStream(buffer.toByteArray()),
http://git-wip-us.apache.org/repos/asf/tika/blob/b97045ae/tika-parsers/src/test/java/org/apache/tika/parser/ocr/TesseractOCRParserTest.java
----------------------------------------------------------------------
diff --git a/tika-parsers/src/test/java/org/apache/tika/parser/ocr/TesseractOCRParserTest.java b/tika-parsers/src/test/java/org/apache/tika/parser/ocr/TesseractOCRParserTest.java
index 7607427..956a71b 100644
--- a/tika-parsers/src/test/java/org/apache/tika/parser/ocr/TesseractOCRParserTest.java
+++ b/tika-parsers/src/test/java/org/apache/tika/parser/ocr/TesseractOCRParserTest.java
@@ -91,7 +91,7 @@ public class TesseractOCRParserTest extends TikaTest {
// Assuming that Tesseract is on the path, we should find 5 Parsers that support PNG.
assumeTrue(canRun());
- assertEquals(7, parser.getSupportedTypes(parseContext).size());
+ assertEquals(8, parser.getSupportedTypes(parseContext).size());
assertTrue(parser.getSupportedTypes(parseContext).contains(png));
// DefaultParser will now select the TesseractOCRParser.