You are viewing a plain text version of this content. The canonical link for it is here.
Posted to commits@tika.apache.org by mi...@apache.org on 2011/10/03 14:36:04 UTC

svn commit: r1178389 - in /tika/trunk/tika-parsers/src/test: java/org/apache/tika/TestParsers.java java/org/apache/tika/parser/pdf/PDFParserTest.java resources/test-documents/testAnnotations.pdf resources/test-documents/testComment2.pdf

Author: mikemccand
Date: Mon Oct  3 12:36:03 2011
New Revision: 1178389

URL: http://svn.apache.org/viewvc?rev=1178389&view=rev
Log:
TIKA-738: move (ignored) test case to PDFParserTest

Added:
    tika/trunk/tika-parsers/src/test/resources/test-documents/testAnnotations.pdf
      - copied unchanged from r1178250, tika/trunk/tika-parsers/src/test/resources/test-documents/testComment2.pdf
Removed:
    tika/trunk/tika-parsers/src/test/resources/test-documents/testComment2.pdf
Modified:
    tika/trunk/tika-parsers/src/test/java/org/apache/tika/TestParsers.java
    tika/trunk/tika-parsers/src/test/java/org/apache/tika/parser/pdf/PDFParserTest.java

Modified: tika/trunk/tika-parsers/src/test/java/org/apache/tika/TestParsers.java
URL: http://svn.apache.org/viewvc/tika/trunk/tika-parsers/src/test/java/org/apache/tika/TestParsers.java?rev=1178389&r1=1178388&r2=1178389&view=diff
==============================================================================
--- tika/trunk/tika-parsers/src/test/java/org/apache/tika/TestParsers.java (original)
+++ tika/trunk/tika-parsers/src/test/java/org/apache/tika/TestParsers.java Mon Oct  3 12:36:03 2011
@@ -191,10 +191,6 @@ public class TestParsers extends TikaTes
         final String[] extensions = new String[] {"ppt", "pptx", "doc", "docx", "pdf", "rtf"};
         for(String extension : extensions) {
             verifyComment(extension, "testComment");
-            // TIKA-717: re-enable once we fix this:
-            //if (extension.equals("pdf")) {
-            //verifyComment(extension, "testComment2");
-            //}
         }
     }
 }

Modified: tika/trunk/tika-parsers/src/test/java/org/apache/tika/parser/pdf/PDFParserTest.java
URL: http://svn.apache.org/viewvc/tika/trunk/tika-parsers/src/test/java/org/apache/tika/parser/pdf/PDFParserTest.java?rev=1178389&r1=1178388&r2=1178389&view=diff
==============================================================================
--- tika/trunk/tika-parsers/src/test/java/org/apache/tika/parser/pdf/PDFParserTest.java (original)
+++ tika/trunk/tika-parsers/src/test/java/org/apache/tika/parser/pdf/PDFParserTest.java Mon Oct  3 12:36:03 2011
@@ -212,4 +212,22 @@ public class PDFParserTest extends TikaT
         // chars, so we cannot test this here:
         //assertContains("\uD800\uDF32\uD800\uDF3f\uD800\uDF44\uD800\uDF39\uD800\uDF43\uD800\uDF3A", content);
     }
+
+    // TIKA-738: re-enable this
+    public void IGNOREtestAnnotations() throws Exception {
+        Parser parser = new AutoDetectParser(); // Should auto-detect!
+        ContentHandler handler = new BodyContentHandler();
+        Metadata metadata = new Metadata();
+        ParseContext context = new ParseContext();
+        InputStream stream = getResourceAsStream("/test-documents/testAnnotations.pdf");
+        try {
+            parser.parse(stream, handler, metadata, context);
+        } finally {
+            stream.close();
+        }
+        String content = handler.toString();
+        content = content.replaceAll("[\\s\u00a0]+"," ");
+        assertContains("Here is some text", content);
+        assertContains("Here is a comment", content);
+    }
 }