You are viewing a plain text version of this content. The canonical link for it is here.
Posted to commits@tika.apache.org by mi...@apache.org on 2011/11/06 12:14:35 UTC

svn commit: r1198336 - in /tika/trunk/tika-parsers/src/test: java/org/apache/tika/parser/microsoft/ooxml/OOXMLParserTest.java resources/test-documents/testWordArt.pptx

Author: mikemccand
Date: Sun Nov  6 11:14:34 2011
New Revision: 1198336

URL: http://svn.apache.org/viewvc?rev=1198336&view=rev
Log:
TIKA-714: add test case for PPTX to extract text from word art

Added:
    tika/trunk/tika-parsers/src/test/resources/test-documents/testWordArt.pptx   (with props)
Modified:
    tika/trunk/tika-parsers/src/test/java/org/apache/tika/parser/microsoft/ooxml/OOXMLParserTest.java

Modified: tika/trunk/tika-parsers/src/test/java/org/apache/tika/parser/microsoft/ooxml/OOXMLParserTest.java
URL: http://svn.apache.org/viewvc/tika/trunk/tika-parsers/src/test/java/org/apache/tika/parser/microsoft/ooxml/OOXMLParserTest.java?rev=1198336&r1=1198335&r2=1198336&view=diff
==============================================================================
--- tika/trunk/tika-parsers/src/test/java/org/apache/tika/parser/microsoft/ooxml/OOXMLParserTest.java (original)
+++ tika/trunk/tika-parsers/src/test/java/org/apache/tika/parser/microsoft/ooxml/OOXMLParserTest.java Sun Nov  6 11:14:34 2011
@@ -661,4 +661,20 @@ public class OOXMLParserTest extends Tik
         assertContains("Text that I added to the master slide", content);
     }
     */
+
+    public void testWordArt() throws Exception {
+        ContentHandler handler = new BodyContentHandler();
+        Metadata metadata = new Metadata();
+
+        InputStream stream = OOXMLParserTest.class.getResourceAsStream(
+                "/test-documents/testWordArt.pptx");
+        try {
+            new AutoDetectParser().parse(stream, handler, metadata, new ParseContext());
+        } finally {
+            stream.close();
+        }
+        String content = handler.toString();
+        assertContains("Here is some red word Art", content);
+    }
+
 }

Added: tika/trunk/tika-parsers/src/test/resources/test-documents/testWordArt.pptx
URL: http://svn.apache.org/viewvc/tika/trunk/tika-parsers/src/test/resources/test-documents/testWordArt.pptx?rev=1198336&view=auto
==============================================================================
Binary file - no diff available.

Propchange: tika/trunk/tika-parsers/src/test/resources/test-documents/testWordArt.pptx
------------------------------------------------------------------------------
    svn:mime-type = application/octet-stream