You are viewing a plain text version of this content. The canonical link for it is here.
Posted to commits@tika.apache.org by ta...@apache.org on 2017/12/08 17:39:15 UTC

[tika] branch master updated: TIKA-2521

This is an automated email from the ASF dual-hosted git repository.

tallison pushed a commit to branch master
in repository https://gitbox.apache.org/repos/asf/tika.git


The following commit(s) were added to refs/heads/master by this push:
     new f57e0e7  TIKA-2521
f57e0e7 is described below

commit f57e0e78c3882c5003cf15b18375a334944d24dd
Author: tballison <ta...@mitre.org>
AuthorDate: Fri Dec 8 12:39:07 2017 -0500

    TIKA-2521
---
 .../tika/parser/microsoft/ooxml/OOXMLTikaBodyPartHandler.java | 11 +++++++++++
 1 file changed, 11 insertions(+)

diff --git a/tika-parsers/src/main/java/org/apache/tika/parser/microsoft/ooxml/OOXMLTikaBodyPartHandler.java b/tika-parsers/src/main/java/org/apache/tika/parser/microsoft/ooxml/OOXMLTikaBodyPartHandler.java
index 95cbc5b..70fe7aa 100644
--- a/tika-parsers/src/main/java/org/apache/tika/parser/microsoft/ooxml/OOXMLTikaBodyPartHandler.java
+++ b/tika-parsers/src/main/java/org/apache/tika/parser/microsoft/ooxml/OOXMLTikaBodyPartHandler.java
@@ -178,6 +178,17 @@ public class OOXMLTikaBodyPartHandler implements OOXMLWordAndPowerPointTextHandl
 
     @Override
     public void startParagraph(ParagraphProperties paragraphProperties) {
+
+        //if you're in a table cell and your after the first paragraph
+        //make sure to prepend a \n
+        if (tableCellDepth > 0 && pWithinCell > 0) {
+            try {
+                xhtml.characters(NEWLINE, 0, 1);
+            } catch (SAXException e) {
+                //swallow
+            }
+        }
+
         if (pDepth == 0 && tableDepth == 0 && sdtDepth == 0) {
             paragraphTag = P;
             String styleClass = null;

-- 
To stop receiving notification emails like this one, please contact
['"commits@tika.apache.org" <co...@tika.apache.org>'].