You are viewing a plain text version of this content. The canonical link for it is here.
Posted to commits@tika.apache.org by ta...@apache.org on 2017/12/08 17:39:15 UTC
[tika] branch master updated: TIKA-2521
This is an automated email from the ASF dual-hosted git repository.
tallison pushed a commit to branch master
in repository https://gitbox.apache.org/repos/asf/tika.git
The following commit(s) were added to refs/heads/master by this push:
new f57e0e7 TIKA-2521
f57e0e7 is described below
commit f57e0e78c3882c5003cf15b18375a334944d24dd
Author: tballison <ta...@mitre.org>
AuthorDate: Fri Dec 8 12:39:07 2017 -0500
TIKA-2521
---
.../tika/parser/microsoft/ooxml/OOXMLTikaBodyPartHandler.java | 11 +++++++++++
1 file changed, 11 insertions(+)
diff --git a/tika-parsers/src/main/java/org/apache/tika/parser/microsoft/ooxml/OOXMLTikaBodyPartHandler.java b/tika-parsers/src/main/java/org/apache/tika/parser/microsoft/ooxml/OOXMLTikaBodyPartHandler.java
index 95cbc5b..70fe7aa 100644
--- a/tika-parsers/src/main/java/org/apache/tika/parser/microsoft/ooxml/OOXMLTikaBodyPartHandler.java
+++ b/tika-parsers/src/main/java/org/apache/tika/parser/microsoft/ooxml/OOXMLTikaBodyPartHandler.java
@@ -178,6 +178,17 @@ public class OOXMLTikaBodyPartHandler implements OOXMLWordAndPowerPointTextHandl
@Override
public void startParagraph(ParagraphProperties paragraphProperties) {
+
+ //if you're in a table cell and your after the first paragraph
+ //make sure to prepend a \n
+ if (tableCellDepth > 0 && pWithinCell > 0) {
+ try {
+ xhtml.characters(NEWLINE, 0, 1);
+ } catch (SAXException e) {
+ //swallow
+ }
+ }
+
if (pDepth == 0 && tableDepth == 0 && sdtDepth == 0) {
paragraphTag = P;
String styleClass = null;
--
To stop receiving notification emails like this one, please contact
['"commits@tika.apache.org" <co...@tika.apache.org>'].