You are viewing a plain text version of this content. The canonical link for it is here.
Posted to commits@tika.apache.org by ti...@apache.org on 2023/08/13 14:12:44 UTC

[tika] 02/02: TIKA-4114: add comment TIKA-4064: avoid outdated method

This is an automated email from the ASF dual-hosted git repository.

tilman pushed a commit to branch main
in repository https://gitbox.apache.org/repos/asf/tika.git

commit be4c708c13c4eca8588daa3e3ec8536eb36a158a
Author: Tilman Hausherr <ti...@apache.org>
AuthorDate: Sun Aug 13 16:12:26 2023 +0200

    TIKA-4114: add comment
    TIKA-4064: avoid outdated method
---
 .../src/main/java/org/apache/tika/parser/pdf/AbstractPDF2XHTML.java  | 5 +++--
 1 file changed, 3 insertions(+), 2 deletions(-)

diff --git a/tika-parsers/tika-parsers-standard/tika-parsers-standard-modules/tika-parser-pdf-module/src/main/java/org/apache/tika/parser/pdf/AbstractPDF2XHTML.java b/tika-parsers/tika-parsers-standard/tika-parsers-standard-modules/tika-parser-pdf-module/src/main/java/org/apache/tika/parser/pdf/AbstractPDF2XHTML.java
index 51fd4b63c..e03e14a4f 100644
--- a/tika-parsers/tika-parsers-standard/tika-parsers-standard-modules/tika-parser-pdf-module/src/main/java/org/apache/tika/parser/pdf/AbstractPDF2XHTML.java
+++ b/tika-parsers/tika-parsers-standard/tika-parsers-standard-modules/tika-parser-pdf-module/src/main/java/org/apache/tika/parser/pdf/AbstractPDF2XHTML.java
@@ -1397,9 +1397,10 @@ class AbstractPDF2XHTML extends PDFTextStripper {
     }
 
     @Override
-    protected void showGlyph(Matrix textRenderingMatrix, PDFont font, int code, String unicode,
+    protected void showGlyph(Matrix textRenderingMatrix, PDFont font, int code,
                              Vector displacement) throws IOException {
-        super.showGlyph(textRenderingMatrix, font, code, unicode, displacement);
+        super.showGlyph(textRenderingMatrix, font, code, displacement);
+        String unicode = font.toUnicode(code);
         if (unicode == null || unicode.isEmpty()) {
             unmappedUnicodeCharsPerPage++;
             totalUnmappedUnicodeCharacters++;