You are viewing a plain text version of this content. The canonical link for it is here.
Posted to dev@tika.apache.org by Tyler Palsulich <tp...@gmail.com> on 2015/03/06 18:29:24 UTC

Re: svn commit: r1664641 - /tika/trunk/tika-parsers/src/test/java/org/apache/tika/parser/pdf/PDFParserTest.java

Thank you for this one... We can always turn it on later for debugging.

Tyler
On Mar 6, 2015 9:50 AM, <ta...@apache.org> wrote:

> Author: tallison
> Date: Fri Mar  6 14:50:46 2015
> New Revision: 1664641
>
> URL: http://svn.apache.org/r1664641
> Log:
> turn off pdfbox logging in PDFParserTest
>
> Modified:
>
> tika/trunk/tika-parsers/src/test/java/org/apache/tika/parser/pdf/PDFParserTest.java
>
> Modified:
> tika/trunk/tika-parsers/src/test/java/org/apache/tika/parser/pdf/PDFParserTest.java
> URL:
> http://svn.apache.org/viewvc/tika/trunk/tika-parsers/src/test/java/org/apache/tika/parser/pdf/PDFParserTest.java?rev=1664641&r1=1664640&r2=1664641&view=diff
>
> ==============================================================================
> ---
> tika/trunk/tika-parsers/src/test/java/org/apache/tika/parser/pdf/PDFParserTest.java
> (original)
> +++
> tika/trunk/tika-parsers/src/test/java/org/apache/tika/parser/pdf/PDFParserTest.java
> Fri Mar  6 14:50:46 2015
> @@ -31,6 +31,8 @@ import java.util.Locale;
>  import java.util.Map;
>  import java.util.Set;
>
> +import org.apache.log4j.Level;
> +import org.apache.log4j.Logger;
>  import org.apache.tika.TikaTest;
>  import org.apache.tika.exception.AccessPermissionException;
>  import org.apache.tika.exception.EncryptedDocumentException;
> @@ -53,6 +55,8 @@ import org.apache.tika.sax.BasicContentH
>  import org.apache.tika.sax.BodyContentHandler;
>  import org.apache.tika.sax.ContentHandlerDecorator;
>  import org.apache.tika.sax.ToXMLContentHandler;
> +import org.junit.AfterClass;
> +import org.junit.BeforeClass;
>  import org.junit.Test;
>  import org.xml.sax.ContentHandler;
>  /**
> @@ -65,6 +69,20 @@ public class PDFParserTest extends TikaT
>      public static final MediaType TYPE_PDF = MediaType.application("pdf");
>      public static final MediaType TYPE_DOCX =
> MediaType.application("vnd.openxmlformats-officedocument.wordprocessingml.document");
>      public static final MediaType TYPE_DOC =
> MediaType.application("msword");
> +    public static Level PDFBOX_LOG_LEVEL = Level.INFO;
> +
> +    @BeforeClass
> +    public static void setup() {
> +        //remember default logging level, but turn off for PDFParserTest
> +        PDFBOX_LOG_LEVEL =
> Logger.getLogger("org.apache.pdfbox").getLevel();
> +        Logger.getLogger("org.apache.pdfbox").setLevel(Level.OFF);
> +    }
> +
> +    @AfterClass
> +    public static void tearDown() {
> +        //return to regular logging level
> +        Logger.getLogger("org.apache.pdfbox").setLevel(PDFBOX_LOG_LEVEL);
> +    }
>
>      @Test
>      public void testPdfParsing() throws Exception {
>
>
>

Re: svn commit: r1664641 - /tika/trunk/tika-parsers/src/test/java/org/apache/tika/parser/pdf/PDFParserTest.java

Posted by Tyler Palsulich <tp...@gmail.com>.
I'll keep an eye out for it! I'm on 1000 -- I'm afraid about halfway
through.

Have a good weekend,
Tyler

On Fri, Mar 6, 2015 at 12:47 PM, Allison, Timothy B. <ta...@mitre.org>
wrote:

> In the back of my memory, there's a ticket open for fixing the logged
> messages from PDFBox (or maybe just fixing the pdfs that triggered the
> messages), but I can't find it quickly.  It may have been a smaller part of
> something that we've already closed out, or it might still be open.
>
> Tyler, in your impressive ticket-blitz of 2015, let me know if you find
> this. :)
>
>
> Best,
>
>          Tim
> -----Original Message-----
>
> From: Tyler Palsulich [mailto:tpalsulich@gmail.com]
> Sent: Friday, March 06, 2015 12:29 PM
> To: dev@tika.apache.org
> Cc: commits@tika.apache.org
> Subject: Re: svn commit: r1664641 -
> /tika/trunk/tika-parsers/src/test/java/org/apache/tika/parser/pdf/PDFParserTest.java
>
> Thank you for this one... We can always turn it on later for debugging.
>
> Tyler
> On Mar 6, 2015 9:50 AM, <ta...@apache.org> wrote:
>
> > Author: tallison
> > Date: Fri Mar  6 14:50:46 2015
> > New Revision: 1664641
> >
> > URL: http://svn.apache.org/r1664641
> > Log:
> > turn off pdfbox logging in PDFParserTest
> >
> > Modified:
> >
> >
> tika/trunk/tika-parsers/src/test/java/org/apache/tika/parser/pdf/PDFParserTest.java
> >
> > Modified:
> >
> tika/trunk/tika-parsers/src/test/java/org/apache/tika/parser/pdf/PDFParserTest.java
> > URL:
> >
> http://svn.apache.org/viewvc/tika/trunk/tika-parsers/src/test/java/org/apache/tika/parser/pdf/PDFParserTest.java?rev=1664641&r1=1664640&r2=1664641&view=diff
> >
> >
> ==============================================================================
> > ---
> >
> tika/trunk/tika-parsers/src/test/java/org/apache/tika/parser/pdf/PDFParserTest.java
> > (original)
> > +++
> >
> tika/trunk/tika-parsers/src/test/java/org/apache/tika/parser/pdf/PDFParserTest.java
> > Fri Mar  6 14:50:46 2015
> > @@ -31,6 +31,8 @@ import java.util.Locale;
> >  import java.util.Map;
> >  import java.util.Set;
> >
> > +import org.apache.log4j.Level;
> > +import org.apache.log4j.Logger;
> >  import org.apache.tika.TikaTest;
> >  import org.apache.tika.exception.AccessPermissionException;
> >  import org.apache.tika.exception.EncryptedDocumentException;
> > @@ -53,6 +55,8 @@ import org.apache.tika.sax.BasicContentH
> >  import org.apache.tika.sax.BodyContentHandler;
> >  import org.apache.tika.sax.ContentHandlerDecorator;
> >  import org.apache.tika.sax.ToXMLContentHandler;
> > +import org.junit.AfterClass;
> > +import org.junit.BeforeClass;
> >  import org.junit.Test;
> >  import org.xml.sax.ContentHandler;
> >  /**
> > @@ -65,6 +69,20 @@ public class PDFParserTest extends TikaT
> >      public static final MediaType TYPE_PDF =
> MediaType.application("pdf");
> >      public static final MediaType TYPE_DOCX =
> >
> MediaType.application("vnd.openxmlformats-officedocument.wordprocessingml.document");
> >      public static final MediaType TYPE_DOC =
> > MediaType.application("msword");
> > +    public static Level PDFBOX_LOG_LEVEL = Level.INFO;
> > +
> > +    @BeforeClass
> > +    public static void setup() {
> > +        //remember default logging level, but turn off for PDFParserTest
> > +        PDFBOX_LOG_LEVEL =
> > Logger.getLogger("org.apache.pdfbox").getLevel();
> > +        Logger.getLogger("org.apache.pdfbox").setLevel(Level.OFF);
> > +    }
> > +
> > +    @AfterClass
> > +    public static void tearDown() {
> > +        //return to regular logging level
> > +
> Logger.getLogger("org.apache.pdfbox").setLevel(PDFBOX_LOG_LEVEL);
> > +    }
> >
> >      @Test
> >      public void testPdfParsing() throws Exception {
> >
> >
> >
>

RE: svn commit: r1664641 - /tika/trunk/tika-parsers/src/test/java/org/apache/tika/parser/pdf/PDFParserTest.java

Posted by "Allison, Timothy B." <ta...@mitre.org>.
In the back of my memory, there's a ticket open for fixing the logged messages from PDFBox (or maybe just fixing the pdfs that triggered the messages), but I can't find it quickly.  It may have been a smaller part of something that we've already closed out, or it might still be open.  

Tyler, in your impressive ticket-blitz of 2015, let me know if you find this. :)


Best,

         Tim
-----Original Message-----

From: Tyler Palsulich [mailto:tpalsulich@gmail.com] 
Sent: Friday, March 06, 2015 12:29 PM
To: dev@tika.apache.org
Cc: commits@tika.apache.org
Subject: Re: svn commit: r1664641 - /tika/trunk/tika-parsers/src/test/java/org/apache/tika/parser/pdf/PDFParserTest.java

Thank you for this one... We can always turn it on later for debugging.

Tyler
On Mar 6, 2015 9:50 AM, <ta...@apache.org> wrote:

> Author: tallison
> Date: Fri Mar  6 14:50:46 2015
> New Revision: 1664641
>
> URL: http://svn.apache.org/r1664641
> Log:
> turn off pdfbox logging in PDFParserTest
>
> Modified:
>
> tika/trunk/tika-parsers/src/test/java/org/apache/tika/parser/pdf/PDFParserTest.java
>
> Modified:
> tika/trunk/tika-parsers/src/test/java/org/apache/tika/parser/pdf/PDFParserTest.java
> URL:
> http://svn.apache.org/viewvc/tika/trunk/tika-parsers/src/test/java/org/apache/tika/parser/pdf/PDFParserTest.java?rev=1664641&r1=1664640&r2=1664641&view=diff
>
> ==============================================================================
> ---
> tika/trunk/tika-parsers/src/test/java/org/apache/tika/parser/pdf/PDFParserTest.java
> (original)
> +++
> tika/trunk/tika-parsers/src/test/java/org/apache/tika/parser/pdf/PDFParserTest.java
> Fri Mar  6 14:50:46 2015
> @@ -31,6 +31,8 @@ import java.util.Locale;
>  import java.util.Map;
>  import java.util.Set;
>
> +import org.apache.log4j.Level;
> +import org.apache.log4j.Logger;
>  import org.apache.tika.TikaTest;
>  import org.apache.tika.exception.AccessPermissionException;
>  import org.apache.tika.exception.EncryptedDocumentException;
> @@ -53,6 +55,8 @@ import org.apache.tika.sax.BasicContentH
>  import org.apache.tika.sax.BodyContentHandler;
>  import org.apache.tika.sax.ContentHandlerDecorator;
>  import org.apache.tika.sax.ToXMLContentHandler;
> +import org.junit.AfterClass;
> +import org.junit.BeforeClass;
>  import org.junit.Test;
>  import org.xml.sax.ContentHandler;
>  /**
> @@ -65,6 +69,20 @@ public class PDFParserTest extends TikaT
>      public static final MediaType TYPE_PDF = MediaType.application("pdf");
>      public static final MediaType TYPE_DOCX =
> MediaType.application("vnd.openxmlformats-officedocument.wordprocessingml.document");
>      public static final MediaType TYPE_DOC =
> MediaType.application("msword");
> +    public static Level PDFBOX_LOG_LEVEL = Level.INFO;
> +
> +    @BeforeClass
> +    public static void setup() {
> +        //remember default logging level, but turn off for PDFParserTest
> +        PDFBOX_LOG_LEVEL =
> Logger.getLogger("org.apache.pdfbox").getLevel();
> +        Logger.getLogger("org.apache.pdfbox").setLevel(Level.OFF);
> +    }
> +
> +    @AfterClass
> +    public static void tearDown() {
> +        //return to regular logging level
> +        Logger.getLogger("org.apache.pdfbox").setLevel(PDFBOX_LOG_LEVEL);
> +    }
>
>      @Test
>      public void testPdfParsing() throws Exception {
>
>
>