You are viewing a plain text version of this content. The canonical link for it is here.
Posted to commits@tika.apache.org by ni...@apache.org on 2011/04/06 18:20:00 UTC

svn commit: r1089518 - in /tika/trunk/tika-parsers/src/main/resources: META-INF/services/ org/ org/apache/ org/apache/tika/ org/apache/tika/parser/ org/apache/tika/parser/external/

Author: nick
Date: Wed Apr  6 16:20:00 2011
New Revision: 1089518

URL: http://svn.apache.org/viewvc?rev=1089518&view=rev
Log:
TIKA-634 - Example external parsers config file

Added:
    tika/trunk/tika-parsers/src/main/resources/org/
    tika/trunk/tika-parsers/src/main/resources/org/apache/
    tika/trunk/tika-parsers/src/main/resources/org/apache/tika/
    tika/trunk/tika-parsers/src/main/resources/org/apache/tika/parser/
    tika/trunk/tika-parsers/src/main/resources/org/apache/tika/parser/external/
    tika/trunk/tika-parsers/src/main/resources/org/apache/tika/parser/external/tika-external-parsers.xml
Modified:
    tika/trunk/tika-parsers/src/main/resources/META-INF/services/org.apache.tika.parser.Parser

Modified: tika/trunk/tika-parsers/src/main/resources/META-INF/services/org.apache.tika.parser.Parser
URL: http://svn.apache.org/viewvc/tika/trunk/tika-parsers/src/main/resources/META-INF/services/org.apache.tika.parser.Parser?rev=1089518&r1=1089517&r2=1089518&view=diff
==============================================================================
--- tika/trunk/tika-parsers/src/main/resources/META-INF/services/org.apache.tika.parser.Parser (original)
+++ tika/trunk/tika-parsers/src/main/resources/META-INF/services/org.apache.tika.parser.Parser Wed Apr  6 16:20:00 2011
@@ -29,6 +29,7 @@ org.apache.tika.parser.jpeg.JpegParser
 org.apache.tika.parser.mail.RFC822Parser
 org.apache.tika.parser.mbox.MboxParser
 org.apache.tika.parser.microsoft.OfficeParser
+org.apache.tika.parser.microsoft.TNEFParser
 org.apache.tika.parser.microsoft.ooxml.OOXMLParser
 org.apache.tika.parser.mp3.Mp3Parser
 org.apache.tika.parser.hdf.HDFParser

Added: tika/trunk/tika-parsers/src/main/resources/org/apache/tika/parser/external/tika-external-parsers.xml
URL: http://svn.apache.org/viewvc/tika/trunk/tika-parsers/src/main/resources/org/apache/tika/parser/external/tika-external-parsers.xml?rev=1089518&view=auto
==============================================================================
--- tika/trunk/tika-parsers/src/main/resources/org/apache/tika/parser/external/tika-external-parsers.xml (added)
+++ tika/trunk/tika-parsers/src/main/resources/org/apache/tika/parser/external/tika-external-parsers.xml Wed Apr  6 16:20:00 2011
@@ -0,0 +1,39 @@
+<?xml version="1.0" encoding="UTF-8"?>
+<!--
+  Licensed to the Apache Software Foundation (ASF) under one or more
+  contributor license agreements.  See the NOTICE file distributed with
+  this work for additional information regarding copyright ownership.
+  The ASF licenses this file to You under the Apache License, Version 2.0
+  (the "License"); you may not use this file except in compliance with
+  the License.  You may obtain a copy of the License at
+
+  http://www.apache.org/licenses/LICENSE-2.0
+
+  Unless required by applicable law or agreed to in writing, software
+  distributed under the License is distributed on an "AS IS" BASIS,
+  WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+  See the License for the specific language governing permissions and
+  limitations under the License.
+-->
+<!--
+  Description: This xml file defines external commands to be run by Tika
+  as parsers.
+-->
+<external-parsers>
+  <!-- This example uses ffmpeg for video metadata extraction -->
+  <parser>
+     <check>
+       <command>ffmpeg -version</command>
+       <error-codes>126,127</error-codes>
+     </check>
+     <command>ffmpeg -i ${INPUT}</command>
+     <mime-types>
+       <mime-type>video/avi</mime-type>
+       <mime-type>video/mpeg</mime-type>
+     </mime-types>
+     <metadata>
+       <match key="xmpDM:audioChannelType">Stream.*? Audio:.*? Hz, (\w+),</match>
+       <match key="xmpDM:audioCompressor">Stream.*? Audio: (\w+),</match>
+     </metadata>
+  </parser>
+</external-parsers>