You are viewing a plain text version of this content. The canonical link for it is here.
Posted to commits@tika.apache.org by ni...@apache.org on 2011/04/06 18:20:00 UTC
svn commit: r1089518 - in /tika/trunk/tika-parsers/src/main/resources:
META-INF/services/ org/ org/apache/ org/apache/tika/
org/apache/tika/parser/ org/apache/tika/parser/external/
Author: nick
Date: Wed Apr 6 16:20:00 2011
New Revision: 1089518
URL: http://svn.apache.org/viewvc?rev=1089518&view=rev
Log:
TIKA-634 - Example external parsers config file
Added:
tika/trunk/tika-parsers/src/main/resources/org/
tika/trunk/tika-parsers/src/main/resources/org/apache/
tika/trunk/tika-parsers/src/main/resources/org/apache/tika/
tika/trunk/tika-parsers/src/main/resources/org/apache/tika/parser/
tika/trunk/tika-parsers/src/main/resources/org/apache/tika/parser/external/
tika/trunk/tika-parsers/src/main/resources/org/apache/tika/parser/external/tika-external-parsers.xml
Modified:
tika/trunk/tika-parsers/src/main/resources/META-INF/services/org.apache.tika.parser.Parser
Modified: tika/trunk/tika-parsers/src/main/resources/META-INF/services/org.apache.tika.parser.Parser
URL: http://svn.apache.org/viewvc/tika/trunk/tika-parsers/src/main/resources/META-INF/services/org.apache.tika.parser.Parser?rev=1089518&r1=1089517&r2=1089518&view=diff
==============================================================================
--- tika/trunk/tika-parsers/src/main/resources/META-INF/services/org.apache.tika.parser.Parser (original)
+++ tika/trunk/tika-parsers/src/main/resources/META-INF/services/org.apache.tika.parser.Parser Wed Apr 6 16:20:00 2011
@@ -29,6 +29,7 @@ org.apache.tika.parser.jpeg.JpegParser
org.apache.tika.parser.mail.RFC822Parser
org.apache.tika.parser.mbox.MboxParser
org.apache.tika.parser.microsoft.OfficeParser
+org.apache.tika.parser.microsoft.TNEFParser
org.apache.tika.parser.microsoft.ooxml.OOXMLParser
org.apache.tika.parser.mp3.Mp3Parser
org.apache.tika.parser.hdf.HDFParser
Added: tika/trunk/tika-parsers/src/main/resources/org/apache/tika/parser/external/tika-external-parsers.xml
URL: http://svn.apache.org/viewvc/tika/trunk/tika-parsers/src/main/resources/org/apache/tika/parser/external/tika-external-parsers.xml?rev=1089518&view=auto
==============================================================================
--- tika/trunk/tika-parsers/src/main/resources/org/apache/tika/parser/external/tika-external-parsers.xml (added)
+++ tika/trunk/tika-parsers/src/main/resources/org/apache/tika/parser/external/tika-external-parsers.xml Wed Apr 6 16:20:00 2011
@@ -0,0 +1,39 @@
+<?xml version="1.0" encoding="UTF-8"?>
+<!--
+ Licensed to the Apache Software Foundation (ASF) under one or more
+ contributor license agreements. See the NOTICE file distributed with
+ this work for additional information regarding copyright ownership.
+ The ASF licenses this file to You under the Apache License, Version 2.0
+ (the "License"); you may not use this file except in compliance with
+ the License. You may obtain a copy of the License at
+
+ http://www.apache.org/licenses/LICENSE-2.0
+
+ Unless required by applicable law or agreed to in writing, software
+ distributed under the License is distributed on an "AS IS" BASIS,
+ WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+ See the License for the specific language governing permissions and
+ limitations under the License.
+-->
+<!--
+ Description: This xml file defines external commands to be run by Tika
+ as parsers.
+-->
+<external-parsers>
+ <!-- This example uses ffmpeg for video metadata extraction -->
+ <parser>
+ <check>
+ <command>ffmpeg -version</command>
+ <error-codes>126,127</error-codes>
+ </check>
+ <command>ffmpeg -i ${INPUT}</command>
+ <mime-types>
+ <mime-type>video/avi</mime-type>
+ <mime-type>video/mpeg</mime-type>
+ </mime-types>
+ <metadata>
+ <match key="xmpDM:audioChannelType">Stream.*? Audio:.*? Hz, (\w+),</match>
+ <match key="xmpDM:audioCompressor">Stream.*? Audio: (\w+),</match>
+ </metadata>
+ </parser>
+</external-parsers>