You are viewing a plain text version of this content. The canonical link for it is here.
Posted to commits@manifoldcf.apache.org by kw...@apache.org on 2014/06/19 02:07:28 UTC
svn commit: r1603683 -
/manifoldcf/branches/CONNECTORS-954/connectors/tika/connector/src/main/java/org/apache/manifoldcf/agents/transformer/tika/TikaExtractor.java
Author: kwright
Date: Thu Jun 19 00:07:28 2014
New Revision: 1603683
URL: http://svn.apache.org/r1603683
Log:
Hook up UI to be actually functional
Modified:
manifoldcf/branches/CONNECTORS-954/connectors/tika/connector/src/main/java/org/apache/manifoldcf/agents/transformer/tika/TikaExtractor.java
Modified: manifoldcf/branches/CONNECTORS-954/connectors/tika/connector/src/main/java/org/apache/manifoldcf/agents/transformer/tika/TikaExtractor.java
URL: http://svn.apache.org/viewvc/manifoldcf/branches/CONNECTORS-954/connectors/tika/connector/src/main/java/org/apache/manifoldcf/agents/transformer/tika/TikaExtractor.java?rev=1603683&r1=1603682&r2=1603683&view=diff
==============================================================================
--- manifoldcf/branches/CONNECTORS-954/connectors/tika/connector/src/main/java/org/apache/manifoldcf/agents/transformer/tika/TikaExtractor.java (original)
+++ manifoldcf/branches/CONNECTORS-954/connectors/tika/connector/src/main/java/org/apache/manifoldcf/agents/transformer/tika/TikaExtractor.java Thu Jun 19 00:07:28 2014
@@ -101,6 +101,8 @@ public class TikaExtractor extends org.a
public int addOrReplaceDocumentWithException(String documentURI, String pipelineDescription, RepositoryDocument document, String authorityNameString, IOutputAddActivity activities)
throws ManifoldCFException, ServiceInterruption, IOException
{
+ SpecPacker sp = new SpecPacker(pipelineDescription);
+
// Tika's API reads from an input stream and writes to an output Writer.
// Since a RepositoryDocument includes readers and inputstreams exclusively, AND all downstream
// processing needs to occur in a ManifoldCF thread, we have some constraints on the architecture we need to get this done:
@@ -203,7 +205,18 @@ public class TikaExtractor extends org.a
String[] metaNames = metadata.names();
for(String mName : metaNames){
String value = metadata.get(mName);
- docCopy.addField(mName,value);
+ String target = sp.getMapping(mName);
+ if(target!=null)
+ {
+ docCopy.addField(target, value);
+ }
+ else
+ {
+ if(sp.keepAllMetadata())
+ {
+ docCopy.addField(mName, value);
+ }
+ }
}
// Send new document downstream