You are viewing a plain text version of this content. The canonical link for it is here.
Posted to commits@manifoldcf.apache.org by kw...@apache.org on 2014/06/19 02:07:28 UTC

svn commit: r1603683 - /manifoldcf/branches/CONNECTORS-954/connectors/tika/connector/src/main/java/org/apache/manifoldcf/agents/transformer/tika/TikaExtractor.java

Author: kwright
Date: Thu Jun 19 00:07:28 2014
New Revision: 1603683

URL: http://svn.apache.org/r1603683
Log:
Hook up UI to be actually functional

Modified:
    manifoldcf/branches/CONNECTORS-954/connectors/tika/connector/src/main/java/org/apache/manifoldcf/agents/transformer/tika/TikaExtractor.java

Modified: manifoldcf/branches/CONNECTORS-954/connectors/tika/connector/src/main/java/org/apache/manifoldcf/agents/transformer/tika/TikaExtractor.java
URL: http://svn.apache.org/viewvc/manifoldcf/branches/CONNECTORS-954/connectors/tika/connector/src/main/java/org/apache/manifoldcf/agents/transformer/tika/TikaExtractor.java?rev=1603683&r1=1603682&r2=1603683&view=diff
==============================================================================
--- manifoldcf/branches/CONNECTORS-954/connectors/tika/connector/src/main/java/org/apache/manifoldcf/agents/transformer/tika/TikaExtractor.java (original)
+++ manifoldcf/branches/CONNECTORS-954/connectors/tika/connector/src/main/java/org/apache/manifoldcf/agents/transformer/tika/TikaExtractor.java Thu Jun 19 00:07:28 2014
@@ -101,6 +101,8 @@ public class TikaExtractor extends org.a
   public int addOrReplaceDocumentWithException(String documentURI, String pipelineDescription, RepositoryDocument document, String authorityNameString, IOutputAddActivity activities)
     throws ManifoldCFException, ServiceInterruption, IOException
   {
+    SpecPacker sp = new SpecPacker(pipelineDescription);
+
     // Tika's API reads from an input stream and writes to an output Writer.
     // Since a RepositoryDocument includes readers and inputstreams exclusively, AND all downstream
     // processing needs to occur in a ManifoldCF thread, we have some constraints on the architecture we need to get this done:
@@ -203,7 +205,18 @@ public class TikaExtractor extends org.a
         String[] metaNames = metadata.names();
         for(String mName : metaNames){
           String value = metadata.get(mName);
-          docCopy.addField(mName,value);
+          String target = sp.getMapping(mName);
+          if(target!=null)
+          {
+            docCopy.addField(target, value);
+          }
+          else
+          {
+            if(sp.keepAllMetadata())
+            {
+             docCopy.addField(mName, value);
+            }
+          }
         }
 
         // Send new document downstream