You are viewing a plain text version of this content. The canonical link for it is here.
Posted to commits@jackrabbit.apache.org by mr...@apache.org on 2008/08/21 15:37:16 UTC
svn commit: r687757 -
/jackrabbit/trunk/jackrabbit-text-extractors/src/main/java/org/apache/jackrabbit/extractor/MsOutlookTextExtractor.java
Author: mreutegg
Date: Thu Aug 21 06:37:15 2008
New Revision: 687757
URL: http://svn.apache.org/viewvc?rev=687757&view=rev
Log:
JCR-1561: New MsOutlook Message Extractor
Added:
jackrabbit/trunk/jackrabbit-text-extractors/src/main/java/org/apache/jackrabbit/extractor/MsOutlookTextExtractor.java (with props)
Added: jackrabbit/trunk/jackrabbit-text-extractors/src/main/java/org/apache/jackrabbit/extractor/MsOutlookTextExtractor.java
URL: http://svn.apache.org/viewvc/jackrabbit/trunk/jackrabbit-text-extractors/src/main/java/org/apache/jackrabbit/extractor/MsOutlookTextExtractor.java?rev=687757&view=auto
==============================================================================
--- jackrabbit/trunk/jackrabbit-text-extractors/src/main/java/org/apache/jackrabbit/extractor/MsOutlookTextExtractor.java (added)
+++ jackrabbit/trunk/jackrabbit-text-extractors/src/main/java/org/apache/jackrabbit/extractor/MsOutlookTextExtractor.java Thu Aug 21 06:37:15 2008
@@ -0,0 +1,79 @@
+/*
+ * Licensed to the Apache Software Foundation (ASF) under one or more
+ * contributor license agreements. See the NOTICE file distributed with
+ * this work for additional information regarding copyright ownership.
+ * The ASF licenses this file to You under the Apache License, Version 2.0
+ * (the "License"); you may not use this file except in compliance with
+ * the License. You may obtain a copy of the License at
+ *
+ * http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing, software
+ * distributed under the License is distributed on an "AS IS" BASIS,
+ * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+ * See the License for the specific language governing permissions and
+ * limitations under the License.
+ */
+package org.apache.jackrabbit.extractor;
+
+import java.io.IOException;
+import java.io.InputStream;
+import java.io.Reader;
+import java.io.StringReader;
+
+import org.apache.poi.hsmf.MAPIMessage;
+import org.slf4j.Logger;
+import org.slf4j.LoggerFactory;
+
+/**
+ * Text extractor for Microsoft Outlook messages.
+ */
+public class MsOutlookTextExtractor extends AbstractTextExtractor {
+
+ /**
+ * Logger instance.
+ */
+ private static final Logger logger =
+ LoggerFactory.getLogger(MsOutlookTextExtractor.class);
+
+ /**
+ * Force loading of dependent class.
+ */
+ static {
+ MAPIMessage.class.getName();
+ }
+
+ /**
+ * Creates a new <code>MsOutlookTextExtractor</code> instance.
+ */
+ public MsOutlookTextExtractor() {
+ super(new String[]{"application/vnd.ms-outlook"});
+ }
+
+ //-------------------------------------------------------< TextExtractor >
+
+ /**
+ * {@inheritDoc}
+ * Returns an empty reader if an error occured extracting text from
+ * the outlook message.
+ */
+ public Reader extractText(InputStream stream,
+ String type,
+ String encoding) throws IOException {
+ try {
+ MAPIMessage message = new MAPIMessage(stream);
+ StringBuffer buffer = new StringBuffer();
+ buffer.append(message.getDisplayFrom()).append('\n');
+ buffer.append(message.getDisplayTo()).append('\n');
+ buffer.append(message.getSubject()).append('\n');
+ buffer.append(message.getTextBody());
+ return new StringReader(buffer.toString());
+ } catch (Exception e) {
+ logger.warn("Failed to extract Message content", e);
+ return new StringReader("");
+ } finally {
+ stream.close();
+ }
+ }
+
+}
Propchange: jackrabbit/trunk/jackrabbit-text-extractors/src/main/java/org/apache/jackrabbit/extractor/MsOutlookTextExtractor.java
------------------------------------------------------------------------------
svn:eol-style = native