You are viewing a plain text version of this content. The canonical link for it is here.
Posted to commits@nutch.apache.org by je...@apache.org on 2006/02/13 22:43:16 UTC

svn commit: r377501 - in /lucene/nutch/trunk: ./ src/plugin/lib-parsems/src/java/org/apache/nutch/parse/ms/ src/plugin/parse-mspowerpoint/src/java/org/apache/nutch/parse/mspowerpoint/

Author: jerome
Date: Mon Feb 13 13:43:15 2006
New Revision: 377501

URL: http://svn.apache.org/viewcvs?rev=377501&view=rev
Log:
Javadoc updates for ms parsers

Added:
    lucene/nutch/trunk/src/plugin/lib-parsems/src/java/org/apache/nutch/parse/ms/package.html   (with props)
Modified:
    lucene/nutch/trunk/build.xml
    lucene/nutch/trunk/default.properties
    lucene/nutch/trunk/src/plugin/lib-parsems/src/java/org/apache/nutch/parse/ms/MSBaseParser.java
    lucene/nutch/trunk/src/plugin/parse-mspowerpoint/src/java/org/apache/nutch/parse/mspowerpoint/FilteredStringWriter.java

Modified: lucene/nutch/trunk/build.xml
URL: http://svn.apache.org/viewcvs/lucene/nutch/trunk/build.xml?rev=377501&r1=377500&r2=377501&view=diff
==============================================================================
--- lucene/nutch/trunk/build.xml (original)
+++ lucene/nutch/trunk/build.xml Mon Feb 13 13:43:15 2006
@@ -249,6 +249,7 @@
 
     	<packageset dir="${src.dir}"/>
     	<packageset dir="${plugins.dir}/lib-http/src/java"/>
+    	<packageset dir="${plugins.dir}/lib-parsems/src/java"/>
     	<packageset dir="${plugins.dir}/ontology/src/java"/>
     	<packageset dir="${plugins.dir}/protocol-file/src/java"/>
     	<packageset dir="${plugins.dir}/protocol-ftp/src/java"/>

Modified: lucene/nutch/trunk/default.properties
URL: http://svn.apache.org/viewcvs/lucene/nutch/trunk/default.properties?rev=377501&r1=377500&r2=377501&view=diff
==============================================================================
--- lucene/nutch/trunk/default.properties (original)
+++ lucene/nutch/trunk/default.properties Mon Feb 13 13:43:15 2006
@@ -68,6 +68,7 @@
 plugin.msword=org.apache.nutch.parse.msword*
 # Unfortunately, ontology on core and plugin uses the same package:
 # plugin.ontology=org.apache.nutch.ontology*
+plugin.parsems=org.apache.nutch.parse.ms*
 plugin.pdf=org.apache.nutch.parse.pdf*
 plugin.rss=org.apache.nutch.parse.rss*
 plugin.rtf=org.apache.nutch.parse.rtf*
@@ -95,6 +96,7 @@
    ${plugin.msexcel}:\
    ${plugin.mspowerpoint}:\
    ${plugin.msword}:\
+   ${plugin.parsems}:\
    ${plugin.pdf}:\
    ${plugin.rss}:\
    ${plugin.rtf}:\

Modified: lucene/nutch/trunk/src/plugin/lib-parsems/src/java/org/apache/nutch/parse/ms/MSBaseParser.java
URL: http://svn.apache.org/viewcvs/lucene/nutch/trunk/src/plugin/lib-parsems/src/java/org/apache/nutch/parse/ms/MSBaseParser.java?rev=377501&r1=377500&r2=377501&view=diff
==============================================================================
--- lucene/nutch/trunk/src/plugin/lib-parsems/src/java/org/apache/nutch/parse/ms/MSBaseParser.java (original)
+++ lucene/nutch/trunk/src/plugin/lib-parsems/src/java/org/apache/nutch/parse/ms/MSBaseParser.java Mon Feb 13 13:43:15 2006
@@ -56,7 +56,7 @@
 
   /**
    * Parses a Content with a specific {@link MSExtractor Microsoft document
-   * extractor.
+   * extractor}.
    */
   protected Parse getParse(MSExtractor extractor, Content content) {
     

Added: lucene/nutch/trunk/src/plugin/lib-parsems/src/java/org/apache/nutch/parse/ms/package.html
URL: http://svn.apache.org/viewcvs/lucene/nutch/trunk/src/plugin/lib-parsems/src/java/org/apache/nutch/parse/ms/package.html?rev=377501&view=auto
==============================================================================
--- lucene/nutch/trunk/src/plugin/lib-parsems/src/java/org/apache/nutch/parse/ms/package.html (added)
+++ lucene/nutch/trunk/src/plugin/lib-parsems/src/java/org/apache/nutch/parse/ms/package.html Mon Feb 13 13:43:15 2006
@@ -0,0 +1,5 @@
+<html>
+<body>
+<p>Common API for Microsoft &copy; documents parsing.</p>
+</body>
+</html>

Propchange: lucene/nutch/trunk/src/plugin/lib-parsems/src/java/org/apache/nutch/parse/ms/package.html
------------------------------------------------------------------------------
    svn:eol-style = native

Modified: lucene/nutch/trunk/src/plugin/parse-mspowerpoint/src/java/org/apache/nutch/parse/mspowerpoint/FilteredStringWriter.java
URL: http://svn.apache.org/viewcvs/lucene/nutch/trunk/src/plugin/parse-mspowerpoint/src/java/org/apache/nutch/parse/mspowerpoint/FilteredStringWriter.java?rev=377501&r1=377500&r2=377501&view=diff
==============================================================================
--- lucene/nutch/trunk/src/plugin/parse-mspowerpoint/src/java/org/apache/nutch/parse/mspowerpoint/FilteredStringWriter.java (original)
+++ lucene/nutch/trunk/src/plugin/parse-mspowerpoint/src/java/org/apache/nutch/parse/mspowerpoint/FilteredStringWriter.java Mon Feb 13 13:43:15 2006
@@ -23,7 +23,6 @@
  * 
  * @author Stephan Strittmatter - http://www.sybit.de
  * @version 1.0
- * @create 19.01.2005
  */
 public class FilteredStringWriter extends StringWriter {
 
@@ -67,4 +66,4 @@
       super.write(ch);
     }
   }
-}
\ No newline at end of file
+}