You are viewing a plain text version of this content. The canonical link for it is here.
Posted to commits@nutch.apache.org by je...@apache.org on 2006/02/13 22:43:16 UTC
svn commit: r377501 - in /lucene/nutch/trunk: ./
src/plugin/lib-parsems/src/java/org/apache/nutch/parse/ms/
src/plugin/parse-mspowerpoint/src/java/org/apache/nutch/parse/mspowerpoint/
Author: jerome
Date: Mon Feb 13 13:43:15 2006
New Revision: 377501
URL: http://svn.apache.org/viewcvs?rev=377501&view=rev
Log:
Javadoc updates for ms parsers
Added:
lucene/nutch/trunk/src/plugin/lib-parsems/src/java/org/apache/nutch/parse/ms/package.html (with props)
Modified:
lucene/nutch/trunk/build.xml
lucene/nutch/trunk/default.properties
lucene/nutch/trunk/src/plugin/lib-parsems/src/java/org/apache/nutch/parse/ms/MSBaseParser.java
lucene/nutch/trunk/src/plugin/parse-mspowerpoint/src/java/org/apache/nutch/parse/mspowerpoint/FilteredStringWriter.java
Modified: lucene/nutch/trunk/build.xml
URL: http://svn.apache.org/viewcvs/lucene/nutch/trunk/build.xml?rev=377501&r1=377500&r2=377501&view=diff
==============================================================================
--- lucene/nutch/trunk/build.xml (original)
+++ lucene/nutch/trunk/build.xml Mon Feb 13 13:43:15 2006
@@ -249,6 +249,7 @@
<packageset dir="${src.dir}"/>
<packageset dir="${plugins.dir}/lib-http/src/java"/>
+ <packageset dir="${plugins.dir}/lib-parsems/src/java"/>
<packageset dir="${plugins.dir}/ontology/src/java"/>
<packageset dir="${plugins.dir}/protocol-file/src/java"/>
<packageset dir="${plugins.dir}/protocol-ftp/src/java"/>
Modified: lucene/nutch/trunk/default.properties
URL: http://svn.apache.org/viewcvs/lucene/nutch/trunk/default.properties?rev=377501&r1=377500&r2=377501&view=diff
==============================================================================
--- lucene/nutch/trunk/default.properties (original)
+++ lucene/nutch/trunk/default.properties Mon Feb 13 13:43:15 2006
@@ -68,6 +68,7 @@
plugin.msword=org.apache.nutch.parse.msword*
# Unfortunately, ontology on core and plugin uses the same package:
# plugin.ontology=org.apache.nutch.ontology*
+plugin.parsems=org.apache.nutch.parse.ms*
plugin.pdf=org.apache.nutch.parse.pdf*
plugin.rss=org.apache.nutch.parse.rss*
plugin.rtf=org.apache.nutch.parse.rtf*
@@ -95,6 +96,7 @@
${plugin.msexcel}:\
${plugin.mspowerpoint}:\
${plugin.msword}:\
+ ${plugin.parsems}:\
${plugin.pdf}:\
${plugin.rss}:\
${plugin.rtf}:\
Modified: lucene/nutch/trunk/src/plugin/lib-parsems/src/java/org/apache/nutch/parse/ms/MSBaseParser.java
URL: http://svn.apache.org/viewcvs/lucene/nutch/trunk/src/plugin/lib-parsems/src/java/org/apache/nutch/parse/ms/MSBaseParser.java?rev=377501&r1=377500&r2=377501&view=diff
==============================================================================
--- lucene/nutch/trunk/src/plugin/lib-parsems/src/java/org/apache/nutch/parse/ms/MSBaseParser.java (original)
+++ lucene/nutch/trunk/src/plugin/lib-parsems/src/java/org/apache/nutch/parse/ms/MSBaseParser.java Mon Feb 13 13:43:15 2006
@@ -56,7 +56,7 @@
/**
* Parses a Content with a specific {@link MSExtractor Microsoft document
- * extractor.
+ * extractor}.
*/
protected Parse getParse(MSExtractor extractor, Content content) {
Added: lucene/nutch/trunk/src/plugin/lib-parsems/src/java/org/apache/nutch/parse/ms/package.html
URL: http://svn.apache.org/viewcvs/lucene/nutch/trunk/src/plugin/lib-parsems/src/java/org/apache/nutch/parse/ms/package.html?rev=377501&view=auto
==============================================================================
--- lucene/nutch/trunk/src/plugin/lib-parsems/src/java/org/apache/nutch/parse/ms/package.html (added)
+++ lucene/nutch/trunk/src/plugin/lib-parsems/src/java/org/apache/nutch/parse/ms/package.html Mon Feb 13 13:43:15 2006
@@ -0,0 +1,5 @@
+<html>
+<body>
+<p>Common API for Microsoft © documents parsing.</p>
+</body>
+</html>
Propchange: lucene/nutch/trunk/src/plugin/lib-parsems/src/java/org/apache/nutch/parse/ms/package.html
------------------------------------------------------------------------------
svn:eol-style = native
Modified: lucene/nutch/trunk/src/plugin/parse-mspowerpoint/src/java/org/apache/nutch/parse/mspowerpoint/FilteredStringWriter.java
URL: http://svn.apache.org/viewcvs/lucene/nutch/trunk/src/plugin/parse-mspowerpoint/src/java/org/apache/nutch/parse/mspowerpoint/FilteredStringWriter.java?rev=377501&r1=377500&r2=377501&view=diff
==============================================================================
--- lucene/nutch/trunk/src/plugin/parse-mspowerpoint/src/java/org/apache/nutch/parse/mspowerpoint/FilteredStringWriter.java (original)
+++ lucene/nutch/trunk/src/plugin/parse-mspowerpoint/src/java/org/apache/nutch/parse/mspowerpoint/FilteredStringWriter.java Mon Feb 13 13:43:15 2006
@@ -23,7 +23,6 @@
*
* @author Stephan Strittmatter - http://www.sybit.de
* @version 1.0
- * @create 19.01.2005
*/
public class FilteredStringWriter extends StringWriter {
@@ -67,4 +66,4 @@
super.write(ch);
}
}
-}
\ No newline at end of file
+}