You are viewing a plain text version of this content. The canonical link for it is here.
Posted to commits@nutch.apache.org by do...@apache.org on 2008/09/22 18:43:33 UTC
svn commit: r697896 - in /lucene/nutch/trunk: CHANGES.txt
src/java/org/apache/nutch/fetcher/Fetcher.java
src/java/org/apache/nutch/fetcher/Fetcher2.java
Author: dogacan
Date: Mon Sep 22 09:43:33 2008
New Revision: 697896
URL: http://svn.apache.org/viewvc?rev=697896&view=rev
Log:
NUTCH-633 - ParseSegment no longer allow reparsing.
Modified:
lucene/nutch/trunk/CHANGES.txt
lucene/nutch/trunk/src/java/org/apache/nutch/fetcher/Fetcher.java
lucene/nutch/trunk/src/java/org/apache/nutch/fetcher/Fetcher2.java
Modified: lucene/nutch/trunk/CHANGES.txt
URL: http://svn.apache.org/viewvc/lucene/nutch/trunk/CHANGES.txt?rev=697896&r1=697895&r2=697896&view=diff
==============================================================================
--- lucene/nutch/trunk/CHANGES.txt (original)
+++ lucene/nutch/trunk/CHANGES.txt Mon Sep 22 09:43:33 2008
@@ -271,6 +271,9 @@
99. NUTCH-375 - Add support for Content-Encoding: deflated
(Pascal Beis, ab)
+100. NUTCH-633 - ParseSegment no longer allow reparsing.
+ (dogacan)
+
Release 0.9 - 2007-04-02
1. Changed log4j confiquration to log to stdout on commandline
Modified: lucene/nutch/trunk/src/java/org/apache/nutch/fetcher/Fetcher.java
URL: http://svn.apache.org/viewvc/lucene/nutch/trunk/src/java/org/apache/nutch/fetcher/Fetcher.java?rev=697896&r1=697895&r2=697896&view=diff
==============================================================================
--- lucene/nutch/trunk/src/java/org/apache/nutch/fetcher/Fetcher.java (original)
+++ lucene/nutch/trunk/src/java/org/apache/nutch/fetcher/Fetcher.java Mon Sep 22 09:43:33 2008
@@ -346,13 +346,10 @@
}
}
- if (!parsing) {
- /* Store status code in content if we are not parsing in fetcher.
- * So we can read this value during parsing (as a separate job) and
- * decide to parse or not.
- * */
- content.getMetadata().add(Nutch.FETCH_STATUS_KEY, Integer.toString(status));
- }
+ /* Store status code in content So we can read this value during
+ * parsing (as a separate job) and decide to parse or not.
+ */
+ content.getMetadata().add(Nutch.FETCH_STATUS_KEY, Integer.toString(status));
}
try {
Modified: lucene/nutch/trunk/src/java/org/apache/nutch/fetcher/Fetcher2.java
URL: http://svn.apache.org/viewvc/lucene/nutch/trunk/src/java/org/apache/nutch/fetcher/Fetcher2.java?rev=697896&r1=697895&r2=697896&view=diff
==============================================================================
--- lucene/nutch/trunk/src/java/org/apache/nutch/fetcher/Fetcher2.java (original)
+++ lucene/nutch/trunk/src/java/org/apache/nutch/fetcher/Fetcher2.java Mon Sep 22 09:43:33 2008
@@ -751,13 +751,10 @@
}
}
- if (!parsing) {
- /* Store status code in content if we are not parsing in fetcher.
- * So we can read this value during parsing (as a separate job) and
- * decide to parse or not.
- * */
- content.getMetadata().add(Nutch.FETCH_STATUS_KEY, Integer.toString(status));
- }
+ /* Store status code in content So we can read this value during
+ * parsing (as a separate job) and decide to parse or not.
+ */
+ content.getMetadata().add(Nutch.FETCH_STATUS_KEY, Integer.toString(status));
}
try {