You are viewing a plain text version of this content. The canonical link for it is here.
Posted to commits@nutch.apache.org by do...@apache.org on 2008/09/22 18:43:33 UTC

svn commit: r697896 - in /lucene/nutch/trunk: CHANGES.txt src/java/org/apache/nutch/fetcher/Fetcher.java src/java/org/apache/nutch/fetcher/Fetcher2.java

Author: dogacan
Date: Mon Sep 22 09:43:33 2008
New Revision: 697896

URL: http://svn.apache.org/viewvc?rev=697896&view=rev
Log:
NUTCH-633 - ParseSegment no longer allow reparsing.

Modified:
    lucene/nutch/trunk/CHANGES.txt
    lucene/nutch/trunk/src/java/org/apache/nutch/fetcher/Fetcher.java
    lucene/nutch/trunk/src/java/org/apache/nutch/fetcher/Fetcher2.java

Modified: lucene/nutch/trunk/CHANGES.txt
URL: http://svn.apache.org/viewvc/lucene/nutch/trunk/CHANGES.txt?rev=697896&r1=697895&r2=697896&view=diff
==============================================================================
--- lucene/nutch/trunk/CHANGES.txt (original)
+++ lucene/nutch/trunk/CHANGES.txt Mon Sep 22 09:43:33 2008
@@ -271,6 +271,9 @@
 99. NUTCH-375 - Add support for Content-Encoding: deflated
     (Pascal Beis, ab)
 
+100. NUTCH-633 - ParseSegment no longer allow reparsing.
+     (dogacan)
+
 Release 0.9 - 2007-04-02
 
  1. Changed log4j confiquration to log to stdout on commandline

Modified: lucene/nutch/trunk/src/java/org/apache/nutch/fetcher/Fetcher.java
URL: http://svn.apache.org/viewvc/lucene/nutch/trunk/src/java/org/apache/nutch/fetcher/Fetcher.java?rev=697896&r1=697895&r2=697896&view=diff
==============================================================================
--- lucene/nutch/trunk/src/java/org/apache/nutch/fetcher/Fetcher.java (original)
+++ lucene/nutch/trunk/src/java/org/apache/nutch/fetcher/Fetcher.java Mon Sep 22 09:43:33 2008
@@ -346,13 +346,10 @@
           }
         }
         
-        if (!parsing) {
-          /* Store status code in content if we are not parsing in fetcher. 
-           * So we can read this value during parsing (as a separate job) and
-           * decide to parse or not.
-           * */
-          content.getMetadata().add(Nutch.FETCH_STATUS_KEY, Integer.toString(status));
-        }
+        /* Store status code in content So we can read this value during 
+         * parsing (as a separate job) and decide to parse or not.
+         */
+        content.getMetadata().add(Nutch.FETCH_STATUS_KEY, Integer.toString(status));
       }
 
       try {

Modified: lucene/nutch/trunk/src/java/org/apache/nutch/fetcher/Fetcher2.java
URL: http://svn.apache.org/viewvc/lucene/nutch/trunk/src/java/org/apache/nutch/fetcher/Fetcher2.java?rev=697896&r1=697895&r2=697896&view=diff
==============================================================================
--- lucene/nutch/trunk/src/java/org/apache/nutch/fetcher/Fetcher2.java (original)
+++ lucene/nutch/trunk/src/java/org/apache/nutch/fetcher/Fetcher2.java Mon Sep 22 09:43:33 2008
@@ -751,13 +751,10 @@
           }
         }
         
-        if (!parsing) {
-          /* Store status code in content if we are not parsing in fetcher. 
-           * So we can read this value during parsing (as a separate job) and
-           * decide to parse or not.
-           * */
-          content.getMetadata().add(Nutch.FETCH_STATUS_KEY, Integer.toString(status));
-        }
+        /* Store status code in content So we can read this value during 
+         * parsing (as a separate job) and decide to parse or not.
+         */
+        content.getMetadata().add(Nutch.FETCH_STATUS_KEY, Integer.toString(status));
       }
 
       try {