You are viewing a plain text version of this content. The canonical link for it is here.
Posted to commits@nutch.apache.org by ma...@apache.org on 2011/09/13 20:15:17 UTC
svn commit: r1170282 - in /nutch/branches/branch-1.4: CHANGES.txt
src/java/org/apache/nutch/crawl/CrawlDb.java
Author: markus
Date: Tue Sep 13 18:15:17 2011
New Revision: 1170282
URL: http://svn.apache.org/viewvc?rev=1170282&view=rev
Log:
NUTCH-1110 UpdateDB must not write _success file
Modified:
nutch/branches/branch-1.4/CHANGES.txt
nutch/branches/branch-1.4/src/java/org/apache/nutch/crawl/CrawlDb.java
Modified: nutch/branches/branch-1.4/CHANGES.txt
URL: http://svn.apache.org/viewvc/nutch/branches/branch-1.4/CHANGES.txt?rev=1170282&r1=1170281&r2=1170282&view=diff
==============================================================================
--- nutch/branches/branch-1.4/CHANGES.txt (original)
+++ nutch/branches/branch-1.4/CHANGES.txt Tue Sep 13 18:15:17 2011
@@ -2,6 +2,8 @@ Nutch Change Log
Release 1.4 - Current development
+* NUTCH-1110 UpdateDB must not write _success file (markus)
+
* NUTCH-1105 Max content length option for index-basic (markus)
* NUTCH-940 static field plugin (Claudio Martella via lewismc)
Modified: nutch/branches/branch-1.4/src/java/org/apache/nutch/crawl/CrawlDb.java
URL: http://svn.apache.org/viewvc/nutch/branches/branch-1.4/src/java/org/apache/nutch/crawl/CrawlDb.java?rev=1170282&r1=1170281&r2=1170282&view=diff
==============================================================================
--- nutch/branches/branch-1.4/src/java/org/apache/nutch/crawl/CrawlDb.java (original)
+++ nutch/branches/branch-1.4/src/java/org/apache/nutch/crawl/CrawlDb.java Tue Sep 13 18:15:17 2011
@@ -139,6 +139,9 @@ public class CrawlDb extends Configured
job.setOutputKeyClass(Text.class);
job.setOutputValueClass(CrawlDatum.class);
+ // https://issues.apache.org/jira/browse/NUTCH-1110
+ job.setBoolean("mapreduce.fileoutputcommitter.marksuccessfuljobs", false);
+
return job;
}