You are viewing a plain text version of this content. The canonical link for it is here.
Posted to commits@nutch.apache.org by ta...@apache.org on 2014/05/03 17:26:38 UTC
svn commit: r1592218 - in /nutch/branches/2.x: CHANGES.txt
src/java/org/apache/nutch/fetcher/FetcherJob.java
Author: talat
Date: Sat May 3 15:26:38 2014
New Revision: 1592218
URL: http://svn.apache.org/r1592218
Log:
NUTCH-1618 Turn speculative execution off for Fetching (talat)
Modified:
nutch/branches/2.x/CHANGES.txt
nutch/branches/2.x/src/java/org/apache/nutch/fetcher/FetcherJob.java
Modified: nutch/branches/2.x/CHANGES.txt
URL: http://svn.apache.org/viewvc/nutch/branches/2.x/CHANGES.txt?rev=1592218&r1=1592217&r2=1592218&view=diff
==============================================================================
--- nutch/branches/2.x/CHANGES.txt (original)
+++ nutch/branches/2.x/CHANGES.txt Sat May 3 15:26:38 2014
@@ -2,6 +2,8 @@ Nutch Change Log
Current Development
+* NUTCH-1618 Turn speculative execution off for Fetching (talat)
+
* NUTCH-1657 ORIGINAL_CHAR_ENCODING and CHAR_ENCODING_FOR_CONVERSION never set in HTMLParser (talat)
* NUTCH-1725 CleaningJob's reducer does not commit deleted docs. (ilhamikalkan via talat)
Modified: nutch/branches/2.x/src/java/org/apache/nutch/fetcher/FetcherJob.java
URL: http://svn.apache.org/viewvc/nutch/branches/2.x/src/java/org/apache/nutch/fetcher/FetcherJob.java?rev=1592218&r1=1592217&r2=1592218&view=diff
==============================================================================
--- nutch/branches/2.x/src/java/org/apache/nutch/fetcher/FetcherJob.java (original)
+++ nutch/branches/2.x/src/java/org/apache/nutch/fetcher/FetcherJob.java Sat May 3 15:26:38 2014
@@ -183,6 +183,10 @@ public class FetcherJob extends NutchToo
LOG.info("FetcherJob : timelimit set for : " + getConf().getLong("fetcher.timelimit", -1));
numJobs = 1;
currentJob = new NutchJob(getConf(), "fetch");
+
+ // for politeness, don't permit parallel execution of a single task
+ currentJob.setReduceSpeculativeExecution(false);
+
Collection<WebPage.Field> fields = getFields(currentJob);
StorageUtils.initMapperJob(currentJob, fields, IntWritable.class,
FetchEntry.class, FetcherMapper.class, FetchEntryPartitioner.class, false);