You are viewing a plain text version of this content. The canonical link for it is here.
Posted to commits@nutch.apache.org by cu...@apache.org on 2005/07/10 23:20:47 UTC
svn commit: r210036 -
/lucene/nutch/branches/mapred/src/java/org/apache/nutch/crawl/Fetcher.java
Author: cutting
Date: Sun Jul 10 14:20:46 2005
New Revision: 210036
URL: http://svn.apache.org/viewcvs?rev=210036&view=rev
Log:
Actually use the new InputFormat!
Modified:
lucene/nutch/branches/mapred/src/java/org/apache/nutch/crawl/Fetcher.java
Modified: lucene/nutch/branches/mapred/src/java/org/apache/nutch/crawl/Fetcher.java
URL: http://svn.apache.org/viewcvs/lucene/nutch/branches/mapred/src/java/org/apache/nutch/crawl/Fetcher.java?rev=210036&r1=210035&r2=210036&view=diff
==============================================================================
--- lucene/nutch/branches/mapred/src/java/org/apache/nutch/crawl/Fetcher.java (original)
+++ lucene/nutch/branches/mapred/src/java/org/apache/nutch/crawl/Fetcher.java Sun Jul 10 14:20:46 2005
@@ -38,7 +38,7 @@
public static final String DIGEST_KEY = "nutch.content.digest";
- public class InputFormat extends SequenceFileInputFormat {
+ public static class InputFormat extends SequenceFileInputFormat {
/** Don't split inputs, to keep things polite. */
public FileSplit[] getSplits(NutchFileSystem fs, JobConf job, int nSplits)
throws IOException {
@@ -253,7 +253,7 @@
job.setInt("fetcher.threads.fetch", threads);
job.setInputDir(new File(segment, CrawlDatum.GENERATE_DIR_NAME));
- job.setInputFormat(SequenceFileInputFormat.class);
+ job.setInputFormat(InputFormat.class);
job.setInputKeyClass(UTF8.class);
job.setInputValueClass(CrawlDatum.class);