You are viewing a plain text version of this content. The canonical link for it is here.
Posted to commits@nutch.apache.org by si...@apache.org on 2006/09/19 21:10:12 UTC
svn commit: r447931 - in /lucene/nutch/trunk: ./
src/test/org/apache/nutch/fetcher/ src/testresources/fetch-test-site/
Author: siren
Date: Tue Sep 19 12:10:11 2006
New Revision: 447931
URL: http://svn.apache.org/viewvc?view=rev&rev=447931
Log:
fix for fetcher testcase
Modified:
lucene/nutch/trunk/build.xml
lucene/nutch/trunk/src/test/org/apache/nutch/fetcher/TestFetcher.java
lucene/nutch/trunk/src/testresources/fetch-test-site/dup_of_pagea.html
lucene/nutch/trunk/src/testresources/fetch-test-site/index.html
lucene/nutch/trunk/src/testresources/fetch-test-site/pagea.html
lucene/nutch/trunk/src/testresources/fetch-test-site/pageb.html
Modified: lucene/nutch/trunk/build.xml
URL: http://svn.apache.org/viewvc/lucene/nutch/trunk/build.xml?view=diff&rev=447931&r1=447930&r2=447931
==============================================================================
--- lucene/nutch/trunk/build.xml (original)
+++ lucene/nutch/trunk/build.xml Tue Sep 19 12:10:11 2006
@@ -248,7 +248,12 @@
<delete dir="${test.build.data}"/>
<mkdir dir="${test.build.data}"/>
-
+ <!--
+ copy resources needed in junit tests
+ -->
+ <copy todir="${test.build.data}">
+ <fileset dir="src/testresources" includes="**/*"/>
+ </copy>
<copy file="${test.src.dir}/nutch-site.xml"
todir="${test.build.classes}"/>
Modified: lucene/nutch/trunk/src/test/org/apache/nutch/fetcher/TestFetcher.java
URL: http://svn.apache.org/viewvc/lucene/nutch/trunk/src/test/org/apache/nutch/fetcher/TestFetcher.java?view=diff&rev=447931&r1=447930&r2=447931
==============================================================================
--- lucene/nutch/trunk/src/test/org/apache/nutch/fetcher/TestFetcher.java (original)
+++ lucene/nutch/trunk/src/test/org/apache/nutch/fetcher/TestFetcher.java Tue Sep 19 12:10:11 2006
@@ -110,7 +110,10 @@
UTF8 key=new UTF8();
Content value=new Content();
if(!reader.next(key, value)) break READ;
- handledurls.add(key.toString());
+ String contentString=new String(value.getContent());
+ if(contentString.indexOf("Nutch fetcher test page")!=-1) {
+ handledurls.add(key.toString());
+ }
} while(true);
reader.close();
Modified: lucene/nutch/trunk/src/testresources/fetch-test-site/dup_of_pagea.html
URL: http://svn.apache.org/viewvc/lucene/nutch/trunk/src/testresources/fetch-test-site/dup_of_pagea.html?view=diff&rev=447931&r1=447930&r2=447931
==============================================================================
--- lucene/nutch/trunk/src/testresources/fetch-test-site/dup_of_pagea.html (original)
+++ lucene/nutch/trunk/src/testresources/fetch-test-site/dup_of_pagea.html Tue Sep 19 12:10:11 2006
@@ -5,5 +5,7 @@
<body>
This is page a
<a href="index.html">home</a>
+<hr>
+Nutch fetcher test page
</body>
</html>
Modified: lucene/nutch/trunk/src/testresources/fetch-test-site/index.html
URL: http://svn.apache.org/viewvc/lucene/nutch/trunk/src/testresources/fetch-test-site/index.html?view=diff&rev=447931&r1=447930&r2=447931
==============================================================================
--- lucene/nutch/trunk/src/testresources/fetch-test-site/index.html (original)
+++ lucene/nutch/trunk/src/testresources/fetch-test-site/index.html Tue Sep 19 12:10:11 2006
@@ -7,5 +7,7 @@
<a href="pagea.html">Page a</a>
<a href="pageb.html">Page b</a>
<a href="dup_of_pagea.html">dup of Page a</a>
+<hr>
+Nutch fetcher test page
</body>
</html>
Modified: lucene/nutch/trunk/src/testresources/fetch-test-site/pagea.html
URL: http://svn.apache.org/viewvc/lucene/nutch/trunk/src/testresources/fetch-test-site/pagea.html?view=diff&rev=447931&r1=447930&r2=447931
==============================================================================
--- lucene/nutch/trunk/src/testresources/fetch-test-site/pagea.html (original)
+++ lucene/nutch/trunk/src/testresources/fetch-test-site/pagea.html Tue Sep 19 12:10:11 2006
@@ -5,5 +5,7 @@
<body>
This is page a
<a href="index.html">home</a>
+<hr>
+Nutch fetcher test page
</body>
</html>
Modified: lucene/nutch/trunk/src/testresources/fetch-test-site/pageb.html
URL: http://svn.apache.org/viewvc/lucene/nutch/trunk/src/testresources/fetch-test-site/pageb.html?view=diff&rev=447931&r1=447930&r2=447931
==============================================================================
--- lucene/nutch/trunk/src/testresources/fetch-test-site/pageb.html (original)
+++ lucene/nutch/trunk/src/testresources/fetch-test-site/pageb.html Tue Sep 19 12:10:11 2006
@@ -5,5 +5,7 @@
<body>
This is page b
<a href="index.html">home</a>
+<hr>
+Nutch fetcher test page
</body>
</html>