You are viewing a plain text version of this content. The canonical link for it is here.
Posted to commits@nutch.apache.org by ma...@apache.org on 2012/06/26 11:18:41 UTC
svn commit: r1353884 -
/nutch/trunk/src/test/org/apache/nutch/net/TestURLNormalizers.java
Author: markus
Date: Tue Jun 26 09:18:40 2012
New Revision: 1353884
URL: http://svn.apache.org/viewvc?rev=1353884&view=rev
Log:
NUTCH-1319 adding test to accomodate HostURLNormalizer
Modified:
nutch/trunk/src/test/org/apache/nutch/net/TestURLNormalizers.java
Modified: nutch/trunk/src/test/org/apache/nutch/net/TestURLNormalizers.java
URL: http://svn.apache.org/viewvc/nutch/trunk/src/test/org/apache/nutch/net/TestURLNormalizers.java?rev=1353884&r1=1353883&r2=1353884&view=diff
==============================================================================
--- nutch/trunk/src/test/org/apache/nutch/net/TestURLNormalizers.java (original)
+++ nutch/trunk/src/test/org/apache/nutch/net/TestURLNormalizers.java Tue Jun 26 09:18:40 2012
@@ -42,12 +42,20 @@ public class TestURLNormalizers extends
// NUTCH-1011 - Get rid of superfluous slashes
try {
- String normalizedSlashes = normalizers.normalize("http://www.example.org//path/to//somewhere.html", URLNormalizers.SCOPE_DEFAULT);
- assertEquals(normalizedSlashes, "http://www.example.org/path/to/somewhere.html");
+ String normalizedSlashes = normalizers.normalize("http://www.example.com//path/to//somewhere.html", URLNormalizers.SCOPE_DEFAULT);
+ assertEquals(normalizedSlashes, "http://www.example.com/path/to/somewhere.html");
} catch (MalformedURLException mue) {
fail(mue.toString());
}
-
+
+ // HostNormalizer NUTCH-1319
+ try {
+ String normalizedHost = normalizers.normalize("http://www.example.org//path/to//somewhere.html", URLNormalizers.SCOPE_DEFAULT);
+ assertEquals(normalizedHost, "http://example.org/path/to/somewhere.html");
+ } catch (MalformedURLException mue) {
+ fail(mue.toString());
+ }
+
// check the order
int pos1 = -1, pos2 = -1;
URLNormalizer[] impls = normalizers.getURLNormalizers(URLNormalizers.SCOPE_DEFAULT);