You are viewing a plain text version of this content. The canonical link for it is here.
Posted to commits@nutch.apache.org by ma...@apache.org on 2012/06/26 11:18:41 UTC

svn commit: r1353884 - /nutch/trunk/src/test/org/apache/nutch/net/TestURLNormalizers.java

Author: markus
Date: Tue Jun 26 09:18:40 2012
New Revision: 1353884

URL: http://svn.apache.org/viewvc?rev=1353884&view=rev
Log:
NUTCH-1319 adding test to accomodate HostURLNormalizer

Modified:
    nutch/trunk/src/test/org/apache/nutch/net/TestURLNormalizers.java

Modified: nutch/trunk/src/test/org/apache/nutch/net/TestURLNormalizers.java
URL: http://svn.apache.org/viewvc/nutch/trunk/src/test/org/apache/nutch/net/TestURLNormalizers.java?rev=1353884&r1=1353883&r2=1353884&view=diff
==============================================================================
--- nutch/trunk/src/test/org/apache/nutch/net/TestURLNormalizers.java (original)
+++ nutch/trunk/src/test/org/apache/nutch/net/TestURLNormalizers.java Tue Jun 26 09:18:40 2012
@@ -42,12 +42,20 @@ public class TestURLNormalizers extends 
 
     // NUTCH-1011 - Get rid of superfluous slashes
     try {
-      String normalizedSlashes = normalizers.normalize("http://www.example.org//path/to//somewhere.html", URLNormalizers.SCOPE_DEFAULT);
-      assertEquals(normalizedSlashes, "http://www.example.org/path/to/somewhere.html");
+      String normalizedSlashes = normalizers.normalize("http://www.example.com//path/to//somewhere.html", URLNormalizers.SCOPE_DEFAULT);
+      assertEquals(normalizedSlashes, "http://www.example.com/path/to/somewhere.html");
     } catch (MalformedURLException mue) {
       fail(mue.toString());
     }
-
+    
+    // HostNormalizer NUTCH-1319
+    try {
+      String normalizedHost = normalizers.normalize("http://www.example.org//path/to//somewhere.html", URLNormalizers.SCOPE_DEFAULT);
+      assertEquals(normalizedHost, "http://example.org/path/to/somewhere.html");
+    } catch (MalformedURLException mue) {
+      fail(mue.toString());
+    }
+    
     // check the order
     int pos1 = -1, pos2 = -1;
     URLNormalizer[] impls = normalizers.getURLNormalizers(URLNormalizers.SCOPE_DEFAULT);