You are viewing a plain text version of this content. The canonical link for it is here.
Posted to commits@nutch.apache.org by fe...@apache.org on 2012/05/30 11:26:13 UTC
svn commit: r1344168 - in /nutch/branches/nutchgora: CHANGES.txt
src/java/org/apache/nutch/parse/ParseUtil.java
Author: ferdy
Date: Wed May 30 09:26:12 2012
New Revision: 1344168
URL: http://svn.apache.org/viewvc?rev=1344168&view=rev
Log:
NUTCH-1379 NPE when reprUrl is null in ParseUtil
Modified:
nutch/branches/nutchgora/CHANGES.txt
nutch/branches/nutchgora/src/java/org/apache/nutch/parse/ParseUtil.java
Modified: nutch/branches/nutchgora/CHANGES.txt
URL: http://svn.apache.org/viewvc/nutch/branches/nutchgora/CHANGES.txt?rev=1344168&r1=1344167&r2=1344168&view=diff
==============================================================================
--- nutch/branches/nutchgora/CHANGES.txt (original)
+++ nutch/branches/nutchgora/CHANGES.txt Wed May 30 09:26:12 2012
@@ -2,6 +2,8 @@ Nutch Change Log
Release 2.1 (22/02/2012)
+* NUTCH-1379 NPE when reprUrl is null in ParseUtil (ferdy)
+
* NUTCH-1378 HostDb NullPointerException (ferdy)
* NUTCH-XX Commit to add configuration for separation of ant distribution targets (lewismc + jnioche)
Modified: nutch/branches/nutchgora/src/java/org/apache/nutch/parse/ParseUtil.java
URL: http://svn.apache.org/viewvc/nutch/branches/nutchgora/src/java/org/apache/nutch/parse/ParseUtil.java?rev=1344168&r1=1344167&r2=1344168&view=diff
==============================================================================
--- nutch/branches/nutchgora/src/java/org/apache/nutch/parse/ParseUtil.java (original)
+++ nutch/branches/nutchgora/src/java/org/apache/nutch/parse/ParseUtil.java Wed May 30 09:26:12 2012
@@ -209,7 +209,12 @@ public class ParseUtil extends Configure
String reprUrl = URLUtil.chooseRepr(url, newUrl,
refreshTime < FetcherJob.PERM_REFRESH_TIME);
WebPage newWebPage = new WebPage();
- page.setReprUrl(new Utf8(reprUrl));
+ if (reprUrl == null) {
+ LOG.warn("reprUrl==null for " + url);
+ return redirectedPage;
+ } else {
+ page.setReprUrl(new Utf8(reprUrl));
+ }
page.putToMetadata(FetcherJob.REDIRECT_DISCOVERED, TableUtil.YES_VAL);
redirectedPage = new URLWebPage(reprUrl, newWebPage);
}