You are viewing a plain text version of this content. The canonical link for it is here.
Posted to commits@nutch.apache.org by ab...@apache.org on 2006/05/13 01:35:50 UTC

svn commit: r405946 - /lucene/nutch/trunk/src/plugin/parse-html/src/java/org/apache/nutch/parse/html/DOMBuilder.java

Author: ab
Date: Fri May 12 16:35:50 2006
New Revision: 405946

URL: http://svn.apache.org/viewcvs?rev=405946&view=rev
Log:
Fix yet another case where TagSoup supplies invalid parameters.

Modified:
    lucene/nutch/trunk/src/plugin/parse-html/src/java/org/apache/nutch/parse/html/DOMBuilder.java

Modified: lucene/nutch/trunk/src/plugin/parse-html/src/java/org/apache/nutch/parse/html/DOMBuilder.java
URL: http://svn.apache.org/viewcvs/lucene/nutch/trunk/src/plugin/parse-html/src/java/org/apache/nutch/parse/html/DOMBuilder.java?rev=405946&r1=405945&r2=405946&view=diff
==============================================================================
--- lucene/nutch/trunk/src/plugin/parse-html/src/java/org/apache/nutch/parse/html/DOMBuilder.java (original)
+++ lucene/nutch/trunk/src/plugin/parse-html/src/java/org/apache/nutch/parse/html/DOMBuilder.java Fri May 12 16:35:50 2006
@@ -551,7 +551,7 @@
   public void comment(char ch[], int start, int length) throws org.xml.sax.SAXException
   {
     // tagsoup sometimes submits invalid values here
-    if (ch == null || start < 0 || length >= ch.length) return;
+    if (ch == null || start < 0 || length >= (ch.length - start) || length < 0) return;
     append(m_doc.createComment(new String(ch, start, length)));
   }