You are viewing a plain text version of this content. The canonical link for it is here.
Posted to cvs@cocoon.apache.org by cd...@apache.org on 2012/11/23 20:26:48 UTC

svn commit: r1413037 - /cocoon/branches/BRANCH_2_1_X/src/blocks/html/java/org/apache/cocoon/transformation/HTMLTransformer.java

Author: cdamioli
Date: Fri Nov 23 19:26:46 2012
New Revision: 1413037

URL: http://svn.apache.org/viewvc?rev=1413037&view=rev
Log:
COCOON-2002 HTML transformer only works with latin-1 characters

Modified:
    cocoon/branches/BRANCH_2_1_X/src/blocks/html/java/org/apache/cocoon/transformation/HTMLTransformer.java

Modified: cocoon/branches/BRANCH_2_1_X/src/blocks/html/java/org/apache/cocoon/transformation/HTMLTransformer.java
URL: http://svn.apache.org/viewvc/cocoon/branches/BRANCH_2_1_X/src/blocks/html/java/org/apache/cocoon/transformation/HTMLTransformer.java?rev=1413037&r1=1413036&r2=1413037&view=diff
==============================================================================
--- cocoon/branches/BRANCH_2_1_X/src/blocks/html/java/org/apache/cocoon/transformation/HTMLTransformer.java (original)
+++ cocoon/branches/BRANCH_2_1_X/src/blocks/html/java/org/apache/cocoon/transformation/HTMLTransformer.java Fri Nov 23 19:26:46 2012
@@ -170,7 +170,7 @@ public class HTMLTransformer
 
             // Extract the document using JTidy and stream it.
             ByteArrayInputStream bais =
-                new ByteArrayInputStream(text.getBytes());
+                new ByteArrayInputStream(text.getBytes("UTF-8"));
             org.w3c.dom.Document doc =
                 tidy.parseDOM(new BufferedInputStream(bais), null);