You are viewing a plain text version of this content. The canonical link for it is here.
Posted to cvs@cocoon.apache.org by cd...@apache.org on 2012/11/23 20:26:48 UTC
svn commit: r1413037 -
/cocoon/branches/BRANCH_2_1_X/src/blocks/html/java/org/apache/cocoon/transformation/HTMLTransformer.java
Author: cdamioli
Date: Fri Nov 23 19:26:46 2012
New Revision: 1413037
URL: http://svn.apache.org/viewvc?rev=1413037&view=rev
Log:
COCOON-2002 HTML transformer only works with latin-1 characters
Modified:
cocoon/branches/BRANCH_2_1_X/src/blocks/html/java/org/apache/cocoon/transformation/HTMLTransformer.java
Modified: cocoon/branches/BRANCH_2_1_X/src/blocks/html/java/org/apache/cocoon/transformation/HTMLTransformer.java
URL: http://svn.apache.org/viewvc/cocoon/branches/BRANCH_2_1_X/src/blocks/html/java/org/apache/cocoon/transformation/HTMLTransformer.java?rev=1413037&r1=1413036&r2=1413037&view=diff
==============================================================================
--- cocoon/branches/BRANCH_2_1_X/src/blocks/html/java/org/apache/cocoon/transformation/HTMLTransformer.java (original)
+++ cocoon/branches/BRANCH_2_1_X/src/blocks/html/java/org/apache/cocoon/transformation/HTMLTransformer.java Fri Nov 23 19:26:46 2012
@@ -170,7 +170,7 @@ public class HTMLTransformer
// Extract the document using JTidy and stream it.
ByteArrayInputStream bais =
- new ByteArrayInputStream(text.getBytes());
+ new ByteArrayInputStream(text.getBytes("UTF-8"));
org.w3c.dom.Document doc =
tidy.parseDOM(new BufferedInputStream(bais), null);