You are viewing a plain text version of this content. The canonical link for it is here.
Posted to dev@xalan.apache.org by "Andrei Gheorghe (JIRA)" <ji...@apache.org> on 2014/07/23 15:23:39 UTC
[jira] [Updated] (XALANC-756) FormatterToXML throws exception for
valid XML
[ https://issues.apache.org/jira/browse/XALANC-756?page=com.atlassian.jira.plugin.system.issuetabpanels:all-tabpanel ]
Andrei Gheorghe updated XALANC-756:
-----------------------------------
Description:
Xalan-C++ throws SAXException for this XML:
{code}<?xml version="1.0" encoding="UTF-8"?><elem attr="
"/>{code}
This XML is valid according to all the validators I have tried.
This issue can be reproduced using the following test program.
I also supplied a patch to show where the problem originates and which seems to solve the issue.
{code:title=test.cpp|borderStyle=solid}
#include <xercesc/util/PlatformUtils.hpp>
#include <xercesc/framework/MemBufInputSource.hpp>
#include <xercesc/parsers/XercesDOMParser.hpp>
#include <xalanc/XercesParserLiaison/XercesDocumentWrapper.hpp>
#include <xalanc/PlatformSupport/XalanStdOutputStream.hpp>
#include <xalanc/PlatformSupport/XalanOutputStreamPrintWriter.hpp>
#include <xalanc/XMLSupport/FormatterToXML.hpp>
#include <xalanc/XMLSupport/FormatterTreeWalker.hpp>
#include <sstream>
#include <iostream>
XERCES_CPP_NAMESPACE_USE
XALAN_CPP_NAMESPACE_USE
using namespace std;
int main()
{
try
{
XMLPlatformUtils::Initialize();
string testXML = "<?xml version=\"1.0\" encoding=\"UTF-8\"?><elem attr=\"
\"/>";
MemBufInputSource bufferMemSource( ( const XMLByte* )testXML.c_str(), testXML.size(), "testXML", false );
XercesDOMParser parser;
parser.parse(bufferMemSource);
XercesDocumentWrapper docWrapper( *XMLPlatformUtils::fgMemoryManager, parser.getDocument(), true, true, true );
XalanStdOutputStream stream( cout );
XalanOutputStreamPrintWriter printWriter( stream );
FormatterToXML formatter( printWriter );
FormatterTreeWalker walker( formatter );
formatter.setShouldWriteXMLHeader( false );
formatter.startDocument();
walker.traverseSubtree( &docWrapper ); //throws SAXException: 'A' is an invalid Unicode scalar value.
formatter.endDocument();
}
catch ( const exception& )
{}
return 0;
}
{code}
{code}
Index: src/xalanc/XMLSupport/FormatterToXML.cpp
===================================================================
--- src/xalanc/XMLSupport/FormatterToXML.cpp (revision 1612825)
+++ src/xalanc/XMLSupport/FormatterToXML.cpp (working copy)
@@ -910,7 +910,7 @@
{
if(ch < 0x20 )
{
- if(m_isXML1_1)
+ if(ch == 0x9 || ch == 0xA || ch == 0xD || m_isXML1_1)
{
writeNumberedEntityReference(ch);
}
{code}
was:
Xalan-C++ throws SAXException for this XML: <?xml version="1.0" encoding="UTF-8"?><elem attr="
"/>
This XML is valid according to all the validators I have tried.
This issue can be reproduced using the following test program.
I also supplied a patch to show where the problem originates and which seems to solve the issue.
{code:title=test.cpp|borderStyle=solid}
#include <xercesc/util/PlatformUtils.hpp>
#include <xercesc/framework/MemBufInputSource.hpp>
#include <xercesc/parsers/XercesDOMParser.hpp>
#include <xalanc/XercesParserLiaison/XercesDocumentWrapper.hpp>
#include <xalanc/PlatformSupport/XalanStdOutputStream.hpp>
#include <xalanc/PlatformSupport/XalanOutputStreamPrintWriter.hpp>
#include <xalanc/XMLSupport/FormatterToXML.hpp>
#include <xalanc/XMLSupport/FormatterTreeWalker.hpp>
#include <sstream>
#include <iostream>
XERCES_CPP_NAMESPACE_USE
XALAN_CPP_NAMESPACE_USE
using namespace std;
int main()
{
try
{
XMLPlatformUtils::Initialize();
string testXML = "<?xml version=\"1.0\" encoding=\"UTF-8\"?><elem attr=\"
\"/>";
MemBufInputSource bufferMemSource( ( const XMLByte* )testXML.c_str(), testXML.size(), "testXML", false );
XercesDOMParser parser;
parser.parse(bufferMemSource);
XercesDocumentWrapper docWrapper( *XMLPlatformUtils::fgMemoryManager, parser.getDocument(), true, true, true );
XalanStdOutputStream stream( cout );
XalanOutputStreamPrintWriter printWriter( stream );
FormatterToXML formatter( printWriter );
FormatterTreeWalker walker( formatter );
formatter.setShouldWriteXMLHeader( false );
formatter.startDocument();
walker.traverseSubtree( &docWrapper ); //throws SAXException: 'A' is an invalid Unicode scalar value.
formatter.endDocument();
}
catch ( const exception& )
{}
return 0;
}
{code}
{code}
Index: src/xalanc/XMLSupport/FormatterToXML.cpp
===================================================================
--- src/xalanc/XMLSupport/FormatterToXML.cpp (revision 1612825)
+++ src/xalanc/XMLSupport/FormatterToXML.cpp (working copy)
@@ -910,7 +910,7 @@
{
if(ch < 0x20 )
{
- if(m_isXML1_1)
+ if(ch == 0x9 || ch == 0xA || ch == 0xD || m_isXML1_1)
{
writeNumberedEntityReference(ch);
}
{code}
> FormatterToXML throws exception for valid XML
> ---------------------------------------------
>
> Key: XALANC-756
> URL: https://issues.apache.org/jira/browse/XALANC-756
> Project: XalanC
> Issue Type: Bug
> Reporter: Andrei Gheorghe
> Assignee: Steven J. Hathaway
>
> Xalan-C++ throws SAXException for this XML:
> {code}<?xml version="1.0" encoding="UTF-8"?><elem attr="
"/>{code}
> This XML is valid according to all the validators I have tried.
> This issue can be reproduced using the following test program.
> I also supplied a patch to show where the problem originates and which seems to solve the issue.
> {code:title=test.cpp|borderStyle=solid}
> #include <xercesc/util/PlatformUtils.hpp>
> #include <xercesc/framework/MemBufInputSource.hpp>
> #include <xercesc/parsers/XercesDOMParser.hpp>
> #include <xalanc/XercesParserLiaison/XercesDocumentWrapper.hpp>
> #include <xalanc/PlatformSupport/XalanStdOutputStream.hpp>
> #include <xalanc/PlatformSupport/XalanOutputStreamPrintWriter.hpp>
> #include <xalanc/XMLSupport/FormatterToXML.hpp>
> #include <xalanc/XMLSupport/FormatterTreeWalker.hpp>
> #include <sstream>
> #include <iostream>
> XERCES_CPP_NAMESPACE_USE
> XALAN_CPP_NAMESPACE_USE
> using namespace std;
> int main()
> {
> try
> {
> XMLPlatformUtils::Initialize();
> string testXML = "<?xml version=\"1.0\" encoding=\"UTF-8\"?><elem attr=\"
\"/>";
> MemBufInputSource bufferMemSource( ( const XMLByte* )testXML.c_str(), testXML.size(), "testXML", false );
> XercesDOMParser parser;
> parser.parse(bufferMemSource);
> XercesDocumentWrapper docWrapper( *XMLPlatformUtils::fgMemoryManager, parser.getDocument(), true, true, true );
> XalanStdOutputStream stream( cout );
> XalanOutputStreamPrintWriter printWriter( stream );
> FormatterToXML formatter( printWriter );
> FormatterTreeWalker walker( formatter );
> formatter.setShouldWriteXMLHeader( false );
> formatter.startDocument();
> walker.traverseSubtree( &docWrapper ); //throws SAXException: 'A' is an invalid Unicode scalar value.
> formatter.endDocument();
> }
> catch ( const exception& )
> {}
> return 0;
> }
> {code}
> {code}
> Index: src/xalanc/XMLSupport/FormatterToXML.cpp
> ===================================================================
> --- src/xalanc/XMLSupport/FormatterToXML.cpp (revision 1612825)
> +++ src/xalanc/XMLSupport/FormatterToXML.cpp (working copy)
> @@ -910,7 +910,7 @@
> {
> if(ch < 0x20 )
> {
> - if(m_isXML1_1)
> + if(ch == 0x9 || ch == 0xA || ch == 0xD || m_isXML1_1)
> {
> writeNumberedEntityReference(ch);
> }
> {code}
--
This message was sent by Atlassian JIRA
(v6.2#6252)
---------------------------------------------------------------------
To unsubscribe, e-mail: dev-unsubscribe@xalan.apache.org
For additional commands, e-mail: dev-help@xalan.apache.org