summaryrefslogtreecommitdiffstats
path: root/unoxml
diff options
context:
space:
mode:
authorRĂ¼diger Timm <rt@openoffice.org>2008-06-06 11:06:04 +0000
committerRĂ¼diger Timm <rt@openoffice.org>2008-06-06 11:06:04 +0000
commit4ed1bf8f9a8b350b6255a9e63cd5d8b8a631adfe (patch)
tree8ae2c806f9f48e9bab11a49e2561a0ba827415dc /unoxml
parentINTEGRATION: CWS xmlfix2 (1.10.2); FILE MERGED (diff)
downloadcore-4ed1bf8f9a8b350b6255a9e63cd5d8b8a631adfe.tar.gz
core-4ed1bf8f9a8b350b6255a9e63cd5d8b8a631adfe.zip
INTEGRATION: CWS xmlfix2 (1.3.50); FILE MERGED
2008/05/15 17:26:26 mst 1.3.50.6: RESYNC: (1.4-1.5); FILE MERGED 2008/04/22 11:38:14 mst 1.3.50.5: - unoxml/source/dom/documentbuilder.cxx: + fix build with gcc 4.3: include string.h 2008/04/01 08:36:53 mst 1.3.50.4: - unoxml/source/dom/documentbuilder.cxx: + wntmsci11 warning fixes 2008/03/31 14:19:29 mst 1.3.50.3: - unoxml/source/dom/{document.hxx,node.hxx,documentbuilder{.hxx,.cxx}}: + fix mess resulting from "using namespace rtl" 2008/03/26 15:07:48 mst 1.3.50.2: RESYNC: (1.3-1.4); FILE MERGED 2007/11/14 14:28:38 lo 1.3.50.1: parser improvements
Diffstat (limited to 'unoxml')
-rw-r--r--unoxml/source/dom/documentbuilder.cxx331
1 files changed, 302 insertions, 29 deletions
diff --git a/unoxml/source/dom/documentbuilder.cxx b/unoxml/source/dom/documentbuilder.cxx
index 30d71b4d6042..d556b431385e 100644
--- a/unoxml/source/dom/documentbuilder.cxx
+++ b/unoxml/source/dom/documentbuilder.cxx
@@ -7,7 +7,7 @@
* OpenOffice.org - a multi-platform office productivity suite
*
* $RCSfile: documentbuilder.cxx,v $
- * $Revision: 1.5 $
+ * $Revision: 1.6 $
*
* This file is part of OpenOffice.org.
*
@@ -32,10 +32,81 @@
#include "node.hxx"
#include "document.hxx"
+#include <rtl/alloc.h>
+#include <rtl/memory.h>
+#include <rtl/ustrbuf.hxx>
+
+#include <cppuhelper/implbase1.hxx>
+
+#include <libxml/xmlerror.h>
+
+#include <com/sun/star/xml/sax/SAXParseException.hpp>
+#include <com/sun/star/ucb/XCommandEnvironment.hpp>
+#include <com/sun/star/task/XInteractionHandler.hpp>
+#include <ucbhelper/content.hxx>
+#include <ucbhelper/commandenvironment.hxx>
+
+#include <string.h>
+#include <stdio.h>
+#include <stdarg.h>
+
+
+using ::rtl::OUStringBuffer;
+using ::rtl::OString;
+using ::com::sun::star::xml::sax::InputSource;
+using namespace ucbhelper;
+using namespace ::com::sun::star::ucb;
+using ::com::sun::star::task::XInteractionHandler;
+
+
namespace DOM
{
+ extern "C" {
+ //char *strdup(const char *s);
+ /*
+ static char* strdupfunc(const char* s)
+ {
+ sal_Int32 len = 0;
+ while (s[len] != '\0') len++;
+ char *newStr = (char*)rtl_allocateMemory(len+1);
+ if (newStr != NULL)
+ rtl_copyMemory(newStr, s, len+1);
+ return newStr;
+ }
+ */
+ }
+
+
+ class CDefaultEntityResolver : public cppu::WeakImplHelper1< XEntityResolver >
+ {
+ public:
+ virtual InputSource SAL_CALL resolveEntity( const OUString& sPublicId, const OUString& sSystemId )
+ throw (::com::sun::star::uno::RuntimeException)
+ {
+ InputSource is;
+ is.sPublicId = sPublicId;
+ is.sSystemId = sSystemId;
+ is.sEncoding = OUString();
+
+ try {
+ Reference< XCommandEnvironment > aEnvironment(
+ new CommandEnvironment(Reference< XInteractionHandler >(),
+ Reference< XProgressHandler >() ));
+ Content aContent(sSystemId, aEnvironment);
+
+ is.aInputStream = aContent.openStream();
+ } catch (com::sun::star::uno::Exception) {
+ OSL_ENSURE(sal_False, "exception in default entity resolver");
+ is.aInputStream = Reference< XInputStream >();
+ }
+ return is;
+ }
+
+ };
+
CDocumentBuilder::CDocumentBuilder(const Reference< XMultiServiceFactory >& xFactory)
: m_aFactory(xFactory)
+ , m_aEntityResolver(Reference< XEntityResolver > (new CDefaultEntityResolver()))
{
// init libxml. libxml will protect itself against multiple
// initializations so there is no problem here if this gets
@@ -119,41 +190,243 @@ namespace DOM
return Reference< XDocument >(static_cast< CDocument* >(CNode::get((xmlNodePtr)pDocument)));
}
- Reference< XDocument > SAL_CALL CDocumentBuilder::parse(const Reference< XInputStream >& is)
- throw (RuntimeException)
+ static OUString make_error_message(xmlParserCtxtPtr ctxt)
{
- sal_Int32 bsize = 4096;
- char* buffer = (char*)rtl_allocateMemory(bsize);
- sal_Int32 nbytes = 0;
- sal_Int32 nread = 0;
- sal_Int32 csize = bsize;
- Sequence< sal_Int8 > chunk(csize);
- do
+ OUStringBuffer buf;
+ buf.appendAscii(ctxt->lastError.message);
+ buf.appendAscii("Line: ");
+ buf.append(static_cast<sal_Int32>(ctxt->lastError.line));
+ buf.appendAscii("\nColumn: ");
+ buf.append(static_cast<sal_Int32>(ctxt->lastError.int2));
+ OUString msg = buf.makeStringAndClear();
+ return msg;
+ }
+
+ // -- callbacks and context struct for parsing from stream
+ // -- c-linkage, so the callbacks can be used by libxml
+ extern "C" {
+
+ // context struct passed to IO functions
+ typedef struct context {
+ CDocumentBuilder *pBuilder;
+ Reference< XInputStream > rInputStream;
+ bool close;
+ bool freeOnClose;
+ } context_t;
+
+ static int xmlIO_read_func( void *context, char *buffer, int len)
+ {
+ // get the context...
+ context_t *pctx = static_cast<context_t*>(context);
+ if (!pctx->rInputStream.is())
+ return -1;
+ try {
+ // try to read the requested number of bytes
+ Sequence< sal_Int8 > chunk(len);
+ int nread = pctx->rInputStream->readBytes(chunk, len);
+
+ // copy bytes to the provided buffer
+ rtl_copyMemory(buffer, chunk.getConstArray(), nread);
+ return nread;
+ } catch (com::sun::star::uno::Exception& ex) {
+ (void) ex;
+ OSL_ENSURE(sal_False, OUStringToOString(ex.Message, RTL_TEXTENCODING_UTF8).getStr());
+ return -1;
+ }
+ }
+
+ static int xmlIO_close_func(void* context)
+ {
+ // get the context...
+ context_t *pctx = static_cast<context_t*>(context);
+ if (!pctx->rInputStream.is())
+ return 0;
+ try
{
- // read mac csize bytes
- nread = is->readBytes(chunk, csize);
- // grow buffer?
- if ((nbytes + nread) > bsize)
- {
- bsize = 2*bsize;
- char *new_buffer = (char*)rtl_reallocateMemory(buffer, bsize);
- if (new_buffer == 0)
- throw RuntimeException();
- buffer = new_buffer;
- }
- // copy bytes to buffer
- rtl_copyMemory(buffer+nbytes, chunk.getConstArray(), nread);
- nbytes += nread;
+ if (pctx->close)
+ pctx->rInputStream->closeInput();
+ if (pctx->freeOnClose)
+ delete pctx;
+ return 0;
+ } catch (com::sun::star::uno::Exception& ex) {
+ (void) ex;
+ OSL_ENSURE(sal_False, OUStringToOString(ex.Message, RTL_TEXTENCODING_UTF8).getStr());
+ return -1;
+ }
+ }
+
+ static xmlParserInputPtr resolve_func(void *ctx,
+ const xmlChar *publicId,
+ const xmlChar *systemId)
+ {
+ // get the CDocumentBuilder object
+ xmlParserCtxtPtr ctxt = (xmlParserCtxtPtr)ctx;
+ CDocumentBuilder *builder = static_cast< CDocumentBuilder* >(ctxt->_private);
+ Reference< XEntityResolver > resolver = builder->getEntityResolver();
+ OUString sysid;
+ if (systemId != 0)
+ sysid = OUString((sal_Char*)systemId, strlen((char*)systemId), RTL_TEXTENCODING_UTF8);
+ OUString pubid;
+ if (publicId != 0)
+ pubid = OUString((sal_Char*)publicId, strlen((char*)publicId), RTL_TEXTENCODING_UTF8);
+
+ // resolve the entity
+ InputSource src = resolver->resolveEntity(pubid, sysid);
+
+ // create IO context on heap because this call will no longer be on the stack
+ // when IO is actually performed through the callbacks. The close function must
+ // free the memory which is indicated by the freeOnClose field in the context struct
+ context_t *c = new context_t;
+ c->pBuilder = builder;
+ c->rInputStream = src.aInputStream;
+ c->close = true;
+ c->freeOnClose = true;
+
+ // set up the inputBuffer and inputPtr for libxml
+ xmlParserInputBufferPtr pBuffer =
+ xmlParserInputBufferCreateIO(xmlIO_read_func, xmlIO_close_func, c, XML_CHAR_ENCODING_NONE);
+ xmlParserInputPtr pInput =
+ xmlNewIOInputStream(ctxt, pBuffer, XML_CHAR_ENCODING_NONE);
+ return pInput;
+ }
+
+ static xmlParserInputPtr external_entity_loader(const char *URL, const char * /*ID*/, xmlParserCtxtPtr ctxt)
+ {
+ // just call our resolver function using the URL as systemId
+ return resolve_func(ctxt, 0, (const xmlChar*)URL);
+ }
+
+ // default warning handler triggers assertion
+ static void warning_func(void * ctx, const char * /*msg*/, ...)
+ {
+ OUStringBuffer buf(OUString::createFromAscii("libxml2 warning\n"));
+ buf.append(make_error_message(static_cast< xmlParserCtxtPtr >(ctx)));
+ OString msg = OUStringToOString(buf.makeStringAndClear(), RTL_TEXTENCODING_ASCII_US);
+ OSL_ENSURE(sal_False, msg.getStr());
+ }
+
+ // default error handler triggers assertion
+ static void error_func(void * ctx, const char * /*msg*/, ...)
+ {
+ OUStringBuffer buf(OUString::createFromAscii("libxml2 error\n"));
+ buf.append(make_error_message(static_cast< xmlParserCtxtPtr >(ctx)));
+ OString msg = OUStringToOString(buf.makeStringAndClear(), RTL_TEXTENCODING_ASCII_US);
+ OSL_ENSURE(sal_False, msg.getStr());
+ }
+
+ } // extern "C"
+
+ Reference< XDocument > SAL_CALL CDocumentBuilder::parse(const Reference< XInputStream >& is)
+ throw (RuntimeException, SAXParseException, IOException)
+ {
+
+ // encoding...
+ /*
+ xmlChar *encstr = (xmlChar*) OUStringToOString(src.sEncoding, RTL_TEXTENCODING_UTF8).getStr();
+ xmlCharEncoding enc = xmlParseCharEncoding(encstr);
+ */
+
+ xmlParserCtxtPtr ctxt = xmlNewParserCtxt();
+
+ // register error functions to prevent errors being printed
+ // on the console
+ ctxt->_private = this;
+ ctxt->sax->error = error_func;
+ ctxt->sax->warning = warning_func;
+ ctxt->sax->resolveEntity = resolve_func;
+
+ // IO context struct
+ context_t c;
+ c.pBuilder = this;
+ c.rInputStream = is;
+ // we did not open the stream, thus we do not close it.
+ c.close = false;
+ c.freeOnClose = false;
+ xmlDocPtr pDoc = xmlCtxtReadIO(ctxt, xmlIO_read_func, xmlIO_close_func, &c,
+ 0, 0, 0);
+
+ xmlFreeParserCtxt(ctxt);
+ if (pDoc == 0) {
+ OUString msg = make_error_message(ctxt);
+ com::sun::star::xml::sax::SAXParseException saxex;
+ saxex.Message = msg;
+ saxex.LineNumber = static_cast<sal_Int32>(ctxt->lastError.line);
+ saxex.ColumnNumber = static_cast<sal_Int32>(ctxt->lastError.int2);
+ throw saxex;
+ }
+ return Reference< XDocument >(static_cast< CDocument* >(CNode::get((xmlNodePtr)pDoc)));
+ }
+
+ Reference< XDocument > SAL_CALL CDocumentBuilder::parseSource(const InputSource& is)
+ throw (RuntimeException, SAXParseException, IOException)
+ {
+ // if there is an encoding specified in the input source, use it
+ xmlCharEncoding enc = XML_CHAR_ENCODING_NONE;
+ if (is.sEncoding.getLength() > 0) {
+ OString oEncstr = OUStringToOString(is.sEncoding, RTL_TEXTENCODING_UTF8);
+ char *encstr = (char*) oEncstr.getStr();
+ enc = xmlParseCharEncoding(encstr);
}
- while(nread == csize);
- // try to parse the buffer
- xmlDocPtr pDoc = xmlParseMemory(buffer, nbytes);
- // XXX error checking
- rtl_freeMemory(buffer);
+ // set up parser context
+ xmlParserCtxtPtr ctxt = xmlNewParserCtxt();
+ // register error functions to prevent errors being printed
+ // on the console
+ ctxt->_private = this;
+ ctxt->sax->error = error_func;
+ ctxt->sax->warning = warning_func;
+
+ // setup entity resolver binding(s)
+ ctxt->sax->resolveEntity = resolve_func;
+ xmlSetExternalEntityLoader(external_entity_loader);
+
+ // if an input stream is provided, use it
+
+ // use the systemID
+ return Reference< XDocument >();
+ }
+
+ Reference< XDocument > SAL_CALL CDocumentBuilder::parseURI(const OUString& sUri)
+ throw (RuntimeException, SAXParseException, IOException)
+ {
+ xmlParserCtxtPtr ctxt = xmlNewParserCtxt();
+ ctxt->_private = this;
+ ctxt->sax->error = error_func;
+ ctxt->sax->warning = warning_func;
+ ctxt->sax->resolveEntity = resolve_func;
+ // xmlSetExternalEntityLoader(external_entity_loader);
+ OString oUri = OUStringToOString(sUri, RTL_TEXTENCODING_UTF8);
+ char *uri = (char*) oUri.getStr();
+ xmlDocPtr pDoc = xmlCtxtReadFile(ctxt, uri, 0, 0);
+ xmlFreeParserCtxt(ctxt);
+ if (pDoc == 0) {
+ OUString msg = make_error_message(ctxt);
+ com::sun::star::xml::sax::SAXParseException saxex;
+ saxex.Message = msg;
+ saxex.LineNumber = static_cast<sal_Int32>(ctxt->lastError.line);
+ saxex.ColumnNumber = static_cast<sal_Int32>(ctxt->lastError.int2);
+ throw saxex;
+ }
return Reference< XDocument >(static_cast< CDocument* >(CNode::get((xmlNodePtr)pDoc)));
+ }
+ void SAL_CALL CDocumentBuilder::setEntityResolver(const Reference< XEntityResolver >& er)
+ throw (RuntimeException)
+ {
+ m_aEntityResolver = er;
+ }
+
+ Reference< XEntityResolver > SAL_CALL CDocumentBuilder::getEntityResolver()
+ throw (RuntimeException)
+ {
+ return m_aEntityResolver;
}
+
+ void SAL_CALL CDocumentBuilder::setErrorHandler(const Reference< XErrorHandler >& eh)
+ throw (RuntimeException)
+ {
+ m_aErrorHandler = eh;
+ }
}