arabica/include/SAX/wrappers/saxxerces.hpp

987 lines
37 KiB
C++
Raw Normal View History

#ifndef ARABICA_SAX_XERCES_H
#define ARABICA_SAX_XERCES_H
//---------------------------------------------------------------------------
// A SAX2 wrapper class for Xerces.
//---------------------------------------------------------------------------
#include <iterator>
#include <memory>
#include <string>
#include <vector>
#include <SAX/Attributes.hpp>
#include <SAX/InputSource.hpp>
#include <SAX/XMLReader.hpp>
#include <SAX/ext/ProgressiveParser.hpp>
#include <SAX/SAXParseException.hpp>
#include <SAX/SAXNotRecognizedException.hpp>
#include <SAX/SAXNotSupportedException.hpp>
#include <SAX/ext/LexicalHandler.hpp>
#include <SAX/ext/DeclHandler.hpp>
#include <SAX/IStreamHandle.hpp>
#include <SAX/wrappers/XercesPropertyNames.hpp>
#include <SAX/wrappers/XercesFeatureNames.hpp>
#include <Arabica/getparam.hpp>
// Xerces Includes
#include <xercesc/util/PlatformUtils.hpp>
#include <xercesc/sax2/SAX2XMLReader.hpp>
#include <xercesc/sax2/XMLReaderFactory.hpp>
#include <xercesc/sax2/ContentHandler.hpp>
#include <xercesc/sax2/LexicalHandler.hpp>
#include <xercesc/sax2/DeclHandler.hpp>
#include <xercesc/sax/Locator.hpp>
#include <xercesc/sax2/Attributes.hpp>
#include <xercesc/sax/EntityResolver.hpp>
#include <xercesc/sax/DTDHandler.hpp>
#include <xercesc/sax/ErrorHandler.hpp>
#include <xercesc/sax/SAXParseException.hpp>
#include <xercesc/util/BinInputStream.hpp>
#include <xercesc/sax/InputSource.hpp>
#include <xercesc/util/TransService.hpp>
#ifndef XERCES_HAS_CPP_NAMESPACE
#define XERCES_CPP_NAMESPACE
#endif
namespace Arabica
{
namespace SAX
{
namespace XercesImpl
{
///////////////////////////////
// Xerces platform initializer
/**
* Class to handle calls to XMLPlatformUtils::Initialize() and
* XMLPlatformUtils::Terminate().
*
* Without such a class, calls to Initialize() and Terminate() may be nested
* and cause evil consequences. Eg. A typical use of the old xerces_wrapper
* could have resulted in:
* <pre>
* // Construct two xerces_wrappers.
* XMLPlatformUtils::Initialize()
* XMLPlatformUtils::Initialize()
*
* // do stuff
*
* // Get rid of one of the xerces_wrappers
* XERCES_CPP_NAMESPACE::XMLPlatformUtils::Terminate()
*
* // do more stuff -- this is _after_ a call to Terminate()...
*
* XMLPlatformUtils::Terminate()
* </pre>
*/
class xerces_initializer
{
public:
xerces_initializer() { doInitialize(); }
~xerces_initializer() { doTerminate(); }
private:
void doInitialize();
void doTerminate();
static int count_;
}; // class xerces_initializer
} // namespace XercesImpl
template<class string_type,
class T0 = Arabica::nil_t,
class T1 = Arabica::nil_t>
class xerces_wrapper : public ProgressiveParser<string_type, typename Arabica::get_string_adaptor<string_type, T0, T1>::type>
{
private:
typedef XMLReaderInterface<string_type, typename Arabica::get_string_adaptor<string_type, T0, T1>::type> XMLReaderT;
typedef typename XMLReaderT::string_adaptor string_adaptor;
public:
typedef typename XMLReaderT::EntityResolverT EntityResolverT;
typedef typename XMLReaderT::DTDHandlerT DTDHandlerT;
typedef typename XMLReaderT::ContentHandlerT ContentHandlerT;
typedef typename XMLReaderT::InputSourceT InputSourceT;
typedef LexicalHandler<string_type, string_adaptor> LexicalHandlerT;
typedef Locator<string_type, string_adaptor> LocatorT;
typedef Attributes<string_type, string_adaptor> AttributesT;
typedef DeclHandler<string_type, string_adaptor> DeclHandlerT;
typedef ErrorHandler<string_type, string_adaptor> ErrorHandlerT;
typedef typename ErrorHandlerT::SAXParseExceptionT SAXParseExceptionT;
typedef SAX::XercesFeatureNames<string_type, string_adaptor> featuresT;
xerces_wrapper();
virtual ~xerces_wrapper();
/////////////////////////////////////////////////
// Configuration
virtual bool getFeature(const string_type& name) const;
virtual void setFeature(const string_type& name, bool value);
/////////////////////////////////////////////////
// Event Handlers
virtual void setEntityResolver(EntityResolverT& resolver) { entityResolverAdaptor_.setEntityResolver(resolver); }
virtual EntityResolverT* getEntityResolver() const { return entityResolverAdaptor_.getEntityResolver(); }
virtual void setDTDHandler(DTDHandlerT& handler) { dtdHandlerAdaptor_.setDTDHandler(handler); }
virtual DTDHandlerT* getDTDHandler() const { return dtdHandlerAdaptor_.getDTDHandler(); }
virtual void setContentHandler(ContentHandlerT& handler) { contentHandlerAdaptor_.setContentHandler(handler); }
virtual ContentHandlerT* getContentHandler() const { return contentHandlerAdaptor_.getContentHandler(); }
virtual void setErrorHandler(ErrorHandlerT& handler) { errorHandlerAdaptor_.setErrorHandler(handler); }
virtual ErrorHandlerT* getErrorHandler() const { return errorHandlerAdaptor_.getErrorHandler(); }
virtual void setDeclHandler(DeclHandlerT& handler) { declHandlerAdaptor_.setDeclHandler(handler); }
virtual DeclHandlerT* getDeclHandler() const { return declHandlerAdaptor_.getDeclHandler(); }
virtual void setLexicalHandler(LexicalHandlerT& handler) { lexicalHandlerAdaptor_.setLexicalHandler(handler); }
virtual LexicalHandlerT* getLexicalHandler() const { return lexicalHandlerAdaptor_.getLexicalHandler(); }
//////////////////////////////////////////////////
// Parsing
virtual void parse(InputSourceT& input);
//////////////////////////////////////////////////
// Progressive Parsing
//////////////////////////////////////////////////
/** @name Progressive Parsing */
//@{
virtual bool parseFirst(const string_type& systemId, XMLPScanToken& toFill)
{
InputSourceT is(systemId);
return parseFirst(is, toFill);
}
virtual bool parseFirst(InputSourceT& input,
XMLPScanToken& toFill);
virtual bool parseNext(XMLPScanToken& token);
virtual void parseReset(XMLPScanToken& token);
//@}
private:
///////////////////////////////
// String adaptor for XMLCh
// * For the null-terminated version, we convert the array of XMLCh to a
// null-terminated vector of wchar_t. We then pass &vector[0] to the
// parent method.
// * For the known length version, we convert the the array of XMLCh to a
// vector of wchar_t. We then pass &vector[0] and length to the parent
// method.
template<typename char_type>
class xerces_string_janitor
{
// Ordinarily you'd expect to be able to use Xerces' Array janitor class. However,
// Windows exes and dlls use seperate heaps, so you can't delete in one module that
// was allocated by another. It's a pita. The solution here is to use XMLString::release.
// Although this simply does a delete[], the deletion occurs in the Xerces DLL, so
// it will work correctly.
public:
xerces_string_janitor(char_type* ptr) : ptr_(ptr) { }
~xerces_string_janitor() { XERCES_CPP_NAMESPACE::XMLString::release(&ptr_); }
char_type const* const get() const { return ptr_; }
private:
char_type* ptr_;
xerces_string_janitor(const xerces_string_janitor&);
xerces_string_janitor& operator=(const xerces_string_janitor&) const;
}; // class xerces_string_janitor
class xerces_string_adaptor : public string_adaptor
{
public:
typedef typename string_adaptor::value_type value_type;
typedef string_adaptor base;
#ifndef ARABICA_NO_WCHAR_T
static string_type makeStringT(const XMLCh* str)
{
return makeStringT(str, XERCES_CPP_NAMESPACE::XMLString::stringLen(str));
} // makeStringT
static string_type makeStringT(const XMLCh* str, int length)
{
if(str && length)
{
std::vector<wchar_t> buffer;
std::copy(str, str+length, inserter(buffer, buffer.begin()));
return base::construct_from_utf16(&buffer[0], length);
}
else
return string_type();
} // makeStringT
#else
// alternative version for the wchar_t impaired
static string_type makeStringT(const XMLCh* str, unsigned int inputLength)
{
static XMLByte outBuff[4096];
string_type out;
unsigned int outputLength;
unsigned int eaten = 0;
unsigned int offset = 0;
while(inputLength)
{
outputLength = transcoder_->transcodeTo(str+offset,
inputLength,
outBuff, 1024,
eaten,
XERCES_CPP_NAMESPACE::XMLTranscoder::UnRep_RepChar);
base::append(out, construct_from_XMLByte(outBuff, outputLength));
offset += eaten;
inputLength -= eaten;
}
return out;
} // makeStringT
static string_type makeStringT(const XMLCh* str)
{
return makeStringT(str, XERCES_CPP_NAMESPACE::XMLString::stringLen(str));
} // makeStringT
static string_type construct_from_XMLByte(const XMLByte* bytes, int length)
{
return base::construct_from_utf8(reinterpret_cast<const char*>(bytes), length);
} // construct_from_XMLByte
static std::unique_ptr<XERCES_CPP_NAMESPACE::XMLTranscoder> transcoder_;
static void kickoff()
{
XERCES_CPP_NAMESPACE::XMLTransService::Codes res;
transcoder_.reset(XERCES_CPP_NAMESPACE::XMLPlatformUtils::fgTransService->makeNewTranscoderFor(XERCES_CPP_NAMESPACE::XMLRecognizer::UTF_8, res, 4096, XERCES_CPP_NAMESPACE::XMLPlatformUtils::fgMemoryManager));
}
static void shutdown()
{
transcoder_.reset(0);
} // shutdown
#endif
static XMLCh* asXMLChString(const string_type& s)
{
std::string str = base::asStdString(s);
return XERCES_CPP_NAMESPACE::XMLString::transcode(str.c_str());
} // asXMLChString
}; // class xerces_string_adaptor
typedef xerces_string_adaptor XSA;
///////////////////////////////
// Adaptors
class LocatorAdaptor : public LocatorT
{
public:
LocatorAdaptor() : locator_(0) { }
LocatorAdaptor(const XERCES_CPP_NAMESPACE::Locator* const locator) : locator_(locator) { }
~LocatorAdaptor() { }
string_type getPublicId() const
{
if(!locator_)
return string_type();
return xerces_string_adaptor::makeStringT(locator_->getPublicId());
} // getPublicId
string_type getSystemId() const
{
if(!locator_)
return string_type();
return XSA::makeStringT(locator_->getSystemId());
} // getSystemId
size_t getLineNumber() const
{
if(!locator_)
return -1;
return static_cast<size_t>(locator_->getLineNumber());
} // getLineNumber
size_t getColumnNumber() const
{
if(!locator_)
return -1;
return static_cast<size_t>(locator_->getColumnNumber());
} // getColumnNumber
void setLocator(const XERCES_CPP_NAMESPACE::Locator* const locator)
{
locator_ = locator;
} // setLocator
private:
const XERCES_CPP_NAMESPACE::Locator* locator_;
}; // class LocatorAdaptor
class EntityResolverAdaptor : public XERCES_CPP_NAMESPACE::EntityResolver
{
public:
EntityResolverAdaptor() : entityResolverHandler_(0) { }
~EntityResolverAdaptor() { }
void setEntityResolver(EntityResolverT& handler)
{
entityResolverHandler_ = &handler;
}
EntityResolverT* getEntityResolver() const
{
return entityResolverHandler_;
}
virtual XERCES_CPP_NAMESPACE::InputSource* resolveEntity(const XMLCh* const publicId,
const XMLCh* const systemId)
{
InputSourceT source;
if(entityResolverHandler_)
{
source = entityResolverHandler_->resolveEntity(XSA::makeStringT(publicId),
XSA::makeStringT(systemId));
}
// If all of these are empty, the EntityResolver has requested that we
// use the default entity resolver.
if ((source.getByteStream() == 0) &&
(XSA::empty(source.getPublicId())) &&
(XSA::empty(source.getSystemId())))
{
// Xerces-C takes a NULL (0) return to mean "use the default entity
// resolver".
return 0;
}
else
{
return new InputSourceAdaptor(source);
}
}
private:
EntityResolverT* entityResolverHandler_;
}; // class EntityResolverAdaptor
class DTDHandlerAdaptor : public XERCES_CPP_NAMESPACE::DTDHandler
{
public:
DTDHandlerAdaptor() : dtdHandler_(0) { }
~DTDHandlerAdaptor() { }
void setDTDHandler(DTDHandlerT& handler) { dtdHandler_ = &handler; }
DTDHandlerT* getDTDHandler() const { return dtdHandler_; }
virtual void notationDecl(const XMLCh* const name,
const XMLCh* const publicId,
const XMLCh* const systemId)
{
if(dtdHandler_)
dtdHandler_->notationDecl(XSA::makeStringT(name),
XSA::makeStringT(publicId),
XSA::makeStringT(systemId));
} // notationDecl
virtual void unparsedEntityDecl(const XMLCh* const name,
const XMLCh* const publicId,
const XMLCh* const systemId,
const XMLCh* const notationName)
{
if(dtdHandler_)
dtdHandler_->unparsedEntityDecl(XSA::makeStringT(name),
XSA::makeStringT(publicId),
XSA::makeStringT(systemId),
XSA::makeStringT(notationName));
} // unparsedEntityDecl
virtual void resetDocType()
{
// no op
} // resetDocType
private:
DTDHandlerT* dtdHandler_;
}; // class DTDHandlerAdaptor
class ContentHandlerAdaptor : public XERCES_CPP_NAMESPACE::ContentHandler
{
public:
ContentHandlerAdaptor() : contentHandler_(0) { }
~ContentHandlerAdaptor() { }
void setContentHandler(ContentHandlerT& handler) { contentHandler_ = &handler; }
ContentHandlerT* getContentHandler() const { return contentHandler_; }
virtual void setDocumentLocator(const XERCES_CPP_NAMESPACE::Locator* const locator)
{
locator_.setLocator(locator);
if(contentHandler_)
contentHandler_->setDocumentLocator(locator_);
} // putDocumentLocation
virtual void startDocument()
{
if(contentHandler_)
contentHandler_->startDocument();
} // startDocument
virtual void endDocument()
{
if(contentHandler_)
contentHandler_->endDocument();
} // endDocument
virtual void startPrefixMapping(const XMLCh* const prefix, const XMLCh* const uri)
{
if(contentHandler_)
contentHandler_->startPrefixMapping(XSA::makeStringT(prefix), XSA::makeStringT(uri));
} // startPrefixMapping
virtual void endPrefixMapping(const XMLCh* const prefix)
{
if(contentHandler_)
contentHandler_->endPrefixMapping(XSA::makeStringT(prefix));
} // endPrefixMapping
virtual void startElement(const XMLCh* const namespaceUri,
const XMLCh* const localName,
const XMLCh* const rawName,
const XERCES_CPP_NAMESPACE::Attributes& attrs)
{
if(contentHandler_)
{
AttributesAdaptor attrAdaptor(attrs);
contentHandler_->startElement(XSA::makeStringT(namespaceUri),
XSA::makeStringT(localName),
XSA::makeStringT(rawName),
attrAdaptor);
} // if ...
} // startElement
virtual void endElement(const XMLCh* const namespaceUri,
const XMLCh* const localName,
const XMLCh* const rawName)
{
if(contentHandler_)
contentHandler_->endElement(XSA::makeStringT(namespaceUri),
XSA::makeStringT(localName),
XSA::makeStringT(rawName));
} // endElement
virtual void characters(const XMLCh* const chars, const XMLSize_t length)
{
if(contentHandler_)
contentHandler_->characters(XSA::makeStringT(chars, length));
} // characters
virtual void ignorableWhitespace(const XMLCh* const chars, const XMLSize_t length)
{
if(contentHandler_)
contentHandler_->ignorableWhitespace(XSA::makeStringT(chars, length));
} // ignorableWhitespace
virtual void processingInstruction(const XMLCh* const target,
const XMLCh* const data)
{
if(contentHandler_)
contentHandler_->processingInstruction(XSA::makeStringT(target),
XSA::makeStringT(data));
} // processingInstruction
virtual void skippedEntity(const XMLCh* const name)
{
if(contentHandler_)
contentHandler_->skippedEntity(XSA::makeStringT(name));
} // skippedEntity
private:
////////////////////////////////////////////////
// member varaibles
ContentHandlerT* contentHandler_;
LocatorAdaptor locator_;
//////////////////////////////////////////////////////
// COM interface -> C++ interface adaptors
class AttributesAdaptor : public AttributesT
{
public:
AttributesAdaptor(const XERCES_CPP_NAMESPACE::Attributes& attrs) : attributes_(attrs) { }
~AttributesAdaptor() { }
/////////////////////////
// indexed access
virtual int getLength() const
{
return attributes_.getLength();
} // getLength
virtual string_type getURI(unsigned int index) const
{
return XSA::makeStringT(attributes_.getURI(index));
} // getURI
virtual string_type getLocalName(unsigned int index) const
{
return XSA::makeStringT(attributes_.getLocalName(index));
} // getLocalName
virtual string_type getQName(unsigned int index) const
{
return XSA::makeStringT(attributes_.getQName(index));
} // getQName
virtual string_type getType(unsigned int index) const
{
return XSA::makeStringT(attributes_.getType(index));
} // getType
virtual string_type getValue(unsigned int index) const
{
return XSA::makeStringT(attributes_.getValue(index));
} // getValue
/////////////////////////
// name based query
virtual int getIndex(const string_type& uri, const string_type& localName) const
{
xerces_string_janitor<XMLCh> wUri(XSA::asXMLChString(uri));
xerces_string_janitor<XMLCh> wLocalName(XSA::asXMLChString(localName));
return attributes_.getIndex(wUri.get(), wLocalName.get());
} // getIndex
virtual int getIndex(const string_type& qName) const
{
xerces_string_janitor<XMLCh> wQName(XSA::asXMLChString(qName));
return attributes_.getIndex(wQName.get());
} // getIndex
virtual string_type getType(const string_type& uri, const string_type& localName) const
{
xerces_string_janitor<XMLCh> wUri(XSA::asXMLChString(uri));
xerces_string_janitor<XMLCh> wLocalName(XSA::asXMLChString(localName));
return XSA::makeStringT(attributes_.getType(wUri.get(), wLocalName.get()));
} // getType
virtual string_type getType(const string_type& qName) const
{
xerces_string_janitor<XMLCh> wQName(XSA::asXMLChString(qName));
return XSA::makeStringT(attributes_.getType(wQName.get()));
} // getType
virtual string_type getValue(const string_type& uri, const string_type& localName) const
{
xerces_string_janitor<XMLCh> wUri(XSA::asXMLChString(uri));
xerces_string_janitor<XMLCh> wLocalName(XSA::asXMLChString(localName));
return XSA::makeStringT(attributes_.getValue(wUri.get(), wLocalName.get()));
} // getValue
virtual string_type getValue(const string_type& qname) const
{
xerces_string_janitor<XMLCh> wQName(XSA::asXMLChString(qname));
return XSA::makeStringT(attributes_.getValue(wQName.get()));
} // getValue
private:
const XERCES_CPP_NAMESPACE::Attributes& attributes_;
AttributesAdaptor();
}; // class AttributesAdaptor
}; // class ContentHandlerAdaptor
class ErrorHandlerAdaptor : public XERCES_CPP_NAMESPACE::ErrorHandler
{
public:
ErrorHandlerAdaptor() : errorHandler_(0) { }
virtual ~ErrorHandlerAdaptor() { }
void setErrorHandler(ErrorHandlerT& handler) { errorHandler_ = &handler; }
ErrorHandlerT* getErrorHandler() const { return errorHandler_; }
virtual void warning(const XERCES_CPP_NAMESPACE::SAXParseException& exception)
{
handleError(exception, &ErrorHandlerT::warning);
} // warning
virtual void error(const XERCES_CPP_NAMESPACE::SAXParseException& exception)
{
handleError(exception, &ErrorHandlerT::error);
} // error
virtual void fatalError(const XERCES_CPP_NAMESPACE::SAXParseException& exception)
{
handleError(exception, &ErrorHandlerT::fatalError);
} // fatalError
virtual void resetErrors()
{
// no op
} // resetErrors
private:
typedef void(ErrorHandlerT::* ErrorFn)(const SAXParseExceptionT&);
void handleError(const XERCES_CPP_NAMESPACE::SAXParseException& exception, ErrorFn fn)
{
if(!errorHandler_)
return;
string_type errorMsg(XSA::makeStringT(exception.getMessage()));
string_type publicId(XSA::makeStringT(exception.getPublicId()));
string_type systemId(XSA::makeStringT(exception.getSystemId()));
SAXParseExceptionT sp(XSA::asStdString(errorMsg),
publicId,
systemId,
static_cast<size_t>(exception.getLineNumber()),
static_cast<size_t>(exception.getColumnNumber()));
(errorHandler_->*fn)(sp);
} // handleError
ErrorHandlerT* errorHandler_;
}; // class ErrorHandlerAdaptor
class LexicalHandlerAdaptor : public XERCES_CPP_NAMESPACE::LexicalHandler
{
public:
LexicalHandlerAdaptor() : lexicalHandler_(0) { }
virtual ~LexicalHandlerAdaptor() { }
void setLexicalHandler(LexicalHandlerT& handler) { lexicalHandler_ = &handler; }
LexicalHandlerT* getLexicalHandler() const { return lexicalHandler_; }
virtual void startDTD(const XMLCh* const name,
const XMLCh* const publicId,
const XMLCh* const systemId)
{
if(lexicalHandler_)
lexicalHandler_->startDTD(XSA::makeStringT(name),
XSA::makeStringT(publicId),
XSA::makeStringT(systemId));
} // startDTD
virtual void endDTD()
{
if(lexicalHandler_)
lexicalHandler_->endDTD();
} // endDTD
virtual void startEntity(const XMLCh* const name)
{
if(lexicalHandler_)
lexicalHandler_->startEntity(XSA::makeStringT(name));
} // startEntity
virtual void endEntity(const XMLCh* const name)
{
if(lexicalHandler_)
lexicalHandler_->endEntity(XSA::makeStringT(name));
} // endEntity
virtual void startCDATA()
{
if(lexicalHandler_)
lexicalHandler_->startCDATA();
} // startCDATA
virtual void endCDATA()
{
if(lexicalHandler_)
lexicalHandler_->endCDATA();
} // endCDATA
virtual void comment(const XMLCh* const chars, const XMLSize_t length)
{
if(lexicalHandler_)
lexicalHandler_->comment(XSA::makeStringT(chars, length));
} // comment
private:
LexicalHandlerT* lexicalHandler_;
}; // class LexicalHandlerAdaptor
class DeclHandlerAdaptor : public XERCES_CPP_NAMESPACE::DeclHandler
{
public:
DeclHandlerAdaptor() : declHandler_(0) { }
virtual ~DeclHandlerAdaptor() { }
void setDeclHandler(DeclHandlerT& handler) { declHandler_ = &handler; }
DeclHandlerT* getDeclHandler() const { return declHandler_; }
virtual void elementDecl(const XMLCh* const name,
const XMLCh* const model)
{
if(declHandler_)
declHandler_->elementDecl(XSA::makeStringT(name),
XSA::makeStringT(model));
} // elementDecl
virtual void attributeDecl(const XMLCh* const elementName,
const XMLCh* const attributeName,
const XMLCh* const type,
const XMLCh* const valueDefault,
const XMLCh* const value)
{
if(declHandler_)
{
const XMLCh* tmpValueDefault = valueDefault;
if (tmpValueDefault == XERCES_CPP_NAMESPACE::XMLUni::fgNullString)
tmpValueDefault = 0;
declHandler_->attributeDecl(XSA::makeStringT(elementName),
XSA::makeStringT(attributeName),
XSA::makeStringT(type),
XSA::makeStringT(tmpValueDefault),
XSA::makeStringT(value));
}
} // attributeDecl
virtual void internalEntityDecl(const XMLCh* const name,
const XMLCh* const value)
{
if(declHandler_)
declHandler_->internalEntityDecl(XSA::makeStringT(name),
XSA::makeStringT(value));
} // internalEntityDecl
virtual void externalEntityDecl(const XMLCh* const name,
const XMLCh* const publicId,
const XMLCh* const systemId)
{
if(declHandler_)
declHandler_->externalEntityDecl(XSA::makeStringT(name),
XSA::makeStringT(publicId),
XSA::makeStringT(systemId));
} // externalEntityDecl
private:
DeclHandlerT* declHandler_;
}; // class DeclHandlerAdaptor
class IStreamAdaptor : public XERCES_CPP_NAMESPACE::BinInputStream
{
public:
IStreamAdaptor(IStreamHandle istream)
: istream_(istream),
curPos_(0)
{ }
virtual ~IStreamAdaptor() { }
virtual XMLFilePos curPos() const
{
return curPos_;
} // curPos
virtual XMLSize_t readBytes(XMLByte* const toFill,
const XMLSize_t maxToRead)
{
istream_.get()->read(reinterpret_cast<char*>(toFill), maxToRead);
curPos_ += istream_.get()->gcount();
return static_cast<XMLSize_t>(istream_.get()->gcount());
} // readBytes
virtual const XMLCh* getContentType() const { return 0; }
private:
IStreamHandle istream_;
XMLFilePos curPos_;
}; // IStreamAdaptor
class InputSourceAdaptor : public XERCES_CPP_NAMESPACE::InputSource
{
public:
InputSourceAdaptor(const InputSourceT& source)
: inputSource_(source)
{
xerces_string_janitor<XMLCh> wSystemId(XSA::asXMLChString(source.getSystemId()));
xerces_string_janitor<XMLCh> wPublicId(XSA::asXMLChString(source.getPublicId()));
setSystemId(wSystemId.get());
setPublicId(wPublicId.get());
} // InputSourceAdaptor
virtual ~InputSourceAdaptor() { }
virtual XERCES_CPP_NAMESPACE::BinInputStream* makeStream() const
{
return new IStreamAdaptor(inputSource_.getByteStreamHandle());
} // makeStream
private:
// This is a local copy, so we do not rely on someone else keeping
// their InputSourceT around for us.
InputSourceT inputSource_;
}; // class InputSourceAdaptor
class XercesXMLPScanToken : public SAX::XMLPScanTokenParserImpl
{
public:
XERCES_CPP_NAMESPACE::XMLPScanToken token_;
};
/////////////////////////////////////////////
// Member variables
std::unique_ptr<XercesImpl::xerces_initializer> initializer_;
XERCES_CPP_NAMESPACE::SAX2XMLReader* xerces_;
ContentHandlerAdaptor contentHandlerAdaptor_;
EntityResolverAdaptor entityResolverAdaptor_;
DTDHandlerAdaptor dtdHandlerAdaptor_;
ErrorHandlerAdaptor errorHandlerAdaptor_;
LexicalHandlerAdaptor lexicalHandlerAdaptor_;
DeclHandlerAdaptor declHandlerAdaptor_;
Arabica::SAX::XercesPropertyNames<string_type, string_adaptor> properties_;
// Property values to return by reference
string_type externalSchemaLocation_;
string_type externalNoNamespaceSchemaLocation_;
}; // class xerces_wrapper
#ifdef ARABICA_NO_WCHAR_T
template<class string_type, class T0, class T1>
std::unique_ptr<XERCES_CPP_NAMESPACE::XMLTranscoder> xerces_wrapper<string_type, T0, T1>::xerces_string_adaptor::transcoder_;
#endif
template<class string_type, class T0, class T1>
xerces_wrapper<string_type, T0, T1>::xerces_wrapper()
{
try
{
initializer_.reset(new XercesImpl::xerces_initializer());
#ifdef ARABICA_NO_WCHAR_T
xerces_string_adaptor::kickoff();
#endif
}
catch(const XERCES_CPP_NAMESPACE::XMLException& toCatch)
{
string_type s = XSA::makeStringT(toCatch.getMessage());
throw SAX::SAXException(XSA::asStdString(s));
} // catch
xerces_ = XERCES_CPP_NAMESPACE::XMLReaderFactory::createXMLReader();
xerces_->setContentHandler(&contentHandlerAdaptor_);
xerces_->setEntityResolver(&entityResolverAdaptor_);
xerces_->setDTDHandler(&dtdHandlerAdaptor_);
xerces_->setErrorHandler(&errorHandlerAdaptor_);
xerces_->setLexicalHandler(&lexicalHandlerAdaptor_);
xerces_->setDeclarationHandler(&declHandlerAdaptor_);
} // xerces_wrapper
template<class string_type, class T0, class T1>
xerces_wrapper<string_type, T0, T1>::~xerces_wrapper()
{
#ifdef ARABICA_NO_WCHAR_T
xerces_string_adaptor::shutdown();
#endif
delete xerces_;
} // ~xerces_wrapper
template<class string_type, class T0, class T1>
bool xerces_wrapper<string_type, T0, T1>::getFeature(const string_type& name) const
{
try
{
xerces_string_janitor<XMLCh> wName(XSA::asXMLChString(name));
return xerces_->getFeature(wName.get());
} // try
catch(XERCES_CPP_NAMESPACE::SAXNotSupportedException& e)
{
throw SAX::SAXNotSupportedException(XSA::asStdString(XSA::makeStringT(e.getMessage())));
} // catch(SAXNotSupportedException& e)
catch(XERCES_CPP_NAMESPACE::SAXNotRecognizedException& e)
{
throw SAX::SAXNotRecognizedException(XSA::asStdString(XSA::makeStringT(e.getMessage())));
} // catch(SAXNotRecognizedException& e)
} // getFeature
template<class string_type, class T0, class T1>
void xerces_wrapper<string_type, T0, T1>::setFeature(const string_type& name, bool value)
{
try
{
xerces_string_janitor<XMLCh> wName(XSA::asXMLChString(name));
xerces_->setFeature(wName.get(), value);
} // try
catch(XERCES_CPP_NAMESPACE::SAXNotSupportedException& e)
{
throw SAX::SAXNotSupportedException(XSA::asStdString(XSA::makeStringT(e.getMessage())));
} // catch(SAXNotSupportedException& e)
catch(XERCES_CPP_NAMESPACE::SAXNotRecognizedException& e)
{
throw SAX::SAXNotRecognizedException(XSA::asStdString(XSA::makeStringT(e.getMessage())));
} // catch(SAXNotRecognizedException& e)
} // setFeature
template<class string_type, class T0, class T1>
void xerces_wrapper<string_type, T0, T1>::parse(InputSourceT& source)
{
// if no stream is open, let Xerces deal with it
if(source.getByteStream() == 0)
xerces_->parse(XSA::asStdString(source.getSystemId()).c_str());
else
{
// we have to wrap everything up in a Xerces friendly way
InputSourceAdaptor isAdaptor(source);
xerces_->parse(isAdaptor);
} // if ...
} // parse
template<class string_type, class T0, class T1>
bool xerces_wrapper<string_type,
T0, T1>::parseFirst(InputSourceT& input,
XMLPScanToken& toFill)
{
auto newToken = std::make_unique<XercesXMLPScanToken>();
// To store the result from Xerces parseFirst().
bool result = false;
if (input.getByteStream() == 0)
{
// We can just pass the systemID to parseFirst and let Xerces open the
// stream.
const char* systemID = XSA::asStdString(input.getSystemId()).c_str();
result = xerces_->parseFirst(systemID, newToken->token_);
}
else
{
// We need to wrap input in an InputSourceAdaptor.
// isAdaptor can be a local variable because Xerces has to open any streams
// within the parseFirst() call, so it should not need the
// InputSourceAdaptor to hang around.
InputSourceAdaptor isAdaptor(input);
result = xerces_->parseFirst(isAdaptor, newToken->token_);
}
if (result) {
// We need to explicitly convert to unique_ptr<base class>.
std::unique_ptr<XMLPScanTokenParserImpl> toSet(newToken.release());
toFill.setParserData(std::move(toSet));
}
return result;
} // parseFirst
template<class string_type, class T0, class T1>
bool xerces_wrapper<string_type, T0, T1>::parseNext(XMLPScanToken& token)
{
// Extract the XercesXMLPScanToken from within token.
XercesXMLPScanToken* xercesToken =
dynamic_cast<XercesXMLPScanToken*>(token.parserImpl());
if (xercesToken == 0)
{
// If it failed to cast, we can simply refuse to parse, because this call
// clearly isn't following a successful parseFirst().
return false;
}
else
{
// Otherwise, just pass the token to Xerces.
return xerces_->parseNext(xercesToken->token_);
}
} // parseNext
template<class string_type, class T0, class T1>
void xerces_wrapper<string_type, T0, T1>::parseReset(XMLPScanToken& token)
{
// Extract the XercesXMLPScanToken from within token.
XercesXMLPScanToken* xercesToken =
dynamic_cast<XercesXMLPScanToken*>(token.parserImpl());
// If it failed to cast, we can simply ignore it, because this call clearly
// isn't following a successful parseFirst().
if (xercesToken != 0)
{
xerces_->parseReset(xercesToken->token_);
}
} // parseReset
} // namespace SAX
} // namespace Arabica
#endif
// end of file