arabica/include/SAX/wrappers/saxmsxml2.hpp

948 lines
37 KiB
C++
Raw Normal View History

2003-09-11 12:26:53 +02:00
#ifndef ARABICA_SAX_MSXML2_H
#define ARABICA_SAX_MSXML2_H
2002-06-21 13:16:28 +02:00
//---------------------------------------------------------------------------
// A SAX2 wrapper class for MSXML component.
//---------------------------------------------------------------------------
2007-09-05 00:55:47 +02:00
#include <SAX/ArabicaConfig.hpp>
#include <SAX/XMLReader.hpp>
#include <SAX/InputSource.hpp>
#include <SAX/SAXParseException.hpp>
#include <SAX/SAXNotRecognizedException.hpp>
#include <SAX/SAXNotSupportedException.hpp>
#include <SAX/helpers/PropertyNames.hpp>
#include <Arabica/StringAdaptor.hpp>
#include <iostream>
#include <Arabica/getparam.hpp>
// Include the MSXML definitions.
#include <msxml2.h>
2002-06-21 13:16:28 +02:00
//
// Declare the 'smart pointer' type to simplify COM handling.
#include <comdef.h>
_COM_SMARTPTR_TYPEDEF(ISAXXMLReader, __uuidof(ISAXXMLReader));
2002-06-21 13:16:28 +02:00
2007-09-05 11:49:18 +02:00
namespace Arabica
{
2002-06-21 13:16:28 +02:00
namespace SAX
{
struct COMInitializer_tag { };
2002-06-21 13:16:28 +02:00
/**
* use this as COMInitializer_type if you call
* CoInitialize/CoInitializeEx in your own code
*/
class COMExternalInitializer : public COMInitializer_tag
2002-06-21 13:16:28 +02:00
{
public:
COMExternalInitializer() { }
~COMExternalInitializer() { }
}; // COMExternalInitializer
class COMSingleThreadInitializer : public COMInitializer_tag
2002-06-21 13:16:28 +02:00
{
public:
COMSingleThreadInitializer() { ::CoInitialize(NULL); }
2002-06-21 13:16:28 +02:00
~COMSingleThreadInitializer() { ::CoUninitialize(); }
}; // COMSingleThreadInitializer
#if(_WIN32_WINNT >= 0x0400 ) || defined(_WIN32_DCOM)
class COMMultiThreadInitializer : public COMInitializer_tag
2002-06-21 13:16:28 +02:00
{
public:
COMMultiThreadInitializer() { ::CoInitializeEx(NULL, COINIT_MULTITHREADED); }
~COMMultiThreadInitializer() { ::CoUninitialize(); }
};
#endif
template<class string_type,
class T0 = Arabica::nil_t,
class T1 = Arabica::nil_t>
class msxml2_wrapper : public SAX::XMLReaderInterface<string_type, T0, T1>
2002-06-21 13:16:28 +02:00
{
2005-11-17 23:06:12 +01:00
public:
typedef SAX::XMLReaderInterface<string_type, T0, T1> XMLReaderT;
typedef typename XMLReaderT::string_adaptor string_adaptor;
typedef typename Arabica::get_param<COMInitializer_tag,
COMSingleThreadInitializer,
T1,
T0>::type COMInitializer_type;
typedef SAX::EntityResolver<string_type, string_adaptor> entityResolverT;
typedef SAX::DTDHandler<string_type, string_adaptor> dtdHandlerT;
typedef SAX::ContentHandler<string_type, string_adaptor> contentHandlerT;
typedef SAX::DeclHandler<string_type, string_adaptor> declHandlerT;
typedef SAX::LexicalHandler<string_type, string_adaptor> lexicalHandlerT;
typedef SAX::InputSource<string_type, string_adaptor> inputSourceT;
typedef SAX::Locator<string_type, string_adaptor> locatorT;
typedef SAX::ErrorHandler<string_type, string_adaptor> errorHandlerT;
typedef SAX::Attributes<string_type, string_adaptor> attributesT;
2002-06-21 13:16:28 +02:00
msxml2_wrapper();
virtual ~msxml2_wrapper();
2002-06-21 13:16:28 +02:00
/////////////////////////////////////////////////
// Configuration
virtual bool getFeature(const string_type& name) const;
virtual void setFeature(const string_type& name, bool value);
2002-06-21 13:16:28 +02:00
/////////////////////////////////////////////////
// Event Handlers
/* MSXML does not use EntityResolver currently */
virtual void setEntityResolver(entityResolverT& resolver) { }
virtual entityResolverT* getEntityResolver() const { return 0; }
virtual void setDTDHandler(dtdHandlerT& handler) { dtdHandler_.setDTDHandler(handler); }
virtual dtdHandlerT* getDTDHandler() const { return dtdHandler_.getDTDHandler(); }
virtual void setContentHandler(contentHandlerT& handler) { contentHandler_.setContentHandler(handler); }
virtual contentHandlerT* getContentHandler() const { return contentHandler_.getContentHandler(); }
virtual void setErrorHandler(errorHandlerT& handler);
virtual errorHandlerT* getErrorHandler() const { return errorHandler_.getErrorHandler(); }
virtual void setDeclHandler(declHandlerT& handler) { declHandler_.setDeclHandler(handler); }
virtual declHandlerT* getDeclHandler() const { return declHandler_.getDeclHandler(); }
virtual void setLexicalHandler(lexicalHandlerT& handler) { lexicalHandler_.setLexicalHandler(handler); }
virtual lexicalHandlerT* getLexicalHandler() const { return lexicalHandler_.getLexicalHandler(); }
2002-06-21 13:16:28 +02:00
//////////////////////////////////////////////////
// Parsing
virtual void parse(inputSourceT& input);
2002-06-21 13:16:28 +02:00
protected:
virtual std::auto_ptr<typename XMLReaderT::PropertyBase> doGetProperty(const string_type& name)
{
if(name == properties_.lexicalHandler)
{
Property<lexicalHandlerT*>* prop = new Property<lexicalHandlerT*>(lexicalHandler_.getLexicalHandler());
return std::auto_ptr<XMLReaderT::PropertyBase>(prop);
}
if(name == properties_.declHandler)
{
Property<declHandlerT*>* prop = new Property<declHandlerT*>(declHandler_.getDeclHandler());
return std::auto_ptr<XMLReaderT::PropertyBase>(prop);
}
throw SAX::SAXNotRecognizedException("Property not recognized ");
} // doGetProperty
virtual void doSetProperty(const string_type& name, std::auto_ptr<typename XMLReaderT::PropertyBase> value)
{
if(name == properties_.lexicalHandler)
{
Property<lexicalHandlerT&>* prop = dynamic_cast<Property<lexicalHandlerT&>*>(value.get());
if(!prop)
throw std::runtime_error("bad_cast: Property LexicalHandler is wrong type, should be SAX::LexicalHandler&");
lexicalHandler_.setLexicalHandler(prop->get());
return;
} // if ...
if(name == properties_.declHandler)
{
Property<declHandlerT&>* prop = dynamic_cast<Property<declHandlerT&>*>(value.get());
if(!prop)
throw std::runtime_error("bad_cast: Property DeclHandler is wrong type, should be SAX::DeclHandler&");
declHandler_.setDeclHandler(prop->get());
return;
} // if ...
throw SAX::SAXNotRecognizedException("Property not recognized ");
} // doSetProperty
2002-06-21 13:16:28 +02:00
private:
//////////////////////////////////////////////////////
// COM interface -> C++ interface adaptors
class LocatorAdaptor : public locatorT
2002-06-21 13:16:28 +02:00
{
public:
LocatorAdaptor() : locator_(0) { }
LocatorAdaptor(ISAXLocator __RPC_FAR* locator) : locator_(0) { setLocator(locator); }
2002-06-21 13:16:28 +02:00
~LocatorAdaptor() { setLocator(0); }
string_type getPublicId() const
2002-06-21 13:16:28 +02:00
{
if(!locator_)
return string_type();
2002-06-21 13:16:28 +02:00
const wchar_t* pwchPublicId;
locator_->getPublicId(&pwchPublicId);
string_type publicId(string_adaptor::construct_from_utf16(pwchPublicId));
2002-06-21 13:16:28 +02:00
return publicId;
} // getPublicId
string_type getSystemId() const
2002-06-21 13:16:28 +02:00
{
if(!locator_)
return string_type();
2002-06-21 13:16:28 +02:00
const wchar_t* pwchSystemId;
locator_->getSystemId(&pwchSystemId);
string_type systemId(string_adaptor::construct_from_utf16(pwchSystemId));
2002-06-21 13:16:28 +02:00
return systemId;
} // getSystemId
int getLineNumber() const
{
if(!locator_)
return -1;
int lineNumber;
locator_->getLineNumber(&lineNumber);
2002-06-21 13:16:28 +02:00
return lineNumber;
} // getLineNumber
int getColumnNumber() const
2002-06-21 13:16:28 +02:00
{
if(!locator_)
return -1;
int columnNumber;
locator_->getColumnNumber(&columnNumber);
2002-06-21 13:16:28 +02:00
return columnNumber;
} // getColumnNumber
void setLocator(ISAXLocator __RPC_FAR* locator)
2002-06-21 13:16:28 +02:00
{
locator_ = locator;
// no need to AddRef or Release as the ISAXLocator points to the MSXML instance
// and we'll clean that up properly anyway
2002-06-21 13:16:28 +02:00
} // setLocator
private:
ISAXLocator __RPC_FAR *locator_;
2002-06-21 13:16:28 +02:00
}; // class LocatorAdaptor
class DTDHandlerAdaptor : public ISAXDTDHandler
2002-06-21 13:16:28 +02:00
{
public:
DTDHandlerAdaptor() : dtdHandler_(0) { }
~DTDHandlerAdaptor() { }
void setDTDHandler(dtdHandlerT& handler) { dtdHandler_ = &handler; }
dtdHandlerT* getDTDHandler() const { return dtdHandler_; }
2002-06-21 13:16:28 +02:00
virtual HRESULT STDMETHODCALLTYPE notationDecl(
/* [in] */ const wchar_t *pwchName,
/* [in] */ int cchName,
/* [in] */ const wchar_t *pwchPublicId,
/* [in] */ int cchPublicId,
/* [in] */ const wchar_t *pwchSystemId,
/* [in] */ int cchSystemId)
2002-06-21 13:16:28 +02:00
{
if(dtdHandler_)
dtdHandler_->notationDecl(string_adaptor::construct_from_utf16(pwchName, cchName),
string_adaptor::construct_from_utf16(pwchPublicId, cchPublicId),
string_adaptor::construct_from_utf16(pwchSystemId, cchSystemId));
2002-06-21 13:16:28 +02:00
return S_OK;
} // notationDecl
virtual HRESULT STDMETHODCALLTYPE unparsedEntityDecl(
/* [in] */ const wchar_t *pwchName,
/* [in] */ int cchName,
/* [in] */ const wchar_t *pwchPublicId,
/* [in] */ int cchPublicId,
/* [in] */ const wchar_t *pwchSystemId,
/* [in] */ int cchSystemId,
/* [in] */ const wchar_t *pwchNotationName,
/* [in] */ int cchNotationName)
{
2002-06-21 13:16:28 +02:00
if(dtdHandler_)
dtdHandler_->unparsedEntityDecl(string_adaptor::construct_from_utf16(pwchName, cchName),
string_adaptor::construct_from_utf16(pwchPublicId, cchPublicId),
string_adaptor::construct_from_utf16(pwchSystemId, cchSystemId),
string_adaptor::construct_from_utf16(pwchNotationName, cchNotationName));
2002-06-21 13:16:28 +02:00
return S_OK;
} // unparsedEntityDecl
// satify COM interface even if we're not a COM object
long __stdcall QueryInterface(const struct _GUID &riid,void **ppvObject) { return 0; }
unsigned long __stdcall AddRef() { return 0; }
unsigned long __stdcall Release() { return 0; }
private:
dtdHandlerT* dtdHandler_;
2002-06-21 13:16:28 +02:00
}; // class DTDHandlerAdaptor
class ContentHandlerAdaptor : public ISAXContentHandler
2002-06-21 13:16:28 +02:00
{
public:
ContentHandlerAdaptor() : contentHandler_(0) { }
~ContentHandlerAdaptor() { }
void setContentHandler(contentHandlerT& handler) { contentHandler_ = &handler; }
contentHandlerT* getContentHandler() const { return contentHandler_; }
2002-06-21 13:16:28 +02:00
virtual HRESULT STDMETHODCALLTYPE putDocumentLocator(
/* [in] */ ISAXLocator *pLocator)
2002-06-21 13:16:28 +02:00
{
locator_.setLocator(pLocator);
if(contentHandler_) contentHandler_->setDocumentLocator(locator_);
return S_OK;
} // putDocumentLocation
virtual HRESULT STDMETHODCALLTYPE startDocument( void)
2002-06-21 13:16:28 +02:00
{
if(contentHandler_) contentHandler_->startDocument();
return S_OK;
} // startDocument
virtual HRESULT STDMETHODCALLTYPE endDocument( void)
2002-06-21 13:16:28 +02:00
{
if(contentHandler_) contentHandler_->endDocument();
return S_OK;
} // endDocument
virtual HRESULT STDMETHODCALLTYPE startPrefixMapping(
/* [in] */ const wchar_t *pwchPrefix,
/* [in] */ int cchPrefix,
/* [in] */ const wchar_t *pwchUri,
/* [in] */ int cchUri)
2002-06-21 13:16:28 +02:00
{
2002-06-21 13:16:28 +02:00
if(contentHandler_)
contentHandler_->startPrefixMapping(string_adaptor::construct_from_utf16(pwchPrefix, cchPrefix),
string_adaptor::construct_from_utf16(pwchUri, cchUri));
2002-06-21 13:16:28 +02:00
return S_OK;
} // startPrefixMapping
virtual HRESULT STDMETHODCALLTYPE endPrefixMapping(
/* [in] */ const wchar_t *pwchPrefix,
/* [in] */ int cchPrefix)
2002-06-21 13:16:28 +02:00
{
if(contentHandler_) contentHandler_->endPrefixMapping(string_adaptor::construct_from_utf16(pwchPrefix, cchPrefix));
2002-06-21 13:16:28 +02:00
return S_OK;
} // endPrefixMapping
virtual HRESULT STDMETHODCALLTYPE startElement(
/* [in] */ const wchar_t *pwchNamespaceUri,
/* [in] */ int cchNamespaceUri,
/* [in] */ const wchar_t *pwchLocalName,
/* [in] */ int cchLocalName,
/* [in] */ const wchar_t *pwchQName,
/* [in] */ int cchQName,
/* [in] */ ISAXAttributes *pAttributes)
2002-06-21 13:16:28 +02:00
{
if(contentHandler_)
{
AttributesAdaptor attrs(pAttributes);
contentHandler_->startElement(string_adaptor::construct_from_utf16(pwchNamespaceUri, cchNamespaceUri),
string_adaptor::construct_from_utf16(pwchLocalName, cchLocalName),
string_adaptor::construct_from_utf16(pwchQName, cchQName),
2002-06-21 13:16:28 +02:00
attrs);
} // if ...
return S_OK;
} // startElement
virtual HRESULT STDMETHODCALLTYPE endElement(
/* [in] */ const wchar_t *pwchNamespaceUri,
/* [in] */ int cchNamespaceUri,
/* [in] */ const wchar_t *pwchLocalName,
/* [in] */ int cchLocalName,
/* [in] */ const wchar_t *pwchQName,
/* [in] */ int cchQName)
2002-06-21 13:16:28 +02:00
{
if(contentHandler_)
contentHandler_->endElement(string_adaptor::construct_from_utf16(pwchNamespaceUri, cchNamespaceUri),
string_adaptor::construct_from_utf16(pwchLocalName, cchLocalName),
string_adaptor::construct_from_utf16(pwchQName, cchQName));
2002-06-21 13:16:28 +02:00
return S_OK;
} // endElement
virtual HRESULT STDMETHODCALLTYPE characters(
/* [in] */ const wchar_t *pwchChars,
/* [in] */ int cchChars)
2002-06-21 13:16:28 +02:00
{
if(contentHandler_) contentHandler_->characters(string_adaptor::construct_from_utf16(pwchChars, cchChars));
2002-06-21 13:16:28 +02:00
return S_OK;
} // characters
virtual HRESULT STDMETHODCALLTYPE ignorableWhitespace(
/* [in] */ const wchar_t *pwchChars,
/* [in] */ int cchChars)
2002-06-21 13:16:28 +02:00
{
if(contentHandler_)
contentHandler_->ignorableWhitespace(string_adaptor::construct_from_utf16(pwchChars, cchChars));
2002-06-21 13:16:28 +02:00
return S_OK;
} // ignorableWhitespace
virtual HRESULT STDMETHODCALLTYPE processingInstruction(
/* [in] */ const wchar_t *pwchTarget,
/* [in] */ int cchTarget,
/* [in] */ const wchar_t *pwchData,
/* [in] */ int cchData)
2002-06-21 13:16:28 +02:00
{
if(contentHandler_)
contentHandler_->processingInstruction(string_adaptor::construct_from_utf16(pwchTarget, cchTarget),
string_adaptor::construct_from_utf16(pwchData, cchData));
2002-06-21 13:16:28 +02:00
return S_OK;
} // processingInstruction
virtual HRESULT STDMETHODCALLTYPE skippedEntity(
/* [in] */ const wchar_t *pwchName,
/* [in] */ int cchName)
2002-06-21 13:16:28 +02:00
{
if(contentHandler_)
contentHandler_->skippedEntity(string_adaptor::construct_from_utf16(pwchName, cchName));
2002-06-21 13:16:28 +02:00
return S_OK;
} // skippedEntity
// satisfy COM interface even if we're not a COM object
long __stdcall QueryInterface(const struct _GUID &riid,void **ppvObject) { return 0; }
unsigned long __stdcall AddRef() { return 0; }
unsigned long __stdcall Release() { return 0; }
private:
////////////////////////////////////////////////
// member varaibles
contentHandlerT* contentHandler_;
2002-06-21 13:16:28 +02:00
LocatorAdaptor locator_;
//////////////////////////////////////////////////////
// COM interface -> C++ interface adaptors
class AttributesAdaptor : public attributesT
2002-06-21 13:16:28 +02:00
{
public:
AttributesAdaptor(ISAXAttributes __RPC_FAR *pAttributes) : attributes_(pAttributes) { }
2002-06-21 13:16:28 +02:00
~AttributesAdaptor() { }
/////////////////////////
// indexed access
2002-06-21 13:16:28 +02:00
virtual int getLength() const
{
int length;
attributes_->getLength(&length);
2002-06-21 13:16:28 +02:00
return length;
} // getLength
virtual string_type getURI(unsigned int index) const
2002-06-21 13:16:28 +02:00
{
const wchar_t* pwchUri;
2002-06-21 13:16:28 +02:00
int cchUri;
HRESULT hr = attributes_->getURI(index, &pwchUri, &cchUri);
2002-06-21 13:16:28 +02:00
if (FAILED(hr))
return string_type();
string_type uri(string_adaptor::construct_from_utf16(pwchUri, cchUri));
2002-06-21 13:16:28 +02:00
return uri;
} // getURI
virtual string_type getLocalName(unsigned int index) const
2002-06-21 13:16:28 +02:00
{
const wchar_t* pwchLocalName;
2002-06-21 13:16:28 +02:00
int cchLocalName;
HRESULT hr = attributes_->getLocalName(index, &pwchLocalName, &cchLocalName);
2002-06-21 13:16:28 +02:00
if (FAILED(hr))
return string_type();
string_type localName(string_adaptor::construct_from_utf16(pwchLocalName, cchLocalName));
return localName;
2002-06-21 13:16:28 +02:00
} // getLocalName
virtual string_type getQName(unsigned int index) const
2002-06-21 13:16:28 +02:00
{
const wchar_t* pwchQName;
2002-06-21 13:16:28 +02:00
int cchQName;
HRESULT hr = attributes_->getQName(index, &pwchQName, &cchQName);
2002-06-21 13:16:28 +02:00
if (FAILED(hr))
return string_type();
string_type qName(string_adaptor::construct_from_utf16(pwchQName, cchQName));
2002-06-21 13:16:28 +02:00
return qName;
} // getQName
virtual string_type getType(unsigned int index) const
2002-06-21 13:16:28 +02:00
{
const wchar_t* pwchType;
2002-06-21 13:16:28 +02:00
int cchType;
HRESULT hr = attributes_->getType(index, &pwchType, &cchType);
2002-06-21 13:16:28 +02:00
if (FAILED(hr))
return string_type();
string_type type(string_adaptor::construct_from_utf16(pwchType, cchType));
2002-06-21 13:16:28 +02:00
return type;
} // getType
virtual string_type getValue(unsigned int index) const
2002-06-21 13:16:28 +02:00
{
const wchar_t* pwchValue;
2002-06-21 13:16:28 +02:00
int cchValue;
HRESULT hr = attributes_->getValue(index, &pwchValue, &cchValue);
2002-06-21 13:16:28 +02:00
if (FAILED(hr))
return string_type();
string_type value(string_adaptor::construct_from_utf16(pwchValue, cchValue));
2002-06-21 13:16:28 +02:00
return value;
} // getValue
/////////////////////////
// name based query
virtual int getIndex(const string_type& uri, const string_type& localName) const
2002-06-21 13:16:28 +02:00
{
int index = -1;
std::wstring wUri(string_adaptor::asStdWString(uri));
std::wstring wLocalName(string_adaptor::asStdWString(localName));
2003-08-27 16:28:01 +02:00
HRESULT hr = attributes_->getIndexFromName(wUri.data(), static_cast<int>(wUri.length()),
wLocalName.data(), static_cast<int>(wLocalName.length()),
2002-06-21 13:16:28 +02:00
&index);
return index;
} // getIndex
virtual int getIndex(const string_type& qName) const
2002-06-21 13:16:28 +02:00
{
int index = -1;
std::wstring wQName(string_adaptor::asStdWString(qName));
2003-08-27 16:28:01 +02:00
attributes_->getIndexFromQName(wQName.data(), static_cast<int>(wQName.length()), &index);
return index;
2002-06-21 13:16:28 +02:00
} // getIndex
virtual string_type getType(const string_type& uri, const string_type& localName) const
2002-06-21 13:16:28 +02:00
{
const wchar_t* pwchType;
2002-06-21 13:16:28 +02:00
int cchType;
std::wstring wUri(string_adaptor::asStdWString(uri));
std::wstring wLocalName(string_adaptor::asStdWString(localName));
2003-08-27 16:28:01 +02:00
HRESULT hr = attributes_->getTypeFromName(wUri.data(), static_cast<int>(wUri.length()),
wLocalName.data(), static_cast<int>(wLocalName.length()),
2002-06-21 13:16:28 +02:00
&pwchType, &cchType);
if (FAILED(hr))
return string_type();
string_type type(string_adaptor::construct_from_utf16(pwchType, cchType));
2002-06-21 13:16:28 +02:00
return type;
} // getType
virtual string_type getType(const string_type& qName) const
2002-06-21 13:16:28 +02:00
{
const wchar_t* pwchType;
2002-06-21 13:16:28 +02:00
int cchType;
std::wstring wQName(string_adaptor::asStdWString(qName));
2003-08-27 16:28:01 +02:00
HRESULT hr = attributes_->getTypeFromQName(wQName.data(), static_cast<int>(wQName.length()),
2002-06-21 13:16:28 +02:00
&pwchType, &cchType);
if (FAILED(hr))
return string_type();
string_type type(string_adaptor::construct_from_utf16(pwchType, cchType));
2002-06-21 13:16:28 +02:00
return type;
} // getType
virtual string_type getValue(const string_type& uri, const string_type& localName) const
2002-06-21 13:16:28 +02:00
{
const wchar_t* pwchValue;
2002-06-21 13:16:28 +02:00
int cchValue;
std::wstring wUri(string_adaptor::asStdWString(uri));
std::wstring wLocalName(string_adaptor::asStdWString(localName));
2003-08-27 16:28:01 +02:00
HRESULT hr = attributes_->getValueFromName(wUri.data(), static_cast<int>(wUri.length()),
wLocalName.data(), static_cast<int>(wLocalName.length()),
2002-06-21 13:16:28 +02:00
&pwchValue, &cchValue);
if (FAILED(hr))
return string_type();
string_type value(string_adaptor::construct_from_utf16(pwchValue, cchValue));
2002-06-21 13:16:28 +02:00
return value;
} // getValue
virtual string_type getValue(const string_type& qname) const
2002-06-21 13:16:28 +02:00
{
const wchar_t* pwchValue;
2002-06-21 13:16:28 +02:00
int cchValue;
std::wstring wQName(string_adaptor::asStdWString(qname));
2003-08-27 16:28:01 +02:00
HRESULT hr = attributes_->getValueFromQName(wQName.data(), static_cast<int>(wQName.length()),
2002-06-21 13:16:28 +02:00
&pwchValue, &cchValue);
if (FAILED(hr))
return string_type();
string_type value(string_adaptor::construct_from_utf16(pwchValue, cchValue));
2002-06-21 13:16:28 +02:00
return value;
} // getValue
private:
ISAXAttributes __RPC_FAR *attributes_;
2002-06-21 13:16:28 +02:00
AttributesAdaptor();
}; // class AttributesAdaptor
}; // class ContentHandlerAdaptor
class ErrorHandlerAdaptor : public ISAXErrorHandler
2002-06-21 13:16:28 +02:00
{
public:
ErrorHandlerAdaptor() : errorHandler_(0),
bWarning_(false), bError_(false), bFatal_(false),
eWarning_("none"), eError_("none"), eFatal_("none")
{ }
2002-06-21 13:16:28 +02:00
virtual ~ErrorHandlerAdaptor() { }
void setErrorHandler(errorHandlerT& handler) { errorHandler_ = &handler; }
errorHandlerT* getErrorHandler() const { return errorHandler_; }
2002-06-21 13:16:28 +02:00
virtual HRESULT STDMETHODCALLTYPE error(
/* [in] */ ISAXLocator *pLocator,
/* [in] */ const wchar_t *pwchErrorMessage,
/* [in] */ HRESULT hrErrorCode)
2002-06-21 13:16:28 +02:00
{
bError_ = true;
string_type errorMsg(string_adaptor::construct_from_utf16(pwchErrorMessage));
eError_ = SAXParseExceptionT(string_adaptor::asStdString(errorMsg), LocatorAdaptor(pLocator));
2002-06-21 13:16:28 +02:00
return S_OK;
} // error
virtual HRESULT STDMETHODCALLTYPE fatalError(
/* [in] */ ISAXLocator *pLocator,
/* [in] */ const wchar_t *pwchErrorMessage,
/* [in] */ HRESULT hrErrorCode)
2002-06-21 13:16:28 +02:00
{
bFatal_ = true;
string_type errorMsg(string_adaptor::construct_from_utf16(pwchErrorMessage));
eFatal_ = SAXParseExceptionT(string_adaptor::asStdString(errorMsg), LocatorAdaptor(pLocator));
return S_FALSE;
2002-06-21 13:16:28 +02:00
} // fatalError
virtual HRESULT STDMETHODCALLTYPE ignorableWarning(
/* [in] */ ISAXLocator *pLocator,
/* [in] */ const wchar_t *pwchErrorMessage,
/* [in] */ HRESULT hrErrorCode)
2002-06-21 13:16:28 +02:00
{
bWarning_ = true;
string_type errorMsg(string_adaptor::construct_from_utf16(pwchErrorMessage));
eWarning_ = SAXParseExceptionT(string_adaptor::asStdString(errorMsg), LocatorAdaptor(pLocator));
return S_OK;
2002-06-21 13:16:28 +02:00
} // ignorableWarning
void report()
{
if(!errorHandler_)
return;
bool bWarning = bWarning_;
bool bError = bError_;
bool bFatal = bFatal_;
bWarning_ = bError_ = bFatal_ = false;
if(bFatal)
errorHandler_->fatalError(eFatal_);
if(bError)
errorHandler_->error(eError_);
if(bWarning)
errorHandler_->warning(eWarning_);
} // report
2002-06-21 13:16:28 +02:00
// satisfy COM interface even if we're not a COM object
long __stdcall QueryInterface(const struct _GUID &riid,void **ppvObject) { return 0; }
unsigned long __stdcall AddRef() { return 0; }
unsigned long __stdcall Release() { return 0; }
private:
typedef SAX::SAXParseException<string_type, string_adaptor> SAXParseExceptionT;
bool bWarning_;
bool bError_;
bool bFatal_;
SAXParseExceptionT eWarning_;
SAXParseExceptionT eError_;
SAXParseExceptionT eFatal_;
errorHandlerT* errorHandler_;
2002-06-21 13:16:28 +02:00
}; // class ErrorHandlerAdaptor
class LexicalHandlerAdaptor : public ISAXLexicalHandler
2002-06-21 13:16:28 +02:00
{
public:
LexicalHandlerAdaptor() : lexicalHandler_(0) { }
virtual ~LexicalHandlerAdaptor() { }
void setLexicalHandler(lexicalHandlerT& handler) { lexicalHandler_ = &handler; }
lexicalHandlerT* getLexicalHandler() const { return lexicalHandler_; }
2002-06-21 13:16:28 +02:00
virtual HRESULT STDMETHODCALLTYPE startDTD(
/* [in] */ const wchar_t *pwchName,
/* [in] */ int cchName,
/* [in] */ const wchar_t *pwchPublicId,
/* [in] */ int cchPublicId,
/* [in] */ const wchar_t *pwchSystemId,
/* [in] */ int cchSystemId)
2002-06-21 13:16:28 +02:00
{
if(lexicalHandler_)
lexicalHandler_->startDTD(string_adaptor::construct_from_utf16(pwchName, cchName),
string_adaptor::construct_from_utf16(pwchPublicId, cchPublicId),
string_adaptor::construct_from_utf16(pwchSystemId, cchSystemId));
2002-06-21 13:16:28 +02:00
return S_OK;
} // startDTD
virtual HRESULT STDMETHODCALLTYPE endDTD( void)
2002-06-21 13:16:28 +02:00
{
if(lexicalHandler_)
lexicalHandler_->endDTD();
return S_OK;
} // endDTD
virtual HRESULT STDMETHODCALLTYPE startEntity(
/* [in] */ const wchar_t *pwchName,
/* [in] */ int cchName)
2002-06-21 13:16:28 +02:00
{
if(lexicalHandler_)
lexicalHandler_->startEntity(string_adaptor::construct_from_utf16(pwchName, cchName));
2002-06-21 13:16:28 +02:00
return S_OK;
} // startEntity
virtual HRESULT STDMETHODCALLTYPE endEntity(
/* [in] */ const wchar_t *pwchName,
/* [in] */ int cchName)
2002-06-21 13:16:28 +02:00
{
if(lexicalHandler_)
lexicalHandler_->endEntity(string_adaptor::construct_from_utf16(pwchName, cchName));
2002-06-21 13:16:28 +02:00
return S_OK;
} // endEntity
virtual HRESULT __stdcall startCDATA()
2002-06-21 13:16:28 +02:00
{
if(lexicalHandler_)
lexicalHandler_->startCDATA();
return S_OK;
} // startCDATA
virtual HRESULT __stdcall endCDATA()
2002-06-21 13:16:28 +02:00
{
if(lexicalHandler_)
lexicalHandler_->endCDATA();
return S_OK;
} // endCDATA
virtual HRESULT STDMETHODCALLTYPE comment(
/* [in] */ const wchar_t *pwchChars,
/* [in] */ int cchChars)
2002-06-21 13:16:28 +02:00
{
if(lexicalHandler_)
lexicalHandler_->comment(string_adaptor::construct_from_utf16(pwchChars, cchChars));
return S_OK;
2002-06-21 13:16:28 +02:00
} // comment
// satisfy COM interface even if we're not a COM object
long __stdcall QueryInterface(const struct _GUID &riid,void **ppvObject)
{
// we have to implement this, because we pass this as an IUnknown but it needs an
// ISAXLexicalHandler interface
if(riid == __uuidof(ISAXLexicalHandler))
2002-06-21 13:16:28 +02:00
*ppvObject = this;
return 0;
} // QueryInterface
unsigned long __stdcall AddRef() { return 0; }
unsigned long __stdcall Release() { return 0; }
private:
lexicalHandlerT* lexicalHandler_;
2002-06-21 13:16:28 +02:00
}; // class LexicalHandlerAdaptor
class DeclHandlerAdaptor : public ISAXDeclHandler
2002-06-21 13:16:28 +02:00
{
public:
DeclHandlerAdaptor() : declHandler_(0) { }
virtual ~DeclHandlerAdaptor() { }
void setDeclHandler(declHandlerT& handler) { declHandler_ = &handler; }
declHandlerT* getDeclHandler() const { return declHandler_; }
2002-06-21 13:16:28 +02:00
virtual HRESULT STDMETHODCALLTYPE elementDecl(
/* [in] */ const wchar_t *pwchName,
/* [in] */ int cchName,
/* [in] */ const wchar_t *pwchModel,
/* [in] */ int cchModel)
2002-06-21 13:16:28 +02:00
{
if(declHandler_)
declHandler_->elementDecl(string_adaptor::construct_from_utf16(pwchName, cchName),
string_adaptor::construct_from_utf16(pwchModel, cchModel));
2002-06-21 13:16:28 +02:00
return S_OK;
} // elementDecl
virtual HRESULT STDMETHODCALLTYPE attributeDecl(
/* [in] */ const wchar_t *pwchElementName,
/* [in] */ int cchElementName,
/* [in] */ const wchar_t *pwchAttributeName,
/* [in] */ int cchAttributeName,
/* [in] */ const wchar_t *pwchType,
/* [in] */ int cchType,
/* [in] */ const wchar_t *pwchValueDefault,
/* [in] */ int cchValueDefault,
/* [in] */ const wchar_t *pwchValue,
/* [in] */ int cchValue)
2002-06-21 13:16:28 +02:00
{
if(declHandler_)
declHandler_->attributeDecl(string_adaptor::construct_from_utf16(pwchElementName, cchElementName),
string_adaptor::construct_from_utf16(pwchAttributeName, cchAttributeName),
string_adaptor::construct_from_utf16(pwchType, cchType),
string_adaptor::construct_from_utf16(pwchValueDefault, cchValueDefault),
string_adaptor::construct_from_utf16(pwchValue, cchValue));
2002-06-21 13:16:28 +02:00
return S_OK;
} // attributeDecl
virtual HRESULT STDMETHODCALLTYPE internalEntityDecl(
/* [in] */ const wchar_t *pwchName,
/* [in] */ int cchName,
/* [in] */ const wchar_t *pwchValue,
/* [in] */ int cchValue)
2002-06-21 13:16:28 +02:00
{
if(declHandler_)
declHandler_->internalEntityDecl(string_adaptor::construct_from_utf16(pwchName, cchName),
string_adaptor::construct_from_utf16(pwchValue, cchValue));
2002-06-21 13:16:28 +02:00
return S_OK;
} // internalEntityDecl
virtual HRESULT STDMETHODCALLTYPE externalEntityDecl(
/* [in] */ const wchar_t *pwchName,
/* [in] */ int cchName,
/* [in] */ const wchar_t *pwchPublicId,
/* [in] */ int cchPublicId,
/* [in] */ const wchar_t *pwchSystemId,
/* [in] */ int cchSystemId)
2002-06-21 13:16:28 +02:00
{
if(declHandler_)
declHandler_->externalEntityDecl(string_adaptor::construct_from_utf16(pwchName, cchName),
string_adaptor::construct_from_utf16(pwchPublicId, cchPublicId),
string_adaptor::construct_from_utf16(pwchSystemId, cchSystemId));
2002-06-21 13:16:28 +02:00
return S_OK;
} // externalEntityDecl
// satisfy COM interface even if we're not a COM object
long __stdcall QueryInterface(const struct _GUID &riid,void **ppvObject)
{
// we have to implement this, because we pass this as an IUnknown but it needs an
// ISAXDeclHandler interface
if(riid == __uuidof(ISAXDeclHandler))
2002-06-21 13:16:28 +02:00
*ppvObject = reinterpret_cast<void*>(this);
return 0;
} // QueryInterface
unsigned long __stdcall AddRef() { return 0; }
unsigned long __stdcall Release() { return 0; }
private:
declHandlerT* declHandler_;
2002-06-21 13:16:28 +02:00
}; // class DeclHandlerAdaptor
class StreamAdaptor : public ISequentialStream
2002-06-21 13:16:28 +02:00
{
public:
StreamAdaptor(inputSourceT& source) :
2002-06-21 13:16:28 +02:00
source_(source)
{
} // StreamAdaptor
virtual HRESULT __stdcall Read(void* pv, ULONG cb, ULONG* pcbRead)
{
source_.getByteStream()->read(reinterpret_cast<char*>(pv), cb);
*pcbRead = source_.getByteStream()->gcount();
return S_OK;
} // Read
virtual HRESULT __stdcall Write(const void __RPC_FAR *pv, ULONG cb, ULONG __RPC_FAR *pcbWritten)
2002-06-21 13:16:28 +02:00
{
return S_FALSE;
} // Write
// satisfy COM interface even if we're not a COM object
long __stdcall QueryInterface(const struct _GUID &riid,void **ppvObject)
{
// we have to implement this, because we pass this as an IUnknown but it needs an
// IStream interface
if(riid == __uuidof(ISequentialStream))
{
2002-06-21 13:16:28 +02:00
*ppvObject = reinterpret_cast<void*>(this);
return S_OK;
} // if ...
return E_NOINTERFACE;
2002-06-21 13:16:28 +02:00
} // QueryInterface
unsigned long __stdcall AddRef() { return 1; }
unsigned long __stdcall Release() { return 1; }
2002-06-21 13:16:28 +02:00
private:
inputSourceT& source_;
2002-06-21 13:16:28 +02:00
}; // StreamAdaptor
2002-06-21 13:16:28 +02:00
//////////////////////////////////////////////////////
// member variables
COMInitializer_type init;
DTDHandlerAdaptor dtdHandler_;
ContentHandlerAdaptor contentHandler_;
ErrorHandlerAdaptor errorHandler_;
LexicalHandlerAdaptor lexicalHandler_;
DeclHandlerAdaptor declHandler_;
ISAXXMLReaderPtr reader_;
SAX::PropertyNames<string_type, string_adaptor> properties_;
2002-06-21 13:16:28 +02:00
}; // class msxml
template<class string_type, class T0, class T1>
msxml2_wrapper<string_type, T0, T1>::msxml2_wrapper()
2002-06-21 13:16:28 +02:00
{
reader_.CreateInstance("Msxml2.SAXXMLReader.6.0");
if(reader_.GetInterfacePtr() == 0)
reader_.CreateInstance("Msxml2.SAXXMLReader.5.0");
if(reader_.GetInterfacePtr() == 0)
reader_.CreateInstance("Msxml2.SAXXMLReader.4.0");
2005-08-15 11:05:56 +02:00
if(reader_.GetInterfacePtr() == 0)
reader_.CreateInstance("Msxml2.SAXXMLReader.3.0");
if(reader_.GetInterfacePtr() == 0)
reader_.CreateInstance(__uuidof(ISAXXMLReader));
2005-08-15 11:05:56 +02:00
if(reader_.GetInterfacePtr() == 0)
throw SAXException("MSXML SAX Reader (pre-4.0) could not be instantiated");
2002-06-21 13:16:28 +02:00
reader_->putContentHandler(&contentHandler_);
reader_->putErrorHandler(&errorHandler_);
reader_->putDTDHandler(&dtdHandler_);
VARIANT wrapper;
wrapper.vt = VT_UNKNOWN;
wrapper.punkVal = static_cast<ISAXLexicalHandler*>(&lexicalHandler_);
2002-06-21 13:16:28 +02:00
reader_->putProperty(L"http://xml.org/sax/properties/lexical-handler", wrapper);
wrapper.punkVal = static_cast<ISAXDeclHandler*>(&declHandler_);
2002-06-21 13:16:28 +02:00
reader_->putProperty(L"http://xml.org/sax/properties/declaration-handler", wrapper);
} // msxml2_wrapper
template<class string_type, class T0, class T1>
msxml2_wrapper<string_type, T0, T1>::~msxml2_wrapper()
2002-06-21 13:16:28 +02:00
{
2005-08-15 11:05:56 +02:00
if(reader_.GetInterfacePtr())
reader_.Release();
} // ~msxml2_wrapper
2002-06-21 13:16:28 +02:00
template<class string_type, class T0, class T1>
bool msxml2_wrapper<string_type, T0, T1>::getFeature(const string_type& name) const
2002-06-21 13:16:28 +02:00
{
VARIANT_BOOL feature;
std::wstring wName(string_adaptor::asStdWString(name));
2003-08-27 16:28:01 +02:00
reader_->getFeature(wName.c_str(), &feature);
2002-06-21 13:16:28 +02:00
return (feature == VARIANT_TRUE) ? true : false;
} // msxml2_wrapper::getFeature
2002-06-21 13:16:28 +02:00
template<class string_type, class T0, class T1>
void msxml2_wrapper<string_type, T0, T1>::setFeature(const string_type& name, bool value)
2002-06-21 13:16:28 +02:00
{
std::wstring wName(string_adaptor::asStdWString(name));
2003-08-27 16:28:01 +02:00
reader_->putFeature(wName.c_str(), value);
2002-06-21 13:16:28 +02:00
} // setFeature
template<class string_type, class T0, class T1>
void msxml2_wrapper<string_type, T0, T1>::setErrorHandler(errorHandlerT& handler)
2002-06-21 13:16:28 +02:00
{
errorHandler_.setErrorHandler(handler);
} // setErrorHandler
template<class string_type, class T0, class T1>
void msxml2_wrapper<string_type, T0, T1>::parse(inputSourceT& source)
2002-06-21 13:16:28 +02:00
{
if(source.getByteStream() == 0)
{
std::wstring wSysId(string_adaptor::asStdWString(source.getSystemId()));
2003-08-27 16:28:01 +02:00
reader_->parseURL(wSysId.c_str());
2002-06-21 13:16:28 +02:00
}
else
{
StreamAdaptor sa(source);
VARIANT wrapper;
wrapper.vt = VT_UNKNOWN;
wrapper.punkVal = static_cast<ISequentialStream*>(&sa);
reader_->parse(wrapper);
2002-06-21 13:16:28 +02:00
} // if ...
errorHandler_.report();
2002-06-21 13:16:28 +02:00
} // parse
} // namespace SAX
2007-09-05 11:49:18 +02:00
} // namespace Arabica
2002-06-21 13:16:28 +02:00
#endif
// end of file