mirror of
https://github.com/jezhiggins/arabica
synced 2025-01-17 18:12:04 +01:00
1048 lines
38 KiB
C++
1048 lines
38 KiB
C++
#ifndef ARABICA_SAX_EXPAT_H
|
|
#define ARABICA_SAX_EXPAT_H
|
|
//---------------------------------------------------------------------------
|
|
// A SAX2 wrapper class for expat.
|
|
//---------------------------------------------------------------------------
|
|
|
|
#include <SAX/ArabicaConfig.h>
|
|
#include <SAX/XMLReader.h>
|
|
#include <expat.h>
|
|
|
|
#include <sstream>
|
|
#include <SAX/InputSource.h>
|
|
#include <SAX/ContentHandler.h>
|
|
#include <SAX/SAXParseException.h>
|
|
#include <SAX/SAXNotRecognizedException.h>
|
|
#include <SAX/SAXNotSupportedException.h>
|
|
#include <SAX/ext/DeclHandler.h>
|
|
#include <SAX/ext/LexicalHandler.h>
|
|
#include <SAX/helpers/DefaultHandler.h>
|
|
#include <SAX/helpers/AttributesImpl.h>
|
|
#include <SAX/helpers/NamespaceSupport.h>
|
|
#include <SAX/helpers/InputSourceResolver.h>
|
|
#include <SAX/helpers/FeatureNames.h>
|
|
#include <SAX/helpers/PropertyNames.h>
|
|
#include <SAX/helpers/StringAdaptor.h>
|
|
#include <SAX/helpers/AttributeDefaults.h>
|
|
#include <typeinfo>
|
|
#include <map>
|
|
|
|
namespace SAX
|
|
{
|
|
|
|
////////////////////////////////////////////////////////////////////////////
|
|
// the callback functions for expat
|
|
namespace expat_wrapper_impl_mumbojumbo
|
|
{
|
|
|
|
extern "C"
|
|
{
|
|
void ewim_charHandler(void* data, const char* txt, int txtlen);
|
|
void ewim_startElement(void* data, const char* qName, const char** atts);
|
|
void ewim_endElement(void* data, const char* qName);
|
|
void ewim_processingInstruction(void* userData, const char* target, const char* data);
|
|
void ewim_elementDeclaration(void* userData,
|
|
const XML_Char* name,
|
|
XML_Content* model);
|
|
void ewim_attListDeclaration(void* userData,
|
|
const XML_Char* elname,
|
|
const XML_Char* attname,
|
|
const XML_Char* att_type,
|
|
const XML_Char* dflt,
|
|
int isrequired);
|
|
void ewim_entityDeclaration(void* userData,
|
|
const XML_Char* entityName,
|
|
int is_parameter_entity,
|
|
const XML_Char* value,
|
|
int value_length,
|
|
const XML_Char* base,
|
|
const XML_Char* systemId,
|
|
const XML_Char* publicId,
|
|
const XML_Char* notationName);
|
|
void ewim_notationDeclaration(void* userData,
|
|
const XML_Char* notationName,
|
|
const XML_Char* base,
|
|
const XML_Char* systemId,
|
|
const XML_Char* publicId);
|
|
void ewim_startDoctypeDecl(void* userData,
|
|
const XML_Char* doctypeName,
|
|
const XML_Char* sysid,
|
|
const XML_Char* pubid,
|
|
int has_internal_subset);
|
|
void ewim_endDoctypeDecl(void* userData);
|
|
void ewim_startCdataSection(void* userData);
|
|
void ewim_endCdataSection(void* userData);
|
|
void ewim_commentHandler(void* userData, const XML_Char* data);
|
|
int ewim_externalEntityRefHandler(XML_Parser parser,
|
|
const XML_Char* context,
|
|
const XML_Char* base,
|
|
const XML_Char* systemId,
|
|
const XML_Char* publicId);
|
|
|
|
} // extern "C"
|
|
|
|
class expat2base
|
|
{
|
|
private:
|
|
virtual void charHandler(const char* txt, int txtlen) = 0;
|
|
virtual void startElement(const char* qName, const char** atts) = 0;
|
|
virtual void endElement(const char* qName) = 0;
|
|
virtual void processingInstruction(const char* target, const char* data) = 0;
|
|
virtual void elementDeclaration(const XML_Char* name,
|
|
const XML_Content* model) = 0;
|
|
virtual void attListDeclaration(const XML_Char* elname,
|
|
const XML_Char* attname,
|
|
const XML_Char* att_type,
|
|
const XML_Char* dflt,
|
|
int isrequired) = 0;
|
|
virtual void entityDeclaration(const XML_Char* entityName,
|
|
int is_parameter_entity,
|
|
const XML_Char* value,
|
|
int value_length,
|
|
const XML_Char* base,
|
|
const XML_Char* systemId,
|
|
const XML_Char* publicId,
|
|
const XML_Char* notationName) = 0;
|
|
virtual void notationDeclaration(const XML_Char* notationName,
|
|
const XML_Char* base,
|
|
const XML_Char* systemId,
|
|
const XML_Char* publicId) = 0;
|
|
virtual void startDoctypeDecl(const XML_Char* doctypeName,
|
|
const XML_Char* sysid,
|
|
const XML_Char* pubid,
|
|
int has_internal_subset) = 0;
|
|
virtual void endDoctypeDecl() = 0;
|
|
virtual void startCdataSection() = 0;
|
|
virtual void endCdataSection() = 0;
|
|
virtual void commentHandler(const XML_Char* data) = 0;
|
|
virtual int externalEntityRefHandler(XML_Parser parser,
|
|
const XML_Char* context,
|
|
const XML_Char* base,
|
|
const XML_Char* systemId,
|
|
const XML_Char* publicId) = 0;
|
|
|
|
|
|
friend void ewim_charHandler(void*, const char*, int);
|
|
friend void ewim_startElement(void*, const char*, const char**);
|
|
friend void ewim_endElement(void*, const char*);
|
|
friend void ewim_processingInstruction(void*, const char*, const char*);
|
|
friend void ewim_elementDeclaration(void*, const XML_Char*, XML_Content*);
|
|
friend void ewim_attListDeclaration(void*, const XML_Char*, const XML_Char*, const XML_Char*, const XML_Char*, int);
|
|
friend void ewim_entityDeclaration(void*, const XML_Char*, int, const XML_Char*, int, const XML_Char*, const XML_Char*, const XML_Char*, const XML_Char*);
|
|
friend void ewim_notationDeclaration(void*, const XML_Char*, const XML_Char*, const XML_Char*, const XML_Char*);
|
|
friend void ewim_startDoctypeDecl(void*, const XML_Char*, const XML_Char*, const XML_Char*, int);
|
|
friend void ewim_endDoctypeDecl(void*);
|
|
friend void ewim_startCdataSection(void*);
|
|
friend void ewim_endCdataSection(void*);
|
|
friend void ewim_commentHandler(void*, const XML_Char*);
|
|
friend int ewim_externalEntityRefHandler(XML_Parser, const XML_Char*, const XML_Char*, const XML_Char*, const XML_Char*);
|
|
|
|
}; // class expat2base
|
|
|
|
} // namespace expat_wrapper_impl_mumbojumbo
|
|
|
|
////////////////////////////////////////////////////////////////////////////
|
|
// A SAX2 wrapper for expat. expat has an event-based interface of its own,
|
|
// so the SAX wrapper maps more or less directly to it.
|
|
|
|
/**
|
|
* expat_wrapper puts an {@link basic_XMLReader XMLReader} interface
|
|
* around <a href='http://www.libexpat.org/'>Expat</a>.
|
|
* <p>
|
|
* For general usage:<br>
|
|
* <code>
|
|
* expat_wrapper<std::string> parser;<br>
|
|
* ... <br>
|
|
* parser.parse(filename);<br>
|
|
* </code>
|
|
* expat_wrapper<std::string> will hand out std::strings containing UTF-8 encoded
|
|
* data (expat's native format).
|
|
* <p>
|
|
* If you need std::wstring containing UCS-2 or perhaps you want to use some custom
|
|
* string type, then you can simply instantiate expat_wrapper on your string type and
|
|
* a policy class which knows how to convert UTF-8 const char*s to your type.
|
|
* <p>
|
|
* The default policy is:
|
|
* <code>
|
|
* template<class stringT><br>
|
|
* class default_expat_string_convertor<br>
|
|
* {<br>
|
|
* public:<br>
|
|
* stringT makeStringT(const char* str) const<br>
|
|
* {<br>
|
|
* if(!str)<br>
|
|
* return stringT();<br>
|
|
* return stringT(str);<br>
|
|
* } // makeStringT<br>
|
|
* stringT makeStringT(const char* str, int length) const<br>
|
|
* {<br>
|
|
* return stringT(str, length);<br>
|
|
* } // makeStringT<br>
|
|
* <br>
|
|
* std::string asStdString(const stringT& str) const<br>
|
|
* {<br>
|
|
* return str;<br>
|
|
* } // asStdString<br>
|
|
* }; // class default_string_convertor<br>
|
|
* </code>
|
|
* <p>
|
|
* A custom policy needs to provide the equivalent makeString and asStdString functions.
|
|
* <p>
|
|
* @author Jez Higgins
|
|
* <a href="mailto:jez@jezuk.co.uk">jez@jezuk.co.uk</a>
|
|
* @version $Id$
|
|
* @see SAX::basic_XMLReader
|
|
*/
|
|
template<class string_type, class string_adaptor_type = SAX::default_string_adaptor<string_type> >
|
|
class expat_wrapper : public SAX::basic_XMLReader<string_type>,
|
|
public SAX::basic_Locator<string_type>,
|
|
public expat_wrapper_impl_mumbojumbo::expat2base
|
|
{
|
|
public:
|
|
typedef string_type stringT;
|
|
typedef string_adaptor_type string_adaptorT;
|
|
typedef SAX::basic_EntityResolver<stringT> entityResolverT;
|
|
typedef SAX::basic_DTDHandler<stringT> dtdHandlerT;
|
|
typedef SAX::basic_ContentHandler<stringT> contentHandlerT;
|
|
typedef SAX::basic_DeclHandler<stringT> declHandlerT;
|
|
typedef SAX::basic_LexicalHandler<stringT> lexicalHandlerT;
|
|
typedef SAX::basic_InputSource<stringT> inputSourceT;
|
|
typedef SAX::basic_Locator<stringT> locatorT;
|
|
typedef SAX::basic_NamespaceSupport<stringT, string_adaptorT> namespaceSupportT;
|
|
typedef SAX::basic_ErrorHandler<stringT> errorHandlerT;
|
|
typedef SAX::basic_SAXParseException<stringT> SAXParseExceptionT;
|
|
typedef typename SAX::basic_XMLReader<stringT>::PropertyBase PropertyBaseT;
|
|
|
|
expat_wrapper();
|
|
virtual ~expat_wrapper();
|
|
|
|
/////////////////////////////////////////////////
|
|
// Configuration
|
|
virtual bool getFeature(const stringT& name) const;
|
|
virtual void setFeature(const stringT& name, bool value);
|
|
|
|
/////////////////////////////////////////////////
|
|
// Event Handlers
|
|
virtual void setEntityResolver(entityResolverT& resolver) { entityResolver_ = &resolver; }
|
|
virtual entityResolverT* getEntityResolver() const { return entityResolver_; }
|
|
virtual void setDTDHandler(dtdHandlerT& handler) { dtdHandler_ = &handler; }
|
|
virtual dtdHandlerT* getDTDHandler() const { return dtdHandler_; }
|
|
virtual void setContentHandler(contentHandlerT& handler) { contentHandler_ = &handler; }
|
|
virtual contentHandlerT* getContentHandler() const { return contentHandler_; }
|
|
virtual void setErrorHandler(errorHandlerT& handler) { errorHandler_ = &handler; }
|
|
virtual errorHandlerT* getErrorHandler() const { return errorHandler_; }
|
|
|
|
//////////////////////////////////////////////////
|
|
// Parsing
|
|
virtual void parse(inputSourceT& input);
|
|
private:
|
|
bool do_parse(inputSourceT& source, XML_Parser parser);
|
|
|
|
public:
|
|
//////////////////////////////////////////////////
|
|
// Locator
|
|
virtual stringT getPublicId() const;
|
|
virtual stringT getSystemId() const;
|
|
virtual int getLineNumber() const;
|
|
virtual int getColumnNumber() const;
|
|
|
|
///////////////////////////////////////////////////
|
|
// properties
|
|
protected:
|
|
virtual std::auto_ptr<PropertyBaseT> doGetProperty(const stringT& name);
|
|
virtual void doSetProperty(const stringT& name, std::auto_ptr<PropertyBaseT> value);
|
|
private:
|
|
typename namespaceSupportT::Parts processName(const stringT& qName, bool isAttribute);
|
|
void reportError(const std::string& message, bool fatal = false);
|
|
void checkNotParsing(const stringT& type, const stringT& name) const;
|
|
|
|
private:
|
|
virtual void charHandler(const char* txt, int txtlen);
|
|
virtual void startElement(const char* qName, const char** atts);
|
|
virtual void endElement(const char* qName);
|
|
virtual void processingInstruction(const char* target, const char* data);
|
|
virtual void elementDeclaration(const XML_Char* name,
|
|
const XML_Content* model);
|
|
virtual void attListDeclaration(const XML_Char* elname,
|
|
const XML_Char* attname,
|
|
const XML_Char* att_type,
|
|
const XML_Char* dflt,
|
|
int isrequired);
|
|
virtual void entityDeclaration(const XML_Char* entityName,
|
|
int is_parameter_entity,
|
|
const XML_Char* value,
|
|
int value_length,
|
|
const XML_Char* base,
|
|
const XML_Char* systemId,
|
|
const XML_Char* publicId,
|
|
const XML_Char* notationName);
|
|
virtual void notationDeclaration(const XML_Char* notationName,
|
|
const XML_Char* base,
|
|
const XML_Char* systemId,
|
|
const XML_Char* publicId);
|
|
virtual void startDoctypeDecl(const XML_Char* doctypeName,
|
|
const XML_Char* sysid,
|
|
const XML_Char* pubid,
|
|
int has_internal_subset);
|
|
virtual void endDoctypeDecl();
|
|
virtual void startCdataSection();
|
|
virtual void endCdataSection();
|
|
virtual void commentHandler(const XML_Char* data);
|
|
virtual int externalEntityRefHandler(XML_Parser parser,
|
|
const XML_Char* context,
|
|
const XML_Char* base,
|
|
const XML_Char* systemId,
|
|
const XML_Char* publicId);
|
|
|
|
|
|
private:
|
|
void startElementNoNS(const char* qName, const char** atts);
|
|
void endElementNoNS(const char* qName);
|
|
void convertXML_Content(std::ostream& os, const XML_Content* model, bool isChild = false);
|
|
|
|
// member variables
|
|
entityResolverT* entityResolver_;
|
|
dtdHandlerT* dtdHandler_;
|
|
contentHandlerT* contentHandler_;
|
|
errorHandlerT* errorHandler_;
|
|
declHandlerT* declHandler_;
|
|
lexicalHandlerT* lexicalHandler_;
|
|
namespaceSupportT nsSupport_;
|
|
|
|
XML_Parser parser_;
|
|
stringT publicId_;
|
|
stringT systemId_;
|
|
bool parsing_;
|
|
|
|
// features
|
|
bool namespaces_;
|
|
bool prefixes_;
|
|
bool externalResolving_;
|
|
|
|
string_adaptorT SA_;
|
|
stringT emptyString_;
|
|
const SAX::FeatureNames<stringT, string_adaptorT> features_;
|
|
const SAX::PropertyNames<stringT, string_adaptorT> properties_;
|
|
const SAX::NamespaceConstants<stringT, string_adaptorT> nsc_;
|
|
const SAX::AttributeDefaults<stringT, string_adaptorT> attrDefaults_;
|
|
|
|
std::map<stringT, stringT> declaredExternalEnts_;
|
|
}; // class expat_wrapper
|
|
|
|
//////////////////////////////////////////////////////////////////
|
|
// expat wrapper definition
|
|
template<class stringT, class string_adaptorT>
|
|
expat_wrapper<stringT, string_adaptorT>::expat_wrapper() :
|
|
entityResolver_(0),
|
|
dtdHandler_(0),
|
|
contentHandler_(0),
|
|
errorHandler_(0),
|
|
declHandler_(0),
|
|
lexicalHandler_(0),
|
|
parser_(XML_ParserCreate(0)),
|
|
parsing_(false),
|
|
namespaces_(true),
|
|
prefixes_(true),
|
|
externalResolving_(false)
|
|
{
|
|
XML_SetUserData(parser_, reinterpret_cast<void*>(static_cast<expat_wrapper_impl_mumbojumbo::expat2base*>(this)));
|
|
XML_SetCharacterDataHandler(parser_, expat_wrapper_impl_mumbojumbo::ewim_charHandler);
|
|
XML_SetElementHandler(parser_, expat_wrapper_impl_mumbojumbo::ewim_startElement, expat_wrapper_impl_mumbojumbo::ewim_endElement);
|
|
XML_SetElementDeclHandler(parser_, expat_wrapper_impl_mumbojumbo::ewim_elementDeclaration);
|
|
XML_SetAttlistDeclHandler(parser_, expat_wrapper_impl_mumbojumbo::ewim_attListDeclaration);
|
|
XML_SetEntityDeclHandler(parser_, expat_wrapper_impl_mumbojumbo::ewim_entityDeclaration);
|
|
XML_SetNotationDeclHandler(parser_, expat_wrapper_impl_mumbojumbo::ewim_notationDeclaration);
|
|
XML_SetDoctypeDeclHandler(parser_, expat_wrapper_impl_mumbojumbo::ewim_startDoctypeDecl, expat_wrapper_impl_mumbojumbo::ewim_endDoctypeDecl);
|
|
XML_SetCdataSectionHandler(parser_, expat_wrapper_impl_mumbojumbo::ewim_startCdataSection, expat_wrapper_impl_mumbojumbo::ewim_endCdataSection);
|
|
XML_SetCommentHandler(parser_, expat_wrapper_impl_mumbojumbo::ewim_commentHandler);
|
|
XML_SetExternalEntityRefHandler(parser_, expat_wrapper_impl_mumbojumbo::ewim_externalEntityRefHandler);
|
|
XML_SetProcessingInstructionHandler(parser_, expat_wrapper_impl_mumbojumbo::ewim_processingInstruction);
|
|
} // expat
|
|
|
|
template<class stringT, class string_adaptorT>
|
|
expat_wrapper<stringT, string_adaptorT>::~expat_wrapper()
|
|
{
|
|
XML_ParserFree(parser_);
|
|
} // ~expat
|
|
|
|
template<class stringT, class string_adaptorT>
|
|
void expat_wrapper<stringT, string_adaptorT>::setFeature(const stringT& name, bool value)
|
|
{
|
|
if(name == features_.namespaces)
|
|
{
|
|
checkNotParsing(SA_.makeStringT("feature"), name);
|
|
namespaces_ = value;
|
|
if(!namespaces_ && !prefixes_)
|
|
prefixes_ = true;
|
|
return;
|
|
} // namespaces
|
|
|
|
if(name == features_.namespace_prefixes)
|
|
{
|
|
checkNotParsing(SA_.makeStringT("feature"), name);
|
|
prefixes_ = value;
|
|
if(prefixes_ && !namespaces_)
|
|
namespaces_ = true;
|
|
return;
|
|
} // namespace prefixes
|
|
|
|
if(name == features_.external_general || name == features_.external_parameter)
|
|
{
|
|
checkNotParsing(SA_.makeStringT("feature"), name);
|
|
externalResolving_ = value;
|
|
return;
|
|
} // external entity resolution
|
|
|
|
if(name == features_.validation)
|
|
{
|
|
std::ostringstream os;
|
|
os << "Feature not supported " << SA_.asStdString(name);
|
|
throw SAX::SAXNotSupportedException(os.str());
|
|
}
|
|
else
|
|
{
|
|
std::ostringstream os;
|
|
os << "Feature not recognized " << SA_.asStdString(name);
|
|
throw SAX::SAXNotRecognizedException(os.str());
|
|
}
|
|
} // setFeature
|
|
|
|
template<class stringT, class string_adaptorT>
|
|
bool expat_wrapper<stringT, string_adaptorT>::getFeature(const stringT& name) const
|
|
{
|
|
if(name == features_.namespaces)
|
|
return namespaces_;
|
|
|
|
if(name == features_.namespace_prefixes)
|
|
return prefixes_;
|
|
|
|
if(name == features_.external_general || name == features_.external_parameter)
|
|
return externalResolving_;
|
|
|
|
if(name == features_.validation)
|
|
return false;
|
|
|
|
throw SAX::SAXNotRecognizedException(std::string("Feature not recognized ") + SA_.asStdString(name));
|
|
} // getFeature
|
|
|
|
template<class stringT, class string_adaptorT>
|
|
void expat_wrapper<stringT, string_adaptorT>::parse(inputSourceT& source)
|
|
{
|
|
publicId_ = source.getPublicId();
|
|
systemId_ = source.getSystemId();
|
|
|
|
if(contentHandler_)
|
|
contentHandler_->setDocumentLocator(*this);
|
|
|
|
parsing_ = true;
|
|
|
|
if(contentHandler_)
|
|
contentHandler_->startDocument();
|
|
|
|
XML_SetParamEntityParsing(parser_, externalResolving_ ? XML_PARAM_ENTITY_PARSING_ALWAYS : XML_PARAM_ENTITY_PARSING_NEVER);
|
|
|
|
do_parse(source, parser_);
|
|
|
|
if(contentHandler_)
|
|
contentHandler_->endDocument();
|
|
|
|
parsing_ = false;
|
|
} // parse
|
|
|
|
template<class stringT, class string_adaptorT>
|
|
bool expat_wrapper<stringT, string_adaptorT>::do_parse(inputSourceT& source, XML_Parser parser)
|
|
{
|
|
InputSourceResolver is(source, SA_);
|
|
if(is.resolve() == 0)
|
|
{
|
|
reportError("Could not resolve XML document", true);
|
|
return false;
|
|
} // if(is.resolver() == 0)
|
|
|
|
const int BUFF_SIZE = 10*1024;
|
|
while(!is.resolve()->eof())
|
|
{
|
|
char* buffer = (char*)XML_GetBuffer(parser, BUFF_SIZE);
|
|
if(buffer == NULL)
|
|
{
|
|
reportError("Could not acquire expat buffer", true);
|
|
return false;
|
|
} // if ...
|
|
|
|
is.resolve()->read(buffer, BUFF_SIZE);
|
|
if(XML_ParseBuffer(parser, is.resolve()->gcount(), is.resolve()->eof()) == 0)
|
|
{
|
|
// error
|
|
reportError(XML_ErrorString(XML_GetErrorCode(parser_)), true);
|
|
return false;
|
|
} // if ...
|
|
} // while
|
|
|
|
return true;
|
|
} // do_parse
|
|
|
|
template<class stringT, class string_adaptorT>
|
|
#ifndef ARABICA_VS6_WORKAROUND
|
|
std::auto_ptr<typename expat_wrapper<stringT, string_adaptorT>::PropertyBaseT> expat_wrapper<stringT, string_adaptorT>::doGetProperty(const stringT& name)
|
|
#else
|
|
std::auto_ptr<expat_wrapper<stringT, string_adaptorT>::PropertyBaseT> expat_wrapper<stringT, string_adaptorT>::doGetProperty(const stringT& name)
|
|
#endif
|
|
{
|
|
if(name == properties_.lexicalHandler)
|
|
{
|
|
SAX::basic_XMLReader<stringT>::Property<lexicalHandlerT*>* prop =
|
|
new SAX::basic_XMLReader<stringT>::Property<lexicalHandlerT*>(lexicalHandler_);
|
|
return std::auto_ptr<PropertyBaseT>(prop);
|
|
}
|
|
else if(name == properties_.declHandler)
|
|
{
|
|
SAX::basic_XMLReader<stringT>::Property<declHandlerT*>* prop =
|
|
new SAX::basic_XMLReader<stringT>::Property<declHandlerT*>(declHandler_);
|
|
return std::auto_ptr<PropertyBaseT>(prop);
|
|
}
|
|
else
|
|
throw SAX::SAXNotRecognizedException(std::string("Property not recognized ") + SA_.asStdString(name));
|
|
} // doGetProperty
|
|
|
|
template<class stringT, class string_adaptorT>
|
|
void expat_wrapper<stringT, string_adaptorT>::doSetProperty(const stringT& name, std::auto_ptr<PropertyBaseT> value)
|
|
{
|
|
if(name == properties_.lexicalHandler)
|
|
{
|
|
SAX::basic_XMLReader<stringT>::Property<lexicalHandlerT&>* prop =
|
|
dynamic_cast<SAX::basic_XMLReader<stringT>::Property<lexicalHandlerT&>*>(value.get());
|
|
|
|
if(!prop)
|
|
throw std::bad_cast();
|
|
|
|
lexicalHandler_ = &(prop->get());
|
|
}
|
|
else if(name == properties_.declHandler)
|
|
{
|
|
SAX::basic_XMLReader<stringT>::Property<declHandlerT&>* prop =
|
|
dynamic_cast<SAX::basic_XMLReader<stringT>::Property<declHandlerT&>*>(value.get());
|
|
|
|
if(!prop)
|
|
throw std::bad_cast();
|
|
|
|
declHandler_ = &(prop->get());
|
|
}
|
|
else
|
|
{
|
|
std::ostringstream os;
|
|
os << "Property not recognized " << SA_.asStdString(name);
|
|
throw SAX::SAXNotRecognizedException(os.str());
|
|
}
|
|
} // doSetProperty
|
|
|
|
// Locator implementation
|
|
template<class stringT, class string_adaptorT>
|
|
stringT expat_wrapper<stringT, string_adaptorT>::getPublicId() const
|
|
{
|
|
return publicId_;
|
|
} // getPublicId
|
|
|
|
template<class stringT, class string_adaptorT>
|
|
stringT expat_wrapper<stringT, string_adaptorT>::getSystemId() const
|
|
{
|
|
return systemId_;
|
|
} // getSystemId
|
|
|
|
template<class stringT, class string_adaptorT>
|
|
int expat_wrapper<stringT, string_adaptorT>::getLineNumber() const
|
|
{
|
|
return XML_GetCurrentLineNumber(parser_);
|
|
} // getLineNumber
|
|
|
|
template<class stringT, class string_adaptorT>
|
|
int expat_wrapper<stringT, string_adaptorT>::getColumnNumber() const
|
|
{
|
|
return XML_GetCurrentColumnNumber(parser_);
|
|
} // getColumnNumber
|
|
|
|
template<class stringT, class string_adaptorT>
|
|
typename SAX::basic_NamespaceSupport<stringT, string_adaptorT>::Parts expat_wrapper<stringT, string_adaptorT>::processName(const stringT& qName, bool isAttribute)
|
|
{
|
|
typename namespaceSupportT::Parts p = nsSupport_.processName(qName, isAttribute);
|
|
if(!p.URI.length() && p.prefix.length())
|
|
reportError(std::string("Undeclared prefix ") + SA_.asStdString(qName));
|
|
return p;
|
|
} // processName
|
|
|
|
template<class stringT, class string_adaptorT>
|
|
void expat_wrapper<stringT, string_adaptorT>::reportError(const std::string& message, bool fatal)
|
|
{
|
|
if(!errorHandler_)
|
|
return;
|
|
|
|
SAXParseExceptionT e(message,
|
|
publicId_,
|
|
systemId_,
|
|
XML_GetCurrentLineNumber(parser_),
|
|
XML_GetCurrentColumnNumber(parser_));
|
|
if(fatal)
|
|
errorHandler_->fatalError(e);
|
|
else
|
|
errorHandler_->error(e);
|
|
} // reportError
|
|
|
|
template<class stringT, class string_adaptorT>
|
|
void expat_wrapper<stringT, string_adaptorT>::checkNotParsing(const stringT& type, const stringT& name) const
|
|
{
|
|
if(parsing_)
|
|
{
|
|
std::ostringstream os;
|
|
os << "Can't change " << SA_.asStdString(type) << " " << SA_.asStdString(name) << " while parsing";
|
|
throw SAX::SAXNotSupportedException(os.str());
|
|
} // if(parsing_)
|
|
} // checkNotParsing
|
|
|
|
template<class stringT, class string_adaptorT>
|
|
void expat_wrapper<stringT, string_adaptorT>::charHandler(const char* txt, int txtlen)
|
|
{
|
|
if(!contentHandler_)
|
|
return;
|
|
contentHandler_->characters(SA_.makeStringT(txt, txtlen));
|
|
} // charHandler
|
|
|
|
template<class stringT, class string_adaptorT>
|
|
void expat_wrapper<stringT, string_adaptorT>::startElement(const char* qName, const char** atts)
|
|
{
|
|
if(!contentHandler_)
|
|
return;
|
|
|
|
if(!namespaces_)
|
|
{
|
|
startElementNoNS(qName, atts);
|
|
return;
|
|
} // if(!namespaces)
|
|
|
|
// OK we're doing Namespaces
|
|
nsSupport_.pushContext();
|
|
bool seenDecl = false;
|
|
SAX::basic_AttributesImpl<stringT> attributes;
|
|
|
|
// take a first pass and copy all the attributes, noting any declarations
|
|
if(atts && *atts != 0)
|
|
{
|
|
while(*atts != 0)
|
|
{
|
|
stringT attQName = SA_.makeStringT(*atts++);
|
|
stringT value = SA_.makeStringT(*atts++);
|
|
|
|
// declaration?
|
|
if(attQName.find(nsc_.xmlns) == 0)
|
|
{
|
|
stringT prefix;
|
|
size_t n = attQName.find(nsc_.colon);
|
|
if(n != stringT::npos)
|
|
prefix = stringT(attQName.begin() + n + 1, attQName.end());
|
|
if(!nsSupport_.declarePrefix(prefix, value))
|
|
reportError(std::string("Illegal Namespace prefix ") + SA_.asStdString(prefix));
|
|
contentHandler_->startPrefixMapping(prefix, value);
|
|
if(prefixes_)
|
|
attributes.addAttribute(emptyString_,
|
|
emptyString_,
|
|
attQName,
|
|
emptyString_,
|
|
value);
|
|
seenDecl = true;
|
|
}
|
|
else
|
|
{
|
|
typename namespaceSupportT::Parts attName = processName(attQName, true);
|
|
attributes.addAttribute(attName.URI, attName.localName, attName.rawName, emptyString_, value);
|
|
}
|
|
} // while ...
|
|
} // if ...
|
|
|
|
// if there was a Namespace decl we have to go around again
|
|
if(seenDecl)
|
|
{
|
|
int length = attributes.getLength();
|
|
for(int i = 0; i < length; ++i)
|
|
{
|
|
stringT attQName = attributes.getQName(i);
|
|
if(attQName.find(nsc_.xmlns))
|
|
{
|
|
typename namespaceSupportT::Parts attName = processName(attQName, true);
|
|
attributes.setURI(i, attName.URI);
|
|
attributes.setLocalName(i, attName.localName);
|
|
} // if ...
|
|
} // for ...
|
|
} // if(seenDecl)
|
|
|
|
// at last! report the event
|
|
typename namespaceSupportT::Parts name = processName(SA_.makeStringT(qName), false);
|
|
contentHandler_->startElement(name.URI, name.localName, name.rawName, attributes);
|
|
} // startElement
|
|
|
|
template<class stringT, class string_adaptorT>
|
|
void expat_wrapper<stringT, string_adaptorT>::startElementNoNS(const char* qName, const char** atts)
|
|
{
|
|
SAX::basic_AttributesImpl<stringT> attributes;
|
|
|
|
if(atts && *atts != 0)
|
|
{
|
|
while(*atts != 0)
|
|
{
|
|
stringT attQName = SA_.makeStringT(*atts++);
|
|
stringT value = SA_.makeStringT(*atts++);
|
|
|
|
attributes.addAttribute(emptyString_, emptyString_, attQName, emptyString_, value);
|
|
} // while ..
|
|
} // if ...
|
|
|
|
contentHandler_->startElement(emptyString_, emptyString_, SA_.makeStringT(qName), attributes);
|
|
} // startElementNoNS
|
|
|
|
template<class stringT, class string_adaptorT>
|
|
void expat_wrapper<stringT, string_adaptorT>::endElement(const char* qName)
|
|
{
|
|
if(!contentHandler_)
|
|
return;
|
|
|
|
if(!namespaces_)
|
|
{
|
|
endElementNoNS(qName);
|
|
return;
|
|
} // if(!namespaces_)
|
|
|
|
typename namespaceSupportT::Parts name = processName(SA_.makeStringT(qName), false);
|
|
contentHandler_->endElement(name.URI, name.localName, name.rawName);
|
|
typename namespaceSupportT::stringListT prefixes = nsSupport_.getDeclaredPrefixes();
|
|
for(size_t i = 1, end = prefixes.size(); i < end; ++i)
|
|
contentHandler_->endPrefixMapping(prefixes[i]);
|
|
nsSupport_.popContext();
|
|
} // endElement
|
|
|
|
template<class stringT, class string_adaptorT>
|
|
void expat_wrapper<stringT, string_adaptorT>::endElementNoNS(const char* qName)
|
|
{
|
|
if(contentHandler_)
|
|
contentHandler_->endElement(emptyString_, emptyString_, SA_.makeStringT(qName));
|
|
} // endElementNoNS
|
|
|
|
template<class stringT, class string_adaptorT>
|
|
void expat_wrapper<stringT, string_adaptorT>::processingInstruction(const char* target, const char* data)
|
|
{
|
|
if(contentHandler_)
|
|
contentHandler_->processingInstruction(SA_.makeStringT(target), SA_.makeStringT(data));
|
|
} // processingInstruction
|
|
|
|
template<class stringT, class string_adaptorT>
|
|
void expat_wrapper<stringT, string_adaptorT>::elementDeclaration(const XML_Char* name,
|
|
const XML_Content* model)
|
|
{
|
|
if(!declHandler_)
|
|
return;
|
|
|
|
std::ostringstream os;
|
|
convertXML_Content(os, model);
|
|
declHandler_->elementDecl(SA_.makeStringT(name), SA_.makeStringT(os.str().c_str()));
|
|
} // elementDeclaration
|
|
|
|
template<class stringT, class string_adaptorT>
|
|
void expat_wrapper<stringT, string_adaptorT>::convertXML_Content(std::ostream& os, const XML_Content* model, bool isChild)
|
|
{
|
|
/*
|
|
enum XML_Content_Type {
|
|
XML_CTYPE_EMPTY = 1,
|
|
XML_CTYPE_ANY,
|
|
XML_CTYPE_MIXED,
|
|
XML_CTYPE_NAME,
|
|
XML_CTYPE_CHOICE,
|
|
XML_CTYPE_SEQ
|
|
};
|
|
|
|
enum XML_Content_Quant {
|
|
XML_CQUANT_NONE,
|
|
XML_CQUANT_OPT,
|
|
XML_CQUANT_REP,
|
|
XML_CQUANT_PLUS
|
|
};
|
|
|
|
If type == XML_CTYPE_EMPTY or XML_CTYPE_ANY, then quant will be
|
|
XML_CQUANT_NONE, and the other fields will be zero or NULL.
|
|
If type == XML_CTYPE_MIXED, then quant will be NONE or REP and
|
|
numchildren will contain number of elements that may be mixed in
|
|
and children point to an array of XML_Content cells that will be
|
|
all of XML_CTYPE_NAME type with no quantification.
|
|
|
|
If type == XML_CTYPE_NAME, then the name points to the name, and
|
|
the numchildren field will be zero and children will be NULL. The
|
|
quant fields indicates any quantifiers placed on the name.
|
|
|
|
CHOICE and SEQ will have name NULL, the number of children in
|
|
numchildren and children will point, recursively, to an array
|
|
of XML_Content cells.
|
|
|
|
The EMPTY, ANY, and MIXED types will only occur at top level.
|
|
|
|
typedef struct XML_cp XML_Content;
|
|
|
|
struct XML_cp {
|
|
enum XML_Content_Type type;
|
|
enum XML_Content_Quant quant;
|
|
const XML_Char * name;
|
|
unsigned int numchildren;
|
|
XML_Content * children;
|
|
};
|
|
*/
|
|
char concatenator = ' ';
|
|
|
|
switch(model->type)
|
|
{
|
|
case XML_CTYPE_EMPTY:
|
|
os << "EMPTY";
|
|
break;
|
|
case XML_CTYPE_ANY:
|
|
os << "ANY";
|
|
break;
|
|
case XML_CTYPE_MIXED:
|
|
if(model->numchildren == 0)
|
|
os << "(#PCDATA)";
|
|
else
|
|
os << "(#PCDATA";
|
|
concatenator = '|';
|
|
break;
|
|
case XML_CTYPE_NAME:
|
|
if(!isChild)
|
|
os << '(' << model->name << ')';
|
|
else
|
|
os << model->name;
|
|
break;
|
|
case XML_CTYPE_CHOICE:
|
|
concatenator = '|';
|
|
break;
|
|
case XML_CTYPE_SEQ:
|
|
concatenator = ',';
|
|
break;
|
|
} // switch
|
|
|
|
// do children here
|
|
if(model->numchildren)
|
|
{
|
|
if(model->type != XML_CTYPE_MIXED)
|
|
os << '(';
|
|
|
|
for(unsigned int i = 0; i < model->numchildren; ++i)
|
|
{
|
|
if(i != 0)
|
|
os << concatenator;
|
|
convertXML_Content(os, &(model->children[i]), true);
|
|
} // for ...
|
|
|
|
os << ')';
|
|
} // if ...
|
|
|
|
switch(model->quant)
|
|
{
|
|
case XML_CQUANT_NONE:
|
|
break;
|
|
case XML_CQUANT_OPT:
|
|
os << "?";
|
|
break;
|
|
case XML_CQUANT_REP:
|
|
os << "*";
|
|
break;
|
|
case XML_CQUANT_PLUS:
|
|
os << "+";
|
|
break;
|
|
} // switch
|
|
} // convertXML_Content
|
|
|
|
template<class stringT, class string_adaptorT>
|
|
void expat_wrapper<stringT, string_adaptorT>::attListDeclaration(const XML_Char* elname,
|
|
const XML_Char* attname,
|
|
const XML_Char* att_type,
|
|
const XML_Char* dflt,
|
|
int isrequired)
|
|
{
|
|
/* The Attlist declaration handler is called for *each* attribute. So
|
|
a single Attlist declaration with multiple attributes declared will
|
|
generate multiple calls to this handler. The "default" parameter
|
|
may be NULL in the case of the "#IMPLIED" or "#REQUIRED" keyword.
|
|
The "isrequired" parameter will be true and the default value will
|
|
be NULL in the case of "#REQUIRED". If "isrequired" is true and
|
|
default is non-NULL, then this is a "#FIXED" default. */
|
|
if(declHandler_)
|
|
{
|
|
const stringT* defType = &attrDefaults_.implied;
|
|
if(isrequired)
|
|
defType = dflt ? &attrDefaults_.fixed : &attrDefaults_.required;
|
|
declHandler_->attributeDecl(SA_.makeStringT(elname),
|
|
SA_.makeStringT(attname),
|
|
SA_.makeStringT(att_type),
|
|
*defType,
|
|
SA_.makeStringT(dflt));
|
|
}
|
|
} // attListDeclaration
|
|
|
|
template<class stringT, class string_adaptorT>
|
|
void expat_wrapper<stringT, string_adaptorT>::entityDeclaration(const XML_Char* entityName,
|
|
int is_parameter_entity,
|
|
const XML_Char* value,
|
|
int value_length,
|
|
const XML_Char* base,
|
|
const XML_Char* systemId,
|
|
const XML_Char* publicId,
|
|
const XML_Char* notationName)
|
|
{
|
|
/* For internal entities (<!ENTITY foo "bar">), value will
|
|
be non-null and systemId, publicID, and notationName will be null.
|
|
The value string is NOT null terminated; the length is provided in
|
|
the value_length argument. Since it is legal to have zero-length
|
|
values, do not use this argument to test for internal entities.
|
|
|
|
For external entities, value will be null and systemId will be non-null.
|
|
The publicId argument will be null unless a public identifier was
|
|
provided. The notationName argument will have a non-null value only
|
|
for unparsed entity declarations. */
|
|
|
|
const stringT s_entityName(SA_.makeStringT(entityName));
|
|
if(!systemId && !publicId && !notationName)
|
|
{
|
|
// internal entity!
|
|
if(declHandler_)
|
|
declHandler_->internalEntityDecl(s_entityName, SA_.makeStringT(value, value_length));
|
|
return;
|
|
}
|
|
|
|
const stringT s_publicId(SA_.makeStringT(publicId));
|
|
const stringT s_systemId(SA_.makeStringT(systemId));
|
|
if(notationName == 0)
|
|
{
|
|
if(declHandler_)
|
|
declHandler_->externalEntityDecl(s_entityName, s_publicId, s_systemId);
|
|
declaredExternalEnts_.insert(std::make_pair(s_publicId, s_entityName));
|
|
declaredExternalEnts_.insert(std::make_pair(s_systemId, s_entityName));
|
|
}
|
|
else
|
|
{
|
|
if(dtdHandler_)
|
|
dtdHandler_->unparsedEntityDecl(s_entityName, s_publicId, s_systemId, SA_.makeStringT(notationName));
|
|
}
|
|
} // entityDeclaration
|
|
|
|
template<class stringT, class string_adaptorT>
|
|
void expat_wrapper<stringT, string_adaptorT>::notationDeclaration(const XML_Char* notationName,
|
|
const XML_Char* base,
|
|
const XML_Char* systemId,
|
|
const XML_Char* publicId)
|
|
{
|
|
if(!dtdHandler_)
|
|
return;
|
|
dtdHandler_->notationDecl(SA_.makeStringT(notationName),
|
|
SA_.makeStringT(publicId),
|
|
SA_.makeStringT(systemId));
|
|
} // notationDeclaration
|
|
|
|
template<class stringT, class string_adaptorT>
|
|
void expat_wrapper<stringT, string_adaptorT>::startDoctypeDecl(const XML_Char *doctypeName,
|
|
const XML_Char *systemId,
|
|
const XML_Char *publicId,
|
|
int has_internal_subset)
|
|
{
|
|
if(!lexicalHandler_)
|
|
return;
|
|
|
|
stringT s_publicId = SA_.makeStringT(publicId);
|
|
stringT s_systemId = SA_.makeStringT(systemId);
|
|
stringT dtd = SA_.makeStringT("[dtd]");
|
|
declaredExternalEnts_.insert(std::make_pair(s_publicId, dtd));
|
|
declaredExternalEnts_.insert(std::make_pair(s_systemId, dtd));
|
|
lexicalHandler_->startDTD(SA_.makeStringT(doctypeName),
|
|
s_publicId,
|
|
s_systemId);
|
|
} // startDoctypeDecl
|
|
|
|
template<class stringT, class string_adaptorT>
|
|
void expat_wrapper<stringT, string_adaptorT>::endDoctypeDecl()
|
|
{
|
|
if(lexicalHandler_)
|
|
lexicalHandler_->endDTD();
|
|
} // endDoctypeDecl
|
|
|
|
template<class stringT, class string_adaptorT>
|
|
void expat_wrapper<stringT, string_adaptorT>::startCdataSection()
|
|
{
|
|
if(lexicalHandler_)
|
|
lexicalHandler_->startCDATA();
|
|
} // startCdataSection
|
|
|
|
template<class stringT, class string_adaptorT>
|
|
void expat_wrapper<stringT, string_adaptorT>::endCdataSection()
|
|
{
|
|
if(lexicalHandler_)
|
|
lexicalHandler_->endCDATA();
|
|
} // endCdataSection
|
|
|
|
template<class stringT, class string_adaptorT>
|
|
void expat_wrapper<stringT, string_adaptorT>::commentHandler(const XML_Char *data)
|
|
{
|
|
if(lexicalHandler_)
|
|
lexicalHandler_->comment(SA_.makeStringT(data));
|
|
} // commentHandler
|
|
|
|
template<class stringT, class string_adaptorT>
|
|
int expat_wrapper<stringT, string_adaptorT>::externalEntityRefHandler(XML_Parser parser,
|
|
const XML_Char* context,
|
|
const XML_Char* base,
|
|
const XML_Char* systemId,
|
|
const XML_Char* publicId)
|
|
{
|
|
stringT pubId(SA_.makeStringT(publicId));
|
|
stringT sysId(SA_.makeStringT(systemId));
|
|
|
|
stringT entityName;
|
|
if(systemId)
|
|
entityName = declaredExternalEnts_[sysId];
|
|
else if(publicId)
|
|
entityName = declaredExternalEnts_[pubId];
|
|
|
|
if(!externalResolving_)
|
|
{
|
|
if(!entityName.empty() && contentHandler_)
|
|
contentHandler_->skippedEntity(entityName);
|
|
|
|
return 1;
|
|
} // if ...
|
|
|
|
////////////////////////////////////////////////////////
|
|
// resolve external entity
|
|
if(!entityName.empty() && lexicalHandler_)
|
|
lexicalHandler_->startEntity(entityName);
|
|
|
|
inputSourceT source;
|
|
if(entityResolver_)
|
|
{
|
|
source = entityResolver_->resolveEntity(pubId, sysId);
|
|
if(source.getPublicId().empty() && source.getSystemId().empty())
|
|
{
|
|
source.setPublicId(pubId);
|
|
source.setSystemId(sysId);
|
|
} // if ...
|
|
}
|
|
else
|
|
{
|
|
source.setPublicId(pubId);
|
|
source.setSystemId(sysId);
|
|
} // if ...
|
|
|
|
XML_Parser externalParser = XML_ExternalEntityParserCreate(parser, context, 0);
|
|
|
|
bool ok = do_parse(source, externalParser);
|
|
|
|
XML_ParserFree(externalParser);
|
|
|
|
if(!entityName.empty() && lexicalHandler_)
|
|
lexicalHandler_->endEntity(entityName);
|
|
|
|
return ok;
|
|
} // externalEntityRefHandler
|
|
|
|
}; // namespace SAX
|
|
|
|
#endif
|
|
// end of file
|