#ifndef ARABICA_DEFAULT_HANDLER_H #define ARABICA_DEFAULT_HANDLER_H // DefaultHandler.h // $Id$ #include #include #include #include #include #include #include #include #include #include #include namespace SAX { /** * Default base class for SAX2 event handlers. * *

This class is available as a convenience base class for SAX2 * applications: it provides default implementations for all of the * callbacks in the four core SAX2 handler classes:

* *
    *
  • {@link basic_EntityResolver EntityResolver}
  • *
  • {@link basic_DTDHandler DTDHandler}
  • *
  • {@link basic_ContentHandler ContentHandler}
  • *
  • {@link ErrorHandler ErrorHandler}
  • *
* *

Application writers can extend this class when they need to * implement only part of an interface; parser writers can * instantiate this class to provide default handlers when the * application has not supplied its own.

* *

This class replaces the deprecated SAX1 * {@link basic_HandlerBase HandlerBase} class.

* * @since SAX 2.0 * @author Jez Higgins, * jez@jezuk.co.uk * @version 2.0 * @see basic_EntityResolver * @see basic_DTDHandler * @see basic_ContentHandler * @see basic_ErrorHandler */ template class basic_DefaultHandler : public basic_EntityResolver, public basic_DTDHandler, public basic_ContentHandler, public basic_ErrorHandler, public basic_LexicalHandler, public basic_DeclHandler { public: typedef string_type stringT; typedef basic_InputSource InputSourceT; typedef basic_Locator LocatorT; typedef basic_Attributes AttributesT; typedef basic_SAXParseException SAXParseExceptionT; basic_DefaultHandler() { } virtual ~basic_DefaultHandler() { } ////////////////////////////////////////////// // EntityResolver /** * Resolve an external entity. * *

Always return a default-constructed InputSourceT, so that * the parser will use the system identifier provided in the XML document. * This method implements the SAX default behaviour: application writers can * override it in a subclass to do special translations such as catalog * lookups or URI redirection.

* * @param publicId The public identifer, or an empty string if none is * available. * @param systemId The system identifier provided in the XML * document. * @return The new input source, (empty to require the * default behaviour). * @exception SAXException Any SAX exception. * @see basic_EntityResolver#resolveEntity */ virtual InputSourceT resolveEntity(const stringT& /* publicId */, const stringT& /* systemId */) { return InputSourceT(); } // resolveEntity ////////////////////////////////////////////// // DTDHandler /** * Receive notification of a notation declaration. * *

By default, do nothing. Application writers may override this * method in a subclass if they wish to keep track of the notations * declared in a document.

* * @param name The notation name. * @param publicId The notation public identifier, or an empty string if not * available. * @param systemId The notation system identifier. * @exception SAXException Any SAX exception, possibly * wrapping another exception. * @see basic_DTDHandler#notationDecl */ virtual void notationDecl(const stringT& /* name */, const stringT& /* publicId */, const stringT& /* systemId */) { } // notationDecl /** * Receive notification of an unparsed entity declaration. * *

By default, do nothing. Application writers may override this * method in a subclass to keep track of the unparsed entities * declared in a document.

* * @param name The entity name. * @param publicId The entity public identifier, or an empty string if not * available. * @param systemId The entity system identifier. * @param notationName The name of the associated notation. * @exception SAXException Any SAX exception, possibly * wrapping another exception. * @see basic_DTDHandler#unparsedEntityDecl */ virtual void unparsedEntityDecl(const stringT& /* name */, const stringT& /* publicId */, const stringT& /* systemId */, const stringT& /* notationName */) { } // unparsedEntityDecl //////////////////////////////////////////////////// // ContentHandler /** * Receive a Locator object for document events. * *

By default, do nothing. Application writers may override this * method in a subclass if they wish to store the locator for use * with other document events.

* * @param locator A locator for all SAX document events. * @see basic_ContentHandler#setDocumentLocator * @see basic_Locator */ virtual void setDocumentLocator(const LocatorT& /* locator */) { } /** * Receive notification of the beginning of the document. * *

By default, do nothing. Application writers may override this * method in a subclass to take specific actions at the beginning * of a document (such as allocating the root node of a tree or * creating an output file).

* * @exception SAXException Any SAX exception, possibly * wrapping another exception. * @see basic_ContentHandler#startDocument */ virtual void startDocument() { } /** * Receive notification of the end of the document. * *

By default, do nothing. Application writers may override this * method in a subclass to take specific actions at the end * of a document (such as finalising a tree or closing an output * file).

* * @exception SAXException Any SAX exception, possibly * wrapping another exception. * @see basic_ContentHandler#endDocument */ virtual void endDocument() { } /** * Receive notification of the start of a Namespace mapping. * *

By default, do nothing. Application writers may override this * method in a subclass to take specific actions at the start of * each Namespace prefix scope (such as storing the prefix mapping).

* * @param prefix The Namespace prefix being declared. * @param uri The Namespace URI mapped to the prefix. * @exception SAXException Any SAX exception, possibly * wrapping another exception. * @see basic_ContentHandler#startPrefixMapping */ virtual void startPrefixMapping(const stringT& /* prefix */, const stringT& /* uri */) { } /** * Receive notification of the end of a Namespace mapping. * *

By default, do nothing. Application writers may override this * method in a subclass to take specific actions at the end of * each prefix mapping.

* * @param prefix The Namespace prefix being declared. * @exception SAXException Any SAX exception, possibly * wrapping another exception. * @see basic_ContentHandler#endPrefixMapping */ virtual void endPrefixMapping(const stringT& /* prefix */) { } /** * Receive notification of the start of an element. * *

By default, do nothing. Application writers may override this * method in a subclass to take specific actions at the start of * each element (such as allocating a new tree node or writing * output to a file).

* * @param namespaceURI The Namespace URI, or the empty string if the element * has no Namespace URI or if Namespace processing is not * being performed. * @param localName The local name (without prefix), or the empty string if * Namespace processing is not being performed. * @param qName The qualified name (with prefix), or the empty string if * qualified names are not available. * @param atts The attributes attached to the element. If there are no * attributes, it shall be an empty Attributes object. * @exception SAXException Any SAX exception, possibly * wrapping another exception. * @see basic_ContentHandler#startElement */ virtual void startElement(const stringT& /* namespaceURI */, const stringT& /* localName */, const stringT& /* qName */, const AttributesT& /* atts */) { } /** * Receive notification of the end of an element. * *

By default, do nothing. Application writers may override this * method in a subclass to take specific actions at the end of * each element (such as finalising a tree node or writing * output to a file).

* * @param namespaceURI The Namespace URI, or the empty string if the element * has no Namespace URI or if Namespace processing is not * being performed. * @param localName The local name (without prefix), or the empty string if * Namespace processing is not being performed. * @param qName The qualified name (with prefix), or the empty string if * qualified names are not available. * @exception SAXException Any SAX exception, possibly * wrapping another exception. * @see basic_ContentHandler#endElement */ virtual void endElement(const stringT& /* namespaceURI */, const stringT& /* localName */, const stringT& /* qName */) { } /** * Receive notification of character data inside an element. * *

By default, do nothing. Application writers may override this * method to take specific actions for each chunk of character data * (such as adding the data to a node or buffer, or printing it to * a file).

* * @param ch The characters. * @exception SAXException Any SAX exception, possibly * wrapping another exception. * @see basic_ContentHandler#characters */ virtual void characters(const stringT& /* ch */) { } /** * Receive notification of ignorable whitespace in element content. * *

By default, do nothing. Application writers may override this * method to take specific actions for each chunk of ignorable * whitespace (such as adding data to a node or buffer, or printing * it to a file).

* * @param ch The whitespace characters. * @exception SAXException Any SAX exception, possibly * wrapping another exception. * @see basic_ContentHandler#ignorableWhitespace */ virtual void ignorableWhitespace(const stringT& /* ch */) { } /** * Receive notification of a processing instruction. * *

By default, do nothing. Application writers may override this * method in a subclass to take specific actions for each * processing instruction, such as setting status variables or * invoking other methods.

* * @param target The processing instruction target. * @param data The processing instruction data, or an empty string if * none is supplied. * @exception SAXException Any SAX exception, possibly * wrapping another exception. * @see basic_ContentHandler#processingInstruction */ virtual void processingInstruction(const stringT& /* target */, const stringT& /* data */) { } /** * Receive notification of a skipped entity. * *

By default, do nothing. Application writers may override this * method in a subclass to take specific actions for each * processing instruction, such as setting status variables or * invoking other methods.

* * @param name The name of the skipped entity. * @exception SAXException Any SAX exception, possibly * wrapping another exception. * @see basic_ContentHandler#processingInstruction */ virtual void skippedEntity(const stringT& /* name */) { } ///////////////////////////////////////////////////// // ErrorHandler /** * Receive notification of a parser warning. * *

The default implementation does nothing. Application writers * may override this method in a subclass to take specific actions * for each warning, such as inserting the message in a log file or * printing it to the console.

* * @param e The warning information encoded as an exception. * @exception SAXException Any SAX exception, possibly * wrapping another exception. * @see basic_ErrorHandler#warning * @see SAXParseException */ virtual void warning(const SAXParseExceptionT& /* e */) { } /** * Receive notification of a recoverable parser error. * *

The default implementation does nothing. Application writers * may override this method in a subclass to take specific actions * for each error, such as inserting the message in a log file or * printing it to the console.

* * @param e The warning information encoded as an exception. * @exception SAXException Any SAX exception, possibly * wrapping another exception. * @see basic_ErrorHandler#error * @see SAXParseException */ virtual void error(const SAXParseExceptionT& /* e */) { } /** * Report a fatal XML parsing error. * *

The default implementation throws a SAXParseException. * Application writers may override this method in a subclass if * they need to take specific actions for each fatal error (such as * collecting all of the errors into a single report): in any case, * the application must stop all regular processing when this * method is invoked, since the document is no longer reliable, and * the parser may no longer report parsing events.

* * @param e The error information encoded as an exception. * @exception SAXException Any SAX exception, possibly * wrapping another exception. * @see basic_ErrorHandler#fatalError * @see SAXParseException */ virtual void fatalError(const SAXParseExceptionT& e) { throw SAXParseExceptionT(e); // VS.NET refuses throw e; saying the copy constructor is inaccessible // GCC likes throw e; // one of them, I presume, is wrong } // fatalError ////////////////////////////////////////////////////////// // LexicalHandler /** * Report the start of DTD declarations, if any. * *

This method is intended to report the beginning of the * DOCTYPE declaration; if the document has no DOCTYPE declaration, * this method will not be invoked.

* *

All declarations reported through * {@link basic_DTDHandler DTDHandler} or * {@link basic_DeclHandler DeclHandler} events must appear * between the startDTD and {@link #endDTD endDTD} events. * Declarations are assumed to belong to the internal DTD subset * unless they appear between {@link #startEntity startEntity} * and {@link #endEntity endEntity} events. Comments and * processing instructions from the DTD should also be reported * between the startDTD and endDTD events, in their original * order of (logical) occurrence; they are not required to * appear in their correct locations relative to DTDHandler * or DeclHandler events, however.

* *

Note that the start/endDTD events will appear within * the start/endDocument events from ContentHandler and * before the first * {@link basic_ContentHandler#startElement startElement} * event.

* * @param name The document type name. * @param publicId The declared public identifier for the * external DTD subset, or an empty string if none was declared. * @param systemId The declared system identifier for the * external DTD subset, or an empty string if none was declared. * @see #endDTD * @see #startEntity */ virtual void startDTD(const stringT& name, const stringT& publicId, const stringT& systemId) { } /** * Report the end of DTD declarations. * *

This method is intended to report the end of the * DOCTYPE declaration; if the document has no DOCTYPE declaration, * this method will not be invoked.

* * @see #startDTD */ virtual void endDTD() { } /** * Report the beginning of some internal and external XML entities. * *

The reporting of parameter entities (including * the external DTD subset) is optional, and SAX2 drivers that * support LexicalHandler may not support it; you can use the * http://xml.org/sax/features/lexical-handler/parameter-entities * feature to query or control the reporting of parameter entities.

* *

General entities are reported with their regular names, * parameter entities have '%' prepended to their names, and * the external DTD subset has the pseudo-entity name "[dtd]".

* *

When a SAX2 driver is providing these events, all other * events must be properly nested within start/end entity * events. There is no additional requirement that events from * {@link basic_DeclHandler DeclHandler} or * {@link basic_DTDHandler DTDHandler} be properly ordered.

* *

Note that skipped entities will be reported through the * {@link basic_ContentHandler#skippedEntity skippedEntity} * event, which is part of the ContentHandler interface.

* *

Because of the streaming event model that SAX uses, some * entity boundaries cannot be reported under any * circumstances:

* *
    *
  • general entities within attribute values
  • *
  • parameter entities within declarations
  • *
* *

These will be silently expanded, with no indication of where * the original entity boundaries were.

* *

Note also that the boundaries of character references (which * are not really entities anyway) are not reported.

* *

All start/endEntity events must be properly nested. * * @param name The name of the entity. If it is a parameter * entity, the name will begin with '%', and if it is the * external DTD subset, it will be "[dtd]". * @see #endEntity * @see basic_DeclHandler#internalEntityDecl * @see basic_DeclHandler#externalEntityDecl */ virtual void startEntity(const stringT& name) { } /** * Report the end of an entity. * * @param name The name of the entity that is ending. * @see #startEntity */ virtual void endEntity(const stringT& name) { } /** * Report the start of a CDATA section. * *

The contents of the CDATA section will be reported through * the regular {@link basic_ContentHandler#characters * characters} event; this event is intended only to report * the boundary.

* * @see #endCDATA */ virtual void startCDATA() { } /** * Report the end of a CDATA section. * * @see #startCDATA */ virtual void endCDATA() { } /** * Report an XML comment anywhere in the document. * *

This callback will be used for comments inside or outside the * document element, including comments in the external DTD * subset (if read). Comments in the DTD must be properly * nested inside start/endDTD and start/endEntity events (if * used).

* * @param text A string holding the comment. */ virtual void comment(const stringT& text) { } //////////////////////////////////////////////////////////// // DeclHandler /** * Report an element type declaration. * *

The content model will consist of the string "EMPTY", the * string "ANY", or a parenthesised group, optionally followed * by an occurrence indicator. The model will be normalized so * that all parameter entities are fully resolved and all whitespace * is removed,and will include the enclosing parentheses. Other * normalization (such as removing redundant parentheses or * simplifying occurrence indicators) is at the discretion of the * parser.

* * @param name The element type name. * @param model The content model as a normalized string. */ virtual void elementDecl(const stringT& name, const stringT& model) { } /** * Report an attribute type declaration. * *

Only the effective (first) declaration for an attribute will * be reported. The type will be one of the strings "CDATA", * "ID", "IDREF", "IDREFS", "NMTOKEN", "NMTOKENS", "ENTITY", * "ENTITIES", a parenthesized token group with * the separator "|" and all whitespace removed, or the word * "NOTATION" followed by a space followed by a parenthesized * token group with all whitespace removed.

* *

Any parameter entities in the attribute value will be * expanded, but general entities will not.

* * @param elementName The name of the associated element. * @param attributeName The name of the attribute. * @param type A string representing the attribute type. * @param valueDefault A string representing the attribute default * ("#IMPLIED", "#REQUIRED", or "#FIXED") or empty string if * none of these applies. * @param value A string representing the attribute's default value, * or empty string if there is none. */ virtual void attributeDecl(const stringT& elementName, const stringT& attributeName, const stringT& type, const stringT& valueDefault, const stringT& value) { } /** * Report an internal entity declaration. * *

Only the effective (first) declaration for each entity * will be reported. All parameter entities in the value * will be expanded, but general entities will not.

* * @param name The name of the entity. If it is a parameter * entity, the name will begin with '%'. * @param value The replacement text of the entity. * @see #externalEntityDecl * @see basic_DTDHandler#unparsedEntityDecl */ virtual void internalEntityDecl(const stringT& name, const stringT& value) { } /** * Report a parsed external entity declaration. * *

Only the effective (first) declaration for each entity * will be reported.

* * @param name The name of the entity. If it is a parameter * entity, the name will begin with '%'. * @param publicId The declared public identifier of the entity, or * an empty string if none was declared. * @param systemId The declared system identifier of the entity. * @see #internalEntityDecl * @see basic_DTDHandler#unparsedEntityDecl */ virtual void externalEntityDecl(const stringT& name, const stringT& publicId, const stringT& systemId) { } private: basic_DefaultHandler(const basic_DefaultHandler&); basic_DefaultHandler& operator=(const basic_DefaultHandler&); bool operator==(const basic_DefaultHandler&); }; // class basic_DefaultHandler typedef basic_DefaultHandler DefaultHandler; #ifndef ARABICA_NO_WCHAR_T typedef basic_DefaultHandler wDefaultHandler; #endif } // namespace SAX #endif