#ifndef ARABICA_INPUTSOURCE_H #define ARABICA_INPUTSOURCE_H // InputSource.h // $Id$ #include #include #include namespace SAX { /** * A single input source for an XML entity. * *

This class allows a SAX application to encapsulate information * about an input source in a single object, which may include * a public identifier, a system identifier, a byte stream (possibly * with a specified encoding), and/or a character stream.

* *

There are two places that the application will deliver this * input source to the parser: as the argument to the Parser.parse * method, or as the return value of the EntityResolver.resolveEntity * method.

* *

The SAX parser will use the InputSource object to determine how * to read XML input. If there is a character stream available, the * parser will read that stream directly; if not, the parser will use * a byte stream, if available; if neither a character stream nor a * byte stream is available, the parser will attempt to open a URI * connection to the resource identified by the system * identifier.

* *

An InputSource object belongs to the application: the SAX parser * shall never modify it in any way (it may modify a copy if * necessary).

* * InputSource is still under active consideration, and its * interface may change. * * @since SAX 1.0 * @author Jez Higgins, * jez@jezuk.co.uk * @version 2.0 * @see basic_Parser#parse * @see basic_EntityResolver#resolveEntity */ template class basic_InputSource { public: typedef string_type stringT; /** * Zero-argument default constructor. * * @see #setPublicId * @see #setSystemId * @see #setByteStream * @see #setEncoding */ basic_InputSource() : byteStream_(0) { } /** * Create a new input source with a system identifier. * *

Applications may use setPublicId to include a * public identifier as well, or setEncoding to specify * the character encoding, if known.

* *

If the system identifier is a URL, it must be full resolved.

* * @param systemId The system identifier (URI). * @see #setPublicId * @see #setSystemId * @see #setByteStream * @see #setEncoding * @see #setCharacterStream */ basic_InputSource(const stringT& systemId) : systemId_(systemId), byteStream_(0) { } basic_InputSource(const basic_InputSource& rhs) : publicId_(rhs.publicId_), systemId_(rhs.systemId_), byteStream_(rhs.byteStream_) { } /** * Create a new input source with a byte stream. * *

Application writers may use setSystemId to provide a base * for resolving relative URIs, setPublicId to include a * public identifier, and/or setEncoding to specify the object's * character encoding.

* * @param byteStream The raw byte stream containing the document. * @see #setPublicId * @see #setSystemId * @see #setEncoding * @see #setByteStream * @see #setCharacterStream */ basic_InputSource(std::istream& byteStream) : byteStream_(&byteStream) { } virtual ~basic_InputSource() { } basic_InputSource& operator=(const basic_InputSource& rhs) { publicId_ = rhs.publicId_; systemId_ = rhs.systemId_; byteStream_ = rhs.byteStream_; return *this; } // operator= /** * Set the public identifier for this input source. * *

The public identifier is always optional: if the application * writer includes one, it will be provided as part of the * location information.

* * @param publicId The public identifier as a string. * @see #getPublicId * @see basic_Locator#getPublicId * @see basic_SAXParseException#getPublicId */ void setPublicId(const stringT& publicId) { publicId_ = publicId; } /** * Get the public identifier for this input source. * * @return The public identifier, or an empty string if none was supplied. * @see #setPublicId */ const stringT& getPublicId() const { return publicId_; } /** * Set the system identifier for this input source. * *

The system identifier is optional if there is a byte stream * or a character stream, but it is still useful to provide one, * since the application can use it to resolve relative URIs * and can include it in error messages and warnings (the parser * will attempt to open a connection to the URI only if * there is no byte stream or character stream specified).

* *

If the application knows the character encoding of the * object pointed to by the system identifier, it can register * the encoding using the setEncoding method.

* *

If the system ID is a URL, it must be fully resolved.

* * @param systemId The system identifier as a string. * @see #setEncoding * @see #getSystemId * @see basic_Locator#getSystemId * @see basic_SAXParseException#getSystemId */ void setSystemId(const stringT& systemId) { systemId_ = systemId; } /** * Get the system identifier for this input source. * *

The getEncoding method will return the character encoding * of the object pointed to, or an empty string if unknown.

* *

If the system ID is a URL, it will be fully resolved.

* * @return The system identifier. * @see #setSystemId * @see #getEncoding */ const stringT& getSystemId() const { return systemId_; } /** * Set the byte stream for this input source. * *

The SAX parser will ignore this if there is also a character * stream specified, but it will use a byte stream in preference * to opening a URI connection itself.

* *

If the application knows the character encoding of the * byte stream, it should set it with the setEncoding method.

* * @param byteStream A byte stream containing an XML document or * other entity. * @see #setEncoding * @see #getByteStream * @see #getEncoding */ void setByteStream(std::istream& byteStream) { byteStream_ = &byteStream; } // setByteStream /** * Get the byte stream for this input source. * *

The getEncoding method will return the character * encoding for this byte stream, or null if unknown.

* * @return The byte stream, or null if none was supplied. * @see #getEncoding * @see #setByteStream */ std::istream* getByteStream() const { return byteStream_ ;} /** * Set the character encoding, if known. * *

The encoding must be a string acceptable for an * XML encoding declaration (see section 4.3.3 of the XML 1.0 * recommendation).

* *

This method has no effect when the application provides a * character stream.

* * @param encoding A string describing the character encoding. * @see #setSystemId * @see #setByteStream * @see #getEncoding */ void setEncoding(const stringT& encoding) { encoding_ = encoding; } /** * Get the character encoding for a byte stream or URI. * * @return The encoding, or an empty string if none was supplied. * @see #setByteStream * @see #getSystemId * @see #getByteStream */ const stringT& getEncoding() const { return encoding_; } /////////////////////////////////////////////////////////// private: stringT publicId_; stringT systemId_; std::istream* byteStream_; stringT encoding_; bool operator==(const basic_InputSource&); // no implementation }; // class basic_InputSource /* char specialization template<> basic_InputSource::basic_InputSource(std::istream& byteStream) : byteStream_(&byteStream), charStream_(&byteStream) { } // basic_InputSource template<> basic_InputSource::basic_InputSource(charStreamT& charStream, bool) : byteStream_(&charStream), charStream_(&charStream) { } // basic_InputSource template<> void basic_InputSource::setByteStream(std::istream& byteStream) { byteStream_ = &byteStream; charStream_ = &byteStream; } // setByteStream template<> void basic_InputSource::setCharacterStream(charStreamT& charStream) { byteStream_ = &charStream; charStream_ = &charStream; } // setCharStream */ /* // wchar_t specializations template<> basic_InputSource::basic_InputSource(std::istream& byteStream) : byteStream_(&byteStream), charStream_(0) { } // basic_InputStream template<> basic_InputSource::basic_InputSource(charStreamT& charStream, bool) : byteStream_(0), charStream_(&charStream) { } // basic_InputStream ///////////////////////////// template void basic_InputSource::setByteStream(std::istream& byteStream) { byteStream_ = &byteStream; charStream_ = 0; } // setByteStream template void basic_InputSource::setCharacterStream(charStreamT& charStream) { byteStream_ = 0; charStream_ = &charStream; } // setCharStream */ typedef basic_InputSource InputSource; #ifndef ARABICA_NO_WCHAR_T typedef basic_InputSource wInputSource; #endif }; // namespace SAX #endif // #define InputSourceH // end of file