2003-09-02 11:23:52 +00:00
|
|
|
#ifndef ARABICA_UTF8UCS2_CODECVT_H
|
|
|
|
#define ARABICA_UTF8UCS2_CODECVT_H
|
2002-06-21 11:16:28 +00:00
|
|
|
//---------------------------------------------------------------------------
|
2003-09-02 11:23:52 +00:00
|
|
|
// class utf8ucs2codecvt
|
2002-06-21 11:16:28 +00:00
|
|
|
// This facet converts from Unicode (UCS-2) wchar_ts to
|
|
|
|
// char using the UTF-8 encoding.
|
|
|
|
//
|
|
|
|
// For the full guff on codecvts see section 22.2.1.5 of
|
|
|
|
// The C++ Standard (ISO/IEC 14882 to be pedantic).
|
|
|
|
//
|
|
|
|
// I got my information about UTF-8 from RFC 2044.
|
|
|
|
//---------------------------------------------------------------------------
|
2007-09-04 22:55:47 +00:00
|
|
|
#include <SAX/ArabicaConfig.hpp>
|
2003-09-12 23:33:19 +00:00
|
|
|
|
2008-08-06 22:31:39 +01:00
|
|
|
#ifndef ARABICA_NO_WCHAR_T
|
|
|
|
#include <Arabica/mbstate.hpp>
|
2002-06-21 11:16:28 +00:00
|
|
|
#include <locale>
|
|
|
|
|
2003-09-12 23:15:14 +00:00
|
|
|
#ifndef ARABICA_NO_CODECVT_SPECIALISATIONS
|
2007-09-19 17:30:48 +00:00
|
|
|
#include <convert/impl/codecvt_specialisations.hpp>
|
2003-09-12 23:15:14 +00:00
|
|
|
#endif
|
|
|
|
|
2003-09-11 14:05:18 +00:00
|
|
|
namespace Arabica
|
|
|
|
{
|
|
|
|
namespace convert
|
|
|
|
{
|
|
|
|
|
2003-09-02 11:23:52 +00:00
|
|
|
class utf8ucs2codecvt : public std::codecvt<wchar_t, char, std::mbstate_t>
|
2002-06-21 11:16:28 +00:00
|
|
|
{
|
|
|
|
protected:
|
2003-09-02 11:23:52 +00:00
|
|
|
virtual ~utf8ucs2codecvt() { }
|
2002-06-21 11:16:28 +00:00
|
|
|
|
|
|
|
virtual result do_out(std::mbstate_t&,
|
|
|
|
const wchar_t* from,
|
|
|
|
const wchar_t* from_end,
|
|
|
|
const wchar_t*& from_next,
|
|
|
|
char* to,
|
|
|
|
char* to_limit,
|
|
|
|
char*& to_next) const;
|
|
|
|
|
|
|
|
virtual result do_in(std::mbstate_t&,
|
|
|
|
const char* from,
|
|
|
|
const char* from_end,
|
|
|
|
const char*& from_next,
|
|
|
|
wchar_t* to,
|
|
|
|
wchar_t* to_limit,
|
|
|
|
wchar_t*& to_next) const;
|
|
|
|
|
|
|
|
virtual result do_unshift(std::mbstate_t&,
|
|
|
|
char*,
|
|
|
|
char*,
|
|
|
|
char*&) const;
|
|
|
|
|
2003-08-29 21:09:00 +00:00
|
|
|
virtual int do_encoding() const throw() { return 0; }
|
2002-06-21 11:16:28 +00:00
|
|
|
|
2003-08-29 21:09:00 +00:00
|
|
|
virtual bool do_always_noconv() const throw() { return false; }
|
2002-06-21 11:16:28 +00:00
|
|
|
|
|
|
|
virtual int do_length(const std::mbstate_t&,
|
|
|
|
const char* from,
|
|
|
|
const char* end,
|
2004-10-12 20:50:27 +00:00
|
|
|
size_t max) const throw();
|
2002-06-21 11:16:28 +00:00
|
|
|
|
2003-08-29 21:09:00 +00:00
|
|
|
virtual int do_max_length() const throw() { return 3; }
|
2003-09-02 11:23:52 +00:00
|
|
|
}; // class utf8ucs2codecvt
|
2002-06-21 11:16:28 +00:00
|
|
|
|
2003-09-11 14:05:18 +00:00
|
|
|
} // namespace convert
|
|
|
|
} // namespace Arabica
|
|
|
|
|
2003-09-12 23:33:19 +00:00
|
|
|
#endif
|
2003-09-12 23:15:14 +00:00
|
|
|
#endif
|