arabica/Utils/convert_adaptor.h

355 lines
12 KiB
C
Raw Normal View History

2002-06-21 13:16:28 +02:00
#ifndef ARABICA_CONVERT_ADAPTOR_H
#define ARABICA_CONVERT_ADAPTOR_H
//////////////////////////////////////////////////////
//
// $Id$
2003-08-28 14:36:33 +02:00
// Written by Jez Higgins <jez@jezuk.co.uk>
// Copyright 1999-2003 Jez UK Ltd, http://www.jezuk.co.uk/
//
// convert_adaptor is a stream that wraps around another stream. This
// may not seem like a big deal, but convert_adaptor applies codecvt
// facets along the way. This allows you to apply encryption or
// decryption (or any other transcoding) transparently. It can
// also adapt wchar_t streams to char streams, or vice versa, allowing
// you to write std::wstrings out as UTF-8 chars to a file, for instance.
2002-06-21 13:16:28 +02:00
//////////////////////////////////////////////////////
#include <locale>
#include <istream>
#include <ostream>
#include <vector>
#include <algorithm>
2003-09-10 17:15:55 +02:00
#include <SAX/ArabicaConfig.h>
2003-09-10 10:48:08 +02:00
#ifdef ARABICA_VS6_WORKAROUND
2003-09-15 18:07:35 +02:00
#include <Utils/impl/VS6Workaround.h>
2002-06-21 13:16:28 +02:00
#endif
2003-09-11 16:05:18 +02:00
namespace Arabica
{
namespace convert
{
2002-06-21 13:16:28 +02:00
template<typename charT,
typename traitsT = std::char_traits<charT>,
typename externalCharT = charT,
typename externalTraitsT = std::char_traits<externalCharT> >
class convert_bufadaptor : public std::basic_streambuf<charT, traitsT>
{
public:
typedef typename traitsT::int_type int_type;
typedef std::basic_streambuf<externalCharT, externalTraitsT> externalStreambufT;
2004-09-20 21:45:51 +02:00
typedef std::basic_streambuf<charT, traitsT> streambufT;
2002-06-21 13:16:28 +02:00
explicit convert_bufadaptor(externalStreambufT& externalbuf) : externalbuf_(&externalbuf), inEof_(false) { }
2002-06-21 13:16:28 +02:00
virtual ~convert_bufadaptor() { }
void set_buffer(externalStreambufT& externalbuf) { externalbuf_ = &externalbuf; inEof_ = false; }
2002-06-21 13:16:28 +02:00
protected:
virtual int_type overflow(int_type c = traitsT::eof());
virtual int sync();
virtual int_type underflow();
virtual int_type pbackfail(int_type c);
private:
2003-10-27 17:09:54 +01:00
typedef typename externalTraitsT::int_type external_int_type;
2002-06-21 13:16:28 +02:00
typedef typename traitsT::state_type state_t;
externalStreambufT* externalbuf_;
2002-06-21 13:16:28 +02:00
std::vector<charT> outBuffer_;
state_t outState_;
std::vector<charT> inBuffer_;
state_t inState_;
bool inEof_;
2002-06-21 13:16:28 +02:00
void growOutBuffer();
bool flushOut();
void growInBuffer();
std::streamsize readIn();
2002-06-21 13:16:28 +02:00
static const std::streamsize bufferSize_;
static const std::streamsize pbSize_;
2002-06-21 13:16:28 +02:00
}; // convert_bufadaptor
template<class charT, class traitsT, class externalCharT, class externalTraitsT>
const std::streamsize convert_bufadaptor<charT, traitsT, externalCharT, externalTraitsT>::bufferSize_ = 1024;
2002-06-21 13:16:28 +02:00
template<class charT, class traitsT, class externalCharT, class externalTraitsT>
const std::streamsize convert_bufadaptor<charT, traitsT, externalCharT, externalTraitsT>::pbSize_ = 4;
2002-06-21 13:16:28 +02:00
// why 4? both Josuttis and Langer&Kreft use 4.
template<class charT, class traitsT, class externalCharT, class externalTraitsT>
typename convert_bufadaptor<charT, traitsT, externalCharT, externalTraitsT>::int_type convert_bufadaptor<charT, traitsT, externalCharT, externalTraitsT>::overflow(int_type c)
2002-06-21 13:16:28 +02:00
{
if(traitsT::eq_int_type(traitsT::eof(), c))
return traitsT::not_eof(c);
growOutBuffer();
sputc(traitsT::to_char_type(c));
return traitsT::not_eof(c);
} // overflow
template<class charT, class traitsT, class externalCharT, class externalTraitsT>
int convert_bufadaptor<charT, traitsT, externalCharT, externalTraitsT>::sync()
{
return flushOut() ? 0 : -1;
} // sync
template<class charT, class traitsT, class externalCharT, class externalTraitsT>
typename convert_bufadaptor<charT, traitsT, externalCharT, externalTraitsT>::int_type convert_bufadaptor<charT, traitsT, externalCharT, externalTraitsT>::underflow()
2002-06-21 13:16:28 +02:00
{
2004-09-20 21:45:51 +02:00
if(streambufT::gptr() != 0 && streambufT::gptr() < streambufT::egptr())
return (traitsT::to_int_type(*streambufT::gptr()));
2002-06-21 13:16:28 +02:00
if(!readIn())
2002-06-21 13:16:28 +02:00
return traitsT::eof();
2004-09-20 21:45:51 +02:00
return traitsT::to_int_type(*streambufT::gptr());
2002-06-21 13:16:28 +02:00
} // underflow
template<class charT, class traitsT, class externalCharT, class externalTraitsT>
typename convert_bufadaptor<charT, traitsT, externalCharT, externalTraitsT>::int_type convert_bufadaptor<charT, traitsT, externalCharT, externalTraitsT>::pbackfail(int_type c)
2002-06-21 13:16:28 +02:00
{
2004-09-20 21:45:51 +02:00
if(streambufT::gptr() == streambufT::eback())
2002-06-21 13:16:28 +02:00
return traitsT::eof();
2004-09-20 21:45:51 +02:00
streambufT::gbump(-1);
2002-06-21 13:16:28 +02:00
if(!traitsT::eq_int_type(c, traitsT::eof()))
2004-09-20 21:45:51 +02:00
*(streambufT::gptr()) = traitsT::to_char_type(c);
2002-06-21 13:16:28 +02:00
return traitsT::not_eof(c);
} // pbackfail
template<class charT, class traitsT, class externalCharT, class externalTraitsT>
void convert_bufadaptor<charT, traitsT, externalCharT, externalTraitsT>::growOutBuffer()
{
size_t oldsize = outBuffer_.capacity();
size_t newsize = (oldsize ? oldsize*2 : bufferSize_);
outBuffer_.resize(newsize);
setp(&outBuffer_[0] + oldsize, &outBuffer_[0] + outBuffer_.capacity());
} // growOutBuffer
template<class charT, class traitsT, class externalCharT, class externalTraitsT>
void convert_bufadaptor<charT, traitsT, externalCharT, externalTraitsT>::growInBuffer()
{
size_t oldsize = inBuffer_.capacity();
size_t newsize = (oldsize ? oldsize*2 : bufferSize_) + pbSize_;
inBuffer_.resize(newsize);
} // growInBuffer
template<class charT, class traitsT, class externalCharT, class externalTraitsT>
bool convert_bufadaptor<charT, traitsT, externalCharT, externalTraitsT>::flushOut()
{
2004-09-20 21:45:51 +02:00
size_t length = streambufT::pptr() - &outBuffer_[0];
2002-06-21 13:16:28 +02:00
if(!length)
return true;
bool ok(true);
const std::codecvt<charT, char, state_t>& cvt =
2003-09-09 15:09:48 +02:00
#ifndef ARABICA_VS6_WORKAROUND
2003-09-10 17:15:55 +02:00
std::use_facet<std::codecvt<charT, char, std::mbstate_t> >(this->getloc());
2002-06-21 13:16:28 +02:00
#else
2003-09-10 17:15:55 +02:00
std::use_facet(this->getloc(), (std::codecvt<charT, char, std::mbstate_t>*)0, true);
2002-06-21 13:16:28 +02:00
#endif
if(cvt.always_noconv())
std::copy(&outBuffer_[0], &outBuffer_[0] + length, std::ostreambuf_iterator<externalCharT>(externalbuf_));
2002-06-21 13:16:28 +02:00
else
{
// we must do code conversion
2003-09-01 13:28:37 +02:00
length += cvt.max_length(); // add a little
2002-06-21 13:16:28 +02:00
std::vector<externalCharT> to(length);
const charT* from_next = &(outBuffer_[0]);
2002-06-21 13:16:28 +02:00
std::codecvt_base::result r;
do
{
externalCharT* to_next;
2004-09-20 21:45:51 +02:00
r = cvt.out(outState_, from_next, streambufT::pptr(), from_next,
2002-06-21 13:16:28 +02:00
&to[0], &to[0]+length, to_next);
if(r == std::codecvt_base::noconv)
{
std::copy(&outBuffer_[0], &outBuffer_[0] + length, std::ostreambuf_iterator<externalCharT>(externalbuf_));
2002-06-21 13:16:28 +02:00
break;
}
std::copy(&to[0], to_next, std::ostreambuf_iterator<externalCharT>(externalbuf_));
2002-06-21 13:16:28 +02:00
}
while(r == std::codecvt_base::partial);
ok = ok ? (r != std::codecvt_base::error) : false;
} // if(cvt.always_noconv())
if(ok)
setp(&outBuffer_[0], &outBuffer_[0] + outBuffer_.capacity());
return ok;
} // flushOut
template<class charT, class traitsT, class externalCharT, class externalTraitsT>
std::streamsize convert_bufadaptor<charT, traitsT, externalCharT, externalTraitsT>::readIn()
2002-06-21 13:16:28 +02:00
{
if(!inBuffer_.capacity())
growInBuffer();
2004-09-20 21:45:51 +02:00
size_t pbCount = std::min<size_t>(streambufT::gptr() - streambufT::eback(), pbSize_);
2002-06-21 13:16:28 +02:00
memcpy(&(inBuffer_[0]) + (pbSize_-pbCount)*sizeof(charT),
2004-09-20 21:45:51 +02:00
streambufT::gptr() - pbCount*sizeof(charT),
2002-06-21 13:16:28 +02:00
pbCount*sizeof(charT));
const std::codecvt<charT, char, state_t>& cvt =
2003-09-09 15:09:48 +02:00
#ifndef ARABICA_VS6_WORKAROUND
2003-09-10 17:15:55 +02:00
std::use_facet<std::codecvt<charT, char, std::mbstate_t> >(this->getloc());
2002-06-21 13:16:28 +02:00
#else
std::use_facet(this->getloc(), (std::codecvt<charT, char, std::mbstate_t>*)0, true);
2002-06-21 13:16:28 +02:00
#endif
externalCharT from[1024];
std::streamsize res = 0;
if(!inEof_)
{
2003-10-27 17:09:54 +01:00
external_int_type ec = externalbuf_->sgetc();
while((!externalTraitsT::eq_int_type(externalTraitsT::eof(), ec)) && (res != bufferSize_))
{
from[res++] = static_cast<externalCharT>(ec);
ec = externalbuf_->snextc();
}
inEof_ = (externalTraitsT::eq_int_type(externalTraitsT::eof(), ec));
} // if ...
std::streamsize converted = 0;
2002-06-21 13:16:28 +02:00
if(res > 0)
{
std::codecvt_base::result r;
const externalCharT* from_next = from;
2002-06-21 13:16:28 +02:00
do
{
// can't cache this as may reallocate buffer
charT* const to = &(inBuffer_[0])+pbSize_;
charT* const to_end = &(inBuffer_[0]) + inBuffer_.capacity() - pbSize_;
2002-06-21 13:16:28 +02:00
charT* to_next;
externalCharT* const from_end = from + res;
r = cvt.in(inState_, from_next, from_end, from_next,
to + converted, to_end, to_next);
2002-06-21 13:16:28 +02:00
if(r == std::codecvt_base::noconv)
{
memcpy(&(inBuffer_[0])+pbSize_, from, res);
converted = res;
}
2002-06-21 13:16:28 +02:00
else
converted += static_cast<std::streamsize>(to_next - (to + converted));
2002-06-21 13:16:28 +02:00
if(r == std::codecvt_base::partial)
{
// haven't done everything
if(to_next == to_end)
growInBuffer(); // need more room!
else
{
int shortfall = (from + res) - from_next;
memcpy(from, from_next, shortfall);
res = externalbuf_->sgetn(from + shortfall, static_cast<std::streamsize>(bufferSize_ - shortfall));
from_next = &from[0];
if(res == 0) // oh dear
break; // let's bail!
res += shortfall;
}
} // if(r == std::codecvt_base::partial)
2002-06-21 13:16:28 +02:00
}
while(r == std::codecvt_base::partial);
if(r == std::codecvt_base::error)
{
// couldn't convert - let's bail
return 0;
} // if(r == std::codecvt_base::error)
}
setg(&(inBuffer_[0]) + (pbSize_-pbCount), &(inBuffer_[0])+pbSize_, &(inBuffer_[0])+pbSize_+converted);
2002-06-21 13:16:28 +02:00
return static_cast<int_type>(res);
2002-06-21 13:16:28 +02:00
} // readIn
////////////////////////////////////////////////////
// iconvert_adaptor
template<typename charT, typename traitsT, typename externalCharT, typename externalTraitsT>
class convert_adaptor_buffer
{
protected:
typedef std::basic_streambuf<externalCharT, externalTraitsT> externalStreambufT;
explicit convert_adaptor_buffer(externalStreambufT& externalbuf) : bufadaptor_(externalbuf) { }
convert_bufadaptor<charT, traitsT, externalCharT, externalTraitsT> bufadaptor_;
}; // convert_adaptor_buffer
2002-06-21 13:16:28 +02:00
template<typename charT,
typename traitsT = std::char_traits<charT>,
typename fromCharT = charT,
typename fromTraitsT = std::char_traits<fromCharT> >
class iconvert_adaptor : private convert_adaptor_buffer<charT, traitsT, fromCharT, fromTraitsT>,
public std::basic_istream<charT, traitsT>
2002-06-21 13:16:28 +02:00
{
2004-09-20 21:45:51 +02:00
typedef std::basic_istream<charT, traitsT> baseStreamT;
2002-06-21 13:16:28 +02:00
typedef std::basic_istream<fromCharT, fromTraitsT> fromStreamT;
2004-09-20 21:45:51 +02:00
typedef convert_adaptor_buffer<charT, traitsT, fromCharT, fromTraitsT> baseBufT;
protected:
using baseBufT::bufadaptor_;
2002-06-21 13:16:28 +02:00
public:
explicit iconvert_adaptor(fromStreamT& fromstream) :
2004-09-20 21:45:51 +02:00
baseBufT(*(fromstream.rdbuf())),
baseStreamT(&bufadaptor_)
2002-06-21 13:16:28 +02:00
{
} // iconvert_adaptor
virtual ~iconvert_adaptor() { }
2004-09-20 21:45:51 +02:00
baseBufT* rdbuf() const
2002-06-21 13:16:28 +02:00
{
2004-09-20 21:45:51 +02:00
return const_cast<baseBufT*>(&bufadaptor_);
2002-06-21 13:16:28 +02:00
} // rdbuf
void set_stream(fromStreamT& fromStream) { bufadaptor_.set_buffer(*fromStream.rdbuf()); }
2003-08-28 00:11:54 +02:00
}; // class iconvert_adaptor
2002-06-21 13:16:28 +02:00
2003-09-01 13:28:37 +02:00
////////////////////////////////////////////////////////
// oconvert_adaptor
template<typename charT,
typename traitsT = std::char_traits<charT>,
typename toCharT = charT,
typename toTraitsT = std::char_traits<toCharT> >
class oconvert_adaptor : private convert_adaptor_buffer<charT, traitsT, toCharT, toTraitsT>,
public std::basic_ostream<charT, traitsT>
2003-09-01 13:28:37 +02:00
{
2004-09-20 21:45:51 +02:00
typedef std::basic_ostream<charT, traitsT> baseStreamT;
2003-09-01 13:28:37 +02:00
typedef std::basic_ostream<toCharT, toTraitsT> toStreamT;
2004-09-20 21:45:51 +02:00
typedef convert_adaptor_buffer<charT, traitsT, toCharT, toTraitsT> baseBufT;
protected:
using baseBufT::bufadaptor_;
2003-09-01 13:28:37 +02:00
public:
explicit oconvert_adaptor(toStreamT &toStream) :
2004-09-20 21:45:51 +02:00
baseBufT(*(toStream.rdbuf())),
baseStreamT(&bufadaptor_)
2003-09-01 13:28:37 +02:00
{
} // oconvert_adaptor
2003-09-17 13:09:20 +02:00
virtual ~oconvert_adaptor()
{
2004-09-20 21:45:51 +02:00
baseStreamT::flush();
2003-09-17 13:09:20 +02:00
} // ~oconvert_adaptor
2003-09-01 13:28:37 +02:00
convert_bufadaptor<charT, traitsT>* rdbuf() const
{
return const_cast<convert_bufadaptor<charT, traitsT, toCharT, toTraitsT>*>(&bufadaptor_);
} // rdbuf
void set_stream(toStreamT& toStream) { bufadaptor_.set_buffer(*toStream.rdbuf()); }
2003-09-01 13:28:37 +02:00
}; // class oconvert_adaptor
2003-09-11 16:05:18 +02:00
} // namespace convert
} // namespace Arabica
2002-06-21 13:16:28 +02:00
#endif