#include "codec.h"
#include "iso2022jp.h"
#include "iso646fi.h"
+#include "iso88591.h"
+#include "iso885915.h"
#include "jisx0201.h"
#include "jisx0208.h"
-#include "latin1.h"
#include "utf8.h"
+#include "windows1252.h"
using namespace std;
namespace Msp {
+namespace Codecs {
-/**
-Determines whether the given string can be successfully decoded with this
-codec. Note that this function returning true does not guarantee that the
-string was actually encoded with this codec. In particular, many 8-bit
-encodings are indistinguishable.
-*/
-bool StringCodec::detect(const string &str) const
+bool Codec::detect(const string &str) const
{
Decoder *dec=create_decoder();
bool result=true;
{
for(string::const_iterator i=str.begin(); i!=str.end(); )
dec->decode_char(str, i);
- dec->sync();
}
catch(const CodecError &)
{
return result;
}
-void StringCodec::Encoder::error(const string &msg)
+void Codec::Encoder::encode(const ustring &str, string &buf)
+{
+ for(ustring::const_iterator i=str.begin(); i!=str.end(); ++i)
+ encode_char(*i, buf);
+}
+
+void Codec::Encoder::error(UnicodeChar ch, string &buf, const string &msg)
{
- switch(err_mode_)
+ switch(err_mode)
{
- case IGNORE_ERRORS: break;
- case REPLACE_ERRORS: append_replacement(); break;
- default: throw CodecError(msg);
+ case TRANSLITERATE:
+ transliterate(ch, buf);
+ case IGNORE_ERRORS:
+ break;
+ default:
+ throw CodecError(msg);
}
}
-void StringCodec::Decoder::error(const string &msg)
+
+void Codec::Decoder::decode(const string &str, ustring &buf)
{
- switch(err_mode_)
+ for(string::const_iterator i=str.begin(); i!=str.end();)
{
- case IGNORE_ERRORS: break;
- case REPLACE_ERRORS: append(0xFFFD); break;
- default: throw CodecError(msg);
+ UnicodeChar c=decode_char(str, i);
+ if(c!=-1)
+ buf+=c;
}
}
-/**
-Creates a codec for the given encoding. The caller is responsible for deleting
-the codec when it's no longer needed.
-*/
-StringCodec *create_codec(const string &n)
+UnicodeChar Codec::Decoder::error(const string &msg)
+{
+ switch(err_mode)
+ {
+ case TRANSLITERATE:
+ return 0xFFFE;
+ case IGNORE_ERRORS:
+ return -1;
+ default:
+ throw CodecError(msg);
+ }
+}
+
+Codec *create_codec(const string &n)
{
string name;
for(string::const_iterator i=n.begin(); i!=n.end(); ++i)
if(name=="ascii") return new Ascii;
if(name=="iso2022jp") return new Iso2022Jp;
if(name=="iso646fi") return new Iso646Fi;
+ if(name=="iso88591" || name=="latin1") return new Iso88591;
+ if(name=="iso885915" || name=="latin9") return new Iso885915;
if(name=="jisx0201") return new JisX0201;
if(name=="jisx0208") return new JisX0208;
- if(name=="latin1") return new Latin1;
if(name=="utf8") return new Utf8;
+ if(name=="windows1252") return new Windows1252;
throw InvalidParameterValue("Unknown string codec");
}
+} // namespace Codecs
} // namespace Msp