SJISCodingSystem.cxx revision 7c478bd95313f5f23a4c958a745db2134aa03244
// Copyright (c) 1994 James Clark
// See the file COPYING for copying permission.
#pragma ident "%Z%%M% %I% %E% SMI"
#include "splib.h"
#ifdef SP_MULTI_BYTE
#include "SJISCodingSystem.h"
#ifdef SP_NAMESPACE
namespace SP_NAMESPACE {
#endif
class SJISDecoder : public Decoder {
public:
SJISDecoder();
size_t decode(Char *, const char *, size_t, const char **);
private:
};
class SJISEncoder : public RecoveringEncoder {
public:
SJISEncoder();
void output(const Char *, size_t, OutputByteStream *);
void output(Char *tmp_char, size_t tmp_size_t, OutputByteStream *tmp_obs) {
output((const Char *)tmp_char, (size_t) tmp_size_t, (OutputByteStream *)tmp_obs);
}
};
Decoder *SJISCodingSystem::makeDecoder() const
{
return new SJISDecoder;
}
Encoder *SJISCodingSystem::makeEncoder() const
{
return new SJISEncoder;
}
SJISDecoder::SJISDecoder()
{
}
size_t SJISDecoder::decode(Char *to, const char *s,
size_t slen, const char **rest)
{
Char *start = to;
while (slen > 0) {
unsigned char c = *(unsigned char *)s;
if (!(c & 0x80)) {
*to++ = c;
s++;
slen--;
}
else if (129 <= c && c <= 159) {
if (slen < 2)
break;
s++;
slen -= 2;
unsigned char c2 = *(unsigned char *)s++;
unsigned short n = ((c - 112) << 9) | c2;
if (64 <= c2 && c2 <= 127)
n -= 31 + (1 << 8);
else if (c2 <= 158)
n -= 32 + (1 << 8);
else if (c2 <= 252)
n -= 126;
else
continue;
n |= 0x8080;
*to++ = n;
}
else if (224 <= c && c <= 239) {
if (slen < 2)
break;
s++;
slen -= 2;
unsigned char c2 = *(unsigned char *)s++;
unsigned short n = ((c - 176) << 9) | c2;
if (64 <= c2 && c2 <= 127)
n -= 31 + (1 << 8);
else if (c2 <= 158)
n -= 32 + (1 << 8);
else if (c2 <= 252)
n -= 126;
else
continue;
n |= 0x8080;
*to++ = n;
}
else if (161 <= c && c <= 223) {
slen--;
s++;
*to++ = c;
}
else {
// 128, 160, 240-255
slen--;
s++;
}
}
*rest = s;
return to - start;
}
SJISEncoder::SJISEncoder()
{
}
void SJISEncoder::output(const Char *s, size_t n, OutputByteStream *sb)
{
for (; n > 0; s++, n--) {
Char c = *s;
unsigned short mask = (unsigned short)(c & 0x8080);
if (mask == 0)
sb->sputc((unsigned char)(c & 0xff));
else if (mask == 0x8080) {
unsigned char c1 = (c >> 8) & 0x7f;
unsigned char c2 = c & 0x7f;
unsigned char out1;
if (c1 < 33)
out1 = 0;
else if (c1 < 95)
out1 = ((c1 + 1) >> 1) + 112;
else if (c1 < 127)
out1 = ((c1 + 1) >> 1) + 176;
else
out1 = 0;
if (out1) {
unsigned char out2;
if (c1 & 1) {
if (c2 < 33)
out2 = 0;
else if (c2 <= 95)
out2 = c2 + 31;
else if (c2 <= 126)
out2 = c2 + 32;
else
out2 = 0;
}
else {
if (33 <= c2 && c2 <= 126)
out2 = c2 + 126;
else
out2 = 0;
}
if (out2) {
sb->sputc(out1);
sb->sputc(out2);
}
else
handleUnencodable(c, sb);
}
else
handleUnencodable(c, sb);
}
else if (mask == 0x0080) {
if (161 <= c && c <= 223)
sb->sputc((unsigned char)(c & 0xff));
else
handleUnencodable(c, sb);
}
else
handleUnencodable(c, sb);
}
}
#ifdef SP_NAMESPACE
}
#endif
#else /* not SP_MULTI_BYTE */
#ifndef __GNUG__
static char non_empty_translation_unit; // sigh
#endif
#endif /* not SP_MULTI_BYTE */