177 lines
3.2 KiB
C++
177 lines
3.2 KiB
C++
|
// Copyright (c) 1994 James Clark
|
||
|
// See the file COPYING for copying permission.
|
||
|
|
||
|
#include "splib.h"
|
||
|
|
||
|
#ifdef SP_MULTI_BYTE
|
||
|
|
||
|
#include "SJISCodingSystem.h"
|
||
|
|
||
|
#ifdef SP_NAMESPACE
|
||
|
namespace SP_NAMESPACE {
|
||
|
#endif
|
||
|
|
||
|
class SJISDecoder : public Decoder {
|
||
|
public:
|
||
|
SJISDecoder();
|
||
|
size_t decode(Char *, const char *, size_t, const char **);
|
||
|
private:
|
||
|
};
|
||
|
|
||
|
class SJISEncoder : public RecoveringEncoder {
|
||
|
public:
|
||
|
SJISEncoder();
|
||
|
void output(const Char *, size_t, OutputByteStream *);
|
||
|
};
|
||
|
|
||
|
Decoder *SJISCodingSystem::makeDecoder() const
|
||
|
{
|
||
|
return new SJISDecoder;
|
||
|
}
|
||
|
|
||
|
Encoder *SJISCodingSystem::makeEncoder() const
|
||
|
{
|
||
|
return new SJISEncoder;
|
||
|
}
|
||
|
|
||
|
|
||
|
SJISDecoder::SJISDecoder()
|
||
|
{
|
||
|
}
|
||
|
|
||
|
size_t SJISDecoder::decode(Char *to, const char *s,
|
||
|
size_t slen, const char **rest)
|
||
|
{
|
||
|
Char *start = to;
|
||
|
while (slen > 0) {
|
||
|
unsigned char c = *(unsigned char *)s;
|
||
|
if (!(c & 0x80)) {
|
||
|
*to++ = c;
|
||
|
s++;
|
||
|
slen--;
|
||
|
}
|
||
|
else if (129 <= c && c <= 159) {
|
||
|
if (slen < 2)
|
||
|
break;
|
||
|
s++;
|
||
|
slen -= 2;
|
||
|
unsigned char c2 = *(unsigned char *)s++;
|
||
|
unsigned short n = ((c - 112) << 9) | c2;
|
||
|
if (64 <= c2 && c2 <= 127)
|
||
|
n -= 31 + (1 << 8);
|
||
|
else if (c2 <= 158)
|
||
|
n -= 32 + (1 << 8);
|
||
|
else if (c2 <= 252)
|
||
|
n -= 126;
|
||
|
else
|
||
|
continue;
|
||
|
n |= 0x8080;
|
||
|
*to++ = n;
|
||
|
}
|
||
|
else if (224 <= c && c <= 239) {
|
||
|
if (slen < 2)
|
||
|
break;
|
||
|
s++;
|
||
|
slen -= 2;
|
||
|
unsigned char c2 = *(unsigned char *)s++;
|
||
|
unsigned short n = ((c - 176) << 9) | c2;
|
||
|
if (64 <= c2 && c2 <= 127)
|
||
|
n -= 31 + (1 << 8);
|
||
|
else if (c2 <= 158)
|
||
|
n -= 32 + (1 << 8);
|
||
|
else if (c2 <= 252)
|
||
|
n -= 126;
|
||
|
else
|
||
|
continue;
|
||
|
n |= 0x8080;
|
||
|
*to++ = n;
|
||
|
}
|
||
|
else if (161 <= c && c <= 223) {
|
||
|
slen--;
|
||
|
s++;
|
||
|
*to++ = c;
|
||
|
}
|
||
|
else {
|
||
|
// 128, 160, 240-255
|
||
|
slen--;
|
||
|
s++;
|
||
|
}
|
||
|
}
|
||
|
*rest = s;
|
||
|
return to - start;
|
||
|
}
|
||
|
|
||
|
SJISEncoder::SJISEncoder()
|
||
|
{
|
||
|
}
|
||
|
|
||
|
void SJISEncoder::output(const Char *s, size_t n, OutputByteStream *sb)
|
||
|
{
|
||
|
for (; n > 0; s++, n--) {
|
||
|
Char c = *s;
|
||
|
unsigned short mask = (unsigned short)(c & 0x8080);
|
||
|
if (mask == 0)
|
||
|
sb->sputc((unsigned char)(c & 0xff));
|
||
|
else if (mask == 0x8080) {
|
||
|
unsigned char c1 = (c >> 8) & 0x7f;
|
||
|
unsigned char c2 = c & 0x7f;
|
||
|
unsigned char out1;
|
||
|
if (c1 < 33)
|
||
|
out1 = 0;
|
||
|
else if (c1 < 95)
|
||
|
out1 = ((c1 + 1) >> 1) + 112;
|
||
|
else if (c1 < 127)
|
||
|
out1 = ((c1 + 1) >> 1) + 176;
|
||
|
else
|
||
|
out1 = 0;
|
||
|
if (out1) {
|
||
|
unsigned char out2;
|
||
|
if (c1 & 1) {
|
||
|
if (c2 < 33)
|
||
|
out2 = 0;
|
||
|
else if (c2 <= 95)
|
||
|
out2 = c2 + 31;
|
||
|
else if (c2 <= 126)
|
||
|
out2 = c2 + 32;
|
||
|
else
|
||
|
out2 = 0;
|
||
|
}
|
||
|
else {
|
||
|
if (33 <= c2 && c2 <= 126)
|
||
|
out2 = c2 + 126;
|
||
|
else
|
||
|
out2 = 0;
|
||
|
}
|
||
|
if (out2) {
|
||
|
sb->sputc(out1);
|
||
|
sb->sputc(out2);
|
||
|
}
|
||
|
else
|
||
|
handleUnencodable(c, sb);
|
||
|
}
|
||
|
else
|
||
|
handleUnencodable(c, sb);
|
||
|
}
|
||
|
else if (mask == 0x0080) {
|
||
|
if (161 <= c && c <= 223)
|
||
|
sb->sputc((unsigned char)(c & 0xff));
|
||
|
else
|
||
|
handleUnencodable(c, sb);
|
||
|
}
|
||
|
else
|
||
|
handleUnencodable(c, sb);
|
||
|
}
|
||
|
}
|
||
|
|
||
|
#ifdef SP_NAMESPACE
|
||
|
}
|
||
|
#endif
|
||
|
|
||
|
#else /* not SP_MULTI_BYTE */
|
||
|
|
||
|
#ifndef __GNUG__
|
||
|
static char non_empty_translation_unit; // sigh
|
||
|
#endif
|
||
|
|
||
|
#endif /* not SP_MULTI_BYTE */
|