Blob Blame History Raw
// Copyright (c) 1994 James Clark
// See the file COPYING for copying permission.

#include "splib.h"

#ifdef SP_MULTI_BYTE

#include "SJISCodingSystem.h"

#ifdef SP_NAMESPACE
namespace SP_NAMESPACE {
#endif

class SJISDecoder : public Decoder {
public:
  SJISDecoder();
  size_t decode(Char *, const char *, size_t, const char **);
private:
};

class SJISEncoder : public RecoveringEncoder {
public:
  SJISEncoder();
  void output(const Char *, size_t, OutputByteStream *);
};

Decoder *SJISCodingSystem::makeDecoder() const
{
  return new SJISDecoder;
}

Encoder *SJISCodingSystem::makeEncoder() const
{
  return new SJISEncoder;
}


SJISDecoder::SJISDecoder()
{
}

size_t SJISDecoder::decode(Char *to, const char *s,
			   size_t slen, const char **rest)
{
  Char *start = to;
  while (slen > 0) {
    unsigned char c = *(unsigned char *)s;
    if (!(c & 0x80)) {
      *to++ = c;
      s++;
      slen--;
    }
    else if (129 <= c && c <= 159) {
      if (slen < 2)
	break;
      s++;
      slen -= 2;
      unsigned char c2 = *(unsigned char *)s++;
      unsigned short n = ((c - 112) << 9) | c2;
      if (64 <= c2 && c2 <= 127)
	n -= 31 + (1 << 8);
      else if (c2 <= 158)
	n -= 32 + (1 << 8);
      else if (c2 <= 252)
	n -= 126;
      else
	continue;
      n |= 0x8080;
      *to++ = n;
    }
    else if (224 <= c && c <= 239) {
      if (slen < 2)
	break;
      s++;
      slen -= 2;
      unsigned char c2 = *(unsigned char *)s++;
      unsigned short n = ((c - 176) << 9) | c2;
      if (64 <= c2 && c2 <= 127)
	n -= 31 + (1 << 8);
      else if (c2 <= 158)
	n -= 32 + (1 << 8);
      else if (c2 <= 252)
	n -= 126;
      else
	continue;
      n |= 0x8080;
      *to++ = n;
    }
    else if (161 <= c && c <= 223) {
      slen--;
      s++;
      *to++ = c;
    }
    else {
      // 128, 160, 240-255
      slen--;
      s++;
    }
  }
  *rest = s;
  return to - start;
}

SJISEncoder::SJISEncoder()
{
}

void SJISEncoder::output(const Char *s, size_t n, OutputByteStream *sb)
{
  for (; n > 0; s++, n--) {
    Char c = *s;
    unsigned short mask = (unsigned short)(c & 0x8080);
    if (mask == 0)
      sb->sputc((unsigned char)(c & 0xff));
    else if (mask == 0x8080) {
      unsigned char c1 = (c >> 8) & 0x7f;
      unsigned char c2 = c & 0x7f;
      unsigned char out1;
      if (c1 < 33)
	out1 = 0;
      else if (c1 < 95)
	out1 = ((c1 + 1) >> 1) + 112;
      else if (c1 < 127)
	out1 = ((c1 + 1) >> 1) + 176;
      else
	out1 = 0;
      if (out1) {
	unsigned char out2;
	if (c1 & 1) {
	  if (c2 < 33)
	    out2 = 0;
	  else if (c2 <= 95)
	    out2 = c2 + 31;
	  else if (c2 <= 126)
	    out2 = c2 + 32;
	  else
	    out2 = 0;
	}
	else {
	  if (33 <= c2 && c2 <= 126)
	    out2 = c2 + 126;
	  else
	    out2 = 0;
	}
	if (out2) {
	  sb->sputc(out1);
	  sb->sputc(out2);
	}
	else
	  handleUnencodable(c, sb);
      }
      else
	handleUnencodable(c, sb);
    }
    else if (mask == 0x0080) {
      if (161 <= c && c <= 223)
	sb->sputc((unsigned char)(c & 0xff));
      else
	handleUnencodable(c, sb);
    }
    else
      handleUnencodable(c, sb);
  }
}

#ifdef SP_NAMESPACE
}
#endif

#else /* not SP_MULTI_BYTE */

#ifndef __GNUG__
static char non_empty_translation_unit;	// sigh
#endif

#endif /* not SP_MULTI_BYTE */