Blame iconvdata/euc-kr.c

Packit 6c4009
/* Mapping tables for EUC-KR handling.
Packit 6c4009
   Copyright (C) 1998-2018 Free Software Foundation, Inc.
Packit 6c4009
   This file is part of the GNU C Library.
Packit 6c4009
   Contributed by Jungshik Shin <jshin@pantheon.yale.edu>
Packit 6c4009
   and Ulrich Drepper <drepper@cygnus.com>, 1998.
Packit 6c4009
Packit 6c4009
   The GNU C Library is free software; you can redistribute it and/or
Packit 6c4009
   modify it under the terms of the GNU Lesser General Public
Packit 6c4009
   License as published by the Free Software Foundation; either
Packit 6c4009
   version 2.1 of the License, or (at your option) any later version.
Packit 6c4009
Packit 6c4009
   The GNU C Library is distributed in the hope that it will be useful,
Packit 6c4009
   but WITHOUT ANY WARRANTY; without even the implied warranty of
Packit 6c4009
   MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the GNU
Packit 6c4009
   Lesser General Public License for more details.
Packit 6c4009
Packit 6c4009
   You should have received a copy of the GNU Lesser General Public
Packit 6c4009
   License along with the GNU C Library; if not, see
Packit 6c4009
   <http://www.gnu.org/licenses/>.  */
Packit 6c4009
Packit 6c4009
#include <dlfcn.h>
Packit 6c4009
#include <stdint.h>
Packit 6c4009
#include <ksc5601.h>
Packit 6c4009
Packit 6c4009
Packit 6c4009
static inline void
Packit 6c4009
__attribute ((always_inline))
Packit 6c4009
euckr_from_ucs4 (uint32_t ch, unsigned char *cp)
Packit 6c4009
{
Packit 6c4009
  if (ch > 0x9f)
Packit 6c4009
    {
Packit 6c4009
      if (__builtin_expect (ch, 0) == 0x20a9)
Packit 6c4009
	{
Packit 6c4009
	  /* Half-width Korean Currency WON sign.  There is no
Packit 6c4009
             equivalent in EUC-KR.  Some mappings use \x5c because
Packit 6c4009
             this is what some old Korean ASCII variants used but this
Packit 6c4009
             is causing problems.  We map it to the FULL WIDTH WON SIGN.  */
Packit 6c4009
	  cp[0] = '\xa3';
Packit 6c4009
	  cp[1] = '\xdc';
Packit 6c4009
	}
Packit 6c4009
      else if (__builtin_expect (ucs4_to_ksc5601 (ch, cp, 2), 0)
Packit 6c4009
	  != __UNKNOWN_10646_CHAR)
Packit 6c4009
	{
Packit 6c4009
	  cp[0] |= 0x80;
Packit 6c4009
	  cp[1] |= 0x80;
Packit 6c4009
	}
Packit 6c4009
      else
Packit 6c4009
	cp[0] = cp[1] = '\0';
Packit 6c4009
    }
Packit 6c4009
  else
Packit 6c4009
    {
Packit 6c4009
      /* There is no mapping for U005c but we nevertheless map it to
Packit 6c4009
	 \x5c.  */
Packit 6c4009
      cp[0] = (unsigned char) ch;
Packit 6c4009
      cp[1] = '\0';
Packit 6c4009
    }
Packit 6c4009
}
Packit 6c4009
Packit 6c4009
Packit 6c4009
/* Definitions used in the body of the `gconv' function.  */
Packit 6c4009
#define CHARSET_NAME		"EUC-KR//"
Packit 6c4009
#define FROM_LOOP		from_euc_kr
Packit 6c4009
#define TO_LOOP			to_euc_kr
Packit 6c4009
#define DEFINE_INIT		1
Packit 6c4009
#define DEFINE_FINI		1
Packit 6c4009
#define MIN_NEEDED_FROM		1
Packit 6c4009
#define MAX_NEEDED_FROM		2
Packit 6c4009
#define MIN_NEEDED_TO		4
Packit 6c4009
#define ONE_DIRECTION		0
Packit 6c4009
Packit 6c4009
Packit 6c4009
/* First define the conversion function from EUC-KR to UCS4.  */
Packit 6c4009
#define MIN_NEEDED_INPUT	MIN_NEEDED_FROM
Packit 6c4009
#define MAX_NEEDED_INPUT	MAX_NEEDED_FROM
Packit 6c4009
#define MIN_NEEDED_OUTPUT	MIN_NEEDED_TO
Packit 6c4009
#define LOOPFCT			FROM_LOOP
Packit 6c4009
#define BODY \
Packit 6c4009
  {									      \
Packit 6c4009
    uint32_t ch = *inptr;						      \
Packit 6c4009
									      \
Packit 6c4009
    if (ch <= 0x9f)							      \
Packit 6c4009
      ++inptr;								      \
Packit Service 8182f1
    else if (__glibc_unlikely (ch == 0xa0))				      \
Packit 6c4009
      {									      \
Packit 6c4009
	/* This is illegal.  */						      \
Packit 6c4009
	STANDARD_FROM_LOOP_ERR_HANDLER (1);				      \
Packit 6c4009
      }									      \
Packit 6c4009
    else								      \
Packit 6c4009
      {									      \
Packit 6c4009
	/* Two-byte character.  First test whether the next byte	      \
Packit 6c4009
	   is also available.  */					      \
Packit 6c4009
	ch = ksc5601_to_ucs4 (&inptr, inend - inptr, 0x80);		      \
Packit 6c4009
	if (__glibc_unlikely (ch == 0))					      \
Packit 6c4009
	  {								      \
Packit 6c4009
	    /* The second byte is not available.  */			      \
Packit 6c4009
	    result = __GCONV_INCOMPLETE_INPUT;				      \
Packit 6c4009
	    break;							      \
Packit 6c4009
	  }								      \
Packit 6c4009
	if (__glibc_unlikely (ch == __UNKNOWN_10646_CHAR))		      \
Packit 6c4009
	  /* This is an illegal character.  */				      \
Packit 6c4009
	  STANDARD_FROM_LOOP_ERR_HANDLER (2);				      \
Packit 6c4009
      }									      \
Packit 6c4009
									      \
Packit 6c4009
    put32 (outptr, ch);							      \
Packit 6c4009
    outptr += 4;							      \
Packit 6c4009
  }
Packit 6c4009
#define LOOP_NEED_FLAGS
Packit 6c4009
#define ONEBYTE_BODY \
Packit 6c4009
  {									      \
Packit 6c4009
    if (c <= 0x9f)							      \
Packit 6c4009
      return c;								      \
Packit 6c4009
    else								      \
Packit 6c4009
      return WEOF;							      \
Packit 6c4009
  }
Packit 6c4009
#include <iconv/loop.c>
Packit 6c4009
Packit 6c4009
Packit 6c4009
/* Next, define the other direction.  */
Packit 6c4009
#define MIN_NEEDED_INPUT	MIN_NEEDED_TO
Packit 6c4009
#define MIN_NEEDED_OUTPUT	MIN_NEEDED_FROM
Packit 6c4009
#define MAX_NEEDED_OUTPUT	MAX_NEEDED_FROM
Packit 6c4009
#define LOOPFCT			TO_LOOP
Packit 6c4009
#define BODY \
Packit 6c4009
  {									      \
Packit 6c4009
    uint32_t ch = get32 (inptr);					      \
Packit 6c4009
    unsigned char cp[2];						      \
Packit 6c4009
									      \
Packit 6c4009
    /* Decomposing Hangul syllables not available in KS C 5601 into	      \
Packit 6c4009
       Jamos should be considered either here or in euckr_from_ucs4() */      \
Packit 6c4009
    euckr_from_ucs4 (ch, cp);						      \
Packit 6c4009
									      \
Packit 6c4009
    if (__builtin_expect (cp[0], '\1') == '\0' && ch != 0)		      \
Packit 6c4009
      {									      \
Packit 6c4009
	UNICODE_TAG_HANDLER (ch, 4);					      \
Packit 6c4009
									      \
Packit 6c4009
	/* Illegal character.  */					      \
Packit 6c4009
	STANDARD_TO_LOOP_ERR_HANDLER (4);				      \
Packit 6c4009
      }									      \
Packit 6c4009
									      \
Packit 6c4009
    *outptr++ = cp[0];							      \
Packit 6c4009
    /* Now test for a possible second byte and write this if possible.  */    \
Packit 6c4009
    if (cp[1] != '\0')							      \
Packit 6c4009
      {									      \
Packit 6c4009
	if (__glibc_unlikely (outptr >= outend))			      \
Packit 6c4009
	  {								      \
Packit 6c4009
	    /* The result does not fit into the buffer.  */		      \
Packit 6c4009
	    --outptr;							      \
Packit 6c4009
	    result = __GCONV_FULL_OUTPUT;				      \
Packit 6c4009
	    break;							      \
Packit 6c4009
	  }								      \
Packit 6c4009
	*outptr++ = cp[1];						      \
Packit 6c4009
      }									      \
Packit 6c4009
									      \
Packit 6c4009
    inptr += 4;								      \
Packit 6c4009
  }
Packit 6c4009
#define LOOP_NEED_FLAGS
Packit 6c4009
#include <iconv/loop.c>
Packit 6c4009
Packit 6c4009
Packit 6c4009
/* Now define the toplevel functions.  */
Packit 6c4009
#include <iconv/skeleton.c>