Blame gnulib-tests/test-iconv.c

Packit 33f14e
/* Test of character set conversion.
Packit 33f14e
   Copyright (C) 2007-2017 Free Software Foundation, Inc.
Packit 33f14e
Packit 33f14e
   This program is free software: you can redistribute it and/or modify
Packit 33f14e
   it under the terms of the GNU General Public License as published by
Packit 33f14e
   the Free Software Foundation; either version 3 of the License, or
Packit 33f14e
   (at your option) any later version.
Packit 33f14e
Packit 33f14e
   This program is distributed in the hope that it will be useful,
Packit 33f14e
   but WITHOUT ANY WARRANTY; without even the implied warranty of
Packit 33f14e
   MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
Packit 33f14e
   GNU General Public License for more details.
Packit 33f14e
Packit 33f14e
   You should have received a copy of the GNU General Public License
Packit 33f14e
   along with this program.  If not, see <http://www.gnu.org/licenses/>.  */
Packit 33f14e
Packit 33f14e
/* Written by Bruno Haible <bruno@clisp.org>, 2007.  */
Packit 33f14e
Packit 33f14e
#include <config.h>
Packit 33f14e
Packit 33f14e
#if HAVE_ICONV
Packit 33f14e
# include <iconv.h>
Packit 33f14e
Packit 33f14e
# ifndef ICONV_CONST
Packit 33f14e
#  define ICONV_CONST /* empty */
Packit 33f14e
# endif
Packit 33f14e
Packit 33f14e
#include "signature.h"
Packit 33f14e
SIGNATURE_CHECK (iconv, size_t, (iconv_t, ICONV_CONST char **, size_t *,
Packit 33f14e
                                 char **, size_t *));
Packit 33f14e
SIGNATURE_CHECK (iconv_close, int, (iconv_t x));
Packit 33f14e
SIGNATURE_CHECK (iconv_open, iconv_t, (char const *, char const *));
Packit 33f14e
Packit 33f14e
#endif
Packit 33f14e
Packit 33f14e
#include <errno.h>
Packit 33f14e
#include <string.h>
Packit 33f14e
Packit 33f14e
#include "macros.h"
Packit 33f14e
Packit 33f14e
int
Packit 33f14e
main ()
Packit 33f14e
{
Packit 33f14e
#if HAVE_ICONV
Packit 33f14e
  /* Assume that iconv() supports at least the encodings ASCII, ISO-8859-1,
Packit 33f14e
     and UTF-8.  */
Packit 33f14e
  iconv_t cd_88591_to_utf8 = iconv_open ("UTF-8", "ISO8859-1");
Packit 33f14e
  iconv_t cd_utf8_to_88591 = iconv_open ("ISO8859-1", "UTF-8");
Packit 33f14e
Packit 33f14e
#if defined __MVS__ && defined __IBMC__
Packit 33f14e
  /* String literals below are in ASCII, not EBCDIC.  */
Packit 33f14e
# pragma convert("ISO8859-1")
Packit 33f14e
# define CONVERT_ENABLED
Packit 33f14e
#endif
Packit 33f14e
Packit 33f14e
  ASSERT (cd_88591_to_utf8 != (iconv_t)(-1));
Packit 33f14e
  ASSERT (cd_utf8_to_88591 != (iconv_t)(-1));
Packit 33f14e
Packit 33f14e
  /* Test conversion from ISO-8859-1 to UTF-8 with no errors.  */
Packit 33f14e
  {
Packit 33f14e
    static const char input[] = "\304rger mit b\366sen B\374bchen ohne Augenma\337";
Packit 33f14e
    static const char expected[] = "\303\204rger mit b\303\266sen B\303\274bchen ohne Augenma\303\237";
Packit 33f14e
    char buf[50];
Packit 33f14e
    const char *inptr = input;
Packit 33f14e
    size_t inbytesleft = strlen (input);
Packit 33f14e
    char *outptr = buf;
Packit 33f14e
    size_t outbytesleft = sizeof (buf);
Packit 33f14e
    size_t res = iconv (cd_88591_to_utf8,
Packit 33f14e
                        (ICONV_CONST char **) &inptr, &inbytesleft,
Packit 33f14e
                        &outptr, &outbytesleft);
Packit 33f14e
    ASSERT (res == 0 && inbytesleft == 0);
Packit 33f14e
    ASSERT (outptr == buf + strlen (expected));
Packit 33f14e
    ASSERT (memcmp (buf, expected, strlen (expected)) == 0);
Packit 33f14e
  }
Packit 33f14e
Packit 33f14e
  /* Test conversion from ISO-8859-1 to UTF-8 with E2BIG.  */
Packit 33f14e
  {
Packit 33f14e
    static const char input[] = "\304";
Packit 33f14e
    static char buf[2] = { (char)0xDE, (char)0xAD };
Packit 33f14e
    const char *inptr = input;
Packit 33f14e
    size_t inbytesleft = 1;
Packit 33f14e
    char *outptr = buf;
Packit 33f14e
    size_t outbytesleft = 1;
Packit 33f14e
    size_t res = iconv (cd_88591_to_utf8,
Packit 33f14e
                        (ICONV_CONST char **) &inptr, &inbytesleft,
Packit 33f14e
                        &outptr, &outbytesleft);
Packit 33f14e
    ASSERT (res == (size_t)(-1) && errno == E2BIG);
Packit 33f14e
    ASSERT (inbytesleft == 1);
Packit 33f14e
    ASSERT (outbytesleft == 1);
Packit 33f14e
    ASSERT ((unsigned char) buf[1] == 0xAD);
Packit 33f14e
    ASSERT ((unsigned char) buf[0] == 0xDE);
Packit 33f14e
  }
Packit 33f14e
Packit 33f14e
  /* Test conversion from UTF-8 to ISO-8859-1 with no errors.  */
Packit 33f14e
  {
Packit 33f14e
    static const char input[] = "\303\204rger mit b\303\266sen B\303\274bchen ohne Augenma\303\237";
Packit 33f14e
    static const char expected[] = "\304rger mit b\366sen B\374bchen ohne Augenma\337";
Packit 33f14e
    char buf[50];
Packit 33f14e
    const char *inptr = input;
Packit 33f14e
    size_t inbytesleft = strlen (input);
Packit 33f14e
    char *outptr = buf;
Packit 33f14e
    size_t outbytesleft = sizeof (buf);
Packit 33f14e
    size_t res = iconv (cd_utf8_to_88591,
Packit 33f14e
                        (ICONV_CONST char **) &inptr, &inbytesleft,
Packit 33f14e
                        &outptr, &outbytesleft);
Packit 33f14e
    ASSERT (res == 0 && inbytesleft == 0);
Packit 33f14e
    ASSERT (outptr == buf + strlen (expected));
Packit 33f14e
    ASSERT (memcmp (buf, expected, strlen (expected)) == 0);
Packit 33f14e
  }
Packit 33f14e
Packit 33f14e
  /* Test conversion from UTF-8 to ISO-8859-1 with EILSEQ.  */
Packit 33f14e
  {
Packit 33f14e
    static const char input[] = "\342\202\254"; /* EURO SIGN */
Packit 33f14e
    char buf[10];
Packit 33f14e
    const char *inptr = input;
Packit 33f14e
    size_t inbytesleft = strlen (input);
Packit 33f14e
    char *outptr = buf;
Packit 33f14e
    size_t outbytesleft = sizeof (buf);
Packit 33f14e
    size_t res = iconv (cd_utf8_to_88591,
Packit 33f14e
                        (ICONV_CONST char **) &inptr, &inbytesleft,
Packit 33f14e
                        &outptr, &outbytesleft);
Packit 33f14e
    if (res == (size_t)(-1))
Packit 33f14e
      {
Packit 33f14e
        ASSERT (errno == EILSEQ);
Packit 33f14e
        ASSERT (inbytesleft == strlen (input) && outptr == buf);
Packit 33f14e
      }
Packit 33f14e
    else
Packit 33f14e
      {
Packit 33f14e
        ASSERT (res == 1);
Packit 33f14e
        ASSERT (inbytesleft == 0);
Packit 33f14e
      }
Packit 33f14e
  }
Packit 33f14e
Packit 33f14e
  /* Test conversion from UTF-8 to ISO-8859-1 with EINVAL.  */
Packit 33f14e
  {
Packit 33f14e
    static const char input[] = "\342";
Packit 33f14e
    char buf[10];
Packit 33f14e
    const char *inptr = input;
Packit 33f14e
    size_t inbytesleft = 1;
Packit 33f14e
    char *outptr = buf;
Packit 33f14e
    size_t outbytesleft = sizeof (buf);
Packit 33f14e
    size_t res = iconv (cd_utf8_to_88591,
Packit 33f14e
                        (ICONV_CONST char **) &inptr, &inbytesleft,
Packit 33f14e
                        &outptr, &outbytesleft);
Packit 33f14e
    ASSERT (res == (size_t)(-1) && errno == EINVAL);
Packit 33f14e
    ASSERT (inbytesleft == 1 && outptr == buf);
Packit 33f14e
  }
Packit 33f14e
Packit 33f14e
  iconv_close (cd_88591_to_utf8);
Packit 33f14e
  iconv_close (cd_utf8_to_88591);
Packit 33f14e
Packit 33f14e
#ifdef CONVERT_ENABLED
Packit 33f14e
# pragma convert(pop)
Packit 33f14e
#endif
Packit 33f14e
Packit 33f14e
#endif /* HAVE_ICONV */
Packit 33f14e
Packit 33f14e
  return 0;
Packit 33f14e
}