Blame glib/tests/utf8-misc.c

Packit ae235b
/* Unit tests for utilities
Packit ae235b
 * Copyright (C) 2010 Red Hat, Inc.
Packit ae235b
 *
Packit ae235b
 * This work is provided "as is"; redistribution and modification
Packit ae235b
 * in whole or in part, in any medium, physical or electronic is
Packit ae235b
 * permitted without restriction.
Packit ae235b
 *
Packit ae235b
 * This work is distributed in the hope that it will be useful,
Packit ae235b
 * but WITHOUT ANY WARRANTY; without even the implied warranty of
Packit ae235b
 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.
Packit ae235b
 *
Packit ae235b
 * In no event shall the authors or contributors be liable for any
Packit ae235b
 * direct, indirect, incidental, special, exemplary, or consequential
Packit ae235b
 * damages (including, but not limited to, procurement of substitute
Packit ae235b
 * goods or services; loss of use, data, or profits; or business
Packit ae235b
 * interruption) however caused and on any theory of liability, whether
Packit ae235b
 * in contract, strict liability, or tort (including negligence or
Packit ae235b
 * otherwise) arising in any way out of the use of this software, even
Packit ae235b
 * if advised of the possibility of such damage.
Packit ae235b
 *
Packit ae235b
 * Author: Matthias Clasen
Packit ae235b
 */
Packit ae235b
Packit ae235b
#include "glib.h"
Packit ae235b
Packit ae235b
static void
Packit ae235b
test_utf8_strlen (void)
Packit ae235b
{
Packit ae235b
  const gchar *string = "\xe2\x82\xa0gh\xe2\x82\xa4jl";
Packit ae235b
Packit ae235b
  g_assert_cmpint (g_utf8_strlen (string, -1), ==, 6);
Packit ae235b
  g_assert_cmpint (g_utf8_strlen (string, 0), ==, 0);
Packit ae235b
  g_assert_cmpint (g_utf8_strlen (string, 1), ==, 0);
Packit ae235b
  g_assert_cmpint (g_utf8_strlen (string, 2), ==, 0);
Packit ae235b
  g_assert_cmpint (g_utf8_strlen (string, 3), ==, 1);
Packit ae235b
  g_assert_cmpint (g_utf8_strlen (string, 4), ==, 2);
Packit ae235b
  g_assert_cmpint (g_utf8_strlen (string, 5), ==, 3);
Packit ae235b
  g_assert_cmpint (g_utf8_strlen (string, 6), ==, 3);
Packit ae235b
  g_assert_cmpint (g_utf8_strlen (string, 7), ==, 3);
Packit ae235b
  g_assert_cmpint (g_utf8_strlen (string, 8), ==, 4);
Packit ae235b
  g_assert_cmpint (g_utf8_strlen (string, 9), ==, 5);
Packit ae235b
  g_assert_cmpint (g_utf8_strlen (string, 10), ==, 6);
Packit ae235b
}
Packit ae235b
Packit ae235b
static void
Packit ae235b
test_utf8_strncpy (void)
Packit ae235b
{
Packit ae235b
  const gchar *string = "\xe2\x82\xa0gh\xe2\x82\xa4jl";
Packit ae235b
  gchar dest[20];
Packit ae235b
Packit ae235b
  g_utf8_strncpy (dest, string, 0);
Packit ae235b
  g_assert_cmpstr (dest, ==, "");
Packit ae235b
Packit ae235b
  g_utf8_strncpy (dest, string, 1);
Packit ae235b
  g_assert_cmpstr (dest, ==, "\xe2\x82\xa0");
Packit ae235b
Packit ae235b
  g_utf8_strncpy (dest, string, 2);
Packit ae235b
  g_assert_cmpstr (dest, ==, "\xe2\x82\xa0g");
Packit ae235b
Packit ae235b
  g_utf8_strncpy (dest, string, 3);
Packit ae235b
  g_assert_cmpstr (dest, ==, "\xe2\x82\xa0gh");
Packit ae235b
Packit ae235b
  g_utf8_strncpy (dest, string, 4);
Packit ae235b
  g_assert_cmpstr (dest, ==, "\xe2\x82\xa0gh\xe2\x82\xa4");
Packit ae235b
Packit ae235b
  g_utf8_strncpy (dest, string, 5);
Packit ae235b
  g_assert_cmpstr (dest, ==, "\xe2\x82\xa0gh\xe2\x82\xa4j");
Packit ae235b
Packit ae235b
  g_utf8_strncpy (dest, string, 6);
Packit ae235b
  g_assert_cmpstr (dest, ==, "\xe2\x82\xa0gh\xe2\x82\xa4jl");
Packit ae235b
Packit ae235b
  g_utf8_strncpy (dest, string, 20);
Packit ae235b
  g_assert_cmpstr (dest, ==, "\xe2\x82\xa0gh\xe2\x82\xa4jl");
Packit ae235b
}
Packit ae235b
Packit ae235b
static void
Packit ae235b
test_utf8_strrchr (void)
Packit ae235b
{
Packit ae235b
  const gchar *string = "\xe2\x82\xa0gh\xe2\x82\xa4jl\xe2\x82\xa4jl";
Packit ae235b
Packit ae235b
  g_assert (g_utf8_strrchr (string, -1, 'j') == string + 13);
Packit ae235b
  g_assert (g_utf8_strrchr (string, -1, 8356) == string + 10);
Packit ae235b
  g_assert (g_utf8_strrchr (string, 9, 8356) == string + 5);
Packit ae235b
  g_assert (g_utf8_strrchr (string, 3, 'j') == NULL);
Packit ae235b
  g_assert (g_utf8_strrchr (string, -1, 'x') == NULL);
Packit ae235b
}
Packit ae235b
Packit ae235b
static void
Packit ae235b
test_utf8_reverse (void)
Packit ae235b
{
Packit ae235b
  gchar *r;
Packit ae235b
Packit ae235b
  r = g_utf8_strreverse ("abcdef", -1);
Packit ae235b
  g_assert_cmpstr (r, ==, "fedcba");
Packit ae235b
  g_free (r);
Packit ae235b
Packit ae235b
  r = g_utf8_strreverse ("abcdef", 4);
Packit ae235b
  g_assert_cmpstr (r, ==, "dcba");
Packit ae235b
  g_free (r);
Packit ae235b
Packit ae235b
  /* U+0B0B Oriya Letter Vocalic R
Packit ae235b
   * U+10900 Phoenician Letter Alf
Packit ae235b
   * U+0041 Latin Capital Letter A
Packit ae235b
   * U+1EB6 Latin Capital Letter A With Breve And Dot Below
Packit ae235b
   */
Packit ae235b
  r = g_utf8_strreverse ("\340\254\213\360\220\244\200\101\341\272\266", -1);
Packit ae235b
  g_assert_cmpstr (r, ==, "\341\272\266\101\360\220\244\200\340\254\213");
Packit ae235b
  g_free (r);
Packit ae235b
}
Packit ae235b
Packit ae235b
static void
Packit ae235b
test_utf8_substring (void)
Packit ae235b
{
Packit ae235b
  gchar *r;
Packit ae235b
Packit ae235b
  r = g_utf8_substring ("abcd", 1, 3);
Packit ae235b
  g_assert_cmpstr (r, ==, "bc");
Packit ae235b
  g_free (r);
Packit ae235b
Packit ae235b
  r = g_utf8_substring ("abcd", 0, 4);
Packit ae235b
  g_assert_cmpstr (r, ==, "abcd");
Packit ae235b
  g_free (r);
Packit ae235b
Packit ae235b
  r = g_utf8_substring ("abcd", 2, 2);
Packit ae235b
  g_assert_cmpstr (r, ==, "");
Packit ae235b
  g_free (r);
Packit ae235b
Packit ae235b
  r = g_utf8_substring ("abc\xe2\x82\xa0gh\xe2\x82\xa4", 2, 5);
Packit ae235b
  g_assert_cmpstr (r, ==, "c\xe2\x82\xa0g");
Packit ae235b
  g_free (r);
Packit ae235b
}
Packit ae235b
Packit ae235b
static void
Packit ae235b
test_utf8_make_valid (void)
Packit ae235b
{
Packit ae235b
  gchar *r;
Packit ae235b
Packit ae235b
  /* valid UTF8 */
Packit ae235b
  r = g_utf8_make_valid ("\xe2\x82\xa0gh\xe2\x82\xa4jl", -1);
Packit ae235b
  g_assert_cmpstr (r, ==, "\xe2\x82\xa0gh\xe2\x82\xa4jl");
Packit ae235b
  g_free (r);
Packit ae235b
Packit ae235b
  /* invalid UTF8 */
Packit ae235b
  r = g_utf8_make_valid ("\xe2\x82\xa0gh\xe2\xffjl", -1);
Packit ae235b
  g_assert_cmpstr (r, ==, "\xe2\x82\xa0gh\xef\xbf\xbd\xef\xbf\xbdjl");
Packit ae235b
  g_free (r);
Packit ae235b
Packit ae235b
  /* invalid UTF8 without nul terminator followed by something unfortunate */
Packit ae235b
  r = g_utf8_make_valid ("Bj\xc3\xb8", 3);
Packit ae235b
  g_assert_cmpstr (r, ==, "Bj\xef\xbf\xbd");
Packit ae235b
  g_free (r);
Packit ae235b
Packit ae235b
  /* invalid UTF8 with embedded nul */
Packit ae235b
  r = g_utf8_make_valid ("\xe2\x82\xa0gh\xe2\x00jl", 9);
Packit ae235b
  g_assert_cmpstr (r, ==, "\xe2\x82\xa0gh\xef\xbf\xbd\xef\xbf\xbdjl");
Packit ae235b
  g_free (r);
Packit ae235b
}
Packit ae235b
Packit ae235b
int
Packit ae235b
main (int   argc,
Packit ae235b
      char *argv[])
Packit ae235b
{
Packit ae235b
  g_test_init (&argc, &argv, NULL);
Packit ae235b
Packit ae235b
  g_test_add_func ("/utf8/strlen", test_utf8_strlen);
Packit ae235b
  g_test_add_func ("/utf8/strncpy", test_utf8_strncpy);
Packit ae235b
  g_test_add_func ("/utf8/strrchr", test_utf8_strrchr);
Packit ae235b
  g_test_add_func ("/utf8/reverse", test_utf8_reverse);
Packit ae235b
  g_test_add_func ("/utf8/substring", test_utf8_substring);
Packit ae235b
  g_test_add_func ("/utf8/make-valid", test_utf8_make_valid);
Packit ae235b
Packit ae235b
  return g_test_run();
Packit ae235b
}