Blame glib/tests/utf8-performance.c

Packit ae235b
/* GLIB - Library of useful routines for C programming
Packit ae235b
 *
Packit ae235b
 * Copyright (C) 2010 Mikhail Zabaluev <mikhail.zabaluev@gmail.com>
Packit ae235b
 *
Packit ae235b
 * This library is free software; you can redistribute it and/or
Packit ae235b
 * modify it under the terms of the GNU Lesser General Public
Packit ae235b
 * License as published by the Free Software Foundation; either
Packit ae235b
 * version 2.1 of the License, or (at your option) any later version.
Packit ae235b
 *
Packit ae235b
 * This library is distributed in the hope that it will be useful,
Packit ae235b
 * but WITHOUT ANY WARRANTY; without even the implied warranty of
Packit ae235b
 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the GNU
Packit ae235b
 * Lesser General Public License for more details.
Packit ae235b
 *
Packit ae235b
 * You should have received a copy of the GNU Lesser General Public
Packit ae235b
 * License along with this library; if not, see <http://www.gnu.org/licenses/>.
Packit ae235b
 */
Packit ae235b
Packit ae235b
#include <string.h>
Packit ae235b
Packit ae235b
#include <glib.h>
Packit ae235b
Packit ae235b
#define NUM_ITERATIONS 500000
Packit ae235b
Packit ae235b
static const char str_ascii[] =
Packit ae235b
    "The quick brown fox jumps over the lazy dog";
Packit ae235b
Packit ae235b
static const gchar str_latin1[] =
Packit ae235b
    "Zwölf Boxkämpfer jagen Viktor quer über den großen Sylter Deich";
Packit ae235b
Packit ae235b
/* Energizing GOELRO-talk in Russian, used by KDE */
Packit ae235b
static const char str_cyrillic[] =
Packit ae235b
    "Широкая электрификация южных губерний даст мощный толчок подъёму "
Packit ae235b
    "сельского хозяйства.";
Packit ae235b
Packit ae235b
/* First sentence from the Wikipedia article:
Packit ae235b
 * http://zh.wikipedia.org/w/index.php?title=%E6%B1%89%E5%AD%97&oldid=13053137 */
Packit ae235b
static const char str_han[] =
Packit ae235b
    "漢字,亦稱中文字、中国字,在台灣又被稱為國字,是漢字文化圈廣泛使用的一種文字,屬於表意文字的詞素音節文字";
Packit ae235b
Packit ae235b
typedef int (* GrindFunc) (const char *, gsize);
Packit ae235b
Packit ae235b
#define GRIND_LOOP_BEGIN                 \
Packit ae235b
  {                                      \
Packit ae235b
    int i;                               \
Packit ae235b
    for (i = 0; i < NUM_ITERATIONS; i++)
Packit ae235b
Packit ae235b
#define GRIND_LOOP_END \
Packit ae235b
  }
Packit ae235b
Packit ae235b
static int
Packit ae235b
grind_get_char (const char *str, gsize len)
Packit ae235b
{
Packit ae235b
  gunichar acc = 0;
Packit ae235b
  GRIND_LOOP_BEGIN
Packit ae235b
    {
Packit ae235b
      const char *p = str;
Packit ae235b
      while (*p)
Packit ae235b
        {
Packit ae235b
          acc += g_utf8_get_char (p);
Packit ae235b
          p = g_utf8_next_char (p);
Packit ae235b
        }
Packit ae235b
    }
Packit ae235b
  GRIND_LOOP_END;
Packit ae235b
  return acc;
Packit ae235b
}
Packit ae235b
Packit ae235b
static int
Packit ae235b
grind_get_char_validated (const char *str, gsize len)
Packit ae235b
{
Packit ae235b
  gunichar acc = 0;
Packit ae235b
  GRIND_LOOP_BEGIN
Packit ae235b
    {
Packit ae235b
      const char *p = str;
Packit ae235b
      while (*p)
Packit ae235b
        {
Packit ae235b
          acc += g_utf8_get_char_validated (p, -1);
Packit ae235b
          p = g_utf8_next_char (p);
Packit ae235b
        }
Packit ae235b
    }
Packit ae235b
  GRIND_LOOP_END;
Packit ae235b
  return acc;
Packit ae235b
}
Packit ae235b
Packit ae235b
static int
Packit ae235b
grind_utf8_to_ucs4 (const char *str, gsize len)
Packit ae235b
{
Packit ae235b
  GRIND_LOOP_BEGIN
Packit ae235b
    {
Packit ae235b
      gunichar *ustr;
Packit ae235b
      ustr = g_utf8_to_ucs4 (str, -1, NULL, NULL, NULL);
Packit ae235b
      g_free (ustr);
Packit ae235b
    }
Packit ae235b
  GRIND_LOOP_END;
Packit ae235b
  return 0;
Packit ae235b
}
Packit ae235b
Packit ae235b
static int
Packit ae235b
grind_get_char_backwards (const char *str, gsize len)
Packit ae235b
{
Packit ae235b
  gunichar acc = 0;
Packit ae235b
  GRIND_LOOP_BEGIN
Packit ae235b
    {
Packit ae235b
      const char *p = str + len;
Packit ae235b
      do
Packit ae235b
	{
Packit ae235b
	  p = g_utf8_prev_char (p);
Packit ae235b
	  acc += g_utf8_get_char (p);
Packit ae235b
        }
Packit ae235b
      while (p != str);
Packit ae235b
    }
Packit ae235b
  GRIND_LOOP_END;
Packit ae235b
  return acc;
Packit ae235b
}
Packit ae235b
Packit ae235b
static int
Packit ae235b
grind_utf8_to_ucs4_sized (const char *str, gsize len)
Packit ae235b
{
Packit ae235b
  GRIND_LOOP_BEGIN
Packit ae235b
    {
Packit ae235b
      gunichar *ustr;
Packit ae235b
      ustr = g_utf8_to_ucs4 (str, len, NULL, NULL, NULL);
Packit ae235b
      g_free (ustr);
Packit ae235b
    }
Packit ae235b
  GRIND_LOOP_END;
Packit ae235b
  return 0;
Packit ae235b
}
Packit ae235b
Packit ae235b
static int
Packit ae235b
grind_utf8_to_ucs4_fast (const char *str, gsize len)
Packit ae235b
{
Packit ae235b
  GRIND_LOOP_BEGIN
Packit ae235b
    {
Packit ae235b
      gunichar *ustr;
Packit ae235b
      ustr = g_utf8_to_ucs4_fast (str, -1, NULL);
Packit ae235b
      g_free (ustr);
Packit ae235b
    }
Packit ae235b
  GRIND_LOOP_END;
Packit ae235b
  return 0;
Packit ae235b
}
Packit ae235b
Packit ae235b
static int
Packit ae235b
grind_utf8_to_ucs4_fast_sized (const char *str, gsize len)
Packit ae235b
{
Packit ae235b
  GRIND_LOOP_BEGIN
Packit ae235b
    {
Packit ae235b
      gunichar *ustr;
Packit ae235b
      ustr = g_utf8_to_ucs4_fast (str, len, NULL);
Packit ae235b
      g_free (ustr);
Packit ae235b
    }
Packit ae235b
  GRIND_LOOP_END;
Packit ae235b
  return 0;
Packit ae235b
}
Packit ae235b
Packit ae235b
static int
Packit ae235b
grind_utf8_validate (const char *str, gsize len)
Packit ae235b
{
Packit ae235b
  GRIND_LOOP_BEGIN
Packit ae235b
    g_utf8_validate (str, -1, NULL);
Packit ae235b
  GRIND_LOOP_END;
Packit ae235b
  return 0;
Packit ae235b
}
Packit ae235b
Packit ae235b
static int
Packit ae235b
grind_utf8_validate_sized (const char *str, gsize len)
Packit ae235b
{
Packit ae235b
  GRIND_LOOP_BEGIN
Packit ae235b
    g_utf8_validate (str, len, NULL);
Packit ae235b
  GRIND_LOOP_END;
Packit ae235b
  return 0;
Packit ae235b
}
Packit ae235b
Packit ae235b
typedef struct _GrindData {
Packit ae235b
  GrindFunc func;
Packit ae235b
  const char *str;
Packit ae235b
} GrindData;
Packit ae235b
Packit ae235b
static void
Packit ae235b
perform (gconstpointer data)
Packit ae235b
{
Packit ae235b
  GrindData *gd = (GrindData *) data;
Packit ae235b
  GrindFunc grind_func = gd->func;
Packit ae235b
  const char *str = gd->str;
Packit ae235b
  gsize len;
Packit ae235b
  gulong bytes_ground;
Packit ae235b
  gdouble time_elapsed;
Packit ae235b
  gdouble result;
Packit ae235b
Packit ae235b
  len = strlen (str);
Packit ae235b
  bytes_ground = (gulong) len * NUM_ITERATIONS;
Packit ae235b
Packit ae235b
  g_test_timer_start ();
Packit ae235b
Packit ae235b
  grind_func (str, len);
Packit ae235b
Packit ae235b
  time_elapsed = g_test_timer_elapsed ();
Packit ae235b
Packit ae235b
  result = ((gdouble) bytes_ground / time_elapsed) * 1.0e-6;
Packit ae235b
Packit ae235b
  g_test_maximized_result (result, "%7.1f MB/s", result);
Packit ae235b
Packit ae235b
  g_slice_free (GrindData, gd);
Packit ae235b
}
Packit ae235b
Packit ae235b
static void
Packit ae235b
add_cases(const char *path, GrindFunc func)
Packit ae235b
{
Packit ae235b
#define ADD_CASE(script)                              \
Packit ae235b
  G_STMT_START {                                      \
Packit ae235b
    GrindData *gd;                                    \
Packit ae235b
    gchar *full_path;                                 \
Packit ae235b
    gd = g_slice_new0(GrindData);                     \
Packit ae235b
    gd->func = func;                                  \
Packit ae235b
    gd->str = str_##script;                           \
Packit ae235b
    full_path = g_strdup_printf("%s/" #script, path); \
Packit ae235b
    g_test_add_data_func (full_path, gd, perform);    \
Packit ae235b
    g_free (full_path);                               \
Packit ae235b
  } G_STMT_END
Packit ae235b
Packit ae235b
  ADD_CASE(ascii);
Packit ae235b
  ADD_CASE(latin1);
Packit ae235b
  ADD_CASE(cyrillic);
Packit ae235b
  ADD_CASE(han);
Packit ae235b
Packit ae235b
#undef ADD_CASE
Packit ae235b
}
Packit ae235b
Packit ae235b
int
Packit ae235b
main (int argc, char **argv)
Packit ae235b
{
Packit ae235b
  g_test_init (&argc, &argv, NULL);
Packit ae235b
Packit ae235b
  if (g_test_perf ())
Packit ae235b
    {
Packit ae235b
      add_cases ("/utf8/perf/get_char", grind_get_char);
Packit ae235b
      add_cases ("/utf8/perf/get_char-backwards", grind_get_char_backwards);
Packit ae235b
      add_cases ("/utf8/perf/get_char_validated", grind_get_char_validated);
Packit ae235b
      add_cases ("/utf8/perf/utf8_to_ucs4", grind_utf8_to_ucs4);
Packit ae235b
      add_cases ("/utf8/perf/utf8_to_ucs4-sized", grind_utf8_to_ucs4_sized);
Packit ae235b
      add_cases ("/utf8/perf/utf8_to_ucs4_fast", grind_utf8_to_ucs4_fast);
Packit ae235b
      add_cases ("/utf8/perf/utf8_to_ucs4_fast-sized", grind_utf8_to_ucs4_fast_sized);
Packit ae235b
      add_cases ("/utf8/perf/utf8_validate", grind_utf8_validate);
Packit ae235b
      add_cases ("/utf8/perf/utf8_validate-sized", grind_utf8_validate_sized);
Packit ae235b
    }
Packit ae235b
Packit ae235b
  return g_test_run ();
Packit ae235b
}