Blame lib/unistr.in.h

Packit 33f14e
/* Elementary Unicode string functions.
Packit 33f14e
   Copyright (C) 2001-2002, 2005-2017 Free Software Foundation, Inc.
Packit 33f14e
Packit 33f14e
   This program is free software: you can redistribute it and/or modify it
Packit 33f14e
   under the terms of the GNU General Public License as published
Packit 33f14e
   by the Free Software Foundation; either version 3 of the License, or
Packit 33f14e
   (at your option) any later version.
Packit 33f14e
Packit 33f14e
   This program is distributed in the hope that it will be useful,
Packit 33f14e
   but WITHOUT ANY WARRANTY; without even the implied warranty of
Packit 33f14e
   MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the GNU
Packit 33f14e
   General Public License for more details.
Packit 33f14e
Packit 33f14e
   You should have received a copy of the GNU General Public License
Packit 33f14e
   along with this program.  If not, see <http://www.gnu.org/licenses/>.  */
Packit 33f14e
Packit 33f14e
#ifndef _UNISTR_H
Packit 33f14e
#define _UNISTR_H
Packit 33f14e
Packit 33f14e
#include "unitypes.h"
Packit 33f14e
Packit 33f14e
/* Get common macros for C.  */
Packit 33f14e
#include "unused-parameter.h"
Packit 33f14e
Packit 33f14e
/* Get bool.  */
Packit 33f14e
#include <stdbool.h>
Packit 33f14e
Packit 33f14e
/* Get size_t.  */
Packit 33f14e
#include <stddef.h>
Packit 33f14e
Packit 33f14e
#ifdef __cplusplus
Packit 33f14e
extern "C" {
Packit 33f14e
#endif
Packit 33f14e
Packit 33f14e
Packit 33f14e
/* Conventions:
Packit 33f14e
Packit 33f14e
   All functions prefixed with u8_ operate on UTF-8 encoded strings.
Packit 33f14e
   Their unit is an uint8_t (1 byte).
Packit 33f14e
Packit 33f14e
   All functions prefixed with u16_ operate on UTF-16 encoded strings.
Packit 33f14e
   Their unit is an uint16_t (a 2-byte word).
Packit 33f14e
Packit 33f14e
   All functions prefixed with u32_ operate on UCS-4 encoded strings.
Packit 33f14e
   Their unit is an uint32_t (a 4-byte word).
Packit 33f14e
Packit 33f14e
   All argument pairs (s, n) denote a Unicode string s[0..n-1] with exactly
Packit 33f14e
   n units.
Packit 33f14e
Packit 33f14e
   All arguments starting with "str" and the arguments of functions starting
Packit 33f14e
   with u8_str/u16_str/u32_str denote a NUL terminated string, i.e. a string
Packit 33f14e
   which terminates at the first NUL unit.  This termination unit is
Packit 33f14e
   considered part of the string for all memory allocation purposes, but
Packit 33f14e
   is not considered part of the string for all other logical purposes.
Packit 33f14e
Packit 33f14e
   Functions returning a string result take a (resultbuf, lengthp) argument
Packit 33f14e
   pair.  If resultbuf is not NULL and the result fits into *lengthp units,
Packit 33f14e
   it is put in resultbuf, and resultbuf is returned.  Otherwise, a freshly
Packit 33f14e
   allocated string is returned.  In both cases, *lengthp is set to the
Packit 33f14e
   length (number of units) of the returned string.  In case of error,
Packit 33f14e
   NULL is returned and errno is set.  */
Packit 33f14e
Packit 33f14e
Packit 33f14e
/* Elementary string checks.  */
Packit 33f14e
Packit 33f14e
/* Check whether an UTF-8 string is well-formed.
Packit 33f14e
   Return NULL if valid, or a pointer to the first invalid unit otherwise.  */
Packit 33f14e
extern const uint8_t *
Packit 33f14e
       u8_check (const uint8_t *s, size_t n)
Packit 33f14e
       _UC_ATTRIBUTE_PURE;
Packit 33f14e
Packit 33f14e
/* Check whether an UTF-16 string is well-formed.
Packit 33f14e
   Return NULL if valid, or a pointer to the first invalid unit otherwise.  */
Packit 33f14e
extern const uint16_t *
Packit 33f14e
       u16_check (const uint16_t *s, size_t n)
Packit 33f14e
       _UC_ATTRIBUTE_PURE;
Packit 33f14e
Packit 33f14e
/* Check whether an UCS-4 string is well-formed.
Packit 33f14e
   Return NULL if valid, or a pointer to the first invalid unit otherwise.  */
Packit 33f14e
extern const uint32_t *
Packit 33f14e
       u32_check (const uint32_t *s, size_t n)
Packit 33f14e
       _UC_ATTRIBUTE_PURE;
Packit 33f14e
Packit 33f14e
Packit 33f14e
/* Elementary string conversions.  */
Packit 33f14e
Packit 33f14e
/* Convert an UTF-8 string to an UTF-16 string.  */
Packit 33f14e
extern uint16_t *
Packit 33f14e
       u8_to_u16 (const uint8_t *s, size_t n, uint16_t *resultbuf,
Packit 33f14e
                  size_t *lengthp);
Packit 33f14e
Packit 33f14e
/* Convert an UTF-8 string to an UCS-4 string.  */
Packit 33f14e
extern uint32_t *
Packit 33f14e
       u8_to_u32 (const uint8_t *s, size_t n, uint32_t *resultbuf,
Packit 33f14e
                  size_t *lengthp);
Packit 33f14e
Packit 33f14e
/* Convert an UTF-16 string to an UTF-8 string.  */
Packit 33f14e
extern uint8_t *
Packit 33f14e
       u16_to_u8 (const uint16_t *s, size_t n, uint8_t *resultbuf,
Packit 33f14e
                  size_t *lengthp);
Packit 33f14e
Packit 33f14e
/* Convert an UTF-16 string to an UCS-4 string.  */
Packit 33f14e
extern uint32_t *
Packit 33f14e
       u16_to_u32 (const uint16_t *s, size_t n, uint32_t *resultbuf,
Packit 33f14e
                   size_t *lengthp);
Packit 33f14e
Packit 33f14e
/* Convert an UCS-4 string to an UTF-8 string.  */
Packit 33f14e
extern uint8_t *
Packit 33f14e
       u32_to_u8 (const uint32_t *s, size_t n, uint8_t *resultbuf,
Packit 33f14e
                  size_t *lengthp);
Packit 33f14e
Packit 33f14e
/* Convert an UCS-4 string to an UTF-16 string.  */
Packit 33f14e
extern uint16_t *
Packit 33f14e
       u32_to_u16 (const uint32_t *s, size_t n, uint16_t *resultbuf,
Packit 33f14e
                   size_t *lengthp);
Packit 33f14e
Packit 33f14e
Packit 33f14e
/* Elementary string functions.  */
Packit 33f14e
Packit 33f14e
/* Return the length (number of units) of the first character in S, which is
Packit 33f14e
   no longer than N.  Return 0 if it is the NUL character.  Return -1 upon
Packit 33f14e
   failure.  */
Packit 33f14e
/* Similar to mblen(), except that s must not be NULL.  */
Packit 33f14e
extern int
Packit 33f14e
       u8_mblen (const uint8_t *s, size_t n)
Packit 33f14e
       _UC_ATTRIBUTE_PURE;
Packit 33f14e
extern int
Packit 33f14e
       u16_mblen (const uint16_t *s, size_t n)
Packit 33f14e
       _UC_ATTRIBUTE_PURE;
Packit 33f14e
extern int
Packit 33f14e
       u32_mblen (const uint32_t *s, size_t n)
Packit 33f14e
       _UC_ATTRIBUTE_PURE;
Packit 33f14e
Packit 33f14e
/* Return the length (number of units) of the first character in S, putting
Packit 33f14e
   its 'ucs4_t' representation in *PUC.  Upon failure, *PUC is set to 0xfffd,
Packit 33f14e
   and an appropriate number of units is returned.
Packit 33f14e
   The number of available units, N, must be > 0.  */
Packit 33f14e
/* Similar to mbtowc(), except that puc and s must not be NULL, n must be > 0,
Packit 33f14e
   and the NUL character is not treated specially.  */
Packit 33f14e
/* The variants with _safe suffix are safe, even if the library is compiled
Packit 33f14e
   without --enable-safety.  */
Packit 33f14e
Packit 33f14e
#if GNULIB_UNISTR_U8_MBTOUC_UNSAFE || HAVE_LIBUNISTRING
Packit 33f14e
# if !HAVE_INLINE
Packit 33f14e
extern int
Packit 33f14e
       u8_mbtouc_unsafe (ucs4_t *puc, const uint8_t *s, size_t n);
Packit 33f14e
# else
Packit 33f14e
extern int
Packit 33f14e
       u8_mbtouc_unsafe_aux (ucs4_t *puc, const uint8_t *s, size_t n);
Packit 33f14e
static inline int
Packit 33f14e
u8_mbtouc_unsafe (ucs4_t *puc, const uint8_t *s, size_t n)
Packit 33f14e
{
Packit 33f14e
  uint8_t c = *s;
Packit 33f14e
Packit 33f14e
  if (c < 0x80)
Packit 33f14e
    {
Packit 33f14e
      *puc = c;
Packit 33f14e
      return 1;
Packit 33f14e
    }
Packit 33f14e
  else
Packit 33f14e
    return u8_mbtouc_unsafe_aux (puc, s, n);
Packit 33f14e
}
Packit 33f14e
# endif
Packit 33f14e
#endif
Packit 33f14e
Packit 33f14e
#if GNULIB_UNISTR_U16_MBTOUC_UNSAFE || HAVE_LIBUNISTRING
Packit 33f14e
# if !HAVE_INLINE
Packit 33f14e
extern int
Packit 33f14e
       u16_mbtouc_unsafe (ucs4_t *puc, const uint16_t *s, size_t n);
Packit 33f14e
# else
Packit 33f14e
extern int
Packit 33f14e
       u16_mbtouc_unsafe_aux (ucs4_t *puc, const uint16_t *s, size_t n);
Packit 33f14e
static inline int
Packit 33f14e
u16_mbtouc_unsafe (ucs4_t *puc, const uint16_t *s, size_t n)
Packit 33f14e
{
Packit 33f14e
  uint16_t c = *s;
Packit 33f14e
Packit 33f14e
  if (c < 0xd800 || c >= 0xe000)
Packit 33f14e
    {
Packit 33f14e
      *puc = c;
Packit 33f14e
      return 1;
Packit 33f14e
    }
Packit 33f14e
  else
Packit 33f14e
    return u16_mbtouc_unsafe_aux (puc, s, n);
Packit 33f14e
}
Packit 33f14e
# endif
Packit 33f14e
#endif
Packit 33f14e
Packit 33f14e
#if GNULIB_UNISTR_U32_MBTOUC_UNSAFE || HAVE_LIBUNISTRING
Packit 33f14e
# if !HAVE_INLINE
Packit 33f14e
extern int
Packit 33f14e
       u32_mbtouc_unsafe (ucs4_t *puc, const uint32_t *s, size_t n);
Packit 33f14e
# else
Packit 33f14e
static inline int
Packit 33f14e
u32_mbtouc_unsafe (ucs4_t *puc,
Packit 33f14e
                   const uint32_t *s, size_t n _GL_UNUSED_PARAMETER)
Packit 33f14e
{
Packit 33f14e
  uint32_t c = *s;
Packit 33f14e
Packit 33f14e
  if (c < 0xd800 || (c >= 0xe000 && c < 0x110000))
Packit 33f14e
    *puc = c;
Packit 33f14e
  else
Packit 33f14e
    /* invalid multibyte character */
Packit 33f14e
    *puc = 0xfffd;
Packit 33f14e
  return 1;
Packit 33f14e
}
Packit 33f14e
# endif
Packit 33f14e
#endif
Packit 33f14e
Packit 33f14e
#if GNULIB_UNISTR_U8_MBTOUC || HAVE_LIBUNISTRING
Packit 33f14e
# if !HAVE_INLINE
Packit 33f14e
extern int
Packit 33f14e
       u8_mbtouc (ucs4_t *puc, const uint8_t *s, size_t n);
Packit 33f14e
# else
Packit 33f14e
extern int
Packit 33f14e
       u8_mbtouc_aux (ucs4_t *puc, const uint8_t *s, size_t n);
Packit 33f14e
static inline int
Packit 33f14e
u8_mbtouc (ucs4_t *puc, const uint8_t *s, size_t n)
Packit 33f14e
{
Packit 33f14e
  uint8_t c = *s;
Packit 33f14e
Packit 33f14e
  if (c < 0x80)
Packit 33f14e
    {
Packit 33f14e
      *puc = c;
Packit 33f14e
      return 1;
Packit 33f14e
    }
Packit 33f14e
  else
Packit 33f14e
    return u8_mbtouc_aux (puc, s, n);
Packit 33f14e
}
Packit 33f14e
# endif
Packit 33f14e
#endif
Packit 33f14e
Packit 33f14e
#if GNULIB_UNISTR_U16_MBTOUC || HAVE_LIBUNISTRING
Packit 33f14e
# if !HAVE_INLINE
Packit 33f14e
extern int
Packit 33f14e
       u16_mbtouc (ucs4_t *puc, const uint16_t *s, size_t n);
Packit 33f14e
# else
Packit 33f14e
extern int
Packit 33f14e
       u16_mbtouc_aux (ucs4_t *puc, const uint16_t *s, size_t n);
Packit 33f14e
static inline int
Packit 33f14e
u16_mbtouc (ucs4_t *puc, const uint16_t *s, size_t n)
Packit 33f14e
{
Packit 33f14e
  uint16_t c = *s;
Packit 33f14e
Packit 33f14e
  if (c < 0xd800 || c >= 0xe000)
Packit 33f14e
    {
Packit 33f14e
      *puc = c;
Packit 33f14e
      return 1;
Packit 33f14e
    }
Packit 33f14e
  else
Packit 33f14e
    return u16_mbtouc_aux (puc, s, n);
Packit 33f14e
}
Packit 33f14e
# endif
Packit 33f14e
#endif
Packit 33f14e
Packit 33f14e
#if GNULIB_UNISTR_U32_MBTOUC || HAVE_LIBUNISTRING
Packit 33f14e
# if !HAVE_INLINE
Packit 33f14e
extern int
Packit 33f14e
       u32_mbtouc (ucs4_t *puc, const uint32_t *s, size_t n);
Packit 33f14e
# else
Packit 33f14e
static inline int
Packit 33f14e
u32_mbtouc (ucs4_t *puc, const uint32_t *s, size_t n _GL_UNUSED_PARAMETER)
Packit 33f14e
{
Packit 33f14e
  uint32_t c = *s;
Packit 33f14e
Packit 33f14e
  if (c < 0xd800 || (c >= 0xe000 && c < 0x110000))
Packit 33f14e
    *puc = c;
Packit 33f14e
  else
Packit 33f14e
    /* invalid multibyte character */
Packit 33f14e
    *puc = 0xfffd;
Packit 33f14e
  return 1;
Packit 33f14e
}
Packit 33f14e
# endif
Packit 33f14e
#endif
Packit 33f14e
Packit 33f14e
/* Return the length (number of units) of the first character in S, putting
Packit 33f14e
   its 'ucs4_t' representation in *PUC.  Upon failure, *PUC is set to 0xfffd,
Packit 33f14e
   and -1 is returned for an invalid sequence of units, -2 is returned for an
Packit 33f14e
   incomplete sequence of units.
Packit 33f14e
   The number of available units, N, must be > 0.  */
Packit 33f14e
/* Similar to u*_mbtouc(), except that the return value gives more details
Packit 33f14e
   about the failure, similar to mbrtowc().  */
Packit 33f14e
Packit 33f14e
#if GNULIB_UNISTR_U8_MBTOUCR || HAVE_LIBUNISTRING
Packit 33f14e
extern int
Packit 33f14e
       u8_mbtoucr (ucs4_t *puc, const uint8_t *s, size_t n);
Packit 33f14e
#endif
Packit 33f14e
Packit 33f14e
#if GNULIB_UNISTR_U16_MBTOUCR || HAVE_LIBUNISTRING
Packit 33f14e
extern int
Packit 33f14e
       u16_mbtoucr (ucs4_t *puc, const uint16_t *s, size_t n);
Packit 33f14e
#endif
Packit 33f14e
Packit 33f14e
#if GNULIB_UNISTR_U32_MBTOUCR || HAVE_LIBUNISTRING
Packit 33f14e
extern int
Packit 33f14e
       u32_mbtoucr (ucs4_t *puc, const uint32_t *s, size_t n);
Packit 33f14e
#endif
Packit 33f14e
Packit 33f14e
/* Put the multibyte character represented by UC in S, returning its
Packit 33f14e
   length.  Return -1 upon failure, -2 if the number of available units, N,
Packit 33f14e
   is too small.  The latter case cannot occur if N >= 6/2/1, respectively.  */
Packit 33f14e
/* Similar to wctomb(), except that s must not be NULL, and the argument n
Packit 33f14e
   must be specified.  */
Packit 33f14e
Packit 33f14e
#if GNULIB_UNISTR_U8_UCTOMB || HAVE_LIBUNISTRING
Packit 33f14e
/* Auxiliary function, also used by u8_chr, u8_strchr, u8_strrchr.  */
Packit 33f14e
extern int
Packit 33f14e
       u8_uctomb_aux (uint8_t *s, ucs4_t uc, int n);
Packit 33f14e
# if !HAVE_INLINE
Packit 33f14e
extern int
Packit 33f14e
       u8_uctomb (uint8_t *s, ucs4_t uc, int n);
Packit 33f14e
# else
Packit 33f14e
static inline int
Packit 33f14e
u8_uctomb (uint8_t *s, ucs4_t uc, int n)
Packit 33f14e
{
Packit 33f14e
  if (uc < 0x80 && n > 0)
Packit 33f14e
    {
Packit 33f14e
      s[0] = uc;
Packit 33f14e
      return 1;
Packit 33f14e
    }
Packit 33f14e
  else
Packit 33f14e
    return u8_uctomb_aux (s, uc, n);
Packit 33f14e
}
Packit 33f14e
# endif
Packit 33f14e
#endif
Packit 33f14e
Packit 33f14e
#if GNULIB_UNISTR_U16_UCTOMB || HAVE_LIBUNISTRING
Packit 33f14e
/* Auxiliary function, also used by u16_chr, u16_strchr, u16_strrchr.  */
Packit 33f14e
extern int
Packit 33f14e
       u16_uctomb_aux (uint16_t *s, ucs4_t uc, int n);
Packit 33f14e
# if !HAVE_INLINE
Packit 33f14e
extern int
Packit 33f14e
       u16_uctomb (uint16_t *s, ucs4_t uc, int n);
Packit 33f14e
# else
Packit 33f14e
static inline int
Packit 33f14e
u16_uctomb (uint16_t *s, ucs4_t uc, int n)
Packit 33f14e
{
Packit 33f14e
  if (uc < 0xd800 && n > 0)
Packit 33f14e
    {
Packit 33f14e
      s[0] = uc;
Packit 33f14e
      return 1;
Packit 33f14e
    }
Packit 33f14e
  else
Packit 33f14e
    return u16_uctomb_aux (s, uc, n);
Packit 33f14e
}
Packit 33f14e
# endif
Packit 33f14e
#endif
Packit 33f14e
Packit 33f14e
#if GNULIB_UNISTR_U32_UCTOMB || HAVE_LIBUNISTRING
Packit 33f14e
# if !HAVE_INLINE
Packit 33f14e
extern int
Packit 33f14e
       u32_uctomb (uint32_t *s, ucs4_t uc, int n);
Packit 33f14e
# else
Packit 33f14e
static inline int
Packit 33f14e
u32_uctomb (uint32_t *s, ucs4_t uc, int n)
Packit 33f14e
{
Packit 33f14e
  if (uc < 0xd800 || (uc >= 0xe000 && uc < 0x110000))
Packit 33f14e
    {
Packit 33f14e
      if (n > 0)
Packit 33f14e
        {
Packit 33f14e
          *s = uc;
Packit 33f14e
          return 1;
Packit 33f14e
        }
Packit 33f14e
      else
Packit 33f14e
        return -2;
Packit 33f14e
    }
Packit 33f14e
  else
Packit 33f14e
    return -1;
Packit 33f14e
}
Packit 33f14e
# endif
Packit 33f14e
#endif
Packit 33f14e
Packit 33f14e
/* Copy N units from SRC to DEST.  */
Packit 33f14e
/* Similar to memcpy().  */
Packit 33f14e
extern uint8_t *
Packit 33f14e
       u8_cpy (uint8_t *dest, const uint8_t *src, size_t n);
Packit 33f14e
extern uint16_t *
Packit 33f14e
       u16_cpy (uint16_t *dest, const uint16_t *src, size_t n);
Packit 33f14e
extern uint32_t *
Packit 33f14e
       u32_cpy (uint32_t *dest, const uint32_t *src, size_t n);
Packit 33f14e
Packit 33f14e
/* Copy N units from SRC to DEST, guaranteeing correct behavior for
Packit 33f14e
   overlapping memory areas.  */
Packit 33f14e
/* Similar to memmove().  */
Packit 33f14e
extern uint8_t *
Packit 33f14e
       u8_move (uint8_t *dest, const uint8_t *src, size_t n);
Packit 33f14e
extern uint16_t *
Packit 33f14e
       u16_move (uint16_t *dest, const uint16_t *src, size_t n);
Packit 33f14e
extern uint32_t *
Packit 33f14e
       u32_move (uint32_t *dest, const uint32_t *src, size_t n);
Packit 33f14e
Packit 33f14e
/* Set the first N characters of S to UC.  UC should be a character that
Packit 33f14e
   occupies only 1 unit.  */
Packit 33f14e
/* Similar to memset().  */
Packit 33f14e
extern uint8_t *
Packit 33f14e
       u8_set (uint8_t *s, ucs4_t uc, size_t n);
Packit 33f14e
extern uint16_t *
Packit 33f14e
       u16_set (uint16_t *s, ucs4_t uc, size_t n);
Packit 33f14e
extern uint32_t *
Packit 33f14e
       u32_set (uint32_t *s, ucs4_t uc, size_t n);
Packit 33f14e
Packit 33f14e
/* Compare S1 and S2, each of length N.  */
Packit 33f14e
/* Similar to memcmp().  */
Packit 33f14e
extern int
Packit 33f14e
       u8_cmp (const uint8_t *s1, const uint8_t *s2, size_t n)
Packit 33f14e
       _UC_ATTRIBUTE_PURE;
Packit 33f14e
extern int
Packit 33f14e
       u16_cmp (const uint16_t *s1, const uint16_t *s2, size_t n)
Packit 33f14e
       _UC_ATTRIBUTE_PURE;
Packit 33f14e
extern int
Packit 33f14e
       u32_cmp (const uint32_t *s1, const uint32_t *s2, size_t n)
Packit 33f14e
       _UC_ATTRIBUTE_PURE;
Packit 33f14e
Packit 33f14e
/* Compare S1 and S2.  */
Packit 33f14e
/* Similar to the gnulib function memcmp2().  */
Packit 33f14e
extern int
Packit 33f14e
       u8_cmp2 (const uint8_t *s1, size_t n1, const uint8_t *s2, size_t n2)
Packit 33f14e
       _UC_ATTRIBUTE_PURE;
Packit 33f14e
extern int
Packit 33f14e
       u16_cmp2 (const uint16_t *s1, size_t n1, const uint16_t *s2, size_t n2)
Packit 33f14e
       _UC_ATTRIBUTE_PURE;
Packit 33f14e
extern int
Packit 33f14e
       u32_cmp2 (const uint32_t *s1, size_t n1, const uint32_t *s2, size_t n2)
Packit 33f14e
       _UC_ATTRIBUTE_PURE;
Packit 33f14e
Packit 33f14e
/* Search the string at S for UC.  */
Packit 33f14e
/* Similar to memchr().  */
Packit 33f14e
extern uint8_t *
Packit 33f14e
       u8_chr (const uint8_t *s, size_t n, ucs4_t uc)
Packit 33f14e
       _UC_ATTRIBUTE_PURE;
Packit 33f14e
extern uint16_t *
Packit 33f14e
       u16_chr (const uint16_t *s, size_t n, ucs4_t uc)
Packit 33f14e
       _UC_ATTRIBUTE_PURE;
Packit 33f14e
extern uint32_t *
Packit 33f14e
       u32_chr (const uint32_t *s, size_t n, ucs4_t uc)
Packit 33f14e
       _UC_ATTRIBUTE_PURE;
Packit 33f14e
Packit 33f14e
/* Count the number of Unicode characters in the N units from S.  */
Packit 33f14e
/* Similar to mbsnlen().  */
Packit 33f14e
extern size_t
Packit 33f14e
       u8_mbsnlen (const uint8_t *s, size_t n)
Packit 33f14e
       _UC_ATTRIBUTE_PURE;
Packit 33f14e
extern size_t
Packit 33f14e
       u16_mbsnlen (const uint16_t *s, size_t n)
Packit 33f14e
       _UC_ATTRIBUTE_PURE;
Packit 33f14e
extern size_t
Packit 33f14e
       u32_mbsnlen (const uint32_t *s, size_t n)
Packit 33f14e
       _UC_ATTRIBUTE_PURE;
Packit 33f14e
Packit 33f14e
/* Elementary string functions with memory allocation.  */
Packit 33f14e
Packit 33f14e
/* Make a freshly allocated copy of S, of length N.  */
Packit 33f14e
extern uint8_t *
Packit 33f14e
       u8_cpy_alloc (const uint8_t *s, size_t n);
Packit 33f14e
extern uint16_t *
Packit 33f14e
       u16_cpy_alloc (const uint16_t *s, size_t n);
Packit 33f14e
extern uint32_t *
Packit 33f14e
       u32_cpy_alloc (const uint32_t *s, size_t n);
Packit 33f14e
Packit 33f14e
/* Elementary string functions on NUL terminated strings.  */
Packit 33f14e
Packit 33f14e
/* Return the length (number of units) of the first character in S.
Packit 33f14e
   Return 0 if it is the NUL character.  Return -1 upon failure.  */
Packit 33f14e
extern int
Packit 33f14e
       u8_strmblen (const uint8_t *s)
Packit 33f14e
       _UC_ATTRIBUTE_PURE;
Packit 33f14e
extern int
Packit 33f14e
       u16_strmblen (const uint16_t *s)
Packit 33f14e
       _UC_ATTRIBUTE_PURE;
Packit 33f14e
extern int
Packit 33f14e
       u32_strmblen (const uint32_t *s)
Packit 33f14e
       _UC_ATTRIBUTE_PURE;
Packit 33f14e
Packit 33f14e
/* Return the length (number of units) of the first character in S, putting
Packit 33f14e
   its 'ucs4_t' representation in *PUC.  Return 0 if it is the NUL
Packit 33f14e
   character.  Return -1 upon failure.  */
Packit 33f14e
extern int
Packit 33f14e
       u8_strmbtouc (ucs4_t *puc, const uint8_t *s);
Packit 33f14e
extern int
Packit 33f14e
       u16_strmbtouc (ucs4_t *puc, const uint16_t *s);
Packit 33f14e
extern int
Packit 33f14e
       u32_strmbtouc (ucs4_t *puc, const uint32_t *s);
Packit 33f14e
Packit 33f14e
/* Forward iteration step.  Advances the pointer past the next character,
Packit 33f14e
   or returns NULL if the end of the string has been reached.  Puts the
Packit 33f14e
   character's 'ucs4_t' representation in *PUC.  */
Packit 33f14e
extern const uint8_t *
Packit 33f14e
       u8_next (ucs4_t *puc, const uint8_t *s);
Packit 33f14e
extern const uint16_t *
Packit 33f14e
       u16_next (ucs4_t *puc, const uint16_t *s);
Packit 33f14e
extern const uint32_t *
Packit 33f14e
       u32_next (ucs4_t *puc, const uint32_t *s);
Packit 33f14e
Packit 33f14e
/* Backward iteration step.  Advances the pointer to point to the previous
Packit 33f14e
   character, or returns NULL if the beginning of the string had been reached.
Packit 33f14e
   Puts the character's 'ucs4_t' representation in *PUC.  */
Packit 33f14e
extern const uint8_t *
Packit 33f14e
       u8_prev (ucs4_t *puc, const uint8_t *s, const uint8_t *start);
Packit 33f14e
extern const uint16_t *
Packit 33f14e
       u16_prev (ucs4_t *puc, const uint16_t *s, const uint16_t *start);
Packit 33f14e
extern const uint32_t *
Packit 33f14e
       u32_prev (ucs4_t *puc, const uint32_t *s, const uint32_t *start);
Packit 33f14e
Packit 33f14e
/* Return the number of units in S.  */
Packit 33f14e
/* Similar to strlen(), wcslen().  */
Packit 33f14e
extern size_t
Packit 33f14e
       u8_strlen (const uint8_t *s)
Packit 33f14e
       _UC_ATTRIBUTE_PURE;
Packit 33f14e
extern size_t
Packit 33f14e
       u16_strlen (const uint16_t *s)
Packit 33f14e
       _UC_ATTRIBUTE_PURE;
Packit 33f14e
extern size_t
Packit 33f14e
       u32_strlen (const uint32_t *s)
Packit 33f14e
       _UC_ATTRIBUTE_PURE;
Packit 33f14e
Packit 33f14e
/* Return the number of units in S, but at most MAXLEN.  */
Packit 33f14e
/* Similar to strnlen(), wcsnlen().  */
Packit 33f14e
extern size_t
Packit 33f14e
       u8_strnlen (const uint8_t *s, size_t maxlen)
Packit 33f14e
       _UC_ATTRIBUTE_PURE;
Packit 33f14e
extern size_t
Packit 33f14e
       u16_strnlen (const uint16_t *s, size_t maxlen)
Packit 33f14e
       _UC_ATTRIBUTE_PURE;
Packit 33f14e
extern size_t
Packit 33f14e
       u32_strnlen (const uint32_t *s, size_t maxlen)
Packit 33f14e
       _UC_ATTRIBUTE_PURE;
Packit 33f14e
Packit 33f14e
/* Copy SRC to DEST.  */
Packit 33f14e
/* Similar to strcpy(), wcscpy().  */
Packit 33f14e
extern uint8_t *
Packit 33f14e
       u8_strcpy (uint8_t *dest, const uint8_t *src);
Packit 33f14e
extern uint16_t *
Packit 33f14e
       u16_strcpy (uint16_t *dest, const uint16_t *src);
Packit 33f14e
extern uint32_t *
Packit 33f14e
       u32_strcpy (uint32_t *dest, const uint32_t *src);
Packit 33f14e
Packit 33f14e
/* Copy SRC to DEST, returning the address of the terminating NUL in DEST.  */
Packit 33f14e
/* Similar to stpcpy().  */
Packit 33f14e
extern uint8_t *
Packit 33f14e
       u8_stpcpy (uint8_t *dest, const uint8_t *src);
Packit 33f14e
extern uint16_t *
Packit 33f14e
       u16_stpcpy (uint16_t *dest, const uint16_t *src);
Packit 33f14e
extern uint32_t *
Packit 33f14e
       u32_stpcpy (uint32_t *dest, const uint32_t *src);
Packit 33f14e
Packit 33f14e
/* Copy no more than N units of SRC to DEST.  */
Packit 33f14e
/* Similar to strncpy(), wcsncpy().  */
Packit 33f14e
extern uint8_t *
Packit 33f14e
       u8_strncpy (uint8_t *dest, const uint8_t *src, size_t n);
Packit 33f14e
extern uint16_t *
Packit 33f14e
       u16_strncpy (uint16_t *dest, const uint16_t *src, size_t n);
Packit 33f14e
extern uint32_t *
Packit 33f14e
       u32_strncpy (uint32_t *dest, const uint32_t *src, size_t n);
Packit 33f14e
Packit 33f14e
/* Copy no more than N units of SRC to DEST.  Return a pointer past the last
Packit 33f14e
   non-NUL unit written into DEST.  */
Packit 33f14e
/* Similar to stpncpy().  */
Packit 33f14e
extern uint8_t *
Packit 33f14e
       u8_stpncpy (uint8_t *dest, const uint8_t *src, size_t n);
Packit 33f14e
extern uint16_t *
Packit 33f14e
       u16_stpncpy (uint16_t *dest, const uint16_t *src, size_t n);
Packit 33f14e
extern uint32_t *
Packit 33f14e
       u32_stpncpy (uint32_t *dest, const uint32_t *src, size_t n);
Packit 33f14e
Packit 33f14e
/* Append SRC onto DEST.  */
Packit 33f14e
/* Similar to strcat(), wcscat().  */
Packit 33f14e
extern uint8_t *
Packit 33f14e
       u8_strcat (uint8_t *dest, const uint8_t *src);
Packit 33f14e
extern uint16_t *
Packit 33f14e
       u16_strcat (uint16_t *dest, const uint16_t *src);
Packit 33f14e
extern uint32_t *
Packit 33f14e
       u32_strcat (uint32_t *dest, const uint32_t *src);
Packit 33f14e
Packit 33f14e
/* Append no more than N units of SRC onto DEST.  */
Packit 33f14e
/* Similar to strncat(), wcsncat().  */
Packit 33f14e
extern uint8_t *
Packit 33f14e
       u8_strncat (uint8_t *dest, const uint8_t *src, size_t n);
Packit 33f14e
extern uint16_t *
Packit 33f14e
       u16_strncat (uint16_t *dest, const uint16_t *src, size_t n);
Packit 33f14e
extern uint32_t *
Packit 33f14e
       u32_strncat (uint32_t *dest, const uint32_t *src, size_t n);
Packit 33f14e
Packit 33f14e
/* Compare S1 and S2.  */
Packit 33f14e
/* Similar to strcmp(), wcscmp().  */
Packit 33f14e
#ifdef __sun
Packit 33f14e
/* Avoid a collision with the u8_strcmp() function in Solaris 11 libc.  */
Packit 33f14e
extern int
Packit 33f14e
       u8_strcmp_gnu (const uint8_t *s1, const uint8_t *s2)
Packit 33f14e
       _UC_ATTRIBUTE_PURE;
Packit 33f14e
# define u8_strcmp u8_strcmp_gnu
Packit 33f14e
#else
Packit 33f14e
extern int
Packit 33f14e
       u8_strcmp (const uint8_t *s1, const uint8_t *s2)
Packit 33f14e
       _UC_ATTRIBUTE_PURE;
Packit 33f14e
#endif
Packit 33f14e
extern int
Packit 33f14e
       u16_strcmp (const uint16_t *s1, const uint16_t *s2)
Packit 33f14e
       _UC_ATTRIBUTE_PURE;
Packit 33f14e
extern int
Packit 33f14e
       u32_strcmp (const uint32_t *s1, const uint32_t *s2)
Packit 33f14e
       _UC_ATTRIBUTE_PURE;
Packit 33f14e
Packit 33f14e
/* Compare S1 and S2 using the collation rules of the current locale.
Packit 33f14e
   Return -1 if S1 < S2, 0 if S1 = S2, 1 if S1 > S2.
Packit 33f14e
   Upon failure, set errno and return any value.  */
Packit 33f14e
/* Similar to strcoll(), wcscoll().  */
Packit 33f14e
extern int
Packit 33f14e
       u8_strcoll (const uint8_t *s1, const uint8_t *s2);
Packit 33f14e
extern int
Packit 33f14e
       u16_strcoll (const uint16_t *s1, const uint16_t *s2);
Packit 33f14e
extern int
Packit 33f14e
       u32_strcoll (const uint32_t *s1, const uint32_t *s2);
Packit 33f14e
Packit 33f14e
/* Compare no more than N units of S1 and S2.  */
Packit 33f14e
/* Similar to strncmp(), wcsncmp().  */
Packit 33f14e
extern int
Packit 33f14e
       u8_strncmp (const uint8_t *s1, const uint8_t *s2, size_t n)
Packit 33f14e
       _UC_ATTRIBUTE_PURE;
Packit 33f14e
extern int
Packit 33f14e
       u16_strncmp (const uint16_t *s1, const uint16_t *s2, size_t n)
Packit 33f14e
       _UC_ATTRIBUTE_PURE;
Packit 33f14e
extern int
Packit 33f14e
       u32_strncmp (const uint32_t *s1, const uint32_t *s2, size_t n)
Packit 33f14e
       _UC_ATTRIBUTE_PURE;
Packit 33f14e
Packit 33f14e
/* Duplicate S, returning an identical malloc'd string.  */
Packit 33f14e
/* Similar to strdup(), wcsdup().  */
Packit 33f14e
extern uint8_t *
Packit 33f14e
       u8_strdup (const uint8_t *s);
Packit 33f14e
extern uint16_t *
Packit 33f14e
       u16_strdup (const uint16_t *s);
Packit 33f14e
extern uint32_t *
Packit 33f14e
       u32_strdup (const uint32_t *s);
Packit 33f14e
Packit 33f14e
/* Find the first occurrence of UC in STR.  */
Packit 33f14e
/* Similar to strchr(), wcschr().  */
Packit 33f14e
extern uint8_t *
Packit 33f14e
       u8_strchr (const uint8_t *str, ucs4_t uc)
Packit 33f14e
       _UC_ATTRIBUTE_PURE;
Packit 33f14e
extern uint16_t *
Packit 33f14e
       u16_strchr (const uint16_t *str, ucs4_t uc)
Packit 33f14e
       _UC_ATTRIBUTE_PURE;
Packit 33f14e
extern uint32_t *
Packit 33f14e
       u32_strchr (const uint32_t *str, ucs4_t uc)
Packit 33f14e
       _UC_ATTRIBUTE_PURE;
Packit 33f14e
Packit 33f14e
/* Find the last occurrence of UC in STR.  */
Packit 33f14e
/* Similar to strrchr(), wcsrchr().  */
Packit 33f14e
extern uint8_t *
Packit 33f14e
       u8_strrchr (const uint8_t *str, ucs4_t uc)
Packit 33f14e
       _UC_ATTRIBUTE_PURE;
Packit 33f14e
extern uint16_t *
Packit 33f14e
       u16_strrchr (const uint16_t *str, ucs4_t uc)
Packit 33f14e
       _UC_ATTRIBUTE_PURE;
Packit 33f14e
extern uint32_t *
Packit 33f14e
       u32_strrchr (const uint32_t *str, ucs4_t uc)
Packit 33f14e
       _UC_ATTRIBUTE_PURE;
Packit 33f14e
Packit 33f14e
/* Return the length of the initial segment of STR which consists entirely
Packit 33f14e
   of Unicode characters not in REJECT.  */
Packit 33f14e
/* Similar to strcspn(), wcscspn().  */
Packit 33f14e
extern size_t
Packit 33f14e
       u8_strcspn (const uint8_t *str, const uint8_t *reject)
Packit 33f14e
       _UC_ATTRIBUTE_PURE;
Packit 33f14e
extern size_t
Packit 33f14e
       u16_strcspn (const uint16_t *str, const uint16_t *reject)
Packit 33f14e
       _UC_ATTRIBUTE_PURE;
Packit 33f14e
extern size_t
Packit 33f14e
       u32_strcspn (const uint32_t *str, const uint32_t *reject)
Packit 33f14e
       _UC_ATTRIBUTE_PURE;
Packit 33f14e
Packit 33f14e
/* Return the length of the initial segment of STR which consists entirely
Packit 33f14e
   of Unicode characters in ACCEPT.  */
Packit 33f14e
/* Similar to strspn(), wcsspn().  */
Packit 33f14e
extern size_t
Packit 33f14e
       u8_strspn (const uint8_t *str, const uint8_t *accept)
Packit 33f14e
       _UC_ATTRIBUTE_PURE;
Packit 33f14e
extern size_t
Packit 33f14e
       u16_strspn (const uint16_t *str, const uint16_t *accept)
Packit 33f14e
       _UC_ATTRIBUTE_PURE;
Packit 33f14e
extern size_t
Packit 33f14e
       u32_strspn (const uint32_t *str, const uint32_t *accept)
Packit 33f14e
       _UC_ATTRIBUTE_PURE;
Packit 33f14e
Packit 33f14e
/* Find the first occurrence in STR of any character in ACCEPT.  */
Packit 33f14e
/* Similar to strpbrk(), wcspbrk().  */
Packit 33f14e
extern uint8_t *
Packit 33f14e
       u8_strpbrk (const uint8_t *str, const uint8_t *accept)
Packit 33f14e
       _UC_ATTRIBUTE_PURE;
Packit 33f14e
extern uint16_t *
Packit 33f14e
       u16_strpbrk (const uint16_t *str, const uint16_t *accept)
Packit 33f14e
       _UC_ATTRIBUTE_PURE;
Packit 33f14e
extern uint32_t *
Packit 33f14e
       u32_strpbrk (const uint32_t *str, const uint32_t *accept)
Packit 33f14e
       _UC_ATTRIBUTE_PURE;
Packit 33f14e
Packit 33f14e
/* Find the first occurrence of NEEDLE in HAYSTACK.  */
Packit 33f14e
/* Similar to strstr(), wcsstr().  */
Packit 33f14e
extern uint8_t *
Packit 33f14e
       u8_strstr (const uint8_t *haystack, const uint8_t *needle)
Packit 33f14e
       _UC_ATTRIBUTE_PURE;
Packit 33f14e
extern uint16_t *
Packit 33f14e
       u16_strstr (const uint16_t *haystack, const uint16_t *needle)
Packit 33f14e
       _UC_ATTRIBUTE_PURE;
Packit 33f14e
extern uint32_t *
Packit 33f14e
       u32_strstr (const uint32_t *haystack, const uint32_t *needle)
Packit 33f14e
       _UC_ATTRIBUTE_PURE;
Packit 33f14e
Packit 33f14e
/* Test whether STR starts with PREFIX.  */
Packit 33f14e
extern bool
Packit 33f14e
       u8_startswith (const uint8_t *str, const uint8_t *prefix)
Packit 33f14e
       _UC_ATTRIBUTE_PURE;
Packit 33f14e
extern bool
Packit 33f14e
       u16_startswith (const uint16_t *str, const uint16_t *prefix)
Packit 33f14e
       _UC_ATTRIBUTE_PURE;
Packit 33f14e
extern bool
Packit 33f14e
       u32_startswith (const uint32_t *str, const uint32_t *prefix)
Packit 33f14e
       _UC_ATTRIBUTE_PURE;
Packit 33f14e
Packit 33f14e
/* Test whether STR ends with SUFFIX.  */
Packit 33f14e
extern bool
Packit 33f14e
       u8_endswith (const uint8_t *str, const uint8_t *suffix)
Packit 33f14e
       _UC_ATTRIBUTE_PURE;
Packit 33f14e
extern bool
Packit 33f14e
       u16_endswith (const uint16_t *str, const uint16_t *suffix)
Packit 33f14e
       _UC_ATTRIBUTE_PURE;
Packit 33f14e
extern bool
Packit 33f14e
       u32_endswith (const uint32_t *str, const uint32_t *suffix)
Packit 33f14e
       _UC_ATTRIBUTE_PURE;
Packit 33f14e
Packit 33f14e
/* Divide STR into tokens separated by characters in DELIM.
Packit 33f14e
   This interface is actually more similar to wcstok than to strtok.  */
Packit 33f14e
/* Similar to strtok_r(), wcstok().  */
Packit 33f14e
extern uint8_t *
Packit 33f14e
       u8_strtok (uint8_t *str, const uint8_t *delim, uint8_t **ptr);
Packit 33f14e
extern uint16_t *
Packit 33f14e
       u16_strtok (uint16_t *str, const uint16_t *delim, uint16_t **ptr);
Packit 33f14e
extern uint32_t *
Packit 33f14e
       u32_strtok (uint32_t *str, const uint32_t *delim, uint32_t **ptr);
Packit 33f14e
Packit 33f14e
Packit 33f14e
#ifdef __cplusplus
Packit 33f14e
}
Packit 33f14e
#endif
Packit 33f14e
Packit 33f14e
#endif /* _UNISTR_H */