Blame lib/unistr.in.h

Packit Service a2489d
/* Elementary Unicode string functions.
Packit Service a2489d
   Copyright (C) 2001-2002, 2005-2018 Free Software Foundation, Inc.
Packit Service a2489d
Packit Service a2489d
   This program is free software: you can redistribute it and/or modify it
Packit Service a2489d
   under the terms of the GNU General Public License as published
Packit Service a2489d
   by the Free Software Foundation; either version 3 of the License, or
Packit Service a2489d
   (at your option) any later version.
Packit Service a2489d
Packit Service a2489d
   This program is distributed in the hope that it will be useful,
Packit Service a2489d
   but WITHOUT ANY WARRANTY; without even the implied warranty of
Packit Service a2489d
   MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the GNU
Packit Service a2489d
   General Public License for more details.
Packit Service a2489d
Packit Service a2489d
   You should have received a copy of the GNU General Public License
Packit Service a2489d
   along with this program.  If not, see <https://www.gnu.org/licenses/>.  */
Packit Service a2489d
Packit Service a2489d
#ifndef _UNISTR_H
Packit Service a2489d
#define _UNISTR_H
Packit Service a2489d
Packit Service a2489d
#include "unitypes.h"
Packit Service a2489d
Packit Service a2489d
/* Get common macros for C.  */
Packit Service a2489d
#include "unused-parameter.h"
Packit Service a2489d
Packit Service a2489d
/* Get bool.  */
Packit Service a2489d
#include <stdbool.h>
Packit Service a2489d
Packit Service a2489d
/* Get size_t.  */
Packit Service a2489d
#include <stddef.h>
Packit Service a2489d
Packit Service a2489d
#ifdef __cplusplus
Packit Service a2489d
extern "C" {
Packit Service a2489d
#endif
Packit Service a2489d
Packit Service a2489d
Packit Service a2489d
/* Conventions:
Packit Service a2489d
Packit Service a2489d
   All functions prefixed with u8_ operate on UTF-8 encoded strings.
Packit Service a2489d
   Their unit is an uint8_t (1 byte).
Packit Service a2489d
Packit Service a2489d
   All functions prefixed with u16_ operate on UTF-16 encoded strings.
Packit Service a2489d
   Their unit is an uint16_t (a 2-byte word).
Packit Service a2489d
Packit Service a2489d
   All functions prefixed with u32_ operate on UCS-4 encoded strings.
Packit Service a2489d
   Their unit is an uint32_t (a 4-byte word).
Packit Service a2489d
Packit Service a2489d
   All argument pairs (s, n) denote a Unicode string s[0..n-1] with exactly
Packit Service a2489d
   n units.
Packit Service a2489d
Packit Service a2489d
   All arguments starting with "str" and the arguments of functions starting
Packit Service a2489d
   with u8_str/u16_str/u32_str denote a NUL terminated string, i.e. a string
Packit Service a2489d
   which terminates at the first NUL unit.  This termination unit is
Packit Service a2489d
   considered part of the string for all memory allocation purposes, but
Packit Service a2489d
   is not considered part of the string for all other logical purposes.
Packit Service a2489d
Packit Service a2489d
   Functions returning a string result take a (resultbuf, lengthp) argument
Packit Service a2489d
   pair.  If resultbuf is not NULL and the result fits into *lengthp units,
Packit Service a2489d
   it is put in resultbuf, and resultbuf is returned.  Otherwise, a freshly
Packit Service a2489d
   allocated string is returned.  In both cases, *lengthp is set to the
Packit Service a2489d
   length (number of units) of the returned string.  In case of error,
Packit Service a2489d
   NULL is returned and errno is set.  */
Packit Service a2489d
Packit Service a2489d
Packit Service a2489d
/* Elementary string checks.  */
Packit Service a2489d
Packit Service a2489d
/* Check whether an UTF-8 string is well-formed.
Packit Service a2489d
   Return NULL if valid, or a pointer to the first invalid unit otherwise.  */
Packit Service a2489d
extern const uint8_t *
Packit Service a2489d
       u8_check (const uint8_t *s, size_t n)
Packit Service a2489d
       _UC_ATTRIBUTE_PURE;
Packit Service a2489d
Packit Service a2489d
/* Check whether an UTF-16 string is well-formed.
Packit Service a2489d
   Return NULL if valid, or a pointer to the first invalid unit otherwise.  */
Packit Service a2489d
extern const uint16_t *
Packit Service a2489d
       u16_check (const uint16_t *s, size_t n)
Packit Service a2489d
       _UC_ATTRIBUTE_PURE;
Packit Service a2489d
Packit Service a2489d
/* Check whether an UCS-4 string is well-formed.
Packit Service a2489d
   Return NULL if valid, or a pointer to the first invalid unit otherwise.  */
Packit Service a2489d
extern const uint32_t *
Packit Service a2489d
       u32_check (const uint32_t *s, size_t n)
Packit Service a2489d
       _UC_ATTRIBUTE_PURE;
Packit Service a2489d
Packit Service a2489d
Packit Service a2489d
/* Elementary string conversions.  */
Packit Service a2489d
Packit Service a2489d
/* Convert an UTF-8 string to an UTF-16 string.  */
Packit Service a2489d
extern uint16_t *
Packit Service a2489d
       u8_to_u16 (const uint8_t *s, size_t n, uint16_t *resultbuf,
Packit Service a2489d
                  size_t *lengthp);
Packit Service a2489d
Packit Service a2489d
/* Convert an UTF-8 string to an UCS-4 string.  */
Packit Service a2489d
extern uint32_t *
Packit Service a2489d
       u8_to_u32 (const uint8_t *s, size_t n, uint32_t *resultbuf,
Packit Service a2489d
                  size_t *lengthp);
Packit Service a2489d
Packit Service a2489d
/* Convert an UTF-16 string to an UTF-8 string.  */
Packit Service a2489d
extern uint8_t *
Packit Service a2489d
       u16_to_u8 (const uint16_t *s, size_t n, uint8_t *resultbuf,
Packit Service a2489d
                  size_t *lengthp);
Packit Service a2489d
Packit Service a2489d
/* Convert an UTF-16 string to an UCS-4 string.  */
Packit Service a2489d
extern uint32_t *
Packit Service a2489d
       u16_to_u32 (const uint16_t *s, size_t n, uint32_t *resultbuf,
Packit Service a2489d
                   size_t *lengthp);
Packit Service a2489d
Packit Service a2489d
/* Convert an UCS-4 string to an UTF-8 string.  */
Packit Service a2489d
extern uint8_t *
Packit Service a2489d
       u32_to_u8 (const uint32_t *s, size_t n, uint8_t *resultbuf,
Packit Service a2489d
                  size_t *lengthp);
Packit Service a2489d
Packit Service a2489d
/* Convert an UCS-4 string to an UTF-16 string.  */
Packit Service a2489d
extern uint16_t *
Packit Service a2489d
       u32_to_u16 (const uint32_t *s, size_t n, uint16_t *resultbuf,
Packit Service a2489d
                   size_t *lengthp);
Packit Service a2489d
Packit Service a2489d
Packit Service a2489d
/* Elementary string functions.  */
Packit Service a2489d
Packit Service a2489d
/* Return the length (number of units) of the first character in S, which is
Packit Service a2489d
   no longer than N.  Return 0 if it is the NUL character.  Return -1 upon
Packit Service a2489d
   failure.  */
Packit Service a2489d
/* Similar to mblen(), except that s must not be NULL.  */
Packit Service a2489d
extern int
Packit Service a2489d
       u8_mblen (const uint8_t *s, size_t n)
Packit Service a2489d
       _UC_ATTRIBUTE_PURE;
Packit Service a2489d
extern int
Packit Service a2489d
       u16_mblen (const uint16_t *s, size_t n)
Packit Service a2489d
       _UC_ATTRIBUTE_PURE;
Packit Service a2489d
extern int
Packit Service a2489d
       u32_mblen (const uint32_t *s, size_t n)
Packit Service a2489d
       _UC_ATTRIBUTE_PURE;
Packit Service a2489d
Packit Service a2489d
/* Return the length (number of units) of the first character in S, putting
Packit Service a2489d
   its 'ucs4_t' representation in *PUC.  Upon failure, *PUC is set to 0xfffd,
Packit Service a2489d
   and an appropriate number of units is returned.
Packit Service a2489d
   The number of available units, N, must be > 0.  */
Packit Service a2489d
/* Similar to mbtowc(), except that puc and s must not be NULL, n must be > 0,
Packit Service a2489d
   and the NUL character is not treated specially.  */
Packit Service a2489d
/* The variants with _unsafe suffix are for backward compatibility with
Packit Service a2489d
   libunistring versions < 0.9.7.  */
Packit Service a2489d
Packit Service a2489d
#if GNULIB_UNISTR_U8_MBTOUC_UNSAFE || HAVE_LIBUNISTRING
Packit Service a2489d
# if !HAVE_INLINE
Packit Service a2489d
extern int
Packit Service a2489d
       u8_mbtouc_unsafe (ucs4_t *puc, const uint8_t *s, size_t n);
Packit Service a2489d
# else
Packit Service a2489d
extern int
Packit Service a2489d
       u8_mbtouc_unsafe_aux (ucs4_t *puc, const uint8_t *s, size_t n);
Packit Service a2489d
static inline int
Packit Service a2489d
u8_mbtouc_unsafe (ucs4_t *puc, const uint8_t *s, size_t n)
Packit Service a2489d
{
Packit Service a2489d
  uint8_t c = *s;
Packit Service a2489d
Packit Service a2489d
  if (c < 0x80)
Packit Service a2489d
    {
Packit Service a2489d
      *puc = c;
Packit Service a2489d
      return 1;
Packit Service a2489d
    }
Packit Service a2489d
  else
Packit Service a2489d
    return u8_mbtouc_unsafe_aux (puc, s, n);
Packit Service a2489d
}
Packit Service a2489d
# endif
Packit Service a2489d
#endif
Packit Service a2489d
Packit Service a2489d
#if GNULIB_UNISTR_U16_MBTOUC_UNSAFE || HAVE_LIBUNISTRING
Packit Service a2489d
# if !HAVE_INLINE
Packit Service a2489d
extern int
Packit Service a2489d
       u16_mbtouc_unsafe (ucs4_t *puc, const uint16_t *s, size_t n);
Packit Service a2489d
# else
Packit Service a2489d
extern int
Packit Service a2489d
       u16_mbtouc_unsafe_aux (ucs4_t *puc, const uint16_t *s, size_t n);
Packit Service a2489d
static inline int
Packit Service a2489d
u16_mbtouc_unsafe (ucs4_t *puc, const uint16_t *s, size_t n)
Packit Service a2489d
{
Packit Service a2489d
  uint16_t c = *s;
Packit Service a2489d
Packit Service a2489d
  if (c < 0xd800 || c >= 0xe000)
Packit Service a2489d
    {
Packit Service a2489d
      *puc = c;
Packit Service a2489d
      return 1;
Packit Service a2489d
    }
Packit Service a2489d
  else
Packit Service a2489d
    return u16_mbtouc_unsafe_aux (puc, s, n);
Packit Service a2489d
}
Packit Service a2489d
# endif
Packit Service a2489d
#endif
Packit Service a2489d
Packit Service a2489d
#if GNULIB_UNISTR_U32_MBTOUC_UNSAFE || HAVE_LIBUNISTRING
Packit Service a2489d
# if !HAVE_INLINE
Packit Service a2489d
extern int
Packit Service a2489d
       u32_mbtouc_unsafe (ucs4_t *puc, const uint32_t *s, size_t n);
Packit Service a2489d
# else
Packit Service a2489d
static inline int
Packit Service a2489d
u32_mbtouc_unsafe (ucs4_t *puc,
Packit Service a2489d
                   const uint32_t *s, size_t n _GL_UNUSED_PARAMETER)
Packit Service a2489d
{
Packit Service a2489d
  uint32_t c = *s;
Packit Service a2489d
Packit Service a2489d
  if (c < 0xd800 || (c >= 0xe000 && c < 0x110000))
Packit Service a2489d
    *puc = c;
Packit Service a2489d
  else
Packit Service a2489d
    /* invalid multibyte character */
Packit Service a2489d
    *puc = 0xfffd;
Packit Service a2489d
  return 1;
Packit Service a2489d
}
Packit Service a2489d
# endif
Packit Service a2489d
#endif
Packit Service a2489d
Packit Service a2489d
#if GNULIB_UNISTR_U8_MBTOUC || HAVE_LIBUNISTRING
Packit Service a2489d
# if !HAVE_INLINE
Packit Service a2489d
extern int
Packit Service a2489d
       u8_mbtouc (ucs4_t *puc, const uint8_t *s, size_t n);
Packit Service a2489d
# else
Packit Service a2489d
extern int
Packit Service a2489d
       u8_mbtouc_aux (ucs4_t *puc, const uint8_t *s, size_t n);
Packit Service a2489d
static inline int
Packit Service a2489d
u8_mbtouc (ucs4_t *puc, const uint8_t *s, size_t n)
Packit Service a2489d
{
Packit Service a2489d
  uint8_t c = *s;
Packit Service a2489d
Packit Service a2489d
  if (c < 0x80)
Packit Service a2489d
    {
Packit Service a2489d
      *puc = c;
Packit Service a2489d
      return 1;
Packit Service a2489d
    }
Packit Service a2489d
  else
Packit Service a2489d
    return u8_mbtouc_aux (puc, s, n);
Packit Service a2489d
}
Packit Service a2489d
# endif
Packit Service a2489d
#endif
Packit Service a2489d
Packit Service a2489d
#if GNULIB_UNISTR_U16_MBTOUC || HAVE_LIBUNISTRING
Packit Service a2489d
# if !HAVE_INLINE
Packit Service a2489d
extern int
Packit Service a2489d
       u16_mbtouc (ucs4_t *puc, const uint16_t *s, size_t n);
Packit Service a2489d
# else
Packit Service a2489d
extern int
Packit Service a2489d
       u16_mbtouc_aux (ucs4_t *puc, const uint16_t *s, size_t n);
Packit Service a2489d
static inline int
Packit Service a2489d
u16_mbtouc (ucs4_t *puc, const uint16_t *s, size_t n)
Packit Service a2489d
{
Packit Service a2489d
  uint16_t c = *s;
Packit Service a2489d
Packit Service a2489d
  if (c < 0xd800 || c >= 0xe000)
Packit Service a2489d
    {
Packit Service a2489d
      *puc = c;
Packit Service a2489d
      return 1;
Packit Service a2489d
    }
Packit Service a2489d
  else
Packit Service a2489d
    return u16_mbtouc_aux (puc, s, n);
Packit Service a2489d
}
Packit Service a2489d
# endif
Packit Service a2489d
#endif
Packit Service a2489d
Packit Service a2489d
#if GNULIB_UNISTR_U32_MBTOUC || HAVE_LIBUNISTRING
Packit Service a2489d
# if !HAVE_INLINE
Packit Service a2489d
extern int
Packit Service a2489d
       u32_mbtouc (ucs4_t *puc, const uint32_t *s, size_t n);
Packit Service a2489d
# else
Packit Service a2489d
static inline int
Packit Service a2489d
u32_mbtouc (ucs4_t *puc, const uint32_t *s, size_t n _GL_UNUSED_PARAMETER)
Packit Service a2489d
{
Packit Service a2489d
  uint32_t c = *s;
Packit Service a2489d
Packit Service a2489d
  if (c < 0xd800 || (c >= 0xe000 && c < 0x110000))
Packit Service a2489d
    *puc = c;
Packit Service a2489d
  else
Packit Service a2489d
    /* invalid multibyte character */
Packit Service a2489d
    *puc = 0xfffd;
Packit Service a2489d
  return 1;
Packit Service a2489d
}
Packit Service a2489d
# endif
Packit Service a2489d
#endif
Packit Service a2489d
Packit Service a2489d
/* Return the length (number of units) of the first character in S, putting
Packit Service a2489d
   its 'ucs4_t' representation in *PUC.  Upon failure, *PUC is set to 0xfffd,
Packit Service a2489d
   and -1 is returned for an invalid sequence of units, -2 is returned for an
Packit Service a2489d
   incomplete sequence of units.
Packit Service a2489d
   The number of available units, N, must be > 0.  */
Packit Service a2489d
/* Similar to u*_mbtouc(), except that the return value gives more details
Packit Service a2489d
   about the failure, similar to mbrtowc().  */
Packit Service a2489d
Packit Service a2489d
#if GNULIB_UNISTR_U8_MBTOUCR || HAVE_LIBUNISTRING
Packit Service a2489d
extern int
Packit Service a2489d
       u8_mbtoucr (ucs4_t *puc, const uint8_t *s, size_t n);
Packit Service a2489d
#endif
Packit Service a2489d
Packit Service a2489d
#if GNULIB_UNISTR_U16_MBTOUCR || HAVE_LIBUNISTRING
Packit Service a2489d
extern int
Packit Service a2489d
       u16_mbtoucr (ucs4_t *puc, const uint16_t *s, size_t n);
Packit Service a2489d
#endif
Packit Service a2489d
Packit Service a2489d
#if GNULIB_UNISTR_U32_MBTOUCR || HAVE_LIBUNISTRING
Packit Service a2489d
extern int
Packit Service a2489d
       u32_mbtoucr (ucs4_t *puc, const uint32_t *s, size_t n);
Packit Service a2489d
#endif
Packit Service a2489d
Packit Service a2489d
/* Put the multibyte character represented by UC in S, returning its
Packit Service a2489d
   length.  Return -1 upon failure, -2 if the number of available units, N,
Packit Service a2489d
   is too small.  The latter case cannot occur if N >= 6/2/1, respectively.  */
Packit Service a2489d
/* Similar to wctomb(), except that s must not be NULL, and the argument n
Packit Service a2489d
   must be specified.  */
Packit Service a2489d
Packit Service a2489d
#if GNULIB_UNISTR_U8_UCTOMB || HAVE_LIBUNISTRING
Packit Service a2489d
/* Auxiliary function, also used by u8_chr, u8_strchr, u8_strrchr.  */
Packit Service a2489d
extern int
Packit Service a2489d
       u8_uctomb_aux (uint8_t *s, ucs4_t uc, int n);
Packit Service a2489d
# if !HAVE_INLINE
Packit Service a2489d
extern int
Packit Service a2489d
       u8_uctomb (uint8_t *s, ucs4_t uc, int n);
Packit Service a2489d
# else
Packit Service a2489d
static inline int
Packit Service a2489d
u8_uctomb (uint8_t *s, ucs4_t uc, int n)
Packit Service a2489d
{
Packit Service a2489d
  if (uc < 0x80 && n > 0)
Packit Service a2489d
    {
Packit Service a2489d
      s[0] = uc;
Packit Service a2489d
      return 1;
Packit Service a2489d
    }
Packit Service a2489d
  else
Packit Service a2489d
    return u8_uctomb_aux (s, uc, n);
Packit Service a2489d
}
Packit Service a2489d
# endif
Packit Service a2489d
#endif
Packit Service a2489d
Packit Service a2489d
#if GNULIB_UNISTR_U16_UCTOMB || HAVE_LIBUNISTRING
Packit Service a2489d
/* Auxiliary function, also used by u16_chr, u16_strchr, u16_strrchr.  */
Packit Service a2489d
extern int
Packit Service a2489d
       u16_uctomb_aux (uint16_t *s, ucs4_t uc, int n);
Packit Service a2489d
# if !HAVE_INLINE
Packit Service a2489d
extern int
Packit Service a2489d
       u16_uctomb (uint16_t *s, ucs4_t uc, int n);
Packit Service a2489d
# else
Packit Service a2489d
static inline int
Packit Service a2489d
u16_uctomb (uint16_t *s, ucs4_t uc, int n)
Packit Service a2489d
{
Packit Service a2489d
  if (uc < 0xd800 && n > 0)
Packit Service a2489d
    {
Packit Service a2489d
      s[0] = uc;
Packit Service a2489d
      return 1;
Packit Service a2489d
    }
Packit Service a2489d
  else
Packit Service a2489d
    return u16_uctomb_aux (s, uc, n);
Packit Service a2489d
}
Packit Service a2489d
# endif
Packit Service a2489d
#endif
Packit Service a2489d
Packit Service a2489d
#if GNULIB_UNISTR_U32_UCTOMB || HAVE_LIBUNISTRING
Packit Service a2489d
# if !HAVE_INLINE
Packit Service a2489d
extern int
Packit Service a2489d
       u32_uctomb (uint32_t *s, ucs4_t uc, int n);
Packit Service a2489d
# else
Packit Service a2489d
static inline int
Packit Service a2489d
u32_uctomb (uint32_t *s, ucs4_t uc, int n)
Packit Service a2489d
{
Packit Service a2489d
  if (uc < 0xd800 || (uc >= 0xe000 && uc < 0x110000))
Packit Service a2489d
    {
Packit Service a2489d
      if (n > 0)
Packit Service a2489d
        {
Packit Service a2489d
          *s = uc;
Packit Service a2489d
          return 1;
Packit Service a2489d
        }
Packit Service a2489d
      else
Packit Service a2489d
        return -2;
Packit Service a2489d
    }
Packit Service a2489d
  else
Packit Service a2489d
    return -1;
Packit Service a2489d
}
Packit Service a2489d
# endif
Packit Service a2489d
#endif
Packit Service a2489d
Packit Service a2489d
/* Copy N units from SRC to DEST.  */
Packit Service a2489d
/* Similar to memcpy().  */
Packit Service a2489d
extern uint8_t *
Packit Service a2489d
       u8_cpy (uint8_t *dest, const uint8_t *src, size_t n);
Packit Service a2489d
extern uint16_t *
Packit Service a2489d
       u16_cpy (uint16_t *dest, const uint16_t *src, size_t n);
Packit Service a2489d
extern uint32_t *
Packit Service a2489d
       u32_cpy (uint32_t *dest, const uint32_t *src, size_t n);
Packit Service a2489d
Packit Service a2489d
/* Copy N units from SRC to DEST, guaranteeing correct behavior for
Packit Service a2489d
   overlapping memory areas.  */
Packit Service a2489d
/* Similar to memmove().  */
Packit Service a2489d
extern uint8_t *
Packit Service a2489d
       u8_move (uint8_t *dest, const uint8_t *src, size_t n);
Packit Service a2489d
extern uint16_t *
Packit Service a2489d
       u16_move (uint16_t *dest, const uint16_t *src, size_t n);
Packit Service a2489d
extern uint32_t *
Packit Service a2489d
       u32_move (uint32_t *dest, const uint32_t *src, size_t n);
Packit Service a2489d
Packit Service a2489d
/* Set the first N characters of S to UC.  UC should be a character that
Packit Service a2489d
   occupies only 1 unit.  */
Packit Service a2489d
/* Similar to memset().  */
Packit Service a2489d
extern uint8_t *
Packit Service a2489d
       u8_set (uint8_t *s, ucs4_t uc, size_t n);
Packit Service a2489d
extern uint16_t *
Packit Service a2489d
       u16_set (uint16_t *s, ucs4_t uc, size_t n);
Packit Service a2489d
extern uint32_t *
Packit Service a2489d
       u32_set (uint32_t *s, ucs4_t uc, size_t n);
Packit Service a2489d
Packit Service a2489d
/* Compare S1 and S2, each of length N.  */
Packit Service a2489d
/* Similar to memcmp().  */
Packit Service a2489d
extern int
Packit Service a2489d
       u8_cmp (const uint8_t *s1, const uint8_t *s2, size_t n)
Packit Service a2489d
       _UC_ATTRIBUTE_PURE;
Packit Service a2489d
extern int
Packit Service a2489d
       u16_cmp (const uint16_t *s1, const uint16_t *s2, size_t n)
Packit Service a2489d
       _UC_ATTRIBUTE_PURE;
Packit Service a2489d
extern int
Packit Service a2489d
       u32_cmp (const uint32_t *s1, const uint32_t *s2, size_t n)
Packit Service a2489d
       _UC_ATTRIBUTE_PURE;
Packit Service a2489d
Packit Service a2489d
/* Compare S1 and S2.  */
Packit Service a2489d
/* Similar to the gnulib function memcmp2().  */
Packit Service a2489d
extern int
Packit Service a2489d
       u8_cmp2 (const uint8_t *s1, size_t n1, const uint8_t *s2, size_t n2)
Packit Service a2489d
       _UC_ATTRIBUTE_PURE;
Packit Service a2489d
extern int
Packit Service a2489d
       u16_cmp2 (const uint16_t *s1, size_t n1, const uint16_t *s2, size_t n2)
Packit Service a2489d
       _UC_ATTRIBUTE_PURE;
Packit Service a2489d
extern int
Packit Service a2489d
       u32_cmp2 (const uint32_t *s1, size_t n1, const uint32_t *s2, size_t n2)
Packit Service a2489d
       _UC_ATTRIBUTE_PURE;
Packit Service a2489d
Packit Service a2489d
/* Search the string at S for UC.  */
Packit Service a2489d
/* Similar to memchr().  */
Packit Service a2489d
extern uint8_t *
Packit Service a2489d
       u8_chr (const uint8_t *s, size_t n, ucs4_t uc)
Packit Service a2489d
       _UC_ATTRIBUTE_PURE;
Packit Service a2489d
extern uint16_t *
Packit Service a2489d
       u16_chr (const uint16_t *s, size_t n, ucs4_t uc)
Packit Service a2489d
       _UC_ATTRIBUTE_PURE;
Packit Service a2489d
extern uint32_t *
Packit Service a2489d
       u32_chr (const uint32_t *s, size_t n, ucs4_t uc)
Packit Service a2489d
       _UC_ATTRIBUTE_PURE;
Packit Service a2489d
Packit Service a2489d
/* Count the number of Unicode characters in the N units from S.  */
Packit Service a2489d
/* Similar to mbsnlen().  */
Packit Service a2489d
extern size_t
Packit Service a2489d
       u8_mbsnlen (const uint8_t *s, size_t n)
Packit Service a2489d
       _UC_ATTRIBUTE_PURE;
Packit Service a2489d
extern size_t
Packit Service a2489d
       u16_mbsnlen (const uint16_t *s, size_t n)
Packit Service a2489d
       _UC_ATTRIBUTE_PURE;
Packit Service a2489d
extern size_t
Packit Service a2489d
       u32_mbsnlen (const uint32_t *s, size_t n)
Packit Service a2489d
       _UC_ATTRIBUTE_PURE;
Packit Service a2489d
Packit Service a2489d
/* Elementary string functions with memory allocation.  */
Packit Service a2489d
Packit Service a2489d
/* Make a freshly allocated copy of S, of length N.  */
Packit Service a2489d
extern uint8_t *
Packit Service a2489d
       u8_cpy_alloc (const uint8_t *s, size_t n);
Packit Service a2489d
extern uint16_t *
Packit Service a2489d
       u16_cpy_alloc (const uint16_t *s, size_t n);
Packit Service a2489d
extern uint32_t *
Packit Service a2489d
       u32_cpy_alloc (const uint32_t *s, size_t n);
Packit Service a2489d
Packit Service a2489d
/* Elementary string functions on NUL terminated strings.  */
Packit Service a2489d
Packit Service a2489d
/* Return the length (number of units) of the first character in S.
Packit Service a2489d
   Return 0 if it is the NUL character.  Return -1 upon failure.  */
Packit Service a2489d
extern int
Packit Service a2489d
       u8_strmblen (const uint8_t *s)
Packit Service a2489d
       _UC_ATTRIBUTE_PURE;
Packit Service a2489d
extern int
Packit Service a2489d
       u16_strmblen (const uint16_t *s)
Packit Service a2489d
       _UC_ATTRIBUTE_PURE;
Packit Service a2489d
extern int
Packit Service a2489d
       u32_strmblen (const uint32_t *s)
Packit Service a2489d
       _UC_ATTRIBUTE_PURE;
Packit Service a2489d
Packit Service a2489d
/* Return the length (number of units) of the first character in S, putting
Packit Service a2489d
   its 'ucs4_t' representation in *PUC.  Return 0 if it is the NUL
Packit Service a2489d
   character.  Return -1 upon failure.  */
Packit Service a2489d
extern int
Packit Service a2489d
       u8_strmbtouc (ucs4_t *puc, const uint8_t *s);
Packit Service a2489d
extern int
Packit Service a2489d
       u16_strmbtouc (ucs4_t *puc, const uint16_t *s);
Packit Service a2489d
extern int
Packit Service a2489d
       u32_strmbtouc (ucs4_t *puc, const uint32_t *s);
Packit Service a2489d
Packit Service a2489d
/* Forward iteration step.  Advances the pointer past the next character,
Packit Service a2489d
   or returns NULL if the end of the string has been reached.  Puts the
Packit Service a2489d
   character's 'ucs4_t' representation in *PUC.  */
Packit Service a2489d
extern const uint8_t *
Packit Service a2489d
       u8_next (ucs4_t *puc, const uint8_t *s);
Packit Service a2489d
extern const uint16_t *
Packit Service a2489d
       u16_next (ucs4_t *puc, const uint16_t *s);
Packit Service a2489d
extern const uint32_t *
Packit Service a2489d
       u32_next (ucs4_t *puc, const uint32_t *s);
Packit Service a2489d
Packit Service a2489d
/* Backward iteration step.  Advances the pointer to point to the previous
Packit Service a2489d
   character, or returns NULL if the beginning of the string had been reached.
Packit Service a2489d
   Puts the character's 'ucs4_t' representation in *PUC.  */
Packit Service a2489d
extern const uint8_t *
Packit Service a2489d
       u8_prev (ucs4_t *puc, const uint8_t *s, const uint8_t *start);
Packit Service a2489d
extern const uint16_t *
Packit Service a2489d
       u16_prev (ucs4_t *puc, const uint16_t *s, const uint16_t *start);
Packit Service a2489d
extern const uint32_t *
Packit Service a2489d
       u32_prev (ucs4_t *puc, const uint32_t *s, const uint32_t *start);
Packit Service a2489d
Packit Service a2489d
/* Return the number of units in S.  */
Packit Service a2489d
/* Similar to strlen(), wcslen().  */
Packit Service a2489d
extern size_t
Packit Service a2489d
       u8_strlen (const uint8_t *s)
Packit Service a2489d
       _UC_ATTRIBUTE_PURE;
Packit Service a2489d
extern size_t
Packit Service a2489d
       u16_strlen (const uint16_t *s)
Packit Service a2489d
       _UC_ATTRIBUTE_PURE;
Packit Service a2489d
extern size_t
Packit Service a2489d
       u32_strlen (const uint32_t *s)
Packit Service a2489d
       _UC_ATTRIBUTE_PURE;
Packit Service a2489d
Packit Service a2489d
/* Return the number of units in S, but at most MAXLEN.  */
Packit Service a2489d
/* Similar to strnlen(), wcsnlen().  */
Packit Service a2489d
extern size_t
Packit Service a2489d
       u8_strnlen (const uint8_t *s, size_t maxlen)
Packit Service a2489d
       _UC_ATTRIBUTE_PURE;
Packit Service a2489d
extern size_t
Packit Service a2489d
       u16_strnlen (const uint16_t *s, size_t maxlen)
Packit Service a2489d
       _UC_ATTRIBUTE_PURE;
Packit Service a2489d
extern size_t
Packit Service a2489d
       u32_strnlen (const uint32_t *s, size_t maxlen)
Packit Service a2489d
       _UC_ATTRIBUTE_PURE;
Packit Service a2489d
Packit Service a2489d
/* Copy SRC to DEST.  */
Packit Service a2489d
/* Similar to strcpy(), wcscpy().  */
Packit Service a2489d
extern uint8_t *
Packit Service a2489d
       u8_strcpy (uint8_t *dest, const uint8_t *src);
Packit Service a2489d
extern uint16_t *
Packit Service a2489d
       u16_strcpy (uint16_t *dest, const uint16_t *src);
Packit Service a2489d
extern uint32_t *
Packit Service a2489d
       u32_strcpy (uint32_t *dest, const uint32_t *src);
Packit Service a2489d
Packit Service a2489d
/* Copy SRC to DEST, returning the address of the terminating NUL in DEST.  */
Packit Service a2489d
/* Similar to stpcpy().  */
Packit Service a2489d
extern uint8_t *
Packit Service a2489d
       u8_stpcpy (uint8_t *dest, const uint8_t *src);
Packit Service a2489d
extern uint16_t *
Packit Service a2489d
       u16_stpcpy (uint16_t *dest, const uint16_t *src);
Packit Service a2489d
extern uint32_t *
Packit Service a2489d
       u32_stpcpy (uint32_t *dest, const uint32_t *src);
Packit Service a2489d
Packit Service a2489d
/* Copy no more than N units of SRC to DEST.  */
Packit Service a2489d
/* Similar to strncpy(), wcsncpy().  */
Packit Service a2489d
extern uint8_t *
Packit Service a2489d
       u8_strncpy (uint8_t *dest, const uint8_t *src, size_t n);
Packit Service a2489d
extern uint16_t *
Packit Service a2489d
       u16_strncpy (uint16_t *dest, const uint16_t *src, size_t n);
Packit Service a2489d
extern uint32_t *
Packit Service a2489d
       u32_strncpy (uint32_t *dest, const uint32_t *src, size_t n);
Packit Service a2489d
Packit Service a2489d
/* Copy no more than N units of SRC to DEST.  Return a pointer past the last
Packit Service a2489d
   non-NUL unit written into DEST.  */
Packit Service a2489d
/* Similar to stpncpy().  */
Packit Service a2489d
extern uint8_t *
Packit Service a2489d
       u8_stpncpy (uint8_t *dest, const uint8_t *src, size_t n);
Packit Service a2489d
extern uint16_t *
Packit Service a2489d
       u16_stpncpy (uint16_t *dest, const uint16_t *src, size_t n);
Packit Service a2489d
extern uint32_t *
Packit Service a2489d
       u32_stpncpy (uint32_t *dest, const uint32_t *src, size_t n);
Packit Service a2489d
Packit Service a2489d
/* Append SRC onto DEST.  */
Packit Service a2489d
/* Similar to strcat(), wcscat().  */
Packit Service a2489d
extern uint8_t *
Packit Service a2489d
       u8_strcat (uint8_t *dest, const uint8_t *src);
Packit Service a2489d
extern uint16_t *
Packit Service a2489d
       u16_strcat (uint16_t *dest, const uint16_t *src);
Packit Service a2489d
extern uint32_t *
Packit Service a2489d
       u32_strcat (uint32_t *dest, const uint32_t *src);
Packit Service a2489d
Packit Service a2489d
/* Append no more than N units of SRC onto DEST.  */
Packit Service a2489d
/* Similar to strncat(), wcsncat().  */
Packit Service a2489d
extern uint8_t *
Packit Service a2489d
       u8_strncat (uint8_t *dest, const uint8_t *src, size_t n);
Packit Service a2489d
extern uint16_t *
Packit Service a2489d
       u16_strncat (uint16_t *dest, const uint16_t *src, size_t n);
Packit Service a2489d
extern uint32_t *
Packit Service a2489d
       u32_strncat (uint32_t *dest, const uint32_t *src, size_t n);
Packit Service a2489d
Packit Service a2489d
/* Compare S1 and S2.  */
Packit Service a2489d
/* Similar to strcmp(), wcscmp().  */
Packit Service a2489d
#ifdef __sun
Packit Service a2489d
/* Avoid a collision with the u8_strcmp() function in Solaris 11 libc.  */
Packit Service a2489d
extern int
Packit Service a2489d
       u8_strcmp_gnu (const uint8_t *s1, const uint8_t *s2)
Packit Service a2489d
       _UC_ATTRIBUTE_PURE;
Packit Service a2489d
# define u8_strcmp u8_strcmp_gnu
Packit Service a2489d
#else
Packit Service a2489d
extern int
Packit Service a2489d
       u8_strcmp (const uint8_t *s1, const uint8_t *s2)
Packit Service a2489d
       _UC_ATTRIBUTE_PURE;
Packit Service a2489d
#endif
Packit Service a2489d
extern int
Packit Service a2489d
       u16_strcmp (const uint16_t *s1, const uint16_t *s2)
Packit Service a2489d
       _UC_ATTRIBUTE_PURE;
Packit Service a2489d
extern int
Packit Service a2489d
       u32_strcmp (const uint32_t *s1, const uint32_t *s2)
Packit Service a2489d
       _UC_ATTRIBUTE_PURE;
Packit Service a2489d
Packit Service a2489d
/* Compare S1 and S2 using the collation rules of the current locale.
Packit Service a2489d
   Return -1 if S1 < S2, 0 if S1 = S2, 1 if S1 > S2.
Packit Service a2489d
   Upon failure, set errno and return any value.  */
Packit Service a2489d
/* Similar to strcoll(), wcscoll().  */
Packit Service a2489d
extern int
Packit Service a2489d
       u8_strcoll (const uint8_t *s1, const uint8_t *s2);
Packit Service a2489d
extern int
Packit Service a2489d
       u16_strcoll (const uint16_t *s1, const uint16_t *s2);
Packit Service a2489d
extern int
Packit Service a2489d
       u32_strcoll (const uint32_t *s1, const uint32_t *s2);
Packit Service a2489d
Packit Service a2489d
/* Compare no more than N units of S1 and S2.  */
Packit Service a2489d
/* Similar to strncmp(), wcsncmp().  */
Packit Service a2489d
extern int
Packit Service a2489d
       u8_strncmp (const uint8_t *s1, const uint8_t *s2, size_t n)
Packit Service a2489d
       _UC_ATTRIBUTE_PURE;
Packit Service a2489d
extern int
Packit Service a2489d
       u16_strncmp (const uint16_t *s1, const uint16_t *s2, size_t n)
Packit Service a2489d
       _UC_ATTRIBUTE_PURE;
Packit Service a2489d
extern int
Packit Service a2489d
       u32_strncmp (const uint32_t *s1, const uint32_t *s2, size_t n)
Packit Service a2489d
       _UC_ATTRIBUTE_PURE;
Packit Service a2489d
Packit Service a2489d
/* Duplicate S, returning an identical malloc'd string.  */
Packit Service a2489d
/* Similar to strdup(), wcsdup().  */
Packit Service a2489d
extern uint8_t *
Packit Service a2489d
       u8_strdup (const uint8_t *s);
Packit Service a2489d
extern uint16_t *
Packit Service a2489d
       u16_strdup (const uint16_t *s);
Packit Service a2489d
extern uint32_t *
Packit Service a2489d
       u32_strdup (const uint32_t *s);
Packit Service a2489d
Packit Service a2489d
/* Find the first occurrence of UC in STR.  */
Packit Service a2489d
/* Similar to strchr(), wcschr().  */
Packit Service a2489d
extern uint8_t *
Packit Service a2489d
       u8_strchr (const uint8_t *str, ucs4_t uc)
Packit Service a2489d
       _UC_ATTRIBUTE_PURE;
Packit Service a2489d
extern uint16_t *
Packit Service a2489d
       u16_strchr (const uint16_t *str, ucs4_t uc)
Packit Service a2489d
       _UC_ATTRIBUTE_PURE;
Packit Service a2489d
extern uint32_t *
Packit Service a2489d
       u32_strchr (const uint32_t *str, ucs4_t uc)
Packit Service a2489d
       _UC_ATTRIBUTE_PURE;
Packit Service a2489d
Packit Service a2489d
/* Find the last occurrence of UC in STR.  */
Packit Service a2489d
/* Similar to strrchr(), wcsrchr().  */
Packit Service a2489d
extern uint8_t *
Packit Service a2489d
       u8_strrchr (const uint8_t *str, ucs4_t uc)
Packit Service a2489d
       _UC_ATTRIBUTE_PURE;
Packit Service a2489d
extern uint16_t *
Packit Service a2489d
       u16_strrchr (const uint16_t *str, ucs4_t uc)
Packit Service a2489d
       _UC_ATTRIBUTE_PURE;
Packit Service a2489d
extern uint32_t *
Packit Service a2489d
       u32_strrchr (const uint32_t *str, ucs4_t uc)
Packit Service a2489d
       _UC_ATTRIBUTE_PURE;
Packit Service a2489d
Packit Service a2489d
/* Return the length of the initial segment of STR which consists entirely
Packit Service a2489d
   of Unicode characters not in REJECT.  */
Packit Service a2489d
/* Similar to strcspn(), wcscspn().  */
Packit Service a2489d
extern size_t
Packit Service a2489d
       u8_strcspn (const uint8_t *str, const uint8_t *reject)
Packit Service a2489d
       _UC_ATTRIBUTE_PURE;
Packit Service a2489d
extern size_t
Packit Service a2489d
       u16_strcspn (const uint16_t *str, const uint16_t *reject)
Packit Service a2489d
       _UC_ATTRIBUTE_PURE;
Packit Service a2489d
extern size_t
Packit Service a2489d
       u32_strcspn (const uint32_t *str, const uint32_t *reject)
Packit Service a2489d
       _UC_ATTRIBUTE_PURE;
Packit Service a2489d
Packit Service a2489d
/* Return the length of the initial segment of STR which consists entirely
Packit Service a2489d
   of Unicode characters in ACCEPT.  */
Packit Service a2489d
/* Similar to strspn(), wcsspn().  */
Packit Service a2489d
extern size_t
Packit Service a2489d
       u8_strspn (const uint8_t *str, const uint8_t *accept)
Packit Service a2489d
       _UC_ATTRIBUTE_PURE;
Packit Service a2489d
extern size_t
Packit Service a2489d
       u16_strspn (const uint16_t *str, const uint16_t *accept)
Packit Service a2489d
       _UC_ATTRIBUTE_PURE;
Packit Service a2489d
extern size_t
Packit Service a2489d
       u32_strspn (const uint32_t *str, const uint32_t *accept)
Packit Service a2489d
       _UC_ATTRIBUTE_PURE;
Packit Service a2489d
Packit Service a2489d
/* Find the first occurrence in STR of any character in ACCEPT.  */
Packit Service a2489d
/* Similar to strpbrk(), wcspbrk().  */
Packit Service a2489d
extern uint8_t *
Packit Service a2489d
       u8_strpbrk (const uint8_t *str, const uint8_t *accept)
Packit Service a2489d
       _UC_ATTRIBUTE_PURE;
Packit Service a2489d
extern uint16_t *
Packit Service a2489d
       u16_strpbrk (const uint16_t *str, const uint16_t *accept)
Packit Service a2489d
       _UC_ATTRIBUTE_PURE;
Packit Service a2489d
extern uint32_t *
Packit Service a2489d
       u32_strpbrk (const uint32_t *str, const uint32_t *accept)
Packit Service a2489d
       _UC_ATTRIBUTE_PURE;
Packit Service a2489d
Packit Service a2489d
/* Find the first occurrence of NEEDLE in HAYSTACK.  */
Packit Service a2489d
/* Similar to strstr(), wcsstr().  */
Packit Service a2489d
extern uint8_t *
Packit Service a2489d
       u8_strstr (const uint8_t *haystack, const uint8_t *needle)
Packit Service a2489d
       _UC_ATTRIBUTE_PURE;
Packit Service a2489d
extern uint16_t *
Packit Service a2489d
       u16_strstr (const uint16_t *haystack, const uint16_t *needle)
Packit Service a2489d
       _UC_ATTRIBUTE_PURE;
Packit Service a2489d
extern uint32_t *
Packit Service a2489d
       u32_strstr (const uint32_t *haystack, const uint32_t *needle)
Packit Service a2489d
       _UC_ATTRIBUTE_PURE;
Packit Service a2489d
Packit Service a2489d
/* Test whether STR starts with PREFIX.  */
Packit Service a2489d
extern bool
Packit Service a2489d
       u8_startswith (const uint8_t *str, const uint8_t *prefix)
Packit Service a2489d
       _UC_ATTRIBUTE_PURE;
Packit Service a2489d
extern bool
Packit Service a2489d
       u16_startswith (const uint16_t *str, const uint16_t *prefix)
Packit Service a2489d
       _UC_ATTRIBUTE_PURE;
Packit Service a2489d
extern bool
Packit Service a2489d
       u32_startswith (const uint32_t *str, const uint32_t *prefix)
Packit Service a2489d
       _UC_ATTRIBUTE_PURE;
Packit Service a2489d
Packit Service a2489d
/* Test whether STR ends with SUFFIX.  */
Packit Service a2489d
extern bool
Packit Service a2489d
       u8_endswith (const uint8_t *str, const uint8_t *suffix)
Packit Service a2489d
       _UC_ATTRIBUTE_PURE;
Packit Service a2489d
extern bool
Packit Service a2489d
       u16_endswith (const uint16_t *str, const uint16_t *suffix)
Packit Service a2489d
       _UC_ATTRIBUTE_PURE;
Packit Service a2489d
extern bool
Packit Service a2489d
       u32_endswith (const uint32_t *str, const uint32_t *suffix)
Packit Service a2489d
       _UC_ATTRIBUTE_PURE;
Packit Service a2489d
Packit Service a2489d
/* Divide STR into tokens separated by characters in DELIM.
Packit Service a2489d
   This interface is actually more similar to wcstok than to strtok.  */
Packit Service a2489d
/* Similar to strtok_r(), wcstok().  */
Packit Service a2489d
extern uint8_t *
Packit Service a2489d
       u8_strtok (uint8_t *str, const uint8_t *delim, uint8_t **ptr);
Packit Service a2489d
extern uint16_t *
Packit Service a2489d
       u16_strtok (uint16_t *str, const uint16_t *delim, uint16_t **ptr);
Packit Service a2489d
extern uint32_t *
Packit Service a2489d
       u32_strtok (uint32_t *str, const uint32_t *delim, uint32_t **ptr);
Packit Service a2489d
Packit Service a2489d
Packit Service a2489d
#ifdef __cplusplus
Packit Service a2489d
}
Packit Service a2489d
#endif
Packit Service a2489d
Packit Service a2489d
#endif /* _UNISTR_H */