Blame lib/unistr.in.h

Packit 8f70b4
/* Elementary Unicode string functions.
Packit 8f70b4
   Copyright (C) 2001-2002, 2005-2018 Free Software Foundation, Inc.
Packit 8f70b4
Packit 8f70b4
   This program is free software: you can redistribute it and/or modify it
Packit 8f70b4
   under the terms of the GNU General Public License as published
Packit 8f70b4
   by the Free Software Foundation; either version 3 of the License, or
Packit 8f70b4
   (at your option) any later version.
Packit 8f70b4
Packit 8f70b4
   This program is distributed in the hope that it will be useful,
Packit 8f70b4
   but WITHOUT ANY WARRANTY; without even the implied warranty of
Packit 8f70b4
   MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the GNU
Packit 8f70b4
   General Public License for more details.
Packit 8f70b4
Packit 8f70b4
   You should have received a copy of the GNU General Public License
Packit 8f70b4
   along with this program.  If not, see <https://www.gnu.org/licenses/>.  */
Packit 8f70b4
Packit 8f70b4
#ifndef _UNISTR_H
Packit 8f70b4
#define _UNISTR_H
Packit 8f70b4
Packit 8f70b4
#include "unitypes.h"
Packit 8f70b4
Packit 8f70b4
/* Get common macros for C.  */
Packit 8f70b4
#include "unused-parameter.h"
Packit 8f70b4
Packit 8f70b4
/* Get bool.  */
Packit 8f70b4
#include <stdbool.h>
Packit 8f70b4
Packit 8f70b4
/* Get size_t.  */
Packit 8f70b4
#include <stddef.h>
Packit 8f70b4
Packit 8f70b4
#ifdef __cplusplus
Packit 8f70b4
extern "C" {
Packit 8f70b4
#endif
Packit 8f70b4
Packit 8f70b4
Packit 8f70b4
/* Conventions:
Packit 8f70b4
Packit 8f70b4
   All functions prefixed with u8_ operate on UTF-8 encoded strings.
Packit 8f70b4
   Their unit is an uint8_t (1 byte).
Packit 8f70b4
Packit 8f70b4
   All functions prefixed with u16_ operate on UTF-16 encoded strings.
Packit 8f70b4
   Their unit is an uint16_t (a 2-byte word).
Packit 8f70b4
Packit 8f70b4
   All functions prefixed with u32_ operate on UCS-4 encoded strings.
Packit 8f70b4
   Their unit is an uint32_t (a 4-byte word).
Packit 8f70b4
Packit 8f70b4
   All argument pairs (s, n) denote a Unicode string s[0..n-1] with exactly
Packit 8f70b4
   n units.
Packit 8f70b4
Packit 8f70b4
   All arguments starting with "str" and the arguments of functions starting
Packit 8f70b4
   with u8_str/u16_str/u32_str denote a NUL terminated string, i.e. a string
Packit 8f70b4
   which terminates at the first NUL unit.  This termination unit is
Packit 8f70b4
   considered part of the string for all memory allocation purposes, but
Packit 8f70b4
   is not considered part of the string for all other logical purposes.
Packit 8f70b4
Packit 8f70b4
   Functions returning a string result take a (resultbuf, lengthp) argument
Packit 8f70b4
   pair.  If resultbuf is not NULL and the result fits into *lengthp units,
Packit 8f70b4
   it is put in resultbuf, and resultbuf is returned.  Otherwise, a freshly
Packit 8f70b4
   allocated string is returned.  In both cases, *lengthp is set to the
Packit 8f70b4
   length (number of units) of the returned string.  In case of error,
Packit 8f70b4
   NULL is returned and errno is set.  */
Packit 8f70b4
Packit 8f70b4
Packit 8f70b4
/* Elementary string checks.  */
Packit 8f70b4
Packit 8f70b4
/* Check whether an UTF-8 string is well-formed.
Packit 8f70b4
   Return NULL if valid, or a pointer to the first invalid unit otherwise.  */
Packit 8f70b4
extern const uint8_t *
Packit 8f70b4
       u8_check (const uint8_t *s, size_t n)
Packit 8f70b4
       _UC_ATTRIBUTE_PURE;
Packit 8f70b4
Packit 8f70b4
/* Check whether an UTF-16 string is well-formed.
Packit 8f70b4
   Return NULL if valid, or a pointer to the first invalid unit otherwise.  */
Packit 8f70b4
extern const uint16_t *
Packit 8f70b4
       u16_check (const uint16_t *s, size_t n)
Packit 8f70b4
       _UC_ATTRIBUTE_PURE;
Packit 8f70b4
Packit 8f70b4
/* Check whether an UCS-4 string is well-formed.
Packit 8f70b4
   Return NULL if valid, or a pointer to the first invalid unit otherwise.  */
Packit 8f70b4
extern const uint32_t *
Packit 8f70b4
       u32_check (const uint32_t *s, size_t n)
Packit 8f70b4
       _UC_ATTRIBUTE_PURE;
Packit 8f70b4
Packit 8f70b4
Packit 8f70b4
/* Elementary string conversions.  */
Packit 8f70b4
Packit 8f70b4
/* Convert an UTF-8 string to an UTF-16 string.  */
Packit 8f70b4
extern uint16_t *
Packit 8f70b4
       u8_to_u16 (const uint8_t *s, size_t n, uint16_t *resultbuf,
Packit 8f70b4
                  size_t *lengthp);
Packit 8f70b4
Packit 8f70b4
/* Convert an UTF-8 string to an UCS-4 string.  */
Packit 8f70b4
extern uint32_t *
Packit 8f70b4
       u8_to_u32 (const uint8_t *s, size_t n, uint32_t *resultbuf,
Packit 8f70b4
                  size_t *lengthp);
Packit 8f70b4
Packit 8f70b4
/* Convert an UTF-16 string to an UTF-8 string.  */
Packit 8f70b4
extern uint8_t *
Packit 8f70b4
       u16_to_u8 (const uint16_t *s, size_t n, uint8_t *resultbuf,
Packit 8f70b4
                  size_t *lengthp);
Packit 8f70b4
Packit 8f70b4
/* Convert an UTF-16 string to an UCS-4 string.  */
Packit 8f70b4
extern uint32_t *
Packit 8f70b4
       u16_to_u32 (const uint16_t *s, size_t n, uint32_t *resultbuf,
Packit 8f70b4
                   size_t *lengthp);
Packit 8f70b4
Packit 8f70b4
/* Convert an UCS-4 string to an UTF-8 string.  */
Packit 8f70b4
extern uint8_t *
Packit 8f70b4
       u32_to_u8 (const uint32_t *s, size_t n, uint8_t *resultbuf,
Packit 8f70b4
                  size_t *lengthp);
Packit 8f70b4
Packit 8f70b4
/* Convert an UCS-4 string to an UTF-16 string.  */
Packit 8f70b4
extern uint16_t *
Packit 8f70b4
       u32_to_u16 (const uint32_t *s, size_t n, uint16_t *resultbuf,
Packit 8f70b4
                   size_t *lengthp);
Packit 8f70b4
Packit 8f70b4
Packit 8f70b4
/* Elementary string functions.  */
Packit 8f70b4
Packit 8f70b4
/* Return the length (number of units) of the first character in S, which is
Packit 8f70b4
   no longer than N.  Return 0 if it is the NUL character.  Return -1 upon
Packit 8f70b4
   failure.  */
Packit 8f70b4
/* Similar to mblen(), except that s must not be NULL.  */
Packit 8f70b4
extern int
Packit 8f70b4
       u8_mblen (const uint8_t *s, size_t n)
Packit 8f70b4
       _UC_ATTRIBUTE_PURE;
Packit 8f70b4
extern int
Packit 8f70b4
       u16_mblen (const uint16_t *s, size_t n)
Packit 8f70b4
       _UC_ATTRIBUTE_PURE;
Packit 8f70b4
extern int
Packit 8f70b4
       u32_mblen (const uint32_t *s, size_t n)
Packit 8f70b4
       _UC_ATTRIBUTE_PURE;
Packit 8f70b4
Packit 8f70b4
/* Return the length (number of units) of the first character in S, putting
Packit 8f70b4
   its 'ucs4_t' representation in *PUC.  Upon failure, *PUC is set to 0xfffd,
Packit 8f70b4
   and an appropriate number of units is returned.
Packit 8f70b4
   The number of available units, N, must be > 0.  */
Packit 8f70b4
/* Similar to mbtowc(), except that puc and s must not be NULL, n must be > 0,
Packit 8f70b4
   and the NUL character is not treated specially.  */
Packit 8f70b4
/* The variants with _unsafe suffix are for backward compatibility with
Packit 8f70b4
   libunistring versions < 0.9.7.  */
Packit 8f70b4
Packit 8f70b4
#if GNULIB_UNISTR_U8_MBTOUC_UNSAFE || HAVE_LIBUNISTRING
Packit 8f70b4
# if !HAVE_INLINE
Packit 8f70b4
extern int
Packit 8f70b4
       u8_mbtouc_unsafe (ucs4_t *puc, const uint8_t *s, size_t n);
Packit 8f70b4
# else
Packit 8f70b4
extern int
Packit 8f70b4
       u8_mbtouc_unsafe_aux (ucs4_t *puc, const uint8_t *s, size_t n);
Packit 8f70b4
static inline int
Packit 8f70b4
u8_mbtouc_unsafe (ucs4_t *puc, const uint8_t *s, size_t n)
Packit 8f70b4
{
Packit 8f70b4
  uint8_t c = *s;
Packit 8f70b4
Packit 8f70b4
  if (c < 0x80)
Packit 8f70b4
    {
Packit 8f70b4
      *puc = c;
Packit 8f70b4
      return 1;
Packit 8f70b4
    }
Packit 8f70b4
  else
Packit 8f70b4
    return u8_mbtouc_unsafe_aux (puc, s, n);
Packit 8f70b4
}
Packit 8f70b4
# endif
Packit 8f70b4
#endif
Packit 8f70b4
Packit 8f70b4
#if GNULIB_UNISTR_U16_MBTOUC_UNSAFE || HAVE_LIBUNISTRING
Packit 8f70b4
# if !HAVE_INLINE
Packit 8f70b4
extern int
Packit 8f70b4
       u16_mbtouc_unsafe (ucs4_t *puc, const uint16_t *s, size_t n);
Packit 8f70b4
# else
Packit 8f70b4
extern int
Packit 8f70b4
       u16_mbtouc_unsafe_aux (ucs4_t *puc, const uint16_t *s, size_t n);
Packit 8f70b4
static inline int
Packit 8f70b4
u16_mbtouc_unsafe (ucs4_t *puc, const uint16_t *s, size_t n)
Packit 8f70b4
{
Packit 8f70b4
  uint16_t c = *s;
Packit 8f70b4
Packit 8f70b4
  if (c < 0xd800 || c >= 0xe000)
Packit 8f70b4
    {
Packit 8f70b4
      *puc = c;
Packit 8f70b4
      return 1;
Packit 8f70b4
    }
Packit 8f70b4
  else
Packit 8f70b4
    return u16_mbtouc_unsafe_aux (puc, s, n);
Packit 8f70b4
}
Packit 8f70b4
# endif
Packit 8f70b4
#endif
Packit 8f70b4
Packit 8f70b4
#if GNULIB_UNISTR_U32_MBTOUC_UNSAFE || HAVE_LIBUNISTRING
Packit 8f70b4
# if !HAVE_INLINE
Packit 8f70b4
extern int
Packit 8f70b4
       u32_mbtouc_unsafe (ucs4_t *puc, const uint32_t *s, size_t n);
Packit 8f70b4
# else
Packit 8f70b4
static inline int
Packit 8f70b4
u32_mbtouc_unsafe (ucs4_t *puc,
Packit 8f70b4
                   const uint32_t *s, size_t n _GL_UNUSED_PARAMETER)
Packit 8f70b4
{
Packit 8f70b4
  uint32_t c = *s;
Packit 8f70b4
Packit 8f70b4
  if (c < 0xd800 || (c >= 0xe000 && c < 0x110000))
Packit 8f70b4
    *puc = c;
Packit 8f70b4
  else
Packit 8f70b4
    /* invalid multibyte character */
Packit 8f70b4
    *puc = 0xfffd;
Packit 8f70b4
  return 1;
Packit 8f70b4
}
Packit 8f70b4
# endif
Packit 8f70b4
#endif
Packit 8f70b4
Packit 8f70b4
#if GNULIB_UNISTR_U8_MBTOUC || HAVE_LIBUNISTRING
Packit 8f70b4
# if !HAVE_INLINE
Packit 8f70b4
extern int
Packit 8f70b4
       u8_mbtouc (ucs4_t *puc, const uint8_t *s, size_t n);
Packit 8f70b4
# else
Packit 8f70b4
extern int
Packit 8f70b4
       u8_mbtouc_aux (ucs4_t *puc, const uint8_t *s, size_t n);
Packit 8f70b4
static inline int
Packit 8f70b4
u8_mbtouc (ucs4_t *puc, const uint8_t *s, size_t n)
Packit 8f70b4
{
Packit 8f70b4
  uint8_t c = *s;
Packit 8f70b4
Packit 8f70b4
  if (c < 0x80)
Packit 8f70b4
    {
Packit 8f70b4
      *puc = c;
Packit 8f70b4
      return 1;
Packit 8f70b4
    }
Packit 8f70b4
  else
Packit 8f70b4
    return u8_mbtouc_aux (puc, s, n);
Packit 8f70b4
}
Packit 8f70b4
# endif
Packit 8f70b4
#endif
Packit 8f70b4
Packit 8f70b4
#if GNULIB_UNISTR_U16_MBTOUC || HAVE_LIBUNISTRING
Packit 8f70b4
# if !HAVE_INLINE
Packit 8f70b4
extern int
Packit 8f70b4
       u16_mbtouc (ucs4_t *puc, const uint16_t *s, size_t n);
Packit 8f70b4
# else
Packit 8f70b4
extern int
Packit 8f70b4
       u16_mbtouc_aux (ucs4_t *puc, const uint16_t *s, size_t n);
Packit 8f70b4
static inline int
Packit 8f70b4
u16_mbtouc (ucs4_t *puc, const uint16_t *s, size_t n)
Packit 8f70b4
{
Packit 8f70b4
  uint16_t c = *s;
Packit 8f70b4
Packit 8f70b4
  if (c < 0xd800 || c >= 0xe000)
Packit 8f70b4
    {
Packit 8f70b4
      *puc = c;
Packit 8f70b4
      return 1;
Packit 8f70b4
    }
Packit 8f70b4
  else
Packit 8f70b4
    return u16_mbtouc_aux (puc, s, n);
Packit 8f70b4
}
Packit 8f70b4
# endif
Packit 8f70b4
#endif
Packit 8f70b4
Packit 8f70b4
#if GNULIB_UNISTR_U32_MBTOUC || HAVE_LIBUNISTRING
Packit 8f70b4
# if !HAVE_INLINE
Packit 8f70b4
extern int
Packit 8f70b4
       u32_mbtouc (ucs4_t *puc, const uint32_t *s, size_t n);
Packit 8f70b4
# else
Packit 8f70b4
static inline int
Packit 8f70b4
u32_mbtouc (ucs4_t *puc, const uint32_t *s, size_t n _GL_UNUSED_PARAMETER)
Packit 8f70b4
{
Packit 8f70b4
  uint32_t c = *s;
Packit 8f70b4
Packit 8f70b4
  if (c < 0xd800 || (c >= 0xe000 && c < 0x110000))
Packit 8f70b4
    *puc = c;
Packit 8f70b4
  else
Packit 8f70b4
    /* invalid multibyte character */
Packit 8f70b4
    *puc = 0xfffd;
Packit 8f70b4
  return 1;
Packit 8f70b4
}
Packit 8f70b4
# endif
Packit 8f70b4
#endif
Packit 8f70b4
Packit 8f70b4
/* Return the length (number of units) of the first character in S, putting
Packit 8f70b4
   its 'ucs4_t' representation in *PUC.  Upon failure, *PUC is set to 0xfffd,
Packit 8f70b4
   and -1 is returned for an invalid sequence of units, -2 is returned for an
Packit 8f70b4
   incomplete sequence of units.
Packit 8f70b4
   The number of available units, N, must be > 0.  */
Packit 8f70b4
/* Similar to u*_mbtouc(), except that the return value gives more details
Packit 8f70b4
   about the failure, similar to mbrtowc().  */
Packit 8f70b4
Packit 8f70b4
#if GNULIB_UNISTR_U8_MBTOUCR || HAVE_LIBUNISTRING
Packit 8f70b4
extern int
Packit 8f70b4
       u8_mbtoucr (ucs4_t *puc, const uint8_t *s, size_t n);
Packit 8f70b4
#endif
Packit 8f70b4
Packit 8f70b4
#if GNULIB_UNISTR_U16_MBTOUCR || HAVE_LIBUNISTRING
Packit 8f70b4
extern int
Packit 8f70b4
       u16_mbtoucr (ucs4_t *puc, const uint16_t *s, size_t n);
Packit 8f70b4
#endif
Packit 8f70b4
Packit 8f70b4
#if GNULIB_UNISTR_U32_MBTOUCR || HAVE_LIBUNISTRING
Packit 8f70b4
extern int
Packit 8f70b4
       u32_mbtoucr (ucs4_t *puc, const uint32_t *s, size_t n);
Packit 8f70b4
#endif
Packit 8f70b4
Packit 8f70b4
/* Put the multibyte character represented by UC in S, returning its
Packit 8f70b4
   length.  Return -1 upon failure, -2 if the number of available units, N,
Packit 8f70b4
   is too small.  The latter case cannot occur if N >= 6/2/1, respectively.  */
Packit 8f70b4
/* Similar to wctomb(), except that s must not be NULL, and the argument n
Packit 8f70b4
   must be specified.  */
Packit 8f70b4
Packit 8f70b4
#if GNULIB_UNISTR_U8_UCTOMB || HAVE_LIBUNISTRING
Packit 8f70b4
/* Auxiliary function, also used by u8_chr, u8_strchr, u8_strrchr.  */
Packit 8f70b4
extern int
Packit 8f70b4
       u8_uctomb_aux (uint8_t *s, ucs4_t uc, int n);
Packit 8f70b4
# if !HAVE_INLINE
Packit 8f70b4
extern int
Packit 8f70b4
       u8_uctomb (uint8_t *s, ucs4_t uc, int n);
Packit 8f70b4
# else
Packit 8f70b4
static inline int
Packit 8f70b4
u8_uctomb (uint8_t *s, ucs4_t uc, int n)
Packit 8f70b4
{
Packit 8f70b4
  if (uc < 0x80 && n > 0)
Packit 8f70b4
    {
Packit 8f70b4
      s[0] = uc;
Packit 8f70b4
      return 1;
Packit 8f70b4
    }
Packit 8f70b4
  else
Packit 8f70b4
    return u8_uctomb_aux (s, uc, n);
Packit 8f70b4
}
Packit 8f70b4
# endif
Packit 8f70b4
#endif
Packit 8f70b4
Packit 8f70b4
#if GNULIB_UNISTR_U16_UCTOMB || HAVE_LIBUNISTRING
Packit 8f70b4
/* Auxiliary function, also used by u16_chr, u16_strchr, u16_strrchr.  */
Packit 8f70b4
extern int
Packit 8f70b4
       u16_uctomb_aux (uint16_t *s, ucs4_t uc, int n);
Packit 8f70b4
# if !HAVE_INLINE
Packit 8f70b4
extern int
Packit 8f70b4
       u16_uctomb (uint16_t *s, ucs4_t uc, int n);
Packit 8f70b4
# else
Packit 8f70b4
static inline int
Packit 8f70b4
u16_uctomb (uint16_t *s, ucs4_t uc, int n)
Packit 8f70b4
{
Packit 8f70b4
  if (uc < 0xd800 && n > 0)
Packit 8f70b4
    {
Packit 8f70b4
      s[0] = uc;
Packit 8f70b4
      return 1;
Packit 8f70b4
    }
Packit 8f70b4
  else
Packit 8f70b4
    return u16_uctomb_aux (s, uc, n);
Packit 8f70b4
}
Packit 8f70b4
# endif
Packit 8f70b4
#endif
Packit 8f70b4
Packit 8f70b4
#if GNULIB_UNISTR_U32_UCTOMB || HAVE_LIBUNISTRING
Packit 8f70b4
# if !HAVE_INLINE
Packit 8f70b4
extern int
Packit 8f70b4
       u32_uctomb (uint32_t *s, ucs4_t uc, int n);
Packit 8f70b4
# else
Packit 8f70b4
static inline int
Packit 8f70b4
u32_uctomb (uint32_t *s, ucs4_t uc, int n)
Packit 8f70b4
{
Packit 8f70b4
  if (uc < 0xd800 || (uc >= 0xe000 && uc < 0x110000))
Packit 8f70b4
    {
Packit 8f70b4
      if (n > 0)
Packit 8f70b4
        {
Packit 8f70b4
          *s = uc;
Packit 8f70b4
          return 1;
Packit 8f70b4
        }
Packit 8f70b4
      else
Packit 8f70b4
        return -2;
Packit 8f70b4
    }
Packit 8f70b4
  else
Packit 8f70b4
    return -1;
Packit 8f70b4
}
Packit 8f70b4
# endif
Packit 8f70b4
#endif
Packit 8f70b4
Packit 8f70b4
/* Copy N units from SRC to DEST.  */
Packit 8f70b4
/* Similar to memcpy().  */
Packit 8f70b4
extern uint8_t *
Packit 8f70b4
       u8_cpy (uint8_t *dest, const uint8_t *src, size_t n);
Packit 8f70b4
extern uint16_t *
Packit 8f70b4
       u16_cpy (uint16_t *dest, const uint16_t *src, size_t n);
Packit 8f70b4
extern uint32_t *
Packit 8f70b4
       u32_cpy (uint32_t *dest, const uint32_t *src, size_t n);
Packit 8f70b4
Packit 8f70b4
/* Copy N units from SRC to DEST, guaranteeing correct behavior for
Packit 8f70b4
   overlapping memory areas.  */
Packit 8f70b4
/* Similar to memmove().  */
Packit 8f70b4
extern uint8_t *
Packit 8f70b4
       u8_move (uint8_t *dest, const uint8_t *src, size_t n);
Packit 8f70b4
extern uint16_t *
Packit 8f70b4
       u16_move (uint16_t *dest, const uint16_t *src, size_t n);
Packit 8f70b4
extern uint32_t *
Packit 8f70b4
       u32_move (uint32_t *dest, const uint32_t *src, size_t n);
Packit 8f70b4
Packit 8f70b4
/* Set the first N characters of S to UC.  UC should be a character that
Packit 8f70b4
   occupies only 1 unit.  */
Packit 8f70b4
/* Similar to memset().  */
Packit 8f70b4
extern uint8_t *
Packit 8f70b4
       u8_set (uint8_t *s, ucs4_t uc, size_t n);
Packit 8f70b4
extern uint16_t *
Packit 8f70b4
       u16_set (uint16_t *s, ucs4_t uc, size_t n);
Packit 8f70b4
extern uint32_t *
Packit 8f70b4
       u32_set (uint32_t *s, ucs4_t uc, size_t n);
Packit 8f70b4
Packit 8f70b4
/* Compare S1 and S2, each of length N.  */
Packit 8f70b4
/* Similar to memcmp().  */
Packit 8f70b4
extern int
Packit 8f70b4
       u8_cmp (const uint8_t *s1, const uint8_t *s2, size_t n)
Packit 8f70b4
       _UC_ATTRIBUTE_PURE;
Packit 8f70b4
extern int
Packit 8f70b4
       u16_cmp (const uint16_t *s1, const uint16_t *s2, size_t n)
Packit 8f70b4
       _UC_ATTRIBUTE_PURE;
Packit 8f70b4
extern int
Packit 8f70b4
       u32_cmp (const uint32_t *s1, const uint32_t *s2, size_t n)
Packit 8f70b4
       _UC_ATTRIBUTE_PURE;
Packit 8f70b4
Packit 8f70b4
/* Compare S1 and S2.  */
Packit 8f70b4
/* Similar to the gnulib function memcmp2().  */
Packit 8f70b4
extern int
Packit 8f70b4
       u8_cmp2 (const uint8_t *s1, size_t n1, const uint8_t *s2, size_t n2)
Packit 8f70b4
       _UC_ATTRIBUTE_PURE;
Packit 8f70b4
extern int
Packit 8f70b4
       u16_cmp2 (const uint16_t *s1, size_t n1, const uint16_t *s2, size_t n2)
Packit 8f70b4
       _UC_ATTRIBUTE_PURE;
Packit 8f70b4
extern int
Packit 8f70b4
       u32_cmp2 (const uint32_t *s1, size_t n1, const uint32_t *s2, size_t n2)
Packit 8f70b4
       _UC_ATTRIBUTE_PURE;
Packit 8f70b4
Packit 8f70b4
/* Search the string at S for UC.  */
Packit 8f70b4
/* Similar to memchr().  */
Packit 8f70b4
extern uint8_t *
Packit 8f70b4
       u8_chr (const uint8_t *s, size_t n, ucs4_t uc)
Packit 8f70b4
       _UC_ATTRIBUTE_PURE;
Packit 8f70b4
extern uint16_t *
Packit 8f70b4
       u16_chr (const uint16_t *s, size_t n, ucs4_t uc)
Packit 8f70b4
       _UC_ATTRIBUTE_PURE;
Packit 8f70b4
extern uint32_t *
Packit 8f70b4
       u32_chr (const uint32_t *s, size_t n, ucs4_t uc)
Packit 8f70b4
       _UC_ATTRIBUTE_PURE;
Packit 8f70b4
Packit 8f70b4
/* Count the number of Unicode characters in the N units from S.  */
Packit 8f70b4
/* Similar to mbsnlen().  */
Packit 8f70b4
extern size_t
Packit 8f70b4
       u8_mbsnlen (const uint8_t *s, size_t n)
Packit 8f70b4
       _UC_ATTRIBUTE_PURE;
Packit 8f70b4
extern size_t
Packit 8f70b4
       u16_mbsnlen (const uint16_t *s, size_t n)
Packit 8f70b4
       _UC_ATTRIBUTE_PURE;
Packit 8f70b4
extern size_t
Packit 8f70b4
       u32_mbsnlen (const uint32_t *s, size_t n)
Packit 8f70b4
       _UC_ATTRIBUTE_PURE;
Packit 8f70b4
Packit 8f70b4
/* Elementary string functions with memory allocation.  */
Packit 8f70b4
Packit 8f70b4
/* Make a freshly allocated copy of S, of length N.  */
Packit 8f70b4
extern uint8_t *
Packit 8f70b4
       u8_cpy_alloc (const uint8_t *s, size_t n);
Packit 8f70b4
extern uint16_t *
Packit 8f70b4
       u16_cpy_alloc (const uint16_t *s, size_t n);
Packit 8f70b4
extern uint32_t *
Packit 8f70b4
       u32_cpy_alloc (const uint32_t *s, size_t n);
Packit 8f70b4
Packit 8f70b4
/* Elementary string functions on NUL terminated strings.  */
Packit 8f70b4
Packit 8f70b4
/* Return the length (number of units) of the first character in S.
Packit 8f70b4
   Return 0 if it is the NUL character.  Return -1 upon failure.  */
Packit 8f70b4
extern int
Packit 8f70b4
       u8_strmblen (const uint8_t *s)
Packit 8f70b4
       _UC_ATTRIBUTE_PURE;
Packit 8f70b4
extern int
Packit 8f70b4
       u16_strmblen (const uint16_t *s)
Packit 8f70b4
       _UC_ATTRIBUTE_PURE;
Packit 8f70b4
extern int
Packit 8f70b4
       u32_strmblen (const uint32_t *s)
Packit 8f70b4
       _UC_ATTRIBUTE_PURE;
Packit 8f70b4
Packit 8f70b4
/* Return the length (number of units) of the first character in S, putting
Packit 8f70b4
   its 'ucs4_t' representation in *PUC.  Return 0 if it is the NUL
Packit 8f70b4
   character.  Return -1 upon failure.  */
Packit 8f70b4
extern int
Packit 8f70b4
       u8_strmbtouc (ucs4_t *puc, const uint8_t *s);
Packit 8f70b4
extern int
Packit 8f70b4
       u16_strmbtouc (ucs4_t *puc, const uint16_t *s);
Packit 8f70b4
extern int
Packit 8f70b4
       u32_strmbtouc (ucs4_t *puc, const uint32_t *s);
Packit 8f70b4
Packit 8f70b4
/* Forward iteration step.  Advances the pointer past the next character,
Packit 8f70b4
   or returns NULL if the end of the string has been reached.  Puts the
Packit 8f70b4
   character's 'ucs4_t' representation in *PUC.  */
Packit 8f70b4
extern const uint8_t *
Packit 8f70b4
       u8_next (ucs4_t *puc, const uint8_t *s);
Packit 8f70b4
extern const uint16_t *
Packit 8f70b4
       u16_next (ucs4_t *puc, const uint16_t *s);
Packit 8f70b4
extern const uint32_t *
Packit 8f70b4
       u32_next (ucs4_t *puc, const uint32_t *s);
Packit 8f70b4
Packit 8f70b4
/* Backward iteration step.  Advances the pointer to point to the previous
Packit 8f70b4
   character, or returns NULL if the beginning of the string had been reached.
Packit 8f70b4
   Puts the character's 'ucs4_t' representation in *PUC.  */
Packit 8f70b4
extern const uint8_t *
Packit 8f70b4
       u8_prev (ucs4_t *puc, const uint8_t *s, const uint8_t *start);
Packit 8f70b4
extern const uint16_t *
Packit 8f70b4
       u16_prev (ucs4_t *puc, const uint16_t *s, const uint16_t *start);
Packit 8f70b4
extern const uint32_t *
Packit 8f70b4
       u32_prev (ucs4_t *puc, const uint32_t *s, const uint32_t *start);
Packit 8f70b4
Packit 8f70b4
/* Return the number of units in S.  */
Packit 8f70b4
/* Similar to strlen(), wcslen().  */
Packit 8f70b4
extern size_t
Packit 8f70b4
       u8_strlen (const uint8_t *s)
Packit 8f70b4
       _UC_ATTRIBUTE_PURE;
Packit 8f70b4
extern size_t
Packit 8f70b4
       u16_strlen (const uint16_t *s)
Packit 8f70b4
       _UC_ATTRIBUTE_PURE;
Packit 8f70b4
extern size_t
Packit 8f70b4
       u32_strlen (const uint32_t *s)
Packit 8f70b4
       _UC_ATTRIBUTE_PURE;
Packit 8f70b4
Packit 8f70b4
/* Return the number of units in S, but at most MAXLEN.  */
Packit 8f70b4
/* Similar to strnlen(), wcsnlen().  */
Packit 8f70b4
extern size_t
Packit 8f70b4
       u8_strnlen (const uint8_t *s, size_t maxlen)
Packit 8f70b4
       _UC_ATTRIBUTE_PURE;
Packit 8f70b4
extern size_t
Packit 8f70b4
       u16_strnlen (const uint16_t *s, size_t maxlen)
Packit 8f70b4
       _UC_ATTRIBUTE_PURE;
Packit 8f70b4
extern size_t
Packit 8f70b4
       u32_strnlen (const uint32_t *s, size_t maxlen)
Packit 8f70b4
       _UC_ATTRIBUTE_PURE;
Packit 8f70b4
Packit 8f70b4
/* Copy SRC to DEST.  */
Packit 8f70b4
/* Similar to strcpy(), wcscpy().  */
Packit 8f70b4
extern uint8_t *
Packit 8f70b4
       u8_strcpy (uint8_t *dest, const uint8_t *src);
Packit 8f70b4
extern uint16_t *
Packit 8f70b4
       u16_strcpy (uint16_t *dest, const uint16_t *src);
Packit 8f70b4
extern uint32_t *
Packit 8f70b4
       u32_strcpy (uint32_t *dest, const uint32_t *src);
Packit 8f70b4
Packit 8f70b4
/* Copy SRC to DEST, returning the address of the terminating NUL in DEST.  */
Packit 8f70b4
/* Similar to stpcpy().  */
Packit 8f70b4
extern uint8_t *
Packit 8f70b4
       u8_stpcpy (uint8_t *dest, const uint8_t *src);
Packit 8f70b4
extern uint16_t *
Packit 8f70b4
       u16_stpcpy (uint16_t *dest, const uint16_t *src);
Packit 8f70b4
extern uint32_t *
Packit 8f70b4
       u32_stpcpy (uint32_t *dest, const uint32_t *src);
Packit 8f70b4
Packit 8f70b4
/* Copy no more than N units of SRC to DEST.  */
Packit 8f70b4
/* Similar to strncpy(), wcsncpy().  */
Packit 8f70b4
extern uint8_t *
Packit 8f70b4
       u8_strncpy (uint8_t *dest, const uint8_t *src, size_t n);
Packit 8f70b4
extern uint16_t *
Packit 8f70b4
       u16_strncpy (uint16_t *dest, const uint16_t *src, size_t n);
Packit 8f70b4
extern uint32_t *
Packit 8f70b4
       u32_strncpy (uint32_t *dest, const uint32_t *src, size_t n);
Packit 8f70b4
Packit 8f70b4
/* Copy no more than N units of SRC to DEST.  Return a pointer past the last
Packit 8f70b4
   non-NUL unit written into DEST.  */
Packit 8f70b4
/* Similar to stpncpy().  */
Packit 8f70b4
extern uint8_t *
Packit 8f70b4
       u8_stpncpy (uint8_t *dest, const uint8_t *src, size_t n);
Packit 8f70b4
extern uint16_t *
Packit 8f70b4
       u16_stpncpy (uint16_t *dest, const uint16_t *src, size_t n);
Packit 8f70b4
extern uint32_t *
Packit 8f70b4
       u32_stpncpy (uint32_t *dest, const uint32_t *src, size_t n);
Packit 8f70b4
Packit 8f70b4
/* Append SRC onto DEST.  */
Packit 8f70b4
/* Similar to strcat(), wcscat().  */
Packit 8f70b4
extern uint8_t *
Packit 8f70b4
       u8_strcat (uint8_t *dest, const uint8_t *src);
Packit 8f70b4
extern uint16_t *
Packit 8f70b4
       u16_strcat (uint16_t *dest, const uint16_t *src);
Packit 8f70b4
extern uint32_t *
Packit 8f70b4
       u32_strcat (uint32_t *dest, const uint32_t *src);
Packit 8f70b4
Packit 8f70b4
/* Append no more than N units of SRC onto DEST.  */
Packit 8f70b4
/* Similar to strncat(), wcsncat().  */
Packit 8f70b4
extern uint8_t *
Packit 8f70b4
       u8_strncat (uint8_t *dest, const uint8_t *src, size_t n);
Packit 8f70b4
extern uint16_t *
Packit 8f70b4
       u16_strncat (uint16_t *dest, const uint16_t *src, size_t n);
Packit 8f70b4
extern uint32_t *
Packit 8f70b4
       u32_strncat (uint32_t *dest, const uint32_t *src, size_t n);
Packit 8f70b4
Packit 8f70b4
/* Compare S1 and S2.  */
Packit 8f70b4
/* Similar to strcmp(), wcscmp().  */
Packit 8f70b4
#ifdef __sun
Packit 8f70b4
/* Avoid a collision with the u8_strcmp() function in Solaris 11 libc.  */
Packit 8f70b4
extern int
Packit 8f70b4
       u8_strcmp_gnu (const uint8_t *s1, const uint8_t *s2)
Packit 8f70b4
       _UC_ATTRIBUTE_PURE;
Packit 8f70b4
# define u8_strcmp u8_strcmp_gnu
Packit 8f70b4
#else
Packit 8f70b4
extern int
Packit 8f70b4
       u8_strcmp (const uint8_t *s1, const uint8_t *s2)
Packit 8f70b4
       _UC_ATTRIBUTE_PURE;
Packit 8f70b4
#endif
Packit 8f70b4
extern int
Packit 8f70b4
       u16_strcmp (const uint16_t *s1, const uint16_t *s2)
Packit 8f70b4
       _UC_ATTRIBUTE_PURE;
Packit 8f70b4
extern int
Packit 8f70b4
       u32_strcmp (const uint32_t *s1, const uint32_t *s2)
Packit 8f70b4
       _UC_ATTRIBUTE_PURE;
Packit 8f70b4
Packit 8f70b4
/* Compare S1 and S2 using the collation rules of the current locale.
Packit 8f70b4
   Return -1 if S1 < S2, 0 if S1 = S2, 1 if S1 > S2.
Packit 8f70b4
   Upon failure, set errno and return any value.  */
Packit 8f70b4
/* Similar to strcoll(), wcscoll().  */
Packit 8f70b4
extern int
Packit 8f70b4
       u8_strcoll (const uint8_t *s1, const uint8_t *s2);
Packit 8f70b4
extern int
Packit 8f70b4
       u16_strcoll (const uint16_t *s1, const uint16_t *s2);
Packit 8f70b4
extern int
Packit 8f70b4
       u32_strcoll (const uint32_t *s1, const uint32_t *s2);
Packit 8f70b4
Packit 8f70b4
/* Compare no more than N units of S1 and S2.  */
Packit 8f70b4
/* Similar to strncmp(), wcsncmp().  */
Packit 8f70b4
extern int
Packit 8f70b4
       u8_strncmp (const uint8_t *s1, const uint8_t *s2, size_t n)
Packit 8f70b4
       _UC_ATTRIBUTE_PURE;
Packit 8f70b4
extern int
Packit 8f70b4
       u16_strncmp (const uint16_t *s1, const uint16_t *s2, size_t n)
Packit 8f70b4
       _UC_ATTRIBUTE_PURE;
Packit 8f70b4
extern int
Packit 8f70b4
       u32_strncmp (const uint32_t *s1, const uint32_t *s2, size_t n)
Packit 8f70b4
       _UC_ATTRIBUTE_PURE;
Packit 8f70b4
Packit 8f70b4
/* Duplicate S, returning an identical malloc'd string.  */
Packit 8f70b4
/* Similar to strdup(), wcsdup().  */
Packit 8f70b4
extern uint8_t *
Packit 8f70b4
       u8_strdup (const uint8_t *s);
Packit 8f70b4
extern uint16_t *
Packit 8f70b4
       u16_strdup (const uint16_t *s);
Packit 8f70b4
extern uint32_t *
Packit 8f70b4
       u32_strdup (const uint32_t *s);
Packit 8f70b4
Packit 8f70b4
/* Find the first occurrence of UC in STR.  */
Packit 8f70b4
/* Similar to strchr(), wcschr().  */
Packit 8f70b4
extern uint8_t *
Packit 8f70b4
       u8_strchr (const uint8_t *str, ucs4_t uc)
Packit 8f70b4
       _UC_ATTRIBUTE_PURE;
Packit 8f70b4
extern uint16_t *
Packit 8f70b4
       u16_strchr (const uint16_t *str, ucs4_t uc)
Packit 8f70b4
       _UC_ATTRIBUTE_PURE;
Packit 8f70b4
extern uint32_t *
Packit 8f70b4
       u32_strchr (const uint32_t *str, ucs4_t uc)
Packit 8f70b4
       _UC_ATTRIBUTE_PURE;
Packit 8f70b4
Packit 8f70b4
/* Find the last occurrence of UC in STR.  */
Packit 8f70b4
/* Similar to strrchr(), wcsrchr().  */
Packit 8f70b4
extern uint8_t *
Packit 8f70b4
       u8_strrchr (const uint8_t *str, ucs4_t uc)
Packit 8f70b4
       _UC_ATTRIBUTE_PURE;
Packit 8f70b4
extern uint16_t *
Packit 8f70b4
       u16_strrchr (const uint16_t *str, ucs4_t uc)
Packit 8f70b4
       _UC_ATTRIBUTE_PURE;
Packit 8f70b4
extern uint32_t *
Packit 8f70b4
       u32_strrchr (const uint32_t *str, ucs4_t uc)
Packit 8f70b4
       _UC_ATTRIBUTE_PURE;
Packit 8f70b4
Packit 8f70b4
/* Return the length of the initial segment of STR which consists entirely
Packit 8f70b4
   of Unicode characters not in REJECT.  */
Packit 8f70b4
/* Similar to strcspn(), wcscspn().  */
Packit 8f70b4
extern size_t
Packit 8f70b4
       u8_strcspn (const uint8_t *str, const uint8_t *reject)
Packit 8f70b4
       _UC_ATTRIBUTE_PURE;
Packit 8f70b4
extern size_t
Packit 8f70b4
       u16_strcspn (const uint16_t *str, const uint16_t *reject)
Packit 8f70b4
       _UC_ATTRIBUTE_PURE;
Packit 8f70b4
extern size_t
Packit 8f70b4
       u32_strcspn (const uint32_t *str, const uint32_t *reject)
Packit 8f70b4
       _UC_ATTRIBUTE_PURE;
Packit 8f70b4
Packit 8f70b4
/* Return the length of the initial segment of STR which consists entirely
Packit 8f70b4
   of Unicode characters in ACCEPT.  */
Packit 8f70b4
/* Similar to strspn(), wcsspn().  */
Packit 8f70b4
extern size_t
Packit 8f70b4
       u8_strspn (const uint8_t *str, const uint8_t *accept)
Packit 8f70b4
       _UC_ATTRIBUTE_PURE;
Packit 8f70b4
extern size_t
Packit 8f70b4
       u16_strspn (const uint16_t *str, const uint16_t *accept)
Packit 8f70b4
       _UC_ATTRIBUTE_PURE;
Packit 8f70b4
extern size_t
Packit 8f70b4
       u32_strspn (const uint32_t *str, const uint32_t *accept)
Packit 8f70b4
       _UC_ATTRIBUTE_PURE;
Packit 8f70b4
Packit 8f70b4
/* Find the first occurrence in STR of any character in ACCEPT.  */
Packit 8f70b4
/* Similar to strpbrk(), wcspbrk().  */
Packit 8f70b4
extern uint8_t *
Packit 8f70b4
       u8_strpbrk (const uint8_t *str, const uint8_t *accept)
Packit 8f70b4
       _UC_ATTRIBUTE_PURE;
Packit 8f70b4
extern uint16_t *
Packit 8f70b4
       u16_strpbrk (const uint16_t *str, const uint16_t *accept)
Packit 8f70b4
       _UC_ATTRIBUTE_PURE;
Packit 8f70b4
extern uint32_t *
Packit 8f70b4
       u32_strpbrk (const uint32_t *str, const uint32_t *accept)
Packit 8f70b4
       _UC_ATTRIBUTE_PURE;
Packit 8f70b4
Packit 8f70b4
/* Find the first occurrence of NEEDLE in HAYSTACK.  */
Packit 8f70b4
/* Similar to strstr(), wcsstr().  */
Packit 8f70b4
extern uint8_t *
Packit 8f70b4
       u8_strstr (const uint8_t *haystack, const uint8_t *needle)
Packit 8f70b4
       _UC_ATTRIBUTE_PURE;
Packit 8f70b4
extern uint16_t *
Packit 8f70b4
       u16_strstr (const uint16_t *haystack, const uint16_t *needle)
Packit 8f70b4
       _UC_ATTRIBUTE_PURE;
Packit 8f70b4
extern uint32_t *
Packit 8f70b4
       u32_strstr (const uint32_t *haystack, const uint32_t *needle)
Packit 8f70b4
       _UC_ATTRIBUTE_PURE;
Packit 8f70b4
Packit 8f70b4
/* Test whether STR starts with PREFIX.  */
Packit 8f70b4
extern bool
Packit 8f70b4
       u8_startswith (const uint8_t *str, const uint8_t *prefix)
Packit 8f70b4
       _UC_ATTRIBUTE_PURE;
Packit 8f70b4
extern bool
Packit 8f70b4
       u16_startswith (const uint16_t *str, const uint16_t *prefix)
Packit 8f70b4
       _UC_ATTRIBUTE_PURE;
Packit 8f70b4
extern bool
Packit 8f70b4
       u32_startswith (const uint32_t *str, const uint32_t *prefix)
Packit 8f70b4
       _UC_ATTRIBUTE_PURE;
Packit 8f70b4
Packit 8f70b4
/* Test whether STR ends with SUFFIX.  */
Packit 8f70b4
extern bool
Packit 8f70b4
       u8_endswith (const uint8_t *str, const uint8_t *suffix)
Packit 8f70b4
       _UC_ATTRIBUTE_PURE;
Packit 8f70b4
extern bool
Packit 8f70b4
       u16_endswith (const uint16_t *str, const uint16_t *suffix)
Packit 8f70b4
       _UC_ATTRIBUTE_PURE;
Packit 8f70b4
extern bool
Packit 8f70b4
       u32_endswith (const uint32_t *str, const uint32_t *suffix)
Packit 8f70b4
       _UC_ATTRIBUTE_PURE;
Packit 8f70b4
Packit 8f70b4
/* Divide STR into tokens separated by characters in DELIM.
Packit 8f70b4
   This interface is actually more similar to wcstok than to strtok.  */
Packit 8f70b4
/* Similar to strtok_r(), wcstok().  */
Packit 8f70b4
extern uint8_t *
Packit 8f70b4
       u8_strtok (uint8_t *str, const uint8_t *delim, uint8_t **ptr);
Packit 8f70b4
extern uint16_t *
Packit 8f70b4
       u16_strtok (uint16_t *str, const uint16_t *delim, uint16_t **ptr);
Packit 8f70b4
extern uint32_t *
Packit 8f70b4
       u32_strtok (uint32_t *str, const uint32_t *delim, uint32_t **ptr);
Packit 8f70b4
Packit 8f70b4
Packit 8f70b4
#ifdef __cplusplus
Packit 8f70b4
}
Packit 8f70b4
#endif
Packit 8f70b4
Packit 8f70b4
#endif /* _UNISTR_H */