Blame support/regex_internal.h

Packit Service f629e6
/* Extended regular expression matching and search library.
Packit Service f629e6
   Copyright (C) 2002-2017 Free Software Foundation, Inc.
Packit Service f629e6
   This file is part of the GNU C Library.
Packit Service f629e6
   Contributed by Isamu Hasegawa <isamu@yamato.ibm.com>.
Packit Service f629e6
Packit Service f629e6
   The GNU C Library is free software; you can redistribute it and/or
Packit Service f629e6
   modify it under the terms of the GNU Lesser General Public
Packit Service f629e6
   License as published by the Free Software Foundation; either
Packit Service f629e6
   version 2.1 of the License, or (at your option) any later version.
Packit Service f629e6
Packit Service f629e6
   The GNU C Library is distributed in the hope that it will be useful,
Packit Service f629e6
   but WITHOUT ANY WARRANTY; without even the implied warranty of
Packit Service f629e6
   MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the GNU
Packit Service f629e6
   Lesser General Public License for more details.
Packit Service f629e6
Packit Service f629e6
   You should have received a copy of the GNU Lesser General Public
Packit Service f629e6
   License along with the GNU C Library; if not, see
Packit Service f629e6
   <http://www.gnu.org/licenses/>.  */
Packit Service f629e6
Packit Service f629e6
#ifndef _REGEX_INTERNAL_H
Packit Service f629e6
#define _REGEX_INTERNAL_H 1
Packit Service f629e6
Packit Service f629e6
#include <assert.h>
Packit Service f629e6
#include <ctype.h>
Packit Service f629e6
#include <stdio.h>
Packit Service f629e6
#include <stdlib.h>
Packit Service f629e6
#include <string.h>
Packit Service f629e6
Packit Service f629e6
#if defined HAVE_LANGINFO_H || defined HAVE_LANGINFO_CODESET || defined _LIBC
Packit Service f629e6
# include <langinfo.h>
Packit Service f629e6
#endif
Packit Service f629e6
#if defined HAVE_LOCALE_H || defined _LIBC
Packit Service f629e6
# include <locale.h>
Packit Service f629e6
#endif
Packit Service f629e6
#if defined HAVE_WCHAR_H || defined _LIBC
Packit Service f629e6
# include <wchar.h>
Packit Service f629e6
#endif /* HAVE_WCHAR_H || _LIBC */
Packit Service f629e6
#if defined HAVE_WCTYPE_H || defined _LIBC
Packit Service f629e6
# include <wctype.h>
Packit Service f629e6
#endif /* HAVE_WCTYPE_H || _LIBC */
Packit Service f629e6
#if defined HAVE_STDBOOL_H || defined _LIBC
Packit Service f629e6
# include <stdbool.h>
Packit Service f629e6
#endif /* HAVE_STDBOOL_H || _LIBC */
Packit Service f629e6
#if defined HAVE_STDINT_H || defined _LIBC
Packit Service f629e6
# include <stdint.h>
Packit Service f629e6
#endif /* HAVE_STDINT_H || _LIBC */
Packit Service f629e6
#if defined _LIBC
Packit Service f629e6
# include <libc-lock.h>
Packit Service f629e6
#else
Packit Service f629e6
# define __libc_lock_init(NAME) do { } while (0)
Packit Service f629e6
# define __libc_lock_lock(NAME) do { } while (0)
Packit Service f629e6
# define __libc_lock_unlock(NAME) do { } while (0)
Packit Service f629e6
#endif
Packit Service f629e6
Packit Service f629e6
#ifndef GAWK
Packit Service f629e6
/* In case that the system doesn't have isblank().  */
Packit Service f629e6
#if !defined _LIBC && !defined HAVE_ISBLANK && !defined isblank
Packit Service f629e6
# define isblank(ch) ((ch) == ' ' || (ch) == '\t')
Packit Service f629e6
#endif
Packit Service f629e6
#else /* GAWK */
Packit Service f629e6
/*
Packit Service f629e6
 * This is a freaking mess. On glibc systems you have to define
Packit Service f629e6
 * a magic constant to get isblank() out of <ctype.h>, since it's
Packit Service f629e6
 * a C99 function.  To heck with all that and borrow a page from
Packit Service f629e6
 * dfa.c's book.
Packit Service f629e6
 */
Packit Service f629e6
Packit Service f629e6
static int
Packit Service f629e6
is_blank (int c)
Packit Service f629e6
{
Packit Service f629e6
   return (c == ' ' || c == '\t');
Packit Service f629e6
}
Packit Service f629e6
#endif /* GAWK */
Packit Service f629e6
Packit Service f629e6
#ifdef _LIBC
Packit Service f629e6
# ifndef _RE_DEFINE_LOCALE_FUNCTIONS
Packit Service f629e6
#  define _RE_DEFINE_LOCALE_FUNCTIONS 1
Packit Service f629e6
#   include <locale/localeinfo.h>
Packit Service f629e6
#   include <locale/coll-lookup.h>
Packit Service f629e6
# endif
Packit Service f629e6
#endif
Packit Service f629e6
Packit Service f629e6
/* This is for other GNU distributions with internationalized messages.  */
Packit Service f629e6
#if (HAVE_LIBINTL_H && ENABLE_NLS) || defined _LIBC
Packit Service f629e6
# include <libintl.h>
Packit Service f629e6
# ifdef _LIBC
Packit Service f629e6
#  undef gettext
Packit Service f629e6
#  define gettext(msgid) \
Packit Service f629e6
  __dcgettext (_libc_intl_domainname, msgid, LC_MESSAGES)
Packit Service f629e6
# endif
Packit Service f629e6
#else
Packit Service f629e6
# define gettext(msgid) (msgid)
Packit Service f629e6
#endif
Packit Service f629e6
Packit Service f629e6
#ifndef gettext_noop
Packit Service f629e6
/* This define is so xgettext can find the internationalizable
Packit Service f629e6
   strings.  */
Packit Service f629e6
# define gettext_noop(String) String
Packit Service f629e6
#endif
Packit Service f629e6
Packit Service f629e6
/* For loser systems without the definition.  */
Packit Service f629e6
#ifndef SIZE_MAX
Packit Service f629e6
# define SIZE_MAX ((size_t) -1)
Packit Service f629e6
#endif
Packit Service f629e6
Packit Service f629e6
#if ! defined(__DJGPP__) && (defined(GAWK) || _LIBC)
Packit Service f629e6
# define RE_ENABLE_I18N
Packit Service f629e6
#endif
Packit Service f629e6
Packit Service f629e6
#if __GNUC__ >= 3
Packit Service f629e6
# define BE(expr, val) __builtin_expect (expr, val)
Packit Service f629e6
#else
Packit Service f629e6
# define BE(expr, val) (expr)
Packit Service f629e6
# ifdef inline
Packit Service f629e6
# undef inline
Packit Service f629e6
# endif
Packit Service f629e6
# define inline
Packit Service f629e6
#endif
Packit Service f629e6
Packit Service f629e6
/* Number of single byte character.  */
Packit Service f629e6
#define SBC_MAX 256
Packit Service f629e6
Packit Service f629e6
#define COLL_ELEM_LEN_MAX 8
Packit Service f629e6
Packit Service f629e6
/* The character which represents newline.  */
Packit Service f629e6
#define NEWLINE_CHAR '\n'
Packit Service f629e6
#define WIDE_NEWLINE_CHAR L'\n'
Packit Service f629e6
Packit Service f629e6
/* Rename to standard API for using out of glibc.  */
Packit Service f629e6
#ifndef _LIBC
Packit Service f629e6
# ifdef __wctype
Packit Service f629e6
# undef __wctype
Packit Service f629e6
# endif
Packit Service f629e6
# define __wctype wctype
Packit Service f629e6
# ifdef __iswctype
Packit Service f629e6
# undef __iswctype
Packit Service f629e6
# endif
Packit Service f629e6
# define __iswctype iswctype
Packit Service f629e6
# define __btowc btowc
Packit Service f629e6
# define __mbrtowc mbrtowc
Packit Service f629e6
#undef __mempcpy	/* GAWK */
Packit Service f629e6
# define __mempcpy mempcpy
Packit Service f629e6
# define __wcrtomb wcrtomb
Packit Service f629e6
# define __regfree regfree
Packit Service f629e6
#endif /* not _LIBC */
Packit Service f629e6
Packit Service f629e6
#if __GNUC__ < 3 + (__GNUC_MINOR__ < 1)
Packit Service f629e6
# define __attribute__(arg)
Packit Service f629e6
#endif
Packit Service f629e6
Packit Service f629e6
#ifdef GAWK
Packit Service f629e6
/*
Packit Service f629e6
 * Instead of trying to figure out which GCC version introduced
Packit Service f629e6
 * this symbol, just define it out and be done.
Packit Service f629e6
 */
Packit Service f629e6
# undef __attribute_warn_unused_result__
Packit Service f629e6
# define __attribute_warn_unused_result__
Packit Service f629e6
#endif
Packit Service f629e6
Packit Service f629e6
/* An integer used to represent a set of bits.  It must be unsigned,
Packit Service f629e6
   and must be at least as wide as unsigned int.  */
Packit Service f629e6
typedef unsigned long int bitset_word_t;
Packit Service f629e6
/* All bits set in a bitset_word_t.  */
Packit Service f629e6
#define BITSET_WORD_MAX ULONG_MAX
Packit Service f629e6
/* Number of bits in a bitset_word_t.  */
Packit Service f629e6
#define BITSET_WORD_BITS (sizeof (bitset_word_t) * CHAR_BIT)
Packit Service f629e6
/* Number of bitset_word_t in a bit_set.  */
Packit Service f629e6
#define BITSET_WORDS (SBC_MAX / BITSET_WORD_BITS)
Packit Service f629e6
typedef bitset_word_t bitset_t[BITSET_WORDS];
Packit Service f629e6
typedef bitset_word_t *re_bitset_ptr_t;
Packit Service f629e6
typedef const bitset_word_t *re_const_bitset_ptr_t;
Packit Service f629e6
Packit Service f629e6
#define bitset_set(set,i) \
Packit Service f629e6
  (set[i / BITSET_WORD_BITS] |= (bitset_word_t) 1 << i % BITSET_WORD_BITS)
Packit Service f629e6
#define bitset_clear(set,i) \
Packit Service f629e6
  (set[i / BITSET_WORD_BITS] &= ~((bitset_word_t) 1 << i % BITSET_WORD_BITS))
Packit Service f629e6
#define bitset_contain(set,i) \
Packit Service f629e6
  (set[i / BITSET_WORD_BITS] & ((bitset_word_t) 1 << i % BITSET_WORD_BITS))
Packit Service f629e6
#define bitset_empty(set) memset (set, '\0', sizeof (bitset_t))
Packit Service f629e6
#define bitset_set_all(set) memset (set, '\xff', sizeof (bitset_t))
Packit Service f629e6
#define bitset_copy(dest,src) memcpy (dest, src, sizeof (bitset_t))
Packit Service f629e6
Packit Service f629e6
#define PREV_WORD_CONSTRAINT 0x0001
Packit Service f629e6
#define PREV_NOTWORD_CONSTRAINT 0x0002
Packit Service f629e6
#define NEXT_WORD_CONSTRAINT 0x0004
Packit Service f629e6
#define NEXT_NOTWORD_CONSTRAINT 0x0008
Packit Service f629e6
#define PREV_NEWLINE_CONSTRAINT 0x0010
Packit Service f629e6
#define NEXT_NEWLINE_CONSTRAINT 0x0020
Packit Service f629e6
#define PREV_BEGBUF_CONSTRAINT 0x0040
Packit Service f629e6
#define NEXT_ENDBUF_CONSTRAINT 0x0080
Packit Service f629e6
#define WORD_DELIM_CONSTRAINT 0x0100
Packit Service f629e6
#define NOT_WORD_DELIM_CONSTRAINT 0x0200
Packit Service f629e6
Packit Service f629e6
typedef enum
Packit Service f629e6
{
Packit Service f629e6
  INSIDE_WORD = PREV_WORD_CONSTRAINT | NEXT_WORD_CONSTRAINT,
Packit Service f629e6
  WORD_FIRST = PREV_NOTWORD_CONSTRAINT | NEXT_WORD_CONSTRAINT,
Packit Service f629e6
  WORD_LAST = PREV_WORD_CONSTRAINT | NEXT_NOTWORD_CONSTRAINT,
Packit Service f629e6
  INSIDE_NOTWORD = PREV_NOTWORD_CONSTRAINT | NEXT_NOTWORD_CONSTRAINT,
Packit Service f629e6
  LINE_FIRST = PREV_NEWLINE_CONSTRAINT,
Packit Service f629e6
  LINE_LAST = NEXT_NEWLINE_CONSTRAINT,
Packit Service f629e6
  BUF_FIRST = PREV_BEGBUF_CONSTRAINT,
Packit Service f629e6
  BUF_LAST = NEXT_ENDBUF_CONSTRAINT,
Packit Service f629e6
  WORD_DELIM = WORD_DELIM_CONSTRAINT,
Packit Service f629e6
  NOT_WORD_DELIM = NOT_WORD_DELIM_CONSTRAINT
Packit Service f629e6
} re_context_type;
Packit Service f629e6
Packit Service f629e6
typedef struct
Packit Service f629e6
{
Packit Service f629e6
  int alloc;
Packit Service f629e6
  int nelem;
Packit Service f629e6
  int *elems;
Packit Service f629e6
} re_node_set;
Packit Service f629e6
Packit Service f629e6
typedef enum
Packit Service f629e6
{
Packit Service f629e6
  NON_TYPE = 0,
Packit Service f629e6
Packit Service f629e6
  /* Node type, These are used by token, node, tree.  */
Packit Service f629e6
  CHARACTER = 1,
Packit Service f629e6
  END_OF_RE = 2,
Packit Service f629e6
  SIMPLE_BRACKET = 3,
Packit Service f629e6
  OP_BACK_REF = 4,
Packit Service f629e6
  OP_PERIOD = 5,
Packit Service f629e6
#ifdef RE_ENABLE_I18N
Packit Service f629e6
  COMPLEX_BRACKET = 6,
Packit Service f629e6
  OP_UTF8_PERIOD = 7,
Packit Service f629e6
#endif /* RE_ENABLE_I18N */
Packit Service f629e6
Packit Service f629e6
  /* We define EPSILON_BIT as a macro so that OP_OPEN_SUBEXP is used
Packit Service f629e6
     when the debugger shows values of this enum type.  */
Packit Service f629e6
#define EPSILON_BIT 8
Packit Service f629e6
  OP_OPEN_SUBEXP = EPSILON_BIT | 0,
Packit Service f629e6
  OP_CLOSE_SUBEXP = EPSILON_BIT | 1,
Packit Service f629e6
  OP_ALT = EPSILON_BIT | 2,
Packit Service f629e6
  OP_DUP_ASTERISK = EPSILON_BIT | 3,
Packit Service f629e6
  ANCHOR = EPSILON_BIT | 4,
Packit Service f629e6
Packit Service f629e6
  /* Tree type, these are used only by tree. */
Packit Service f629e6
  CONCAT = 16,
Packit Service f629e6
  SUBEXP = 17,
Packit Service f629e6
Packit Service f629e6
  /* Token type, these are used only by token.  */
Packit Service f629e6
  OP_DUP_PLUS = 18,
Packit Service f629e6
  OP_DUP_QUESTION,
Packit Service f629e6
  OP_OPEN_BRACKET,
Packit Service f629e6
  OP_CLOSE_BRACKET,
Packit Service f629e6
  OP_CHARSET_RANGE,
Packit Service f629e6
  OP_OPEN_DUP_NUM,
Packit Service f629e6
  OP_CLOSE_DUP_NUM,
Packit Service f629e6
  OP_NON_MATCH_LIST,
Packit Service f629e6
  OP_OPEN_COLL_ELEM,
Packit Service f629e6
  OP_CLOSE_COLL_ELEM,
Packit Service f629e6
  OP_OPEN_EQUIV_CLASS,
Packit Service f629e6
  OP_CLOSE_EQUIV_CLASS,
Packit Service f629e6
  OP_OPEN_CHAR_CLASS,
Packit Service f629e6
  OP_CLOSE_CHAR_CLASS,
Packit Service f629e6
  OP_WORD,
Packit Service f629e6
  OP_NOTWORD,
Packit Service f629e6
  OP_SPACE,
Packit Service f629e6
  OP_NOTSPACE,
Packit Service f629e6
  BACK_SLASH
Packit Service f629e6
Packit Service f629e6
} re_token_type_t;
Packit Service f629e6
Packit Service f629e6
#ifdef RE_ENABLE_I18N
Packit Service f629e6
typedef struct
Packit Service f629e6
{
Packit Service f629e6
  /* Multibyte characters.  */
Packit Service f629e6
  wchar_t *mbchars;
Packit Service f629e6
Packit Service f629e6
  /* Collating symbols.  */
Packit Service f629e6
# ifdef _LIBC
Packit Service f629e6
  int32_t *coll_syms;
Packit Service f629e6
# endif
Packit Service f629e6
Packit Service f629e6
  /* Equivalence classes. */
Packit Service f629e6
# ifdef _LIBC
Packit Service f629e6
  int32_t *equiv_classes;
Packit Service f629e6
# endif
Packit Service f629e6
Packit Service f629e6
  /* Range expressions. */
Packit Service f629e6
# ifdef _LIBC
Packit Service f629e6
  uint32_t *range_starts;
Packit Service f629e6
  uint32_t *range_ends;
Packit Service f629e6
# else /* not _LIBC */
Packit Service f629e6
  wchar_t *range_starts;
Packit Service f629e6
  wchar_t *range_ends;
Packit Service f629e6
# endif /* not _LIBC */
Packit Service f629e6
Packit Service f629e6
  /* Character classes. */
Packit Service f629e6
  wctype_t *char_classes;
Packit Service f629e6
Packit Service f629e6
  /* If this character set is the non-matching list.  */
Packit Service f629e6
  unsigned int non_match : 1;
Packit Service f629e6
Packit Service f629e6
  /* # of multibyte characters.  */
Packit Service f629e6
  int nmbchars;
Packit Service f629e6
Packit Service f629e6
  /* # of collating symbols.  */
Packit Service f629e6
  int ncoll_syms;
Packit Service f629e6
Packit Service f629e6
  /* # of equivalence classes. */
Packit Service f629e6
  int nequiv_classes;
Packit Service f629e6
Packit Service f629e6
  /* # of range expressions. */
Packit Service f629e6
  int nranges;
Packit Service f629e6
Packit Service f629e6
  /* # of character classes. */
Packit Service f629e6
  int nchar_classes;
Packit Service f629e6
} re_charset_t;
Packit Service f629e6
#endif /* RE_ENABLE_I18N */
Packit Service f629e6
Packit Service f629e6
typedef struct
Packit Service f629e6
{
Packit Service f629e6
  union
Packit Service f629e6
  {
Packit Service f629e6
    unsigned char c;		/* for CHARACTER */
Packit Service f629e6
    re_bitset_ptr_t sbcset;	/* for SIMPLE_BRACKET */
Packit Service f629e6
#ifdef RE_ENABLE_I18N
Packit Service f629e6
    re_charset_t *mbcset;	/* for COMPLEX_BRACKET */
Packit Service f629e6
#endif /* RE_ENABLE_I18N */
Packit Service f629e6
    int idx;			/* for BACK_REF */
Packit Service f629e6
    re_context_type ctx_type;	/* for ANCHOR */
Packit Service f629e6
  } opr;
Packit Service f629e6
#if __GNUC__ >= 2
Packit Service f629e6
  re_token_type_t type : 8;
Packit Service f629e6
#else
Packit Service f629e6
  re_token_type_t type;
Packit Service f629e6
#endif
Packit Service f629e6
  unsigned int constraint : 10;	/* context constraint */
Packit Service f629e6
  unsigned int duplicated : 1;
Packit Service f629e6
  unsigned int opt_subexp : 1;
Packit Service f629e6
#ifdef RE_ENABLE_I18N
Packit Service f629e6
  unsigned int accept_mb : 1;
Packit Service f629e6
  /* These 2 bits can be moved into the union if needed (e.g. if running out
Packit Service f629e6
     of bits; move opr.c to opr.c.c and move the flags to opr.c.flags).  */
Packit Service f629e6
  unsigned int mb_partial : 1;
Packit Service f629e6
#endif
Packit Service f629e6
  unsigned int word_char : 1;
Packit Service f629e6
} re_token_t;
Packit Service f629e6
Packit Service f629e6
#define IS_EPSILON_NODE(type) ((type) & EPSILON_BIT)
Packit Service f629e6
Packit Service f629e6
struct re_string_t
Packit Service f629e6
{
Packit Service f629e6
  /* Indicate the raw buffer which is the original string passed as an
Packit Service f629e6
     argument of regexec(), re_search(), etc..  */
Packit Service f629e6
  const unsigned char *raw_mbs;
Packit Service f629e6
  /* Store the multibyte string.  In case of "case insensitive mode" like
Packit Service f629e6
     REG_ICASE, upper cases of the string are stored, otherwise MBS points
Packit Service f629e6
     the same address that RAW_MBS points.  */
Packit Service f629e6
  unsigned char *mbs;
Packit Service f629e6
#ifdef RE_ENABLE_I18N
Packit Service f629e6
  /* Store the wide character string which is corresponding to MBS.  */
Packit Service f629e6
  wint_t *wcs;
Packit Service f629e6
  int *offsets;
Packit Service f629e6
  mbstate_t cur_state;
Packit Service f629e6
#endif
Packit Service f629e6
  /* Index in RAW_MBS.  Each character mbs[i] corresponds to
Packit Service f629e6
     raw_mbs[raw_mbs_idx + i].  */
Packit Service f629e6
  int raw_mbs_idx;
Packit Service f629e6
  /* The length of the valid characters in the buffers.  */
Packit Service f629e6
  int valid_len;
Packit Service f629e6
  /* The corresponding number of bytes in raw_mbs array.  */
Packit Service f629e6
  int valid_raw_len;
Packit Service f629e6
  /* The length of the buffers MBS and WCS.  */
Packit Service f629e6
  int bufs_len;
Packit Service f629e6
  /* The index in MBS, which is updated by re_string_fetch_byte.  */
Packit Service f629e6
  int cur_idx;
Packit Service f629e6
  /* length of RAW_MBS array.  */
Packit Service f629e6
  int raw_len;
Packit Service f629e6
  /* This is RAW_LEN - RAW_MBS_IDX + VALID_LEN - VALID_RAW_LEN.  */
Packit Service f629e6
  int len;
Packit Service f629e6
  /* End of the buffer may be shorter than its length in the cases such
Packit Service f629e6
     as re_match_2, re_search_2.  Then, we use STOP for end of the buffer
Packit Service f629e6
     instead of LEN.  */
Packit Service f629e6
  int raw_stop;
Packit Service f629e6
  /* This is RAW_STOP - RAW_MBS_IDX adjusted through OFFSETS.  */
Packit Service f629e6
  int stop;
Packit Service f629e6
Packit Service f629e6
  /* The context of mbs[0].  We store the context independently, since
Packit Service f629e6
     the context of mbs[0] may be different from raw_mbs[0], which is
Packit Service f629e6
     the beginning of the input string.  */
Packit Service f629e6
  unsigned int tip_context;
Packit Service f629e6
  /* The translation passed as a part of an argument of re_compile_pattern.  */
Packit Service f629e6
  RE_TRANSLATE_TYPE trans;
Packit Service f629e6
  /* Copy of re_dfa_t's word_char.  */
Packit Service f629e6
  re_const_bitset_ptr_t word_char;
Packit Service f629e6
  /* 1 if REG_ICASE.  */
Packit Service f629e6
  unsigned char icase;
Packit Service f629e6
  unsigned char is_utf8;
Packit Service f629e6
  unsigned char map_notascii;
Packit Service f629e6
  unsigned char mbs_allocated;
Packit Service f629e6
  unsigned char offsets_needed;
Packit Service f629e6
  unsigned char newline_anchor;
Packit Service f629e6
  unsigned char word_ops_used;
Packit Service f629e6
  int mb_cur_max;
Packit Service f629e6
};
Packit Service f629e6
typedef struct re_string_t re_string_t;
Packit Service f629e6
Packit Service f629e6
Packit Service f629e6
struct re_dfa_t;
Packit Service f629e6
typedef struct re_dfa_t re_dfa_t;
Packit Service f629e6
Packit Service f629e6
#ifndef NOT_IN_libc
Packit Service f629e6
static reg_errcode_t re_string_realloc_buffers (re_string_t *pstr,
Packit Service f629e6
						int new_buf_len);
Packit Service f629e6
# ifdef RE_ENABLE_I18N
Packit Service f629e6
static void build_wcs_buffer (re_string_t *pstr);
Packit Service f629e6
static reg_errcode_t build_wcs_upper_buffer (re_string_t *pstr);
Packit Service f629e6
# endif /* RE_ENABLE_I18N */
Packit Service f629e6
static void build_upper_buffer (re_string_t *pstr);
Packit Service f629e6
static void re_string_translate_buffer (re_string_t *pstr);
Packit Service f629e6
static unsigned int re_string_context_at (const re_string_t *input, int idx,
Packit Service f629e6
					  int eflags) __attribute__ ((pure));
Packit Service f629e6
#endif
Packit Service f629e6
#define re_string_peek_byte(pstr, offset) \
Packit Service f629e6
  ((pstr)->mbs[(pstr)->cur_idx + offset])
Packit Service f629e6
#define re_string_fetch_byte(pstr) \
Packit Service f629e6
  ((pstr)->mbs[(pstr)->cur_idx++])
Packit Service f629e6
#define re_string_first_byte(pstr, idx) \
Packit Service f629e6
  ((idx) == (pstr)->valid_len || (pstr)->wcs[idx] != WEOF)
Packit Service f629e6
#define re_string_is_single_byte_char(pstr, idx) \
Packit Service f629e6
  ((pstr)->wcs[idx] != WEOF && ((pstr)->valid_len == (idx) + 1 \
Packit Service f629e6
				|| (pstr)->wcs[(idx) + 1] != WEOF))
Packit Service f629e6
#define re_string_eoi(pstr) ((pstr)->stop <= (pstr)->cur_idx)
Packit Service f629e6
#define re_string_cur_idx(pstr) ((pstr)->cur_idx)
Packit Service f629e6
#define re_string_get_buffer(pstr) ((pstr)->mbs)
Packit Service f629e6
#define re_string_length(pstr) ((pstr)->len)
Packit Service f629e6
#define re_string_byte_at(pstr,idx) ((pstr)->mbs[idx])
Packit Service f629e6
#define re_string_skip_bytes(pstr,idx) ((pstr)->cur_idx += (idx))
Packit Service f629e6
#define re_string_set_index(pstr,idx) ((pstr)->cur_idx = (idx))
Packit Service f629e6
Packit Service f629e6
#ifndef _LIBC
Packit Service f629e6
# if HAVE_ALLOCA
Packit Service f629e6
#  include <alloca.h>
Packit Service f629e6
/* The OS usually guarantees only one guard page at the bottom of the stack,
Packit Service f629e6
   and a page size can be as small as 4096 bytes.  So we cannot safely
Packit Service f629e6
   allocate anything larger than 4096 bytes.  Also care for the possibility
Packit Service f629e6
   of a few compiler-allocated temporary stack slots.  */
Packit Service f629e6
#  define __libc_use_alloca(n) ((n) < 4032)
Packit Service f629e6
# else
Packit Service f629e6
/* alloca is implemented with malloc, so just use malloc.  */
Packit Service f629e6
#  define __libc_use_alloca(n) 0
Packit Service f629e6
# endif
Packit Service f629e6
#endif
Packit Service f629e6
Packit Service f629e6
/*
Packit Service f629e6
 * GAWK checks for zero-size allocations everywhere else,
Packit Service f629e6
 * do it here too.
Packit Service f629e6
 */
Packit Service f629e6
#ifndef GAWK
Packit Service f629e6
#define re_malloc(t,n) ((t *) malloc ((n) * sizeof (t)))
Packit Service f629e6
#define re_realloc(p,t,n) ((t *) realloc (p, (n) * sizeof (t)))
Packit Service f629e6
#else
Packit Service f629e6
static void *
Packit Service f629e6
test_malloc(size_t count, const char *file, size_t line)
Packit Service f629e6
{
Packit Service f629e6
	if (count == 0) {
Packit Service f629e6
		fprintf(stderr, "%s:%lu: allocation of zero bytes\n",
Packit Service f629e6
				file, (unsigned long) line);
Packit Service f629e6
		exit(1);
Packit Service f629e6
	}
Packit Service f629e6
	return malloc(count);
Packit Service f629e6
}
Packit Service f629e6
Packit Service f629e6
static void *
Packit Service f629e6
test_realloc(void *p, size_t count, const char *file, size_t line)
Packit Service f629e6
{
Packit Service f629e6
	if (count == 0) {
Packit Service f629e6
		fprintf(stderr, "%s:%lu: reallocation of zero bytes\n",
Packit Service f629e6
				file, (unsigned long) line);
Packit Service f629e6
		exit(1);
Packit Service f629e6
	}
Packit Service f629e6
	return realloc(p, count);
Packit Service f629e6
}
Packit Service f629e6
#define re_malloc(t,n) ((t *) test_malloc (((n) * sizeof (t)), __FILE__, __LINE__))
Packit Service f629e6
#define re_realloc(p,t,n) ((t *) test_realloc (p, (n) * sizeof (t), __FILE__, __LINE__))
Packit Service f629e6
#endif
Packit Service f629e6
#define re_free(p) free (p)
Packit Service f629e6
Packit Service f629e6
struct bin_tree_t
Packit Service f629e6
{
Packit Service f629e6
  struct bin_tree_t *parent;
Packit Service f629e6
  struct bin_tree_t *left;
Packit Service f629e6
  struct bin_tree_t *right;
Packit Service f629e6
  struct bin_tree_t *first;
Packit Service f629e6
  struct bin_tree_t *next;
Packit Service f629e6
Packit Service f629e6
  re_token_t token;
Packit Service f629e6
Packit Service f629e6
  /* `node_idx' is the index in dfa->nodes, if `type' == 0.
Packit Service f629e6
     Otherwise `type' indicate the type of this node.  */
Packit Service f629e6
  int node_idx;
Packit Service f629e6
};
Packit Service f629e6
typedef struct bin_tree_t bin_tree_t;
Packit Service f629e6
Packit Service f629e6
#define BIN_TREE_STORAGE_SIZE \
Packit Service f629e6
  ((1024 - sizeof (void *)) / sizeof (bin_tree_t))
Packit Service f629e6
Packit Service f629e6
struct bin_tree_storage_t
Packit Service f629e6
{
Packit Service f629e6
  struct bin_tree_storage_t *next;
Packit Service f629e6
  bin_tree_t data[BIN_TREE_STORAGE_SIZE];
Packit Service f629e6
};
Packit Service f629e6
typedef struct bin_tree_storage_t bin_tree_storage_t;
Packit Service f629e6
Packit Service f629e6
#define CONTEXT_WORD 1
Packit Service f629e6
#define CONTEXT_NEWLINE (CONTEXT_WORD << 1)
Packit Service f629e6
#define CONTEXT_BEGBUF (CONTEXT_NEWLINE << 1)
Packit Service f629e6
#define CONTEXT_ENDBUF (CONTEXT_BEGBUF << 1)
Packit Service f629e6
Packit Service f629e6
#define IS_WORD_CONTEXT(c) ((c) & CONTEXT_WORD)
Packit Service f629e6
#define IS_NEWLINE_CONTEXT(c) ((c) & CONTEXT_NEWLINE)
Packit Service f629e6
#define IS_BEGBUF_CONTEXT(c) ((c) & CONTEXT_BEGBUF)
Packit Service f629e6
#define IS_ENDBUF_CONTEXT(c) ((c) & CONTEXT_ENDBUF)
Packit Service f629e6
#define IS_ORDINARY_CONTEXT(c) ((c) == 0)
Packit Service f629e6
Packit Service f629e6
#define IS_WORD_CHAR(ch) (isalnum (ch) || (ch) == '_')
Packit Service f629e6
#define IS_NEWLINE(ch) ((ch) == NEWLINE_CHAR)
Packit Service f629e6
#define IS_WIDE_WORD_CHAR(ch) (iswalnum (ch) || (ch) == L'_')
Packit Service f629e6
#define IS_WIDE_NEWLINE(ch) ((ch) == WIDE_NEWLINE_CHAR)
Packit Service f629e6
Packit Service f629e6
#define NOT_SATISFY_PREV_CONSTRAINT(constraint,context) \
Packit Service f629e6
 ((((constraint) & PREV_WORD_CONSTRAINT) && !IS_WORD_CONTEXT (context)) \
Packit Service f629e6
  || ((constraint & PREV_NOTWORD_CONSTRAINT) && IS_WORD_CONTEXT (context)) \
Packit Service f629e6
  || ((constraint & PREV_NEWLINE_CONSTRAINT) && !IS_NEWLINE_CONTEXT (context))\
Packit Service f629e6
  || ((constraint & PREV_BEGBUF_CONSTRAINT) && !IS_BEGBUF_CONTEXT (context)))
Packit Service f629e6
Packit Service f629e6
#define NOT_SATISFY_NEXT_CONSTRAINT(constraint,context) \
Packit Service f629e6
 ((((constraint) & NEXT_WORD_CONSTRAINT) && !IS_WORD_CONTEXT (context)) \
Packit Service f629e6
  || (((constraint) & NEXT_NOTWORD_CONSTRAINT) && IS_WORD_CONTEXT (context)) \
Packit Service f629e6
  || (((constraint) & NEXT_NEWLINE_CONSTRAINT) && !IS_NEWLINE_CONTEXT (context)) \
Packit Service f629e6
  || (((constraint) & NEXT_ENDBUF_CONSTRAINT) && !IS_ENDBUF_CONTEXT (context)))
Packit Service f629e6
Packit Service f629e6
struct re_dfastate_t
Packit Service f629e6
{
Packit Service f629e6
  unsigned int hash;
Packit Service f629e6
  re_node_set nodes;
Packit Service f629e6
  re_node_set non_eps_nodes;
Packit Service f629e6
  re_node_set inveclosure;
Packit Service f629e6
  re_node_set *entrance_nodes;
Packit Service f629e6
  struct re_dfastate_t **trtable, **word_trtable;
Packit Service f629e6
  unsigned int context : 4;
Packit Service f629e6
  unsigned int halt : 1;
Packit Service f629e6
  /* If this state can accept `multi byte'.
Packit Service f629e6
     Note that we refer to multibyte characters, and multi character
Packit Service f629e6
     collating elements as `multi byte'.  */
Packit Service f629e6
  unsigned int accept_mb : 1;
Packit Service f629e6
  /* If this state has backreference node(s).  */
Packit Service f629e6
  unsigned int has_backref : 1;
Packit Service f629e6
  unsigned int has_constraint : 1;
Packit Service f629e6
};
Packit Service f629e6
typedef struct re_dfastate_t re_dfastate_t;
Packit Service f629e6
Packit Service f629e6
struct re_state_table_entry
Packit Service f629e6
{
Packit Service f629e6
  int num;
Packit Service f629e6
  int alloc;
Packit Service f629e6
  re_dfastate_t **array;
Packit Service f629e6
};
Packit Service f629e6
Packit Service f629e6
/* Array type used in re_sub_match_last_t and re_sub_match_top_t.  */
Packit Service f629e6
Packit Service f629e6
typedef struct
Packit Service f629e6
{
Packit Service f629e6
  int next_idx;
Packit Service f629e6
  int alloc;
Packit Service f629e6
  re_dfastate_t **array;
Packit Service f629e6
} state_array_t;
Packit Service f629e6
Packit Service f629e6
/* Store information about the node NODE whose type is OP_CLOSE_SUBEXP.  */
Packit Service f629e6
Packit Service f629e6
typedef struct
Packit Service f629e6
{
Packit Service f629e6
  int node;
Packit Service f629e6
  int str_idx; /* The position NODE match at.  */
Packit Service f629e6
  state_array_t path;
Packit Service f629e6
} re_sub_match_last_t;
Packit Service f629e6
Packit Service f629e6
/* Store information about the node NODE whose type is OP_OPEN_SUBEXP.
Packit Service f629e6
   And information about the node, whose type is OP_CLOSE_SUBEXP,
Packit Service f629e6
   corresponding to NODE is stored in LASTS.  */
Packit Service f629e6
Packit Service f629e6
typedef struct
Packit Service f629e6
{
Packit Service f629e6
  int str_idx;
Packit Service f629e6
  int node;
Packit Service f629e6
  state_array_t *path;
Packit Service f629e6
  int alasts; /* Allocation size of LASTS.  */
Packit Service f629e6
  int nlasts; /* The number of LASTS.  */
Packit Service f629e6
  re_sub_match_last_t **lasts;
Packit Service f629e6
} re_sub_match_top_t;
Packit Service f629e6
Packit Service f629e6
struct re_backref_cache_entry
Packit Service f629e6
{
Packit Service f629e6
  int node;
Packit Service f629e6
  int str_idx;
Packit Service f629e6
  int subexp_from;
Packit Service f629e6
  int subexp_to;
Packit Service f629e6
  char more;
Packit Service f629e6
  char unused;
Packit Service f629e6
  unsigned short int eps_reachable_subexps_map;
Packit Service f629e6
};
Packit Service f629e6
Packit Service f629e6
typedef struct
Packit Service f629e6
{
Packit Service f629e6
  /* The string object corresponding to the input string.  */
Packit Service f629e6
  re_string_t input;
Packit Service f629e6
#if defined _LIBC || (defined __STDC_VERSION__ && __STDC_VERSION__ >= 199901L)
Packit Service f629e6
  const re_dfa_t *const dfa;
Packit Service f629e6
#else
Packit Service f629e6
  const re_dfa_t *dfa;
Packit Service f629e6
#endif
Packit Service f629e6
  /* EFLAGS of the argument of regexec.  */
Packit Service f629e6
  int eflags;
Packit Service f629e6
  /* Where the matching ends.  */
Packit Service f629e6
  int match_last;
Packit Service f629e6
  int last_node;
Packit Service f629e6
  /* The state log used by the matcher.  */
Packit Service f629e6
  re_dfastate_t **state_log;
Packit Service f629e6
  int state_log_top;
Packit Service f629e6
  /* Back reference cache.  */
Packit Service f629e6
  int nbkref_ents;
Packit Service f629e6
  int abkref_ents;
Packit Service f629e6
  struct re_backref_cache_entry *bkref_ents;
Packit Service f629e6
  int max_mb_elem_len;
Packit Service f629e6
  int nsub_tops;
Packit Service f629e6
  int asub_tops;
Packit Service f629e6
  re_sub_match_top_t **sub_tops;
Packit Service f629e6
} re_match_context_t;
Packit Service f629e6
Packit Service f629e6
typedef struct
Packit Service f629e6
{
Packit Service f629e6
  re_dfastate_t **sifted_states;
Packit Service f629e6
  re_dfastate_t **limited_states;
Packit Service f629e6
  int last_node;
Packit Service f629e6
  int last_str_idx;
Packit Service f629e6
  re_node_set limits;
Packit Service f629e6
} re_sift_context_t;
Packit Service f629e6
Packit Service f629e6
struct re_fail_stack_ent_t
Packit Service f629e6
{
Packit Service f629e6
  int idx;
Packit Service f629e6
  int node;
Packit Service f629e6
  regmatch_t *regs;
Packit Service f629e6
  re_node_set eps_via_nodes;
Packit Service f629e6
};
Packit Service f629e6
Packit Service f629e6
struct re_fail_stack_t
Packit Service f629e6
{
Packit Service f629e6
  int num;
Packit Service f629e6
  int alloc;
Packit Service f629e6
  struct re_fail_stack_ent_t *stack;
Packit Service f629e6
};
Packit Service f629e6
Packit Service f629e6
struct re_dfa_t
Packit Service f629e6
{
Packit Service f629e6
  re_token_t *nodes;
Packit Service f629e6
  size_t nodes_alloc;
Packit Service f629e6
  size_t nodes_len;
Packit Service f629e6
  int *nexts;
Packit Service f629e6
  int *org_indices;
Packit Service f629e6
  re_node_set *edests;
Packit Service f629e6
  re_node_set *eclosures;
Packit Service f629e6
  re_node_set *inveclosures;
Packit Service f629e6
  struct re_state_table_entry *state_table;
Packit Service f629e6
  re_dfastate_t *init_state;
Packit Service f629e6
  re_dfastate_t *init_state_word;
Packit Service f629e6
  re_dfastate_t *init_state_nl;
Packit Service f629e6
  re_dfastate_t *init_state_begbuf;
Packit Service f629e6
  bin_tree_t *str_tree;
Packit Service f629e6
  bin_tree_storage_t *str_tree_storage;
Packit Service f629e6
  re_bitset_ptr_t sb_char;
Packit Service f629e6
  int str_tree_storage_idx;
Packit Service f629e6
Packit Service f629e6
  /* number of subexpressions `re_nsub' is in regex_t.  */
Packit Service f629e6
  unsigned int state_hash_mask;
Packit Service f629e6
  int init_node;
Packit Service f629e6
  int nbackref; /* The number of backreference in this dfa.  */
Packit Service f629e6
Packit Service f629e6
  /* Bitmap expressing which backreference is used.  */
Packit Service f629e6
  bitset_word_t used_bkref_map;
Packit Service f629e6
  bitset_word_t completed_bkref_map;
Packit Service f629e6
Packit Service f629e6
  unsigned int has_plural_match : 1;
Packit Service f629e6
  /* If this dfa has "multibyte node", which is a backreference or
Packit Service f629e6
     a node which can accept multibyte character or multi character
Packit Service f629e6
     collating element.  */
Packit Service f629e6
  unsigned int has_mb_node : 1;
Packit Service f629e6
  unsigned int is_utf8 : 1;
Packit Service f629e6
  unsigned int map_notascii : 1;
Packit Service f629e6
  unsigned int word_ops_used : 1;
Packit Service f629e6
  int mb_cur_max;
Packit Service f629e6
  bitset_t word_char;
Packit Service f629e6
  reg_syntax_t syntax;
Packit Service f629e6
  int *subexp_map;
Packit Service f629e6
#ifdef DEBUG
Packit Service f629e6
  char* re_str;
Packit Service f629e6
#endif
Packit Service f629e6
#ifdef _LIBC
Packit Service f629e6
  __libc_lock_define (, lock)
Packit Service f629e6
#endif
Packit Service f629e6
};
Packit Service f629e6
Packit Service f629e6
#define re_node_set_init_empty(set) memset (set, '\0', sizeof (re_node_set))
Packit Service f629e6
#define re_node_set_remove(set,id) \
Packit Service f629e6
  (re_node_set_remove_at (set, re_node_set_contains (set, id) - 1))
Packit Service f629e6
#define re_node_set_empty(p) ((p)->nelem = 0)
Packit Service f629e6
#define re_node_set_free(set) re_free ((set)->elems)
Packit Service f629e6

Packit Service f629e6
Packit Service f629e6
typedef enum
Packit Service f629e6
{
Packit Service f629e6
  SB_CHAR,
Packit Service f629e6
  MB_CHAR,
Packit Service f629e6
  EQUIV_CLASS,
Packit Service f629e6
  COLL_SYM,
Packit Service f629e6
  CHAR_CLASS
Packit Service f629e6
} bracket_elem_type;
Packit Service f629e6
Packit Service f629e6
typedef struct
Packit Service f629e6
{
Packit Service f629e6
  bracket_elem_type type;
Packit Service f629e6
  union
Packit Service f629e6
  {
Packit Service f629e6
    unsigned char ch;
Packit Service f629e6
    unsigned char *name;
Packit Service f629e6
    wchar_t wch;
Packit Service f629e6
  } opr;
Packit Service f629e6
} bracket_elem_t;
Packit Service f629e6
Packit Service f629e6
Packit Service f629e6
/* Inline functions for bitset operation.  */
Packit Service f629e6
static void __attribute__ ((unused))
Packit Service f629e6
bitset_not (bitset_t set)
Packit Service f629e6
{
Packit Service f629e6
  int bitset_i;
Packit Service f629e6
  for (bitset_i = 0; bitset_i < BITSET_WORDS; ++bitset_i)
Packit Service f629e6
    set[bitset_i] = ~set[bitset_i];
Packit Service f629e6
}
Packit Service f629e6
Packit Service f629e6
static void __attribute__ ((unused))
Packit Service f629e6
bitset_merge (bitset_t dest, const bitset_t src)
Packit Service f629e6
{
Packit Service f629e6
  int bitset_i;
Packit Service f629e6
  for (bitset_i = 0; bitset_i < BITSET_WORDS; ++bitset_i)
Packit Service f629e6
    dest[bitset_i] |= src[bitset_i];
Packit Service f629e6
}
Packit Service f629e6
Packit Service f629e6
static void __attribute__ ((unused))
Packit Service f629e6
bitset_mask (bitset_t dest, const bitset_t src)
Packit Service f629e6
{
Packit Service f629e6
  int bitset_i;
Packit Service f629e6
  for (bitset_i = 0; bitset_i < BITSET_WORDS; ++bitset_i)
Packit Service f629e6
    dest[bitset_i] &= src[bitset_i];
Packit Service f629e6
}
Packit Service f629e6
Packit Service f629e6
#ifdef RE_ENABLE_I18N
Packit Service f629e6
/* Inline functions for re_string.  */
Packit Service f629e6
static int
Packit Service f629e6
__attribute__ ((pure, unused))
Packit Service f629e6
re_string_char_size_at (const re_string_t *pstr, int idx)
Packit Service f629e6
{
Packit Service f629e6
  int byte_idx;
Packit Service f629e6
  if (pstr->mb_cur_max == 1)
Packit Service f629e6
    return 1;
Packit Service f629e6
  for (byte_idx = 1; idx + byte_idx < pstr->valid_len; ++byte_idx)
Packit Service f629e6
    if (pstr->wcs[idx + byte_idx] != WEOF)
Packit Service f629e6
      break;
Packit Service f629e6
  return byte_idx;
Packit Service f629e6
}
Packit Service f629e6
Packit Service f629e6
static wint_t
Packit Service f629e6
__attribute__ ((pure, unused))
Packit Service f629e6
re_string_wchar_at (const re_string_t *pstr, int idx)
Packit Service f629e6
{
Packit Service f629e6
  if (pstr->mb_cur_max == 1)
Packit Service f629e6
    return (wint_t) pstr->mbs[idx];
Packit Service f629e6
  return (wint_t) pstr->wcs[idx];
Packit Service f629e6
}
Packit Service f629e6
Packit Service f629e6
# ifndef NOT_IN_libc
Packit Service f629e6
#  ifdef _LIBC
Packit Service f629e6
#   include <locale/weight.h>
Packit Service f629e6
#  endif
Packit Service f629e6
Packit Service f629e6
static int
Packit Service f629e6
__attribute__ ((pure, unused))
Packit Service f629e6
re_string_elem_size_at (const re_string_t *pstr, int idx)
Packit Service f629e6
{
Packit Service f629e6
#  ifdef _LIBC
Packit Service f629e6
  const unsigned char *p, *extra;
Packit Service f629e6
  const int32_t *table, *indirect;
Packit Service f629e6
  uint_fast32_t nrules = _NL_CURRENT_WORD (LC_COLLATE, _NL_COLLATE_NRULES);
Packit Service f629e6
Packit Service f629e6
  if (nrules != 0)
Packit Service f629e6
    {
Packit Service f629e6
      table = (const int32_t *) _NL_CURRENT (LC_COLLATE, _NL_COLLATE_TABLEMB);
Packit Service f629e6
      extra = (const unsigned char *)
Packit Service f629e6
	_NL_CURRENT (LC_COLLATE, _NL_COLLATE_EXTRAMB);
Packit Service f629e6
      indirect = (const int32_t *) _NL_CURRENT (LC_COLLATE,
Packit Service f629e6
						_NL_COLLATE_INDIRECTMB);
Packit Service f629e6
      p = pstr->mbs + idx;
Packit Service f629e6
      findidx (table, indirect, extra, &p, pstr->len - idx);
Packit Service f629e6
      return p - pstr->mbs - idx;
Packit Service f629e6
    }
Packit Service f629e6
  else
Packit Service f629e6
#  endif /* _LIBC */
Packit Service f629e6
    return 1;
Packit Service f629e6
}
Packit Service f629e6
# endif
Packit Service f629e6
#endif /* RE_ENABLE_I18N */
Packit Service f629e6
Packit Service f629e6
#endif /*  _REGEX_INTERNAL_H */