Blame lex.c

Packit 991819
/*	$OpenBSD: lex.c,v 1.51 2015/09/10 22:48:58 nicm Exp $	*/
Packit 991819
Packit 991819
/*-
Packit 991819
 * Copyright (c) 2003, 2004, 2005, 2006, 2007, 2008, 2009, 2010,
Packit 991819
 *		 2011, 2012, 2013, 2014, 2015, 2016, 2017, 2018
Packit 991819
 *	mirabilos <m@mirbsd.org>
Packit 991819
 *
Packit 991819
 * Provided that these terms and disclaimer and all copyright notices
Packit 991819
 * are retained or reproduced in an accompanying document, permission
Packit 991819
 * is granted to deal in this work without restriction, including un-
Packit 991819
 * limited rights to use, publicly perform, distribute, sell, modify,
Packit 991819
 * merge, give away, or sublicence.
Packit 991819
 *
Packit 991819
 * This work is provided "AS IS" and WITHOUT WARRANTY of any kind, to
Packit 991819
 * the utmost extent permitted by applicable law, neither express nor
Packit 991819
 * implied; without malicious intent or gross negligence. In no event
Packit 991819
 * may a licensor, author or contributor be held liable for indirect,
Packit 991819
 * direct, other damage, loss, or other issues arising in any way out
Packit 991819
 * of dealing in the work, even if advised of the possibility of such
Packit 991819
 * damage or existence of a defect, except proven that it results out
Packit 991819
 * of said person's immediate fault when using the work as intended.
Packit 991819
 */
Packit 991819
Packit 991819
#include "sh.h"
Packit 991819
Packit 991819
__RCSID("$MirOS: src/bin/mksh/lex.c,v 1.247 2018/01/14 01:44:01 tg Exp $");
Packit 991819
Packit 991819
/*
Packit 991819
 * states while lexing word
Packit 991819
 */
Packit 991819
#define SBASE		0	/* outside any lexical constructs */
Packit 991819
#define SWORD		1	/* implicit quoting for substitute() */
Packit 991819
#define SLETPAREN	2	/* inside (( )), implicit quoting */
Packit 991819
#define SSQUOTE		3	/* inside '' */
Packit 991819
#define SDQUOTE		4	/* inside "" */
Packit 991819
#define SEQUOTE		5	/* inside $'' */
Packit 991819
#define SBRACE		6	/* inside ${} */
Packit 991819
#define SQBRACE		7	/* inside "${}" */
Packit 991819
#define SBQUOTE		8	/* inside `` */
Packit 991819
#define SASPAREN	9	/* inside $(( )) */
Packit 991819
#define SHEREDELIM	10	/* parsing << or <<- delimiter */
Packit 991819
#define SHEREDQUOTE	11	/* parsing " in << or <<- delimiter */
Packit 991819
#define SPATTERN	12	/* parsing *(...|...) pattern (*+?@!) */
Packit 991819
#define SADELIM		13	/* like SBASE, looking for delimiter */
Packit 991819
#define STBRACEKORN	14	/* parsing ${...[#%]...} !FSH */
Packit 991819
#define STBRACEBOURNE	15	/* parsing ${...[#%]...} FSH */
Packit 991819
#define SINVALID	255	/* invalid state */
Packit 991819
Packit 991819
struct sretrace_info {
Packit 991819
	struct sretrace_info *next;
Packit 991819
	XString xs;
Packit 991819
	char *xp;
Packit 991819
};
Packit 991819
Packit 991819
/*
Packit 991819
 * Structure to keep track of the lexing state and the various pieces of info
Packit 991819
 * needed for each particular state.
Packit 991819
 */
Packit 991819
typedef struct lex_state {
Packit 991819
	union {
Packit 991819
		/* point to the next state block */
Packit 991819
		struct lex_state *base;
Packit 991819
		/* marks start of state output in output string */
Packit 991819
		size_t start;
Packit 991819
		/* SBQUOTE: true if in double quotes: "`...`" */
Packit 991819
		/* SEQUOTE: got NUL, ignore rest of string */
Packit 991819
		bool abool;
Packit 991819
		/* SADELIM information */
Packit 991819
		struct {
Packit 991819
			/* character to search for */
Packit 991819
			unsigned char delimiter;
Packit 991819
			/* max. number of delimiters */
Packit 991819
			unsigned char num;
Packit 991819
		} adelim;
Packit 991819
	} u;
Packit 991819
	/* count open parentheses */
Packit 991819
	short nparen;
Packit 991819
	/* type of this state */
Packit 991819
	uint8_t type;
Packit 991819
} Lex_state;
Packit 991819
#define ls_base		u.base
Packit 991819
#define ls_start	u.start
Packit 991819
#define ls_bool		u.abool
Packit 991819
#define ls_adelim	u.adelim
Packit 991819
Packit 991819
typedef struct {
Packit 991819
	Lex_state *base;
Packit 991819
	Lex_state *end;
Packit 991819
} State_info;
Packit 991819
Packit 991819
static void readhere(struct ioword *);
Packit 991819
static void ungetsc(int);
Packit 991819
static void ungetsc_i(int);
Packit 991819
static int getsc_uu(void);
Packit 991819
static void getsc_line(Source *);
Packit 991819
static int getsc_bn(void);
Packit 991819
static int getsc_i(void);
Packit 991819
static char *get_brace_var(XString *, char *);
Packit 991819
static bool arraysub(char **);
Packit 991819
static void gethere(void);
Packit 991819
static Lex_state *push_state_i(State_info *, Lex_state *);
Packit 991819
static Lex_state *pop_state_i(State_info *, Lex_state *);
Packit 991819
Packit 991819
static int backslash_skip;
Packit 991819
static int ignore_backslash_newline;
Packit 991819
Packit 991819
/* optimised getsc_bn() */
Packit 991819
#define o_getsc()	(*source->str != '\0' && *source->str != '\\' && \
Packit 991819
			    !backslash_skip ? *source->str++ : getsc_bn())
Packit 991819
/* optimised getsc_uu() */
Packit 991819
#define	o_getsc_u()	((*source->str != '\0') ? *source->str++ : getsc_uu())
Packit 991819
Packit 991819
/* retrace helper */
Packit 991819
#define o_getsc_r(carg)					\
Packit 991819
	int cev = (carg);				\
Packit 991819
	struct sretrace_info *rp = retrace_info;	\
Packit 991819
							\
Packit 991819
	while (rp) {					\
Packit 991819
		Xcheck(rp->xs, rp->xp);			\
Packit 991819
		*rp->xp++ = cev;			\
Packit 991819
		rp = rp->next;				\
Packit 991819
	}						\
Packit 991819
							\
Packit 991819
	return (cev);
Packit 991819
Packit 991819
/* callback */
Packit 991819
static int
Packit 991819
getsc_i(void)
Packit 991819
{
Packit 991819
	o_getsc_r((unsigned int)(unsigned char)o_getsc());
Packit 991819
}
Packit 991819
Packit 991819
#if defined(MKSH_SMALL) && !defined(MKSH_SMALL_BUT_FAST)
Packit 991819
#define getsc()		getsc_i()
Packit 991819
#else
Packit 991819
static int getsc_r(int);
Packit 991819
Packit 991819
static int
Packit 991819
getsc_r(int c)
Packit 991819
{
Packit 991819
	o_getsc_r(c);
Packit 991819
}
Packit 991819
Packit 991819
#define getsc()		getsc_r((unsigned int)(unsigned char)o_getsc())
Packit 991819
#endif
Packit 991819
Packit 991819
#define STATE_BSIZE	8
Packit 991819
Packit 991819
#define PUSH_STATE(s)	do {					\
Packit 991819
	if (++statep == state_info.end)				\
Packit 991819
		statep = push_state_i(&state_info, statep);	\
Packit 991819
	state = statep->type = (s);				\
Packit 991819
} while (/* CONSTCOND */ 0)
Packit 991819
Packit 991819
#define POP_STATE()	do {					\
Packit 991819
	if (--statep == state_info.base)			\
Packit 991819
		statep = pop_state_i(&state_info, statep);	\
Packit 991819
	state = statep->type;					\
Packit 991819
} while (/* CONSTCOND */ 0)
Packit 991819
Packit 991819
#define PUSH_SRETRACE(s) do {					\
Packit 991819
	struct sretrace_info *ri;				\
Packit 991819
								\
Packit 991819
	PUSH_STATE(s);						\
Packit 991819
	statep->ls_start = Xsavepos(ws, wp);			\
Packit 991819
	ri = alloc(sizeof(struct sretrace_info), ATEMP);	\
Packit 991819
	Xinit(ri->xs, ri->xp, 64, ATEMP);			\
Packit 991819
	ri->next = retrace_info;				\
Packit 991819
	retrace_info = ri;					\
Packit 991819
} while (/* CONSTCOND */ 0)
Packit 991819
Packit 991819
#define POP_SRETRACE()	do {					\
Packit 991819
	wp = Xrestpos(ws, wp, statep->ls_start);		\
Packit 991819
	*retrace_info->xp = '\0';				\
Packit 991819
	sp = Xstring(retrace_info->xs, retrace_info->xp);	\
Packit 991819
	dp = (void *)retrace_info;				\
Packit 991819
	retrace_info = retrace_info->next;			\
Packit 991819
	afree(dp, ATEMP);					\
Packit 991819
	POP_STATE();						\
Packit 991819
} while (/* CONSTCOND */ 0)
Packit 991819
Packit 991819
/**
Packit 991819
 * Lexical analyser
Packit 991819
 *
Packit 991819
 * tokens are not regular expressions, they are LL(1).
Packit 991819
 * for example, "${var:-${PWD}}", and "$(size $(whence ksh))".
Packit 991819
 * hence the state stack. Note "$(...)" are now parsed recursively.
Packit 991819
 */
Packit 991819
Packit 991819
int
Packit 991819
yylex(int cf)
Packit 991819
{
Packit 991819
	Lex_state states[STATE_BSIZE], *statep, *s2, *base;
Packit 991819
	State_info state_info;
Packit 991819
	int c, c2, state;
Packit 991819
	size_t cz;
Packit 991819
	XString ws;		/* expandable output word */
Packit 991819
	char *wp;		/* output word pointer */
Packit 991819
	char *sp, *dp;
Packit 991819
Packit 991819
 Again:
Packit 991819
	states[0].type = SINVALID;
Packit 991819
	states[0].ls_base = NULL;
Packit 991819
	statep = &states[1];
Packit 991819
	state_info.base = states;
Packit 991819
	state_info.end = &state_info.base[STATE_BSIZE];
Packit 991819
Packit 991819
	Xinit(ws, wp, 64, ATEMP);
Packit 991819
Packit 991819
	backslash_skip = 0;
Packit 991819
	ignore_backslash_newline = 0;
Packit 991819
Packit 991819
	if (cf & ONEWORD)
Packit 991819
		state = SWORD;
Packit 991819
	else if (cf & LETEXPR) {
Packit 991819
		/* enclose arguments in (double) quotes */
Packit 991819
		*wp++ = OQUOTE;
Packit 991819
		state = SLETPAREN;
Packit 991819
		statep->nparen = 0;
Packit 991819
	} else {
Packit 991819
		/* normal lexing */
Packit 991819
		state = (cf & HEREDELIM) ? SHEREDELIM : SBASE;
Packit 991819
		do {
Packit 991819
			c = getsc();
Packit 991819
		} while (ctype(c, C_BLANK));
Packit 991819
		if (c == '#') {
Packit 991819
			ignore_backslash_newline++;
Packit 991819
			do {
Packit 991819
				c = getsc();
Packit 991819
			} while (!ctype(c, C_NUL | C_LF));
Packit 991819
			ignore_backslash_newline--;
Packit 991819
		}
Packit 991819
		ungetsc(c);
Packit 991819
	}
Packit 991819
	if (source->flags & SF_ALIAS) {
Packit 991819
		/* trailing ' ' in alias definition */
Packit 991819
		source->flags &= ~SF_ALIAS;
Packit 991819
		/* POSIX: trailing space only counts if parsing simple cmd */
Packit 991819
		if (!Flag(FPOSIX) || (cf & CMDWORD))
Packit 991819
			cf |= ALIAS;
Packit 991819
	}
Packit 991819
Packit 991819
	/* Initial state: one of SWORD SLETPAREN SHEREDELIM SBASE */
Packit 991819
	statep->type = state;
Packit 991819
Packit 991819
	/* collect non-special or quoted characters to form word */
Packit 991819
	while (!((c = getsc()) == 0 ||
Packit 991819
	    ((state == SBASE || state == SHEREDELIM) && ctype(c, C_LEX1)))) {
Packit 991819
		if (state == SBASE &&
Packit 991819
		    subshell_nesting_type == ORD(/*{*/ '}') &&
Packit 991819
		    (unsigned int)c == ORD(/*{*/ '}'))
Packit 991819
			/* possibly end ${ :;} */
Packit 991819
			break;
Packit 991819
		Xcheck(ws, wp);
Packit 991819
		switch (state) {
Packit 991819
		case SADELIM:
Packit 991819
			if ((unsigned int)c == ORD('('))
Packit 991819
				statep->nparen++;
Packit 991819
			else if ((unsigned int)c == ORD(')'))
Packit 991819
				statep->nparen--;
Packit 991819
			else if (statep->nparen == 0 &&
Packit 991819
			    ((unsigned int)c == ORD(/*{*/ '}') ||
Packit 991819
			    c == (int)statep->ls_adelim.delimiter)) {
Packit 991819
				*wp++ = ADELIM;
Packit 991819
				*wp++ = c;
Packit 991819
				if ((unsigned int)c == ORD(/*{*/ '}') ||
Packit 991819
				    --statep->ls_adelim.num == 0)
Packit 991819
					POP_STATE();
Packit 991819
				if ((unsigned int)c == ORD(/*{*/ '}'))
Packit 991819
					POP_STATE();
Packit 991819
				break;
Packit 991819
			}
Packit 991819
			/* FALLTHROUGH */
Packit 991819
		case SBASE:
Packit 991819
			if ((unsigned int)c == ORD('[') && (cf & CMDASN)) {
Packit 991819
				/* temporary */
Packit 991819
				*wp = EOS;
Packit 991819
				if (is_wdvarname(Xstring(ws, wp), false)) {
Packit 991819
					char *p, *tmp;
Packit 991819
Packit 991819
					if (arraysub(&tmp)) {
Packit 991819
						*wp++ = CHAR;
Packit 991819
						*wp++ = c;
Packit 991819
						for (p = tmp; *p; ) {
Packit 991819
							Xcheck(ws, wp);
Packit 991819
							*wp++ = CHAR;
Packit 991819
							*wp++ = *p++;
Packit 991819
						}
Packit 991819
						afree(tmp, ATEMP);
Packit 991819
						break;
Packit 991819
					}
Packit 991819
				}
Packit 991819
				*wp++ = CHAR;
Packit 991819
				*wp++ = c;
Packit 991819
				break;
Packit 991819
			}
Packit 991819
			/* FALLTHROUGH */
Packit 991819
 Sbase1:		/* includes *(...|...) pattern (*+?@!) */
Packit 991819
			if (ctype(c, C_PATMO)) {
Packit 991819
				c2 = getsc();
Packit 991819
				if ((unsigned int)c2 == ORD('(' /*)*/)) {
Packit 991819
					*wp++ = OPAT;
Packit 991819
					*wp++ = c;
Packit 991819
					PUSH_STATE(SPATTERN);
Packit 991819
					break;
Packit 991819
				}
Packit 991819
				ungetsc(c2);
Packit 991819
			}
Packit 991819
			/* FALLTHROUGH */
Packit 991819
 Sbase2:		/* doesn't include *(...|...) pattern (*+?@!) */
Packit 991819
			switch (c) {
Packit 991819
			case ORD('\\'):
Packit 991819
 getsc_qchar:
Packit 991819
				if ((c = getsc())) {
Packit 991819
					/* trailing \ is lost */
Packit 991819
					*wp++ = QCHAR;
Packit 991819
					*wp++ = c;
Packit 991819
				}
Packit 991819
				break;
Packit 991819
			case ORD('\''):
Packit 991819
 open_ssquote_unless_heredoc:
Packit 991819
				if ((cf & HEREDOC))
Packit 991819
					goto store_char;
Packit 991819
				*wp++ = OQUOTE;
Packit 991819
				ignore_backslash_newline++;
Packit 991819
				PUSH_STATE(SSQUOTE);
Packit 991819
				break;
Packit 991819
			case ORD('"'):
Packit 991819
 open_sdquote:
Packit 991819
				*wp++ = OQUOTE;
Packit 991819
				PUSH_STATE(SDQUOTE);
Packit 991819
				break;
Packit 991819
			case ORD('$'):
Packit 991819
				/*
Packit 991819
				 * processing of dollar sign belongs into
Packit 991819
				 * Subst, except for those which can open
Packit 991819
				 * a string: $'…' and $"…"
Packit 991819
				 */
Packit 991819
 subst_dollar_ex:
Packit 991819
				c = getsc();
Packit 991819
				switch (c) {
Packit 991819
				case ORD('"'):
Packit 991819
					goto open_sdquote;
Packit 991819
				case ORD('\''):
Packit 991819
					goto open_sequote;
Packit 991819
				default:
Packit 991819
					goto SubstS;
Packit 991819
				}
Packit 991819
			default:
Packit 991819
				goto Subst;
Packit 991819
			}
Packit 991819
			break;
Packit 991819
Packit 991819
 Subst:
Packit 991819
			switch (c) {
Packit 991819
			case ORD('\\'):
Packit 991819
				c = getsc();
Packit 991819
				switch (c) {
Packit 991819
				case ORD('"'):
Packit 991819
					if ((cf & HEREDOC))
Packit 991819
						goto heredocquote;
Packit 991819
					/* FALLTHROUGH */
Packit 991819
				case ORD('\\'):
Packit 991819
				case ORD('$'):
Packit 991819
				case ORD('`'):
Packit 991819
 store_qchar:
Packit 991819
					*wp++ = QCHAR;
Packit 991819
					*wp++ = c;
Packit 991819
					break;
Packit 991819
				default:
Packit 991819
 heredocquote:
Packit 991819
					Xcheck(ws, wp);
Packit 991819
					if (c) {
Packit 991819
						/* trailing \ is lost */
Packit 991819
						*wp++ = CHAR;
Packit 991819
						*wp++ = '\\';
Packit 991819
						*wp++ = CHAR;
Packit 991819
						*wp++ = c;
Packit 991819
					}
Packit 991819
					break;
Packit 991819
				}
Packit 991819
				break;
Packit 991819
			case ORD('$'):
Packit 991819
				c = getsc();
Packit 991819
 SubstS:
Packit 991819
				if ((unsigned int)c == ORD('(' /*)*/)) {
Packit 991819
					c = getsc();
Packit 991819
					if ((unsigned int)c == ORD('(' /*)*/)) {
Packit 991819
						*wp++ = EXPRSUB;
Packit 991819
						PUSH_SRETRACE(SASPAREN);
Packit 991819
						statep->nparen = 2;
Packit 991819
						*retrace_info->xp++ = '(';
Packit 991819
					} else {
Packit 991819
						ungetsc(c);
Packit 991819
 subst_command:
Packit 991819
						c = COMSUB;
Packit 991819
 subst_command2:
Packit 991819
						sp = yyrecursive(c);
Packit 991819
						cz = strlen(sp) + 1;
Packit 991819
						XcheckN(ws, wp, cz);
Packit 991819
						*wp++ = c;
Packit 991819
						memcpy(wp, sp, cz);
Packit 991819
						wp += cz;
Packit 991819
					}
Packit 991819
				} else if ((unsigned int)c == ORD('{' /*}*/)) {
Packit 991819
					if ((unsigned int)(c = getsc()) == ORD('|')) {
Packit 991819
						/*
Packit 991819
						 * non-subenvironment
Packit 991819
						 * value substitution
Packit 991819
						 */
Packit 991819
						c = VALSUB;
Packit 991819
						goto subst_command2;
Packit 991819
					} else if (ctype(c, C_IFSWS)) {
Packit 991819
						/*
Packit 991819
						 * non-subenvironment
Packit 991819
						 * "command" substitution
Packit 991819
						 */
Packit 991819
						c = FUNSUB;
Packit 991819
						goto subst_command2;
Packit 991819
					}
Packit 991819
					ungetsc(c);
Packit 991819
					*wp++ = OSUBST;
Packit 991819
					*wp++ = '{' /*}*/;
Packit 991819
					wp = get_brace_var(&ws, wp);
Packit 991819
					c = getsc();
Packit 991819
					/* allow :# and :% (ksh88 compat) */
Packit 991819
					if ((unsigned int)c == ORD(':')) {
Packit 991819
						*wp++ = CHAR;
Packit 991819
						*wp++ = c;
Packit 991819
						c = getsc();
Packit 991819
						if ((unsigned int)c == ORD(':')) {
Packit 991819
							*wp++ = CHAR;
Packit 991819
							*wp++ = '0';
Packit 991819
							*wp++ = ADELIM;
Packit 991819
							*wp++ = ':';
Packit 991819
							PUSH_STATE(SBRACE);
Packit 991819
							PUSH_STATE(SADELIM);
Packit 991819
							statep->ls_adelim.delimiter = ':';
Packit 991819
							statep->ls_adelim.num = 1;
Packit 991819
							statep->nparen = 0;
Packit 991819
							break;
Packit 991819
						} else if (ctype(c, C_DIGIT | C_DOLAR | C_SPC) ||
Packit 991819
						    /*XXX what else? */
Packit 991819
						    c == '(' /*)*/) {
Packit 991819
							/* substring subst. */
Packit 991819
							if (c != ' ') {
Packit 991819
								*wp++ = CHAR;
Packit 991819
								*wp++ = ' ';
Packit 991819
							}
Packit 991819
							ungetsc(c);
Packit 991819
							PUSH_STATE(SBRACE);
Packit 991819
							PUSH_STATE(SADELIM);
Packit 991819
							statep->ls_adelim.delimiter = ':';
Packit 991819
							statep->ls_adelim.num = 2;
Packit 991819
							statep->nparen = 0;
Packit 991819
							break;
Packit 991819
						}
Packit 991819
					} else if (c == '/') {
Packit 991819
						c2 = ADELIM;
Packit 991819
 parse_adelim_slash:
Packit 991819
						*wp++ = CHAR;
Packit 991819
						*wp++ = c;
Packit 991819
						if ((unsigned int)(c = getsc()) == ORD('/')) {
Packit 991819
							*wp++ = c2;
Packit 991819
							*wp++ = c;
Packit 991819
						} else
Packit 991819
							ungetsc(c);
Packit 991819
						PUSH_STATE(SBRACE);
Packit 991819
						PUSH_STATE(SADELIM);
Packit 991819
						statep->ls_adelim.delimiter = '/';
Packit 991819
						statep->ls_adelim.num = 1;
Packit 991819
						statep->nparen = 0;
Packit 991819
						break;
Packit 991819
					} else if (c == '@') {
Packit 991819
						c2 = getsc();
Packit 991819
						ungetsc(c2);
Packit 991819
						if ((unsigned int)c2 == ORD('/')) {
Packit 991819
							c2 = CHAR;
Packit 991819
							goto parse_adelim_slash;
Packit 991819
						}
Packit 991819
					}
Packit 991819
					/*
Packit 991819
					 * If this is a trim operation,
Packit 991819
					 * treat (,|,) specially in STBRACE.
Packit 991819
					 */
Packit 991819
					if (ctype(c, C_SUB2)) {
Packit 991819
						ungetsc(c);
Packit 991819
						if (Flag(FSH))
Packit 991819
							PUSH_STATE(STBRACEBOURNE);
Packit 991819
						else
Packit 991819
							PUSH_STATE(STBRACEKORN);
Packit 991819
					} else {
Packit 991819
						ungetsc(c);
Packit 991819
						if (state == SDQUOTE ||
Packit 991819
						    state == SQBRACE)
Packit 991819
							PUSH_STATE(SQBRACE);
Packit 991819
						else
Packit 991819
							PUSH_STATE(SBRACE);
Packit 991819
					}
Packit 991819
				} else if (ctype(c, C_ALPHX)) {
Packit 991819
					*wp++ = OSUBST;
Packit 991819
					*wp++ = 'X';
Packit 991819
					do {
Packit 991819
						Xcheck(ws, wp);
Packit 991819
						*wp++ = c;
Packit 991819
						c = getsc();
Packit 991819
					} while (ctype(c, C_ALNUX));
Packit 991819
					*wp++ = '\0';
Packit 991819
					*wp++ = CSUBST;
Packit 991819
					*wp++ = 'X';
Packit 991819
					ungetsc(c);
Packit 991819
				} else if (ctype(c, C_VAR1 | C_DIGIT)) {
Packit 991819
					Xcheck(ws, wp);
Packit 991819
					*wp++ = OSUBST;
Packit 991819
					*wp++ = 'X';
Packit 991819
					*wp++ = c;
Packit 991819
					*wp++ = '\0';
Packit 991819
					*wp++ = CSUBST;
Packit 991819
					*wp++ = 'X';
Packit 991819
				} else {
Packit 991819
					*wp++ = CHAR;
Packit 991819
					*wp++ = '$';
Packit 991819
					ungetsc(c);
Packit 991819
				}
Packit 991819
				break;
Packit 991819
			case ORD('`'):
Packit 991819
 subst_gravis:
Packit 991819
				PUSH_STATE(SBQUOTE);
Packit 991819
				*wp++ = COMASUB;
Packit 991819
				/*
Packit 991819
				 * We need to know whether we are within double
Packit 991819
				 * quotes in order to translate \" to " within
Packit 991819
				 * "…`…\"…`…" because, unlike for COMSUBs, the
Packit 991819
				 * outer double quoteing changes the backslash
Packit 991819
				 * meaning for the inside. For more details:
Packit 991819
				 * http://austingroupbugs.net/view.php?id=1015
Packit 991819
				 */
Packit 991819
				statep->ls_bool = false;
Packit 991819
				s2 = statep;
Packit 991819
				base = state_info.base;
Packit 991819
				while (/* CONSTCOND */ 1) {
Packit 991819
					for (; s2 != base; s2--) {
Packit 991819
						if (s2->type == SDQUOTE) {
Packit 991819
							statep->ls_bool = true;
Packit 991819
							break;
Packit 991819
						}
Packit 991819
					}
Packit 991819
					if (s2 != base)
Packit 991819
						break;
Packit 991819
					if (!(s2 = s2->ls_base))
Packit 991819
						break;
Packit 991819
					base = s2-- - STATE_BSIZE;
Packit 991819
				}
Packit 991819
				break;
Packit 991819
			case QCHAR:
Packit 991819
				if (cf & LQCHAR) {
Packit 991819
					*wp++ = QCHAR;
Packit 991819
					*wp++ = getsc();
Packit 991819
					break;
Packit 991819
				}
Packit 991819
				/* FALLTHROUGH */
Packit 991819
			default:
Packit 991819
 store_char:
Packit 991819
				*wp++ = CHAR;
Packit 991819
				*wp++ = c;
Packit 991819
			}
Packit 991819
			break;
Packit 991819
Packit 991819
		case SEQUOTE:
Packit 991819
			if ((unsigned int)c == ORD('\'')) {
Packit 991819
				POP_STATE();
Packit 991819
				*wp++ = CQUOTE;
Packit 991819
				ignore_backslash_newline--;
Packit 991819
			} else if ((unsigned int)c == ORD('\\')) {
Packit 991819
				if ((c2 = unbksl(true, getsc_i, ungetsc)) == -1)
Packit 991819
					c2 = getsc();
Packit 991819
				if (c2 == 0)
Packit 991819
					statep->ls_bool = true;
Packit 991819
				if (!statep->ls_bool) {
Packit 991819
					char ts[4];
Packit 991819
Packit 991819
					if ((unsigned int)c2 < 0x100) {
Packit 991819
						*wp++ = QCHAR;
Packit 991819
						*wp++ = c2;
Packit 991819
					} else {
Packit 991819
						cz = utf_wctomb(ts, c2 - 0x100);
Packit 991819
						ts[cz] = 0;
Packit 991819
						cz = 0;
Packit 991819
						do {
Packit 991819
							*wp++ = QCHAR;
Packit 991819
							*wp++ = ts[cz];
Packit 991819
						} while (ts[++cz]);
Packit 991819
					}
Packit 991819
				}
Packit 991819
			} else if (!statep->ls_bool) {
Packit 991819
				*wp++ = QCHAR;
Packit 991819
				*wp++ = c;
Packit 991819
			}
Packit 991819
			break;
Packit 991819
Packit 991819
		case SSQUOTE:
Packit 991819
			if ((unsigned int)c == ORD('\'')) {
Packit 991819
				POP_STATE();
Packit 991819
				if ((cf & HEREDOC) || state == SQBRACE)
Packit 991819
					goto store_char;
Packit 991819
				*wp++ = CQUOTE;
Packit 991819
				ignore_backslash_newline--;
Packit 991819
			} else {
Packit 991819
				*wp++ = QCHAR;
Packit 991819
				*wp++ = c;
Packit 991819
			}
Packit 991819
			break;
Packit 991819
Packit 991819
		case SDQUOTE:
Packit 991819
			if ((unsigned int)c == ORD('"')) {
Packit 991819
				POP_STATE();
Packit 991819
				*wp++ = CQUOTE;
Packit 991819
			} else
Packit 991819
				goto Subst;
Packit 991819
			break;
Packit 991819
Packit 991819
		/* $(( ... )) */
Packit 991819
		case SASPAREN:
Packit 991819
			if ((unsigned int)c == ORD('('))
Packit 991819
				statep->nparen++;
Packit 991819
			else if ((unsigned int)c == ORD(')')) {
Packit 991819
				statep->nparen--;
Packit 991819
				if (statep->nparen == 1) {
Packit 991819
					/* end of EXPRSUB */
Packit 991819
					POP_SRETRACE();
Packit 991819
Packit 991819
					if ((unsigned int)(c2 = getsc()) == ORD(/*(*/ ')')) {
Packit 991819
						cz = strlen(sp) - 2;
Packit 991819
						XcheckN(ws, wp, cz);
Packit 991819
						memcpy(wp, sp + 1, cz);
Packit 991819
						wp += cz;
Packit 991819
						afree(sp, ATEMP);
Packit 991819
						*wp++ = '\0';
Packit 991819
						break;
Packit 991819
					} else {
Packit 991819
						Source *s;
Packit 991819
Packit 991819
						ungetsc(c2);
Packit 991819
						/*
Packit 991819
						 * mismatched parenthesis -
Packit 991819
						 * assume we were really
Packit 991819
						 * parsing a $(...) expression
Packit 991819
						 */
Packit 991819
						--wp;
Packit 991819
						s = pushs(SREREAD,
Packit 991819
						    source->areap);
Packit 991819
						s->start = s->str =
Packit 991819
						    s->u.freeme = sp;
Packit 991819
						s->next = source;
Packit 991819
						source = s;
Packit 991819
						goto subst_command;
Packit 991819
					}
Packit 991819
				}
Packit 991819
			}
Packit 991819
			/* reuse existing state machine */
Packit 991819
			goto Sbase2;
Packit 991819
Packit 991819
		case SQBRACE:
Packit 991819
			if ((unsigned int)c == ORD('\\')) {
Packit 991819
				/*
Packit 991819
				 * perform POSIX "quote removal" if the back-
Packit 991819
				 * slash is "special", i.e. same cases as the
Packit 991819
				 * {case '\\':} in Subst: plus closing brace;
Packit 991819
				 * in mksh code "quote removal" on '\c' means
Packit 991819
				 * write QCHAR+c, otherwise CHAR+\+CHAR+c are
Packit 991819
				 * emitted (in heredocquote:)
Packit 991819
				 */
Packit 991819
				if ((unsigned int)(c = getsc()) == ORD('"') ||
Packit 991819
				    (unsigned int)c == ORD('\\') ||
Packit 991819
				    ctype(c, C_DOLAR | C_GRAVE) ||
Packit 991819
				    (unsigned int)c == ORD(/*{*/ '}'))
Packit 991819
					goto store_qchar;
Packit 991819
				goto heredocquote;
Packit 991819
			}
Packit 991819
			goto common_SQBRACE;
Packit 991819
Packit 991819
		case SBRACE:
Packit 991819
			if ((unsigned int)c == ORD('\''))
Packit 991819
				goto open_ssquote_unless_heredoc;
Packit 991819
			else if ((unsigned int)c == ORD('\\'))
Packit 991819
				goto getsc_qchar;
Packit 991819
 common_SQBRACE:
Packit 991819
			if ((unsigned int)c == ORD('"'))
Packit 991819
				goto open_sdquote;
Packit 991819
			else if ((unsigned int)c == ORD('$'))
Packit 991819
				goto subst_dollar_ex;
Packit 991819
			else if ((unsigned int)c == ORD('`'))
Packit 991819
				goto subst_gravis;
Packit 991819
			else if ((unsigned int)c != ORD(/*{*/ '}'))
Packit 991819
				goto store_char;
Packit 991819
			POP_STATE();
Packit 991819
			*wp++ = CSUBST;
Packit 991819
			*wp++ = /*{*/ '}';
Packit 991819
			break;
Packit 991819
Packit 991819
		/* Same as SBASE, except (,|,) treated specially */
Packit 991819
		case STBRACEKORN:
Packit 991819
			if ((unsigned int)c == ORD('|'))
Packit 991819
				*wp++ = SPAT;
Packit 991819
			else if ((unsigned int)c == ORD('(')) {
Packit 991819
				*wp++ = OPAT;
Packit 991819
				/* simile for @ */
Packit 991819
				*wp++ = ' ';
Packit 991819
				PUSH_STATE(SPATTERN);
Packit 991819
			} else /* FALLTHROUGH */
Packit 991819
		case STBRACEBOURNE:
Packit 991819
			  if ((unsigned int)c == ORD(/*{*/ '}')) {
Packit 991819
				POP_STATE();
Packit 991819
				*wp++ = CSUBST;
Packit 991819
				*wp++ = /*{*/ '}';
Packit 991819
			} else
Packit 991819
				goto Sbase1;
Packit 991819
			break;
Packit 991819
Packit 991819
		case SBQUOTE:
Packit 991819
			if ((unsigned int)c == ORD('`')) {
Packit 991819
				*wp++ = 0;
Packit 991819
				POP_STATE();
Packit 991819
			} else if ((unsigned int)c == ORD('\\')) {
Packit 991819
				switch (c = getsc()) {
Packit 991819
				case 0:
Packit 991819
					/* trailing \ is lost */
Packit 991819
					break;
Packit 991819
				case ORD('$'):
Packit 991819
				case ORD('`'):
Packit 991819
				case ORD('\\'):
Packit 991819
					*wp++ = c;
Packit 991819
					break;
Packit 991819
				case ORD('"'):
Packit 991819
					if (statep->ls_bool) {
Packit 991819
						*wp++ = c;
Packit 991819
						break;
Packit 991819
					}
Packit 991819
					/* FALLTHROUGH */
Packit 991819
				default:
Packit 991819
					*wp++ = '\\';
Packit 991819
					*wp++ = c;
Packit 991819
					break;
Packit 991819
				}
Packit 991819
			} else
Packit 991819
				*wp++ = c;
Packit 991819
			break;
Packit 991819
Packit 991819
		/* ONEWORD */
Packit 991819
		case SWORD:
Packit 991819
			goto Subst;
Packit 991819
Packit 991819
		/* LETEXPR: (( ... )) */
Packit 991819
		case SLETPAREN:
Packit 991819
			if ((unsigned int)c == ORD(/*(*/ ')')) {
Packit 991819
				if (statep->nparen > 0)
Packit 991819
					--statep->nparen;
Packit 991819
				else if ((unsigned int)(c2 = getsc()) == ORD(/*(*/ ')')) {
Packit 991819
					c = 0;
Packit 991819
					*wp++ = CQUOTE;
Packit 991819
					goto Done;
Packit 991819
				} else {
Packit 991819
					Source *s;
Packit 991819
Packit 991819
					ungetsc(c2);
Packit 991819
					ungetsc(c);
Packit 991819
					/*
Packit 991819
					 * mismatched parenthesis -
Packit 991819
					 * assume we were really
Packit 991819
					 * parsing a (...) expression
Packit 991819
					 */
Packit 991819
					*wp = EOS;
Packit 991819
					sp = Xstring(ws, wp);
Packit 991819
					dp = wdstrip(sp + 1, WDS_TPUTS);
Packit 991819
					s = pushs(SREREAD, source->areap);
Packit 991819
					s->start = s->str = s->u.freeme = dp;
Packit 991819
					s->next = source;
Packit 991819
					source = s;
Packit 991819
					ungetsc('(' /*)*/);
Packit 991819
					return (ORD('(' /*)*/));
Packit 991819
				}
Packit 991819
			} else if ((unsigned int)c == ORD('('))
Packit 991819
				/*
Packit 991819
				 * parentheses inside quotes and
Packit 991819
				 * backslashes are lost, but AT&T ksh
Packit 991819
				 * doesn't count them either
Packit 991819
				 */
Packit 991819
				++statep->nparen;
Packit 991819
			goto Sbase2;
Packit 991819
Packit 991819
		/* << or <<- delimiter */
Packit 991819
		case SHEREDELIM:
Packit 991819
			/*
Packit 991819
			 * here delimiters need a special case since
Packit 991819
			 * $ and `...` are not to be treated specially
Packit 991819
			 */
Packit 991819
			switch (c) {
Packit 991819
			case ORD('\\'):
Packit 991819
				if ((c = getsc())) {
Packit 991819
					/* trailing \ is lost */
Packit 991819
					*wp++ = QCHAR;
Packit 991819
					*wp++ = c;
Packit 991819
				}
Packit 991819
				break;
Packit 991819
			case ORD('\''):
Packit 991819
				goto open_ssquote_unless_heredoc;
Packit 991819
			case ORD('$'):
Packit 991819
				if ((unsigned int)(c2 = getsc()) == ORD('\'')) {
Packit 991819
 open_sequote:
Packit 991819
					*wp++ = OQUOTE;
Packit 991819
					ignore_backslash_newline++;
Packit 991819
					PUSH_STATE(SEQUOTE);
Packit 991819
					statep->ls_bool = false;
Packit 991819
					break;
Packit 991819
				} else if ((unsigned int)c2 == ORD('"')) {
Packit 991819
					/* FALLTHROUGH */
Packit 991819
			case ORD('"'):
Packit 991819
					PUSH_SRETRACE(SHEREDQUOTE);
Packit 991819
					break;
Packit 991819
				}
Packit 991819
				ungetsc(c2);
Packit 991819
				/* FALLTHROUGH */
Packit 991819
			default:
Packit 991819
				*wp++ = CHAR;
Packit 991819
				*wp++ = c;
Packit 991819
			}
Packit 991819
			break;
Packit 991819
Packit 991819
		/* " in << or <<- delimiter */
Packit 991819
		case SHEREDQUOTE:
Packit 991819
			if ((unsigned int)c != ORD('"'))
Packit 991819
				goto Subst;
Packit 991819
			POP_SRETRACE();
Packit 991819
			dp = strnul(sp) - 1;
Packit 991819
			/* remove the trailing double quote */
Packit 991819
			*dp = '\0';
Packit 991819
			/* store the quoted string */
Packit 991819
			*wp++ = OQUOTE;
Packit 991819
			XcheckN(ws, wp, (dp - sp) * 2);
Packit 991819
			dp = sp;
Packit 991819
			while ((c = *dp++)) {
Packit 991819
				if (c == '\\') {
Packit 991819
					switch ((c = *dp++)) {
Packit 991819
					case ORD('\\'):
Packit 991819
					case ORD('"'):
Packit 991819
					case ORD('$'):
Packit 991819
					case ORD('`'):
Packit 991819
						break;
Packit 991819
					default:
Packit 991819
						*wp++ = CHAR;
Packit 991819
						*wp++ = '\\';
Packit 991819
						break;
Packit 991819
					}
Packit 991819
				}
Packit 991819
				*wp++ = CHAR;
Packit 991819
				*wp++ = c;
Packit 991819
			}
Packit 991819
			afree(sp, ATEMP);
Packit 991819
			*wp++ = CQUOTE;
Packit 991819
			state = statep->type = SHEREDELIM;
Packit 991819
			break;
Packit 991819
Packit 991819
		/* in *(...|...) pattern (*+?@!) */
Packit 991819
		case SPATTERN:
Packit 991819
			if ((unsigned int)c == ORD(/*(*/ ')')) {
Packit 991819
				*wp++ = CPAT;
Packit 991819
				POP_STATE();
Packit 991819
			} else if ((unsigned int)c == ORD('|')) {
Packit 991819
				*wp++ = SPAT;
Packit 991819
			} else if ((unsigned int)c == ORD('(')) {
Packit 991819
				*wp++ = OPAT;
Packit 991819
				/* simile for @ */
Packit 991819
				*wp++ = ' ';
Packit 991819
				PUSH_STATE(SPATTERN);
Packit 991819
			} else
Packit 991819
				goto Sbase1;
Packit 991819
			break;
Packit 991819
		}
Packit 991819
	}
Packit 991819
 Done:
Packit 991819
	Xcheck(ws, wp);
Packit 991819
	if (statep != &states[1])
Packit 991819
		/* XXX figure out what is missing */
Packit 991819
		yyerror("no closing quote");
Packit 991819
Packit 991819
	/* This done to avoid tests for SHEREDELIM wherever SBASE tested */
Packit 991819
	if (state == SHEREDELIM)
Packit 991819
		state = SBASE;
Packit 991819
Packit 991819
	dp = Xstring(ws, wp);
Packit 991819
	if (state == SBASE && (
Packit 991819
	    (c == '&' && !Flag(FSH) && !Flag(FPOSIX)) ||
Packit 991819
	    ctype(c, C_ANGLE)) && ((c2 = Xlength(ws, wp)) == 0 ||
Packit 991819
	    (c2 == 2 && dp[0] == CHAR && ctype(dp[1], C_DIGIT)))) {
Packit 991819
		struct ioword *iop = alloc(sizeof(struct ioword), ATEMP);
Packit 991819
Packit 991819
		iop->unit = c2 == 2 ? ksh_numdig(dp[1]) : c == '<' ? 0 : 1;
Packit 991819
Packit 991819
		if (c == '&') {
Packit 991819
			if ((unsigned int)(c2 = getsc()) != ORD('>')) {
Packit 991819
				ungetsc(c2);
Packit 991819
				goto no_iop;
Packit 991819
			}
Packit 991819
			c = c2;
Packit 991819
			iop->ioflag = IOBASH;
Packit 991819
		} else
Packit 991819
			iop->ioflag = 0;
Packit 991819
Packit 991819
		c2 = getsc();
Packit 991819
		/* <<, >>, <> are ok, >< is not */
Packit 991819
		if (c == c2 || ((unsigned int)c == ORD('<') &&
Packit 991819
		    (unsigned int)c2 == ORD('>'))) {
Packit 991819
			iop->ioflag |= c == c2 ?
Packit 991819
			    ((unsigned int)c == ORD('>') ? IOCAT : IOHERE) : IORDWR;
Packit 991819
			if (iop->ioflag == IOHERE) {
Packit 991819
				if ((unsigned int)(c2 = getsc()) == ORD('-'))
Packit 991819
					iop->ioflag |= IOSKIP;
Packit 991819
				else if ((unsigned int)c2 == ORD('<'))
Packit 991819
					iop->ioflag |= IOHERESTR;
Packit 991819
				else
Packit 991819
					ungetsc(c2);
Packit 991819
			}
Packit 991819
		} else if ((unsigned int)c2 == ORD('&'))
Packit 991819
			iop->ioflag |= IODUP | ((unsigned int)c == ORD('<') ? IORDUP : 0);
Packit 991819
		else {
Packit 991819
			iop->ioflag |= (unsigned int)c == ORD('>') ? IOWRITE : IOREAD;
Packit 991819
			if ((unsigned int)c == ORD('>') && (unsigned int)c2 == ORD('|'))
Packit 991819
				iop->ioflag |= IOCLOB;
Packit 991819
			else
Packit 991819
				ungetsc(c2);
Packit 991819
		}
Packit 991819
Packit 991819
		iop->ioname = NULL;
Packit 991819
		iop->delim = NULL;
Packit 991819
		iop->heredoc = NULL;
Packit 991819
		/* free word */
Packit 991819
		Xfree(ws, wp);
Packit 991819
		yylval.iop = iop;
Packit 991819
		return (REDIR);
Packit 991819
 no_iop:
Packit 991819
		afree(iop, ATEMP);
Packit 991819
	}
Packit 991819
Packit 991819
	if (wp == dp && state == SBASE) {
Packit 991819
		/* free word */
Packit 991819
		Xfree(ws, wp);
Packit 991819
		/* no word, process LEX1 character */
Packit 991819
		if (((unsigned int)c == ORD('|')) ||
Packit 991819
		    ((unsigned int)c == ORD('&')) ||
Packit 991819
		    ((unsigned int)c == ORD(';')) ||
Packit 991819
		    ((unsigned int)c == ORD('(' /*)*/))) {
Packit 991819
			if ((c2 = getsc()) == c)
Packit 991819
				c = ((unsigned int)c == ORD(';')) ? BREAK :
Packit 991819
				    ((unsigned int)c == ORD('|')) ? LOGOR :
Packit 991819
				    ((unsigned int)c == ORD('&')) ? LOGAND :
Packit 991819
				    /* (unsigned int)c == ORD('(' )) */ MDPAREN;
Packit 991819
			else if ((unsigned int)c == ORD('|') && (unsigned int)c2 == ORD('&'))
Packit 991819
				c = COPROC;
Packit 991819
			else if ((unsigned int)c == ORD(';') && (unsigned int)c2 == ORD('|'))
Packit 991819
				c = BRKEV;
Packit 991819
			else if ((unsigned int)c == ORD(';') && (unsigned int)c2 == ORD('&'))
Packit 991819
				c = BRKFT;
Packit 991819
			else
Packit 991819
				ungetsc(c2);
Packit 991819
#ifndef MKSH_SMALL
Packit 991819
			if (c == BREAK) {
Packit 991819
				if ((unsigned int)(c2 = getsc()) == ORD('&'))
Packit 991819
					c = BRKEV;
Packit 991819
				else
Packit 991819
					ungetsc(c2);
Packit 991819
			}
Packit 991819
#endif
Packit 991819
		} else if ((unsigned int)c == ORD('\n')) {
Packit 991819
			if (cf & HEREDELIM)
Packit 991819
				ungetsc(c);
Packit 991819
			else {
Packit 991819
				gethere();
Packit 991819
				if (cf & CONTIN)
Packit 991819
					goto Again;
Packit 991819
			}
Packit 991819
		} else if (c == '\0' && !(cf & HEREDELIM)) {
Packit 991819
			struct ioword **p = heres;
Packit 991819
Packit 991819
			while (p < herep)
Packit 991819
				if ((*p)->ioflag & IOHERESTR)
Packit 991819
					++p;
Packit 991819
				else
Packit 991819
					/* ksh -c 'cat <
Packit 991819
					yyerror(Tf_heredoc,
Packit 991819
					    evalstr((*p)->delim, 0));
Packit 991819
		}
Packit 991819
		return (c);
Packit 991819
	}
Packit 991819
Packit 991819
	/* terminate word */
Packit 991819
	*wp++ = EOS;
Packit 991819
	yylval.cp = Xclose(ws, wp);
Packit 991819
	if (state == SWORD || state == SLETPAREN
Packit 991819
	    /* XXX ONEWORD? */)
Packit 991819
		return (LWORD);
Packit 991819
Packit 991819
	/* unget terminator */
Packit 991819
	ungetsc(c);
Packit 991819
Packit 991819
	/*
Packit 991819
	 * note: the alias-vs-function code below depends on several
Packit 991819
	 * interna: starting from here, source->str is not modified;
Packit 991819
	 * the way getsc() and ungetsc() operate; etc.
Packit 991819
	 */
Packit 991819
Packit 991819
	/* copy word to unprefixed string ident */
Packit 991819
	sp = yylval.cp;
Packit 991819
	dp = ident;
Packit 991819
	while ((dp - ident) < IDENT && (c = *sp++) == CHAR)
Packit 991819
		*dp++ = *sp++;
Packit 991819
	if (c != EOS)
Packit 991819
		/* word is not unquoted, or space ran out */
Packit 991819
		dp = ident;
Packit 991819
	/* make sure the ident array stays NUL padded */
Packit 991819
	memset(dp, 0, (ident + IDENT) - dp + 1);
Packit 991819
Packit 991819
	if (*ident != '\0' && (cf & (KEYWORD | ALIAS))) {
Packit 991819
		struct tbl *p;
Packit 991819
		uint32_t h = hash(ident);
Packit 991819
Packit 991819
		if ((cf & KEYWORD) && (p = ktsearch(&keywords, ident, h)) &&
Packit 991819
		    (!(cf & ESACONLY) || p->val.i == ESAC ||
Packit 991819
		    (unsigned int)p->val.i == ORD(/*{*/ '}'))) {
Packit 991819
			afree(yylval.cp, ATEMP);
Packit 991819
			return (p->val.i);
Packit 991819
		}
Packit 991819
		if ((cf & ALIAS) && (p = ktsearch(&aliases, ident, h)) &&
Packit 991819
		    (p->flag & ISSET)) {
Packit 991819
			/*
Packit 991819
			 * this still points to the same character as the
Packit 991819
			 * ungetsc'd terminator from above
Packit 991819
			 */
Packit 991819
			const char *cp = source->str;
Packit 991819
Packit 991819
			/* prefer POSIX but not Korn functions over aliases */
Packit 991819
			while (ctype(*cp, C_BLANK))
Packit 991819
				/*
Packit 991819
				 * this is like getsc() without skipping
Packit 991819
				 * over Source boundaries (including not
Packit 991819
				 * parsing ungetsc'd characters that got
Packit 991819
				 * pushed into an SREREAD) which is what
Packit 991819
				 * we want here anyway: find out whether
Packit 991819
				 * the alias name is followed by a POSIX
Packit 991819
				 * function definition
Packit 991819
				 */
Packit 991819
				++cp;
Packit 991819
			/* prefer functions over aliases */
Packit 991819
			if (cp[0] != '(' || cp[1] != ')') {
Packit 991819
				Source *s = source;
Packit 991819
Packit 991819
				while (s && (s->flags & SF_HASALIAS))
Packit 991819
					if (s->u.tblp == p)
Packit 991819
						return (LWORD);
Packit 991819
					else
Packit 991819
						s = s->next;
Packit 991819
				/* push alias expansion */
Packit 991819
				s = pushs(SALIAS, source->areap);
Packit 991819
				s->start = s->str = p->val.s;
Packit 991819
				s->u.tblp = p;
Packit 991819
				s->flags |= SF_HASALIAS;
Packit 991819
				s->line = source->line;
Packit 991819
				s->next = source;
Packit 991819
				if (source->type == SEOF) {
Packit 991819
					/* prevent infinite recursion at EOS */
Packit 991819
					source->u.tblp = p;
Packit 991819
					source->flags |= SF_HASALIAS;
Packit 991819
				}
Packit 991819
				source = s;
Packit 991819
				afree(yylval.cp, ATEMP);
Packit 991819
				goto Again;
Packit 991819
			}
Packit 991819
		}
Packit 991819
	} else if (*ident == '\0') {
Packit 991819
		/* retain typeset et al. even when quoted */
Packit 991819
		struct tbl *tt = get_builtin((dp = wdstrip(yylval.cp, 0)));
Packit 991819
		uint32_t flag = tt ? tt->flag : 0;
Packit 991819
Packit 991819
		if (flag & (DECL_UTIL | DECL_FWDR))
Packit 991819
			strlcpy(ident, dp, sizeof(ident));
Packit 991819
		afree(dp, ATEMP);
Packit 991819
	}
Packit 991819
Packit 991819
	return (LWORD);
Packit 991819
}
Packit 991819
Packit 991819
static void
Packit 991819
gethere(void)
Packit 991819
{
Packit 991819
	struct ioword **p;
Packit 991819
Packit 991819
	for (p = heres; p < herep; p++)
Packit 991819
		if (!((*p)->ioflag & IOHERESTR))
Packit 991819
			readhere(*p);
Packit 991819
	herep = heres;
Packit 991819
}
Packit 991819
Packit 991819
/*
Packit 991819
 * read "<
Packit 991819
 */
Packit 991819
Packit 991819
static void
Packit 991819
readhere(struct ioword *iop)
Packit 991819
{
Packit 991819
	int c;
Packit 991819
	const char *eof, *eofp;
Packit 991819
	XString xs;
Packit 991819
	char *xp;
Packit 991819
	size_t xpos;
Packit 991819
Packit 991819
	eof = evalstr(iop->delim, 0);
Packit 991819
Packit 991819
	if (!(iop->ioflag & IOEVAL))
Packit 991819
		ignore_backslash_newline++;
Packit 991819
Packit 991819
	Xinit(xs, xp, 256, ATEMP);
Packit 991819
Packit 991819
 heredoc_read_line:
Packit 991819
	/* beginning of line */
Packit 991819
	eofp = eof;
Packit 991819
	xpos = Xsavepos(xs, xp);
Packit 991819
	if (iop->ioflag & IOSKIP) {
Packit 991819
		/* skip over leading tabs */
Packit 991819
		while ((c = getsc()) == '\t')
Packit 991819
			;	/* nothing */
Packit 991819
		goto heredoc_parse_char;
Packit 991819
	}
Packit 991819
 heredoc_read_char:
Packit 991819
	c = getsc();
Packit 991819
 heredoc_parse_char:
Packit 991819
	/* compare with here document marker */
Packit 991819
	if (!*eofp) {
Packit 991819
		/* end of here document marker, what to do? */
Packit 991819
		switch (c) {
Packit 991819
		case ORD(/*(*/ ')'):
Packit 991819
			if (!subshell_nesting_type)
Packit 991819
				/*-
Packit 991819
				 * not allowed outside $(...) or (...)
Packit 991819
				 * => mismatch
Packit 991819
				 */
Packit 991819
				break;
Packit 991819
			/* allow $(...) or (...) to close here */
Packit 991819
			ungetsc(/*(*/ ')');
Packit 991819
			/* FALLTHROUGH */
Packit 991819
		case 0:
Packit 991819
			/*
Packit 991819
			 * Allow EOF here to commands without trailing
Packit 991819
			 * newlines (mksh -c '...') will work as well.
Packit 991819
			 */
Packit 991819
		case ORD('\n'):
Packit 991819
			/* Newline terminates here document marker */
Packit 991819
			goto heredoc_found_terminator;
Packit 991819
		}
Packit 991819
	} else if (c == *eofp++)
Packit 991819
		/* store; then read and compare next character */
Packit 991819
		goto heredoc_store_and_loop;
Packit 991819
	/* nope, mismatch; read until end of line */
Packit 991819
	while (c != '\n') {
Packit 991819
		if (!c)
Packit 991819
			/* oops, reached EOF */
Packit 991819
			yyerror(Tf_heredoc, eof);
Packit 991819
		/* store character */
Packit 991819
		Xcheck(xs, xp);
Packit 991819
		Xput(xs, xp, c);
Packit 991819
		/* read next character */
Packit 991819
		c = getsc();
Packit 991819
	}
Packit 991819
	/* we read a newline as last character */
Packit 991819
 heredoc_store_and_loop:
Packit 991819
	/* store character */
Packit 991819
	Xcheck(xs, xp);
Packit 991819
	Xput(xs, xp, c);
Packit 991819
	if (c == '\n')
Packit 991819
		goto heredoc_read_line;
Packit 991819
	goto heredoc_read_char;
Packit 991819
Packit 991819
 heredoc_found_terminator:
Packit 991819
	/* jump back to saved beginning of line */
Packit 991819
	xp = Xrestpos(xs, xp, xpos);
Packit 991819
	/* terminate, close and store */
Packit 991819
	Xput(xs, xp, '\0');
Packit 991819
	iop->heredoc = Xclose(xs, xp);
Packit 991819
Packit 991819
	if (!(iop->ioflag & IOEVAL))
Packit 991819
		ignore_backslash_newline--;
Packit 991819
}
Packit 991819
Packit 991819
void
Packit 991819
yyerror(const char *fmt, ...)
Packit 991819
{
Packit 991819
	va_list va;
Packit 991819
Packit 991819
	/* pop aliases and re-reads */
Packit 991819
	while (source->type == SALIAS || source->type == SREREAD)
Packit 991819
		source = source->next;
Packit 991819
	/* zap pending input */
Packit 991819
	source->str = null;
Packit 991819
Packit 991819
	error_prefix(true);
Packit 991819
	va_start(va, fmt);
Packit 991819
	shf_vfprintf(shl_out, fmt, va);
Packit 991819
	shf_putc('\n', shl_out);
Packit 991819
	va_end(va);
Packit 991819
	errorfz();
Packit 991819
}
Packit 991819
Packit 991819
/*
Packit 991819
 * input for yylex with alias expansion
Packit 991819
 */
Packit 991819
Packit 991819
Source *
Packit 991819
pushs(int type, Area *areap)
Packit 991819
{
Packit 991819
	Source *s;
Packit 991819
Packit 991819
	s = alloc(sizeof(Source), areap);
Packit 991819
	memset(s, 0, sizeof(Source));
Packit 991819
	s->type = type;
Packit 991819
	s->str = null;
Packit 991819
	s->areap = areap;
Packit 991819
	if (type == SFILE || type == SSTDIN)
Packit 991819
		XinitN(s->xs, 256, s->areap);
Packit 991819
	return (s);
Packit 991819
}
Packit 991819
Packit 991819
static int
Packit 991819
getsc_uu(void)
Packit 991819
{
Packit 991819
	Source *s = source;
Packit 991819
	int c;
Packit 991819
Packit 991819
	while ((c = ord(*s->str++)) == 0) {
Packit 991819
		/* return 0 for EOF by default */
Packit 991819
		s->str = NULL;
Packit 991819
		switch (s->type) {
Packit 991819
		case SEOF:
Packit 991819
			s->str = null;
Packit 991819
			return (0);
Packit 991819
Packit 991819
		case SSTDIN:
Packit 991819
		case SFILE:
Packit 991819
			getsc_line(s);
Packit 991819
			break;
Packit 991819
Packit 991819
		case SWSTR:
Packit 991819
			break;
Packit 991819
Packit 991819
		case SSTRING:
Packit 991819
		case SSTRINGCMDLINE:
Packit 991819
			break;
Packit 991819
Packit 991819
		case SWORDS:
Packit 991819
			s->start = s->str = *s->u.strv++;
Packit 991819
			s->type = SWORDSEP;
Packit 991819
			break;
Packit 991819
Packit 991819
		case SWORDSEP:
Packit 991819
			if (*s->u.strv == NULL) {
Packit 991819
				s->start = s->str = "\n";
Packit 991819
				s->type = SEOF;
Packit 991819
			} else {
Packit 991819
				s->start = s->str = T1space;
Packit 991819
				s->type = SWORDS;
Packit 991819
			}
Packit 991819
			break;
Packit 991819
Packit 991819
		case SALIAS:
Packit 991819
			if (s->flags & SF_ALIASEND) {
Packit 991819
				/* pass on an unused SF_ALIAS flag */
Packit 991819
				source = s->next;
Packit 991819
				source->flags |= s->flags & SF_ALIAS;
Packit 991819
				s = source;
Packit 991819
			} else if (*s->u.tblp->val.s &&
Packit 991819
			    ctype((c = strnul(s->u.tblp->val.s)[-1]), C_SPACE)) {
Packit 991819
				/* pop source stack */
Packit 991819
				source = s = s->next;
Packit 991819
				/*
Packit 991819
				 * Note that this alias ended with a
Packit 991819
				 * space, enabling alias expansion on
Packit 991819
				 * the following word.
Packit 991819
				 */
Packit 991819
				s->flags |= SF_ALIAS;
Packit 991819
			} else {
Packit 991819
				/*
Packit 991819
				 * At this point, we need to keep the current
Packit 991819
				 * alias in the source list so recursive
Packit 991819
				 * aliases can be detected and we also need to
Packit 991819
				 * return the next character. Do this by
Packit 991819
				 * temporarily popping the alias to get the
Packit 991819
				 * next character and then put it back in the
Packit 991819
				 * source list with the SF_ALIASEND flag set.
Packit 991819
				 */
Packit 991819
				/* pop source stack */
Packit 991819
				source = s->next;
Packit 991819
				source->flags |= s->flags & SF_ALIAS;
Packit 991819
				c = getsc_uu();
Packit 991819
				if (c) {
Packit 991819
					s->flags |= SF_ALIASEND;
Packit 991819
					s->ugbuf[0] = c; s->ugbuf[1] = '\0';
Packit 991819
					s->start = s->str = s->ugbuf;
Packit 991819
					s->next = source;
Packit 991819
					source = s;
Packit 991819
				} else {
Packit 991819
					s = source;
Packit 991819
					/* avoid reading EOF twice */
Packit 991819
					s->str = NULL;
Packit 991819
					break;
Packit 991819
				}
Packit 991819
			}
Packit 991819
			continue;
Packit 991819
Packit 991819
		case SREREAD:
Packit 991819
			if (s->start != s->ugbuf)
Packit 991819
				/* yuck */
Packit 991819
				afree(s->u.freeme, ATEMP);
Packit 991819
			source = s = s->next;
Packit 991819
			continue;
Packit 991819
		}
Packit 991819
		if (s->str == NULL) {
Packit 991819
			s->type = SEOF;
Packit 991819
			s->start = s->str = null;
Packit 991819
			return ('\0');
Packit 991819
		}
Packit 991819
		if (s->flags & SF_ECHO) {
Packit 991819
			shf_puts(s->str, shl_out);
Packit 991819
			shf_flush(shl_out);
Packit 991819
		}
Packit 991819
	}
Packit 991819
	return (c);
Packit 991819
}
Packit 991819
Packit 991819
static void
Packit 991819
getsc_line(Source *s)
Packit 991819
{
Packit 991819
	char *xp = Xstring(s->xs, xp), *cp;
Packit 991819
	bool interactive = Flag(FTALKING) && s->type == SSTDIN;
Packit 991819
	bool have_tty = tobool(interactive && (s->flags & SF_TTY));
Packit 991819
Packit 991819
	/* Done here to ensure nothing odd happens when a timeout occurs */
Packit 991819
	XcheckN(s->xs, xp, LINE);
Packit 991819
	*xp = '\0';
Packit 991819
	s->start = s->str = xp;
Packit 991819
Packit 991819
	if (have_tty && ksh_tmout) {
Packit 991819
		ksh_tmout_state = TMOUT_READING;
Packit 991819
		alarm(ksh_tmout);
Packit 991819
	}
Packit 991819
	if (interactive) {
Packit 991819
		if (cur_prompt == PS1)
Packit 991819
			histsave(&s->line, NULL, HIST_FLUSH, true);
Packit 991819
		change_winsz();
Packit 991819
	}
Packit 991819
#ifndef MKSH_NO_CMDLINE_EDITING
Packit 991819
	if (have_tty && (
Packit 991819
#if !MKSH_S_NOVI
Packit 991819
	    Flag(FVI) ||
Packit 991819
#endif
Packit 991819
	    Flag(FEMACS) || Flag(FGMACS))) {
Packit 991819
		int nread;
Packit 991819
Packit 991819
		nread = x_read(xp);
Packit 991819
		if (nread < 0)
Packit 991819
			/* read error */
Packit 991819
			nread = 0;
Packit 991819
		xp[nread] = '\0';
Packit 991819
		xp += nread;
Packit 991819
	} else
Packit 991819
#endif
Packit 991819
	  {
Packit 991819
		if (interactive)
Packit 991819
			pprompt(prompt, 0);
Packit 991819
		else
Packit 991819
			s->line++;
Packit 991819
Packit 991819
		while (/* CONSTCOND */ 1) {
Packit 991819
			char *p = shf_getse(xp, Xnleft(s->xs, xp), s->u.shf);
Packit 991819
Packit 991819
			if (!p && shf_error(s->u.shf) &&
Packit 991819
			    shf_errno(s->u.shf) == EINTR) {
Packit 991819
				shf_clearerr(s->u.shf);
Packit 991819
				if (trap)
Packit 991819
					runtraps(0);
Packit 991819
				continue;
Packit 991819
			}
Packit 991819
			if (!p || (xp = p, xp[-1] == '\n'))
Packit 991819
				break;
Packit 991819
			/* double buffer size */
Packit 991819
			/* move past NUL so doubling works... */
Packit 991819
			xp++;
Packit 991819
			XcheckN(s->xs, xp, Xlength(s->xs, xp));
Packit 991819
			/* ...and move back again */
Packit 991819
			xp--;
Packit 991819
		}
Packit 991819
		/*
Packit 991819
		 * flush any unwanted input so other programs/builtins
Packit 991819
		 * can read it. Not very optimal, but less error prone
Packit 991819
		 * than flushing else where, dealing with redirections,
Packit 991819
		 * etc.
Packit 991819
		 * TODO: reduce size of shf buffer (~128?) if SSTDIN
Packit 991819
		 */
Packit 991819
		if (s->type == SSTDIN)
Packit 991819
			shf_flush(s->u.shf);
Packit 991819
	}
Packit 991819
	/*
Packit 991819
	 * XXX: temporary kludge to restore source after a
Packit 991819
	 * trap may have been executed.
Packit 991819
	 */
Packit 991819
	source = s;
Packit 991819
	if (have_tty && ksh_tmout) {
Packit 991819
		ksh_tmout_state = TMOUT_EXECUTING;
Packit 991819
		alarm(0);
Packit 991819
	}
Packit 991819
	cp = Xstring(s->xs, xp);
Packit 991819
	rndpush(cp);
Packit 991819
	s->start = s->str = cp;
Packit 991819
	strip_nuls(Xstring(s->xs, xp), Xlength(s->xs, xp));
Packit 991819
	/* Note: if input is all nulls, this is not eof */
Packit 991819
	if (Xlength(s->xs, xp) == 0) {
Packit 991819
		/* EOF */
Packit 991819
		if (s->type == SFILE)
Packit 991819
			shf_fdclose(s->u.shf);
Packit 991819
		s->str = NULL;
Packit 991819
	} else if (interactive && *s->str) {
Packit 991819
		if (cur_prompt != PS1)
Packit 991819
			histsave(&s->line, s->str, HIST_APPEND, true);
Packit 991819
		else if (!ctype(*s->str, C_IFS | C_IFSWS))
Packit 991819
			histsave(&s->line, s->str, HIST_QUEUE, true);
Packit 991819
#if !defined(MKSH_SMALL) && HAVE_PERSISTENT_HISTORY
Packit 991819
		else
Packit 991819
			goto check_for_sole_return;
Packit 991819
	} else if (interactive && cur_prompt == PS1) {
Packit 991819
 check_for_sole_return:
Packit 991819
		cp = Xstring(s->xs, xp);
Packit 991819
		while (ctype(*cp, C_IFSWS))
Packit 991819
			++cp;
Packit 991819
		if (!*cp) {
Packit 991819
			histsave(&s->line, NULL, HIST_FLUSH, true);
Packit 991819
			histsync();
Packit 991819
		}
Packit 991819
#endif
Packit 991819
	}
Packit 991819
	if (interactive)
Packit 991819
		set_prompt(PS2, NULL);
Packit 991819
}
Packit 991819
Packit 991819
void
Packit 991819
set_prompt(int to, Source *s)
Packit 991819
{
Packit 991819
	cur_prompt = (uint8_t)to;
Packit 991819
Packit 991819
	switch (to) {
Packit 991819
	/* command */
Packit 991819
	case PS1:
Packit 991819
		/*
Packit 991819
		 * Substitute ! and !! here, before substitutions are done
Packit 991819
		 * so ! in expanded variables are not expanded.
Packit 991819
		 * NOTE: this is not what AT&T ksh does (it does it after
Packit 991819
		 * substitutions, POSIX doesn't say which is to be done.
Packit 991819
		 */
Packit 991819
		{
Packit 991819
			struct shf *shf;
Packit 991819
			char * volatile ps1;
Packit 991819
			Area *saved_atemp;
Packit 991819
			int saved_lineno;
Packit 991819
Packit 991819
			ps1 = str_val(global("PS1"));
Packit 991819
			shf = shf_sopen(NULL, strlen(ps1) * 2,
Packit 991819
			    SHF_WR | SHF_DYNAMIC, NULL);
Packit 991819
			while (*ps1)
Packit 991819
				if (*ps1 != '!' || *++ps1 == '!')
Packit 991819
					shf_putchar(*ps1++, shf);
Packit 991819
				else
Packit 991819
					shf_fprintf(shf, Tf_lu, s ?
Packit 991819
					    (unsigned long)s->line + 1 : 0UL);
Packit 991819
			ps1 = shf_sclose(shf);
Packit 991819
			saved_lineno = current_lineno;
Packit 991819
			if (s)
Packit 991819
				current_lineno = s->line + 1;
Packit 991819
			saved_atemp = ATEMP;
Packit 991819
			newenv(E_ERRH);
Packit 991819
			if (kshsetjmp(e->jbuf)) {
Packit 991819
				prompt = safe_prompt;
Packit 991819
				/*
Packit 991819
				 * Don't print an error - assume it has already
Packit 991819
				 * been printed. Reason is we may have forked
Packit 991819
				 * to run a command and the child may be
Packit 991819
				 * unwinding its stack through this code as it
Packit 991819
				 * exits.
Packit 991819
				 */
Packit 991819
			} else {
Packit 991819
				char *cp = substitute(ps1, 0);
Packit 991819
				strdupx(prompt, cp, saved_atemp);
Packit 991819
			}
Packit 991819
			current_lineno = saved_lineno;
Packit 991819
			quitenv(NULL);
Packit 991819
		}
Packit 991819
		break;
Packit 991819
	/* command continuation */
Packit 991819
	case PS2:
Packit 991819
		prompt = str_val(global("PS2"));
Packit 991819
		break;
Packit 991819
	}
Packit 991819
}
Packit 991819
Packit 991819
int
Packit 991819
pprompt(const char *cp, int ntruncate)
Packit 991819
{
Packit 991819
	char delimiter = 0;
Packit 991819
	bool doprint = (ntruncate != -1);
Packit 991819
	bool indelimit = false;
Packit 991819
	int columns = 0, lines = 0;
Packit 991819
Packit 991819
	/*
Packit 991819
	 * Undocumented AT&T ksh feature:
Packit 991819
	 * If the second char in the prompt string is \r then the first
Packit 991819
	 * char is taken to be a non-printing delimiter and any chars
Packit 991819
	 * between two instances of the delimiter are not considered to
Packit 991819
	 * be part of the prompt length
Packit 991819
	 */
Packit 991819
	if (*cp && cp[1] == '\r') {
Packit 991819
		delimiter = *cp;
Packit 991819
		cp += 2;
Packit 991819
	}
Packit 991819
	for (; *cp; cp++) {
Packit 991819
		if (indelimit && *cp != delimiter)
Packit 991819
			;
Packit 991819
		else if (ctype(*cp, C_CR | C_LF)) {
Packit 991819
			lines += columns / x_cols + ((*cp == '\n') ? 1 : 0);
Packit 991819
			columns = 0;
Packit 991819
		} else if (*cp == '\t') {
Packit 991819
			columns = (columns | 7) + 1;
Packit 991819
		} else if (*cp == '\b') {
Packit 991819
			if (columns > 0)
Packit 991819
				columns--;
Packit 991819
		} else if (*cp == delimiter)
Packit 991819
			indelimit = !indelimit;
Packit 991819
		else if (UTFMODE && (rtt2asc(*cp) > 0x7F)) {
Packit 991819
			const char *cp2;
Packit 991819
			columns += utf_widthadj(cp, &cp2);
Packit 991819
			if (doprint && (indelimit ||
Packit 991819
			    (ntruncate < (x_cols * lines + columns))))
Packit 991819
				shf_write(cp, cp2 - cp, shl_out);
Packit 991819
			cp = cp2 - /* loop increment */ 1;
Packit 991819
			continue;
Packit 991819
		} else
Packit 991819
			columns++;
Packit 991819
		if (doprint && (*cp != delimiter) &&
Packit 991819
		    (indelimit || (ntruncate < (x_cols * lines + columns))))
Packit 991819
			shf_putc(*cp, shl_out);
Packit 991819
	}
Packit 991819
	if (doprint)
Packit 991819
		shf_flush(shl_out);
Packit 991819
	return (x_cols * lines + columns);
Packit 991819
}
Packit 991819
Packit 991819
/*
Packit 991819
 * Read the variable part of a ${...} expression (i.e. up to but not
Packit 991819
 * including the :[-+?=#%] or close-brace).
Packit 991819
 */
Packit 991819
static char *
Packit 991819
get_brace_var(XString *wsp, char *wp)
Packit 991819
{
Packit 991819
	char c;
Packit 991819
	enum parse_state {
Packit 991819
		PS_INITIAL, PS_SAW_PERCENT, PS_SAW_HASH, PS_SAW_BANG,
Packit 991819
		PS_IDENT, PS_NUMBER, PS_VAR1
Packit 991819
	} state = PS_INITIAL;
Packit 991819
Packit 991819
	while (/* CONSTCOND */ 1) {
Packit 991819
		c = getsc();
Packit 991819
		/* State machine to figure out where the variable part ends. */
Packit 991819
		switch (state) {
Packit 991819
		case PS_SAW_HASH:
Packit 991819
			if (ctype(c, C_VAR1)) {
Packit 991819
				char c2;
Packit 991819
Packit 991819
				c2 = getsc();
Packit 991819
				ungetsc(c2);
Packit 991819
				if (ord(c2) != ORD(/*{*/ '}')) {
Packit 991819
					ungetsc(c);
Packit 991819
					goto out;
Packit 991819
				}
Packit 991819
			}
Packit 991819
			goto ps_common;
Packit 991819
		case PS_SAW_BANG:
Packit 991819
			switch (ord(c)) {
Packit 991819
			case ORD('@'):
Packit 991819
			case ORD('#'):
Packit 991819
			case ORD('-'):
Packit 991819
			case ORD('?'):
Packit 991819
				goto out;
Packit 991819
			}
Packit 991819
			goto ps_common;
Packit 991819
		case PS_INITIAL:
Packit 991819
			switch (ord(c)) {
Packit 991819
			case ORD('%'):
Packit 991819
				state = PS_SAW_PERCENT;
Packit 991819
				goto next;
Packit 991819
			case ORD('#'):
Packit 991819
				state = PS_SAW_HASH;
Packit 991819
				goto next;
Packit 991819
			case ORD('!'):
Packit 991819
				state = PS_SAW_BANG;
Packit 991819
				goto next;
Packit 991819
			}
Packit 991819
			/* FALLTHROUGH */
Packit 991819
		case PS_SAW_PERCENT:
Packit 991819
 ps_common:
Packit 991819
			if (ctype(c, C_ALPHX))
Packit 991819
				state = PS_IDENT;
Packit 991819
			else if (ctype(c, C_DIGIT))
Packit 991819
				state = PS_NUMBER;
Packit 991819
			else if (ctype(c, C_VAR1))
Packit 991819
				state = PS_VAR1;
Packit 991819
			else
Packit 991819
				goto out;
Packit 991819
			break;
Packit 991819
		case PS_IDENT:
Packit 991819
			if (!ctype(c, C_ALNUX)) {
Packit 991819
				if (ord(c) == ORD('[')) {
Packit 991819
					char *tmp, *p;
Packit 991819
Packit 991819
					if (!arraysub(&tmp))
Packit 991819
						yyerror("missing ]");
Packit 991819
					*wp++ = c;
Packit 991819
					p = tmp;
Packit 991819
					while (*p) {
Packit 991819
						Xcheck(*wsp, wp);
Packit 991819
						*wp++ = *p++;
Packit 991819
					}
Packit 991819
					afree(tmp, ATEMP);
Packit 991819
					/* the ] */
Packit 991819
					c = getsc();
Packit 991819
				}
Packit 991819
				goto out;
Packit 991819
			}
Packit 991819
 next:
Packit 991819
			break;
Packit 991819
		case PS_NUMBER:
Packit 991819
			if (!ctype(c, C_DIGIT))
Packit 991819
				goto out;
Packit 991819
			break;
Packit 991819
		case PS_VAR1:
Packit 991819
			goto out;
Packit 991819
		}
Packit 991819
		Xcheck(*wsp, wp);
Packit 991819
		*wp++ = c;
Packit 991819
	}
Packit 991819
 out:
Packit 991819
	/* end of variable part */
Packit 991819
	*wp++ = '\0';
Packit 991819
	ungetsc(c);
Packit 991819
	return (wp);
Packit 991819
}
Packit 991819
Packit 991819
/*
Packit 991819
 * Save an array subscript - returns true if matching bracket found, false
Packit 991819
 * if eof or newline was found.
Packit 991819
 * (Returned string double null terminated)
Packit 991819
 */
Packit 991819
static bool
Packit 991819
arraysub(char **strp)
Packit 991819
{
Packit 991819
	XString ws;
Packit 991819
	char *wp, c;
Packit 991819
	/* we are just past the initial [ */
Packit 991819
	unsigned int depth = 1;
Packit 991819
Packit 991819
	Xinit(ws, wp, 32, ATEMP);
Packit 991819
Packit 991819
	do {
Packit 991819
		c = getsc();
Packit 991819
		Xcheck(ws, wp);
Packit 991819
		*wp++ = c;
Packit 991819
		if (ord(c) == ORD('['))
Packit 991819
			depth++;
Packit 991819
		else if (ord(c) == ORD(']'))
Packit 991819
			depth--;
Packit 991819
	} while (depth > 0 && c && c != '\n');
Packit 991819
Packit 991819
	*wp++ = '\0';
Packit 991819
	*strp = Xclose(ws, wp);
Packit 991819
Packit 991819
	return (tobool(depth == 0));
Packit 991819
}
Packit 991819
Packit 991819
/* Unget a char: handles case when we are already at the start of the buffer */
Packit 991819
static void
Packit 991819
ungetsc(int c)
Packit 991819
{
Packit 991819
	struct sretrace_info *rp = retrace_info;
Packit 991819
Packit 991819
	if (backslash_skip)
Packit 991819
		backslash_skip--;
Packit 991819
	/* Don't unget EOF... */
Packit 991819
	if (source->str == null && c == '\0')
Packit 991819
		return;
Packit 991819
	while (rp) {
Packit 991819
		if (Xlength(rp->xs, rp->xp))
Packit 991819
			rp->xp--;
Packit 991819
		rp = rp->next;
Packit 991819
	}
Packit 991819
	ungetsc_i(c);
Packit 991819
}
Packit 991819
static void
Packit 991819
ungetsc_i(int c)
Packit 991819
{
Packit 991819
	if (source->str > source->start)
Packit 991819
		source->str--;
Packit 991819
	else {
Packit 991819
		Source *s;
Packit 991819
Packit 991819
		s = pushs(SREREAD, source->areap);
Packit 991819
		s->ugbuf[0] = c; s->ugbuf[1] = '\0';
Packit 991819
		s->start = s->str = s->ugbuf;
Packit 991819
		s->next = source;
Packit 991819
		source = s;
Packit 991819
	}
Packit 991819
}
Packit 991819
Packit 991819
Packit 991819
/* Called to get a char that isn't a \newline sequence. */
Packit 991819
static int
Packit 991819
getsc_bn(void)
Packit 991819
{
Packit 991819
	int c, c2;
Packit 991819
Packit 991819
	if (ignore_backslash_newline)
Packit 991819
		return (o_getsc_u());
Packit 991819
Packit 991819
	if (backslash_skip == 1) {
Packit 991819
		backslash_skip = 2;
Packit 991819
		return (o_getsc_u());
Packit 991819
	}
Packit 991819
Packit 991819
	backslash_skip = 0;
Packit 991819
Packit 991819
	while (/* CONSTCOND */ 1) {
Packit 991819
		c = o_getsc_u();
Packit 991819
		if (c == '\\') {
Packit 991819
			if ((c2 = o_getsc_u()) == '\n')
Packit 991819
				/* ignore the \newline; get the next char... */
Packit 991819
				continue;
Packit 991819
			ungetsc_i(c2);
Packit 991819
			backslash_skip = 1;
Packit 991819
		}
Packit 991819
		return (c);
Packit 991819
	}
Packit 991819
}
Packit 991819
Packit 991819
void
Packit 991819
yyskiputf8bom(void)
Packit 991819
{
Packit 991819
	int c;
Packit 991819
Packit 991819
	if (rtt2asc((c = o_getsc_u())) != 0xEF) {
Packit 991819
		ungetsc_i(c);
Packit 991819
		return;
Packit 991819
	}
Packit 991819
	if (rtt2asc((c = o_getsc_u())) != 0xBB) {
Packit 991819
		ungetsc_i(c);
Packit 991819
		ungetsc_i(asc2rtt(0xEF));
Packit 991819
		return;
Packit 991819
	}
Packit 991819
	if (rtt2asc((c = o_getsc_u())) != 0xBF) {
Packit 991819
		ungetsc_i(c);
Packit 991819
		ungetsc_i(asc2rtt(0xBB));
Packit 991819
		ungetsc_i(asc2rtt(0xEF));
Packit 991819
		return;
Packit 991819
	}
Packit 991819
	UTFMODE |= 8;
Packit 991819
}
Packit 991819
Packit 991819
static Lex_state *
Packit 991819
push_state_i(State_info *si, Lex_state *old_end)
Packit 991819
{
Packit 991819
	Lex_state *news = alloc2(STATE_BSIZE, sizeof(Lex_state), ATEMP);
Packit 991819
Packit 991819
	news[0].ls_base = old_end;
Packit 991819
	si->base = &news[0];
Packit 991819
	si->end = &news[STATE_BSIZE];
Packit 991819
	return (&news[1]);
Packit 991819
}
Packit 991819
Packit 991819
static Lex_state *
Packit 991819
pop_state_i(State_info *si, Lex_state *old_end)
Packit 991819
{
Packit 991819
	Lex_state *old_base = si->base;
Packit 991819
Packit 991819
	si->base = old_end->ls_base - STATE_BSIZE;
Packit 991819
	si->end = old_end->ls_base;
Packit 991819
Packit 991819
	afree(old_base, ATEMP);
Packit 991819
Packit 991819
	return (si->base + STATE_BSIZE - 1);
Packit 991819
}