Home | History | Annotate | Line # | Download | only in sh
parser.h revision 1.30
      1  1.30       kre /*	$NetBSD: parser.h,v 1.30 2024/10/21 15:57:45 kre Exp $	*/
      2   1.9       cgd 
      3   1.1       cgd /*-
      4   1.5       jtc  * Copyright (c) 1991, 1993
      5   1.5       jtc  *	The Regents of the University of California.  All rights reserved.
      6   1.1       cgd  *
      7   1.1       cgd  * This code is derived from software contributed to Berkeley by
      8   1.1       cgd  * Kenneth Almquist.
      9   1.1       cgd  *
     10   1.1       cgd  * Redistribution and use in source and binary forms, with or without
     11   1.1       cgd  * modification, are permitted provided that the following conditions
     12   1.1       cgd  * are met:
     13   1.1       cgd  * 1. Redistributions of source code must retain the above copyright
     14   1.1       cgd  *    notice, this list of conditions and the following disclaimer.
     15   1.1       cgd  * 2. Redistributions in binary form must reproduce the above copyright
     16   1.1       cgd  *    notice, this list of conditions and the following disclaimer in the
     17   1.1       cgd  *    documentation and/or other materials provided with the distribution.
     18  1.16       agc  * 3. Neither the name of the University nor the names of its contributors
     19   1.1       cgd  *    may be used to endorse or promote products derived from this software
     20   1.1       cgd  *    without specific prior written permission.
     21   1.1       cgd  *
     22   1.1       cgd  * THIS SOFTWARE IS PROVIDED BY THE REGENTS AND CONTRIBUTORS ``AS IS'' AND
     23   1.1       cgd  * ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
     24   1.1       cgd  * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
     25   1.1       cgd  * ARE DISCLAIMED.  IN NO EVENT SHALL THE REGENTS OR CONTRIBUTORS BE LIABLE
     26   1.1       cgd  * FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL
     27   1.1       cgd  * DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS
     28   1.1       cgd  * OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION)
     29   1.1       cgd  * HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT
     30   1.1       cgd  * LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY
     31   1.1       cgd  * OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF
     32   1.1       cgd  * SUCH DAMAGE.
     33   1.1       cgd  *
     34  1.10  christos  *	@(#)parser.h	8.3 (Berkeley) 5/4/95
     35   1.1       cgd  */
     36   1.1       cgd 
     37   1.1       cgd /* control characters in argument strings */
     38  1.15  christos #define CTL_FIRST '\201'	/* first 'special' character */
     39  1.15  christos #define CTLESC '\201'		/* escape next character */
     40  1.15  christos #define CTLVAR '\202'		/* variable defn */
     41   1.1       cgd #define CTLENDVAR '\203'
     42   1.1       cgd #define CTLBACKQ '\204'
     43   1.1       cgd #define CTLQUOTE 01		/* ored with CTLBACKQ code if in quotes */
     44   1.5       jtc /*	CTLBACKQ | CTLQUOTE == '\205' */
     45  1.15  christos #define	CTLARI	'\206'		/* arithmetic expression */
     46   1.5       jtc #define	CTLENDARI '\207'
     47  1.12   mycroft #define	CTLQUOTEMARK '\210'
     48  1.17       dsl #define	CTLQUOTEEND '\211'	/* only inside ${...} */
     49  1.24       kre #define	CTLNONL '\212'		/* The \n in a deleted \ \n sequence */
     50  1.22       kre 			/* pure concidence that (CTLNONL & 0x7f) == '\n' */
     51  1.24       kre #define	CTLCNL	'\213'		/* A $'\n' - newline not counted */
     52  1.30       kre #define	CTLVARMOD '\214'	/* a modifier in a variable expansion */
     53  1.30       kre #define	CTL_LAST '\214'		/* last 'special' character */
     54   1.1       cgd 
     55   1.1       cgd /* variable substitution byte (follows CTLVAR) */
     56  1.18  christos #define VSTYPE		0x0f	/* type of variable substitution */
     57  1.18  christos #define VSNUL		0x10	/* colon--treat the empty string as unset */
     58  1.18  christos #define VSLINENO	0x20	/* expansion of $LINENO, the line number
     59  1.18  christos 				   follows immediately */
     60  1.19  christos #define VSPATQ		0x40	/* ensure correct pattern quoting in ${x#pat} */
     61  1.18  christos #define VSQUOTE	 	0x80	/* inside double quotes--suppress splitting */
     62   1.1       cgd 
     63  1.30       kre /* values of VSTYPE field (nb: 0 reserved for "not determined yet") */
     64   1.8  christos #define VSNORMAL	0x1		/* normal variable:  $var or ${var} */
     65   1.8  christos #define VSMINUS		0x2		/* ${var-text} */
     66   1.8  christos #define VSPLUS		0x3		/* ${var+text} */
     67   1.8  christos #define VSQUESTION	0x4		/* ${var?message} */
     68   1.8  christos #define VSASSIGN	0x5		/* ${var=text} */
     69   1.8  christos #define VSTRIMLEFT	0x6		/* ${var#pattern} */
     70   1.8  christos #define VSTRIMLEFTMAX	0x7		/* ${var##pattern} */
     71   1.8  christos #define VSTRIMRIGHT	0x8		/* ${var%pattern} */
     72   1.8  christos #define VSTRIMRIGHTMAX 	0x9		/* ${var%%pattern} */
     73   1.8  christos #define VSLENGTH	0xa		/* ${#var} */
     74  1.30       kre #define VSUNKNOWN	0xf		/* unknown modifier */
     75   1.1       cgd 
     76  1.23       kre union node *parsecmd(int);
     77  1.23       kre void fixredir(union node *, const char *, int);
     78  1.25       kre int goodname(const char *);
     79  1.26       kre int isassignment(const char *);
     80  1.23       kre const char *getprompt(void *);
     81  1.23       kre const char *expandstr(char *, int);
     82  1.29       kre const char *expandvar(char *, int);
     83  1.27       kre const char *expandenv(char *);
     84  1.23       kre 
     85  1.23       kre struct HereDoc;
     86  1.23       kre union node;
     87  1.23       kre struct nodelist;
     88  1.23       kre 
     89  1.23       kre struct parse_state {
     90  1.23       kre 	struct HereDoc *ps_heredoclist;	/* list of here documents to read */
     91  1.23       kre 	int ps_parsebackquote;		/* nonzero inside backquotes */
     92  1.23       kre 	int ps_doprompt;		/* if set, prompt the user */
     93  1.23       kre 	int ps_needprompt;		/* true if interactive at line start */
     94  1.23       kre 	int ps_lasttoken;		/* last token read */
     95  1.23       kre 	int ps_tokpushback;		/* last token pushed back */
     96  1.23       kre 	char *ps_wordtext;	/* text of last word returned by readtoken */
     97  1.26       kre 	int ps_checkkwd;		/* word expansion flags, see below */
     98  1.23       kre 	struct nodelist *ps_backquotelist; /* list of cmdsubs to process */
     99  1.23       kre 	union node *ps_redirnode;	/* node for current redirect */
    100  1.28       kre 	struct HereDoc *ps_heredoc;	/* current heredoc << being parsed */
    101  1.23       kre 	int ps_quoteflag;		/* set if (part) of token was quoted */
    102  1.23       kre 	int ps_startlinno;		/* line # where last token started */
    103  1.23       kre 	int ps_funclinno;		/* line # of the current function */
    104  1.23       kre 	int ps_elided_nl;		/* count of \ \n pairs we have seen */
    105  1.23       kre };
    106  1.23       kre 
    107  1.23       kre /*
    108  1.23       kre  * The parser references the elements of struct parse_state quite
    109  1.23       kre  * frequently - they used to be simple globals, so one memory ref
    110  1.28       kre  * per access, adding an indirect through a global ptr would not be
    111  1.23       kre  * nice.   The following gross hack allows most of that cost to be
    112  1.23       kre  * avoided, by allowing the compiler to understand that the global
    113  1.23       kre  * pointer is in fact constant in any function, and so its value can
    114  1.23       kre  * be cached, rather than needing to be fetched every time in case
    115  1.23       kre  * some other called function has changed it.
    116  1.23       kre  *
    117  1.23       kre  * The rule to make this work is that any function that wants
    118  1.23       kre  * to alter the global must restore it before it returns (and thus
    119  1.23       kre  * must have an error trap handler).  That means that the struct
    120  1.23       kre  * used for the new parser state can be a local in that function's
    121  1.23       kre  * stack frame, it never needs to be malloc'd.
    122  1.23       kre  */
    123  1.23       kre 
    124  1.23       kre union parse_state_p {
    125  1.23       kre 	struct parse_state *const	c_current_parser;
    126  1.23       kre 	struct parse_state *		v_current_parser;
    127  1.23       kre };
    128  1.23       kre 
    129  1.23       kre extern union parse_state_p psp;
    130  1.23       kre 
    131  1.23       kre #define	current_parser (psp.c_current_parser)
    132  1.23       kre 
    133  1.23       kre /*
    134  1.23       kre  * Perhaps one day emulate "static" by moving most of these definitions into
    135  1.23       kre  * parser.c ...  (only checkkwd & tokpushback are used outside parser.c,
    136  1.23       kre  * and only in init.c as a RESET activity)
    137  1.23       kre  */
    138  1.23       kre #define	tokpushback	(current_parser->ps_tokpushback)
    139  1.23       kre #define	checkkwd	(current_parser->ps_checkkwd)
    140  1.23       kre 
    141  1.23       kre #define	heredoclist	(current_parser->ps_heredoclist)
    142  1.23       kre #define	parsebackquote	(current_parser->ps_parsebackquote)
    143  1.23       kre #define	doprompt	(current_parser->ps_doprompt)
    144  1.23       kre #define	needprompt	(current_parser->ps_needprompt)
    145  1.23       kre #define	lasttoken	(current_parser->ps_lasttoken)
    146  1.23       kre #define	wordtext	(current_parser->ps_wordtext)
    147  1.23       kre #define	backquotelist	(current_parser->ps_backquotelist)
    148  1.23       kre #define	redirnode	(current_parser->ps_redirnode)
    149  1.23       kre #define	heredoc		(current_parser->ps_heredoc)
    150  1.23       kre #define	quoteflag	(current_parser->ps_quoteflag)
    151  1.23       kre #define	startlinno	(current_parser->ps_startlinno)
    152  1.23       kre #define	funclinno	(current_parser->ps_funclinno)
    153  1.23       kre #define	elided_nl	(current_parser->ps_elided_nl)
    154   1.1       cgd 
    155   1.1       cgd /*
    156  1.26       kre  * Values that can be set in checkkwd
    157  1.26       kre  */
    158  1.26       kre #define CHKKWD		0x01		/* turn word into keyword (if it is) */
    159  1.26       kre #define CHKNL		0x02		/* ignore leading \n's */
    160  1.26       kre #define CHKALIAS	0x04		/* lookup words as aliases and ... */
    161  1.26       kre 
    162  1.26       kre /*
    163   1.1       cgd  * NEOF is returned by parsecmd when it encounters an end of file.  It
    164   1.1       cgd  * must be distinct from NULL, so we use the address of a variable that
    165   1.1       cgd  * happens to be handy.
    166   1.1       cgd  */
    167  1.23       kre #define NEOF ((union node *)&psp)
    168  1.22       kre 
    169  1.22       kre #ifdef DEBUG
    170  1.22       kre extern int parsing;
    171  1.22       kre #endif
    172