1 1.30 kre /* $NetBSD: parser.h,v 1.30 2024/10/21 15:57:45 kre Exp $ */ 2 1.9 cgd 3 1.1 cgd /*- 4 1.5 jtc * Copyright (c) 1991, 1993 5 1.5 jtc * The Regents of the University of California. All rights reserved. 6 1.1 cgd * 7 1.1 cgd * This code is derived from software contributed to Berkeley by 8 1.1 cgd * Kenneth Almquist. 9 1.1 cgd * 10 1.1 cgd * Redistribution and use in source and binary forms, with or without 11 1.1 cgd * modification, are permitted provided that the following conditions 12 1.1 cgd * are met: 13 1.1 cgd * 1. Redistributions of source code must retain the above copyright 14 1.1 cgd * notice, this list of conditions and the following disclaimer. 15 1.1 cgd * 2. Redistributions in binary form must reproduce the above copyright 16 1.1 cgd * notice, this list of conditions and the following disclaimer in the 17 1.1 cgd * documentation and/or other materials provided with the distribution. 18 1.16 agc * 3. Neither the name of the University nor the names of its contributors 19 1.1 cgd * may be used to endorse or promote products derived from this software 20 1.1 cgd * without specific prior written permission. 21 1.1 cgd * 22 1.1 cgd * THIS SOFTWARE IS PROVIDED BY THE REGENTS AND CONTRIBUTORS ``AS IS'' AND 23 1.1 cgd * ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE 24 1.1 cgd * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE 25 1.1 cgd * ARE DISCLAIMED. IN NO EVENT SHALL THE REGENTS OR CONTRIBUTORS BE LIABLE 26 1.1 cgd * FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL 27 1.1 cgd * DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS 28 1.1 cgd * OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION) 29 1.1 cgd * HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT 30 1.1 cgd * LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY 31 1.1 cgd * OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF 32 1.1 cgd * SUCH DAMAGE. 33 1.1 cgd * 34 1.10 christos * @(#)parser.h 8.3 (Berkeley) 5/4/95 35 1.1 cgd */ 36 1.1 cgd 37 1.1 cgd /* control characters in argument strings */ 38 1.15 christos #define CTL_FIRST '\201' /* first 'special' character */ 39 1.15 christos #define CTLESC '\201' /* escape next character */ 40 1.15 christos #define CTLVAR '\202' /* variable defn */ 41 1.1 cgd #define CTLENDVAR '\203' 42 1.1 cgd #define CTLBACKQ '\204' 43 1.1 cgd #define CTLQUOTE 01 /* ored with CTLBACKQ code if in quotes */ 44 1.5 jtc /* CTLBACKQ | CTLQUOTE == '\205' */ 45 1.15 christos #define CTLARI '\206' /* arithmetic expression */ 46 1.5 jtc #define CTLENDARI '\207' 47 1.12 mycroft #define CTLQUOTEMARK '\210' 48 1.17 dsl #define CTLQUOTEEND '\211' /* only inside ${...} */ 49 1.24 kre #define CTLNONL '\212' /* The \n in a deleted \ \n sequence */ 50 1.22 kre /* pure concidence that (CTLNONL & 0x7f) == '\n' */ 51 1.24 kre #define CTLCNL '\213' /* A $'\n' - newline not counted */ 52 1.30 kre #define CTLVARMOD '\214' /* a modifier in a variable expansion */ 53 1.30 kre #define CTL_LAST '\214' /* last 'special' character */ 54 1.1 cgd 55 1.1 cgd /* variable substitution byte (follows CTLVAR) */ 56 1.18 christos #define VSTYPE 0x0f /* type of variable substitution */ 57 1.18 christos #define VSNUL 0x10 /* colon--treat the empty string as unset */ 58 1.18 christos #define VSLINENO 0x20 /* expansion of $LINENO, the line number 59 1.18 christos follows immediately */ 60 1.19 christos #define VSPATQ 0x40 /* ensure correct pattern quoting in ${x#pat} */ 61 1.18 christos #define VSQUOTE 0x80 /* inside double quotes--suppress splitting */ 62 1.1 cgd 63 1.30 kre /* values of VSTYPE field (nb: 0 reserved for "not determined yet") */ 64 1.8 christos #define VSNORMAL 0x1 /* normal variable: $var or ${var} */ 65 1.8 christos #define VSMINUS 0x2 /* ${var-text} */ 66 1.8 christos #define VSPLUS 0x3 /* ${var+text} */ 67 1.8 christos #define VSQUESTION 0x4 /* ${var?message} */ 68 1.8 christos #define VSASSIGN 0x5 /* ${var=text} */ 69 1.8 christos #define VSTRIMLEFT 0x6 /* ${var#pattern} */ 70 1.8 christos #define VSTRIMLEFTMAX 0x7 /* ${var##pattern} */ 71 1.8 christos #define VSTRIMRIGHT 0x8 /* ${var%pattern} */ 72 1.8 christos #define VSTRIMRIGHTMAX 0x9 /* ${var%%pattern} */ 73 1.8 christos #define VSLENGTH 0xa /* ${#var} */ 74 1.30 kre #define VSUNKNOWN 0xf /* unknown modifier */ 75 1.1 cgd 76 1.23 kre union node *parsecmd(int); 77 1.23 kre void fixredir(union node *, const char *, int); 78 1.25 kre int goodname(const char *); 79 1.26 kre int isassignment(const char *); 80 1.23 kre const char *getprompt(void *); 81 1.23 kre const char *expandstr(char *, int); 82 1.29 kre const char *expandvar(char *, int); 83 1.27 kre const char *expandenv(char *); 84 1.23 kre 85 1.23 kre struct HereDoc; 86 1.23 kre union node; 87 1.23 kre struct nodelist; 88 1.23 kre 89 1.23 kre struct parse_state { 90 1.23 kre struct HereDoc *ps_heredoclist; /* list of here documents to read */ 91 1.23 kre int ps_parsebackquote; /* nonzero inside backquotes */ 92 1.23 kre int ps_doprompt; /* if set, prompt the user */ 93 1.23 kre int ps_needprompt; /* true if interactive at line start */ 94 1.23 kre int ps_lasttoken; /* last token read */ 95 1.23 kre int ps_tokpushback; /* last token pushed back */ 96 1.23 kre char *ps_wordtext; /* text of last word returned by readtoken */ 97 1.26 kre int ps_checkkwd; /* word expansion flags, see below */ 98 1.23 kre struct nodelist *ps_backquotelist; /* list of cmdsubs to process */ 99 1.23 kre union node *ps_redirnode; /* node for current redirect */ 100 1.28 kre struct HereDoc *ps_heredoc; /* current heredoc << being parsed */ 101 1.23 kre int ps_quoteflag; /* set if (part) of token was quoted */ 102 1.23 kre int ps_startlinno; /* line # where last token started */ 103 1.23 kre int ps_funclinno; /* line # of the current function */ 104 1.23 kre int ps_elided_nl; /* count of \ \n pairs we have seen */ 105 1.23 kre }; 106 1.23 kre 107 1.23 kre /* 108 1.23 kre * The parser references the elements of struct parse_state quite 109 1.23 kre * frequently - they used to be simple globals, so one memory ref 110 1.28 kre * per access, adding an indirect through a global ptr would not be 111 1.23 kre * nice. The following gross hack allows most of that cost to be 112 1.23 kre * avoided, by allowing the compiler to understand that the global 113 1.23 kre * pointer is in fact constant in any function, and so its value can 114 1.23 kre * be cached, rather than needing to be fetched every time in case 115 1.23 kre * some other called function has changed it. 116 1.23 kre * 117 1.23 kre * The rule to make this work is that any function that wants 118 1.23 kre * to alter the global must restore it before it returns (and thus 119 1.23 kre * must have an error trap handler). That means that the struct 120 1.23 kre * used for the new parser state can be a local in that function's 121 1.23 kre * stack frame, it never needs to be malloc'd. 122 1.23 kre */ 123 1.23 kre 124 1.23 kre union parse_state_p { 125 1.23 kre struct parse_state *const c_current_parser; 126 1.23 kre struct parse_state * v_current_parser; 127 1.23 kre }; 128 1.23 kre 129 1.23 kre extern union parse_state_p psp; 130 1.23 kre 131 1.23 kre #define current_parser (psp.c_current_parser) 132 1.23 kre 133 1.23 kre /* 134 1.23 kre * Perhaps one day emulate "static" by moving most of these definitions into 135 1.23 kre * parser.c ... (only checkkwd & tokpushback are used outside parser.c, 136 1.23 kre * and only in init.c as a RESET activity) 137 1.23 kre */ 138 1.23 kre #define tokpushback (current_parser->ps_tokpushback) 139 1.23 kre #define checkkwd (current_parser->ps_checkkwd) 140 1.23 kre 141 1.23 kre #define heredoclist (current_parser->ps_heredoclist) 142 1.23 kre #define parsebackquote (current_parser->ps_parsebackquote) 143 1.23 kre #define doprompt (current_parser->ps_doprompt) 144 1.23 kre #define needprompt (current_parser->ps_needprompt) 145 1.23 kre #define lasttoken (current_parser->ps_lasttoken) 146 1.23 kre #define wordtext (current_parser->ps_wordtext) 147 1.23 kre #define backquotelist (current_parser->ps_backquotelist) 148 1.23 kre #define redirnode (current_parser->ps_redirnode) 149 1.23 kre #define heredoc (current_parser->ps_heredoc) 150 1.23 kre #define quoteflag (current_parser->ps_quoteflag) 151 1.23 kre #define startlinno (current_parser->ps_startlinno) 152 1.23 kre #define funclinno (current_parser->ps_funclinno) 153 1.23 kre #define elided_nl (current_parser->ps_elided_nl) 154 1.1 cgd 155 1.1 cgd /* 156 1.26 kre * Values that can be set in checkkwd 157 1.26 kre */ 158 1.26 kre #define CHKKWD 0x01 /* turn word into keyword (if it is) */ 159 1.26 kre #define CHKNL 0x02 /* ignore leading \n's */ 160 1.26 kre #define CHKALIAS 0x04 /* lookup words as aliases and ... */ 161 1.26 kre 162 1.26 kre /* 163 1.1 cgd * NEOF is returned by parsecmd when it encounters an end of file. It 164 1.1 cgd * must be distinct from NULL, so we use the address of a variable that 165 1.1 cgd * happens to be handy. 166 1.1 cgd */ 167 1.23 kre #define NEOF ((union node *)&psp) 168 1.22 kre 169 1.22 kre #ifdef DEBUG 170 1.22 kre extern int parsing; 171 1.22 kre #endif 172