parser.h revision 1.23 1 1.23 kre /* $NetBSD: parser.h,v 1.23 2017/06/30 23:02:56 kre Exp $ */
2 1.9 cgd
3 1.1 cgd /*-
4 1.5 jtc * Copyright (c) 1991, 1993
5 1.5 jtc * The Regents of the University of California. All rights reserved.
6 1.1 cgd *
7 1.1 cgd * This code is derived from software contributed to Berkeley by
8 1.1 cgd * Kenneth Almquist.
9 1.1 cgd *
10 1.1 cgd * Redistribution and use in source and binary forms, with or without
11 1.1 cgd * modification, are permitted provided that the following conditions
12 1.1 cgd * are met:
13 1.1 cgd * 1. Redistributions of source code must retain the above copyright
14 1.1 cgd * notice, this list of conditions and the following disclaimer.
15 1.1 cgd * 2. Redistributions in binary form must reproduce the above copyright
16 1.1 cgd * notice, this list of conditions and the following disclaimer in the
17 1.1 cgd * documentation and/or other materials provided with the distribution.
18 1.16 agc * 3. Neither the name of the University nor the names of its contributors
19 1.1 cgd * may be used to endorse or promote products derived from this software
20 1.1 cgd * without specific prior written permission.
21 1.1 cgd *
22 1.1 cgd * THIS SOFTWARE IS PROVIDED BY THE REGENTS AND CONTRIBUTORS ``AS IS'' AND
23 1.1 cgd * ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
24 1.1 cgd * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
25 1.1 cgd * ARE DISCLAIMED. IN NO EVENT SHALL THE REGENTS OR CONTRIBUTORS BE LIABLE
26 1.1 cgd * FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL
27 1.1 cgd * DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS
28 1.1 cgd * OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION)
29 1.1 cgd * HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT
30 1.1 cgd * LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY
31 1.1 cgd * OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF
32 1.1 cgd * SUCH DAMAGE.
33 1.1 cgd *
34 1.10 christos * @(#)parser.h 8.3 (Berkeley) 5/4/95
35 1.1 cgd */
36 1.1 cgd
37 1.1 cgd /* control characters in argument strings */
38 1.15 christos #define CTL_FIRST '\201' /* first 'special' character */
39 1.15 christos #define CTLESC '\201' /* escape next character */
40 1.15 christos #define CTLVAR '\202' /* variable defn */
41 1.1 cgd #define CTLENDVAR '\203'
42 1.1 cgd #define CTLBACKQ '\204'
43 1.1 cgd #define CTLQUOTE 01 /* ored with CTLBACKQ code if in quotes */
44 1.5 jtc /* CTLBACKQ | CTLQUOTE == '\205' */
45 1.15 christos #define CTLARI '\206' /* arithmetic expression */
46 1.5 jtc #define CTLENDARI '\207'
47 1.12 mycroft #define CTLQUOTEMARK '\210'
48 1.17 dsl #define CTLQUOTEEND '\211' /* only inside ${...} */
49 1.22 kre #define CTLNONL '\212' /* The \n in a deleted \ \n sequence */
50 1.22 kre /* pure concidence that (CTLNONL & 0x7f) == '\n' */
51 1.22 kre #define CTL_LAST '\212' /* last 'special' character */
52 1.1 cgd
53 1.1 cgd /* variable substitution byte (follows CTLVAR) */
54 1.18 christos #define VSTYPE 0x0f /* type of variable substitution */
55 1.18 christos #define VSNUL 0x10 /* colon--treat the empty string as unset */
56 1.18 christos #define VSLINENO 0x20 /* expansion of $LINENO, the line number
57 1.18 christos follows immediately */
58 1.19 christos #define VSPATQ 0x40 /* ensure correct pattern quoting in ${x#pat} */
59 1.18 christos #define VSQUOTE 0x80 /* inside double quotes--suppress splitting */
60 1.1 cgd
61 1.1 cgd /* values of VSTYPE field */
62 1.8 christos #define VSNORMAL 0x1 /* normal variable: $var or ${var} */
63 1.8 christos #define VSMINUS 0x2 /* ${var-text} */
64 1.8 christos #define VSPLUS 0x3 /* ${var+text} */
65 1.8 christos #define VSQUESTION 0x4 /* ${var?message} */
66 1.8 christos #define VSASSIGN 0x5 /* ${var=text} */
67 1.8 christos #define VSTRIMLEFT 0x6 /* ${var#pattern} */
68 1.8 christos #define VSTRIMLEFTMAX 0x7 /* ${var##pattern} */
69 1.8 christos #define VSTRIMRIGHT 0x8 /* ${var%pattern} */
70 1.8 christos #define VSTRIMRIGHTMAX 0x9 /* ${var%%pattern} */
71 1.8 christos #define VSLENGTH 0xa /* ${#var} */
72 1.1 cgd
73 1.23 kre union node *parsecmd(int);
74 1.23 kre void fixredir(union node *, const char *, int);
75 1.23 kre int goodname(char *);
76 1.23 kre const char *getprompt(void *);
77 1.23 kre const char *expandstr(char *, int);
78 1.23 kre
79 1.23 kre struct HereDoc;
80 1.23 kre union node;
81 1.23 kre struct nodelist;
82 1.23 kre
83 1.23 kre struct parse_state {
84 1.23 kre int ps_noalias; /* when set, don't handle aliases */
85 1.23 kre struct HereDoc *ps_heredoclist; /* list of here documents to read */
86 1.23 kre int ps_parsebackquote; /* nonzero inside backquotes */
87 1.23 kre int ps_doprompt; /* if set, prompt the user */
88 1.23 kre int ps_needprompt; /* true if interactive at line start */
89 1.23 kre int ps_lasttoken; /* last token read */
90 1.23 kre int ps_tokpushback; /* last token pushed back */
91 1.23 kre char *ps_wordtext; /* text of last word returned by readtoken */
92 1.23 kre int ps_checkkwd; /* 1 == check for kwds, 2 += eat newlines */
93 1.23 kre struct nodelist *ps_backquotelist; /* list of cmdsubs to process */
94 1.23 kre union node *ps_redirnode; /* node for current redirect */
95 1.23 kre struct HereDoc *ps_heredoc; /* current heredoc << beign parsed */
96 1.23 kre int ps_quoteflag; /* set if (part) of token was quoted */
97 1.23 kre int ps_startlinno; /* line # where last token started */
98 1.23 kre int ps_funclinno; /* line # of the current function */
99 1.23 kre int ps_elided_nl; /* count of \ \n pairs we have seen */
100 1.23 kre };
101 1.23 kre
102 1.23 kre /*
103 1.23 kre * The parser references the elements of struct parse_state quite
104 1.23 kre * frequently - they used to be simple globals, so one memory ref
105 1.23 kre * per access, adding an indirect through global ptr would not be
106 1.23 kre * nice. The following gross hack allows most of that cost to be
107 1.23 kre * avoided, by allowing the compiler to understand that the global
108 1.23 kre * pointer is in fact constant in any function, and so its value can
109 1.23 kre * be cached, rather than needing to be fetched every time in case
110 1.23 kre * some other called function has changed it.
111 1.23 kre *
112 1.23 kre * The rule to make this work is that any function that wants
113 1.23 kre * to alter the global must restore it before it returns (and thus
114 1.23 kre * must have an error trap handler). That means that the struct
115 1.23 kre * used for the new parser state can be a local in that function's
116 1.23 kre * stack frame, it never needs to be malloc'd.
117 1.23 kre */
118 1.23 kre
119 1.23 kre union parse_state_p {
120 1.23 kre struct parse_state *const c_current_parser;
121 1.23 kre struct parse_state * v_current_parser;
122 1.23 kre };
123 1.23 kre
124 1.23 kre extern union parse_state_p psp;
125 1.23 kre
126 1.23 kre #define current_parser (psp.c_current_parser)
127 1.23 kre
128 1.23 kre /*
129 1.23 kre * Perhaps one day emulate "static" by moving most of these definitions into
130 1.23 kre * parser.c ... (only checkkwd & tokpushback are used outside parser.c,
131 1.23 kre * and only in init.c as a RESET activity)
132 1.23 kre */
133 1.23 kre #define tokpushback (current_parser->ps_tokpushback)
134 1.23 kre #define checkkwd (current_parser->ps_checkkwd)
135 1.23 kre
136 1.23 kre #define noalias (current_parser->ps_noalias)
137 1.23 kre #define heredoclist (current_parser->ps_heredoclist)
138 1.23 kre #define parsebackquote (current_parser->ps_parsebackquote)
139 1.23 kre #define doprompt (current_parser->ps_doprompt)
140 1.23 kre #define needprompt (current_parser->ps_needprompt)
141 1.23 kre #define lasttoken (current_parser->ps_lasttoken)
142 1.23 kre #define wordtext (current_parser->ps_wordtext)
143 1.23 kre #define backquotelist (current_parser->ps_backquotelist)
144 1.23 kre #define redirnode (current_parser->ps_redirnode)
145 1.23 kre #define heredoc (current_parser->ps_heredoc)
146 1.23 kre #define quoteflag (current_parser->ps_quoteflag)
147 1.23 kre #define startlinno (current_parser->ps_startlinno)
148 1.23 kre #define funclinno (current_parser->ps_funclinno)
149 1.23 kre #define elided_nl (current_parser->ps_elided_nl)
150 1.1 cgd
151 1.1 cgd /*
152 1.1 cgd * NEOF is returned by parsecmd when it encounters an end of file. It
153 1.1 cgd * must be distinct from NULL, so we use the address of a variable that
154 1.1 cgd * happens to be handy.
155 1.1 cgd */
156 1.23 kre #define NEOF ((union node *)&psp)
157 1.22 kre
158 1.22 kre #ifdef DEBUG
159 1.22 kre extern int parsing;
160 1.22 kre #endif
161