parser.c revision 1.48 1 1.48 christos /* $NetBSD: parser.c,v 1.48 2001/11/02 23:49:14 christos Exp $ */
2 1.24 cgd
3 1.1 cgd /*-
4 1.11 jtc * Copyright (c) 1991, 1993
5 1.11 jtc * The Regents of the University of California. All rights reserved.
6 1.1 cgd *
7 1.1 cgd * This code is derived from software contributed to Berkeley by
8 1.1 cgd * Kenneth Almquist.
9 1.1 cgd *
10 1.1 cgd * Redistribution and use in source and binary forms, with or without
11 1.1 cgd * modification, are permitted provided that the following conditions
12 1.1 cgd * are met:
13 1.1 cgd * 1. Redistributions of source code must retain the above copyright
14 1.1 cgd * notice, this list of conditions and the following disclaimer.
15 1.1 cgd * 2. Redistributions in binary form must reproduce the above copyright
16 1.1 cgd * notice, this list of conditions and the following disclaimer in the
17 1.1 cgd * documentation and/or other materials provided with the distribution.
18 1.1 cgd * 3. All advertising materials mentioning features or use of this software
19 1.1 cgd * must display the following acknowledgement:
20 1.1 cgd * This product includes software developed by the University of
21 1.1 cgd * California, Berkeley and its contributors.
22 1.1 cgd * 4. Neither the name of the University nor the names of its contributors
23 1.1 cgd * may be used to endorse or promote products derived from this software
24 1.1 cgd * without specific prior written permission.
25 1.1 cgd *
26 1.1 cgd * THIS SOFTWARE IS PROVIDED BY THE REGENTS AND CONTRIBUTORS ``AS IS'' AND
27 1.1 cgd * ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
28 1.1 cgd * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
29 1.1 cgd * ARE DISCLAIMED. IN NO EVENT SHALL THE REGENTS OR CONTRIBUTORS BE LIABLE
30 1.1 cgd * FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL
31 1.1 cgd * DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS
32 1.1 cgd * OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION)
33 1.1 cgd * HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT
34 1.1 cgd * LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY
35 1.1 cgd * OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF
36 1.1 cgd * SUCH DAMAGE.
37 1.1 cgd */
38 1.1 cgd
39 1.36 christos #include <sys/cdefs.h>
40 1.1 cgd #ifndef lint
41 1.24 cgd #if 0
42 1.26 christos static char sccsid[] = "@(#)parser.c 8.7 (Berkeley) 5/16/95";
43 1.24 cgd #else
44 1.48 christos __RCSID("$NetBSD: parser.c,v 1.48 2001/11/02 23:49:14 christos Exp $");
45 1.24 cgd #endif
46 1.1 cgd #endif /* not lint */
47 1.1 cgd
48 1.25 christos #include <stdlib.h>
49 1.25 christos
50 1.1 cgd #include "shell.h"
51 1.1 cgd #include "parser.h"
52 1.1 cgd #include "nodes.h"
53 1.1 cgd #include "expand.h" /* defines rmescapes() */
54 1.46 christos #include "eval.h" /* defines commandname */
55 1.1 cgd #include "redir.h" /* defines copyfd() */
56 1.1 cgd #include "syntax.h"
57 1.1 cgd #include "options.h"
58 1.1 cgd #include "input.h"
59 1.1 cgd #include "output.h"
60 1.1 cgd #include "var.h"
61 1.1 cgd #include "error.h"
62 1.1 cgd #include "memalloc.h"
63 1.1 cgd #include "mystring.h"
64 1.11 jtc #include "alias.h"
65 1.25 christos #include "show.h"
66 1.35 christos #ifndef SMALL
67 1.11 jtc #include "myhistedit.h"
68 1.14 cgd #endif
69 1.1 cgd
70 1.1 cgd /*
71 1.1 cgd * Shell command parser.
72 1.1 cgd */
73 1.1 cgd
74 1.1 cgd #define EOFMARKLEN 79
75 1.1 cgd
76 1.1 cgd /* values returned by readtoken */
77 1.30 christos #include "token.h"
78 1.1 cgd
79 1.1 cgd
80 1.1 cgd
81 1.1 cgd struct heredoc {
82 1.1 cgd struct heredoc *next; /* next here document in list */
83 1.1 cgd union node *here; /* redirection node */
84 1.1 cgd char *eofmark; /* string indicating end of input */
85 1.1 cgd int striptabs; /* if set, strip leading tabs */
86 1.1 cgd };
87 1.1 cgd
88 1.1 cgd
89 1.1 cgd
90 1.48 christos static int noalias = 0; /* when set, don't handle aliases */
91 1.1 cgd struct heredoc *heredoclist; /* list of here documents to read */
92 1.1 cgd int parsebackquote; /* nonzero if we are inside backquotes */
93 1.1 cgd int doprompt; /* if set, prompt the user */
94 1.1 cgd int needprompt; /* true if interactive and at start of line */
95 1.1 cgd int lasttoken; /* last token read */
96 1.1 cgd MKINIT int tokpushback; /* last token pushed back */
97 1.1 cgd char *wordtext; /* text of last word returned by readtoken */
98 1.11 jtc MKINIT int checkkwd; /* 1 == check for kwds, 2 == also eat newlines */
99 1.1 cgd struct nodelist *backquotelist;
100 1.1 cgd union node *redirnode;
101 1.1 cgd struct heredoc *heredoc;
102 1.1 cgd int quoteflag; /* set if (part of) last token was quoted */
103 1.1 cgd int startlinno; /* line # where last token started */
104 1.1 cgd
105 1.1 cgd
106 1.1 cgd STATIC union node *list __P((int));
107 1.1 cgd STATIC union node *andor __P((void));
108 1.1 cgd STATIC union node *pipeline __P((void));
109 1.1 cgd STATIC union node *command __P((void));
110 1.5 sef STATIC union node *simplecmd __P((union node **, union node *));
111 1.18 jtc STATIC union node *makename __P((void));
112 1.1 cgd STATIC void parsefname __P((void));
113 1.1 cgd STATIC void parseheredoc __P((void));
114 1.25 christos STATIC int peektoken __P((void));
115 1.1 cgd STATIC int readtoken __P((void));
116 1.25 christos STATIC int xxreadtoken __P((void));
117 1.1 cgd STATIC int readtoken1 __P((int, char const *, char *, int));
118 1.1 cgd STATIC int noexpand __P((char *));
119 1.39 mycroft STATIC void synexpect __P((int)) __attribute__((noreturn));
120 1.43 christos STATIC void synerror __P((const char *)) __attribute__((noreturn));
121 1.30 christos STATIC void setprompt __P((int));
122 1.1 cgd
123 1.22 cgd
124 1.1 cgd /*
125 1.1 cgd * Read and parse a command. Returns NEOF on end of file. (NULL is a
126 1.1 cgd * valid parse tree indicating a blank line.)
127 1.1 cgd */
128 1.1 cgd
129 1.1 cgd union node *
130 1.45 cgd parsecmd(int interact)
131 1.22 cgd {
132 1.1 cgd int t;
133 1.1 cgd
134 1.47 christos tokpushback = 0;
135 1.1 cgd doprompt = interact;
136 1.1 cgd if (doprompt)
137 1.11 jtc setprompt(1);
138 1.11 jtc else
139 1.11 jtc setprompt(0);
140 1.1 cgd needprompt = 0;
141 1.11 jtc t = readtoken();
142 1.11 jtc if (t == TEOF)
143 1.1 cgd return NEOF;
144 1.1 cgd if (t == TNL)
145 1.1 cgd return NULL;
146 1.1 cgd tokpushback++;
147 1.1 cgd return list(1);
148 1.1 cgd }
149 1.1 cgd
150 1.1 cgd
151 1.1 cgd STATIC union node *
152 1.30 christos list(nlflag)
153 1.22 cgd int nlflag;
154 1.22 cgd {
155 1.1 cgd union node *n1, *n2, *n3;
156 1.12 jtc int tok;
157 1.1 cgd
158 1.1 cgd checkkwd = 2;
159 1.1 cgd if (nlflag == 0 && tokendlist[peektoken()])
160 1.1 cgd return NULL;
161 1.12 jtc n1 = NULL;
162 1.1 cgd for (;;) {
163 1.12 jtc n2 = andor();
164 1.12 jtc tok = readtoken();
165 1.12 jtc if (tok == TBACKGND) {
166 1.12 jtc if (n2->type == NCMD || n2->type == NPIPE) {
167 1.12 jtc n2->ncmd.backgnd = 1;
168 1.12 jtc } else if (n2->type == NREDIR) {
169 1.12 jtc n2->type = NBACKGND;
170 1.1 cgd } else {
171 1.1 cgd n3 = (union node *)stalloc(sizeof (struct nredir));
172 1.1 cgd n3->type = NBACKGND;
173 1.12 jtc n3->nredir.n = n2;
174 1.1 cgd n3->nredir.redirect = NULL;
175 1.12 jtc n2 = n3;
176 1.1 cgd }
177 1.12 jtc }
178 1.12 jtc if (n1 == NULL) {
179 1.12 jtc n1 = n2;
180 1.12 jtc }
181 1.12 jtc else {
182 1.12 jtc n3 = (union node *)stalloc(sizeof (struct nbinary));
183 1.12 jtc n3->type = NSEMI;
184 1.12 jtc n3->nbinary.ch1 = n1;
185 1.12 jtc n3->nbinary.ch2 = n2;
186 1.12 jtc n1 = n3;
187 1.12 jtc }
188 1.12 jtc switch (tok) {
189 1.12 jtc case TBACKGND:
190 1.12 jtc case TSEMI:
191 1.12 jtc tok = readtoken();
192 1.12 jtc /* fall through */
193 1.1 cgd case TNL:
194 1.12 jtc if (tok == TNL) {
195 1.1 cgd parseheredoc();
196 1.1 cgd if (nlflag)
197 1.1 cgd return n1;
198 1.1 cgd } else {
199 1.1 cgd tokpushback++;
200 1.1 cgd }
201 1.1 cgd checkkwd = 2;
202 1.1 cgd if (tokendlist[peektoken()])
203 1.1 cgd return n1;
204 1.1 cgd break;
205 1.1 cgd case TEOF:
206 1.1 cgd if (heredoclist)
207 1.1 cgd parseheredoc();
208 1.1 cgd else
209 1.1 cgd pungetc(); /* push back EOF on input */
210 1.1 cgd return n1;
211 1.1 cgd default:
212 1.1 cgd if (nlflag)
213 1.1 cgd synexpect(-1);
214 1.1 cgd tokpushback++;
215 1.1 cgd return n1;
216 1.1 cgd }
217 1.1 cgd }
218 1.1 cgd }
219 1.1 cgd
220 1.1 cgd
221 1.1 cgd
222 1.1 cgd STATIC union node *
223 1.1 cgd andor() {
224 1.1 cgd union node *n1, *n2, *n3;
225 1.1 cgd int t;
226 1.1 cgd
227 1.1 cgd n1 = pipeline();
228 1.1 cgd for (;;) {
229 1.1 cgd if ((t = readtoken()) == TAND) {
230 1.1 cgd t = NAND;
231 1.1 cgd } else if (t == TOR) {
232 1.1 cgd t = NOR;
233 1.1 cgd } else {
234 1.1 cgd tokpushback++;
235 1.1 cgd return n1;
236 1.1 cgd }
237 1.1 cgd n2 = pipeline();
238 1.1 cgd n3 = (union node *)stalloc(sizeof (struct nbinary));
239 1.1 cgd n3->type = t;
240 1.1 cgd n3->nbinary.ch1 = n1;
241 1.1 cgd n3->nbinary.ch2 = n2;
242 1.1 cgd n1 = n3;
243 1.1 cgd }
244 1.1 cgd }
245 1.1 cgd
246 1.1 cgd
247 1.1 cgd
248 1.1 cgd STATIC union node *
249 1.1 cgd pipeline() {
250 1.44 christos union node *n1, *n2, *pipenode;
251 1.1 cgd struct nodelist *lp, *prev;
252 1.44 christos int negate;
253 1.1 cgd
254 1.44 christos negate = 0;
255 1.11 jtc TRACE(("pipeline: entered\n"));
256 1.44 christos while (readtoken() == TNOT)
257 1.44 christos negate = !negate;
258 1.44 christos tokpushback++;
259 1.1 cgd n1 = command();
260 1.1 cgd if (readtoken() == TPIPE) {
261 1.1 cgd pipenode = (union node *)stalloc(sizeof (struct npipe));
262 1.1 cgd pipenode->type = NPIPE;
263 1.1 cgd pipenode->npipe.backgnd = 0;
264 1.1 cgd lp = (struct nodelist *)stalloc(sizeof (struct nodelist));
265 1.1 cgd pipenode->npipe.cmdlist = lp;
266 1.1 cgd lp->n = n1;
267 1.1 cgd do {
268 1.1 cgd prev = lp;
269 1.1 cgd lp = (struct nodelist *)stalloc(sizeof (struct nodelist));
270 1.1 cgd lp->n = command();
271 1.1 cgd prev->next = lp;
272 1.1 cgd } while (readtoken() == TPIPE);
273 1.1 cgd lp->next = NULL;
274 1.1 cgd n1 = pipenode;
275 1.1 cgd }
276 1.1 cgd tokpushback++;
277 1.44 christos if (negate) {
278 1.44 christos n2 = (union node *)stalloc(sizeof (struct nnot));
279 1.44 christos n2->type = NNOT;
280 1.44 christos n2->nnot.com = n1;
281 1.44 christos return n2;
282 1.44 christos } else
283 1.44 christos return n1;
284 1.1 cgd }
285 1.1 cgd
286 1.1 cgd
287 1.1 cgd
288 1.1 cgd STATIC union node *
289 1.1 cgd command() {
290 1.1 cgd union node *n1, *n2;
291 1.1 cgd union node *ap, **app;
292 1.1 cgd union node *cp, **cpp;
293 1.1 cgd union node *redir, **rpp;
294 1.31 christos int t, negate = 0;
295 1.1 cgd
296 1.1 cgd checkkwd = 2;
297 1.25 christos redir = NULL;
298 1.25 christos n1 = NULL;
299 1.5 sef rpp = &redir;
300 1.31 christos
301 1.5 sef /* Check for redirection which may precede command */
302 1.5 sef while (readtoken() == TREDIR) {
303 1.5 sef *rpp = n2 = redirnode;
304 1.5 sef rpp = &n2->nfile.next;
305 1.5 sef parsefname();
306 1.5 sef }
307 1.5 sef tokpushback++;
308 1.5 sef
309 1.31 christos while (readtoken() == TNOT) {
310 1.31 christos TRACE(("command: TNOT recognized\n"));
311 1.31 christos negate = !negate;
312 1.31 christos }
313 1.31 christos tokpushback++;
314 1.31 christos
315 1.1 cgd switch (readtoken()) {
316 1.1 cgd case TIF:
317 1.1 cgd n1 = (union node *)stalloc(sizeof (struct nif));
318 1.1 cgd n1->type = NIF;
319 1.1 cgd n1->nif.test = list(0);
320 1.1 cgd if (readtoken() != TTHEN)
321 1.1 cgd synexpect(TTHEN);
322 1.1 cgd n1->nif.ifpart = list(0);
323 1.1 cgd n2 = n1;
324 1.1 cgd while (readtoken() == TELIF) {
325 1.1 cgd n2->nif.elsepart = (union node *)stalloc(sizeof (struct nif));
326 1.1 cgd n2 = n2->nif.elsepart;
327 1.1 cgd n2->type = NIF;
328 1.1 cgd n2->nif.test = list(0);
329 1.1 cgd if (readtoken() != TTHEN)
330 1.1 cgd synexpect(TTHEN);
331 1.1 cgd n2->nif.ifpart = list(0);
332 1.1 cgd }
333 1.1 cgd if (lasttoken == TELSE)
334 1.1 cgd n2->nif.elsepart = list(0);
335 1.1 cgd else {
336 1.1 cgd n2->nif.elsepart = NULL;
337 1.1 cgd tokpushback++;
338 1.1 cgd }
339 1.1 cgd if (readtoken() != TFI)
340 1.1 cgd synexpect(TFI);
341 1.1 cgd checkkwd = 1;
342 1.1 cgd break;
343 1.1 cgd case TWHILE:
344 1.1 cgd case TUNTIL: {
345 1.1 cgd int got;
346 1.1 cgd n1 = (union node *)stalloc(sizeof (struct nbinary));
347 1.1 cgd n1->type = (lasttoken == TWHILE)? NWHILE : NUNTIL;
348 1.1 cgd n1->nbinary.ch1 = list(0);
349 1.1 cgd if ((got=readtoken()) != TDO) {
350 1.1 cgd TRACE(("expecting DO got %s %s\n", tokname[got], got == TWORD ? wordtext : ""));
351 1.1 cgd synexpect(TDO);
352 1.1 cgd }
353 1.1 cgd n1->nbinary.ch2 = list(0);
354 1.1 cgd if (readtoken() != TDONE)
355 1.1 cgd synexpect(TDONE);
356 1.1 cgd checkkwd = 1;
357 1.1 cgd break;
358 1.1 cgd }
359 1.1 cgd case TFOR:
360 1.1 cgd if (readtoken() != TWORD || quoteflag || ! goodname(wordtext))
361 1.1 cgd synerror("Bad for loop variable");
362 1.1 cgd n1 = (union node *)stalloc(sizeof (struct nfor));
363 1.1 cgd n1->type = NFOR;
364 1.1 cgd n1->nfor.var = wordtext;
365 1.1 cgd if (readtoken() == TWORD && ! quoteflag && equal(wordtext, "in")) {
366 1.1 cgd app = ≈
367 1.1 cgd while (readtoken() == TWORD) {
368 1.1 cgd n2 = (union node *)stalloc(sizeof (struct narg));
369 1.1 cgd n2->type = NARG;
370 1.1 cgd n2->narg.text = wordtext;
371 1.1 cgd n2->narg.backquote = backquotelist;
372 1.1 cgd *app = n2;
373 1.1 cgd app = &n2->narg.next;
374 1.1 cgd }
375 1.1 cgd *app = NULL;
376 1.1 cgd n1->nfor.args = ap;
377 1.5 sef if (lasttoken != TNL && lasttoken != TSEMI)
378 1.5 sef synexpect(-1);
379 1.1 cgd } else {
380 1.43 christos static char argvars[5] = {CTLVAR, VSNORMAL|VSQUOTE,
381 1.1 cgd '@', '=', '\0'};
382 1.1 cgd n2 = (union node *)stalloc(sizeof (struct narg));
383 1.1 cgd n2->type = NARG;
384 1.43 christos n2->narg.text = argvars;
385 1.1 cgd n2->narg.backquote = NULL;
386 1.1 cgd n2->narg.next = NULL;
387 1.1 cgd n1->nfor.args = n2;
388 1.11 jtc /*
389 1.11 jtc * Newline or semicolon here is optional (but note
390 1.11 jtc * that the original Bourne shell only allowed NL).
391 1.11 jtc */
392 1.11 jtc if (lasttoken != TNL && lasttoken != TSEMI)
393 1.11 jtc tokpushback++;
394 1.1 cgd }
395 1.1 cgd checkkwd = 2;
396 1.1 cgd if ((t = readtoken()) == TDO)
397 1.1 cgd t = TDONE;
398 1.1 cgd else if (t == TBEGIN)
399 1.1 cgd t = TEND;
400 1.1 cgd else
401 1.1 cgd synexpect(-1);
402 1.1 cgd n1->nfor.body = list(0);
403 1.1 cgd if (readtoken() != t)
404 1.1 cgd synexpect(t);
405 1.1 cgd checkkwd = 1;
406 1.1 cgd break;
407 1.1 cgd case TCASE:
408 1.1 cgd n1 = (union node *)stalloc(sizeof (struct ncase));
409 1.1 cgd n1->type = NCASE;
410 1.1 cgd if (readtoken() != TWORD)
411 1.1 cgd synexpect(TWORD);
412 1.1 cgd n1->ncase.expr = n2 = (union node *)stalloc(sizeof (struct narg));
413 1.1 cgd n2->type = NARG;
414 1.1 cgd n2->narg.text = wordtext;
415 1.1 cgd n2->narg.backquote = backquotelist;
416 1.1 cgd n2->narg.next = NULL;
417 1.1 cgd while (readtoken() == TNL);
418 1.1 cgd if (lasttoken != TWORD || ! equal(wordtext, "in"))
419 1.1 cgd synerror("expecting \"in\"");
420 1.1 cgd cpp = &n1->ncase.cases;
421 1.48 christos noalias = 1;
422 1.15 jtc checkkwd = 2, readtoken();
423 1.15 jtc do {
424 1.1 cgd *cpp = cp = (union node *)stalloc(sizeof (struct nclist));
425 1.1 cgd cp->type = NCLIST;
426 1.1 cgd app = &cp->nclist.pattern;
427 1.1 cgd for (;;) {
428 1.1 cgd *app = ap = (union node *)stalloc(sizeof (struct narg));
429 1.1 cgd ap->type = NARG;
430 1.1 cgd ap->narg.text = wordtext;
431 1.1 cgd ap->narg.backquote = backquotelist;
432 1.15 jtc if (checkkwd = 2, readtoken() != TPIPE)
433 1.1 cgd break;
434 1.1 cgd app = &ap->narg.next;
435 1.16 jtc readtoken();
436 1.1 cgd }
437 1.1 cgd ap->narg.next = NULL;
438 1.48 christos noalias = 0;
439 1.48 christos if (lasttoken != TRP) {
440 1.1 cgd synexpect(TRP);
441 1.48 christos }
442 1.1 cgd cp->nclist.body = list(0);
443 1.15 jtc
444 1.15 jtc checkkwd = 2;
445 1.15 jtc if ((t = readtoken()) != TESAC) {
446 1.48 christos if (t != TENDCASE) {
447 1.48 christos noalias = 0;
448 1.15 jtc synexpect(TENDCASE);
449 1.48 christos } else {
450 1.48 christos noalias = 1;
451 1.48 christos checkkwd = 2;
452 1.48 christos readtoken();
453 1.48 christos }
454 1.15 jtc }
455 1.1 cgd cpp = &cp->nclist.next;
456 1.15 jtc } while(lasttoken != TESAC);
457 1.48 christos noalias = 0;
458 1.1 cgd *cpp = NULL;
459 1.1 cgd checkkwd = 1;
460 1.1 cgd break;
461 1.1 cgd case TLP:
462 1.1 cgd n1 = (union node *)stalloc(sizeof (struct nredir));
463 1.1 cgd n1->type = NSUBSHELL;
464 1.1 cgd n1->nredir.n = list(0);
465 1.1 cgd n1->nredir.redirect = NULL;
466 1.1 cgd if (readtoken() != TRP)
467 1.1 cgd synexpect(TRP);
468 1.1 cgd checkkwd = 1;
469 1.1 cgd break;
470 1.1 cgd case TBEGIN:
471 1.1 cgd n1 = list(0);
472 1.1 cgd if (readtoken() != TEND)
473 1.1 cgd synexpect(TEND);
474 1.1 cgd checkkwd = 1;
475 1.1 cgd break;
476 1.5 sef /* Handle an empty command like other simple commands. */
477 1.19 mycroft case TSEMI:
478 1.19 mycroft /*
479 1.19 mycroft * An empty command before a ; doesn't make much sense, and
480 1.19 mycroft * should certainly be disallowed in the case of `if ;'.
481 1.19 mycroft */
482 1.19 mycroft if (!redir)
483 1.19 mycroft synexpect(-1);
484 1.30 christos case TAND:
485 1.30 christos case TOR:
486 1.5 sef case TNL:
487 1.20 mycroft case TEOF:
488 1.1 cgd case TWORD:
489 1.19 mycroft case TRP:
490 1.1 cgd tokpushback++;
491 1.31 christos n1 = simplecmd(rpp, redir);
492 1.31 christos goto checkneg;
493 1.1 cgd default:
494 1.1 cgd synexpect(-1);
495 1.39 mycroft /* NOTREACHED */
496 1.1 cgd }
497 1.1 cgd
498 1.1 cgd /* Now check for redirection which may follow command */
499 1.1 cgd while (readtoken() == TREDIR) {
500 1.1 cgd *rpp = n2 = redirnode;
501 1.1 cgd rpp = &n2->nfile.next;
502 1.1 cgd parsefname();
503 1.1 cgd }
504 1.1 cgd tokpushback++;
505 1.1 cgd *rpp = NULL;
506 1.1 cgd if (redir) {
507 1.1 cgd if (n1->type != NSUBSHELL) {
508 1.1 cgd n2 = (union node *)stalloc(sizeof (struct nredir));
509 1.1 cgd n2->type = NREDIR;
510 1.1 cgd n2->nredir.n = n1;
511 1.1 cgd n1 = n2;
512 1.1 cgd }
513 1.1 cgd n1->nredir.redirect = redir;
514 1.1 cgd }
515 1.31 christos
516 1.31 christos checkneg:
517 1.31 christos if (negate) {
518 1.31 christos n2 = (union node *)stalloc(sizeof (struct nnot));
519 1.31 christos n2->type = NNOT;
520 1.31 christos n2->nnot.com = n1;
521 1.31 christos return n2;
522 1.31 christos }
523 1.31 christos else
524 1.31 christos return n1;
525 1.1 cgd }
526 1.1 cgd
527 1.1 cgd
528 1.1 cgd STATIC union node *
529 1.30 christos simplecmd(rpp, redir)
530 1.5 sef union node **rpp, *redir;
531 1.5 sef {
532 1.1 cgd union node *args, **app;
533 1.5 sef union node **orig_rpp = rpp;
534 1.31 christos union node *n = NULL, *n2;
535 1.31 christos int negate = 0;
536 1.1 cgd
537 1.11 jtc /* If we don't have any redirections already, then we must reset */
538 1.11 jtc /* rpp to be the address of the local redir variable. */
539 1.5 sef if (redir == 0)
540 1.5 sef rpp = &redir;
541 1.5 sef
542 1.1 cgd args = NULL;
543 1.1 cgd app = &args;
544 1.30 christos /*
545 1.11 jtc * We save the incoming value, because we need this for shell
546 1.11 jtc * functions. There can not be a redirect or an argument between
547 1.30 christos * the function name and the open parenthesis.
548 1.11 jtc */
549 1.5 sef orig_rpp = rpp;
550 1.11 jtc
551 1.31 christos while (readtoken() == TNOT) {
552 1.31 christos TRACE(("command: TNOT recognized\n"));
553 1.31 christos negate = !negate;
554 1.31 christos }
555 1.31 christos tokpushback++;
556 1.31 christos
557 1.1 cgd for (;;) {
558 1.1 cgd if (readtoken() == TWORD) {
559 1.1 cgd n = (union node *)stalloc(sizeof (struct narg));
560 1.1 cgd n->type = NARG;
561 1.1 cgd n->narg.text = wordtext;
562 1.1 cgd n->narg.backquote = backquotelist;
563 1.1 cgd *app = n;
564 1.1 cgd app = &n->narg.next;
565 1.1 cgd } else if (lasttoken == TREDIR) {
566 1.1 cgd *rpp = n = redirnode;
567 1.1 cgd rpp = &n->nfile.next;
568 1.1 cgd parsefname(); /* read name of redirection file */
569 1.1 cgd } else if (lasttoken == TLP && app == &args->narg.next
570 1.5 sef && rpp == orig_rpp) {
571 1.1 cgd /* We have a function */
572 1.1 cgd if (readtoken() != TRP)
573 1.1 cgd synexpect(TRP);
574 1.1 cgd #ifdef notdef
575 1.1 cgd if (! goodname(n->narg.text))
576 1.1 cgd synerror("Bad function name");
577 1.1 cgd #endif
578 1.1 cgd n->type = NDEFUN;
579 1.1 cgd n->narg.next = command();
580 1.31 christos goto checkneg;
581 1.1 cgd } else {
582 1.1 cgd tokpushback++;
583 1.1 cgd break;
584 1.1 cgd }
585 1.1 cgd }
586 1.1 cgd *app = NULL;
587 1.1 cgd *rpp = NULL;
588 1.1 cgd n = (union node *)stalloc(sizeof (struct ncmd));
589 1.1 cgd n->type = NCMD;
590 1.1 cgd n->ncmd.backgnd = 0;
591 1.1 cgd n->ncmd.args = args;
592 1.1 cgd n->ncmd.redirect = redir;
593 1.31 christos
594 1.31 christos checkneg:
595 1.31 christos if (negate) {
596 1.31 christos n2 = (union node *)stalloc(sizeof (struct nnot));
597 1.31 christos n2->type = NNOT;
598 1.31 christos n2->nnot.com = n;
599 1.31 christos return n2;
600 1.31 christos }
601 1.31 christos else
602 1.31 christos return n;
603 1.1 cgd }
604 1.1 cgd
605 1.18 jtc STATIC union node *
606 1.18 jtc makename() {
607 1.18 jtc union node *n;
608 1.18 jtc
609 1.18 jtc n = (union node *)stalloc(sizeof (struct narg));
610 1.18 jtc n->type = NARG;
611 1.18 jtc n->narg.next = NULL;
612 1.18 jtc n->narg.text = wordtext;
613 1.18 jtc n->narg.backquote = backquotelist;
614 1.18 jtc return n;
615 1.18 jtc }
616 1.18 jtc
617 1.45 cgd void fixredir(union node *n, const char *text, int err)
618 1.18 jtc {
619 1.18 jtc TRACE(("Fix redir %s %d\n", text, err));
620 1.18 jtc if (!err)
621 1.18 jtc n->ndup.vname = NULL;
622 1.18 jtc
623 1.18 jtc if (is_digit(text[0]) && text[1] == '\0')
624 1.18 jtc n->ndup.dupfd = digit_val(text[0]);
625 1.18 jtc else if (text[0] == '-' && text[1] == '\0')
626 1.18 jtc n->ndup.dupfd = -1;
627 1.18 jtc else {
628 1.30 christos
629 1.18 jtc if (err)
630 1.18 jtc synerror("Bad fd number");
631 1.18 jtc else
632 1.18 jtc n->ndup.vname = makename();
633 1.18 jtc }
634 1.18 jtc }
635 1.18 jtc
636 1.1 cgd
637 1.1 cgd STATIC void
638 1.1 cgd parsefname() {
639 1.1 cgd union node *n = redirnode;
640 1.1 cgd
641 1.1 cgd if (readtoken() != TWORD)
642 1.1 cgd synexpect(-1);
643 1.1 cgd if (n->type == NHERE) {
644 1.1 cgd struct heredoc *here = heredoc;
645 1.1 cgd struct heredoc *p;
646 1.1 cgd int i;
647 1.1 cgd
648 1.1 cgd if (quoteflag == 0)
649 1.1 cgd n->type = NXHERE;
650 1.1 cgd TRACE(("Here document %d\n", n->type));
651 1.1 cgd if (here->striptabs) {
652 1.1 cgd while (*wordtext == '\t')
653 1.1 cgd wordtext++;
654 1.1 cgd }
655 1.1 cgd if (! noexpand(wordtext) || (i = strlen(wordtext)) == 0 || i > EOFMARKLEN)
656 1.1 cgd synerror("Illegal eof marker for << redirection");
657 1.1 cgd rmescapes(wordtext);
658 1.1 cgd here->eofmark = wordtext;
659 1.1 cgd here->next = NULL;
660 1.1 cgd if (heredoclist == NULL)
661 1.1 cgd heredoclist = here;
662 1.1 cgd else {
663 1.1 cgd for (p = heredoclist ; p->next ; p = p->next);
664 1.1 cgd p->next = here;
665 1.1 cgd }
666 1.1 cgd } else if (n->type == NTOFD || n->type == NFROMFD) {
667 1.18 jtc fixredir(n, wordtext, 0);
668 1.1 cgd } else {
669 1.18 jtc n->nfile.fname = makename();
670 1.1 cgd }
671 1.1 cgd }
672 1.1 cgd
673 1.1 cgd
674 1.1 cgd /*
675 1.1 cgd * Input any here documents.
676 1.1 cgd */
677 1.1 cgd
678 1.1 cgd STATIC void
679 1.1 cgd parseheredoc() {
680 1.1 cgd struct heredoc *here;
681 1.1 cgd union node *n;
682 1.1 cgd
683 1.1 cgd while (heredoclist) {
684 1.1 cgd here = heredoclist;
685 1.1 cgd heredoclist = here->next;
686 1.1 cgd if (needprompt) {
687 1.11 jtc setprompt(2);
688 1.1 cgd needprompt = 0;
689 1.1 cgd }
690 1.1 cgd readtoken1(pgetc(), here->here->type == NHERE? SQSYNTAX : DQSYNTAX,
691 1.1 cgd here->eofmark, here->striptabs);
692 1.1 cgd n = (union node *)stalloc(sizeof (struct narg));
693 1.1 cgd n->narg.type = NARG;
694 1.1 cgd n->narg.next = NULL;
695 1.1 cgd n->narg.text = wordtext;
696 1.1 cgd n->narg.backquote = backquotelist;
697 1.1 cgd here->here->nhere.doc = n;
698 1.1 cgd }
699 1.1 cgd }
700 1.1 cgd
701 1.1 cgd STATIC int
702 1.1 cgd peektoken() {
703 1.1 cgd int t;
704 1.1 cgd
705 1.1 cgd t = readtoken();
706 1.1 cgd tokpushback++;
707 1.1 cgd return (t);
708 1.1 cgd }
709 1.1 cgd
710 1.1 cgd STATIC int
711 1.1 cgd readtoken() {
712 1.1 cgd int t;
713 1.11 jtc int savecheckkwd = checkkwd;
714 1.1 cgd #ifdef DEBUG
715 1.1 cgd int alreadyseen = tokpushback;
716 1.1 cgd #endif
717 1.48 christos struct alias *ap;
718 1.30 christos
719 1.11 jtc top:
720 1.1 cgd t = xxreadtoken();
721 1.1 cgd
722 1.1 cgd if (checkkwd) {
723 1.1 cgd /*
724 1.1 cgd * eat newlines
725 1.1 cgd */
726 1.1 cgd if (checkkwd == 2) {
727 1.1 cgd checkkwd = 0;
728 1.1 cgd while (t == TNL) {
729 1.1 cgd parseheredoc();
730 1.1 cgd t = xxreadtoken();
731 1.1 cgd }
732 1.1 cgd } else
733 1.1 cgd checkkwd = 0;
734 1.1 cgd /*
735 1.11 jtc * check for keywords and aliases
736 1.1 cgd */
737 1.30 christos if (t == TWORD && !quoteflag)
738 1.22 cgd {
739 1.43 christos const char *const *pp;
740 1.1 cgd
741 1.43 christos for (pp = parsekwd; *pp; pp++) {
742 1.30 christos if (**pp == *wordtext && equal(*pp, wordtext))
743 1.22 cgd {
744 1.43 christos lasttoken = t = pp -
745 1.43 christos parsekwd + KWDOFFSET;
746 1.1 cgd TRACE(("keyword %s recognized\n", tokname[t]));
747 1.11 jtc goto out;
748 1.1 cgd }
749 1.1 cgd }
750 1.48 christos if(!noalias &&
751 1.48 christos (ap = lookupalias(wordtext, 1)) != NULL) {
752 1.11 jtc pushstring(ap->val, strlen(ap->val), ap);
753 1.11 jtc checkkwd = savecheckkwd;
754 1.11 jtc goto top;
755 1.11 jtc }
756 1.1 cgd }
757 1.11 jtc out:
758 1.31 christos checkkwd = (t == TNOT) ? savecheckkwd : 0;
759 1.1 cgd }
760 1.1 cgd #ifdef DEBUG
761 1.1 cgd if (!alreadyseen)
762 1.1 cgd TRACE(("token %s %s\n", tokname[t], t == TWORD ? wordtext : ""));
763 1.1 cgd else
764 1.1 cgd TRACE(("reread token %s %s\n", tokname[t], t == TWORD ? wordtext : ""));
765 1.1 cgd #endif
766 1.1 cgd return (t);
767 1.1 cgd }
768 1.1 cgd
769 1.1 cgd
770 1.1 cgd /*
771 1.1 cgd * Read the next input token.
772 1.1 cgd * If the token is a word, we set backquotelist to the list of cmds in
773 1.1 cgd * backquotes. We set quoteflag to true if any part of the word was
774 1.1 cgd * quoted.
775 1.1 cgd * If the token is TREDIR, then we set redirnode to a structure containing
776 1.1 cgd * the redirection.
777 1.1 cgd * In all cases, the variable startlinno is set to the number of the line
778 1.1 cgd * on which the token starts.
779 1.1 cgd *
780 1.1 cgd * [Change comment: here documents and internal procedures]
781 1.1 cgd * [Readtoken shouldn't have any arguments. Perhaps we should make the
782 1.1 cgd * word parsing code into a separate routine. In this case, readtoken
783 1.1 cgd * doesn't need to have any internal procedures, but parseword does.
784 1.1 cgd * We could also make parseoperator in essence the main routine, and
785 1.1 cgd * have parseword (readtoken1?) handle both words and redirection.]
786 1.1 cgd */
787 1.1 cgd
788 1.1 cgd #define RETURN(token) return lasttoken = token
789 1.1 cgd
790 1.1 cgd STATIC int
791 1.1 cgd xxreadtoken() {
792 1.32 tls int c;
793 1.1 cgd
794 1.1 cgd if (tokpushback) {
795 1.1 cgd tokpushback = 0;
796 1.1 cgd return lasttoken;
797 1.1 cgd }
798 1.1 cgd if (needprompt) {
799 1.11 jtc setprompt(2);
800 1.1 cgd needprompt = 0;
801 1.1 cgd }
802 1.1 cgd startlinno = plinno;
803 1.1 cgd for (;;) { /* until token or start of word found */
804 1.1 cgd c = pgetc_macro();
805 1.1 cgd if (c == ' ' || c == '\t')
806 1.1 cgd continue; /* quick check for white space first */
807 1.1 cgd switch (c) {
808 1.1 cgd case ' ': case '\t':
809 1.1 cgd continue;
810 1.1 cgd case '#':
811 1.1 cgd while ((c = pgetc()) != '\n' && c != PEOF);
812 1.1 cgd pungetc();
813 1.1 cgd continue;
814 1.1 cgd case '\\':
815 1.1 cgd if (pgetc() == '\n') {
816 1.1 cgd startlinno = ++plinno;
817 1.1 cgd if (doprompt)
818 1.11 jtc setprompt(2);
819 1.11 jtc else
820 1.11 jtc setprompt(0);
821 1.1 cgd continue;
822 1.1 cgd }
823 1.1 cgd pungetc();
824 1.1 cgd goto breakloop;
825 1.1 cgd case '\n':
826 1.1 cgd plinno++;
827 1.1 cgd needprompt = doprompt;
828 1.1 cgd RETURN(TNL);
829 1.1 cgd case PEOF:
830 1.1 cgd RETURN(TEOF);
831 1.1 cgd case '&':
832 1.1 cgd if (pgetc() == '&')
833 1.1 cgd RETURN(TAND);
834 1.1 cgd pungetc();
835 1.1 cgd RETURN(TBACKGND);
836 1.1 cgd case '|':
837 1.1 cgd if (pgetc() == '|')
838 1.1 cgd RETURN(TOR);
839 1.1 cgd pungetc();
840 1.1 cgd RETURN(TPIPE);
841 1.1 cgd case ';':
842 1.1 cgd if (pgetc() == ';')
843 1.1 cgd RETURN(TENDCASE);
844 1.1 cgd pungetc();
845 1.1 cgd RETURN(TSEMI);
846 1.1 cgd case '(':
847 1.1 cgd RETURN(TLP);
848 1.1 cgd case ')':
849 1.1 cgd RETURN(TRP);
850 1.1 cgd default:
851 1.1 cgd goto breakloop;
852 1.1 cgd }
853 1.1 cgd }
854 1.1 cgd breakloop:
855 1.1 cgd return readtoken1(c, BASESYNTAX, (char *)NULL, 0);
856 1.1 cgd #undef RETURN
857 1.1 cgd }
858 1.1 cgd
859 1.1 cgd
860 1.1 cgd
861 1.1 cgd /*
862 1.1 cgd * If eofmark is NULL, read a word or a redirection symbol. If eofmark
863 1.1 cgd * is not NULL, read a here document. In the latter case, eofmark is the
864 1.1 cgd * word which marks the end of the document and striptabs is true if
865 1.1 cgd * leading tabs should be stripped from the document. The argument firstc
866 1.1 cgd * is the first character of the input token or document.
867 1.1 cgd *
868 1.1 cgd * Because C does not have internal subroutines, I have simulated them
869 1.1 cgd * using goto's to implement the subroutine linkage. The following macros
870 1.1 cgd * will run code that appears at the end of readtoken1.
871 1.1 cgd */
872 1.1 cgd
873 1.1 cgd #define CHECKEND() {goto checkend; checkend_return:;}
874 1.1 cgd #define PARSEREDIR() {goto parseredir; parseredir_return:;}
875 1.1 cgd #define PARSESUB() {goto parsesub; parsesub_return:;}
876 1.1 cgd #define PARSEBACKQOLD() {oldstyle = 1; goto parsebackq; parsebackq_oldreturn:;}
877 1.1 cgd #define PARSEBACKQNEW() {oldstyle = 0; goto parsebackq; parsebackq_newreturn:;}
878 1.11 jtc #define PARSEARITH() {goto parsearith; parsearith_return:;}
879 1.1 cgd
880 1.1 cgd STATIC int
881 1.1 cgd readtoken1(firstc, syntax, eofmark, striptabs)
882 1.1 cgd int firstc;
883 1.1 cgd char const *syntax;
884 1.1 cgd char *eofmark;
885 1.1 cgd int striptabs;
886 1.1 cgd {
887 1.25 christos int c = firstc;
888 1.25 christos char *out;
889 1.1 cgd int len;
890 1.1 cgd char line[EOFMARKLEN + 1];
891 1.1 cgd struct nodelist *bqlist;
892 1.1 cgd int quotef;
893 1.1 cgd int dblquote;
894 1.11 jtc int varnest; /* levels of variables expansion */
895 1.11 jtc int arinest; /* levels of arithmetic expansion */
896 1.11 jtc int parenlevel; /* levels of parens in arithmetic */
897 1.1 cgd int oldstyle;
898 1.11 jtc char const *prevsyntax; /* syntax before arithmetic */
899 1.25 christos #if __GNUC__
900 1.25 christos /* Avoid longjmp clobbering */
901 1.25 christos (void) &out;
902 1.25 christos (void) "ef;
903 1.25 christos (void) &dblquote;
904 1.25 christos (void) &varnest;
905 1.25 christos (void) &arinest;
906 1.25 christos (void) &parenlevel;
907 1.25 christos (void) &oldstyle;
908 1.25 christos (void) &prevsyntax;
909 1.25 christos (void) &syntax;
910 1.25 christos #endif
911 1.1 cgd
912 1.1 cgd startlinno = plinno;
913 1.1 cgd dblquote = 0;
914 1.1 cgd if (syntax == DQSYNTAX)
915 1.1 cgd dblquote = 1;
916 1.1 cgd quotef = 0;
917 1.1 cgd bqlist = NULL;
918 1.1 cgd varnest = 0;
919 1.11 jtc arinest = 0;
920 1.11 jtc parenlevel = 0;
921 1.11 jtc
922 1.1 cgd STARTSTACKSTR(out);
923 1.1 cgd loop: { /* for each line, until end of word */
924 1.1 cgd #if ATTY
925 1.1 cgd if (c == '\034' && doprompt
926 1.1 cgd && attyset() && ! equal(termval(), "emacs")) {
927 1.1 cgd attyline();
928 1.1 cgd if (syntax == BASESYNTAX)
929 1.1 cgd return readtoken();
930 1.1 cgd c = pgetc();
931 1.1 cgd goto loop;
932 1.1 cgd }
933 1.1 cgd #endif
934 1.1 cgd CHECKEND(); /* set c to PEOF if at end of here document */
935 1.1 cgd for (;;) { /* until end of line or end of word */
936 1.1 cgd CHECKSTRSPACE(3, out); /* permit 3 calls to USTPUTC */
937 1.1 cgd switch(syntax[c]) {
938 1.1 cgd case CNL: /* '\n' */
939 1.1 cgd if (syntax == BASESYNTAX)
940 1.1 cgd goto endword; /* exit outer loop */
941 1.1 cgd USTPUTC(c, out);
942 1.1 cgd plinno++;
943 1.11 jtc if (doprompt)
944 1.11 jtc setprompt(2);
945 1.11 jtc else
946 1.11 jtc setprompt(0);
947 1.1 cgd c = pgetc();
948 1.1 cgd goto loop; /* continue outer loop */
949 1.1 cgd case CWORD:
950 1.1 cgd USTPUTC(c, out);
951 1.1 cgd break;
952 1.1 cgd case CCTL:
953 1.1 cgd if (eofmark == NULL || dblquote)
954 1.1 cgd USTPUTC(CTLESC, out);
955 1.1 cgd USTPUTC(c, out);
956 1.1 cgd break;
957 1.1 cgd case CBACK: /* backslash */
958 1.1 cgd c = pgetc();
959 1.1 cgd if (c == PEOF) {
960 1.1 cgd USTPUTC('\\', out);
961 1.1 cgd pungetc();
962 1.1 cgd } else if (c == '\n') {
963 1.1 cgd if (doprompt)
964 1.11 jtc setprompt(2);
965 1.11 jtc else
966 1.11 jtc setprompt(0);
967 1.1 cgd } else {
968 1.1 cgd if (dblquote && c != '\\' && c != '`' && c != '$'
969 1.1 cgd && (c != '"' || eofmark != NULL))
970 1.1 cgd USTPUTC('\\', out);
971 1.1 cgd if (SQSYNTAX[c] == CCTL)
972 1.1 cgd USTPUTC(CTLESC, out);
973 1.41 mycroft else if (eofmark == NULL)
974 1.41 mycroft USTPUTC(CTLQUOTEMARK, out);
975 1.1 cgd USTPUTC(c, out);
976 1.1 cgd quotef++;
977 1.1 cgd }
978 1.1 cgd break;
979 1.1 cgd case CSQUOTE:
980 1.41 mycroft if (eofmark == NULL)
981 1.41 mycroft USTPUTC(CTLQUOTEMARK, out);
982 1.1 cgd syntax = SQSYNTAX;
983 1.1 cgd break;
984 1.1 cgd case CDQUOTE:
985 1.41 mycroft if (eofmark == NULL)
986 1.41 mycroft USTPUTC(CTLQUOTEMARK, out);
987 1.1 cgd syntax = DQSYNTAX;
988 1.1 cgd dblquote = 1;
989 1.1 cgd break;
990 1.1 cgd case CENDQUOTE:
991 1.41 mycroft if (eofmark != NULL && arinest == 0 &&
992 1.41 mycroft varnest == 0) {
993 1.1 cgd USTPUTC(c, out);
994 1.1 cgd } else {
995 1.41 mycroft if (arinest) {
996 1.11 jtc syntax = ARISYNTAX;
997 1.41 mycroft dblquote = 0;
998 1.41 mycroft } else if (eofmark == NULL) {
999 1.11 jtc syntax = BASESYNTAX;
1000 1.41 mycroft dblquote = 0;
1001 1.41 mycroft }
1002 1.1 cgd quotef++;
1003 1.1 cgd }
1004 1.1 cgd break;
1005 1.1 cgd case CVAR: /* '$' */
1006 1.1 cgd PARSESUB(); /* parse substitution */
1007 1.1 cgd break;
1008 1.1 cgd case CENDVAR: /* '}' */
1009 1.1 cgd if (varnest > 0) {
1010 1.1 cgd varnest--;
1011 1.1 cgd USTPUTC(CTLENDVAR, out);
1012 1.1 cgd } else {
1013 1.1 cgd USTPUTC(c, out);
1014 1.1 cgd }
1015 1.1 cgd break;
1016 1.11 jtc case CLP: /* '(' in arithmetic */
1017 1.11 jtc parenlevel++;
1018 1.11 jtc USTPUTC(c, out);
1019 1.11 jtc break;
1020 1.11 jtc case CRP: /* ')' in arithmetic */
1021 1.11 jtc if (parenlevel > 0) {
1022 1.11 jtc USTPUTC(c, out);
1023 1.11 jtc --parenlevel;
1024 1.11 jtc } else {
1025 1.11 jtc if (pgetc() == ')') {
1026 1.11 jtc if (--arinest == 0) {
1027 1.11 jtc USTPUTC(CTLENDARI, out);
1028 1.11 jtc syntax = prevsyntax;
1029 1.41 mycroft if (syntax == DQSYNTAX)
1030 1.41 mycroft dblquote = 1;
1031 1.41 mycroft else
1032 1.41 mycroft dblquote = 0;
1033 1.11 jtc } else
1034 1.11 jtc USTPUTC(')', out);
1035 1.11 jtc } else {
1036 1.30 christos /*
1037 1.11 jtc * unbalanced parens
1038 1.11 jtc * (don't 2nd guess - no error)
1039 1.11 jtc */
1040 1.11 jtc pungetc();
1041 1.11 jtc USTPUTC(')', out);
1042 1.11 jtc }
1043 1.11 jtc }
1044 1.11 jtc break;
1045 1.1 cgd case CBQUOTE: /* '`' */
1046 1.1 cgd PARSEBACKQOLD();
1047 1.1 cgd break;
1048 1.1 cgd case CEOF:
1049 1.1 cgd goto endword; /* exit outer loop */
1050 1.1 cgd default:
1051 1.1 cgd if (varnest == 0)
1052 1.1 cgd goto endword; /* exit outer loop */
1053 1.1 cgd USTPUTC(c, out);
1054 1.1 cgd }
1055 1.1 cgd c = pgetc_macro();
1056 1.1 cgd }
1057 1.1 cgd }
1058 1.1 cgd endword:
1059 1.11 jtc if (syntax == ARISYNTAX)
1060 1.11 jtc synerror("Missing '))'");
1061 1.5 sef if (syntax != BASESYNTAX && ! parsebackquote && eofmark == NULL)
1062 1.1 cgd synerror("Unterminated quoted string");
1063 1.1 cgd if (varnest != 0) {
1064 1.1 cgd startlinno = plinno;
1065 1.1 cgd synerror("Missing '}'");
1066 1.1 cgd }
1067 1.1 cgd USTPUTC('\0', out);
1068 1.1 cgd len = out - stackblock();
1069 1.1 cgd out = stackblock();
1070 1.1 cgd if (eofmark == NULL) {
1071 1.1 cgd if ((c == '>' || c == '<')
1072 1.1 cgd && quotef == 0
1073 1.1 cgd && len <= 2
1074 1.1 cgd && (*out == '\0' || is_digit(*out))) {
1075 1.1 cgd PARSEREDIR();
1076 1.1 cgd return lasttoken = TREDIR;
1077 1.1 cgd } else {
1078 1.1 cgd pungetc();
1079 1.1 cgd }
1080 1.1 cgd }
1081 1.1 cgd quoteflag = quotef;
1082 1.1 cgd backquotelist = bqlist;
1083 1.1 cgd grabstackblock(len);
1084 1.1 cgd wordtext = out;
1085 1.1 cgd return lasttoken = TWORD;
1086 1.1 cgd /* end of readtoken routine */
1087 1.1 cgd
1088 1.1 cgd
1089 1.1 cgd
1090 1.1 cgd /*
1091 1.1 cgd * Check to see whether we are at the end of the here document. When this
1092 1.1 cgd * is called, c is set to the first character of the next input line. If
1093 1.1 cgd * we are at the end of the here document, this routine sets the c to PEOF.
1094 1.1 cgd */
1095 1.1 cgd
1096 1.1 cgd checkend: {
1097 1.1 cgd if (eofmark) {
1098 1.1 cgd if (striptabs) {
1099 1.1 cgd while (c == '\t')
1100 1.1 cgd c = pgetc();
1101 1.1 cgd }
1102 1.1 cgd if (c == *eofmark) {
1103 1.1 cgd if (pfgets(line, sizeof line) != NULL) {
1104 1.32 tls char *p, *q;
1105 1.1 cgd
1106 1.1 cgd p = line;
1107 1.1 cgd for (q = eofmark + 1 ; *q && *p == *q ; p++, q++);
1108 1.1 cgd if (*p == '\n' && *q == '\0') {
1109 1.1 cgd c = PEOF;
1110 1.1 cgd plinno++;
1111 1.1 cgd needprompt = doprompt;
1112 1.1 cgd } else {
1113 1.11 jtc pushstring(line, strlen(line), NULL);
1114 1.1 cgd }
1115 1.1 cgd }
1116 1.1 cgd }
1117 1.1 cgd }
1118 1.1 cgd goto checkend_return;
1119 1.1 cgd }
1120 1.1 cgd
1121 1.1 cgd
1122 1.1 cgd /*
1123 1.1 cgd * Parse a redirection operator. The variable "out" points to a string
1124 1.1 cgd * specifying the fd to be redirected. The variable "c" contains the
1125 1.1 cgd * first character of the redirection operator.
1126 1.1 cgd */
1127 1.1 cgd
1128 1.1 cgd parseredir: {
1129 1.1 cgd char fd = *out;
1130 1.1 cgd union node *np;
1131 1.1 cgd
1132 1.1 cgd np = (union node *)stalloc(sizeof (struct nfile));
1133 1.1 cgd if (c == '>') {
1134 1.1 cgd np->nfile.fd = 1;
1135 1.1 cgd c = pgetc();
1136 1.1 cgd if (c == '>')
1137 1.1 cgd np->type = NAPPEND;
1138 1.1 cgd else if (c == '&')
1139 1.1 cgd np->type = NTOFD;
1140 1.1 cgd else {
1141 1.1 cgd np->type = NTO;
1142 1.1 cgd pungetc();
1143 1.1 cgd }
1144 1.1 cgd } else { /* c == '<' */
1145 1.1 cgd np->nfile.fd = 0;
1146 1.42 christos switch (c = pgetc()) {
1147 1.42 christos case '<':
1148 1.1 cgd if (sizeof (struct nfile) != sizeof (struct nhere)) {
1149 1.1 cgd np = (union node *)stalloc(sizeof (struct nhere));
1150 1.1 cgd np->nfile.fd = 0;
1151 1.1 cgd }
1152 1.1 cgd np->type = NHERE;
1153 1.1 cgd heredoc = (struct heredoc *)stalloc(sizeof (struct heredoc));
1154 1.1 cgd heredoc->here = np;
1155 1.1 cgd if ((c = pgetc()) == '-') {
1156 1.1 cgd heredoc->striptabs = 1;
1157 1.1 cgd } else {
1158 1.1 cgd heredoc->striptabs = 0;
1159 1.1 cgd pungetc();
1160 1.1 cgd }
1161 1.42 christos break;
1162 1.42 christos
1163 1.42 christos case '&':
1164 1.1 cgd np->type = NFROMFD;
1165 1.42 christos break;
1166 1.42 christos
1167 1.42 christos case '>':
1168 1.42 christos np->type = NFROMTO;
1169 1.42 christos break;
1170 1.42 christos
1171 1.42 christos default:
1172 1.1 cgd np->type = NFROM;
1173 1.1 cgd pungetc();
1174 1.42 christos break;
1175 1.1 cgd }
1176 1.1 cgd }
1177 1.1 cgd if (fd != '\0')
1178 1.1 cgd np->nfile.fd = digit_val(fd);
1179 1.1 cgd redirnode = np;
1180 1.1 cgd goto parseredir_return;
1181 1.1 cgd }
1182 1.1 cgd
1183 1.1 cgd
1184 1.1 cgd /*
1185 1.1 cgd * Parse a substitution. At this point, we have read the dollar sign
1186 1.1 cgd * and nothing else.
1187 1.1 cgd */
1188 1.1 cgd
1189 1.1 cgd parsesub: {
1190 1.1 cgd int subtype;
1191 1.1 cgd int typeloc;
1192 1.1 cgd int flags;
1193 1.1 cgd char *p;
1194 1.1 cgd static const char types[] = "}-+?=";
1195 1.1 cgd
1196 1.1 cgd c = pgetc();
1197 1.1 cgd if (c != '(' && c != '{' && !is_name(c) && !is_special(c)) {
1198 1.1 cgd USTPUTC('$', out);
1199 1.1 cgd pungetc();
1200 1.11 jtc } else if (c == '(') { /* $(command) or $((arith)) */
1201 1.11 jtc if (pgetc() == '(') {
1202 1.11 jtc PARSEARITH();
1203 1.11 jtc } else {
1204 1.11 jtc pungetc();
1205 1.11 jtc PARSEBACKQNEW();
1206 1.11 jtc }
1207 1.1 cgd } else {
1208 1.1 cgd USTPUTC(CTLVAR, out);
1209 1.1 cgd typeloc = out - stackblock();
1210 1.1 cgd USTPUTC(VSNORMAL, out);
1211 1.1 cgd subtype = VSNORMAL;
1212 1.1 cgd if (c == '{') {
1213 1.1 cgd c = pgetc();
1214 1.23 christos if (c == '#') {
1215 1.26 christos if ((c = pgetc()) == '}')
1216 1.26 christos c = '#';
1217 1.26 christos else
1218 1.26 christos subtype = VSLENGTH;
1219 1.23 christos }
1220 1.23 christos else
1221 1.23 christos subtype = 0;
1222 1.1 cgd }
1223 1.1 cgd if (is_name(c)) {
1224 1.1 cgd do {
1225 1.1 cgd STPUTC(c, out);
1226 1.1 cgd c = pgetc();
1227 1.1 cgd } while (is_in_name(c));
1228 1.34 christos } else if (is_digit(c)) {
1229 1.33 christos do {
1230 1.33 christos USTPUTC(c, out);
1231 1.33 christos c = pgetc();
1232 1.34 christos } while (is_digit(c));
1233 1.34 christos }
1234 1.34 christos else if (is_special(c)) {
1235 1.34 christos USTPUTC(c, out);
1236 1.34 christos c = pgetc();
1237 1.1 cgd }
1238 1.33 christos else
1239 1.33 christos badsub: synerror("Bad substitution");
1240 1.33 christos
1241 1.1 cgd STPUTC('=', out);
1242 1.1 cgd flags = 0;
1243 1.1 cgd if (subtype == 0) {
1244 1.23 christos switch (c) {
1245 1.23 christos case ':':
1246 1.1 cgd flags = VSNUL;
1247 1.1 cgd c = pgetc();
1248 1.23 christos /*FALLTHROUGH*/
1249 1.23 christos default:
1250 1.23 christos p = strchr(types, c);
1251 1.23 christos if (p == NULL)
1252 1.23 christos goto badsub;
1253 1.23 christos subtype = p - types + VSNORMAL;
1254 1.23 christos break;
1255 1.23 christos case '%':
1256 1.30 christos case '#':
1257 1.23 christos {
1258 1.23 christos int cc = c;
1259 1.23 christos subtype = c == '#' ? VSTRIMLEFT :
1260 1.23 christos VSTRIMRIGHT;
1261 1.23 christos c = pgetc();
1262 1.23 christos if (c == cc)
1263 1.23 christos subtype++;
1264 1.23 christos else
1265 1.23 christos pungetc();
1266 1.23 christos break;
1267 1.23 christos }
1268 1.1 cgd }
1269 1.1 cgd } else {
1270 1.1 cgd pungetc();
1271 1.1 cgd }
1272 1.11 jtc if (dblquote || arinest)
1273 1.1 cgd flags |= VSQUOTE;
1274 1.1 cgd *(stackblock() + typeloc) = subtype | flags;
1275 1.1 cgd if (subtype != VSNORMAL)
1276 1.1 cgd varnest++;
1277 1.1 cgd }
1278 1.1 cgd goto parsesub_return;
1279 1.1 cgd }
1280 1.1 cgd
1281 1.1 cgd
1282 1.1 cgd /*
1283 1.1 cgd * Called to parse command substitutions. Newstyle is set if the command
1284 1.1 cgd * is enclosed inside $(...); nlpp is a pointer to the head of the linked
1285 1.1 cgd * list of commands (passed by reference), and savelen is the number of
1286 1.1 cgd * characters on the top of the stack which must be preserved.
1287 1.1 cgd */
1288 1.1 cgd
1289 1.1 cgd parsebackq: {
1290 1.1 cgd struct nodelist **nlpp;
1291 1.1 cgd int savepbq;
1292 1.1 cgd union node *n;
1293 1.1 cgd char *volatile str;
1294 1.1 cgd struct jmploc jmploc;
1295 1.1 cgd struct jmploc *volatile savehandler;
1296 1.1 cgd int savelen;
1297 1.28 christos int saveprompt;
1298 1.36 christos #ifdef __GNUC__
1299 1.36 christos (void) &saveprompt;
1300 1.36 christos #endif
1301 1.1 cgd
1302 1.1 cgd savepbq = parsebackquote;
1303 1.1 cgd if (setjmp(jmploc.loc)) {
1304 1.1 cgd if (str)
1305 1.1 cgd ckfree(str);
1306 1.1 cgd parsebackquote = 0;
1307 1.1 cgd handler = savehandler;
1308 1.4 dpassage longjmp(handler->loc, 1);
1309 1.1 cgd }
1310 1.1 cgd INTOFF;
1311 1.1 cgd str = NULL;
1312 1.1 cgd savelen = out - stackblock();
1313 1.1 cgd if (savelen > 0) {
1314 1.1 cgd str = ckmalloc(savelen);
1315 1.21 mycroft memcpy(str, stackblock(), savelen);
1316 1.1 cgd }
1317 1.1 cgd savehandler = handler;
1318 1.1 cgd handler = &jmploc;
1319 1.1 cgd INTON;
1320 1.11 jtc if (oldstyle) {
1321 1.11 jtc /* We must read until the closing backquote, giving special
1322 1.11 jtc treatment to some slashes, and then push the string and
1323 1.11 jtc reread it as input, interpreting it normally. */
1324 1.43 christos char *pout;
1325 1.43 christos int pc;
1326 1.43 christos int psavelen;
1327 1.43 christos char *pstr;
1328 1.28 christos
1329 1.30 christos
1330 1.43 christos STARTSTACKSTR(pout);
1331 1.28 christos for (;;) {
1332 1.28 christos if (needprompt) {
1333 1.28 christos setprompt(2);
1334 1.28 christos needprompt = 0;
1335 1.28 christos }
1336 1.43 christos switch (pc = pgetc()) {
1337 1.28 christos case '`':
1338 1.28 christos goto done;
1339 1.28 christos
1340 1.28 christos case '\\':
1341 1.43 christos if ((pc = pgetc()) == '\n') {
1342 1.28 christos plinno++;
1343 1.28 christos if (doprompt)
1344 1.28 christos setprompt(2);
1345 1.28 christos else
1346 1.28 christos setprompt(0);
1347 1.29 christos /*
1348 1.29 christos * If eating a newline, avoid putting
1349 1.29 christos * the newline into the new character
1350 1.29 christos * stream (via the STPUTC after the
1351 1.29 christos * switch).
1352 1.29 christos */
1353 1.29 christos continue;
1354 1.28 christos }
1355 1.43 christos if (pc != '\\' && pc != '`' && pc != '$'
1356 1.43 christos && (!dblquote || pc != '"'))
1357 1.43 christos STPUTC('\\', pout);
1358 1.28 christos break;
1359 1.28 christos
1360 1.28 christos case '\n':
1361 1.28 christos plinno++;
1362 1.28 christos needprompt = doprompt;
1363 1.28 christos break;
1364 1.28 christos
1365 1.30 christos case PEOF:
1366 1.30 christos startlinno = plinno;
1367 1.30 christos synerror("EOF in backquote substitution");
1368 1.30 christos break;
1369 1.30 christos
1370 1.28 christos default:
1371 1.28 christos break;
1372 1.28 christos }
1373 1.43 christos STPUTC(pc, pout);
1374 1.11 jtc }
1375 1.28 christos done:
1376 1.43 christos STPUTC('\0', pout);
1377 1.43 christos psavelen = pout - stackblock();
1378 1.43 christos if (psavelen > 0) {
1379 1.43 christos pstr = grabstackstr(pout);
1380 1.43 christos setinputstring(pstr, 1);
1381 1.11 jtc }
1382 1.11 jtc }
1383 1.1 cgd nlpp = &bqlist;
1384 1.1 cgd while (*nlpp)
1385 1.1 cgd nlpp = &(*nlpp)->next;
1386 1.1 cgd *nlpp = (struct nodelist *)stalloc(sizeof (struct nodelist));
1387 1.1 cgd (*nlpp)->next = NULL;
1388 1.1 cgd parsebackquote = oldstyle;
1389 1.28 christos
1390 1.28 christos if (oldstyle) {
1391 1.28 christos saveprompt = doprompt;
1392 1.28 christos doprompt = 0;
1393 1.28 christos }
1394 1.28 christos
1395 1.1 cgd n = list(0);
1396 1.28 christos
1397 1.28 christos if (oldstyle)
1398 1.28 christos doprompt = saveprompt;
1399 1.28 christos else {
1400 1.28 christos if (readtoken() != TRP)
1401 1.28 christos synexpect(TRP);
1402 1.28 christos }
1403 1.28 christos
1404 1.1 cgd (*nlpp)->n = n;
1405 1.27 christos if (oldstyle) {
1406 1.27 christos /*
1407 1.27 christos * Start reading from old file again, ignoring any pushed back
1408 1.27 christos * tokens left from the backquote parsing
1409 1.27 christos */
1410 1.11 jtc popfile();
1411 1.27 christos tokpushback = 0;
1412 1.27 christos }
1413 1.1 cgd while (stackblocksize() <= savelen)
1414 1.1 cgd growstackblock();
1415 1.1 cgd STARTSTACKSTR(out);
1416 1.1 cgd if (str) {
1417 1.21 mycroft memcpy(out, str, savelen);
1418 1.1 cgd STADJUST(savelen, out);
1419 1.1 cgd INTOFF;
1420 1.1 cgd ckfree(str);
1421 1.1 cgd str = NULL;
1422 1.1 cgd INTON;
1423 1.1 cgd }
1424 1.1 cgd parsebackquote = savepbq;
1425 1.1 cgd handler = savehandler;
1426 1.11 jtc if (arinest || dblquote)
1427 1.11 jtc USTPUTC(CTLBACKQ | CTLQUOTE, out);
1428 1.11 jtc else
1429 1.11 jtc USTPUTC(CTLBACKQ, out);
1430 1.1 cgd if (oldstyle)
1431 1.1 cgd goto parsebackq_oldreturn;
1432 1.1 cgd else
1433 1.1 cgd goto parsebackq_newreturn;
1434 1.1 cgd }
1435 1.1 cgd
1436 1.1 cgd /*
1437 1.11 jtc * Parse an arithmetic expansion (indicate start of one and set state)
1438 1.1 cgd */
1439 1.11 jtc parsearith: {
1440 1.1 cgd
1441 1.11 jtc if (++arinest == 1) {
1442 1.11 jtc prevsyntax = syntax;
1443 1.11 jtc syntax = ARISYNTAX;
1444 1.11 jtc USTPUTC(CTLARI, out);
1445 1.41 mycroft if (dblquote)
1446 1.41 mycroft USTPUTC('"',out);
1447 1.41 mycroft else
1448 1.41 mycroft USTPUTC(' ',out);
1449 1.11 jtc } else {
1450 1.11 jtc /*
1451 1.11 jtc * we collapse embedded arithmetic expansion to
1452 1.11 jtc * parenthesis, which should be equivalent
1453 1.11 jtc */
1454 1.11 jtc USTPUTC('(', out);
1455 1.1 cgd }
1456 1.11 jtc goto parsearith_return;
1457 1.1 cgd }
1458 1.1 cgd
1459 1.11 jtc } /* end of readtoken */
1460 1.1 cgd
1461 1.1 cgd
1462 1.1 cgd
1463 1.11 jtc #ifdef mkinit
1464 1.11 jtc RESET {
1465 1.11 jtc tokpushback = 0;
1466 1.11 jtc checkkwd = 0;
1467 1.1 cgd }
1468 1.1 cgd #endif
1469 1.1 cgd
1470 1.1 cgd /*
1471 1.1 cgd * Returns true if the text contains nothing to expand (no dollar signs
1472 1.1 cgd * or backquotes).
1473 1.1 cgd */
1474 1.1 cgd
1475 1.1 cgd STATIC int
1476 1.1 cgd noexpand(text)
1477 1.1 cgd char *text;
1478 1.1 cgd {
1479 1.32 tls char *p;
1480 1.32 tls char c;
1481 1.1 cgd
1482 1.1 cgd p = text;
1483 1.1 cgd while ((c = *p++) != '\0') {
1484 1.41 mycroft if (c == CTLQUOTEMARK)
1485 1.41 mycroft continue;
1486 1.1 cgd if (c == CTLESC)
1487 1.1 cgd p++;
1488 1.38 mrg else if (BASESYNTAX[(int)c] == CCTL)
1489 1.1 cgd return 0;
1490 1.1 cgd }
1491 1.1 cgd return 1;
1492 1.1 cgd }
1493 1.1 cgd
1494 1.1 cgd
1495 1.1 cgd /*
1496 1.1 cgd * Return true if the argument is a legal variable name (a letter or
1497 1.1 cgd * underscore followed by zero or more letters, underscores, and digits).
1498 1.1 cgd */
1499 1.1 cgd
1500 1.1 cgd int
1501 1.45 cgd goodname(char *name)
1502 1.1 cgd {
1503 1.32 tls char *p;
1504 1.1 cgd
1505 1.1 cgd p = name;
1506 1.1 cgd if (! is_name(*p))
1507 1.1 cgd return 0;
1508 1.1 cgd while (*++p) {
1509 1.1 cgd if (! is_in_name(*p))
1510 1.1 cgd return 0;
1511 1.1 cgd }
1512 1.1 cgd return 1;
1513 1.1 cgd }
1514 1.1 cgd
1515 1.1 cgd
1516 1.1 cgd /*
1517 1.1 cgd * Called when an unexpected token is read during the parse. The argument
1518 1.1 cgd * is the token that is expected, or -1 if more than one type of token can
1519 1.1 cgd * occur at this point.
1520 1.1 cgd */
1521 1.1 cgd
1522 1.1 cgd STATIC void
1523 1.30 christos synexpect(token)
1524 1.22 cgd int token;
1525 1.22 cgd {
1526 1.1 cgd char msg[64];
1527 1.1 cgd
1528 1.1 cgd if (token >= 0) {
1529 1.1 cgd fmtstr(msg, 64, "%s unexpected (expecting %s)",
1530 1.1 cgd tokname[lasttoken], tokname[token]);
1531 1.1 cgd } else {
1532 1.1 cgd fmtstr(msg, 64, "%s unexpected", tokname[lasttoken]);
1533 1.1 cgd }
1534 1.1 cgd synerror(msg);
1535 1.39 mycroft /* NOTREACHED */
1536 1.1 cgd }
1537 1.1 cgd
1538 1.1 cgd
1539 1.1 cgd STATIC void
1540 1.1 cgd synerror(msg)
1541 1.43 christos const char *msg;
1542 1.1 cgd {
1543 1.1 cgd if (commandname)
1544 1.1 cgd outfmt(&errout, "%s: %d: ", commandname, startlinno);
1545 1.1 cgd outfmt(&errout, "Syntax error: %s\n", msg);
1546 1.1 cgd error((char *)NULL);
1547 1.39 mycroft /* NOTREACHED */
1548 1.11 jtc }
1549 1.11 jtc
1550 1.11 jtc STATIC void
1551 1.11 jtc setprompt(which)
1552 1.11 jtc int which;
1553 1.11 jtc {
1554 1.11 jtc whichprompt = which;
1555 1.11 jtc
1556 1.35 christos #ifndef SMALL
1557 1.11 jtc if (!el)
1558 1.14 cgd #endif
1559 1.11 jtc out2str(getprompt(NULL));
1560 1.11 jtc }
1561 1.11 jtc
1562 1.11 jtc /*
1563 1.11 jtc * called by editline -- any expansions to the prompt
1564 1.11 jtc * should be added here.
1565 1.11 jtc */
1566 1.43 christos const char *
1567 1.45 cgd getprompt(void *unused)
1568 1.11 jtc {
1569 1.11 jtc switch (whichprompt) {
1570 1.11 jtc case 0:
1571 1.11 jtc return "";
1572 1.11 jtc case 1:
1573 1.11 jtc return ps1val();
1574 1.11 jtc case 2:
1575 1.11 jtc return ps2val();
1576 1.11 jtc default:
1577 1.11 jtc return "<internal prompt error>";
1578 1.11 jtc }
1579 1.1 cgd }
1580