cond.c revision 1.209 1 /* $NetBSD: cond.c,v 1.209 2020/11/12 20:16:20 rillig Exp $ */
2
3 /*
4 * Copyright (c) 1988, 1989, 1990 The Regents of the University of California.
5 * All rights reserved.
6 *
7 * This code is derived from software contributed to Berkeley by
8 * Adam de Boor.
9 *
10 * Redistribution and use in source and binary forms, with or without
11 * modification, are permitted provided that the following conditions
12 * are met:
13 * 1. Redistributions of source code must retain the above copyright
14 * notice, this list of conditions and the following disclaimer.
15 * 2. Redistributions in binary form must reproduce the above copyright
16 * notice, this list of conditions and the following disclaimer in the
17 * documentation and/or other materials provided with the distribution.
18 * 3. Neither the name of the University nor the names of its contributors
19 * may be used to endorse or promote products derived from this software
20 * without specific prior written permission.
21 *
22 * THIS SOFTWARE IS PROVIDED BY THE REGENTS AND CONTRIBUTORS ``AS IS'' AND
23 * ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
24 * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
25 * ARE DISCLAIMED. IN NO EVENT SHALL THE REGENTS OR CONTRIBUTORS BE LIABLE
26 * FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL
27 * DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS
28 * OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION)
29 * HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT
30 * LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY
31 * OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF
32 * SUCH DAMAGE.
33 */
34
35 /*
36 * Copyright (c) 1988, 1989 by Adam de Boor
37 * Copyright (c) 1989 by Berkeley Softworks
38 * All rights reserved.
39 *
40 * This code is derived from software contributed to Berkeley by
41 * Adam de Boor.
42 *
43 * Redistribution and use in source and binary forms, with or without
44 * modification, are permitted provided that the following conditions
45 * are met:
46 * 1. Redistributions of source code must retain the above copyright
47 * notice, this list of conditions and the following disclaimer.
48 * 2. Redistributions in binary form must reproduce the above copyright
49 * notice, this list of conditions and the following disclaimer in the
50 * documentation and/or other materials provided with the distribution.
51 * 3. All advertising materials mentioning features or use of this software
52 * must display the following acknowledgement:
53 * This product includes software developed by the University of
54 * California, Berkeley and its contributors.
55 * 4. Neither the name of the University nor the names of its contributors
56 * may be used to endorse or promote products derived from this software
57 * without specific prior written permission.
58 *
59 * THIS SOFTWARE IS PROVIDED BY THE REGENTS AND CONTRIBUTORS ``AS IS'' AND
60 * ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
61 * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
62 * ARE DISCLAIMED. IN NO EVENT SHALL THE REGENTS OR CONTRIBUTORS BE LIABLE
63 * FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL
64 * DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS
65 * OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION)
66 * HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT
67 * LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY
68 * OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF
69 * SUCH DAMAGE.
70 */
71
72 /* Handling of conditionals in a makefile.
73 *
74 * Interface:
75 * Cond_EvalLine Evaluate the conditional directive, such as
76 * '.if <cond>', '.elifnmake <cond>', '.else', '.endif'.
77 *
78 * Cond_EvalCondition
79 * Evaluate the conditional, which is either the argument
80 * of one of the .if directives or the condition in a
81 * ':?then:else' variable modifier.
82 *
83 * Cond_save_depth
84 * Cond_restore_depth
85 * Save and restore the nesting of the conditions, at
86 * the start and end of including another makefile, to
87 * ensure that in each makefile the conditional
88 * directives are well-balanced.
89 */
90
91 #include <errno.h>
92
93 #include "make.h"
94 #include "dir.h"
95
96 /* "@(#)cond.c 8.2 (Berkeley) 1/2/94" */
97 MAKE_RCSID("$NetBSD: cond.c,v 1.209 2020/11/12 20:16:20 rillig Exp $");
98
99 /*
100 * The parsing of conditional expressions is based on this grammar:
101 * E -> F || E
102 * E -> F
103 * F -> T && F
104 * F -> T
105 * T -> defined(variable)
106 * T -> make(target)
107 * T -> exists(file)
108 * T -> empty(varspec)
109 * T -> target(name)
110 * T -> commands(name)
111 * T -> symbol
112 * T -> $(varspec) op value
113 * T -> $(varspec) == "string"
114 * T -> $(varspec) != "string"
115 * T -> "string"
116 * T -> ( E )
117 * T -> ! T
118 * op -> == | != | > | < | >= | <=
119 *
120 * 'symbol' is some other symbol to which the default function is applied.
121 *
122 * The tokens are scanned by CondToken, which returns:
123 * TOK_AND for '&' or '&&'
124 * TOK_OR for '|' or '||'
125 * TOK_NOT for '!'
126 * TOK_LPAREN for '('
127 * TOK_RPAREN for ')'
128 * Other terminal symbols are evaluated using either the default function or
129 * the function given in the terminal, they return either TOK_TRUE or
130 * TOK_FALSE.
131 *
132 * TOK_FALSE is 0 and TOK_TRUE 1 so we can directly assign C comparisons.
133 *
134 * All non-terminal functions (CondParser_Expr, CondParser_Factor and
135 * CondParser_Term) return either TOK_FALSE, TOK_TRUE, or TOK_ERROR on error.
136 */
137 typedef enum Token {
138 TOK_FALSE = 0, TOK_TRUE = 1, TOK_AND, TOK_OR, TOK_NOT,
139 TOK_LPAREN, TOK_RPAREN, TOK_EOF, TOK_NONE, TOK_ERROR
140 } Token;
141
142 typedef struct CondParser {
143 const struct If *if_info; /* Info for current statement */
144 const char *p; /* The remaining condition to parse */
145 Token curr; /* Single push-back token used in parsing */
146
147 /* Whether an error message has already been printed for this condition.
148 * The first available error message is usually the most specific one,
149 * therefore it makes sense to suppress the standard "Malformed
150 * conditional" message. */
151 Boolean printedError;
152 } CondParser;
153
154 static Token CondParser_Expr(CondParser *par, Boolean);
155
156 static unsigned int cond_depth = 0; /* current .if nesting level */
157 static unsigned int cond_min_depth = 0; /* depth at makefile open */
158
159 /*
160 * Indicate when we should be strict about lhs of comparisons.
161 * In strict mode, the lhs must be a variable expression or a string literal
162 * in quotes. In non-strict mode it may also be an unquoted string literal.
163 *
164 * TRUE when CondEvalExpression is called from Cond_EvalLine (.if etc)
165 * FALSE when CondEvalExpression is called from ApplyModifier_IfElse
166 * since lhs is already expanded, and at that point we cannot tell if
167 * it was a variable reference or not.
168 */
169 static Boolean lhsStrict;
170
171 static int
172 is_token(const char *str, const char *tok, size_t len)
173 {
174 return strncmp(str, tok, len) == 0 && !ch_isalpha(str[len]);
175 }
176
177 static Token
178 ToToken(Boolean cond)
179 {
180 return cond ? TOK_TRUE : TOK_FALSE;
181 }
182
183 /* Push back the most recent token read. We only need one level of this. */
184 static void
185 CondParser_PushBack(CondParser *par, Token t)
186 {
187 assert(par->curr == TOK_NONE);
188 assert(t != TOK_NONE);
189
190 par->curr = t;
191 }
192
193 static void
194 CondParser_SkipWhitespace(CondParser *par)
195 {
196 cpp_skip_whitespace(&par->p);
197 }
198
199 /* Parse the argument of a built-in function.
200 *
201 * Arguments:
202 * *pp initially points at the '(',
203 * upon successful return it points right after the ')'.
204 *
205 * *out_arg receives the argument as string.
206 *
207 * func says whether the argument belongs to an actual function, or
208 * whether the parsed argument is passed to the default function.
209 *
210 * Return the length of the argument, or 0 on error. */
211 static size_t
212 ParseFuncArg(const char **pp, Boolean doEval, const char *func,
213 char **out_arg) {
214 const char *p = *pp;
215 Buffer argBuf;
216 int paren_depth;
217 size_t argLen;
218
219 if (func != NULL)
220 p++; /* Skip opening '(' - verified by caller */
221
222 if (*p == '\0') {
223 *out_arg = NULL; /* Missing closing parenthesis: */
224 return 0; /* .if defined( */
225 }
226
227 cpp_skip_hspace(&p);
228
229 Buf_InitSize(&argBuf, 16);
230
231 paren_depth = 0;
232 for (;;) {
233 char ch = *p;
234 if (ch == '\0' || ch == ' ' || ch == '\t')
235 break;
236 if ((ch == '&' || ch == '|') && paren_depth == 0)
237 break;
238 if (*p == '$') {
239 /*
240 * Parse the variable spec and install it as part of the argument
241 * if it's valid. We tell Var_Parse to complain on an undefined
242 * variable, so we don't need to do it. Nor do we return an error,
243 * though perhaps we should...
244 */
245 void *nestedVal_freeIt;
246 VarEvalFlags eflags = doEval ? VARE_WANTRES | VARE_UNDEFERR
247 : VARE_NONE;
248 const char *nestedVal;
249 (void)Var_Parse(&p, VAR_CMDLINE, eflags, &nestedVal,
250 &nestedVal_freeIt);
251 /* TODO: handle errors */
252 Buf_AddStr(&argBuf, nestedVal);
253 free(nestedVal_freeIt);
254 continue;
255 }
256 if (ch == '(')
257 paren_depth++;
258 else if (ch == ')' && --paren_depth < 0)
259 break;
260 Buf_AddByte(&argBuf, *p);
261 p++;
262 }
263
264 *out_arg = Buf_GetAll(&argBuf, &argLen);
265 Buf_Destroy(&argBuf, FALSE);
266
267 cpp_skip_hspace(&p);
268
269 if (func != NULL && *p++ != ')') {
270 Parse_Error(PARSE_WARNING, "Missing closing parenthesis for %s()",
271 func);
272 /* The PARSE_FATAL is done as a follow-up by CondEvalExpression. */
273 return 0;
274 }
275
276 *pp = p;
277 return argLen;
278 }
279
280 /* Test whether the given variable is defined. */
281 static Boolean
282 FuncDefined(size_t argLen MAKE_ATTR_UNUSED, const char *arg)
283 {
284 void *freeIt;
285 Boolean result = Var_Value(arg, VAR_CMDLINE, &freeIt) != NULL;
286 bmake_free(freeIt);
287 return result;
288 }
289
290 /* See if the given target is being made. */
291 static Boolean
292 FuncMake(size_t argLen MAKE_ATTR_UNUSED, const char *arg)
293 {
294 StringListNode *ln;
295
296 for (ln = opts.create->first; ln != NULL; ln = ln->next)
297 if (Str_Match(ln->datum, arg))
298 return TRUE;
299 return FALSE;
300 }
301
302 /* See if the given file exists. */
303 static Boolean
304 FuncExists(size_t argLen MAKE_ATTR_UNUSED, const char *arg)
305 {
306 Boolean result;
307 char *path;
308
309 path = Dir_FindFile(arg, dirSearchPath);
310 DEBUG2(COND, "exists(%s) result is \"%s\"\n",
311 arg, path != NULL ? path : "");
312 result = path != NULL;
313 free(path);
314 return result;
315 }
316
317 /* See if the given node exists and is an actual target. */
318 static Boolean
319 FuncTarget(size_t argLen MAKE_ATTR_UNUSED, const char *arg)
320 {
321 GNode *gn = Targ_FindNode(arg);
322 return gn != NULL && GNode_IsTarget(gn);
323 }
324
325 /* See if the given node exists and is an actual target with commands
326 * associated with it. */
327 static Boolean
328 FuncCommands(size_t argLen MAKE_ATTR_UNUSED, const char *arg)
329 {
330 GNode *gn = Targ_FindNode(arg);
331 return gn != NULL && GNode_IsTarget(gn) && !Lst_IsEmpty(gn->commands);
332 }
333
334 /*
335 * Convert the given number into a double.
336 * We try a base 10 or 16 integer conversion first, if that fails
337 * then we try a floating point conversion instead.
338 *
339 * Results:
340 * Returns TRUE if the conversion succeeded.
341 * Sets 'out_value' to the converted number.
342 */
343 static Boolean
344 TryParseNumber(const char *str, double *out_value)
345 {
346 char *end;
347 unsigned long ul_val;
348 double dbl_val;
349
350 errno = 0;
351 if (str[0] == '\0') { /* XXX: why is an empty string a number? */
352 *out_value = 0.0;
353 return TRUE;
354 }
355
356 ul_val = strtoul(str, &end, str[1] == 'x' ? 16 : 10);
357 if (*end == '\0' && errno != ERANGE) {
358 *out_value = str[0] == '-' ? -(double)-ul_val : (double)ul_val;
359 return TRUE;
360 }
361
362 if (*end != '\0' && *end != '.' && *end != 'e' && *end != 'E')
363 return FALSE; /* skip the expensive strtod call */
364 dbl_val = strtod(str, &end);
365 if (*end != '\0')
366 return FALSE;
367
368 *out_value = dbl_val;
369 return TRUE;
370 }
371
372 static Boolean
373 is_separator(char ch)
374 {
375 return ch == '\0' || ch_isspace(ch) || strchr("!=><)", ch) != NULL;
376 }
377
378 /*-
379 * Parse a string from a variable reference or an optionally quoted
380 * string. This is called for the lhs and rhs of string comparisons.
381 *
382 * Results:
383 * Returns the string, absent any quotes, or NULL on error.
384 * Sets out_quoted if the string was quoted.
385 * Sets out_freeIt.
386 */
387 /* coverity:[+alloc : arg-*4] */
388 static const char *
389 CondParser_String(CondParser *par, Boolean doEval, Boolean strictLHS,
390 Boolean *out_quoted, void **out_freeIt)
391 {
392 Buffer buf;
393 const char *str;
394 Boolean atStart;
395 const char *nested_p;
396 Boolean quoted;
397 const char *start;
398 VarEvalFlags eflags;
399 VarParseResult parseResult;
400
401 Buf_Init(&buf);
402 str = NULL;
403 *out_freeIt = NULL;
404 *out_quoted = quoted = par->p[0] == '"';
405 start = par->p;
406 if (quoted)
407 par->p++;
408 while (par->p[0] != '\0' && str == NULL) {
409 switch (par->p[0]) {
410 case '\\':
411 par->p++;
412 if (par->p[0] != '\0') {
413 Buf_AddByte(&buf, par->p[0]);
414 par->p++;
415 }
416 continue;
417 case '"':
418 if (quoted) {
419 par->p++; /* skip the closing quote */
420 goto got_str;
421 }
422 Buf_AddByte(&buf, par->p[0]); /* likely? */
423 par->p++;
424 continue;
425 case ')': /* see is_separator */
426 case '!':
427 case '=':
428 case '>':
429 case '<':
430 case ' ':
431 case '\t':
432 if (!quoted)
433 goto got_str;
434 Buf_AddByte(&buf, par->p[0]);
435 par->p++;
436 continue;
437 case '$':
438 /* if we are in quotes, an undefined variable is ok */
439 eflags = doEval && !quoted ? VARE_WANTRES | VARE_UNDEFERR :
440 doEval ? VARE_WANTRES :
441 VARE_NONE;
442
443 nested_p = par->p;
444 atStart = nested_p == start;
445 parseResult = Var_Parse(&nested_p, VAR_CMDLINE, eflags, &str,
446 out_freeIt);
447 /* TODO: handle errors */
448 if (str == var_Error) {
449 if (parseResult & VPR_ANY_MSG)
450 par->printedError = TRUE;
451 if (*out_freeIt != NULL) {
452 /* XXX: Can there be any situation in which a returned
453 * var_Error requires freeIt? */
454 free(*out_freeIt);
455 *out_freeIt = NULL;
456 }
457 /*
458 * Even if !doEval, we still report syntax errors, which
459 * is what getting var_Error back with !doEval means.
460 */
461 str = NULL;
462 goto cleanup;
463 }
464 par->p = nested_p;
465
466 /*
467 * If the '$' started the string literal (which means no quotes),
468 * and the variable expression is followed by a space, looks like
469 * a comparison operator or is the end of the expression, we are
470 * done.
471 */
472 if (atStart && is_separator(par->p[0]))
473 goto cleanup;
474
475 Buf_AddStr(&buf, str);
476 if (*out_freeIt) {
477 free(*out_freeIt);
478 *out_freeIt = NULL;
479 }
480 str = NULL; /* not finished yet */
481 continue;
482 default:
483 if (strictLHS && !quoted && *start != '$' && !ch_isdigit(*start)) {
484 /* lhs must be quoted, a variable reference or number */
485 str = NULL;
486 goto cleanup;
487 }
488 Buf_AddByte(&buf, par->p[0]);
489 par->p++;
490 continue;
491 }
492 }
493 got_str:
494 *out_freeIt = Buf_GetAll(&buf, NULL);
495 str = *out_freeIt;
496 cleanup:
497 Buf_Destroy(&buf, FALSE);
498 return str;
499 }
500
501 struct If {
502 const char *form; /* Form of if */
503 size_t formlen; /* Length of form */
504 Boolean doNot; /* TRUE if default function should be negated */
505 Boolean (*defProc)(size_t, const char *); /* Default function to apply */
506 };
507
508 /* The different forms of .if directives. */
509 static const struct If ifs[] = {
510 { "def", 3, FALSE, FuncDefined },
511 { "ndef", 4, TRUE, FuncDefined },
512 { "make", 4, FALSE, FuncMake },
513 { "nmake", 5, TRUE, FuncMake },
514 { "", 0, FALSE, FuncDefined },
515 { NULL, 0, FALSE, NULL }
516 };
517 enum { PLAIN_IF_INDEX = 4 };
518
519 static Boolean
520 If_Eval(const struct If *if_info, const char *arg, size_t arglen)
521 {
522 Boolean res = if_info->defProc(arglen, arg);
523 return if_info->doNot ? !res : res;
524 }
525
526 /* Evaluate a "comparison without operator", such as in ".if ${VAR}" or
527 * ".if 0". */
528 static Boolean
529 EvalNotEmpty(CondParser *par, const char *value, Boolean quoted)
530 {
531 double num;
532
533 /* For .ifxxx "...", check for non-empty string. */
534 if (quoted)
535 return value[0] != '\0';
536
537 /* For .ifxxx <number>, compare against zero */
538 if (TryParseNumber(value, &num))
539 return num != 0.0;
540
541 /* For .if ${...}, check for non-empty string. This is different from
542 * the evaluation function from that .if variant, which would test
543 * whether a variable of the given name were defined. */
544 /* XXX: Whitespace should count as empty, just as in ParseEmptyArg. */
545 if (par->if_info->form[0] == '\0')
546 return value[0] != '\0';
547
548 /* For the other variants of .ifxxx ${...}, use its default function. */
549 return If_Eval(par->if_info, value, strlen(value));
550 }
551
552 /* Evaluate a numerical comparison, such as in ".if ${VAR} >= 9". */
553 static Token
554 EvalCompareNum(double lhs, const char *op, double rhs)
555 {
556 DEBUG3(COND, "lhs = %f, rhs = %f, op = %.2s\n", lhs, rhs, op);
557
558 switch (op[0]) {
559 case '!':
560 if (op[1] != '=') {
561 Parse_Error(PARSE_WARNING, "Unknown operator");
562 /* The PARSE_FATAL is done as a follow-up by CondEvalExpression. */
563 return TOK_ERROR;
564 }
565 return ToToken(lhs != rhs);
566 case '=':
567 if (op[1] != '=') {
568 Parse_Error(PARSE_WARNING, "Unknown operator");
569 /* The PARSE_FATAL is done as a follow-up by CondEvalExpression. */
570 return TOK_ERROR;
571 }
572 return ToToken(lhs == rhs);
573 case '<':
574 return ToToken(op[1] == '=' ? lhs <= rhs : lhs < rhs);
575 case '>':
576 return ToToken(op[1] == '=' ? lhs >= rhs : lhs > rhs);
577 }
578 return TOK_ERROR;
579 }
580
581 static Token
582 EvalCompareStr(const char *lhs, const char *op, const char *rhs)
583 {
584 if (!((op[0] == '!' || op[0] == '=') && op[1] == '=')) {
585 Parse_Error(PARSE_WARNING,
586 "String comparison operator must be either == or !=");
587 /* The PARSE_FATAL is done as a follow-up by CondEvalExpression. */
588 return TOK_ERROR;
589 }
590
591 DEBUG3(COND, "lhs = \"%s\", rhs = \"%s\", op = %.2s\n", lhs, rhs, op);
592 return ToToken((*op == '=') == (strcmp(lhs, rhs) == 0));
593 }
594
595 /* Evaluate a comparison, such as "${VAR} == 12345". */
596 static Token
597 EvalCompare(const char *lhs, Boolean lhsQuoted, const char *op,
598 const char *rhs, Boolean rhsQuoted)
599 {
600 double left, right;
601
602 if (!rhsQuoted && !lhsQuoted)
603 if (TryParseNumber(lhs, &left) && TryParseNumber(rhs, &right))
604 return EvalCompareNum(left, op, right);
605
606 return EvalCompareStr(lhs, op, rhs);
607 }
608
609 /* Parse a comparison condition such as:
610 *
611 * 0
612 * ${VAR:Mpattern}
613 * ${VAR} == value
614 * ${VAR:U0} < 12345
615 */
616 static Token
617 CondParser_Comparison(CondParser *par, Boolean doEval)
618 {
619 Token t = TOK_ERROR;
620 const char *lhs, *op, *rhs;
621 void *lhs_freeIt, *rhs_freeIt;
622 Boolean lhsQuoted, rhsQuoted;
623
624 /*
625 * Parse the variable spec and skip over it, saving its
626 * value in lhs.
627 */
628 lhs = CondParser_String(par, doEval, lhsStrict, &lhsQuoted, &lhs_freeIt);
629 if (lhs == NULL)
630 goto done_lhs;
631
632 CondParser_SkipWhitespace(par);
633
634 op = par->p;
635 switch (par->p[0]) {
636 case '!':
637 case '=':
638 case '<':
639 case '>':
640 if (par->p[1] == '=')
641 par->p += 2;
642 else
643 par->p++;
644 break;
645 default:
646 /* Unknown operator, compare against an empty string or 0. */
647 t = ToToken(doEval && EvalNotEmpty(par, lhs, lhsQuoted));
648 goto done_lhs;
649 }
650
651 CondParser_SkipWhitespace(par);
652
653 if (par->p[0] == '\0') {
654 Parse_Error(PARSE_WARNING, "Missing right-hand-side of operator");
655 /* The PARSE_FATAL is done as a follow-up by CondEvalExpression. */
656 goto done_lhs;
657 }
658
659 rhs = CondParser_String(par, doEval, FALSE, &rhsQuoted, &rhs_freeIt);
660 if (rhs == NULL)
661 goto done_rhs;
662
663 if (!doEval) {
664 t = TOK_FALSE;
665 goto done_rhs;
666 }
667
668 t = EvalCompare(lhs, lhsQuoted, op, rhs, rhsQuoted);
669
670 done_rhs:
671 free(rhs_freeIt);
672 done_lhs:
673 free(lhs_freeIt);
674 return t;
675 }
676
677 /* The argument to empty() is a variable name, optionally followed by
678 * variable modifiers. */
679 static size_t
680 ParseEmptyArg(const char **pp, Boolean doEval,
681 const char *func MAKE_ATTR_UNUSED, char **out_arg)
682 {
683 void *val_freeIt;
684 const char *val;
685 size_t magic_res;
686
687 /* We do all the work here and return the result as the length */
688 *out_arg = NULL;
689
690 (*pp)--; /* Make (*pp)[1] point to the '('. */
691 (void)Var_Parse(pp, VAR_CMDLINE, doEval ? VARE_WANTRES : VARE_NONE,
692 &val, &val_freeIt);
693 /* TODO: handle errors */
694 /* If successful, *pp points beyond the closing ')' now. */
695
696 if (val == var_Error) {
697 free(val_freeIt);
698 return (size_t)-1;
699 }
700
701 /* A variable is empty when it just contains spaces... 4/15/92, christos */
702 cpp_skip_whitespace(&val);
703
704 /*
705 * For consistency with the other functions we can't generate the
706 * true/false here.
707 */
708 magic_res = *val != '\0' ? 2 : 1;
709 free(val_freeIt);
710 return magic_res;
711 }
712
713 static Boolean
714 FuncEmpty(size_t arglen, const char *arg MAKE_ATTR_UNUSED)
715 {
716 /* Magic values ahead, see ParseEmptyArg. */
717 return arglen == 1;
718 }
719
720 static Boolean
721 CondParser_Func(CondParser *par, Boolean doEval, Token *out_token)
722 {
723 static const struct fn_def {
724 const char *fn_name;
725 size_t fn_name_len;
726 size_t (*fn_parse)(const char **, Boolean, const char *, char **);
727 Boolean (*fn_eval)(size_t, const char *);
728 } fns[] = {
729 { "defined", 7, ParseFuncArg, FuncDefined },
730 { "make", 4, ParseFuncArg, FuncMake },
731 { "exists", 6, ParseFuncArg, FuncExists },
732 { "empty", 5, ParseEmptyArg, FuncEmpty },
733 { "target", 6, ParseFuncArg, FuncTarget },
734 { "commands", 8, ParseFuncArg, FuncCommands }
735 };
736 const struct fn_def *fn;
737 char *arg = NULL;
738 size_t arglen;
739 const char *cp = par->p;
740 const struct fn_def *fns_end = fns + sizeof fns / sizeof fns[0];
741
742 for (fn = fns; fn != fns_end; fn++) {
743 if (!is_token(cp, fn->fn_name, fn->fn_name_len))
744 continue;
745
746 cp += fn->fn_name_len;
747 cpp_skip_whitespace(&cp);
748 if (*cp != '(')
749 break;
750
751 arglen = fn->fn_parse(&cp, doEval, fn->fn_name, &arg);
752 if (arglen == 0 || arglen == (size_t)-1) {
753 par->p = cp;
754 *out_token = arglen == 0 ? TOK_FALSE : TOK_ERROR;
755 return TRUE;
756 }
757
758 /* Evaluate the argument using the required function. */
759 *out_token = ToToken(!doEval || fn->fn_eval(arglen, arg));
760 free(arg);
761 par->p = cp;
762 return TRUE;
763 }
764
765 return FALSE;
766 }
767
768 /* Parse a function call, a number, a variable expression or a string
769 * literal. */
770 static Token
771 CondParser_LeafToken(CondParser *par, Boolean doEval)
772 {
773 Token t;
774 char *arg = NULL;
775 size_t arglen;
776 const char *cp = par->p;
777 const char *cp1;
778
779 if (CondParser_Func(par, doEval, &t))
780 return t;
781
782 /* Push anything numeric through the compare expression */
783 cp = par->p;
784 if (ch_isdigit(cp[0]) || cp[0] == '-' || cp[0] == '+')
785 return CondParser_Comparison(par, doEval);
786
787 /*
788 * Most likely we have a naked token to apply the default function to.
789 * However ".if a == b" gets here when the "a" is unquoted and doesn't
790 * start with a '$'. This surprises people.
791 * If what follows the function argument is a '=' or '!' then the syntax
792 * would be invalid if we did "defined(a)" - so instead treat as an
793 * expression.
794 */
795 arglen = ParseFuncArg(&cp, doEval, NULL, &arg);
796 cp1 = cp;
797 cpp_skip_whitespace(&cp1);
798 if (*cp1 == '=' || *cp1 == '!')
799 return CondParser_Comparison(par, doEval);
800 par->p = cp;
801
802 /*
803 * Evaluate the argument using the default function.
804 * This path always treats .if as .ifdef. To get here, the character
805 * after .if must have been taken literally, so the argument cannot
806 * be empty - even if it contained a variable expansion.
807 */
808 t = ToToken(!doEval || If_Eval(par->if_info, arg, arglen));
809 free(arg);
810 return t;
811 }
812
813 /* Return the next token or comparison result from the parser. */
814 static Token
815 CondParser_Token(CondParser *par, Boolean doEval)
816 {
817 Token t;
818
819 t = par->curr;
820 if (t != TOK_NONE) {
821 par->curr = TOK_NONE;
822 return t;
823 }
824
825 cpp_skip_hspace(&par->p);
826
827 switch (par->p[0]) {
828
829 case '(':
830 par->p++;
831 return TOK_LPAREN;
832
833 case ')':
834 par->p++;
835 return TOK_RPAREN;
836
837 case '|':
838 par->p++;
839 if (par->p[0] == '|')
840 par->p++;
841 else if (opts.lint) {
842 Parse_Error(PARSE_FATAL, "Unknown operator '|'");
843 par->printedError = TRUE;
844 return TOK_ERROR;
845 }
846 return TOK_OR;
847
848 case '&':
849 par->p++;
850 if (par->p[0] == '&')
851 par->p++;
852 else if (opts.lint) {
853 Parse_Error(PARSE_FATAL, "Unknown operator '&'");
854 par->printedError = TRUE;
855 return TOK_ERROR;
856 }
857 return TOK_AND;
858
859 case '!':
860 par->p++;
861 return TOK_NOT;
862
863 case '#': /* XXX: see unit-tests/cond-token-plain.mk */
864 case '\n': /* XXX: why should this end the condition? */
865 /* Probably obsolete now, from 1993-03-21. */
866 case '\0':
867 return TOK_EOF;
868
869 case '"':
870 case '$':
871 return CondParser_Comparison(par, doEval);
872
873 default:
874 return CondParser_LeafToken(par, doEval);
875 }
876 }
877
878 /* Parse a single term in the expression. This consists of a terminal symbol
879 * or TOK_NOT and a term (not including the binary operators):
880 *
881 * T -> defined(variable) | make(target) | exists(file) | symbol
882 * T -> ! T | ( E )
883 *
884 * Results:
885 * TOK_TRUE, TOK_FALSE or TOK_ERROR.
886 */
887 static Token
888 CondParser_Term(CondParser *par, Boolean doEval)
889 {
890 Token t;
891
892 t = CondParser_Token(par, doEval);
893
894 if (t == TOK_EOF) {
895 /*
896 * If we reached the end of the expression, the expression
897 * is malformed...
898 */
899 t = TOK_ERROR;
900 } else if (t == TOK_LPAREN) {
901 /*
902 * T -> ( E )
903 */
904 t = CondParser_Expr(par, doEval);
905 if (t != TOK_ERROR) {
906 if (CondParser_Token(par, doEval) != TOK_RPAREN) {
907 t = TOK_ERROR;
908 }
909 }
910 } else if (t == TOK_NOT) {
911 t = CondParser_Term(par, doEval);
912 if (t == TOK_TRUE) {
913 t = TOK_FALSE;
914 } else if (t == TOK_FALSE) {
915 t = TOK_TRUE;
916 }
917 }
918 return t;
919 }
920
921 /* Parse a conjunctive factor (nice name, wot?)
922 *
923 * F -> T && F | T
924 *
925 * Results:
926 * TOK_TRUE, TOK_FALSE or TOK_ERROR
927 */
928 static Token
929 CondParser_Factor(CondParser *par, Boolean doEval)
930 {
931 Token l, o;
932
933 l = CondParser_Term(par, doEval);
934 if (l != TOK_ERROR) {
935 o = CondParser_Token(par, doEval);
936
937 if (o == TOK_AND) {
938 /*
939 * F -> T && F
940 *
941 * If T is TOK_FALSE, the whole thing will be TOK_FALSE, but we
942 * have to parse the r.h.s. anyway (to throw it away).
943 * If T is TOK_TRUE, the result is the r.h.s., be it a TOK_ERROR
944 * or not.
945 */
946 if (l == TOK_TRUE) {
947 l = CondParser_Factor(par, doEval);
948 } else {
949 (void)CondParser_Factor(par, FALSE);
950 }
951 } else {
952 /*
953 * F -> T
954 */
955 CondParser_PushBack(par, o);
956 }
957 }
958 return l;
959 }
960
961 /* Main expression production.
962 *
963 * E -> F || E | F
964 *
965 * Results:
966 * TOK_TRUE, TOK_FALSE or TOK_ERROR.
967 */
968 static Token
969 CondParser_Expr(CondParser *par, Boolean doEval)
970 {
971 Token l, o;
972
973 l = CondParser_Factor(par, doEval);
974 if (l != TOK_ERROR) {
975 o = CondParser_Token(par, doEval);
976
977 if (o == TOK_OR) {
978 /*
979 * E -> F || E
980 *
981 * A similar thing occurs for ||, except that here we make sure
982 * the l.h.s. is TOK_FALSE before we bother to evaluate the r.h.s.
983 * Once again, if l is TOK_FALSE, the result is the r.h.s. and once
984 * again if l is TOK_TRUE, we parse the r.h.s. to throw it away.
985 */
986 if (l == TOK_FALSE) {
987 l = CondParser_Expr(par, doEval);
988 } else {
989 (void)CondParser_Expr(par, FALSE);
990 }
991 } else {
992 /*
993 * E -> F
994 */
995 CondParser_PushBack(par, o);
996 }
997 }
998 return l;
999 }
1000
1001 static CondEvalResult
1002 CondParser_Eval(CondParser *par, Boolean *value)
1003 {
1004 Token res;
1005
1006 DEBUG1(COND, "CondParser_Eval: %s\n", par->p);
1007
1008 res = CondParser_Expr(par, TRUE);
1009 if (res != TOK_FALSE && res != TOK_TRUE)
1010 return COND_INVALID;
1011
1012 if (CondParser_Token(par, TRUE /* XXX: Why TRUE? */) != TOK_EOF)
1013 return COND_INVALID;
1014
1015 *value = res == TOK_TRUE;
1016 return COND_PARSE;
1017 }
1018
1019 /* Evaluate the condition, including any side effects from the variable
1020 * expressions in the condition. The condition consists of &&, ||, !,
1021 * function(arg), comparisons and parenthetical groupings thereof.
1022 *
1023 * Results:
1024 * COND_PARSE if the condition was valid grammatically
1025 * COND_INVALID if not a valid conditional.
1026 *
1027 * (*value) is set to the boolean value of the condition
1028 */
1029 static CondEvalResult
1030 CondEvalExpression(const struct If *info, const char *cond, Boolean *value,
1031 Boolean eprint, Boolean strictLHS)
1032 {
1033 CondParser par;
1034 CondEvalResult rval;
1035
1036 lhsStrict = strictLHS;
1037
1038 cpp_skip_hspace(&cond);
1039
1040 par.if_info = info != NULL ? info : ifs + PLAIN_IF_INDEX;
1041 par.p = cond;
1042 par.curr = TOK_NONE;
1043 par.printedError = FALSE;
1044
1045 rval = CondParser_Eval(&par, value);
1046
1047 if (rval == COND_INVALID && eprint && !par.printedError)
1048 Parse_Error(PARSE_FATAL, "Malformed conditional (%s)", cond);
1049
1050 return rval;
1051 }
1052
1053 /* Evaluate a condition in a :? modifier, such as
1054 * ${"${VAR}" == value:?yes:no}. */
1055 CondEvalResult
1056 Cond_EvalCondition(const char *cond, Boolean *out_value)
1057 {
1058 return CondEvalExpression(NULL, cond, out_value, FALSE, FALSE);
1059 }
1060
1061 /* Evaluate the conditional directive in the line, which is one of:
1062 *
1063 * .if <cond>
1064 * .ifmake <cond>
1065 * .ifnmake <cond>
1066 * .ifdef <cond>
1067 * .ifndef <cond>
1068 * .elif <cond>
1069 * .elifmake <cond>
1070 * .elifnmake <cond>
1071 * .elifdef <cond>
1072 * .elifndef <cond>
1073 * .else
1074 * .endif
1075 *
1076 * In these directives, <cond> consists of &&, ||, !, function(arg),
1077 * comparisons, expressions, bare words, numbers and strings, and
1078 * parenthetical groupings thereof.
1079 *
1080 * Results:
1081 * COND_PARSE to continue parsing the lines that follow the
1082 * conditional (when <cond> evaluates to TRUE)
1083 * COND_SKIP to skip the lines after the conditional
1084 * (when <cond> evaluates to FALSE, or when a previous
1085 * branch has already been taken)
1086 * COND_INVALID if the conditional was not valid, either because of
1087 * a syntax error or because some variable was undefined
1088 * or because the condition could not be evaluated
1089 */
1090 CondEvalResult
1091 Cond_EvalLine(const char *const line)
1092 {
1093 typedef enum IfState {
1094
1095 /* The previous <cond> evaluated to TRUE. The lines following this
1096 * condition are interpreted. */
1097 IF_ACTIVE,
1098
1099 /* The previous '.else' evaluated to TRUE. The lines following this
1100 * condition are interpreted. The only difference to IF_ACTIVE is
1101 * that no other '.else' may follow. */
1102 ELSE_ACTIVE,
1103
1104 /* None of the previous <cond> evaluated to TRUE. Still searching
1105 * for an '.elif' or an 'else' that evaluates to TRUE. */
1106 SEARCH_FOR_ELIF,
1107
1108 /* One of the previous <cond> evaluated to TRUE. There was no '.else'
1109 * yet. */
1110 SKIP_TO_ELSE,
1111
1112 /* One of the previous <cond> evaluated to TRUE, and '.else' was
1113 * already seen. No other '.else' may follow. */
1114 SKIP_TO_ENDIF
1115
1116 } IfState;
1117
1118 static enum IfState *cond_states = NULL;
1119 static unsigned int cond_states_cap = 128;
1120
1121 const struct If *ifp;
1122 Boolean isElif;
1123 Boolean value;
1124 IfState state;
1125 const char *p = line;
1126
1127 if (cond_states == NULL) {
1128 cond_states = bmake_malloc(cond_states_cap * sizeof *cond_states);
1129 cond_states[0] = IF_ACTIVE;
1130 }
1131 p++; /* skip the leading '.' */
1132 cpp_skip_hspace(&p);
1133
1134 /* Find what type of if we're dealing with. */
1135 if (p[0] == 'e') {
1136 if (p[1] != 'l') {
1137 if (!is_token(p + 1, "ndif", 4)) { /* It is an '.endif'. */
1138 /* TODO: check for extraneous <cond> */
1139 return COND_INVALID;
1140 }
1141 /* End of conditional section */
1142 if (cond_depth == cond_min_depth) {
1143 Parse_Error(PARSE_FATAL, "if-less endif");
1144 return COND_PARSE;
1145 }
1146 /* Return state for previous conditional */
1147 cond_depth--;
1148 return cond_states[cond_depth] <= ELSE_ACTIVE
1149 ? COND_PARSE : COND_SKIP;
1150 }
1151
1152 /* Quite likely this is 'else' or 'elif' */
1153 p += 2;
1154 if (is_token(p, "se", 2)) { /* It is an 'else'. */
1155
1156 /* TODO: check for extraneous <cond> */
1157
1158 if (cond_depth == cond_min_depth) {
1159 Parse_Error(PARSE_FATAL, "if-less else");
1160 return COND_PARSE;
1161 }
1162
1163 state = cond_states[cond_depth];
1164 switch (state) {
1165 case SEARCH_FOR_ELIF:
1166 state = ELSE_ACTIVE;
1167 break;
1168 case ELSE_ACTIVE:
1169 case SKIP_TO_ENDIF:
1170 Parse_Error(PARSE_WARNING, "extra else");
1171 /* FALLTHROUGH */
1172 default:
1173 case IF_ACTIVE:
1174 case SKIP_TO_ELSE:
1175 state = SKIP_TO_ENDIF;
1176 break;
1177 }
1178 cond_states[cond_depth] = state;
1179 return state <= ELSE_ACTIVE ? COND_PARSE : COND_SKIP;
1180 }
1181 /* Assume for now it is an elif */
1182 isElif = TRUE;
1183 } else
1184 isElif = FALSE;
1185
1186 if (p[0] != 'i' || p[1] != 'f') {
1187 /* TODO: Add error message about unknown directive.
1188 * See directive-elif.mk:23 */
1189 return COND_INVALID; /* Not an ifxxx or elifxxx line */
1190 }
1191
1192 /*
1193 * Figure out what sort of conditional it is -- what its default
1194 * function is, etc. -- by looking in the table of valid "ifs"
1195 */
1196 p += 2;
1197 for (ifp = ifs;; ifp++) {
1198 if (ifp->form == NULL) {
1199 /* TODO: Add error message about unknown directive,
1200 * since there is no other known directive that starts with 'el'
1201 * or 'if'.
1202 * Example: .elifx 123 */
1203 return COND_INVALID;
1204 }
1205 if (is_token(p, ifp->form, ifp->formlen)) {
1206 p += ifp->formlen;
1207 break;
1208 }
1209 }
1210
1211 /* Now we know what sort of 'if' it is... */
1212
1213 if (isElif) {
1214 if (cond_depth == cond_min_depth) {
1215 Parse_Error(PARSE_FATAL, "if-less elif");
1216 return COND_PARSE;
1217 }
1218 state = cond_states[cond_depth];
1219 if (state == SKIP_TO_ENDIF || state == ELSE_ACTIVE) {
1220 Parse_Error(PARSE_WARNING, "extra elif");
1221 cond_states[cond_depth] = SKIP_TO_ENDIF;
1222 return COND_SKIP;
1223 }
1224 if (state != SEARCH_FOR_ELIF) {
1225 /* Either just finished the 'true' block, or already SKIP_TO_ELSE */
1226 cond_states[cond_depth] = SKIP_TO_ELSE;
1227 return COND_SKIP;
1228 }
1229 } else {
1230 /* Normal .if */
1231 if (cond_depth + 1 >= cond_states_cap) {
1232 /*
1233 * This is rare, but not impossible.
1234 * In meta mode, dirdeps.mk (only runs at level 0)
1235 * can need more than the default.
1236 */
1237 cond_states_cap += 32;
1238 cond_states = bmake_realloc(cond_states,
1239 cond_states_cap * sizeof *cond_states);
1240 }
1241 state = cond_states[cond_depth];
1242 cond_depth++;
1243 if (state > ELSE_ACTIVE) {
1244 /* If we aren't parsing the data, treat as always false */
1245 cond_states[cond_depth] = SKIP_TO_ELSE;
1246 return COND_SKIP;
1247 }
1248 }
1249
1250 /* And evaluate the conditional expression */
1251 if (CondEvalExpression(ifp, p, &value, TRUE, TRUE) == COND_INVALID) {
1252 /* Syntax error in conditional, error message already output. */
1253 /* Skip everything to matching .endif */
1254 cond_states[cond_depth] = SKIP_TO_ELSE;
1255 return COND_SKIP;
1256 }
1257
1258 if (!value) {
1259 cond_states[cond_depth] = SEARCH_FOR_ELIF;
1260 return COND_SKIP;
1261 }
1262 cond_states[cond_depth] = IF_ACTIVE;
1263 return COND_PARSE;
1264 }
1265
1266 void
1267 Cond_restore_depth(unsigned int saved_depth)
1268 {
1269 unsigned int open_conds = cond_depth - cond_min_depth;
1270
1271 if (open_conds != 0 || saved_depth > cond_depth) {
1272 Parse_Error(PARSE_FATAL, "%u open conditional%s", open_conds,
1273 open_conds == 1 ? "" : "s");
1274 cond_depth = cond_min_depth;
1275 }
1276
1277 cond_min_depth = saved_depth;
1278 }
1279
1280 unsigned int
1281 Cond_save_depth(void)
1282 {
1283 unsigned int depth = cond_min_depth;
1284
1285 cond_min_depth = cond_depth;
1286 return depth;
1287 }
1288