Home | History | Annotate | Line # | Download | only in expr
expr.y revision 1.48
      1  1.48    rillig /* $NetBSD: expr.y,v 1.48 2025/03/15 09:33:02 rillig Exp $ */
      2  1.17  jdolecek 
      3  1.17  jdolecek /*_
      4  1.17  jdolecek  * Copyright (c) 2000 The NetBSD Foundation, Inc.
      5  1.17  jdolecek  * All rights reserved.
      6   1.2       cgd  *
      7  1.17  jdolecek  * This code is derived from software contributed to The NetBSD Foundation
      8  1.29     grant  * by Jaromir Dolecek <jdolecek (at) NetBSD.org> and J.T. Conklin <jtc (at) NetBSD.org>.
      9  1.11       jtc  *
     10  1.17  jdolecek  * Redistribution and use in source and binary forms, with or without
     11  1.17  jdolecek  * modification, are permitted provided that the following conditions
     12  1.17  jdolecek  * are met:
     13  1.17  jdolecek  * 1. Redistributions of source code must retain the above copyright
     14  1.17  jdolecek  *    notice, this list of conditions and the following disclaimer.
     15  1.17  jdolecek  * 2. Redistributions in binary form must reproduce the above copyright
     16  1.17  jdolecek  *    notice, this list of conditions and the following disclaimer in the
     17  1.17  jdolecek  *    documentation and/or other materials provided with the distribution.
     18  1.34    martin  *
     19  1.34    martin  * THIS SOFTWARE IS PROVIDED BY THE NETBSD FOUNDATION, INC. AND CONTRIBUTORS
     20  1.34    martin  * ``AS IS'' AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED
     21  1.34    martin  * TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR
     22  1.34    martin  * PURPOSE ARE DISCLAIMED.  IN NO EVENT SHALL THE FOUNDATION OR CONTRIBUTORS
     23  1.34    martin  * BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR
     24  1.34    martin  * CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF
     25  1.34    martin  * SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS
     26  1.34    martin  * INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN
     27  1.34    martin  * CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE)
     28  1.34    martin  * ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE
     29  1.34    martin  * POSSIBILITY OF SUCH DAMAGE.
     30   1.1       cgd  */
     31  1.12       jtc 
     32  1.17  jdolecek %{
     33  1.17  jdolecek #include <sys/cdefs.h>
     34  1.17  jdolecek #ifndef lint
     35  1.48    rillig __RCSID("$NetBSD: expr.y,v 1.48 2025/03/15 09:33:02 rillig Exp $");
     36  1.17  jdolecek #endif /* not lint */
     37  1.17  jdolecek 
     38  1.17  jdolecek #include <sys/types.h>
     39  1.28       wiz 
     40  1.17  jdolecek #include <err.h>
     41  1.17  jdolecek #include <errno.h>
     42  1.17  jdolecek #include <limits.h>
     43  1.17  jdolecek #include <locale.h>
     44  1.17  jdolecek #include <regex.h>
     45  1.17  jdolecek #include <stdarg.h>
     46   1.1       cgd #include <stdio.h>
     47   1.4       cgd #include <stdlib.h>
     48   1.4       cgd #include <string.h>
     49   1.1       cgd 
     50  1.23  jdolecek static const char * const *av;
     51   1.1       cgd 
     52  1.37     joerg static void yyerror(const char *, ...) __dead;
     53  1.17  jdolecek static int yylex(void);
     54  1.17  jdolecek static int is_zero_or_null(const char *);
     55  1.17  jdolecek static int is_integer(const char *);
     56  1.48    rillig static const char *eval_arith(const char *, const char *, const char *);
     57  1.48    rillig static int eval_compare(const char *, const char *, const char *);
     58  1.48    rillig static const char *eval_match(const char *, const char *);
     59  1.26       jmc 
     60  1.17  jdolecek #define YYSTYPE	const char *
     61   1.1       cgd 
     62  1.17  jdolecek %}
     63  1.20  jdolecek %token STRING
     64  1.22   thorpej %left SPEC_OR
     65  1.22   thorpej %left SPEC_AND
     66  1.26       jmc %left COMPARE
     67  1.26       jmc %left ADD_SUB_OPERATOR
     68  1.26       jmc %left MUL_DIV_MOD_OPERATOR
     69  1.26       jmc %left SPEC_REG
     70  1.31  jdolecek %left LENGTH
     71  1.17  jdolecek %left LEFT_PARENT RIGHT_PARENT
     72   1.1       cgd 
     73   1.1       cgd %%
     74   1.1       cgd 
     75  1.48    rillig exp:	expr {
     76  1.17  jdolecek 		(void) printf("%s\n", $1);
     77  1.17  jdolecek 		return (is_zero_or_null($1));
     78  1.17  jdolecek 		}
     79   1.1       cgd 	;
     80   1.1       cgd 
     81  1.23  jdolecek expr:	item { $$ = $1; }
     82  1.48    rillig 	| expr SPEC_OR expr {
     83  1.17  jdolecek 		if (!is_zero_or_null($1))
     84  1.17  jdolecek 			$$ = $1;
     85  1.17  jdolecek 		else
     86  1.17  jdolecek 			$$ = $3;
     87  1.17  jdolecek 		}
     88  1.48    rillig 	| expr SPEC_AND expr {
     89  1.17  jdolecek 		if (!is_zero_or_null($1) && !is_zero_or_null($3))
     90  1.17  jdolecek 			$$ = $1;
     91  1.17  jdolecek 		else
     92  1.17  jdolecek 			$$ = "0";
     93  1.17  jdolecek 		}
     94  1.48    rillig 	| expr SPEC_REG expr {
     95  1.48    rillig 		$$ = eval_match($1, $3);
     96  1.17  jdolecek 		}
     97  1.48    rillig 	| expr ADD_SUB_OPERATOR expr {
     98  1.48    rillig 		$$ = eval_arith($1, $2, $3);
     99  1.26       jmc                 }
    100  1.26       jmc 
    101  1.48    rillig 	| expr MUL_DIV_MOD_OPERATOR expr {
    102  1.48    rillig 		$$ = eval_arith($1, $2, $3);
    103  1.17  jdolecek 		}
    104  1.48    rillig 	| expr COMPARE expr {
    105  1.48    rillig 		$$ = eval_compare($1, $2, $3) ? "1" : "0";
    106  1.17  jdolecek 		}
    107  1.17  jdolecek 	| LEFT_PARENT expr RIGHT_PARENT { $$ = $2; }
    108  1.31  jdolecek 	| LENGTH expr {
    109  1.31  jdolecek 		/*
    110  1.31  jdolecek 		 * Return length of 'expr' in bytes.
    111  1.31  jdolecek 		 */
    112  1.31  jdolecek 		char *ln;
    113  1.31  jdolecek 
    114  1.31  jdolecek 		asprintf(&ln, "%ld", (long) strlen($2));
    115  1.33    rumble 		if (ln == NULL)
    116  1.33    rumble 			err(1, NULL);
    117  1.31  jdolecek 		$$ = ln;
    118  1.31  jdolecek 		}
    119  1.17  jdolecek 	;
    120   1.4       cgd 
    121  1.17  jdolecek item:	STRING
    122  1.26       jmc 	| ADD_SUB_OPERATOR
    123  1.26       jmc 	| MUL_DIV_MOD_OPERATOR
    124  1.17  jdolecek 	| COMPARE
    125  1.17  jdolecek 	| SPEC_OR
    126  1.17  jdolecek 	| SPEC_AND
    127  1.17  jdolecek 	| SPEC_REG
    128  1.31  jdolecek 	| LENGTH
    129  1.17  jdolecek 	;
    130  1.17  jdolecek %%
    131   1.1       cgd 
    132  1.17  jdolecek /*
    133  1.17  jdolecek  * Returns 1 if the string is empty or contains only numeric zero.
    134  1.17  jdolecek  */
    135  1.17  jdolecek static int
    136  1.17  jdolecek is_zero_or_null(const char *str)
    137   1.1       cgd {
    138  1.17  jdolecek 	char *endptr;
    139   1.4       cgd 
    140  1.17  jdolecek 	return str[0] == '\0'
    141  1.17  jdolecek 		|| ( strtoll(str, &endptr, 10) == 0LL
    142  1.17  jdolecek 			&& endptr[0] == '\0');
    143   1.1       cgd }
    144   1.1       cgd 
    145  1.17  jdolecek /*
    146  1.17  jdolecek  * Returns 1 if the string is an integer.
    147  1.17  jdolecek  */
    148  1.17  jdolecek static int
    149  1.17  jdolecek is_integer(const char *str)
    150   1.1       cgd {
    151  1.17  jdolecek 	char *endptr;
    152   1.4       cgd 
    153  1.17  jdolecek 	(void) strtoll(str, &endptr, 10);
    154  1.17  jdolecek 	/* note we treat empty string as valid number */
    155  1.17  jdolecek 	return (endptr[0] == '\0');
    156   1.1       cgd }
    157   1.1       cgd 
    158  1.48    rillig static const char *
    159  1.48    rillig eval_arith(const char *left, const char *op, const char *right)
    160  1.26       jmc {
    161  1.40     kamil 	int64_t res, l, r;
    162  1.26       jmc 
    163  1.32     lukem 	res = 0;
    164  1.32     lukem 
    165  1.26       jmc 	if (!is_integer(left)) {
    166  1.26       jmc 		yyerror("non-integer argument '%s'", left);
    167  1.26       jmc 		/* NOTREACHED */
    168  1.26       jmc 	}
    169  1.26       jmc 	if (!is_integer(right)) {
    170  1.26       jmc 		yyerror("non-integer argument '%s'", right);
    171  1.26       jmc 		/* NOTREACHED */
    172  1.26       jmc 	}
    173  1.26       jmc 
    174  1.26       jmc 	errno = 0;
    175  1.26       jmc 	l = strtoll(left, NULL, 10);
    176  1.26       jmc 	if (errno == ERANGE) {
    177  1.26       jmc 		yyerror("value '%s' is %s is %lld", left,
    178  1.26       jmc 		    (l > 0) ? "too big, maximum" : "too small, minimum",
    179  1.26       jmc 		    (l > 0) ? LLONG_MAX : LLONG_MIN);
    180  1.26       jmc 		/* NOTREACHED */
    181  1.26       jmc 	}
    182  1.26       jmc 
    183  1.26       jmc 	errno = 0;
    184  1.26       jmc 	r = strtoll(right, NULL, 10);
    185  1.26       jmc 	if (errno == ERANGE) {
    186  1.26       jmc 		yyerror("value '%s' is %s is %lld", right,
    187  1.26       jmc 		    (l > 0) ? "too big, maximum" : "too small, minimum",
    188  1.26       jmc 	  	    (l > 0) ? LLONG_MAX : LLONG_MIN);
    189  1.26       jmc 		/* NOTREACHED */
    190  1.26       jmc 	}
    191  1.26       jmc 
    192  1.26       jmc 	switch(op[0]) {
    193  1.26       jmc 	case '+':
    194  1.40     kamil 		/*
    195  1.40     kamil 		 * Check for over-& underflow.
    196  1.27       jmc 		 */
    197  1.41     kamil 		if ((l >= 0 && r <= INT64_MAX - l) ||
    198  1.41     kamil 		    (l <= 0 && r >= INT64_MIN - l)) {
    199  1.40     kamil 			res = l + r;
    200  1.40     kamil 		} else {
    201  1.26       jmc 			yyerror("integer overflow or underflow occurred for "
    202  1.26       jmc                             "operation '%s %s %s'", left, op, right);
    203  1.40     kamil 		}
    204  1.26       jmc 		break;
    205  1.26       jmc 	case '-':
    206  1.40     kamil 		/*
    207  1.40     kamil 		 * Check for over-& underflow.
    208  1.27       jmc 		 */
    209  1.40     kamil 		if ((r > 0 && l < INT64_MIN + r) ||
    210  1.40     kamil 		    (r < 0 && l > INT64_MAX + r)) {
    211  1.26       jmc 			yyerror("integer overflow or underflow occurred for "
    212  1.26       jmc 			    "operation '%s %s %s'", left, op, right);
    213  1.40     kamil 		} else {
    214  1.40     kamil 			res = l - r;
    215  1.40     kamil 		}
    216  1.26       jmc 		break;
    217  1.26       jmc 	case '/':
    218  1.40     kamil 		if (r == 0)
    219  1.26       jmc 			yyerror("second argument to '%s' must not be zero", op);
    220  1.40     kamil 		if (l == INT64_MIN && r == -1)
    221  1.40     kamil 			yyerror("integer overflow or underflow occurred for "
    222  1.40     kamil 			    "operation '%s %s %s'", left, op, right);
    223  1.26       jmc 		res = l / r;
    224  1.26       jmc 
    225  1.26       jmc 		break;
    226  1.26       jmc 	case '%':
    227  1.27       jmc 		if (r == 0)
    228  1.26       jmc 			yyerror("second argument to '%s' must not be zero", op);
    229  1.40     kamil 		if (l == INT64_MIN && r == -1)
    230  1.40     kamil 			yyerror("integer overflow or underflow occurred for "
    231  1.40     kamil 			    "operation '%s %s %s'", left, op, right);
    232  1.26       jmc 		res = l % r;
    233  1.26       jmc 		break;
    234  1.26       jmc 	case '*':
    235  1.40     kamil 		/*
    236  1.40     kamil 		 * Check for over-& underflow.
    237  1.40     kamil 		 */
    238  1.40     kamil 
    239  1.44     kamil 		/*
    240  1.44     kamil 		 * Simplify the conditions:
    241  1.44     kamil 		 *  - remove the case of both negative arguments
    242  1.44     kamil 		 *    unless the operation will cause an overflow
    243  1.44     kamil 		 */
    244  1.40     kamil 		if (l < 0 && r < 0 && l != INT64_MIN && r != INT64_MIN) {
    245  1.40     kamil 			l = -l;
    246  1.40     kamil 			r = -r;
    247  1.26       jmc 		}
    248  1.26       jmc 
    249  1.46     kamil 		/* - remove the case of negative l and positive r */
    250  1.44     kamil 		if (l < 0 && r >= 0) {
    251  1.44     kamil 			/* Use res as a temporary variable */
    252  1.44     kamil 			res = l;
    253  1.44     kamil 			l = r;
    254  1.44     kamil 			r = res;
    255  1.44     kamil 		}
    256  1.44     kamil 
    257  1.40     kamil 		if ((l < 0 && r < 0) ||
    258  1.44     kamil 		    (r > 0 && l > INT64_MAX / r) ||
    259  1.45     kamil 		    (r <= 0 && l != 0 && r < INT64_MIN / l)) {
    260  1.27       jmc 			yyerror("integer overflow or underflow occurred for "
    261  1.27       jmc 			    "operation '%s %s %s'", left, op, right);
    262  1.27       jmc 			/* NOTREACHED */
    263  1.40     kamil 		} else {
    264  1.40     kamil 			res = l * r;
    265  1.40     kamil 		}
    266  1.26       jmc 		break;
    267  1.26       jmc 	}
    268  1.48    rillig 
    269  1.48    rillig 	char *val;
    270  1.48    rillig 	(void)asprintf(&val, "%lld", (long long int)res);
    271  1.48    rillig 	if (val == NULL)
    272  1.48    rillig 		err(1, NULL);
    273  1.48    rillig 	return val;
    274  1.48    rillig }
    275  1.48    rillig 
    276  1.48    rillig static int
    277  1.48    rillig eval_compare(const char *left, const char *op, const char *right)
    278  1.48    rillig {
    279  1.48    rillig 	int64_t l, r;
    280  1.48    rillig 
    281  1.48    rillig 	if (is_integer(left) && is_integer(right)) {
    282  1.48    rillig 		l = strtoll(left, NULL, 10);
    283  1.48    rillig 		r = strtoll(right, NULL, 10);
    284  1.48    rillig 	} else {
    285  1.48    rillig 		l = strcoll(left, right);
    286  1.48    rillig 		r = 0;
    287  1.48    rillig 	}
    288  1.48    rillig 
    289  1.48    rillig 	switch (op[0]) {
    290  1.48    rillig 	case '=':
    291  1.48    rillig 		return l == r;
    292  1.48    rillig 	case '>':
    293  1.48    rillig 		if (op[1] == '=')
    294  1.48    rillig 			return l >= r;
    295  1.48    rillig 		else
    296  1.48    rillig 			return l > r;
    297  1.48    rillig 	case '<':
    298  1.48    rillig 		if (op[1] == '=')
    299  1.48    rillig 			return l <= r;
    300  1.48    rillig 		else
    301  1.48    rillig 			return l < r;
    302  1.48    rillig 	default:
    303  1.48    rillig 		return l != r;
    304  1.48    rillig 	}
    305  1.48    rillig }
    306  1.48    rillig 
    307  1.48    rillig static const char *
    308  1.48    rillig eval_match(const char *str, const char *re)
    309  1.48    rillig {
    310  1.48    rillig 	regex_t rp;
    311  1.48    rillig 	regmatch_t rm[2];
    312  1.48    rillig 	int eval;
    313  1.48    rillig 
    314  1.48    rillig 	if ((eval = regcomp(&rp, re, REG_BASIC)) != 0) {
    315  1.48    rillig 		char errbuf[256];
    316  1.48    rillig 		(void)regerror(eval, &rp, errbuf, sizeof(errbuf));
    317  1.48    rillig 		yyerror("%s", errbuf);
    318  1.48    rillig 	}
    319  1.48    rillig 
    320  1.48    rillig 	if (regexec(&rp, str, 2, rm, 0) == 0 && rm[0].rm_so == 0) {
    321  1.48    rillig 		char *val;
    322  1.48    rillig 		if (rm[1].rm_so >= 0) {
    323  1.48    rillig 			(void)asprintf(&val, "%.*s",
    324  1.48    rillig 				(int)(rm[1].rm_eo - rm[1].rm_so),
    325  1.48    rillig 				str + rm[1].rm_so);
    326  1.48    rillig 		} else {
    327  1.48    rillig 			(void)asprintf(&val, "%d",
    328  1.48    rillig 				(int)(rm[0].rm_eo - rm[0].rm_so));
    329  1.48    rillig 		}
    330  1.48    rillig 		if (val == NULL)
    331  1.48    rillig 			err(1, NULL);
    332  1.48    rillig 		return val;
    333  1.48    rillig 	}
    334  1.48    rillig 
    335  1.48    rillig 	if (rp.re_nsub == 0)
    336  1.48    rillig 		return "0";
    337  1.48    rillig 	else
    338  1.48    rillig 		return "";
    339  1.26       jmc }
    340   1.4       cgd 
    341  1.23  jdolecek static const char *x = "|&=<>+-*/%:()";
    342  1.23  jdolecek static const int x_token[] = {
    343  1.26       jmc 	SPEC_OR, SPEC_AND, COMPARE, COMPARE, COMPARE, ADD_SUB_OPERATOR,
    344  1.26       jmc 	ADD_SUB_OPERATOR, MUL_DIV_MOD_OPERATOR, MUL_DIV_MOD_OPERATOR,
    345  1.26       jmc 	MUL_DIV_MOD_OPERATOR, SPEC_REG, LEFT_PARENT, RIGHT_PARENT
    346  1.17  jdolecek };
    347   1.1       cgd 
    348  1.23  jdolecek static int handle_ddash = 1;
    349  1.23  jdolecek 
    350  1.17  jdolecek int
    351  1.17  jdolecek yylex(void)
    352   1.1       cgd {
    353  1.17  jdolecek 	const char *p = *av++;
    354  1.23  jdolecek 	int retval;
    355   1.4       cgd 
    356  1.23  jdolecek 	if (!p)
    357  1.23  jdolecek 		retval = 0;
    358  1.47    rillig 	else if (p[0] == '\0')
    359  1.47    rillig 		retval = STRING;
    360  1.23  jdolecek 	else if (p[1] == '\0') {
    361  1.17  jdolecek 		const char *w = strchr(x, p[0]);
    362  1.17  jdolecek 		if (w) {
    363  1.17  jdolecek 			retval = x_token[w-x];
    364  1.17  jdolecek 		} else {
    365  1.17  jdolecek 			retval = STRING;
    366  1.17  jdolecek 		}
    367  1.17  jdolecek 	} else if (p[1] == '=' && p[2] == '\0'
    368  1.17  jdolecek 			&& (p[0] == '>' || p[0] == '<' || p[0] == '!'))
    369  1.17  jdolecek 		retval = COMPARE;
    370  1.23  jdolecek 	else if (handle_ddash && p[0] == '-' && p[1] == '-' && p[2] == '\0') {
    371  1.23  jdolecek 		/* ignore "--" if passed as first argument and isn't followed
    372  1.23  jdolecek 		 * by another STRING */
    373  1.23  jdolecek 		retval = yylex();
    374  1.23  jdolecek 		if (retval != STRING && retval != LEFT_PARENT
    375  1.23  jdolecek 		    && retval != RIGHT_PARENT) {
    376  1.23  jdolecek 			/* is not followed by string or parenthesis, use as
    377  1.23  jdolecek 			 * STRING */
    378  1.23  jdolecek 			retval = STRING;
    379  1.23  jdolecek 			av--;	/* was increased in call to yylex() above */
    380  1.23  jdolecek 			p = "--";
    381  1.23  jdolecek 		} else {
    382  1.23  jdolecek 			/* "--" is to be ignored */
    383  1.23  jdolecek 			p = yylval;
    384  1.23  jdolecek 		}
    385  1.31  jdolecek 	} else if (strcmp(p, "length") == 0)
    386  1.31  jdolecek 		retval = LENGTH;
    387  1.31  jdolecek 	else
    388  1.17  jdolecek 		retval = STRING;
    389   1.1       cgd 
    390  1.23  jdolecek 	handle_ddash = 0;
    391  1.17  jdolecek 	yylval = p;
    392   1.4       cgd 
    393  1.17  jdolecek 	return retval;
    394   1.1       cgd }
    395   1.4       cgd 
    396  1.17  jdolecek /*
    397  1.17  jdolecek  * Print error message and exit with error 2 (syntax error).
    398  1.17  jdolecek  */
    399  1.38     joerg static __printflike(1, 2) void
    400  1.17  jdolecek yyerror(const char *fmt, ...)
    401   1.1       cgd {
    402  1.17  jdolecek 	va_list arg;
    403   1.4       cgd 
    404  1.17  jdolecek 	va_start(arg, fmt);
    405  1.17  jdolecek 	verrx(2, fmt, arg);
    406  1.17  jdolecek 	va_end(arg);
    407   1.1       cgd }
    408   1.1       cgd 
    409  1.17  jdolecek int
    410  1.23  jdolecek main(int argc, const char * const *argv)
    411   1.1       cgd {
    412  1.28       wiz 	setprogname(argv[0]);
    413  1.28       wiz 	(void)setlocale(LC_ALL, "");
    414   1.6       jtc 
    415  1.36     joerg 	if (argc == 1) {
    416  1.36     joerg 		(void)fprintf(stderr, "usage: %s expression\n",
    417  1.36     joerg 		    getprogname());
    418  1.36     joerg 		exit(2);
    419  1.36     joerg 	}
    420  1.36     joerg 
    421  1.36     joerg 	av = argv + 1;
    422   1.5       cgd 
    423  1.42  christos 	return yyparse();
    424   1.1       cgd }
    425