Home | History | Annotate | Line # | Download | only in unit-tests
varmod-ifelse.mk revision 1.40
      1 # $NetBSD: varmod-ifelse.mk,v 1.40 2025/06/28 22:39:29 rillig Exp $
      2 #
      3 # Tests for the ${cond:?then:else} variable modifier, which evaluates either
      4 # the then-expression or the else-expression, depending on the condition.
      5 #
      6 # The modifier was added on 1998-04-01.
      7 #
      8 # Until 2015-10-11, the modifier always evaluated both the "then" and the
      9 # "else" expressions.
     10 
     11 # TODO: Implementation
     12 
     13 # The variable name of the expression is expanded and then taken as the
     14 # condition.  In the below example it becomes:
     15 #
     16 #	bare words == "literal"
     17 #
     18 # This confuses the parser, which expects an operator instead of the bare
     19 # word "expression".  If the name were expanded lazily, everything would be
     20 # fine since the condition would be:
     21 #
     22 #	${:Ubare words} == "literal"
     23 #
     24 # Evaluating the variable name lazily would require additional code in
     25 # Var_Parse and ParseVarname, it would be more useful and predictable
     26 # though.
     27 # expect+1: Bad condition
     28 .if ${${:Ubare words} == "literal":?bad:bad}
     29 .  error
     30 .else
     31 .  error
     32 .endif
     33 
     34 # In a variable assignment, undefined variables are not an error.
     35 # Because of the early expansion, the whole condition evaluates to
     36 # ' == ""' though, which cannot be parsed because the left-hand side looks
     37 # empty.
     38 # expect+1: Bad condition
     39 COND:=	${${UNDEF} == "":?bad-assign:bad-assign}
     40 
     41 # In a conditional directive, undefined variables are reported as such.  In a
     42 # ':?' modifier, though, the "variable name" is expanded first, and in that
     43 # context, an undefined expression is not an error. The "variable name" then
     44 # becomes the condition, in this case ' == ""', which is malformed because the
     45 # left-hand side looks empty.
     46 # expect+1: Bad condition
     47 .if ${${UNDEF} == "":?bad-cond:bad-cond}
     48 .  error
     49 .else
     50 .  error
     51 .endif
     52 
     53 # When the :? is parsed, it is greedy.  The else branch spans all the
     54 # text, up until the closing character '}', even if the text looks like
     55 # another modifier.
     56 .if ${1:?then:else:Q} != "then"
     57 .  error
     58 .endif
     59 .if ${0:?then:else:Q} != "else:Q"
     60 .  error
     61 .endif
     62 
     63 # This line generates 2 error messages.  The first comes from evaluating the
     64 # malformed conditional "1 == == 2", which is reported as "Bad conditional
     65 # expression" by ApplyModifier_IfElse.  The expression containing that
     66 # conditional therefore returns a parse error from Var_Parse, and this parse
     67 # error propagates to CondEvalExpression, where the "Malformed conditional"
     68 # comes from.
     69 # expect+1: Bad condition
     70 .if ${1 == == 2:?yes:no} != ""
     71 .  error
     72 .else
     73 .  error
     74 .endif
     75 
     76 # If the "Bad conditional expression" appears in a quoted string literal, the
     77 # error message "Malformed conditional" is not printed, leaving only the "Bad
     78 # conditional expression".
     79 #
     80 # XXX: The left-hand side is enclosed in quotes.  This results in Var_Parse
     81 # being called without VARE_EVAL_DEFINED.  When ApplyModifier_IfElse
     82 # returns AMR_CLEANUP as result, Var_Parse returns varUndefined since the
     83 # value of the expression is still undefined.  CondParser_String is
     84 # then supposed to do proper error handling, but since varUndefined is local
     85 # to var.c, it cannot distinguish this return value from an ordinary empty
     86 # string.  The left-hand side of the comparison is therefore just an empty
     87 # string, which is obviously equal to the empty string on the right-hand side.
     88 #
     89 # XXX: The debug log for -dc shows a comparison between 1.0 and 0.0.  The
     90 # condition should be detected as being malformed before any comparison is
     91 # done since there is no well-formed comparison in the condition at all.
     92 .MAKEFLAGS: -dc
     93 # expect+1: Bad condition
     94 .if "${1 == == 2:?yes:no}" != ""
     95 .  error
     96 .else
     97 # expect+1: warning: Oops, the parse error should have been propagated.
     98 .  warning Oops, the parse error should have been propagated.
     99 .endif
    100 .MAKEFLAGS: -d0
    101 
    102 # As of 2020-12-10, the variable "VAR" is first expanded, and the result of
    103 # this expansion is then taken as the condition.  To force the
    104 # expression in the condition to be evaluated at exactly the right point,
    105 # the '$' of the intended '${VAR}' escapes from the parser in form of the
    106 # expression ${:U\$}.  Because of this escaping, the variable "VAR" and thus
    107 # the condition ends up as "${VAR} == value", just as intended.
    108 #
    109 # This hack does not work for variables from .for loops since these are
    110 # expanded at parse time to their corresponding ${:Uvalue} expressions.
    111 # Making the '$' of the '${VAR}' expression indirect hides this expression
    112 # from the parser of the .for loop body.  See ForLoop_SubstVarLong.
    113 .MAKEFLAGS: -dc
    114 VAR=	value
    115 .if ${ ${:U\$}{VAR} == value:?ok:bad} != "ok"
    116 .  error
    117 .endif
    118 .MAKEFLAGS: -d0
    119 
    120 # On 2021-04-19, when building external/bsd/tmux with HAVE_LLVM=yes and
    121 # HAVE_GCC=no, the following conditional generated this error message:
    122 #
    123 #	make: Bad conditional expression 'string == "literal" && no >= 10'
    124 #	    in 'string == "literal" && no >= 10?yes:no'
    125 #
    126 # Despite the error message (which was not clearly marked with "error:"),
    127 # the build continued, for historical reasons, see main_Exit.
    128 #
    129 # The tricky detail here is that the condition that looks so obvious in the
    130 # form written in the makefile becomes tricky when it is actually evaluated.
    131 # This is because the condition is written in the place of the variable name
    132 # of the expression, and in an expression, the variable name is always
    133 # expanded first, before even looking at the modifiers.  This happens for the
    134 # modifier ':?' as well, so when CondEvalExpression gets to see the
    135 # expression, it already looks like this:
    136 #
    137 #	string == "literal" && no >= 10
    138 #
    139 # When parsing such an expression, the parser used to be strict.  It first
    140 # evaluated the left-hand side of the operator '&&' and then started parsing
    141 # the right-hand side 'no >= 10'.  The word 'no' is obviously a string
    142 # literal, not enclosed in quotes, which is OK, even on the left-hand side of
    143 # the comparison operator, but only because this is a condition in the
    144 # modifier ':?'.  In an ordinary directive '.if', this would be a parse error.
    145 # For strings, only the comparison operators '==' and '!=' are defined,
    146 # therefore parsing stopped at the '>', producing the 'Bad conditional
    147 # expression'.
    148 #
    149 # Ideally, the conditional expression would not be expanded before parsing
    150 # it.  This would allow to write the conditions exactly as seen below.  That
    151 # change has a high chance of breaking _some_ existing code and would need
    152 # to be thoroughly tested.
    153 #
    154 # Since cond.c 1.262 from 2021-04-20, make reports a more specific error
    155 # message in situations like these, pointing directly to the specific problem
    156 # instead of just saying that the whole condition is bad.
    157 STRING=		string
    158 NUMBER=		no		# not really a number
    159 # expect+1: no.
    160 .info ${${STRING} == "literal" && ${NUMBER} >= 10:?yes:no}.
    161 # expect+2: Comparison with ">=" requires both operands "no" and "10" to be numeric
    162 # expect+1: .
    163 .info ${${STRING} == "literal" || ${NUMBER} >= 10:?yes:no}.
    164 
    165 # The following situation occasionally occurs with MKINET6 or similar
    166 # variables.
    167 NUMBER=		# empty, not really a number either
    168 # expect+2: Bad condition
    169 # expect+1: .
    170 .info ${${STRING} == "literal" && ${NUMBER} >= 10:?yes:no}.
    171 # expect+2: Bad condition
    172 # expect+1: .
    173 .info ${${STRING} == "literal" || ${NUMBER} >= 10:?yes:no}.
    174 
    175 # CondParser_LeafToken handles [0-9-+] specially, treating them as a number.
    176 PLUS=		+
    177 ASTERISK=	*
    178 EMPTY=		# empty
    179 # "true" since "+" is not the empty string.
    180 # expect+1: <true>
    181 .info <${${PLUS}		:?true:false}>
    182 # "false" since the variable named "*" is not defined.
    183 # expect+1: <false>
    184 .info <${${ASTERISK}	:?true:false}>
    185 # syntax error since the condition is completely blank.
    186 # expect+2: Bad condition
    187 # expect+1: <>
    188 .info <${${EMPTY}	:?true:false}>
    189 
    190 
    191 # Since the condition of the '?:' modifier is expanded before being parsed and
    192 # evaluated, it is common practice to enclose expressions in quotes, to avoid
    193 # producing syntactically invalid conditions such as ' == value'.  This only
    194 # works if the expanded values neither contain quotes nor backslashes.  For
    195 # strings containing quotes or backslashes, the '?:' modifier should not be
    196 # used.
    197 PRIMES=	2 3 5 7 11
    198 .if ${1 2 3 4 5:L:@n@$n:${ ("${PRIMES:M$n}" != "") :?prime:not_prime}@} != \
    199   "1:not_prime 2:prime 3:prime 4:not_prime 5:prime"
    200 .  error
    201 .endif
    202 
    203 # When parsing the modifier ':?', there are 3 possible cases:
    204 #
    205 #	1. The whole expression is only parsed.
    206 #	2. The expression is parsed and the 'then' branch is evaluated.
    207 #	3. The expression is parsed and the 'else' branch is evaluated.
    208 #
    209 # In all of these cases, the expression must be parsed in the same way,
    210 # especially when one of the branches contains unbalanced '{}' braces.
    211 #
    212 # At 2020-01-01, the expressions from the 'then' and 'else' branches were
    213 # parsed differently, depending on whether the branch was taken or not.  When
    214 # the branch was taken, the parser recognized that in the modifier ':S,}},,',
    215 # the '}}' were ordinary characters.  When the branch was not taken, the
    216 # parser only counted balanced '{' and '}', ignoring any escaping or other
    217 # changes in the interpretation.
    218 #
    219 # In var.c 1.285 from 2020-07-20, the parsing of the expressions changed so
    220 # that in both cases the expression is parsed in the same way, taking the
    221 # unbalanced braces in the ':S' modifiers into account.  This change was not
    222 # on purpose, the commit message mentioned 'has the same effect', which was a
    223 # wrong assumption.
    224 #
    225 # In var.c 1.323 from 2020-07-26, the unintended fix from var.c 1.285 was
    226 # reverted, still not knowing about the difference between regular parsing and
    227 # balanced-mode parsing.
    228 #
    229 # In var.c 1.1028 from 2022-08-08, there was another attempt at fixing this
    230 # inconsistency in parsing, but since that broke parsing of the modifier ':@',
    231 # it was reverted in var.c 1.1029 from 2022-08-23.
    232 #
    233 # In var.c 1.1047 from 2023-02-18, the inconsistency in parsing was finally
    234 # fixed.  The modifier ':@' now parses the body in balanced mode, while
    235 # everywhere else the modifier parts have their subexpressions parsed in the
    236 # same way, no matter whether they are evaluated or not.
    237 #
    238 # The modifiers ':@' and ':?' are similar in that they conceptually contain
    239 # text to be evaluated later or conditionally, still they parse that text
    240 # differently.  The crucial difference is that the body of the modifier ':@'
    241 # is always parsed using balanced mode.  The modifier ':?', on the other hand,
    242 # must parse both of its branches in the same way, no matter whether they are
    243 # evaluated or not.  Since balanced mode and standard mode are incompatible,
    244 # it's impossible to use balanced mode in the modifier ':?'.
    245 .MAKEFLAGS: -dc
    246 .if 0 && ${1:?${:Uthen0:S,}},,}:${:Uelse0:S,}},,}} != "not evaluated"
    247 # At 2020-01-07, the expression evaluated to 'then0,,}}', even though it was
    248 # irrelevant as the '0' had already been evaluated to 'false'.
    249 .  error
    250 .endif
    251 .if 1 && ${0:?${:Uthen1:S,}},,}:${:Uelse1:S,}},,}} != "else1"
    252 .  error
    253 .endif
    254 .if 2 && ${1:?${:Uthen2:S,}},,}:${:Uelse2:S,}},,}} != "then2"
    255 # At 2020-01-07, the whole expression evaluated to 'then2,,}}' instead of the
    256 # expected 'then2'.  The 'then' branch of the ':?' modifier was parsed
    257 # normally, parsing and evaluating the ':S' modifier, thereby treating the
    258 # '}}' as ordinary characters and resulting in 'then2'.  The 'else' branch was
    259 # parsed in balanced mode, ignoring that the inner '}}' were ordinary
    260 # characters.  The '}}' were thus interpreted as the end of the 'else' branch
    261 # and the whole expression.  This left the trailing ',,}}', which together
    262 # with the 'then2' formed the result 'then2,,}}'.
    263 .  error
    264 .endif
    265 
    266 
    267 # Since the condition is taken from the variable name of the expression, not
    268 # from its value, it is evaluated early.  It is possible though to construct
    269 # conditions that are evaluated lazily, at exactly the right point.  There is
    270 # no way to escape a '$' directly in the variable name, but there are
    271 # alternative ways to bring a '$' into the condition.
    272 #
    273 #	In an indirect condition using the ':U' modifier, each '$', ':' and
    274 #	'}' must be escaped as '\$', '\:' and '\}', respectively, but '{' must
    275 #	not be escaped.
    276 #
    277 #	In an indirect condition using a separate variable, each '$' must be
    278 #	escaped as '$$'.
    279 #
    280 # These two forms allow the variables to contain arbitrary characters, as the
    281 # condition parser does not see them.
    282 DELAYED=	two
    283 # expect+1: no
    284 .info ${ ${:U \${DELAYED\} == "one"}:?yes:no}
    285 # expect+1: yes
    286 .info ${ ${:U \${DELAYED\} == "two"}:?yes:no}
    287 INDIRECT_COND1=	$${DELAYED} == "one"
    288 # expect+1: no
    289 .info ${ ${INDIRECT_COND1}:?yes:no}
    290 INDIRECT_COND2=	$${DELAYED} == "two"
    291 # expect+1: yes
    292 .info ${ ${INDIRECT_COND2}:?yes:no}
    293 
    294 
    295 .MAKEFLAGS: -d0
    296 
    297 
    298 # In the modifier parts for the 'then' and 'else' branches, subexpressions are
    299 # parsed by inspecting the actual modifiers.  In 2008, 2015, 2020, 2022 and
    300 # 2023, the exact parsing algorithm switched a few times, counting balanced
    301 # braces instead of proper subexpressions, which meant that unbalanced braces
    302 # were parsed differently, depending on whether the branch was active or not.
    303 BRACES=	}}}
    304 NO=	${0:?${BRACES:S,}}},yes,}:${BRACES:S,}}},no,}}
    305 YES=	${1:?${BRACES:S,}}},yes,}:${BRACES:S,}}},no,}}
    306 BOTH=	<${YES}> <${NO}>
    307 .if ${BOTH} != "<yes> <no>"
    308 .  error
    309 .endif
    310 
    311 
    312 # expect+2: Unknown modifier ":X-then"
    313 # expect+1: Unknown modifier ":X-else"
    314 .if ${1:?${:X-then}:${:X-else}}
    315 .endif
    316 
    317 
    318 # expect+4: Bad condition
    319 # expect+3: Unknown modifier ":Z1"
    320 # expect+2: Unknown modifier ":Z2"
    321 # expect+1: <>
    322 .info <${ < 0 :?${:Z1}:${:Z2}}>
    323