lint1.h revision 1.109 1 /* $NetBSD: lint1.h,v 1.109 2021/07/02 18:22:09 rillig Exp $ */
2
3 /*
4 * Copyright (c) 1996 Christopher G. Demetriou. All Rights Reserved.
5 * Copyright (c) 1994, 1995 Jochen Pohl
6 * All Rights Reserved.
7 *
8 * Redistribution and use in source and binary forms, with or without
9 * modification, are permitted provided that the following conditions
10 * are met:
11 * 1. Redistributions of source code must retain the above copyright
12 * notice, this list of conditions and the following disclaimer.
13 * 2. Redistributions in binary form must reproduce the above copyright
14 * notice, this list of conditions and the following disclaimer in the
15 * documentation and/or other materials provided with the distribution.
16 * 3. All advertising materials mentioning features or use of this software
17 * must display the following acknowledgement:
18 * This product includes software developed by Jochen Pohl for
19 * The NetBSD Project.
20 * 4. The name of the author may not be used to endorse or promote products
21 * derived from this software without specific prior written permission.
22 *
23 * THIS SOFTWARE IS PROVIDED BY THE AUTHOR ``AS IS'' AND ANY EXPRESS OR
24 * IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED WARRANTIES
25 * OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE ARE DISCLAIMED.
26 * IN NO EVENT SHALL THE AUTHOR BE LIABLE FOR ANY DIRECT, INDIRECT,
27 * INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT
28 * NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE,
29 * DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY
30 * THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT
31 * (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF
32 * THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
33 */
34
35 #include "lint.h"
36 #include "err-msgs.h"
37 #include "op.h"
38
39 /*
40 * XXX - Super conservative so that works for most systems, but we should
41 * not depend on the host settings but the target settings in determining
42 * the alignment. The only valid use for this is in mem1.c; uses in decl.c
43 * are bogus.
44 */
45 #ifndef WORST_ALIGN
46 #ifdef _LP64
47 # define AVAL 15
48 #else
49 # define AVAL 7
50 #endif
51 #define WORST_ALIGN(x) (((x) + AVAL) & ~AVAL)
52 #endif
53
54 #define LWARN_BAD (-3)
55 #define LWARN_ALL (-2)
56 #define LWARN_NONE (-1)
57
58 /*
59 * Describes the position of a declaration or anything else.
60 *
61 * FIXME: Just a single file:lineno pair is not enough to accurately describe
62 * the position of a symbol. The whole inclusion path at that point must be
63 * stored as well. This makes a difference for symbols from included
64 * headers, see print_stack_trace.
65 */
66 typedef struct {
67 const char *p_file;
68 int p_line;
69 int p_uniq; /* uniquifier */
70 } pos_t;
71
72 /* Copies curr_pos, keeping things unique. */
73 #define UNIQUE_CURR_POS(pos) \
74 do { \
75 (pos) = curr_pos; \
76 curr_pos.p_uniq++; \
77 if (curr_pos.p_file == csrc_pos.p_file) \
78 csrc_pos.p_uniq++; \
79 } while (false)
80
81 /*
82 * Strings cannot be referenced to simply by a pointer to its first
83 * char. This is because strings can contain NUL characters other than the
84 * trailing NUL.
85 *
86 * Strings are stored with a trailing NUL.
87 */
88 typedef struct strg {
89 tspec_t st_tspec; /* CHAR or WCHAR */
90 size_t st_len; /* length without trailing NUL */
91 union {
92 u_char *_st_cp;
93 wchar_t *_st_wcp;
94 } st_u;
95 } strg_t;
96
97 #define st_cp st_u._st_cp
98 #define st_wcp st_u._st_wcp
99
100 /*
101 * qualifiers (only for lex/yacc interface)
102 */
103 typedef enum {
104 CONST, VOLATILE, RESTRICT, THREAD
105 } tqual_t;
106
107 /* An integer or floating-point value. */
108 typedef struct {
109 tspec_t v_tspec;
110 /*
111 * Set if an integer constant is unsigned only in C90 and later, but
112 * not in traditional C.
113 *
114 * See the operators table in ops.def, columns "l r".
115 */
116 bool v_unsigned_since_c90;
117 union {
118 int64_t _v_quad; /* integers */
119 ldbl_t _v_ldbl; /* floats */
120 } v_u;
121 } val_t;
122
123 #define v_quad v_u._v_quad
124 #define v_ldbl v_u._v_ldbl
125
126 /*
127 * Structures of type struct_or_union uniquely identify structures. This can't
128 * be done in structures of type type_t, because these are copied
129 * if they must be modified. So it would not be possible to check
130 * if two structures are identical by comparing the pointers to
131 * the type structures.
132 *
133 * The typename is used if the structure is unnamed to identify
134 * the structure type in pass 2.
135 */
136 typedef struct {
137 u_int sou_size_in_bits;
138 u_int sou_align_in_bits : 15;
139 bool sou_incomplete : 1;
140 struct sym *sou_first_member;
141 struct sym *sou_tag;
142 struct sym *sou_first_typedef;
143 } struct_or_union;
144
145 /*
146 * same as above for enums
147 */
148 typedef struct {
149 bool en_incomplete : 1;
150 struct sym *en_first_enumerator;
151 struct sym *en_tag;
152 struct sym *en_first_typedef;
153 } enumeration;
154
155 /*
156 * The type of an expression or object. Complex types are formed via t_subt
157 * (for arrays, pointers and functions), as well as t_str.
158 */
159 struct lint1_type {
160 tspec_t t_tspec; /* type specifier */
161 bool t_incomplete_array : 1;
162 bool t_const : 1; /* const modifier */
163 bool t_volatile : 1; /* volatile modifier */
164 bool t_proto : 1; /* function prototype (t_args valid) */
165 bool t_vararg : 1; /* prototype with '...' */
166 bool t_typedef : 1; /* type defined with typedef */
167 bool t_bitfield : 1;
168 /*
169 * Either the type is currently an enum (having t_tspec ENUM), or
170 * it is an integer type (typically INT) that has been implicitly
171 * converted from an enum type. In both cases, t_enum is valid.
172 *
173 * The information about a former enum type is retained to allow
174 * type checks in expressions such as ((var1 & 0x0001) == var2), to
175 * detect when var1 and var2 are from incompatible enum types.
176 */
177 bool t_is_enum : 1;
178 bool t_packed : 1;
179 union {
180 int _t_dim; /* dimension (if ARRAY) */
181 struct_or_union *_t_str;
182 enumeration *_t_enum;
183 struct sym *_t_args; /* arguments (if t_proto) */
184 } t_u;
185 struct {
186 u_int _t_flen : 8; /* length of bit-field */
187 u_int _t_foffs : 24; /* offset of bit-field */
188 } t_b;
189 struct lint1_type *t_subt; /* element type (if ARRAY),
190 * return value (if FUNC),
191 * target type (if PTR) */
192 };
193
194 #define t_dim t_u._t_dim
195 #define t_str t_u._t_str
196 #define t_enum t_u._t_enum
197 #define t_args t_u._t_args
198 #define t_flen t_b._t_flen
199 #define t_foffs t_b._t_foffs
200
201 /*
202 * types of symbols
203 */
204 typedef enum {
205 FVFT, /* variables, functions, type names, enums */
206 FMEMBER, /* members of structs or unions */
207 FTAG, /* tags */
208 FLABEL /* labels */
209 } symt_t;
210
211 /*
212 * storage classes
213 */
214 typedef enum {
215 NOSCL,
216 EXTERN, /* external symbols (indep. of decl_t) */
217 STATIC, /* static symbols (local and global) */
218 AUTO, /* automatic symbols (except register) */
219 REG, /* register */
220 TYPEDEF, /* typedef */
221 STRUCT_TAG,
222 UNION_TAG,
223 ENUM_TAG,
224 MOS, /* member of struct */
225 MOU, /* member of union */
226 CTCONST, /* enumerator, enum constant or bool constant */
227 ABSTRACT, /* abstract symbol (sizeof, casts, unnamed argument) */
228 ARG, /* argument */
229 PROTO_ARG, /* used in declaration stack during prototype
230 declaration */
231 INLINE /* only used by the parser */
232 } scl_t;
233
234 /*
235 * symbol table entry
236 */
237 typedef struct sym {
238 const char *s_name;
239 const char *s_rename; /* renamed symbol's given name */
240 pos_t s_def_pos; /* position of last (prototype) definition,
241 prototype declaration, no-prototype-def.,
242 tentative definition or declaration,
243 in this order */
244 pos_t s_set_pos; /* position of first initialization */
245 pos_t s_use_pos; /* position of first use */
246 symt_t s_kind; /* type of symbol */
247 void *s_keyword;
248 bool s_bitfield : 1;
249 bool s_set : 1; /* variable set, label defined */
250 bool s_used : 1; /* variable/label used */
251 bool s_arg : 1; /* symbol is function argument */
252 bool s_reg : 1; /* symbol is register variable */
253 bool s_defarg : 1; /* undefined symbol in old style function
254 definition */
255 bool s_return_type_implicit_int : 1;
256 bool s_osdef : 1; /* symbol stems from old style function def. */
257 bool s_inline : 1; /* true if this is an inline function */
258 struct sym *s_ext_sym; /* for local declared external symbols pointer
259 to external symbol with same name */
260 def_t s_def; /* declared, tentative defined, defined */
261 scl_t s_scl; /* storage class */
262 int s_block_level; /* level of declaration, -1 if not in symbol
263 table */
264 type_t *s_type;
265 val_t s_value; /* value (if enum or bool constant) */
266 union {
267 struct_or_union *_s_st;
268 enumeration *_s_et;
269 tspec_t _s_tsp; /* type (only for keywords) */
270 tqual_t _s_tqu; /* qualifier (only for keywords) */
271 struct sym *_s_args; /* arguments in old style function
272 definitions */
273 } u;
274 struct sym *s_link; /* next symbol with same hash value */
275 struct sym **s_rlink; /* pointer to s_link of prev. symbol */
276 struct sym *s_next; /* next struct/union member, enumerator,
277 argument */
278 struct sym *s_dlnxt; /* next symbol declared on same level */
279 } sym_t;
280
281 #define s_styp u._s_st
282 #define s_etyp u._s_et
283 #define s_tspec u._s_tsp
284 #define s_tqual u._s_tqu
285 #define s_args u._s_args
286
287 /*
288 * Used to keep some information about symbols before they are entered
289 * into the symbol table.
290 */
291 typedef struct sbuf {
292 const char *sb_name; /* name of symbol */
293 size_t sb_len; /* length (without '\0') */
294 int sb_hash; /* hash value */
295 sym_t *sb_sym; /* symbol table entry */
296 struct sbuf *sb_next; /* for freelist */
297 } sbuf_t;
298
299
300 /*
301 * tree node
302 */
303 typedef struct tnode {
304 op_t tn_op; /* operator */
305 type_t *tn_type; /* type */
306 bool tn_lvalue : 1; /* node is lvalue */
307 bool tn_cast : 1; /* if tn_op == CVT, it's an explicit cast */
308 bool tn_parenthesized : 1;
309 bool tn_from_system_header : 1;
310 bool tn_system_dependent : 1; /* depends on sizeof or offsetof */
311 union {
312 struct {
313 struct tnode *_tn_left; /* (left) operand */
314 struct tnode *_tn_right; /* right operand */
315 } tn_s;
316 sym_t *_tn_sym; /* symbol if op == NAME */
317 val_t *_tn_val; /* value if op == CON */
318 strg_t *_tn_string; /* string if op == STRING */
319 } tn_u;
320 } tnode_t;
321
322 #define tn_left tn_u.tn_s._tn_left
323 #define tn_right tn_u.tn_s._tn_right
324 #define tn_sym tn_u._tn_sym
325 #define tn_val tn_u._tn_val
326 #define tn_string tn_u._tn_string
327
328 struct generic_association_types {
329 type_t *gat_arg; /* NULL means default or error */
330 tnode_t *gat_result; /* NULL means error */
331 struct generic_association_types *gat_prev;
332 };
333
334 /*
335 * For nested declarations a stack exists, which holds all information
336 * needed for the current level. dcs points to the innermost element of this
337 * stack.
338 *
339 * d_ctx describes the context of the current declaration. Its value is
340 * one of
341 * EXTERN global declarations
342 * MOS or MOU declarations of struct or union members
343 * CTCONST declarations of enums or boolean constants
344 * ARG declaration of arguments in old-style function
345 * definitions
346 * PROTO_ARG declaration of arguments in function prototypes
347 * AUTO declaration of local symbols
348 * ABSTRACT abstract declarations (sizeof, casts)
349 *
350 */
351 typedef struct dinfo {
352 tspec_t d_abstract_type;/* VOID, BOOL, CHAR, INT or COMPLEX */
353 tspec_t d_complex_mod; /* FLOAT or DOUBLE */
354 tspec_t d_sign_mod; /* SIGNED or UNSIGN */
355 tspec_t d_rank_mod; /* SHORT, LONG or QUAD */
356 scl_t d_scl; /* storage class */
357 type_t *d_type; /* after deftyp() pointer to the type used
358 for all declarators */
359 sym_t *d_redeclared_symbol;
360 int d_offset; /* offset of next structure member */
361 int d_stralign; /* alignment required for current structure */
362 scl_t d_ctx; /* context of declaration */
363 bool d_const : 1; /* const in declaration specifiers */
364 bool d_volatile : 1; /* volatile in declaration specifiers */
365 bool d_inline : 1; /* inline in declaration specifiers */
366 bool d_mscl : 1; /* multiple storage classes */
367 bool d_terr : 1; /* invalid type combination */
368 bool d_nonempty_decl : 1; /* if at least one tag is declared
369 * ... in the current function decl. */
370 bool d_vararg : 1;
371 bool d_proto : 1; /* current function decl. is prototype */
372 bool d_notyp : 1; /* set if no type specifier was present */
373 bool d_asm : 1; /* set if d_ctx == AUTO and asm() present */
374 bool d_packed : 1;
375 bool d_used : 1;
376 type_t *d_tagtyp; /* tag during member declaration */
377 sym_t *d_func_args; /* list of arguments during function def. */
378 pos_t d_func_def_pos; /* position of function definition */
379 sym_t *d_dlsyms; /* first symbol declared at this level */
380 sym_t **d_ldlsym; /* points to s_dlnxt in last symbol decl.
381 at this level */
382 sym_t *d_func_proto_syms; /* symbols defined in prototype */
383 struct dinfo *d_next; /* next level */
384 } dinfo_t;
385
386 /* One level of pointer indirection in declarators, including qualifiers. */
387 typedef struct qual_ptr {
388 bool p_const: 1;
389 bool p_volatile: 1;
390 bool p_pointer: 1;
391 struct qual_ptr *p_next;
392 } qual_ptr;
393
394 /*
395 * The values of the 'case' labels, linked via cl_next in reverse order of
396 * appearance in the code, that is from bottom to top.
397 */
398 typedef struct case_label {
399 val_t cl_val;
400 struct case_label *cl_next;
401 } case_label_t;
402
403 typedef enum {
404 CS_DO_WHILE,
405 CS_FOR,
406 CS_FUNCTION_BODY,
407 CS_IF,
408 CS_SWITCH,
409 CS_WHILE
410 } control_statement_kind;
411
412 /*
413 * Used to keep information about nested control statements.
414 */
415 typedef struct control_statement {
416 control_statement_kind c_kind; /* to ensure proper nesting */
417 bool c_loop : 1; /* 'continue' and 'break' are valid */
418 bool c_switch : 1; /* 'case' and 'break' are valid */
419 bool c_break : 1; /* the loop/switch has a reachable
420 * 'break' statement */
421 bool c_continue : 1; /* the loop has a reachable 'continue'
422 * statement */
423 bool c_default : 1; /* the switch has a 'default' label */
424 bool c_maybe_endless : 1; /* the controlling expression is
425 * always true (as in 'for (;;)' or
426 * 'while (1)'), there may be break
427 * statements though */
428 bool c_always_then : 1;
429 bool c_reached_end_of_then : 1;
430 bool c_had_return_noval : 1; /* had "return;" */
431 bool c_had_return_value : 1; /* had "return expr;" */
432
433 type_t *c_switch_type; /* type of switch expression */
434 tnode_t *c_switch_expr;
435 case_label_t *c_case_labels; /* list of case values */
436
437 struct memory_block *c_for_expr3_mem; /* saved memory for end of loop
438 * expression in for() */
439 tnode_t *c_for_expr3; /* end of loop expr in for() */
440 pos_t c_for_expr3_pos; /* position of end of loop expr */
441 pos_t c_for_expr3_csrc_pos; /* same for csrc_pos */
442
443 struct control_statement *c_surrounding;
444 } cstk_t;
445
446 typedef struct {
447 size_t lo; /* inclusive */
448 size_t hi; /* inclusive */
449 } range_t;
450
451 #include "externs1.h"
452
453 #define ERR_SETSIZE 1024
454 #define __NERRBITS (sizeof(unsigned int))
455
456 typedef struct err_set {
457 unsigned int errs_bits[(ERR_SETSIZE + __NERRBITS-1) / __NERRBITS];
458 } err_set;
459
460 #define ERR_SET(n, p) \
461 ((p)->errs_bits[(n)/__NERRBITS] |= (1 << ((n) % __NERRBITS)))
462 #define ERR_CLR(n, p) \
463 ((p)->errs_bits[(n)/__NERRBITS] &= ~(1 << ((n) % __NERRBITS)))
464 #define ERR_ISSET(n, p) \
465 (((p)->errs_bits[(n)/__NERRBITS] & (1 << ((n) % __NERRBITS))) != 0)
466 #define ERR_ZERO(p) (void)memset((p), 0, sizeof(*(p)))
467
468 #define INTERNAL_ERROR(fmt, args...) \
469 internal_error(__FILE__, __LINE__, fmt, ##args)
470
471 #define lint_assert(cond) \
472 do { \
473 if (!(cond)) \
474 assert_failed(__FILE__, __LINE__, __func__, #cond); \
475 } while (false)
476
477 #ifdef BLKDEBUG
478 #define ZERO 0xa5
479 #else
480 #define ZERO 0
481 #endif
482
483 extern err_set msgset;
484
485
486 #ifdef DEBUG
487 # include "err-msgs.h"
488
489 /* ARGSUSED */
490 static inline void __attribute__((format(printf, 1, 2)))
491 check_printf(const char *fmt, ...)
492 {
493 }
494
495 # define wrap_check_printf_at(func, msgid, pos, args...) \
496 do { \
497 check_printf(__CONCAT(MSG_, msgid), ##args); \
498 (func)(msgid, pos, ##args); \
499 } while (false)
500
501 # define error_at(msgid, pos, args...) \
502 wrap_check_printf_at(error_at, msgid, pos, ##args)
503 # define warning_at(msgid, pos, args...) \
504 wrap_check_printf_at(warning_at, msgid, pos, ##args)
505 # define message_at(msgid, pos, args...) \
506 wrap_check_printf_at(message_at, msgid, pos, ##args)
507
508 # define wrap_check_printf(func, msgid, args...) \
509 do { \
510 check_printf(__CONCAT(MSG_, msgid), ##args); \
511 (func)(msgid, ##args); \
512 } while (false)
513
514 # define error(msgid, args...) wrap_check_printf(error, msgid, ##args)
515 # define warning(msgid, args...) wrap_check_printf(warning, msgid, ##args)
516 # define message(msgid, args...) wrap_check_printf(message, msgid, ##args)
517 # define gnuism(msgid, args...) wrap_check_printf(gnuism, msgid, ##args)
518 # define c99ism(msgid, args...) wrap_check_printf(c99ism, msgid, ##args)
519 # define c11ism(msgid, args...) wrap_check_printf(c11ism, msgid, ##args)
520 #endif
521
522 static inline bool
523 is_nonzero_val(const val_t *val)
524 {
525 return is_floating(val->v_tspec)
526 ? val->v_ldbl != 0.0
527 : val->v_quad != 0;
528 }
529
530 static inline bool
531 constant_is_nonzero(const tnode_t *tn)
532 {
533 lint_assert(tn->tn_op == CON);
534 lint_assert(tn->tn_type->t_tspec == tn->tn_val->v_tspec);
535 return is_nonzero_val(tn->tn_val);
536 }
537
538 static inline bool
539 is_zero(const tnode_t *tn)
540 {
541 return tn != NULL && tn->tn_op == CON && !is_nonzero_val(tn->tn_val);
542 }
543
544 static inline bool
545 is_nonzero(const tnode_t *tn)
546 {
547 return tn != NULL && tn->tn_op == CON && is_nonzero_val(tn->tn_val);
548 }
549
550 static inline uint64_t
551 bit(unsigned i)
552 {
553 lint_assert(i < 64);
554 return (uint64_t)1 << i;
555 }
556
557 static inline uint64_t
558 value_bits(unsigned bitsize)
559 {
560 lint_assert(bitsize > 0);
561
562 /* for long double (80 or 128), double _Complex (128) */
563 /*
564 * XXX: double _Complex does not have 128 bits of precision,
565 * therefore it should never be necessary to query the value bits
566 * of such a type; see d_c99_complex_split.c to trigger this case.
567 */
568 if (bitsize >= 64)
569 return ~((uint64_t)0);
570
571 return ~(~(uint64_t)0 << bitsize);
572 }
573
574 /* C99 6.7.8p7 */
575 static inline bool
576 is_struct_or_union(tspec_t t)
577 {
578 return t == STRUCT || t == UNION;
579 }
580