emit1.c revision 1.2 1 /* $NetBSD: emit1.c,v 1.2 1995/07/03 21:24:02 cgd Exp $ */
2
3 /*
4 * Copyright (c) 1994, 1995 Jochen Pohl
5 * All Rights Reserved.
6 *
7 * Redistribution and use in source and binary forms, with or without
8 * modification, are permitted provided that the following conditions
9 * are met:
10 * 1. Redistributions of source code must retain the above copyright
11 * notice, this list of conditions and the following disclaimer.
12 * 2. Redistributions in binary form must reproduce the above copyright
13 * notice, this list of conditions and the following disclaimer in the
14 * documentation and/or other materials provided with the distribution.
15 * 3. All advertising materials mentioning features or use of this software
16 * must display the following acknowledgement:
17 * This product includes software developed by Jochen Pohl for
18 * The NetBSD Project.
19 * 4. The name of the author may not be used to endorse or promote products
20 * derived from this software without specific prior written permission.
21 *
22 * THIS SOFTWARE IS PROVIDED BY THE AUTHOR ``AS IS'' AND ANY EXPRESS OR
23 * IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED WARRANTIES
24 * OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE ARE DISCLAIMED.
25 * IN NO EVENT SHALL THE AUTHOR BE LIABLE FOR ANY DIRECT, INDIRECT,
26 * INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT
27 * NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE,
28 * DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY
29 * THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT
30 * (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF
31 * THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
32 */
33
34 #ifndef lint
35 static char rcsid[] = "$NetBSD: emit1.c,v 1.2 1995/07/03 21:24:02 cgd Exp $";
36 #endif
37
38 #include <ctype.h>
39
40 #include "lint1.h"
41
42 static void outtt __P((sym_t *, sym_t *));
43 static void outfstrg __P((strg_t *));
44
45 /*
46 * Write type into the output buffer.
47 * The type is written as a sequence of substrings, each of which describes a
48 * node of type type_t
49 * a node is coded as follows:
50 * char C
51 * signed char s C
52 * unsigned char u C
53 * short S
54 * unsigned short u S
55 * int I
56 * unsigned int u I
57 * long L
58 * unsigned long u L
59 * long long Q
60 * unsigned long long u Q
61 * float s D
62 * double D
63 * long double l D
64 * void V
65 * * P
66 * [n] A n
67 * () F
68 * (void) F 0
69 * (n arguments) F n arg1 arg2 ... argn
70 * (n arguments, ...) F n arg1 arg2 ... argn-1 E
71 * (a, b, c, ...) f n arg1 arg2 ...
72 * enum tag e T tag_or_typename
73 * struct tag s T tag_or_typename
74 * union tag u T tag_or_typename
75 *
76 * tag_or_typename 0 no tag or type name
77 * 1 n tag Tag
78 * 2 n typename only type name
79 *
80 * spaces are only for better readability
81 * additionaly it is possible to prepend the characters 'c' (for const)
82 * and 'v' (for volatile)
83 */
84 void
85 outtype(tp)
86 type_t *tp;
87 {
88 int t, s, na;
89 sym_t *arg;
90 tspec_t ts;
91
92 while (tp != NULL) {
93 if ((ts = tp->t_tspec) == INT && tp->t_isenum)
94 ts = ENUM;
95 switch (ts) {
96 case CHAR: t = 'C'; s = '\0'; break;
97 case SCHAR: t = 'C'; s = 's'; break;
98 case UCHAR: t = 'C'; s = 'u'; break;
99 case SHORT: t = 'S'; s = '\0'; break;
100 case USHORT: t = 'S'; s = 'u'; break;
101 case INT: t = 'I'; s = '\0'; break;
102 case UINT: t = 'I'; s = 'u'; break;
103 case LONG: t = 'L'; s = '\0'; break;
104 case ULONG: t = 'L'; s = 'u'; break;
105 case QUAD: t = 'Q'; s = '\0'; break;
106 case UQUAD: t = 'Q'; s = 'u'; break;
107 case FLOAT: t = 'D'; s = 's'; break;
108 case DOUBLE: t = 'D'; s = '\0'; break;
109 case LDOUBLE: t = 'D'; s = 'l'; break;
110 case VOID: t = 'V'; s = '\0'; break;
111 case PTR: t = 'P'; s = '\0'; break;
112 case ARRAY: t = 'A'; s = '\0'; break;
113 case FUNC: t = 'F'; s = '\0'; break;
114 case ENUM: t = 'T'; s = 'e'; break;
115 case STRUCT: t = 'T'; s = 's'; break;
116 case UNION: t = 'T'; s = 'u'; break;
117 default:
118 lerror("outtyp() 1");
119 }
120 if (tp->t_const)
121 outchar('c');
122 if (tp->t_volatile)
123 outchar('v');
124 if (s != '\0')
125 outchar(s);
126 outchar(t);
127 if (ts == ARRAY) {
128 outint(tp->t_dim);
129 } else if (ts == ENUM) {
130 outtt(tp->t_enum->etag, tp->t_enum->etdef);
131 } else if (ts == STRUCT || ts == UNION) {
132 outtt(tp->t_str->stag, tp->t_str->stdef);
133 } else if (ts == FUNC && tp->t_proto) {
134 na = 0;
135 for (arg = tp->t_args; arg != NULL; arg = arg->s_nxt)
136 na++;
137 if (tp->t_vararg)
138 na++;
139 outint(na);
140 for (arg = tp->t_args; arg != NULL; arg = arg->s_nxt)
141 outtype(arg->s_type);
142 if (tp->t_vararg)
143 outchar('E');
144 }
145 tp = tp->t_subt;
146 }
147 }
148
149 /*
150 * type to string
151 * used for debugging output
152 *
153 * it uses its own output buffer for conversion
154 */
155 const char *
156 ttos(tp)
157 type_t *tp;
158 {
159 static ob_t tob;
160 ob_t tmp;
161
162 if (tob.o_buf == NULL) {
163 tob.o_len = 64;
164 tob.o_buf = tob.o_nxt = xmalloc(tob.o_len);
165 tob.o_end = tob.o_buf + tob.o_len;
166 }
167
168 tmp = ob;
169 ob = tob;
170 ob.o_nxt = ob.o_buf;
171 outtype(tp);
172 outchar('\0');
173 tob = ob;
174 ob = tmp;
175
176 return (tob.o_buf);
177 }
178
179 /*
180 * write the name of a tag or typename
181 *
182 * if the tag is named, the name of the
183 * tag is written, otherwise, if a typename exists which
184 * refers to this tag, this typename is written
185 */
186 static void
187 outtt(tag, tdef)
188 sym_t *tag, *tdef;
189 {
190 if (tag->s_name != unnamed) {
191 outint(1);
192 outname(tag->s_name);
193 } else if (tdef != NULL) {
194 outint(2);
195 outname(tdef->s_name);
196 } else {
197 outint(0);
198 }
199 }
200
201 /*
202 * write information about an global with storage class extern
203 * declared/defined symbol
204 *
205 * informations about function definitions are written in outfdef(),
206 * not here
207 */
208 void
209 outsym(sym, sc)
210 sym_t *sym;
211 scl_t sc;
212 {
213 /*
214 * Static function declarations must also be written to the output
215 * file. Compatibility of function declarations (for both static
216 * and extern functions) must be checked in lint2. Lint1 can't do
217 * this, especially not, if functions are declared at block level
218 * before their first declaration at level 0.
219 */
220 if (sc != EXTERN && !(sc == STATIC && sym->s_type->t_tspec == FUNC))
221 return;
222
223 /* reset buffer */
224 outclr();
225
226 /*
227 * line number of .c source, 'd' for declaration, Id of current
228 * source (.c or .h), and line in current source.
229 */
230 outint(csrc_pos.p_line);
231 outchar('d');
232 outint(getfnid(sym->s_dpos.p_file));
233 outchar('.');
234 outint(sym->s_dpos.p_line);
235
236 /* flags */
237
238 switch (sym->s_def) {
239 case DEF:
240 /* defined */
241 outchar('d');
242 break;
243 case TDEF:
244 /* tentative defined */
245 outchar('t');
246 break;
247 case DECL:
248 /* declared */
249 outchar('e');
250 break;
251 default:
252 lerror("outsym() 2");
253 }
254 if (llibflg && sym->s_def != DECL) {
255 /*
256 * mark it as used so we get no warnings from lint2 about
257 * unused symbols in libraries.
258 */
259 outchar('u');
260 }
261
262 if (sc == STATIC)
263 outchar('s');
264
265 /* name of the symbol */
266 outname(sym->s_name);
267
268 /* type of the symbol */
269 outtype(sym->s_type);
270 }
271
272 /*
273 * write information about function definition
274 *
275 * this is also done for static functions so we are able to check if
276 * they are called with proper argument types
277 */
278 void
279 outfdef(fsym, tp, posp, rval, osdef, args)
280 sym_t *fsym, *args;
281 type_t *tp;
282 pos_t *posp;
283 int rval, osdef;
284 {
285 int narg;
286 sym_t *arg;
287
288 /* reset the buffer */
289 outclr();
290
291 /*
292 * line number of .c source, 'd' for declaration, Id of current
293 * source (.c or .h), and line in current source
294 *
295 * we are already at the end of the function. If we are in the
296 * .c source, posp->p_line is correct, otherwise csrc_pos.p_line
297 * (for functions defined in header files).
298 */
299 if (posp->p_file == csrc_pos.p_file) {
300 outint(posp->p_line);
301 } else {
302 outint(csrc_pos.p_line);
303 }
304 outchar('d');
305 outint(getfnid(posp->p_file));
306 outchar('.');
307 outint(posp->p_line);
308
309 /* flags */
310
311 /* both SCANFLIKE and PRINTFLIKE imply VARARGS */
312 if (prflstrg != -1) {
313 nvararg = prflstrg;
314 } else if (scflstrg != -1) {
315 nvararg = scflstrg;
316 }
317
318 if (nvararg != -1) {
319 outchar('v');
320 outint(nvararg);
321 }
322 if (scflstrg != -1) {
323 outchar('S');
324 outint(scflstrg);
325 }
326 if (prflstrg != -1) {
327 outchar('P');
328 outint(prflstrg);
329 }
330 nvararg = prflstrg = scflstrg = -1;
331
332 outchar('d');
333
334 if (rval)
335 /* has return value */
336 outchar('r');
337
338 if (llibflg)
339 /*
340 * mark it as used so lint2 does not complain about
341 * unused symbols in libraries
342 */
343 outchar('u');
344
345 if (osdef)
346 /* old style function definition */
347 outchar('o');
348
349 if (fsym->s_scl == STATIC)
350 outchar('s');
351
352 /* name of function */
353 outname(fsym->s_name);
354
355 /* argument types and return value */
356 if (osdef) {
357 narg = 0;
358 for (arg = args; arg != NULL; arg = arg->s_nxt)
359 narg++;
360 outchar('f');
361 outint(narg);
362 for (arg = args; arg != NULL; arg = arg->s_nxt)
363 outtype(arg->s_type);
364 outtype(tp->t_subt);
365 } else {
366 outtype(tp);
367 }
368 }
369
370 /*
371 * write out all information necessary for lint2 to check function
372 * calls
373 *
374 * rvused is set if the return value is used (asigned to a variable)
375 * rvdisc is set if the return value is not used and not ignored
376 * (casted to void)
377 */
378 void
379 outcall(tn, rvused, rvdisc)
380 tnode_t *tn;
381 int rvused, rvdisc;
382 {
383 tnode_t *args, *arg;
384 int narg, n, i;
385 quad_t q;
386 tspec_t t;
387
388 /* reset buffer */
389 outclr();
390
391 /*
392 * line number of .c source, 'c' for function call, Id of current
393 * source (.c or .h), and line in current source
394 */
395 outint(csrc_pos.p_line);
396 outchar('c');
397 outint(getfnid(curr_pos.p_file));
398 outchar('.');
399 outint(curr_pos.p_line);
400
401 /*
402 * flags; 'u' and 'i' must be last to make sure a letter
403 * is between the numeric argument of a flag and the name of
404 * the function
405 */
406 narg = 0;
407 args = tn->tn_right;
408 for (arg = args; arg != NULL; arg = arg->tn_right)
409 narg++;
410 /* informations about arguments */
411 for (n = 1; n <= narg; n++) {
412 /* the last argument is the top one in the tree */
413 for (i = narg, arg = args; i > n; i--, arg = arg->tn_right) ;
414 arg = arg->tn_left;
415 if (arg->tn_op == CON) {
416 if (isityp(t = arg->tn_type->t_tspec)) {
417 /*
418 * XXX it would probably be better to
419 * explizitly test the sign
420 */
421 if ((q = arg->tn_val->v_quad) == 0) {
422 /* zero constant */
423 outchar('z');
424 } else if (msb(q, t, 0) == 0) {
425 /* positive if casted to signed */
426 outchar('p');
427 } else {
428 /* negative if casted to signed */
429 outchar('n');
430 }
431 outint(n);
432 }
433 } else if (arg->tn_op == AMPER &&
434 arg->tn_left->tn_op == STRING &&
435 arg->tn_left->tn_strg->st_tspec == CHAR) {
436 /* constant string, write all format specifiers */
437 outchar('s');
438 outint(n);
439 outfstrg(arg->tn_left->tn_strg);
440 }
441
442 }
443 /* return value discarded/used/ignored */
444 outchar(rvdisc ? 'd' : (rvused ? 'u' : 'i'));
445
446 /* name of the called function */
447 outname(tn->tn_left->tn_left->tn_sym->s_name);
448
449 /* types of arguments */
450 outchar('f');
451 outint(narg);
452 for (n = 1; n <= narg; n++) {
453 /* the last argument is the top one in the tree */
454 for (i = narg, arg = args; i > n; i--, arg = arg->tn_right) ;
455 outtype(arg->tn_left->tn_type);
456 }
457 /* expected type of return value */
458 outtype(tn->tn_type);
459 }
460
461 /*
462 * extracts potential format specifiers for printf() and scanf() and
463 * writes them, enclosed in "" and qouted if necessary, to the output buffer
464 */
465 static void
466 outfstrg(strg)
467 strg_t *strg;
468 {
469 int c, oc, first;
470 u_char *cp;
471
472 if (strg->st_tspec != CHAR)
473 lerror("outfstrg() 1");
474
475 cp = strg->st_cp;
476
477 outchar('"');
478
479 c = *cp++;
480
481 while (c != '\0') {
482
483 if (c != '%') {
484 c = *cp++;
485 continue;
486 }
487
488 outqchar('%');
489 c = *cp++;
490
491 /* flags for printf and scanf and *-fieldwidth for printf */
492 while (c != '\0' && (c == '-' || c == '+' || c == ' ' ||
493 c == '#' || c == '0' || c == '*')) {
494 outqchar(c);
495 c = *cp++;
496 }
497
498 /* numeric field width */
499 while (c != '\0' && isdigit(c)) {
500 outqchar(c);
501 c = *cp++;
502 }
503
504 /* precision for printf */
505 if (c == '.') {
506 outqchar(c);
507 if ((c = *cp++) == '*') {
508 outqchar(c);
509 c = *cp++;
510 } else {
511 while (c != '\0' && isdigit(c)) {
512 outqchar(c);
513 c = *cp++;
514 }
515 }
516 }
517
518 /* h, l, L and q flags fpr printf and scanf */
519 if (c == 'h' || c == 'l' || c == 'L' || c == 'q') {
520 outqchar(c);
521 c = *cp++;
522 }
523
524 /*
525 * The last character. It is always written so we can detect
526 * invalid format specifiers.
527 */
528 if (c != '\0') {
529 outqchar(c);
530 oc = c;
531 c = *cp++;
532 /*
533 * handle [ for scanf. [-] means that a minus sign
534 * was found at an undefined position.
535 */
536 if (oc == '[') {
537 if (c == '^')
538 c = *cp++;
539 if (c == ']')
540 c = *cp++;
541 first = 1;
542 while (c != '\0' && c != ']') {
543 if (c == '-') {
544 if (!first && *cp != ']')
545 outqchar(c);
546 }
547 first = 0;
548 c = *cp++;
549 }
550 if (c == ']') {
551 outqchar(c);
552 c = *cp++;
553 }
554 }
555 }
556
557 }
558
559 outchar('"');
560 }
561
562 /*
563 * writes a record if sym was used
564 */
565 void
566 outusg(sym)
567 sym_t *sym;
568 {
569 /* reset buffer */
570 outclr();
571
572 /*
573 * line number of .c source, 'u' for used, Id of current
574 * source (.c or .h), and line in current source
575 */
576 outint(csrc_pos.p_line);
577 outchar('u');
578 outint(getfnid(curr_pos.p_file));
579 outchar('.');
580 outint(curr_pos.p_line);
581
582 /* necessary to delimit both numbers */
583 outchar('x');
584
585 /* Den Namen des Symbols ausgeben */
586 outname(sym->s_name);
587 }
588