indent.c revision 1.376 1 /* $NetBSD: indent.c,v 1.376 2023/06/16 14:12:10 rillig Exp $ */
2
3 /*-
4 * SPDX-License-Identifier: BSD-4-Clause
5 *
6 * Copyright (c) 1985 Sun Microsystems, Inc.
7 * Copyright (c) 1976 Board of Trustees of the University of Illinois.
8 * Copyright (c) 1980, 1993
9 * The Regents of the University of California. All rights reserved.
10 *
11 * Redistribution and use in source and binary forms, with or without
12 * modification, are permitted provided that the following conditions
13 * are met:
14 * 1. Redistributions of source code must retain the above copyright
15 * notice, this list of conditions and the following disclaimer.
16 * 2. Redistributions in binary form must reproduce the above copyright
17 * notice, this list of conditions and the following disclaimer in the
18 * documentation and/or other materials provided with the distribution.
19 * 3. All advertising materials mentioning features or use of this software
20 * must display the following acknowledgement:
21 * This product includes software developed by the University of
22 * California, Berkeley and its contributors.
23 * 4. Neither the name of the University nor the names of its contributors
24 * may be used to endorse or promote products derived from this software
25 * without specific prior written permission.
26 *
27 * THIS SOFTWARE IS PROVIDED BY THE REGENTS AND CONTRIBUTORS ``AS IS'' AND
28 * ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
29 * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
30 * ARE DISCLAIMED. IN NO EVENT SHALL THE REGENTS OR CONTRIBUTORS BE LIABLE
31 * FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL
32 * DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS
33 * OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION)
34 * HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT
35 * LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY
36 * OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF
37 * SUCH DAMAGE.
38 */
39
40 #include <sys/cdefs.h>
41 __RCSID("$NetBSD: indent.c,v 1.376 2023/06/16 14:12:10 rillig Exp $");
42
43 #include <sys/param.h>
44 #include <err.h>
45 #include <stdarg.h>
46 #include <stdio.h>
47 #include <stdlib.h>
48 #include <string.h>
49
50 #include "indent.h"
51
52 struct options opt = {
53 .brace_same_line = true,
54 .comment_delimiter_on_blank_line = true,
55 .cuddle_else = true,
56 .comment_column = 33,
57 .decl_indent = 16,
58 .else_if_in_same_line = true,
59 .function_brace_split = true,
60 .format_col1_comments = true,
61 .format_block_comments = true,
62 .indent_parameters = true,
63 .indent_size = 8,
64 .local_decl_indent = -1,
65 .lineup_to_parens = true,
66 .procnames_start_line = true,
67 .star_comment_cont = true,
68 .tabsize = 8,
69 .max_line_length = 78,
70 .use_tabs = true,
71 };
72
73 struct parser_state ps;
74
75 struct buffer token;
76
77 struct buffer lab;
78 struct buffer code;
79 struct buffer com;
80
81 bool found_err;
82 bool had_eof;
83 int line_no = 1;
84
85 static struct {
86 struct parser_state *item;
87 size_t len;
88 size_t cap;
89 } ifdef;
90
91 FILE *input;
92 FILE *output;
93
94 static const char *in_name = "Standard Input";
95 static char backup_name[PATH_MAX];
96 static const char *backup_suffix = ".BAK";
97
98
99 void *
100 nonnull(void *p)
101 {
102 if (p == NULL)
103 err(EXIT_FAILURE, NULL);
104 return p;
105 }
106
107 static void
108 buf_expand(struct buffer *buf, size_t add_size)
109 {
110 buf->cap = buf->cap + add_size + 400;
111 buf->s = nonnull(realloc(buf->s, buf->cap));
112 }
113
114 #ifdef debug
115 void
116 buf_terminate(struct buffer *buf)
117 {
118 if (buf->len == buf->cap)
119 buf_expand(buf, 1);
120 buf->s[buf->len] = '\0';
121 }
122 #endif
123
124 void
125 buf_add_char(struct buffer *buf, char ch)
126 {
127 if (buf->len == buf->cap)
128 buf_expand(buf, 1);
129 buf->s[buf->len++] = ch;
130 buf_terminate(buf);
131 }
132
133 void
134 buf_add_chars(struct buffer *buf, const char *s, size_t len)
135 {
136 if (len == 0)
137 return;
138 if (len > buf->cap - buf->len)
139 buf_expand(buf, len);
140 memcpy(buf->s + buf->len, s, len);
141 buf->len += len;
142 buf_terminate(buf);
143 }
144
145 static void
146 buf_add_buf(struct buffer *buf, const struct buffer *add)
147 {
148 buf_add_chars(buf, add->s, add->len);
149 }
150
151 void
152 diag(int level, const char *msg, ...)
153 {
154 va_list ap;
155
156 if (level != 0)
157 found_err = true;
158
159 va_start(ap, msg);
160 fprintf(stderr, "%s: %s:%d: ",
161 level == 0 ? "warning" : "error", in_name, line_no);
162 vfprintf(stderr, msg, ap);
163 fprintf(stderr, "\n");
164 va_end(ap);
165 }
166
167 /*
168 * Compute the indentation from starting at 'ind' and adding the text starting
169 * at 's'.
170 */
171 int
172 ind_add(int ind, const char *s, size_t len)
173 {
174 for (const char *p = s; len > 0; p++, len--) {
175 if (*p == '\n')
176 ind = 0;
177 else if (*p == '\t')
178 ind = next_tab(ind);
179 else if (*p == '\b')
180 --ind;
181 else
182 ++ind;
183 }
184 return ind;
185 }
186
187 static void
188 init_globals(void)
189 {
190 ps_push(psym_stmt, false); /* as a stop symbol */
191 ps.prev_lsym = lsym_semicolon;
192 ps.lbrace_kind = psym_lbrace_block;
193
194 const char *suffix = getenv("SIMPLE_BACKUP_SUFFIX");
195 if (suffix != NULL)
196 backup_suffix = suffix;
197 }
198
199 static void
200 load_profiles(int argc, char **argv)
201 {
202 const char *profile_name = NULL;
203
204 for (int i = 1; i < argc; ++i) {
205 const char *arg = argv[i];
206
207 if (strcmp(arg, "-npro") == 0)
208 return;
209 if (arg[0] == '-' && arg[1] == 'P' && arg[2] != '\0')
210 profile_name = arg + 2;
211 }
212
213 load_profile_files(profile_name);
214 }
215
216 /*
217 * Copy the input file to the backup file, then make the backup file the input
218 * and the original input file the output.
219 */
220 static void
221 copy_to_bak_file(void)
222 {
223 size_t n;
224 char buff[BUFSIZ];
225
226 const char *last_slash = strrchr(in_name, '/');
227 const char *base = last_slash != NULL ? last_slash + 1 : in_name;
228 snprintf(backup_name, sizeof(backup_name), "%s%s", base, backup_suffix);
229
230 /* copy the input file to the backup file */
231 FILE *bak = fopen(backup_name, "w");
232 if (bak == NULL)
233 err(1, "%s", backup_name);
234
235 while ((n = fread(buff, 1, sizeof(buff), input)) > 0)
236 if (fwrite(buff, 1, n, bak) != n)
237 err(1, "%s", backup_name);
238 if (fclose(input) != 0)
239 err(1, "%s", in_name);
240 if (fclose(bak) != 0)
241 err(1, "%s", backup_name);
242
243 /* re-open the backup file as the input file */
244 input = fopen(backup_name, "r");
245 if (input == NULL)
246 err(1, "%s", backup_name);
247 /* now the original input file will be the output */
248 output = fopen(in_name, "w");
249 if (output == NULL) {
250 remove(backup_name);
251 err(1, "%s", in_name);
252 }
253 }
254
255 static void
256 parse_command_line(int argc, char **argv)
257 {
258 for (int i = 1; i < argc; ++i) {
259 const char *arg = argv[i];
260
261 if (arg[0] == '-') {
262 set_option(arg, "Command line");
263
264 } else if (input == NULL) {
265 in_name = arg;
266 if ((input = fopen(in_name, "r")) == NULL)
267 err(1, "%s", in_name);
268
269 } else if (output == NULL) {
270 if (strcmp(arg, in_name) == 0)
271 errx(1, "input and output files "
272 "must be different");
273 if ((output = fopen(arg, "w")) == NULL)
274 err(1, "%s", arg);
275
276 } else
277 errx(1, "too many arguments: %s", arg);
278 }
279
280 if (input == NULL) {
281 input = stdin;
282 output = stdout;
283 } else if (output == NULL)
284 copy_to_bak_file();
285
286 if (opt.comment_column <= 1)
287 opt.comment_column = 2; /* don't put normal comments in column
288 * 1, see opt.format_col1_comments */
289 if (opt.block_comment_max_line_length <= 0)
290 opt.block_comment_max_line_length = opt.max_line_length;
291 if (opt.local_decl_indent < 0)
292 opt.local_decl_indent = opt.decl_indent;
293 if (opt.decl_comment_column <= 0)
294 opt.decl_comment_column = opt.left_justify_decl
295 ? (opt.comment_column <= 10 ? 2 : opt.comment_column - 8)
296 : opt.comment_column;
297 if (opt.continuation_indent == 0)
298 opt.continuation_indent = opt.indent_size;
299 }
300
301 static void
302 set_initial_indentation(void)
303 {
304 inp_read_line();
305
306 int ind = 0;
307 for (const char *p = inp_p;; p++) {
308 if (*p == ' ')
309 ind++;
310 else if (*p == '\t')
311 ind = next_tab(ind);
312 else
313 break;
314 }
315
316 ps.ind_level = ps.ind_level_follow = ind / opt.indent_size;
317 }
318
319 static bool
320 should_break_line(lexer_symbol lsym)
321 {
322 if (lsym == lsym_semicolon)
323 return false;
324 if (ps.prev_lsym == lsym_lbrace || ps.prev_lsym == lsym_semicolon)
325 return true;
326 if (lsym == lsym_lbrace && opt.brace_same_line)
327 return false;
328 return true;
329 }
330
331 static void
332 move_com_to_code(lexer_symbol lsym)
333 {
334 if (ps.want_blank)
335 buf_add_char(&code, ' ');
336 buf_add_buf(&code, &com);
337 buf_clear(&com);
338 ps.want_blank = lsym != lsym_rparen && lsym != lsym_rbracket;
339 }
340
341 static void
342 update_ps_lbrace_kind(lexer_symbol lsym)
343 {
344 if (lsym == lsym_tag) {
345 ps.lbrace_kind = token.s[0] == 's' ? psym_lbrace_struct :
346 token.s[0] == 'u' ? psym_lbrace_union :
347 psym_lbrace_enum;
348 } else if (lsym == lsym_type_outside_parentheses
349 || lsym == lsym_word
350 || lsym == lsym_lbrace) {
351 /* Keep the current '{' kind. */
352 } else
353 ps.lbrace_kind = psym_lbrace_block;
354 }
355
356 static void
357 indent_declarator(int decl_ind, bool tabs_to_var)
358 {
359 int base = ps.ind_level * opt.indent_size;
360 int ind = ind_add(base, code.s, code.len);
361 int target = base + decl_ind;
362 size_t orig_code_len = code.len;
363
364 if (tabs_to_var)
365 for (int next; (next = next_tab(ind)) <= target; ind = next)
366 buf_add_char(&code, '\t');
367 for (; ind < target; ind++)
368 buf_add_char(&code, ' ');
369 if (code.len == orig_code_len && ps.want_blank)
370 buf_add_char(&code, ' ');
371
372 ps.want_blank = false;
373 ps.decl_indent_done = true;
374 }
375
376 static bool
377 is_function_pointer_declaration(void)
378 {
379 return ps.in_decl
380 && !ps.in_typedef_decl
381 && !ps.in_init
382 && !ps.decl_indent_done
383 && !ps.line_has_func_def
384 && ps.ind_paren_level == 0;
385 }
386
387 static int
388 process_eof(void)
389 {
390 finish_output();
391
392 if (ps.psyms.len > 2) /* check for balanced braces */
393 diag(1, "Stuff missing from end of file");
394
395 return found_err ? EXIT_FAILURE : EXIT_SUCCESS;
396 }
397
398 /* move the whole line to the 'label' buffer */
399 static void
400 read_preprocessing_line(void)
401 {
402 enum {
403 PLAIN, STR, CHR, COMM
404 } state = PLAIN;
405
406 buf_add_char(&lab, '#');
407
408 while (inp_p[0] != '\n' || (state == COMM && !had_eof)) {
409 buf_add_char(&lab, inp_next());
410 switch (lab.s[lab.len - 1]) {
411 case '\\':
412 if (state != COMM)
413 buf_add_char(&lab, inp_next());
414 break;
415 case '/':
416 if (inp_p[0] == '*' && state == PLAIN) {
417 state = COMM;
418 buf_add_char(&lab, *inp_p++);
419 }
420 break;
421 case '"':
422 if (state == STR)
423 state = PLAIN;
424 else if (state == PLAIN)
425 state = STR;
426 break;
427 case '\'':
428 if (state == CHR)
429 state = PLAIN;
430 else if (state == PLAIN)
431 state = CHR;
432 break;
433 case '*':
434 if (inp_p[0] == '/' && state == COMM) {
435 state = PLAIN;
436 buf_add_char(&lab, *inp_p++);
437 }
438 break;
439 }
440 }
441
442 while (lab.len > 0 && ch_isblank(lab.s[lab.len - 1]))
443 lab.len--;
444 buf_terminate(&lab);
445 }
446
447 static void
448 paren_stack_push(struct paren_stack *s, int indent, enum paren_level_cast cast)
449 {
450 if (s->len == s->cap) {
451 s->cap = 10 + s->cap;
452 s->item = nonnull(realloc(s->item,
453 sizeof(s->item[0]) * s->cap));
454 }
455 s->item[s->len++] = (struct paren_level){indent, cast};
456 }
457
458 static void *
459 dup_mem(const void *src, size_t size)
460 {
461 return memcpy(nonnull(malloc(size)), src, size);
462 }
463
464 #define dup_array(src, len) \
465 dup_mem((src), sizeof((src)[0]) * (len))
466 #define copy_array(dst, src, len) \
467 memcpy((dst), (src), sizeof((dst)[0]) * (len))
468
469 static void
470 parser_state_back_up(struct parser_state *dst)
471 {
472 *dst = ps;
473
474 dst->paren.item = dup_array(ps.paren.item, ps.paren.len);
475 dst->psyms.sym = dup_array(ps.psyms.sym, ps.psyms.len);
476 dst->psyms.ind_level = dup_array(ps.psyms.ind_level, ps.psyms.len);
477 }
478
479 static void
480 parser_state_restore(const struct parser_state *src)
481 {
482 struct paren_level *ps_paren_item = ps.paren.item;
483 size_t ps_paren_cap = ps.paren.cap;
484 enum parser_symbol *ps_psyms_sym = ps.psyms.sym;
485 int *ps_psyms_ind_level = ps.psyms.ind_level;
486 size_t ps_psyms_cap = ps.psyms.cap;
487
488 ps = *src;
489
490 ps.paren.item = ps_paren_item;
491 ps.paren.cap = ps_paren_cap;
492 ps.psyms.sym = ps_psyms_sym;
493 ps.psyms.ind_level = ps_psyms_ind_level;
494 ps.psyms.cap = ps_psyms_cap;
495
496 copy_array(ps.paren.item, src->paren.item, src->paren.len);
497 copy_array(ps.psyms.sym, src->psyms.sym, src->psyms.len);
498 copy_array(ps.psyms.ind_level, src->psyms.ind_level, src->psyms.len);
499 }
500
501 static void
502 parser_state_free(struct parser_state *pst)
503 {
504 free(pst->paren.item);
505 free(pst->psyms.sym);
506 free(pst->psyms.ind_level);
507 }
508
509 static void
510 process_preprocessing(void)
511 {
512 if (lab.len > 0 || code.len > 0 || com.len > 0)
513 output_line();
514
515 read_preprocessing_line();
516
517 const char *dir = lab.s + 1, *line_end = lab.s + lab.len;
518 while (dir < line_end && ch_isblank(*dir))
519 dir++;
520 size_t dir_len = 0;
521 while (dir + dir_len < line_end && ch_isalpha(dir[dir_len]))
522 dir_len++;
523
524 if (dir_len >= 2 && memcmp(dir, "if", 2) == 0) {
525 if (ifdef.len >= ifdef.cap) {
526 ifdef.cap += 5;
527 ifdef.item = nonnull(realloc(ifdef.item,
528 sizeof(ifdef.item[0]) * ifdef.cap));
529 }
530 parser_state_back_up(ifdef.item + ifdef.len++);
531 out.line_kind = lk_pre_if;
532
533 } else if (dir_len >= 2 && memcmp(dir, "el", 2) == 0) {
534 if (ifdef.len == 0)
535 diag(1, "Unmatched #%.*s", (int)dir_len, dir);
536 else
537 parser_state_restore(ifdef.item + ifdef.len - 1);
538 out.line_kind = lk_pre_other;
539
540 } else if (dir_len == 5 && memcmp(dir, "endif", 5) == 0) {
541 if (ifdef.len == 0)
542 diag(1, "Unmatched #endif");
543 else
544 parser_state_free(ifdef.item + --ifdef.len);
545 out.line_kind = lk_pre_endif;
546 } else
547 out.line_kind = lk_pre_other;
548 }
549
550 static void
551 process_newline(void)
552 {
553 if (ps.prev_lsym == lsym_comma
554 && ps.paren.len == 0 && !ps.in_init
555 && !opt.break_after_comma && ps.break_after_comma
556 && lab.len == 0 /* for preprocessing lines */
557 && com.len == 0)
558 goto stay_in_line;
559 if (ps.psyms.sym[ps.psyms.len - 1] == psym_switch_expr
560 && opt.brace_same_line
561 && com.len == 0) {
562 ps.want_newline = true;
563 goto stay_in_line;
564 }
565
566 output_line();
567
568 stay_in_line:
569 ++line_no;
570 }
571
572 static bool
573 want_blank_before_lparen(void)
574 {
575 if (opt.proc_calls_space)
576 return true;
577 if (ps.prev_lsym == lsym_rparen || ps.prev_lsym == lsym_rbracket)
578 return false;
579 if (ps.prev_lsym == lsym_offsetof)
580 return false;
581 if (ps.prev_lsym == lsym_sizeof)
582 return opt.blank_after_sizeof;
583 if (ps.prev_lsym == lsym_word || ps.prev_lsym == lsym_funcname)
584 return false;
585 return true;
586 }
587
588 static void
589 process_lparen(void)
590 {
591
592 if (is_function_pointer_declaration())
593 indent_declarator(ps.decl_ind, ps.tabs_to_var);
594 else if (ps.want_blank && want_blank_before_lparen())
595 buf_add_char(&code, ' ');
596 ps.want_blank = false;
597 buf_add_buf(&code, &token);
598
599 if (opt.extra_expr_indent && ps.spaced_expr_psym != psym_0)
600 ps.extra_expr_indent = eei_maybe;
601
602 if (ps.in_var_decl && ps.psyms.len <= 3 && !ps.in_init) {
603 parse(psym_stmt); /* prepare for function definition */
604 ps.in_var_decl = false;
605 }
606
607 enum paren_level_cast cast = cast_unknown;
608 if (ps.prev_lsym == lsym_offsetof
609 || ps.prev_lsym == lsym_sizeof
610 || ps.prev_lsym == lsym_for
611 || ps.prev_lsym == lsym_if
612 || ps.prev_lsym == lsym_switch
613 || ps.prev_lsym == lsym_while
614 || ps.line_has_func_def)
615 cast = cast_no;
616
617 paren_stack_push(&ps.paren, ind_add(0, code.s, code.len), cast);
618 }
619
620 static bool
621 rparen_is_cast(bool paren_cast)
622 {
623 if (ps.in_func_def_params)
624 return false;
625 if (ps.prev_lsym == lsym_unary_op)
626 return true;
627 if (ps.line_has_decl && !ps.in_init)
628 return false;
629 return paren_cast || ch_isalpha(inp_p[0]);
630 }
631
632 static void
633 process_rparen(void)
634 {
635 if (ps.paren.len == 0)
636 diag(0, "Extra '%c'", *token.s);
637
638 bool paren_cast = ps.paren.len > 0
639 && ps.paren.item[--ps.paren.len].cast == cast_maybe;
640 ps.prev_paren_was_cast = rparen_is_cast(paren_cast);
641 if (ps.prev_paren_was_cast) {
642 ps.next_unary = true;
643 ps.want_blank = opt.space_after_cast;
644 } else
645 ps.want_blank = true;
646
647 if (code.len == 0)
648 ps.ind_paren_level = (int)ps.paren.len;
649
650 buf_add_buf(&code, &token);
651
652 if (ps.spaced_expr_psym != psym_0 && ps.paren.len == 0) {
653 parse(ps.spaced_expr_psym);
654 ps.spaced_expr_psym = psym_0;
655
656 ps.want_newline = true;
657 ps.next_unary = true;
658 ps.in_stmt_or_decl = false;
659 ps.want_blank = true;
660 out.line_kind = lk_stmt_head;
661 if (ps.extra_expr_indent == eei_maybe)
662 ps.extra_expr_indent = eei_last;
663 }
664 }
665
666 static void
667 process_lbracket(void)
668 {
669 if (code.len > 0
670 && (ps.prev_lsym == lsym_comma || ps.prev_lsym == lsym_binary_op))
671 buf_add_char(&code, ' ');
672 buf_add_buf(&code, &token);
673 ps.want_blank = false;
674
675 paren_stack_push(&ps.paren, ind_add(0, code.s, code.len), cast_no);
676 }
677
678 static void
679 process_rbracket(void)
680 {
681 if (ps.paren.len == 0)
682 diag(0, "Extra '%c'", *token.s);
683 if (ps.paren.len > 0)
684 ps.paren.len--;
685
686 if (code.len == 0)
687 ps.ind_paren_level = (int)ps.paren.len;
688
689 buf_add_buf(&code, &token);
690 ps.want_blank = true;
691 }
692
693 static void
694 process_lbrace(void)
695 {
696 if (ps.prev_lsym == lsym_rparen && ps.prev_paren_was_cast) {
697 ps.in_var_decl = true; // XXX: not really
698 ps.in_init = true;
699 }
700
701 if (out.line_kind == lk_stmt_head)
702 out.line_kind = lk_other;
703
704 ps.in_stmt_or_decl = false; /* don't indent the {} */
705
706 if (ps.in_init)
707 ps.init_level++;
708 else
709 ps.want_newline = true;
710
711 if (code.len > 0 && !ps.in_init) {
712 if (!opt.brace_same_line ||
713 (code.len > 0 && code.s[code.len - 1] == '}'))
714 output_line();
715 else if (ps.in_func_def_params && !ps.in_var_decl) {
716 ps.ind_level_follow = 0;
717 if (opt.function_brace_split)
718 output_line();
719 else
720 ps.want_blank = true;
721 }
722 }
723
724 if (ps.paren.len > 0 && ps.init_level == 0) {
725 diag(1, "Unbalanced parentheses");
726 ps.paren.len = 0;
727 if (ps.spaced_expr_psym != psym_0) {
728 parse(ps.spaced_expr_psym);
729 ps.spaced_expr_psym = psym_0;
730 ps.ind_level = ps.ind_level_follow;
731 }
732 }
733
734 if (code.len == 0)
735 ps.line_is_stmt_cont = false;
736 if (ps.in_decl && ps.in_var_decl) {
737 ps.di_stack[ps.decl_level] = ps.decl_ind;
738 if (++ps.decl_level == (int)array_length(ps.di_stack)) {
739 diag(0, "Reached internal limit of %zu struct levels",
740 array_length(ps.di_stack));
741 ps.decl_level--;
742 }
743 } else {
744 ps.line_has_decl = false; /* don't do special indentation
745 * of comments */
746 ps.in_func_def_params = false;
747 ps.in_decl = false;
748 }
749
750 ps.decl_ind = 0;
751 parse(ps.lbrace_kind);
752 if (ps.want_blank)
753 buf_add_char(&code, ' ');
754 ps.want_blank = false;
755 buf_add_char(&code, '{');
756 ps.declaration = decl_no;
757 }
758
759 static void
760 process_rbrace(void)
761 {
762 if (ps.paren.len > 0 && ps.init_level == 0) {
763 diag(1, "Unbalanced parentheses");
764 ps.paren.len = 0;
765 ps.spaced_expr_psym = psym_0;
766 }
767
768 ps.declaration = decl_no;
769 if (ps.init_level > 0)
770 ps.init_level--;
771
772 if (code.len > 0 && !ps.in_init)
773 output_line();
774
775 buf_add_char(&code, '}');
776 ps.want_blank = true;
777 ps.in_stmt_or_decl = false; // XXX: Initializers don't end a stmt
778 ps.line_is_stmt_cont = false;
779
780 if (ps.decl_level > 0) { /* multi-level structure declaration */
781 ps.decl_ind = ps.di_stack[--ps.decl_level];
782 if (ps.decl_level == 0 && !ps.in_func_def_params) {
783 ps.declaration = decl_begin;
784 ps.decl_ind = ps.ind_level == 0
785 ? opt.decl_indent : opt.local_decl_indent;
786 }
787 ps.in_decl = true;
788 }
789
790 if (ps.psyms.len == 3)
791 out.line_kind = lk_func_end;
792
793 parse(psym_rbrace);
794
795 if (!ps.in_var_decl
796 && ps.psyms.sym[ps.psyms.len - 1] != psym_do_stmt
797 && ps.psyms.sym[ps.psyms.len - 1] != psym_if_expr_stmt)
798 ps.want_newline = true;
799 }
800
801 static void
802 process_period(void)
803 {
804 if (code.len > 0 && code.s[code.len - 1] == ',')
805 buf_add_char(&code, ' ');
806 buf_add_char(&code, '.');
807 ps.want_blank = false;
808 }
809
810 static void
811 process_unary_op(void)
812 {
813 if (is_function_pointer_declaration()) {
814 int ind = ps.decl_ind - (int)token.len;
815 indent_declarator(ind, ps.tabs_to_var);
816 } else if ((token.s[0] == '+' || token.s[0] == '-')
817 && code.len > 0 && code.s[code.len - 1] == token.s[0])
818 ps.want_blank = true;
819
820 if (ps.want_blank)
821 buf_add_char(&code, ' ');
822 buf_add_buf(&code, &token);
823 ps.want_blank = false;
824 }
825
826 static void
827 process_postfix_op(void)
828 {
829 buf_add_buf(&code, &token);
830 ps.want_blank = true;
831 }
832
833 static void
834 process_comma(void)
835 {
836 ps.want_blank = code.len > 0; /* only put blank after comma if comma
837 * does not start the line */
838
839 if (ps.in_decl && ps.ind_paren_level == 0
840 && !ps.line_has_func_def && !ps.in_init && !ps.decl_indent_done) {
841 /* indent leading commas and not the actual identifiers */
842 indent_declarator(ps.decl_ind - 1, ps.tabs_to_var);
843 }
844
845 buf_add_char(&code, ',');
846
847 if (ps.paren.len == 0) {
848 if (ps.init_level == 0)
849 ps.in_init = false;
850 int typical_varname_length = 8;
851 if (ps.break_after_comma && (opt.break_after_comma ||
852 ind_add(compute_code_indent(), code.s, code.len)
853 >= opt.max_line_length - typical_varname_length))
854 ps.want_newline = true;
855 }
856 }
857
858 static void
859 process_label_colon(void)
860 {
861 buf_add_buf(&lab, &code);
862 buf_add_char(&lab, ':');
863 buf_clear(&code);
864
865 if (ps.seen_case)
866 out.line_kind = lk_case_or_default;
867 ps.in_stmt_or_decl = false;
868 ps.want_newline = ps.seen_case;
869 ps.seen_case = false;
870 ps.want_blank = false;
871 }
872
873 static void
874 process_other_colon(void)
875 {
876 buf_add_char(&code, ':');
877 ps.want_blank = ps.decl_level == 0;
878 }
879
880 static void
881 process_semicolon(void)
882 {
883 if (out.line_kind == lk_stmt_head)
884 out.line_kind = lk_other;
885 if (ps.decl_level == 0) {
886 ps.in_var_decl = false;
887 ps.in_typedef_decl = false;
888 }
889 ps.seen_case = false; /* only needs to be reset on error */
890 ps.quest_level = 0; /* only needs to be reset on error */
891 if (ps.prev_lsym == lsym_rparen)
892 ps.in_func_def_params = false;
893 ps.in_init = false;
894 ps.init_level = 0;
895 ps.declaration = ps.declaration == decl_begin ? decl_end : decl_no;
896
897 if (ps.in_decl && code.len == 0 && !ps.in_init &&
898 !ps.decl_indent_done && ps.ind_paren_level == 0) {
899 /* indent stray semicolons in declarations */
900 indent_declarator(ps.decl_ind - 1, ps.tabs_to_var);
901 }
902
903 ps.in_decl = ps.decl_level > 0; /* if we were in a first level
904 * structure declaration before, we
905 * aren't anymore */
906
907 if (ps.paren.len > 0 && ps.spaced_expr_psym != psym_for_exprs) {
908 diag(1, "Unbalanced parentheses");
909 ps.paren.len = 0;
910 if (ps.spaced_expr_psym != psym_0) {
911 parse(ps.spaced_expr_psym);
912 ps.spaced_expr_psym = psym_0;
913 }
914 }
915 buf_add_char(&code, ';');
916 ps.want_blank = true;
917 ps.in_stmt_or_decl = ps.paren.len > 0;
918 ps.decl_ind = 0;
919
920 if (ps.spaced_expr_psym == psym_0) {
921 parse(psym_stmt);
922 ps.want_newline = true;
923 }
924 }
925
926 static void
927 process_type_outside_parentheses(void)
928 {
929 parse(psym_decl); /* let the parser worry about indentation */
930
931 if (ps.prev_lsym == lsym_rparen && ps.psyms.len <= 2 && code.len > 0)
932 output_line();
933
934 if (ps.in_func_def_params && opt.indent_parameters &&
935 ps.decl_level == 0) {
936 ps.ind_level = ps.ind_level_follow = 1;
937 ps.line_is_stmt_cont = false;
938 }
939
940 ps.in_var_decl = /* maybe */ true;
941 ps.in_decl = true;
942 ps.line_has_decl = ps.in_decl;
943 if (ps.decl_level == 0)
944 ps.declaration = decl_begin;
945
946 int ind = ps.ind_level > 0 && ps.decl_level == 0
947 ? opt.local_decl_indent /* local variable */
948 : opt.decl_indent; /* global variable, or member */
949 if (ind == 0) {
950 int ind0 = code.len > 0 ? ind_add(0, code.s, code.len) + 1 : 0;
951 ps.decl_ind = ind_add(ind0, token.s, token.len) + 1;
952 } else
953 ps.decl_ind = ind;
954 ps.tabs_to_var = opt.use_tabs && ind > 0;
955 }
956
957 static void
958 process_word(lexer_symbol lsym)
959 {
960 if (ps.in_decl) {
961 if (lsym == lsym_funcname) {
962 ps.in_decl = false;
963 if (opt.procnames_start_line && code.len > 0)
964 output_line();
965 else if (ps.want_blank)
966 buf_add_char(&code, ' ');
967 ps.want_blank = false;
968 } else if (ps.in_typedef_decl && ps.decl_level == 0) {
969 /* Do not indent typedef declarators. */
970 } else if (!ps.in_init && !ps.decl_indent_done &&
971 ps.ind_paren_level == 0) {
972 if (opt.decl_indent == 0
973 && code.len > 0 && code.s[code.len - 1] == '}')
974 ps.decl_ind = ind_add(0, code.s, code.len) + 1;
975 indent_declarator(ps.decl_ind, ps.tabs_to_var);
976 }
977
978 } else if (ps.spaced_expr_psym != psym_0 && ps.paren.len == 0) {
979 parse(ps.spaced_expr_psym);
980 ps.spaced_expr_psym = psym_0;
981 ps.want_newline = true;
982 ps.in_stmt_or_decl = false;
983 ps.next_unary = true;
984 }
985 }
986
987 static void
988 process_do(void)
989 {
990 ps.in_stmt_or_decl = false;
991 ps.in_decl = false;
992
993 if (code.len > 0)
994 output_line();
995
996 parse(psym_do);
997 ps.want_newline = true;
998 }
999
1000 static void
1001 process_else(void)
1002 {
1003 ps.in_stmt_or_decl = false;
1004 ps.in_decl = false;
1005
1006 if (code.len > 0
1007 && !(opt.cuddle_else && code.s[code.len - 1] == '}'))
1008 output_line();
1009
1010 parse(psym_else);
1011 ps.want_newline = true;
1012 }
1013
1014 static void
1015 process_lsym(lexer_symbol lsym)
1016 {
1017 switch (lsym) {
1018 /* INDENT OFF */
1019 case lsym_preprocessing: process_preprocessing(); break;
1020 case lsym_newline: process_newline(); break;
1021 case lsym_comment: process_comment(); break;
1022 case lsym_lparen: process_lparen(); break;
1023 case lsym_lbracket: process_lbracket(); break;
1024 case lsym_rparen: process_rparen(); break;
1025 case lsym_rbracket: process_rbracket(); break;
1026 case lsym_lbrace: process_lbrace(); break;
1027 case lsym_rbrace: process_rbrace(); break;
1028 case lsym_period: process_period(); break;
1029 case lsym_unary_op: process_unary_op(); break;
1030 case lsym_postfix_op: process_postfix_op(); break;
1031 case lsym_binary_op: goto copy_token;
1032 case lsym_question: ps.quest_level++; goto copy_token;
1033 case lsym_question_colon: goto copy_token;
1034 case lsym_label_colon: process_label_colon(); break;
1035 case lsym_other_colon: process_other_colon(); break;
1036 case lsym_comma: process_comma(); break;
1037 case lsym_semicolon: process_semicolon(); break;
1038 case lsym_typedef: ps.in_typedef_decl = true; goto copy_token;
1039 case lsym_modifier: goto copy_token;
1040 case lsym_case: ps.seen_case = true; goto copy_token;
1041 case lsym_default: ps.seen_case = true; goto copy_token;
1042 case lsym_do: process_do(); goto copy_token;
1043 case lsym_else: process_else(); goto copy_token;
1044 case lsym_for: ps.spaced_expr_psym = psym_for_exprs; goto copy_token;
1045 case lsym_if: ps.spaced_expr_psym = psym_if_expr; goto copy_token;
1046 case lsym_switch: ps.spaced_expr_psym = psym_switch_expr; goto copy_token;
1047 case lsym_while: ps.spaced_expr_psym = psym_while_expr; goto copy_token;
1048 /* INDENT ON */
1049
1050 case lsym_tag:
1051 if (ps.paren.len > 0)
1052 goto copy_token;
1053 /* FALLTHROUGH */
1054 case lsym_type_outside_parentheses:
1055 process_type_outside_parentheses();
1056 goto copy_token;
1057
1058 case lsym_type_in_parentheses:
1059 case lsym_sizeof:
1060 case lsym_offsetof:
1061 case lsym_word:
1062 case lsym_funcname:
1063 case lsym_return:
1064 process_word(lsym);
1065 copy_token:
1066 if (ps.want_blank)
1067 buf_add_char(&code, ' ');
1068 buf_add_buf(&code, &token);
1069 if (lsym != lsym_funcname)
1070 ps.want_blank = true;
1071 break;
1072
1073 default:
1074 break;
1075 }
1076 }
1077
1078 static int
1079 indent(void)
1080 {
1081 debug_parser_state();
1082
1083 for (;;) { /* loop until we reach eof */
1084 lexer_symbol lsym = lexi();
1085
1086 debug_blank_line();
1087 debug_printf("line %d: %s", line_no, lsym_name[lsym]);
1088 debug_print_buf("token", &token);
1089 debug_buffers();
1090 debug_blank_line();
1091
1092 if (lsym == lsym_eof)
1093 return process_eof();
1094
1095 if (lsym == lsym_preprocessing || lsym == lsym_newline)
1096 ps.want_newline = false;
1097 else if (lsym == lsym_comment) {
1098 /* no special processing */
1099 } else {
1100 if (lsym == lsym_if && ps.prev_lsym == lsym_else
1101 && opt.else_if_in_same_line)
1102 ps.want_newline = false;
1103
1104 if (ps.want_newline && should_break_line(lsym)) {
1105 ps.want_newline = false;
1106 output_line();
1107 }
1108 ps.in_stmt_or_decl = true;
1109 if (com.len > 0)
1110 move_com_to_code(lsym);
1111 update_ps_lbrace_kind(lsym);
1112 }
1113
1114 process_lsym(lsym);
1115
1116 if (lsym != lsym_preprocessing
1117 && lsym != lsym_newline
1118 && lsym != lsym_comment)
1119 ps.prev_lsym = lsym;
1120
1121 debug_parser_state();
1122 }
1123 }
1124
1125 int
1126 main(int argc, char **argv)
1127 {
1128 init_globals();
1129 load_profiles(argc, argv);
1130 parse_command_line(argc, argv);
1131 set_initial_indentation();
1132 return indent();
1133 }
1134