indent.c revision 1.91 1 1.91 rillig /* $NetBSD: indent.c,v 1.91 2021/09/27 20:00:41 rillig Exp $ */
2 1.4 tls
3 1.25 kamil /*-
4 1.25 kamil * SPDX-License-Identifier: BSD-4-Clause
5 1.25 kamil *
6 1.25 kamil * Copyright (c) 1985 Sun Microsystems, Inc.
7 1.25 kamil * Copyright (c) 1976 Board of Trustees of the University of Illinois.
8 1.5 mrg * Copyright (c) 1980, 1993
9 1.5 mrg * The Regents of the University of California. All rights reserved.
10 1.15 agc *
11 1.15 agc * Redistribution and use in source and binary forms, with or without
12 1.15 agc * modification, are permitted provided that the following conditions
13 1.15 agc * are met:
14 1.15 agc * 1. Redistributions of source code must retain the above copyright
15 1.15 agc * notice, this list of conditions and the following disclaimer.
16 1.15 agc * 2. Redistributions in binary form must reproduce the above copyright
17 1.15 agc * notice, this list of conditions and the following disclaimer in the
18 1.15 agc * documentation and/or other materials provided with the distribution.
19 1.1 cgd * 3. All advertising materials mentioning features or use of this software
20 1.1 cgd * must display the following acknowledgement:
21 1.1 cgd * This product includes software developed by the University of
22 1.1 cgd * California, Berkeley and its contributors.
23 1.1 cgd * 4. Neither the name of the University nor the names of its contributors
24 1.1 cgd * may be used to endorse or promote products derived from this software
25 1.1 cgd * without specific prior written permission.
26 1.1 cgd *
27 1.1 cgd * THIS SOFTWARE IS PROVIDED BY THE REGENTS AND CONTRIBUTORS ``AS IS'' AND
28 1.1 cgd * ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
29 1.1 cgd * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
30 1.1 cgd * ARE DISCLAIMED. IN NO EVENT SHALL THE REGENTS OR CONTRIBUTORS BE LIABLE
31 1.1 cgd * FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL
32 1.1 cgd * DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS
33 1.1 cgd * OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION)
34 1.1 cgd * HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT
35 1.1 cgd * LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY
36 1.1 cgd * OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF
37 1.1 cgd * SUCH DAMAGE.
38 1.1 cgd */
39 1.1 cgd
40 1.25 kamil #if 0
41 1.25 kamil static char sccsid[] = "@(#)indent.c 5.17 (Berkeley) 6/7/93";
42 1.25 kamil #endif
43 1.1 cgd
44 1.25 kamil #include <sys/cdefs.h>
45 1.25 kamil #if defined(__NetBSD__)
46 1.91 rillig __RCSID("$NetBSD: indent.c,v 1.91 2021/09/27 20:00:41 rillig Exp $");
47 1.25 kamil #elif defined(__FreeBSD__)
48 1.25 kamil __FBSDID("$FreeBSD: head/usr.bin/indent/indent.c 340138 2018-11-04 19:24:49Z oshogbo $");
49 1.25 kamil #endif
50 1.1 cgd
51 1.1 cgd #include <sys/param.h>
52 1.25 kamil #if HAVE_CAPSICUM
53 1.25 kamil #include <sys/capsicum.h>
54 1.25 kamil #include <capsicum_helpers.h>
55 1.25 kamil #endif
56 1.82 rillig #include <ctype.h>
57 1.6 lukem #include <err.h>
58 1.6 lukem #include <errno.h>
59 1.1 cgd #include <fcntl.h>
60 1.1 cgd #include <stdio.h>
61 1.1 cgd #include <stdlib.h>
62 1.1 cgd #include <string.h>
63 1.82 rillig #include <unistd.h>
64 1.29 rillig
65 1.25 kamil #include "indent.h"
66 1.25 kamil
67 1.71 rillig struct options opt = {
68 1.86 rillig .btype_2 = true,
69 1.86 rillig .comment_delimiter_on_blankline = true,
70 1.86 rillig .cuddle_else = true,
71 1.86 rillig .comment_column = 33,
72 1.86 rillig .decl_indent = 16,
73 1.86 rillig .else_if = true,
74 1.86 rillig .function_brace_split = true,
75 1.86 rillig .format_col1_comments = true,
76 1.86 rillig .format_block_comments = true,
77 1.86 rillig .indent_parameters = true,
78 1.86 rillig .indent_size = 8,
79 1.86 rillig .local_decl_indent = -1,
80 1.86 rillig .lineup_to_parens = true,
81 1.86 rillig .procnames_start_line = true,
82 1.86 rillig .star_comment_cont = true,
83 1.86 rillig .tabsize = 8,
84 1.86 rillig .max_line_length = 78,
85 1.86 rillig .use_tabs = true,
86 1.71 rillig };
87 1.71 rillig
88 1.27 joerg struct parser_state ps;
89 1.27 joerg
90 1.63 rillig struct buffer lab;
91 1.65 rillig struct buffer code;
92 1.63 rillig struct buffer com;
93 1.67 rillig struct buffer token;
94 1.27 joerg
95 1.86 rillig char *in_buffer;
96 1.86 rillig char *in_buffer_limit;
97 1.86 rillig char *buf_ptr;
98 1.86 rillig char *buf_end;
99 1.86 rillig
100 1.86 rillig char sc_buf[sc_size];
101 1.86 rillig char *save_com;
102 1.88 rillig static char *sc_end; /* pointer into save_com buffer */
103 1.86 rillig
104 1.86 rillig char *bp_save;
105 1.86 rillig char *be_save;
106 1.86 rillig
107 1.86 rillig bool found_err;
108 1.86 rillig int n_real_blanklines;
109 1.86 rillig bool prefix_blankline_requested;
110 1.86 rillig bool postfix_blankline_requested;
111 1.86 rillig bool break_comma;
112 1.86 rillig float case_ind;
113 1.86 rillig bool had_eof;
114 1.86 rillig int line_no;
115 1.86 rillig bool inhibit_formatting;
116 1.27 joerg
117 1.88 rillig static int ifdef_level;
118 1.88 rillig static struct parser_state state_stack[5];
119 1.27 joerg
120 1.86 rillig FILE *input;
121 1.86 rillig FILE *output;
122 1.27 joerg
123 1.25 kamil static void bakcopy(void);
124 1.75 rillig static void indent_declaration(int, bool);
125 1.1 cgd
126 1.88 rillig static const char *in_name = "Standard Input";
127 1.88 rillig static const char *out_name = "Standard Output";
128 1.88 rillig static const char *backup_suffix = ".BAK";
129 1.88 rillig static char bakfile[MAXPATHLEN] = "";
130 1.1 cgd
131 1.34 rillig static void
132 1.34 rillig check_size_code(size_t desired_size)
133 1.34 rillig {
134 1.81 rillig if (code.e + desired_size >= code.l)
135 1.81 rillig buf_expand(&code, desired_size);
136 1.34 rillig }
137 1.34 rillig
138 1.34 rillig static void
139 1.34 rillig check_size_label(size_t desired_size)
140 1.34 rillig {
141 1.81 rillig if (lab.e + desired_size >= lab.l)
142 1.81 rillig buf_expand(&lab, desired_size);
143 1.34 rillig }
144 1.34 rillig
145 1.40 rillig #if HAVE_CAPSICUM
146 1.40 rillig static void
147 1.40 rillig init_capsicum(void)
148 1.1 cgd {
149 1.25 kamil cap_rights_t rights;
150 1.40 rillig
151 1.40 rillig /* Restrict input/output descriptors and enter Capsicum sandbox. */
152 1.40 rillig cap_rights_init(&rights, CAP_FSTAT, CAP_WRITE);
153 1.40 rillig if (caph_rights_limit(fileno(output), &rights) < 0)
154 1.40 rillig err(EXIT_FAILURE, "unable to limit rights for %s", out_name);
155 1.40 rillig cap_rights_init(&rights, CAP_FSTAT, CAP_READ);
156 1.40 rillig if (caph_rights_limit(fileno(input), &rights) < 0)
157 1.40 rillig err(EXIT_FAILURE, "unable to limit rights for %s", in_name);
158 1.40 rillig if (caph_enter() < 0)
159 1.40 rillig err(EXIT_FAILURE, "unable to enter capability mode");
160 1.40 rillig }
161 1.41 rillig #endif
162 1.41 rillig
163 1.41 rillig static void
164 1.91 rillig search_brace_newline(bool *inout_force_nl)
165 1.91 rillig {
166 1.91 rillig if (sc_end == NULL) {
167 1.91 rillig save_com = sc_buf;
168 1.91 rillig save_com[0] = save_com[1] = ' ';
169 1.91 rillig sc_end = &save_com[2];
170 1.91 rillig }
171 1.91 rillig *sc_end++ = '\n';
172 1.91 rillig
173 1.91 rillig /*
174 1.91 rillig * We may have inherited a force_nl == true from the previous
175 1.91 rillig * token (like a semicolon). But once we know that a newline has
176 1.91 rillig * been scanned in this loop, force_nl should be false.
177 1.91 rillig *
178 1.91 rillig * However, the force_nl == true must be preserved if newline is
179 1.91 rillig * never scanned in this loop, so this assignment cannot be done
180 1.91 rillig * earlier.
181 1.91 rillig */
182 1.91 rillig *inout_force_nl = false;
183 1.91 rillig }
184 1.91 rillig
185 1.91 rillig static void
186 1.91 rillig search_brace_comment(bool *inout_comment_buffered)
187 1.91 rillig {
188 1.91 rillig if (sc_end == NULL) {
189 1.91 rillig /*
190 1.91 rillig * Copy everything from the start of the line, because
191 1.91 rillig * process_comment() will use that to calculate original
192 1.91 rillig * indentation of a boxed comment.
193 1.91 rillig */
194 1.91 rillig memcpy(sc_buf, in_buffer, (size_t)(buf_ptr - in_buffer) - 4);
195 1.91 rillig save_com = sc_buf + (buf_ptr - in_buffer - 4);
196 1.91 rillig save_com[0] = save_com[1] = ' ';
197 1.91 rillig sc_end = &save_com[2];
198 1.91 rillig }
199 1.91 rillig *inout_comment_buffered = true;
200 1.91 rillig *sc_end++ = '/'; /* copy in start of comment */
201 1.91 rillig *sc_end++ = '*';
202 1.91 rillig for (;;) { /* loop until the end of the comment */
203 1.91 rillig *sc_end = *buf_ptr++;
204 1.91 rillig if (buf_ptr >= buf_end)
205 1.91 rillig fill_buffer();
206 1.91 rillig if (*sc_end++ == '*' && *buf_ptr == '/')
207 1.91 rillig break; /* we are at end of comment */
208 1.91 rillig if (sc_end >= &save_com[sc_size]) { /* check for temp buffer
209 1.91 rillig * overflow */
210 1.91 rillig diag(1, "Internal buffer overflow - Move big comment from right after if, while, or whatever");
211 1.91 rillig fflush(output);
212 1.91 rillig exit(1);
213 1.91 rillig }
214 1.91 rillig }
215 1.91 rillig *sc_end++ = '/'; /* add ending slash */
216 1.91 rillig if (++buf_ptr >= buf_end) /* get past / in buffer */
217 1.91 rillig fill_buffer();
218 1.91 rillig }
219 1.91 rillig
220 1.91 rillig static bool
221 1.91 rillig search_brace_lbrace(void)
222 1.91 rillig {
223 1.91 rillig /*
224 1.91 rillig * Put KNF-style lbraces before the buffered up tokens and jump
225 1.91 rillig * out of this loop in order to avoid copying the token again
226 1.91 rillig * under the default case of the switch below.
227 1.91 rillig */
228 1.91 rillig if (sc_end != NULL && opt.btype_2) {
229 1.91 rillig save_com[0] = '{';
230 1.91 rillig /*
231 1.91 rillig * Originally the lbrace may have been alone on its own line,
232 1.91 rillig * but it will be moved into "the else's line", so if there
233 1.91 rillig * was a newline resulting from the "{" before, it must be
234 1.91 rillig * scanned now and ignored.
235 1.91 rillig */
236 1.91 rillig while (isspace((unsigned char)*buf_ptr)) {
237 1.91 rillig if (++buf_ptr >= buf_end)
238 1.91 rillig fill_buffer();
239 1.91 rillig if (*buf_ptr == '\n')
240 1.91 rillig break;
241 1.91 rillig }
242 1.91 rillig return true;
243 1.91 rillig }
244 1.91 rillig return false;
245 1.91 rillig }
246 1.91 rillig
247 1.91 rillig static bool
248 1.91 rillig search_brace_other(token_type ttype, bool *inout_force_nl,
249 1.91 rillig bool comment_buffered, bool last_else)
250 1.91 rillig {
251 1.91 rillig bool remove_newlines;
252 1.91 rillig
253 1.91 rillig remove_newlines =
254 1.91 rillig /* "} else" */
255 1.91 rillig (ttype == keyword_do_else && *token.s == 'e' &&
256 1.91 rillig code.e != code.s && code.e[-1] == '}')
257 1.91 rillig /* "else if" */
258 1.91 rillig || (ttype == keyword_for_if_while &&
259 1.91 rillig *token.s == 'i' && last_else && opt.else_if);
260 1.91 rillig if (remove_newlines)
261 1.91 rillig *inout_force_nl = false;
262 1.91 rillig if (sc_end == NULL) { /* ignore buffering if comment wasn't saved
263 1.91 rillig * up */
264 1.91 rillig ps.search_brace = false;
265 1.91 rillig return false;
266 1.91 rillig }
267 1.91 rillig while (sc_end > save_com && isblank((unsigned char)sc_end[-1])) {
268 1.91 rillig sc_end--;
269 1.91 rillig }
270 1.91 rillig if (opt.swallow_optional_blanklines ||
271 1.91 rillig (!comment_buffered && remove_newlines)) {
272 1.91 rillig *inout_force_nl = !remove_newlines;
273 1.91 rillig while (sc_end > save_com && sc_end[-1] == '\n') {
274 1.91 rillig sc_end--;
275 1.91 rillig }
276 1.91 rillig }
277 1.91 rillig if (*inout_force_nl) { /* if we should insert a nl here, put it into
278 1.91 rillig * the buffer */
279 1.91 rillig *inout_force_nl = false;
280 1.91 rillig --line_no; /* this will be re-increased when the newline
281 1.91 rillig * is read from the buffer */
282 1.91 rillig *sc_end++ = '\n';
283 1.91 rillig *sc_end++ = ' ';
284 1.91 rillig if (opt.verbose) /* print error msg if the line was not already
285 1.91 rillig * broken */
286 1.91 rillig diag(0, "Line broken");
287 1.91 rillig }
288 1.91 rillig for (const char *t_ptr = token.s; *t_ptr != '\0'; ++t_ptr)
289 1.91 rillig *sc_end++ = *t_ptr;
290 1.91 rillig return true;
291 1.91 rillig }
292 1.91 rillig
293 1.91 rillig static void
294 1.91 rillig switch_buffer(void)
295 1.91 rillig {
296 1.91 rillig ps.search_brace = false; /* stop looking for start of stmt */
297 1.91 rillig bp_save = buf_ptr; /* save current input buffer */
298 1.91 rillig be_save = buf_end;
299 1.91 rillig buf_ptr = save_com; /* fix so that subsequent calls to lexi will
300 1.91 rillig * take tokens out of save_com */
301 1.91 rillig *sc_end++ = ' '; /* add trailing blank, just in case */
302 1.91 rillig buf_end = sc_end;
303 1.91 rillig sc_end = NULL;
304 1.91 rillig debug_println("switched buf_ptr to save_com");
305 1.91 rillig }
306 1.91 rillig
307 1.91 rillig static void
308 1.91 rillig search_brace_lookahead(token_type *inout_ttype)
309 1.91 rillig {
310 1.91 rillig /*
311 1.91 rillig * We must make this check, just in case there was an unexpected EOF.
312 1.91 rillig */
313 1.91 rillig if (*inout_ttype != end_of_file) {
314 1.91 rillig /*
315 1.91 rillig * The only intended purpose of calling lexi() below is to categorize
316 1.91 rillig * the next token in order to decide whether to continue buffering
317 1.91 rillig * forthcoming tokens. Once the buffering is over, lexi() will be
318 1.91 rillig * called again elsewhere on all of the tokens - this time for normal
319 1.91 rillig * processing.
320 1.91 rillig *
321 1.91 rillig * Calling it for this purpose is a bug, because lexi() also changes
322 1.91 rillig * the parser state and discards leading whitespace, which is needed
323 1.91 rillig * mostly for comment-related considerations.
324 1.91 rillig *
325 1.91 rillig * Work around the former problem by giving lexi() a copy of the
326 1.91 rillig * current parser state and discard it if the call turned out to be
327 1.91 rillig * just a look ahead.
328 1.91 rillig *
329 1.91 rillig * Work around the latter problem by copying all whitespace characters
330 1.91 rillig * into the buffer so that the later lexi() call will read them.
331 1.91 rillig */
332 1.91 rillig if (sc_end != NULL) {
333 1.91 rillig while (*buf_ptr == ' ' || *buf_ptr == '\t') {
334 1.91 rillig *sc_end++ = *buf_ptr++;
335 1.91 rillig if (sc_end >= &save_com[sc_size]) {
336 1.91 rillig errx(1, "input too long");
337 1.91 rillig }
338 1.91 rillig }
339 1.91 rillig if (buf_ptr >= buf_end) {
340 1.91 rillig fill_buffer();
341 1.91 rillig }
342 1.91 rillig }
343 1.91 rillig
344 1.91 rillig struct parser_state transient_state;
345 1.91 rillig transient_state = ps;
346 1.91 rillig *inout_ttype = lexi(&transient_state); /* read another token */
347 1.91 rillig if (*inout_ttype != newline && *inout_ttype != form_feed &&
348 1.91 rillig *inout_ttype != comment && !transient_state.search_brace) {
349 1.91 rillig ps = transient_state;
350 1.91 rillig }
351 1.91 rillig }
352 1.91 rillig }
353 1.91 rillig
354 1.91 rillig static void
355 1.75 rillig search_brace(token_type *inout_ttype, bool *inout_force_nl,
356 1.86 rillig bool *inout_comment_buffered, bool *inout_last_else)
357 1.41 rillig {
358 1.41 rillig while (ps.search_brace) {
359 1.64 rillig switch (*inout_ttype) {
360 1.41 rillig case newline:
361 1.91 rillig search_brace_newline(inout_force_nl);
362 1.59 rillig break;
363 1.41 rillig case form_feed:
364 1.41 rillig break;
365 1.41 rillig case comment:
366 1.91 rillig search_brace_comment(inout_comment_buffered);
367 1.41 rillig break;
368 1.41 rillig case lbrace:
369 1.91 rillig if (search_brace_lbrace())
370 1.41 rillig goto sw_buffer;
371 1.41 rillig /* FALLTHROUGH */
372 1.41 rillig default: /* it is the start of a normal statement */
373 1.91 rillig if (!search_brace_other(*inout_ttype, inout_force_nl,
374 1.91 rillig *inout_comment_buffered, *inout_last_else))
375 1.41 rillig return;
376 1.91 rillig sw_buffer:
377 1.91 rillig switch_buffer();
378 1.41 rillig }
379 1.91 rillig search_brace_lookahead(inout_ttype);
380 1.41 rillig }
381 1.40 rillig
382 1.73 rillig *inout_last_else = false;
383 1.41 rillig }
384 1.1 cgd
385 1.53 rillig static void
386 1.72 rillig buf_init(struct buffer *buf)
387 1.72 rillig {
388 1.72 rillig buf->buf = xmalloc(bufsize);
389 1.86 rillig buf->buf[0] = ' '; /* allow accessing buf->e[-1] */
390 1.72 rillig buf->buf[1] = '\0';
391 1.72 rillig buf->s = buf->buf + 1;
392 1.72 rillig buf->e = buf->s;
393 1.72 rillig buf->l = buf->buf + bufsize - 5; /* safety margin, though unreliable */
394 1.72 rillig }
395 1.72 rillig
396 1.81 rillig void
397 1.81 rillig buf_expand(struct buffer *buf, size_t desired_size)
398 1.81 rillig {
399 1.81 rillig size_t nsize = buf->l - buf->s + 400 + desired_size;
400 1.81 rillig size_t code_len = buf->e - buf->s;
401 1.81 rillig buf->buf = xrealloc(buf->buf, nsize);
402 1.81 rillig buf->e = buf->buf + code_len + 1;
403 1.81 rillig buf->l = buf->buf + nsize - 5;
404 1.81 rillig buf->s = buf->buf + 1;
405 1.81 rillig }
406 1.81 rillig
407 1.72 rillig static void
408 1.53 rillig main_init_globals(void)
409 1.40 rillig {
410 1.83 rillig found_err = false;
411 1.1 cgd
412 1.25 kamil ps.p_stack[0] = stmt; /* this is the parser's stack */
413 1.25 kamil ps.last_nl = true; /* this is true if the last thing scanned was
414 1.1 cgd * a newline */
415 1.25 kamil ps.last_token = semicolon;
416 1.72 rillig buf_init(&com);
417 1.72 rillig buf_init(&lab);
418 1.72 rillig buf_init(&code);
419 1.72 rillig buf_init(&token);
420 1.73 rillig opt.else_if = true; /* XXX: redundant? */
421 1.25 kamil
422 1.68 rillig in_buffer = xmalloc(10);
423 1.25 kamil in_buffer_limit = in_buffer + 8;
424 1.25 kamil buf_ptr = buf_end = in_buffer;
425 1.25 kamil line_no = 1;
426 1.74 rillig had_eof = ps.in_decl = ps.decl_on_line = (break_comma = false);
427 1.25 kamil ps.in_or_st = false;
428 1.25 kamil ps.want_blank = ps.in_stmt = ps.ind_stmt = false;
429 1.25 kamil
430 1.53 rillig ps.pcase = false;
431 1.25 kamil sc_end = NULL;
432 1.25 kamil bp_save = NULL;
433 1.25 kamil be_save = NULL;
434 1.25 kamil
435 1.25 kamil output = NULL;
436 1.25 kamil
437 1.53 rillig const char *suffix = getenv("SIMPLE_BACKUP_SUFFIX");
438 1.53 rillig if (suffix != NULL)
439 1.88 rillig backup_suffix = suffix;
440 1.53 rillig }
441 1.53 rillig
442 1.53 rillig static void
443 1.53 rillig main_parse_command_line(int argc, char **argv)
444 1.53 rillig {
445 1.53 rillig int i;
446 1.53 rillig const char *profile_name = NULL;
447 1.1 cgd
448 1.25 kamil for (i = 1; i < argc; ++i)
449 1.25 kamil if (strcmp(argv[i], "-npro") == 0)
450 1.25 kamil break;
451 1.25 kamil else if (argv[i][0] == '-' && argv[i][1] == 'P' && argv[i][2] != '\0')
452 1.25 kamil profile_name = argv[i]; /* non-empty -P (set profile) */
453 1.25 kamil if (i >= argc)
454 1.25 kamil set_profile(profile_name);
455 1.1 cgd
456 1.25 kamil for (i = 1; i < argc; ++i) {
457 1.80 rillig if (argv[i][0] == '-') {
458 1.80 rillig set_option(argv[i]);
459 1.80 rillig
460 1.80 rillig } else if (input == NULL) {
461 1.80 rillig in_name = argv[i];
462 1.80 rillig input = fopen(in_name, "r");
463 1.80 rillig if (input == NULL)
464 1.80 rillig err(1, "%s", in_name);
465 1.80 rillig
466 1.80 rillig } else if (output == NULL) {
467 1.80 rillig out_name = argv[i];
468 1.80 rillig if (strcmp(in_name, out_name) == 0)
469 1.80 rillig errx(1, "input and output files must be different");
470 1.80 rillig output = fopen(out_name, "w");
471 1.80 rillig if (output == NULL)
472 1.80 rillig err(1, "%s", out_name);
473 1.1 cgd
474 1.80 rillig } else
475 1.25 kamil errx(1, "unknown parameter: %s", argv[i]);
476 1.80 rillig }
477 1.80 rillig
478 1.25 kamil if (input == NULL)
479 1.25 kamil input = stdin;
480 1.25 kamil if (output == NULL) {
481 1.25 kamil if (input == stdin)
482 1.25 kamil output = stdout;
483 1.25 kamil else {
484 1.25 kamil out_name = in_name;
485 1.25 kamil bakcopy();
486 1.1 cgd }
487 1.25 kamil }
488 1.25 kamil
489 1.57 rillig if (opt.comment_column <= 1)
490 1.57 rillig opt.comment_column = 2; /* don't put normal comments before column 2 */
491 1.51 rillig if (opt.block_comment_max_line_length <= 0)
492 1.51 rillig opt.block_comment_max_line_length = opt.max_line_length;
493 1.25 kamil if (opt.local_decl_indent < 0) /* if not specified by user, set this */
494 1.25 kamil opt.local_decl_indent = opt.decl_indent;
495 1.57 rillig if (opt.decl_comment_column <= 0) /* if not specified by user, set this */
496 1.57 rillig opt.decl_comment_column = opt.ljust_decl
497 1.57 rillig ? (opt.comment_column <= 10 ? 2 : opt.comment_column - 8)
498 1.57 rillig : opt.comment_column;
499 1.25 kamil if (opt.continuation_indent == 0)
500 1.57 rillig opt.continuation_indent = opt.indent_size;
501 1.53 rillig }
502 1.53 rillig
503 1.53 rillig static void
504 1.53 rillig main_prepare_parsing(void)
505 1.53 rillig {
506 1.25 kamil fill_buffer(); /* get first batch of stuff into input buffer */
507 1.25 kamil
508 1.25 kamil parse(semicolon);
509 1.53 rillig
510 1.53 rillig char *p = buf_ptr;
511 1.53 rillig int col = 1;
512 1.53 rillig
513 1.59 rillig for (;;) {
514 1.53 rillig if (*p == ' ')
515 1.53 rillig col++;
516 1.53 rillig else if (*p == '\t')
517 1.53 rillig col = opt.tabsize * (1 + (col - 1) / opt.tabsize) + 1;
518 1.53 rillig else
519 1.53 rillig break;
520 1.53 rillig p++;
521 1.25 kamil }
522 1.57 rillig if (col > opt.indent_size)
523 1.79 rillig ps.ind_level = ps.ind_level_follow = col / opt.indent_size;
524 1.53 rillig }
525 1.25 kamil
526 1.60 rillig static void __attribute__((__noreturn__))
527 1.54 rillig process_end_of_file(void)
528 1.54 rillig {
529 1.65 rillig if (lab.s != lab.e || code.s != code.e || com.s != com.e)
530 1.54 rillig dump_line();
531 1.54 rillig
532 1.54 rillig if (ps.tos > 1) /* check for balanced braces */
533 1.54 rillig diag(1, "Stuff missing from end of file");
534 1.54 rillig
535 1.54 rillig if (opt.verbose) {
536 1.54 rillig printf("There were %d output lines and %d comments\n",
537 1.86 rillig ps.stats.lines, ps.stats.comments);
538 1.54 rillig printf("(Lines with comments)/(Lines with code): %6.3f\n",
539 1.86 rillig (1.0 * ps.stats.comment_lines) / ps.stats.code_lines);
540 1.54 rillig }
541 1.54 rillig
542 1.54 rillig fflush(output);
543 1.83 rillig exit(found_err ? EXIT_FAILURE : EXIT_SUCCESS);
544 1.54 rillig }
545 1.54 rillig
546 1.54 rillig static void
547 1.75 rillig process_comment_in_code(token_type ttype, bool *inout_force_nl)
548 1.54 rillig {
549 1.54 rillig if (*inout_force_nl &&
550 1.64 rillig ttype != semicolon &&
551 1.64 rillig (ttype != lbrace || !opt.btype_2)) {
552 1.54 rillig
553 1.54 rillig /* we should force a broken line here */
554 1.54 rillig if (opt.verbose)
555 1.54 rillig diag(0, "Line broken");
556 1.54 rillig dump_line();
557 1.54 rillig ps.want_blank = false; /* dont insert blank at line start */
558 1.54 rillig *inout_force_nl = false;
559 1.54 rillig }
560 1.54 rillig
561 1.54 rillig ps.in_stmt = true; /* turn on flag which causes an extra level of
562 1.84 rillig * indentation. this is turned off by a ';' or
563 1.54 rillig * '}' */
564 1.86 rillig if (com.s != com.e) { /* the turkey has embedded a comment in a
565 1.86 rillig * line. fix it */
566 1.62 rillig size_t len = com.e - com.s;
567 1.54 rillig
568 1.54 rillig check_size_code(len + 3);
569 1.65 rillig *code.e++ = ' ';
570 1.65 rillig memcpy(code.e, com.s, len);
571 1.65 rillig code.e += len;
572 1.65 rillig *code.e++ = ' ';
573 1.65 rillig *code.e = '\0';
574 1.54 rillig ps.want_blank = false;
575 1.62 rillig com.e = com.s;
576 1.54 rillig }
577 1.54 rillig }
578 1.54 rillig
579 1.54 rillig static void
580 1.54 rillig process_form_feed(void)
581 1.54 rillig {
582 1.54 rillig ps.use_ff = true; /* a form feed is treated much like a newline */
583 1.54 rillig dump_line();
584 1.54 rillig ps.want_blank = false;
585 1.54 rillig }
586 1.54 rillig
587 1.54 rillig static void
588 1.54 rillig process_newline(void)
589 1.54 rillig {
590 1.87 rillig if (ps.last_token != comma || ps.p_l_follow > 0 || opt.break_after_comma
591 1.87 rillig || ps.block_init || !break_comma || com.s != com.e) {
592 1.54 rillig dump_line();
593 1.54 rillig ps.want_blank = false;
594 1.54 rillig }
595 1.54 rillig ++line_no; /* keep track of input line number */
596 1.54 rillig }
597 1.54 rillig
598 1.54 rillig static void
599 1.75 rillig process_lparen_or_lbracket(int dec_ind, bool tabs_to_var, bool sp_sw)
600 1.54 rillig {
601 1.54 rillig /* count parens to make Healy happy */
602 1.54 rillig if (++ps.p_l_follow == nitems(ps.paren_indents)) {
603 1.54 rillig diag(0, "Reached internal limit of %zu unclosed parens",
604 1.54 rillig nitems(ps.paren_indents));
605 1.54 rillig ps.p_l_follow--;
606 1.54 rillig }
607 1.67 rillig if (*token.s == '[')
608 1.54 rillig /* not a function pointer declaration or a function call */;
609 1.54 rillig else if (ps.in_decl && !ps.block_init && !ps.dumped_decl_indent &&
610 1.54 rillig ps.procname[0] == '\0' && ps.paren_level == 0) {
611 1.54 rillig /* function pointer declarations */
612 1.54 rillig indent_declaration(dec_ind, tabs_to_var);
613 1.54 rillig ps.dumped_decl_indent = true;
614 1.54 rillig } else if (ps.want_blank &&
615 1.54 rillig ((ps.last_token != ident && ps.last_token != funcname) ||
616 1.54 rillig opt.proc_calls_space ||
617 1.89 rillig (ps.keyword == kw_sizeof ? opt.blank_after_sizeof :
618 1.89 rillig ps.keyword != kw_0 && ps.keyword != kw_offsetof)))
619 1.65 rillig *code.e++ = ' ';
620 1.54 rillig ps.want_blank = false;
621 1.67 rillig *code.e++ = token.s[0];
622 1.58 rillig
623 1.54 rillig ps.paren_indents[ps.p_l_follow - 1] =
624 1.65 rillig indentation_after_range(0, code.s, code.e);
625 1.58 rillig debug_println("paren_indent[%d] is now %d",
626 1.58 rillig ps.p_l_follow - 1, ps.paren_indents[ps.p_l_follow - 1]);
627 1.58 rillig
628 1.54 rillig if (sp_sw && ps.p_l_follow == 1 && opt.extra_expression_indent
629 1.58 rillig && ps.paren_indents[0] < 2 * opt.indent_size) {
630 1.57 rillig ps.paren_indents[0] = 2 * opt.indent_size;
631 1.58 rillig debug_println("paren_indent[0] is now %d", ps.paren_indents[0]);
632 1.58 rillig }
633 1.67 rillig if (ps.in_or_st && *token.s == '(' && ps.tos <= 2) {
634 1.54 rillig /*
635 1.86 rillig * this is a kluge to make sure that declarations will be aligned
636 1.86 rillig * right if proc decl has an explicit type on it, i.e. "int a(x) {..."
637 1.54 rillig */
638 1.54 rillig parse(semicolon); /* I said this was a kluge... */
639 1.54 rillig ps.in_or_st = false; /* turn off flag for structure decl or
640 1.54 rillig * initialization */
641 1.54 rillig }
642 1.54 rillig /* parenthesized type following sizeof or offsetof is not a cast */
643 1.89 rillig if (ps.keyword == kw_offsetof || ps.keyword == kw_sizeof)
644 1.54 rillig ps.not_cast_mask |= 1 << ps.p_l_follow;
645 1.54 rillig }
646 1.54 rillig
647 1.54 rillig static void
648 1.75 rillig process_rparen_or_rbracket(bool *inout_sp_sw, bool *inout_force_nl,
649 1.86 rillig token_type hd_type)
650 1.54 rillig {
651 1.73 rillig if ((ps.cast_mask & (1 << ps.p_l_follow) & ~ps.not_cast_mask) != 0) {
652 1.54 rillig ps.last_u_d = true;
653 1.54 rillig ps.cast_mask &= (1 << ps.p_l_follow) - 1;
654 1.54 rillig ps.want_blank = opt.space_after_cast;
655 1.54 rillig } else
656 1.54 rillig ps.want_blank = true;
657 1.54 rillig ps.not_cast_mask &= (1 << ps.p_l_follow) - 1;
658 1.54 rillig
659 1.54 rillig if (--ps.p_l_follow < 0) {
660 1.54 rillig ps.p_l_follow = 0;
661 1.67 rillig diag(0, "Extra %c", *token.s);
662 1.54 rillig }
663 1.54 rillig
664 1.65 rillig if (code.e == code.s) /* if the paren starts the line */
665 1.54 rillig ps.paren_level = ps.p_l_follow; /* then indent it */
666 1.54 rillig
667 1.67 rillig *code.e++ = token.s[0];
668 1.54 rillig
669 1.86 rillig if (*inout_sp_sw && (ps.p_l_follow == 0)) { /* check for end of if (...),
670 1.86 rillig * or some such */
671 1.54 rillig *inout_sp_sw = false;
672 1.54 rillig *inout_force_nl = true; /* must force newline after if */
673 1.86 rillig ps.last_u_d = true; /* inform lexi that a following operator is
674 1.86 rillig * unary */
675 1.54 rillig ps.in_stmt = false; /* dont use stmt continuation indentation */
676 1.54 rillig
677 1.54 rillig parse(hd_type); /* let parser worry about if, or whatever */
678 1.54 rillig }
679 1.86 rillig ps.search_brace = opt.btype_2; /* this should ensure that constructs
680 1.86 rillig * such as main(){...} and int[]{...}
681 1.86 rillig * have their braces put in the right
682 1.86 rillig * place */
683 1.54 rillig }
684 1.54 rillig
685 1.54 rillig static void
686 1.75 rillig process_unary_op(int dec_ind, bool tabs_to_var)
687 1.54 rillig {
688 1.54 rillig if (!ps.dumped_decl_indent && ps.in_decl && !ps.block_init &&
689 1.54 rillig ps.procname[0] == '\0' && ps.paren_level == 0) {
690 1.54 rillig /* pointer declarations */
691 1.82 rillig indent_declaration(dec_ind - (int)strlen(token.s), tabs_to_var);
692 1.54 rillig ps.dumped_decl_indent = true;
693 1.54 rillig } else if (ps.want_blank)
694 1.65 rillig *code.e++ = ' ';
695 1.54 rillig
696 1.54 rillig {
697 1.67 rillig size_t len = token.e - token.s;
698 1.54 rillig
699 1.54 rillig check_size_code(len);
700 1.67 rillig memcpy(code.e, token.s, len);
701 1.65 rillig code.e += len;
702 1.54 rillig }
703 1.54 rillig ps.want_blank = false;
704 1.54 rillig }
705 1.54 rillig
706 1.54 rillig static void
707 1.54 rillig process_binary_op(void)
708 1.54 rillig {
709 1.67 rillig size_t len = token.e - token.s;
710 1.54 rillig
711 1.54 rillig check_size_code(len + 1);
712 1.54 rillig if (ps.want_blank)
713 1.65 rillig *code.e++ = ' ';
714 1.67 rillig memcpy(code.e, token.s, len);
715 1.65 rillig code.e += len;
716 1.54 rillig
717 1.54 rillig ps.want_blank = true;
718 1.54 rillig }
719 1.54 rillig
720 1.54 rillig static void
721 1.54 rillig process_postfix_op(void)
722 1.54 rillig {
723 1.67 rillig *code.e++ = token.s[0];
724 1.67 rillig *code.e++ = token.s[1];
725 1.54 rillig ps.want_blank = true;
726 1.54 rillig }
727 1.54 rillig
728 1.54 rillig static void
729 1.54 rillig process_question(int *inout_squest)
730 1.54 rillig {
731 1.54 rillig (*inout_squest)++; /* this will be used when a later colon
732 1.54 rillig * appears so we can distinguish the
733 1.54 rillig * <c>?<n>:<n> construct */
734 1.54 rillig if (ps.want_blank)
735 1.65 rillig *code.e++ = ' ';
736 1.65 rillig *code.e++ = '?';
737 1.54 rillig ps.want_blank = true;
738 1.54 rillig }
739 1.54 rillig
740 1.54 rillig static void
741 1.75 rillig process_colon(int *inout_squest, bool *inout_force_nl, bool *inout_scase)
742 1.54 rillig {
743 1.54 rillig if (*inout_squest > 0) { /* it is part of the <c>?<n>: <n> construct */
744 1.54 rillig --*inout_squest;
745 1.54 rillig if (ps.want_blank)
746 1.65 rillig *code.e++ = ' ';
747 1.65 rillig *code.e++ = ':';
748 1.54 rillig ps.want_blank = true;
749 1.54 rillig return;
750 1.54 rillig }
751 1.54 rillig if (ps.in_or_st) {
752 1.65 rillig *code.e++ = ':';
753 1.54 rillig ps.want_blank = false;
754 1.54 rillig return;
755 1.54 rillig }
756 1.54 rillig ps.in_stmt = false; /* seeing a label does not imply we are in a
757 1.54 rillig * stmt */
758 1.54 rillig /*
759 1.54 rillig * turn everything so far into a label
760 1.54 rillig */
761 1.54 rillig {
762 1.65 rillig size_t len = code.e - code.s;
763 1.54 rillig
764 1.54 rillig check_size_label(len + 3);
765 1.65 rillig memcpy(lab.e, code.s, len);
766 1.63 rillig lab.e += len;
767 1.63 rillig *lab.e++ = ':';
768 1.63 rillig *lab.e = '\0';
769 1.65 rillig code.e = code.s;
770 1.54 rillig }
771 1.54 rillig *inout_force_nl = ps.pcase = *inout_scase; /* ps.pcase will be used by
772 1.54 rillig * dump_line to decide how to
773 1.54 rillig * indent the label. force_nl
774 1.54 rillig * will force a case n: to be
775 1.54 rillig * on a line by itself */
776 1.54 rillig *inout_scase = false;
777 1.54 rillig ps.want_blank = false;
778 1.54 rillig }
779 1.54 rillig
780 1.54 rillig static void
781 1.75 rillig process_semicolon(bool *inout_scase, int *inout_squest, int dec_ind,
782 1.86 rillig bool tabs_to_var, bool *inout_sp_sw,
783 1.86 rillig token_type hd_type,
784 1.86 rillig bool *inout_force_nl)
785 1.54 rillig {
786 1.79 rillig if (ps.decl_nest == 0)
787 1.54 rillig ps.in_or_st = false; /* we are not in an initialization or
788 1.54 rillig * structure declaration */
789 1.86 rillig *inout_scase = false; /* these will only need resetting in an error */
790 1.54 rillig *inout_squest = 0;
791 1.54 rillig if (ps.last_token == rparen)
792 1.73 rillig ps.in_parameter_declaration = false;
793 1.54 rillig ps.cast_mask = 0;
794 1.54 rillig ps.not_cast_mask = 0;
795 1.73 rillig ps.block_init = false;
796 1.54 rillig ps.block_init_level = 0;
797 1.54 rillig ps.just_saw_decl--;
798 1.54 rillig
799 1.65 rillig if (ps.in_decl && code.s == code.e && !ps.block_init &&
800 1.54 rillig !ps.dumped_decl_indent && ps.paren_level == 0) {
801 1.54 rillig /* indent stray semicolons in declarations */
802 1.54 rillig indent_declaration(dec_ind - 1, tabs_to_var);
803 1.54 rillig ps.dumped_decl_indent = true;
804 1.54 rillig }
805 1.54 rillig
806 1.79 rillig ps.in_decl = (ps.decl_nest > 0); /* if we were in a first level
807 1.86 rillig * structure declaration, we arent any
808 1.86 rillig * more */
809 1.54 rillig
810 1.54 rillig if ((!*inout_sp_sw || hd_type != for_exprs) && ps.p_l_follow > 0) {
811 1.54 rillig
812 1.54 rillig /*
813 1.86 rillig * This should be true iff there were unbalanced parens in the stmt.
814 1.86 rillig * It is a bit complicated, because the semicolon might be in a for
815 1.86 rillig * stmt
816 1.54 rillig */
817 1.54 rillig diag(1, "Unbalanced parens");
818 1.54 rillig ps.p_l_follow = 0;
819 1.54 rillig if (*inout_sp_sw) { /* this is a check for an if, while, etc. with
820 1.54 rillig * unbalanced parens */
821 1.54 rillig *inout_sp_sw = false;
822 1.54 rillig parse(hd_type); /* dont lose the if, or whatever */
823 1.54 rillig }
824 1.54 rillig }
825 1.65 rillig *code.e++ = ';';
826 1.54 rillig ps.want_blank = true;
827 1.86 rillig ps.in_stmt = (ps.p_l_follow > 0); /* we are no longer in the middle of a
828 1.86 rillig * stmt */
829 1.54 rillig
830 1.54 rillig if (!*inout_sp_sw) { /* if not if for (;;) */
831 1.54 rillig parse(semicolon); /* let parser know about end of stmt */
832 1.86 rillig *inout_force_nl = true; /* force newline after an end of stmt */
833 1.54 rillig }
834 1.54 rillig }
835 1.54 rillig
836 1.54 rillig static void
837 1.75 rillig process_lbrace(bool *inout_force_nl, bool *inout_sp_sw, token_type hd_type,
838 1.86 rillig int *di_stack, int di_stack_cap, int *inout_dec_ind)
839 1.54 rillig {
840 1.86 rillig ps.in_stmt = false; /* dont indent the {} */
841 1.54 rillig if (!ps.block_init)
842 1.54 rillig *inout_force_nl = true; /* force other stuff on same line as '{' onto
843 1.54 rillig * new line */
844 1.54 rillig else if (ps.block_init_level <= 0)
845 1.54 rillig ps.block_init_level = 1;
846 1.54 rillig else
847 1.54 rillig ps.block_init_level++;
848 1.54 rillig
849 1.65 rillig if (code.s != code.e && !ps.block_init) {
850 1.54 rillig if (!opt.btype_2) {
851 1.54 rillig dump_line();
852 1.54 rillig ps.want_blank = false;
853 1.54 rillig } else if (ps.in_parameter_declaration && !ps.in_or_st) {
854 1.79 rillig ps.ind_level_follow = 0;
855 1.86 rillig if (opt.function_brace_split) { /* dump the line prior to the
856 1.86 rillig * brace ... */
857 1.54 rillig dump_line();
858 1.54 rillig ps.want_blank = false;
859 1.54 rillig } else /* add a space between the decl and brace */
860 1.54 rillig ps.want_blank = true;
861 1.54 rillig }
862 1.54 rillig }
863 1.54 rillig if (ps.in_parameter_declaration)
864 1.73 rillig prefix_blankline_requested = false;
865 1.54 rillig
866 1.86 rillig if (ps.p_l_follow > 0) { /* check for preceding unbalanced parens */
867 1.54 rillig diag(1, "Unbalanced parens");
868 1.54 rillig ps.p_l_follow = 0;
869 1.54 rillig if (*inout_sp_sw) { /* check for unclosed if, for, etc. */
870 1.54 rillig *inout_sp_sw = false;
871 1.54 rillig parse(hd_type);
872 1.79 rillig ps.ind_level = ps.ind_level_follow;
873 1.54 rillig }
874 1.54 rillig }
875 1.65 rillig if (code.s == code.e)
876 1.54 rillig ps.ind_stmt = false; /* dont put extra indentation on line
877 1.54 rillig * with '{' */
878 1.54 rillig if (ps.in_decl && ps.in_or_st) { /* this is either a structure
879 1.86 rillig * declaration or an init */
880 1.79 rillig di_stack[ps.decl_nest] = *inout_dec_ind;
881 1.79 rillig if (++ps.decl_nest == di_stack_cap) {
882 1.54 rillig diag(0, "Reached internal limit of %d struct levels",
883 1.86 rillig di_stack_cap);
884 1.79 rillig ps.decl_nest--;
885 1.54 rillig }
886 1.54 rillig /* ? dec_ind = 0; */
887 1.54 rillig } else {
888 1.86 rillig ps.decl_on_line = false; /* we can't be in the middle of a
889 1.86 rillig * declaration, so don't do special
890 1.86 rillig * indentation of comments */
891 1.54 rillig if (opt.blanklines_after_declarations_at_proctop
892 1.54 rillig && ps.in_parameter_declaration)
893 1.73 rillig postfix_blankline_requested = true;
894 1.73 rillig ps.in_parameter_declaration = false;
895 1.54 rillig ps.in_decl = false;
896 1.54 rillig }
897 1.54 rillig *inout_dec_ind = 0;
898 1.86 rillig parse(lbrace); /* let parser know about this */
899 1.86 rillig if (ps.want_blank) /* put a blank before '{' if '{' is not at
900 1.54 rillig * start of line */
901 1.65 rillig *code.e++ = ' ';
902 1.54 rillig ps.want_blank = false;
903 1.65 rillig *code.e++ = '{';
904 1.54 rillig ps.just_saw_decl = 0;
905 1.54 rillig }
906 1.54 rillig
907 1.54 rillig static void
908 1.75 rillig process_rbrace(bool *inout_sp_sw, int *inout_dec_ind, const int *di_stack)
909 1.54 rillig {
910 1.54 rillig if (ps.p_stack[ps.tos] == decl && !ps.block_init) /* semicolons can be
911 1.86 rillig * omitted in
912 1.86 rillig * declarations */
913 1.54 rillig parse(semicolon);
914 1.73 rillig if (ps.p_l_follow != 0) { /* check for unclosed if, for, else. */
915 1.54 rillig diag(1, "Unbalanced parens");
916 1.54 rillig ps.p_l_follow = 0;
917 1.54 rillig *inout_sp_sw = false;
918 1.54 rillig }
919 1.54 rillig ps.just_saw_decl = 0;
920 1.54 rillig ps.block_init_level--;
921 1.65 rillig if (code.s != code.e && !ps.block_init) { /* '}' must be first on line */
922 1.54 rillig if (opt.verbose)
923 1.54 rillig diag(0, "Line broken");
924 1.54 rillig dump_line();
925 1.54 rillig }
926 1.65 rillig *code.e++ = '}';
927 1.54 rillig ps.want_blank = true;
928 1.54 rillig ps.in_stmt = ps.ind_stmt = false;
929 1.79 rillig if (ps.decl_nest > 0) { /* we are in multi-level structure declaration */
930 1.79 rillig *inout_dec_ind = di_stack[--ps.decl_nest];
931 1.79 rillig if (ps.decl_nest == 0 && !ps.in_parameter_declaration)
932 1.54 rillig ps.just_saw_decl = 2;
933 1.54 rillig ps.in_decl = true;
934 1.54 rillig }
935 1.73 rillig prefix_blankline_requested = false;
936 1.54 rillig parse(rbrace); /* let parser know about this */
937 1.54 rillig ps.search_brace = opt.cuddle_else
938 1.86 rillig && ps.p_stack[ps.tos] == if_expr_stmt
939 1.86 rillig && ps.il[ps.tos] >= ps.ind_level;
940 1.79 rillig if (ps.tos <= 1 && opt.blanklines_after_procs && ps.decl_nest <= 0)
941 1.73 rillig postfix_blankline_requested = true;
942 1.54 rillig }
943 1.54 rillig
944 1.54 rillig static void
945 1.75 rillig process_keyword_do_else(bool *inout_force_nl, bool *inout_last_else)
946 1.54 rillig {
947 1.54 rillig ps.in_stmt = false;
948 1.67 rillig if (*token.s == 'e') {
949 1.65 rillig if (code.e != code.s && (!opt.cuddle_else || code.e[-1] != '}')) {
950 1.54 rillig if (opt.verbose)
951 1.54 rillig diag(0, "Line broken");
952 1.54 rillig dump_line(); /* make sure this starts a line */
953 1.54 rillig ps.want_blank = false;
954 1.54 rillig }
955 1.54 rillig *inout_force_nl = true;/* also, following stuff must go onto new line */
956 1.73 rillig *inout_last_else = true;
957 1.54 rillig parse(keyword_else);
958 1.54 rillig } else {
959 1.65 rillig if (code.e != code.s) { /* make sure this starts a line */
960 1.54 rillig if (opt.verbose)
961 1.54 rillig diag(0, "Line broken");
962 1.54 rillig dump_line();
963 1.54 rillig ps.want_blank = false;
964 1.54 rillig }
965 1.54 rillig *inout_force_nl = true;/* also, following stuff must go onto new line */
966 1.73 rillig *inout_last_else = false;
967 1.54 rillig parse(keyword_do);
968 1.54 rillig }
969 1.54 rillig }
970 1.54 rillig
971 1.54 rillig static void
972 1.75 rillig process_decl(int *out_dec_ind, bool *out_tabs_to_var)
973 1.54 rillig {
974 1.54 rillig parse(decl); /* let parser worry about indentation */
975 1.54 rillig if (ps.last_token == rparen && ps.tos <= 1) {
976 1.65 rillig if (code.s != code.e) {
977 1.54 rillig dump_line();
978 1.73 rillig ps.want_blank = false;
979 1.54 rillig }
980 1.54 rillig }
981 1.79 rillig if (ps.in_parameter_declaration && opt.indent_parameters &&
982 1.79 rillig ps.decl_nest == 0) {
983 1.79 rillig ps.ind_level = ps.ind_level_follow = 1;
984 1.73 rillig ps.ind_stmt = false;
985 1.54 rillig }
986 1.54 rillig ps.in_or_st = true; /* this might be a structure or initialization
987 1.54 rillig * declaration */
988 1.54 rillig ps.in_decl = ps.decl_on_line = ps.last_token != type_def;
989 1.79 rillig if ( /* !ps.in_or_st && */ ps.decl_nest <= 0)
990 1.54 rillig ps.just_saw_decl = 2;
991 1.73 rillig prefix_blankline_requested = false;
992 1.54 rillig
993 1.82 rillig int len = (int)strlen(token.s) + 1;
994 1.82 rillig int ind = ps.ind_level == 0 || ps.decl_nest > 0
995 1.82 rillig ? opt.decl_indent /* global variable or local member */
996 1.82 rillig : opt.local_decl_indent; /* local variable */
997 1.82 rillig *out_dec_ind = ind > 0 ? ind : len;
998 1.82 rillig *out_tabs_to_var = opt.use_tabs ? ind > 0 : false;
999 1.54 rillig }
1000 1.54 rillig
1001 1.54 rillig static void
1002 1.75 rillig process_ident(token_type ttype, int dec_ind, bool tabs_to_var,
1003 1.86 rillig bool *inout_sp_sw, bool *inout_force_nl, token_type hd_type)
1004 1.54 rillig {
1005 1.54 rillig if (ps.in_decl) {
1006 1.64 rillig if (ttype == funcname) {
1007 1.54 rillig ps.in_decl = false;
1008 1.65 rillig if (opt.procnames_start_line && code.s != code.e) {
1009 1.65 rillig *code.e = '\0';
1010 1.54 rillig dump_line();
1011 1.54 rillig } else if (ps.want_blank) {
1012 1.65 rillig *code.e++ = ' ';
1013 1.54 rillig }
1014 1.54 rillig ps.want_blank = false;
1015 1.54 rillig } else if (!ps.block_init && !ps.dumped_decl_indent &&
1016 1.86 rillig ps.paren_level == 0) { /* if we are in a declaration, we must
1017 1.86 rillig * indent identifier */
1018 1.54 rillig indent_declaration(dec_ind, tabs_to_var);
1019 1.54 rillig ps.dumped_decl_indent = true;
1020 1.54 rillig ps.want_blank = false;
1021 1.54 rillig }
1022 1.54 rillig } else if (*inout_sp_sw && ps.p_l_follow == 0) {
1023 1.54 rillig *inout_sp_sw = false;
1024 1.54 rillig *inout_force_nl = true;
1025 1.54 rillig ps.last_u_d = true;
1026 1.54 rillig ps.in_stmt = false;
1027 1.54 rillig parse(hd_type);
1028 1.54 rillig }
1029 1.54 rillig }
1030 1.54 rillig
1031 1.54 rillig static void
1032 1.54 rillig copy_id(void)
1033 1.54 rillig {
1034 1.67 rillig size_t len = token.e - token.s;
1035 1.54 rillig
1036 1.54 rillig check_size_code(len + 1);
1037 1.54 rillig if (ps.want_blank)
1038 1.65 rillig *code.e++ = ' ';
1039 1.67 rillig memcpy(code.e, token.s, len);
1040 1.65 rillig code.e += len;
1041 1.54 rillig }
1042 1.54 rillig
1043 1.54 rillig static void
1044 1.54 rillig process_string_prefix(void)
1045 1.54 rillig {
1046 1.67 rillig size_t len = token.e - token.s;
1047 1.54 rillig
1048 1.54 rillig check_size_code(len + 1);
1049 1.54 rillig if (ps.want_blank)
1050 1.65 rillig *code.e++ = ' ';
1051 1.67 rillig memcpy(code.e, token.s, len);
1052 1.65 rillig code.e += len;
1053 1.54 rillig
1054 1.54 rillig ps.want_blank = false;
1055 1.54 rillig }
1056 1.54 rillig
1057 1.54 rillig static void
1058 1.54 rillig process_period(void)
1059 1.54 rillig {
1060 1.85 rillig if (code.e[-1] == ',')
1061 1.85 rillig *code.e++ = ' ';
1062 1.65 rillig *code.e++ = '.'; /* move the period into line */
1063 1.54 rillig ps.want_blank = false; /* dont put a blank after a period */
1064 1.54 rillig }
1065 1.54 rillig
1066 1.54 rillig static void
1067 1.75 rillig process_comma(int dec_ind, bool tabs_to_var, bool *inout_force_nl)
1068 1.54 rillig {
1069 1.86 rillig ps.want_blank = (code.s != code.e); /* only put blank after comma if comma
1070 1.86 rillig * does not start the line */
1071 1.54 rillig if (ps.in_decl && ps.procname[0] == '\0' && !ps.block_init &&
1072 1.54 rillig !ps.dumped_decl_indent && ps.paren_level == 0) {
1073 1.54 rillig /* indent leading commas and not the actual identifiers */
1074 1.54 rillig indent_declaration(dec_ind - 1, tabs_to_var);
1075 1.54 rillig ps.dumped_decl_indent = true;
1076 1.54 rillig }
1077 1.65 rillig *code.e++ = ',';
1078 1.54 rillig if (ps.p_l_follow == 0) {
1079 1.54 rillig if (ps.block_init_level <= 0)
1080 1.73 rillig ps.block_init = false;
1081 1.87 rillig if (break_comma && (opt.break_after_comma ||
1082 1.54 rillig indentation_after_range(
1083 1.65 rillig compute_code_indent(), code.s, code.e)
1084 1.54 rillig >= opt.max_line_length - opt.tabsize))
1085 1.54 rillig *inout_force_nl = true;
1086 1.54 rillig }
1087 1.54 rillig }
1088 1.54 rillig
1089 1.54 rillig static void
1090 1.54 rillig process_preprocessing(void)
1091 1.54 rillig {
1092 1.65 rillig if (com.s != com.e || lab.s != lab.e || code.s != code.e)
1093 1.54 rillig dump_line();
1094 1.54 rillig check_size_label(1);
1095 1.86 rillig *lab.e++ = '#'; /* move whole line to 'label' buffer */
1096 1.54 rillig
1097 1.54 rillig {
1098 1.75 rillig bool in_comment = false;
1099 1.86 rillig int com_start = 0;
1100 1.86 rillig char quote = '\0';
1101 1.86 rillig int com_end = 0;
1102 1.54 rillig
1103 1.54 rillig while (*buf_ptr == ' ' || *buf_ptr == '\t') {
1104 1.54 rillig buf_ptr++;
1105 1.54 rillig if (buf_ptr >= buf_end)
1106 1.54 rillig fill_buffer();
1107 1.54 rillig }
1108 1.54 rillig while (*buf_ptr != '\n' || (in_comment && !had_eof)) {
1109 1.54 rillig check_size_label(2);
1110 1.63 rillig *lab.e = *buf_ptr++;
1111 1.54 rillig if (buf_ptr >= buf_end)
1112 1.54 rillig fill_buffer();
1113 1.63 rillig switch (*lab.e++) {
1114 1.54 rillig case '\\':
1115 1.54 rillig if (!in_comment) {
1116 1.63 rillig *lab.e++ = *buf_ptr++;
1117 1.54 rillig if (buf_ptr >= buf_end)
1118 1.54 rillig fill_buffer();
1119 1.54 rillig }
1120 1.54 rillig break;
1121 1.54 rillig case '/':
1122 1.55 rillig if (*buf_ptr == '*' && !in_comment && quote == '\0') {
1123 1.73 rillig in_comment = true;
1124 1.63 rillig *lab.e++ = *buf_ptr++;
1125 1.63 rillig com_start = (int)(lab.e - lab.s) - 2;
1126 1.54 rillig }
1127 1.54 rillig break;
1128 1.54 rillig case '"':
1129 1.54 rillig if (quote == '"')
1130 1.55 rillig quote = '\0';
1131 1.55 rillig else if (quote == '\0')
1132 1.55 rillig quote = '"';
1133 1.54 rillig break;
1134 1.54 rillig case '\'':
1135 1.54 rillig if (quote == '\'')
1136 1.55 rillig quote = '\0';
1137 1.55 rillig else if (quote == '\0')
1138 1.55 rillig quote = '\'';
1139 1.54 rillig break;
1140 1.54 rillig case '*':
1141 1.54 rillig if (*buf_ptr == '/' && in_comment) {
1142 1.73 rillig in_comment = false;
1143 1.63 rillig *lab.e++ = *buf_ptr++;
1144 1.63 rillig com_end = (int)(lab.e - lab.s);
1145 1.54 rillig }
1146 1.54 rillig break;
1147 1.54 rillig }
1148 1.54 rillig }
1149 1.54 rillig
1150 1.63 rillig while (lab.e > lab.s && (lab.e[-1] == ' ' || lab.e[-1] == '\t'))
1151 1.63 rillig lab.e--;
1152 1.63 rillig if (lab.e - lab.s == com_end && bp_save == NULL) {
1153 1.54 rillig /* comment on preprocessor line */
1154 1.86 rillig if (sc_end == NULL) { /* if this is the first comment, we
1155 1.86 rillig * must set up the buffer */
1156 1.54 rillig save_com = sc_buf;
1157 1.54 rillig sc_end = &save_com[0];
1158 1.54 rillig } else {
1159 1.86 rillig *sc_end++ = '\n'; /* add newline between comments */
1160 1.54 rillig *sc_end++ = ' ';
1161 1.54 rillig --line_no;
1162 1.54 rillig }
1163 1.54 rillig if (sc_end - save_com + com_end - com_start > sc_size)
1164 1.54 rillig errx(1, "input too long");
1165 1.63 rillig memmove(sc_end, lab.s + com_start, (size_t)(com_end - com_start));
1166 1.54 rillig sc_end += com_end - com_start;
1167 1.63 rillig lab.e = lab.s + com_start;
1168 1.63 rillig while (lab.e > lab.s && (lab.e[-1] == ' ' || lab.e[-1] == '\t'))
1169 1.63 rillig lab.e--;
1170 1.54 rillig bp_save = buf_ptr; /* save current input buffer */
1171 1.54 rillig be_save = buf_end;
1172 1.58 rillig buf_ptr = save_com; /* fix so that subsequent calls to lexi will
1173 1.58 rillig * take tokens out of save_com */
1174 1.54 rillig *sc_end++ = ' '; /* add trailing blank, just in case */
1175 1.54 rillig buf_end = sc_end;
1176 1.54 rillig sc_end = NULL;
1177 1.58 rillig debug_println("switched buf_ptr to save_com");
1178 1.54 rillig }
1179 1.54 rillig check_size_label(1);
1180 1.86 rillig *lab.e = '\0'; /* null terminate line */
1181 1.54 rillig ps.pcase = false;
1182 1.54 rillig }
1183 1.54 rillig
1184 1.86 rillig if (strncmp(lab.s, "#if", 3) == 0) { /* also ifdef, ifndef */
1185 1.88 rillig if ((size_t)ifdef_level < nitems(state_stack))
1186 1.54 rillig state_stack[ifdef_level++] = ps;
1187 1.88 rillig else
1188 1.54 rillig diag(1, "#if stack overflow");
1189 1.86 rillig } else if (strncmp(lab.s, "#el", 3) == 0) { /* else, elif */
1190 1.54 rillig if (ifdef_level <= 0)
1191 1.63 rillig diag(1, lab.s[3] == 'i' ? "Unmatched #elif" : "Unmatched #else");
1192 1.88 rillig else
1193 1.54 rillig ps = state_stack[ifdef_level - 1];
1194 1.63 rillig } else if (strncmp(lab.s, "#endif", 6) == 0) {
1195 1.54 rillig if (ifdef_level <= 0)
1196 1.54 rillig diag(1, "Unmatched #endif");
1197 1.54 rillig else
1198 1.54 rillig ifdef_level--;
1199 1.54 rillig } else {
1200 1.63 rillig if (strncmp(lab.s + 1, "pragma", 6) != 0 &&
1201 1.63 rillig strncmp(lab.s + 1, "error", 5) != 0 &&
1202 1.63 rillig strncmp(lab.s + 1, "line", 4) != 0 &&
1203 1.63 rillig strncmp(lab.s + 1, "undef", 5) != 0 &&
1204 1.63 rillig strncmp(lab.s + 1, "define", 6) != 0 &&
1205 1.63 rillig strncmp(lab.s + 1, "include", 7) != 0) {
1206 1.54 rillig diag(1, "Unrecognized cpp directive");
1207 1.54 rillig return;
1208 1.54 rillig }
1209 1.54 rillig }
1210 1.54 rillig if (opt.blanklines_around_conditional_compilation) {
1211 1.73 rillig postfix_blankline_requested = true;
1212 1.54 rillig n_real_blanklines = 0;
1213 1.54 rillig } else {
1214 1.73 rillig postfix_blankline_requested = false;
1215 1.73 rillig prefix_blankline_requested = false;
1216 1.54 rillig }
1217 1.54 rillig
1218 1.54 rillig /*
1219 1.54 rillig * subsequent processing of the newline character will cause the line to
1220 1.54 rillig * be printed
1221 1.54 rillig */
1222 1.54 rillig }
1223 1.54 rillig
1224 1.60 rillig static void __attribute__((__noreturn__))
1225 1.53 rillig main_loop(void)
1226 1.53 rillig {
1227 1.64 rillig token_type ttype;
1228 1.75 rillig bool force_nl; /* when true, code must be broken */
1229 1.75 rillig bool last_else = false; /* true iff last keyword was an else */
1230 1.86 rillig int dec_ind; /* current indentation for declarations */
1231 1.86 rillig int di_stack[20]; /* a stack of structure indentation levels */
1232 1.75 rillig bool tabs_to_var; /* true if using tabs to indent to var name */
1233 1.75 rillig bool sp_sw; /* when true, we are in the expression of
1234 1.53 rillig * if(...), while(...), etc. */
1235 1.86 rillig token_type hd_type = end_of_file; /* used to store type of stmt for if
1236 1.86 rillig * (...), for (...), etc */
1237 1.73 rillig int squest; /* when this is positive, we have seen a '?'
1238 1.73 rillig * without the matching ':' in a <c>?<s>:<s>
1239 1.53 rillig * construct */
1240 1.84 rillig bool scase; /* set to true when we see a 'case', so we
1241 1.53 rillig * know what to do with the following colon */
1242 1.53 rillig
1243 1.53 rillig sp_sw = force_nl = false;
1244 1.53 rillig dec_ind = 0;
1245 1.79 rillig di_stack[ps.decl_nest = 0] = 0;
1246 1.53 rillig scase = false;
1247 1.53 rillig squest = 0;
1248 1.73 rillig tabs_to_var = false;
1249 1.1 cgd
1250 1.59 rillig for (;;) { /* this is the main loop. it will go until we
1251 1.1 cgd * reach eof */
1252 1.75 rillig bool comment_buffered = false;
1253 1.1 cgd
1254 1.64 rillig ttype = lexi(&ps); /* Read the next token. The actual characters
1255 1.64 rillig * read are stored in "token". */
1256 1.1 cgd
1257 1.25 kamil /*
1258 1.25 kamil * The following code moves newlines and comments following an if (),
1259 1.86 rillig * while (), else, etc. up to the start of the following stmt to a
1260 1.86 rillig * buffer. This allows proper handling of both kinds of brace
1261 1.25 kamil * placement (-br, -bl) and cuddling "else" (-ce).
1262 1.25 kamil */
1263 1.64 rillig search_brace(&ttype, &force_nl, &comment_buffered, &last_else);
1264 1.25 kamil
1265 1.64 rillig if (ttype == end_of_file) {
1266 1.54 rillig process_end_of_file();
1267 1.60 rillig /* NOTREACHED */
1268 1.54 rillig }
1269 1.25 kamil
1270 1.25 kamil if (
1271 1.64 rillig ttype != comment &&
1272 1.64 rillig ttype != newline &&
1273 1.64 rillig ttype != preprocessing &&
1274 1.64 rillig ttype != form_feed) {
1275 1.64 rillig process_comment_in_code(ttype, &force_nl);
1276 1.25 kamil
1277 1.86 rillig } else if (ttype != comment) /* preserve force_nl through a comment */
1278 1.25 kamil force_nl = false; /* cancel forced newline after newline, form
1279 1.25 kamil * feed, etc */
1280 1.1 cgd
1281 1.1 cgd
1282 1.1 cgd
1283 1.25 kamil /*-----------------------------------------------------*\
1284 1.25 kamil | do switch on type of token scanned |
1285 1.25 kamil \*-----------------------------------------------------*/
1286 1.65 rillig check_size_code(3); /* maximum number of increments of code.e
1287 1.34 rillig * before the next check_size_code or
1288 1.25 kamil * dump_line() is 2. After that there's the
1289 1.25 kamil * final increment for the null character. */
1290 1.64 rillig switch (ttype) {
1291 1.25 kamil
1292 1.64 rillig case form_feed:
1293 1.54 rillig process_form_feed();
1294 1.25 kamil break;
1295 1.25 kamil
1296 1.25 kamil case newline:
1297 1.54 rillig process_newline();
1298 1.25 kamil break;
1299 1.25 kamil
1300 1.25 kamil case lparen: /* got a '(' or '[' */
1301 1.54 rillig process_lparen_or_lbracket(dec_ind, tabs_to_var, sp_sw);
1302 1.25 kamil break;
1303 1.25 kamil
1304 1.25 kamil case rparen: /* got a ')' or ']' */
1305 1.54 rillig process_rparen_or_rbracket(&sp_sw, &force_nl, hd_type);
1306 1.25 kamil break;
1307 1.25 kamil
1308 1.25 kamil case unary_op: /* this could be any unary operation */
1309 1.54 rillig process_unary_op(dec_ind, tabs_to_var);
1310 1.25 kamil break;
1311 1.25 kamil
1312 1.36 rillig case binary_op: /* any binary operation */
1313 1.54 rillig process_binary_op();
1314 1.25 kamil break;
1315 1.25 kamil
1316 1.39 rillig case postfix_op: /* got a trailing ++ or -- */
1317 1.54 rillig process_postfix_op();
1318 1.25 kamil break;
1319 1.25 kamil
1320 1.25 kamil case question: /* got a ? */
1321 1.54 rillig process_question(&squest);
1322 1.25 kamil break;
1323 1.25 kamil
1324 1.38 rillig case case_label: /* got word 'case' or 'default' */
1325 1.25 kamil scase = true; /* so we can process the later colon properly */
1326 1.25 kamil goto copy_id;
1327 1.25 kamil
1328 1.25 kamil case colon: /* got a ':' */
1329 1.54 rillig process_colon(&squest, &force_nl, &scase);
1330 1.25 kamil break;
1331 1.25 kamil
1332 1.54 rillig case semicolon: /* got a ';' */
1333 1.54 rillig process_semicolon(&scase, &squest, dec_ind, tabs_to_var, &sp_sw,
1334 1.54 rillig hd_type, &force_nl);
1335 1.25 kamil break;
1336 1.25 kamil
1337 1.25 kamil case lbrace: /* got a '{' */
1338 1.54 rillig process_lbrace(&force_nl, &sp_sw, hd_type, di_stack,
1339 1.59 rillig (int)nitems(di_stack), &dec_ind);
1340 1.25 kamil break;
1341 1.25 kamil
1342 1.25 kamil case rbrace: /* got a '}' */
1343 1.54 rillig process_rbrace(&sp_sw, &dec_ind, di_stack);
1344 1.25 kamil break;
1345 1.25 kamil
1346 1.38 rillig case switch_expr: /* got keyword "switch" */
1347 1.25 kamil sp_sw = true;
1348 1.86 rillig hd_type = switch_expr; /* keep this for when we have seen the
1349 1.86 rillig * expression */
1350 1.25 kamil goto copy_id; /* go move the token into buffer */
1351 1.25 kamil
1352 1.37 rillig case keyword_for_if_while:
1353 1.25 kamil sp_sw = true; /* the interesting stuff is done after the
1354 1.25 kamil * expression is scanned */
1355 1.67 rillig hd_type = (*token.s == 'i' ? if_expr :
1356 1.86 rillig (*token.s == 'w' ? while_expr : for_exprs));
1357 1.25 kamil
1358 1.54 rillig /* remember the type of header for later use by parser */
1359 1.25 kamil goto copy_id; /* copy the token into line */
1360 1.25 kamil
1361 1.37 rillig case keyword_do_else:
1362 1.54 rillig process_keyword_do_else(&force_nl, &last_else);
1363 1.25 kamil goto copy_id; /* move the token into line */
1364 1.25 kamil
1365 1.25 kamil case type_def:
1366 1.39 rillig case storage_class:
1367 1.73 rillig prefix_blankline_requested = false;
1368 1.25 kamil goto copy_id;
1369 1.25 kamil
1370 1.39 rillig case keyword_struct_union_enum:
1371 1.25 kamil if (ps.p_l_follow > 0)
1372 1.25 kamil goto copy_id;
1373 1.25 kamil /* FALLTHROUGH */
1374 1.25 kamil case decl: /* we have a declaration type (int, etc.) */
1375 1.54 rillig process_decl(&dec_ind, &tabs_to_var);
1376 1.25 kamil goto copy_id;
1377 1.25 kamil
1378 1.25 kamil case funcname:
1379 1.25 kamil case ident: /* got an identifier or constant */
1380 1.64 rillig process_ident(ttype, dec_ind, tabs_to_var, &sp_sw, &force_nl,
1381 1.86 rillig hd_type);
1382 1.25 kamil copy_id:
1383 1.54 rillig copy_id();
1384 1.64 rillig if (ttype != funcname)
1385 1.25 kamil ps.want_blank = true;
1386 1.25 kamil break;
1387 1.25 kamil
1388 1.39 rillig case string_prefix:
1389 1.54 rillig process_string_prefix();
1390 1.25 kamil break;
1391 1.1 cgd
1392 1.54 rillig case period:
1393 1.54 rillig process_period();
1394 1.25 kamil break;
1395 1.25 kamil
1396 1.25 kamil case comma:
1397 1.54 rillig process_comma(dec_ind, tabs_to_var, &force_nl);
1398 1.25 kamil break;
1399 1.25 kamil
1400 1.39 rillig case preprocessing: /* '#' */
1401 1.54 rillig process_preprocessing();
1402 1.54 rillig break;
1403 1.56 rillig case comment: /* the initial '/' '*' or '//' of a comment */
1404 1.56 rillig process_comment();
1405 1.25 kamil break;
1406 1.30 rillig
1407 1.30 rillig default:
1408 1.30 rillig break;
1409 1.64 rillig }
1410 1.25 kamil
1411 1.65 rillig *code.e = '\0';
1412 1.64 rillig if (ttype != comment &&
1413 1.64 rillig ttype != newline &&
1414 1.64 rillig ttype != preprocessing)
1415 1.64 rillig ps.last_token = ttype;
1416 1.53 rillig }
1417 1.53 rillig }
1418 1.53 rillig
1419 1.53 rillig int
1420 1.53 rillig main(int argc, char **argv)
1421 1.53 rillig {
1422 1.53 rillig main_init_globals();
1423 1.53 rillig main_parse_command_line(argc, argv);
1424 1.53 rillig #if HAVE_CAPSICUM
1425 1.53 rillig init_capsicum();
1426 1.53 rillig #endif
1427 1.53 rillig main_prepare_parsing();
1428 1.53 rillig main_loop();
1429 1.25 kamil }
1430 1.6 lukem
1431 1.1 cgd /*
1432 1.1 cgd * copy input file to backup file if in_name is /blah/blah/blah/file, then
1433 1.1 cgd * backup file will be ".Bfile" then make the backup file the input and
1434 1.1 cgd * original input file the output
1435 1.1 cgd */
1436 1.25 kamil static void
1437 1.13 wiz bakcopy(void)
1438 1.1 cgd {
1439 1.59 rillig ssize_t n;
1440 1.59 rillig int bakchn;
1441 1.59 rillig char buff[8 * 1024];
1442 1.25 kamil const char *p;
1443 1.25 kamil
1444 1.25 kamil /* construct file name .Bfile */
1445 1.73 rillig for (p = in_name; *p != '\0'; p++); /* skip to end of string */
1446 1.25 kamil while (p > in_name && *p != '/') /* find last '/' */
1447 1.25 kamil p--;
1448 1.25 kamil if (*p == '/')
1449 1.25 kamil p++;
1450 1.88 rillig sprintf(bakfile, "%s%s", p, backup_suffix);
1451 1.25 kamil
1452 1.25 kamil /* copy in_name to backup file */
1453 1.25 kamil bakchn = creat(bakfile, 0600);
1454 1.25 kamil if (bakchn < 0)
1455 1.25 kamil err(1, "%s", bakfile);
1456 1.25 kamil while ((n = read(fileno(input), buff, sizeof(buff))) > 0)
1457 1.59 rillig if (write(bakchn, buff, (size_t)n) != n)
1458 1.25 kamil err(1, "%s", bakfile);
1459 1.25 kamil if (n < 0)
1460 1.25 kamil err(1, "%s", in_name);
1461 1.25 kamil close(bakchn);
1462 1.25 kamil fclose(input);
1463 1.25 kamil
1464 1.25 kamil /* re-open backup file as the input file */
1465 1.25 kamil input = fopen(bakfile, "r");
1466 1.25 kamil if (input == NULL)
1467 1.25 kamil err(1, "%s", bakfile);
1468 1.25 kamil /* now the original input file will be the output */
1469 1.25 kamil output = fopen(in_name, "w");
1470 1.25 kamil if (output == NULL) {
1471 1.25 kamil unlink(bakfile);
1472 1.25 kamil err(1, "%s", in_name);
1473 1.25 kamil }
1474 1.25 kamil }
1475 1.25 kamil
1476 1.25 kamil static void
1477 1.75 rillig indent_declaration(int cur_dec_ind, bool tabs_to_var)
1478 1.25 kamil {
1479 1.65 rillig int pos = (int)(code.e - code.s);
1480 1.65 rillig char *startpos = code.e;
1481 1.25 kamil
1482 1.25 kamil /*
1483 1.86 rillig * get the tab math right for indentations that are not multiples of
1484 1.86 rillig * tabsize
1485 1.25 kamil */
1486 1.57 rillig if ((ps.ind_level * opt.indent_size) % opt.tabsize != 0) {
1487 1.57 rillig pos += (ps.ind_level * opt.indent_size) % opt.tabsize;
1488 1.57 rillig cur_dec_ind += (ps.ind_level * opt.indent_size) % opt.tabsize;
1489 1.25 kamil }
1490 1.25 kamil if (tabs_to_var) {
1491 1.25 kamil int tpos;
1492 1.25 kamil
1493 1.61 rillig check_size_code((size_t)(cur_dec_ind / opt.tabsize));
1494 1.25 kamil while ((tpos = opt.tabsize * (1 + pos / opt.tabsize)) <= cur_dec_ind) {
1495 1.65 rillig *code.e++ = '\t';
1496 1.25 kamil pos = tpos;
1497 1.6 lukem }
1498 1.25 kamil }
1499 1.61 rillig check_size_code((size_t)(cur_dec_ind - pos + 1));
1500 1.25 kamil while (pos < cur_dec_ind) {
1501 1.65 rillig *code.e++ = ' ';
1502 1.25 kamil pos++;
1503 1.25 kamil }
1504 1.65 rillig if (code.e == startpos && ps.want_blank) {
1505 1.65 rillig *code.e++ = ' ';
1506 1.25 kamil ps.want_blank = false;
1507 1.25 kamil }
1508 1.1 cgd }
1509 1.48 rillig
1510 1.48 rillig #ifdef debug
1511 1.48 rillig void
1512 1.48 rillig debug_printf(const char *fmt, ...)
1513 1.48 rillig {
1514 1.48 rillig FILE *f = output == stdout ? stderr : stdout;
1515 1.48 rillig va_list ap;
1516 1.48 rillig
1517 1.48 rillig va_start(ap, fmt);
1518 1.48 rillig vfprintf(f, fmt, ap);
1519 1.48 rillig va_end(ap);
1520 1.48 rillig }
1521 1.48 rillig
1522 1.48 rillig void
1523 1.48 rillig debug_println(const char *fmt, ...)
1524 1.48 rillig {
1525 1.48 rillig FILE *f = output == stdout ? stderr : stdout;
1526 1.48 rillig va_list ap;
1527 1.48 rillig
1528 1.48 rillig va_start(ap, fmt);
1529 1.48 rillig vfprintf(f, fmt, ap);
1530 1.48 rillig va_end(ap);
1531 1.48 rillig fprintf(f, "\n");
1532 1.48 rillig }
1533 1.48 rillig
1534 1.48 rillig void
1535 1.48 rillig debug_vis_range(const char *prefix, const char *s, const char *e,
1536 1.86 rillig const char *suffix)
1537 1.48 rillig {
1538 1.48 rillig debug_printf("%s", prefix);
1539 1.48 rillig for (const char *p = s; p < e; p++) {
1540 1.48 rillig if (isprint((unsigned char)*p) && *p != '\\' && *p != '"')
1541 1.48 rillig debug_printf("%c", *p);
1542 1.48 rillig else if (*p == '\n')
1543 1.48 rillig debug_printf("\\n");
1544 1.48 rillig else if (*p == '\t')
1545 1.48 rillig debug_printf("\\t");
1546 1.48 rillig else
1547 1.48 rillig debug_printf("\\x%02x", *p);
1548 1.48 rillig }
1549 1.48 rillig debug_printf("%s", suffix);
1550 1.48 rillig }
1551 1.48 rillig #endif
1552 1.68 rillig
1553 1.68 rillig static void *
1554 1.68 rillig nonnull(void *p)
1555 1.68 rillig {
1556 1.68 rillig if (p == NULL)
1557 1.68 rillig err(EXIT_FAILURE, NULL);
1558 1.68 rillig return p;
1559 1.68 rillig }
1560 1.68 rillig
1561 1.68 rillig void *
1562 1.68 rillig xmalloc(size_t size)
1563 1.68 rillig {
1564 1.68 rillig return nonnull(malloc(size));
1565 1.68 rillig }
1566 1.68 rillig
1567 1.68 rillig void *
1568 1.68 rillig xrealloc(void *p, size_t new_size)
1569 1.68 rillig {
1570 1.68 rillig return nonnull(realloc(p, new_size));
1571 1.68 rillig }
1572 1.68 rillig
1573 1.68 rillig char *
1574 1.68 rillig xstrdup(const char *s)
1575 1.68 rillig {
1576 1.68 rillig return nonnull(strdup(s));
1577 1.68 rillig }
1578