Home | History | Annotate | Line # | Download | only in indent
io.c revision 1.26
      1 /*	$NetBSD: io.c,v 1.26 2021/03/08 22:26:17 rillig Exp $	*/
      2 
      3 /*-
      4  * SPDX-License-Identifier: BSD-4-Clause
      5  *
      6  * Copyright (c) 1985 Sun Microsystems, Inc.
      7  * Copyright (c) 1980, 1993
      8  *	The Regents of the University of California.  All rights reserved.
      9  * All rights reserved.
     10  *
     11  * Redistribution and use in source and binary forms, with or without
     12  * modification, are permitted provided that the following conditions
     13  * are met:
     14  * 1. Redistributions of source code must retain the above copyright
     15  *    notice, this list of conditions and the following disclaimer.
     16  * 2. Redistributions in binary form must reproduce the above copyright
     17  *    notice, this list of conditions and the following disclaimer in the
     18  *    documentation and/or other materials provided with the distribution.
     19  * 3. All advertising materials mentioning features or use of this software
     20  *    must display the following acknowledgement:
     21  *	This product includes software developed by the University of
     22  *	California, Berkeley and its contributors.
     23  * 4. Neither the name of the University nor the names of its contributors
     24  *    may be used to endorse or promote products derived from this software
     25  *    without specific prior written permission.
     26  *
     27  * THIS SOFTWARE IS PROVIDED BY THE REGENTS AND CONTRIBUTORS ``AS IS'' AND
     28  * ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
     29  * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
     30  * ARE DISCLAIMED.  IN NO EVENT SHALL THE REGENTS OR CONTRIBUTORS BE LIABLE
     31  * FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL
     32  * DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS
     33  * OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION)
     34  * HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT
     35  * LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY
     36  * OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF
     37  * SUCH DAMAGE.
     38  */
     39 
     40 #if 0
     41 #ifndef lint
     42 static char sccsid[] = "@(#)io.c	8.1 (Berkeley) 6/6/93";
     43 #endif /* not lint */
     44 #endif
     45 
     46 #include <sys/cdefs.h>
     47 #ifndef lint
     48 #if defined(__NetBSD__)
     49 __RCSID("$NetBSD: io.c,v 1.26 2021/03/08 22:26:17 rillig Exp $");
     50 #elif defined(__FreeBSD__)
     51 __FBSDID("$FreeBSD: head/usr.bin/indent/io.c 334927 2018-06-10 16:44:18Z pstef $");
     52 #endif
     53 #endif
     54 
     55 #include <ctype.h>
     56 #include <err.h>
     57 #include <stdio.h>
     58 #include <stdlib.h>
     59 #include <string.h>
     60 #include <stdarg.h>
     61 
     62 #include "indent.h"
     63 
     64 int         comment_open;
     65 static int  paren_target;
     66 static int pad_output(int current, int target);
     67 
     68 /*
     69  * dump_line is the routine that actually effects the printing of the new
     70  * source. It prints the label section, followed by the code section with
     71  * the appropriate nesting level, followed by any comments.
     72  */
     73 void
     74 dump_line(void)
     75 {
     76     int cur_col,
     77                 target_col = 1;
     78     static int  not_first_line;
     79 
     80     if (ps.procname[0]) {
     81 	ps.ind_level = 0;
     82 	ps.procname[0] = 0;
     83     }
     84     if (s_code == e_code && s_lab == e_lab && s_com == e_com) {
     85 	if (suppress_blanklines > 0)
     86 	    suppress_blanklines--;
     87 	else {
     88 	    ps.bl_line = true;
     89 	    n_real_blanklines++;
     90 	}
     91     }
     92     else if (!inhibit_formatting) {
     93 	suppress_blanklines = 0;
     94 	ps.bl_line = false;
     95 	if (prefix_blankline_requested && not_first_line) {
     96 	    if (opt.swallow_optional_blanklines) {
     97 		if (n_real_blanklines == 1)
     98 		    n_real_blanklines = 0;
     99 	    }
    100 	    else {
    101 		if (n_real_blanklines == 0)
    102 		    n_real_blanklines = 1;
    103 	    }
    104 	}
    105 	while (--n_real_blanklines >= 0)
    106 	    putc('\n', output);
    107 	n_real_blanklines = 0;
    108 	if (ps.ind_level == 0)
    109 	    ps.ind_stmt = 0;	/* this is a class A kludge. dont do
    110 				 * additional statement indentation if we are
    111 				 * at bracket level 0 */
    112 
    113 	if (e_lab != s_lab || e_code != s_code)
    114 	    ++code_lines;	/* keep count of lines with code */
    115 
    116 
    117 	if (e_lab != s_lab) {	/* print lab, if any */
    118 	    if (comment_open) {
    119 		comment_open = 0;
    120 		fprintf(output, ".*/\n");
    121 	    }
    122 	    while (e_lab > s_lab && (e_lab[-1] == ' ' || e_lab[-1] == '\t'))
    123 		e_lab--;
    124 	    *e_lab = '\0';
    125 	    cur_col = pad_output(1, compute_label_target());
    126 	    if (s_lab[0] == '#' && (strncmp(s_lab, "#else", 5) == 0
    127 				    || strncmp(s_lab, "#endif", 6) == 0)) {
    128 		char *s = s_lab;
    129 		if (e_lab[-1] == '\n') e_lab--;
    130 		do {
    131 		    putc(*s++, output);
    132 		} while (s < e_lab && 'a' <= *s && *s <= 'z');
    133 		while ((*s == ' ' || *s == '\t') && s < e_lab)
    134 		    s++;
    135 		if (s < e_lab)
    136 		    fprintf(output, s[0]=='/' && s[1]=='*' ? "\t%.*s" : "\t/* %.*s */",
    137 			    (int)(e_lab - s), s);
    138 	    }
    139 	    else fprintf(output, "%.*s", (int)(e_lab - s_lab), s_lab);
    140 	    cur_col = count_spaces(cur_col, s_lab);
    141 	}
    142 	else
    143 	    cur_col = 1;	/* there is no label section */
    144 
    145 	ps.pcase = false;
    146 
    147 	if (s_code != e_code) {	/* print code section, if any */
    148 	    char *p;
    149 
    150 	    if (comment_open) {
    151 		comment_open = 0;
    152 		fprintf(output, ".*/\n");
    153 	    }
    154 	    target_col = compute_code_target();
    155 	    {
    156 		int i;
    157 
    158 		for (i = 0; i < ps.p_l_follow; i++)
    159 		    if (ps.paren_indents[i] >= 0)
    160 			ps.paren_indents[i] = -(ps.paren_indents[i] + target_col);
    161 	    }
    162 	    cur_col = pad_output(cur_col, target_col);
    163 	    for (p = s_code; p < e_code; p++)
    164 		if (*p == (char) 0200)
    165 		    fprintf(output, "%d", target_col * 7);
    166 		else
    167 		    putc(*p, output);
    168 	    cur_col = count_spaces(cur_col, s_code);
    169 	}
    170 	if (s_com != e_com) {		/* print comment, if any */
    171 	    int target = ps.com_col;
    172 	    char *com_st = s_com;
    173 
    174 	    target += ps.comment_delta;
    175 	    while (*com_st == '\t')	/* consider original indentation in
    176 				     * case this is a box comment */
    177 		com_st++, target += opt.tabsize;
    178 	    while (target <= 0)
    179 		if (*com_st == ' ')
    180 		    target++, com_st++;
    181 		else if (*com_st == '\t') {
    182 		    target = opt.tabsize * (1 + (target - 1) / opt.tabsize) + 1;
    183 		    com_st++;
    184 		}
    185 		else
    186 		    target = 1;
    187 	    if (cur_col > target) {	/* if comment can't fit on this line,
    188 				     * put it on next line */
    189 		putc('\n', output);
    190 		cur_col = 1;
    191 		++ps.out_lines;
    192 	    }
    193 	    while (e_com > com_st && isspace((unsigned char)e_com[-1]))
    194 		e_com--;
    195 	    (void)pad_output(cur_col, target);
    196 	    fwrite(com_st, e_com - com_st, 1, output);
    197 	    ps.comment_delta = ps.n_comment_delta;
    198 	    ++ps.com_lines;	/* count lines with comments */
    199 	}
    200 	if (ps.use_ff)
    201 	    putc('\014', output);
    202 	else
    203 	    putc('\n', output);
    204 	++ps.out_lines;
    205 	if (ps.just_saw_decl == 1 && opt.blanklines_after_declarations) {
    206 	    prefix_blankline_requested = 1;
    207 	    ps.just_saw_decl = 0;
    208 	}
    209 	else
    210 	    prefix_blankline_requested = postfix_blankline_requested;
    211 	postfix_blankline_requested = 0;
    212     }
    213 
    214     /* keep blank lines after '//' comments */
    215     if (e_com - s_com > 1 && s_com[1] == '/')
    216 	fprintf(output, "%.*s", (int)(e_token - s_token), s_token);
    217 
    218     ps.decl_on_line = ps.in_decl;	/* if we are in the middle of a
    219 					 * declaration, remember that fact for
    220 					 * proper comment indentation */
    221     ps.ind_stmt = ps.in_stmt & ~ps.in_decl;	/* next line should be
    222 						 * indented if we have not
    223 						 * completed this stmt and if
    224 						 * we are not in the middle of
    225 						 * a declaration */
    226     ps.use_ff = false;
    227     ps.dumped_decl_indent = 0;
    228     *(e_lab = s_lab) = '\0';	/* reset buffers */
    229     *(e_code = s_code) = '\0';
    230     *(e_com = s_com = combuf + 1) = '\0';
    231     ps.ind_level = ps.i_l_follow;
    232     ps.paren_level = ps.p_l_follow;
    233     if (ps.paren_level > 0)
    234 	paren_target = -ps.paren_indents[ps.paren_level - 1];
    235     not_first_line = 1;
    236 }
    237 
    238 int
    239 compute_code_target(void)
    240 {
    241     int target_col = opt.ind_size * ps.ind_level + 1;
    242 
    243     if (ps.paren_level)
    244 	if (!opt.lineup_to_parens)
    245 	    target_col += opt.continuation_indent *
    246 		(2 * opt.continuation_indent == opt.ind_size ? 1 : ps.paren_level);
    247 	else if (opt.lineup_to_parens_always)
    248 	    target_col = paren_target;
    249 	else {
    250 	    int w;
    251 	    int t = paren_target;
    252 
    253 	    if ((w = count_spaces(t, s_code) - opt.max_col) > 0
    254 		    && count_spaces(target_col, s_code) <= opt.max_col) {
    255 		t -= w + 1;
    256 		if (t > target_col)
    257 		    target_col = t;
    258 	    }
    259 	    else
    260 		target_col = t;
    261 	}
    262     else if (ps.ind_stmt)
    263 	target_col += opt.continuation_indent;
    264     return target_col;
    265 }
    266 
    267 int
    268 compute_label_target(void)
    269 {
    270     return
    271 	ps.pcase ? (int) (case_ind * opt.ind_size) + 1
    272 	: *s_lab == '#' ? 1
    273 	: opt.ind_size * (ps.ind_level - label_offset) + 1;
    274 }
    275 
    276 
    277 /*
    278  * Copyright (C) 1976 by the Board of Trustees of the University of Illinois
    279  *
    280  * All rights reserved
    281  *
    282  *
    283  * NAME: fill_buffer
    284  *
    285  * FUNCTION: Reads one block of input into input_buffer
    286  *
    287  * HISTORY: initial coding	November 1976	D A Willcox of CAC 1/7/77 A
    288  * Willcox of CAC	Added check for switch back to partly full input
    289  * buffer from temporary buffer
    290  *
    291  */
    292 void
    293 fill_buffer(void)
    294 {				/* this routine reads stuff from the input */
    295     char *p;
    296     int i;
    297     FILE *f = input;
    298 
    299     if (bp_save != NULL) {	/* there is a partly filled input buffer left */
    300 	buf_ptr = bp_save;	/* do not read anything, just switch buffers */
    301 	buf_end = be_save;
    302 	bp_save = be_save = NULL;
    303 	if (buf_ptr < buf_end)
    304 	    return;		/* only return if there is really something in
    305 				 * this buffer */
    306     }
    307     for (p = in_buffer;;) {
    308 	if (p >= in_buffer_limit) {
    309 	    int size = (in_buffer_limit - in_buffer) * 2 + 10;
    310 	    int offset = p - in_buffer;
    311 	    in_buffer = realloc(in_buffer, size);
    312 	    if (in_buffer == NULL)
    313 		errx(1, "input line too long");
    314 	    p = in_buffer + offset;
    315 	    in_buffer_limit = in_buffer + size - 2;
    316 	}
    317 	if ((i = getc(f)) == EOF) {
    318 		*p++ = ' ';
    319 		*p++ = '\n';
    320 		had_eof = true;
    321 		break;
    322 	}
    323 	if (i != '\0')
    324 	    *p++ = i;
    325 	if (i == '\n')
    326 		break;
    327     }
    328     buf_ptr = in_buffer;
    329     buf_end = p;
    330     if (p - in_buffer > 2 && p[-2] == '/' && p[-3] == '*') {
    331 	if (in_buffer[3] == 'I' && strncmp(in_buffer, "/**INDENT**", 11) == 0)
    332 	    fill_buffer();	/* flush indent error message */
    333 	else {
    334 	    int         com = 0;
    335 
    336 	    p = in_buffer;
    337 	    while (*p == ' ' || *p == '\t')
    338 		p++;
    339 	    if (*p == '/' && p[1] == '*') {
    340 		p += 2;
    341 		while (*p == ' ' || *p == '\t')
    342 		    p++;
    343 		if (p[0] == 'I' && p[1] == 'N' && p[2] == 'D' && p[3] == 'E'
    344 			&& p[4] == 'N' && p[5] == 'T') {
    345 		    p += 6;
    346 		    while (*p == ' ' || *p == '\t')
    347 			p++;
    348 		    if (*p == '*')
    349 			com = 1;
    350 		    else if (*p == 'O') {
    351 			if (*++p == 'N')
    352 			    p++, com = 1;
    353 			else if (*p == 'F' && *++p == 'F')
    354 			    p++, com = 2;
    355 		    }
    356 		    while (*p == ' ' || *p == '\t')
    357 			p++;
    358 		    if (p[0] == '*' && p[1] == '/' && p[2] == '\n' && com) {
    359 			if (s_com != e_com || s_lab != e_lab || s_code != e_code)
    360 			    dump_line();
    361 			if (!(inhibit_formatting = com - 1)) {
    362 			    n_real_blanklines = 0;
    363 			    postfix_blankline_requested = 0;
    364 			    prefix_blankline_requested = 0;
    365 			    suppress_blanklines = 1;
    366 			}
    367 		    }
    368 		}
    369 	    }
    370 	}
    371     }
    372     if (inhibit_formatting) {
    373 	p = in_buffer;
    374 	do {
    375 	    putc(*p, output);
    376 	} while (*p++ != '\n');
    377     }
    378 }
    379 
    380 /*
    381  * Copyright (C) 1976 by the Board of Trustees of the University of Illinois
    382  *
    383  * All rights reserved
    384  *
    385  *
    386  * NAME: pad_output
    387  *
    388  * FUNCTION: Writes tabs and spaces to move the current column up to the desired
    389  * position.
    390  *
    391  * ALGORITHM: Put tabs and/or blanks into pobuf, then write pobuf.
    392  *
    393  * PARAMETERS: current		integer		The current column target
    394  * nteger		The desired column
    395  *
    396  * RETURNS: Integer value of the new column.  (If current >= target, no action is
    397  * taken, and current is returned.
    398  *
    399  * GLOBALS: None
    400  *
    401  * CALLS: write (sys)
    402  *
    403  * CALLED BY: dump_line
    404  *
    405  * HISTORY: initial coding	November 1976	D A Willcox of CAC
    406  *
    407  */
    408 static int
    409 pad_output(int current, int target)
    410 			        /* writes tabs and blanks (if necessary) to
    411 				 * get the current output position up to the
    412 				 * target column */
    413     /* current: the current column value */
    414     /* target: position we want it at */
    415 {
    416     int curr;			/* internal column pointer */
    417 
    418     if (current >= target)
    419 	return current;		/* line is already long enough */
    420     curr = current;
    421     if (opt.use_tabs) {
    422 	int tcur;
    423 
    424 	while ((tcur = opt.tabsize * (1 + (curr - 1) / opt.tabsize) + 1) <= target) {
    425 	    putc('\t', output);
    426 	    curr = tcur;
    427 	}
    428     }
    429     while (curr++ < target)
    430 	putc(' ', output);	/* pad with final blanks */
    431 
    432     return target;
    433 }
    434 
    435 /*
    436  * Copyright (C) 1976 by the Board of Trustees of the University of Illinois
    437  *
    438  * All rights reserved
    439  *
    440  *
    441  * NAME: count_spaces
    442  *
    443  * FUNCTION: Find out where printing of a given string will leave the current
    444  * character position on output.
    445  *
    446  * ALGORITHM: Run thru input string and add appropriate values to current
    447  * position.
    448  *
    449  * RETURNS: Integer value of position after printing "buffer" starting in column
    450  * "current".
    451  *
    452  * HISTORY: initial coding	November 1976	D A Willcox of CAC
    453  *
    454  */
    455 int
    456 count_spaces_until(int cur, char *buffer, char *end)
    457 /*
    458  * this routine figures out where the character position will be after
    459  * printing the text in buffer starting at column "current"
    460  */
    461 {
    462     char *buf;		/* used to look thru buffer */
    463 
    464     for (buf = buffer; *buf != '\0' && buf != end; ++buf) {
    465 	switch (*buf) {
    466 
    467 	case '\n':
    468 	case 014:		/* form feed */
    469 	    cur = 1;
    470 	    break;
    471 
    472 	case '\t':
    473 	    cur = opt.tabsize * (1 + (cur - 1) / opt.tabsize) + 1;
    474 	    break;
    475 
    476 	case 010:		/* backspace */
    477 	    --cur;
    478 	    break;
    479 
    480 	default:
    481 	    ++cur;
    482 	    break;
    483 	}			/* end of switch */
    484     }				/* end of for loop */
    485     return cur;
    486 }
    487 
    488 int
    489 count_spaces(int cur, char *buffer)
    490 {
    491     return count_spaces_until(cur, buffer, NULL);
    492 }
    493 
    494 void
    495 diag(int level, const char *msg, ...)
    496 {
    497     va_list ap;
    498     const char *s, *e;
    499 
    500     if (level)
    501 	found_err = 1;
    502 
    503     if (output == stdout) {
    504 	s = "/**INDENT** ";
    505 	e = " */";
    506     } else {
    507 	s = e = "";
    508     }
    509 
    510     va_start(ap, msg);
    511     fprintf(stderr, "%s%s@%d: ", s, level == 0 ? "Warning" : "Error", line_no);
    512     vfprintf(stderr, msg, ap);
    513     fprintf(stderr, "%s\n", e);
    514     va_end(ap);
    515 }
    516