pr_comment.c revision 1.157 1 /* $NetBSD: pr_comment.c,v 1.157 2023/06/09 07:18:52 rillig Exp $ */
2
3 /*-
4 * SPDX-License-Identifier: BSD-4-Clause
5 *
6 * Copyright (c) 1985 Sun Microsystems, Inc.
7 * Copyright (c) 1980, 1993
8 * The Regents of the University of California. All rights reserved.
9 * All rights reserved.
10 *
11 * Redistribution and use in source and binary forms, with or without
12 * modification, are permitted provided that the following conditions
13 * are met:
14 * 1. Redistributions of source code must retain the above copyright
15 * notice, this list of conditions and the following disclaimer.
16 * 2. Redistributions in binary form must reproduce the above copyright
17 * notice, this list of conditions and the following disclaimer in the
18 * documentation and/or other materials provided with the distribution.
19 * 3. All advertising materials mentioning features or use of this software
20 * must display the following acknowledgement:
21 * This product includes software developed by the University of
22 * California, Berkeley and its contributors.
23 * 4. Neither the name of the University nor the names of its contributors
24 * may be used to endorse or promote products derived from this software
25 * without specific prior written permission.
26 *
27 * THIS SOFTWARE IS PROVIDED BY THE REGENTS AND CONTRIBUTORS ``AS IS'' AND
28 * ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
29 * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
30 * ARE DISCLAIMED. IN NO EVENT SHALL THE REGENTS OR CONTRIBUTORS BE LIABLE
31 * FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL
32 * DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS
33 * OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION)
34 * HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT
35 * LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY
36 * OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF
37 * SUCH DAMAGE.
38 */
39
40 #include <sys/cdefs.h>
41 __RCSID("$NetBSD: pr_comment.c,v 1.157 2023/06/09 07:18:52 rillig Exp $");
42
43 #include <string.h>
44
45 #include "indent.h"
46
47 static void
48 com_add_char(char ch)
49 {
50 buf_add_char(&com, ch);
51 }
52
53 static void
54 com_add_delim(void)
55 {
56 if (opt.star_comment_cont)
57 buf_add_chars(&com, " * ", 3);
58 }
59
60 static bool
61 fits_in_one_line(int com_ind, int max_line_length)
62 {
63 for (const char *start = inp_p, *p = start; *p != '\n'; p++) {
64 if (p[0] == '*' && p[1] == '/') {
65 while (p - inp_p >= 2
66 && ch_isblank(p[-1])
67 && ch_isblank(p[-2]))
68 p--;
69 int len = ind_add(com_ind + 3,
70 start, (size_t)(p - start));
71 len += p == start || ch_isblank(p[-1]) ? 2 : 3;
72 return len <= max_line_length;
73 }
74 }
75 return false;
76 }
77
78 static void
79 analyze_comment(bool *p_may_wrap, bool *p_delim,
80 int *p_ind, int *p_line_length)
81 {
82 bool may_wrap = true;
83 bool delim = false;
84 int ind;
85 int line_length = opt.max_line_length;
86
87 if (ps.curr_col_1 && !opt.format_col1_comments) {
88 may_wrap = false;
89 ind = 0;
90 } else {
91 if (inp_p[0] == '-' || inp_p[0] == '*' ||
92 token.s[token.len - 1] == '/' ||
93 (inp_p[0] == '\n' && !opt.format_block_comments))
94 may_wrap = false;
95 if (code.len == 0 && inp_p[strspn(inp_p, "*")] == '\n')
96 out.line_kind = lk_block_comment;
97
98 if (com.len > 0)
99 output_line();
100 if (lab.len == 0 && code.len == 0) {
101 ind = (ps.ind_level - opt.unindent_displace)
102 * opt.indent_size;
103 if (ind <= 0)
104 ind = opt.format_col1_comments ? 0 : 1;
105 line_length = opt.block_comment_max_line_length;
106 if (may_wrap && inp_p[0] == '\n')
107 delim = true;
108 if (may_wrap && opt.comment_delimiter_on_blankline)
109 delim = true;
110 } else {
111 int target_ind = code.len > 0
112 ? ind_add(compute_code_indent(), code.s, code.len)
113 : ind_add(compute_label_indent(), lab.s, lab.len);
114
115 ind = ps.decl_on_line || ps.ind_level == 0
116 ? opt.decl_comment_column - 1
117 : opt.comment_column - 1;
118 if (ind <= target_ind)
119 ind = next_tab(target_ind);
120 if (ind + 25 > line_length)
121 line_length = ind + 25;
122 }
123 }
124
125 ps.com_ind = ind;
126
127 if (!may_wrap) {
128 /* Find out how much indentation there was originally, because
129 * that much will have to be ignored by output_line. */
130 size_t len = (size_t)(inp_p - 2 - inp.s);
131 ps.n_comment_delta = -ind_add(0, inp.s, len);
132 } else {
133 ps.n_comment_delta = 0;
134 if (!(inp_p[0] == '\t' && !ch_isblank(inp_p[1])))
135 while (ch_isblank(inp_p[0]))
136 inp_p++;
137 }
138
139 *p_may_wrap = may_wrap;
140 *p_delim = delim;
141 *p_ind = ind;
142 *p_line_length = line_length;
143 }
144
145 static void
146 copy_comment_start(bool may_wrap, bool *delim, int ind, int line_length)
147 {
148 ps.comment_delta = 0;
149 com_add_char('/');
150 com_add_char(token.s[token.len - 1]); /* either '*' or '/' */
151
152 if (may_wrap) {
153 if (!ch_isblank(inp_p[0]))
154 com_add_char(' ');
155
156 if (*delim && fits_in_one_line(ind, line_length))
157 *delim = false;
158 if (*delim) {
159 output_line();
160 com_add_delim();
161 }
162 }
163 }
164
165 static void
166 copy_comment_wrap_text(int line_length, ssize_t *last_blank)
167 {
168 int now_len = ind_add(ps.com_ind, com.s, com.len);
169 for (;;) {
170 char ch = inp_next();
171 if (ch_isblank(ch))
172 *last_blank = (ssize_t)com.len;
173 com_add_char(ch);
174 now_len++;
175 if (memchr("*\n\r\b\t", inp_p[0], 6) != NULL)
176 break;
177 if (now_len >= line_length && *last_blank != -1)
178 break;
179 }
180
181 ps.next_col_1 = false;
182
183 if (now_len <= line_length)
184 return;
185 if (ch_isspace(com.s[com.len - 1]))
186 return;
187
188 if (*last_blank == -1) {
189 /* only a single word in this line */
190 output_line();
191 com_add_delim();
192 return;
193 }
194
195 const char *last_word_s = com.s + *last_blank + 1;
196 size_t last_word_len = com.len - (size_t)(*last_blank + 1);
197 com.len = (size_t)*last_blank;
198 output_line();
199 com_add_delim();
200
201 /* Assume that output_line and com_add_delim don't
202 * invalidate the "unused" part of the buffer beyond
203 * com.s + com.len. */
204 memmove(com.s + com.len, last_word_s, last_word_len);
205 com.len += last_word_len;
206 *last_blank = -1;
207 }
208
209 static bool
210 copy_comment_wrap_newline(ssize_t *last_blank)
211 {
212 *last_blank = -1;
213 if (ps.next_col_1) {
214 if (com.len == 0)
215 com_add_char(' '); /* force empty output line */
216 if (com.len > 3) {
217 output_line();
218 com_add_delim();
219 }
220 output_line();
221 com_add_delim();
222 } else {
223 ps.next_col_1 = true;
224 if (!(com.len > 0 && ch_isblank(com.s[com.len - 1])))
225 com_add_char(' ');
226 *last_blank = (int)com.len - 1;
227 }
228 ++line_no;
229
230 /* flush any blanks and/or tabs at start of next line */
231 inp_skip(); /* '\n' */
232 while (ch_isblank(inp_p[0]))
233 inp_p++;
234 if (inp_p[0] == '*' && inp_p[1] == '/')
235 return false;
236 if (inp_p[0] == '*') {
237 inp_p++;
238 while (ch_isblank(inp_p[0]))
239 inp_p++;
240 }
241
242 return true;
243 }
244
245 static void
246 copy_comment_wrap_finish(int line_length, bool delim)
247 {
248 if (delim) {
249 if (com.len > 3)
250 output_line();
251 else
252 com.len = 0;
253 com_add_char(' ');
254 } else {
255 size_t len = com.len;
256 while (ch_isblank(com.s[len - 1]))
257 len--;
258 int end_ind = ind_add(ps.com_ind, com.s, len);
259 if (end_ind + 3 > line_length)
260 output_line();
261 }
262
263 while (com.len >= 2
264 && ch_isblank(com.s[com.len - 1])
265 && ch_isblank(com.s[com.len - 2]))
266 com.len--;
267
268 inp_p += 2;
269 if (com.len > 0 && ch_isblank(com.s[com.len - 1]))
270 buf_add_chars(&com, "*/", 2);
271 else
272 buf_add_chars(&com, " */", 3);
273 }
274
275 /*
276 * Copy characters from 'inp' to 'com'. Try to keep comments from going over
277 * the maximum line length. To do that, remember where the last blank, tab, or
278 * newline was. When a line is filled, print up to the last blank and continue
279 * copying.
280 */
281 static void
282 copy_comment_wrap(int line_length, bool delim)
283 {
284 ssize_t last_blank = -1; /* index of the last blank in 'com' */
285
286 for (;;) {
287 if (inp_p[0] == '\n') {
288 if (had_eof)
289 goto unterminated_comment;
290 if (!copy_comment_wrap_newline(&last_blank))
291 goto end_of_comment;
292 } else if (inp_p[0] == '*' && inp_p[1] == '/')
293 goto end_of_comment;
294 else
295 copy_comment_wrap_text(line_length, &last_blank);
296 }
297
298 end_of_comment:
299 copy_comment_wrap_finish(line_length, delim);
300 return;
301
302 unterminated_comment:
303 diag(1, "Unterminated comment");
304 output_line();
305 }
306
307 static void
308 copy_comment_nowrap(void)
309 {
310 char kind = token.s[token.len - 1];
311
312 for (;;) {
313 if (inp_p[0] == '\n') {
314 if (kind == '/')
315 return;
316
317 if (had_eof) {
318 diag(1, "Unterminated comment");
319 output_line();
320 return;
321 }
322
323 if (com.len == 0)
324 com_add_char(' '); /* force output of an
325 * empty line */
326 output_line();
327 ++line_no;
328 inp_skip();
329 continue;
330 }
331
332 com_add_char(*inp_p++);
333 if (com.len >= 2
334 && com.s[com.len - 2] == '*'
335 && com.s[com.len - 1] == '/'
336 && kind == '*')
337 return;
338 }
339 }
340
341 /*
342 * Scan, reformat and output a single comment, which is either a block comment
343 * starting with '/' '*' or an end-of-line comment starting with '//'.
344 */
345 void
346 process_comment(void)
347 {
348 bool may_wrap, delim;
349 int ind, line_length;
350
351 analyze_comment(&may_wrap, &delim, &ind, &line_length);
352 copy_comment_start(may_wrap, &delim, ind, line_length);
353 if (may_wrap)
354 copy_comment_wrap(line_length, delim);
355 else
356 copy_comment_nowrap();
357 }
358