fold.c revision 1.16 1 1.16 ahoka /* $NetBSD: fold.c,v 1.16 2009/07/21 01:35:02 ahoka Exp $ */
2 1.6 jtc
3 1.1 cgd /*-
4 1.6 jtc * Copyright (c) 1990, 1993
5 1.6 jtc * The Regents of the University of California. All rights reserved.
6 1.1 cgd *
7 1.1 cgd * This code is derived from software contributed to Berkeley by
8 1.1 cgd * Kevin Ruddy.
9 1.1 cgd *
10 1.1 cgd * Redistribution and use in source and binary forms, with or without
11 1.1 cgd * modification, are permitted provided that the following conditions
12 1.1 cgd * are met:
13 1.1 cgd * 1. Redistributions of source code must retain the above copyright
14 1.1 cgd * notice, this list of conditions and the following disclaimer.
15 1.1 cgd * 2. Redistributions in binary form must reproduce the above copyright
16 1.1 cgd * notice, this list of conditions and the following disclaimer in the
17 1.1 cgd * documentation and/or other materials provided with the distribution.
18 1.12 agc * 3. Neither the name of the University nor the names of its contributors
19 1.1 cgd * may be used to endorse or promote products derived from this software
20 1.1 cgd * without specific prior written permission.
21 1.1 cgd *
22 1.1 cgd * THIS SOFTWARE IS PROVIDED BY THE REGENTS AND CONTRIBUTORS ``AS IS'' AND
23 1.1 cgd * ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
24 1.1 cgd * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
25 1.1 cgd * ARE DISCLAIMED. IN NO EVENT SHALL THE REGENTS OR CONTRIBUTORS BE LIABLE
26 1.1 cgd * FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL
27 1.1 cgd * DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS
28 1.1 cgd * OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION)
29 1.1 cgd * HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT
30 1.1 cgd * LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY
31 1.1 cgd * OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF
32 1.1 cgd * SUCH DAMAGE.
33 1.1 cgd */
34 1.1 cgd
35 1.7 lukem #include <sys/cdefs.h>
36 1.1 cgd #ifndef lint
37 1.14 lukem __COPYRIGHT("@(#) Copyright (c) 1990, 1993\
38 1.14 lukem The Regents of the University of California. All rights reserved.");
39 1.1 cgd #endif /* not lint */
40 1.1 cgd
41 1.1 cgd #ifndef lint
42 1.6 jtc #if 0
43 1.6 jtc static char sccsid[] = "@(#)fold.c 8.1 (Berkeley) 6/6/93";
44 1.6 jtc #endif
45 1.16 ahoka __RCSID("$NetBSD: fold.c,v 1.16 2009/07/21 01:35:02 ahoka Exp $");
46 1.1 cgd #endif /* not lint */
47 1.1 cgd
48 1.16 ahoka #include <limits.h>
49 1.16 ahoka #include <locale.h>
50 1.1 cgd #include <stdio.h>
51 1.2 jtc #include <stdlib.h>
52 1.5 jtc #include <unistd.h>
53 1.16 ahoka #include <wchar.h>
54 1.4 jtc #include <err.h>
55 1.1 cgd
56 1.1 cgd #define DEFLINEWIDTH 80
57 1.1 cgd
58 1.11 mjl int main(int, char **);
59 1.11 mjl static void fold(int);
60 1.16 ahoka static int new_column_position(int, wint_t);
61 1.10 mjl static void usage(void);
62 1.7 lukem
63 1.2 jtc int count_bytes = 0;
64 1.2 jtc int split_words = 0;
65 1.2 jtc
66 1.2 jtc int
67 1.11 mjl main(int argc, char **argv)
68 1.1 cgd {
69 1.7 lukem int ch;
70 1.1 cgd int width;
71 1.1 cgd char *p;
72 1.1 cgd
73 1.16 ahoka setlocale(LC_CTYPE, "");
74 1.16 ahoka setprogname(argv[0]);
75 1.16 ahoka
76 1.1 cgd width = -1;
77 1.4 jtc while ((ch = getopt(argc, argv, "0123456789bsw:")) != -1)
78 1.1 cgd switch (ch) {
79 1.2 jtc case 'b':
80 1.2 jtc count_bytes = 1;
81 1.2 jtc break;
82 1.2 jtc case 's':
83 1.2 jtc split_words = 1;
84 1.2 jtc break;
85 1.1 cgd case 'w':
86 1.10 mjl if ((width = atoi(optarg)) <= 0)
87 1.10 mjl errx(1, "illegal width value");
88 1.1 cgd break;
89 1.1 cgd case '0': case '1': case '2': case '3': case '4':
90 1.1 cgd case '5': case '6': case '7': case '8': case '9':
91 1.1 cgd if (width == -1) {
92 1.1 cgd p = argv[optind - 1];
93 1.1 cgd if (p[0] == '-' && p[1] == ch && !p[2])
94 1.1 cgd width = atoi(++p);
95 1.1 cgd else
96 1.1 cgd width = atoi(argv[optind] + 1);
97 1.1 cgd }
98 1.1 cgd break;
99 1.1 cgd default:
100 1.10 mjl usage();
101 1.1 cgd }
102 1.1 cgd argv += optind;
103 1.1 cgd argc -= optind;
104 1.1 cgd
105 1.1 cgd if (width == -1)
106 1.1 cgd width = DEFLINEWIDTH;
107 1.2 jtc
108 1.1 cgd if (!*argv)
109 1.1 cgd fold(width);
110 1.1 cgd else for (; *argv; ++argv)
111 1.1 cgd if (!freopen(*argv, "r", stdin)) {
112 1.4 jtc err (1, "%s", *argv);
113 1.4 jtc /* NOTREACHED */
114 1.1 cgd } else
115 1.1 cgd fold(width);
116 1.1 cgd exit(0);
117 1.1 cgd }
118 1.1 cgd
119 1.2 jtc /*
120 1.2 jtc * Fold the contents of standard input to fit within WIDTH columns
121 1.2 jtc * (or bytes) and write to standard output.
122 1.2 jtc *
123 1.2 jtc * If split_words is set, split the line at the last space character
124 1.2 jtc * on the line. This flag necessitates storing the line in a buffer
125 1.2 jtc * until the current column > width, or a newline or EOF is read.
126 1.2 jtc *
127 1.2 jtc * The buffer can grow larger than WIDTH due to backspaces and carriage
128 1.2 jtc * returns embedded in the input stream.
129 1.2 jtc */
130 1.2 jtc static void
131 1.11 mjl fold(int width)
132 1.1 cgd {
133 1.16 ahoka static wchar_t *buf = NULL;
134 1.16 ahoka wchar_t *nbuf;
135 1.2 jtc static int buf_max = 0;
136 1.16 ahoka wint_t ch;
137 1.16 ahoka int col, indx, i;
138 1.2 jtc
139 1.2 jtc col = indx = 0;
140 1.16 ahoka while ((ch = getwchar()) != WEOF) {
141 1.16 ahoka if (ch == L'\n') {
142 1.16 ahoka if (indx != 0) {
143 1.16 ahoka for (i = 0; i < indx; i++)
144 1.16 ahoka putwchar(buf[i]);
145 1.16 ahoka }
146 1.16 ahoka putwchar(L'\n');
147 1.2 jtc col = indx = 0;
148 1.2 jtc continue;
149 1.2 jtc }
150 1.2 jtc
151 1.2 jtc col = new_column_position (col, ch);
152 1.2 jtc if (col > width) {
153 1.16 ahoka int last_space;
154 1.2 jtc
155 1.8 mrg #ifdef __GNUC__
156 1.8 mrg last_space = 0; /* XXX gcc */
157 1.8 mrg #endif
158 1.2 jtc if (split_words) {
159 1.2 jtc for (i = 0, last_space = -1; i < indx; i++)
160 1.16 ahoka if (buf[i] == L' ')
161 1.8 mrg last_space = i;
162 1.2 jtc }
163 1.1 cgd
164 1.2 jtc if (split_words && last_space != -1) {
165 1.16 ahoka for (i = 0; i < last_space; i++)
166 1.16 ahoka putwchar(buf[i]);
167 1.15 ahoka
168 1.15 ahoka /* increase last_space here, so we skip trailing whitespace */
169 1.2 jtc last_space++;
170 1.16 ahoka wmemmove (buf, buf+last_space, indx-last_space);
171 1.2 jtc
172 1.2 jtc indx -= last_space;
173 1.2 jtc col = 0;
174 1.2 jtc for (i = 0; i < indx; i++) {
175 1.9 frueauf col = new_column_position (col, buf[i]);
176 1.2 jtc }
177 1.2 jtc } else {
178 1.16 ahoka for (i = 0; i < indx; i++)
179 1.16 ahoka putwchar(buf[i]);
180 1.2 jtc col = indx = 0;
181 1.2 jtc }
182 1.16 ahoka putwchar('\n');
183 1.2 jtc
184 1.2 jtc /* calculate the column position for the next line. */
185 1.2 jtc col = new_column_position (col, ch);
186 1.1 cgd }
187 1.1 cgd
188 1.2 jtc if (indx + 1 > buf_max) {
189 1.2 jtc /* Allocate buffer in LINE_MAX increments */
190 1.13 itojun if ((nbuf = realloc (buf, buf_max + 2048)) == NULL) {
191 1.7 lukem err (1, "realloc");
192 1.4 jtc /* NOTREACHED */
193 1.2 jtc }
194 1.13 itojun buf = nbuf;
195 1.13 itojun buf_max += 2048;
196 1.1 cgd }
197 1.2 jtc buf[indx++] = ch;
198 1.2 jtc }
199 1.2 jtc
200 1.16 ahoka if (indx != 0) {
201 1.16 ahoka for (i = 0; i < indx; i++)
202 1.16 ahoka putwchar(buf[i]);
203 1.16 ahoka }
204 1.2 jtc }
205 1.1 cgd
206 1.2 jtc /*
207 1.2 jtc * calculate the column position
208 1.2 jtc */
209 1.2 jtc static int
210 1.16 ahoka new_column_position (int col, wint_t ch)
211 1.2 jtc {
212 1.16 ahoka int w;
213 1.16 ahoka
214 1.2 jtc if (!count_bytes) {
215 1.1 cgd switch (ch) {
216 1.16 ahoka case L'\b':
217 1.1 cgd if (col > 0)
218 1.1 cgd --col;
219 1.1 cgd break;
220 1.16 ahoka case L'\r':
221 1.1 cgd col = 0;
222 1.1 cgd break;
223 1.16 ahoka case L'\t':
224 1.2 jtc col = (col + 8) & ~7;
225 1.1 cgd break;
226 1.1 cgd default:
227 1.16 ahoka w = wcwidth(ch);
228 1.16 ahoka if (w > 0)
229 1.16 ahoka col += w;
230 1.1 cgd break;
231 1.1 cgd }
232 1.2 jtc } else {
233 1.16 ahoka char dummy[MB_LEN_MAX];
234 1.16 ahoka
235 1.16 ahoka /* XXX: we assume stateless encoding */
236 1.16 ahoka col += wcrtomb(dummy, ch, NULL);
237 1.1 cgd }
238 1.2 jtc
239 1.2 jtc return col;
240 1.1 cgd }
241 1.10 mjl
242 1.11 mjl static void
243 1.11 mjl usage(void)
244 1.16 ahoka {
245 1.10 mjl (void)fprintf(stderr,
246 1.16 ahoka "usage: %s [-bs] [-w width] [file ...]\n", getprogname());
247 1.10 mjl exit(1);
248 1.16 ahoka }
249 1.10 mjl
250