process.c revision 1.52 1 1.52 christos /* $NetBSD: process.c,v 1.52 2015/03/12 12:40:41 christos Exp $ */
2 1.18 tls
3 1.1 alm /*-
4 1.40 christos * Copyright (c) 1992 Diomidis Spinellis.
5 1.19 mrg * Copyright (c) 1992, 1993, 1994
6 1.8 cgd * The Regents of the University of California. All rights reserved.
7 1.1 alm *
8 1.1 alm * This code is derived from software contributed to Berkeley by
9 1.1 alm * Diomidis Spinellis of Imperial College, University of London.
10 1.1 alm *
11 1.1 alm * Redistribution and use in source and binary forms, with or without
12 1.1 alm * modification, are permitted provided that the following conditions
13 1.1 alm * are met:
14 1.1 alm * 1. Redistributions of source code must retain the above copyright
15 1.1 alm * notice, this list of conditions and the following disclaimer.
16 1.1 alm * 2. Redistributions in binary form must reproduce the above copyright
17 1.1 alm * notice, this list of conditions and the following disclaimer in the
18 1.1 alm * documentation and/or other materials provided with the distribution.
19 1.33 agc * 3. Neither the name of the University nor the names of its contributors
20 1.33 agc * may be used to endorse or promote products derived from this software
21 1.33 agc * without specific prior written permission.
22 1.33 agc *
23 1.33 agc * THIS SOFTWARE IS PROVIDED BY THE REGENTS AND CONTRIBUTORS ``AS IS'' AND
24 1.33 agc * ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
25 1.33 agc * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
26 1.33 agc * ARE DISCLAIMED. IN NO EVENT SHALL THE REGENTS OR CONTRIBUTORS BE LIABLE
27 1.33 agc * FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL
28 1.33 agc * DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS
29 1.33 agc * OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION)
30 1.33 agc * HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT
31 1.33 agc * LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY
32 1.33 agc * OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF
33 1.33 agc * SUCH DAMAGE.
34 1.33 agc */
35 1.33 agc
36 1.37 gdamore #if HAVE_NBTOOL_CONFIG_H
37 1.37 gdamore #include "nbtool_config.h"
38 1.37 gdamore #endif
39 1.37 gdamore
40 1.20 lukem #include <sys/cdefs.h>
41 1.52 christos __RCSID("$NetBSD: process.c,v 1.52 2015/03/12 12:40:41 christos Exp $");
42 1.40 christos #ifdef __FBSDID
43 1.40 christos __FBSDID("$FreeBSD: head/usr.bin/sed/process.c 192732 2009-05-25 06:45:33Z brian $");
44 1.40 christos #endif
45 1.40 christos
46 1.45 christos #if 0
47 1.45 christos static const char sccsid[] = "@(#)process.c 8.6 (Berkeley) 4/20/94";
48 1.45 christos #endif
49 1.45 christos
50 1.1 alm #include <sys/types.h>
51 1.1 alm #include <sys/stat.h>
52 1.1 alm #include <sys/ioctl.h>
53 1.1 alm #include <sys/uio.h>
54 1.1 alm
55 1.1 alm #include <ctype.h>
56 1.40 christos #include <err.h>
57 1.1 alm #include <errno.h>
58 1.1 alm #include <fcntl.h>
59 1.1 alm #include <limits.h>
60 1.1 alm #include <regex.h>
61 1.1 alm #include <stdio.h>
62 1.1 alm #include <stdlib.h>
63 1.1 alm #include <string.h>
64 1.1 alm #include <unistd.h>
65 1.40 christos #include <wchar.h>
66 1.40 christos #include <wctype.h>
67 1.1 alm
68 1.1 alm #include "defs.h"
69 1.1 alm #include "extern.h"
70 1.1 alm
71 1.40 christos static SPACE HS, PS, SS, YS;
72 1.1 alm #define pd PS.deleted
73 1.1 alm #define ps PS.space
74 1.1 alm #define psl PS.len
75 1.1 alm #define hs HS.space
76 1.1 alm #define hsl HS.len
77 1.1 alm
78 1.40 christos static __inline int applies(struct s_command *);
79 1.40 christos static void do_tr(struct s_tr *);
80 1.32 wiz static void flush_appends(void);
81 1.40 christos static void lputs(char *, size_t);
82 1.40 christos static __inline int regexec_e(regex_t *, const char *, int, int, size_t);
83 1.32 wiz static void regsub(SPACE *, char *, char *);
84 1.32 wiz static int substitute(struct s_command *);
85 1.1 alm
86 1.52 christos struct s_appends *appends; /* Array of pointers to strings to append. */
87 1.40 christos static size_t appendx; /* Index into appends array. */
88 1.40 christos size_t appendnum; /* Size of appends array. */
89 1.1 alm
90 1.1 alm static int lastaddr; /* Set by applies if last address of a range. */
91 1.1 alm static int sdone; /* If any substitutes since last line input. */
92 1.1 alm /* Iov structure for 'w' commands. */
93 1.1 alm static regex_t *defpreg;
94 1.1 alm size_t maxnsub;
95 1.52 christos regmatch_t *match;
96 1.1 alm
97 1.40 christos #define OUT() do {fwrite(ps, 1, psl, outfile); fputc('\n', outfile);} while (0)
98 1.8 cgd
99 1.52 christos void
100 1.32 wiz process(void)
101 1.1 alm {
102 1.1 alm struct s_command *cp;
103 1.1 alm SPACE tspace;
104 1.40 christos size_t oldpsl = 0;
105 1.15 mycroft char *p;
106 1.1 alm
107 1.40 christos p = NULL;
108 1.40 christos
109 1.1 alm for (linenum = 0; mf_fgets(&PS, REPLACE);) {
110 1.1 alm pd = 0;
111 1.16 mycroft top:
112 1.1 alm cp = prog;
113 1.1 alm redirect:
114 1.1 alm while (cp != NULL) {
115 1.1 alm if (!applies(cp)) {
116 1.1 alm cp = cp->next;
117 1.1 alm continue;
118 1.1 alm }
119 1.1 alm switch (cp->code) {
120 1.1 alm case '{':
121 1.1 alm cp = cp->u.c;
122 1.1 alm goto redirect;
123 1.1 alm case 'a':
124 1.40 christos if (appendx >= appendnum)
125 1.1 alm appends = xrealloc(appends,
126 1.1 alm sizeof(struct s_appends) *
127 1.40 christos (appendnum *= 2));
128 1.1 alm appends[appendx].type = AP_STRING;
129 1.1 alm appends[appendx].s = cp->t;
130 1.8 cgd appends[appendx].len = strlen(cp->t);
131 1.1 alm appendx++;
132 1.1 alm break;
133 1.1 alm case 'b':
134 1.1 alm cp = cp->u.c;
135 1.1 alm goto redirect;
136 1.1 alm case 'c':
137 1.1 alm pd = 1;
138 1.1 alm psl = 0;
139 1.40 christos if (cp->a2 == NULL || lastaddr || lastline())
140 1.40 christos (void)fprintf(outfile, "%s", cp->t);
141 1.39 uwe goto new;
142 1.1 alm case 'd':
143 1.1 alm pd = 1;
144 1.1 alm goto new;
145 1.1 alm case 'D':
146 1.1 alm if (pd)
147 1.1 alm goto new;
148 1.40 christos if (psl == 0 ||
149 1.40 christos (p = memchr(ps, '\n', psl - 1)) == NULL) {
150 1.1 alm pd = 1;
151 1.16 mycroft goto new;
152 1.28 atatat } else {
153 1.40 christos psl -= (size_t)((p + 1) - ps);
154 1.1 alm memmove(ps, p + 1, psl);
155 1.28 atatat goto top;
156 1.1 alm }
157 1.1 alm case 'g':
158 1.1 alm cspace(&PS, hs, hsl, REPLACE);
159 1.1 alm break;
160 1.1 alm case 'G':
161 1.43 christos cspace(&PS, "\n", 1, APPEND);
162 1.40 christos cspace(&PS, hs, hsl, APPEND);
163 1.1 alm break;
164 1.1 alm case 'h':
165 1.1 alm cspace(&HS, ps, psl, REPLACE);
166 1.1 alm break;
167 1.1 alm case 'H':
168 1.40 christos cspace(&HS, "\n", 1, APPEND);
169 1.40 christos cspace(&HS, ps, psl, APPEND);
170 1.1 alm break;
171 1.1 alm case 'i':
172 1.40 christos (void)fprintf(outfile, "%s", cp->t);
173 1.1 alm break;
174 1.1 alm case 'l':
175 1.40 christos lputs(ps, psl);
176 1.1 alm break;
177 1.1 alm case 'n':
178 1.1 alm if (!nflag && !pd)
179 1.40 christos OUT();
180 1.1 alm flush_appends();
181 1.14 mycroft if (!mf_fgets(&PS, REPLACE))
182 1.1 alm exit(0);
183 1.1 alm pd = 0;
184 1.1 alm break;
185 1.1 alm case 'N':
186 1.1 alm flush_appends();
187 1.40 christos cspace(&PS, "\n", 1, APPEND);
188 1.40 christos if (!mf_fgets(&PS, APPEND))
189 1.1 alm exit(0);
190 1.1 alm break;
191 1.1 alm case 'p':
192 1.1 alm if (pd)
193 1.1 alm break;
194 1.40 christos OUT();
195 1.1 alm break;
196 1.1 alm case 'P':
197 1.1 alm if (pd)
198 1.1 alm break;
199 1.15 mycroft if ((p = memchr(ps, '\n', psl - 1)) != NULL) {
200 1.15 mycroft oldpsl = psl;
201 1.40 christos psl = (size_t)(p - ps);
202 1.1 alm }
203 1.40 christos OUT();
204 1.1 alm if (p != NULL)
205 1.15 mycroft psl = oldpsl;
206 1.1 alm break;
207 1.1 alm case 'q':
208 1.1 alm if (!nflag && !pd)
209 1.40 christos OUT();
210 1.1 alm flush_appends();
211 1.1 alm exit(0);
212 1.1 alm case 'r':
213 1.40 christos if (appendx >= appendnum)
214 1.1 alm appends = xrealloc(appends,
215 1.1 alm sizeof(struct s_appends) *
216 1.40 christos (appendnum *= 2));
217 1.1 alm appends[appendx].type = AP_FILE;
218 1.1 alm appends[appendx].s = cp->t;
219 1.8 cgd appends[appendx].len = strlen(cp->t);
220 1.1 alm appendx++;
221 1.1 alm break;
222 1.1 alm case 's':
223 1.1 alm sdone |= substitute(cp);
224 1.1 alm break;
225 1.1 alm case 't':
226 1.1 alm if (sdone) {
227 1.1 alm sdone = 0;
228 1.1 alm cp = cp->u.c;
229 1.1 alm goto redirect;
230 1.1 alm }
231 1.1 alm break;
232 1.1 alm case 'w':
233 1.1 alm if (pd)
234 1.1 alm break;
235 1.1 alm if (cp->u.fd == -1 && (cp->u.fd = open(cp->t,
236 1.1 alm O_WRONLY|O_APPEND|O_CREAT|O_TRUNC,
237 1.1 alm DEFFILEMODE)) == -1)
238 1.40 christos err(1, "%s", cp->t);
239 1.40 christos if (write(cp->u.fd, ps, psl) != (ssize_t)psl ||
240 1.40 christos write(cp->u.fd, "\n", 1) != 1)
241 1.40 christos err(1, "%s", cp->t);
242 1.1 alm break;
243 1.1 alm case 'x':
244 1.40 christos /*
245 1.40 christos * If the hold space is null, make it empty
246 1.40 christos * but not null. Otherwise the pattern space
247 1.40 christos * will become null after the swap, which is
248 1.40 christos * an abnormal condition.
249 1.40 christos */
250 1.8 cgd if (hs == NULL)
251 1.40 christos cspace(&HS, "", 0, REPLACE);
252 1.1 alm tspace = PS;
253 1.1 alm PS = HS;
254 1.1 alm HS = tspace;
255 1.1 alm break;
256 1.1 alm case 'y':
257 1.40 christos if (pd || psl == 0)
258 1.1 alm break;
259 1.40 christos do_tr(cp->u.y);
260 1.1 alm break;
261 1.1 alm case ':':
262 1.1 alm case '}':
263 1.1 alm break;
264 1.1 alm case '=':
265 1.40 christos (void)fprintf(outfile, "%lu\n", linenum);
266 1.1 alm }
267 1.1 alm cp = cp->next;
268 1.1 alm } /* for all cp */
269 1.1 alm
270 1.1 alm new: if (!nflag && !pd)
271 1.40 christos OUT();
272 1.1 alm flush_appends();
273 1.1 alm } /* for all lines */
274 1.1 alm }
275 1.1 alm
276 1.1 alm /*
277 1.1 alm * TRUE if the address passed matches the current program state
278 1.1 alm * (lastline, linenumber, ps).
279 1.1 alm */
280 1.40 christos #define MATCH(a) \
281 1.40 christos ((a)->type == AT_RE ? regexec_e((a)->u.r, ps, 0, 1, psl) : \
282 1.40 christos (a)->type == AT_LINE ? linenum == (a)->u.l : lastline())
283 1.1 alm
284 1.1 alm /*
285 1.40 christos * Return TRUE if the command applies to the current line. Sets the start
286 1.40 christos * line for process ranges. Interprets the non-select (``!'') flag.
287 1.1 alm */
288 1.40 christos static __inline int
289 1.32 wiz applies(struct s_command *cp)
290 1.1 alm {
291 1.1 alm int r;
292 1.1 alm
293 1.1 alm lastaddr = 0;
294 1.1 alm if (cp->a1 == NULL && cp->a2 == NULL)
295 1.1 alm r = 1;
296 1.40 christos else if (cp->a2)
297 1.40 christos if (cp->startline > 0) {
298 1.46 christos switch (cp->a2->type) {
299 1.46 christos case AT_RELLINE:
300 1.46 christos if (linenum - cp->startline <= cp->a2->u.l)
301 1.46 christos r = 1;
302 1.46 christos else {
303 1.46 christos cp->startline = 0;
304 1.46 christos r = 0;
305 1.46 christos }
306 1.46 christos break;
307 1.46 christos default:
308 1.46 christos if (MATCH(cp->a2)) {
309 1.46 christos cp->startline = 0;
310 1.46 christos lastaddr = 1;
311 1.46 christos r = 1;
312 1.46 christos } else if (cp->a2->type == AT_LINE &&
313 1.46 christos linenum > cp->a2->u.l) {
314 1.46 christos /*
315 1.46 christos * We missed the 2nd address due to a
316 1.46 christos * branch, so just close the range and
317 1.46 christos * return false.
318 1.46 christos */
319 1.46 christos cp->startline = 0;
320 1.46 christos r = 0;
321 1.46 christos } else
322 1.46 christos r = 1;
323 1.46 christos }
324 1.36 christos } else if (cp->a1 && MATCH(cp->a1)) {
325 1.1 alm /*
326 1.1 alm * If the second address is a number less than or
327 1.1 alm * equal to the line number first selected, only
328 1.1 alm * one line shall be selected.
329 1.1 alm * -- POSIX 1003.2
330 1.40 christos * Likewise if the relative second line address is zero.
331 1.1 alm */
332 1.40 christos if ((cp->a2->type == AT_LINE &&
333 1.40 christos linenum >= cp->a2->u.l) ||
334 1.40 christos (cp->a2->type == AT_RELLINE && cp->a2->u.l == 0))
335 1.1 alm lastaddr = 1;
336 1.40 christos else {
337 1.40 christos cp->startline = linenum;
338 1.40 christos }
339 1.1 alm r = 1;
340 1.1 alm } else
341 1.1 alm r = 0;
342 1.40 christos else
343 1.1 alm r = MATCH(cp->a1);
344 1.1 alm return (cp->nonsel ? ! r : r);
345 1.1 alm }
346 1.1 alm
347 1.1 alm /*
348 1.40 christos * Reset the sed processor to its initial state.
349 1.40 christos */
350 1.52 christos void
351 1.40 christos resetstate(void)
352 1.40 christos {
353 1.40 christos struct s_command *cp;
354 1.40 christos
355 1.40 christos /*
356 1.40 christos * Reset all in-range markers.
357 1.40 christos */
358 1.40 christos for (cp = prog; cp; cp = cp->code == '{' ? cp->u.c : cp->next)
359 1.40 christos if (cp->a2)
360 1.40 christos cp->startline = 0;
361 1.40 christos
362 1.40 christos /*
363 1.40 christos * Clear out the hold space.
364 1.40 christos */
365 1.40 christos cspace(&HS, "", 0, REPLACE);
366 1.40 christos }
367 1.40 christos
368 1.40 christos /*
369 1.1 alm * substitute --
370 1.1 alm * Do substitutions in the pattern space. Currently, we build a
371 1.1 alm * copy of the new pattern space in the substitute space structure
372 1.1 alm * and then swap them.
373 1.1 alm */
374 1.1 alm static int
375 1.32 wiz substitute(struct s_command *cp)
376 1.1 alm {
377 1.1 alm SPACE tspace;
378 1.1 alm regex_t *re;
379 1.40 christos regoff_t re_off, slen;
380 1.19 mrg int lastempty, n;
381 1.1 alm char *s;
382 1.1 alm
383 1.1 alm s = ps;
384 1.1 alm re = cp->u.s->re;
385 1.1 alm if (re == NULL) {
386 1.40 christos if (defpreg != NULL && cp->u.s->maxbref > defpreg->re_nsub) {
387 1.1 alm linenum = cp->u.s->linenum;
388 1.40 christos errx(1, "%lu: %s: \\%u not defined in the RE",
389 1.40 christos linenum, fname, cp->u.s->maxbref);
390 1.1 alm }
391 1.1 alm }
392 1.8 cgd if (!regexec_e(re, s, 0, 0, psl))
393 1.1 alm return (0);
394 1.1 alm
395 1.1 alm SS.len = 0; /* Clean substitute space. */
396 1.40 christos slen = (regoff_t)psl;
397 1.1 alm n = cp->u.s->n;
398 1.12 cgd lastempty = 1;
399 1.12 cgd
400 1.1 alm switch (n) {
401 1.1 alm case 0: /* Global */
402 1.1 alm do {
403 1.12 cgd if (lastempty || match[0].rm_so != match[0].rm_eo) {
404 1.12 cgd /* Locate start of replaced string. */
405 1.12 cgd re_off = match[0].rm_so;
406 1.12 cgd /* Copy leading retained string. */
407 1.40 christos cspace(&SS, s, (size_t)re_off, APPEND);
408 1.12 cgd /* Add in regular expression. */
409 1.12 cgd regsub(&SS, s, cp->u.s->new);
410 1.12 cgd }
411 1.12 cgd
412 1.1 alm /* Move past this match. */
413 1.12 cgd if (match[0].rm_so != match[0].rm_eo) {
414 1.12 cgd s += match[0].rm_eo;
415 1.12 cgd slen -= match[0].rm_eo;
416 1.12 cgd lastempty = 0;
417 1.12 cgd } else {
418 1.40 christos if (match[0].rm_so < slen)
419 1.40 christos cspace(&SS, s + match[0].rm_so, 1,
420 1.40 christos APPEND);
421 1.12 cgd s += match[0].rm_so + 1;
422 1.12 cgd slen -= match[0].rm_so + 1;
423 1.12 cgd lastempty = 1;
424 1.12 cgd }
425 1.40 christos } while (slen >= 0 && regexec_e(re, s, REG_NOTBOL, 0, (size_t)slen));
426 1.1 alm /* Copy trailing retained string. */
427 1.12 cgd if (slen > 0)
428 1.40 christos cspace(&SS, s, (size_t)slen, APPEND);
429 1.1 alm break;
430 1.1 alm default: /* Nth occurrence */
431 1.1 alm while (--n) {
432 1.40 christos if (match[0].rm_eo == match[0].rm_so)
433 1.40 christos match[0].rm_eo = match[0].rm_so + 1;
434 1.1 alm s += match[0].rm_eo;
435 1.8 cgd slen -= match[0].rm_eo;
436 1.40 christos if (slen < 0)
437 1.40 christos return (0);
438 1.40 christos if (!regexec_e(re, s, REG_NOTBOL, 0, (size_t)slen))
439 1.1 alm return (0);
440 1.1 alm }
441 1.1 alm /* FALLTHROUGH */
442 1.1 alm case 1: /* 1st occurrence */
443 1.1 alm /* Locate start of replaced string. */
444 1.1 alm re_off = match[0].rm_so + (s - ps);
445 1.1 alm /* Copy leading retained string. */
446 1.40 christos cspace(&SS, ps, (size_t)re_off, APPEND);
447 1.1 alm /* Add in regular expression. */
448 1.1 alm regsub(&SS, s, cp->u.s->new);
449 1.1 alm /* Copy trailing retained string. */
450 1.1 alm s += match[0].rm_eo;
451 1.8 cgd slen -= match[0].rm_eo;
452 1.40 christos cspace(&SS, s, (size_t)slen, APPEND);
453 1.1 alm break;
454 1.1 alm }
455 1.1 alm
456 1.1 alm /*
457 1.1 alm * Swap the substitute space and the pattern space, and make sure
458 1.1 alm * that any leftover pointers into stdio memory get lost.
459 1.1 alm */
460 1.1 alm tspace = PS;
461 1.1 alm PS = SS;
462 1.1 alm SS = tspace;
463 1.1 alm SS.space = SS.back;
464 1.1 alm
465 1.1 alm /* Handle the 'p' flag. */
466 1.1 alm if (cp->u.s->p)
467 1.40 christos OUT();
468 1.1 alm
469 1.1 alm /* Handle the 'w' flag. */
470 1.1 alm if (cp->u.s->wfile && !pd) {
471 1.1 alm if (cp->u.s->wfd == -1 && (cp->u.s->wfd = open(cp->u.s->wfile,
472 1.1 alm O_WRONLY|O_APPEND|O_CREAT|O_TRUNC, DEFFILEMODE)) == -1)
473 1.40 christos err(1, "%s", cp->u.s->wfile);
474 1.40 christos if (write(cp->u.s->wfd, ps, psl) != (ssize_t)psl ||
475 1.40 christos write(cp->u.s->wfd, "\n", 1) != 1)
476 1.40 christos err(1, "%s", cp->u.s->wfile);
477 1.1 alm }
478 1.1 alm return (1);
479 1.1 alm }
480 1.1 alm
481 1.1 alm /*
482 1.40 christos * do_tr --
483 1.40 christos * Perform translation ('y' command) in the pattern space.
484 1.40 christos */
485 1.40 christos static void
486 1.40 christos do_tr(struct s_tr *y)
487 1.40 christos {
488 1.40 christos SPACE tmp;
489 1.40 christos char c, *p;
490 1.40 christos size_t clen, left;
491 1.40 christos size_t i;
492 1.40 christos
493 1.40 christos if (MB_CUR_MAX == 1) {
494 1.40 christos /*
495 1.40 christos * Single-byte encoding: perform in-place translation
496 1.40 christos * of the pattern space.
497 1.40 christos */
498 1.40 christos for (p = ps; p < &ps[psl]; p++)
499 1.40 christos *p = (char)y->bytetab[(u_char)*p];
500 1.40 christos } else {
501 1.40 christos /*
502 1.40 christos * Multi-byte encoding: perform translation into the
503 1.40 christos * translation space, then swap the translation and
504 1.40 christos * pattern spaces.
505 1.40 christos */
506 1.40 christos /* Clean translation space. */
507 1.40 christos YS.len = 0;
508 1.40 christos for (p = ps, left = psl; left > 0; p += clen, left -= clen) {
509 1.40 christos if ((c = (char)y->bytetab[(u_char)*p]) != '\0') {
510 1.40 christos cspace(&YS, &c, 1, APPEND);
511 1.40 christos clen = 1;
512 1.40 christos continue;
513 1.40 christos }
514 1.40 christos for (i = 0; i < y->nmultis; i++)
515 1.40 christos if (left >= y->multis[i].fromlen &&
516 1.40 christos memcmp(p, y->multis[i].from,
517 1.40 christos y->multis[i].fromlen) == 0)
518 1.40 christos break;
519 1.40 christos if (i < y->nmultis) {
520 1.40 christos cspace(&YS, y->multis[i].to,
521 1.40 christos y->multis[i].tolen, APPEND);
522 1.40 christos clen = y->multis[i].fromlen;
523 1.40 christos } else {
524 1.40 christos cspace(&YS, p, 1, APPEND);
525 1.40 christos clen = 1;
526 1.40 christos }
527 1.40 christos }
528 1.40 christos /* Swap the translation space and the pattern space. */
529 1.40 christos tmp = PS;
530 1.40 christos PS = YS;
531 1.40 christos YS = tmp;
532 1.40 christos YS.space = YS.back;
533 1.40 christos }
534 1.40 christos }
535 1.40 christos
536 1.40 christos /*
537 1.1 alm * Flush append requests. Always called before reading a line,
538 1.1 alm * therefore it also resets the substitution done (sdone) flag.
539 1.1 alm */
540 1.1 alm static void
541 1.32 wiz flush_appends(void)
542 1.1 alm {
543 1.1 alm FILE *f;
544 1.40 christos size_t count, i;
545 1.1 alm char buf[8 * 1024];
546 1.1 alm
547 1.40 christos for (i = 0; i < appendx; i++)
548 1.1 alm switch (appends[i].type) {
549 1.1 alm case AP_STRING:
550 1.40 christos fwrite(appends[i].s, sizeof(char), appends[i].len,
551 1.40 christos outfile);
552 1.1 alm break;
553 1.1 alm case AP_FILE:
554 1.1 alm /*
555 1.1 alm * Read files probably shouldn't be cached. Since
556 1.1 alm * it's not an error to read a non-existent file,
557 1.1 alm * it's possible that another program is interacting
558 1.40 christos * with the sed script through the filesystem. It
559 1.1 alm * would be truly bizarre, but possible. It's probably
560 1.1 alm * not that big a performance win, anyhow.
561 1.1 alm */
562 1.1 alm if ((f = fopen(appends[i].s, "r")) == NULL)
563 1.1 alm break;
564 1.40 christos while ((count = fread(buf, sizeof(char), sizeof(buf), f)))
565 1.40 christos (void)fwrite(buf, sizeof(char), count, outfile);
566 1.1 alm (void)fclose(f);
567 1.1 alm break;
568 1.1 alm }
569 1.40 christos if (ferror(outfile))
570 1.40 christos errx(1, "%s: %s", outfname, strerror(errno ? errno : EIO));
571 1.40 christos appendx = 0;
572 1.40 christos sdone = 0;
573 1.1 alm }
574 1.1 alm
575 1.1 alm static void
576 1.40 christos lputs(char *s, size_t len)
577 1.1 alm {
578 1.40 christos static const char escapes[] = "\\\a\b\f\r\t\v";
579 1.40 christos int c;
580 1.40 christos size_t col, width;
581 1.40 christos const char *p;
582 1.40 christos #ifdef TIOCGWINSZ
583 1.1 alm struct winsize win;
584 1.37 gdamore #endif
585 1.40 christos static size_t termwidth = (size_t)-1;
586 1.40 christos size_t clen, i;
587 1.40 christos wchar_t wc;
588 1.40 christos mbstate_t mbs;
589 1.40 christos
590 1.40 christos if (outfile != stdout)
591 1.40 christos termwidth = 60;
592 1.40 christos if (termwidth == (size_t)-1) {
593 1.40 christos if ((p = getenv("COLUMNS")) && *p != '\0')
594 1.40 christos termwidth = (size_t)atoi(p);
595 1.40 christos #ifdef TIOCGWINSZ
596 1.1 alm else if (ioctl(STDOUT_FILENO, TIOCGWINSZ, &win) == 0 &&
597 1.1 alm win.ws_col > 0)
598 1.1 alm termwidth = win.ws_col;
599 1.37 gdamore #endif
600 1.1 alm else
601 1.1 alm termwidth = 60;
602 1.23 ross }
603 1.40 christos if (termwidth == 0)
604 1.40 christos termwidth = 1;
605 1.40 christos
606 1.40 christos memset(&mbs, 0, sizeof(mbs));
607 1.40 christos col = 0;
608 1.40 christos while (len != 0) {
609 1.40 christos clen = mbrtowc(&wc, s, len, &mbs);
610 1.40 christos if (clen == 0)
611 1.40 christos clen = 1;
612 1.40 christos if (clen == (size_t)-1 || clen == (size_t)-2) {
613 1.40 christos wc = (unsigned char)*s;
614 1.40 christos clen = 1;
615 1.40 christos memset(&mbs, 0, sizeof(mbs));
616 1.1 alm }
617 1.40 christos if (wc == '\n') {
618 1.40 christos if (col + 1 >= termwidth)
619 1.40 christos fprintf(outfile, "\\\n");
620 1.40 christos fputc('$', outfile);
621 1.40 christos fputc('\n', outfile);
622 1.40 christos col = 0;
623 1.40 christos } else if (iswprint(wc)) {
624 1.40 christos width = (size_t)wcwidth(wc);
625 1.40 christos if (col + width >= termwidth) {
626 1.40 christos fprintf(outfile, "\\\n");
627 1.40 christos col = 0;
628 1.40 christos }
629 1.40 christos fwrite(s, 1, clen, outfile);
630 1.40 christos col += width;
631 1.40 christos } else if (wc != L'\0' && (c = wctob(wc)) != EOF &&
632 1.40 christos (p = strchr(escapes, c)) != NULL) {
633 1.40 christos if (col + 2 >= termwidth) {
634 1.40 christos fprintf(outfile, "\\\n");
635 1.40 christos col = 0;
636 1.40 christos }
637 1.40 christos fprintf(outfile, "\\%c", "\\abfrtv"[p - escapes]);
638 1.40 christos col += 2;
639 1.1 alm } else {
640 1.40 christos if (col + 4 * clen >= termwidth) {
641 1.40 christos fprintf(outfile, "\\\n");
642 1.40 christos col = 0;
643 1.1 alm }
644 1.40 christos for (i = 0; i < clen; i++)
645 1.40 christos fprintf(outfile, "\\%03o",
646 1.40 christos (int)(unsigned char)s[i]);
647 1.40 christos col += 4 * clen;
648 1.1 alm }
649 1.40 christos s += clen;
650 1.40 christos len -= clen;
651 1.1 alm }
652 1.40 christos if (col + 1 >= termwidth)
653 1.40 christos fprintf(outfile, "\\\n");
654 1.40 christos (void)fputc('$', outfile);
655 1.40 christos (void)fputc('\n', outfile);
656 1.40 christos if (ferror(outfile))
657 1.40 christos errx(1, "%s: %s", outfname, strerror(errno ? errno : EIO));
658 1.1 alm }
659 1.1 alm
660 1.40 christos static __inline int
661 1.40 christos regexec_e(regex_t *preg, const char *string, int eflags, int nomatch,
662 1.40 christos size_t slen)
663 1.1 alm {
664 1.1 alm int eval;
665 1.44 christos #ifndef REG_STARTEND
666 1.44 christos char *buf;
667 1.44 christos #endif
668 1.40 christos
669 1.1 alm if (preg == NULL) {
670 1.1 alm if (defpreg == NULL)
671 1.40 christos errx(1, "first RE may not be empty");
672 1.1 alm } else
673 1.1 alm defpreg = preg;
674 1.1 alm
675 1.40 christos /* Set anchors */
676 1.44 christos #ifndef REG_STARTEND
677 1.44 christos buf = xmalloc(slen + 1);
678 1.44 christos (void)memcpy(buf, string, slen);
679 1.44 christos buf[slen] = '\0';
680 1.44 christos eval = regexec(defpreg, buf,
681 1.44 christos nomatch ? 0 : maxnsub + 1, match, eflags);
682 1.44 christos free(buf);
683 1.44 christos #else
684 1.8 cgd match[0].rm_so = 0;
685 1.40 christos match[0].rm_eo = (regoff_t)slen;
686 1.1 alm eval = regexec(defpreg, string,
687 1.8 cgd nomatch ? 0 : maxnsub + 1, match, eflags | REG_STARTEND);
688 1.44 christos #endif
689 1.1 alm switch(eval) {
690 1.1 alm case 0:
691 1.1 alm return (1);
692 1.1 alm case REG_NOMATCH:
693 1.1 alm return (0);
694 1.1 alm }
695 1.40 christos errx(1, "RE error: %s", strregerror(eval, defpreg));
696 1.1 alm /* NOTREACHED */
697 1.1 alm }
698 1.1 alm
699 1.1 alm /*
700 1.1 alm * regsub - perform substitutions after a regexp match
701 1.1 alm * Based on a routine by Henry Spencer
702 1.1 alm */
703 1.1 alm static void
704 1.32 wiz regsub(SPACE *sp, char *string, char *src)
705 1.1 alm {
706 1.40 christos size_t len;
707 1.40 christos int no;
708 1.20 lukem char c, *dst;
709 1.1 alm
710 1.1 alm #define NEEDSP(reqlen) \
711 1.40 christos /* XXX What is the +1 for? */ \
712 1.34 itojun if (sp->len + (reqlen) + 1 >= sp->blen) { \
713 1.40 christos sp->blen += (reqlen) + 1024; \
714 1.40 christos sp->space = sp->back = xrealloc(sp->back, sp->blen); \
715 1.1 alm dst = sp->space + sp->len; \
716 1.1 alm }
717 1.1 alm
718 1.1 alm dst = sp->space + sp->len;
719 1.1 alm while ((c = *src++) != '\0') {
720 1.1 alm if (c == '&')
721 1.1 alm no = 0;
722 1.24 christos else if (c == '\\' && isdigit((unsigned char)*src))
723 1.1 alm no = *src++ - '0';
724 1.1 alm else
725 1.1 alm no = -1;
726 1.1 alm if (no < 0) { /* Ordinary character. */
727 1.40 christos if (c == '\\' && (*src == '\\' || *src == '&'))
728 1.40 christos c = *src++;
729 1.1 alm NEEDSP(1);
730 1.40 christos *dst++ = c;
731 1.1 alm ++sp->len;
732 1.40 christos } else if (match[no].rm_so != -1 && match[no].rm_eo != -1) {
733 1.40 christos len = (size_t)(match[no].rm_eo - match[no].rm_so);
734 1.1 alm NEEDSP(len);
735 1.1 alm memmove(dst, string + match[no].rm_so, len);
736 1.1 alm dst += len;
737 1.1 alm sp->len += len;
738 1.1 alm }
739 1.1 alm }
740 1.1 alm NEEDSP(1);
741 1.1 alm *dst = '\0';
742 1.1 alm }
743 1.1 alm
744 1.1 alm /*
745 1.40 christos * cspace --
746 1.40 christos * Concatenate space: append the source space to the destination space,
747 1.40 christos * allocating new space as necessary.
748 1.1 alm */
749 1.52 christos void
750 1.38 lukem cspace(SPACE *sp, const char *p, size_t len, enum e_spflag spflag)
751 1.1 alm {
752 1.1 alm size_t tlen;
753 1.1 alm
754 1.8 cgd /* Make sure SPACE has enough memory and ramp up quickly. */
755 1.8 cgd tlen = sp->len + len + 1;
756 1.1 alm if (tlen > sp->blen) {
757 1.40 christos sp->blen = tlen + 1024;
758 1.40 christos sp->space = sp->back = xrealloc(sp->back, sp->blen);
759 1.1 alm }
760 1.1 alm
761 1.8 cgd if (spflag == REPLACE)
762 1.1 alm sp->len = 0;
763 1.1 alm
764 1.1 alm memmove(sp->space + sp->len, p, len);
765 1.8 cgd
766 1.1 alm sp->space[sp->len += len] = '\0';
767 1.1 alm }
768 1.1 alm
769 1.1 alm /*
770 1.1 alm * Close all cached opened files and report any errors
771 1.1 alm */
772 1.52 christos void
773 1.32 wiz cfclose(struct s_command *cp, struct s_command *end)
774 1.1 alm {
775 1.1 alm
776 1.1 alm for (; cp != end; cp = cp->next)
777 1.1 alm switch(cp->code) {
778 1.1 alm case 's':
779 1.1 alm if (cp->u.s->wfd != -1 && close(cp->u.s->wfd))
780 1.40 christos err(1, "%s", cp->u.s->wfile);
781 1.1 alm cp->u.s->wfd = -1;
782 1.1 alm break;
783 1.1 alm case 'w':
784 1.1 alm if (cp->u.fd != -1 && close(cp->u.fd))
785 1.40 christos err(1, "%s", cp->t);
786 1.1 alm cp->u.fd = -1;
787 1.1 alm break;
788 1.1 alm case '{':
789 1.1 alm cfclose(cp->u.c, cp->next);
790 1.1 alm break;
791 1.1 alm }
792 1.1 alm }
793