xargs.c revision 1.16 1 /* $NetBSD: xargs.c,v 1.16 2007/04/18 15:56:07 christos Exp $ */
2
3 /*-
4 * Copyright (c) 1990, 1993
5 * The Regents of the University of California. All rights reserved.
6 *
7 * This code is derived from software contributed to Berkeley by
8 * John B. Roll Jr.
9 *
10 * Redistribution and use in source and binary forms, with or without
11 * modification, are permitted provided that the following conditions
12 * are met:
13 * 1. Redistributions of source code must retain the above copyright
14 * notice, this list of conditions and the following disclaimer.
15 * 2. Redistributions in binary form must reproduce the above copyright
16 * notice, this list of conditions and the following disclaimer in the
17 * documentation and/or other materials provided with the distribution.
18 * 3. Neither the name of the University nor the names of its contributors
19 * may be used to endorse or promote products derived from this software
20 * without specific prior written permission.
21 *
22 * THIS SOFTWARE IS PROVIDED BY THE REGENTS AND CONTRIBUTORS ``AS IS'' AND
23 * ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
24 * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
25 * ARE DISCLAIMED. IN NO EVENT SHALL THE REGENTS OR CONTRIBUTORS BE LIABLE
26 * FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL
27 * DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS
28 * OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION)
29 * HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT
30 * LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY
31 * OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF
32 * SUCH DAMAGE.
33 *
34 * $xMach: xargs.c,v 1.6 2002/02/23 05:27:47 tim Exp $
35 */
36
37 #include <sys/cdefs.h>
38 #ifndef lint
39 __COPYRIGHT("@(#) Copyright (c) 1990, 1993\n\
40 The Regents of the University of California. All rights reserved.\n");
41 #if 0
42 static char sccsid[] = "@(#)xargs.c 8.1 (Berkeley) 6/6/93";
43 __FBSDID("$FreeBSD: src/usr.bin/xargs/xargs.c,v 1.62 2006/01/01 22:59:54 jmallett Exp $");
44 #endif
45 __RCSID("$NetBSD: xargs.c,v 1.16 2007/04/18 15:56:07 christos Exp $");
46 #endif /* not lint */
47
48 #include <sys/param.h>
49 #include <sys/wait.h>
50
51 #include <err.h>
52 #include <errno.h>
53 #include <fcntl.h>
54 #include <langinfo.h>
55 #include <locale.h>
56 #include <paths.h>
57 #include <regex.h>
58 #include <stdio.h>
59 #include <stdlib.h>
60 #include <string.h>
61 #include <signal.h>
62 #include <unistd.h>
63
64 #include "pathnames.h"
65
66 static void parse_input(int, char *[]);
67 static void prerun(int, char *[]);
68 static int prompt(void);
69 static void run(char **);
70 static void usage(void) __attribute__((__noreturn__));
71 void strnsubst(char **, const char *, const char *, size_t);
72 static void waitchildren(const char *, int);
73
74 static char echo[] = _PATH_ECHO;
75 static char **av, **bxp, **ep, **endxp, **xp;
76 static char *argp, *bbp, *ebp, *inpline, *p, *replstr;
77 static const char *eofstr;
78 static int count, insingle, indouble, oflag, pflag, tflag, Rflag, rval, zflag;
79 static int cnt, Iflag, jfound, Lflag, Sflag, wasquoted, xflag;
80 static int curprocs, maxprocs;
81
82 static volatile int childerr;
83
84 extern char **environ;
85
86 int
87 main(int argc, char *argv[])
88 {
89 long arg_max;
90 int ch, Jflag, nargs, nflag, nline;
91 size_t linelen;
92 char *endptr;
93
94 setprogname(argv[0]);
95
96 inpline = replstr = NULL;
97 ep = environ;
98 eofstr = "";
99 Jflag = nflag = 0;
100
101 (void)setlocale(LC_ALL, "");
102
103 /*
104 * POSIX.2 limits the exec line length to ARG_MAX - 2K. Running that
105 * caused some E2BIG errors, so it was changed to ARG_MAX - 4K. Given
106 * that the smallest argument is 2 bytes in length, this means that
107 * the number of arguments is limited to:
108 *
109 * (ARG_MAX - 4K - LENGTH(utility + arguments)) / 2.
110 *
111 * We arbitrarily limit the number of arguments to 5000. This is
112 * allowed by POSIX.2 as long as the resulting minimum exec line is
113 * at least LINE_MAX. Realloc'ing as necessary is possible, but
114 * probably not worthwhile.
115 */
116 nargs = 5000;
117 if ((arg_max = sysconf(_SC_ARG_MAX)) == -1)
118 errx(1, "sysconf(_SC_ARG_MAX) failed");
119 nline = arg_max - 4 * 1024;
120 while (*ep != NULL) {
121 /* 1 byte for each '\0' */
122 nline -= strlen(*ep++) + 1 + sizeof(*ep);
123 }
124 maxprocs = 1;
125 while ((ch = getopt(argc, argv, "0E:I:J:L:n:oP:pR:S:s:rtx")) != -1)
126 switch (ch) {
127 case 'E':
128 eofstr = optarg;
129 break;
130 case 'I':
131 Jflag = 0;
132 Iflag = 1;
133 Lflag = 1;
134 replstr = optarg;
135 break;
136 case 'J':
137 Iflag = 0;
138 Jflag = 1;
139 replstr = optarg;
140 break;
141 case 'L':
142 Lflag = atoi(optarg);
143 break;
144 case 'n':
145 nflag = 1;
146 if ((nargs = atoi(optarg)) <= 0)
147 errx(1, "illegal argument count");
148 break;
149 case 'o':
150 oflag = 1;
151 break;
152 case 'P':
153 if ((maxprocs = atoi(optarg)) <= 0)
154 errx(1, "max. processes must be >0");
155 break;
156 case 'p':
157 pflag = 1;
158 break;
159 case 'R':
160 Rflag = strtol(optarg, &endptr, 10);
161 if (*endptr != '\0')
162 errx(1, "replacements must be a number");
163 break;
164 case 'r':
165 /* GNU compatibility */
166 break;
167 case 'S':
168 Sflag = strtoul(optarg, &endptr, 10);
169 if (*endptr != '\0')
170 errx(1, "replsize must be a number");
171 break;
172 case 's':
173 nline = atoi(optarg);
174 break;
175 case 't':
176 tflag = 1;
177 break;
178 case 'x':
179 xflag = 1;
180 break;
181 case '0':
182 zflag = 1;
183 break;
184 case '?':
185 default:
186 usage();
187 }
188 argc -= optind;
189 argv += optind;
190
191 if (!Iflag && Rflag)
192 usage();
193 if (!Iflag && Sflag)
194 usage();
195 if (Iflag && !Rflag)
196 Rflag = 5;
197 if (Iflag && !Sflag)
198 Sflag = 255;
199 if (xflag && !nflag)
200 usage();
201 if (Iflag || Lflag)
202 xflag = 1;
203 if (replstr != NULL && *replstr == '\0')
204 errx(1, "replstr may not be empty");
205
206 /*
207 * Allocate pointers for the utility name, the utility arguments,
208 * the maximum arguments to be read from stdin and the trailing
209 * NULL.
210 */
211 linelen = 1 + argc + nargs + 1;
212 if ((av = bxp = malloc(linelen * sizeof(char **))) == NULL)
213 errx(1, "malloc failed");
214
215 /*
216 * Use the user's name for the utility as argv[0], just like the
217 * shell. Echo is the default. Set up pointers for the user's
218 * arguments.
219 */
220 if (*argv == NULL)
221 cnt = strlen(*bxp++ = echo);
222 else {
223 do {
224 if (Jflag && strcmp(*argv, replstr) == 0) {
225 char **avj;
226 jfound = 1;
227 argv++;
228 for (avj = argv; *avj; avj++)
229 cnt += strlen(*avj) + 1;
230 break;
231 }
232 cnt += strlen(*bxp++ = *argv) + 1;
233 } while (*++argv != NULL);
234 }
235
236 /*
237 * Set up begin/end/traversing pointers into the array. The -n
238 * count doesn't include the trailing NULL pointer, so the malloc
239 * added in an extra slot.
240 */
241 endxp = (xp = bxp) + nargs;
242
243 /*
244 * Allocate buffer space for the arguments read from stdin and the
245 * trailing NULL. Buffer space is defined as the default or specified
246 * space, minus the length of the utility name and arguments. Set up
247 * begin/end/traversing pointers into the array. The -s count does
248 * include the trailing NULL, so the malloc didn't add in an extra
249 * slot.
250 */
251 nline -= cnt;
252 if (nline <= 0)
253 errx(1, "insufficient space for command");
254
255 if ((bbp = malloc((size_t)(nline + 1))) == NULL)
256 errx(1, "malloc failed");
257 ebp = (argp = p = bbp) + nline - 1;
258 for (;;)
259 parse_input(argc, argv);
260 }
261
262 static void
263 parse_input(int argc, char *argv[])
264 {
265 int ch, foundeof;
266 char **avj;
267
268 foundeof = 0;
269
270 switch (ch = getchar()) {
271 case EOF:
272 /* No arguments since last exec. */
273 if (p == bbp) {
274 waitchildren(*argv, 1);
275 exit(rval);
276 }
277 goto arg1;
278 case ' ':
279 case '\t':
280 /* Quotes escape tabs and spaces. */
281 if (insingle || indouble || zflag)
282 goto addch;
283 goto arg2;
284 case '\0':
285 if (zflag) {
286 /*
287 * Increment 'count', so that nulls will be treated
288 * as end-of-line, as well as end-of-argument. This
289 * is needed so -0 works properly with -I and -L.
290 */
291 count++;
292 goto arg2;
293 }
294 goto addch;
295 case '\n':
296 if (zflag)
297 goto addch;
298 count++; /* Indicate end-of-line (used by -L) */
299
300 /* Quotes do not escape newlines. */
301 arg1: if (insingle || indouble)
302 errx(1, "unterminated quote");
303 arg2:
304 foundeof = *eofstr != '\0' &&
305 strncmp(argp, eofstr, (size_t)(p - argp)) == 0;
306
307 /* Do not make empty args unless they are quoted */
308 if ((argp != p || wasquoted) && !foundeof) {
309 *p++ = '\0';
310 *xp++ = argp;
311 if (Iflag) {
312 size_t curlen;
313
314 if (inpline == NULL)
315 curlen = 0;
316 else {
317 /*
318 * If this string is not zero
319 * length, append a space for
320 * separation before the next
321 * argument.
322 */
323 if ((curlen = strlen(inpline)) != 0)
324 (void)strcat(inpline, " ");
325 }
326 curlen++;
327 /*
328 * Allocate enough to hold what we will
329 * be holding in a second, and to append
330 * a space next time through, if we have
331 * to.
332 */
333 inpline = realloc(inpline, curlen + 2 +
334 strlen(argp));
335 if (inpline == NULL)
336 errx(1, "realloc failed");
337 if (curlen == 1)
338 (void)strcpy(inpline, argp);
339 else
340 (void)strcat(inpline, argp);
341 }
342 }
343
344 /*
345 * If max'd out on args or buffer, or reached EOF,
346 * run the command. If xflag and max'd out on buffer
347 * but not on args, object. Having reached the limit
348 * of input lines, as specified by -L is the same as
349 * maxing out on arguments.
350 */
351 if (xp == endxp || p > ebp || ch == EOF ||
352 (Lflag <= count && xflag) || foundeof) {
353 if (xflag && xp != endxp && p > ebp)
354 errx(1, "insufficient space for arguments");
355 if (jfound) {
356 for (avj = argv; *avj; avj++)
357 *xp++ = *avj;
358 }
359 prerun(argc, av);
360 if (ch == EOF || foundeof) {
361 waitchildren(*argv, 1);
362 exit(rval);
363 }
364 p = bbp;
365 xp = bxp;
366 count = 0;
367 }
368 argp = p;
369 wasquoted = 0;
370 break;
371 case '\'':
372 if (indouble || zflag)
373 goto addch;
374 insingle = !insingle;
375 wasquoted = 1;
376 break;
377 case '"':
378 if (insingle || zflag)
379 goto addch;
380 indouble = !indouble;
381 wasquoted = 1;
382 break;
383 case '\\':
384 if (zflag)
385 goto addch;
386 /* Backslash escapes anything, is escaped by quotes. */
387 if (!insingle && !indouble && (ch = getchar()) == EOF)
388 errx(1, "backslash at EOF");
389 /* FALLTHROUGH */
390 default:
391 addch: if (p < ebp) {
392 *p++ = ch;
393 break;
394 }
395
396 /* If only one argument, not enough buffer space. */
397 if (bxp == xp)
398 errx(1, "insufficient space for argument");
399 /* Didn't hit argument limit, so if xflag object. */
400 if (xflag)
401 errx(1, "insufficient space for arguments");
402
403 if (jfound) {
404 for (avj = argv; *avj; avj++)
405 *xp++ = *avj;
406 }
407 prerun(argc, av);
408 xp = bxp;
409 cnt = ebp - argp;
410 (void)memcpy(bbp, argp, (size_t)cnt);
411 p = (argp = bbp) + cnt;
412 *p++ = ch;
413 break;
414 }
415 }
416
417 /*
418 * Do things necessary before run()'ing, such as -I substitution,
419 * and then call run().
420 */
421 static void
422 prerun(int argc, char *argv[])
423 {
424 char **tmp, **tmp2, **avj;
425 int repls;
426
427 repls = Rflag;
428
429 if (argc == 0 || repls == 0) {
430 *xp = NULL;
431 run(argv);
432 return;
433 }
434
435 avj = argv;
436
437 /*
438 * Allocate memory to hold the argument list, and
439 * a NULL at the tail.
440 */
441 tmp = malloc((argc + 1) * sizeof(char**));
442 if (tmp == NULL)
443 errx(1, "malloc failed");
444 tmp2 = tmp;
445
446 /*
447 * Save the first argument and iterate over it, we
448 * cannot do strnsubst() to it.
449 */
450 if ((*tmp++ = strdup(*avj++)) == NULL)
451 errx(1, "strdup failed");
452
453 /*
454 * For each argument to utility, if we have not used up
455 * the number of replacements we are allowed to do, and
456 * if the argument contains at least one occurrence of
457 * replstr, call strnsubst(), else just save the string.
458 * Iterations over elements of avj and tmp are done
459 * where appropriate.
460 */
461 while (--argc) {
462 *tmp = *avj++;
463 if (repls && strstr(*tmp, replstr) != NULL) {
464 strnsubst(tmp++, replstr, inpline, (size_t)Sflag);
465 if (repls > 0)
466 repls--;
467 } else {
468 if ((*tmp = strdup(*tmp)) == NULL)
469 errx(1, "strdup failed");
470 tmp++;
471 }
472 }
473
474 /*
475 * Run it.
476 */
477 *tmp = NULL;
478 run(tmp2);
479
480 /*
481 * Walk from the tail to the head, free along the way.
482 */
483 for (; tmp2 != tmp; tmp--)
484 free(*tmp);
485 /*
486 * Now free the list itself.
487 */
488 free(tmp2);
489
490 /*
491 * Free the input line buffer, if we have one.
492 */
493 if (inpline != NULL) {
494 free(inpline);
495 inpline = NULL;
496 }
497 }
498
499 static void
500 run(char **argv)
501 {
502 int fd;
503 char **avec;
504
505 /*
506 * If the user wants to be notified of each command before it is
507 * executed, notify them. If they want the notification to be
508 * followed by a prompt, then prompt them.
509 */
510 if (tflag || pflag) {
511 (void)fprintf(stderr, "%s", *argv);
512 for (avec = argv + 1; *avec != NULL; ++avec)
513 (void)fprintf(stderr, " %s", *avec);
514 /*
515 * If the user has asked to be prompted, do so.
516 */
517 if (pflag)
518 /*
519 * If they asked not to exec, return without execution
520 * but if they asked to, go to the execution. If we
521 * could not open their tty, break the switch and drop
522 * back to -t behaviour.
523 */
524 switch (prompt()) {
525 case 0:
526 return;
527 case 1:
528 goto exec;
529 case 2:
530 break;
531 }
532 (void)fprintf(stderr, "\n");
533 (void)fflush(stderr);
534 }
535 exec:
536 childerr = 0;
537 switch (vfork()) {
538 case -1:
539 err(1, "vfork");
540 /*NOTREACHED*/
541 case 0:
542 if (oflag) {
543 if ((fd = open(_PATH_TTY, O_RDONLY)) == -1)
544 err(1, "can't open /dev/tty");
545 } else {
546 fd = open(_PATH_DEVNULL, O_RDONLY);
547 }
548 if (fd > STDIN_FILENO) {
549 if (dup2(fd, STDIN_FILENO) != 0)
550 err(1, "can't dup2 to stdin");
551 (void)close(fd);
552 }
553 (void)execvp(argv[0], argv);
554 childerr = errno;
555 _exit(1);
556 }
557 curprocs++;
558 waitchildren(*argv, 0);
559 }
560
561 static void
562 waitchildren(const char *name, int waitall)
563 {
564 pid_t pid;
565 int status;
566
567 while ((pid = waitpid(-1, &status, !waitall && curprocs < maxprocs ?
568 WNOHANG : 0)) > 0) {
569 curprocs--;
570 /* If we couldn't invoke the utility, exit. */
571 if (childerr != 0) {
572 errno = childerr;
573 err(errno == ENOENT ? 127 : 126, "%s", name);
574 }
575 /*
576 * According to POSIX, we have to exit if the utility exits
577 * with a 255 status, or is interrupted by a signal. xargs
578 * is allowed to return any exit status between 1 and 125
579 * in these cases, but we'll use 124 and 125, the same
580 * values used by GNU xargs.
581 */
582 if (WIFEXITED(status)) {
583 if (WEXITSTATUS (status) == 255) {
584 warnx ("%s exited with status 255", name);
585 exit(124);
586 } else if (WEXITSTATUS (status) != 0) {
587 rval = 123;
588 }
589 } else if (WIFSIGNALED (status)) {
590 if (WTERMSIG(status) < NSIG) {
591 warnx("%s terminated by SIG%s", name,
592 sys_signame[WTERMSIG(status)]);
593 } else {
594 warnx("%s terminated by signal %d", name,
595 WTERMSIG(status));
596 }
597 exit(125);
598 }
599 }
600 if (pid == -1 && errno != ECHILD)
601 err(1, "wait3");
602 }
603
604 /*
605 * Prompt the user about running a command.
606 */
607 static int
608 prompt(void)
609 {
610 regex_t cre;
611 size_t rsize;
612 int match;
613 char *response;
614 FILE *ttyfp;
615
616 if ((ttyfp = fopen(_PATH_TTY, "r")) == NULL)
617 return (2); /* Indicate that the TTY failed to open. */
618 (void)fprintf(stderr, "?...");
619 (void)fflush(stderr);
620 if ((response = fgetln(ttyfp, &rsize)) == NULL ||
621 regcomp(&cre, nl_langinfo(YESEXPR), REG_BASIC) != 0) {
622 (void)fclose(ttyfp);
623 return (0);
624 }
625 response[rsize - 1] = '\0';
626 match = regexec(&cre, response, 0, NULL, 0);
627 (void)fclose(ttyfp);
628 regfree(&cre);
629 return (match == 0);
630 }
631
632 static void
633 usage(void)
634 {
635 (void)fprintf(stderr,
636 "Usage: %s [-0opt] [-E eofstr] [-I replstr [-R replacements] [-S replsize]]\n"
637 " [-J replstr] [-L number] [-n number [-x]] [-P maxprocs]\n"
638 " [-s size] [utility [argument ...]]\n", getprogname());
639 exit(1);
640 }
641