join.c revision 1.29 1 1.29 lukem /* $NetBSD: join.c,v 1.29 2008/07/21 14:19:23 lukem Exp $ */
2 1.8 tls
3 1.1 glass /*-
4 1.10 tls * Copyright (c) 1991 The Regents of the University of California.
5 1.10 tls * All rights reserved.
6 1.1 glass *
7 1.1 glass * This code is derived from software contributed to Berkeley by
8 1.1 glass * Steve Hayman of Indiana University, Michiro Hikida and David
9 1.1 glass * Goodenough.
10 1.1 glass *
11 1.1 glass * Redistribution and use in source and binary forms, with or without
12 1.1 glass * modification, are permitted provided that the following conditions
13 1.1 glass * are met:
14 1.1 glass * 1. Redistributions of source code must retain the above copyright
15 1.1 glass * notice, this list of conditions and the following disclaimer.
16 1.1 glass * 2. Redistributions in binary form must reproduce the above copyright
17 1.1 glass * notice, this list of conditions and the following disclaimer in the
18 1.1 glass * documentation and/or other materials provided with the distribution.
19 1.23 agc * 3. Neither the name of the University nor the names of its contributors
20 1.1 glass * may be used to endorse or promote products derived from this software
21 1.1 glass * without specific prior written permission.
22 1.1 glass *
23 1.1 glass * THIS SOFTWARE IS PROVIDED BY THE REGENTS AND CONTRIBUTORS ``AS IS'' AND
24 1.1 glass * ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
25 1.1 glass * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
26 1.1 glass * ARE DISCLAIMED. IN NO EVENT SHALL THE REGENTS OR CONTRIBUTORS BE LIABLE
27 1.1 glass * FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL
28 1.1 glass * DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS
29 1.1 glass * OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION)
30 1.1 glass * HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT
31 1.1 glass * LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY
32 1.1 glass * OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF
33 1.1 glass * SUCH DAMAGE.
34 1.1 glass */
35 1.1 glass
36 1.27 apb #if HAVE_NBTOOL_CONFIG_H
37 1.27 apb #include "nbtool_config.h"
38 1.27 apb #endif
39 1.27 apb
40 1.11 lukem #include <sys/cdefs.h>
41 1.1 glass #ifndef lint
42 1.29 lukem __COPYRIGHT("@(#) Copyright (c) 1991\
43 1.29 lukem The Regents of the University of California. All rights reserved.");
44 1.1 glass #endif /* not lint */
45 1.1 glass
46 1.1 glass #ifndef lint
47 1.11 lukem #if 0
48 1.11 lukem static char sccsid[] = "from: @(#)join.c 5.1 (Berkeley) 11/18/91";
49 1.11 lukem #else
50 1.29 lukem __RCSID("$NetBSD: join.c,v 1.29 2008/07/21 14:19:23 lukem Exp $");
51 1.11 lukem #endif
52 1.1 glass #endif /* not lint */
53 1.1 glass
54 1.1 glass #include <sys/types.h>
55 1.11 lukem #include <ctype.h>
56 1.11 lukem #include <err.h>
57 1.11 lukem #include <errno.h>
58 1.3 jtc #include <stdio.h>
59 1.1 glass #include <stdlib.h>
60 1.1 glass #include <string.h>
61 1.12 perry #include <unistd.h>
62 1.1 glass
63 1.1 glass /*
64 1.1 glass * There's a structure per input file which encapsulates the state of the
65 1.1 glass * file. We repeatedly read lines from each file until we've read in all
66 1.1 glass * the consecutive lines from the file with a common join field. Then we
67 1.1 glass * compare the set of lines with an equivalent set from the other file.
68 1.1 glass */
69 1.1 glass typedef struct {
70 1.1 glass char *line; /* line */
71 1.1 glass u_long linealloc; /* line allocated count */
72 1.1 glass char **fields; /* line field(s) */
73 1.1 glass u_long fieldcnt; /* line field(s) count */
74 1.1 glass u_long fieldalloc; /* line field(s) allocated count */
75 1.1 glass } LINE;
76 1.1 glass
77 1.21 jonb LINE noline = {"", 0, 0, 0, 0}; /* arg for outfield if no line to output */
78 1.21 jonb
79 1.1 glass typedef struct {
80 1.1 glass FILE *fp; /* file descriptor */
81 1.1 glass u_long joinf; /* join field (-1, -2, -j) */
82 1.1 glass int unpair; /* output unpairable lines (-a) */
83 1.1 glass int number; /* 1 for file 1, 2 for file 2 */
84 1.1 glass
85 1.1 glass LINE *set; /* set of lines with same field */
86 1.1 glass u_long pushback; /* line on the stack */
87 1.1 glass u_long setcnt; /* set count */
88 1.1 glass u_long setalloc; /* set allocated count */
89 1.1 glass } INPUT;
90 1.10 tls INPUT input1 = { NULL, 0, 0, 1, NULL, -1, 0, 0, },
91 1.20 jonb input2 = { NULL, 0, 0, 2, NULL, -1, 0, 0, };
92 1.1 glass
93 1.1 glass typedef struct {
94 1.10 tls u_long fileno; /* file number */
95 1.1 glass u_long fieldno; /* field number */
96 1.1 glass } OLIST;
97 1.1 glass OLIST *olist; /* output field list */
98 1.1 glass u_long olistcnt; /* output field list count */
99 1.1 glass u_long olistalloc; /* output field allocated count */
100 1.1 glass
101 1.1 glass int joinout = 1; /* show lines with matched join fields (-v) */
102 1.1 glass int needsep; /* need separator character */
103 1.1 glass int spans = 1; /* span multiple delimiters (-t) */
104 1.1 glass char *empty; /* empty field replacement string (-e) */
105 1.1 glass char *tabchar = " \t"; /* delimiter characters (-t) */
106 1.1 glass
107 1.26 perry int cmp(LINE *, u_long, LINE *, u_long);
108 1.26 perry void enomem(void);
109 1.26 perry void fieldarg(char *);
110 1.26 perry void joinlines(INPUT *, INPUT *);
111 1.26 perry int main(int, char **);
112 1.26 perry void obsolete(char **);
113 1.26 perry void outfield(LINE *, u_long);
114 1.26 perry void outoneline(INPUT *, LINE *);
115 1.26 perry void outtwoline(INPUT *, LINE *, INPUT *, LINE *);
116 1.26 perry void slurp(INPUT *);
117 1.26 perry void usage(void);
118 1.1 glass
119 1.1 glass int
120 1.26 perry main(int argc, char *argv[])
121 1.1 glass {
122 1.11 lukem INPUT *F1, *F2;
123 1.1 glass int aflag, ch, cval, vflag;
124 1.1 glass char *end;
125 1.1 glass
126 1.1 glass F1 = &input1;
127 1.1 glass F2 = &input2;
128 1.1 glass
129 1.1 glass aflag = vflag = 0;
130 1.1 glass obsolete(argv);
131 1.11 lukem while ((ch = getopt(argc, argv, "\01a:e:j:1:2:o:t:v:")) != -1) {
132 1.1 glass switch (ch) {
133 1.10 tls case '\01':
134 1.1 glass aflag = 1;
135 1.1 glass F1->unpair = F2->unpair = 1;
136 1.1 glass break;
137 1.1 glass case '1':
138 1.11 lukem if ((F1->joinf = strtol(optarg, &end, 10)) < 1) {
139 1.11 lukem warnx("-1 option field number less than 1");
140 1.11 lukem usage();
141 1.11 lukem }
142 1.11 lukem if (*end) {
143 1.11 lukem warnx("illegal field number -- %s", optarg);
144 1.11 lukem usage();
145 1.11 lukem }
146 1.1 glass --F1->joinf;
147 1.1 glass break;
148 1.1 glass case '2':
149 1.11 lukem if ((F2->joinf = strtol(optarg, &end, 10)) < 1) {
150 1.11 lukem warnx("-2 option field number less than 1");
151 1.11 lukem usage();
152 1.11 lukem }
153 1.11 lukem if (*end) {
154 1.11 lukem warnx("illegal field number -- %s", optarg);
155 1.11 lukem usage();
156 1.11 lukem }
157 1.1 glass --F2->joinf;
158 1.1 glass break;
159 1.1 glass case 'a':
160 1.1 glass aflag = 1;
161 1.1 glass switch(strtol(optarg, &end, 10)) {
162 1.1 glass case 1:
163 1.1 glass F1->unpair = 1;
164 1.1 glass break;
165 1.1 glass case 2:
166 1.1 glass F2->unpair = 1;
167 1.1 glass break;
168 1.1 glass default:
169 1.11 lukem warnx("-a option file number not 1 or 2");
170 1.11 lukem usage();
171 1.1 glass break;
172 1.1 glass }
173 1.11 lukem if (*end) {
174 1.11 lukem warnx("illegal file number -- %s", optarg);
175 1.11 lukem usage();
176 1.11 lukem }
177 1.1 glass break;
178 1.1 glass case 'e':
179 1.1 glass empty = optarg;
180 1.1 glass break;
181 1.1 glass case 'j':
182 1.1 glass if ((F1->joinf = F2->joinf =
183 1.11 lukem strtol(optarg, &end, 10)) < 1) {
184 1.11 lukem warnx("-j option field number less than 1");
185 1.11 lukem usage();
186 1.11 lukem }
187 1.11 lukem if (*end) {
188 1.11 lukem warnx("illegal field number -- %s", optarg);
189 1.11 lukem usage();
190 1.11 lukem }
191 1.1 glass --F1->joinf;
192 1.1 glass --F2->joinf;
193 1.1 glass break;
194 1.1 glass case 'o':
195 1.1 glass fieldarg(optarg);
196 1.1 glass break;
197 1.1 glass case 't':
198 1.1 glass spans = 0;
199 1.11 lukem if (strlen(tabchar = optarg) != 1) {
200 1.11 lukem warnx("illegal tab character specification");
201 1.11 lukem usage();
202 1.11 lukem }
203 1.1 glass break;
204 1.1 glass case 'v':
205 1.1 glass vflag = 1;
206 1.1 glass joinout = 0;
207 1.10 tls switch(strtol(optarg, &end, 10)) {
208 1.1 glass case 1:
209 1.1 glass F1->unpair = 1;
210 1.1 glass break;
211 1.1 glass case 2:
212 1.1 glass F2->unpair = 1;
213 1.1 glass break;
214 1.1 glass default:
215 1.11 lukem warnx("-v option file number not 1 or 2");
216 1.11 lukem usage();
217 1.1 glass break;
218 1.1 glass }
219 1.11 lukem if (*end) {
220 1.11 lukem warnx("illegal file number -- %s", optarg);
221 1.11 lukem usage();
222 1.11 lukem }
223 1.1 glass break;
224 1.1 glass case '?':
225 1.1 glass default:
226 1.1 glass usage();
227 1.1 glass }
228 1.1 glass }
229 1.1 glass argc -= optind;
230 1.1 glass argv += optind;
231 1.1 glass
232 1.1 glass if (aflag && vflag)
233 1.11 lukem errx(1, "-a and -v options mutually exclusive");
234 1.1 glass
235 1.1 glass if (argc != 2)
236 1.1 glass usage();
237 1.1 glass
238 1.1 glass /* Open the files; "-" means stdin. */
239 1.1 glass if (!strcmp(*argv, "-"))
240 1.1 glass F1->fp = stdin;
241 1.1 glass else if ((F1->fp = fopen(*argv, "r")) == NULL)
242 1.11 lukem err(1, "%s", *argv);
243 1.1 glass ++argv;
244 1.1 glass if (!strcmp(*argv, "-"))
245 1.1 glass F2->fp = stdin;
246 1.1 glass else if ((F2->fp = fopen(*argv, "r")) == NULL)
247 1.11 lukem err(1, "%s", *argv);
248 1.1 glass if (F1->fp == stdin && F2->fp == stdin)
249 1.11 lukem errx(1, "only one input file may be stdin");
250 1.1 glass
251 1.1 glass slurp(F1);
252 1.1 glass slurp(F2);
253 1.1 glass while (F1->setcnt && F2->setcnt) {
254 1.1 glass cval = cmp(F1->set, F1->joinf, F2->set, F2->joinf);
255 1.1 glass if (cval == 0) {
256 1.1 glass /* Oh joy, oh rapture, oh beauty divine! */
257 1.1 glass if (joinout)
258 1.1 glass joinlines(F1, F2);
259 1.1 glass slurp(F1);
260 1.1 glass slurp(F2);
261 1.1 glass } else if (cval < 0) {
262 1.1 glass /* File 1 takes the lead... */
263 1.1 glass if (F1->unpair)
264 1.1 glass joinlines(F1, NULL);
265 1.1 glass slurp(F1);
266 1.1 glass } else {
267 1.1 glass /* File 2 takes the lead... */
268 1.1 glass if (F2->unpair)
269 1.1 glass joinlines(F2, NULL);
270 1.1 glass slurp(F2);
271 1.1 glass }
272 1.1 glass }
273 1.1 glass
274 1.1 glass /*
275 1.1 glass * Now that one of the files is used up, optionally output any
276 1.1 glass * remaining lines from the other file.
277 1.1 glass */
278 1.1 glass if (F1->unpair)
279 1.1 glass while (F1->setcnt) {
280 1.1 glass joinlines(F1, NULL);
281 1.1 glass slurp(F1);
282 1.1 glass }
283 1.28 hubertf if (F1->fp != stdin)
284 1.28 hubertf fclose(F1->fp);
285 1.28 hubertf
286 1.1 glass if (F2->unpair)
287 1.1 glass while (F2->setcnt) {
288 1.1 glass joinlines(F2, NULL);
289 1.1 glass slurp(F2);
290 1.1 glass }
291 1.28 hubertf if (F2->fp != stdin)
292 1.28 hubertf fclose(F2->fp);
293 1.28 hubertf
294 1.28 hubertf return 0;
295 1.1 glass }
296 1.1 glass
297 1.1 glass void
298 1.26 perry slurp(INPUT *F)
299 1.1 glass {
300 1.17 mycroft LINE *lp;
301 1.10 tls LINE tmp;
302 1.24 itojun LINE *nline;
303 1.1 glass size_t len;
304 1.1 glass int cnt;
305 1.5 cgd char *bp, *fieldp;
306 1.24 itojun u_long nsize;
307 1.1 glass
308 1.1 glass /*
309 1.1 glass * Read all of the lines from an input file that have the same
310 1.1 glass * join field.
311 1.1 glass */
312 1.17 mycroft for (F->setcnt = 0;; ++F->setcnt) {
313 1.1 glass /*
314 1.1 glass * If we're out of space to hold line structures, allocate
315 1.1 glass * more. Initialize the structure so that we know that this
316 1.1 glass * is new space.
317 1.1 glass */
318 1.1 glass if (F->setcnt == F->setalloc) {
319 1.1 glass cnt = F->setalloc;
320 1.17 mycroft if (F->setalloc == 0)
321 1.24 itojun nsize = 64;
322 1.17 mycroft else
323 1.24 itojun nsize = F->setalloc << 1;
324 1.24 itojun if ((nline = realloc(F->set,
325 1.24 itojun nsize * sizeof(LINE))) == NULL)
326 1.10 tls enomem();
327 1.24 itojun F->set = nline;
328 1.24 itojun F->setalloc = nsize;
329 1.17 mycroft memset(F->set + cnt, 0,
330 1.17 mycroft (F->setalloc - cnt) * sizeof(LINE));
331 1.1 glass }
332 1.1 glass
333 1.1 glass /*
334 1.1 glass * Get any pushed back line, else get the next line. Allocate
335 1.1 glass * space as necessary. If taking the line from the stack swap
336 1.10 tls * the two structures so that we don't lose the allocated space.
337 1.10 tls * This could be avoided by doing another level of indirection,
338 1.10 tls * but it's probably okay as is.
339 1.1 glass */
340 1.1 glass lp = &F->set[F->setcnt];
341 1.10 tls if (F->pushback != -1) {
342 1.1 glass tmp = F->set[F->setcnt];
343 1.1 glass F->set[F->setcnt] = F->set[F->pushback];
344 1.1 glass F->set[F->pushback] = tmp;
345 1.10 tls F->pushback = -1;
346 1.1 glass continue;
347 1.1 glass }
348 1.6 cgd if ((bp = fgetln(F->fp, &len)) == NULL)
349 1.1 glass return;
350 1.5 cgd if (lp->linealloc <= len + 1) {
351 1.24 itojun char *n;
352 1.24 itojun
353 1.4 cgd if (lp->linealloc == 0)
354 1.24 itojun nsize = 128;
355 1.24 itojun else
356 1.24 itojun nsize = lp->linealloc;
357 1.24 itojun while (nsize <= len + 1)
358 1.24 itojun nsize <<= 1;
359 1.24 itojun if ((n = realloc(lp->line,
360 1.24 itojun nsize * sizeof(char))) == NULL)
361 1.10 tls enomem();
362 1.24 itojun lp->line = n;
363 1.24 itojun lp->linealloc = nsize;
364 1.1 glass }
365 1.16 tron memmove(lp->line, bp, len);
366 1.1 glass
367 1.5 cgd /* Replace trailing newline, if it exists. */
368 1.5 cgd if (bp[len - 1] == '\n')
369 1.5 cgd lp->line[len - 1] = '\0';
370 1.5 cgd else
371 1.5 cgd lp->line[len] = '\0';
372 1.5 cgd bp = lp->line;
373 1.5 cgd
374 1.1 glass /* Split the line into fields, allocate space as necessary. */
375 1.1 glass lp->fieldcnt = 0;
376 1.5 cgd while ((fieldp = strsep(&bp, tabchar)) != NULL) {
377 1.1 glass if (spans && *fieldp == '\0')
378 1.1 glass continue;
379 1.1 glass if (lp->fieldcnt == lp->fieldalloc) {
380 1.24 itojun char **n;
381 1.24 itojun
382 1.17 mycroft if (lp->fieldalloc == 0)
383 1.24 itojun nsize = 16;
384 1.17 mycroft else
385 1.24 itojun nsize = lp->fieldalloc << 1;
386 1.24 itojun if ((n = realloc(lp->fields,
387 1.24 itojun nsize * sizeof(char *))) == NULL)
388 1.10 tls enomem();
389 1.24 itojun lp->fields = n;
390 1.24 itojun lp->fieldalloc = nsize;
391 1.1 glass }
392 1.1 glass lp->fields[lp->fieldcnt++] = fieldp;
393 1.1 glass }
394 1.1 glass
395 1.1 glass /* See if the join field value has changed. */
396 1.17 mycroft if (F->setcnt && cmp(lp, F->joinf, lp - 1, F->joinf)) {
397 1.1 glass F->pushback = F->setcnt;
398 1.1 glass break;
399 1.1 glass }
400 1.1 glass }
401 1.1 glass }
402 1.1 glass
403 1.1 glass int
404 1.26 perry cmp(LINE *lp1, u_long fieldno1, LINE *lp2, u_long fieldno2)
405 1.1 glass {
406 1.7 mycroft
407 1.7 mycroft if (lp1->fieldcnt <= fieldno1)
408 1.18 mycroft return (lp2->fieldcnt <= fieldno2 ? 0 : 1);
409 1.7 mycroft if (lp2->fieldcnt <= fieldno2)
410 1.1 glass return (-1);
411 1.1 glass return (strcmp(lp1->fields[fieldno1], lp2->fields[fieldno2]));
412 1.1 glass }
413 1.1 glass
414 1.1 glass void
415 1.26 perry joinlines(INPUT *F1, INPUT *F2)
416 1.1 glass {
417 1.11 lukem int cnt1, cnt2;
418 1.1 glass
419 1.1 glass /*
420 1.1 glass * Output the results of a join comparison. The output may be from
421 1.1 glass * either file 1 or file 2 (in which case the first argument is the
422 1.1 glass * file from which to output) or from both.
423 1.1 glass */
424 1.1 glass if (F2 == NULL) {
425 1.1 glass for (cnt1 = 0; cnt1 < F1->setcnt; ++cnt1)
426 1.1 glass outoneline(F1, &F1->set[cnt1]);
427 1.1 glass return;
428 1.1 glass }
429 1.1 glass for (cnt1 = 0; cnt1 < F1->setcnt; ++cnt1)
430 1.1 glass for (cnt2 = 0; cnt2 < F2->setcnt; ++cnt2)
431 1.1 glass outtwoline(F1, &F1->set[cnt1], F2, &F2->set[cnt2]);
432 1.1 glass }
433 1.1 glass
434 1.1 glass void
435 1.26 perry outoneline(INPUT *F, LINE *lp)
436 1.1 glass {
437 1.11 lukem int cnt;
438 1.1 glass
439 1.1 glass /*
440 1.1 glass * Output a single line from one of the files, according to the
441 1.1 glass * join rules. This happens when we are writing unmatched single
442 1.1 glass * lines. Output empty fields in the right places.
443 1.1 glass */
444 1.1 glass if (olist)
445 1.1 glass for (cnt = 0; cnt < olistcnt; ++cnt) {
446 1.10 tls if (olist[cnt].fileno == F->number)
447 1.10 tls outfield(lp, olist[cnt].fieldno);
448 1.21 jonb else
449 1.21 jonb outfield(&noline, 1);
450 1.1 glass }
451 1.1 glass else
452 1.1 glass for (cnt = 0; cnt < lp->fieldcnt; ++cnt)
453 1.10 tls outfield(lp, cnt);
454 1.1 glass (void)printf("\n");
455 1.1 glass if (ferror(stdout))
456 1.11 lukem err(1, "stdout");
457 1.1 glass needsep = 0;
458 1.1 glass }
459 1.1 glass
460 1.1 glass void
461 1.26 perry outtwoline(INPUT *F1, LINE *lp1, INPUT *F2, LINE *lp2)
462 1.1 glass {
463 1.11 lukem int cnt;
464 1.1 glass
465 1.1 glass /* Output a pair of lines according to the join list (if any). */
466 1.15 christos if (olist) {
467 1.1 glass for (cnt = 0; cnt < olistcnt; ++cnt)
468 1.10 tls if (olist[cnt].fileno == 1)
469 1.10 tls outfield(lp1, olist[cnt].fieldno);
470 1.10 tls else /* if (olist[cnt].fileno == 2) */
471 1.10 tls outfield(lp2, olist[cnt].fieldno);
472 1.15 christos } else {
473 1.1 glass /*
474 1.1 glass * Output the join field, then the remaining fields from F1
475 1.1 glass * and F2.
476 1.1 glass */
477 1.10 tls outfield(lp1, F1->joinf);
478 1.1 glass for (cnt = 0; cnt < lp1->fieldcnt; ++cnt)
479 1.1 glass if (F1->joinf != cnt)
480 1.10 tls outfield(lp1, cnt);
481 1.1 glass for (cnt = 0; cnt < lp2->fieldcnt; ++cnt)
482 1.1 glass if (F2->joinf != cnt)
483 1.10 tls outfield(lp2, cnt);
484 1.1 glass }
485 1.1 glass (void)printf("\n");
486 1.1 glass if (ferror(stdout))
487 1.11 lukem err(1, "stdout");
488 1.1 glass needsep = 0;
489 1.1 glass }
490 1.1 glass
491 1.1 glass void
492 1.26 perry outfield(LINE *lp, u_long fieldno)
493 1.1 glass {
494 1.1 glass if (needsep++)
495 1.1 glass (void)printf("%c", *tabchar);
496 1.13 ross if (!ferror(stdout)) {
497 1.19 mycroft if (lp->fieldcnt <= fieldno) {
498 1.1 glass if (empty != NULL)
499 1.1 glass (void)printf("%s", empty);
500 1.1 glass } else {
501 1.1 glass if (*lp->fields[fieldno] == '\0')
502 1.1 glass return;
503 1.1 glass (void)printf("%s", lp->fields[fieldno]);
504 1.1 glass }
505 1.13 ross }
506 1.1 glass if (ferror(stdout))
507 1.11 lukem err(1, "stdout");
508 1.1 glass }
509 1.1 glass
510 1.1 glass /*
511 1.1 glass * Convert an output list argument "2.1, 1.3, 2.4" into an array of output
512 1.1 glass * fields.
513 1.1 glass */
514 1.1 glass void
515 1.26 perry fieldarg(char *option)
516 1.1 glass {
517 1.1 glass u_long fieldno;
518 1.1 glass char *end, *token;
519 1.24 itojun OLIST *n;
520 1.1 glass
521 1.18 mycroft while ((token = strsep(&option, ", \t")) != NULL) {
522 1.1 glass if (*token == '\0')
523 1.1 glass continue;
524 1.11 lukem if ((token[0] != '1' && token[0] != '2') || token[1] != '.')
525 1.11 lukem errx(1, "malformed -o option field");
526 1.1 glass fieldno = strtol(token + 2, &end, 10);
527 1.1 glass if (*end)
528 1.11 lukem errx(1, "malformed -o option field");
529 1.1 glass if (fieldno == 0)
530 1.11 lukem errx(1, "field numbers are 1 based");
531 1.1 glass if (olistcnt == olistalloc) {
532 1.24 itojun if ((n = realloc(olist,
533 1.24 itojun (olistalloc + 50) * sizeof(OLIST))) == NULL)
534 1.24 itojun enomem();
535 1.24 itojun olist = n;
536 1.1 glass olistalloc += 50;
537 1.1 glass }
538 1.10 tls olist[olistcnt].fileno = token[0] - '0';
539 1.1 glass olist[olistcnt].fieldno = fieldno - 1;
540 1.1 glass ++olistcnt;
541 1.1 glass }
542 1.1 glass }
543 1.1 glass
544 1.1 glass void
545 1.26 perry obsolete(char **argv)
546 1.1 glass {
547 1.1 glass int len;
548 1.1 glass char **p, *ap, *t;
549 1.1 glass
550 1.11 lukem while ((ap = *++argv) != NULL) {
551 1.1 glass /* Return if "--". */
552 1.1 glass if (ap[0] == '-' && ap[1] == '-')
553 1.1 glass return;
554 1.1 glass switch (ap[1]) {
555 1.1 glass case 'a':
556 1.1 glass /*
557 1.1 glass * The original join allowed "-a", which meant the
558 1.1 glass * same as -a1 plus -a2. POSIX 1003.2, Draft 11.2
559 1.1 glass * only specifies this as "-a 1" and "a -2", so we
560 1.1 glass * have to use another option flag, one that is
561 1.1 glass * unlikely to ever be used or accidentally entered
562 1.1 glass * on the command line. (Well, we could reallocate
563 1.1 glass * the argv array, but that hardly seems worthwhile.)
564 1.1 glass */
565 1.1 glass if (ap[2] == '\0')
566 1.1 glass ap[1] = '\01';
567 1.1 glass break;
568 1.1 glass case 'j':
569 1.1 glass /*
570 1.1 glass * The original join allowed "-j[12] arg" and "-j arg".
571 1.1 glass * Convert the former to "-[12] arg". Don't convert
572 1.1 glass * the latter since getopt(3) can handle it.
573 1.1 glass */
574 1.1 glass switch(ap[2]) {
575 1.1 glass case '1':
576 1.1 glass if (ap[3] != '\0')
577 1.1 glass goto jbad;
578 1.1 glass ap[1] = '1';
579 1.1 glass ap[2] = '\0';
580 1.1 glass break;
581 1.1 glass case '2':
582 1.1 glass if (ap[3] != '\0')
583 1.1 glass goto jbad;
584 1.1 glass ap[1] = '2';
585 1.1 glass ap[2] = '\0';
586 1.1 glass break;
587 1.1 glass case '\0':
588 1.1 glass break;
589 1.1 glass default:
590 1.11 lukem jbad: errx(1, "illegal option -- %s", ap);
591 1.1 glass usage();
592 1.1 glass }
593 1.1 glass break;
594 1.1 glass case 'o':
595 1.1 glass /*
596 1.10 tls * The original join allowed "-o arg arg". Convert to
597 1.10 tls * "-o arg -o arg".
598 1.1 glass */
599 1.1 glass if (ap[2] != '\0')
600 1.1 glass break;
601 1.1 glass for (p = argv + 2; *p; ++p) {
602 1.11 lukem if ((p[0][0] != '1' && p[0][0] != '2') ||
603 1.10 tls p[0][1] != '.')
604 1.1 glass break;
605 1.1 glass len = strlen(*p);
606 1.1 glass if (len - 2 != strspn(*p + 2, "0123456789"))
607 1.1 glass break;
608 1.1 glass if ((t = malloc(len + 3)) == NULL)
609 1.10 tls enomem();
610 1.1 glass t[0] = '-';
611 1.1 glass t[1] = 'o';
612 1.11 lukem memmove(t + 2, *p, len + 1);
613 1.1 glass *p = t;
614 1.1 glass }
615 1.1 glass argv = p - 1;
616 1.1 glass break;
617 1.1 glass }
618 1.1 glass }
619 1.1 glass }
620 1.1 glass
621 1.1 glass void
622 1.26 perry enomem(void)
623 1.10 tls {
624 1.11 lukem errx(1, "no memory");
625 1.10 tls }
626 1.10 tls
627 1.10 tls void
628 1.26 perry usage(void)
629 1.1 glass {
630 1.25 wiz (void)fprintf(stderr,
631 1.25 wiz "usage: %s [-a fileno | -v fileno] [-e string] [-j fileno field]\n"
632 1.25 wiz " [-o list] [-t char] [-1 field] [-2 field] file1 file2\n",
633 1.25 wiz getprogname());
634 1.1 glass exit(1);
635 1.1 glass }
636