join.c revision 1.23 1 1.23 agc /* $NetBSD: join.c,v 1.23 2003/08/07 11:14:10 agc Exp $ */
2 1.8 tls
3 1.1 glass /*-
4 1.10 tls * Copyright (c) 1991 The Regents of the University of California.
5 1.10 tls * All rights reserved.
6 1.1 glass *
7 1.1 glass * This code is derived from software contributed to Berkeley by
8 1.1 glass * Steve Hayman of Indiana University, Michiro Hikida and David
9 1.1 glass * Goodenough.
10 1.1 glass *
11 1.1 glass * Redistribution and use in source and binary forms, with or without
12 1.1 glass * modification, are permitted provided that the following conditions
13 1.1 glass * are met:
14 1.1 glass * 1. Redistributions of source code must retain the above copyright
15 1.1 glass * notice, this list of conditions and the following disclaimer.
16 1.1 glass * 2. Redistributions in binary form must reproduce the above copyright
17 1.1 glass * notice, this list of conditions and the following disclaimer in the
18 1.1 glass * documentation and/or other materials provided with the distribution.
19 1.23 agc * 3. Neither the name of the University nor the names of its contributors
20 1.1 glass * may be used to endorse or promote products derived from this software
21 1.1 glass * without specific prior written permission.
22 1.1 glass *
23 1.1 glass * THIS SOFTWARE IS PROVIDED BY THE REGENTS AND CONTRIBUTORS ``AS IS'' AND
24 1.1 glass * ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
25 1.1 glass * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
26 1.1 glass * ARE DISCLAIMED. IN NO EVENT SHALL THE REGENTS OR CONTRIBUTORS BE LIABLE
27 1.1 glass * FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL
28 1.1 glass * DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS
29 1.1 glass * OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION)
30 1.1 glass * HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT
31 1.1 glass * LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY
32 1.1 glass * OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF
33 1.1 glass * SUCH DAMAGE.
34 1.1 glass */
35 1.1 glass
36 1.11 lukem #include <sys/cdefs.h>
37 1.1 glass #ifndef lint
38 1.11 lukem __COPYRIGHT(
39 1.11 lukem "@(#) Copyright (c) 1991 The Regents of the University of California.\n\
40 1.11 lukem All rights reserved.\n");
41 1.1 glass #endif /* not lint */
42 1.1 glass
43 1.1 glass #ifndef lint
44 1.11 lukem #if 0
45 1.11 lukem static char sccsid[] = "from: @(#)join.c 5.1 (Berkeley) 11/18/91";
46 1.11 lukem #else
47 1.23 agc __RCSID("$NetBSD: join.c,v 1.23 2003/08/07 11:14:10 agc Exp $");
48 1.11 lukem #endif
49 1.1 glass #endif /* not lint */
50 1.1 glass
51 1.1 glass #include <sys/types.h>
52 1.11 lukem #include <ctype.h>
53 1.11 lukem #include <err.h>
54 1.11 lukem #include <errno.h>
55 1.3 jtc #include <stdio.h>
56 1.1 glass #include <stdlib.h>
57 1.1 glass #include <string.h>
58 1.12 perry #include <unistd.h>
59 1.1 glass
60 1.1 glass /*
61 1.1 glass * There's a structure per input file which encapsulates the state of the
62 1.1 glass * file. We repeatedly read lines from each file until we've read in all
63 1.1 glass * the consecutive lines from the file with a common join field. Then we
64 1.1 glass * compare the set of lines with an equivalent set from the other file.
65 1.1 glass */
66 1.1 glass typedef struct {
67 1.1 glass char *line; /* line */
68 1.1 glass u_long linealloc; /* line allocated count */
69 1.1 glass char **fields; /* line field(s) */
70 1.1 glass u_long fieldcnt; /* line field(s) count */
71 1.1 glass u_long fieldalloc; /* line field(s) allocated count */
72 1.1 glass } LINE;
73 1.1 glass
74 1.21 jonb LINE noline = {"", 0, 0, 0, 0}; /* arg for outfield if no line to output */
75 1.21 jonb
76 1.1 glass typedef struct {
77 1.1 glass FILE *fp; /* file descriptor */
78 1.1 glass u_long joinf; /* join field (-1, -2, -j) */
79 1.1 glass int unpair; /* output unpairable lines (-a) */
80 1.1 glass int number; /* 1 for file 1, 2 for file 2 */
81 1.1 glass
82 1.1 glass LINE *set; /* set of lines with same field */
83 1.1 glass u_long pushback; /* line on the stack */
84 1.1 glass u_long setcnt; /* set count */
85 1.1 glass u_long setalloc; /* set allocated count */
86 1.1 glass } INPUT;
87 1.10 tls INPUT input1 = { NULL, 0, 0, 1, NULL, -1, 0, 0, },
88 1.20 jonb input2 = { NULL, 0, 0, 2, NULL, -1, 0, 0, };
89 1.1 glass
90 1.1 glass typedef struct {
91 1.10 tls u_long fileno; /* file number */
92 1.1 glass u_long fieldno; /* field number */
93 1.1 glass } OLIST;
94 1.1 glass OLIST *olist; /* output field list */
95 1.1 glass u_long olistcnt; /* output field list count */
96 1.1 glass u_long olistalloc; /* output field allocated count */
97 1.1 glass
98 1.1 glass int joinout = 1; /* show lines with matched join fields (-v) */
99 1.1 glass int needsep; /* need separator character */
100 1.1 glass int spans = 1; /* span multiple delimiters (-t) */
101 1.1 glass char *empty; /* empty field replacement string (-e) */
102 1.1 glass char *tabchar = " \t"; /* delimiter characters (-t) */
103 1.1 glass
104 1.1 glass int cmp __P((LINE *, u_long, LINE *, u_long));
105 1.10 tls void enomem __P((void));
106 1.1 glass void fieldarg __P((char *));
107 1.1 glass void joinlines __P((INPUT *, INPUT *));
108 1.11 lukem int main __P((int, char **));
109 1.1 glass void obsolete __P((char **));
110 1.10 tls void outfield __P((LINE *, u_long));
111 1.1 glass void outoneline __P((INPUT *, LINE *));
112 1.1 glass void outtwoline __P((INPUT *, LINE *, INPUT *, LINE *));
113 1.1 glass void slurp __P((INPUT *));
114 1.1 glass void usage __P((void));
115 1.1 glass
116 1.1 glass int
117 1.1 glass main(argc, argv)
118 1.1 glass int argc;
119 1.1 glass char *argv[];
120 1.1 glass {
121 1.11 lukem INPUT *F1, *F2;
122 1.1 glass int aflag, ch, cval, vflag;
123 1.1 glass char *end;
124 1.1 glass
125 1.1 glass F1 = &input1;
126 1.1 glass F2 = &input2;
127 1.1 glass
128 1.1 glass aflag = vflag = 0;
129 1.1 glass obsolete(argv);
130 1.11 lukem while ((ch = getopt(argc, argv, "\01a:e:j:1:2:o:t:v:")) != -1) {
131 1.1 glass switch (ch) {
132 1.10 tls case '\01':
133 1.1 glass aflag = 1;
134 1.1 glass F1->unpair = F2->unpair = 1;
135 1.1 glass break;
136 1.1 glass case '1':
137 1.11 lukem if ((F1->joinf = strtol(optarg, &end, 10)) < 1) {
138 1.11 lukem warnx("-1 option field number less than 1");
139 1.11 lukem usage();
140 1.11 lukem }
141 1.11 lukem if (*end) {
142 1.11 lukem warnx("illegal field number -- %s", optarg);
143 1.11 lukem usage();
144 1.11 lukem }
145 1.1 glass --F1->joinf;
146 1.1 glass break;
147 1.1 glass case '2':
148 1.11 lukem if ((F2->joinf = strtol(optarg, &end, 10)) < 1) {
149 1.11 lukem warnx("-2 option field number less than 1");
150 1.11 lukem usage();
151 1.11 lukem }
152 1.11 lukem if (*end) {
153 1.11 lukem warnx("illegal field number -- %s", optarg);
154 1.11 lukem usage();
155 1.11 lukem }
156 1.1 glass --F2->joinf;
157 1.1 glass break;
158 1.1 glass case 'a':
159 1.1 glass aflag = 1;
160 1.1 glass switch(strtol(optarg, &end, 10)) {
161 1.1 glass case 1:
162 1.1 glass F1->unpair = 1;
163 1.1 glass break;
164 1.1 glass case 2:
165 1.1 glass F2->unpair = 1;
166 1.1 glass break;
167 1.1 glass default:
168 1.11 lukem warnx("-a option file number not 1 or 2");
169 1.11 lukem usage();
170 1.1 glass break;
171 1.1 glass }
172 1.11 lukem if (*end) {
173 1.11 lukem warnx("illegal file number -- %s", optarg);
174 1.11 lukem usage();
175 1.11 lukem }
176 1.1 glass break;
177 1.1 glass case 'e':
178 1.1 glass empty = optarg;
179 1.1 glass break;
180 1.1 glass case 'j':
181 1.1 glass if ((F1->joinf = F2->joinf =
182 1.11 lukem strtol(optarg, &end, 10)) < 1) {
183 1.11 lukem warnx("-j option field number less than 1");
184 1.11 lukem usage();
185 1.11 lukem }
186 1.11 lukem if (*end) {
187 1.11 lukem warnx("illegal field number -- %s", optarg);
188 1.11 lukem usage();
189 1.11 lukem }
190 1.1 glass --F1->joinf;
191 1.1 glass --F2->joinf;
192 1.1 glass break;
193 1.1 glass case 'o':
194 1.1 glass fieldarg(optarg);
195 1.1 glass break;
196 1.1 glass case 't':
197 1.1 glass spans = 0;
198 1.11 lukem if (strlen(tabchar = optarg) != 1) {
199 1.11 lukem warnx("illegal tab character specification");
200 1.11 lukem usage();
201 1.11 lukem }
202 1.1 glass break;
203 1.1 glass case 'v':
204 1.1 glass vflag = 1;
205 1.1 glass joinout = 0;
206 1.10 tls switch(strtol(optarg, &end, 10)) {
207 1.1 glass case 1:
208 1.1 glass F1->unpair = 1;
209 1.1 glass break;
210 1.1 glass case 2:
211 1.1 glass F2->unpair = 1;
212 1.1 glass break;
213 1.1 glass default:
214 1.11 lukem warnx("-v option file number not 1 or 2");
215 1.11 lukem usage();
216 1.1 glass break;
217 1.1 glass }
218 1.11 lukem if (*end) {
219 1.11 lukem warnx("illegal file number -- %s", optarg);
220 1.11 lukem usage();
221 1.11 lukem }
222 1.1 glass break;
223 1.1 glass case '?':
224 1.1 glass default:
225 1.1 glass usage();
226 1.1 glass }
227 1.1 glass }
228 1.1 glass argc -= optind;
229 1.1 glass argv += optind;
230 1.1 glass
231 1.1 glass if (aflag && vflag)
232 1.11 lukem errx(1, "-a and -v options mutually exclusive");
233 1.1 glass
234 1.1 glass if (argc != 2)
235 1.1 glass usage();
236 1.1 glass
237 1.1 glass /* Open the files; "-" means stdin. */
238 1.1 glass if (!strcmp(*argv, "-"))
239 1.1 glass F1->fp = stdin;
240 1.1 glass else if ((F1->fp = fopen(*argv, "r")) == NULL)
241 1.11 lukem err(1, "%s", *argv);
242 1.1 glass ++argv;
243 1.1 glass if (!strcmp(*argv, "-"))
244 1.1 glass F2->fp = stdin;
245 1.1 glass else if ((F2->fp = fopen(*argv, "r")) == NULL)
246 1.11 lukem err(1, "%s", *argv);
247 1.1 glass if (F1->fp == stdin && F2->fp == stdin)
248 1.11 lukem errx(1, "only one input file may be stdin");
249 1.1 glass
250 1.1 glass slurp(F1);
251 1.1 glass slurp(F2);
252 1.1 glass while (F1->setcnt && F2->setcnt) {
253 1.1 glass cval = cmp(F1->set, F1->joinf, F2->set, F2->joinf);
254 1.1 glass if (cval == 0) {
255 1.1 glass /* Oh joy, oh rapture, oh beauty divine! */
256 1.1 glass if (joinout)
257 1.1 glass joinlines(F1, F2);
258 1.1 glass slurp(F1);
259 1.1 glass slurp(F2);
260 1.1 glass } else if (cval < 0) {
261 1.1 glass /* File 1 takes the lead... */
262 1.1 glass if (F1->unpair)
263 1.1 glass joinlines(F1, NULL);
264 1.1 glass slurp(F1);
265 1.1 glass } else {
266 1.1 glass /* File 2 takes the lead... */
267 1.1 glass if (F2->unpair)
268 1.1 glass joinlines(F2, NULL);
269 1.1 glass slurp(F2);
270 1.1 glass }
271 1.1 glass }
272 1.1 glass
273 1.1 glass /*
274 1.1 glass * Now that one of the files is used up, optionally output any
275 1.1 glass * remaining lines from the other file.
276 1.1 glass */
277 1.1 glass if (F1->unpair)
278 1.1 glass while (F1->setcnt) {
279 1.1 glass joinlines(F1, NULL);
280 1.1 glass slurp(F1);
281 1.1 glass }
282 1.1 glass if (F2->unpair)
283 1.1 glass while (F2->setcnt) {
284 1.1 glass joinlines(F2, NULL);
285 1.1 glass slurp(F2);
286 1.1 glass }
287 1.1 glass exit(0);
288 1.1 glass }
289 1.1 glass
290 1.1 glass void
291 1.1 glass slurp(F)
292 1.1 glass INPUT *F;
293 1.1 glass {
294 1.17 mycroft LINE *lp;
295 1.10 tls LINE tmp;
296 1.1 glass size_t len;
297 1.1 glass int cnt;
298 1.5 cgd char *bp, *fieldp;
299 1.1 glass
300 1.1 glass /*
301 1.1 glass * Read all of the lines from an input file that have the same
302 1.1 glass * join field.
303 1.1 glass */
304 1.17 mycroft for (F->setcnt = 0;; ++F->setcnt) {
305 1.1 glass /*
306 1.1 glass * If we're out of space to hold line structures, allocate
307 1.1 glass * more. Initialize the structure so that we know that this
308 1.1 glass * is new space.
309 1.1 glass */
310 1.1 glass if (F->setcnt == F->setalloc) {
311 1.1 glass cnt = F->setalloc;
312 1.17 mycroft if (F->setalloc == 0)
313 1.17 mycroft F->setalloc = 64;
314 1.17 mycroft else
315 1.17 mycroft F->setalloc <<= 1;
316 1.1 glass if ((F->set = realloc(F->set,
317 1.1 glass F->setalloc * sizeof(LINE))) == NULL)
318 1.10 tls enomem();
319 1.17 mycroft memset(F->set + cnt, 0,
320 1.17 mycroft (F->setalloc - cnt) * sizeof(LINE));
321 1.1 glass }
322 1.1 glass
323 1.1 glass /*
324 1.1 glass * Get any pushed back line, else get the next line. Allocate
325 1.1 glass * space as necessary. If taking the line from the stack swap
326 1.10 tls * the two structures so that we don't lose the allocated space.
327 1.10 tls * This could be avoided by doing another level of indirection,
328 1.10 tls * but it's probably okay as is.
329 1.1 glass */
330 1.1 glass lp = &F->set[F->setcnt];
331 1.10 tls if (F->pushback != -1) {
332 1.1 glass tmp = F->set[F->setcnt];
333 1.1 glass F->set[F->setcnt] = F->set[F->pushback];
334 1.1 glass F->set[F->pushback] = tmp;
335 1.10 tls F->pushback = -1;
336 1.1 glass continue;
337 1.1 glass }
338 1.6 cgd if ((bp = fgetln(F->fp, &len)) == NULL)
339 1.1 glass return;
340 1.5 cgd if (lp->linealloc <= len + 1) {
341 1.4 cgd if (lp->linealloc == 0)
342 1.4 cgd lp->linealloc = 128;
343 1.5 cgd while (lp->linealloc <= len + 1)
344 1.17 mycroft lp->linealloc <<= 1;
345 1.1 glass if ((lp->line = realloc(lp->line,
346 1.1 glass lp->linealloc * sizeof(char))) == NULL)
347 1.10 tls enomem();
348 1.1 glass }
349 1.16 tron memmove(lp->line, bp, len);
350 1.1 glass
351 1.5 cgd /* Replace trailing newline, if it exists. */
352 1.5 cgd if (bp[len - 1] == '\n')
353 1.5 cgd lp->line[len - 1] = '\0';
354 1.5 cgd else
355 1.5 cgd lp->line[len] = '\0';
356 1.5 cgd bp = lp->line;
357 1.5 cgd
358 1.1 glass /* Split the line into fields, allocate space as necessary. */
359 1.1 glass lp->fieldcnt = 0;
360 1.5 cgd while ((fieldp = strsep(&bp, tabchar)) != NULL) {
361 1.1 glass if (spans && *fieldp == '\0')
362 1.1 glass continue;
363 1.1 glass if (lp->fieldcnt == lp->fieldalloc) {
364 1.17 mycroft if (lp->fieldalloc == 0)
365 1.17 mycroft lp->fieldalloc = 16;
366 1.17 mycroft else
367 1.17 mycroft lp->fieldalloc <<= 1;
368 1.1 glass if ((lp->fields = realloc(lp->fields,
369 1.1 glass lp->fieldalloc * sizeof(char *))) == NULL)
370 1.10 tls enomem();
371 1.1 glass }
372 1.1 glass lp->fields[lp->fieldcnt++] = fieldp;
373 1.1 glass }
374 1.1 glass
375 1.1 glass /* See if the join field value has changed. */
376 1.17 mycroft if (F->setcnt && cmp(lp, F->joinf, lp - 1, F->joinf)) {
377 1.1 glass F->pushback = F->setcnt;
378 1.1 glass break;
379 1.1 glass }
380 1.1 glass }
381 1.1 glass }
382 1.1 glass
383 1.1 glass int
384 1.1 glass cmp(lp1, fieldno1, lp2, fieldno2)
385 1.1 glass LINE *lp1, *lp2;
386 1.1 glass u_long fieldno1, fieldno2;
387 1.1 glass {
388 1.7 mycroft
389 1.7 mycroft if (lp1->fieldcnt <= fieldno1)
390 1.18 mycroft return (lp2->fieldcnt <= fieldno2 ? 0 : 1);
391 1.7 mycroft if (lp2->fieldcnt <= fieldno2)
392 1.1 glass return (-1);
393 1.1 glass return (strcmp(lp1->fields[fieldno1], lp2->fields[fieldno2]));
394 1.1 glass }
395 1.1 glass
396 1.1 glass void
397 1.1 glass joinlines(F1, F2)
398 1.11 lukem INPUT *F1, *F2;
399 1.1 glass {
400 1.11 lukem int cnt1, cnt2;
401 1.1 glass
402 1.1 glass /*
403 1.1 glass * Output the results of a join comparison. The output may be from
404 1.1 glass * either file 1 or file 2 (in which case the first argument is the
405 1.1 glass * file from which to output) or from both.
406 1.1 glass */
407 1.1 glass if (F2 == NULL) {
408 1.1 glass for (cnt1 = 0; cnt1 < F1->setcnt; ++cnt1)
409 1.1 glass outoneline(F1, &F1->set[cnt1]);
410 1.1 glass return;
411 1.1 glass }
412 1.1 glass for (cnt1 = 0; cnt1 < F1->setcnt; ++cnt1)
413 1.1 glass for (cnt2 = 0; cnt2 < F2->setcnt; ++cnt2)
414 1.1 glass outtwoline(F1, &F1->set[cnt1], F2, &F2->set[cnt2]);
415 1.1 glass }
416 1.1 glass
417 1.1 glass void
418 1.1 glass outoneline(F, lp)
419 1.1 glass INPUT *F;
420 1.11 lukem LINE *lp;
421 1.1 glass {
422 1.11 lukem int cnt;
423 1.1 glass
424 1.1 glass /*
425 1.1 glass * Output a single line from one of the files, according to the
426 1.1 glass * join rules. This happens when we are writing unmatched single
427 1.1 glass * lines. Output empty fields in the right places.
428 1.1 glass */
429 1.1 glass if (olist)
430 1.1 glass for (cnt = 0; cnt < olistcnt; ++cnt) {
431 1.10 tls if (olist[cnt].fileno == F->number)
432 1.10 tls outfield(lp, olist[cnt].fieldno);
433 1.21 jonb else
434 1.21 jonb outfield(&noline, 1);
435 1.1 glass }
436 1.1 glass else
437 1.1 glass for (cnt = 0; cnt < lp->fieldcnt; ++cnt)
438 1.10 tls outfield(lp, cnt);
439 1.1 glass (void)printf("\n");
440 1.1 glass if (ferror(stdout))
441 1.11 lukem err(1, "stdout");
442 1.1 glass needsep = 0;
443 1.1 glass }
444 1.1 glass
445 1.1 glass void
446 1.1 glass outtwoline(F1, lp1, F2, lp2)
447 1.11 lukem INPUT *F1, *F2;
448 1.11 lukem LINE *lp1, *lp2;
449 1.1 glass {
450 1.11 lukem int cnt;
451 1.1 glass
452 1.1 glass /* Output a pair of lines according to the join list (if any). */
453 1.15 christos if (olist) {
454 1.1 glass for (cnt = 0; cnt < olistcnt; ++cnt)
455 1.10 tls if (olist[cnt].fileno == 1)
456 1.10 tls outfield(lp1, olist[cnt].fieldno);
457 1.10 tls else /* if (olist[cnt].fileno == 2) */
458 1.10 tls outfield(lp2, olist[cnt].fieldno);
459 1.15 christos } else {
460 1.1 glass /*
461 1.1 glass * Output the join field, then the remaining fields from F1
462 1.1 glass * and F2.
463 1.1 glass */
464 1.10 tls outfield(lp1, F1->joinf);
465 1.1 glass for (cnt = 0; cnt < lp1->fieldcnt; ++cnt)
466 1.1 glass if (F1->joinf != cnt)
467 1.10 tls outfield(lp1, cnt);
468 1.1 glass for (cnt = 0; cnt < lp2->fieldcnt; ++cnt)
469 1.1 glass if (F2->joinf != cnt)
470 1.10 tls outfield(lp2, cnt);
471 1.1 glass }
472 1.1 glass (void)printf("\n");
473 1.1 glass if (ferror(stdout))
474 1.11 lukem err(1, "stdout");
475 1.1 glass needsep = 0;
476 1.1 glass }
477 1.1 glass
478 1.1 glass void
479 1.10 tls outfield(lp, fieldno)
480 1.1 glass LINE *lp;
481 1.1 glass u_long fieldno;
482 1.1 glass {
483 1.1 glass if (needsep++)
484 1.1 glass (void)printf("%c", *tabchar);
485 1.13 ross if (!ferror(stdout)) {
486 1.19 mycroft if (lp->fieldcnt <= fieldno) {
487 1.1 glass if (empty != NULL)
488 1.1 glass (void)printf("%s", empty);
489 1.1 glass } else {
490 1.1 glass if (*lp->fields[fieldno] == '\0')
491 1.1 glass return;
492 1.1 glass (void)printf("%s", lp->fields[fieldno]);
493 1.1 glass }
494 1.13 ross }
495 1.1 glass if (ferror(stdout))
496 1.11 lukem err(1, "stdout");
497 1.1 glass }
498 1.1 glass
499 1.1 glass /*
500 1.1 glass * Convert an output list argument "2.1, 1.3, 2.4" into an array of output
501 1.1 glass * fields.
502 1.1 glass */
503 1.1 glass void
504 1.1 glass fieldarg(option)
505 1.1 glass char *option;
506 1.1 glass {
507 1.1 glass u_long fieldno;
508 1.1 glass char *end, *token;
509 1.1 glass
510 1.18 mycroft while ((token = strsep(&option, ", \t")) != NULL) {
511 1.1 glass if (*token == '\0')
512 1.1 glass continue;
513 1.11 lukem if ((token[0] != '1' && token[0] != '2') || token[1] != '.')
514 1.11 lukem errx(1, "malformed -o option field");
515 1.1 glass fieldno = strtol(token + 2, &end, 10);
516 1.1 glass if (*end)
517 1.11 lukem errx(1, "malformed -o option field");
518 1.1 glass if (fieldno == 0)
519 1.11 lukem errx(1, "field numbers are 1 based");
520 1.1 glass if (olistcnt == olistalloc) {
521 1.1 glass olistalloc += 50;
522 1.1 glass if ((olist = realloc(olist,
523 1.1 glass olistalloc * sizeof(OLIST))) == NULL)
524 1.10 tls enomem();
525 1.1 glass }
526 1.10 tls olist[olistcnt].fileno = token[0] - '0';
527 1.1 glass olist[olistcnt].fieldno = fieldno - 1;
528 1.1 glass ++olistcnt;
529 1.1 glass }
530 1.1 glass }
531 1.1 glass
532 1.1 glass void
533 1.1 glass obsolete(argv)
534 1.1 glass char **argv;
535 1.1 glass {
536 1.1 glass int len;
537 1.1 glass char **p, *ap, *t;
538 1.1 glass
539 1.11 lukem while ((ap = *++argv) != NULL) {
540 1.1 glass /* Return if "--". */
541 1.1 glass if (ap[0] == '-' && ap[1] == '-')
542 1.1 glass return;
543 1.1 glass switch (ap[1]) {
544 1.1 glass case 'a':
545 1.1 glass /*
546 1.1 glass * The original join allowed "-a", which meant the
547 1.1 glass * same as -a1 plus -a2. POSIX 1003.2, Draft 11.2
548 1.1 glass * only specifies this as "-a 1" and "a -2", so we
549 1.1 glass * have to use another option flag, one that is
550 1.1 glass * unlikely to ever be used or accidentally entered
551 1.1 glass * on the command line. (Well, we could reallocate
552 1.1 glass * the argv array, but that hardly seems worthwhile.)
553 1.1 glass */
554 1.1 glass if (ap[2] == '\0')
555 1.1 glass ap[1] = '\01';
556 1.1 glass break;
557 1.1 glass case 'j':
558 1.1 glass /*
559 1.1 glass * The original join allowed "-j[12] arg" and "-j arg".
560 1.1 glass * Convert the former to "-[12] arg". Don't convert
561 1.1 glass * the latter since getopt(3) can handle it.
562 1.1 glass */
563 1.1 glass switch(ap[2]) {
564 1.1 glass case '1':
565 1.1 glass if (ap[3] != '\0')
566 1.1 glass goto jbad;
567 1.1 glass ap[1] = '1';
568 1.1 glass ap[2] = '\0';
569 1.1 glass break;
570 1.1 glass case '2':
571 1.1 glass if (ap[3] != '\0')
572 1.1 glass goto jbad;
573 1.1 glass ap[1] = '2';
574 1.1 glass ap[2] = '\0';
575 1.1 glass break;
576 1.1 glass case '\0':
577 1.1 glass break;
578 1.1 glass default:
579 1.11 lukem jbad: errx(1, "illegal option -- %s", ap);
580 1.1 glass usage();
581 1.1 glass }
582 1.1 glass break;
583 1.1 glass case 'o':
584 1.1 glass /*
585 1.10 tls * The original join allowed "-o arg arg". Convert to
586 1.10 tls * "-o arg -o arg".
587 1.1 glass */
588 1.1 glass if (ap[2] != '\0')
589 1.1 glass break;
590 1.1 glass for (p = argv + 2; *p; ++p) {
591 1.11 lukem if ((p[0][0] != '1' && p[0][0] != '2') ||
592 1.10 tls p[0][1] != '.')
593 1.1 glass break;
594 1.1 glass len = strlen(*p);
595 1.1 glass if (len - 2 != strspn(*p + 2, "0123456789"))
596 1.1 glass break;
597 1.1 glass if ((t = malloc(len + 3)) == NULL)
598 1.10 tls enomem();
599 1.1 glass t[0] = '-';
600 1.1 glass t[1] = 'o';
601 1.11 lukem memmove(t + 2, *p, len + 1);
602 1.1 glass *p = t;
603 1.1 glass }
604 1.1 glass argv = p - 1;
605 1.1 glass break;
606 1.1 glass }
607 1.1 glass }
608 1.1 glass }
609 1.1 glass
610 1.1 glass void
611 1.10 tls enomem()
612 1.10 tls {
613 1.11 lukem errx(1, "no memory");
614 1.10 tls }
615 1.10 tls
616 1.10 tls void
617 1.1 glass usage()
618 1.1 glass {
619 1.1 glass (void)fprintf(stderr, "%s%s\n",
620 1.1 glass "usage: join [-a fileno | -v fileno ] [-e string] [-1 field] ",
621 1.1 glass "[-2 field]\n [-o list] [-t char] file1 file2");
622 1.1 glass exit(1);
623 1.1 glass }
624