sdiff.c revision 1.3 1 1.3 rillig /* $NetBSD: sdiff.c,v 1.3 2021/08/27 17:38:57 rillig Exp $ */
2 1.1 rmind /* $OpenBSD: sdiff.c,v 1.20 2006/09/19 05:52:23 otto Exp $ */
3 1.1 rmind
4 1.1 rmind /*
5 1.1 rmind * Written by Raymond Lai <ray (at) cyth.net>.
6 1.1 rmind * Public domain.
7 1.1 rmind */
8 1.1 rmind
9 1.1 rmind #include <sys/param.h>
10 1.1 rmind #include <sys/queue.h>
11 1.1 rmind #include <sys/stat.h>
12 1.1 rmind #include <sys/types.h>
13 1.1 rmind #include <sys/wait.h>
14 1.1 rmind
15 1.1 rmind #include <ctype.h>
16 1.1 rmind #include <err.h>
17 1.1 rmind #include <errno.h>
18 1.1 rmind #include <fcntl.h>
19 1.1 rmind #include <getopt.h>
20 1.1 rmind #include <limits.h>
21 1.1 rmind #include <paths.h>
22 1.1 rmind #include <stdio.h>
23 1.1 rmind #include <stdlib.h>
24 1.1 rmind #include <string.h>
25 1.1 rmind #include <unistd.h>
26 1.1 rmind #include <util.h>
27 1.1 rmind
28 1.1 rmind #include "common.h"
29 1.1 rmind #include "extern.h"
30 1.1 rmind
31 1.1 rmind #define WIDTH 130
32 1.1 rmind /*
33 1.1 rmind * Each column must be at least one character wide, plus three
34 1.1 rmind * characters between the columns (space, [<|>], space).
35 1.1 rmind */
36 1.1 rmind #define WIDTH_MIN 5
37 1.1 rmind
38 1.1 rmind /* A single diff line. */
39 1.1 rmind struct diffline {
40 1.1 rmind SIMPLEQ_ENTRY(diffline) diffentries;
41 1.1 rmind char *left;
42 1.1 rmind char div;
43 1.1 rmind char *right;
44 1.1 rmind };
45 1.1 rmind
46 1.1 rmind static void astrcat(char **, const char *);
47 1.1 rmind static void enqueue(char *, char, char *);
48 1.1 rmind static char *mktmpcpy(const char *);
49 1.1 rmind static void freediff(struct diffline *);
50 1.1 rmind static void int_usage(void);
51 1.1 rmind static int parsecmd(FILE *, FILE *, FILE *);
52 1.1 rmind static void printa(FILE *, size_t);
53 1.1 rmind static void printc(FILE *, size_t, FILE *, size_t);
54 1.1 rmind static void printcol(const char *, size_t *, const size_t);
55 1.1 rmind static void printd(FILE *, size_t);
56 1.1 rmind static void println(const char *, const char, const char *);
57 1.1 rmind static void processq(void);
58 1.1 rmind static void prompt(const char *, const char *);
59 1.1 rmind __dead static void usage(void);
60 1.1 rmind static char *xfgets(FILE *);
61 1.1 rmind
62 1.1 rmind SIMPLEQ_HEAD(, diffline) diffhead = SIMPLEQ_HEAD_INITIALIZER(diffhead);
63 1.1 rmind size_t line_width; /* width of a line (two columns and divider) */
64 1.1 rmind size_t width; /* width of each column */
65 1.1 rmind size_t file1ln, file2ln; /* line number of file1 and file2 */
66 1.1 rmind int Iflag = 0; /* ignore sets matching regexp */
67 1.1 rmind int lflag; /* print only left column for identical lines */
68 1.1 rmind int sflag; /* skip identical lines */
69 1.1 rmind FILE *outfile; /* file to save changes to */
70 1.1 rmind const char *tmpdir; /* TMPDIR or /tmp */
71 1.1 rmind
72 1.1 rmind static struct option longopts[] = {
73 1.1 rmind { "text", no_argument, NULL, 'a' },
74 1.1 rmind { "ignore-blank-lines", no_argument, NULL, 'B' },
75 1.1 rmind { "ignore-space-change", no_argument, NULL, 'b' },
76 1.1 rmind { "minimal", no_argument, NULL, 'd' },
77 1.1 rmind { "ignore-tab-expansion", no_argument, NULL, 'E' },
78 1.1 rmind { "diff-program", required_argument, NULL, 'F' },
79 1.1 rmind { "speed-large-files", no_argument, NULL, 'H' },
80 1.1 rmind { "ignore-matching-lines", required_argument, NULL, 'I' },
81 1.1 rmind { "left-column", no_argument, NULL, 'l' },
82 1.1 rmind { "output", required_argument, NULL, 'o' },
83 1.1 rmind { "strip-trailing-cr", no_argument, NULL, 'S' },
84 1.1 rmind { "suppress-common-lines", no_argument, NULL, 's' },
85 1.1 rmind { "expand-tabs", no_argument, NULL, 't' },
86 1.1 rmind { "ignore-all-space", no_argument, NULL, 'W' },
87 1.1 rmind { "width", required_argument, NULL, 'w' },
88 1.1 rmind { NULL, 0, NULL, 0 }
89 1.1 rmind };
90 1.1 rmind
91 1.1 rmind /*
92 1.1 rmind * Create temporary file if source_file is not a regular file.
93 1.1 rmind * Returns temporary file name if one was malloced, NULL if unnecessary.
94 1.1 rmind */
95 1.1 rmind static char *
96 1.1 rmind mktmpcpy(const char *source_file)
97 1.1 rmind {
98 1.1 rmind struct stat sb;
99 1.1 rmind ssize_t rcount;
100 1.1 rmind int ifd, ofd;
101 1.1 rmind u_char buf[BUFSIZ];
102 1.1 rmind char *target_file;
103 1.1 rmind
104 1.1 rmind /* Open input and output. */
105 1.1 rmind ifd = open(source_file, O_RDONLY, 0);
106 1.1 rmind /* File was opened successfully. */
107 1.1 rmind if (ifd != -1) {
108 1.1 rmind if (fstat(ifd, &sb) == -1)
109 1.1 rmind err(2, "error getting file status from %s", source_file);
110 1.1 rmind
111 1.1 rmind /* Regular file. */
112 1.1 rmind if (S_ISREG(sb.st_mode))
113 1.1 rmind return (NULL);
114 1.1 rmind } else {
115 1.1 rmind /* If ``-'' does not exist the user meant stdin. */
116 1.1 rmind if (errno == ENOENT && strcmp(source_file, "-") == 0)
117 1.1 rmind ifd = STDIN_FILENO;
118 1.1 rmind else
119 1.1 rmind err(2, "error opening %s", source_file);
120 1.1 rmind }
121 1.1 rmind
122 1.1 rmind /* Not a regular file, so copy input into temporary file. */
123 1.1 rmind if (asprintf(&target_file, "%s/sdiff.XXXXXXXXXX", tmpdir) == -1)
124 1.1 rmind err(2, "asprintf");
125 1.1 rmind if ((ofd = mkstemp(target_file)) == -1) {
126 1.1 rmind warn("error opening %s", target_file);
127 1.1 rmind goto FAIL;
128 1.1 rmind }
129 1.1 rmind while ((rcount = read(ifd, buf, sizeof(buf))) != -1 &&
130 1.1 rmind rcount != 0) {
131 1.1 rmind ssize_t wcount;
132 1.1 rmind
133 1.1 rmind wcount = write(ofd, buf, (size_t)rcount);
134 1.1 rmind if (-1 == wcount || rcount != wcount) {
135 1.1 rmind warn("error writing to %s", target_file);
136 1.1 rmind goto FAIL;
137 1.1 rmind }
138 1.1 rmind }
139 1.1 rmind if (rcount == -1) {
140 1.1 rmind warn("error reading from %s", source_file);
141 1.1 rmind goto FAIL;
142 1.1 rmind }
143 1.1 rmind
144 1.1 rmind close(ifd);
145 1.1 rmind close(ofd);
146 1.1 rmind
147 1.1 rmind return (target_file);
148 1.1 rmind
149 1.1 rmind FAIL:
150 1.1 rmind unlink(target_file);
151 1.1 rmind exit(2);
152 1.1 rmind }
153 1.1 rmind
154 1.1 rmind int
155 1.1 rmind main(int argc, char **argv)
156 1.1 rmind {
157 1.1 rmind FILE *diffpipe, *file1, *file2;
158 1.1 rmind size_t diffargc = 0, wflag = WIDTH;
159 1.1 rmind int ch, fd[2], status;
160 1.1 rmind pid_t pid;
161 1.1 rmind char **diffargv, *diffprog = "diff", *filename1, *filename2,
162 1.1 rmind *tmp1, *tmp2, *s1, *s2;
163 1.1 rmind
164 1.1 rmind /*
165 1.1 rmind * Process diff flags.
166 1.1 rmind */
167 1.1 rmind /*
168 1.1 rmind * Allocate memory for diff arguments and NULL.
169 1.1 rmind * Each flag has at most one argument, so doubling argc gives an
170 1.1 rmind * upper limit of how many diff args can be passed. argv[0],
171 1.1 rmind * file1, and file2 won't have arguments so doubling them will
172 1.1 rmind * waste some memory; however we need an extra space for the
173 1.1 rmind * NULL at the end, so it sort of works out.
174 1.1 rmind */
175 1.1 rmind if (!(diffargv = malloc(sizeof(char **) * argc * 2)))
176 1.1 rmind err(2, "main");
177 1.1 rmind
178 1.1 rmind /* Add first argument, the program name. */
179 1.1 rmind diffargv[diffargc++] = diffprog;
180 1.1 rmind
181 1.1 rmind while ((ch = getopt_long(argc, argv, "aBbdEHI:ilo:stWw:",
182 1.1 rmind longopts, NULL)) != -1) {
183 1.1 rmind const char *errstr;
184 1.1 rmind
185 1.1 rmind switch (ch) {
186 1.1 rmind case 'a':
187 1.1 rmind diffargv[diffargc++] = "-a";
188 1.1 rmind break;
189 1.1 rmind case 'B':
190 1.1 rmind diffargv[diffargc++] = "-B";
191 1.1 rmind break;
192 1.1 rmind case 'b':
193 1.1 rmind diffargv[diffargc++] = "-b";
194 1.1 rmind break;
195 1.1 rmind case 'd':
196 1.1 rmind diffargv[diffargc++] = "-d";
197 1.1 rmind break;
198 1.1 rmind case 'E':
199 1.1 rmind diffargv[diffargc++] = "-E";
200 1.1 rmind break;
201 1.1 rmind case 'F':
202 1.1 rmind diffargv[0] = diffprog = optarg;
203 1.1 rmind break;
204 1.1 rmind case 'H':
205 1.1 rmind diffargv[diffargc++] = "-H";
206 1.1 rmind break;
207 1.1 rmind case 'I':
208 1.1 rmind Iflag = 1;
209 1.1 rmind diffargv[diffargc++] = "-I";
210 1.1 rmind diffargv[diffargc++] = optarg;
211 1.1 rmind break;
212 1.1 rmind case 'i':
213 1.1 rmind diffargv[diffargc++] = "-i";
214 1.1 rmind break;
215 1.1 rmind case 'l':
216 1.1 rmind lflag = 1;
217 1.1 rmind break;
218 1.1 rmind case 'o':
219 1.1 rmind if ((outfile = fopen(optarg, "w")) == NULL)
220 1.1 rmind err(2, "could not open: %s", optarg);
221 1.1 rmind break;
222 1.1 rmind case 'S':
223 1.1 rmind diffargv[diffargc++] = "--strip-trailing-cr";
224 1.1 rmind break;
225 1.1 rmind case 's':
226 1.1 rmind sflag = 1;
227 1.1 rmind break;
228 1.1 rmind case 't':
229 1.1 rmind diffargv[diffargc++] = "-t";
230 1.1 rmind break;
231 1.1 rmind case 'W':
232 1.1 rmind diffargv[diffargc++] = "-w";
233 1.1 rmind break;
234 1.1 rmind case 'w':
235 1.1 rmind wflag = strtonum(optarg, WIDTH_MIN,
236 1.1 rmind INT_MAX, &errstr);
237 1.1 rmind if (errstr)
238 1.1 rmind errx(2, "width is %s: %s", errstr, optarg);
239 1.1 rmind break;
240 1.1 rmind default:
241 1.1 rmind usage();
242 1.1 rmind }
243 1.1 rmind
244 1.1 rmind }
245 1.1 rmind argc -= optind;
246 1.1 rmind argv += optind;
247 1.1 rmind
248 1.1 rmind if (argc != 2)
249 1.1 rmind usage();
250 1.1 rmind
251 1.1 rmind if ((tmpdir = getenv("TMPDIR")) == NULL)
252 1.1 rmind tmpdir = _PATH_TMP;
253 1.1 rmind
254 1.1 rmind filename1 = argv[0];
255 1.1 rmind filename2 = argv[1];
256 1.1 rmind
257 1.1 rmind /*
258 1.1 rmind * Create temporary files for diff and sdiff to share if file1
259 1.1 rmind * or file2 are not regular files. This allows sdiff and diff
260 1.1 rmind * to read the same inputs if one or both inputs are stdin.
261 1.1 rmind *
262 1.1 rmind * If any temporary files were created, their names would be
263 1.1 rmind * saved in tmp1 or tmp2. tmp1 should never equal tmp2.
264 1.1 rmind */
265 1.1 rmind tmp1 = tmp2 = NULL;
266 1.1 rmind /* file1 and file2 are the same, so copy to same temp file. */
267 1.1 rmind if (strcmp(filename1, filename2) == 0) {
268 1.1 rmind if ((tmp1 = mktmpcpy(filename1)))
269 1.1 rmind filename1 = filename2 = tmp1;
270 1.1 rmind /* Copy file1 and file2 into separate temp files. */
271 1.1 rmind } else {
272 1.1 rmind if ((tmp1 = mktmpcpy(filename1)))
273 1.1 rmind filename1 = tmp1;
274 1.1 rmind if ((tmp2 = mktmpcpy(filename2)))
275 1.1 rmind filename2 = tmp2;
276 1.1 rmind }
277 1.1 rmind
278 1.1 rmind diffargv[diffargc++] = filename1;
279 1.1 rmind diffargv[diffargc++] = filename2;
280 1.1 rmind /* Add NULL to end of array to indicate end of array. */
281 1.1 rmind diffargv[diffargc++] = NULL;
282 1.1 rmind
283 1.1 rmind /* Subtract column divider and divide by two. */
284 1.1 rmind width = (wflag - 3) / 2;
285 1.1 rmind /* Make sure line_width can fit in size_t. */
286 1.1 rmind if (width > (SIZE_T_MAX - 3) / 2)
287 1.1 rmind errx(2, "width is too large: %zu", width);
288 1.1 rmind line_width = width * 2 + 3;
289 1.1 rmind
290 1.1 rmind if (pipe(fd))
291 1.1 rmind err(2, "pipe");
292 1.1 rmind
293 1.1 rmind switch(pid = fork()) {
294 1.1 rmind case 0:
295 1.1 rmind /* child */
296 1.1 rmind /* We don't read from the pipe. */
297 1.1 rmind close(fd[0]);
298 1.1 rmind if (dup2(fd[1], STDOUT_FILENO) == -1)
299 1.1 rmind err(2, "child could not duplicate descriptor");
300 1.1 rmind /* Free unused descriptor. */
301 1.1 rmind close(fd[1]);
302 1.1 rmind
303 1.1 rmind execvp(diffprog, diffargv);
304 1.1 rmind err(2, "could not execute diff: %s", diffprog);
305 1.1 rmind case -1:
306 1.1 rmind err(2, "could not fork");
307 1.1 rmind }
308 1.1 rmind
309 1.1 rmind /* parent */
310 1.1 rmind /* We don't write to the pipe. */
311 1.1 rmind close(fd[1]);
312 1.1 rmind
313 1.1 rmind /* Open pipe to diff command. */
314 1.1 rmind if ((diffpipe = fdopen(fd[0], "r")) == NULL)
315 1.1 rmind err(2, "could not open diff pipe");
316 1.1 rmind if ((file1 = fopen(filename1, "r")) == NULL)
317 1.1 rmind err(2, "could not open %s", filename1);
318 1.1 rmind if ((file2 = fopen(filename2, "r")) == NULL)
319 1.1 rmind err(2, "could not open %s", filename2);
320 1.1 rmind
321 1.1 rmind /* Line numbers start at one. */
322 1.1 rmind file1ln = file2ln = 1;
323 1.1 rmind
324 1.1 rmind /* Read and parse diff output. */
325 1.1 rmind while (parsecmd(diffpipe, file1, file2) != EOF)
326 1.1 rmind ;
327 1.1 rmind fclose(diffpipe);
328 1.1 rmind
329 1.1 rmind /* Wait for diff to exit. */
330 1.1 rmind if (waitpid(pid, &status, 0) == -1 || !WIFEXITED(status) ||
331 1.1 rmind WEXITSTATUS(status) >= 2)
332 1.1 rmind err(2, "diff exited abnormally");
333 1.1 rmind
334 1.1 rmind /* Delete and free unneeded temporary files. */
335 1.1 rmind if (tmp1)
336 1.1 rmind if (unlink(tmp1))
337 1.1 rmind warn("error deleting %s", tmp1);
338 1.1 rmind if (tmp2)
339 1.1 rmind if (unlink(tmp2))
340 1.1 rmind warn("error deleting %s", tmp2);
341 1.1 rmind free(tmp1);
342 1.1 rmind free(tmp2);
343 1.1 rmind filename1 = filename2 = tmp1 = tmp2 = NULL;
344 1.1 rmind
345 1.1 rmind /* No more diffs, so print common lines. */
346 1.1 rmind if (lflag)
347 1.1 rmind while ((s1 = xfgets(file1)))
348 1.1 rmind enqueue(s1, ' ', NULL);
349 1.1 rmind else
350 1.1 rmind for (;;) {
351 1.1 rmind s1 = xfgets(file1);
352 1.1 rmind s2 = xfgets(file2);
353 1.1 rmind if (s1 || s2)
354 1.1 rmind enqueue(s1, ' ', s2);
355 1.1 rmind else
356 1.1 rmind break;
357 1.1 rmind }
358 1.1 rmind fclose(file1);
359 1.1 rmind fclose(file2);
360 1.1 rmind /* Process unmodified lines. */
361 1.1 rmind processq();
362 1.1 rmind
363 1.1 rmind /* Return diff exit status. */
364 1.1 rmind return (WEXITSTATUS(status));
365 1.1 rmind }
366 1.1 rmind
367 1.1 rmind /*
368 1.1 rmind * Prints an individual column (left or right), taking into account
369 1.1 rmind * that tabs are variable-width. Takes a string, the current column
370 1.1 rmind * the cursor is on the screen, and the maximum value of the column.
371 1.1 rmind * The column value is updated as we go along.
372 1.1 rmind */
373 1.1 rmind static void
374 1.1 rmind printcol(const char *s, size_t *col, const size_t col_max)
375 1.1 rmind {
376 1.1 rmind
377 1.1 rmind for (; *s && *col < col_max; ++s) {
378 1.1 rmind size_t new_col;
379 1.1 rmind
380 1.1 rmind switch (*s) {
381 1.1 rmind case '\t':
382 1.1 rmind /*
383 1.1 rmind * If rounding to next multiple of eight causes
384 1.1 rmind * an integer overflow, just return.
385 1.1 rmind */
386 1.1 rmind if (*col > SIZE_T_MAX - 8)
387 1.1 rmind return;
388 1.1 rmind
389 1.1 rmind /* Round to next multiple of eight. */
390 1.1 rmind new_col = (*col / 8 + 1) * 8;
391 1.1 rmind
392 1.1 rmind /*
393 1.1 rmind * If printing the tab goes past the column
394 1.1 rmind * width, don't print it and just quit.
395 1.1 rmind */
396 1.1 rmind if (new_col > col_max)
397 1.1 rmind return;
398 1.1 rmind *col = new_col;
399 1.1 rmind break;
400 1.1 rmind
401 1.1 rmind default:
402 1.1 rmind ++(*col);
403 1.1 rmind }
404 1.1 rmind
405 1.1 rmind putchar(*s);
406 1.1 rmind }
407 1.1 rmind }
408 1.1 rmind
409 1.1 rmind /*
410 1.1 rmind * Prompts user to either choose between two strings or edit one, both,
411 1.1 rmind * or neither.
412 1.1 rmind */
413 1.1 rmind static void
414 1.1 rmind prompt(const char *s1, const char *s2)
415 1.1 rmind {
416 1.1 rmind char *cmd;
417 1.1 rmind
418 1.1 rmind /* Print command prompt. */
419 1.1 rmind putchar('%');
420 1.1 rmind
421 1.1 rmind /* Get user input. */
422 1.1 rmind for (; (cmd = xfgets(stdin)); free(cmd)) {
423 1.1 rmind const char *p;
424 1.1 rmind
425 1.1 rmind /* Skip leading whitespace. */
426 1.3 rillig for (p = cmd; isspace((unsigned char)(*p)); ++p)
427 1.1 rmind ;
428 1.1 rmind
429 1.1 rmind switch (*p) {
430 1.1 rmind case 'e':
431 1.1 rmind /* Skip `e'. */
432 1.1 rmind ++p;
433 1.1 rmind
434 1.1 rmind if (eparse(p, s1, s2) == -1)
435 1.1 rmind goto USAGE;
436 1.1 rmind break;
437 1.1 rmind
438 1.1 rmind case 'l':
439 1.1 rmind /* Choose left column as-is. */
440 1.1 rmind if (s1 != NULL)
441 1.1 rmind fprintf(outfile, "%s\n", s1);
442 1.1 rmind
443 1.1 rmind /* End of command parsing. */
444 1.1 rmind break;
445 1.1 rmind
446 1.1 rmind case 'q':
447 1.1 rmind goto QUIT;
448 1.1 rmind
449 1.1 rmind case 'r':
450 1.1 rmind /* Choose right column as-is. */
451 1.1 rmind if (s2 != NULL)
452 1.1 rmind fprintf(outfile, "%s\n", s2);
453 1.1 rmind
454 1.1 rmind /* End of command parsing. */
455 1.1 rmind break;
456 1.1 rmind
457 1.1 rmind case 's':
458 1.1 rmind sflag = 1;
459 1.1 rmind goto PROMPT;
460 1.1 rmind
461 1.1 rmind case 'v':
462 1.1 rmind sflag = 0;
463 1.1 rmind /* FALLTHROUGH */
464 1.1 rmind
465 1.1 rmind default:
466 1.1 rmind /* Interactive usage help. */
467 1.1 rmind USAGE:
468 1.1 rmind int_usage();
469 1.1 rmind PROMPT:
470 1.1 rmind putchar('%');
471 1.1 rmind
472 1.1 rmind /* Prompt user again. */
473 1.1 rmind continue;
474 1.1 rmind }
475 1.1 rmind
476 1.1 rmind free(cmd);
477 1.1 rmind return;
478 1.1 rmind }
479 1.1 rmind
480 1.1 rmind /*
481 1.1 rmind * If there was no error, we received an EOF from stdin, so we
482 1.1 rmind * should quit.
483 1.1 rmind */
484 1.1 rmind QUIT:
485 1.1 rmind fclose(outfile);
486 1.1 rmind exit(0);
487 1.1 rmind }
488 1.1 rmind
489 1.1 rmind /*
490 1.1 rmind * Takes two strings, separated by a column divider. NULL strings are
491 1.1 rmind * treated as empty columns. If the divider is the ` ' character, the
492 1.1 rmind * second column is not printed (-l flag). In this case, the second
493 1.1 rmind * string must be NULL. When the second column is NULL, the divider
494 1.1 rmind * does not print the trailing space following the divider character.
495 1.1 rmind *
496 1.1 rmind * Takes into account that tabs can take multiple columns.
497 1.1 rmind */
498 1.1 rmind static void
499 1.2 lukem println(const char *s1, const char divc, const char *s2)
500 1.1 rmind {
501 1.1 rmind size_t col;
502 1.1 rmind
503 1.1 rmind /* Print first column. Skips if s1 == NULL. */
504 1.1 rmind col = 0;
505 1.1 rmind if (s1) {
506 1.1 rmind /* Skip angle bracket and space. */
507 1.1 rmind printcol(s1, &col, width);
508 1.1 rmind
509 1.1 rmind }
510 1.1 rmind
511 1.1 rmind /* Only print left column. */
512 1.2 lukem if (divc == ' ' && !s2) {
513 1.1 rmind putchar('\n');
514 1.1 rmind return;
515 1.1 rmind }
516 1.1 rmind
517 1.1 rmind /* Otherwise, we pad this column up to width. */
518 1.1 rmind for (; col < width; ++col)
519 1.1 rmind putchar(' ');
520 1.1 rmind
521 1.1 rmind /*
522 1.1 rmind * Print column divider. If there is no second column, we don't
523 1.1 rmind * need to add the space for padding.
524 1.1 rmind */
525 1.1 rmind if (!s2) {
526 1.2 lukem printf(" %c\n", divc);
527 1.1 rmind return;
528 1.1 rmind }
529 1.2 lukem printf(" %c ", divc);
530 1.1 rmind col += 3;
531 1.1 rmind
532 1.1 rmind /* Skip angle bracket and space. */
533 1.1 rmind printcol(s2, &col, line_width);
534 1.1 rmind
535 1.1 rmind putchar('\n');
536 1.1 rmind }
537 1.1 rmind
538 1.1 rmind /*
539 1.1 rmind * Reads a line from file and returns as a string. If EOF is reached,
540 1.1 rmind * NULL is returned. The returned string must be freed afterwards.
541 1.1 rmind */
542 1.1 rmind static char *
543 1.1 rmind xfgets(FILE *file)
544 1.1 rmind {
545 1.1 rmind const char delim[3] = {'\0', '\0', '\0'};
546 1.1 rmind char *s;
547 1.1 rmind
548 1.1 rmind /* XXX - Is this necessary? */
549 1.1 rmind clearerr(file);
550 1.1 rmind
551 1.1 rmind if (!(s = fparseln(file, NULL, NULL, delim, 0)) &&
552 1.1 rmind ferror(file))
553 1.1 rmind err(2, "error reading file");
554 1.1 rmind
555 1.1 rmind if (!s) {
556 1.1 rmind return (NULL);
557 1.1 rmind }
558 1.1 rmind
559 1.1 rmind return (s);
560 1.1 rmind }
561 1.1 rmind
562 1.1 rmind /*
563 1.1 rmind * Parse ed commands from diffpipe and print lines from file1 (lines
564 1.1 rmind * to change or delete) or file2 (lines to add or change).
565 1.1 rmind * Returns EOF or 0.
566 1.1 rmind */
567 1.1 rmind static int
568 1.1 rmind parsecmd(FILE *diffpipe, FILE *file1, FILE *file2)
569 1.1 rmind {
570 1.1 rmind size_t file1start, file1end, file2start, file2end, n;
571 1.1 rmind /* ed command line and pointer to characters in line */
572 1.1 rmind char *line, *p, *q;
573 1.1 rmind const char *errstr;
574 1.1 rmind char c, cmd;
575 1.1 rmind
576 1.1 rmind /* Read ed command. */
577 1.1 rmind if (!(line = xfgets(diffpipe)))
578 1.1 rmind return (EOF);
579 1.1 rmind
580 1.1 rmind p = line;
581 1.1 rmind /* Go to character after line number. */
582 1.3 rillig while (isdigit((unsigned char)(*p)))
583 1.1 rmind ++p;
584 1.1 rmind c = *p;
585 1.1 rmind *p++ = 0;
586 1.1 rmind file1start = strtonum(line, 0, INT_MAX, &errstr);
587 1.1 rmind if (errstr)
588 1.1 rmind errx(2, "file1 start is %s: %s", errstr, line);
589 1.1 rmind
590 1.1 rmind /* A range is specified for file1. */
591 1.1 rmind if (c == ',') {
592 1.1 rmind
593 1.1 rmind q = p;
594 1.1 rmind /* Go to character after file2end. */
595 1.3 rillig while (isdigit((unsigned char)(*p)))
596 1.1 rmind ++p;
597 1.1 rmind c = *p;
598 1.1 rmind *p++ = 0;
599 1.1 rmind file1end = strtonum(q, 0, INT_MAX, &errstr);
600 1.1 rmind if (errstr)
601 1.1 rmind errx(2, "file1 end is %s: %s", errstr, line);
602 1.1 rmind if (file1start > file1end)
603 1.1 rmind errx(2, "invalid line range in file1: %s", line);
604 1.1 rmind
605 1.1 rmind } else
606 1.1 rmind file1end = file1start;
607 1.1 rmind
608 1.1 rmind cmd = c;
609 1.1 rmind /* Check that cmd is valid. */
610 1.1 rmind if (!(cmd == 'a' || cmd == 'c' || cmd == 'd'))
611 1.1 rmind errx(2, "ed command not recognized: %c: %s", cmd, line);
612 1.1 rmind
613 1.1 rmind q = p;
614 1.1 rmind /* Go to character after line number. */
615 1.3 rillig while (isdigit((unsigned char)(*p)))
616 1.1 rmind ++p;
617 1.1 rmind c = *p;
618 1.1 rmind *p++ = 0;
619 1.1 rmind file2start = strtonum(q, 0, INT_MAX, &errstr);
620 1.1 rmind if (errstr)
621 1.1 rmind errx(2, "file2 start is %s: %s", errstr, line);
622 1.1 rmind
623 1.1 rmind /*
624 1.1 rmind * There should either be a comma signifying a second line
625 1.1 rmind * number or the line should just end here.
626 1.1 rmind */
627 1.1 rmind if (c != ',' && c != '\0')
628 1.1 rmind errx(2, "invalid line range in file2: %c: %s", c, line);
629 1.1 rmind
630 1.1 rmind if (c == ',') {
631 1.1 rmind
632 1.1 rmind file2end = strtonum(p, 0, INT_MAX, &errstr);
633 1.1 rmind if (errstr)
634 1.1 rmind errx(2, "file2 end is %s: %s", errstr, line);
635 1.1 rmind if (file2start >= file2end)
636 1.1 rmind errx(2, "invalid line range in file2: %s", line);
637 1.1 rmind } else
638 1.1 rmind file2end = file2start;
639 1.1 rmind
640 1.1 rmind /* Appends happen _after_ stated line. */
641 1.1 rmind if (cmd == 'a') {
642 1.1 rmind if (file1start != file1end)
643 1.1 rmind errx(2, "append cannot have a file1 range: %s",
644 1.1 rmind line);
645 1.1 rmind if (file1start == SIZE_T_MAX)
646 1.1 rmind errx(2, "file1 line range too high: %s", line);
647 1.1 rmind file1start = ++file1end;
648 1.1 rmind }
649 1.1 rmind /*
650 1.1 rmind * I'm not sure what the deal is with the line numbers for
651 1.1 rmind * deletes, though.
652 1.1 rmind */
653 1.1 rmind else if (cmd == 'd') {
654 1.1 rmind if (file2start != file2end)
655 1.1 rmind errx(2, "delete cannot have a file2 range: %s",
656 1.1 rmind line);
657 1.1 rmind if (file2start == SIZE_T_MAX)
658 1.1 rmind errx(2, "file2 line range too high: %s", line);
659 1.1 rmind file2start = ++file2end;
660 1.1 rmind }
661 1.1 rmind
662 1.1 rmind /*
663 1.1 rmind * Continue reading file1 and file2 until we reach line numbers
664 1.1 rmind * specified by diff. Should only happen with -I flag.
665 1.1 rmind */
666 1.1 rmind for (; file1ln < file1start && file2ln < file2start;
667 1.1 rmind ++file1ln, ++file2ln) {
668 1.1 rmind char *s1, *s2;
669 1.1 rmind
670 1.1 rmind if (!(s1 = xfgets(file1)))
671 1.1 rmind errx(2, "file1 shorter than expected");
672 1.1 rmind if (!(s2 = xfgets(file2)))
673 1.1 rmind errx(2, "file2 shorter than expected");
674 1.1 rmind
675 1.1 rmind /* If the -l flag was specified, print only left column. */
676 1.1 rmind if (lflag) {
677 1.1 rmind free(s2);
678 1.1 rmind /*
679 1.1 rmind * XXX - If -l and -I are both specified, all
680 1.1 rmind * unchanged or ignored lines are shown with a
681 1.1 rmind * `(' divider. This matches GNU sdiff, but I
682 1.1 rmind * believe it is a bug. Just check out:
683 1.1 rmind * gsdiff -l -I '^$' samefile samefile.
684 1.1 rmind */
685 1.1 rmind if (Iflag)
686 1.1 rmind enqueue(s1, '(', NULL);
687 1.1 rmind else
688 1.1 rmind enqueue(s1, ' ', NULL);
689 1.1 rmind } else
690 1.1 rmind enqueue(s1, ' ', s2);
691 1.1 rmind }
692 1.1 rmind /* Ignore deleted lines. */
693 1.1 rmind for (; file1ln < file1start; ++file1ln) {
694 1.1 rmind char *s;
695 1.1 rmind
696 1.1 rmind if (!(s = xfgets(file1)))
697 1.1 rmind errx(2, "file1 shorter than expected");
698 1.1 rmind
699 1.1 rmind enqueue(s, '(', NULL);
700 1.1 rmind }
701 1.1 rmind /* Ignore added lines. */
702 1.1 rmind for (; file2ln < file2start; ++file2ln) {
703 1.1 rmind char *s;
704 1.1 rmind
705 1.1 rmind if (!(s = xfgets(file2)))
706 1.1 rmind errx(2, "file2 shorter than expected");
707 1.1 rmind
708 1.1 rmind /* If -l flag was given, don't print right column. */
709 1.1 rmind if (lflag)
710 1.1 rmind free(s);
711 1.1 rmind else
712 1.1 rmind enqueue(NULL, ')', s);
713 1.1 rmind }
714 1.1 rmind
715 1.1 rmind /* Process unmodified or skipped lines. */
716 1.1 rmind processq();
717 1.1 rmind
718 1.1 rmind switch (cmd) {
719 1.1 rmind case 'a':
720 1.1 rmind printa(file2, file2end);
721 1.1 rmind n = file2end - file2start + 1;
722 1.1 rmind break;
723 1.1 rmind
724 1.1 rmind case 'c':
725 1.1 rmind printc(file1, file1end, file2, file2end);
726 1.1 rmind n = file1end - file1start + 1 + 1 + file2end - file2start + 1;
727 1.1 rmind break;
728 1.1 rmind
729 1.1 rmind case 'd':
730 1.1 rmind printd(file1, file1end);
731 1.1 rmind n = file1end - file1start + 1;
732 1.1 rmind break;
733 1.1 rmind
734 1.1 rmind default:
735 1.1 rmind errx(2, "invalid diff command: %c: %s", cmd, line);
736 1.1 rmind }
737 1.1 rmind
738 1.1 rmind /* Skip to next ed line. */
739 1.1 rmind while (n--)
740 1.1 rmind if (!xfgets(diffpipe))
741 1.1 rmind errx(2, "diff ended early");
742 1.1 rmind
743 1.1 rmind return (0);
744 1.1 rmind }
745 1.1 rmind
746 1.1 rmind /*
747 1.1 rmind * Queues up a diff line.
748 1.1 rmind */
749 1.1 rmind static void
750 1.2 lukem enqueue(char *left, char divc, char *right)
751 1.1 rmind {
752 1.1 rmind struct diffline *diffp;
753 1.1 rmind
754 1.1 rmind if (!(diffp = malloc(sizeof(struct diffline))))
755 1.1 rmind err(2, "enqueue");
756 1.1 rmind diffp->left = left;
757 1.2 lukem diffp->div = divc;
758 1.1 rmind diffp->right = right;
759 1.1 rmind SIMPLEQ_INSERT_TAIL(&diffhead, diffp, diffentries);
760 1.1 rmind }
761 1.1 rmind
762 1.1 rmind /*
763 1.1 rmind * Free a diffline structure and its elements.
764 1.1 rmind */
765 1.1 rmind static void
766 1.1 rmind freediff(struct diffline *diffp)
767 1.1 rmind {
768 1.1 rmind free(diffp->left);
769 1.1 rmind free(diffp->right);
770 1.1 rmind free(diffp);
771 1.1 rmind }
772 1.1 rmind
773 1.1 rmind /*
774 1.1 rmind * Append second string into first. Repeated appends to the same string
775 1.1 rmind * are cached, making this an O(n) function, where n = strlen(append).
776 1.1 rmind */
777 1.1 rmind static void
778 1.1 rmind astrcat(char **s, const char *append)
779 1.1 rmind {
780 1.1 rmind /* Length of string in previous run. */
781 1.1 rmind static size_t offset = 0;
782 1.1 rmind size_t newsiz;
783 1.1 rmind /*
784 1.1 rmind * String from previous run. Compared to *s to see if we are
785 1.1 rmind * dealing with the same string. If so, we can use offset.
786 1.1 rmind */
787 1.1 rmind static const char *oldstr = NULL;
788 1.1 rmind char *newstr;
789 1.1 rmind
790 1.1 rmind
791 1.1 rmind /*
792 1.1 rmind * First string is NULL, so just copy append.
793 1.1 rmind */
794 1.1 rmind if (!*s) {
795 1.1 rmind if (!(*s = strdup(append)))
796 1.1 rmind err(2, "astrcat");
797 1.1 rmind
798 1.1 rmind /* Keep track of string. */
799 1.1 rmind offset = strlen(*s);
800 1.1 rmind oldstr = *s;
801 1.1 rmind
802 1.1 rmind return;
803 1.1 rmind }
804 1.1 rmind
805 1.1 rmind /*
806 1.1 rmind * *s is a string so concatenate.
807 1.1 rmind */
808 1.1 rmind
809 1.1 rmind /* Did we process the same string in the last run? */
810 1.1 rmind /*
811 1.1 rmind * If this is a different string from the one we just processed
812 1.1 rmind * cache new string.
813 1.1 rmind */
814 1.1 rmind if (oldstr != *s) {
815 1.1 rmind offset = strlen(*s);
816 1.1 rmind oldstr = *s;
817 1.1 rmind }
818 1.1 rmind
819 1.1 rmind /* Size = strlen(*s) + \n + strlen(append) + '\0'. */
820 1.1 rmind newsiz = offset + 1 + strlen(append) + 1;
821 1.1 rmind
822 1.1 rmind /* Resize *s to fit new string. */
823 1.1 rmind newstr = realloc(*s, newsiz);
824 1.1 rmind if (newstr == NULL)
825 1.1 rmind err(2, "astrcat");
826 1.1 rmind *s = newstr;
827 1.1 rmind
828 1.1 rmind /* *s + offset should be end of string. */
829 1.1 rmind /* Concatenate. */
830 1.1 rmind strlcpy(*s + offset, "\n", newsiz - offset);
831 1.1 rmind strlcat(*s + offset, append, newsiz - offset);
832 1.1 rmind
833 1.1 rmind /* New string length should be exactly newsiz - 1 characters. */
834 1.1 rmind /* Store generated string's values. */
835 1.1 rmind offset = newsiz - 1;
836 1.1 rmind oldstr = *s;
837 1.1 rmind }
838 1.1 rmind
839 1.1 rmind /*
840 1.1 rmind * Process diff set queue, printing, prompting, and saving each diff
841 1.1 rmind * line stored in queue.
842 1.1 rmind */
843 1.1 rmind static void
844 1.1 rmind processq(void)
845 1.1 rmind {
846 1.1 rmind struct diffline *diffp;
847 1.1 rmind char divc, *left, *right;
848 1.1 rmind
849 1.1 rmind /* Don't process empty queue. */
850 1.1 rmind if (SIMPLEQ_EMPTY(&diffhead))
851 1.1 rmind return;
852 1.1 rmind
853 1.1 rmind /* Remember the divider. */
854 1.1 rmind divc = SIMPLEQ_FIRST(&diffhead)->div;
855 1.1 rmind
856 1.1 rmind left = NULL;
857 1.1 rmind right = NULL;
858 1.1 rmind /*
859 1.1 rmind * Go through set of diffs, concatenating each line in left or
860 1.1 rmind * right column into two long strings, `left' and `right'.
861 1.1 rmind */
862 1.1 rmind SIMPLEQ_FOREACH(diffp, &diffhead, diffentries) {
863 1.1 rmind /*
864 1.1 rmind * Print changed lines if -s was given,
865 1.1 rmind * print all lines if -s was not given.
866 1.1 rmind */
867 1.1 rmind if (!sflag || diffp->div == '|' || diffp->div == '<' ||
868 1.1 rmind diffp->div == '>')
869 1.1 rmind println(diffp->left, diffp->div, diffp->right);
870 1.1 rmind
871 1.1 rmind /* Append new lines to diff set. */
872 1.1 rmind if (diffp->left)
873 1.1 rmind astrcat(&left, diffp->left);
874 1.1 rmind if (diffp->right)
875 1.1 rmind astrcat(&right, diffp->right);
876 1.1 rmind }
877 1.1 rmind
878 1.1 rmind /* Empty queue and free each diff line and its elements. */
879 1.1 rmind while (!SIMPLEQ_EMPTY(&diffhead)) {
880 1.1 rmind diffp = SIMPLEQ_FIRST(&diffhead);
881 1.1 rmind SIMPLEQ_REMOVE_HEAD(&diffhead, diffentries);
882 1.1 rmind freediff(diffp);
883 1.1 rmind }
884 1.1 rmind
885 1.1 rmind /* Write to outfile, prompting user if lines are different. */
886 1.1 rmind if (outfile)
887 1.1 rmind switch (divc) {
888 1.1 rmind case ' ': case '(': case ')':
889 1.1 rmind fprintf(outfile, "%s\n", left);
890 1.1 rmind break;
891 1.1 rmind case '|': case '<': case '>':
892 1.1 rmind prompt(left, right);
893 1.1 rmind break;
894 1.1 rmind default:
895 1.1 rmind errx(2, "invalid divider: %c", divc);
896 1.1 rmind }
897 1.1 rmind
898 1.1 rmind /* Free left and right. */
899 1.1 rmind free(left);
900 1.1 rmind free(right);
901 1.1 rmind }
902 1.1 rmind
903 1.1 rmind /*
904 1.1 rmind * Print lines following an (a)ppend command.
905 1.1 rmind */
906 1.1 rmind static void
907 1.1 rmind printa(FILE *file, size_t line2)
908 1.1 rmind {
909 1.1 rmind char *line;
910 1.1 rmind
911 1.1 rmind for (; file2ln <= line2; ++file2ln) {
912 1.1 rmind if (!(line = xfgets(file)))
913 1.1 rmind errx(2, "append ended early");
914 1.1 rmind enqueue(NULL, '>', line);
915 1.1 rmind }
916 1.1 rmind
917 1.1 rmind processq();
918 1.1 rmind }
919 1.1 rmind
920 1.1 rmind /*
921 1.1 rmind * Print lines following a (c)hange command, from file1ln to file1end
922 1.1 rmind * and from file2ln to file2end.
923 1.1 rmind */
924 1.1 rmind static void
925 1.1 rmind printc(FILE *file1, size_t file1end, FILE *file2, size_t file2end)
926 1.1 rmind {
927 1.1 rmind struct fileline {
928 1.1 rmind SIMPLEQ_ENTRY(fileline) fileentries;
929 1.1 rmind char *line;
930 1.1 rmind };
931 1.1 rmind SIMPLEQ_HEAD(, fileline) delqhead = SIMPLEQ_HEAD_INITIALIZER(delqhead);
932 1.1 rmind
933 1.1 rmind /* Read lines to be deleted. */
934 1.1 rmind for (; file1ln <= file1end; ++file1ln) {
935 1.1 rmind struct fileline *linep;
936 1.1 rmind char *line1;
937 1.1 rmind
938 1.1 rmind /* Read lines from both. */
939 1.1 rmind if (!(line1 = xfgets(file1)))
940 1.1 rmind errx(2, "error reading file1 in delete in change");
941 1.1 rmind
942 1.1 rmind /* Add to delete queue. */
943 1.1 rmind if (!(linep = malloc(sizeof(struct fileline))))
944 1.1 rmind err(2, "printc");
945 1.1 rmind linep->line = line1;
946 1.1 rmind SIMPLEQ_INSERT_TAIL(&delqhead, linep, fileentries);
947 1.1 rmind }
948 1.1 rmind
949 1.1 rmind /* Process changed lines.. */
950 1.1 rmind for (; !SIMPLEQ_EMPTY(&delqhead) && file2ln <= file2end;
951 1.1 rmind ++file2ln) {
952 1.1 rmind struct fileline *del;
953 1.1 rmind char *add;
954 1.1 rmind
955 1.1 rmind /* Get add line. */
956 1.1 rmind if (!(add = xfgets(file2)))
957 1.1 rmind errx(2, "error reading add in change");
958 1.1 rmind
959 1.1 rmind del = SIMPLEQ_FIRST(&delqhead);
960 1.1 rmind enqueue(del->line, '|', add);
961 1.1 rmind SIMPLEQ_REMOVE_HEAD(&delqhead, fileentries);
962 1.1 rmind /*
963 1.1 rmind * Free fileline structure but not its elements since
964 1.1 rmind * they are queued up.
965 1.1 rmind */
966 1.1 rmind free(del);
967 1.1 rmind }
968 1.1 rmind processq();
969 1.1 rmind
970 1.1 rmind /* Process remaining lines to add. */
971 1.1 rmind for (; file2ln <= file2end; ++file2ln) {
972 1.1 rmind char *add;
973 1.1 rmind
974 1.1 rmind /* Get add line. */
975 1.1 rmind if (!(add = xfgets(file2)))
976 1.1 rmind errx(2, "error reading add in change");
977 1.1 rmind
978 1.1 rmind enqueue(NULL, '>', add);
979 1.1 rmind }
980 1.1 rmind processq();
981 1.1 rmind
982 1.1 rmind /* Process remaining lines to delete. */
983 1.1 rmind while (!SIMPLEQ_EMPTY(&delqhead)) {
984 1.1 rmind struct fileline *filep;
985 1.1 rmind
986 1.1 rmind filep = SIMPLEQ_FIRST(&delqhead);
987 1.1 rmind enqueue(filep->line, '<', NULL);
988 1.1 rmind SIMPLEQ_REMOVE_HEAD(&delqhead, fileentries);
989 1.1 rmind free(filep);
990 1.1 rmind }
991 1.1 rmind processq();
992 1.1 rmind }
993 1.1 rmind
994 1.1 rmind /*
995 1.1 rmind * Print deleted lines from file, from file1ln to file1end.
996 1.1 rmind */
997 1.1 rmind static void
998 1.1 rmind printd(FILE *file1, size_t file1end)
999 1.1 rmind {
1000 1.1 rmind char *line1;
1001 1.1 rmind
1002 1.1 rmind /* Print out lines file1ln to line2. */
1003 1.1 rmind for (; file1ln <= file1end; ++file1ln) {
1004 1.1 rmind /* XXX - Why can't this handle stdin? */
1005 1.1 rmind if (!(line1 = xfgets(file1)))
1006 1.1 rmind errx(2, "file1 ended early in delete");
1007 1.1 rmind enqueue(line1, '<', NULL);
1008 1.1 rmind }
1009 1.1 rmind processq();
1010 1.1 rmind }
1011 1.1 rmind
1012 1.1 rmind /*
1013 1.1 rmind * Interactive mode usage.
1014 1.1 rmind */
1015 1.1 rmind static void
1016 1.1 rmind int_usage(void)
1017 1.1 rmind {
1018 1.1 rmind puts("e:\tedit blank diff\n"
1019 1.1 rmind "eb:\tedit both diffs concatenated\n"
1020 1.1 rmind "el:\tedit left diff\n"
1021 1.1 rmind "er:\tedit right diff\n"
1022 1.1 rmind "l:\tchoose left diff\n"
1023 1.1 rmind "r:\tchoose right diff\n"
1024 1.1 rmind "s:\tsilent mode--don't print identical lines\n"
1025 1.1 rmind "v:\tverbose mode--print identical lines\n"
1026 1.1 rmind "q:\tquit");
1027 1.1 rmind }
1028 1.1 rmind
1029 1.1 rmind static void
1030 1.1 rmind usage(void)
1031 1.1 rmind {
1032 1.1 rmind extern char *__progname;
1033 1.1 rmind
1034 1.1 rmind fprintf(stderr,
1035 1.1 rmind "usage: %s [-abdilstW] [-I regexp] [-o outfile] [-w width] file1 file2\n",
1036 1.1 rmind __progname);
1037 1.1 rmind exit(2);
1038 1.1 rmind }
1039