1 1.3 rillig /* $NetBSD: sdiff.c,v 1.3 2021/08/27 17:38:57 rillig Exp $ */ 2 1.1 rmind /* $OpenBSD: sdiff.c,v 1.20 2006/09/19 05:52:23 otto Exp $ */ 3 1.1 rmind 4 1.1 rmind /* 5 1.1 rmind * Written by Raymond Lai <ray (at) cyth.net>. 6 1.1 rmind * Public domain. 7 1.1 rmind */ 8 1.1 rmind 9 1.1 rmind #include <sys/param.h> 10 1.1 rmind #include <sys/queue.h> 11 1.1 rmind #include <sys/stat.h> 12 1.1 rmind #include <sys/types.h> 13 1.1 rmind #include <sys/wait.h> 14 1.1 rmind 15 1.1 rmind #include <ctype.h> 16 1.1 rmind #include <err.h> 17 1.1 rmind #include <errno.h> 18 1.1 rmind #include <fcntl.h> 19 1.1 rmind #include <getopt.h> 20 1.1 rmind #include <limits.h> 21 1.1 rmind #include <paths.h> 22 1.1 rmind #include <stdio.h> 23 1.1 rmind #include <stdlib.h> 24 1.1 rmind #include <string.h> 25 1.1 rmind #include <unistd.h> 26 1.1 rmind #include <util.h> 27 1.1 rmind 28 1.1 rmind #include "common.h" 29 1.1 rmind #include "extern.h" 30 1.1 rmind 31 1.1 rmind #define WIDTH 130 32 1.1 rmind /* 33 1.1 rmind * Each column must be at least one character wide, plus three 34 1.1 rmind * characters between the columns (space, [<|>], space). 35 1.1 rmind */ 36 1.1 rmind #define WIDTH_MIN 5 37 1.1 rmind 38 1.1 rmind /* A single diff line. */ 39 1.1 rmind struct diffline { 40 1.1 rmind SIMPLEQ_ENTRY(diffline) diffentries; 41 1.1 rmind char *left; 42 1.1 rmind char div; 43 1.1 rmind char *right; 44 1.1 rmind }; 45 1.1 rmind 46 1.1 rmind static void astrcat(char **, const char *); 47 1.1 rmind static void enqueue(char *, char, char *); 48 1.1 rmind static char *mktmpcpy(const char *); 49 1.1 rmind static void freediff(struct diffline *); 50 1.1 rmind static void int_usage(void); 51 1.1 rmind static int parsecmd(FILE *, FILE *, FILE *); 52 1.1 rmind static void printa(FILE *, size_t); 53 1.1 rmind static void printc(FILE *, size_t, FILE *, size_t); 54 1.1 rmind static void printcol(const char *, size_t *, const size_t); 55 1.1 rmind static void printd(FILE *, size_t); 56 1.1 rmind static void println(const char *, const char, const char *); 57 1.1 rmind static void processq(void); 58 1.1 rmind static void prompt(const char *, const char *); 59 1.1 rmind __dead static void usage(void); 60 1.1 rmind static char *xfgets(FILE *); 61 1.1 rmind 62 1.1 rmind SIMPLEQ_HEAD(, diffline) diffhead = SIMPLEQ_HEAD_INITIALIZER(diffhead); 63 1.1 rmind size_t line_width; /* width of a line (two columns and divider) */ 64 1.1 rmind size_t width; /* width of each column */ 65 1.1 rmind size_t file1ln, file2ln; /* line number of file1 and file2 */ 66 1.1 rmind int Iflag = 0; /* ignore sets matching regexp */ 67 1.1 rmind int lflag; /* print only left column for identical lines */ 68 1.1 rmind int sflag; /* skip identical lines */ 69 1.1 rmind FILE *outfile; /* file to save changes to */ 70 1.1 rmind const char *tmpdir; /* TMPDIR or /tmp */ 71 1.1 rmind 72 1.1 rmind static struct option longopts[] = { 73 1.1 rmind { "text", no_argument, NULL, 'a' }, 74 1.1 rmind { "ignore-blank-lines", no_argument, NULL, 'B' }, 75 1.1 rmind { "ignore-space-change", no_argument, NULL, 'b' }, 76 1.1 rmind { "minimal", no_argument, NULL, 'd' }, 77 1.1 rmind { "ignore-tab-expansion", no_argument, NULL, 'E' }, 78 1.1 rmind { "diff-program", required_argument, NULL, 'F' }, 79 1.1 rmind { "speed-large-files", no_argument, NULL, 'H' }, 80 1.1 rmind { "ignore-matching-lines", required_argument, NULL, 'I' }, 81 1.1 rmind { "left-column", no_argument, NULL, 'l' }, 82 1.1 rmind { "output", required_argument, NULL, 'o' }, 83 1.1 rmind { "strip-trailing-cr", no_argument, NULL, 'S' }, 84 1.1 rmind { "suppress-common-lines", no_argument, NULL, 's' }, 85 1.1 rmind { "expand-tabs", no_argument, NULL, 't' }, 86 1.1 rmind { "ignore-all-space", no_argument, NULL, 'W' }, 87 1.1 rmind { "width", required_argument, NULL, 'w' }, 88 1.1 rmind { NULL, 0, NULL, 0 } 89 1.1 rmind }; 90 1.1 rmind 91 1.1 rmind /* 92 1.1 rmind * Create temporary file if source_file is not a regular file. 93 1.1 rmind * Returns temporary file name if one was malloced, NULL if unnecessary. 94 1.1 rmind */ 95 1.1 rmind static char * 96 1.1 rmind mktmpcpy(const char *source_file) 97 1.1 rmind { 98 1.1 rmind struct stat sb; 99 1.1 rmind ssize_t rcount; 100 1.1 rmind int ifd, ofd; 101 1.1 rmind u_char buf[BUFSIZ]; 102 1.1 rmind char *target_file; 103 1.1 rmind 104 1.1 rmind /* Open input and output. */ 105 1.1 rmind ifd = open(source_file, O_RDONLY, 0); 106 1.1 rmind /* File was opened successfully. */ 107 1.1 rmind if (ifd != -1) { 108 1.1 rmind if (fstat(ifd, &sb) == -1) 109 1.1 rmind err(2, "error getting file status from %s", source_file); 110 1.1 rmind 111 1.1 rmind /* Regular file. */ 112 1.1 rmind if (S_ISREG(sb.st_mode)) 113 1.1 rmind return (NULL); 114 1.1 rmind } else { 115 1.1 rmind /* If ``-'' does not exist the user meant stdin. */ 116 1.1 rmind if (errno == ENOENT && strcmp(source_file, "-") == 0) 117 1.1 rmind ifd = STDIN_FILENO; 118 1.1 rmind else 119 1.1 rmind err(2, "error opening %s", source_file); 120 1.1 rmind } 121 1.1 rmind 122 1.1 rmind /* Not a regular file, so copy input into temporary file. */ 123 1.1 rmind if (asprintf(&target_file, "%s/sdiff.XXXXXXXXXX", tmpdir) == -1) 124 1.1 rmind err(2, "asprintf"); 125 1.1 rmind if ((ofd = mkstemp(target_file)) == -1) { 126 1.1 rmind warn("error opening %s", target_file); 127 1.1 rmind goto FAIL; 128 1.1 rmind } 129 1.1 rmind while ((rcount = read(ifd, buf, sizeof(buf))) != -1 && 130 1.1 rmind rcount != 0) { 131 1.1 rmind ssize_t wcount; 132 1.1 rmind 133 1.1 rmind wcount = write(ofd, buf, (size_t)rcount); 134 1.1 rmind if (-1 == wcount || rcount != wcount) { 135 1.1 rmind warn("error writing to %s", target_file); 136 1.1 rmind goto FAIL; 137 1.1 rmind } 138 1.1 rmind } 139 1.1 rmind if (rcount == -1) { 140 1.1 rmind warn("error reading from %s", source_file); 141 1.1 rmind goto FAIL; 142 1.1 rmind } 143 1.1 rmind 144 1.1 rmind close(ifd); 145 1.1 rmind close(ofd); 146 1.1 rmind 147 1.1 rmind return (target_file); 148 1.1 rmind 149 1.1 rmind FAIL: 150 1.1 rmind unlink(target_file); 151 1.1 rmind exit(2); 152 1.1 rmind } 153 1.1 rmind 154 1.1 rmind int 155 1.1 rmind main(int argc, char **argv) 156 1.1 rmind { 157 1.1 rmind FILE *diffpipe, *file1, *file2; 158 1.1 rmind size_t diffargc = 0, wflag = WIDTH; 159 1.1 rmind int ch, fd[2], status; 160 1.1 rmind pid_t pid; 161 1.1 rmind char **diffargv, *diffprog = "diff", *filename1, *filename2, 162 1.1 rmind *tmp1, *tmp2, *s1, *s2; 163 1.1 rmind 164 1.1 rmind /* 165 1.1 rmind * Process diff flags. 166 1.1 rmind */ 167 1.1 rmind /* 168 1.1 rmind * Allocate memory for diff arguments and NULL. 169 1.1 rmind * Each flag has at most one argument, so doubling argc gives an 170 1.1 rmind * upper limit of how many diff args can be passed. argv[0], 171 1.1 rmind * file1, and file2 won't have arguments so doubling them will 172 1.1 rmind * waste some memory; however we need an extra space for the 173 1.1 rmind * NULL at the end, so it sort of works out. 174 1.1 rmind */ 175 1.1 rmind if (!(diffargv = malloc(sizeof(char **) * argc * 2))) 176 1.1 rmind err(2, "main"); 177 1.1 rmind 178 1.1 rmind /* Add first argument, the program name. */ 179 1.1 rmind diffargv[diffargc++] = diffprog; 180 1.1 rmind 181 1.1 rmind while ((ch = getopt_long(argc, argv, "aBbdEHI:ilo:stWw:", 182 1.1 rmind longopts, NULL)) != -1) { 183 1.1 rmind const char *errstr; 184 1.1 rmind 185 1.1 rmind switch (ch) { 186 1.1 rmind case 'a': 187 1.1 rmind diffargv[diffargc++] = "-a"; 188 1.1 rmind break; 189 1.1 rmind case 'B': 190 1.1 rmind diffargv[diffargc++] = "-B"; 191 1.1 rmind break; 192 1.1 rmind case 'b': 193 1.1 rmind diffargv[diffargc++] = "-b"; 194 1.1 rmind break; 195 1.1 rmind case 'd': 196 1.1 rmind diffargv[diffargc++] = "-d"; 197 1.1 rmind break; 198 1.1 rmind case 'E': 199 1.1 rmind diffargv[diffargc++] = "-E"; 200 1.1 rmind break; 201 1.1 rmind case 'F': 202 1.1 rmind diffargv[0] = diffprog = optarg; 203 1.1 rmind break; 204 1.1 rmind case 'H': 205 1.1 rmind diffargv[diffargc++] = "-H"; 206 1.1 rmind break; 207 1.1 rmind case 'I': 208 1.1 rmind Iflag = 1; 209 1.1 rmind diffargv[diffargc++] = "-I"; 210 1.1 rmind diffargv[diffargc++] = optarg; 211 1.1 rmind break; 212 1.1 rmind case 'i': 213 1.1 rmind diffargv[diffargc++] = "-i"; 214 1.1 rmind break; 215 1.1 rmind case 'l': 216 1.1 rmind lflag = 1; 217 1.1 rmind break; 218 1.1 rmind case 'o': 219 1.1 rmind if ((outfile = fopen(optarg, "w")) == NULL) 220 1.1 rmind err(2, "could not open: %s", optarg); 221 1.1 rmind break; 222 1.1 rmind case 'S': 223 1.1 rmind diffargv[diffargc++] = "--strip-trailing-cr"; 224 1.1 rmind break; 225 1.1 rmind case 's': 226 1.1 rmind sflag = 1; 227 1.1 rmind break; 228 1.1 rmind case 't': 229 1.1 rmind diffargv[diffargc++] = "-t"; 230 1.1 rmind break; 231 1.1 rmind case 'W': 232 1.1 rmind diffargv[diffargc++] = "-w"; 233 1.1 rmind break; 234 1.1 rmind case 'w': 235 1.1 rmind wflag = strtonum(optarg, WIDTH_MIN, 236 1.1 rmind INT_MAX, &errstr); 237 1.1 rmind if (errstr) 238 1.1 rmind errx(2, "width is %s: %s", errstr, optarg); 239 1.1 rmind break; 240 1.1 rmind default: 241 1.1 rmind usage(); 242 1.1 rmind } 243 1.1 rmind 244 1.1 rmind } 245 1.1 rmind argc -= optind; 246 1.1 rmind argv += optind; 247 1.1 rmind 248 1.1 rmind if (argc != 2) 249 1.1 rmind usage(); 250 1.1 rmind 251 1.1 rmind if ((tmpdir = getenv("TMPDIR")) == NULL) 252 1.1 rmind tmpdir = _PATH_TMP; 253 1.1 rmind 254 1.1 rmind filename1 = argv[0]; 255 1.1 rmind filename2 = argv[1]; 256 1.1 rmind 257 1.1 rmind /* 258 1.1 rmind * Create temporary files for diff and sdiff to share if file1 259 1.1 rmind * or file2 are not regular files. This allows sdiff and diff 260 1.1 rmind * to read the same inputs if one or both inputs are stdin. 261 1.1 rmind * 262 1.1 rmind * If any temporary files were created, their names would be 263 1.1 rmind * saved in tmp1 or tmp2. tmp1 should never equal tmp2. 264 1.1 rmind */ 265 1.1 rmind tmp1 = tmp2 = NULL; 266 1.1 rmind /* file1 and file2 are the same, so copy to same temp file. */ 267 1.1 rmind if (strcmp(filename1, filename2) == 0) { 268 1.1 rmind if ((tmp1 = mktmpcpy(filename1))) 269 1.1 rmind filename1 = filename2 = tmp1; 270 1.1 rmind /* Copy file1 and file2 into separate temp files. */ 271 1.1 rmind } else { 272 1.1 rmind if ((tmp1 = mktmpcpy(filename1))) 273 1.1 rmind filename1 = tmp1; 274 1.1 rmind if ((tmp2 = mktmpcpy(filename2))) 275 1.1 rmind filename2 = tmp2; 276 1.1 rmind } 277 1.1 rmind 278 1.1 rmind diffargv[diffargc++] = filename1; 279 1.1 rmind diffargv[diffargc++] = filename2; 280 1.1 rmind /* Add NULL to end of array to indicate end of array. */ 281 1.1 rmind diffargv[diffargc++] = NULL; 282 1.1 rmind 283 1.1 rmind /* Subtract column divider and divide by two. */ 284 1.1 rmind width = (wflag - 3) / 2; 285 1.1 rmind /* Make sure line_width can fit in size_t. */ 286 1.1 rmind if (width > (SIZE_T_MAX - 3) / 2) 287 1.1 rmind errx(2, "width is too large: %zu", width); 288 1.1 rmind line_width = width * 2 + 3; 289 1.1 rmind 290 1.1 rmind if (pipe(fd)) 291 1.1 rmind err(2, "pipe"); 292 1.1 rmind 293 1.1 rmind switch(pid = fork()) { 294 1.1 rmind case 0: 295 1.1 rmind /* child */ 296 1.1 rmind /* We don't read from the pipe. */ 297 1.1 rmind close(fd[0]); 298 1.1 rmind if (dup2(fd[1], STDOUT_FILENO) == -1) 299 1.1 rmind err(2, "child could not duplicate descriptor"); 300 1.1 rmind /* Free unused descriptor. */ 301 1.1 rmind close(fd[1]); 302 1.1 rmind 303 1.1 rmind execvp(diffprog, diffargv); 304 1.1 rmind err(2, "could not execute diff: %s", diffprog); 305 1.1 rmind case -1: 306 1.1 rmind err(2, "could not fork"); 307 1.1 rmind } 308 1.1 rmind 309 1.1 rmind /* parent */ 310 1.1 rmind /* We don't write to the pipe. */ 311 1.1 rmind close(fd[1]); 312 1.1 rmind 313 1.1 rmind /* Open pipe to diff command. */ 314 1.1 rmind if ((diffpipe = fdopen(fd[0], "r")) == NULL) 315 1.1 rmind err(2, "could not open diff pipe"); 316 1.1 rmind if ((file1 = fopen(filename1, "r")) == NULL) 317 1.1 rmind err(2, "could not open %s", filename1); 318 1.1 rmind if ((file2 = fopen(filename2, "r")) == NULL) 319 1.1 rmind err(2, "could not open %s", filename2); 320 1.1 rmind 321 1.1 rmind /* Line numbers start at one. */ 322 1.1 rmind file1ln = file2ln = 1; 323 1.1 rmind 324 1.1 rmind /* Read and parse diff output. */ 325 1.1 rmind while (parsecmd(diffpipe, file1, file2) != EOF) 326 1.1 rmind ; 327 1.1 rmind fclose(diffpipe); 328 1.1 rmind 329 1.1 rmind /* Wait for diff to exit. */ 330 1.1 rmind if (waitpid(pid, &status, 0) == -1 || !WIFEXITED(status) || 331 1.1 rmind WEXITSTATUS(status) >= 2) 332 1.1 rmind err(2, "diff exited abnormally"); 333 1.1 rmind 334 1.1 rmind /* Delete and free unneeded temporary files. */ 335 1.1 rmind if (tmp1) 336 1.1 rmind if (unlink(tmp1)) 337 1.1 rmind warn("error deleting %s", tmp1); 338 1.1 rmind if (tmp2) 339 1.1 rmind if (unlink(tmp2)) 340 1.1 rmind warn("error deleting %s", tmp2); 341 1.1 rmind free(tmp1); 342 1.1 rmind free(tmp2); 343 1.1 rmind filename1 = filename2 = tmp1 = tmp2 = NULL; 344 1.1 rmind 345 1.1 rmind /* No more diffs, so print common lines. */ 346 1.1 rmind if (lflag) 347 1.1 rmind while ((s1 = xfgets(file1))) 348 1.1 rmind enqueue(s1, ' ', NULL); 349 1.1 rmind else 350 1.1 rmind for (;;) { 351 1.1 rmind s1 = xfgets(file1); 352 1.1 rmind s2 = xfgets(file2); 353 1.1 rmind if (s1 || s2) 354 1.1 rmind enqueue(s1, ' ', s2); 355 1.1 rmind else 356 1.1 rmind break; 357 1.1 rmind } 358 1.1 rmind fclose(file1); 359 1.1 rmind fclose(file2); 360 1.1 rmind /* Process unmodified lines. */ 361 1.1 rmind processq(); 362 1.1 rmind 363 1.1 rmind /* Return diff exit status. */ 364 1.1 rmind return (WEXITSTATUS(status)); 365 1.1 rmind } 366 1.1 rmind 367 1.1 rmind /* 368 1.1 rmind * Prints an individual column (left or right), taking into account 369 1.1 rmind * that tabs are variable-width. Takes a string, the current column 370 1.1 rmind * the cursor is on the screen, and the maximum value of the column. 371 1.1 rmind * The column value is updated as we go along. 372 1.1 rmind */ 373 1.1 rmind static void 374 1.1 rmind printcol(const char *s, size_t *col, const size_t col_max) 375 1.1 rmind { 376 1.1 rmind 377 1.1 rmind for (; *s && *col < col_max; ++s) { 378 1.1 rmind size_t new_col; 379 1.1 rmind 380 1.1 rmind switch (*s) { 381 1.1 rmind case '\t': 382 1.1 rmind /* 383 1.1 rmind * If rounding to next multiple of eight causes 384 1.1 rmind * an integer overflow, just return. 385 1.1 rmind */ 386 1.1 rmind if (*col > SIZE_T_MAX - 8) 387 1.1 rmind return; 388 1.1 rmind 389 1.1 rmind /* Round to next multiple of eight. */ 390 1.1 rmind new_col = (*col / 8 + 1) * 8; 391 1.1 rmind 392 1.1 rmind /* 393 1.1 rmind * If printing the tab goes past the column 394 1.1 rmind * width, don't print it and just quit. 395 1.1 rmind */ 396 1.1 rmind if (new_col > col_max) 397 1.1 rmind return; 398 1.1 rmind *col = new_col; 399 1.1 rmind break; 400 1.1 rmind 401 1.1 rmind default: 402 1.1 rmind ++(*col); 403 1.1 rmind } 404 1.1 rmind 405 1.1 rmind putchar(*s); 406 1.1 rmind } 407 1.1 rmind } 408 1.1 rmind 409 1.1 rmind /* 410 1.1 rmind * Prompts user to either choose between two strings or edit one, both, 411 1.1 rmind * or neither. 412 1.1 rmind */ 413 1.1 rmind static void 414 1.1 rmind prompt(const char *s1, const char *s2) 415 1.1 rmind { 416 1.1 rmind char *cmd; 417 1.1 rmind 418 1.1 rmind /* Print command prompt. */ 419 1.1 rmind putchar('%'); 420 1.1 rmind 421 1.1 rmind /* Get user input. */ 422 1.1 rmind for (; (cmd = xfgets(stdin)); free(cmd)) { 423 1.1 rmind const char *p; 424 1.1 rmind 425 1.1 rmind /* Skip leading whitespace. */ 426 1.3 rillig for (p = cmd; isspace((unsigned char)(*p)); ++p) 427 1.1 rmind ; 428 1.1 rmind 429 1.1 rmind switch (*p) { 430 1.1 rmind case 'e': 431 1.1 rmind /* Skip `e'. */ 432 1.1 rmind ++p; 433 1.1 rmind 434 1.1 rmind if (eparse(p, s1, s2) == -1) 435 1.1 rmind goto USAGE; 436 1.1 rmind break; 437 1.1 rmind 438 1.1 rmind case 'l': 439 1.1 rmind /* Choose left column as-is. */ 440 1.1 rmind if (s1 != NULL) 441 1.1 rmind fprintf(outfile, "%s\n", s1); 442 1.1 rmind 443 1.1 rmind /* End of command parsing. */ 444 1.1 rmind break; 445 1.1 rmind 446 1.1 rmind case 'q': 447 1.1 rmind goto QUIT; 448 1.1 rmind 449 1.1 rmind case 'r': 450 1.1 rmind /* Choose right column as-is. */ 451 1.1 rmind if (s2 != NULL) 452 1.1 rmind fprintf(outfile, "%s\n", s2); 453 1.1 rmind 454 1.1 rmind /* End of command parsing. */ 455 1.1 rmind break; 456 1.1 rmind 457 1.1 rmind case 's': 458 1.1 rmind sflag = 1; 459 1.1 rmind goto PROMPT; 460 1.1 rmind 461 1.1 rmind case 'v': 462 1.1 rmind sflag = 0; 463 1.1 rmind /* FALLTHROUGH */ 464 1.1 rmind 465 1.1 rmind default: 466 1.1 rmind /* Interactive usage help. */ 467 1.1 rmind USAGE: 468 1.1 rmind int_usage(); 469 1.1 rmind PROMPT: 470 1.1 rmind putchar('%'); 471 1.1 rmind 472 1.1 rmind /* Prompt user again. */ 473 1.1 rmind continue; 474 1.1 rmind } 475 1.1 rmind 476 1.1 rmind free(cmd); 477 1.1 rmind return; 478 1.1 rmind } 479 1.1 rmind 480 1.1 rmind /* 481 1.1 rmind * If there was no error, we received an EOF from stdin, so we 482 1.1 rmind * should quit. 483 1.1 rmind */ 484 1.1 rmind QUIT: 485 1.1 rmind fclose(outfile); 486 1.1 rmind exit(0); 487 1.1 rmind } 488 1.1 rmind 489 1.1 rmind /* 490 1.1 rmind * Takes two strings, separated by a column divider. NULL strings are 491 1.1 rmind * treated as empty columns. If the divider is the ` ' character, the 492 1.1 rmind * second column is not printed (-l flag). In this case, the second 493 1.1 rmind * string must be NULL. When the second column is NULL, the divider 494 1.1 rmind * does not print the trailing space following the divider character. 495 1.1 rmind * 496 1.1 rmind * Takes into account that tabs can take multiple columns. 497 1.1 rmind */ 498 1.1 rmind static void 499 1.2 lukem println(const char *s1, const char divc, const char *s2) 500 1.1 rmind { 501 1.1 rmind size_t col; 502 1.1 rmind 503 1.1 rmind /* Print first column. Skips if s1 == NULL. */ 504 1.1 rmind col = 0; 505 1.1 rmind if (s1) { 506 1.1 rmind /* Skip angle bracket and space. */ 507 1.1 rmind printcol(s1, &col, width); 508 1.1 rmind 509 1.1 rmind } 510 1.1 rmind 511 1.1 rmind /* Only print left column. */ 512 1.2 lukem if (divc == ' ' && !s2) { 513 1.1 rmind putchar('\n'); 514 1.1 rmind return; 515 1.1 rmind } 516 1.1 rmind 517 1.1 rmind /* Otherwise, we pad this column up to width. */ 518 1.1 rmind for (; col < width; ++col) 519 1.1 rmind putchar(' '); 520 1.1 rmind 521 1.1 rmind /* 522 1.1 rmind * Print column divider. If there is no second column, we don't 523 1.1 rmind * need to add the space for padding. 524 1.1 rmind */ 525 1.1 rmind if (!s2) { 526 1.2 lukem printf(" %c\n", divc); 527 1.1 rmind return; 528 1.1 rmind } 529 1.2 lukem printf(" %c ", divc); 530 1.1 rmind col += 3; 531 1.1 rmind 532 1.1 rmind /* Skip angle bracket and space. */ 533 1.1 rmind printcol(s2, &col, line_width); 534 1.1 rmind 535 1.1 rmind putchar('\n'); 536 1.1 rmind } 537 1.1 rmind 538 1.1 rmind /* 539 1.1 rmind * Reads a line from file and returns as a string. If EOF is reached, 540 1.1 rmind * NULL is returned. The returned string must be freed afterwards. 541 1.1 rmind */ 542 1.1 rmind static char * 543 1.1 rmind xfgets(FILE *file) 544 1.1 rmind { 545 1.1 rmind const char delim[3] = {'\0', '\0', '\0'}; 546 1.1 rmind char *s; 547 1.1 rmind 548 1.1 rmind /* XXX - Is this necessary? */ 549 1.1 rmind clearerr(file); 550 1.1 rmind 551 1.1 rmind if (!(s = fparseln(file, NULL, NULL, delim, 0)) && 552 1.1 rmind ferror(file)) 553 1.1 rmind err(2, "error reading file"); 554 1.1 rmind 555 1.1 rmind if (!s) { 556 1.1 rmind return (NULL); 557 1.1 rmind } 558 1.1 rmind 559 1.1 rmind return (s); 560 1.1 rmind } 561 1.1 rmind 562 1.1 rmind /* 563 1.1 rmind * Parse ed commands from diffpipe and print lines from file1 (lines 564 1.1 rmind * to change or delete) or file2 (lines to add or change). 565 1.1 rmind * Returns EOF or 0. 566 1.1 rmind */ 567 1.1 rmind static int 568 1.1 rmind parsecmd(FILE *diffpipe, FILE *file1, FILE *file2) 569 1.1 rmind { 570 1.1 rmind size_t file1start, file1end, file2start, file2end, n; 571 1.1 rmind /* ed command line and pointer to characters in line */ 572 1.1 rmind char *line, *p, *q; 573 1.1 rmind const char *errstr; 574 1.1 rmind char c, cmd; 575 1.1 rmind 576 1.1 rmind /* Read ed command. */ 577 1.1 rmind if (!(line = xfgets(diffpipe))) 578 1.1 rmind return (EOF); 579 1.1 rmind 580 1.1 rmind p = line; 581 1.1 rmind /* Go to character after line number. */ 582 1.3 rillig while (isdigit((unsigned char)(*p))) 583 1.1 rmind ++p; 584 1.1 rmind c = *p; 585 1.1 rmind *p++ = 0; 586 1.1 rmind file1start = strtonum(line, 0, INT_MAX, &errstr); 587 1.1 rmind if (errstr) 588 1.1 rmind errx(2, "file1 start is %s: %s", errstr, line); 589 1.1 rmind 590 1.1 rmind /* A range is specified for file1. */ 591 1.1 rmind if (c == ',') { 592 1.1 rmind 593 1.1 rmind q = p; 594 1.1 rmind /* Go to character after file2end. */ 595 1.3 rillig while (isdigit((unsigned char)(*p))) 596 1.1 rmind ++p; 597 1.1 rmind c = *p; 598 1.1 rmind *p++ = 0; 599 1.1 rmind file1end = strtonum(q, 0, INT_MAX, &errstr); 600 1.1 rmind if (errstr) 601 1.1 rmind errx(2, "file1 end is %s: %s", errstr, line); 602 1.1 rmind if (file1start > file1end) 603 1.1 rmind errx(2, "invalid line range in file1: %s", line); 604 1.1 rmind 605 1.1 rmind } else 606 1.1 rmind file1end = file1start; 607 1.1 rmind 608 1.1 rmind cmd = c; 609 1.1 rmind /* Check that cmd is valid. */ 610 1.1 rmind if (!(cmd == 'a' || cmd == 'c' || cmd == 'd')) 611 1.1 rmind errx(2, "ed command not recognized: %c: %s", cmd, line); 612 1.1 rmind 613 1.1 rmind q = p; 614 1.1 rmind /* Go to character after line number. */ 615 1.3 rillig while (isdigit((unsigned char)(*p))) 616 1.1 rmind ++p; 617 1.1 rmind c = *p; 618 1.1 rmind *p++ = 0; 619 1.1 rmind file2start = strtonum(q, 0, INT_MAX, &errstr); 620 1.1 rmind if (errstr) 621 1.1 rmind errx(2, "file2 start is %s: %s", errstr, line); 622 1.1 rmind 623 1.1 rmind /* 624 1.1 rmind * There should either be a comma signifying a second line 625 1.1 rmind * number or the line should just end here. 626 1.1 rmind */ 627 1.1 rmind if (c != ',' && c != '\0') 628 1.1 rmind errx(2, "invalid line range in file2: %c: %s", c, line); 629 1.1 rmind 630 1.1 rmind if (c == ',') { 631 1.1 rmind 632 1.1 rmind file2end = strtonum(p, 0, INT_MAX, &errstr); 633 1.1 rmind if (errstr) 634 1.1 rmind errx(2, "file2 end is %s: %s", errstr, line); 635 1.1 rmind if (file2start >= file2end) 636 1.1 rmind errx(2, "invalid line range in file2: %s", line); 637 1.1 rmind } else 638 1.1 rmind file2end = file2start; 639 1.1 rmind 640 1.1 rmind /* Appends happen _after_ stated line. */ 641 1.1 rmind if (cmd == 'a') { 642 1.1 rmind if (file1start != file1end) 643 1.1 rmind errx(2, "append cannot have a file1 range: %s", 644 1.1 rmind line); 645 1.1 rmind if (file1start == SIZE_T_MAX) 646 1.1 rmind errx(2, "file1 line range too high: %s", line); 647 1.1 rmind file1start = ++file1end; 648 1.1 rmind } 649 1.1 rmind /* 650 1.1 rmind * I'm not sure what the deal is with the line numbers for 651 1.1 rmind * deletes, though. 652 1.1 rmind */ 653 1.1 rmind else if (cmd == 'd') { 654 1.1 rmind if (file2start != file2end) 655 1.1 rmind errx(2, "delete cannot have a file2 range: %s", 656 1.1 rmind line); 657 1.1 rmind if (file2start == SIZE_T_MAX) 658 1.1 rmind errx(2, "file2 line range too high: %s", line); 659 1.1 rmind file2start = ++file2end; 660 1.1 rmind } 661 1.1 rmind 662 1.1 rmind /* 663 1.1 rmind * Continue reading file1 and file2 until we reach line numbers 664 1.1 rmind * specified by diff. Should only happen with -I flag. 665 1.1 rmind */ 666 1.1 rmind for (; file1ln < file1start && file2ln < file2start; 667 1.1 rmind ++file1ln, ++file2ln) { 668 1.1 rmind char *s1, *s2; 669 1.1 rmind 670 1.1 rmind if (!(s1 = xfgets(file1))) 671 1.1 rmind errx(2, "file1 shorter than expected"); 672 1.1 rmind if (!(s2 = xfgets(file2))) 673 1.1 rmind errx(2, "file2 shorter than expected"); 674 1.1 rmind 675 1.1 rmind /* If the -l flag was specified, print only left column. */ 676 1.1 rmind if (lflag) { 677 1.1 rmind free(s2); 678 1.1 rmind /* 679 1.1 rmind * XXX - If -l and -I are both specified, all 680 1.1 rmind * unchanged or ignored lines are shown with a 681 1.1 rmind * `(' divider. This matches GNU sdiff, but I 682 1.1 rmind * believe it is a bug. Just check out: 683 1.1 rmind * gsdiff -l -I '^$' samefile samefile. 684 1.1 rmind */ 685 1.1 rmind if (Iflag) 686 1.1 rmind enqueue(s1, '(', NULL); 687 1.1 rmind else 688 1.1 rmind enqueue(s1, ' ', NULL); 689 1.1 rmind } else 690 1.1 rmind enqueue(s1, ' ', s2); 691 1.1 rmind } 692 1.1 rmind /* Ignore deleted lines. */ 693 1.1 rmind for (; file1ln < file1start; ++file1ln) { 694 1.1 rmind char *s; 695 1.1 rmind 696 1.1 rmind if (!(s = xfgets(file1))) 697 1.1 rmind errx(2, "file1 shorter than expected"); 698 1.1 rmind 699 1.1 rmind enqueue(s, '(', NULL); 700 1.1 rmind } 701 1.1 rmind /* Ignore added lines. */ 702 1.1 rmind for (; file2ln < file2start; ++file2ln) { 703 1.1 rmind char *s; 704 1.1 rmind 705 1.1 rmind if (!(s = xfgets(file2))) 706 1.1 rmind errx(2, "file2 shorter than expected"); 707 1.1 rmind 708 1.1 rmind /* If -l flag was given, don't print right column. */ 709 1.1 rmind if (lflag) 710 1.1 rmind free(s); 711 1.1 rmind else 712 1.1 rmind enqueue(NULL, ')', s); 713 1.1 rmind } 714 1.1 rmind 715 1.1 rmind /* Process unmodified or skipped lines. */ 716 1.1 rmind processq(); 717 1.1 rmind 718 1.1 rmind switch (cmd) { 719 1.1 rmind case 'a': 720 1.1 rmind printa(file2, file2end); 721 1.1 rmind n = file2end - file2start + 1; 722 1.1 rmind break; 723 1.1 rmind 724 1.1 rmind case 'c': 725 1.1 rmind printc(file1, file1end, file2, file2end); 726 1.1 rmind n = file1end - file1start + 1 + 1 + file2end - file2start + 1; 727 1.1 rmind break; 728 1.1 rmind 729 1.1 rmind case 'd': 730 1.1 rmind printd(file1, file1end); 731 1.1 rmind n = file1end - file1start + 1; 732 1.1 rmind break; 733 1.1 rmind 734 1.1 rmind default: 735 1.1 rmind errx(2, "invalid diff command: %c: %s", cmd, line); 736 1.1 rmind } 737 1.1 rmind 738 1.1 rmind /* Skip to next ed line. */ 739 1.1 rmind while (n--) 740 1.1 rmind if (!xfgets(diffpipe)) 741 1.1 rmind errx(2, "diff ended early"); 742 1.1 rmind 743 1.1 rmind return (0); 744 1.1 rmind } 745 1.1 rmind 746 1.1 rmind /* 747 1.1 rmind * Queues up a diff line. 748 1.1 rmind */ 749 1.1 rmind static void 750 1.2 lukem enqueue(char *left, char divc, char *right) 751 1.1 rmind { 752 1.1 rmind struct diffline *diffp; 753 1.1 rmind 754 1.1 rmind if (!(diffp = malloc(sizeof(struct diffline)))) 755 1.1 rmind err(2, "enqueue"); 756 1.1 rmind diffp->left = left; 757 1.2 lukem diffp->div = divc; 758 1.1 rmind diffp->right = right; 759 1.1 rmind SIMPLEQ_INSERT_TAIL(&diffhead, diffp, diffentries); 760 1.1 rmind } 761 1.1 rmind 762 1.1 rmind /* 763 1.1 rmind * Free a diffline structure and its elements. 764 1.1 rmind */ 765 1.1 rmind static void 766 1.1 rmind freediff(struct diffline *diffp) 767 1.1 rmind { 768 1.1 rmind free(diffp->left); 769 1.1 rmind free(diffp->right); 770 1.1 rmind free(diffp); 771 1.1 rmind } 772 1.1 rmind 773 1.1 rmind /* 774 1.1 rmind * Append second string into first. Repeated appends to the same string 775 1.1 rmind * are cached, making this an O(n) function, where n = strlen(append). 776 1.1 rmind */ 777 1.1 rmind static void 778 1.1 rmind astrcat(char **s, const char *append) 779 1.1 rmind { 780 1.1 rmind /* Length of string in previous run. */ 781 1.1 rmind static size_t offset = 0; 782 1.1 rmind size_t newsiz; 783 1.1 rmind /* 784 1.1 rmind * String from previous run. Compared to *s to see if we are 785 1.1 rmind * dealing with the same string. If so, we can use offset. 786 1.1 rmind */ 787 1.1 rmind static const char *oldstr = NULL; 788 1.1 rmind char *newstr; 789 1.1 rmind 790 1.1 rmind 791 1.1 rmind /* 792 1.1 rmind * First string is NULL, so just copy append. 793 1.1 rmind */ 794 1.1 rmind if (!*s) { 795 1.1 rmind if (!(*s = strdup(append))) 796 1.1 rmind err(2, "astrcat"); 797 1.1 rmind 798 1.1 rmind /* Keep track of string. */ 799 1.1 rmind offset = strlen(*s); 800 1.1 rmind oldstr = *s; 801 1.1 rmind 802 1.1 rmind return; 803 1.1 rmind } 804 1.1 rmind 805 1.1 rmind /* 806 1.1 rmind * *s is a string so concatenate. 807 1.1 rmind */ 808 1.1 rmind 809 1.1 rmind /* Did we process the same string in the last run? */ 810 1.1 rmind /* 811 1.1 rmind * If this is a different string from the one we just processed 812 1.1 rmind * cache new string. 813 1.1 rmind */ 814 1.1 rmind if (oldstr != *s) { 815 1.1 rmind offset = strlen(*s); 816 1.1 rmind oldstr = *s; 817 1.1 rmind } 818 1.1 rmind 819 1.1 rmind /* Size = strlen(*s) + \n + strlen(append) + '\0'. */ 820 1.1 rmind newsiz = offset + 1 + strlen(append) + 1; 821 1.1 rmind 822 1.1 rmind /* Resize *s to fit new string. */ 823 1.1 rmind newstr = realloc(*s, newsiz); 824 1.1 rmind if (newstr == NULL) 825 1.1 rmind err(2, "astrcat"); 826 1.1 rmind *s = newstr; 827 1.1 rmind 828 1.1 rmind /* *s + offset should be end of string. */ 829 1.1 rmind /* Concatenate. */ 830 1.1 rmind strlcpy(*s + offset, "\n", newsiz - offset); 831 1.1 rmind strlcat(*s + offset, append, newsiz - offset); 832 1.1 rmind 833 1.1 rmind /* New string length should be exactly newsiz - 1 characters. */ 834 1.1 rmind /* Store generated string's values. */ 835 1.1 rmind offset = newsiz - 1; 836 1.1 rmind oldstr = *s; 837 1.1 rmind } 838 1.1 rmind 839 1.1 rmind /* 840 1.1 rmind * Process diff set queue, printing, prompting, and saving each diff 841 1.1 rmind * line stored in queue. 842 1.1 rmind */ 843 1.1 rmind static void 844 1.1 rmind processq(void) 845 1.1 rmind { 846 1.1 rmind struct diffline *diffp; 847 1.1 rmind char divc, *left, *right; 848 1.1 rmind 849 1.1 rmind /* Don't process empty queue. */ 850 1.1 rmind if (SIMPLEQ_EMPTY(&diffhead)) 851 1.1 rmind return; 852 1.1 rmind 853 1.1 rmind /* Remember the divider. */ 854 1.1 rmind divc = SIMPLEQ_FIRST(&diffhead)->div; 855 1.1 rmind 856 1.1 rmind left = NULL; 857 1.1 rmind right = NULL; 858 1.1 rmind /* 859 1.1 rmind * Go through set of diffs, concatenating each line in left or 860 1.1 rmind * right column into two long strings, `left' and `right'. 861 1.1 rmind */ 862 1.1 rmind SIMPLEQ_FOREACH(diffp, &diffhead, diffentries) { 863 1.1 rmind /* 864 1.1 rmind * Print changed lines if -s was given, 865 1.1 rmind * print all lines if -s was not given. 866 1.1 rmind */ 867 1.1 rmind if (!sflag || diffp->div == '|' || diffp->div == '<' || 868 1.1 rmind diffp->div == '>') 869 1.1 rmind println(diffp->left, diffp->div, diffp->right); 870 1.1 rmind 871 1.1 rmind /* Append new lines to diff set. */ 872 1.1 rmind if (diffp->left) 873 1.1 rmind astrcat(&left, diffp->left); 874 1.1 rmind if (diffp->right) 875 1.1 rmind astrcat(&right, diffp->right); 876 1.1 rmind } 877 1.1 rmind 878 1.1 rmind /* Empty queue and free each diff line and its elements. */ 879 1.1 rmind while (!SIMPLEQ_EMPTY(&diffhead)) { 880 1.1 rmind diffp = SIMPLEQ_FIRST(&diffhead); 881 1.1 rmind SIMPLEQ_REMOVE_HEAD(&diffhead, diffentries); 882 1.1 rmind freediff(diffp); 883 1.1 rmind } 884 1.1 rmind 885 1.1 rmind /* Write to outfile, prompting user if lines are different. */ 886 1.1 rmind if (outfile) 887 1.1 rmind switch (divc) { 888 1.1 rmind case ' ': case '(': case ')': 889 1.1 rmind fprintf(outfile, "%s\n", left); 890 1.1 rmind break; 891 1.1 rmind case '|': case '<': case '>': 892 1.1 rmind prompt(left, right); 893 1.1 rmind break; 894 1.1 rmind default: 895 1.1 rmind errx(2, "invalid divider: %c", divc); 896 1.1 rmind } 897 1.1 rmind 898 1.1 rmind /* Free left and right. */ 899 1.1 rmind free(left); 900 1.1 rmind free(right); 901 1.1 rmind } 902 1.1 rmind 903 1.1 rmind /* 904 1.1 rmind * Print lines following an (a)ppend command. 905 1.1 rmind */ 906 1.1 rmind static void 907 1.1 rmind printa(FILE *file, size_t line2) 908 1.1 rmind { 909 1.1 rmind char *line; 910 1.1 rmind 911 1.1 rmind for (; file2ln <= line2; ++file2ln) { 912 1.1 rmind if (!(line = xfgets(file))) 913 1.1 rmind errx(2, "append ended early"); 914 1.1 rmind enqueue(NULL, '>', line); 915 1.1 rmind } 916 1.1 rmind 917 1.1 rmind processq(); 918 1.1 rmind } 919 1.1 rmind 920 1.1 rmind /* 921 1.1 rmind * Print lines following a (c)hange command, from file1ln to file1end 922 1.1 rmind * and from file2ln to file2end. 923 1.1 rmind */ 924 1.1 rmind static void 925 1.1 rmind printc(FILE *file1, size_t file1end, FILE *file2, size_t file2end) 926 1.1 rmind { 927 1.1 rmind struct fileline { 928 1.1 rmind SIMPLEQ_ENTRY(fileline) fileentries; 929 1.1 rmind char *line; 930 1.1 rmind }; 931 1.1 rmind SIMPLEQ_HEAD(, fileline) delqhead = SIMPLEQ_HEAD_INITIALIZER(delqhead); 932 1.1 rmind 933 1.1 rmind /* Read lines to be deleted. */ 934 1.1 rmind for (; file1ln <= file1end; ++file1ln) { 935 1.1 rmind struct fileline *linep; 936 1.1 rmind char *line1; 937 1.1 rmind 938 1.1 rmind /* Read lines from both. */ 939 1.1 rmind if (!(line1 = xfgets(file1))) 940 1.1 rmind errx(2, "error reading file1 in delete in change"); 941 1.1 rmind 942 1.1 rmind /* Add to delete queue. */ 943 1.1 rmind if (!(linep = malloc(sizeof(struct fileline)))) 944 1.1 rmind err(2, "printc"); 945 1.1 rmind linep->line = line1; 946 1.1 rmind SIMPLEQ_INSERT_TAIL(&delqhead, linep, fileentries); 947 1.1 rmind } 948 1.1 rmind 949 1.1 rmind /* Process changed lines.. */ 950 1.1 rmind for (; !SIMPLEQ_EMPTY(&delqhead) && file2ln <= file2end; 951 1.1 rmind ++file2ln) { 952 1.1 rmind struct fileline *del; 953 1.1 rmind char *add; 954 1.1 rmind 955 1.1 rmind /* Get add line. */ 956 1.1 rmind if (!(add = xfgets(file2))) 957 1.1 rmind errx(2, "error reading add in change"); 958 1.1 rmind 959 1.1 rmind del = SIMPLEQ_FIRST(&delqhead); 960 1.1 rmind enqueue(del->line, '|', add); 961 1.1 rmind SIMPLEQ_REMOVE_HEAD(&delqhead, fileentries); 962 1.1 rmind /* 963 1.1 rmind * Free fileline structure but not its elements since 964 1.1 rmind * they are queued up. 965 1.1 rmind */ 966 1.1 rmind free(del); 967 1.1 rmind } 968 1.1 rmind processq(); 969 1.1 rmind 970 1.1 rmind /* Process remaining lines to add. */ 971 1.1 rmind for (; file2ln <= file2end; ++file2ln) { 972 1.1 rmind char *add; 973 1.1 rmind 974 1.1 rmind /* Get add line. */ 975 1.1 rmind if (!(add = xfgets(file2))) 976 1.1 rmind errx(2, "error reading add in change"); 977 1.1 rmind 978 1.1 rmind enqueue(NULL, '>', add); 979 1.1 rmind } 980 1.1 rmind processq(); 981 1.1 rmind 982 1.1 rmind /* Process remaining lines to delete. */ 983 1.1 rmind while (!SIMPLEQ_EMPTY(&delqhead)) { 984 1.1 rmind struct fileline *filep; 985 1.1 rmind 986 1.1 rmind filep = SIMPLEQ_FIRST(&delqhead); 987 1.1 rmind enqueue(filep->line, '<', NULL); 988 1.1 rmind SIMPLEQ_REMOVE_HEAD(&delqhead, fileentries); 989 1.1 rmind free(filep); 990 1.1 rmind } 991 1.1 rmind processq(); 992 1.1 rmind } 993 1.1 rmind 994 1.1 rmind /* 995 1.1 rmind * Print deleted lines from file, from file1ln to file1end. 996 1.1 rmind */ 997 1.1 rmind static void 998 1.1 rmind printd(FILE *file1, size_t file1end) 999 1.1 rmind { 1000 1.1 rmind char *line1; 1001 1.1 rmind 1002 1.1 rmind /* Print out lines file1ln to line2. */ 1003 1.1 rmind for (; file1ln <= file1end; ++file1ln) { 1004 1.1 rmind /* XXX - Why can't this handle stdin? */ 1005 1.1 rmind if (!(line1 = xfgets(file1))) 1006 1.1 rmind errx(2, "file1 ended early in delete"); 1007 1.1 rmind enqueue(line1, '<', NULL); 1008 1.1 rmind } 1009 1.1 rmind processq(); 1010 1.1 rmind } 1011 1.1 rmind 1012 1.1 rmind /* 1013 1.1 rmind * Interactive mode usage. 1014 1.1 rmind */ 1015 1.1 rmind static void 1016 1.1 rmind int_usage(void) 1017 1.1 rmind { 1018 1.1 rmind puts("e:\tedit blank diff\n" 1019 1.1 rmind "eb:\tedit both diffs concatenated\n" 1020 1.1 rmind "el:\tedit left diff\n" 1021 1.1 rmind "er:\tedit right diff\n" 1022 1.1 rmind "l:\tchoose left diff\n" 1023 1.1 rmind "r:\tchoose right diff\n" 1024 1.1 rmind "s:\tsilent mode--don't print identical lines\n" 1025 1.1 rmind "v:\tverbose mode--print identical lines\n" 1026 1.1 rmind "q:\tquit"); 1027 1.1 rmind } 1028 1.1 rmind 1029 1.1 rmind static void 1030 1.1 rmind usage(void) 1031 1.1 rmind { 1032 1.1 rmind extern char *__progname; 1033 1.1 rmind 1034 1.1 rmind fprintf(stderr, 1035 1.1 rmind "usage: %s [-abdilstW] [-I regexp] [-o outfile] [-w width] file1 file2\n", 1036 1.1 rmind __progname); 1037 1.1 rmind exit(2); 1038 1.1 rmind } 1039