Home | History | Annotate | Line # | Download | only in nl
nl.c revision 1.9
      1  1.9   lukem /*	$NetBSD: nl.c,v 1.9 2008/07/21 14:19:24 lukem Exp $	*/
      2  1.1  kleink 
      3  1.1  kleink /*-
      4  1.1  kleink  * Copyright (c) 1999 The NetBSD Foundation, Inc.
      5  1.1  kleink  * All rights reserved.
      6  1.1  kleink  *
      7  1.1  kleink  * This code is derived from software contributed to The NetBSD Foundation
      8  1.1  kleink  * by Klaus Klein.
      9  1.1  kleink  *
     10  1.1  kleink  * Redistribution and use in source and binary forms, with or without
     11  1.1  kleink  * modification, are permitted provided that the following conditions
     12  1.1  kleink  * are met:
     13  1.1  kleink  * 1. Redistributions of source code must retain the above copyright
     14  1.1  kleink  *    notice, this list of conditions and the following disclaimer.
     15  1.1  kleink  * 2. Redistributions in binary form must reproduce the above copyright
     16  1.1  kleink  *    notice, this list of conditions and the following disclaimer in the
     17  1.1  kleink  *    documentation and/or other materials provided with the distribution.
     18  1.1  kleink  *
     19  1.1  kleink  * THIS SOFTWARE IS PROVIDED BY THE NETBSD FOUNDATION, INC. AND CONTRIBUTORS
     20  1.1  kleink  * ``AS IS'' AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED
     21  1.1  kleink  * TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR
     22  1.1  kleink  * PURPOSE ARE DISCLAIMED.  IN NO EVENT SHALL THE FOUNDATION OR CONTRIBUTORS
     23  1.1  kleink  * BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR
     24  1.1  kleink  * CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF
     25  1.1  kleink  * SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS
     26  1.1  kleink  * INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN
     27  1.1  kleink  * CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE)
     28  1.1  kleink  * ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE
     29  1.1  kleink  * POSSIBILITY OF SUCH DAMAGE.
     30  1.1  kleink  */
     31  1.1  kleink 
     32  1.1  kleink #include <sys/cdefs.h>
     33  1.1  kleink #ifndef lint
     34  1.9   lukem __COPYRIGHT("@(#) Copyright (c) 1999\
     35  1.1  kleink  The NetBSD Foundation, Inc.  All rights reserved.");
     36  1.9   lukem __RCSID("$NetBSD: nl.c,v 1.9 2008/07/21 14:19:24 lukem Exp $");
     37  1.1  kleink #endif
     38  1.1  kleink 
     39  1.1  kleink #include <errno.h>
     40  1.1  kleink #include <limits.h>
     41  1.1  kleink #include <locale.h>
     42  1.1  kleink #include <regex.h>
     43  1.1  kleink #include <stdio.h>
     44  1.1  kleink #include <stdlib.h>
     45  1.6    matt #include <string.h>
     46  1.1  kleink #include <unistd.h>
     47  1.1  kleink 
     48  1.1  kleink typedef enum {
     49  1.1  kleink 	number_all,		/* number all lines */
     50  1.1  kleink 	number_nonempty,	/* number non-empty lines */
     51  1.1  kleink 	number_none,		/* no line numbering */
     52  1.1  kleink 	number_regex		/* number lines matching regular expression */
     53  1.1  kleink } numbering_type;
     54  1.1  kleink 
     55  1.1  kleink struct numbering_property {
     56  1.1  kleink 	const char * const	name;		/* for diagnostics */
     57  1.1  kleink 	numbering_type		type;		/* numbering type */
     58  1.1  kleink 	regex_t			expr;		/* for type == number_regex */
     59  1.1  kleink };
     60  1.1  kleink 
     61  1.1  kleink /* line numbering formats */
     62  1.1  kleink #define FORMAT_LN	"%-*d"	/* left justified, leading zeros suppressed */
     63  1.1  kleink #define FORMAT_RN	"%*d"	/* right justified, leading zeros suppressed */
     64  1.1  kleink #define FORMAT_RZ	"%0*d"	/* right justified, leading zeros kept */
     65  1.1  kleink 
     66  1.1  kleink #define FOOTER		0
     67  1.1  kleink #define BODY		1
     68  1.1  kleink #define HEADER		2
     69  1.1  kleink #define NP_LAST		HEADER
     70  1.1  kleink 
     71  1.1  kleink static struct numbering_property numbering_properties[NP_LAST + 1] = {
     72  1.1  kleink 	{ "footer",	number_none	},
     73  1.1  kleink 	{ "body",	number_nonempty	},
     74  1.1  kleink 	{ "header",	number_none	}
     75  1.1  kleink };
     76  1.1  kleink 
     77  1.1  kleink #define max(a, b)	((a) > (b) ? (a) : (b))
     78  1.1  kleink 
     79  1.1  kleink /*
     80  1.1  kleink  * Maximum number of characters required for a decimal representation of a
     81  1.1  kleink  * (signed) int; courtesy of tzcode.
     82  1.1  kleink  */
     83  1.1  kleink #define INT_STRLEN_MAXIMUM \
     84  1.1  kleink 	((sizeof (int) * CHAR_BIT - 1) * 302 / 1000 + 2)
     85  1.1  kleink 
     86  1.1  kleink static void	filter __P((void));
     87  1.1  kleink int		main __P((int, char *[]));
     88  1.1  kleink static void	parse_numbering __P((const char *, int));
     89  1.1  kleink static void	usage __P((void));
     90  1.1  kleink 
     91  1.1  kleink /*
     92  1.1  kleink  * Pointer to dynamically allocated input line buffer, and its size.
     93  1.1  kleink  */
     94  1.1  kleink static char *buffer;
     95  1.1  kleink static size_t buffersize;
     96  1.1  kleink 
     97  1.1  kleink /*
     98  1.1  kleink  * Dynamically allocated buffer suitable for string representation of ints.
     99  1.1  kleink  */
    100  1.1  kleink static char *intbuffer;
    101  1.1  kleink 
    102  1.1  kleink /*
    103  1.1  kleink  * Configurable parameters.
    104  1.1  kleink  */
    105  1.1  kleink /* delimiter characters that indicate the start of a logical page section */
    106  1.1  kleink static char delim[2] = { '\\', ':' };
    107  1.1  kleink 
    108  1.1  kleink /* line numbering format */
    109  1.1  kleink static const char *format = FORMAT_RN;
    110  1.1  kleink 
    111  1.1  kleink /* increment value used to number logical page lines */
    112  1.1  kleink static int incr = 1;
    113  1.1  kleink 
    114  1.1  kleink /* number of adjacent blank lines to be considered (and numbered) as one */
    115  1.1  kleink static unsigned int nblank = 1;
    116  1.1  kleink 
    117  1.1  kleink /* whether to restart numbering at logical page delimiters */
    118  1.1  kleink static int restart = 1;
    119  1.1  kleink 
    120  1.1  kleink /* characters used in separating the line number and the corrsp. text line */
    121  1.1  kleink static const char *sep = "\t";
    122  1.1  kleink 
    123  1.1  kleink /* initial value used to number logical page lines */
    124  1.1  kleink static int startnum = 1;
    125  1.1  kleink 
    126  1.1  kleink /* number of characters to be used for the line number */
    127  1.1  kleink /* should be unsigned but required signed by `*' precision conversion */
    128  1.1  kleink static int width = 6;
    129  1.1  kleink 
    130  1.1  kleink 
    131  1.1  kleink int
    132  1.1  kleink main(argc, argv)
    133  1.1  kleink 	int argc;
    134  1.1  kleink 	char *argv[];
    135  1.1  kleink {
    136  1.1  kleink 	int c;
    137  1.3  kleink 	long val;
    138  1.3  kleink 	unsigned long uval;
    139  1.1  kleink 	char *ep;
    140  1.1  kleink 	size_t intbuffersize;
    141  1.1  kleink 
    142  1.1  kleink 	(void)setlocale(LC_ALL, "");
    143  1.1  kleink 
    144  1.1  kleink 	/*
    145  1.1  kleink 	 * Note: this implementation strictly conforms to the XBD Utility
    146  1.1  kleink 	 * Syntax Guidelines and does not permit the optional `file' operand
    147  1.1  kleink 	 * to be intermingled with the options, which is defined in the
    148  1.1  kleink 	 * XCU specification (Issue 5) but declared an obsolescent feature that
    149  1.1  kleink 	 * will be removed from a future issue.  It shouldn't matter, though.
    150  1.1  kleink 	 */
    151  1.1  kleink 	while ((c = getopt(argc, argv, "pb:d:f:h:i:l:n:s:v:w:")) != -1) {
    152  1.1  kleink 		switch (c) {
    153  1.1  kleink 		case 'p':
    154  1.1  kleink 			restart = 0;
    155  1.1  kleink 			break;
    156  1.1  kleink 		case 'b':
    157  1.1  kleink 			parse_numbering(optarg, BODY);
    158  1.1  kleink 			break;
    159  1.1  kleink 		case 'd':
    160  1.1  kleink 			if (optarg[0] != '\0')
    161  1.1  kleink 				delim[0] = optarg[0];
    162  1.1  kleink 			if (optarg[1] != '\0')
    163  1.1  kleink 				delim[1] = optarg[1];
    164  1.1  kleink 			/* at most two delimiter characters */
    165  1.1  kleink 			if (optarg[2] != '\0') {
    166  1.1  kleink 				(void)fprintf(stderr,
    167  1.1  kleink 				    "nl: invalid delim argument -- %s\n",
    168  1.1  kleink 				    optarg);
    169  1.1  kleink 				exit(EXIT_FAILURE);
    170  1.1  kleink 				/* NOTREACHED */
    171  1.1  kleink 			}
    172  1.1  kleink 			break;
    173  1.1  kleink 		case 'f':
    174  1.1  kleink 			parse_numbering(optarg, FOOTER);
    175  1.1  kleink 			break;
    176  1.1  kleink 		case 'h':
    177  1.1  kleink 			parse_numbering(optarg, HEADER);
    178  1.1  kleink 			break;
    179  1.1  kleink 		case 'i':
    180  1.1  kleink 			errno = 0;
    181  1.1  kleink 			val = strtol(optarg, &ep, 10);
    182  1.1  kleink 			if ((ep != NULL && *ep != '\0') ||
    183  1.1  kleink 			 ((val == LONG_MIN || val == LONG_MAX) && errno != 0)) {
    184  1.1  kleink 				(void)fprintf(stderr,
    185  1.1  kleink 				    "invalid incr argument -- %s\n", optarg);
    186  1.1  kleink 				exit(EXIT_FAILURE);
    187  1.1  kleink 			}
    188  1.1  kleink 			incr = (int)val;
    189  1.1  kleink 			break;
    190  1.1  kleink 		case 'l':
    191  1.1  kleink 			errno = 0;
    192  1.1  kleink 			uval = strtoul(optarg, &ep, 10);
    193  1.1  kleink 			if ((ep != NULL && *ep != '\0') ||
    194  1.1  kleink 			    (uval == ULONG_MAX && errno != 0)) {
    195  1.1  kleink 				(void)fprintf(stderr,
    196  1.1  kleink 				    "invalid num argument -- %s\n", optarg);
    197  1.1  kleink 				exit(EXIT_FAILURE);
    198  1.1  kleink 			}
    199  1.1  kleink 			nblank = (unsigned int)uval;
    200  1.1  kleink 			break;
    201  1.1  kleink 		case 'n':
    202  1.1  kleink 			if (strcmp(optarg, "ln") == 0) {
    203  1.1  kleink 				format = FORMAT_LN;
    204  1.1  kleink 			} else if (strcmp(optarg, "rn") == 0) {
    205  1.1  kleink 				format = FORMAT_RN;
    206  1.1  kleink 			} else if (strcmp(optarg, "rz") == 0) {
    207  1.1  kleink 				format = FORMAT_RZ;
    208  1.1  kleink 			} else {
    209  1.1  kleink 				(void)fprintf(stderr,
    210  1.1  kleink 				    "nl: illegal format -- %s\n", optarg);
    211  1.1  kleink 				exit(EXIT_FAILURE);
    212  1.1  kleink 			}
    213  1.1  kleink 			break;
    214  1.1  kleink 		case 's':
    215  1.1  kleink 			sep = optarg;
    216  1.1  kleink 			break;
    217  1.1  kleink 		case 'v':
    218  1.1  kleink 			errno = 0;
    219  1.1  kleink 			val = strtol(optarg, &ep, 10);
    220  1.1  kleink 			if ((ep != NULL && *ep != '\0') ||
    221  1.1  kleink 			 ((val == LONG_MIN || val == LONG_MAX) && errno != 0)) {
    222  1.1  kleink 				(void)fprintf(stderr,
    223  1.1  kleink 				    "invalid startnum value -- %s\n", optarg);
    224  1.1  kleink 				exit(EXIT_FAILURE);
    225  1.1  kleink 			}
    226  1.1  kleink 			startnum = (int)val;
    227  1.1  kleink 			break;
    228  1.1  kleink 		case 'w':
    229  1.1  kleink 			errno = 0;
    230  1.1  kleink 			val = strtol(optarg, &ep, 10);
    231  1.1  kleink 			if ((ep != NULL && *ep != '\0') ||
    232  1.1  kleink 			 ((val == LONG_MIN || val == LONG_MAX) && errno != 0)) {
    233  1.1  kleink 				(void)fprintf(stderr,
    234  1.1  kleink 				    "invalid width value -- %s\n", optarg);
    235  1.1  kleink 				exit(EXIT_FAILURE);
    236  1.1  kleink 			}
    237  1.1  kleink 			width = (int)val;
    238  1.1  kleink 			if (!(width > 0)) {
    239  1.1  kleink 				(void)fprintf(stderr,
    240  1.1  kleink 				    "nl: width argument must be > 0 -- %d\n",
    241  1.1  kleink 				    width);
    242  1.1  kleink 				 exit(EXIT_FAILURE);
    243  1.1  kleink 			}
    244  1.1  kleink 			break;
    245  1.1  kleink 		case '?':
    246  1.1  kleink 		default:
    247  1.1  kleink 			usage();
    248  1.1  kleink 			/* NOTREACHED */
    249  1.1  kleink 		}
    250  1.1  kleink 	}
    251  1.1  kleink 	argc -= optind;
    252  1.1  kleink 	argv += optind;
    253  1.1  kleink 
    254  1.1  kleink 	switch (argc) {
    255  1.1  kleink 	case 0:
    256  1.1  kleink 		break;
    257  1.1  kleink 	case 1:
    258  1.1  kleink 		if (freopen(argv[0], "r", stdin) == NULL) {
    259  1.1  kleink 			perror(argv[0]);
    260  1.1  kleink 			exit(EXIT_FAILURE);
    261  1.1  kleink 		}
    262  1.1  kleink 		break;
    263  1.1  kleink 	default:
    264  1.1  kleink 		usage();
    265  1.1  kleink 		/* NOTREACHED */
    266  1.1  kleink 	}
    267  1.1  kleink 
    268  1.1  kleink 	/* Determine the maximum input line length to operate on. */
    269  1.1  kleink 	if ((val = sysconf(_SC_LINE_MAX)) == -1) /* ignore errno */
    270  1.1  kleink 		val = LINE_MAX;
    271  1.1  kleink 	/* Allocate sufficient buffer space (including the terminating NUL). */
    272  1.1  kleink 	buffersize = (size_t)val + 1;
    273  1.1  kleink 	if ((buffer = malloc(buffersize)) == NULL) {
    274  1.1  kleink 		perror("cannot allocate input line buffer");
    275  1.1  kleink 		exit(EXIT_FAILURE);
    276  1.1  kleink 	}
    277  1.1  kleink 
    278  1.1  kleink 	/* Allocate a buffer suitable for preformatting line number. */
    279  1.1  kleink 	intbuffersize = max(INT_STRLEN_MAXIMUM, width) + 1;	/* NUL */
    280  1.1  kleink 	if ((intbuffer = malloc(intbuffersize)) == NULL) {
    281  1.1  kleink 		perror("cannot allocate preformatting buffer");
    282  1.1  kleink 		exit(EXIT_FAILURE);
    283  1.1  kleink 	}
    284  1.1  kleink 
    285  1.1  kleink 	/* Do the work. */
    286  1.1  kleink 	filter();
    287  1.1  kleink 
    288  1.1  kleink 	exit(EXIT_SUCCESS);
    289  1.1  kleink 	/* NOTREACHED */
    290  1.1  kleink }
    291  1.1  kleink 
    292  1.1  kleink static void
    293  1.1  kleink filter()
    294  1.1  kleink {
    295  1.1  kleink 	int line;		/* logical line number */
    296  1.1  kleink 	int section;		/* logical page section */
    297  1.1  kleink 	unsigned int adjblank;	/* adjacent blank lines */
    298  1.1  kleink 	int consumed;		/* intbuffer measurement */
    299  1.1  kleink 	int donumber, idx;
    300  1.1  kleink 
    301  1.1  kleink 	adjblank = 0;
    302  1.1  kleink 	line = startnum;
    303  1.1  kleink 	section = BODY;
    304  1.2  kleink #ifdef __GNUC__
    305  1.7     mrg 	donumber = 0;	/* avoid bogus `uninitialized' warning */
    306  1.2  kleink #endif
    307  1.1  kleink 
    308  1.1  kleink 	while (fgets(buffer, (int)buffersize, stdin) != NULL) {
    309  1.1  kleink 		for (idx = FOOTER; idx <= NP_LAST; idx++) {
    310  1.1  kleink 			/* Does it look like a delimiter? */
    311  1.1  kleink 			if (buffer[2 * idx + 0] == delim[0] &&
    312  1.1  kleink 			    buffer[2 * idx + 1] == delim[1]) {
    313  1.1  kleink 				/* Was this the whole line? */
    314  1.1  kleink 				if (buffer[2 * idx + 2] == '\n') {
    315  1.1  kleink 					section = idx;
    316  1.1  kleink 					adjblank = 0;
    317  1.1  kleink 					if (restart)
    318  1.1  kleink 						line = startnum;
    319  1.1  kleink 					goto nextline;
    320  1.1  kleink 				}
    321  1.1  kleink 			} else {
    322  1.1  kleink 				break;
    323  1.1  kleink 			}
    324  1.1  kleink 		}
    325  1.1  kleink 
    326  1.1  kleink 		switch (numbering_properties[section].type) {
    327  1.1  kleink 		case number_all:
    328  1.1  kleink 			/*
    329  1.1  kleink 			 * Doing this for number_all only is disputable, but
    330  1.1  kleink 			 * the standard expresses an explicit dependency on
    331  1.1  kleink 			 * `-b a' etc.
    332  1.1  kleink 			 */
    333  1.1  kleink 			if (buffer[0] == '\n' && ++adjblank < nblank)
    334  1.1  kleink 				donumber = 0;
    335  1.1  kleink 			else
    336  1.1  kleink 				donumber = 1, adjblank = 0;
    337  1.1  kleink 			break;
    338  1.1  kleink 		case number_nonempty:
    339  1.1  kleink 			donumber = (buffer[0] != '\n');
    340  1.1  kleink 			break;
    341  1.1  kleink 		case number_none:
    342  1.1  kleink 			donumber = 0;
    343  1.1  kleink 			break;
    344  1.1  kleink 		case number_regex:
    345  1.1  kleink 			donumber =
    346  1.1  kleink 			    (regexec(&numbering_properties[section].expr,
    347  1.1  kleink 			    buffer, 0, NULL, 0) == 0);
    348  1.1  kleink 			break;
    349  1.1  kleink 		}
    350  1.1  kleink 
    351  1.1  kleink 		if (donumber) {
    352  1.1  kleink 			/* Note: sprintf() is safe here. */
    353  1.1  kleink 			consumed = sprintf(intbuffer, format, width, line);
    354  1.1  kleink 			(void)printf("%s",
    355  1.1  kleink 			    intbuffer + max(0, consumed - width));
    356  1.1  kleink 			line += incr;
    357  1.1  kleink 		} else {
    358  1.1  kleink 			(void)printf("%*s", width, "");
    359  1.1  kleink 		}
    360  1.1  kleink 		(void)printf("%s%s", sep, buffer);
    361  1.1  kleink 
    362  1.1  kleink 		if (ferror(stdout)) {
    363  1.1  kleink 			perror("output error");
    364  1.1  kleink 			exit(EXIT_FAILURE);
    365  1.1  kleink 		}
    366  1.1  kleink nextline:
    367  1.1  kleink 		;
    368  1.1  kleink 	}
    369  1.1  kleink 
    370  1.1  kleink 	if (ferror(stdin)) {
    371  1.1  kleink 		perror("input error");
    372  1.1  kleink 		exit(EXIT_FAILURE);
    373  1.1  kleink 	}
    374  1.1  kleink }
    375  1.1  kleink 
    376  1.1  kleink /*
    377  1.1  kleink  * Various support functions.
    378  1.1  kleink  */
    379  1.1  kleink 
    380  1.1  kleink static void
    381  1.1  kleink parse_numbering(argstr, section)
    382  1.1  kleink 	const char *argstr;
    383  1.1  kleink 	int section;
    384  1.1  kleink {
    385  1.1  kleink 	int error;
    386  1.5  kleink 	char errorbuf[NL_TEXTMAX];
    387  1.1  kleink 
    388  1.1  kleink 	switch (argstr[0]) {
    389  1.1  kleink 	case 'a':
    390  1.1  kleink 		numbering_properties[section].type = number_all;
    391  1.1  kleink 		break;
    392  1.1  kleink 	case 'n':
    393  1.1  kleink 		numbering_properties[section].type = number_none;
    394  1.1  kleink 		break;
    395  1.1  kleink 	case 't':
    396  1.1  kleink 		numbering_properties[section].type = number_nonempty;
    397  1.1  kleink 		break;
    398  1.1  kleink 	case 'p':
    399  1.1  kleink 		/* If there was a previous expression, throw it away. */
    400  1.1  kleink 		if (numbering_properties[section].type == number_regex)
    401  1.1  kleink 			regfree(&numbering_properties[section].expr);
    402  1.1  kleink 		else
    403  1.1  kleink 			numbering_properties[section].type = number_regex;
    404  1.1  kleink 
    405  1.1  kleink 		/* Compile/validate the supplied regular expression. */
    406  1.1  kleink 		if ((error = regcomp(&numbering_properties[section].expr,
    407  1.1  kleink 		    &argstr[1], REG_NEWLINE|REG_NOSUB)) != 0) {
    408  1.1  kleink 			(void)regerror(error,
    409  1.1  kleink 			    &numbering_properties[section].expr,
    410  1.1  kleink 			    errorbuf, sizeof (errorbuf));
    411  1.1  kleink 			(void)fprintf(stderr,
    412  1.1  kleink 			    "nl: %s expr: %s -- %s\n",
    413  1.1  kleink 			    numbering_properties[section].name, errorbuf,
    414  1.1  kleink 			    &argstr[1]);
    415  1.1  kleink 			exit(EXIT_FAILURE);
    416  1.1  kleink 		}
    417  1.1  kleink 		break;
    418  1.1  kleink 	default:
    419  1.1  kleink 		(void)fprintf(stderr,
    420  1.1  kleink 		    "nl: illegal %s line numbering type -- %s\n",
    421  1.1  kleink 		    numbering_properties[section].name, argstr);
    422  1.1  kleink 		exit(EXIT_FAILURE);
    423  1.1  kleink 	}
    424  1.1  kleink }
    425  1.1  kleink 
    426  1.1  kleink static void
    427  1.1  kleink usage()
    428  1.1  kleink {
    429  1.1  kleink 
    430  1.1  kleink 	(void)fprintf(stderr, "usage: nl [-p] [-b type] [-d delim] [-f type] \
    431  1.1  kleink [-h type] [-i incr] [-l num]\n\t[-n format] [-s sep] [-v startnum] [-w width] \
    432  1.1  kleink [file]\n");
    433  1.1  kleink 	exit(EXIT_FAILURE);
    434  1.1  kleink }
    435