uniq.c revision 1.3 1 1.1 cgd /*
2 1.1 cgd * Copyright (c) 1989 The Regents of the University of California.
3 1.1 cgd * All rights reserved.
4 1.1 cgd *
5 1.1 cgd * This code is derived from software contributed to Berkeley by
6 1.1 cgd * Case Larsen.
7 1.1 cgd *
8 1.1 cgd * Redistribution and use in source and binary forms, with or without
9 1.1 cgd * modification, are permitted provided that the following conditions
10 1.1 cgd * are met:
11 1.1 cgd * 1. Redistributions of source code must retain the above copyright
12 1.1 cgd * notice, this list of conditions and the following disclaimer.
13 1.1 cgd * 2. Redistributions in binary form must reproduce the above copyright
14 1.1 cgd * notice, this list of conditions and the following disclaimer in the
15 1.1 cgd * documentation and/or other materials provided with the distribution.
16 1.1 cgd * 3. All advertising materials mentioning features or use of this software
17 1.1 cgd * must display the following acknowledgement:
18 1.1 cgd * This product includes software developed by the University of
19 1.1 cgd * California, Berkeley and its contributors.
20 1.1 cgd * 4. Neither the name of the University nor the names of its contributors
21 1.1 cgd * may be used to endorse or promote products derived from this software
22 1.1 cgd * without specific prior written permission.
23 1.1 cgd *
24 1.1 cgd * THIS SOFTWARE IS PROVIDED BY THE REGENTS AND CONTRIBUTORS ``AS IS'' AND
25 1.1 cgd * ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
26 1.1 cgd * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
27 1.1 cgd * ARE DISCLAIMED. IN NO EVENT SHALL THE REGENTS OR CONTRIBUTORS BE LIABLE
28 1.1 cgd * FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL
29 1.1 cgd * DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS
30 1.1 cgd * OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION)
31 1.1 cgd * HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT
32 1.1 cgd * LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY
33 1.1 cgd * OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF
34 1.1 cgd * SUCH DAMAGE.
35 1.1 cgd */
36 1.1 cgd
37 1.1 cgd #ifndef lint
38 1.1 cgd char copyright[] =
39 1.1 cgd "@(#) Copyright (c) 1989 The Regents of the University of California.\n\
40 1.1 cgd All rights reserved.\n";
41 1.1 cgd #endif /* not lint */
42 1.1 cgd
43 1.1 cgd #ifndef lint
44 1.1 cgd static char sccsid[] = "@(#)uniq.c 5.2 (Berkeley) 6/1/90";
45 1.1 cgd #endif /* not lint */
46 1.1 cgd
47 1.1 cgd #include <stdio.h>
48 1.1 cgd #include <ctype.h>
49 1.1 cgd
50 1.1 cgd int cflag, dflag, uflag;
51 1.1 cgd int numchars, numfields, repeats;
52 1.1 cgd
53 1.1 cgd #define MAXLINELEN (2048 + 1)
54 1.1 cgd
55 1.1 cgd main (argc,argv)
56 1.1 cgd int argc;
57 1.1 cgd char **argv;
58 1.1 cgd {
59 1.1 cgd extern int optind;
60 1.1 cgd FILE *ifp, *ofp, *file();
61 1.1 cgd int ch;
62 1.1 cgd register char *t1, *t2;
63 1.1 cgd char *prevline, *thisline, *malloc(), *skip();
64 1.1 cgd
65 1.1 cgd while ((ch = getopt(argc, argv, "-cdu123456789")) != EOF)
66 1.1 cgd switch (ch) {
67 1.1 cgd case '-':
68 1.1 cgd --optind;
69 1.1 cgd goto done;
70 1.1 cgd case 'c':
71 1.1 cgd cflag = 1;
72 1.1 cgd break;
73 1.1 cgd case 'd':
74 1.1 cgd dflag = 1;
75 1.1 cgd break;
76 1.1 cgd case 'u':
77 1.1 cgd uflag = 1;
78 1.1 cgd break;
79 1.1 cgd /*
80 1.1 cgd * since -n is a valid option that could be picked up by
81 1.1 cgd * getopt, but is better handled by the +n and -n code, we
82 1.1 cgd * break out.
83 1.1 cgd */
84 1.1 cgd case '1': case '2': case '3': case '4':
85 1.1 cgd case '5': case '6': case '7': case '8': case '9':
86 1.1 cgd --optind;
87 1.1 cgd goto done;
88 1.1 cgd case '?':
89 1.1 cgd default:
90 1.1 cgd usage();
91 1.1 cgd }
92 1.1 cgd
93 1.1 cgd done: argc -= optind;
94 1.1 cgd argv +=optind;
95 1.1 cgd
96 1.1 cgd /* if no flags are set, default is -d -u */
97 1.1 cgd if (cflag) {
98 1.1 cgd if (dflag || uflag)
99 1.1 cgd usage();
100 1.1 cgd } else if (!dflag && !uflag)
101 1.1 cgd dflag = uflag = 1;
102 1.1 cgd
103 1.1 cgd /* because of the +, getopt is messed up */
104 1.2 mycroft for (; *argv && (**argv == '+' || **argv == '-'); ++argv, --argc)
105 1.1 cgd switch (**argv) {
106 1.1 cgd case '+':
107 1.1 cgd if ((numchars = atoi(*argv + 1)) < 0)
108 1.1 cgd goto negerr;
109 1.1 cgd break;
110 1.1 cgd case '-':
111 1.1 cgd if ((numfields = atoi(*argv + 1)) < 0) {
112 1.1 cgd negerr: (void)fprintf(stderr,
113 1.1 cgd "uniq: negative field/char skip value.\n");
114 1.1 cgd usage();
115 1.1 cgd }
116 1.1 cgd break;
117 1.1 cgd }
118 1.1 cgd
119 1.1 cgd switch(argc) {
120 1.1 cgd case 0:
121 1.1 cgd ifp = stdin;
122 1.1 cgd ofp = stdout;
123 1.1 cgd break;
124 1.1 cgd case 1:
125 1.1 cgd ifp = file(argv[0], "r");
126 1.1 cgd ofp = stdout;
127 1.1 cgd break;
128 1.1 cgd case 2:
129 1.1 cgd ifp = file(argv[0], "r");
130 1.1 cgd ofp = file(argv[1], "w");
131 1.1 cgd break;
132 1.1 cgd default:
133 1.1 cgd usage();
134 1.1 cgd }
135 1.1 cgd
136 1.1 cgd prevline = malloc(MAXLINELEN);
137 1.1 cgd thisline = malloc(MAXLINELEN);
138 1.3 deraadt if (!fgets(prevline, MAXLINELEN, ifp))
139 1.3 deraadt exit(0);
140 1.1 cgd
141 1.1 cgd while (fgets(thisline, MAXLINELEN, ifp)) {
142 1.1 cgd /* if requested get the chosen fields + character offsets */
143 1.1 cgd if (numfields || numchars) {
144 1.1 cgd t1 = skip(thisline);
145 1.1 cgd t2 = skip(prevline);
146 1.1 cgd } else {
147 1.1 cgd t1 = thisline;
148 1.1 cgd t2 = prevline;
149 1.1 cgd }
150 1.1 cgd
151 1.1 cgd /* if different, print; set previous to new value */
152 1.1 cgd if (strcmp(t1, t2)) {
153 1.1 cgd show(ofp, prevline);
154 1.1 cgd t1 = prevline;
155 1.1 cgd prevline = thisline;
156 1.1 cgd thisline = t1;
157 1.1 cgd repeats = 0;
158 1.1 cgd }
159 1.1 cgd else
160 1.1 cgd ++repeats;
161 1.1 cgd }
162 1.1 cgd show(ofp, prevline);
163 1.1 cgd exit(0);
164 1.1 cgd }
165 1.1 cgd
166 1.1 cgd /*
167 1.1 cgd * show --
168 1.1 cgd * output a line depending on the flags and number of repetitions
169 1.1 cgd * of the line.
170 1.1 cgd */
171 1.1 cgd show(ofp, str)
172 1.1 cgd FILE *ofp;
173 1.1 cgd char *str;
174 1.1 cgd {
175 1.1 cgd if (cflag)
176 1.1 cgd (void)fprintf(ofp, "%4d %s", repeats + 1, str);
177 1.1 cgd if (dflag && repeats || uflag && !repeats)
178 1.1 cgd (void)fprintf(ofp, "%s", str);
179 1.1 cgd }
180 1.1 cgd
181 1.1 cgd char *
182 1.1 cgd skip(str)
183 1.1 cgd register char *str;
184 1.1 cgd {
185 1.1 cgd register int infield, nchars, nfields;
186 1.1 cgd
187 1.1 cgd for (nfields = numfields, infield = 0; nfields && *str; ++str)
188 1.1 cgd if (isspace(*str)) {
189 1.1 cgd if (infield) {
190 1.1 cgd infield = 0;
191 1.1 cgd --nfields;
192 1.1 cgd }
193 1.1 cgd } else if (!infield)
194 1.1 cgd infield = 1;
195 1.1 cgd for (nchars = numchars; nchars-- && *str; ++str);
196 1.1 cgd return(str);
197 1.1 cgd }
198 1.1 cgd
199 1.1 cgd FILE *
200 1.1 cgd file(name, mode)
201 1.1 cgd char *name, *mode;
202 1.1 cgd {
203 1.1 cgd FILE *fp;
204 1.1 cgd
205 1.1 cgd if (!(fp = fopen(name, mode))) {
206 1.1 cgd (void)fprintf(stderr, "uniq: can't open %s.\n", name);
207 1.1 cgd exit(1);
208 1.1 cgd }
209 1.1 cgd return(fp);
210 1.1 cgd }
211 1.1 cgd
212 1.1 cgd usage()
213 1.1 cgd {
214 1.1 cgd (void)fprintf(stderr,
215 1.1 cgd "usage: uniq [-c | -du] [- #fields] [+ #chars] [input [output]]\n");
216 1.1 cgd exit(1);
217 1.1 cgd }
218