tr.c revision 1.1 1 1.1 cgd /*
2 1.1 cgd * Copyright (c) 1988 The Regents of the University of California.
3 1.1 cgd * All rights reserved.
4 1.1 cgd *
5 1.1 cgd * Redistribution and use in source and binary forms, with or without
6 1.1 cgd * modification, are permitted provided that the following conditions
7 1.1 cgd * are met:
8 1.1 cgd * 1. Redistributions of source code must retain the above copyright
9 1.1 cgd * notice, this list of conditions and the following disclaimer.
10 1.1 cgd * 2. Redistributions in binary form must reproduce the above copyright
11 1.1 cgd * notice, this list of conditions and the following disclaimer in the
12 1.1 cgd * documentation and/or other materials provided with the distribution.
13 1.1 cgd * 3. All advertising materials mentioning features or use of this software
14 1.1 cgd * must display the following acknowledgement:
15 1.1 cgd * This product includes software developed by the University of
16 1.1 cgd * California, Berkeley and its contributors.
17 1.1 cgd * 4. Neither the name of the University nor the names of its contributors
18 1.1 cgd * may be used to endorse or promote products derived from this software
19 1.1 cgd * without specific prior written permission.
20 1.1 cgd *
21 1.1 cgd * THIS SOFTWARE IS PROVIDED BY THE REGENTS AND CONTRIBUTORS ``AS IS'' AND
22 1.1 cgd * ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
23 1.1 cgd * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
24 1.1 cgd * ARE DISCLAIMED. IN NO EVENT SHALL THE REGENTS OR CONTRIBUTORS BE LIABLE
25 1.1 cgd * FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL
26 1.1 cgd * DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS
27 1.1 cgd * OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION)
28 1.1 cgd * HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT
29 1.1 cgd * LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY
30 1.1 cgd * OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF
31 1.1 cgd * SUCH DAMAGE.
32 1.1 cgd */
33 1.1 cgd
34 1.1 cgd #ifndef lint
35 1.1 cgd char copyright[] =
36 1.1 cgd "@(#) Copyright (c) 1988 The Regents of the University of California.\n\
37 1.1 cgd All rights reserved.\n";
38 1.1 cgd #endif /* not lint */
39 1.1 cgd
40 1.1 cgd #ifndef lint
41 1.1 cgd static char sccsid[] = "@(#)tr.c 4.7 (Berkeley) 7/23/90";
42 1.1 cgd #endif /* not lint */
43 1.1 cgd
44 1.1 cgd #include <sys/types.h>
45 1.1 cgd #include <stdio.h>
46 1.1 cgd #include <ctype.h>
47 1.1 cgd
48 1.1 cgd #define NCHARS 256 /* size of u_char */
49 1.1 cgd #define OOBCH 257 /* out of band value */
50 1.1 cgd
51 1.1 cgd typedef struct {
52 1.1 cgd char *str;
53 1.1 cgd int lastch, endrange;
54 1.1 cgd enum { NORM, INRANGE, EOS } state;
55 1.1 cgd } STR;
56 1.1 cgd
57 1.1 cgd main(argc, argv)
58 1.1 cgd int argc;
59 1.1 cgd char **argv;
60 1.1 cgd {
61 1.1 cgd extern int optind;
62 1.1 cgd STR s1, s2;
63 1.1 cgd register int ch, indx, lastch;
64 1.1 cgd int cflag, dflag, sflag;
65 1.1 cgd u_char *tp, tab[NCHARS], squeeze[NCHARS];
66 1.1 cgd
67 1.1 cgd cflag = dflag = sflag = 0;
68 1.1 cgd while ((ch = getopt(argc, argv, "cds")) != EOF)
69 1.1 cgd switch((char)ch) {
70 1.1 cgd case 'c':
71 1.1 cgd cflag = 1;
72 1.1 cgd break;
73 1.1 cgd case 'd':
74 1.1 cgd dflag = 1;
75 1.1 cgd break;
76 1.1 cgd case 's':
77 1.1 cgd sflag = 1;
78 1.1 cgd break;
79 1.1 cgd case '?':
80 1.1 cgd default:
81 1.1 cgd fprintf(stderr,
82 1.1 cgd "usage: tr [-cds] [string1 [string2]]\n");
83 1.1 cgd exit(1);
84 1.1 cgd }
85 1.1 cgd argc -= optind;
86 1.1 cgd argv += optind;
87 1.1 cgd
88 1.1 cgd /*
89 1.1 cgd * the original tr was amazingly tolerant of the command line.
90 1.1 cgd * Neither -c or -s have any effect unless there are two strings.
91 1.1 cgd * Extra arguments are silently ignored. Bag this noise, they
92 1.1 cgd * should all be errors.
93 1.1 cgd */
94 1.1 cgd if (argc < 2 && !dflag) {
95 1.1 cgd while ((ch = getchar()) != EOF)
96 1.1 cgd putchar(ch);
97 1.1 cgd exit(0);
98 1.1 cgd }
99 1.1 cgd
100 1.1 cgd bzero(tab, NCHARS);
101 1.1 cgd if (sflag) {
102 1.1 cgd s1.str = argv[1];
103 1.1 cgd s1.state = NORM;
104 1.1 cgd s1.lastch = OOBCH;
105 1.1 cgd while (next(&s1))
106 1.1 cgd squeeze[s1.lastch] = 1;
107 1.1 cgd }
108 1.1 cgd if (dflag) {
109 1.1 cgd s1.str = argv[0];
110 1.1 cgd s1.state = NORM;
111 1.1 cgd s1.lastch = OOBCH;
112 1.1 cgd while (next(&s1))
113 1.1 cgd tab[s1.lastch] = 1;
114 1.1 cgd if (cflag)
115 1.1 cgd for (tp = tab, indx = 0; indx < NCHARS; ++tp, ++indx)
116 1.1 cgd *tp = !*tp;
117 1.1 cgd if (sflag)
118 1.1 cgd for (lastch = OOBCH; (ch = getchar()) != EOF;) {
119 1.1 cgd if (tab[ch] || (squeeze[ch] && lastch == ch))
120 1.1 cgd continue;
121 1.1 cgd lastch = ch;
122 1.1 cgd putchar(ch);
123 1.1 cgd }
124 1.1 cgd else
125 1.1 cgd while ((ch = getchar()) != EOF)
126 1.1 cgd if (!tab[ch])
127 1.1 cgd putchar(ch);
128 1.1 cgd } else {
129 1.1 cgd s1.str = argv[0];
130 1.1 cgd s2.str = argv[1];
131 1.1 cgd s1.state = s2.state = NORM;
132 1.1 cgd s1.lastch = s2.lastch = OOBCH;
133 1.1 cgd if (cflag) {
134 1.1 cgd /*
135 1.1 cgd * if cflag is set, tr just pretends it only got one
136 1.1 cgd * character in string2. As reasonable as anything
137 1.1 cgd * else. Should really be an error.
138 1.1 cgd */
139 1.1 cgd while (next(&s2));
140 1.1 cgd lastch = s2.lastch;
141 1.1 cgd for (tp = tab, indx = 0; indx < NCHARS; ++tp, ++indx)
142 1.1 cgd *tp = lastch;
143 1.1 cgd while (next(&s1))
144 1.1 cgd tab[s1.lastch] = s1.lastch;
145 1.1 cgd } else {
146 1.1 cgd for (tp = tab, indx = 0; indx < NCHARS; ++tp, ++indx)
147 1.1 cgd *tp = indx;
148 1.1 cgd while (next(&s1)) {
149 1.1 cgd (void)next(&s2);
150 1.1 cgd tab[s1.lastch] = s2.lastch;
151 1.1 cgd }
152 1.1 cgd }
153 1.1 cgd if (sflag)
154 1.1 cgd for (lastch = OOBCH; (ch = getchar()) != EOF;) {
155 1.1 cgd ch = tab[ch];
156 1.1 cgd if (squeeze[ch] && lastch == ch)
157 1.1 cgd continue;
158 1.1 cgd lastch = ch;
159 1.1 cgd putchar(ch);
160 1.1 cgd }
161 1.1 cgd else
162 1.1 cgd while ((ch = getchar()) != EOF)
163 1.1 cgd putchar((int)tab[ch]);
164 1.1 cgd }
165 1.1 cgd exit(0);
166 1.1 cgd }
167 1.1 cgd
168 1.1 cgd next(s)
169 1.1 cgd register STR *s;
170 1.1 cgd {
171 1.1 cgd register int ch;
172 1.1 cgd
173 1.1 cgd if (s->state == EOS)
174 1.1 cgd return(0);
175 1.1 cgd if (s->state == INRANGE) {
176 1.1 cgd if (++s->lastch == s->endrange)
177 1.1 cgd s->state = NORM;
178 1.1 cgd return(1);
179 1.1 cgd }
180 1.1 cgd if (!(ch = *s->str++)) {
181 1.1 cgd s->state = EOS;
182 1.1 cgd return(0);
183 1.1 cgd }
184 1.1 cgd if (ch == '\\') { /* \### */
185 1.1 cgd s->lastch = tran(s);
186 1.1 cgd return(1);
187 1.1 cgd }
188 1.1 cgd if (ch == '-') { /* ranges */
189 1.1 cgd if (s->lastch == OOBCH) /* "-a" */
190 1.1 cgd goto fail2;
191 1.1 cgd if (!(ch = *s->str++)) /* "a-" */
192 1.1 cgd goto fail1;
193 1.1 cgd if (ch == '\\') /* \### */
194 1.1 cgd ch = tran(s);
195 1.1 cgd if (s->lastch > ch) { /* "z-a" */
196 1.1 cgd fail1: --s->str;
197 1.1 cgd fail2: s->lastch = '-';
198 1.1 cgd return(1);
199 1.1 cgd }
200 1.1 cgd if (s->lastch == ch) /* "a-a" */
201 1.1 cgd return(next(s));
202 1.1 cgd s->state = INRANGE; /* "a-z" */
203 1.1 cgd s->endrange = ch;
204 1.1 cgd return(1);
205 1.1 cgd }
206 1.1 cgd s->lastch = ch;
207 1.1 cgd return(1);
208 1.1 cgd }
209 1.1 cgd
210 1.1 cgd /*
211 1.1 cgd * Translate \-escapes. Up to 3 octal digits => char; no digits => literal.
212 1.1 cgd * Unadorned backslash "\" is like \000.
213 1.1 cgd */
214 1.1 cgd tran(s)
215 1.1 cgd register STR *s;
216 1.1 cgd {
217 1.1 cgd register int ch, cnt = 0, val = 0;
218 1.1 cgd
219 1.1 cgd for (;;) {
220 1.1 cgd ch = *s->str++;
221 1.1 cgd if (!isascii(ch) || !isdigit(ch) || ++cnt > 3)
222 1.1 cgd break;
223 1.1 cgd val = val * 8 + ch - '0';
224 1.1 cgd }
225 1.1 cgd if (cnt || ch == 0)
226 1.1 cgd s->str--;
227 1.1 cgd return (cnt ? val : ch);
228 1.1 cgd }
229