pat_rep.c revision 1.27 1 1.27 christos /* $NetBSD: pat_rep.c,v 1.27 2007/05/04 21:19:36 christos Exp $ */
2 1.4 cgd
3 1.1 jtc /*-
4 1.20 agc * Copyright (c) 1992 Keith Muller.
5 1.1 jtc * Copyright (c) 1992, 1993
6 1.1 jtc * The Regents of the University of California. All rights reserved.
7 1.1 jtc *
8 1.1 jtc * This code is derived from software contributed to Berkeley by
9 1.1 jtc * Keith Muller of the University of California, San Diego.
10 1.1 jtc *
11 1.1 jtc * Redistribution and use in source and binary forms, with or without
12 1.1 jtc * modification, are permitted provided that the following conditions
13 1.1 jtc * are met:
14 1.1 jtc * 1. Redistributions of source code must retain the above copyright
15 1.1 jtc * notice, this list of conditions and the following disclaimer.
16 1.1 jtc * 2. Redistributions in binary form must reproduce the above copyright
17 1.1 jtc * notice, this list of conditions and the following disclaimer in the
18 1.1 jtc * documentation and/or other materials provided with the distribution.
19 1.19 agc * 3. Neither the name of the University nor the names of its contributors
20 1.19 agc * may be used to endorse or promote products derived from this software
21 1.19 agc * without specific prior written permission.
22 1.19 agc *
23 1.19 agc * THIS SOFTWARE IS PROVIDED BY THE REGENTS AND CONTRIBUTORS ``AS IS'' AND
24 1.19 agc * ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
25 1.19 agc * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
26 1.19 agc * ARE DISCLAIMED. IN NO EVENT SHALL THE REGENTS OR CONTRIBUTORS BE LIABLE
27 1.19 agc * FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL
28 1.19 agc * DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS
29 1.19 agc * OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION)
30 1.19 agc * HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT
31 1.19 agc * LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY
32 1.19 agc * OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF
33 1.19 agc * SUCH DAMAGE.
34 1.19 agc */
35 1.19 agc
36 1.21 lukem #if HAVE_NBTOOL_CONFIG_H
37 1.21 lukem #include "nbtool_config.h"
38 1.21 lukem #endif
39 1.21 lukem
40 1.7 christos #include <sys/cdefs.h>
41 1.21 lukem #if !defined(lint)
42 1.4 cgd #if 0
43 1.4 cgd static char sccsid[] = "@(#)pat_rep.c 8.2 (Berkeley) 4/18/94";
44 1.4 cgd #else
45 1.27 christos __RCSID("$NetBSD: pat_rep.c,v 1.27 2007/05/04 21:19:36 christos Exp $");
46 1.4 cgd #endif
47 1.1 jtc #endif /* not lint */
48 1.1 jtc
49 1.1 jtc #include <sys/types.h>
50 1.1 jtc #include <sys/time.h>
51 1.1 jtc #include <sys/stat.h>
52 1.1 jtc #include <sys/param.h>
53 1.1 jtc #include <stdio.h>
54 1.1 jtc #include <ctype.h>
55 1.1 jtc #include <string.h>
56 1.1 jtc #include <unistd.h>
57 1.1 jtc #include <stdlib.h>
58 1.1 jtc #include "pax.h"
59 1.1 jtc #include "pat_rep.h"
60 1.1 jtc #include "extern.h"
61 1.1 jtc
62 1.1 jtc /*
63 1.1 jtc * routines to handle pattern matching, name modification (regular expression
64 1.1 jtc * substitution and interactive renames), and destination name modification for
65 1.1 jtc * copy (-rw). Both file name and link names are adjusted as required in these
66 1.1 jtc * routines.
67 1.1 jtc */
68 1.1 jtc
69 1.1 jtc #define MAXSUBEXP 10 /* max subexpressions, DO NOT CHANGE */
70 1.1 jtc static PATTERN *pathead = NULL; /* file pattern match list head */
71 1.1 jtc static PATTERN *pattail = NULL; /* file pattern match list tail */
72 1.1 jtc static REPLACE *rephead = NULL; /* replacement string list head */
73 1.1 jtc static REPLACE *reptail = NULL; /* replacement string list tail */
74 1.1 jtc
75 1.14 christos static int rep_name(char *, size_t, int *, int);
76 1.12 lukem static int tty_rename(ARCHD *);
77 1.12 lukem static int fix_path(char *, int *, char *, int);
78 1.12 lukem static int fn_match(char *, char *, char **);
79 1.12 lukem static char * range_match(char *, int);
80 1.15 christos static int checkdotdot(const char *);
81 1.1 jtc #ifdef NET2_REGEX
82 1.12 lukem static int resub(regexp *, char *, char *, char *);
83 1.1 jtc #else
84 1.12 lukem static int resub(regex_t *, regmatch_t *, char *, char *, char *, char *);
85 1.1 jtc #endif
86 1.1 jtc
87 1.1 jtc /*
88 1.1 jtc * rep_add()
89 1.1 jtc * parses the -s replacement string; compiles the regular expression
90 1.25 snj * and stores the compiled value and its replacement string together in
91 1.1 jtc * replacement string list. Input to this function is of the form:
92 1.11 itohy * /old/new/pg
93 1.1 jtc * The first char in the string specifies the delimiter used by this
94 1.1 jtc * replacement string. "Old" is a regular expression in "ed" format which
95 1.1 jtc * is compiled by regcomp() and is applied to filenames. "new" is the
96 1.1 jtc * substitution string; p and g are options flags for printing and global
97 1.1 jtc * replacement (over the single filename)
98 1.1 jtc * Return:
99 1.1 jtc * 0 if a proper replacement string and regular expression was added to
100 1.1 jtc * the list of replacement patterns; -1 otherwise.
101 1.1 jtc */
102 1.1 jtc
103 1.1 jtc int
104 1.5 tls rep_add(char *str)
105 1.1 jtc {
106 1.5 tls char *pt1;
107 1.5 tls char *pt2;
108 1.5 tls REPLACE *rep;
109 1.22 dsl #ifdef NET2_REGEX
110 1.22 dsl static const char rebuf[] = "Error";
111 1.22 dsl #else
112 1.5 tls int res;
113 1.1 jtc char rebuf[BUFSIZ];
114 1.12 lukem #endif
115 1.1 jtc
116 1.1 jtc /*
117 1.1 jtc * throw out the bad parameters
118 1.1 jtc */
119 1.1 jtc if ((str == NULL) || (*str == '\0')) {
120 1.7 christos tty_warn(1, "Empty replacement string");
121 1.24 dsl return -1;
122 1.1 jtc }
123 1.1 jtc
124 1.1 jtc /*
125 1.1 jtc * first character in the string specifies what the delimiter is for
126 1.14 christos * this expression.
127 1.1 jtc */
128 1.14 christos for (pt1 = str+1; *pt1; pt1++) {
129 1.14 christos if (*pt1 == '\\') {
130 1.14 christos pt1++;
131 1.14 christos continue;
132 1.14 christos }
133 1.14 christos if (*pt1 == *str)
134 1.14 christos break;
135 1.14 christos }
136 1.22 dsl if (*pt1 == 0) {
137 1.7 christos tty_warn(1, "Invalid replacement string %s", str);
138 1.24 dsl return -1;
139 1.1 jtc }
140 1.1 jtc
141 1.1 jtc /*
142 1.1 jtc * allocate space for the node that handles this replacement pattern
143 1.1 jtc * and split out the regular expression and try to compile it
144 1.1 jtc */
145 1.1 jtc if ((rep = (REPLACE *)malloc(sizeof(REPLACE))) == NULL) {
146 1.7 christos tty_warn(1, "Unable to allocate memory for replacement string");
147 1.24 dsl return -1;
148 1.1 jtc }
149 1.1 jtc
150 1.1 jtc *pt1 = '\0';
151 1.12 lukem #ifdef NET2_REGEX
152 1.1 jtc if ((rep->rcmp = regcomp(str+1)) == NULL) {
153 1.12 lukem #else
154 1.1 jtc if ((res = regcomp(&(rep->rcmp), str+1, 0)) != 0) {
155 1.1 jtc regerror(res, &(rep->rcmp), rebuf, sizeof(rebuf));
156 1.22 dsl #endif
157 1.7 christos tty_warn(1, "%s while compiling regular expression %s", rebuf,
158 1.7 christos str);
159 1.1 jtc (void)free((char *)rep);
160 1.24 dsl return -1;
161 1.1 jtc }
162 1.1 jtc
163 1.1 jtc /*
164 1.1 jtc * put the delimiter back in case we need an error message and
165 1.1 jtc * locate the delimiter at the end of the replacement string
166 1.1 jtc * we then point the node at the new substitution string
167 1.1 jtc */
168 1.1 jtc *pt1++ = *str;
169 1.14 christos for (pt2 = pt1; *pt2; pt2++) {
170 1.14 christos if (*pt2 == '\\') {
171 1.14 christos pt2++;
172 1.14 christos continue;
173 1.14 christos }
174 1.14 christos if (*pt2 == *str)
175 1.14 christos break;
176 1.14 christos }
177 1.22 dsl if (*pt2 == 0) {
178 1.14 christos #ifdef NET2_REGEX
179 1.14 christos (void)free((char *)rep->rcmp);
180 1.14 christos #else
181 1.14 christos regfree(&(rep->rcmp));
182 1.14 christos #endif
183 1.14 christos (void)free((char *)rep);
184 1.14 christos tty_warn(1, "Invalid replacement string %s", str);
185 1.24 dsl return -1;
186 1.14 christos }
187 1.14 christos
188 1.14 christos *pt2 = '\0';
189 1.17 rafal
190 1.18 wiz /* Make sure to dup replacement, who knows where it came from! */
191 1.17 rafal if ((rep->nstr = strdup(pt1)) == NULL) {
192 1.17 rafal #ifdef NET2_REGEX
193 1.17 rafal (void)free((char *)rep->rcmp);
194 1.17 rafal #else
195 1.17 rafal regfree(&(rep->rcmp));
196 1.17 rafal #endif
197 1.17 rafal (void)free((char *)rep);
198 1.17 rafal tty_warn(1, "Unable to allocate memory for replacement string");
199 1.24 dsl return -1;
200 1.17 rafal }
201 1.17 rafal
202 1.1 jtc pt1 = pt2++;
203 1.1 jtc rep->flgs = 0;
204 1.1 jtc
205 1.1 jtc /*
206 1.1 jtc * set the options if any
207 1.1 jtc */
208 1.1 jtc while (*pt2 != '\0') {
209 1.1 jtc switch(*pt2) {
210 1.1 jtc case 'g':
211 1.1 jtc case 'G':
212 1.1 jtc rep->flgs |= GLOB;
213 1.1 jtc break;
214 1.1 jtc case 'p':
215 1.1 jtc case 'P':
216 1.1 jtc rep->flgs |= PRNT;
217 1.1 jtc break;
218 1.27 christos case 's':
219 1.27 christos case 'S':
220 1.27 christos rep->flgs |= SYML;
221 1.27 christos break;
222 1.1 jtc default:
223 1.12 lukem #ifdef NET2_REGEX
224 1.1 jtc (void)free((char *)rep->rcmp);
225 1.12 lukem #else
226 1.1 jtc regfree(&(rep->rcmp));
227 1.12 lukem #endif
228 1.1 jtc (void)free((char *)rep);
229 1.1 jtc *pt1 = *str;
230 1.7 christos tty_warn(1, "Invalid replacement string option %s",
231 1.7 christos str);
232 1.24 dsl return -1;
233 1.1 jtc }
234 1.1 jtc ++pt2;
235 1.1 jtc }
236 1.1 jtc
237 1.1 jtc /*
238 1.1 jtc * all done, link it in at the end
239 1.1 jtc */
240 1.1 jtc rep->fow = NULL;
241 1.1 jtc if (rephead == NULL) {
242 1.1 jtc reptail = rephead = rep;
243 1.24 dsl return 0;
244 1.1 jtc }
245 1.1 jtc reptail->fow = rep;
246 1.1 jtc reptail = rep;
247 1.24 dsl return 0;
248 1.1 jtc }
249 1.1 jtc
250 1.1 jtc /*
251 1.1 jtc * pat_add()
252 1.1 jtc * add a pattern match to the pattern match list. Pattern matches are used
253 1.1 jtc * to select which archive members are extracted. (They appear as
254 1.1 jtc * arguments to pax in the list and read modes). If no patterns are
255 1.1 jtc * supplied to pax, all members in the archive will be selected (and the
256 1.1 jtc * pattern match list is empty).
257 1.10 is *
258 1.1 jtc * Return:
259 1.1 jtc * 0 if the pattern was added to the list, -1 otherwise
260 1.1 jtc */
261 1.1 jtc
262 1.1 jtc int
263 1.14 christos pat_add(char *str, char *chdn)
264 1.1 jtc {
265 1.5 tls PATTERN *pt;
266 1.1 jtc
267 1.1 jtc /*
268 1.1 jtc * throw out the junk
269 1.1 jtc */
270 1.1 jtc if ((str == NULL) || (*str == '\0')) {
271 1.7 christos tty_warn(1, "Empty pattern string");
272 1.24 dsl return -1;
273 1.1 jtc }
274 1.1 jtc
275 1.1 jtc /*
276 1.1 jtc * allocate space for the pattern and store the pattern. the pattern is
277 1.1 jtc * part of argv so do not bother to copy it, just point at it. Add the
278 1.1 jtc * node to the end of the pattern list
279 1.1 jtc */
280 1.1 jtc if ((pt = (PATTERN *)malloc(sizeof(PATTERN))) == NULL) {
281 1.7 christos tty_warn(1, "Unable to allocate memory for pattern string");
282 1.24 dsl return -1;
283 1.1 jtc }
284 1.1 jtc
285 1.1 jtc pt->pstr = str;
286 1.1 jtc pt->pend = NULL;
287 1.1 jtc pt->plen = strlen(str);
288 1.1 jtc pt->fow = NULL;
289 1.14 christos pt->flgs = 0;
290 1.14 christos pt->chdname = chdn;
291 1.1 jtc if (pathead == NULL) {
292 1.1 jtc pattail = pathead = pt;
293 1.24 dsl return 0;
294 1.1 jtc }
295 1.1 jtc pattail->fow = pt;
296 1.1 jtc pattail = pt;
297 1.24 dsl return 0;
298 1.1 jtc }
299 1.1 jtc
300 1.1 jtc /*
301 1.1 jtc * pat_chk()
302 1.1 jtc * complain if any the user supplied pattern did not result in a match to
303 1.1 jtc * a selected archive member.
304 1.1 jtc */
305 1.1 jtc
306 1.1 jtc void
307 1.1 jtc pat_chk(void)
308 1.1 jtc {
309 1.5 tls PATTERN *pt;
310 1.5 tls int wban = 0;
311 1.1 jtc
312 1.1 jtc /*
313 1.1 jtc * walk down the list checking the flags to make sure MTCH was set,
314 1.1 jtc * if not complain
315 1.1 jtc */
316 1.1 jtc for (pt = pathead; pt != NULL; pt = pt->fow) {
317 1.14 christos if (pt->flgs & MTCH)
318 1.1 jtc continue;
319 1.1 jtc if (!wban) {
320 1.7 christos tty_warn(1, "WARNING! These patterns were not matched:");
321 1.1 jtc ++wban;
322 1.1 jtc }
323 1.1 jtc (void)fprintf(stderr, "%s\n", pt->pstr);
324 1.1 jtc }
325 1.1 jtc }
326 1.1 jtc
327 1.1 jtc /*
328 1.1 jtc * pat_sel()
329 1.1 jtc * the archive member which matches a pattern was selected. Mark the
330 1.1 jtc * pattern as having selected an archive member. arcn->pat points at the
331 1.1 jtc * pattern that was matched. arcn->pat is set in pat_match()
332 1.1 jtc *
333 1.1 jtc * NOTE: When the -c option is used, we are called when there was no match
334 1.1 jtc * by pat_match() (that means we did match before the inverted sense of
335 1.18 wiz * the logic). Now this seems really strange at first, but with -c we
336 1.26 msaitoh * need to keep track of those patterns that cause an archive member to
337 1.26 msaitoh * NOT be selected (it found an archive member with a specified pattern)
338 1.1 jtc * Return:
339 1.1 jtc * 0 if the pattern pointed at by arcn->pat was tagged as creating a
340 1.1 jtc * match, -1 otherwise.
341 1.1 jtc */
342 1.1 jtc
343 1.1 jtc int
344 1.5 tls pat_sel(ARCHD *arcn)
345 1.1 jtc {
346 1.5 tls PATTERN *pt;
347 1.5 tls PATTERN **ppt;
348 1.5 tls int len;
349 1.1 jtc
350 1.1 jtc /*
351 1.1 jtc * if no patterns just return
352 1.1 jtc */
353 1.1 jtc if ((pathead == NULL) || ((pt = arcn->pat) == NULL))
354 1.24 dsl return 0;
355 1.1 jtc
356 1.1 jtc /*
357 1.1 jtc * when we are NOT limited to a single match per pattern mark the
358 1.1 jtc * pattern and return
359 1.1 jtc */
360 1.1 jtc if (!nflag) {
361 1.1 jtc pt->flgs |= MTCH;
362 1.24 dsl return 0;
363 1.1 jtc }
364 1.1 jtc
365 1.1 jtc /*
366 1.1 jtc * we reach this point only when we allow a single selected match per
367 1.11 itohy * pattern, if the pattern matches a directory and we do not have -d
368 1.1 jtc * (dflag) we are done with this pattern. We may also be handed a file
369 1.1 jtc * in the subtree of a directory. in that case when we are operating
370 1.1 jtc * with -d, this pattern was already selected and we are done
371 1.1 jtc */
372 1.1 jtc if (pt->flgs & DIR_MTCH)
373 1.24 dsl return 0;
374 1.1 jtc
375 1.1 jtc if (!dflag && ((pt->pend != NULL) || (arcn->type == PAX_DIR))) {
376 1.1 jtc /*
377 1.1 jtc * ok we matched a directory and we are allowing
378 1.1 jtc * subtree matches but because of the -n only its children will
379 1.1 jtc * match. This is tagged as a DIR_MTCH type.
380 1.1 jtc * WATCH IT, the code assumes that pt->pend points
381 1.1 jtc * into arcn->name and arcn->name has not been modified.
382 1.1 jtc * If not we will have a big mess. Yup this is another kludge
383 1.1 jtc */
384 1.1 jtc
385 1.1 jtc /*
386 1.1 jtc * if this was a prefix match, remove trailing part of path
387 1.1 jtc * so we can copy it. Future matches will be exact prefix match
388 1.1 jtc */
389 1.1 jtc if (pt->pend != NULL)
390 1.1 jtc *pt->pend = '\0';
391 1.11 itohy
392 1.1 jtc if ((pt->pstr = strdup(arcn->name)) == NULL) {
393 1.7 christos tty_warn(1, "Pattern select out of memory");
394 1.1 jtc if (pt->pend != NULL)
395 1.1 jtc *pt->pend = '/';
396 1.1 jtc pt->pend = NULL;
397 1.24 dsl return -1;
398 1.1 jtc }
399 1.1 jtc
400 1.1 jtc /*
401 1.1 jtc * put the trailing / back in the source string
402 1.1 jtc */
403 1.1 jtc if (pt->pend != NULL) {
404 1.1 jtc *pt->pend = '/';
405 1.1 jtc pt->pend = NULL;
406 1.1 jtc }
407 1.1 jtc pt->plen = strlen(pt->pstr);
408 1.1 jtc
409 1.1 jtc /*
410 1.1 jtc * strip off any trailing /, this should really never happen
411 1.1 jtc */
412 1.1 jtc len = pt->plen - 1;
413 1.1 jtc if (*(pt->pstr + len) == '/') {
414 1.1 jtc *(pt->pstr + len) = '\0';
415 1.1 jtc pt->plen = len;
416 1.11 itohy }
417 1.1 jtc pt->flgs = DIR_MTCH | MTCH;
418 1.1 jtc arcn->pat = pt;
419 1.24 dsl return 0;
420 1.1 jtc }
421 1.1 jtc
422 1.1 jtc /*
423 1.1 jtc * we are then done with this pattern, so we delete it from the list
424 1.1 jtc * because it can never be used for another match.
425 1.1 jtc * Seems kind of strange to do for a -c, but the pax spec is really
426 1.18 wiz * vague on the interaction of -c, -n, and -d. We assume that when -c
427 1.1 jtc * and the pattern rejects a member (i.e. it matched it) it is done.
428 1.1 jtc * In effect we place the order of the flags as having -c last.
429 1.1 jtc */
430 1.1 jtc pt = pathead;
431 1.1 jtc ppt = &pathead;
432 1.1 jtc while ((pt != NULL) && (pt != arcn->pat)) {
433 1.1 jtc ppt = &(pt->fow);
434 1.1 jtc pt = pt->fow;
435 1.1 jtc }
436 1.1 jtc
437 1.1 jtc if (pt == NULL) {
438 1.1 jtc /*
439 1.1 jtc * should never happen....
440 1.1 jtc */
441 1.26 msaitoh tty_warn(1, "Pattern list inconsistent");
442 1.24 dsl return -1;
443 1.1 jtc }
444 1.1 jtc *ppt = pt->fow;
445 1.1 jtc (void)free((char *)pt);
446 1.1 jtc arcn->pat = NULL;
447 1.24 dsl return 0;
448 1.1 jtc }
449 1.1 jtc
450 1.1 jtc /*
451 1.1 jtc * pat_match()
452 1.1 jtc * see if this archive member matches any supplied pattern, if a match
453 1.1 jtc * is found, arcn->pat is set to point at the potential pattern. Later if
454 1.1 jtc * this archive member is "selected" we process and mark the pattern as
455 1.1 jtc * one which matched a selected archive member (see pat_sel())
456 1.1 jtc * Return:
457 1.11 itohy * 0 if this archive member should be processed, 1 if it should be
458 1.1 jtc * skipped and -1 if we are done with all patterns (and pax should quit
459 1.1 jtc * looking for more members)
460 1.1 jtc */
461 1.1 jtc
462 1.1 jtc int
463 1.5 tls pat_match(ARCHD *arcn)
464 1.1 jtc {
465 1.5 tls PATTERN *pt;
466 1.1 jtc
467 1.1 jtc arcn->pat = NULL;
468 1.1 jtc
469 1.1 jtc /*
470 1.1 jtc * if there are no more patterns and we have -n (and not -c) we are
471 1.1 jtc * done. otherwise with no patterns to match, matches all
472 1.1 jtc */
473 1.1 jtc if (pathead == NULL) {
474 1.1 jtc if (nflag && !cflag)
475 1.24 dsl return -1;
476 1.24 dsl return 0;
477 1.1 jtc }
478 1.1 jtc
479 1.1 jtc /*
480 1.1 jtc * have to search down the list one at a time looking for a match.
481 1.1 jtc */
482 1.1 jtc pt = pathead;
483 1.1 jtc while (pt != NULL) {
484 1.1 jtc /*
485 1.1 jtc * check for a file name match unless we have DIR_MTCH set in
486 1.1 jtc * this pattern then we want a prefix match
487 1.1 jtc */
488 1.1 jtc if (pt->flgs & DIR_MTCH) {
489 1.1 jtc /*
490 1.1 jtc * this pattern was matched before to a directory
491 1.1 jtc * as we must have -n set for this (but not -d). We can
492 1.1 jtc * only match CHILDREN of that directory so we must use
493 1.1 jtc * an exact prefix match (no wildcards).
494 1.1 jtc */
495 1.1 jtc if ((arcn->name[pt->plen] == '/') &&
496 1.1 jtc (strncmp(pt->pstr, arcn->name, pt->plen) == 0))
497 1.1 jtc break;
498 1.1 jtc } else if (fn_match(pt->pstr, arcn->name, &pt->pend) == 0)
499 1.1 jtc break;
500 1.1 jtc pt = pt->fow;
501 1.1 jtc }
502 1.1 jtc
503 1.1 jtc /*
504 1.1 jtc * return the result, remember that cflag (-c) inverts the sense of a
505 1.1 jtc * match
506 1.1 jtc */
507 1.1 jtc if (pt == NULL)
508 1.24 dsl return cflag ? 0 : 1;
509 1.1 jtc
510 1.1 jtc /*
511 1.1 jtc * we had a match, now when we invert the sense (-c) we reject this
512 1.1 jtc * member. However we have to tag the pattern a being successful, (in a
513 1.26 msaitoh * match, not in selecting an archive member) so we call pat_sel()
514 1.26 msaitoh * here.
515 1.1 jtc */
516 1.1 jtc arcn->pat = pt;
517 1.1 jtc if (!cflag)
518 1.24 dsl return 0;
519 1.1 jtc
520 1.1 jtc if (pat_sel(arcn) < 0)
521 1.24 dsl return -1;
522 1.1 jtc arcn->pat = NULL;
523 1.24 dsl return 1;
524 1.1 jtc }
525 1.1 jtc
526 1.1 jtc /*
527 1.1 jtc * fn_match()
528 1.1 jtc * Return:
529 1.11 itohy * 0 if this archive member should be processed, 1 if it should be
530 1.1 jtc * skipped and -1 if we are done with all patterns (and pax should quit
531 1.1 jtc * looking for more members)
532 1.1 jtc * Note: *pend may be changed to show where the prefix ends.
533 1.1 jtc */
534 1.1 jtc
535 1.1 jtc static int
536 1.5 tls fn_match(char *pattern, char *string, char **pend)
537 1.1 jtc {
538 1.5 tls char c;
539 1.1 jtc char test;
540 1.1 jtc
541 1.1 jtc *pend = NULL;
542 1.1 jtc for (;;) {
543 1.1 jtc switch (c = *pattern++) {
544 1.1 jtc case '\0':
545 1.1 jtc /*
546 1.1 jtc * Ok we found an exact match
547 1.1 jtc */
548 1.1 jtc if (*string == '\0')
549 1.24 dsl return 0;
550 1.1 jtc
551 1.1 jtc /*
552 1.1 jtc * Check if it is a prefix match
553 1.1 jtc */
554 1.1 jtc if ((dflag == 1) || (*string != '/'))
555 1.24 dsl return -1;
556 1.1 jtc
557 1.1 jtc /*
558 1.1 jtc * It is a prefix match, remember where the trailing
559 1.1 jtc * / is located
560 1.1 jtc */
561 1.1 jtc *pend = string;
562 1.24 dsl return 0;
563 1.1 jtc case '?':
564 1.1 jtc if ((test = *string++) == '\0')
565 1.1 jtc return (-1);
566 1.1 jtc break;
567 1.1 jtc case '*':
568 1.1 jtc c = *pattern;
569 1.1 jtc /*
570 1.11 itohy * Collapse multiple *'s.
571 1.1 jtc */
572 1.1 jtc while (c == '*')
573 1.1 jtc c = *++pattern;
574 1.1 jtc
575 1.1 jtc /*
576 1.1 jtc * Optimized hack for pattern with a * at the end
577 1.1 jtc */
578 1.1 jtc if (c == '\0')
579 1.1 jtc return (0);
580 1.1 jtc
581 1.1 jtc /*
582 1.1 jtc * General case, use recursion.
583 1.1 jtc */
584 1.1 jtc while ((test = *string) != '\0') {
585 1.1 jtc if (!fn_match(pattern, string, pend))
586 1.1 jtc return (0);
587 1.1 jtc ++string;
588 1.1 jtc }
589 1.1 jtc return (-1);
590 1.1 jtc case '[':
591 1.1 jtc /*
592 1.1 jtc * range match
593 1.1 jtc */
594 1.1 jtc if (((test = *string++) == '\0') ||
595 1.1 jtc ((pattern = range_match(pattern, test)) == NULL))
596 1.1 jtc return (-1);
597 1.1 jtc break;
598 1.1 jtc case '\\':
599 1.1 jtc default:
600 1.1 jtc if (c != *string++)
601 1.1 jtc return (-1);
602 1.1 jtc break;
603 1.1 jtc }
604 1.1 jtc }
605 1.1 jtc /* NOTREACHED */
606 1.1 jtc }
607 1.1 jtc
608 1.1 jtc static char *
609 1.5 tls range_match(char *pattern, int test)
610 1.1 jtc {
611 1.5 tls char c;
612 1.5 tls char c2;
613 1.1 jtc int negate;
614 1.1 jtc int ok = 0;
615 1.1 jtc
616 1.7 christos if ((negate = (*pattern == '!')) != 0)
617 1.1 jtc ++pattern;
618 1.1 jtc
619 1.1 jtc while ((c = *pattern++) != ']') {
620 1.1 jtc /*
621 1.1 jtc * Illegal pattern
622 1.1 jtc */
623 1.1 jtc if (c == '\0')
624 1.1 jtc return (NULL);
625 1.1 jtc
626 1.1 jtc if ((*pattern == '-') && ((c2 = pattern[1]) != '\0') &&
627 1.1 jtc (c2 != ']')) {
628 1.1 jtc if ((c <= test) && (test <= c2))
629 1.1 jtc ok = 1;
630 1.1 jtc pattern += 2;
631 1.1 jtc } else if (c == test)
632 1.1 jtc ok = 1;
633 1.1 jtc }
634 1.1 jtc return (ok == negate ? NULL : pattern);
635 1.1 jtc }
636 1.1 jtc
637 1.1 jtc /*
638 1.1 jtc * mod_name()
639 1.1 jtc * modify a selected file name. first attempt to apply replacement string
640 1.1 jtc * expressions, then apply interactive file rename. We apply replacement
641 1.1 jtc * string expressions to both filenames and file links (if we didn't the
642 1.1 jtc * links would point to the wrong place, and we could never be able to
643 1.1 jtc * move an archive that has a file link in it). When we rename files
644 1.1 jtc * interactively, we store that mapping (old name to user input name) so
645 1.1 jtc * if we spot any file links to the old file name in the future, we will
646 1.1 jtc * know exactly how to fix the file link.
647 1.1 jtc * Return:
648 1.11 itohy * 0 continue to process file, 1 skip this file, -1 pax is finished
649 1.1 jtc */
650 1.1 jtc
651 1.1 jtc int
652 1.27 christos mod_name(ARCHD *arcn, int flags)
653 1.1 jtc {
654 1.5 tls int res = 0;
655 1.1 jtc
656 1.15 christos if (secure) {
657 1.15 christos if (checkdotdot(arcn->name)) {
658 1.15 christos tty_warn(0, "Ignoring file containing `..' (%s)",
659 1.15 christos arcn->name);
660 1.15 christos return 1;
661 1.15 christos }
662 1.16 christos #ifdef notdef
663 1.15 christos if (checkdotdot(arcn->ln_name)) {
664 1.15 christos tty_warn(0, "Ignoring link containing `..' (%s)",
665 1.15 christos arcn->ln_name);
666 1.15 christos return 1;
667 1.15 christos }
668 1.16 christos #endif
669 1.15 christos }
670 1.15 christos
671 1.14 christos /*
672 1.1 jtc * IMPORTANT: We have a problem. what do we do with symlinks?
673 1.1 jtc * Modifying a hard link name makes sense, as we know the file it
674 1.1 jtc * points at should have been seen already in the archive (and if it
675 1.1 jtc * wasn't seen because of a read error or a bad archive, we lose
676 1.1 jtc * anyway). But there are no such requirements for symlinks. On one
677 1.1 jtc * hand the symlink that refers to a file in the archive will have to
678 1.1 jtc * be modified to so it will still work at its new location in the
679 1.1 jtc * file system. On the other hand a symlink that points elsewhere (and
680 1.1 jtc * should continue to do so) should not be modified. There is clearly
681 1.1 jtc * no perfect solution here. So we handle them like hardlinks. Clearly
682 1.1 jtc * a replacement made by the interactive rename mapping is very likely
683 1.1 jtc * to be correct since it applies to a single file and is an exact
684 1.1 jtc * match. The regular expression replacements are a little harder to
685 1.1 jtc * justify though. We claim that the symlink name is only likely
686 1.1 jtc * to be replaced when it points within the file tree being moved and
687 1.1 jtc * in that case it should be modified. what we really need to do is to
688 1.1 jtc * call an oracle here. :)
689 1.1 jtc */
690 1.1 jtc if (rephead != NULL) {
691 1.27 christos flags |= (flags & RENM) ? PRNT : 0;
692 1.1 jtc /*
693 1.1 jtc * we have replacement strings, modify the name and the link
694 1.1 jtc * name if any.
695 1.1 jtc */
696 1.14 christos if ((res = rep_name(arcn->name, sizeof(arcn->name),
697 1.27 christos &(arcn->nlen), flags)) != 0)
698 1.24 dsl return res;
699 1.1 jtc
700 1.1 jtc if (((arcn->type == PAX_SLK) || (arcn->type == PAX_HLK) ||
701 1.1 jtc (arcn->type == PAX_HRG)) &&
702 1.27 christos ((res = rep_name(arcn->ln_name,
703 1.27 christos sizeof(arcn->ln_name), &(arcn->ln_nlen),
704 1.27 christos flags | (arcn->type == PAX_SLK ? SYML : 0))) != 0))
705 1.24 dsl return res;
706 1.1 jtc }
707 1.1 jtc
708 1.1 jtc if (iflag) {
709 1.1 jtc /*
710 1.1 jtc * perform interactive file rename, then map the link if any
711 1.1 jtc */
712 1.1 jtc if ((res = tty_rename(arcn)) != 0)
713 1.24 dsl return res;
714 1.1 jtc if ((arcn->type == PAX_SLK) || (arcn->type == PAX_HLK) ||
715 1.1 jtc (arcn->type == PAX_HRG))
716 1.14 christos sub_name(arcn->ln_name, &(arcn->ln_nlen), sizeof(arcn->ln_name));
717 1.1 jtc }
718 1.23 jmc
719 1.23 jmc /*
720 1.23 jmc * Strip off leading '/' if appropriate.
721 1.23 jmc * Currently, this option is only set for the tar format.
722 1.23 jmc */
723 1.23 jmc if (rmleadslash && arcn->name[0] == '/') {
724 1.23 jmc if (arcn->name[1] == '\0') {
725 1.23 jmc arcn->name[0] = '.';
726 1.23 jmc } else {
727 1.23 jmc (void)memmove(arcn->name, &arcn->name[1],
728 1.23 jmc strlen(arcn->name));
729 1.23 jmc arcn->nlen--;
730 1.23 jmc }
731 1.23 jmc if (rmleadslash < 2) {
732 1.23 jmc rmleadslash = 2;
733 1.23 jmc tty_warn(0, "Removing leading / from absolute path names in the archive");
734 1.23 jmc }
735 1.23 jmc }
736 1.23 jmc if (rmleadslash && arcn->ln_name[0] == '/' &&
737 1.23 jmc (arcn->type == PAX_HLK || arcn->type == PAX_HRG)) {
738 1.23 jmc if (arcn->ln_name[1] == '\0') {
739 1.23 jmc arcn->ln_name[0] = '.';
740 1.23 jmc } else {
741 1.23 jmc (void)memmove(arcn->ln_name, &arcn->ln_name[1],
742 1.23 jmc strlen(arcn->ln_name));
743 1.23 jmc arcn->ln_nlen--;
744 1.23 jmc }
745 1.23 jmc if (rmleadslash < 2) {
746 1.23 jmc rmleadslash = 2;
747 1.23 jmc tty_warn(0, "Removing leading / from absolute path names in the archive");
748 1.23 jmc }
749 1.23 jmc }
750 1.23 jmc
751 1.24 dsl return res;
752 1.1 jtc }
753 1.1 jtc
754 1.1 jtc /*
755 1.1 jtc * tty_rename()
756 1.1 jtc * Prompt the user for a replacement file name. A "." keeps the old name,
757 1.1 jtc * a empty line skips the file, and an EOF on reading the tty, will cause
758 1.1 jtc * pax to stop processing and exit. Otherwise the file name input, replaces
759 1.1 jtc * the old one.
760 1.1 jtc * Return:
761 1.1 jtc * 0 process this file, 1 skip this file, -1 we need to exit pax
762 1.1 jtc */
763 1.1 jtc
764 1.1 jtc static int
765 1.5 tls tty_rename(ARCHD *arcn)
766 1.1 jtc {
767 1.1 jtc char tmpname[PAXPATHLEN+2];
768 1.1 jtc int res;
769 1.1 jtc
770 1.1 jtc /*
771 1.1 jtc * prompt user for the replacement name for a file, keep trying until
772 1.1 jtc * we get some reasonable input. Archives may have more than one file
773 1.1 jtc * on them with the same name (from updates etc). We print verbose info
774 1.1 jtc * on the file so the user knows what is up.
775 1.1 jtc */
776 1.1 jtc tty_prnt("\nATTENTION: %s interactive file rename operation.\n", argv0);
777 1.1 jtc
778 1.1 jtc for (;;) {
779 1.1 jtc ls_tty(arcn);
780 1.1 jtc tty_prnt("Input new name, or a \".\" to keep the old name, ");
781 1.1 jtc tty_prnt("or a \"return\" to skip this file.\n");
782 1.1 jtc tty_prnt("Input > ");
783 1.1 jtc if (tty_read(tmpname, sizeof(tmpname)) < 0)
784 1.24 dsl return -1;
785 1.1 jtc if (strcmp(tmpname, "..") == 0) {
786 1.1 jtc tty_prnt("Try again, illegal file name: ..\n");
787 1.1 jtc continue;
788 1.1 jtc }
789 1.1 jtc if (strlen(tmpname) > PAXPATHLEN) {
790 1.1 jtc tty_prnt("Try again, file name too long\n");
791 1.1 jtc continue;
792 1.1 jtc }
793 1.1 jtc break;
794 1.1 jtc }
795 1.1 jtc
796 1.1 jtc /*
797 1.1 jtc * empty file name, skips this file. a "." leaves it alone
798 1.1 jtc */
799 1.1 jtc if (tmpname[0] == '\0') {
800 1.1 jtc tty_prnt("Skipping file.\n");
801 1.24 dsl return 1;
802 1.1 jtc }
803 1.1 jtc if ((tmpname[0] == '.') && (tmpname[1] == '\0')) {
804 1.1 jtc tty_prnt("Processing continues, name unchanged.\n");
805 1.24 dsl return 0;
806 1.1 jtc }
807 1.1 jtc
808 1.1 jtc /*
809 1.1 jtc * ok the name changed. We may run into links that point at this
810 1.1 jtc * file later. we have to remember where the user sent the file
811 1.1 jtc * in order to repair any links.
812 1.1 jtc */
813 1.1 jtc tty_prnt("Processing continues, name changed to: %s\n", tmpname);
814 1.1 jtc res = add_name(arcn->name, arcn->nlen, tmpname);
815 1.14 christos arcn->nlen = strlcpy(arcn->name, tmpname, sizeof(arcn->name));
816 1.1 jtc if (res < 0)
817 1.24 dsl return -1;
818 1.24 dsl return 0;
819 1.1 jtc }
820 1.1 jtc
821 1.1 jtc /*
822 1.1 jtc * set_dest()
823 1.1 jtc * fix up the file name and the link name (if any) so this file will land
824 1.1 jtc * in the destination directory (used during copy() -rw).
825 1.1 jtc * Return:
826 1.1 jtc * 0 if ok, -1 if failure (name too long)
827 1.1 jtc */
828 1.1 jtc
829 1.1 jtc int
830 1.5 tls set_dest(ARCHD *arcn, char *dest_dir, int dir_len)
831 1.1 jtc {
832 1.1 jtc if (fix_path(arcn->name, &(arcn->nlen), dest_dir, dir_len) < 0)
833 1.24 dsl return -1;
834 1.1 jtc
835 1.1 jtc /*
836 1.1 jtc * It is really hard to deal with symlinks here, we cannot be sure
837 1.1 jtc * if the name they point was moved (or will be moved). It is best to
838 1.1 jtc * leave them alone.
839 1.1 jtc */
840 1.1 jtc if ((arcn->type != PAX_HLK) && (arcn->type != PAX_HRG))
841 1.24 dsl return 0;
842 1.1 jtc
843 1.1 jtc if (fix_path(arcn->ln_name, &(arcn->ln_nlen), dest_dir, dir_len) < 0)
844 1.24 dsl return -1;
845 1.24 dsl return 0;
846 1.1 jtc }
847 1.1 jtc
848 1.1 jtc /*
849 1.1 jtc * fix_path
850 1.1 jtc * concatenate dir_name and or_name and store the result in or_name (if
851 1.1 jtc * it fits). This is one ugly function.
852 1.1 jtc * Return:
853 1.1 jtc * 0 if ok, -1 if the final name is too long
854 1.1 jtc */
855 1.1 jtc
856 1.1 jtc static int
857 1.1 jtc fix_path( char *or_name, int *or_len, char *dir_name, int dir_len)
858 1.1 jtc {
859 1.5 tls char *src;
860 1.5 tls char *dest;
861 1.5 tls char *start;
862 1.1 jtc int len;
863 1.1 jtc
864 1.1 jtc /*
865 1.1 jtc * we shift the or_name to the right enough to tack in the dir_name
866 1.1 jtc * at the front. We make sure we have enough space for it all before
867 1.1 jtc * we start. since dest always ends in a slash, we skip of or_name
868 1.1 jtc * if it also starts with one.
869 1.1 jtc */
870 1.1 jtc start = or_name;
871 1.1 jtc src = start + *or_len;
872 1.1 jtc dest = src + dir_len;
873 1.1 jtc if (*start == '/') {
874 1.1 jtc ++start;
875 1.1 jtc --dest;
876 1.1 jtc }
877 1.1 jtc if ((len = dest - or_name) > PAXPATHLEN) {
878 1.7 christos tty_warn(1, "File name %s/%s, too long", dir_name, start);
879 1.24 dsl return -1;
880 1.1 jtc }
881 1.1 jtc *or_len = len;
882 1.1 jtc
883 1.1 jtc /*
884 1.11 itohy * enough space, shift
885 1.1 jtc */
886 1.1 jtc while (src >= start)
887 1.1 jtc *dest-- = *src--;
888 1.1 jtc src = dir_name + dir_len - 1;
889 1.1 jtc
890 1.1 jtc /*
891 1.1 jtc * splice in the destination directory name
892 1.1 jtc */
893 1.1 jtc while (src >= dir_name)
894 1.1 jtc *dest-- = *src--;
895 1.1 jtc
896 1.1 jtc *(or_name + len) = '\0';
897 1.24 dsl return 0;
898 1.1 jtc }
899 1.1 jtc
900 1.1 jtc /*
901 1.1 jtc * rep_name()
902 1.1 jtc * walk down the list of replacement strings applying each one in order.
903 1.1 jtc * when we find one with a successful substitution, we modify the name
904 1.1 jtc * as specified. if required, we print the results. if the resulting name
905 1.1 jtc * is empty, we will skip this archive member. We use the regexp(3)
906 1.1 jtc * routines (regexp() ought to win a prize as having the most cryptic
907 1.1 jtc * library function manual page).
908 1.1 jtc * --Parameters--
909 1.1 jtc * name is the file name we are going to apply the regular expressions to
910 1.1 jtc * (and may be modified)
911 1.14 christos * namelen the size of the name buffer.
912 1.1 jtc * nlen is the length of this name (and is modified to hold the length of
913 1.1 jtc * the final string).
914 1.1 jtc * prnt is a flag that says whether to print the final result.
915 1.1 jtc * Return:
916 1.1 jtc * 0 if substitution was successful, 1 if we are to skip the file (the name
917 1.1 jtc * ended up empty)
918 1.1 jtc */
919 1.1 jtc
920 1.1 jtc static int
921 1.27 christos rep_name(char *name, size_t namelen, int *nlen, int flags)
922 1.1 jtc {
923 1.5 tls REPLACE *pt;
924 1.5 tls char *inpt;
925 1.5 tls char *outpt;
926 1.5 tls char *endpt;
927 1.5 tls char *rpt;
928 1.5 tls int found = 0;
929 1.5 tls int res;
930 1.12 lukem #ifndef NET2_REGEX
931 1.1 jtc regmatch_t pm[MAXSUBEXP];
932 1.12 lukem #endif
933 1.1 jtc char nname[PAXPATHLEN+1]; /* final result of all replacements */
934 1.1 jtc char buf1[PAXPATHLEN+1]; /* where we work on the name */
935 1.1 jtc
936 1.1 jtc /*
937 1.1 jtc * copy the name into buf1, where we will work on it. We need to keep
938 1.1 jtc * the orig string around so we can print out the result of the final
939 1.1 jtc * replacement. We build up the final result in nname. inpt points at
940 1.1 jtc * the string we apply the regular expression to. prnt is used to
941 1.1 jtc * suppress printing when we handle replacements on the link field
942 1.1 jtc * (the user already saw that substitution go by)
943 1.1 jtc */
944 1.1 jtc pt = rephead;
945 1.1 jtc (void)strcpy(buf1, name);
946 1.1 jtc inpt = buf1;
947 1.1 jtc outpt = nname;
948 1.1 jtc endpt = outpt + PAXPATHLEN;
949 1.1 jtc
950 1.1 jtc /*
951 1.1 jtc * try each replacement string in order
952 1.1 jtc */
953 1.1 jtc while (pt != NULL) {
954 1.1 jtc do {
955 1.27 christos if ((flags & SYML) && (pt->flgs & SYML))
956 1.27 christos continue;
957 1.1 jtc /*
958 1.1 jtc * check for a successful substitution, if not go to
959 1.1 jtc * the next pattern, or cleanup if we were global
960 1.1 jtc */
961 1.12 lukem #ifdef NET2_REGEX
962 1.1 jtc if (regexec(pt->rcmp, inpt) == 0)
963 1.12 lukem #else
964 1.1 jtc if (regexec(&(pt->rcmp), inpt, MAXSUBEXP, pm, 0) != 0)
965 1.12 lukem #endif
966 1.1 jtc break;
967 1.1 jtc
968 1.1 jtc /*
969 1.1 jtc * ok we found one. We have three parts, the prefix
970 1.1 jtc * which did not match, the section that did and the
971 1.1 jtc * tail (that also did not match). Copy the prefix to
972 1.1 jtc * the final output buffer (watching to make sure we
973 1.1 jtc * do not create a string too long).
974 1.1 jtc */
975 1.1 jtc found = 1;
976 1.12 lukem #ifdef NET2_REGEX
977 1.1 jtc rpt = pt->rcmp->startp[0];
978 1.12 lukem #else
979 1.1 jtc rpt = inpt + pm[0].rm_so;
980 1.12 lukem #endif
981 1.1 jtc
982 1.1 jtc while ((inpt < rpt) && (outpt < endpt))
983 1.1 jtc *outpt++ = *inpt++;
984 1.1 jtc if (outpt == endpt)
985 1.1 jtc break;
986 1.1 jtc
987 1.1 jtc /*
988 1.1 jtc * for the second part (which matched the regular
989 1.1 jtc * expression) apply the substitution using the
990 1.1 jtc * replacement string and place it the prefix in the
991 1.1 jtc * final output. If we have problems, skip it.
992 1.1 jtc */
993 1.12 lukem if ((res =
994 1.12 lukem #ifdef NET2_REGEX
995 1.12 lukem resub(pt->rcmp,pt->nstr,outpt,endpt)
996 1.12 lukem #else
997 1.12 lukem resub(&(pt->rcmp),pm,pt->nstr,inpt, outpt,endpt)
998 1.12 lukem #endif
999 1.12 lukem ) < 0) {
1000 1.27 christos if (flags & PRNT)
1001 1.7 christos tty_warn(1, "Replacement name error %s",
1002 1.1 jtc name);
1003 1.24 dsl return 1;
1004 1.1 jtc }
1005 1.1 jtc outpt += res;
1006 1.1 jtc
1007 1.1 jtc /*
1008 1.1 jtc * we set up to look again starting at the first
1009 1.1 jtc * character in the tail (of the input string right
1010 1.1 jtc * after the last character matched by the regular
1011 1.1 jtc * expression (inpt always points at the first char in
1012 1.1 jtc * the string to process). If we are not doing a global
1013 1.1 jtc * substitution, we will use inpt to copy the tail to
1014 1.1 jtc * the final result. Make sure we do not overrun the
1015 1.1 jtc * output buffer
1016 1.1 jtc */
1017 1.12 lukem #ifdef NET2_REGEX
1018 1.1 jtc inpt = pt->rcmp->endp[0];
1019 1.12 lukem #else
1020 1.6 mycroft inpt += pm[0].rm_eo - pm[0].rm_so;
1021 1.12 lukem #endif
1022 1.1 jtc
1023 1.1 jtc if ((outpt == endpt) || (*inpt == '\0'))
1024 1.1 jtc break;
1025 1.1 jtc
1026 1.1 jtc /*
1027 1.1 jtc * if the user wants global we keep trying to
1028 1.1 jtc * substitute until it fails, then we are done.
1029 1.1 jtc */
1030 1.1 jtc } while (pt->flgs & GLOB);
1031 1.1 jtc
1032 1.11 itohy if (found)
1033 1.1 jtc break;
1034 1.1 jtc
1035 1.1 jtc /*
1036 1.1 jtc * a successful substitution did NOT occur, try the next one
1037 1.1 jtc */
1038 1.1 jtc pt = pt->fow;
1039 1.1 jtc }
1040 1.1 jtc
1041 1.1 jtc if (found) {
1042 1.1 jtc /*
1043 1.1 jtc * we had a substitution, copy the last tail piece (if there is
1044 1.1 jtc * room) to the final result
1045 1.1 jtc */
1046 1.1 jtc while ((outpt < endpt) && (*inpt != '\0'))
1047 1.1 jtc *outpt++ = *inpt++;
1048 1.1 jtc
1049 1.1 jtc *outpt = '\0';
1050 1.1 jtc if ((outpt == endpt) && (*inpt != '\0')) {
1051 1.27 christos if (flags & PRNT)
1052 1.7 christos tty_warn(1,"Replacement name too long %s >> %s",
1053 1.1 jtc name, nname);
1054 1.24 dsl return 1;
1055 1.11 itohy }
1056 1.1 jtc
1057 1.1 jtc /*
1058 1.1 jtc * inform the user of the result if wanted
1059 1.1 jtc */
1060 1.27 christos if ((flags & PRNT) && (pt->flgs & PRNT)) {
1061 1.1 jtc if (*nname == '\0')
1062 1.1 jtc (void)fprintf(stderr,"%s >> <empty string>\n",
1063 1.1 jtc name);
1064 1.11 itohy else
1065 1.1 jtc (void)fprintf(stderr,"%s >> %s\n", name, nname);
1066 1.1 jtc }
1067 1.1 jtc
1068 1.1 jtc /*
1069 1.1 jtc * if empty inform the caller this file is to be skipped
1070 1.1 jtc * otherwise copy the new name over the orig name and return
1071 1.1 jtc */
1072 1.11 itohy if (*nname == '\0')
1073 1.24 dsl return 1;
1074 1.27 christos if (flags & RENM)
1075 1.27 christos *nlen = strlcpy(name, nname, namelen);
1076 1.1 jtc }
1077 1.24 dsl return 0;
1078 1.15 christos }
1079 1.15 christos
1080 1.15 christos
1081 1.15 christos /*
1082 1.15 christos * checkdotdot()
1083 1.15 christos * Return true if a component of the name contains a reference to ".."
1084 1.15 christos */
1085 1.15 christos static int
1086 1.15 christos checkdotdot(const char *name)
1087 1.15 christos {
1088 1.15 christos const char *p;
1089 1.15 christos /* 1. "..{[/],}" */
1090 1.15 christos if (name[0] == '.' && name[1] == '.' &&
1091 1.15 christos (name[2] == '/' || name[2] == '\0'))
1092 1.15 christos return 1;
1093 1.15 christos
1094 1.15 christos /* 2. "*[/]..[/]*" */
1095 1.15 christos if (strstr(name, "/../") != NULL)
1096 1.15 christos return 1;
1097 1.15 christos
1098 1.15 christos /* 3. "*[/].." */
1099 1.15 christos for (p = name; *p; p++)
1100 1.15 christos continue;
1101 1.15 christos if (p - name < 3)
1102 1.15 christos return 0;
1103 1.15 christos if (p[-1] == '.' && p[-2] == '.' && p[-3] == '/')
1104 1.15 christos return 1;
1105 1.15 christos
1106 1.15 christos return 0;
1107 1.1 jtc }
1108 1.1 jtc
1109 1.1 jtc #ifdef NET2_REGEX
1110 1.1 jtc /*
1111 1.1 jtc * resub()
1112 1.1 jtc * apply the replacement to the matched expression. expand out the old
1113 1.11 itohy * style ed(1) subexpression expansion.
1114 1.1 jtc * Return:
1115 1.1 jtc * -1 if error, or the number of characters added to the destination.
1116 1.1 jtc */
1117 1.1 jtc
1118 1.1 jtc static int
1119 1.5 tls resub(regexp *prog, char *src, char *dest, char *destend)
1120 1.1 jtc {
1121 1.5 tls char *spt;
1122 1.5 tls char *dpt;
1123 1.5 tls char c;
1124 1.5 tls int no;
1125 1.5 tls int len;
1126 1.1 jtc
1127 1.1 jtc spt = src;
1128 1.1 jtc dpt = dest;
1129 1.1 jtc while ((dpt < destend) && ((c = *spt++) != '\0')) {
1130 1.1 jtc if (c == '&')
1131 1.1 jtc no = 0;
1132 1.1 jtc else if ((c == '\\') && (*spt >= '0') && (*spt <= '9'))
1133 1.1 jtc no = *spt++ - '0';
1134 1.1 jtc else {
1135 1.11 itohy if ((c == '\\') && ((*spt == '\\') || (*spt == '&')))
1136 1.11 itohy c = *spt++;
1137 1.11 itohy *dpt++ = c;
1138 1.1 jtc continue;
1139 1.1 jtc }
1140 1.11 itohy if ((prog->startp[no] == NULL) || (prog->endp[no] == NULL) ||
1141 1.1 jtc ((len = prog->endp[no] - prog->startp[no]) <= 0))
1142 1.1 jtc continue;
1143 1.1 jtc
1144 1.1 jtc /*
1145 1.1 jtc * copy the subexpression to the destination.
1146 1.1 jtc * fail if we run out of space or the match string is damaged
1147 1.1 jtc */
1148 1.1 jtc if (len > (destend - dpt))
1149 1.14 christos return (-1);
1150 1.14 christos strncpy(dpt, prog->startp[no], len);
1151 1.1 jtc dpt += len;
1152 1.1 jtc }
1153 1.24 dsl return dpt - dest;
1154 1.1 jtc }
1155 1.1 jtc
1156 1.1 jtc #else
1157 1.1 jtc
1158 1.1 jtc /*
1159 1.1 jtc * resub()
1160 1.1 jtc * apply the replacement to the matched expression. expand out the old
1161 1.11 itohy * style ed(1) subexpression expansion.
1162 1.1 jtc * Return:
1163 1.1 jtc * -1 if error, or the number of characters added to the destination.
1164 1.1 jtc */
1165 1.1 jtc
1166 1.1 jtc static int
1167 1.9 pk resub(regex_t *rp, regmatch_t *pm, char *src, char *txt, char *dest,
1168 1.5 tls char *destend)
1169 1.1 jtc {
1170 1.5 tls char *spt;
1171 1.5 tls char *dpt;
1172 1.5 tls char c;
1173 1.5 tls regmatch_t *pmpt;
1174 1.5 tls int len;
1175 1.1 jtc int subexcnt;
1176 1.1 jtc
1177 1.1 jtc spt = src;
1178 1.1 jtc dpt = dest;
1179 1.1 jtc subexcnt = rp->re_nsub;
1180 1.1 jtc while ((dpt < destend) && ((c = *spt++) != '\0')) {
1181 1.1 jtc /*
1182 1.1 jtc * see if we just have an ordinary replacement character
1183 1.1 jtc * or we refer to a subexpression.
1184 1.1 jtc */
1185 1.1 jtc if (c == '&') {
1186 1.1 jtc pmpt = pm;
1187 1.9 pk } else if ((c == '\\') && (*spt >= '1') && (*spt <= '9')) {
1188 1.1 jtc /*
1189 1.1 jtc * make sure there is a subexpression as specified
1190 1.1 jtc */
1191 1.1 jtc if ((len = *spt++ - '0') > subexcnt)
1192 1.24 dsl return -1;
1193 1.1 jtc pmpt = pm + len;
1194 1.1 jtc } else {
1195 1.11 itohy /*
1196 1.1 jtc * Ordinary character, just copy it
1197 1.1 jtc */
1198 1.11 itohy if ((c == '\\') && ((*spt == '\\') || (*spt == '&')))
1199 1.11 itohy c = *spt++;
1200 1.11 itohy *dpt++ = c;
1201 1.1 jtc continue;
1202 1.1 jtc }
1203 1.1 jtc
1204 1.1 jtc /*
1205 1.1 jtc * continue if the subexpression is bogus
1206 1.1 jtc */
1207 1.1 jtc if ((pmpt->rm_so < 0) || (pmpt->rm_eo < 0) ||
1208 1.1 jtc ((len = pmpt->rm_eo - pmpt->rm_so) <= 0))
1209 1.1 jtc continue;
1210 1.1 jtc
1211 1.1 jtc /*
1212 1.1 jtc * copy the subexpression to the destination.
1213 1.1 jtc * fail if we run out of space or the match string is damaged
1214 1.1 jtc */
1215 1.1 jtc if (len > (destend - dpt))
1216 1.14 christos return -1;
1217 1.14 christos strncpy(dpt, txt + pmpt->rm_so, len);
1218 1.1 jtc dpt += len;
1219 1.1 jtc }
1220 1.24 dsl return dpt - dest;
1221 1.1 jtc }
1222 1.1 jtc #endif
1223