glob.c revision 1.18.2.1 1 1.18.2.1 riz /* $NetBSD: glob.c,v 1.18.2.1 2010/08/05 01:43:20 riz Exp $ */
2 1.5 cgd
3 1.1 cgd /*
4 1.12 christos * Copyright (c) 1989, 1993
5 1.12 christos * The Regents of the University of California. All rights reserved.
6 1.12 christos *
7 1.12 christos * This code is derived from software contributed to Berkeley by
8 1.12 christos * Guido van Rossum.
9 1.12 christos *
10 1.12 christos * Redistribution and use in source and binary forms, with or without
11 1.12 christos * modification, are permitted provided that the following conditions
12 1.12 christos * are met:
13 1.12 christos * 1. Redistributions of source code must retain the above copyright
14 1.12 christos * notice, this list of conditions and the following disclaimer.
15 1.12 christos * 2. Redistributions in binary form must reproduce the above copyright
16 1.12 christos * notice, this list of conditions and the following disclaimer in the
17 1.12 christos * documentation and/or other materials provided with the distribution.
18 1.12 christos * 3. Neither the name of the University nor the names of its contributors
19 1.12 christos * may be used to endorse or promote products derived from this software
20 1.12 christos * without specific prior written permission.
21 1.12 christos *
22 1.12 christos * THIS SOFTWARE IS PROVIDED BY THE REGENTS AND CONTRIBUTORS ``AS IS'' AND
23 1.12 christos * ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
24 1.12 christos * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
25 1.12 christos * ARE DISCLAIMED. IN NO EVENT SHALL THE REGENTS OR CONTRIBUTORS BE LIABLE
26 1.12 christos * FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL
27 1.12 christos * DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS
28 1.12 christos * OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION)
29 1.12 christos * HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT
30 1.12 christos * LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY
31 1.12 christos * OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF
32 1.12 christos * SUCH DAMAGE.
33 1.1 cgd */
34 1.1 cgd
35 1.12 christos #include <sys/cdefs.h>
36 1.12 christos #if defined(LIBC_SCCS) && !defined(lint)
37 1.12 christos #if 0
38 1.12 christos static char sccsid[] = "@(#)glob.c 8.3 (Berkeley) 10/13/93";
39 1.12 christos #else
40 1.18.2.1 riz __RCSID("$NetBSD: glob.c,v 1.18.2.1 2010/08/05 01:43:20 riz Exp $");
41 1.12 christos #endif
42 1.12 christos #endif /* LIBC_SCCS and not lint */
43 1.1 cgd
44 1.12 christos /*
45 1.12 christos * glob(3) -- a superset of the one defined in POSIX 1003.2.
46 1.12 christos *
47 1.12 christos * The [!...] convention to negate a range is supported (SysV, Posix, ksh).
48 1.12 christos *
49 1.12 christos * Optional extra services, controlled by flags not defined by POSIX:
50 1.12 christos *
51 1.12 christos * GLOB_MAGCHAR:
52 1.12 christos * Set in gl_flags if pattern contained a globbing character.
53 1.12 christos * GLOB_NOMAGIC:
54 1.12 christos * Same as GLOB_NOCHECK, but it will only append pattern if it did
55 1.12 christos * not contain any magic characters. [Used in csh style globbing]
56 1.12 christos * GLOB_ALTDIRFUNC:
57 1.12 christos * Use alternately specified directory access functions.
58 1.12 christos * GLOB_TILDE:
59 1.12 christos * expand ~user/foo to the /home/dir/of/user/foo
60 1.12 christos * GLOB_BRACE:
61 1.12 christos * expand {1,2}{a,b} to 1a 1b 2a 2b
62 1.12 christos * gl_matchc:
63 1.12 christos * Number of matches in the current invocation of glob.
64 1.12 christos */
65 1.12 christos
66 1.12 christos #include "namespace.h"
67 1.12 christos #include <sys/param.h>
68 1.12 christos #include <sys/stat.h>
69 1.12 christos
70 1.12 christos #include <assert.h>
71 1.12 christos #include <ctype.h>
72 1.12 christos #include <dirent.h>
73 1.12 christos #include <errno.h>
74 1.12 christos #include <glob.h>
75 1.12 christos #include <pwd.h>
76 1.12 christos #include <stdio.h>
77 1.12 christos #include <stdlib.h>
78 1.12 christos #include <string.h>
79 1.12 christos #include <unistd.h>
80 1.12 christos
81 1.12 christos #ifdef HAVE_NBTOOL_CONFIG_H
82 1.12 christos #define NO_GETPW_R
83 1.12 christos #endif
84 1.12 christos
85 1.18.2.1 riz #define GLOB_LIMIT_MALLOC 65536
86 1.18.2.1 riz #define GLOB_LIMIT_STAT 128
87 1.18.2.1 riz #define GLOB_LIMIT_READDIR 16384
88 1.18.2.1 riz
89 1.18.2.1 riz #define GLOB_INDEX_MALLOC 0
90 1.18.2.1 riz #define GLOB_INDEX_STAT 1
91 1.18.2.1 riz #define GLOB_INDEX_READDIR 2
92 1.18.2.1 riz
93 1.12 christos /*
94 1.12 christos * XXX: For NetBSD 1.4.x compatibility. (kill me l8r)
95 1.12 christos */
96 1.12 christos #ifndef _DIAGASSERT
97 1.12 christos #define _DIAGASSERT(a)
98 1.12 christos #endif
99 1.12 christos
100 1.12 christos #define DOLLAR '$'
101 1.12 christos #define DOT '.'
102 1.12 christos #define EOS '\0'
103 1.12 christos #define LBRACKET '['
104 1.12 christos #define NOT '!'
105 1.12 christos #define QUESTION '?'
106 1.12 christos #define QUOTE '\\'
107 1.12 christos #define RANGE '-'
108 1.12 christos #define RBRACKET ']'
109 1.12 christos #define SEP '/'
110 1.12 christos #define STAR '*'
111 1.12 christos #define TILDE '~'
112 1.12 christos #define UNDERSCORE '_'
113 1.12 christos #define LBRACE '{'
114 1.12 christos #define RBRACE '}'
115 1.12 christos #define SLASH '/'
116 1.12 christos #define COMMA ','
117 1.12 christos
118 1.15 christos #ifndef USE_8BIT_CHARS
119 1.12 christos
120 1.12 christos #define M_QUOTE 0x8000
121 1.12 christos #define M_PROTECT 0x4000
122 1.12 christos #define M_MASK 0xffff
123 1.12 christos #define M_ASCII 0x00ff
124 1.12 christos
125 1.12 christos typedef u_short Char;
126 1.12 christos
127 1.12 christos #else
128 1.12 christos
129 1.15 christos #define M_QUOTE (Char)0x80
130 1.15 christos #define M_PROTECT (Char)0x40
131 1.15 christos #define M_MASK (Char)0xff
132 1.15 christos #define M_ASCII (Char)0x7f
133 1.12 christos
134 1.12 christos typedef char Char;
135 1.12 christos
136 1.12 christos #endif
137 1.12 christos
138 1.12 christos
139 1.12 christos #define CHAR(c) ((Char)((c)&M_ASCII))
140 1.12 christos #define META(c) ((Char)((c)|M_QUOTE))
141 1.12 christos #define M_ALL META('*')
142 1.12 christos #define M_END META(']')
143 1.12 christos #define M_NOT META('!')
144 1.12 christos #define M_ONE META('?')
145 1.12 christos #define M_RNG META('-')
146 1.12 christos #define M_SET META('[')
147 1.12 christos #define ismeta(c) (((c)&M_QUOTE) != 0)
148 1.12 christos
149 1.12 christos
150 1.18 christos static int compare(const void *, const void *);
151 1.18 christos static int g_Ctoc(const Char *, char *, size_t);
152 1.18 christos static int g_lstat(Char *, __gl_stat_t *, glob_t *);
153 1.18 christos static DIR *g_opendir(Char *, glob_t *);
154 1.18 christos static Char *g_strchr(const Char *, int);
155 1.18 christos static int g_stat(Char *, __gl_stat_t *, glob_t *);
156 1.18.2.1 riz static int glob0(const Char *, glob_t *, size_t *);
157 1.18 christos static int glob1(Char *, glob_t *, size_t *);
158 1.18 christos static int glob2(Char *, Char *, Char *, Char *, glob_t *,
159 1.18 christos size_t *);
160 1.18 christos static int glob3(Char *, Char *, Char *, Char *, Char *, glob_t *,
161 1.18 christos size_t *);
162 1.18 christos static int globextend(const Char *, glob_t *, size_t *);
163 1.18 christos static const Char *globtilde(const Char *, Char *, size_t, glob_t *);
164 1.18.2.1 riz static int globexp1(const Char *, glob_t *, size_t *);
165 1.18.2.1 riz static int globexp2(const Char *, const Char *, glob_t *, int *,
166 1.18.2.1 riz size_t *);
167 1.18 christos static int match(Char *, Char *, Char *);
168 1.12 christos #ifdef DEBUG
169 1.18 christos static void qprintf(const char *, Char *);
170 1.12 christos #endif
171 1.12 christos
172 1.12 christos int
173 1.18 christos glob(const char *pattern, int flags, int (*errfunc)(const char *, int),
174 1.18 christos glob_t *pglob)
175 1.12 christos {
176 1.12 christos const u_char *patnext;
177 1.12 christos int c;
178 1.12 christos Char *bufnext, *bufend, patbuf[MAXPATHLEN+1];
179 1.18.2.1 riz /* 0 = malloc(), 1 = stat(), 2 = readdir() */
180 1.18.2.1 riz size_t limit[] = { 0, 0, 0 };
181 1.12 christos
182 1.12 christos _DIAGASSERT(pattern != NULL);
183 1.12 christos
184 1.12 christos patnext = (const u_char *) pattern;
185 1.12 christos if (!(flags & GLOB_APPEND)) {
186 1.12 christos pglob->gl_pathc = 0;
187 1.12 christos pglob->gl_pathv = NULL;
188 1.12 christos if (!(flags & GLOB_DOOFFS))
189 1.12 christos pglob->gl_offs = 0;
190 1.12 christos }
191 1.12 christos pglob->gl_flags = flags & ~GLOB_MAGCHAR;
192 1.12 christos pglob->gl_errfunc = errfunc;
193 1.12 christos pglob->gl_matchc = 0;
194 1.12 christos
195 1.12 christos bufnext = patbuf;
196 1.12 christos bufend = bufnext + MAXPATHLEN;
197 1.12 christos if (flags & GLOB_NOESCAPE) {
198 1.12 christos while (bufnext < bufend && (c = *patnext++) != EOS)
199 1.12 christos *bufnext++ = c;
200 1.12 christos } else {
201 1.12 christos /* Protect the quoted characters. */
202 1.12 christos while (bufnext < bufend && (c = *patnext++) != EOS)
203 1.12 christos if (c == QUOTE) {
204 1.12 christos if ((c = *patnext++) == EOS) {
205 1.12 christos c = QUOTE;
206 1.12 christos --patnext;
207 1.12 christos }
208 1.12 christos *bufnext++ = c | M_PROTECT;
209 1.12 christos }
210 1.12 christos else
211 1.12 christos *bufnext++ = c;
212 1.12 christos }
213 1.12 christos *bufnext = EOS;
214 1.12 christos
215 1.12 christos if (flags & GLOB_BRACE)
216 1.18.2.1 riz return globexp1(patbuf, pglob, limit);
217 1.12 christos else
218 1.18.2.1 riz return glob0(patbuf, pglob, limit);
219 1.12 christos }
220 1.12 christos
221 1.12 christos /*
222 1.12 christos * Expand recursively a glob {} pattern. When there is no more expansion
223 1.12 christos * invoke the standard globbing routine to glob the rest of the magic
224 1.12 christos * characters
225 1.12 christos */
226 1.12 christos static int
227 1.18.2.1 riz globexp1(const Char *pattern, glob_t *pglob, size_t *limit)
228 1.12 christos {
229 1.12 christos const Char* ptr = pattern;
230 1.12 christos int rv;
231 1.12 christos
232 1.12 christos _DIAGASSERT(pattern != NULL);
233 1.12 christos _DIAGASSERT(pglob != NULL);
234 1.12 christos
235 1.12 christos /* Protect a single {}, for find(1), like csh */
236 1.12 christos if (pattern[0] == LBRACE && pattern[1] == RBRACE && pattern[2] == EOS)
237 1.18.2.1 riz return glob0(pattern, pglob, limit);
238 1.12 christos
239 1.12 christos while ((ptr = (const Char *) g_strchr(ptr, LBRACE)) != NULL)
240 1.18.2.1 riz if (!globexp2(ptr, pattern, pglob, &rv, limit))
241 1.12 christos return rv;
242 1.12 christos
243 1.18.2.1 riz return glob0(pattern, pglob, limit);
244 1.12 christos }
245 1.12 christos
246 1.12 christos
247 1.12 christos /*
248 1.12 christos * Recursive brace globbing helper. Tries to expand a single brace.
249 1.12 christos * If it succeeds then it invokes globexp1 with the new pattern.
250 1.12 christos * If it fails then it tries to glob the rest of the pattern and returns.
251 1.12 christos */
252 1.12 christos static int
253 1.18.2.1 riz globexp2(const Char *ptr, const Char *pattern, glob_t *pglob, int *rv,
254 1.18.2.1 riz size_t *limit)
255 1.12 christos {
256 1.12 christos int i;
257 1.12 christos Char *lm, *ls;
258 1.12 christos const Char *pe, *pm, *pl;
259 1.12 christos Char patbuf[MAXPATHLEN + 1];
260 1.12 christos
261 1.12 christos _DIAGASSERT(ptr != NULL);
262 1.12 christos _DIAGASSERT(pattern != NULL);
263 1.12 christos _DIAGASSERT(pglob != NULL);
264 1.12 christos _DIAGASSERT(rv != NULL);
265 1.12 christos
266 1.12 christos /* copy part up to the brace */
267 1.12 christos for (lm = patbuf, pm = pattern; pm != ptr; *lm++ = *pm++)
268 1.12 christos continue;
269 1.12 christos ls = lm;
270 1.12 christos
271 1.12 christos /* Find the balanced brace */
272 1.12 christos for (i = 0, pe = ++ptr; *pe; pe++)
273 1.12 christos if (*pe == LBRACKET) {
274 1.12 christos /* Ignore everything between [] */
275 1.12 christos for (pm = pe++; *pe != RBRACKET && *pe != EOS; pe++)
276 1.12 christos continue;
277 1.12 christos if (*pe == EOS) {
278 1.12 christos /*
279 1.12 christos * We could not find a matching RBRACKET.
280 1.12 christos * Ignore and just look for RBRACE
281 1.12 christos */
282 1.12 christos pe = pm;
283 1.12 christos }
284 1.12 christos }
285 1.12 christos else if (*pe == LBRACE)
286 1.12 christos i++;
287 1.12 christos else if (*pe == RBRACE) {
288 1.12 christos if (i == 0)
289 1.12 christos break;
290 1.12 christos i--;
291 1.12 christos }
292 1.12 christos
293 1.12 christos /* Non matching braces; just glob the pattern */
294 1.12 christos if (i != 0 || *pe == EOS) {
295 1.12 christos /*
296 1.12 christos * we use `pattern', not `patbuf' here so that that
297 1.12 christos * unbalanced braces are passed to the match
298 1.12 christos */
299 1.18.2.1 riz *rv = glob0(pattern, pglob, limit);
300 1.12 christos return 0;
301 1.12 christos }
302 1.12 christos
303 1.12 christos for (i = 0, pl = pm = ptr; pm <= pe; pm++) {
304 1.12 christos switch (*pm) {
305 1.12 christos case LBRACKET:
306 1.12 christos /* Ignore everything between [] */
307 1.12 christos for (pl = pm++; *pm != RBRACKET && *pm != EOS; pm++)
308 1.12 christos continue;
309 1.12 christos if (*pm == EOS) {
310 1.12 christos /*
311 1.12 christos * We could not find a matching RBRACKET.
312 1.12 christos * Ignore and just look for RBRACE
313 1.12 christos */
314 1.12 christos pm = pl;
315 1.12 christos }
316 1.12 christos break;
317 1.12 christos
318 1.12 christos case LBRACE:
319 1.12 christos i++;
320 1.12 christos break;
321 1.12 christos
322 1.12 christos case RBRACE:
323 1.12 christos if (i) {
324 1.12 christos i--;
325 1.12 christos break;
326 1.12 christos }
327 1.12 christos /* FALLTHROUGH */
328 1.12 christos case COMMA:
329 1.12 christos if (i && *pm == COMMA)
330 1.12 christos break;
331 1.12 christos else {
332 1.12 christos /* Append the current string */
333 1.12 christos for (lm = ls; (pl < pm); *lm++ = *pl++)
334 1.12 christos continue;
335 1.12 christos /*
336 1.12 christos * Append the rest of the pattern after the
337 1.12 christos * closing brace
338 1.12 christos */
339 1.12 christos for (pl = pe + 1; (*lm++ = *pl++) != EOS;)
340 1.12 christos continue;
341 1.12 christos
342 1.12 christos /* Expand the current pattern */
343 1.12 christos #ifdef DEBUG
344 1.12 christos qprintf("globexp2:", patbuf);
345 1.12 christos #endif
346 1.18.2.1 riz *rv = globexp1(patbuf, pglob, limit);
347 1.12 christos
348 1.12 christos /* move after the comma, to the next string */
349 1.12 christos pl = pm + 1;
350 1.12 christos }
351 1.12 christos break;
352 1.12 christos
353 1.12 christos default:
354 1.12 christos break;
355 1.12 christos }
356 1.12 christos }
357 1.12 christos *rv = 0;
358 1.12 christos return 0;
359 1.12 christos }
360 1.12 christos
361 1.12 christos
362 1.12 christos
363 1.12 christos /*
364 1.12 christos * expand tilde from the passwd file.
365 1.12 christos */
366 1.12 christos static const Char *
367 1.18 christos globtilde(const Char *pattern, Char *patbuf, size_t patsize, glob_t *pglob)
368 1.12 christos {
369 1.12 christos struct passwd *pwd;
370 1.12 christos const char *h;
371 1.12 christos const Char *p;
372 1.12 christos Char *b;
373 1.12 christos char *d;
374 1.12 christos Char *pend = &patbuf[patsize / sizeof(Char)];
375 1.12 christos #ifndef NO_GETPW_R
376 1.12 christos struct passwd pwres;
377 1.12 christos char pwbuf[1024];
378 1.12 christos #endif
379 1.12 christos
380 1.12 christos pend--;
381 1.12 christos
382 1.12 christos _DIAGASSERT(pattern != NULL);
383 1.12 christos _DIAGASSERT(patbuf != NULL);
384 1.12 christos _DIAGASSERT(pglob != NULL);
385 1.12 christos
386 1.12 christos if (*pattern != TILDE || !(pglob->gl_flags & GLOB_TILDE))
387 1.12 christos return pattern;
388 1.12 christos
389 1.12 christos /* Copy up to the end of the string or / */
390 1.12 christos for (p = pattern + 1, d = (char *)(void *)patbuf;
391 1.12 christos d < (char *)(void *)pend && *p && *p != SLASH;
392 1.12 christos *d++ = *p++)
393 1.12 christos continue;
394 1.12 christos
395 1.12 christos if (d == (char *)(void *)pend)
396 1.12 christos return NULL;
397 1.12 christos
398 1.12 christos *d = EOS;
399 1.12 christos d = (char *)(void *)patbuf;
400 1.12 christos
401 1.12 christos if (*d == EOS) {
402 1.12 christos /*
403 1.12 christos * handle a plain ~ or ~/ by expanding $HOME
404 1.12 christos * first and then trying the password file
405 1.12 christos */
406 1.12 christos if ((h = getenv("HOME")) == NULL) {
407 1.12 christos #ifdef NO_GETPW_R
408 1.12 christos if ((pwd = getpwuid(getuid())) == NULL)
409 1.12 christos #else
410 1.12 christos if (getpwuid_r(getuid(), &pwres, pwbuf, sizeof(pwbuf),
411 1.12 christos &pwd) != 0 || pwd == NULL)
412 1.12 christos #endif
413 1.12 christos return pattern;
414 1.12 christos else
415 1.12 christos h = pwd->pw_dir;
416 1.12 christos }
417 1.12 christos }
418 1.12 christos else {
419 1.12 christos /*
420 1.12 christos * Expand a ~user
421 1.12 christos */
422 1.12 christos #ifdef NO_GETPW_R
423 1.12 christos if ((pwd = getpwnam(d)) == NULL)
424 1.12 christos #else
425 1.12 christos if (getpwnam_r(d, &pwres, pwbuf, sizeof(pwbuf), &pwd) != 0 ||
426 1.12 christos pwd == NULL)
427 1.12 christos #endif
428 1.12 christos return pattern;
429 1.12 christos else
430 1.12 christos h = pwd->pw_dir;
431 1.12 christos }
432 1.12 christos
433 1.12 christos /* Copy the home directory */
434 1.12 christos for (b = patbuf; b < pend && *h; *b++ = *h++)
435 1.12 christos continue;
436 1.12 christos
437 1.12 christos if (b == pend)
438 1.12 christos return NULL;
439 1.12 christos
440 1.12 christos /* Append the rest of the pattern */
441 1.12 christos while (b < pend && (*b++ = *p++) != EOS)
442 1.12 christos continue;
443 1.12 christos
444 1.12 christos if (b == pend)
445 1.12 christos return NULL;
446 1.12 christos
447 1.12 christos return patbuf;
448 1.12 christos }
449 1.12 christos
450 1.12 christos
451 1.12 christos /*
452 1.12 christos * The main glob() routine: compiles the pattern (optionally processing
453 1.12 christos * quotes), calls glob1() to do the real pattern matching, and finally
454 1.12 christos * sorts the list (unless unsorted operation is requested). Returns 0
455 1.12 christos * if things went well, nonzero if errors occurred. It is not an error
456 1.12 christos * to find no matches.
457 1.12 christos */
458 1.12 christos static int
459 1.18.2.1 riz glob0(const Char *pattern, glob_t *pglob, size_t *limit)
460 1.12 christos {
461 1.12 christos const Char *qpatnext;
462 1.16 christos int c, error;
463 1.16 christos __gl_size_t oldpathc;
464 1.12 christos Char *bufnext, patbuf[MAXPATHLEN+1];
465 1.12 christos
466 1.12 christos _DIAGASSERT(pattern != NULL);
467 1.12 christos _DIAGASSERT(pglob != NULL);
468 1.12 christos
469 1.12 christos if ((qpatnext = globtilde(pattern, patbuf, sizeof(patbuf),
470 1.12 christos pglob)) == NULL)
471 1.12 christos return GLOB_ABEND;
472 1.12 christos oldpathc = pglob->gl_pathc;
473 1.12 christos bufnext = patbuf;
474 1.12 christos
475 1.12 christos /* We don't need to check for buffer overflow any more. */
476 1.12 christos while ((c = *qpatnext++) != EOS) {
477 1.12 christos switch (c) {
478 1.12 christos case LBRACKET:
479 1.12 christos c = *qpatnext;
480 1.12 christos if (c == NOT)
481 1.12 christos ++qpatnext;
482 1.12 christos if (*qpatnext == EOS ||
483 1.12 christos g_strchr(qpatnext+1, RBRACKET) == NULL) {
484 1.12 christos *bufnext++ = LBRACKET;
485 1.12 christos if (c == NOT)
486 1.12 christos --qpatnext;
487 1.12 christos break;
488 1.12 christos }
489 1.12 christos *bufnext++ = M_SET;
490 1.12 christos if (c == NOT)
491 1.12 christos *bufnext++ = M_NOT;
492 1.12 christos c = *qpatnext++;
493 1.12 christos do {
494 1.12 christos *bufnext++ = CHAR(c);
495 1.12 christos if (*qpatnext == RANGE &&
496 1.12 christos (c = qpatnext[1]) != RBRACKET) {
497 1.12 christos *bufnext++ = M_RNG;
498 1.12 christos *bufnext++ = CHAR(c);
499 1.12 christos qpatnext += 2;
500 1.12 christos }
501 1.12 christos } while ((c = *qpatnext++) != RBRACKET);
502 1.12 christos pglob->gl_flags |= GLOB_MAGCHAR;
503 1.12 christos *bufnext++ = M_END;
504 1.12 christos break;
505 1.12 christos case QUESTION:
506 1.12 christos pglob->gl_flags |= GLOB_MAGCHAR;
507 1.12 christos *bufnext++ = M_ONE;
508 1.12 christos break;
509 1.12 christos case STAR:
510 1.12 christos pglob->gl_flags |= GLOB_MAGCHAR;
511 1.12 christos /* collapse adjacent stars to one,
512 1.12 christos * to avoid exponential behavior
513 1.12 christos */
514 1.12 christos if (bufnext == patbuf || bufnext[-1] != M_ALL)
515 1.12 christos *bufnext++ = M_ALL;
516 1.12 christos break;
517 1.12 christos default:
518 1.12 christos *bufnext++ = CHAR(c);
519 1.12 christos break;
520 1.12 christos }
521 1.12 christos }
522 1.12 christos *bufnext = EOS;
523 1.12 christos #ifdef DEBUG
524 1.12 christos qprintf("glob0:", patbuf);
525 1.12 christos #endif
526 1.12 christos
527 1.18.2.1 riz if ((error = glob1(patbuf, pglob, limit)) != 0)
528 1.18 christos return error;
529 1.12 christos
530 1.12 christos if (pglob->gl_pathc == oldpathc) {
531 1.12 christos /*
532 1.12 christos * If there was no match we are going to append the pattern
533 1.12 christos * if GLOB_NOCHECK was specified or if GLOB_NOMAGIC was
534 1.12 christos * specified and the pattern did not contain any magic
535 1.12 christos * characters GLOB_NOMAGIC is there just for compatibility
536 1.12 christos * with csh.
537 1.12 christos */
538 1.12 christos if ((pglob->gl_flags & GLOB_NOCHECK) ||
539 1.12 christos ((pglob->gl_flags & (GLOB_NOMAGIC|GLOB_MAGCHAR))
540 1.12 christos == GLOB_NOMAGIC)) {
541 1.18.2.1 riz return globextend(pattern, pglob, limit);
542 1.12 christos } else {
543 1.18 christos return GLOB_NOMATCH;
544 1.12 christos }
545 1.12 christos } else if (!(pglob->gl_flags & GLOB_NOSORT)) {
546 1.12 christos qsort(pglob->gl_pathv + pglob->gl_offs + oldpathc,
547 1.12 christos (size_t)pglob->gl_pathc - oldpathc, sizeof(char *),
548 1.12 christos compare);
549 1.12 christos }
550 1.12 christos
551 1.18 christos return 0;
552 1.12 christos }
553 1.12 christos
554 1.12 christos static int
555 1.18 christos compare(const void *p, const void *q)
556 1.12 christos {
557 1.12 christos
558 1.12 christos _DIAGASSERT(p != NULL);
559 1.12 christos _DIAGASSERT(q != NULL);
560 1.12 christos
561 1.18 christos return strcoll(*(const char * const *)p, *(const char * const *)q);
562 1.12 christos }
563 1.12 christos
564 1.12 christos static int
565 1.18 christos glob1(Char *pattern, glob_t *pglob, size_t *limit)
566 1.12 christos {
567 1.12 christos Char pathbuf[MAXPATHLEN+1];
568 1.12 christos
569 1.12 christos _DIAGASSERT(pattern != NULL);
570 1.12 christos _DIAGASSERT(pglob != NULL);
571 1.12 christos
572 1.12 christos /* A null pathname is invalid -- POSIX 1003.1 sect. 2.4. */
573 1.12 christos if (*pattern == EOS)
574 1.18 christos return 0;
575 1.12 christos /*
576 1.12 christos * we save one character so that we can use ptr >= limit,
577 1.12 christos * in the general case when we are appending non nul chars only.
578 1.12 christos */
579 1.18 christos return glob2(pathbuf, pathbuf,
580 1.18 christos pathbuf + (sizeof(pathbuf) / sizeof(*pathbuf)) - 1, pattern,
581 1.18 christos pglob, limit);
582 1.12 christos }
583 1.12 christos
584 1.12 christos /*
585 1.12 christos * The functions glob2 and glob3 are mutually recursive; there is one level
586 1.12 christos * of recursion for each segment in the pattern that contains one or more
587 1.12 christos * meta characters.
588 1.12 christos */
589 1.12 christos static int
590 1.18 christos glob2(Char *pathbuf, Char *pathend, Char *pathlim, Char *pattern, glob_t *pglob,
591 1.18 christos size_t *limit)
592 1.12 christos {
593 1.12 christos __gl_stat_t sb;
594 1.12 christos Char *p, *q;
595 1.12 christos int anymeta;
596 1.12 christos
597 1.12 christos _DIAGASSERT(pathbuf != NULL);
598 1.12 christos _DIAGASSERT(pathend != NULL);
599 1.12 christos _DIAGASSERT(pattern != NULL);
600 1.12 christos _DIAGASSERT(pglob != NULL);
601 1.12 christos
602 1.12 christos /*
603 1.12 christos * Loop over pattern segments until end of pattern or until
604 1.12 christos * segment with meta character found.
605 1.12 christos */
606 1.12 christos for (anymeta = 0;;) {
607 1.12 christos if (*pattern == EOS) { /* End of pattern? */
608 1.12 christos *pathend = EOS;
609 1.12 christos if (g_lstat(pathbuf, &sb, pglob))
610 1.18 christos return 0;
611 1.12 christos
612 1.18.2.1 riz if ((pglob->gl_flags & GLOB_LIMIT) &&
613 1.18.2.1 riz limit[GLOB_INDEX_STAT]++ >= GLOB_LIMIT_STAT) {
614 1.18.2.1 riz errno = 0;
615 1.18.2.1 riz *pathend++ = SEP;
616 1.18.2.1 riz *pathend = EOS;
617 1.18.2.1 riz return GLOB_NOSPACE;
618 1.18.2.1 riz }
619 1.12 christos if (((pglob->gl_flags & GLOB_MARK) &&
620 1.12 christos pathend[-1] != SEP) && (S_ISDIR(sb.st_mode) ||
621 1.12 christos (S_ISLNK(sb.st_mode) &&
622 1.12 christos (g_stat(pathbuf, &sb, pglob) == 0) &&
623 1.12 christos S_ISDIR(sb.st_mode)))) {
624 1.12 christos if (pathend >= pathlim)
625 1.18 christos return GLOB_ABORTED;
626 1.12 christos *pathend++ = SEP;
627 1.12 christos *pathend = EOS;
628 1.12 christos }
629 1.12 christos ++pglob->gl_matchc;
630 1.18 christos return globextend(pathbuf, pglob, limit);
631 1.12 christos }
632 1.12 christos
633 1.12 christos /* Find end of next segment, copy tentatively to pathend. */
634 1.12 christos q = pathend;
635 1.12 christos p = pattern;
636 1.12 christos while (*p != EOS && *p != SEP) {
637 1.12 christos if (ismeta(*p))
638 1.12 christos anymeta = 1;
639 1.12 christos if (q >= pathlim)
640 1.12 christos return GLOB_ABORTED;
641 1.12 christos *q++ = *p++;
642 1.12 christos }
643 1.12 christos
644 1.12 christos if (!anymeta) { /* No expansion, do next segment. */
645 1.12 christos pathend = q;
646 1.12 christos pattern = p;
647 1.12 christos while (*pattern == SEP) {
648 1.12 christos if (pathend >= pathlim)
649 1.12 christos return GLOB_ABORTED;
650 1.12 christos *pathend++ = *pattern++;
651 1.12 christos }
652 1.12 christos } else /* Need expansion, recurse. */
653 1.18 christos return glob3(pathbuf, pathend, pathlim, pattern, p,
654 1.18 christos pglob, limit);
655 1.12 christos }
656 1.12 christos /* NOTREACHED */
657 1.12 christos }
658 1.12 christos
659 1.12 christos static int
660 1.18 christos glob3(Char *pathbuf, Char *pathend, Char *pathlim, Char *pattern,
661 1.18 christos Char *restpattern, glob_t *pglob, size_t *limit)
662 1.12 christos {
663 1.12 christos struct dirent *dp;
664 1.12 christos DIR *dirp;
665 1.12 christos int error;
666 1.12 christos char buf[MAXPATHLEN];
667 1.12 christos
668 1.12 christos /*
669 1.12 christos * The readdirfunc declaration can't be prototyped, because it is
670 1.12 christos * assigned, below, to two functions which are prototyped in glob.h
671 1.12 christos * and dirent.h as taking pointers to differently typed opaque
672 1.12 christos * structures.
673 1.12 christos */
674 1.18 christos struct dirent *(*readdirfunc)(void *);
675 1.12 christos
676 1.12 christos _DIAGASSERT(pathbuf != NULL);
677 1.12 christos _DIAGASSERT(pathend != NULL);
678 1.12 christos _DIAGASSERT(pattern != NULL);
679 1.12 christos _DIAGASSERT(restpattern != NULL);
680 1.12 christos _DIAGASSERT(pglob != NULL);
681 1.12 christos
682 1.12 christos *pathend = EOS;
683 1.12 christos errno = 0;
684 1.12 christos
685 1.12 christos if ((dirp = g_opendir(pathbuf, pglob)) == NULL) {
686 1.12 christos if (pglob->gl_errfunc) {
687 1.12 christos if (g_Ctoc(pathbuf, buf, sizeof(buf)))
688 1.18 christos return GLOB_ABORTED;
689 1.12 christos if (pglob->gl_errfunc(buf, errno) ||
690 1.12 christos pglob->gl_flags & GLOB_ERR)
691 1.18 christos return GLOB_ABORTED;
692 1.12 christos }
693 1.12 christos /*
694 1.12 christos * Posix/XOpen: glob should return when it encounters a
695 1.12 christos * directory that it cannot open or read
696 1.12 christos * XXX: Should we ignore ENOTDIR and ENOENT though?
697 1.12 christos * I think that Posix had in mind EPERM...
698 1.12 christos */
699 1.12 christos if (pglob->gl_flags & GLOB_ERR)
700 1.18 christos return GLOB_ABORTED;
701 1.12 christos
702 1.18 christos return 0;
703 1.12 christos }
704 1.12 christos
705 1.12 christos error = 0;
706 1.12 christos
707 1.12 christos /* Search directory for matching names. */
708 1.12 christos if (pglob->gl_flags & GLOB_ALTDIRFUNC)
709 1.12 christos readdirfunc = pglob->gl_readdir;
710 1.12 christos else
711 1.12 christos readdirfunc = (struct dirent *(*)__P((void *))) readdir;
712 1.12 christos while ((dp = (*readdirfunc)(dirp)) != NULL) {
713 1.12 christos u_char *sc;
714 1.12 christos Char *dc;
715 1.12 christos
716 1.12 christos /* Initial DOT must be matched literally. */
717 1.12 christos if (dp->d_name[0] == DOT && *pattern != DOT)
718 1.12 christos continue;
719 1.12 christos /*
720 1.12 christos * The resulting string contains EOS, so we can
721 1.12 christos * use the pathlim character, if it is the nul
722 1.12 christos */
723 1.12 christos for (sc = (u_char *) dp->d_name, dc = pathend;
724 1.12 christos dc <= pathlim && (*dc++ = *sc++) != EOS;)
725 1.12 christos continue;
726 1.12 christos
727 1.18.2.1 riz if ((pglob->gl_flags & GLOB_LIMIT) &&
728 1.18.2.1 riz limit[GLOB_INDEX_READDIR]++ >= GLOB_LIMIT_READDIR) {
729 1.18.2.1 riz errno = 0;
730 1.18.2.1 riz *pathend++ = SEP;
731 1.18.2.1 riz *pathend = EOS;
732 1.18.2.1 riz return GLOB_NOSPACE;
733 1.18.2.1 riz }
734 1.18.2.1 riz
735 1.12 christos /*
736 1.12 christos * Have we filled the buffer without seeing EOS?
737 1.12 christos */
738 1.12 christos if (dc > pathlim && *pathlim != EOS) {
739 1.12 christos /*
740 1.12 christos * Abort when requested by caller, otherwise
741 1.12 christos * reset pathend back to last SEP and continue
742 1.12 christos * with next dir entry.
743 1.12 christos */
744 1.12 christos if (pglob->gl_flags & GLOB_ERR) {
745 1.12 christos error = GLOB_ABORTED;
746 1.12 christos break;
747 1.12 christos }
748 1.12 christos else {
749 1.12 christos *pathend = EOS;
750 1.12 christos continue;
751 1.12 christos }
752 1.12 christos }
753 1.12 christos
754 1.12 christos if (!match(pathend, pattern, restpattern)) {
755 1.12 christos *pathend = EOS;
756 1.12 christos continue;
757 1.12 christos }
758 1.18.2.1 riz error = glob2(pathbuf, --dc, pathlim, restpattern, pglob,
759 1.18.2.1 riz limit);
760 1.12 christos if (error)
761 1.12 christos break;
762 1.12 christos }
763 1.12 christos
764 1.12 christos if (pglob->gl_flags & GLOB_ALTDIRFUNC)
765 1.12 christos (*pglob->gl_closedir)(dirp);
766 1.12 christos else
767 1.12 christos closedir(dirp);
768 1.12 christos
769 1.12 christos /*
770 1.12 christos * Again Posix X/Open issue with regards to error handling.
771 1.12 christos */
772 1.12 christos if ((error || errno) && (pglob->gl_flags & GLOB_ERR))
773 1.18 christos return GLOB_ABORTED;
774 1.12 christos
775 1.18 christos return error;
776 1.12 christos }
777 1.12 christos
778 1.12 christos
779 1.12 christos /*
780 1.17 christos * Extend the gl_pathv member of a glob_t structure to accommodate a new item,
781 1.12 christos * add the new item, and update gl_pathc.
782 1.12 christos *
783 1.12 christos * This assumes the BSD realloc, which only copies the block when its size
784 1.12 christos * crosses a power-of-two boundary; for v7 realloc, this would cause quadratic
785 1.12 christos * behavior.
786 1.12 christos *
787 1.12 christos * Return 0 if new item added, error code if memory couldn't be allocated.
788 1.12 christos *
789 1.12 christos * Invariant of the glob_t structure:
790 1.12 christos * Either gl_pathc is zero and gl_pathv is NULL; or gl_pathc > 0 and
791 1.12 christos * gl_pathv points to (gl_offs + gl_pathc + 1) items.
792 1.12 christos */
793 1.12 christos static int
794 1.18 christos globextend(const Char *path, glob_t *pglob, size_t *limit)
795 1.12 christos {
796 1.12 christos char **pathv;
797 1.16 christos size_t i, newsize, len;
798 1.12 christos char *copy;
799 1.12 christos const Char *p;
800 1.12 christos
801 1.12 christos _DIAGASSERT(path != NULL);
802 1.12 christos _DIAGASSERT(pglob != NULL);
803 1.12 christos
804 1.12 christos newsize = sizeof(*pathv) * (2 + pglob->gl_pathc + pglob->gl_offs);
805 1.12 christos pathv = pglob->gl_pathv ? realloc(pglob->gl_pathv, newsize) :
806 1.12 christos malloc(newsize);
807 1.12 christos if (pathv == NULL)
808 1.18 christos return GLOB_NOSPACE;
809 1.12 christos
810 1.12 christos if (pglob->gl_pathv == NULL && pglob->gl_offs > 0) {
811 1.12 christos /* first time around -- clear initial gl_offs items */
812 1.12 christos pathv += pglob->gl_offs;
813 1.16 christos for (i = pglob->gl_offs + 1; --i > 0; )
814 1.12 christos *--pathv = NULL;
815 1.12 christos }
816 1.12 christos pglob->gl_pathv = pathv;
817 1.12 christos
818 1.12 christos for (p = path; *p++;)
819 1.12 christos continue;
820 1.12 christos len = (size_t)(p - path);
821 1.18.2.1 riz limit[GLOB_INDEX_MALLOC] += len;
822 1.12 christos if ((copy = malloc(len)) != NULL) {
823 1.12 christos if (g_Ctoc(path, copy, len)) {
824 1.12 christos free(copy);
825 1.18 christos return GLOB_ABORTED;
826 1.12 christos }
827 1.12 christos pathv[pglob->gl_offs + pglob->gl_pathc++] = copy;
828 1.12 christos }
829 1.12 christos pathv[pglob->gl_offs + pglob->gl_pathc] = NULL;
830 1.12 christos
831 1.18.2.1 riz if ((pglob->gl_flags & GLOB_LIMIT) &&
832 1.18.2.1 riz (newsize + limit[GLOB_INDEX_MALLOC]) >= GLOB_LIMIT_MALLOC) {
833 1.12 christos errno = 0;
834 1.18 christos return GLOB_NOSPACE;
835 1.12 christos }
836 1.12 christos
837 1.18 christos return copy == NULL ? GLOB_NOSPACE : 0;
838 1.12 christos }
839 1.12 christos
840 1.12 christos
841 1.12 christos /*
842 1.12 christos * pattern matching function for filenames. Each occurrence of the *
843 1.12 christos * pattern causes a recursion level.
844 1.12 christos */
845 1.12 christos static int
846 1.18 christos match(Char *name, Char *pat, Char *patend)
847 1.12 christos {
848 1.12 christos int ok, negate_range;
849 1.12 christos Char c, k;
850 1.12 christos
851 1.12 christos _DIAGASSERT(name != NULL);
852 1.12 christos _DIAGASSERT(pat != NULL);
853 1.12 christos _DIAGASSERT(patend != NULL);
854 1.12 christos
855 1.12 christos while (pat < patend) {
856 1.12 christos c = *pat++;
857 1.12 christos switch (c & M_MASK) {
858 1.12 christos case M_ALL:
859 1.12 christos if (pat == patend)
860 1.18 christos return 1;
861 1.12 christos do
862 1.12 christos if (match(name, pat, patend))
863 1.18 christos return 1;
864 1.12 christos while (*name++ != EOS);
865 1.18 christos return 0;
866 1.12 christos case M_ONE:
867 1.12 christos if (*name++ == EOS)
868 1.18 christos return 0;
869 1.12 christos break;
870 1.12 christos case M_SET:
871 1.12 christos ok = 0;
872 1.12 christos if ((k = *name++) == EOS)
873 1.18 christos return 0;
874 1.12 christos if ((negate_range = ((*pat & M_MASK) == M_NOT)) != EOS)
875 1.12 christos ++pat;
876 1.12 christos while (((c = *pat++) & M_MASK) != M_END)
877 1.12 christos if ((*pat & M_MASK) == M_RNG) {
878 1.12 christos if (c <= k && k <= pat[1])
879 1.12 christos ok = 1;
880 1.12 christos pat += 2;
881 1.12 christos } else if (c == k)
882 1.12 christos ok = 1;
883 1.12 christos if (ok == negate_range)
884 1.18 christos return 0;
885 1.12 christos break;
886 1.12 christos default:
887 1.12 christos if (*name++ != c)
888 1.18 christos return 0;
889 1.12 christos break;
890 1.12 christos }
891 1.12 christos }
892 1.18 christos return *name == EOS;
893 1.12 christos }
894 1.12 christos
895 1.12 christos /* Free allocated data belonging to a glob_t structure. */
896 1.12 christos void
897 1.18 christos globfree(glob_t *pglob)
898 1.12 christos {
899 1.16 christos size_t i;
900 1.12 christos char **pp;
901 1.12 christos
902 1.12 christos _DIAGASSERT(pglob != NULL);
903 1.12 christos
904 1.12 christos if (pglob->gl_pathv != NULL) {
905 1.12 christos pp = pglob->gl_pathv + pglob->gl_offs;
906 1.12 christos for (i = pglob->gl_pathc; i--; ++pp)
907 1.12 christos if (*pp)
908 1.12 christos free(*pp);
909 1.12 christos free(pglob->gl_pathv);
910 1.12 christos pglob->gl_pathv = NULL;
911 1.12 christos pglob->gl_pathc = 0;
912 1.12 christos }
913 1.12 christos }
914 1.12 christos
915 1.12 christos static DIR *
916 1.18 christos g_opendir(Char *str, glob_t *pglob)
917 1.12 christos {
918 1.12 christos char buf[MAXPATHLEN];
919 1.12 christos
920 1.12 christos _DIAGASSERT(str != NULL);
921 1.12 christos _DIAGASSERT(pglob != NULL);
922 1.12 christos
923 1.12 christos if (!*str)
924 1.12 christos (void)strlcpy(buf, ".", sizeof(buf));
925 1.12 christos else {
926 1.12 christos if (g_Ctoc(str, buf, sizeof(buf)))
927 1.12 christos return NULL;
928 1.12 christos }
929 1.12 christos
930 1.12 christos if (pglob->gl_flags & GLOB_ALTDIRFUNC)
931 1.18 christos return (*pglob->gl_opendir)(buf);
932 1.12 christos
933 1.18 christos return opendir(buf);
934 1.12 christos }
935 1.12 christos
936 1.12 christos static int
937 1.18 christos g_lstat(Char *fn, __gl_stat_t *sb, glob_t *pglob)
938 1.12 christos {
939 1.12 christos char buf[MAXPATHLEN];
940 1.12 christos
941 1.12 christos _DIAGASSERT(fn != NULL);
942 1.12 christos _DIAGASSERT(sb != NULL);
943 1.12 christos _DIAGASSERT(pglob != NULL);
944 1.12 christos
945 1.12 christos if (g_Ctoc(fn, buf, sizeof(buf)))
946 1.12 christos return -1;
947 1.12 christos if (pglob->gl_flags & GLOB_ALTDIRFUNC)
948 1.18 christos return (*pglob->gl_lstat)(buf, sb);
949 1.18 christos return lstat(buf, sb);
950 1.12 christos }
951 1.12 christos
952 1.12 christos static int
953 1.18 christos g_stat(Char *fn, __gl_stat_t *sb, glob_t *pglob)
954 1.12 christos {
955 1.12 christos char buf[MAXPATHLEN];
956 1.12 christos
957 1.12 christos _DIAGASSERT(fn != NULL);
958 1.12 christos _DIAGASSERT(sb != NULL);
959 1.12 christos _DIAGASSERT(pglob != NULL);
960 1.12 christos
961 1.12 christos if (g_Ctoc(fn, buf, sizeof(buf)))
962 1.12 christos return -1;
963 1.12 christos if (pglob->gl_flags & GLOB_ALTDIRFUNC)
964 1.18 christos return (*pglob->gl_stat)(buf, sb);
965 1.18 christos return stat(buf, sb);
966 1.12 christos }
967 1.12 christos
968 1.12 christos static Char *
969 1.18 christos g_strchr(const Char *str, int ch)
970 1.12 christos {
971 1.12 christos
972 1.12 christos _DIAGASSERT(str != NULL);
973 1.12 christos
974 1.12 christos do {
975 1.12 christos if (*str == ch)
976 1.14 christos return __UNCONST(str);
977 1.12 christos } while (*str++);
978 1.12 christos return NULL;
979 1.12 christos }
980 1.12 christos
981 1.12 christos static int
982 1.18 christos g_Ctoc(const Char *str, char *buf, size_t len)
983 1.12 christos {
984 1.12 christos char *dc;
985 1.12 christos
986 1.12 christos _DIAGASSERT(str != NULL);
987 1.12 christos _DIAGASSERT(buf != NULL);
988 1.12 christos
989 1.12 christos if (len == 0)
990 1.12 christos return 1;
991 1.12 christos
992 1.12 christos for (dc = buf; len && (*dc++ = *str++) != EOS; len--)
993 1.12 christos continue;
994 1.12 christos
995 1.12 christos return len == 0;
996 1.12 christos }
997 1.12 christos
998 1.12 christos #ifdef DEBUG
999 1.12 christos static void
1000 1.18 christos qprintf(const char *str, Char *s)
1001 1.12 christos {
1002 1.12 christos Char *p;
1003 1.12 christos
1004 1.12 christos _DIAGASSERT(str != NULL);
1005 1.12 christos _DIAGASSERT(s != NULL);
1006 1.12 christos
1007 1.12 christos (void)printf("%s:\n", str);
1008 1.12 christos for (p = s; *p; p++)
1009 1.12 christos (void)printf("%c", CHAR(*p));
1010 1.12 christos (void)printf("\n");
1011 1.12 christos for (p = s; *p; p++)
1012 1.12 christos (void)printf("%c", *p & M_PROTECT ? '"' : ' ');
1013 1.12 christos (void)printf("\n");
1014 1.12 christos for (p = s; *p; p++)
1015 1.12 christos (void)printf("%c", ismeta(*p) ? '_' : ' ');
1016 1.12 christos (void)printf("\n");
1017 1.12 christos }
1018 1.12 christos #endif
1019