regexp.c revision 1.12 1 1.12 matt /* $NetBSD: regexp.c,v 1.12 2012/03/20 20:34:59 matt Exp $ */
2 1.3 jtc
3 1.1 cgd /*
4 1.3 jtc * Copyright (c) 1980, 1993
5 1.3 jtc * The Regents of the University of California. All rights reserved.
6 1.3 jtc *
7 1.1 cgd *
8 1.1 cgd * Redistribution and use in source and binary forms, with or without
9 1.1 cgd * modification, are permitted provided that the following conditions
10 1.1 cgd * are met:
11 1.1 cgd * 1. Redistributions of source code must retain the above copyright
12 1.1 cgd * notice, this list of conditions and the following disclaimer.
13 1.1 cgd * 2. Redistributions in binary form must reproduce the above copyright
14 1.1 cgd * notice, this list of conditions and the following disclaimer in the
15 1.1 cgd * documentation and/or other materials provided with the distribution.
16 1.7 agc * 3. Neither the name of the University nor the names of its contributors
17 1.1 cgd * may be used to endorse or promote products derived from this software
18 1.1 cgd * without specific prior written permission.
19 1.1 cgd *
20 1.1 cgd * THIS SOFTWARE IS PROVIDED BY THE REGENTS AND CONTRIBUTORS ``AS IS'' AND
21 1.1 cgd * ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
22 1.1 cgd * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
23 1.1 cgd * ARE DISCLAIMED. IN NO EVENT SHALL THE REGENTS OR CONTRIBUTORS BE LIABLE
24 1.1 cgd * FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL
25 1.1 cgd * DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS
26 1.1 cgd * OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION)
27 1.1 cgd * HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT
28 1.1 cgd * LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY
29 1.1 cgd * OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF
30 1.1 cgd * SUCH DAMAGE.
31 1.1 cgd */
32 1.1 cgd
33 1.4 lukem #include <sys/cdefs.h>
34 1.1 cgd #ifndef lint
35 1.11 lukem __COPYRIGHT("@(#) Copyright (c) 1980, 1993\
36 1.11 lukem The Regents of the University of California. All rights reserved.");
37 1.3 jtc #endif /* not lint */
38 1.3 jtc
39 1.3 jtc #ifndef lint
40 1.3 jtc #if 0
41 1.3 jtc static char sccsid[] = "@(#)regexp.c 8.1 (Berkeley) 6/6/93";
42 1.3 jtc #endif
43 1.12 matt __RCSID("$NetBSD: regexp.c,v 1.12 2012/03/20 20:34:59 matt Exp $");
44 1.1 cgd #endif /* not lint */
45 1.1 cgd
46 1.10 christos #include <assert.h>
47 1.1 cgd #include <ctype.h>
48 1.3 jtc #include <stdlib.h>
49 1.3 jtc #include <string.h>
50 1.3 jtc #include "extern.h"
51 1.1 cgd
52 1.1 cgd #define FALSE 0
53 1.3 jtc #define TRUE !(FALSE)
54 1.1 cgd #define NIL 0
55 1.1 cgd
56 1.3 jtc static void expconv __P((void));
57 1.3 jtc
58 1.5 christos boolean x_escaped; /* true if we are currently x_escaped */
59 1.5 christos char *x_start; /* start of string */
60 1.3 jtc boolean l_onecase; /* true if upper and lower equivalent */
61 1.1 cgd
62 1.8 dsl #define makelower(c) (isupper((unsigned char)(c)) ? tolower((unsigned char)(c)) : (c))
63 1.1 cgd
64 1.1 cgd /* STRNCMP - like strncmp except that we convert the
65 1.1 cgd * first string to lower case before comparing
66 1.1 cgd * if l_onecase is set.
67 1.1 cgd */
68 1.1 cgd
69 1.3 jtc int
70 1.12 matt STRNCMP(char *s1, char *s2, int len)
71 1.1 cgd {
72 1.1 cgd if (l_onecase) {
73 1.1 cgd do
74 1.1 cgd if (*s2 - makelower(*s1))
75 1.1 cgd return (*s2 - makelower(*s1));
76 1.1 cgd else {
77 1.1 cgd s2++;
78 1.1 cgd s1++;
79 1.1 cgd }
80 1.1 cgd while (--len);
81 1.1 cgd } else {
82 1.1 cgd do
83 1.1 cgd if (*s2 - *s1)
84 1.1 cgd return (*s2 - *s1);
85 1.1 cgd else {
86 1.1 cgd s2++;
87 1.1 cgd s1++;
88 1.1 cgd }
89 1.1 cgd while (--len);
90 1.1 cgd }
91 1.1 cgd return(0);
92 1.1 cgd }
93 1.1 cgd
94 1.1 cgd /* The following routine converts an irregular expression to
95 1.1 cgd * internal format.
96 1.1 cgd *
97 1.1 cgd * Either meta symbols (\a \d or \p) or character strings or
98 1.1 cgd * operations ( alternation or perenthesizing ) can be
99 1.1 cgd * specified. Each starts with a descriptor byte. The descriptor
100 1.1 cgd * byte has STR set for strings, META set for meta symbols
101 1.1 cgd * and OPER set for operations.
102 1.1 cgd * The descriptor byte can also have the OPT bit set if the object
103 1.1 cgd * defined is optional. Also ALT can be set to indicate an alternation.
104 1.1 cgd *
105 1.1 cgd * For metasymbols the byte following the descriptor byte identities
106 1.1 cgd * the meta symbol (containing an ascii 'a', 'd', 'p', '|', or '('). For
107 1.1 cgd * strings the byte after the descriptor is a character count for
108 1.1 cgd * the string:
109 1.1 cgd *
110 1.1 cgd * meta symbols := descriptor
111 1.1 cgd * symbol
112 1.1 cgd *
113 1.1 cgd * strings := descriptor
114 1.1 cgd * character count
115 1.1 cgd * the string
116 1.1 cgd *
117 1.1 cgd * operatins := descriptor
118 1.1 cgd * symbol
119 1.1 cgd * character count
120 1.1 cgd */
121 1.1 cgd
122 1.1 cgd /*
123 1.1 cgd * handy macros for accessing parts of match blocks
124 1.1 cgd */
125 1.1 cgd #define MSYM(A) (*(A+1)) /* symbol in a meta symbol block */
126 1.1 cgd #define MNEXT(A) (A+2) /* character following a metasymbol block */
127 1.1 cgd
128 1.1 cgd #define OSYM(A) (*(A+1)) /* symbol in an operation block */
129 1.1 cgd #define OCNT(A) (*(A+2)) /* character count */
130 1.1 cgd #define ONEXT(A) (A+3) /* next character after the operation */
131 1.1 cgd #define OPTR(A) (A+*(A+2)) /* place pointed to by the operator */
132 1.1 cgd
133 1.1 cgd #define SCNT(A) (*(A+1)) /* byte count of a string */
134 1.1 cgd #define SSTR(A) (A+2) /* address of the string */
135 1.1 cgd #define SNEXT(A) (A+2+*(A+1)) /* character following the string */
136 1.1 cgd
137 1.1 cgd /*
138 1.1 cgd * bit flags in the descriptor
139 1.1 cgd */
140 1.1 cgd #define OPT 1
141 1.1 cgd #define STR 2
142 1.1 cgd #define META 4
143 1.1 cgd #define ALT 8
144 1.1 cgd #define OPER 16
145 1.1 cgd
146 1.3 jtc static char *ccre; /* pointer to current position in converted exp*/
147 1.3 jtc static char *ure; /* pointer current position in unconverted exp */
148 1.1 cgd
149 1.1 cgd char *
150 1.12 matt convexp(char *re) /* unconverted irregular expression */
151 1.1 cgd {
152 1.4 lukem char *cre; /* pointer to converted regular expression */
153 1.1 cgd
154 1.1 cgd /* allocate room for the converted expression */
155 1.1 cgd if (re == NIL)
156 1.1 cgd return (NIL);
157 1.1 cgd if (*re == '\0')
158 1.1 cgd return (NIL);
159 1.6 itojun cre = malloc(4 * strlen(re) + 3);
160 1.1 cgd ccre = cre;
161 1.1 cgd ure = re;
162 1.1 cgd
163 1.1 cgd /* start the conversion with a \a */
164 1.1 cgd *cre = META | OPT;
165 1.1 cgd MSYM(cre) = 'a';
166 1.1 cgd ccre = MNEXT(cre);
167 1.1 cgd
168 1.1 cgd /* start the conversion (its recursive) */
169 1.6 itojun expconv();
170 1.1 cgd *ccre = 0;
171 1.1 cgd return (cre);
172 1.1 cgd }
173 1.1 cgd
174 1.3 jtc static void
175 1.12 matt expconv(void)
176 1.1 cgd {
177 1.4 lukem char *cs; /* pointer to current symbol in converted exp */
178 1.4 lukem char c; /* character being processed */
179 1.4 lukem char *acs; /* pinter to last alternate */
180 1.4 lukem int temp;
181 1.1 cgd
182 1.1 cgd /* let the conversion begin */
183 1.1 cgd acs = NIL;
184 1.1 cgd cs = NIL;
185 1.1 cgd while (*ure != NIL) {
186 1.1 cgd switch (c = *ure++) {
187 1.1 cgd
188 1.1 cgd case '\\':
189 1.1 cgd switch (c = *ure++) {
190 1.1 cgd
191 1.1 cgd /* escaped characters are just characters */
192 1.1 cgd default:
193 1.1 cgd if (cs == NIL || (*cs & STR) == 0) {
194 1.1 cgd cs = ccre;
195 1.1 cgd *cs = STR;
196 1.1 cgd SCNT(cs) = 1;
197 1.1 cgd ccre += 2;
198 1.1 cgd } else
199 1.1 cgd SCNT(cs)++;
200 1.1 cgd *ccre++ = c;
201 1.1 cgd break;
202 1.1 cgd
203 1.1 cgd /* normal(?) metacharacters */
204 1.1 cgd case 'a':
205 1.1 cgd case 'd':
206 1.1 cgd case 'e':
207 1.1 cgd case 'p':
208 1.1 cgd if (acs != NIL && acs != cs) {
209 1.1 cgd do {
210 1.1 cgd temp = OCNT(acs);
211 1.1 cgd OCNT(acs) = ccre - acs;
212 1.1 cgd acs -= temp;
213 1.1 cgd } while (temp != 0);
214 1.1 cgd acs = NIL;
215 1.1 cgd }
216 1.1 cgd cs = ccre;
217 1.1 cgd *cs = META;
218 1.1 cgd MSYM(cs) = c;
219 1.1 cgd ccre = MNEXT(cs);
220 1.1 cgd break;
221 1.1 cgd }
222 1.1 cgd break;
223 1.1 cgd
224 1.1 cgd /* just put the symbol in */
225 1.1 cgd case '^':
226 1.1 cgd case '$':
227 1.1 cgd if (acs != NIL && acs != cs) {
228 1.1 cgd do {
229 1.1 cgd temp = OCNT(acs);
230 1.1 cgd OCNT(acs) = ccre - acs;
231 1.1 cgd acs -= temp;
232 1.1 cgd } while (temp != 0);
233 1.1 cgd acs = NIL;
234 1.1 cgd }
235 1.1 cgd cs = ccre;
236 1.1 cgd *cs = META;
237 1.1 cgd MSYM(cs) = c;
238 1.1 cgd ccre = MNEXT(cs);
239 1.1 cgd break;
240 1.1 cgd
241 1.1 cgd /* mark the last match sequence as optional */
242 1.1 cgd case '?':
243 1.1 cgd if (cs)
244 1.1 cgd *cs = *cs | OPT;
245 1.1 cgd break;
246 1.1 cgd
247 1.1 cgd /* recurse and define a subexpression */
248 1.1 cgd case '(':
249 1.1 cgd if (acs != NIL && acs != cs) {
250 1.1 cgd do {
251 1.1 cgd temp = OCNT(acs);
252 1.1 cgd OCNT(acs) = ccre - acs;
253 1.1 cgd acs -= temp;
254 1.1 cgd } while (temp != 0);
255 1.1 cgd acs = NIL;
256 1.1 cgd }
257 1.1 cgd cs = ccre;
258 1.1 cgd *cs = OPER;
259 1.1 cgd OSYM(cs) = '(';
260 1.1 cgd ccre = ONEXT(cs);
261 1.6 itojun expconv();
262 1.1 cgd OCNT(cs) = ccre - cs; /* offset to next symbol */
263 1.1 cgd break;
264 1.1 cgd
265 1.3 jtc /* reurn from a recursion */
266 1.1 cgd case ')':
267 1.1 cgd if (acs != NIL) {
268 1.1 cgd do {
269 1.1 cgd temp = OCNT(acs);
270 1.1 cgd OCNT(acs) = ccre - acs;
271 1.1 cgd acs -= temp;
272 1.1 cgd } while (temp != 0);
273 1.1 cgd acs = NIL;
274 1.1 cgd }
275 1.1 cgd cs = ccre;
276 1.1 cgd *cs = META;
277 1.1 cgd MSYM(cs) = c;
278 1.1 cgd ccre = MNEXT(cs);
279 1.1 cgd return;
280 1.1 cgd
281 1.1 cgd /* mark the last match sequence as having an alternate */
282 1.1 cgd /* the third byte will contain an offset to jump over the */
283 1.1 cgd /* alternate match in case the first did not fail */
284 1.1 cgd case '|':
285 1.1 cgd if (acs != NIL && acs != cs)
286 1.1 cgd OCNT(ccre) = ccre - acs; /* make a back pointer */
287 1.1 cgd else
288 1.1 cgd OCNT(ccre) = 0;
289 1.9 christos assert(cs != NULL);
290 1.1 cgd *cs |= ALT;
291 1.1 cgd cs = ccre;
292 1.1 cgd *cs = OPER;
293 1.1 cgd OSYM(cs) = '|';
294 1.1 cgd ccre = ONEXT(cs);
295 1.1 cgd acs = cs; /* remember that the pointer is to be filles */
296 1.1 cgd break;
297 1.1 cgd
298 1.1 cgd /* if its not a metasymbol just build a scharacter string */
299 1.1 cgd default:
300 1.1 cgd if (cs == NIL || (*cs & STR) == 0) {
301 1.1 cgd cs = ccre;
302 1.1 cgd *cs = STR;
303 1.1 cgd SCNT(cs) = 1;
304 1.1 cgd ccre = SSTR(cs);
305 1.1 cgd } else
306 1.1 cgd SCNT(cs)++;
307 1.1 cgd *ccre++ = c;
308 1.1 cgd break;
309 1.1 cgd }
310 1.1 cgd }
311 1.1 cgd if (acs != NIL) {
312 1.1 cgd do {
313 1.1 cgd temp = OCNT(acs);
314 1.1 cgd OCNT(acs) = ccre - acs;
315 1.1 cgd acs -= temp;
316 1.1 cgd } while (temp != 0);
317 1.1 cgd acs = NIL;
318 1.1 cgd }
319 1.1 cgd return;
320 1.1 cgd }
321 1.1 cgd /* end of convertre */
322 1.1 cgd
323 1.1 cgd
324 1.1 cgd /*
325 1.1 cgd * The following routine recognises an irregular expresion
326 1.1 cgd * with the following special characters:
327 1.1 cgd *
328 1.1 cgd * \? - means last match was optional
329 1.1 cgd * \a - matches any number of characters
330 1.1 cgd * \d - matches any number of spaces and tabs
331 1.1 cgd * \p - matches any number of alphanumeric
332 1.1 cgd * characters. The
333 1.1 cgd * characters matched will be copied into
334 1.1 cgd * the area pointed to by 'name'.
335 1.1 cgd * \| - alternation
336 1.1 cgd * \( \) - grouping used mostly for alternation and
337 1.1 cgd * optionality
338 1.1 cgd *
339 1.1 cgd * The irregular expression must be translated to internal form
340 1.1 cgd * prior to calling this routine
341 1.1 cgd *
342 1.1 cgd * The value returned is the pointer to the first non \a
343 1.1 cgd * character matched.
344 1.1 cgd */
345 1.1 cgd
346 1.1 cgd char *
347 1.12 matt expmatch(
348 1.12 matt char *s, /* string to check for a match in */
349 1.12 matt char *re, /* a converted irregular expression */
350 1.12 matt char *mstring) /* where to put whatever matches a \p */
351 1.1 cgd {
352 1.4 lukem char *cs; /* the current symbol */
353 1.4 lukem char *ptr,*s1; /* temporary pointer */
354 1.4 lukem boolean matched; /* a temporary boolean */
355 1.1 cgd
356 1.1 cgd /* initial conditions */
357 1.1 cgd if (re == NIL)
358 1.1 cgd return (NIL);
359 1.1 cgd cs = re;
360 1.1 cgd matched = FALSE;
361 1.1 cgd
362 1.1 cgd /* loop till expression string is exhausted (or at least pretty tired) */
363 1.1 cgd while (*cs) {
364 1.1 cgd switch (*cs & (OPER | STR | META)) {
365 1.1 cgd
366 1.1 cgd /* try to match a string */
367 1.1 cgd case STR:
368 1.1 cgd matched = !STRNCMP (s, SSTR(cs), SCNT(cs));
369 1.1 cgd if (matched) {
370 1.1 cgd
371 1.1 cgd /* hoorah it matches */
372 1.1 cgd s += SCNT(cs);
373 1.1 cgd cs = SNEXT(cs);
374 1.1 cgd } else if (*cs & ALT) {
375 1.1 cgd
376 1.1 cgd /* alternation, skip to next expression */
377 1.1 cgd cs = SNEXT(cs);
378 1.1 cgd } else if (*cs & OPT) {
379 1.1 cgd
380 1.1 cgd /* the match is optional */
381 1.1 cgd cs = SNEXT(cs);
382 1.1 cgd matched = 1; /* indicate a successful match */
383 1.1 cgd } else {
384 1.1 cgd
385 1.1 cgd /* no match, error return */
386 1.1 cgd return (NIL);
387 1.1 cgd }
388 1.1 cgd break;
389 1.1 cgd
390 1.1 cgd /* an operator, do something fancy */
391 1.1 cgd case OPER:
392 1.1 cgd switch (OSYM(cs)) {
393 1.1 cgd
394 1.1 cgd /* this is an alternation */
395 1.1 cgd case '|':
396 1.1 cgd if (matched)
397 1.1 cgd
398 1.1 cgd /* last thing in the alternation was a match, skip ahead */
399 1.1 cgd cs = OPTR(cs);
400 1.1 cgd else
401 1.1 cgd
402 1.1 cgd /* no match, keep trying */
403 1.1 cgd cs = ONEXT(cs);
404 1.1 cgd break;
405 1.1 cgd
406 1.1 cgd /* this is a grouping, recurse */
407 1.1 cgd case '(':
408 1.6 itojun ptr = expmatch(s, ONEXT(cs), mstring);
409 1.1 cgd if (ptr != NIL) {
410 1.1 cgd
411 1.1 cgd /* the subexpression matched */
412 1.1 cgd matched = 1;
413 1.1 cgd s = ptr;
414 1.1 cgd } else if (*cs & ALT) {
415 1.1 cgd
416 1.1 cgd /* alternation, skip to next expression */
417 1.1 cgd matched = 0;
418 1.1 cgd } else if (*cs & OPT) {
419 1.1 cgd
420 1.1 cgd /* the match is optional */
421 1.1 cgd matched = 1; /* indicate a successful match */
422 1.1 cgd } else {
423 1.1 cgd
424 1.1 cgd /* no match, error return */
425 1.1 cgd return (NIL);
426 1.1 cgd }
427 1.1 cgd cs = OPTR(cs);
428 1.1 cgd break;
429 1.1 cgd }
430 1.1 cgd break;
431 1.1 cgd
432 1.1 cgd /* try to match a metasymbol */
433 1.1 cgd case META:
434 1.1 cgd switch (MSYM(cs)) {
435 1.1 cgd
436 1.1 cgd /* try to match anything and remember what was matched */
437 1.1 cgd case 'p':
438 1.1 cgd /*
439 1.1 cgd * This is really the same as trying the match the
440 1.1 cgd * remaining parts of the expression to any subset
441 1.1 cgd * of the string.
442 1.1 cgd */
443 1.1 cgd s1 = s;
444 1.1 cgd do {
445 1.6 itojun ptr = expmatch(s1, MNEXT(cs), mstring);
446 1.1 cgd if (ptr != NIL && s1 != s) {
447 1.1 cgd
448 1.1 cgd /* we have a match, remember the match */
449 1.6 itojun strncpy(mstring, s, s1 - s);
450 1.1 cgd mstring[s1 - s] = '\0';
451 1.1 cgd return (ptr);
452 1.1 cgd } else if (ptr != NIL && (*cs & OPT)) {
453 1.1 cgd
454 1.1 cgd /* it was aoptional so no match is ok */
455 1.1 cgd return (ptr);
456 1.1 cgd } else if (ptr != NIL) {
457 1.1 cgd
458 1.1 cgd /* not optional and we still matched */
459 1.1 cgd return (NIL);
460 1.1 cgd }
461 1.5 christos if (!isalnum((unsigned char)*s1) && *s1 != '_')
462 1.1 cgd return (NIL);
463 1.1 cgd if (*s1 == '\\')
464 1.5 christos x_escaped = x_escaped ? FALSE : TRUE;
465 1.1 cgd else
466 1.5 christos x_escaped = FALSE;
467 1.1 cgd } while (*s1++);
468 1.1 cgd return (NIL);
469 1.1 cgd
470 1.1 cgd /* try to match anything */
471 1.1 cgd case 'a':
472 1.1 cgd /*
473 1.1 cgd * This is really the same as trying the match the
474 1.1 cgd * remaining parts of the expression to any subset
475 1.1 cgd * of the string.
476 1.1 cgd */
477 1.1 cgd s1 = s;
478 1.1 cgd do {
479 1.6 itojun ptr = expmatch(s1, MNEXT(cs), mstring);
480 1.1 cgd if (ptr != NIL && s1 != s) {
481 1.1 cgd
482 1.1 cgd /* we have a match */
483 1.1 cgd return (ptr);
484 1.1 cgd } else if (ptr != NIL && (*cs & OPT)) {
485 1.1 cgd
486 1.1 cgd /* it was aoptional so no match is ok */
487 1.1 cgd return (ptr);
488 1.1 cgd } else if (ptr != NIL) {
489 1.1 cgd
490 1.1 cgd /* not optional and we still matched */
491 1.1 cgd return (NIL);
492 1.1 cgd }
493 1.1 cgd if (*s1 == '\\')
494 1.5 christos x_escaped = x_escaped ? FALSE : TRUE;
495 1.1 cgd else
496 1.5 christos x_escaped = FALSE;
497 1.1 cgd } while (*s1++);
498 1.1 cgd return (NIL);
499 1.1 cgd
500 1.5 christos /* fail if we are currently x_escaped */
501 1.1 cgd case 'e':
502 1.5 christos if (x_escaped)
503 1.1 cgd return(NIL);
504 1.1 cgd cs = MNEXT(cs);
505 1.1 cgd break;
506 1.1 cgd
507 1.1 cgd /* match any number of tabs and spaces */
508 1.1 cgd case 'd':
509 1.1 cgd ptr = s;
510 1.1 cgd while (*s == ' ' || *s == '\t')
511 1.1 cgd s++;
512 1.5 christos if (s != ptr || s == x_start) {
513 1.1 cgd
514 1.1 cgd /* match, be happy */
515 1.1 cgd matched = 1;
516 1.1 cgd cs = MNEXT(cs);
517 1.1 cgd } else if (*s == '\n' || *s == '\0') {
518 1.1 cgd
519 1.1 cgd /* match, be happy */
520 1.1 cgd matched = 1;
521 1.1 cgd cs = MNEXT(cs);
522 1.1 cgd } else if (*cs & ALT) {
523 1.1 cgd
524 1.1 cgd /* try the next part */
525 1.1 cgd matched = 0;
526 1.1 cgd cs = MNEXT(cs);
527 1.1 cgd } else if (*cs & OPT) {
528 1.1 cgd
529 1.1 cgd /* doesn't matter */
530 1.1 cgd matched = 1;
531 1.1 cgd cs = MNEXT(cs);
532 1.1 cgd } else
533 1.1 cgd
534 1.1 cgd /* no match, error return */
535 1.1 cgd return (NIL);
536 1.1 cgd break;
537 1.1 cgd
538 1.1 cgd /* check for end of line */
539 1.1 cgd case '$':
540 1.1 cgd if (*s == '\0' || *s == '\n') {
541 1.1 cgd
542 1.1 cgd /* match, be happy */
543 1.1 cgd s++;
544 1.1 cgd matched = 1;
545 1.1 cgd cs = MNEXT(cs);
546 1.1 cgd } else if (*cs & ALT) {
547 1.1 cgd
548 1.1 cgd /* try the next part */
549 1.1 cgd matched = 0;
550 1.1 cgd cs = MNEXT(cs);
551 1.1 cgd } else if (*cs & OPT) {
552 1.1 cgd
553 1.1 cgd /* doesn't matter */
554 1.1 cgd matched = 1;
555 1.1 cgd cs = MNEXT(cs);
556 1.1 cgd } else
557 1.1 cgd
558 1.1 cgd /* no match, error return */
559 1.1 cgd return (NIL);
560 1.1 cgd break;
561 1.1 cgd
562 1.1 cgd /* check for start of line */
563 1.1 cgd case '^':
564 1.5 christos if (s == x_start) {
565 1.1 cgd
566 1.1 cgd /* match, be happy */
567 1.1 cgd matched = 1;
568 1.1 cgd cs = MNEXT(cs);
569 1.1 cgd } else if (*cs & ALT) {
570 1.1 cgd
571 1.1 cgd /* try the next part */
572 1.1 cgd matched = 0;
573 1.1 cgd cs = MNEXT(cs);
574 1.1 cgd } else if (*cs & OPT) {
575 1.1 cgd
576 1.1 cgd /* doesn't matter */
577 1.1 cgd matched = 1;
578 1.1 cgd cs = MNEXT(cs);
579 1.1 cgd } else
580 1.1 cgd
581 1.1 cgd /* no match, error return */
582 1.1 cgd return (NIL);
583 1.1 cgd break;
584 1.1 cgd
585 1.1 cgd /* end of a subexpression, return success */
586 1.1 cgd case ')':
587 1.1 cgd return (s);
588 1.1 cgd }
589 1.1 cgd break;
590 1.1 cgd }
591 1.1 cgd }
592 1.1 cgd return (s);
593 1.1 cgd }
594