Home | History | Annotate | Line # | Download | only in vgrind
regexp.c revision 1.1.1.1
      1      1.1  cgd /*
      2  1.1.1.1  jtc  * Copyright (c) 1980, 1993
      3  1.1.1.1  jtc  *	The Regents of the University of California.  All rights reserved.
      4  1.1.1.1  jtc  *
      5      1.1  cgd  *
      6      1.1  cgd  * Redistribution and use in source and binary forms, with or without
      7      1.1  cgd  * modification, are permitted provided that the following conditions
      8      1.1  cgd  * are met:
      9      1.1  cgd  * 1. Redistributions of source code must retain the above copyright
     10      1.1  cgd  *    notice, this list of conditions and the following disclaimer.
     11      1.1  cgd  * 2. Redistributions in binary form must reproduce the above copyright
     12      1.1  cgd  *    notice, this list of conditions and the following disclaimer in the
     13      1.1  cgd  *    documentation and/or other materials provided with the distribution.
     14      1.1  cgd  * 3. All advertising materials mentioning features or use of this software
     15      1.1  cgd  *    must display the following acknowledgement:
     16      1.1  cgd  *	This product includes software developed by the University of
     17      1.1  cgd  *	California, Berkeley and its contributors.
     18      1.1  cgd  * 4. Neither the name of the University nor the names of its contributors
     19      1.1  cgd  *    may be used to endorse or promote products derived from this software
     20      1.1  cgd  *    without specific prior written permission.
     21      1.1  cgd  *
     22      1.1  cgd  * THIS SOFTWARE IS PROVIDED BY THE REGENTS AND CONTRIBUTORS ``AS IS'' AND
     23      1.1  cgd  * ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
     24      1.1  cgd  * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
     25      1.1  cgd  * ARE DISCLAIMED.  IN NO EVENT SHALL THE REGENTS OR CONTRIBUTORS BE LIABLE
     26      1.1  cgd  * FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL
     27      1.1  cgd  * DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS
     28      1.1  cgd  * OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION)
     29      1.1  cgd  * HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT
     30      1.1  cgd  * LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY
     31      1.1  cgd  * OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF
     32      1.1  cgd  * SUCH DAMAGE.
     33      1.1  cgd  */
     34      1.1  cgd 
     35      1.1  cgd #ifndef lint
     36  1.1.1.1  jtc static char copyright[] =
     37  1.1.1.1  jtc "@(#) Copyright (c) 1980, 1993\n\
     38  1.1.1.1  jtc 	The Regents of the University of California.  All rights reserved.\n";
     39  1.1.1.1  jtc #endif /* not lint */
     40  1.1.1.1  jtc 
     41  1.1.1.1  jtc #ifndef lint
     42  1.1.1.1  jtc static char sccsid[] = "@(#)regexp.c	8.1 (Berkeley) 6/6/93";
     43      1.1  cgd #endif /* not lint */
     44      1.1  cgd 
     45      1.1  cgd #include <ctype.h>
     46  1.1.1.1  jtc #include <stdlib.h>
     47  1.1.1.1  jtc #include <string.h>
     48  1.1.1.1  jtc #include "extern.h"
     49      1.1  cgd 
     50      1.1  cgd #define FALSE	0
     51  1.1.1.1  jtc #define TRUE	!(FALSE)
     52      1.1  cgd #define NIL	0
     53      1.1  cgd 
     54  1.1.1.1  jtc static void	expconv __P((void));
     55  1.1.1.1  jtc 
     56  1.1.1.1  jtc boolean	 _escaped;	/* true if we are currently _escaped */
     57  1.1.1.1  jtc char	*_start;	/* start of string */
     58  1.1.1.1  jtc boolean	 l_onecase;	/* true if upper and lower equivalent */
     59      1.1  cgd 
     60      1.1  cgd #define makelower(c) (isupper((c)) ? tolower((c)) : (c))
     61      1.1  cgd 
     62      1.1  cgd /*  STRNCMP -	like strncmp except that we convert the
     63      1.1  cgd  *	 	first string to lower case before comparing
     64      1.1  cgd  *		if l_onecase is set.
     65      1.1  cgd  */
     66      1.1  cgd 
     67  1.1.1.1  jtc int
     68      1.1  cgd STRNCMP(s1, s2, len)
     69      1.1  cgd 	register char *s1,*s2;
     70      1.1  cgd 	register int len;
     71      1.1  cgd {
     72      1.1  cgd 	if (l_onecase) {
     73      1.1  cgd 	    do
     74      1.1  cgd 		if (*s2 - makelower(*s1))
     75      1.1  cgd 			return (*s2 - makelower(*s1));
     76      1.1  cgd 		else {
     77      1.1  cgd 			s2++;
     78      1.1  cgd 			s1++;
     79      1.1  cgd 		}
     80      1.1  cgd 	    while (--len);
     81      1.1  cgd 	} else {
     82      1.1  cgd 	    do
     83      1.1  cgd 		if (*s2 - *s1)
     84      1.1  cgd 			return (*s2 - *s1);
     85      1.1  cgd 		else {
     86      1.1  cgd 			s2++;
     87      1.1  cgd 			s1++;
     88      1.1  cgd 		}
     89      1.1  cgd 	    while (--len);
     90      1.1  cgd 	}
     91      1.1  cgd 	return(0);
     92      1.1  cgd }
     93      1.1  cgd 
     94      1.1  cgd /*	The following routine converts an irregular expression to
     95      1.1  cgd  *	internal format.
     96      1.1  cgd  *
     97      1.1  cgd  *	Either meta symbols (\a \d or \p) or character strings or
     98      1.1  cgd  *	operations ( alternation or perenthesizing ) can be
     99      1.1  cgd  *	specified.  Each starts with a descriptor byte.  The descriptor
    100      1.1  cgd  *	byte has STR set for strings, META set for meta symbols
    101      1.1  cgd  *	and OPER set for operations.
    102      1.1  cgd  *	The descriptor byte can also have the OPT bit set if the object
    103      1.1  cgd  *	defined is optional.  Also ALT can be set to indicate an alternation.
    104      1.1  cgd  *
    105      1.1  cgd  *	For metasymbols the byte following the descriptor byte identities
    106      1.1  cgd  *	the meta symbol (containing an ascii 'a', 'd', 'p', '|', or '(').  For
    107      1.1  cgd  *	strings the byte after the descriptor is a character count for
    108      1.1  cgd  *	the string:
    109      1.1  cgd  *
    110      1.1  cgd  *		meta symbols := descriptor
    111      1.1  cgd  *				symbol
    112      1.1  cgd  *
    113      1.1  cgd  *		strings :=	descriptor
    114      1.1  cgd  *				character count
    115      1.1  cgd  *				the string
    116      1.1  cgd  *
    117      1.1  cgd  *		operatins :=	descriptor
    118      1.1  cgd  *				symbol
    119      1.1  cgd  *				character count
    120      1.1  cgd  */
    121      1.1  cgd 
    122      1.1  cgd /*
    123      1.1  cgd  *  handy macros for accessing parts of match blocks
    124      1.1  cgd  */
    125      1.1  cgd #define MSYM(A) (*(A+1))	/* symbol in a meta symbol block */
    126      1.1  cgd #define MNEXT(A) (A+2)		/* character following a metasymbol block */
    127      1.1  cgd 
    128      1.1  cgd #define OSYM(A) (*(A+1))	/* symbol in an operation block */
    129      1.1  cgd #define OCNT(A) (*(A+2))	/* character count */
    130      1.1  cgd #define ONEXT(A) (A+3)		/* next character after the operation */
    131      1.1  cgd #define OPTR(A) (A+*(A+2))	/* place pointed to by the operator */
    132      1.1  cgd 
    133      1.1  cgd #define SCNT(A) (*(A+1))	/* byte count of a string */
    134      1.1  cgd #define SSTR(A) (A+2)		/* address of the string */
    135      1.1  cgd #define SNEXT(A) (A+2+*(A+1))	/* character following the string */
    136      1.1  cgd 
    137      1.1  cgd /*
    138      1.1  cgd  *  bit flags in the descriptor
    139      1.1  cgd  */
    140      1.1  cgd #define OPT 1
    141      1.1  cgd #define STR 2
    142      1.1  cgd #define META 4
    143      1.1  cgd #define ALT 8
    144      1.1  cgd #define OPER 16
    145      1.1  cgd 
    146  1.1.1.1  jtc static char *ccre;	/* pointer to current position in converted exp*/
    147  1.1.1.1  jtc static char *ure;	/* pointer current position in unconverted exp */
    148      1.1  cgd 
    149      1.1  cgd char *
    150      1.1  cgd convexp(re)
    151      1.1  cgd     char *re;		/* unconverted irregular expression */
    152      1.1  cgd {
    153      1.1  cgd     register char *cre;		/* pointer to converted regular expression */
    154      1.1  cgd 
    155      1.1  cgd     /* allocate room for the converted expression */
    156      1.1  cgd     if (re == NIL)
    157      1.1  cgd 	return (NIL);
    158      1.1  cgd     if (*re == '\0')
    159      1.1  cgd 	return (NIL);
    160      1.1  cgd     cre = malloc (4 * strlen(re) + 3);
    161      1.1  cgd     ccre = cre;
    162      1.1  cgd     ure = re;
    163      1.1  cgd 
    164      1.1  cgd     /* start the conversion with a \a */
    165      1.1  cgd     *cre = META | OPT;
    166      1.1  cgd     MSYM(cre) = 'a';
    167      1.1  cgd     ccre = MNEXT(cre);
    168      1.1  cgd 
    169      1.1  cgd     /* start the conversion (its recursive) */
    170      1.1  cgd     expconv ();
    171      1.1  cgd     *ccre = 0;
    172      1.1  cgd     return (cre);
    173      1.1  cgd }
    174      1.1  cgd 
    175  1.1.1.1  jtc static void
    176      1.1  cgd expconv()
    177      1.1  cgd {
    178      1.1  cgd     register char *cs;		/* pointer to current symbol in converted exp */
    179      1.1  cgd     register char c;		/* character being processed */
    180      1.1  cgd     register char *acs;		/* pinter to last alternate */
    181      1.1  cgd     register int temp;
    182      1.1  cgd 
    183      1.1  cgd     /* let the conversion begin */
    184      1.1  cgd     acs = NIL;
    185      1.1  cgd     cs = NIL;
    186      1.1  cgd     while (*ure != NIL) {
    187      1.1  cgd 	switch (c = *ure++) {
    188      1.1  cgd 
    189      1.1  cgd 	case '\\':
    190      1.1  cgd 	    switch (c = *ure++) {
    191      1.1  cgd 
    192      1.1  cgd 	    /* escaped characters are just characters */
    193      1.1  cgd 	    default:
    194      1.1  cgd 		if (cs == NIL || (*cs & STR) == 0) {
    195      1.1  cgd 		    cs = ccre;
    196      1.1  cgd 		    *cs = STR;
    197      1.1  cgd 		    SCNT(cs) = 1;
    198      1.1  cgd 		    ccre += 2;
    199      1.1  cgd 		} else
    200      1.1  cgd 		    SCNT(cs)++;
    201      1.1  cgd 		*ccre++ = c;
    202      1.1  cgd 		break;
    203      1.1  cgd 
    204      1.1  cgd 	    /* normal(?) metacharacters */
    205      1.1  cgd 	    case 'a':
    206      1.1  cgd 	    case 'd':
    207      1.1  cgd 	    case 'e':
    208      1.1  cgd 	    case 'p':
    209      1.1  cgd 		if (acs != NIL && acs != cs) {
    210      1.1  cgd 		    do {
    211      1.1  cgd 			temp = OCNT(acs);
    212      1.1  cgd 			OCNT(acs) = ccre - acs;
    213      1.1  cgd 			acs -= temp;
    214      1.1  cgd 		    } while (temp != 0);
    215      1.1  cgd 		    acs = NIL;
    216      1.1  cgd 		}
    217      1.1  cgd 		cs = ccre;
    218      1.1  cgd 		*cs = META;
    219      1.1  cgd 		MSYM(cs) = c;
    220      1.1  cgd 		ccre = MNEXT(cs);
    221      1.1  cgd 		break;
    222      1.1  cgd 	    }
    223      1.1  cgd 	    break;
    224      1.1  cgd 
    225      1.1  cgd 	/* just put the symbol in */
    226      1.1  cgd 	case '^':
    227      1.1  cgd 	case '$':
    228      1.1  cgd 	    if (acs != NIL && acs != cs) {
    229      1.1  cgd 		do {
    230      1.1  cgd 		    temp = OCNT(acs);
    231      1.1  cgd 		    OCNT(acs) = ccre - acs;
    232      1.1  cgd 		    acs -= temp;
    233      1.1  cgd 		} while (temp != 0);
    234      1.1  cgd 		acs = NIL;
    235      1.1  cgd 	    }
    236      1.1  cgd 	    cs = ccre;
    237      1.1  cgd 	    *cs = META;
    238      1.1  cgd 	    MSYM(cs) = c;
    239      1.1  cgd 	    ccre = MNEXT(cs);
    240      1.1  cgd 	    break;
    241      1.1  cgd 
    242      1.1  cgd 	/* mark the last match sequence as optional */
    243      1.1  cgd 	case '?':
    244      1.1  cgd 	    if (cs)
    245      1.1  cgd 	    	*cs = *cs | OPT;
    246      1.1  cgd 	    break;
    247      1.1  cgd 
    248      1.1  cgd 	/* recurse and define a subexpression */
    249      1.1  cgd 	case '(':
    250      1.1  cgd 	    if (acs != NIL && acs != cs) {
    251      1.1  cgd 		do {
    252      1.1  cgd 		    temp = OCNT(acs);
    253      1.1  cgd 		    OCNT(acs) = ccre - acs;
    254      1.1  cgd 		    acs -= temp;
    255      1.1  cgd 		} while (temp != 0);
    256      1.1  cgd 		acs = NIL;
    257      1.1  cgd 	    }
    258      1.1  cgd 	    cs = ccre;
    259      1.1  cgd 	    *cs = OPER;
    260      1.1  cgd 	    OSYM(cs) = '(';
    261      1.1  cgd 	    ccre = ONEXT(cs);
    262      1.1  cgd 	    expconv ();
    263      1.1  cgd 	    OCNT(cs) = ccre - cs;		/* offset to next symbol */
    264      1.1  cgd 	    break;
    265      1.1  cgd 
    266  1.1.1.1  jtc 	/* reurn from a recursion */
    267      1.1  cgd 	case ')':
    268      1.1  cgd 	    if (acs != NIL) {
    269      1.1  cgd 		do {
    270      1.1  cgd 		    temp = OCNT(acs);
    271      1.1  cgd 		    OCNT(acs) = ccre - acs;
    272      1.1  cgd 		    acs -= temp;
    273      1.1  cgd 		} while (temp != 0);
    274      1.1  cgd 		acs = NIL;
    275      1.1  cgd 	    }
    276      1.1  cgd 	    cs = ccre;
    277      1.1  cgd 	    *cs = META;
    278      1.1  cgd 	    MSYM(cs) = c;
    279      1.1  cgd 	    ccre = MNEXT(cs);
    280      1.1  cgd 	    return;
    281      1.1  cgd 
    282      1.1  cgd 	/* mark the last match sequence as having an alternate */
    283      1.1  cgd 	/* the third byte will contain an offset to jump over the */
    284      1.1  cgd 	/* alternate match in case the first did not fail */
    285      1.1  cgd 	case '|':
    286      1.1  cgd 	    if (acs != NIL && acs != cs)
    287      1.1  cgd 		OCNT(ccre) = ccre - acs;	/* make a back pointer */
    288      1.1  cgd 	    else
    289      1.1  cgd 		OCNT(ccre) = 0;
    290      1.1  cgd 	    *cs |= ALT;
    291      1.1  cgd 	    cs = ccre;
    292      1.1  cgd 	    *cs = OPER;
    293      1.1  cgd 	    OSYM(cs) = '|';
    294      1.1  cgd 	    ccre = ONEXT(cs);
    295      1.1  cgd 	    acs = cs;	/* remember that the pointer is to be filles */
    296      1.1  cgd 	    break;
    297      1.1  cgd 
    298      1.1  cgd 	/* if its not a metasymbol just build a scharacter string */
    299      1.1  cgd 	default:
    300      1.1  cgd 	    if (cs == NIL || (*cs & STR) == 0) {
    301      1.1  cgd 		cs = ccre;
    302      1.1  cgd 		*cs = STR;
    303      1.1  cgd 		SCNT(cs) = 1;
    304      1.1  cgd 		ccre = SSTR(cs);
    305      1.1  cgd 	    } else
    306      1.1  cgd 		SCNT(cs)++;
    307      1.1  cgd 	    *ccre++ = c;
    308      1.1  cgd 	    break;
    309      1.1  cgd 	}
    310      1.1  cgd     }
    311      1.1  cgd     if (acs != NIL) {
    312      1.1  cgd 	do {
    313      1.1  cgd 	    temp = OCNT(acs);
    314      1.1  cgd 	    OCNT(acs) = ccre - acs;
    315      1.1  cgd 	    acs -= temp;
    316      1.1  cgd 	} while (temp != 0);
    317      1.1  cgd 	acs = NIL;
    318      1.1  cgd     }
    319      1.1  cgd     return;
    320      1.1  cgd }
    321      1.1  cgd /* end of convertre */
    322      1.1  cgd 
    323      1.1  cgd 
    324      1.1  cgd /*
    325      1.1  cgd  *	The following routine recognises an irregular expresion
    326      1.1  cgd  *	with the following special characters:
    327      1.1  cgd  *
    328      1.1  cgd  *		\?	-	means last match was optional
    329      1.1  cgd  *		\a	-	matches any number of characters
    330      1.1  cgd  *		\d	-	matches any number of spaces and tabs
    331      1.1  cgd  *		\p	-	matches any number of alphanumeric
    332      1.1  cgd  *				characters. The
    333      1.1  cgd  *				characters matched will be copied into
    334      1.1  cgd  *				the area pointed to by 'name'.
    335      1.1  cgd  *		\|	-	alternation
    336      1.1  cgd  *		\( \)	-	grouping used mostly for alternation and
    337      1.1  cgd  *				optionality
    338      1.1  cgd  *
    339      1.1  cgd  *	The irregular expression must be translated to internal form
    340      1.1  cgd  *	prior to calling this routine
    341      1.1  cgd  *
    342      1.1  cgd  *	The value returned is the pointer to the first non \a
    343      1.1  cgd  *	character matched.
    344      1.1  cgd  */
    345      1.1  cgd 
    346      1.1  cgd char *
    347      1.1  cgd expmatch (s, re, mstring)
    348      1.1  cgd     register char *s;		/* string to check for a match in */
    349      1.1  cgd     register char *re;		/* a converted irregular expression */
    350      1.1  cgd     register char *mstring;	/* where to put whatever matches a \p */
    351      1.1  cgd {
    352      1.1  cgd     register char *cs;		/* the current symbol */
    353      1.1  cgd     register char *ptr,*s1;	/* temporary pointer */
    354      1.1  cgd     boolean matched;		/* a temporary boolean */
    355      1.1  cgd 
    356      1.1  cgd     /* initial conditions */
    357      1.1  cgd     if (re == NIL)
    358      1.1  cgd 	return (NIL);
    359      1.1  cgd     cs = re;
    360      1.1  cgd     matched = FALSE;
    361      1.1  cgd 
    362      1.1  cgd     /* loop till expression string is exhausted (or at least pretty tired) */
    363      1.1  cgd     while (*cs) {
    364      1.1  cgd 	switch (*cs & (OPER | STR | META)) {
    365      1.1  cgd 
    366      1.1  cgd 	/* try to match a string */
    367      1.1  cgd 	case STR:
    368      1.1  cgd 	    matched = !STRNCMP (s, SSTR(cs), SCNT(cs));
    369      1.1  cgd 	    if (matched) {
    370      1.1  cgd 
    371      1.1  cgd 		/* hoorah it matches */
    372      1.1  cgd 		s += SCNT(cs);
    373      1.1  cgd 		cs = SNEXT(cs);
    374      1.1  cgd 	    } else if (*cs & ALT) {
    375      1.1  cgd 
    376      1.1  cgd 		/* alternation, skip to next expression */
    377      1.1  cgd 		cs = SNEXT(cs);
    378      1.1  cgd 	    } else if (*cs & OPT) {
    379      1.1  cgd 
    380      1.1  cgd 		/* the match is optional */
    381      1.1  cgd 		cs = SNEXT(cs);
    382      1.1  cgd 		matched = 1;		/* indicate a successful match */
    383      1.1  cgd 	    } else {
    384      1.1  cgd 
    385      1.1  cgd 		/* no match, error return */
    386      1.1  cgd 		return (NIL);
    387      1.1  cgd 	    }
    388      1.1  cgd 	    break;
    389      1.1  cgd 
    390      1.1  cgd 	/* an operator, do something fancy */
    391      1.1  cgd 	case OPER:
    392      1.1  cgd 	    switch (OSYM(cs)) {
    393      1.1  cgd 
    394      1.1  cgd 	    /* this is an alternation */
    395      1.1  cgd 	    case '|':
    396      1.1  cgd 		if (matched)
    397      1.1  cgd 
    398      1.1  cgd 		    /* last thing in the alternation was a match, skip ahead */
    399      1.1  cgd 		    cs = OPTR(cs);
    400      1.1  cgd 		else
    401      1.1  cgd 
    402      1.1  cgd 		    /* no match, keep trying */
    403      1.1  cgd 		    cs = ONEXT(cs);
    404      1.1  cgd 		break;
    405      1.1  cgd 
    406      1.1  cgd 	    /* this is a grouping, recurse */
    407      1.1  cgd 	    case '(':
    408      1.1  cgd 		ptr = expmatch (s, ONEXT(cs), mstring);
    409      1.1  cgd 		if (ptr != NIL) {
    410      1.1  cgd 
    411      1.1  cgd 		    /* the subexpression matched */
    412      1.1  cgd 		    matched = 1;
    413      1.1  cgd 		    s = ptr;
    414      1.1  cgd 		} else if (*cs & ALT) {
    415      1.1  cgd 
    416      1.1  cgd 		    /* alternation, skip to next expression */
    417      1.1  cgd 		    matched = 0;
    418      1.1  cgd 		} else if (*cs & OPT) {
    419      1.1  cgd 
    420      1.1  cgd 		    /* the match is optional */
    421      1.1  cgd 		    matched = 1;	/* indicate a successful match */
    422      1.1  cgd 		} else {
    423      1.1  cgd 
    424      1.1  cgd 		    /* no match, error return */
    425      1.1  cgd 		    return (NIL);
    426      1.1  cgd 		}
    427      1.1  cgd 		cs = OPTR(cs);
    428      1.1  cgd 		break;
    429      1.1  cgd 	    }
    430      1.1  cgd 	    break;
    431      1.1  cgd 
    432      1.1  cgd 	/* try to match a metasymbol */
    433      1.1  cgd 	case META:
    434      1.1  cgd 	    switch (MSYM(cs)) {
    435      1.1  cgd 
    436      1.1  cgd 	    /* try to match anything and remember what was matched */
    437      1.1  cgd 	    case 'p':
    438      1.1  cgd 		/*
    439      1.1  cgd 		 *  This is really the same as trying the match the
    440      1.1  cgd 		 *  remaining parts of the expression to any subset
    441      1.1  cgd 		 *  of the string.
    442      1.1  cgd 		 */
    443      1.1  cgd 		s1 = s;
    444      1.1  cgd 		do {
    445      1.1  cgd 		    ptr = expmatch (s1, MNEXT(cs), mstring);
    446      1.1  cgd 		    if (ptr != NIL && s1 != s) {
    447      1.1  cgd 
    448      1.1  cgd 			/* we have a match, remember the match */
    449      1.1  cgd 			strncpy (mstring, s, s1 - s);
    450      1.1  cgd 			mstring[s1 - s] = '\0';
    451      1.1  cgd 			return (ptr);
    452      1.1  cgd 		    } else if (ptr != NIL && (*cs & OPT)) {
    453      1.1  cgd 
    454      1.1  cgd 			/* it was aoptional so no match is ok */
    455      1.1  cgd 			return (ptr);
    456      1.1  cgd 		    } else if (ptr != NIL) {
    457      1.1  cgd 
    458      1.1  cgd 			/* not optional and we still matched */
    459      1.1  cgd 			return (NIL);
    460      1.1  cgd 		    }
    461      1.1  cgd 		    if (!isalnum(*s1) && *s1 != '_')
    462      1.1  cgd 			return (NIL);
    463      1.1  cgd 		    if (*s1 == '\\')
    464      1.1  cgd 			_escaped = _escaped ? FALSE : TRUE;
    465      1.1  cgd 		    else
    466      1.1  cgd 			_escaped = FALSE;
    467      1.1  cgd 		} while (*s1++);
    468      1.1  cgd 		return (NIL);
    469      1.1  cgd 
    470      1.1  cgd 	    /* try to match anything */
    471      1.1  cgd 	    case 'a':
    472      1.1  cgd 		/*
    473      1.1  cgd 		 *  This is really the same as trying the match the
    474      1.1  cgd 		 *  remaining parts of the expression to any subset
    475      1.1  cgd 		 *  of the string.
    476      1.1  cgd 		 */
    477      1.1  cgd 		s1 = s;
    478      1.1  cgd 		do {
    479      1.1  cgd 		    ptr = expmatch (s1, MNEXT(cs), mstring);
    480      1.1  cgd 		    if (ptr != NIL && s1 != s) {
    481      1.1  cgd 
    482      1.1  cgd 			/* we have a match */
    483      1.1  cgd 			return (ptr);
    484      1.1  cgd 		    } else if (ptr != NIL && (*cs & OPT)) {
    485      1.1  cgd 
    486      1.1  cgd 			/* it was aoptional so no match is ok */
    487      1.1  cgd 			return (ptr);
    488      1.1  cgd 		    } else if (ptr != NIL) {
    489      1.1  cgd 
    490      1.1  cgd 			/* not optional and we still matched */
    491      1.1  cgd 			return (NIL);
    492      1.1  cgd 		    }
    493      1.1  cgd 		    if (*s1 == '\\')
    494      1.1  cgd 			_escaped = _escaped ? FALSE : TRUE;
    495      1.1  cgd 		    else
    496      1.1  cgd 			_escaped = FALSE;
    497      1.1  cgd 		} while (*s1++);
    498      1.1  cgd 		return (NIL);
    499      1.1  cgd 
    500      1.1  cgd 	    /* fail if we are currently _escaped */
    501      1.1  cgd 	    case 'e':
    502      1.1  cgd 		if (_escaped)
    503      1.1  cgd 		    return(NIL);
    504      1.1  cgd 		cs = MNEXT(cs);
    505      1.1  cgd 		break;
    506      1.1  cgd 
    507      1.1  cgd 	    /* match any number of tabs and spaces */
    508      1.1  cgd 	    case 'd':
    509      1.1  cgd 		ptr = s;
    510      1.1  cgd 		while (*s == ' ' || *s == '\t')
    511      1.1  cgd 		    s++;
    512      1.1  cgd 		if (s != ptr || s == _start) {
    513      1.1  cgd 
    514      1.1  cgd 		    /* match, be happy */
    515      1.1  cgd 		    matched = 1;
    516      1.1  cgd 		    cs = MNEXT(cs);
    517      1.1  cgd 		} else if (*s == '\n' || *s == '\0') {
    518      1.1  cgd 
    519      1.1  cgd 		    /* match, be happy */
    520      1.1  cgd 		    matched = 1;
    521      1.1  cgd 		    cs = MNEXT(cs);
    522      1.1  cgd 		} else if (*cs & ALT) {
    523      1.1  cgd 
    524      1.1  cgd 		    /* try the next part */
    525      1.1  cgd 		    matched = 0;
    526      1.1  cgd 		    cs = MNEXT(cs);
    527      1.1  cgd 		} else if (*cs & OPT) {
    528      1.1  cgd 
    529      1.1  cgd 		    /* doesn't matter */
    530      1.1  cgd 		    matched = 1;
    531      1.1  cgd 		    cs = MNEXT(cs);
    532      1.1  cgd 		} else
    533      1.1  cgd 
    534      1.1  cgd 		    /* no match, error return */
    535      1.1  cgd 		    return (NIL);
    536      1.1  cgd 		break;
    537      1.1  cgd 
    538      1.1  cgd 	    /* check for end of line */
    539      1.1  cgd 	    case '$':
    540      1.1  cgd 		if (*s == '\0' || *s == '\n') {
    541      1.1  cgd 
    542      1.1  cgd 		    /* match, be happy */
    543      1.1  cgd 		    s++;
    544      1.1  cgd 		    matched = 1;
    545      1.1  cgd 		    cs = MNEXT(cs);
    546      1.1  cgd 		} else if (*cs & ALT) {
    547      1.1  cgd 
    548      1.1  cgd 		    /* try the next part */
    549      1.1  cgd 		    matched = 0;
    550      1.1  cgd 		    cs = MNEXT(cs);
    551      1.1  cgd 		} else if (*cs & OPT) {
    552      1.1  cgd 
    553      1.1  cgd 		    /* doesn't matter */
    554      1.1  cgd 		    matched = 1;
    555      1.1  cgd 		    cs = MNEXT(cs);
    556      1.1  cgd 		} else
    557      1.1  cgd 
    558      1.1  cgd 		    /* no match, error return */
    559      1.1  cgd 		    return (NIL);
    560      1.1  cgd 		break;
    561      1.1  cgd 
    562      1.1  cgd 	    /* check for start of line */
    563      1.1  cgd 	    case '^':
    564      1.1  cgd 		if (s == _start) {
    565      1.1  cgd 
    566      1.1  cgd 		    /* match, be happy */
    567      1.1  cgd 		    matched = 1;
    568      1.1  cgd 		    cs = MNEXT(cs);
    569      1.1  cgd 		} else if (*cs & ALT) {
    570      1.1  cgd 
    571      1.1  cgd 		    /* try the next part */
    572      1.1  cgd 		    matched = 0;
    573      1.1  cgd 		    cs = MNEXT(cs);
    574      1.1  cgd 		} else if (*cs & OPT) {
    575      1.1  cgd 
    576      1.1  cgd 		    /* doesn't matter */
    577      1.1  cgd 		    matched = 1;
    578      1.1  cgd 		    cs = MNEXT(cs);
    579      1.1  cgd 		} else
    580      1.1  cgd 
    581      1.1  cgd 		    /* no match, error return */
    582      1.1  cgd 		    return (NIL);
    583      1.1  cgd 		break;
    584      1.1  cgd 
    585      1.1  cgd 	    /* end of a subexpression, return success */
    586      1.1  cgd 	    case ')':
    587      1.1  cgd 		return (s);
    588      1.1  cgd 	    }
    589      1.1  cgd 	    break;
    590      1.1  cgd 	}
    591      1.1  cgd     }
    592      1.1  cgd     return (s);
    593      1.1  cgd }
    594