Home | History | Annotate | Line # | Download | only in make
dir.c revision 1.87
      1 /*	$NetBSD: dir.c,v 1.87 2020/08/10 19:53:19 rillig Exp $	*/
      2 
      3 /*
      4  * Copyright (c) 1988, 1989, 1990 The Regents of the University of California.
      5  * All rights reserved.
      6  *
      7  * This code is derived from software contributed to Berkeley by
      8  * Adam de Boor.
      9  *
     10  * Redistribution and use in source and binary forms, with or without
     11  * modification, are permitted provided that the following conditions
     12  * are met:
     13  * 1. Redistributions of source code must retain the above copyright
     14  *    notice, this list of conditions and the following disclaimer.
     15  * 2. Redistributions in binary form must reproduce the above copyright
     16  *    notice, this list of conditions and the following disclaimer in the
     17  *    documentation and/or other materials provided with the distribution.
     18  * 3. Neither the name of the University nor the names of its contributors
     19  *    may be used to endorse or promote products derived from this software
     20  *    without specific prior written permission.
     21  *
     22  * THIS SOFTWARE IS PROVIDED BY THE REGENTS AND CONTRIBUTORS ``AS IS'' AND
     23  * ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
     24  * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
     25  * ARE DISCLAIMED.  IN NO EVENT SHALL THE REGENTS OR CONTRIBUTORS BE LIABLE
     26  * FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL
     27  * DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS
     28  * OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION)
     29  * HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT
     30  * LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY
     31  * OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF
     32  * SUCH DAMAGE.
     33  */
     34 
     35 /*
     36  * Copyright (c) 1988, 1989 by Adam de Boor
     37  * Copyright (c) 1989 by Berkeley Softworks
     38  * All rights reserved.
     39  *
     40  * This code is derived from software contributed to Berkeley by
     41  * Adam de Boor.
     42  *
     43  * Redistribution and use in source and binary forms, with or without
     44  * modification, are permitted provided that the following conditions
     45  * are met:
     46  * 1. Redistributions of source code must retain the above copyright
     47  *    notice, this list of conditions and the following disclaimer.
     48  * 2. Redistributions in binary form must reproduce the above copyright
     49  *    notice, this list of conditions and the following disclaimer in the
     50  *    documentation and/or other materials provided with the distribution.
     51  * 3. All advertising materials mentioning features or use of this software
     52  *    must display the following acknowledgement:
     53  *	This product includes software developed by the University of
     54  *	California, Berkeley and its contributors.
     55  * 4. Neither the name of the University nor the names of its contributors
     56  *    may be used to endorse or promote products derived from this software
     57  *    without specific prior written permission.
     58  *
     59  * THIS SOFTWARE IS PROVIDED BY THE REGENTS AND CONTRIBUTORS ``AS IS'' AND
     60  * ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
     61  * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
     62  * ARE DISCLAIMED.  IN NO EVENT SHALL THE REGENTS OR CONTRIBUTORS BE LIABLE
     63  * FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL
     64  * DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS
     65  * OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION)
     66  * HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT
     67  * LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY
     68  * OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF
     69  * SUCH DAMAGE.
     70  */
     71 
     72 #ifndef MAKE_NATIVE
     73 static char rcsid[] = "$NetBSD: dir.c,v 1.87 2020/08/10 19:53:19 rillig Exp $";
     74 #else
     75 #include <sys/cdefs.h>
     76 #ifndef lint
     77 #if 0
     78 static char sccsid[] = "@(#)dir.c	8.2 (Berkeley) 1/2/94";
     79 #else
     80 __RCSID("$NetBSD: dir.c,v 1.87 2020/08/10 19:53:19 rillig Exp $");
     81 #endif
     82 #endif /* not lint */
     83 #endif
     84 
     85 /*-
     86  * dir.c --
     87  *	Directory searching using wildcards and/or normal names...
     88  *	Used both for source wildcarding in the Makefile and for finding
     89  *	implicit sources.
     90  *
     91  * The interface for this module is:
     92  *	Dir_Init  	    Initialize the module.
     93  *
     94  *	Dir_InitCur	    Set the cur Path.
     95  *
     96  *	Dir_InitDot	    Set the dot Path.
     97  *
     98  *	Dir_End  	    Cleanup the module.
     99  *
    100  *	Dir_SetPATH	    Set ${.PATH} to reflect state of dirSearchPath.
    101  *
    102  *	Dir_HasWildcards    Returns TRUE if the name given it needs to
    103  *	    	  	    be wildcard-expanded.
    104  *
    105  *	Dir_Expand	    Given a pattern and a path, return a Lst of names
    106  *	    	  	    which match the pattern on the search path.
    107  *
    108  *	Dir_FindFile	    Searches for a file on a given search path.
    109  *	    	  	    If it exists, the entire path is returned.
    110  *	    	  	    Otherwise NULL is returned.
    111  *
    112  *	Dir_FindHereOrAbove Search for a path in the current directory and
    113  *			    then all the directories above it in turn until
    114  *			    the path is found or we reach the root ("/").
    115  *
    116  *	Dir_MTime 	    Return the modification time of a node. The file
    117  *	    	  	    is searched for along the default search path.
    118  *	    	  	    The path and mtime fields of the node are filled
    119  *	    	  	    in.
    120  *
    121  *	Dir_AddDir	    Add a directory to a search path.
    122  *
    123  *	Dir_MakeFlags	    Given a search path and a command flag, create
    124  *	    	  	    a string with each of the directories in the path
    125  *	    	  	    preceded by the command flag and all of them
    126  *	    	  	    separated by a space.
    127  *
    128  *	Dir_Destroy	    Destroy an element of a search path. Frees up all
    129  *	    	  	    things that can be freed for the element as long
    130  *	    	  	    as the element is no longer referenced by any other
    131  *	    	  	    search path.
    132  *	Dir_ClearPath	    Resets a search path to the empty list.
    133  *
    134  * For debugging:
    135  *	Dir_PrintDirectories	Print stats about the directory cache.
    136  */
    137 
    138 #include <sys/types.h>
    139 #include <sys/stat.h>
    140 
    141 #include <dirent.h>
    142 #include <errno.h>
    143 #include <stdio.h>
    144 
    145 #include "make.h"
    146 #include "hash.h"
    147 #include "dir.h"
    148 #include "job.h"
    149 
    150 /*
    151  *	A search path consists of a Lst of Path structures. A Path structure
    152  *	has in it the name of the directory and a hash table of all the files
    153  *	in the directory. This is used to cut down on the number of system
    154  *	calls necessary to find implicit dependents and their like. Since
    155  *	these searches are made before any actions are taken, we need not
    156  *	worry about the directory changing due to creation commands. If this
    157  *	hampers the style of some makefiles, they must be changed.
    158  *
    159  *	A list of all previously-read directories is kept in the
    160  *	openDirectories Lst. This list is checked first before a directory
    161  *	is opened.
    162  *
    163  *	The need for the caching of whole directories is brought about by
    164  *	the multi-level transformation code in suff.c, which tends to search
    165  *	for far more files than regular make does. In the initial
    166  *	implementation, the amount of time spent performing "stat" calls was
    167  *	truly astronomical. The problem with hashing at the start is,
    168  *	of course, that pmake doesn't then detect changes to these directories
    169  *	during the course of the make. Three possibilities suggest themselves:
    170  *
    171  *	    1) just use stat to test for a file's existence. As mentioned
    172  *	       above, this is very inefficient due to the number of checks
    173  *	       engendered by the multi-level transformation code.
    174  *	    2) use readdir() and company to search the directories, keeping
    175  *	       them open between checks. I have tried this and while it
    176  *	       didn't slow down the process too much, it could severely
    177  *	       affect the amount of parallelism available as each directory
    178  *	       open would take another file descriptor out of play for
    179  *	       handling I/O for another job. Given that it is only recently
    180  *	       that UNIX OS's have taken to allowing more than 20 or 32
    181  *	       file descriptors for a process, this doesn't seem acceptable
    182  *	       to me.
    183  *	    3) record the mtime of the directory in the Path structure and
    184  *	       verify the directory hasn't changed since the contents were
    185  *	       hashed. This will catch the creation or deletion of files,
    186  *	       but not the updating of files. However, since it is the
    187  *	       creation and deletion that is the problem, this could be
    188  *	       a good thing to do. Unfortunately, if the directory (say ".")
    189  *	       were fairly large and changed fairly frequently, the constant
    190  *	       rehashing could seriously degrade performance. It might be
    191  *	       good in such cases to keep track of the number of rehashes
    192  *	       and if the number goes over a (small) limit, resort to using
    193  *	       stat in its place.
    194  *
    195  *	An additional thing to consider is that pmake is used primarily
    196  *	to create C programs and until recently pcc-based compilers refused
    197  *	to allow you to specify where the resulting object file should be
    198  *	placed. This forced all objects to be created in the current
    199  *	directory. This isn't meant as a full excuse, just an explanation of
    200  *	some of the reasons for the caching used here.
    201  *
    202  *	One more note: the location of a target's file is only performed
    203  *	on the downward traversal of the graph and then only for terminal
    204  *	nodes in the graph. This could be construed as wrong in some cases,
    205  *	but prevents inadvertent modification of files when the "installed"
    206  *	directory for a file is provided in the search path.
    207  *
    208  *	Another data structure maintained by this module is an mtime
    209  *	cache used when the searching of cached directories fails to find
    210  *	a file. In the past, Dir_FindFile would simply perform an access()
    211  *	call in such a case to determine if the file could be found using
    212  *	just the name given. When this hit, however, all that was gained
    213  *	was the knowledge that the file existed. Given that an access() is
    214  *	essentially a stat() without the copyout() call, and that the same
    215  *	filesystem overhead would have to be incurred in Dir_MTime, it made
    216  *	sense to replace the access() with a stat() and record the mtime
    217  *	in a cache for when Dir_MTime was actually called.
    218  */
    219 
    220 Lst dirSearchPath;		/* main search path */
    221 
    222 static Lst openDirectories;	/* the list of all open directories */
    223 
    224 /*
    225  * Variables for gathering statistics on the efficiency of the hashing
    226  * mechanism.
    227  */
    228 static int hits;		/* Found in directory cache */
    229 static int misses;		/* Sad, but not evil misses */
    230 static int nearmisses;		/* Found under search path */
    231 static int bigmisses;		/* Sought by itself */
    232 
    233 static Path *dot;		/* contents of current directory */
    234 static Path *cur;		/* contents of current directory, if not dot */
    235 static Path *dotLast;		/* a fake path entry indicating we need to
    236 				 * look for . last */
    237 
    238 /* Results of doing a last-resort stat in Dir_FindFile -- if we have to go to
    239  * the system to find the file, we might as well have its mtime on record.
    240  *
    241  * XXX: If this is done way early, there's a chance other rules will have
    242  * already updated the file, in which case we'll update it again. Generally,
    243  * there won't be two rules to update a single file, so this should be ok,
    244  * but... */
    245 static Hash_Table mtimes;
    246 
    247 static Hash_Table lmtimes;	/* same as mtimes but for lstat */
    248 
    249 static int DirFindName(const void *, const void *);
    250 static int DirMatchFiles(const char *, Path *, Lst);
    251 static void DirExpandCurly(const char *, const char *, Lst, Lst);
    252 static void DirExpandInt(const char *, Lst, Lst);
    253 static int DirPrintWord(void *, void *);
    254 static int DirPrintDir(void *, void *);
    255 static char *DirLookup(Path *, const char *, const char *, Boolean);
    256 static char *DirLookupSubdir(Path *, const char *);
    257 static char *DirFindDot(Boolean, const char *, const char *);
    258 static char *DirLookupAbs(Path *, const char *, const char *);
    259 
    260 
    261 /*
    262  * We use stat(2) a lot, cache the results
    263  * mtime and mode are all we care about.
    264  */
    265 struct cache_st {
    266     time_t lmtime;		/* lstat */
    267     time_t mtime;		/* stat */
    268     mode_t mode;
    269 };
    270 
    271 /* minimize changes below */
    272 #define CST_LSTAT 1
    273 #define CST_UPDATE 2
    274 
    275 static int
    276 cached_stats(Hash_Table *htp, const char *pathname, struct stat *st, int flags)
    277 {
    278     Hash_Entry *entry;
    279     struct cache_st *cst;
    280     int rc;
    281 
    282     if (!pathname || !pathname[0])
    283 	return -1;
    284 
    285     entry = Hash_FindEntry(htp, pathname);
    286 
    287     if (entry && (flags & CST_UPDATE) == 0) {
    288 	cst = entry->clientPtr;
    289 
    290 	memset(st, 0, sizeof(*st));
    291 	st->st_mode = cst->mode;
    292 	st->st_mtime = (flags & CST_LSTAT) ? cst->lmtime : cst->mtime;
    293 	if (st->st_mtime) {
    294 	    if (DEBUG(DIR)) {
    295 		fprintf(debug_file, "Using cached time %s for %s\n",
    296 			Targ_FmtTime(st->st_mtime), pathname);
    297 	    }
    298 	    return 0;
    299 	}
    300     }
    301 
    302     rc = (flags & CST_LSTAT) ? lstat(pathname, st) : stat(pathname, st);
    303     if (rc == -1)
    304 	return -1;
    305 
    306     if (st->st_mtime == 0)
    307 	st->st_mtime = 1;	/* avoid confusion with missing file */
    308 
    309     if (!entry)
    310 	entry = Hash_CreateEntry(htp, pathname, NULL);
    311     if (!entry->clientPtr) {
    312 	entry->clientPtr = bmake_malloc(sizeof(*cst));
    313 	memset(entry->clientPtr, 0, sizeof(*cst));
    314     }
    315     cst = entry->clientPtr;
    316     if ((flags & CST_LSTAT)) {
    317 	cst->lmtime = st->st_mtime;
    318     } else {
    319 	cst->mtime = st->st_mtime;
    320     }
    321     cst->mode = st->st_mode;
    322     if (DEBUG(DIR)) {
    323 	fprintf(debug_file, "   Caching %s for %s\n",
    324 		Targ_FmtTime(st->st_mtime), pathname);
    325     }
    326 
    327     return 0;
    328 }
    329 
    330 int
    331 cached_stat(const char *pathname, void *st)
    332 {
    333     return cached_stats(&mtimes, pathname, st, 0);
    334 }
    335 
    336 int
    337 cached_lstat(const char *pathname, void *st)
    338 {
    339     return cached_stats(&lmtimes, pathname, st, CST_LSTAT);
    340 }
    341 
    342 /*-
    343  *-----------------------------------------------------------------------
    344  * Dir_Init --
    345  *	initialize things for this module
    346  *
    347  * Results:
    348  *	none
    349  *
    350  * Side Effects:
    351  *	some directories may be opened.
    352  *-----------------------------------------------------------------------
    353  */
    354 void
    355 Dir_Init(const char *cdname)
    356 {
    357     if (!cdname) {
    358 	dirSearchPath = Lst_Init(FALSE);
    359 	openDirectories = Lst_Init(FALSE);
    360 	Hash_InitTable(&mtimes, 0);
    361 	Hash_InitTable(&lmtimes, 0);
    362 	return;
    363     }
    364     Dir_InitCur(cdname);
    365 
    366     dotLast = bmake_malloc(sizeof(Path));
    367     dotLast->refCount = 1;
    368     dotLast->hits = 0;
    369     dotLast->name = bmake_strdup(".DOTLAST");
    370     Hash_InitTable(&dotLast->files, -1);
    371 }
    372 
    373 /*
    374  * Called by Dir_Init() and whenever .CURDIR is assigned to.
    375  */
    376 void
    377 Dir_InitCur(const char *cdname)
    378 {
    379     Path *p;
    380 
    381     if (cdname != NULL) {
    382 	/*
    383 	 * Our build directory is not the same as our source directory.
    384 	 * Keep this one around too.
    385 	 */
    386 	if ((p = Dir_AddDir(NULL, cdname))) {
    387 	    p->refCount += 1;
    388 	    if (cur && cur != p) {
    389 		/*
    390 		 * We've been here before, cleanup.
    391 		 */
    392 		cur->refCount -= 1;
    393 		Dir_Destroy(cur);
    394 	    }
    395 	    cur = p;
    396 	}
    397     }
    398 }
    399 
    400 /*-
    401  *-----------------------------------------------------------------------
    402  * Dir_InitDot --
    403  *	(re)initialize "dot" (current/object directory) path hash
    404  *
    405  * Results:
    406  *	none
    407  *
    408  * Side Effects:
    409  *	some directories may be opened.
    410  *-----------------------------------------------------------------------
    411  */
    412 void
    413 Dir_InitDot(void)
    414 {
    415     if (dot != NULL) {
    416 	LstNode ln;
    417 
    418 	/* Remove old entry from openDirectories, but do not destroy. */
    419 	ln = Lst_Member(openDirectories, dot);
    420 	(void)Lst_Remove(openDirectories, ln);
    421     }
    422 
    423     dot = Dir_AddDir(NULL, ".");
    424 
    425     if (dot == NULL) {
    426 	Error("Cannot open `.' (%s)", strerror(errno));
    427 	exit(1);
    428     }
    429 
    430     /*
    431      * We always need to have dot around, so we increment its reference count
    432      * to make sure it's not destroyed.
    433      */
    434     dot->refCount += 1;
    435     Dir_SetPATH();		/* initialize */
    436 }
    437 
    438 /*-
    439  *-----------------------------------------------------------------------
    440  * Dir_End --
    441  *	cleanup things for this module
    442  *
    443  * Results:
    444  *	none
    445  *
    446  * Side Effects:
    447  *	none
    448  *-----------------------------------------------------------------------
    449  */
    450 void
    451 Dir_End(void)
    452 {
    453 #ifdef CLEANUP
    454     if (cur) {
    455 	cur->refCount -= 1;
    456 	Dir_Destroy(cur);
    457     }
    458     dot->refCount -= 1;
    459     dotLast->refCount -= 1;
    460     Dir_Destroy(dotLast);
    461     Dir_Destroy(dot);
    462     Dir_ClearPath(dirSearchPath);
    463     Lst_Destroy(dirSearchPath, NULL);
    464     Dir_ClearPath(openDirectories);
    465     Lst_Destroy(openDirectories, NULL);
    466     Hash_DeleteTable(&mtimes);
    467 #endif
    468 }
    469 
    470 /*
    471  * We want ${.PATH} to indicate the order in which we will actually
    472  * search, so we rebuild it after any .PATH: target.
    473  * This is the simplest way to deal with the effect of .DOTLAST.
    474  */
    475 void
    476 Dir_SetPATH(void)
    477 {
    478     LstNode ln;			/* a list element */
    479     Path *p;
    480     Boolean hasLastDot = FALSE;	/* true we should search dot last */
    481 
    482     Var_Delete(".PATH", VAR_GLOBAL);
    483 
    484     if (Lst_Open(dirSearchPath) == SUCCESS) {
    485 	if ((ln = Lst_First(dirSearchPath)) != NULL) {
    486 	    p = (Path *)Lst_Datum(ln);
    487 	    if (p == dotLast) {
    488 		hasLastDot = TRUE;
    489 		Var_Append(".PATH", dotLast->name, VAR_GLOBAL);
    490 	    }
    491 	}
    492 
    493 	if (!hasLastDot) {
    494 	    if (dot)
    495 		Var_Append(".PATH", dot->name, VAR_GLOBAL);
    496 	    if (cur)
    497 		Var_Append(".PATH", cur->name, VAR_GLOBAL);
    498 	}
    499 
    500 	while ((ln = Lst_Next(dirSearchPath)) != NULL) {
    501 	    p = (Path *)Lst_Datum(ln);
    502 	    if (p == dotLast)
    503 		continue;
    504 	    if (p == dot && hasLastDot)
    505 		continue;
    506 	    Var_Append(".PATH", p->name, VAR_GLOBAL);
    507 	}
    508 
    509 	if (hasLastDot) {
    510 	    if (dot)
    511 		Var_Append(".PATH", dot->name, VAR_GLOBAL);
    512 	    if (cur)
    513 		Var_Append(".PATH", cur->name, VAR_GLOBAL);
    514 	}
    515 	Lst_Close(dirSearchPath);
    516     }
    517 }
    518 
    519 /*-
    520  *-----------------------------------------------------------------------
    521  * DirFindName --
    522  *	See if the Path structure describes the same directory as the
    523  *	given one by comparing their names. Called from Dir_AddDir via
    524  *	Lst_Find when searching the list of open directories.
    525  *
    526  * Input:
    527  *	p		Current name
    528  *	dname		Desired name
    529  *
    530  * Results:
    531  *	0 if it is the same. Non-zero otherwise
    532  *
    533  * Side Effects:
    534  *	None
    535  *-----------------------------------------------------------------------
    536  */
    537 static int
    538 DirFindName(const void *p, const void *dname)
    539 {
    540     return strcmp(((const Path *)p)->name, dname);
    541 }
    542 
    543 /*-
    544  *-----------------------------------------------------------------------
    545  * Dir_HasWildcards  --
    546  *	see if the given name has any wildcard characters in it
    547  *	be careful not to expand unmatching brackets or braces.
    548  *	XXX: This code is not 100% correct. ([^]] fails etc.)
    549  *	I really don't think that make(1) should be expanding
    550  *	patterns, because then you have to set a mechanism for
    551  *	escaping the expansion!
    552  *
    553  * Input:
    554  *	name		name to check
    555  *
    556  * Results:
    557  *	returns TRUE if the word should be expanded, FALSE otherwise
    558  *
    559  * Side Effects:
    560  *	none
    561  *-----------------------------------------------------------------------
    562  */
    563 Boolean
    564 Dir_HasWildcards(char *name)
    565 {
    566     char *cp;
    567     int wild = 0, brace = 0, bracket = 0;
    568 
    569     for (cp = name; *cp; cp++) {
    570 	switch (*cp) {
    571 	case '{':
    572 	    brace++;
    573 	    wild = 1;
    574 	    break;
    575 	case '}':
    576 	    brace--;
    577 	    break;
    578 	case '[':
    579 	    bracket++;
    580 	    wild = 1;
    581 	    break;
    582 	case ']':
    583 	    bracket--;
    584 	    break;
    585 	case '?':
    586 	case '*':
    587 	    wild = 1;
    588 	    break;
    589 	default:
    590 	    break;
    591 	}
    592     }
    593     return wild && bracket == 0 && brace == 0;
    594 }
    595 
    596 /*-
    597  *-----------------------------------------------------------------------
    598  * DirMatchFiles --
    599  * 	Given a pattern and a Path structure, see if any files
    600  *	match the pattern and add their names to the 'expansions' list if
    601  *	any do. This is incomplete -- it doesn't take care of patterns like
    602  *	src / *src / *.c properly (just *.c on any of the directories), but it
    603  *	will do for now.
    604  *
    605  * Input:
    606  *	pattern		Pattern to look for
    607  *	p		Directory to search
    608  *	expansion	Place to store the results
    609  *
    610  * Results:
    611  *	Always returns 0
    612  *
    613  * Side Effects:
    614  *	File names are added to the expansions lst. The directory will be
    615  *	fully hashed when this is done.
    616  *-----------------------------------------------------------------------
    617  */
    618 static int
    619 DirMatchFiles(const char *pattern, Path *p, Lst expansions)
    620 {
    621     Hash_Search search;		/* Index into the directory's table */
    622     Hash_Entry *entry;		/* Current entry in the table */
    623     Boolean isDot;		/* TRUE if the directory being searched is . */
    624 
    625     isDot = (*p->name == '.' && p->name[1] == '\0');
    626 
    627     for (entry = Hash_EnumFirst(&p->files, &search);
    628 	 entry != NULL;
    629 	 entry = Hash_EnumNext(&search))
    630     {
    631 	/*
    632 	 * See if the file matches the given pattern. Note we follow the UNIX
    633 	 * convention that dot files will only be found if the pattern
    634 	 * begins with a dot (note also that as a side effect of the hashing
    635 	 * scheme, .* won't match . or .. since they aren't hashed).
    636 	 */
    637 	if (Str_Match(entry->name, pattern) &&
    638 	    ((entry->name[0] != '.') ||
    639 	     (pattern[0] == '.')))
    640 	{
    641 	    (void)Lst_AtEnd(expansions,
    642 			    (isDot ? bmake_strdup(entry->name) :
    643 			     str_concat3(p->name, "/", entry->name)));
    644 	}
    645     }
    646     return 0;
    647 }
    648 
    649 static const char *
    650 closing_brace(const char *p)
    651 {
    652     int nest = 0;
    653     while (*p != '\0' && !(*p == '}' && nest == 0)) {
    654 	if (*p == '{')
    655 	    nest++;
    656 	if (*p == '}')
    657 	    nest--;
    658 	p++;
    659     }
    660     return p;
    661 }
    662 
    663 static const char *
    664 separator_comma(const char *p)
    665 {
    666     int nest = 0;
    667     while (*p != '\0' && !((*p == '}' || *p == ',') && nest == 0)) {
    668 	if (*p == '{')
    669 	    nest++;
    670 	if (*p == '}')
    671 	    nest--;
    672 	p++;
    673     }
    674     return p;
    675 }
    676 
    677 static Boolean
    678 contains_wildcard(const char *p)
    679 {
    680     for (; *p != '\0'; p++) {
    681 	switch (*p) {
    682 	case '*':
    683 	case '?':
    684 	case '{':
    685 	case '[':
    686 	    return TRUE;
    687 	}
    688     }
    689     return FALSE;
    690 }
    691 
    692 static char *
    693 concat3(const char *a, size_t a_len, const char *b, size_t b_len,
    694 	const char *c, size_t c_len)
    695 {
    696     size_t s_len = a_len + b_len + c_len;
    697     char *s = bmake_malloc(s_len + 1);
    698     memcpy(s, a, a_len);
    699     memcpy(s + a_len, b, b_len);
    700     memcpy(s + a_len + b_len, c, c_len);
    701     s[s_len] = '\0';
    702     return s;
    703 }
    704 
    705 /*-
    706  *-----------------------------------------------------------------------
    707  * DirExpandCurly --
    708  *	Expand curly braces like the C shell. Does this recursively.
    709  *	Note the special case: if after the piece of the curly brace is
    710  *	done there are no wildcard characters in the result, the result is
    711  *	placed on the list WITHOUT CHECKING FOR ITS EXISTENCE.
    712  *
    713  * Input:
    714  *	word		Entire word to expand
    715  *	brace		First curly brace in it
    716  *	path		Search path to use
    717  *	expansions	Place to store the expansions
    718  *
    719  * Results:
    720  *	None.
    721  *
    722  * Side Effects:
    723  *	The given list is filled with the expansions...
    724  *
    725  *-----------------------------------------------------------------------
    726  */
    727 static void
    728 DirExpandCurly(const char *word, const char *brace, Lst path, Lst expansions)
    729 {
    730     /* Split the word into prefix '{' middle '}' suffix. */
    731 
    732     const char *middle = brace + 1;
    733     const char *middle_end = closing_brace(middle);
    734     size_t middle_len = (size_t)(middle_end - middle);
    735     const char *prefix;
    736     size_t prefix_len;
    737     const char *suffix;
    738     size_t suffix_len;
    739     const char *piece;
    740 
    741     if (DEBUG(DIR)) {
    742 	fprintf(debug_file, "%s: word=\"%s\" middle=\"%.*s\"\n",
    743 		__func__, word, (int)middle_len, middle);
    744     }
    745 
    746     if (*middle_end == '\0') {
    747 	Error("Unterminated {} clause \"%s\"", middle);
    748 	return;
    749     }
    750 
    751     prefix = word;
    752     prefix_len = (size_t)(brace - prefix);
    753     suffix = middle_end + 1;
    754     suffix_len = strlen(suffix);
    755 
    756     /* Split the middle into pieces, separated by commas. */
    757 
    758     piece = middle;
    759     while (piece < middle_end + 1) {
    760 	const char *piece_end = separator_comma(piece);
    761 	size_t piece_len = (size_t)(piece_end - piece);
    762 
    763 	char *file = concat3(prefix, prefix_len, piece, piece_len,
    764 			     suffix, suffix_len);
    765 
    766 	if (DEBUG(DIR)) {
    767 	    fprintf(debug_file, "%s: \"%.*s\" + \"%.*s\" + \"%s\" = \"%s\"\n",
    768 		    __func__, (int)prefix_len, prefix, (int)piece_len, piece,
    769 		    suffix, file);
    770 	}
    771 
    772 	if (contains_wildcard(file)) {
    773 	    Dir_Expand(file, path, expansions);
    774 	    free(file);
    775 	} else {
    776 	    (void)Lst_AtEnd(expansions, file);
    777 	}
    778 
    779 	piece = piece_end + 1;	/* skip over the comma or closing brace */
    780     }
    781 }
    782 
    783 
    784 /*-
    785  *-----------------------------------------------------------------------
    786  * DirExpandInt --
    787  *	Internal expand routine. Passes through the directories in the
    788  *	path one by one, calling DirMatchFiles for each. NOTE: This still
    789  *	doesn't handle patterns in directories...
    790  *
    791  * Input:
    792  *	word		Word to expand
    793  *	path		Path on which to look
    794  *	expansions	Place to store the result
    795  *
    796  * Results:
    797  *	None.
    798  *
    799  * Side Effects:
    800  *	Things are added to the expansions list.
    801  *
    802  *-----------------------------------------------------------------------
    803  */
    804 static void
    805 DirExpandInt(const char *word, Lst path, Lst expansions)
    806 {
    807     LstNode ln;			/* Current node */
    808     Path *p;			/* Directory in the node */
    809 
    810     if (Lst_Open(path) == SUCCESS) {
    811 	while ((ln = Lst_Next(path)) != NULL) {
    812 	    p = (Path *)Lst_Datum(ln);
    813 	    DirMatchFiles(word, p, expansions);
    814 	}
    815 	Lst_Close(path);
    816     }
    817 }
    818 
    819 /*-
    820  *-----------------------------------------------------------------------
    821  * DirPrintWord --
    822  *	Print a word in the list of expansions. Callback for Dir_Expand
    823  *	when DEBUG(DIR), via Lst_ForEach.
    824  *
    825  * Results:
    826  *	=== 0
    827  *
    828  * Side Effects:
    829  *	The passed word is printed, followed by a space.
    830  *
    831  *-----------------------------------------------------------------------
    832  */
    833 static int
    834 DirPrintWord(void *word, void *dummy MAKE_ATTR_UNUSED)
    835 {
    836     fprintf(debug_file, "%s ", (char *)word);
    837 
    838     return 0;
    839 }
    840 
    841 /*-
    842  *-----------------------------------------------------------------------
    843  * Dir_Expand  --
    844  *	Expand the given word into a list of words by globbing it looking
    845  *	in the directories on the given search path.
    846  *
    847  * Input:
    848  *	word		the word to expand
    849  *	path		the list of directories in which to find the
    850  *			resulting files
    851  *	expansions	the list on which to place the results
    852  *
    853  * Results:
    854  *	A list of words consisting of the files which exist along the search
    855  *	path matching the given pattern.
    856  *
    857  * Side Effects:
    858  *	Directories may be opened. Who knows?
    859  *	Undefined behavior if the word is really in read-only memory.
    860  *-----------------------------------------------------------------------
    861  */
    862 void
    863 Dir_Expand(const char *word, Lst path, Lst expansions)
    864 {
    865     const char *cp;
    866 
    867     if (DEBUG(DIR)) {
    868 	fprintf(debug_file, "Expanding \"%s\"... ", word);
    869     }
    870 
    871     cp = strchr(word, '{');
    872     if (cp) {
    873 	DirExpandCurly(word, cp, path, expansions);
    874     } else {
    875 	cp = strchr(word, '/');
    876 	if (cp) {
    877 	    /*
    878 	     * The thing has a directory component -- find the first wildcard
    879 	     * in the string.
    880 	     */
    881 	    for (cp = word; *cp; cp++) {
    882 		if (*cp == '?' || *cp == '[' || *cp == '*' || *cp == '{') {
    883 		    break;
    884 		}
    885 	    }
    886 	    if (*cp == '{') {
    887 		/*
    888 		 * This one will be fun.
    889 		 */
    890 		DirExpandCurly(word, cp, path, expansions);
    891 		return;
    892 	    } else if (*cp != '\0') {
    893 		/*
    894 		 * Back up to the start of the component
    895 		 */
    896 		char *dirpath;
    897 
    898 		while (cp > word && *cp != '/') {
    899 		    cp--;
    900 		}
    901 		if (cp != word) {
    902 		    char sc;
    903 		    /*
    904 		     * If the glob isn't in the first component, try and find
    905 		     * all the components up to the one with a wildcard.
    906 		     */
    907 		    sc = cp[1];
    908 		    ((char *)UNCONST(cp))[1] = '\0';
    909 		    dirpath = Dir_FindFile(word, path);
    910 		    ((char *)UNCONST(cp))[1] = sc;
    911 		    /*
    912 		     * dirpath is null if can't find the leading component
    913 		     * XXX: Dir_FindFile won't find internal components.
    914 		     * i.e. if the path contains ../Etc/Object and we're
    915 		     * looking for Etc, it won't be found. Ah well.
    916 		     * Probably not important.
    917 		     */
    918 		    if (dirpath != NULL) {
    919 			char *dp = &dirpath[strlen(dirpath) - 1];
    920 			if (*dp == '/')
    921 			    *dp = '\0';
    922 			path = Lst_Init(FALSE);
    923 			(void)Dir_AddDir(path, dirpath);
    924 			DirExpandInt(cp + 1, path, expansions);
    925 			Lst_Destroy(path, NULL);
    926 		    }
    927 		} else {
    928 		    /*
    929 		     * Start the search from the local directory
    930 		     */
    931 		    DirExpandInt(word, path, expansions);
    932 		}
    933 	    } else {
    934 		/*
    935 		 * Return the file -- this should never happen.
    936 		 */
    937 		DirExpandInt(word, path, expansions);
    938 	    }
    939 	} else {
    940 	    /*
    941 	     * First the files in dot
    942 	     */
    943 	    DirMatchFiles(word, dot, expansions);
    944 
    945 	    /*
    946 	     * Then the files in every other directory on the path.
    947 	     */
    948 	    DirExpandInt(word, path, expansions);
    949 	}
    950     }
    951     if (DEBUG(DIR)) {
    952 	Lst_ForEach(expansions, DirPrintWord, NULL);
    953 	fprintf(debug_file, "\n");
    954     }
    955 }
    956 
    957 /*-
    958  *-----------------------------------------------------------------------
    959  * DirLookup  --
    960  *	Find if the file with the given name exists in the given path.
    961  *
    962  * Results:
    963  *	The path to the file or NULL. This path is guaranteed to be in a
    964  *	different part of memory than name and so may be safely free'd.
    965  *
    966  * Side Effects:
    967  *	None.
    968  *-----------------------------------------------------------------------
    969  */
    970 static char *
    971 DirLookup(Path *p, const char *name MAKE_ATTR_UNUSED, const char *cp,
    972 	  Boolean hasSlash MAKE_ATTR_UNUSED)
    973 {
    974     char *file;			/* the current filename to check */
    975 
    976     if (DEBUG(DIR)) {
    977 	fprintf(debug_file, "   %s ...\n", p->name);
    978     }
    979 
    980     if (Hash_FindEntry(&p->files, cp) == NULL)
    981 	return NULL;
    982 
    983     file = str_concat3(p->name, "/", cp);
    984     if (DEBUG(DIR)) {
    985 	fprintf(debug_file, "   returning %s\n", file);
    986     }
    987     p->hits += 1;
    988     hits += 1;
    989     return file;
    990 }
    991 
    992 
    993 /*-
    994  *-----------------------------------------------------------------------
    995  * DirLookupSubdir  --
    996  *	Find if the file with the given name exists in the given path.
    997  *
    998  * Results:
    999  *	The path to the file or NULL. This path is guaranteed to be in a
   1000  *	different part of memory than name and so may be safely free'd.
   1001  *
   1002  * Side Effects:
   1003  *	If the file is found, it is added in the modification times hash
   1004  *	table.
   1005  *-----------------------------------------------------------------------
   1006  */
   1007 static char *
   1008 DirLookupSubdir(Path *p, const char *name)
   1009 {
   1010     struct stat stb;		/* Buffer for stat, if necessary */
   1011     char *file;			/* the current filename to check */
   1012 
   1013     if (p != dot) {
   1014 	file = str_concat3(p->name, "/", name);
   1015     } else {
   1016 	/*
   1017 	 * Checking in dot -- DON'T put a leading ./ on the thing.
   1018 	 */
   1019 	file = bmake_strdup(name);
   1020     }
   1021 
   1022     if (DEBUG(DIR)) {
   1023 	fprintf(debug_file, "checking %s ...\n", file);
   1024     }
   1025 
   1026     if (cached_stat(file, &stb) == 0) {
   1027 	nearmisses += 1;
   1028 	return file;
   1029     }
   1030     free(file);
   1031     return NULL;
   1032 }
   1033 
   1034 /*-
   1035  *-----------------------------------------------------------------------
   1036  * DirLookupAbs  --
   1037  *	Find if the file with the given name exists in the given path.
   1038  *
   1039  * Results:
   1040  *	The path to the file, the empty string or NULL. If the file is
   1041  *	the empty string, the search should be terminated.
   1042  *	This path is guaranteed to be in a different part of memory
   1043  *	than name and so may be safely free'd.
   1044  *
   1045  * Side Effects:
   1046  *	None.
   1047  *-----------------------------------------------------------------------
   1048  */
   1049 static char *
   1050 DirLookupAbs(Path *p, const char *name, const char *cp)
   1051 {
   1052     char *p1;			/* pointer into p->name */
   1053     const char *p2;		/* pointer into name */
   1054 
   1055     if (DEBUG(DIR)) {
   1056 	fprintf(debug_file, "   %s ...\n", p->name);
   1057     }
   1058 
   1059     /*
   1060      * If the file has a leading path component and that component
   1061      * exactly matches the entire name of the current search
   1062      * directory, we can attempt another cache lookup. And if we don't
   1063      * have a hit, we can safely assume the file does not exist at all.
   1064      */
   1065     for (p1 = p->name, p2 = name; *p1 && *p1 == *p2; p1++, p2++) {
   1066 	continue;
   1067     }
   1068     if (*p1 != '\0' || p2 != cp - 1) {
   1069 	return NULL;
   1070     }
   1071 
   1072     if (Hash_FindEntry(&p->files, cp) == NULL) {
   1073 	if (DEBUG(DIR)) {
   1074 	    fprintf(debug_file, "   must be here but isn't -- returning\n");
   1075 	}
   1076 	/* Return empty string: terminates search */
   1077 	return bmake_strdup("");
   1078     }
   1079 
   1080     p->hits += 1;
   1081     hits += 1;
   1082     if (DEBUG(DIR)) {
   1083 	fprintf(debug_file, "   returning %s\n", name);
   1084     }
   1085     return bmake_strdup(name);
   1086 }
   1087 
   1088 /*-
   1089  *-----------------------------------------------------------------------
   1090  * DirFindDot  --
   1091  *	Find the file given on "." or curdir
   1092  *
   1093  * Results:
   1094  *	The path to the file or NULL. This path is guaranteed to be in a
   1095  *	different part of memory than name and so may be safely free'd.
   1096  *
   1097  * Side Effects:
   1098  *	Hit counts change
   1099  *-----------------------------------------------------------------------
   1100  */
   1101 static char *
   1102 DirFindDot(Boolean hasSlash MAKE_ATTR_UNUSED, const char *name, const char *cp)
   1103 {
   1104 
   1105     if (Hash_FindEntry(&dot->files, cp) != NULL) {
   1106 	if (DEBUG(DIR)) {
   1107 	    fprintf(debug_file, "   in '.'\n");
   1108 	}
   1109 	hits += 1;
   1110 	dot->hits += 1;
   1111 	return bmake_strdup(name);
   1112     }
   1113     if (cur && Hash_FindEntry(&cur->files, cp) != NULL) {
   1114 	if (DEBUG(DIR)) {
   1115 	    fprintf(debug_file, "   in ${.CURDIR} = %s\n", cur->name);
   1116 	}
   1117 	hits += 1;
   1118 	cur->hits += 1;
   1119 	return str_concat3(cur->name, "/", cp);
   1120     }
   1121 
   1122     return NULL;
   1123 }
   1124 
   1125 /*-
   1126  *-----------------------------------------------------------------------
   1127  * Dir_FindFile  --
   1128  *	Find the file with the given name along the given search path.
   1129  *
   1130  * Input:
   1131  *	name		the file to find
   1132  *	path		the Lst of directories to search
   1133  *
   1134  * Results:
   1135  *	The path to the file or NULL. This path is guaranteed to be in a
   1136  *	different part of memory than name and so may be safely free'd.
   1137  *
   1138  * Side Effects:
   1139  *	If the file is found in a directory which is not on the path
   1140  *	already (either 'name' is absolute or it is a relative path
   1141  *	[ dir1/.../dirn/file ] which exists below one of the directories
   1142  *	already on the search path), its directory is added to the end
   1143  *	of the path on the assumption that there will be more files in
   1144  *	that directory later on. Sometimes this is true. Sometimes not.
   1145  *-----------------------------------------------------------------------
   1146  */
   1147 char *
   1148 Dir_FindFile(const char *name, Lst path)
   1149 {
   1150     LstNode ln;			/* a list element */
   1151     char *file;			/* the current filename to check */
   1152     Path *p;			/* current path member */
   1153     const char *cp;		/* Terminal name of file */
   1154     Boolean hasLastDot = FALSE;	/* true we should search dot last */
   1155     Boolean hasSlash;		/* true if 'name' contains a / */
   1156     struct stat stb;		/* Buffer for stat, if necessary */
   1157     const char *trailing_dot = ".";
   1158 
   1159     /*
   1160      * Find the final component of the name and note whether it has a
   1161      * slash in it (the name, I mean)
   1162      */
   1163     cp = strrchr(name, '/');
   1164     if (cp) {
   1165 	hasSlash = TRUE;
   1166 	cp += 1;
   1167     } else {
   1168 	hasSlash = FALSE;
   1169 	cp = name;
   1170     }
   1171 
   1172     if (DEBUG(DIR)) {
   1173 	fprintf(debug_file, "Searching for %s ...", name);
   1174     }
   1175 
   1176     if (Lst_Open(path) == FAILURE) {
   1177 	if (DEBUG(DIR)) {
   1178 	    fprintf(debug_file, "couldn't open path, file not found\n");
   1179 	}
   1180 	misses += 1;
   1181 	return NULL;
   1182     }
   1183 
   1184     if ((ln = Lst_First(path)) != NULL) {
   1185 	p = (Path *)Lst_Datum(ln);
   1186 	if (p == dotLast) {
   1187 	    hasLastDot = TRUE;
   1188 	    if (DEBUG(DIR))
   1189 		fprintf(debug_file, "[dot last]...");
   1190 	}
   1191     }
   1192     if (DEBUG(DIR)) {
   1193 	fprintf(debug_file, "\n");
   1194     }
   1195 
   1196     /*
   1197      * If there's no leading directory components or if the leading
   1198      * directory component is exactly `./', consult the cached contents
   1199      * of each of the directories on the search path.
   1200      */
   1201     if (!hasSlash || (cp - name == 2 && *name == '.')) {
   1202 	/*
   1203 	 * We look through all the directories on the path seeking one which
   1204 	 * contains the final component of the given name.  If such a beast
   1205 	 * is found, we concatenate the directory name and the final
   1206 	 * component and return the resulting string. If we don't find any
   1207 	 * such thing, we go on to phase two...
   1208 	 *
   1209 	 * No matter what, we always look for the file in the current
   1210 	 * directory before anywhere else (unless we found the magic
   1211 	 * DOTLAST path, in which case we search it last) and we *do not*
   1212 	 * add the ./ to it if it exists.
   1213 	 * This is so there are no conflicts between what the user
   1214 	 * specifies (fish.c) and what pmake finds (./fish.c).
   1215 	 */
   1216 	if (!hasLastDot && (file = DirFindDot(hasSlash, name, cp)) != NULL) {
   1217 	    Lst_Close(path);
   1218 	    return file;
   1219 	}
   1220 
   1221 	while ((ln = Lst_Next(path)) != NULL) {
   1222 	    p = (Path *)Lst_Datum(ln);
   1223 	    if (p == dotLast)
   1224 		continue;
   1225 	    if ((file = DirLookup(p, name, cp, hasSlash)) != NULL) {
   1226 		Lst_Close(path);
   1227 		return file;
   1228 	    }
   1229 	}
   1230 
   1231 	if (hasLastDot && (file = DirFindDot(hasSlash, name, cp)) != NULL) {
   1232 	    Lst_Close(path);
   1233 	    return file;
   1234 	}
   1235     }
   1236     Lst_Close(path);
   1237 
   1238     /*
   1239      * We didn't find the file on any directory in the search path.
   1240      * If the name doesn't contain a slash, that means it doesn't exist.
   1241      * If it *does* contain a slash, however, there is still hope: it
   1242      * could be in a subdirectory of one of the members of the search
   1243      * path. (eg. /usr/include and sys/types.h. The above search would
   1244      * fail to turn up types.h in /usr/include, but it *is* in
   1245      * /usr/include/sys/types.h).
   1246      * [ This no longer applies: If we find such a beast, we assume there
   1247      * will be more (what else can we assume?) and add all but the last
   1248      * component of the resulting name onto the search path (at the
   1249      * end).]
   1250      * This phase is only performed if the file is *not* absolute.
   1251      */
   1252     if (!hasSlash) {
   1253 	if (DEBUG(DIR)) {
   1254 	    fprintf(debug_file, "   failed.\n");
   1255 	}
   1256 	misses += 1;
   1257 	return NULL;
   1258     }
   1259 
   1260     if (*cp == '\0') {
   1261 	/* we were given a trailing "/" */
   1262 	cp = trailing_dot;
   1263     }
   1264 
   1265     if (name[0] != '/') {
   1266 	Boolean checkedDot = FALSE;
   1267 
   1268 	if (DEBUG(DIR)) {
   1269 	    fprintf(debug_file, "   Trying subdirectories...\n");
   1270 	}
   1271 
   1272 	if (!hasLastDot) {
   1273 	    if (dot) {
   1274 		checkedDot = TRUE;
   1275 		if ((file = DirLookupSubdir(dot, name)) != NULL)
   1276 		    return file;
   1277 	    }
   1278 	    if (cur && (file = DirLookupSubdir(cur, name)) != NULL)
   1279 		return file;
   1280 	}
   1281 
   1282 	(void)Lst_Open(path);
   1283 	while ((ln = Lst_Next(path)) != NULL) {
   1284 	    p = (Path *)Lst_Datum(ln);
   1285 	    if (p == dotLast)
   1286 		continue;
   1287 	    if (p == dot) {
   1288 		if (checkedDot)
   1289 		    continue;
   1290 		checkedDot = TRUE;
   1291 	    }
   1292 	    if ((file = DirLookupSubdir(p, name)) != NULL) {
   1293 		Lst_Close(path);
   1294 		return file;
   1295 	    }
   1296 	}
   1297 	Lst_Close(path);
   1298 
   1299 	if (hasLastDot) {
   1300 	    if (dot && !checkedDot) {
   1301 		checkedDot = TRUE;
   1302 		if ((file = DirLookupSubdir(dot, name)) != NULL)
   1303 		    return file;
   1304 	    }
   1305 	    if (cur && (file = DirLookupSubdir(cur, name)) != NULL)
   1306 		return file;
   1307 	}
   1308 
   1309 	if (checkedDot) {
   1310 	    /*
   1311 	     * Already checked by the given name, since . was in the path,
   1312 	     * so no point in proceeding...
   1313 	     */
   1314 	    if (DEBUG(DIR)) {
   1315 		fprintf(debug_file, "   Checked . already, returning NULL\n");
   1316 	    }
   1317 	    return NULL;
   1318 	}
   1319 
   1320     } else { /* name[0] == '/' */
   1321 
   1322 	/*
   1323 	 * For absolute names, compare directory path prefix against the
   1324 	 * the directory path of each member on the search path for an exact
   1325 	 * match. If we have an exact match on any member of the search path,
   1326 	 * use the cached contents of that member to lookup the final file
   1327 	 * component. If that lookup fails we can safely assume that the
   1328 	 * file does not exist at all.  This is signified by DirLookupAbs()
   1329 	 * returning an empty string.
   1330 	 */
   1331 	if (DEBUG(DIR)) {
   1332 	    fprintf(debug_file, "   Trying exact path matches...\n");
   1333 	}
   1334 
   1335 	if (!hasLastDot && cur &&
   1336 	    ((file = DirLookupAbs(cur, name, cp)) != NULL)) {
   1337 	    if (file[0] == '\0') {
   1338 		free(file);
   1339 		return NULL;
   1340 	    }
   1341 	    return file;
   1342 	}
   1343 
   1344 	(void)Lst_Open(path);
   1345 	while ((ln = Lst_Next(path)) != NULL) {
   1346 	    p = (Path *)Lst_Datum(ln);
   1347 	    if (p == dotLast)
   1348 		continue;
   1349 	    if ((file = DirLookupAbs(p, name, cp)) != NULL) {
   1350 		Lst_Close(path);
   1351 		if (file[0] == '\0') {
   1352 		    free(file);
   1353 		    return NULL;
   1354 		}
   1355 		return file;
   1356 	    }
   1357 	}
   1358 	Lst_Close(path);
   1359 
   1360 	if (hasLastDot && cur &&
   1361 	    ((file = DirLookupAbs(cur, name, cp)) != NULL)) {
   1362 	    if (file[0] == '\0') {
   1363 		free(file);
   1364 		return NULL;
   1365 	    }
   1366 	    return file;
   1367 	}
   1368     }
   1369 
   1370     /*
   1371      * Didn't find it that way, either. Sigh. Phase 3. Add its directory
   1372      * onto the search path in any case, just in case, then look for the
   1373      * thing in the hash table. If we find it, grand. We return a new
   1374      * copy of the name. Otherwise we sadly return a NULL pointer. Sigh.
   1375      * Note that if the directory holding the file doesn't exist, this will
   1376      * do an extra search of the final directory on the path. Unless something
   1377      * weird happens, this search won't succeed and life will be groovy.
   1378      *
   1379      * Sigh. We cannot add the directory onto the search path because
   1380      * of this amusing case:
   1381      * $(INSTALLDIR)/$(FILE): $(FILE)
   1382      *
   1383      * $(FILE) exists in $(INSTALLDIR) but not in the current one.
   1384      * When searching for $(FILE), we will find it in $(INSTALLDIR)
   1385      * b/c we added it here. This is not good...
   1386      */
   1387 #ifdef notdef
   1388     if (cp == traling_dot) {
   1389 	cp = strrchr(name, '/');
   1390 	cp += 1;
   1391     }
   1392     cp[-1] = '\0';
   1393     (void)Dir_AddDir(path, name);
   1394     cp[-1] = '/';
   1395 
   1396     bigmisses += 1;
   1397     ln = Lst_Last(path);
   1398     if (ln == NULL) {
   1399 	return NULL;
   1400     } else {
   1401 	p = (Path *)Lst_Datum(ln);
   1402     }
   1403 
   1404     if (Hash_FindEntry(&p->files, cp) != NULL) {
   1405 	return bmake_strdup(name);
   1406     } else {
   1407 	return NULL;
   1408     }
   1409 #else /* !notdef */
   1410     if (DEBUG(DIR)) {
   1411 	fprintf(debug_file, "   Looking for \"%s\" ...\n", name);
   1412     }
   1413 
   1414     bigmisses += 1;
   1415     if (cached_stat(name, &stb) == 0) {
   1416 	return bmake_strdup(name);
   1417     }
   1418 
   1419     if (DEBUG(DIR)) {
   1420 	fprintf(debug_file, "   failed. Returning NULL\n");
   1421     }
   1422     return NULL;
   1423 #endif /* notdef */
   1424 }
   1425 
   1426 
   1427 /*-
   1428  *-----------------------------------------------------------------------
   1429  * Dir_FindHereOrAbove  --
   1430  *	search for a path starting at a given directory and then working
   1431  *	our way up towards the root.
   1432  *
   1433  * Input:
   1434  *	here		starting directory
   1435  *	search_path	the path we are looking for
   1436  *	result		the result of a successful search is placed here
   1437  *	rlen		the length of the result buffer
   1438  *			(typically MAXPATHLEN + 1)
   1439  *
   1440  * Results:
   1441  *	0 on failure, 1 on success [in which case the found path is put
   1442  *	in the result buffer].
   1443  *
   1444  * Side Effects:
   1445  *-----------------------------------------------------------------------
   1446  */
   1447 int
   1448 Dir_FindHereOrAbove(char *here, char *search_path, char *result, int rlen)
   1449 {
   1450     struct stat st;
   1451     char dirbase[MAXPATHLEN + 1], *db_end;
   1452     char try[MAXPATHLEN + 1], *try_end;
   1453 
   1454     /* copy out our starting point */
   1455     snprintf(dirbase, sizeof(dirbase), "%s", here);
   1456     db_end = dirbase + strlen(dirbase);
   1457 
   1458     /* loop until we determine a result */
   1459     while (1) {
   1460 
   1461 	/* try and stat(2) it ... */
   1462 	snprintf(try, sizeof(try), "%s/%s", dirbase, search_path);
   1463 	if (cached_stat(try, &st) != -1) {
   1464 	    /*
   1465 	     * success!  if we found a file, chop off
   1466 	     * the filename so we return a directory.
   1467 	     */
   1468 	    if ((st.st_mode & S_IFMT) != S_IFDIR) {
   1469 		try_end = try + strlen(try);
   1470 		while (try_end > try && *try_end != '/')
   1471 		    try_end--;
   1472 		if (try_end > try)
   1473 		    *try_end = 0;	/* chop! */
   1474 	    }
   1475 
   1476 	    /*
   1477 	     * done!
   1478 	     */
   1479 	    snprintf(result, rlen, "%s", try);
   1480 	    return 1;
   1481 	}
   1482 
   1483 	/*
   1484 	 * nope, we didn't find it.  if we used up dirbase we've
   1485 	 * reached the root and failed.
   1486 	 */
   1487 	if (db_end == dirbase)
   1488 	    break;		/* failed! */
   1489 
   1490 	/*
   1491 	 * truncate dirbase from the end to move up a dir
   1492 	 */
   1493 	while (db_end > dirbase && *db_end != '/')
   1494 	    db_end--;
   1495 	*db_end = 0;		/* chop! */
   1496 
   1497     } /* while (1) */
   1498 
   1499     /*
   1500      * we failed...
   1501      */
   1502     return 0;
   1503 }
   1504 
   1505 /*-
   1506  *-----------------------------------------------------------------------
   1507  * Dir_MTime  --
   1508  *	Find the modification time of the file described by gn along the
   1509  *	search path dirSearchPath.
   1510  *
   1511  * Input:
   1512  *	gn		the file whose modification time is desired
   1513  *
   1514  * Results:
   1515  *	The modification time or 0 if it doesn't exist
   1516  *
   1517  * Side Effects:
   1518  *	The modification time is placed in the node's mtime slot.
   1519  *	If the node didn't have a path entry before, and Dir_FindFile
   1520  *	found one for it, the full name is placed in the path slot.
   1521  *-----------------------------------------------------------------------
   1522  */
   1523 int
   1524 Dir_MTime(GNode *gn, Boolean recheck)
   1525 {
   1526     char *fullName;		/* the full pathname of name */
   1527     struct stat stb;		/* buffer for finding the mod time */
   1528 
   1529     if (gn->type & OP_ARCHV) {
   1530 	return Arch_MTime(gn);
   1531     } else if (gn->type & OP_PHONY) {
   1532 	gn->mtime = 0;
   1533 	return 0;
   1534     } else if (gn->path == NULL) {
   1535 	if (gn->type & OP_NOPATH)
   1536 	    fullName = NULL;
   1537 	else {
   1538 	    fullName = Dir_FindFile(gn->name, Suff_FindPath(gn));
   1539 	    if (fullName == NULL && gn->flags & FROM_DEPEND &&
   1540 		!Lst_IsEmpty(gn->iParents)) {
   1541 		char *cp;
   1542 
   1543 		cp = strrchr(gn->name, '/');
   1544 		if (cp) {
   1545 		    /*
   1546 		     * This is an implied source, and it may have moved,
   1547 		     * see if we can find it via the current .PATH
   1548 		     */
   1549 		    cp++;
   1550 
   1551 		    fullName = Dir_FindFile(cp, Suff_FindPath(gn));
   1552 		    if (fullName) {
   1553 			/*
   1554 			 * Put the found file in gn->path
   1555 			 * so that we give that to the compiler.
   1556 			 */
   1557 			gn->path = bmake_strdup(fullName);
   1558 			if (!Job_RunTarget(".STALE", gn->fname))
   1559 			    fprintf(stdout,
   1560 				    "%s: %s, %d: ignoring stale %s for %s, "
   1561 				    "found %s\n", progname, gn->fname,
   1562 				    gn->lineno,
   1563 				    makeDependfile, gn->name, fullName);
   1564 		    }
   1565 		}
   1566 	    }
   1567 	    if (DEBUG(DIR))
   1568 		fprintf(debug_file, "Found '%s' as '%s'\n",
   1569 			gn->name, fullName ? fullName : "(not found)");
   1570 	}
   1571     } else {
   1572 	fullName = gn->path;
   1573     }
   1574 
   1575     if (fullName == NULL) {
   1576 	fullName = bmake_strdup(gn->name);
   1577     }
   1578 
   1579     if (cached_stats(&mtimes, fullName, &stb, recheck ? CST_UPDATE : 0) < 0) {
   1580 	if (gn->type & OP_MEMBER) {
   1581 	    if (fullName != gn->path)
   1582 		free(fullName);
   1583 	    return Arch_MemMTime(gn);
   1584 	} else {
   1585 	    stb.st_mtime = 0;
   1586 	}
   1587     }
   1588 
   1589     if (fullName && gn->path == NULL) {
   1590 	gn->path = fullName;
   1591     }
   1592 
   1593     gn->mtime = stb.st_mtime;
   1594     return gn->mtime;
   1595 }
   1596 
   1597 /*-
   1598  *-----------------------------------------------------------------------
   1599  * Dir_AddDir --
   1600  *	Add the given name to the end of the given path. The order of
   1601  *	the arguments is backwards so ParseDoDependency can do a
   1602  *	Lst_ForEach of its list of paths...
   1603  *
   1604  * Input:
   1605  *	path		the path to which the directory should be
   1606  *			added
   1607  *	name		the name of the directory to add
   1608  *
   1609  * Results:
   1610  *	none
   1611  *
   1612  * Side Effects:
   1613  *	A structure is added to the list and the directory is
   1614  *	read and hashed.
   1615  *-----------------------------------------------------------------------
   1616  */
   1617 Path *
   1618 Dir_AddDir(Lst path, const char *name)
   1619 {
   1620     LstNode ln = NULL;		/* node in case Path structure is found */
   1621     Path *p = NULL;		/* pointer to new Path structure */
   1622     DIR *d;			/* for reading directory */
   1623     struct dirent *dp;		/* entry in directory */
   1624 
   1625     if (strcmp(name, ".DOTLAST") == 0) {
   1626 	ln = Lst_Find(path, name, DirFindName);
   1627 	if (ln != NULL)
   1628 	    return (Path *)Lst_Datum(ln);
   1629 	else {
   1630 	    dotLast->refCount += 1;
   1631 	    (void)Lst_AtFront(path, dotLast);
   1632 	}
   1633     }
   1634 
   1635     if (path)
   1636 	ln = Lst_Find(openDirectories, name, DirFindName);
   1637     if (ln != NULL) {
   1638 	p = (Path *)Lst_Datum(ln);
   1639 	if (path && Lst_Member(path, p) == NULL) {
   1640 	    p->refCount += 1;
   1641 	    (void)Lst_AtEnd(path, p);
   1642 	}
   1643     } else {
   1644 	if (DEBUG(DIR)) {
   1645 	    fprintf(debug_file, "Caching %s ...", name);
   1646 	}
   1647 
   1648 	if ((d = opendir(name)) != NULL) {
   1649 	    p = bmake_malloc(sizeof(Path));
   1650 	    p->name = bmake_strdup(name);
   1651 	    p->hits = 0;
   1652 	    p->refCount = 1;
   1653 	    Hash_InitTable(&p->files, -1);
   1654 
   1655 	    while ((dp = readdir(d)) != NULL) {
   1656 #if defined(sun) && defined(d_ino) /* d_ino is a sunos4 #define for d_fileno */
   1657 		/*
   1658 		 * The sun directory library doesn't check for a 0 inode
   1659 		 * (0-inode slots just take up space), so we have to do
   1660 		 * it ourselves.
   1661 		 */
   1662 		if (dp->d_fileno == 0) {
   1663 		    continue;
   1664 		}
   1665 #endif /* sun && d_ino */
   1666 		(void)Hash_CreateEntry(&p->files, dp->d_name, NULL);
   1667 	    }
   1668 	    (void)closedir(d);
   1669 	    (void)Lst_AtEnd(openDirectories, p);
   1670 	    if (path != NULL)
   1671 		(void)Lst_AtEnd(path, p);
   1672 	}
   1673 	if (DEBUG(DIR)) {
   1674 	    fprintf(debug_file, "done\n");
   1675 	}
   1676     }
   1677     return p;
   1678 }
   1679 
   1680 /*-
   1681  *-----------------------------------------------------------------------
   1682  * Dir_CopyDir --
   1683  *	Callback function for duplicating a search path via Lst_Duplicate.
   1684  *	Ups the reference count for the directory.
   1685  *
   1686  * Results:
   1687  *	Returns the Path it was given.
   1688  *
   1689  * Side Effects:
   1690  *	The refCount of the path is incremented.
   1691  *
   1692  *-----------------------------------------------------------------------
   1693  */
   1694 void *
   1695 Dir_CopyDir(void *p)
   1696 {
   1697     ((Path *)p)->refCount += 1;
   1698 
   1699     return p;
   1700 }
   1701 
   1702 /*-
   1703  *-----------------------------------------------------------------------
   1704  * Dir_MakeFlags --
   1705  *	Make a string by taking all the directories in the given search
   1706  *	path and preceding them by the given flag. Used by the suffix
   1707  *	module to create variables for compilers based on suffix search
   1708  *	paths.
   1709  *
   1710  * Input:
   1711  *	flag		flag which should precede each directory
   1712  *	path		list of directories
   1713  *
   1714  * Results:
   1715  *	The string mentioned above. Note that there is no space between
   1716  *	the given flag and each directory. The empty string is returned if
   1717  *	Things don't go well.
   1718  *
   1719  * Side Effects:
   1720  *	None
   1721  *-----------------------------------------------------------------------
   1722  */
   1723 char *
   1724 Dir_MakeFlags(const char *flag, Lst path)
   1725 {
   1726     char *str;			/* the string which will be returned */
   1727     char *s1, *s2;		/* the current directory preceded by 'flag' */
   1728     LstNode ln;			/* the node of the current directory */
   1729     Path *p;			/* the structure describing the current
   1730 				 * directory */
   1731 
   1732     str = bmake_strdup("");
   1733 
   1734     if (Lst_Open(path) == SUCCESS) {
   1735 	while ((ln = Lst_Next(path)) != NULL) {
   1736 	    p = (Path *)Lst_Datum(ln);
   1737 	    s2 = str_concat2(flag, p->name);
   1738 	    str = str_concat3(s1 = str, " ", s2);
   1739 	    free(s1);
   1740 	    free(s2);
   1741 	}
   1742 	Lst_Close(path);
   1743     }
   1744 
   1745     return str;
   1746 }
   1747 
   1748 /*-
   1749  *-----------------------------------------------------------------------
   1750  * Dir_Destroy --
   1751  *	Nuke a directory descriptor, if possible. Callback procedure
   1752  *	for the suffixes module when destroying a search path.
   1753  *
   1754  * Input:
   1755  *	pp		The directory descriptor to nuke
   1756  *
   1757  * Results:
   1758  *	None.
   1759  *
   1760  * Side Effects:
   1761  *	If no other path references this directory (refCount == 0),
   1762  *	the Path and all its data are freed.
   1763  *
   1764  *-----------------------------------------------------------------------
   1765  */
   1766 void
   1767 Dir_Destroy(void *pp)
   1768 {
   1769     Path *p = (Path *)pp;
   1770     p->refCount -= 1;
   1771 
   1772     if (p->refCount == 0) {
   1773 	LstNode ln;
   1774 
   1775 	ln = Lst_Member(openDirectories, p);
   1776 	(void)Lst_Remove(openDirectories, ln);
   1777 
   1778 	Hash_DeleteTable(&p->files);
   1779 	free(p->name);
   1780 	free(p);
   1781     }
   1782 }
   1783 
   1784 /*-
   1785  *-----------------------------------------------------------------------
   1786  * Dir_ClearPath --
   1787  *	Clear out all elements of the given search path. This is different
   1788  *	from destroying the list, notice.
   1789  *
   1790  * Input:
   1791  *	path		Path to clear
   1792  *
   1793  * Results:
   1794  *	None.
   1795  *
   1796  * Side Effects:
   1797  *	The path is set to the empty list.
   1798  *
   1799  *-----------------------------------------------------------------------
   1800  */
   1801 void
   1802 Dir_ClearPath(Lst path)
   1803 {
   1804     Path *p;
   1805     while (!Lst_IsEmpty(path)) {
   1806 	p = (Path *)Lst_DeQueue(path);
   1807 	Dir_Destroy(p);
   1808     }
   1809 }
   1810 
   1811 
   1812 /*-
   1813  *-----------------------------------------------------------------------
   1814  * Dir_Concat --
   1815  *	Concatenate two paths, adding the second to the end of the first.
   1816  *	Makes sure to avoid duplicates.
   1817  *
   1818  * Input:
   1819  *	path1		Dest
   1820  *	path2		Source
   1821  *
   1822  * Results:
   1823  *	None
   1824  *
   1825  * Side Effects:
   1826  *	Reference counts for added dirs are upped.
   1827  *
   1828  *-----------------------------------------------------------------------
   1829  */
   1830 void
   1831 Dir_Concat(Lst path1, Lst path2)
   1832 {
   1833     LstNode ln;
   1834     Path *p;
   1835 
   1836     for (ln = Lst_First(path2); ln != NULL; ln = Lst_Succ(ln)) {
   1837 	p = (Path *)Lst_Datum(ln);
   1838 	if (Lst_Member(path1, p) == NULL) {
   1839 	    p->refCount += 1;
   1840 	    (void)Lst_AtEnd(path1, p);
   1841 	}
   1842     }
   1843 }
   1844 
   1845 /********** DEBUG INFO **********/
   1846 void
   1847 Dir_PrintDirectories(void)
   1848 {
   1849     LstNode ln;
   1850     Path *p;
   1851 
   1852     fprintf(debug_file, "#*** Directory Cache:\n");
   1853     fprintf(debug_file,
   1854 	    "# Stats: %d hits %d misses %d near misses %d losers (%d%%)\n",
   1855 	    hits, misses, nearmisses, bigmisses,
   1856 	    (hits + bigmisses + nearmisses ?
   1857 	     hits * 100 / (hits + bigmisses + nearmisses) : 0));
   1858     fprintf(debug_file, "# %-20s referenced\thits\n", "directory");
   1859     if (Lst_Open(openDirectories) == SUCCESS) {
   1860 	while ((ln = Lst_Next(openDirectories)) != NULL) {
   1861 	    p = (Path *)Lst_Datum(ln);
   1862 	    fprintf(debug_file, "# %-20s %10d\t%4d\n", p->name, p->refCount,
   1863 		    p->hits);
   1864 	}
   1865 	Lst_Close(openDirectories);
   1866     }
   1867 }
   1868 
   1869 static int
   1870 DirPrintDir(void *p, void *dummy MAKE_ATTR_UNUSED)
   1871 {
   1872     fprintf(debug_file, "%s ", ((Path *)p)->name);
   1873     return 0;
   1874 }
   1875 
   1876 void
   1877 Dir_PrintPath(Lst path)
   1878 {
   1879     Lst_ForEach(path, DirPrintDir, NULL);
   1880 }
   1881