Home | History | Annotate | Line # | Download | only in makewhatis
makewhatis.c revision 1.21
      1 /*	$NetBSD: makewhatis.c,v 1.21 2002/01/31 22:43:41 tv Exp $	*/
      2 
      3 /*-
      4  * Copyright (c) 1999 The NetBSD Foundation, Inc.
      5  * All rights reserved.
      6  *
      7  * This code is derived from software contributed to The NetBSD Foundation
      8  * by Matthias Scheler.
      9  *
     10  * Redistribution and use in source and binary forms, with or without
     11  * modification, are permitted provided that the following conditions
     12  * are met:
     13  * 1. Redistributions of source code must retain the above copyright
     14  *    notice, this list of conditions and the following disclaimer.
     15  * 2. Redistributions in binary form must reproduce the above copyright
     16  *    notice, this list of conditions and the following disclaimer in the
     17  *    documentation and/or other materials provided with the distribution.
     18  * 3. All advertising materials mentioning features or use of this software
     19  *    must display the following acknowledgement:
     20  *	This product includes software developed by the NetBSD
     21  *	Foundation, Inc. and its contributors.
     22  * 4. Neither the name of The NetBSD Foundation nor the names of its
     23  *    contributors may be used to endorse or promote products derived
     24  *    from this software without specific prior written permission.
     25  *
     26  * THIS SOFTWARE IS PROVIDED BY THE NETBSD FOUNDATION, INC. AND CONTRIBUTORS
     27  * ``AS IS'' AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED
     28  * TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR
     29  * PURPOSE ARE DISCLAIMED.  IN NO EVENT SHALL THE FOUNDATION OR CONTRIBUTORS
     30  * BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR
     31  * CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF
     32  * SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS
     33  * INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN
     34  * CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE)
     35  * ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE
     36  * POSSIBILITY OF SUCH DAMAGE.
     37  */
     38 
     39 #include <sys/cdefs.h>
     40 #if defined(__COPYRIGHT) && !defined(lint)
     41 __COPYRIGHT("@(#) Copyright (c) 1999 The NetBSD Foundation, Inc.\n\
     42 	All rights reserved.\n");
     43 #endif /* not lint */
     44 
     45 #if defined(__RCSID) && !defined(lint)
     46 __RCSID("$NetBSD: makewhatis.c,v 1.21 2002/01/31 22:43:41 tv Exp $");
     47 #endif /* not lint */
     48 
     49 #if HAVE_CONFIG_H
     50 #include "config.h"
     51 #endif
     52 
     53 #include <sys/types.h>
     54 #include <sys/param.h>
     55 #include <sys/stat.h>
     56 #include <sys/wait.h>
     57 
     58 #include <ctype.h>
     59 #include <err.h>
     60 #include <errno.h>
     61 #include <fcntl.h>
     62 #include <fts.h>
     63 #include <locale.h>
     64 #include <paths.h>
     65 #include <signal.h>
     66 #include <stdio.h>
     67 #include <stdlib.h>
     68 #include <string.h>
     69 #include <unistd.h>
     70 #include <zlib.h>
     71 
     72 typedef struct manpagestruct manpage;
     73 struct manpagestruct {
     74 	manpage *mp_left,*mp_right;
     75 	ino_t	 mp_inode;
     76 	char	 mp_name[1];
     77 };
     78 
     79 typedef struct whatisstruct whatis;
     80 struct whatisstruct {
     81 	whatis	*wi_left,*wi_right;
     82 	char	*wi_data;
     83 };
     84 
     85 int	 main(int, char **);
     86 char	*findwhitespace(char *);
     87 char	*strmove(char *,char *);
     88 char	*GetS(gzFile, char *, size_t);
     89 int	 manpagesection(char *);
     90 char	*createsectionstring(char *);
     91 void	 addmanpage(manpage **, ino_t, char *);
     92 void	 addwhatis(whatis **, char *);
     93 char	*replacestring(char *, char *, char *);
     94 void	 catpreprocess(char *);
     95 char	*parsecatpage(gzFile *);
     96 int	 manpreprocess(char *);
     97 char	*nroff(gzFile *);
     98 char	*parsemanpage(gzFile *, int);
     99 char	*getwhatisdata(char *);
    100 void	 processmanpages(manpage **,whatis **);
    101 void	 dumpwhatis(FILE *, whatis *);
    102 void	*emalloc(size_t);
    103 char	*estrdup(const char *);
    104 
    105 char *default_manpath[] = {
    106 	"/usr/share/man",
    107 	NULL
    108 };
    109 
    110 char sectionext[] = "0123456789ln";
    111 char whatisdb[]	  = "whatis.db";
    112 
    113 int
    114 main(int argc, char **argv)
    115 {
    116 	char	**manpath;
    117 	FTS	*fts;
    118 	FTSENT	*fe;
    119 	manpage *source;
    120 	whatis	*dest;
    121 	FILE	*out;
    122 
    123 	(void)setlocale(LC_ALL, "");
    124 
    125 	manpath = (argc < 2) ? default_manpath : &argv[1];
    126 
    127 	if ((fts = fts_open(manpath, FTS_LOGICAL, NULL)) == NULL)
    128 		err(EXIT_FAILURE, "Cannot open `%s'", *manpath);
    129 
    130 	source = NULL;
    131 	while ((fe = fts_read(fts)) != NULL) {
    132 		switch (fe->fts_info) {
    133 		case FTS_F:
    134 			if (manpagesection(fe->fts_path) >= 0)
    135 				addmanpage(&source, fe->fts_statp->st_ino,
    136 				    fe->fts_path);
    137 			/*FALLTHROUGH*/
    138 		case FTS_D:
    139 		case FTS_DC:
    140 		case FTS_DEFAULT:
    141 		case FTS_DP:
    142 		case FTS_SLNONE:
    143 			break;
    144 		default:
    145 			errno = fe->fts_errno;
    146 			err(EXIT_FAILURE, "Error reading `%s'", fe->fts_path);
    147 		}
    148 	}
    149 
    150 	(void)fts_close(fts);
    151 
    152 	dest = NULL;
    153 	processmanpages(&source, &dest);
    154 
    155 	if (chdir(manpath[0]) == -1)
    156 		err(EXIT_FAILURE, "Cannot change dir to `%s'", manpath[0]);
    157 
    158 	(void)unlink(whatisdb);
    159 	if ((out = fopen(whatisdb, "w")) == NULL)
    160 		err(EXIT_FAILURE, "Cannot open `%s'", whatisdb);
    161 
    162 	dumpwhatis(out, dest);
    163 	if (fchmod(fileno(out), S_IRUSR|S_IRGRP|S_IROTH) == -1)
    164 		err(EXIT_FAILURE, "Cannot chmod `%s'", whatisdb);
    165 	if (fclose(out) != 0)
    166 		err(EXIT_FAILURE, "Cannot close `%s'", whatisdb);
    167 
    168 	return EXIT_SUCCESS;
    169 }
    170 
    171 char *
    172 findwhitespace(char *str)
    173 {
    174 	while (!isspace((unsigned char)*str))
    175 		if (*str++ == '\0') {
    176 			str = NULL;
    177 			break;
    178 		}
    179 
    180 	return str;
    181 }
    182 
    183 char
    184 *strmove(char *dest,char *src)
    185 {
    186 	return memmove(dest, src, strlen(src) + 1);
    187 }
    188 
    189 char *
    190 GetS(gzFile in, char *buffer, size_t length)
    191 {
    192 	char	*ptr;
    193 
    194 	if (((ptr = gzgets(in, buffer, (int)length)) != NULL) && (*ptr == '\0'))
    195 		ptr = NULL;
    196 
    197 	return ptr;
    198 }
    199 
    200 int
    201 manpagesection(char *name)
    202 {
    203 	char	*ptr;
    204 
    205 	if ((ptr = strrchr(name, '/')) != NULL)
    206 		ptr++;
    207 	else
    208 		ptr = name;
    209 
    210 	while ((ptr = strchr(ptr, '.')) != NULL) {
    211 		int section;
    212 
    213 		ptr++;
    214 		section=0;
    215 		while (sectionext[section] != '\0')
    216 			if (sectionext[section] == *ptr)
    217 				return section;
    218 			else
    219 				section++;
    220 	}
    221 
    222 	return -1;
    223 }
    224 
    225 char *
    226 createsectionstring(char *section_id)
    227 {
    228 	char *section = emalloc(strlen(section_id) + 7);
    229 	section[0] = ' ';
    230 	section[1] = '(';
    231 	(void)strcat(strcpy(&section[2], section_id), ") - ");
    232 	return section;
    233 }
    234 
    235 void
    236 addmanpage(manpage **tree,ino_t inode,char *name)
    237 {
    238 	manpage *mp;
    239 
    240 	while ((mp = *tree) != NULL) {
    241 		if (mp->mp_inode == inode)
    242 			return;
    243 		tree = inode < mp->mp_inode ? &mp->mp_left : &mp->mp_right;
    244 	}
    245 
    246 	mp = emalloc(sizeof(manpage) + strlen(name));
    247 	mp->mp_left = NULL;
    248 	mp->mp_right = NULL;
    249 	mp->mp_inode = inode;
    250 	(void)strcpy(mp->mp_name, name);
    251 	*tree = mp;
    252 }
    253 
    254 void
    255 addwhatis(whatis **tree, char *data)
    256 {
    257 	whatis *wi;
    258 	int result;
    259 
    260 	while (isspace((unsigned char)*data))
    261 		data++;
    262 
    263 	if (*data == '/') {
    264 		char *ptr;
    265 
    266 		ptr = ++data;
    267 		while ((*ptr != '\0') && !isspace((unsigned char)*ptr))
    268 			if (*ptr++ == '/')
    269 				data = ptr;
    270 	}
    271 
    272 	while ((wi = *tree) != NULL) {
    273 		result = strcmp(data, wi->wi_data);
    274 		if (result == 0) return;
    275 		tree = result < 0 ? &wi->wi_left : &wi->wi_right;
    276 	}
    277 
    278 	wi = emalloc(sizeof(whatis) + strlen(data));
    279 
    280 	wi->wi_left = NULL;
    281 	wi->wi_right = NULL;
    282 	wi->wi_data = data;
    283 	*tree = wi;
    284 }
    285 
    286 void
    287 catpreprocess(char *from)
    288 {
    289 	char	*to;
    290 
    291 	to = from;
    292 	while (isspace((unsigned char)*from)) from++;
    293 
    294 	while (*from != '\0')
    295 		if (isspace((unsigned char)*from)) {
    296 			while (isspace((unsigned char)*++from));
    297 			if (*from != '\0')
    298 				*to++ = ' ';
    299 		}
    300 		else if (*(from + 1) == '\10')
    301 			from += 2;
    302 		else
    303 			*to++ = *from++;
    304 
    305 	*to = '\0';
    306 }
    307 
    308 char *
    309 replacestring(char *string, char *old, char *new)
    310 
    311 {
    312 	char	*ptr, *result;
    313 	size_t	 slength, olength, nlength, pos;
    314 
    315 	if (new == NULL)
    316 		return estrdup(string);
    317 
    318 	ptr = strstr(string, old);
    319 	if (ptr == NULL)
    320 		return estrdup(string);
    321 
    322 	slength = strlen(string);
    323 	olength = strlen(old);
    324 	nlength = strlen(new);
    325 	result = emalloc(slength - olength + nlength + 1);
    326 
    327 	pos = ptr - string;
    328 	(void)memcpy(result, string, pos);
    329 	(void)memcpy(&result[pos], new, nlength);
    330 	(void)strcpy(&result[pos + nlength], &string[pos + olength]);
    331 
    332 	return result;
    333 }
    334 
    335 char *
    336 parsecatpage(gzFile *in)
    337 {
    338 	char	 buffer[8192];
    339 	char	*section, *ptr, *last;
    340 	size_t	 size;
    341 
    342 	do {
    343 		if (GetS(in, buffer, sizeof(buffer)) == NULL)
    344 			return NULL;
    345 	}
    346 	while (buffer[0] == '\n');
    347 
    348 	section = NULL;
    349 	if ((ptr = strchr(buffer, '(')) != NULL) {
    350 		if ((last = strchr(ptr + 1, ')')) !=NULL) {
    351 			size_t	length;
    352 
    353 			length = last - ptr + 1;
    354 			section = emalloc(length + 5);
    355 			*section = ' ';
    356 			(void) memcpy(section + 1, ptr, length);
    357 			(void) strcpy(section + 1 + length, " - ");
    358 		}
    359 	}
    360 
    361 	for (;;) {
    362 		if (GetS(in, buffer, sizeof(buffer)) == NULL) {
    363 			free(section);
    364 			return NULL;
    365 		}
    366 		catpreprocess(buffer);
    367 		if (strncmp(buffer, "NAME", 4) == 0)
    368 			break;
    369 	}
    370 
    371 	ptr = last = buffer;
    372 	size = sizeof(buffer) - 1;
    373 	while ((size > 0) && (GetS(in, ptr, size) != NULL)) {
    374 		int	 length;
    375 
    376 		catpreprocess(ptr);
    377 
    378 		length = strlen(ptr);
    379 		if (length == 0) {
    380 			*last = '\0';
    381 
    382 			ptr = replacestring(buffer, " - ", section);
    383 			free(section);
    384 			return ptr;
    385 		}
    386 		if ((length > 1) && (ptr[length - 1] == '-') &&
    387 		    isalpha(ptr[length - 2]))
    388 			last = &ptr[--length];
    389 		else {
    390 			last = &ptr[length++];
    391 			*last = ' ';
    392 		}
    393 
    394 		ptr += length;
    395 		size -= length;
    396 	}
    397 
    398 	free(section);
    399 
    400 	return NULL;
    401 }
    402 
    403 int
    404 manpreprocess(char *line)
    405 {
    406 	char	*from, *to;
    407 
    408 	to = from = line;
    409 	while (isspace((unsigned char)*from)) from++;
    410 	if (strncmp(from, ".\\\"", 3) == 0)
    411 		return 1;
    412 
    413 	while (*from != '\0')
    414 		if (isspace((unsigned char)*from)) {
    415 			while (isspace((unsigned char)*++from));
    416 			if ((*from != '\0') && (*from != ','))
    417 				*to++ = ' ';
    418 		}
    419 		else if (*from == '\\')
    420 			switch (*++from) {
    421 			case '\0':
    422 			case '-':
    423 				break;
    424 			case 'f':
    425 			case 's':
    426 				from++;
    427 				if ((*from=='+') || (*from=='-'))
    428 					from++;
    429 				while (isdigit(*from))
    430 					from++;
    431 				break;
    432 			default:
    433 				from++;
    434 			}
    435 		else
    436 			if (*from == '"')
    437 				from++;
    438 			else
    439 				*to++ = *from++;
    440 
    441 	*to = '\0';
    442 
    443 	if (strncasecmp(line, ".Xr", 3) == 0) {
    444 		char	*sect;
    445 
    446 		from = line + 3;
    447 		if (isspace((unsigned char)*from))
    448 			from++;
    449 
    450 		if ((sect = findwhitespace(from)) != NULL) {
    451 			size_t	length;
    452 			char	*trail;
    453 
    454 			*sect++ = '\0';
    455 			if ((trail = findwhitespace(sect)) != NULL)
    456 				*trail++ = '\0';
    457 			length = strlen(from);
    458 			(void) memmove(line, from, length);
    459 			line[length++] = '(';
    460 			to = &line[length];
    461 			length = strlen(sect);
    462 			(void) memmove(to, sect, length);
    463 			if (trail == NULL) {
    464 				(void) strcpy(&to[length], ")");
    465 			} else {
    466 				to += length;
    467 				*to++ = ')';
    468 				length = strlen(trail);
    469 				(void) memmove(to, trail, length + 1);
    470 			}
    471 		}
    472 	}
    473 
    474 	return 0;
    475 }
    476 
    477 char *
    478 nroff(gzFile *in)
    479 {
    480 	char tempname[MAXPATHLEN], buffer[65536], *data;
    481 	int tempfd, bytes, pipefd[2], status;
    482 	static int devnull = -1;
    483 	pid_t child;
    484 
    485 	if (gzrewind(in) < 0)
    486 		err(EXIT_FAILURE, "Cannot rewind pipe");
    487 
    488 	if ((devnull < 0) &&
    489 	    ((devnull = open(_PATH_DEVNULL, O_WRONLY, 0)) < 0))
    490 		err(EXIT_FAILURE, "Cannot open `/dev/null'");
    491 
    492 	(void)strcpy(tempname, _PATH_TMP "makewhatis.XXXXXX");
    493 	if ((tempfd = mkstemp(tempname)) == -1)
    494 		err(EXIT_FAILURE, "Cannot create temp file");
    495 
    496 	while ((bytes = gzread(in, buffer, sizeof(buffer))) > 0)
    497 		if (write(tempfd, buffer, (size_t)bytes) != bytes) {
    498 			bytes = -1;
    499 			break;
    500 		}
    501 
    502 	if (bytes < 0) {
    503 		(void)close(tempfd);
    504 		(void)unlink(tempname);
    505 		err(EXIT_FAILURE, "Read from pipe failed");
    506 	}
    507 	if (lseek(tempfd, (off_t)0, SEEK_SET) == (off_t)-1) {
    508 		(void)close(tempfd);
    509 		(void)unlink(tempname);
    510 		err(EXIT_FAILURE, "Cannot rewind temp file");
    511 	}
    512 	if (pipe(pipefd) == -1) {
    513 		(void)close(tempfd);
    514 		(void)unlink(tempname);
    515 		err(EXIT_FAILURE, "Cannot create pipe");
    516 	}
    517 
    518 	switch (child = vfork()) {
    519 	case -1:
    520 		(void)close(pipefd[1]);
    521 		(void)close(pipefd[0]);
    522 		(void)close(tempfd);
    523 		(void)unlink(tempname);
    524 		err(EXIT_FAILURE, "Fork failed");
    525 		/* NOTREACHED */
    526 	case 0:
    527 		(void)close(pipefd[0]);
    528 		if (tempfd != STDIN_FILENO) {
    529 			(void)dup2(tempfd, STDIN_FILENO);
    530 			(void)close(tempfd);
    531 		}
    532 		if (pipefd[1] != STDOUT_FILENO) {
    533 			(void)dup2(pipefd[1], STDOUT_FILENO);
    534 			(void)close(pipefd[1]);
    535 		}
    536 		if (devnull != STDERR_FILENO) {
    537 			(void)dup2(devnull, STDERR_FILENO);
    538 			(void)close(devnull);
    539 		}
    540 		(void)execlp("nroff", "nroff", "-S", "-man", NULL);
    541 		_exit(EXIT_FAILURE);
    542 		/*NOTREACHED*/
    543 	default:
    544 		(void)close(pipefd[1]);
    545 		(void)close(tempfd);
    546 		break;
    547 	}
    548 
    549 	if ((in = gzdopen(pipefd[0], "r")) == NULL) {
    550 		if (errno == 0)
    551 			errno = ENOMEM;
    552 		(void)close(pipefd[0]);
    553 		(void)kill(child, SIGTERM);
    554 		while (waitpid(child, NULL, 0) != child);
    555 		(void)unlink(tempname);
    556 		err(EXIT_FAILURE, "Cannot read from pipe");
    557 	}
    558 
    559 	data = parsecatpage(in);
    560 	while (gzread(in, buffer, sizeof(buffer)) > 0);
    561 	(void)gzclose(in);
    562 
    563 	while (waitpid(child, &status, 0) != child);
    564 	if ((data != NULL) &&
    565 	    !(WIFEXITED(status) && (WEXITSTATUS(status) == 0))) {
    566 		free(data);
    567 		errx(EXIT_FAILURE, "nroff exited with %d status",
    568 		    WEXITSTATUS(status));
    569 	}
    570 
    571 	(void)unlink(tempname);
    572 	return data;
    573 }
    574 
    575 char *
    576 parsemanpage(gzFile *in, int defaultsection)
    577 {
    578 	char	*section, buffer[8192], *ptr;
    579 
    580 	section = NULL;
    581 	do {
    582 		if (GetS(in, buffer, sizeof(buffer) - 1) == NULL) {
    583 			free(section);
    584 			return NULL;
    585 		}
    586 		if (manpreprocess(buffer))
    587 			continue;
    588 		if (strncasecmp(buffer, ".Dt", 3) == 0) {
    589 			char	*end;
    590 
    591 			ptr = &buffer[3];
    592 			if (isspace((unsigned char)*ptr))
    593 				ptr++;
    594 			if ((ptr = findwhitespace(ptr)) == NULL)
    595 				continue;
    596 
    597 			if ((end = findwhitespace(++ptr)) != NULL)
    598 				*end = '\0';
    599 
    600 			free(section);
    601 			section = createsectionstring(ptr);
    602 		}
    603 		else if (strncasecmp(buffer, ".TH", 3) == 0) {
    604 			ptr = &buffer[3];
    605 			while (isspace((unsigned char)*ptr))
    606 				ptr++;
    607 			if ((ptr = findwhitespace(ptr)) != NULL) {
    608 				char *next;
    609 
    610 				while (isspace((unsigned char)*ptr))
    611 					ptr++;
    612 				if ((next = findwhitespace(ptr)) != NULL)
    613 					*next = '\0';
    614 				free(section);
    615 				section = createsectionstring(ptr);
    616 			}
    617 		}
    618 		else if (strncasecmp(buffer, ".Ds", 3) == 0) {
    619 			free(section);
    620 			return NULL;
    621 		}
    622 	} while (strncasecmp(buffer, ".Sh NAME", 8) != 0);
    623 
    624 	do {
    625 		if (GetS(in, buffer, sizeof(buffer) - 1) == NULL) {
    626 			free(section);
    627 			return NULL;
    628 		}
    629 	} while (manpreprocess(buffer));
    630 
    631 	if (strncasecmp(buffer, ".Nm", 3) == 0) {
    632 		size_t	length, offset;
    633 
    634 		ptr = &buffer[3];
    635 		while (isspace((unsigned char)*ptr))
    636 			ptr++;
    637 
    638 		length = strlen(ptr);
    639 		if ((length > 1) && (ptr[length - 1] == ',') &&
    640 		    isspace((unsigned char)ptr[length - 2])) {
    641 			ptr[--length] = '\0';
    642 			ptr[length - 1] = ',';
    643 		}
    644 		(void) memmove(buffer, ptr, length + 1);
    645 
    646 		offset = length + 3;
    647 		ptr = &buffer[offset];
    648 		for (;;) {
    649 			size_t	 more;
    650 
    651 			if ((sizeof(buffer) == offset) ||
    652 			    (GetS(in, ptr, sizeof(buffer) - offset)
    653 			       == NULL)) {
    654 				free(section);
    655 				return NULL;
    656 			}
    657 			if (manpreprocess(ptr))
    658 				continue;
    659 
    660 			if (strncasecmp(ptr, ".Nm", 3) != 0) break;
    661 
    662 			ptr += 3;
    663 			if (isspace((unsigned char)*ptr))
    664 				ptr++;
    665 
    666 			buffer[length++] = ' ';
    667 			more = strlen(ptr);
    668 			if ((more > 1) && (ptr[more - 1] == ',') &&
    669 			    isspace((unsigned char)ptr[more - 2])) {
    670 				ptr[--more] = '\0';
    671 				ptr[more - 1] = ',';
    672 			}
    673 
    674 			(void) memmove(&buffer[length], ptr, more + 1);
    675 			length += more;
    676 			offset = length + 3;
    677 
    678 			ptr = &buffer[offset];
    679 		}
    680 
    681 		if (strncasecmp(ptr, ".Nd", 3) == 0) {
    682 			(void) strcpy(&buffer[length], " -");
    683 
    684 			while (strncasecmp(ptr, ".Sh", 3) != 0) {
    685 				int	 more;
    686 
    687 				if (*ptr == '.') {
    688 					char	*space;
    689 
    690 					if (strncasecmp(ptr, ".Nd", 3) != 0) {
    691 						free(section);
    692 						return NULL;
    693 					}
    694 					space = findwhitespace(ptr);
    695 					if (space == NULL)
    696 						ptr = "";
    697 					else {
    698 						space++;
    699 						(void) strmove(ptr, space);
    700 					}
    701 				}
    702 
    703 				if (*ptr != '\0') {
    704 					buffer[offset - 1] = ' ';
    705 					more = strlen(ptr) + 1;
    706 					offset += more;
    707 				}
    708 				ptr = &buffer[offset];
    709 				if ((sizeof(buffer) == offset) ||
    710 				    (GetS(in, ptr, sizeof(buffer) - offset)
    711 					== NULL)) {
    712 					free(section);
    713 					return NULL;
    714 				}
    715 				if (manpreprocess(ptr))
    716 					*ptr = '\0';
    717 			}
    718 		}
    719 	}
    720 	else {
    721 		int	 offset;
    722 
    723 		if (*buffer == '.') {
    724 			char	*space;
    725 
    726 			if ((space = findwhitespace(&buffer[1])) == NULL) {
    727 				free(section);
    728 				return NULL;
    729 			}
    730 			space++;
    731 			(void) strmove(buffer, space);
    732 		}
    733 
    734 		offset = strlen(buffer) + 1;
    735 		for (;;) {
    736 			int	 more;
    737 
    738 			ptr = &buffer[offset];
    739 			if ((sizeof(buffer) == offset) ||
    740 			    (GetS(in, ptr, sizeof(buffer) - offset)
    741 				== NULL)) {
    742 				free(section);
    743 				return NULL;
    744 			}
    745 			if (manpreprocess(ptr) || (*ptr == '\0'))
    746 				continue;
    747 
    748 			if ((strncasecmp(ptr, ".Sh", 3) == 0) ||
    749 			    (strncasecmp(ptr, ".Ss", 3) == 0))
    750 				break;
    751 
    752 			if (*ptr == '.') {
    753 				char	*space;
    754 
    755 				if ((space = findwhitespace(ptr)) == NULL) {
    756 					continue;
    757 				}
    758 
    759 				space++;
    760 				(void) memmove(ptr, space, strlen(space) + 1);
    761 			}
    762 
    763 			buffer[offset - 1] = ' ';
    764 			more = strlen(ptr);
    765 			if ((more > 1) && (ptr[more - 1] == ',') &&
    766 			    isspace((unsigned char)ptr[more - 2])) {
    767 				ptr[more - 1] = '\0';
    768 				ptr[more - 2] = ',';
    769 			}
    770 			else more++;
    771 			offset += more;
    772 		}
    773 	}
    774 
    775 	if (section == NULL) {
    776 		char sectionbuffer[24];
    777 
    778 		(void) sprintf(sectionbuffer, " (%c) - ",
    779 			sectionext[defaultsection]);
    780 		ptr = replacestring(buffer, " - ", sectionbuffer);
    781 	}
    782 	else {
    783 		ptr = replacestring(buffer, " - ", section);
    784 		free(section);
    785 	}
    786 	return ptr;
    787 }
    788 
    789 char *
    790 getwhatisdata(char *name)
    791 {
    792 	gzFile	*in;
    793 	char	*data;
    794 	int	 section;
    795 
    796 	if ((in = gzopen(name, "r")) == NULL) {
    797 		if (errno == 0)
    798 			errno = ENOMEM;
    799 		err(EXIT_FAILURE, "Cannot open `%s'", name);
    800 		/* NOTREACHED */
    801 	}
    802 
    803 	section = manpagesection(name);
    804 	if (section == 0)
    805 		data = parsecatpage(in);
    806 	else {
    807 		data = parsemanpage(in, section);
    808 		if (data == NULL)
    809 			data = nroff(in);
    810 	}
    811 
    812 	(void) gzclose(in);
    813 	return data;
    814 }
    815 
    816 void
    817 processmanpages(manpage **source, whatis **dest)
    818 {
    819 	manpage *mp;
    820 
    821 	mp = *source;
    822 	*source = NULL;
    823 
    824 	while (mp != NULL) {
    825 		manpage *obsolete;
    826 		char *data;
    827 
    828 		if (mp->mp_left != NULL)
    829 			processmanpages(&mp->mp_left,dest);
    830 
    831 		if ((data = getwhatisdata(mp->mp_name)) != NULL)
    832 			addwhatis(dest,data);
    833 
    834 		obsolete = mp;
    835 		mp = mp->mp_right;
    836 		free(obsolete);
    837 	}
    838 }
    839 
    840 void
    841 dumpwhatis(FILE *out, whatis *tree)
    842 {
    843 	while (tree != NULL) {
    844 		if (tree->wi_left)
    845 			dumpwhatis(out, tree->wi_left);
    846 
    847 		if ((fputs(tree->wi_data, out) == EOF) ||
    848 		    (fputc('\n', out) == EOF))
    849 			err(EXIT_FAILURE, "Write failed");
    850 
    851 		tree = tree->wi_right;
    852 	}
    853 }
    854 
    855 void *
    856 emalloc(size_t len)
    857 {
    858 	void *ptr;
    859 	if ((ptr = malloc(len)) == NULL)
    860 		err(EXIT_FAILURE, "malloc %lu failed", (unsigned long)len);
    861 	return ptr;
    862 }
    863 
    864 char *
    865 estrdup(const char *str)
    866 {
    867 	char *ptr;
    868 	if ((ptr = strdup(str)) == NULL)
    869 		err(EXIT_FAILURE, "strdup failed");
    870 	return ptr;
    871 }
    872