Home | History | Annotate | Line # | Download | only in httpd
bozohttpd.c revision 1.35
      1 /*	$NetBSD: bozohttpd.c,v 1.35 2013/06/27 10:01:31 martin Exp $	*/
      2 
      3 /*	$eterna: bozohttpd.c,v 1.178 2011/11/18 09:21:15 mrg Exp $	*/
      4 
      5 /*
      6  * Copyright (c) 1997-2011 Matthew R. Green
      7  * All rights reserved.
      8  *
      9  * Redistribution and use in source and binary forms, with or without
     10  * modification, are permitted provided that the following conditions
     11  * are met:
     12  * 1. Redistributions of source code must retain the above copyright
     13  *    notice, this list of conditions and the following disclaimer.
     14  * 2. Redistributions in binary form must reproduce the above copyright
     15  *    notice, this list of conditions and the following disclaimer and
     16  *    dedication in the documentation and/or other materials provided
     17  *    with the distribution.
     18  *
     19  * THIS SOFTWARE IS PROVIDED BY THE AUTHOR ``AS IS'' AND ANY EXPRESS OR
     20  * IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED WARRANTIES
     21  * OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE ARE DISCLAIMED.
     22  * IN NO EVENT SHALL THE AUTHOR BE LIABLE FOR ANY DIRECT, INDIRECT,
     23  * INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING,
     24  * BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES;
     25  * LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED
     26  * AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY,
     27  * OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY
     28  * OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF
     29  * SUCH DAMAGE.
     30  *
     31  */
     32 
     33 /* this program is dedicated to the Great God of Processed Cheese */
     34 
     35 /*
     36  * bozohttpd.c:  minimal httpd; provides only these features:
     37  *	- HTTP/0.9 (by virtue of ..)
     38  *	- HTTP/1.0
     39  *	- HTTP/1.1
     40  *	- CGI/1.1 this will only be provided for "system" scripts
     41  *	- automatic "missing trailing slash" redirections
     42  *	- configurable translation of /~user/ to ~user/public_html,
     43  *	  however, this does not include cgi-bin support
     44  *	- access lists via libwrap via inetd/tcpd
     45  *	- virtual hosting
     46  *	- not that we do not even pretend to understand MIME, but
     47  *	  rely only on the HTTP specification
     48  *	- ipv6 support
     49  *	- automatic `index.html' generation
     50  *	- configurable server name
     51  *	- directory index generation
     52  *	- daemon mode (lacks libwrap support)
     53  *	- .htpasswd support
     54  */
     55 
     56 /*
     57  * requirements for minimal http/1.1 (at least, as documented in
     58  * <draft-ietf-http-v11-spec-rev-06> which expired may 18, 1999):
     59  *
     60  *	- 14.15: content-encoding handling. [1]
     61  *
     62  *	- 14.16: content-length handling.  this is only a SHOULD header
     63  *	  thus we could just not send it ever.  [1]
     64  *
     65  *	- 14.17: content-type handling. [1]
     66  *
     67  *	- 14.25/28: if-{,un}modified-since handling.  maybe do this, but
     68  *	  i really don't want to have to parse 3 differnet date formats
     69  *
     70  * [1] need to revisit to ensure proper behaviour
     71  *
     72  * and the following is a list of features that we do not need
     73  * to have due to other limits, or are too lazy.  there are more
     74  * of these than are listed, but these are of particular note,
     75  * and could perhaps be implemented.
     76  *
     77  *	- 3.5/3.6: content/transfer codings.  probably can ignore
     78  *	  this?  we "SHOULD"n't.  but 4.4 says we should ignore a
     79  *	  `content-length' header upon reciept of a `transfer-encoding'
     80  *	  header.
     81  *
     82  *	- 5.1.1: request methods.  only MUST support GET and HEAD,
     83  *	  but there are new ones besides POST that are currently
     84  *	  supported: OPTIONS PUT DELETE TRACE and CONNECT, plus
     85  *	  extensions not yet known?
     86  *
     87  * 	- 10.1: we can ignore informational status codes
     88  *
     89  *	- 10.3.3/10.3.4/10.3.8:  just use '302' codes always.
     90  *
     91  *	- 14.1/14.2/14.3/14.27: we do not support Accept: headers..
     92  *	  just ignore them and send the request anyway.  they are
     93  *	  only SHOULD.
     94  *
     95  *	- 14.5/14.16/14.35: we don't do ranges.  from section 14.35.2
     96  *	  `A server MAY ignore the Range header'.  but it might be nice.
     97  *	  since 20080301 we support simple range headers.
     98  *
     99  *	- 14.9: we aren't a cache.
    100  *
    101  *	- 14.15: content-md5 would be nice...
    102  *
    103  *	- 14.24/14.26/14.27: be nice to support this...
    104  *
    105  *	- 14.44: not sure about this Vary: header.  ignore it for now.
    106  */
    107 
    108 #ifndef INDEX_HTML
    109 #define INDEX_HTML		"index.html"
    110 #endif
    111 #ifndef SERVER_SOFTWARE
    112 #define SERVER_SOFTWARE		"bozohttpd/20111118"
    113 #endif
    114 #ifndef DIRECT_ACCESS_FILE
    115 #define DIRECT_ACCESS_FILE	".bzdirect"
    116 #endif
    117 #ifndef REDIRECT_FILE
    118 #define REDIRECT_FILE		".bzredirect"
    119 #endif
    120 #ifndef ABSREDIRECT_FILE
    121 #define ABSREDIRECT_FILE	".bzabsredirect"
    122 #endif
    123 #ifndef PUBLIC_HTML
    124 #define PUBLIC_HTML		"public_html"
    125 #endif
    126 
    127 #ifndef USE_ARG
    128 #define USE_ARG(x)	/*LINTED*/(void)&(x)
    129 #endif
    130 
    131 /*
    132  * And so it begins ..
    133  */
    134 
    135 #include <sys/param.h>
    136 #include <sys/socket.h>
    137 #include <sys/time.h>
    138 #include <sys/mman.h>
    139 
    140 #include <arpa/inet.h>
    141 
    142 #include <ctype.h>
    143 #include <dirent.h>
    144 #include <errno.h>
    145 #include <fcntl.h>
    146 #include <netdb.h>
    147 #include <pwd.h>
    148 #include <grp.h>
    149 #include <signal.h>
    150 #include <stdarg.h>
    151 #include <stdlib.h>
    152 #include <string.h>
    153 #include <syslog.h>
    154 #include <time.h>
    155 #include <unistd.h>
    156 
    157 #include "bozohttpd.h"
    158 
    159 #ifndef MAX_WAIT_TIME
    160 #define	MAX_WAIT_TIME	60	/* hang around for 60 seconds max */
    161 #endif
    162 
    163 /* variables and functions */
    164 #ifndef LOG_FTP
    165 #define LOG_FTP LOG_DAEMON
    166 #endif
    167 
    168 volatile sig_atomic_t	alarmhit;
    169 
    170 /*
    171  * check there's enough space in the prefs and names arrays.
    172  */
    173 static int
    174 size_arrays(bozoprefs_t *bozoprefs, unsigned needed)
    175 {
    176 	char	**temp;
    177 
    178 	if (bozoprefs->size == 0) {
    179 		/* only get here first time around */
    180 		bozoprefs->size = needed;
    181 		if ((bozoprefs->name = calloc(sizeof(char *), needed)) == NULL) {
    182 			(void) fprintf(stderr, "size_arrays: bad alloc\n");
    183 			return 0;
    184 		}
    185 		if ((bozoprefs->value = calloc(sizeof(char *), needed)) == NULL) {
    186 			free(bozoprefs->name);
    187 			(void) fprintf(stderr, "size_arrays: bad alloc\n");
    188 			return 0;
    189 		}
    190 	} else if (bozoprefs->c == bozoprefs->size) {
    191 		/* only uses 'needed' when filled array */
    192 		bozoprefs->size += needed;
    193 		temp = realloc(bozoprefs->name, sizeof(char *) * needed);
    194 		if (temp == NULL) {
    195 			(void) fprintf(stderr, "size_arrays: bad alloc\n");
    196 			return 0;
    197 		}
    198 		bozoprefs->name = temp;
    199 		temp = realloc(bozoprefs->value, sizeof(char *) * needed);
    200 		if (temp == NULL) {
    201 			(void) fprintf(stderr, "size_arrays: bad alloc\n");
    202 			return 0;
    203 		}
    204 		bozoprefs->value = temp;
    205 	}
    206 	return 1;
    207 }
    208 
    209 static int
    210 findvar(bozoprefs_t *bozoprefs, const char *name)
    211 {
    212 	unsigned	i;
    213 
    214 	for (i = 0 ; i < bozoprefs->c && strcmp(bozoprefs->name[i], name) != 0; i++)
    215 		;
    216 	return (i == bozoprefs->c) ? -1 : (int)i;
    217 }
    218 
    219 int
    220 bozo_set_pref(bozoprefs_t *bozoprefs, const char *name, const char *value)
    221 {
    222 	int	i;
    223 
    224 	if ((i = findvar(bozoprefs, name)) < 0) {
    225 		/* add the element to the array */
    226 		if (size_arrays(bozoprefs, bozoprefs->size + 15)) {
    227 			bozoprefs->name[i = bozoprefs->c++] = strdup(name);
    228 		}
    229 	} else {
    230 		/* replace the element in the array */
    231 		if (bozoprefs->value[i]) {
    232 			free(bozoprefs->value[i]);
    233 			bozoprefs->value[i] = NULL;
    234 		}
    235 	}
    236 	/* sanity checks for range of values go here */
    237 	bozoprefs->value[i] = strdup(value);
    238 	return 1;
    239 }
    240 
    241 /*
    242  * get a variable's value, or NULL
    243  */
    244 char *
    245 bozo_get_pref(bozoprefs_t *bozoprefs, const char *name)
    246 {
    247 	int	i;
    248 
    249 	return ((i = findvar(bozoprefs, name)) < 0) ? NULL :
    250 			bozoprefs->value[i];
    251 }
    252 
    253 char *
    254 bozo_http_date(char *date, size_t datelen)
    255 {
    256 	struct	tm *tm;
    257 	time_t	now;
    258 
    259 	/* Sun, 06 Nov 1994 08:49:37 GMT */
    260 	now = time(NULL);
    261 	tm = gmtime(&now);	/* HTTP/1.1 spec rev 06 sez GMT only */
    262 	strftime(date, datelen, "%a, %d %b %Y %H:%M:%S GMT", tm);
    263 	return date;
    264 }
    265 
    266 /*
    267  * convert "in" into the three parts of a request (first line).
    268  * we allocate into file and query, but return pointers into
    269  * "in" for proto and method.
    270  */
    271 static void
    272 parse_request(bozohttpd_t *httpd, char *in, char **method, char **file,
    273 		char **query, char **proto)
    274 {
    275 	ssize_t	len;
    276 	char	*val;
    277 
    278 	USE_ARG(httpd);
    279 	debug((httpd, DEBUG_EXPLODING, "parse in: %s", in));
    280 	*method = *file = *query = *proto = NULL;
    281 
    282 	len = (ssize_t)strlen(in);
    283 	val = bozostrnsep(&in, " \t\n\r", &len);
    284 	if (len < 1 || val == NULL)
    285 		return;
    286 	*method = val;
    287 
    288 	while (*in == ' ' || *in == '\t')
    289 		in++;
    290 	val = bozostrnsep(&in, " \t\n\r", &len);
    291 	if (len < 1) {
    292 		if (len == 0)
    293 			*file = val;
    294 		else
    295 			*file = in;
    296 	} else {
    297 		*file = val;
    298 
    299 		*query = strchr(*file, '?');
    300 		if (*query)
    301 			*(*query)++ = '\0';
    302 
    303 		if (in) {
    304 			while (*in && (*in == ' ' || *in == '\t'))
    305 				in++;
    306 			if (*in)
    307 				*proto = in;
    308 		}
    309 	}
    310 
    311 	/* allocate private copies */
    312 	*file = bozostrdup(httpd, *file);
    313 	if (*query)
    314 		*query = bozostrdup(httpd, *query);
    315 
    316 	debug((httpd, DEBUG_FAT,
    317 		"url: method: \"%s\" file: \"%s\" query: \"%s\" proto: \"%s\"",
    318 		*method, *file, *query, *proto));
    319 }
    320 
    321 /*
    322  * cleanup a bozo_httpreq_t after use
    323  */
    324 void
    325 bozo_clean_request(bozo_httpreq_t *request)
    326 {
    327 	struct bozoheaders *hdr, *ohdr = NULL;
    328 
    329 	if (request == NULL)
    330 		return;
    331 
    332 	/* If SSL enabled cleanup SSL structure. */
    333 	bozo_ssl_destroy(request->hr_httpd);
    334 
    335 	/* clean up request */
    336 #define MF(x)	if (request->x) free(request->x)
    337 	MF(hr_remotehost);
    338 	MF(hr_remoteaddr);
    339 	MF(hr_serverport);
    340 	MF(hr_virthostname);
    341 	MF(hr_file);
    342 	MF(hr_oldfile);
    343 	MF(hr_query);
    344 #undef MF
    345 	bozo_auth_cleanup(request);
    346 	for (hdr = SIMPLEQ_FIRST(&request->hr_headers); hdr;
    347 	    hdr = SIMPLEQ_NEXT(hdr, h_next)) {
    348 		free(hdr->h_value);
    349 		free(hdr->h_header);
    350 		if (ohdr)
    351 			free(ohdr);
    352 		ohdr = hdr;
    353 	}
    354 	if (ohdr)
    355 		free(ohdr);
    356 
    357 	free(request);
    358 }
    359 
    360 /*
    361  * send a HTTP/1.1 408 response if we timeout.
    362  */
    363 /* ARGSUSED */
    364 static void
    365 alarmer(int sig)
    366 {
    367 	alarmhit = 1;
    368 }
    369 
    370 /*
    371  * add or merge this header (val: str) into the requests list
    372  */
    373 static bozoheaders_t *
    374 addmerge_header(bozo_httpreq_t *request, char *val,
    375 		char *str, ssize_t len)
    376 {
    377 	struct	bozoheaders *hdr;
    378 
    379 	USE_ARG(len);
    380 	/* do we exist already? */
    381 	SIMPLEQ_FOREACH(hdr, &request->hr_headers, h_next) {
    382 		if (strcasecmp(val, hdr->h_header) == 0)
    383 			break;
    384 	}
    385 
    386 	if (hdr) {
    387 		/* yup, merge it in */
    388 		char *nval;
    389 
    390 		if (asprintf(&nval, "%s, %s", hdr->h_value, str) == -1) {
    391 			(void)bozo_http_error(request->hr_httpd, 500, NULL,
    392 			     "memory allocation failure");
    393 			return NULL;
    394 		}
    395 		free(hdr->h_value);
    396 		hdr->h_value = nval;
    397 	} else {
    398 		/* nope, create a new one */
    399 
    400 		hdr = bozomalloc(request->hr_httpd, sizeof *hdr);
    401 		hdr->h_header = bozostrdup(request->hr_httpd, val);
    402 		if (str && *str)
    403 			hdr->h_value = bozostrdup(request->hr_httpd, str);
    404 		else
    405 			hdr->h_value = bozostrdup(request->hr_httpd, " ");
    406 
    407 		SIMPLEQ_INSERT_TAIL(&request->hr_headers, hdr, h_next);
    408 		request->hr_nheaders++;
    409 	}
    410 
    411 	return hdr;
    412 }
    413 
    414 /*
    415  * as the prototype string is not constant (eg, "HTTP/1.1" is equivalent
    416  * to "HTTP/001.01"), we MUST parse this.
    417  */
    418 static int
    419 process_proto(bozo_httpreq_t *request, const char *proto)
    420 {
    421 	char	majorstr[16], *minorstr;
    422 	int	majorint, minorint;
    423 
    424 	if (proto == NULL) {
    425 got_proto_09:
    426 		request->hr_proto = request->hr_httpd->consts.http_09;
    427 		debug((request->hr_httpd, DEBUG_FAT, "request %s is http/0.9",
    428 			request->hr_file));
    429 		return 0;
    430 	}
    431 
    432 	if (strncasecmp(proto, "HTTP/", 5) != 0)
    433 		goto bad;
    434 	strncpy(majorstr, proto + 5, sizeof majorstr);
    435 	majorstr[sizeof(majorstr)-1] = 0;
    436 	minorstr = strchr(majorstr, '.');
    437 	if (minorstr == NULL)
    438 		goto bad;
    439 	*minorstr++ = 0;
    440 
    441 	majorint = atoi(majorstr);
    442 	minorint = atoi(minorstr);
    443 
    444 	switch (majorint) {
    445 	case 0:
    446 		if (minorint != 9)
    447 			break;
    448 		goto got_proto_09;
    449 	case 1:
    450 		if (minorint == 0)
    451 			request->hr_proto = request->hr_httpd->consts.http_10;
    452 		else if (minorint == 1)
    453 			request->hr_proto = request->hr_httpd->consts.http_11;
    454 		else
    455 			break;
    456 
    457 		debug((request->hr_httpd, DEBUG_FAT, "request %s is %s",
    458 		    request->hr_file, request->hr_proto));
    459 		SIMPLEQ_INIT(&request->hr_headers);
    460 		request->hr_nheaders = 0;
    461 		return 0;
    462 	}
    463 bad:
    464 	return bozo_http_error(request->hr_httpd, 404, NULL, "unknown prototype");
    465 }
    466 
    467 /*
    468  * process each type of HTTP method, setting this HTTP requests
    469  # method type.
    470  */
    471 static struct method_map {
    472 	const char *name;
    473 	int	type;
    474 } method_map[] = {
    475 	{ "GET", 	HTTP_GET, },
    476 	{ "POST",	HTTP_POST, },
    477 	{ "HEAD",	HTTP_HEAD, },
    478 #if 0	/* other non-required http/1.1 methods */
    479 	{ "OPTIONS",	HTTP_OPTIONS, },
    480 	{ "PUT",	HTTP_PUT, },
    481 	{ "DELETE",	HTTP_DELETE, },
    482 	{ "TRACE",	HTTP_TRACE, },
    483 	{ "CONNECT",	HTTP_CONNECT, },
    484 #endif
    485 	{ NULL,		0, },
    486 };
    487 
    488 static int
    489 process_method(bozo_httpreq_t *request, const char *method)
    490 {
    491 	struct	method_map *mmp;
    492 
    493 	if (request->hr_proto == request->hr_httpd->consts.http_11)
    494 		request->hr_allow = "GET, HEAD, POST";
    495 
    496 	for (mmp = method_map; mmp->name; mmp++)
    497 		if (strcasecmp(method, mmp->name) == 0) {
    498 			request->hr_method = mmp->type;
    499 			request->hr_methodstr = mmp->name;
    500 			return 0;
    501 		}
    502 
    503 	return bozo_http_error(request->hr_httpd, 404, request, "unknown method");
    504 }
    505 
    506 /*
    507  * This function reads a http request from stdin, returning a pointer to a
    508  * bozo_httpreq_t structure, describing the request.
    509  */
    510 bozo_httpreq_t *
    511 bozo_read_request(bozohttpd_t *httpd)
    512 {
    513 	struct	sigaction	sa;
    514 	char	*str, *val, *method, *file, *proto, *query;
    515 	char	*host, *addr, *port;
    516 	char	bufport[10];
    517 	char	hbuf[NI_MAXHOST], abuf[NI_MAXHOST];
    518 	struct	sockaddr_storage ss;
    519 	ssize_t	len;
    520 	int	line = 0;
    521 	socklen_t slen;
    522 	bozo_httpreq_t *request;
    523 
    524 	/*
    525 	 * if we're in daemon mode, bozo_daemon_fork() will return here twice
    526 	 * for each call.  once in the child, returning 0, and once in the
    527 	 * parent, returning 1.  for each child, then we can setup SSL, and
    528 	 * the parent can signal the caller there was no request to process
    529 	 * and it will wait for another.
    530 	 */
    531 	if (bozo_daemon_fork(httpd))
    532 		return NULL;
    533 	bozo_ssl_accept(httpd);
    534 
    535 	request = bozomalloc(httpd, sizeof(*request));
    536 	memset(request, 0, sizeof(*request));
    537 	request->hr_httpd = httpd;
    538 	request->hr_allow = request->hr_host = NULL;
    539 	request->hr_content_type = request->hr_content_length = NULL;
    540 	request->hr_range = NULL;
    541 	request->hr_last_byte_pos = -1;
    542 	request->hr_if_modified_since = NULL;
    543 	request->hr_virthostname = NULL;
    544 	request->hr_file = NULL;
    545 	request->hr_oldfile = NULL;
    546 
    547 	slen = sizeof(ss);
    548 	if (getpeername(0, (struct sockaddr *)(void *)&ss, &slen) < 0)
    549 		host = addr = NULL;
    550 	else {
    551 		if (getnameinfo((struct sockaddr *)(void *)&ss, slen,
    552 		    abuf, sizeof abuf, NULL, 0, NI_NUMERICHOST) == 0)
    553 			addr = abuf;
    554 		else
    555 			addr = NULL;
    556 		if (httpd->numeric == 0 &&
    557 		    getnameinfo((struct sockaddr *)(void *)&ss, slen,
    558 				hbuf, sizeof hbuf, NULL, 0, 0) == 0)
    559 			host = hbuf;
    560 		else
    561 			host = NULL;
    562 	}
    563 	if (host != NULL)
    564 		request->hr_remotehost = bozostrdup(request->hr_httpd, host);
    565 	if (addr != NULL)
    566 		request->hr_remoteaddr = bozostrdup(request->hr_httpd, addr);
    567 	slen = sizeof(ss);
    568 
    569 	/*
    570 	 * Override the bound port from the request value, so it works even
    571 	 * if passed through a proxy that doesn't rewrite the port.
    572 	 */
    573 	if (httpd->bindport) {
    574 		if (strcmp(httpd->bindport, "80") != 0)
    575 			port = httpd->bindport;
    576 		else
    577 			port = NULL;
    578 	} else {
    579 		if (getsockname(0, (struct sockaddr *)(void *)&ss, &slen) < 0)
    580 			port = NULL;
    581 		else {
    582 			if (getnameinfo((struct sockaddr *)(void *)&ss, slen, NULL, 0,
    583 					bufport, sizeof bufport, NI_NUMERICSERV) == 0)
    584 				port = bufport;
    585 			else
    586 				port = NULL;
    587 		}
    588 	}
    589 	if (port != NULL)
    590 		request->hr_serverport = bozostrdup(request->hr_httpd, port);
    591 
    592 	/*
    593 	 * setup a timer to make sure the request is not hung
    594 	 */
    595 	sa.sa_handler = alarmer;
    596 	sigemptyset(&sa.sa_mask);
    597 	sigaddset(&sa.sa_mask, SIGALRM);
    598 	sa.sa_flags = 0;
    599 	sigaction(SIGALRM, &sa, NULL);	/* XXX */
    600 
    601 	alarm(MAX_WAIT_TIME);
    602 	while ((str = bozodgetln(httpd, STDIN_FILENO, &len, bozo_read)) != NULL) {
    603 		alarm(0);
    604 		if (alarmhit) {
    605 			(void)bozo_http_error(httpd, 408, NULL,
    606 					"request timed out");
    607 			goto cleanup;
    608 		}
    609 		line++;
    610 
    611 		if (line == 1) {
    612 
    613 			if (len < 1) {
    614 				(void)bozo_http_error(httpd, 404, NULL,
    615 						"null method");
    616 				goto cleanup;
    617 			}
    618 
    619 			bozo_warn(httpd, "got request ``%s'' from host %s to port %s",
    620 				str,
    621 				host ? host : addr ? addr : "<local>",
    622 				port ? port : "<stdin>");
    623 
    624 			/* we allocate return space in file and query only */
    625 			parse_request(httpd, str, &method, &file, &query, &proto);
    626 			request->hr_file = file;
    627 			request->hr_query = query;
    628 			if (method == NULL) {
    629 				(void)bozo_http_error(httpd, 404, NULL,
    630 						"null method");
    631 				goto cleanup;
    632 			}
    633 			if (file == NULL) {
    634 				(void)bozo_http_error(httpd, 404, NULL,
    635 						"null file");
    636 				goto cleanup;
    637 			}
    638 
    639 			/*
    640 			 * note that we parse the proto first, so that we
    641 			 * can more properly parse the method and the url.
    642 			 */
    643 
    644 			if (process_proto(request, proto) ||
    645 			    process_method(request, method)) {
    646 				goto cleanup;
    647 			}
    648 
    649 			debug((httpd, DEBUG_FAT, "got file \"%s\" query \"%s\"",
    650 			    request->hr_file,
    651 			    request->hr_query ? request->hr_query : "<none>"));
    652 
    653 			/* http/0.9 has no header processing */
    654 			if (request->hr_proto == httpd->consts.http_09)
    655 				break;
    656 		} else {		/* incoming headers */
    657 			bozoheaders_t *hdr;
    658 
    659 			if (*str == '\0')
    660 				break;
    661 
    662 			val = bozostrnsep(&str, ":", &len);
    663 			debug((httpd, DEBUG_EXPLODING,
    664 			    "read_req2: after bozostrnsep: str ``%s'' val ``%s''",
    665 			    str, val));
    666 			if (val == NULL || len == -1) {
    667 				(void)bozo_http_error(httpd, 404, request,
    668 						"no header");
    669 				goto cleanup;
    670 			}
    671 			while (*str == ' ' || *str == '\t')
    672 				len--, str++;
    673 			while (*val == ' ' || *val == '\t')
    674 				val++;
    675 
    676 			if (bozo_auth_check_headers(request, val, str, len))
    677 				goto next_header;
    678 
    679 			hdr = addmerge_header(request, val, str, len);
    680 
    681 			if (strcasecmp(hdr->h_header, "content-type") == 0)
    682 				request->hr_content_type = hdr->h_value;
    683 			else if (strcasecmp(hdr->h_header, "content-length") == 0)
    684 				request->hr_content_length = hdr->h_value;
    685 			else if (strcasecmp(hdr->h_header, "host") == 0)
    686 				request->hr_host = hdr->h_value;
    687 			/* HTTP/1.1 rev06 draft spec: 14.20 */
    688 			else if (strcasecmp(hdr->h_header, "expect") == 0) {
    689 				(void)bozo_http_error(httpd, 417, request,
    690 						"we don't support Expect:");
    691 				goto cleanup;
    692 			}
    693 			else if (strcasecmp(hdr->h_header, "referrer") == 0 ||
    694 			         strcasecmp(hdr->h_header, "referer") == 0)
    695 				request->hr_referrer = hdr->h_value;
    696 			else if (strcasecmp(hdr->h_header, "range") == 0)
    697 				request->hr_range = hdr->h_value;
    698 			else if (strcasecmp(hdr->h_header,
    699 					"if-modified-since") == 0)
    700 				request->hr_if_modified_since = hdr->h_value;
    701 			else if (strcasecmp(hdr->h_header,
    702 					"accept-encoding") == 0)
    703 				request->hr_accept_encoding = hdr->h_value;
    704 
    705 			debug((httpd, DEBUG_FAT, "adding header %s: %s",
    706 			    hdr->h_header, hdr->h_value));
    707 		}
    708 next_header:
    709 		alarm(MAX_WAIT_TIME);
    710 	}
    711 
    712 	/* now, clear it all out */
    713 	alarm(0);
    714 	signal(SIGALRM, SIG_DFL);
    715 
    716 	/* RFC1945, 8.3 */
    717 	if (request->hr_method == HTTP_POST &&
    718 	    request->hr_content_length == NULL) {
    719 		(void)bozo_http_error(httpd, 400, request,
    720 				"missing content length");
    721 		goto cleanup;
    722 	}
    723 
    724 	/* HTTP/1.1 draft rev-06, 14.23 & 19.6.1.1 */
    725 	if (request->hr_proto == httpd->consts.http_11 &&
    726 	    request->hr_host == NULL) {
    727 		(void)bozo_http_error(httpd, 400, request,
    728 				"missing Host header");
    729 		goto cleanup;
    730 	}
    731 
    732 	if (request->hr_range != NULL) {
    733 		debug((httpd, DEBUG_FAT, "hr_range: %s", request->hr_range));
    734 		/* support only simple ranges %d- and %d-%d */
    735 		if (strchr(request->hr_range, ',') == NULL) {
    736 			const char *rstart, *dash;
    737 
    738 			rstart = strchr(request->hr_range, '=');
    739 			if (rstart != NULL) {
    740 				rstart++;
    741 				dash = strchr(rstart, '-');
    742 				if (dash != NULL && dash != rstart) {
    743 					dash++;
    744 					request->hr_have_range = 1;
    745 					request->hr_first_byte_pos =
    746 					    strtoll(rstart, NULL, 10);
    747 					if (request->hr_first_byte_pos < 0)
    748 						request->hr_first_byte_pos = 0;
    749 					if (*dash != '\0') {
    750 						request->hr_last_byte_pos =
    751 						    strtoll(dash, NULL, 10);
    752 						if (request->hr_last_byte_pos < 0)
    753 							request->hr_last_byte_pos = -1;
    754 					}
    755 				}
    756 			}
    757 		}
    758 	}
    759 
    760 	debug((httpd, DEBUG_FAT, "bozo_read_request returns url %s in request",
    761 	       request->hr_file));
    762 	return request;
    763 
    764 cleanup:
    765 	bozo_clean_request(request);
    766 
    767 	return NULL;
    768 }
    769 
    770 static int
    771 mmap_and_write_part(bozohttpd_t *httpd, int fd, off_t first_byte_pos, size_t sz)
    772 {
    773 	size_t mappedsz, wroffset;
    774 	off_t mappedoffset;
    775 	char *addr;
    776 	void *mappedaddr;
    777 
    778 	/*
    779 	 * we need to ensure that both the size *and* offset arguments to
    780 	 * mmap() are page-aligned.  our formala for this is:
    781 	 *
    782 	 *    input offset: first_byte_pos
    783 	 *    input size: sz
    784 	 *
    785 	 *    mapped offset = page align truncate (input offset)
    786 	 *    mapped size   =
    787 	 *        page align extend (input offset - mapped offset + input size)
    788 	 *    write offset  = input offset - mapped offset
    789 	 *
    790 	 * we use the write offset in all writes
    791 	 */
    792 	mappedoffset = first_byte_pos & ~(httpd->page_size - 1);
    793 	mappedsz = (size_t)
    794 		(first_byte_pos - mappedoffset + sz + httpd->page_size - 1) &
    795 		~(httpd->page_size - 1);
    796 	wroffset = (size_t)(first_byte_pos - mappedoffset);
    797 
    798 	addr = mmap(0, mappedsz, PROT_READ, MAP_SHARED, fd, mappedoffset);
    799 	if (addr == (char *)-1) {
    800 		bozo_warn(httpd, "mmap failed: %s", strerror(errno));
    801 		return -1;
    802 	}
    803 	mappedaddr = addr;
    804 
    805 #ifdef MADV_SEQUENTIAL
    806 	(void)madvise(addr, sz, MADV_SEQUENTIAL);
    807 #endif
    808 	while (sz > BOZO_WRSZ) {
    809 		if (bozo_write(httpd, STDOUT_FILENO, addr + wroffset,
    810 				BOZO_WRSZ) != BOZO_WRSZ) {
    811 			bozo_warn(httpd, "write failed: %s", strerror(errno));
    812 			goto out;
    813 		}
    814 		debug((httpd, DEBUG_OBESE, "wrote %d bytes", BOZO_WRSZ));
    815 		sz -= BOZO_WRSZ;
    816 		addr += BOZO_WRSZ;
    817 	}
    818 	if (sz && (size_t)bozo_write(httpd, STDOUT_FILENO, addr + wroffset,
    819 				sz) != sz) {
    820 		bozo_warn(httpd, "final write failed: %s", strerror(errno));
    821 		goto out;
    822 	}
    823 	debug((httpd, DEBUG_OBESE, "wrote %d bytes", (int)sz));
    824  out:
    825 	if (munmap(mappedaddr, mappedsz) < 0) {
    826 		bozo_warn(httpd, "munmap failed");
    827 		return -1;
    828 	}
    829 
    830 	return 0;
    831 }
    832 
    833 static int
    834 parse_http_date(const char *val, time_t *timestamp)
    835 {
    836 	char *remainder;
    837 	struct tm tm;
    838 
    839 	if ((remainder = strptime(val, "%a, %d %b %Y %T GMT", &tm)) == NULL &&
    840 	    (remainder = strptime(val, "%a, %d-%b-%y %T GMT", &tm)) == NULL &&
    841 	    (remainder = strptime(val, "%a %b %d %T %Y", &tm)) == NULL)
    842 		return 0; /* Invalid HTTP date format */
    843 
    844 	if (*remainder)
    845 		return 0; /* No trailing garbage */
    846 
    847 	*timestamp = timegm(&tm);
    848 	return 1;
    849 }
    850 
    851 /*
    852  * given an url, encode it ala rfc 3986.  ie, escape ? and friends.
    853  * note that this function returns a static buffer, and thus needs
    854  * to be updated for any sort of parallel processing.
    855  */
    856 char *
    857 escape_rfc3986(bozohttpd_t *httpd, const char *url)
    858 {
    859 	static char *buf;
    860 	static size_t buflen = 0;
    861 	size_t len;
    862 	const char *s;
    863 	char *d;
    864 
    865 	len = strlen(url);
    866 	if (buflen < len * 3 + 1) {
    867 		buflen = len * 3 + 1;
    868 		buf = bozorealloc(httpd, buf, buflen);
    869 	}
    870 
    871 	if (url == NULL) {
    872 		buf[0] = 0;
    873 		return buf;
    874 	}
    875 
    876 	for (len = 0, s = url, d = buf; *s;) {
    877 		if (*s & 0x80)
    878 			goto encode_it;
    879 		switch (*s) {
    880 		case ':':
    881 		case '/':
    882 		case '?':
    883 		case '#':
    884 		case '[':
    885 		case ']':
    886 		case '@':
    887 		case '!':
    888 		case '$':
    889 		case '&':
    890 		case '\'':
    891 		case '(':
    892 		case ')':
    893 		case '*':
    894 		case '+':
    895 		case ',':
    896 		case ';':
    897 		case '=':
    898 		case '%':
    899 		encode_it:
    900 			snprintf(d, 4, "%%%2X", *s++);
    901 			d += 3;
    902 			len += 3;
    903 			break;
    904 		default:
    905 			*d++ = *s++;
    906 			len++;
    907 			break;
    908 		}
    909 	}
    910 	buf[len] = 0;
    911 
    912 	return buf;
    913 }
    914 
    915 /*
    916  * checks to see if this request has a valid .bzdirect file.  returns
    917  * 0 on failure and 1 on success.
    918  */
    919 static int
    920 check_direct_access(bozo_httpreq_t *request)
    921 {
    922 	FILE *fp;
    923 	struct stat sb;
    924 	char dir[MAXPATHLEN], dirfile[MAXPATHLEN], *basename;
    925 
    926 	snprintf(dir, sizeof(dir), "%s", request->hr_file + 1);
    927 	debug((request->hr_httpd, DEBUG_FAT, "check_bzredirect: dir %s", dir));
    928 	basename = strrchr(dir, '/');
    929 
    930 	if ((!basename || basename[1] != '\0') &&
    931 	    lstat(dir, &sb) == 0 && S_ISDIR(sb.st_mode))
    932 		/* nothing */;
    933 	else if (basename == NULL)
    934 		strcpy(dir, ".");
    935 	else {
    936 		*basename++ = '\0';
    937 		bozo_check_special_files(request, basename);
    938 	}
    939 
    940 	snprintf(dirfile, sizeof(dirfile), "%s/%s", dir, DIRECT_ACCESS_FILE);
    941 	if (stat(dirfile, &sb) < 0 ||
    942 	    (fp = fopen(dirfile, "r")) == NULL)
    943 		return 0;
    944 	fclose(fp);
    945 	return 1;
    946 }
    947 
    948 /*
    949  * do automatic redirection -- if there are query parameters for the URL
    950  * we will tack these on to the new (redirected) URL.
    951  */
    952 static void
    953 handle_redirect(bozo_httpreq_t *request,
    954 		const char *url, int absolute)
    955 {
    956 	bozohttpd_t *httpd = request->hr_httpd;
    957 	char *urlbuf;
    958 	char portbuf[20];
    959 	const char *hostname = BOZOHOST(httpd, request);
    960 	int query = 0;
    961 
    962 	if (url == NULL) {
    963 		if (asprintf(&urlbuf, "/%s/", request->hr_file) < 0)
    964 			bozo_err(httpd, 1, "asprintf");
    965 		url = urlbuf;
    966 	} else
    967 		urlbuf = NULL;
    968 	url = escape_rfc3986(request->hr_httpd, url);
    969 
    970 	if (request->hr_query && strlen(request->hr_query))
    971 		query = 1;
    972 
    973 	if (request->hr_serverport && strcmp(request->hr_serverport, "80") != 0)
    974 		snprintf(portbuf, sizeof(portbuf), ":%s",
    975 		    request->hr_serverport);
    976 	else
    977 		portbuf[0] = '\0';
    978 	bozo_warn(httpd, "redirecting %s%s%s", hostname, portbuf, url);
    979 	debug((httpd, DEBUG_FAT, "redirecting %s", url));
    980 	bozo_printf(httpd, "%s 301 Document Moved\r\n", request->hr_proto);
    981 	if (request->hr_proto != httpd->consts.http_09)
    982 		bozo_print_header(request, NULL, "text/html", NULL);
    983 	if (request->hr_proto != httpd->consts.http_09) {
    984 		bozo_printf(httpd, "Location: http://");
    985 		if (absolute == 0)
    986 			bozo_printf(httpd, "%s%s", hostname, portbuf);
    987 		if (query) {
    988 			bozo_printf(httpd, "%s?%s\r\n", url, request->hr_query);
    989 		} else {
    990 			bozo_printf(httpd, "%s\r\n", url);
    991 		}
    992 	}
    993 	bozo_printf(httpd, "\r\n");
    994 	if (request->hr_method == HTTP_HEAD)
    995 		goto head;
    996 	bozo_printf(httpd, "<html><head><title>Document Moved</title></head>\n");
    997 	bozo_printf(httpd, "<body><h1>Document Moved</h1>\n");
    998 	bozo_printf(httpd, "This document had moved <a href=\"http://");
    999 	if (query) {
   1000 		if (absolute)
   1001 			bozo_printf(httpd, "%s?%s", url, request->hr_query);
   1002 		else
   1003 			bozo_printf(httpd, "%s%s%s?%s", hostname,
   1004 				    portbuf, url, request->hr_query);
   1005 	} else {
   1006 		if (absolute)
   1007 			bozo_printf(httpd, "%s", url);
   1008 		else
   1009 			bozo_printf(httpd, "%s%s%s", hostname,
   1010 				    portbuf, url);
   1011 	}
   1012 	bozo_printf(httpd, "\">here</a>\n");
   1013 	bozo_printf(httpd, "</body></html>\n");
   1014 head:
   1015 	bozo_flush(httpd, stdout);
   1016 	if (urlbuf)
   1017 		free(urlbuf);
   1018 }
   1019 
   1020 /*
   1021  * deal with virtual host names; we do this:
   1022  *	if we have a virtual path root (httpd->virtbase), and we are given a
   1023  *	virtual host spec (Host: ho.st or http://ho.st/), see if this
   1024  *	directory exists under httpd->virtbase.  if it does, use this as the
   1025  #	new slashdir.
   1026  */
   1027 static int
   1028 check_virtual(bozo_httpreq_t *request)
   1029 {
   1030 	bozohttpd_t *httpd = request->hr_httpd;
   1031 	char *file = request->hr_file, *s;
   1032 	size_t len;
   1033 
   1034 	if (!httpd->virtbase)
   1035 		goto use_slashdir;
   1036 
   1037 	/*
   1038 	 * convert http://virtual.host/ to request->hr_host
   1039 	 */
   1040 	debug((httpd, DEBUG_OBESE, "checking for http:// virtual host in ``%s''",
   1041 			file));
   1042 	if (strncasecmp(file, "http://", 7) == 0) {
   1043 		/* we would do virtual hosting here? */
   1044 		file += 7;
   1045 		s = strchr(file, '/');
   1046 		/* HTTP/1.1 draft rev-06, 5.2: URI takes precedence over Host: */
   1047 		request->hr_host = file;
   1048 		request->hr_file = bozostrdup(request->hr_httpd, s ? s : "/");
   1049 		debug((httpd, DEBUG_OBESE, "got host ``%s'' file is now ``%s''",
   1050 		    request->hr_host, request->hr_file));
   1051 	} else if (!request->hr_host)
   1052 		goto use_slashdir;
   1053 
   1054 	/*
   1055 	 * ok, we have a virtual host, use scandir(3) to find a case
   1056 	 * insensitive match for the virtual host we are asked for.
   1057 	 * note that if the virtual host is the same as the master,
   1058 	 * we don't need to do anything special.
   1059 	 */
   1060 	len = strlen(request->hr_host);
   1061 	debug((httpd, DEBUG_OBESE,
   1062 	    "check_virtual: checking host `%s' under httpd->virtbase `%s' "
   1063 	    "for file `%s'",
   1064 	    request->hr_host, httpd->virtbase, request->hr_file));
   1065 	if (strncasecmp(httpd->virthostname, request->hr_host, len) != 0) {
   1066 		s = 0;
   1067 		DIR *dirp;
   1068 		struct dirent *d;
   1069 
   1070 		if ((dirp = opendir(httpd->virtbase)) != NULL) {
   1071 			while ((d = readdir(dirp)) != NULL) {
   1072 				if (strcmp(d->d_name, ".") == 0 ||
   1073 				    strcmp(d->d_name, "..") == 0) {
   1074 					continue;
   1075 				}
   1076 				debug((httpd, DEBUG_OBESE, "looking at dir``%s''",
   1077 			 	   d->d_name));
   1078 				if (strncasecmp(d->d_name, request->hr_host,
   1079 				    len) == 0) {
   1080 					/* found it, punch it */
   1081 					debug((httpd, DEBUG_OBESE, "found it punch it"));
   1082 					request->hr_virthostname =
   1083 					    bozostrdup(httpd,d->d_name);
   1084 					if (asprintf(&s, "%s/%s", httpd->virtbase,
   1085 					    request->hr_virthostname) < 0)
   1086 						bozo_err(httpd, 1, "asprintf");
   1087 					break;
   1088 				}
   1089 			}
   1090 			closedir(dirp);
   1091 		}
   1092 		else {
   1093 			debug((httpd, DEBUG_FAT, "opendir %s failed: %s",
   1094 			    httpd->virtbase, strerror(errno)));
   1095 		}
   1096 		if (s == 0) {
   1097 			if (httpd->unknown_slash)
   1098 				goto use_slashdir;
   1099 			return bozo_http_error(httpd, 404, request,
   1100 						"unknown URL");
   1101 		}
   1102 	} else
   1103 use_slashdir:
   1104 		s = httpd->slashdir;
   1105 
   1106 	/*
   1107 	 * ok, nailed the correct slashdir, chdir to it
   1108 	 */
   1109 	if (chdir(s) < 0)
   1110 		return bozo_http_error(httpd, 404, request,
   1111 					"can't chdir to slashdir");
   1112 	return 0;
   1113 }
   1114 
   1115 /*
   1116  * checks to see if this request has a valid .bzredirect file.  returns
   1117  * 0 on failure and 1 on success.
   1118  */
   1119 static void
   1120 check_bzredirect(bozo_httpreq_t *request)
   1121 {
   1122 	struct stat sb;
   1123 	char dir[MAXPATHLEN], redir[MAXPATHLEN], redirpath[MAXPATHLEN + 1];
   1124 	char *basename, *finalredir;
   1125 	int rv, absolute;
   1126 
   1127 	/*
   1128 	 * if this pathname is really a directory, but doesn't end in /,
   1129 	 * use it as the directory to look for the redir file.
   1130 	 */
   1131 	snprintf(dir, sizeof(dir), "%s", request->hr_file + 1);
   1132 	debug((request->hr_httpd, DEBUG_FAT, "check_bzredirect: dir %s", dir));
   1133 	basename = strrchr(dir, '/');
   1134 
   1135 	if ((!basename || basename[1] != '\0') &&
   1136 	    lstat(dir, &sb) == 0 && S_ISDIR(sb.st_mode))
   1137 		/* nothing */;
   1138 	else if (basename == NULL)
   1139 		strcpy(dir, ".");
   1140 	else {
   1141 		*basename++ = '\0';
   1142 		bozo_check_special_files(request, basename);
   1143 	}
   1144 
   1145 	snprintf(redir, sizeof(redir), "%s/%s", dir, REDIRECT_FILE);
   1146 	if (lstat(redir, &sb) == 0) {
   1147 		if (!S_ISLNK(sb.st_mode))
   1148 			return;
   1149 		absolute = 0;
   1150 	} else {
   1151 		snprintf(redir, sizeof(redir), "%s/%s", dir, ABSREDIRECT_FILE);
   1152 		if (lstat(redir, &sb) < 0 || !S_ISLNK(sb.st_mode))
   1153 			return;
   1154 		absolute = 1;
   1155 	}
   1156 	debug((request->hr_httpd, DEBUG_FAT,
   1157 	       "check_bzredirect: calling readlink"));
   1158 	rv = readlink(redir, redirpath, sizeof redirpath - 1);
   1159 	if (rv == -1 || rv == 0) {
   1160 		debug((request->hr_httpd, DEBUG_FAT, "readlink failed"));
   1161 		return;
   1162 	}
   1163 	redirpath[rv] = '\0';
   1164 	debug((request->hr_httpd, DEBUG_FAT,
   1165 	       "readlink returned \"%s\"", redirpath));
   1166 
   1167 	/* now we have the link pointer, redirect to the real place */
   1168 	if (absolute)
   1169 		finalredir = redirpath;
   1170 	else
   1171 		snprintf(finalredir = redir, sizeof(redir), "/%s/%s", dir,
   1172 			 redirpath);
   1173 
   1174 	debug((request->hr_httpd, DEBUG_FAT,
   1175 	       "check_bzredirect: new redir %s", finalredir));
   1176 	handle_redirect(request, finalredir, absolute);
   1177 }
   1178 
   1179 /* this fixes the %HH hack that RFC2396 requires.  */
   1180 static void
   1181 fix_url_percent(bozo_httpreq_t *request)
   1182 {
   1183 	bozohttpd_t *httpd = request->hr_httpd;
   1184 	char	*s, *t, buf[3], *url;
   1185 	char	*end;	/* if end is not-zero, we don't translate beyond that */
   1186 
   1187 	url = request->hr_file;
   1188 
   1189 	end = url + strlen(url);
   1190 
   1191 	/* fast forward to the first % */
   1192 	if ((s = strchr(url, '%')) == NULL)
   1193 		return;
   1194 
   1195 	t = s;
   1196 	do {
   1197 		if (end && s >= end) {
   1198 			debug((httpd, DEBUG_EXPLODING,
   1199 				"fu_%%: past end, filling out.."));
   1200 			while (*s)
   1201 				*t++ = *s++;
   1202 			break;
   1203 		}
   1204 		debug((httpd, DEBUG_EXPLODING,
   1205 			"fu_%%: got s == %%, s[1]s[2] == %c%c",
   1206 			s[1], s[2]));
   1207 		if (s[1] == '\0' || s[2] == '\0') {
   1208 			(void)bozo_http_error(httpd, 400, request,
   1209 			    "percent hack missing two chars afterwards");
   1210 			goto copy_rest;
   1211 		}
   1212 		if (s[1] == '0' && s[2] == '0') {
   1213 			(void)bozo_http_error(httpd, 404, request,
   1214 					"percent hack was %00");
   1215 			goto copy_rest;
   1216 		}
   1217 		if (s[1] == '2' && s[2] == 'f') {
   1218 			(void)bozo_http_error(httpd, 404, request,
   1219 					"percent hack was %2f (/)");
   1220 			goto copy_rest;
   1221 		}
   1222 
   1223 		buf[0] = *++s;
   1224 		buf[1] = *++s;
   1225 		buf[2] = '\0';
   1226 		s++;
   1227 		*t = (char)strtol(buf, NULL, 16);
   1228 		debug((httpd, DEBUG_EXPLODING,
   1229 				"fu_%%: strtol put '%02x' into *t", *t));
   1230 		if (*t++ == '\0') {
   1231 			(void)bozo_http_error(httpd, 400, request,
   1232 					"percent hack got a 0 back");
   1233 			goto copy_rest;
   1234 		}
   1235 
   1236 		while (*s && *s != '%') {
   1237 			if (end && s >= end)
   1238 				break;
   1239 			*t++ = *s++;
   1240 		}
   1241 	} while (*s);
   1242 copy_rest:
   1243 	while (*s) {
   1244 		if (s >= end)
   1245 			break;
   1246 		*t++ = *s++;
   1247 	}
   1248 	*t = '\0';
   1249 	debug((httpd, DEBUG_FAT, "fix_url_percent returns %s in url",
   1250 			request->hr_file));
   1251 }
   1252 
   1253 /*
   1254  * transform_request does this:
   1255  *	- ``expand'' %20 crapola
   1256  *	- punt if it doesn't start with /
   1257  *	- check httpd->untrustedref / referrer
   1258  *	- look for "http://myname/" and deal with it.
   1259  *	- maybe call bozo_process_cgi()
   1260  *	- check for ~user and call bozo_user_transform() if so
   1261  *	- if the length > 1, check for trailing slash.  if so,
   1262  *	  add the index.html file
   1263  *	- if the length is 1, return the index.html file
   1264  *	- disallow anything ending up with a file starting
   1265  *	  at "/" or having ".." in it.
   1266  *	- anything else is a really weird internal error
   1267  *	- returns malloced file to serve, if unhandled
   1268  */
   1269 static int
   1270 transform_request(bozo_httpreq_t *request, int *isindex)
   1271 {
   1272 	bozohttpd_t *httpd = request->hr_httpd;
   1273 	char	*file, *newfile = NULL;
   1274 	size_t	len;
   1275 	const char *hostname = BOZOHOST(httpd, request);
   1276 
   1277 	file = NULL;
   1278 	*isindex = 0;
   1279 	debug((httpd, DEBUG_FAT, "tf_req: file %s", request->hr_file));
   1280 	fix_url_percent(request);
   1281 	if (check_virtual(request)) {
   1282 		goto bad_done;
   1283 	}
   1284 	file = request->hr_file;
   1285 
   1286 	if (file[0] != '/') {
   1287 		(void)bozo_http_error(httpd, 404, request, "unknown URL");
   1288 		goto bad_done;
   1289 	}
   1290 
   1291 	check_bzredirect(request);
   1292 
   1293 	if (httpd->untrustedref) {
   1294 		int to_indexhtml = 0;
   1295 
   1296 #define TOP_PAGE(x)	(strcmp((x), "/") == 0 || \
   1297 			 strcmp((x) + 1, httpd->index_html) == 0 || \
   1298 			 strcmp((x) + 1, "favicon.ico") == 0)
   1299 
   1300 		debug((httpd, DEBUG_EXPLODING, "checking httpd->untrustedref"));
   1301 		/*
   1302 		 * first check that this path isn't allowed via .bzdirect file,
   1303 		 * and then check referrer; make sure that people come via the
   1304 		 * real name... otherwise if we aren't looking at / or
   1305 		 * /index.html, redirect...  we also special case favicon.ico.
   1306 		 */
   1307 		if (check_direct_access(request))
   1308 			/* nothing */;
   1309 		else if (request->hr_referrer) {
   1310 			const char *r = request->hr_referrer;
   1311 
   1312 			debug((httpd, DEBUG_FAT,
   1313 				"checking referrer \"%s\" vs virthostname %s",
   1314 				r, hostname));
   1315 			if (strncmp(r, "http://", 7) != 0 ||
   1316 			    (strncasecmp(r + 7, hostname,
   1317 			    		 strlen(hostname)) != 0 &&
   1318 			     !TOP_PAGE(file)))
   1319 				to_indexhtml = 1;
   1320 		} else {
   1321 			const char *h = request->hr_host;
   1322 
   1323 			debug((httpd, DEBUG_FAT, "url has no referrer at all"));
   1324 			/* if there's no referrer, let / or /index.html past */
   1325 			if (!TOP_PAGE(file) ||
   1326 			    (h && strncasecmp(h, hostname,
   1327 			    		strlen(hostname)) != 0))
   1328 				to_indexhtml = 1;
   1329 		}
   1330 
   1331 		if (to_indexhtml) {
   1332 			char *slashindexhtml;
   1333 
   1334 			if (asprintf(&slashindexhtml, "/%s",
   1335 					httpd->index_html) < 0)
   1336 				bozo_err(httpd, 1, "asprintf");
   1337 			debug((httpd, DEBUG_FAT,
   1338 				"httpd->untrustedref: redirecting %s to %s",
   1339 				file, slashindexhtml));
   1340 			handle_redirect(request, slashindexhtml, 0);
   1341 			free(slashindexhtml);
   1342 			return 0;
   1343 		}
   1344 	}
   1345 
   1346 	len = strlen(file);
   1347 	if (/*CONSTCOND*/0) {
   1348 #ifndef NO_USER_SUPPORT
   1349 	} else if (len > 1 && httpd->enable_users && file[1] == '~') {
   1350 		if (file[2] == '\0') {
   1351 			(void)bozo_http_error(httpd, 404, request,
   1352 						"missing username");
   1353 			goto bad_done;
   1354 		}
   1355 		if (strchr(file + 2, '/') == NULL) {
   1356 			handle_redirect(request, NULL, 0);
   1357 			return 0;
   1358 		}
   1359 		debug((httpd, DEBUG_FAT, "calling bozo_user_transform"));
   1360 
   1361 		return bozo_user_transform(request, isindex);
   1362 #endif /* NO_USER_SUPPORT */
   1363 	} else if (len > 1) {
   1364 		debug((httpd, DEBUG_FAT, "file[len-1] == %c", file[len-1]));
   1365 		if (file[len-1] == '/') {	/* append index.html */
   1366 			*isindex = 1;
   1367 			debug((httpd, DEBUG_FAT, "appending index.html"));
   1368 			newfile = bozomalloc(httpd,
   1369 					len + strlen(httpd->index_html) + 1);
   1370 			strcpy(newfile, file + 1);
   1371 			strcat(newfile, httpd->index_html);
   1372 		} else
   1373 			newfile = bozostrdup(request->hr_httpd, file + 1);
   1374 	} else if (len == 1) {
   1375 		debug((httpd, DEBUG_EXPLODING, "tf_req: len == 1"));
   1376 		newfile = bozostrdup(request->hr_httpd, httpd->index_html);
   1377 		*isindex = 1;
   1378 	} else {	/* len == 0 ? */
   1379 		(void)bozo_http_error(httpd, 500, request,
   1380 					"request->hr_file is nul?");
   1381 		goto bad_done;
   1382 	}
   1383 
   1384 	if (newfile == NULL) {
   1385 		(void)bozo_http_error(httpd, 500, request, "internal failure");
   1386 		goto bad_done;
   1387 	}
   1388 
   1389 	/*
   1390 	 * look for "http://myname/" and deal with it as necessary.
   1391 	 */
   1392 
   1393 	/*
   1394 	 * stop traversing outside our domain
   1395 	 *
   1396 	 * XXX true security only comes from our parent using chroot(2)
   1397 	 * before execve(2)'ing us.  or our own built in chroot(2) support.
   1398 	 */
   1399 	if (*newfile == '/' || strcmp(newfile, "..") == 0 ||
   1400 	    strstr(newfile, "/..") || strstr(newfile, "../")) {
   1401 		(void)bozo_http_error(httpd, 403, request, "illegal request");
   1402 		goto bad_done;
   1403 	}
   1404 
   1405 	if (bozo_auth_check(request, newfile))
   1406 		goto bad_done;
   1407 
   1408 	if (strlen(newfile)) {
   1409 		request->hr_oldfile = request->hr_file;
   1410 		request->hr_file = newfile;
   1411 	}
   1412 
   1413 	if (bozo_process_cgi(request))
   1414 		return 0;
   1415 
   1416 	debug((httpd, DEBUG_FAT, "transform_request set: %s", newfile));
   1417 	return 1;
   1418 bad_done:
   1419 	debug((httpd, DEBUG_FAT, "transform_request returning: 0"));
   1420 	if (newfile)
   1421 		free(newfile);
   1422 	return 0;
   1423 }
   1424 
   1425 /*
   1426  * can_gzip checks if the request supports and prefers gzip encoding.
   1427  *
   1428  * XXX: we do not consider the associated q with gzip in making our
   1429  *      decision which is broken.
   1430  */
   1431 
   1432 static int
   1433 can_gzip(bozo_httpreq_t *request)
   1434 {
   1435 	const char	*pos;
   1436 	const char	*tmp;
   1437 	size_t		 len;
   1438 
   1439 	/* First we decide if the request can be gzipped at all. */
   1440 
   1441 	/* not if we already are encoded... */
   1442 	tmp = bozo_content_encoding(request, request->hr_file);
   1443 	if (tmp && *tmp)
   1444 		return 0;
   1445 
   1446 	/* not if we are not asking for the whole file... */
   1447 	if (request->hr_last_byte_pos != -1 || request->hr_have_range)
   1448 		return 0;
   1449 
   1450 	/* Then we determine if gzip is on the cards. */
   1451 
   1452 	for (pos = request->hr_accept_encoding; pos && *pos; pos += len) {
   1453 		while (*pos == ' ')
   1454 			pos++;
   1455 
   1456 		len = strcspn(pos, ";,");
   1457 
   1458 		if ((len == 4 && strncasecmp("gzip", pos, 4) == 0) ||
   1459 		    (len == 6 && strncasecmp("x-gzip", pos, 6) == 0))
   1460 			return 1;
   1461 
   1462 		if (pos[len] == ';')
   1463 			len += strcspn(&pos[len], ",");
   1464 
   1465 		if (pos[len])
   1466 			len++;
   1467 	}
   1468 
   1469 	return 0;
   1470 }
   1471 
   1472 /*
   1473  * bozo_process_request does the following:
   1474  *	- check the request is valid
   1475  *	- process cgi-bin if necessary
   1476  *	- transform a filename if necesarry
   1477  *	- return the HTTP request
   1478  */
   1479 void
   1480 bozo_process_request(bozo_httpreq_t *request)
   1481 {
   1482 	bozohttpd_t *httpd = request->hr_httpd;
   1483 	struct	stat sb;
   1484 	time_t timestamp;
   1485 	char	*file;
   1486 	const char *type, *encoding;
   1487 	int	fd, isindex;
   1488 
   1489 	/*
   1490 	 * note that transform_request chdir()'s if required.  also note
   1491 	 * that cgi is handed here.  if transform_request() returns 0
   1492 	 * then the request has been handled already.
   1493 	 */
   1494 	if (transform_request(request, &isindex) == 0)
   1495 		return;
   1496 
   1497 	fd = -1;
   1498 	encoding = NULL;
   1499 	if (can_gzip(request)) {
   1500 		asprintf(&file, "%s.gz", request->hr_file);
   1501 		fd = open(file, O_RDONLY);
   1502 		if (fd >= 0)
   1503 			encoding = "gzip";
   1504 		free(file);
   1505 	}
   1506 
   1507 	file = request->hr_file;
   1508 
   1509 	if (fd < 0)
   1510 		fd = open(file, O_RDONLY);
   1511 
   1512 	if (fd < 0) {
   1513 		debug((httpd, DEBUG_FAT, "open failed: %s", strerror(errno)));
   1514 		if (errno == EPERM)
   1515 			(void)bozo_http_error(httpd, 403, request,
   1516 						"no permission to open file");
   1517 		else if (errno == ENOENT) {
   1518 			if (!bozo_dir_index(request, file, isindex))
   1519 				(void)bozo_http_error(httpd, 404, request,
   1520 							"no file");
   1521 		} else
   1522 			(void)bozo_http_error(httpd, 500, request, "open file");
   1523 		goto cleanup_nofd;
   1524 	}
   1525 	if (fstat(fd, &sb) < 0) {
   1526 		(void)bozo_http_error(httpd, 500, request, "can't fstat");
   1527 		goto cleanup;
   1528 	}
   1529 	if (S_ISDIR(sb.st_mode)) {
   1530 		handle_redirect(request, NULL, 0);
   1531 		goto cleanup;
   1532 	}
   1533 
   1534 	if (request->hr_if_modified_since &&
   1535 	    parse_http_date(request->hr_if_modified_since, &timestamp) &&
   1536 	    timestamp >= sb.st_mtime) {
   1537 		/* XXX ignore subsecond of timestamp */
   1538 		bozo_printf(httpd, "%s 304 Not Modified\r\n",
   1539 				request->hr_proto);
   1540 		bozo_printf(httpd, "\r\n");
   1541 		bozo_flush(httpd, stdout);
   1542 		goto cleanup;
   1543 	}
   1544 
   1545 	/* validate requested range */
   1546 	if (request->hr_last_byte_pos == -1 ||
   1547 	    request->hr_last_byte_pos >= sb.st_size)
   1548 		request->hr_last_byte_pos = sb.st_size - 1;
   1549 	if (request->hr_have_range &&
   1550 	    request->hr_first_byte_pos > request->hr_last_byte_pos) {
   1551 		request->hr_have_range = 0;	/* punt */
   1552 		request->hr_first_byte_pos = 0;
   1553 		request->hr_last_byte_pos = sb.st_size - 1;
   1554 	}
   1555 	debug((httpd, DEBUG_FAT, "have_range %d first_pos %lld last_pos %lld",
   1556 	    request->hr_have_range,
   1557 	    (long long)request->hr_first_byte_pos,
   1558 	    (long long)request->hr_last_byte_pos));
   1559 	if (request->hr_have_range)
   1560 		bozo_printf(httpd, "%s 206 Partial Content\r\n",
   1561 				request->hr_proto);
   1562 	else
   1563 		bozo_printf(httpd, "%s 200 OK\r\n", request->hr_proto);
   1564 
   1565 	if (request->hr_proto != httpd->consts.http_09) {
   1566 		type = bozo_content_type(request, file);
   1567 		if (!encoding)
   1568 			encoding = bozo_content_encoding(request, file);
   1569 
   1570 		bozo_print_header(request, &sb, type, encoding);
   1571 		bozo_printf(httpd, "\r\n");
   1572 	}
   1573 	bozo_flush(httpd, stdout);
   1574 
   1575 	if (request->hr_method != HTTP_HEAD) {
   1576 		off_t szleft, cur_byte_pos;
   1577 
   1578 		szleft =
   1579 		     request->hr_last_byte_pos - request->hr_first_byte_pos + 1;
   1580 		cur_byte_pos = request->hr_first_byte_pos;
   1581 
   1582  retry:
   1583 		while (szleft) {
   1584 			size_t sz;
   1585 
   1586 			/* This should take care of the first unaligned chunk */
   1587 			if ((cur_byte_pos & (httpd->page_size - 1)) != 0)
   1588 				sz = (size_t)(cur_byte_pos & ~httpd->page_size);
   1589 			if ((off_t)httpd->mmapsz < szleft)
   1590 				sz = httpd->mmapsz;
   1591 			else
   1592 				sz = (size_t)szleft;
   1593 			if (mmap_and_write_part(httpd, fd, cur_byte_pos, sz)) {
   1594 				if (errno == ENOMEM) {
   1595 					httpd->mmapsz /= 2;
   1596 					if (httpd->mmapsz >= httpd->page_size)
   1597 						goto retry;
   1598 				}
   1599 				goto cleanup;
   1600 			}
   1601 			cur_byte_pos += sz;
   1602 			szleft -= sz;
   1603 		}
   1604 	}
   1605  cleanup:
   1606 	close(fd);
   1607  cleanup_nofd:
   1608 	close(STDIN_FILENO);
   1609 	close(STDOUT_FILENO);
   1610 	/*close(STDERR_FILENO);*/
   1611 }
   1612 
   1613 /* make sure we're not trying to access special files */
   1614 int
   1615 bozo_check_special_files(bozo_httpreq_t *request, const char *name)
   1616 {
   1617 	bozohttpd_t *httpd = request->hr_httpd;
   1618 
   1619 	/* ensure basename(name) != special files */
   1620 	if (strcmp(name, DIRECT_ACCESS_FILE) == 0)
   1621 		return bozo_http_error(httpd, 403, request,
   1622 		    "no permission to open direct access file");
   1623 	if (strcmp(name, REDIRECT_FILE) == 0)
   1624 		return bozo_http_error(httpd, 403, request,
   1625 		    "no permission to open redirect file");
   1626 	if (strcmp(name, ABSREDIRECT_FILE) == 0)
   1627 		return bozo_http_error(httpd, 403, request,
   1628 		    "no permission to open redirect file");
   1629 	return bozo_auth_check_special_files(request, name);
   1630 }
   1631 
   1632 /* generic header printing routine */
   1633 void
   1634 bozo_print_header(bozo_httpreq_t *request,
   1635 		struct stat *sbp, const char *type, const char *encoding)
   1636 {
   1637 	bozohttpd_t *httpd = request->hr_httpd;
   1638 	off_t len;
   1639 	char	date[40];
   1640 
   1641 	bozo_printf(httpd, "Date: %s\r\n", bozo_http_date(date, sizeof(date)));
   1642 	bozo_printf(httpd, "Server: %s\r\n", httpd->server_software);
   1643 	bozo_printf(httpd, "Accept-Ranges: bytes\r\n");
   1644 	if (sbp) {
   1645 		char filedate[40];
   1646 		struct	tm *tm;
   1647 
   1648 		tm = gmtime(&sbp->st_mtime);
   1649 		strftime(filedate, sizeof filedate,
   1650 		    "%a, %d %b %Y %H:%M:%S GMT", tm);
   1651 		bozo_printf(httpd, "Last-Modified: %s\r\n", filedate);
   1652 	}
   1653 	if (type && *type)
   1654 		bozo_printf(httpd, "Content-Type: %s\r\n", type);
   1655 	if (encoding && *encoding)
   1656 		bozo_printf(httpd, "Content-Encoding: %s\r\n", encoding);
   1657 	if (sbp) {
   1658 		if (request->hr_have_range) {
   1659 			len = request->hr_last_byte_pos -
   1660 					request->hr_first_byte_pos +1;
   1661 			bozo_printf(httpd,
   1662 				"Content-Range: bytes %qd-%qd/%qd\r\n",
   1663 				(long long) request->hr_first_byte_pos,
   1664 				(long long) request->hr_last_byte_pos,
   1665 				(long long) sbp->st_size);
   1666 		} else
   1667 			len = sbp->st_size;
   1668 		bozo_printf(httpd, "Content-Length: %qd\r\n", (long long)len);
   1669 	}
   1670 	if (request && request->hr_proto == httpd->consts.http_11)
   1671 		bozo_printf(httpd, "Connection: close\r\n");
   1672 	bozo_flush(httpd, stdout);
   1673 }
   1674 
   1675 #ifndef NO_DEBUG
   1676 void
   1677 debug__(bozohttpd_t *httpd, int level, const char *fmt, ...)
   1678 {
   1679 	va_list	ap;
   1680 	int savederrno;
   1681 
   1682 	/* only log if the level is low enough */
   1683 	if (httpd->debug < level)
   1684 		return;
   1685 
   1686 	savederrno = errno;
   1687 	va_start(ap, fmt);
   1688 	if (httpd->logstderr) {
   1689 		vfprintf(stderr, fmt, ap);
   1690 		fputs("\n", stderr);
   1691 	} else
   1692 		vsyslog(LOG_DEBUG, fmt, ap);
   1693 	va_end(ap);
   1694 	errno = savederrno;
   1695 }
   1696 #endif /* NO_DEBUG */
   1697 
   1698 /* these are like warn() and err(), except for syslog not stderr */
   1699 void
   1700 bozo_warn(bozohttpd_t *httpd, const char *fmt, ...)
   1701 {
   1702 	va_list ap;
   1703 
   1704 	va_start(ap, fmt);
   1705 	if (httpd->logstderr || isatty(STDERR_FILENO)) {
   1706 		//fputs("warning: ", stderr);
   1707 		vfprintf(stderr, fmt, ap);
   1708 		fputs("\n", stderr);
   1709 	} else
   1710 		vsyslog(LOG_INFO, fmt, ap);
   1711 	va_end(ap);
   1712 }
   1713 
   1714 void
   1715 bozo_err(bozohttpd_t *httpd, int code, const char *fmt, ...)
   1716 {
   1717 	va_list ap;
   1718 
   1719 	va_start(ap, fmt);
   1720 	if (httpd->logstderr || isatty(STDERR_FILENO)) {
   1721 		//fputs("error: ", stderr);
   1722 		vfprintf(stderr, fmt, ap);
   1723 		fputs("\n", stderr);
   1724 	} else
   1725 		vsyslog(LOG_ERR, fmt, ap);
   1726 	va_end(ap);
   1727 	exit(code);
   1728 }
   1729 
   1730 /* this escape HTML tags */
   1731 static void
   1732 escape_html(bozo_httpreq_t *request)
   1733 {
   1734 	int	i, j;
   1735 	char	*url = request->hr_file, *tmp;
   1736 
   1737 	for (i = 0, j = 0; url[i]; i++) {
   1738 		switch (url[i]) {
   1739 		case '<':
   1740 		case '>':
   1741 			j += 4;
   1742 			break;
   1743 		case '&':
   1744 			j += 5;
   1745 			break;
   1746 		}
   1747 	}
   1748 
   1749 	if (j == 0)
   1750 		return;
   1751 
   1752 	if ((tmp = (char *) malloc(strlen(url) + j)) == 0)
   1753 		/*
   1754 		 * ouch, but we are only called from an error context, and
   1755 		 * most paths here come from malloc(3) failures anyway...
   1756 		 * we could completely punt and just exit, but isn't returning
   1757 		 * an not-quite-correct error better than nothing at all?
   1758 		 */
   1759 		return;
   1760 
   1761 	for (i = 0, j = 0; url[i]; i++) {
   1762 		switch (url[i]) {
   1763 		case '<':
   1764 			memcpy(tmp + j, "&lt;", 4);
   1765 			j += 4;
   1766 			break;
   1767 		case '>':
   1768 			memcpy(tmp + j, "&gt;", 4);
   1769 			j += 4;
   1770 			break;
   1771 		case '&':
   1772 			memcpy(tmp + j, "&amp;", 5);
   1773 			j += 5;
   1774 			break;
   1775 		default:
   1776 			tmp[j++] = url[i];
   1777 		}
   1778 	}
   1779 	tmp[j] = 0;
   1780 
   1781 	free(request->hr_file);
   1782 	request->hr_file = tmp;
   1783 }
   1784 
   1785 /* short map between error code, and short/long messages */
   1786 static struct errors_map {
   1787 	int	code;			/* HTTP return code */
   1788 	const char *shortmsg;		/* short version of message */
   1789 	const char *longmsg;		/* long version of message */
   1790 } errors_map[] = {
   1791 	{ 400,	"400 Bad Request",	"The request was not valid", },
   1792 	{ 401,	"401 Unauthorized",	"No authorization", },
   1793 	{ 403,	"403 Forbidden",	"Access to this item has been denied",},
   1794 	{ 404, 	"404 Not Found",	"This item has not been found", },
   1795 	{ 408, 	"408 Request Timeout",	"This request took too long", },
   1796 	{ 417,	"417 Expectation Failed","Expectations not available", },
   1797 	{ 500,	"500 Internal Error",	"An error occured on the server", },
   1798 	{ 501,	"501 Not Implemented",	"This request is not available", },
   1799 	{ 0,	NULL,			NULL, },
   1800 };
   1801 
   1802 static const char *help = "DANGER! WILL ROBINSON! DANGER!";
   1803 
   1804 static const char *
   1805 http_errors_short(int code)
   1806 {
   1807 	struct errors_map *ep;
   1808 
   1809 	for (ep = errors_map; ep->code; ep++)
   1810 		if (ep->code == code)
   1811 			return (ep->shortmsg);
   1812 	return (help);
   1813 }
   1814 
   1815 static const char *
   1816 http_errors_long(int code)
   1817 {
   1818 	struct errors_map *ep;
   1819 
   1820 	for (ep = errors_map; ep->code; ep++)
   1821 		if (ep->code == code)
   1822 			return (ep->longmsg);
   1823 	return (help);
   1824 }
   1825 
   1826 /* the follow functions and variables are used in handling HTTP errors */
   1827 /* ARGSUSED */
   1828 int
   1829 bozo_http_error(bozohttpd_t *httpd, int code, bozo_httpreq_t *request,
   1830 		const char *msg)
   1831 {
   1832 	char portbuf[20];
   1833 	const char *header = http_errors_short(code);
   1834 	const char *reason = http_errors_long(code);
   1835 	const char *proto = (request && request->hr_proto) ?
   1836 				request->hr_proto : httpd->consts.http_11;
   1837 	const char *hostname = BOZOHOST(httpd, request);
   1838 	int	size;
   1839 
   1840 	debug((httpd, DEBUG_FAT, "bozo_http_error %d: %s", code, msg));
   1841 	if (header == NULL || reason == NULL) {
   1842 		bozo_err(httpd, 1,
   1843 			"bozo_http_error() failed (short = %p, long = %p)",
   1844 			header, reason);
   1845 		return code;
   1846 	}
   1847 
   1848 	if (request && request->hr_serverport &&
   1849 	    strcmp(request->hr_serverport, "80") != 0)
   1850 		snprintf(portbuf, sizeof(portbuf), ":%s",
   1851 				request->hr_serverport);
   1852 	else
   1853 		portbuf[0] = '\0';
   1854 
   1855 	if (request && request->hr_file) {
   1856 		escape_html(request);
   1857 		size = snprintf(httpd->errorbuf, BUFSIZ,
   1858 		    "<html><head><title>%s</title></head>\n"
   1859 		    "<body><h1>%s</h1>\n"
   1860 		    "%s: <pre>%s</pre>\n"
   1861  		    "<hr><address><a href=\"http://%s%s/\">%s%s</a></address>\n"
   1862 		    "</body></html>\n",
   1863 		    header, header, request->hr_file, reason,
   1864 		    hostname, portbuf, hostname, portbuf);
   1865 		if (size >= (int)BUFSIZ) {
   1866 			bozo_warn(httpd,
   1867 				"bozo_http_error buffer too small, truncated");
   1868 			size = (int)BUFSIZ;
   1869 		}
   1870 	} else
   1871 		size = 0;
   1872 
   1873 	bozo_printf(httpd, "%s %s\r\n", proto, header);
   1874 	if (request)
   1875 		bozo_auth_check_401(request, code);
   1876 
   1877 	bozo_printf(httpd, "Content-Type: text/html\r\n");
   1878 	bozo_printf(httpd, "Content-Length: %d\r\n", size);
   1879 	bozo_printf(httpd, "Server: %s\r\n", httpd->server_software);
   1880 	if (request && request->hr_allow)
   1881 		bozo_printf(httpd, "Allow: %s\r\n", request->hr_allow);
   1882 	bozo_printf(httpd, "\r\n");
   1883 	if (size)
   1884 		bozo_printf(httpd, "%s", httpd->errorbuf);
   1885 	bozo_flush(httpd, stdout);
   1886 
   1887 	return code;
   1888 }
   1889 
   1890 /* Below are various modified libc functions */
   1891 
   1892 /*
   1893  * returns -1 in lenp if the string ran out before finding a delimiter,
   1894  * but is otherwise the same as strsep.  Note that the length must be
   1895  * correctly passed in.
   1896  */
   1897 char *
   1898 bozostrnsep(char **strp, const char *delim, ssize_t	*lenp)
   1899 {
   1900 	char	*s;
   1901 	const	char *spanp;
   1902 	int	c, sc;
   1903 	char	*tok;
   1904 
   1905 	if ((s = *strp) == NULL)
   1906 		return (NULL);
   1907 	for (tok = s;;) {
   1908 		if (lenp && --(*lenp) == -1)
   1909 			return (NULL);
   1910 		c = *s++;
   1911 		spanp = delim;
   1912 		do {
   1913 			if ((sc = *spanp++) == c) {
   1914 				if (c == 0)
   1915 					s = NULL;
   1916 				else
   1917 					s[-1] = '\0';
   1918 				*strp = s;
   1919 				return (tok);
   1920 			}
   1921 		} while (sc != 0);
   1922 	}
   1923 	/* NOTREACHED */
   1924 }
   1925 
   1926 /*
   1927  * inspired by fgetln(3), but works for fd's.  should work identically
   1928  * except it, however, does *not* return the newline, and it does nul
   1929  * terminate the string.
   1930  */
   1931 char *
   1932 bozodgetln(bozohttpd_t *httpd, int fd, ssize_t *lenp,
   1933 	ssize_t (*readfn)(bozohttpd_t *, int, void *, size_t))
   1934 {
   1935 	ssize_t	len;
   1936 	int	got_cr = 0;
   1937 	char	c, *nbuffer;
   1938 
   1939 	/* initialise */
   1940 	if (httpd->getln_buflen == 0) {
   1941 		/* should be plenty for most requests */
   1942 		httpd->getln_buflen = 128;
   1943 		httpd->getln_buffer = malloc((size_t)httpd->getln_buflen);
   1944 		if (httpd->getln_buffer == NULL) {
   1945 			httpd->getln_buflen = 0;
   1946 			return NULL;
   1947 		}
   1948 	}
   1949 	len = 0;
   1950 
   1951 	/*
   1952 	 * we *have* to read one byte at a time, to not break cgi
   1953 	 * programs (for we pass stdin off to them).  could fix this
   1954 	 * by becoming a fd-passing program instead of just exec'ing
   1955 	 * the program
   1956 	 *
   1957 	 * the above is no longer true, we are the fd-passing
   1958 	 * program already.
   1959 	 */
   1960 	for (; readfn(httpd, fd, &c, 1) == 1; ) {
   1961 		debug((httpd, DEBUG_EXPLODING, "bozodgetln read %c", c));
   1962 
   1963 		if (len >= httpd->getln_buflen - 1) {
   1964 			httpd->getln_buflen *= 2;
   1965 			debug((httpd, DEBUG_EXPLODING, "bozodgetln: "
   1966 				"reallocating buffer to buflen %zu",
   1967 				httpd->getln_buflen));
   1968 			nbuffer = bozorealloc(httpd, httpd->getln_buffer,
   1969 				(size_t)httpd->getln_buflen);
   1970 			httpd->getln_buffer = nbuffer;
   1971 		}
   1972 
   1973 		httpd->getln_buffer[len++] = c;
   1974 		if (c == '\r') {
   1975 			got_cr = 1;
   1976 			continue;
   1977 		} else if (c == '\n') {
   1978 			/*
   1979 			 * HTTP/1.1 spec says to ignore CR and treat
   1980 			 * LF as the real line terminator.  even though
   1981 			 * the same spec defines CRLF as the line
   1982 			 * terminator, it is recommended in section 19.3
   1983 			 * to do the LF trick for tolerance.
   1984 			 */
   1985 			if (got_cr)
   1986 				len -= 2;
   1987 			else
   1988 				len -= 1;
   1989 			break;
   1990 		}
   1991 
   1992 	}
   1993 	httpd->getln_buffer[len] = '\0';
   1994 	debug((httpd, DEBUG_OBESE, "bozodgetln returns: ``%s'' with len %zd",
   1995 	       httpd->getln_buffer, len));
   1996 	*lenp = len;
   1997 	return httpd->getln_buffer;
   1998 }
   1999 
   2000 void *
   2001 bozorealloc(bozohttpd_t *httpd, void *ptr, size_t size)
   2002 {
   2003 	void	*p;
   2004 
   2005 	p = realloc(ptr, size);
   2006 	if (p == NULL) {
   2007 		(void)bozo_http_error(httpd, 500, NULL,
   2008 				"memory allocation failure");
   2009 		exit(1);
   2010 	}
   2011 	return (p);
   2012 }
   2013 
   2014 void *
   2015 bozomalloc(bozohttpd_t *httpd, size_t size)
   2016 {
   2017 	void	*p;
   2018 
   2019 	p = malloc(size);
   2020 	if (p == NULL) {
   2021 		(void)bozo_http_error(httpd, 500, NULL,
   2022 				"memory allocation failure");
   2023 		exit(1);
   2024 	}
   2025 	return (p);
   2026 }
   2027 
   2028 char *
   2029 bozostrdup(bozohttpd_t *httpd, const char *str)
   2030 {
   2031 	char	*p;
   2032 
   2033 	p = strdup(str);
   2034 	if (p == NULL) {
   2035 		(void)bozo_http_error(httpd, 500, NULL,
   2036 					"memory allocation failure");
   2037 		exit(1);
   2038 	}
   2039 	return (p);
   2040 }
   2041 
   2042 /* set default values in bozohttpd_t struct */
   2043 int
   2044 bozo_init_httpd(bozohttpd_t *httpd)
   2045 {
   2046 	/* make sure everything is clean */
   2047 	(void) memset(httpd, 0x0, sizeof(*httpd));
   2048 
   2049 	/* constants */
   2050 	httpd->consts.http_09 = "HTTP/0.9";
   2051 	httpd->consts.http_10 = "HTTP/1.0";
   2052 	httpd->consts.http_11 = "HTTP/1.1";
   2053 	httpd->consts.text_plain = "text/plain";
   2054 
   2055 	/* mmap region size */
   2056 	httpd->mmapsz = BOZO_MMAPSZ;
   2057 
   2058 	/* error buffer for bozo_http_error() */
   2059 	if ((httpd->errorbuf = malloc(BUFSIZ)) == NULL) {
   2060 		(void) fprintf(stderr,
   2061 			"bozohttpd: memory_allocation failure\n");
   2062 		return 0;
   2063 	}
   2064 	return 1;
   2065 }
   2066 
   2067 /* set default values in bozoprefs_t struct */
   2068 int
   2069 bozo_init_prefs(bozoprefs_t *prefs)
   2070 {
   2071 	/* make sure everything is clean */
   2072 	(void) memset(prefs, 0x0, sizeof(*prefs));
   2073 
   2074 	/* set up default values */
   2075 	bozo_set_pref(prefs, "server software", SERVER_SOFTWARE);
   2076 	bozo_set_pref(prefs, "index.html", INDEX_HTML);
   2077 	bozo_set_pref(prefs, "public_html", PUBLIC_HTML);
   2078 
   2079 	return 1;
   2080 }
   2081 
   2082 /* set default values */
   2083 int
   2084 bozo_set_defaults(bozohttpd_t *httpd, bozoprefs_t *prefs)
   2085 {
   2086 	return bozo_init_httpd(httpd) && bozo_init_prefs(prefs);
   2087 }
   2088 
   2089 /* set the virtual host name, port and root */
   2090 int
   2091 bozo_setup(bozohttpd_t *httpd, bozoprefs_t *prefs, const char *vhost,
   2092 		const char *root)
   2093 {
   2094 	struct passwd	 *pw;
   2095 	extern char	**environ;
   2096 	static char	 *cleanenv[1] = { NULL };
   2097 	uid_t		  uid;
   2098 	char		 *chrootdir;
   2099 	char		 *username;
   2100 	char		 *portnum;
   2101 	char		 *cp;
   2102 	int		  dirtyenv;
   2103 
   2104 	dirtyenv = 0;
   2105 
   2106 	if (vhost == NULL) {
   2107 		httpd->virthostname = bozomalloc(httpd, MAXHOSTNAMELEN+1);
   2108 		/* XXX we do not check for FQDN here */
   2109 		if (gethostname(httpd->virthostname, MAXHOSTNAMELEN+1) < 0)
   2110 			bozo_err(httpd, 1, "gethostname");
   2111 		httpd->virthostname[MAXHOSTNAMELEN] = '\0';
   2112 	} else {
   2113 		httpd->virthostname = strdup(vhost);
   2114 	}
   2115 	httpd->slashdir = strdup(root);
   2116 	if ((portnum = bozo_get_pref(prefs, "port number")) != NULL) {
   2117 		httpd->bindport = strdup(portnum);
   2118 	}
   2119 
   2120 	/* go over preferences now */
   2121 	if ((cp = bozo_get_pref(prefs, "numeric")) != NULL &&
   2122 	    strcmp(cp, "true") == 0) {
   2123 		httpd->numeric = 1;
   2124 	}
   2125 	if ((cp = bozo_get_pref(prefs, "trusted referal")) != NULL &&
   2126 	    strcmp(cp, "true") == 0) {
   2127 		httpd->untrustedref = 1;
   2128 	}
   2129 	if ((cp = bozo_get_pref(prefs, "log to stderr")) != NULL &&
   2130 	    strcmp(cp, "true") == 0) {
   2131 		httpd->logstderr = 1;
   2132 	}
   2133 	if ((cp = bozo_get_pref(prefs, "bind address")) != NULL) {
   2134 		httpd->bindaddress = strdup(cp);
   2135 	}
   2136 	if ((cp = bozo_get_pref(prefs, "background")) != NULL) {
   2137 		httpd->background = atoi(cp);
   2138 	}
   2139 	if ((cp = bozo_get_pref(prefs, "foreground")) != NULL &&
   2140 	    strcmp(cp, "true") == 0) {
   2141 		httpd->foreground = 1;
   2142 	}
   2143 	if ((cp = bozo_get_pref(prefs, "pid file")) != NULL) {
   2144 		httpd->pidfile = strdup(cp);
   2145 	}
   2146 	if ((cp = bozo_get_pref(prefs, "unknown slash")) != NULL &&
   2147 	    strcmp(cp, "true") == 0) {
   2148 		httpd->unknown_slash = 1;
   2149 	}
   2150 	if ((cp = bozo_get_pref(prefs, "virtual base")) != NULL) {
   2151 		httpd->virtbase = strdup(cp);
   2152 	}
   2153 	if ((cp = bozo_get_pref(prefs, "enable users")) != NULL &&
   2154 	    strcmp(cp, "true") == 0) {
   2155 		httpd->enable_users = 1;
   2156 	}
   2157 	if ((cp = bozo_get_pref(prefs, "dirty environment")) != NULL &&
   2158 	    strcmp(cp, "true") == 0) {
   2159 		dirtyenv = 1;
   2160 	}
   2161 	if ((cp = bozo_get_pref(prefs, "hide dots")) != NULL &&
   2162 	    strcmp(cp, "true") == 0) {
   2163 		httpd->hide_dots = 1;
   2164 	}
   2165 	if ((cp = bozo_get_pref(prefs, "directory indexing")) != NULL &&
   2166 	    strcmp(cp, "true") == 0) {
   2167 		httpd->dir_indexing = 1;
   2168 	}
   2169 	if ((cp = bozo_get_pref(prefs, "public_html")) != NULL) {
   2170 		httpd->public_html = strdup(cp);
   2171 	}
   2172 	httpd->server_software =
   2173 			strdup(bozo_get_pref(prefs, "server software"));
   2174 	httpd->index_html = strdup(bozo_get_pref(prefs, "index.html"));
   2175 
   2176 	/*
   2177 	 * initialise ssl and daemon mode if necessary.
   2178 	 */
   2179 	bozo_ssl_init(httpd);
   2180 	bozo_daemon_init(httpd);
   2181 
   2182 	if ((username = bozo_get_pref(prefs, "username")) == NULL) {
   2183 		if ((pw = getpwuid(uid = 0)) == NULL)
   2184 			bozo_err(httpd, 1, "getpwuid(0): %s", strerror(errno));
   2185 		httpd->username = strdup(pw->pw_name);
   2186 	} else {
   2187 		httpd->username = strdup(username);
   2188 		if ((pw = getpwnam(httpd->username)) == NULL)
   2189 			bozo_err(httpd, 1, "getpwnam(%s): %s", httpd->username,
   2190 					strerror(errno));
   2191 		if (initgroups(pw->pw_name, pw->pw_gid) == -1)
   2192 			bozo_err(httpd, 1, "initgroups: %s", strerror(errno));
   2193 		if (setgid(pw->pw_gid) == -1)
   2194 			bozo_err(httpd, 1, "setgid(%u): %s", pw->pw_gid,
   2195 					strerror(errno));
   2196 		uid = pw->pw_uid;
   2197 	}
   2198 	/*
   2199 	 * handle chroot.
   2200 	 */
   2201 	if ((chrootdir = bozo_get_pref(prefs, "chroot dir")) != NULL) {
   2202 		httpd->rootdir = strdup(chrootdir);
   2203 		if (chdir(httpd->rootdir) == -1)
   2204 			bozo_err(httpd, 1, "chdir(%s): %s", httpd->rootdir,
   2205 				strerror(errno));
   2206 		if (chroot(httpd->rootdir) == -1)
   2207 			bozo_err(httpd, 1, "chroot(%s): %s", httpd->rootdir,
   2208 				strerror(errno));
   2209 	}
   2210 
   2211 	if (username != NULL)
   2212 		if (setuid(uid) == -1)
   2213 			bozo_err(httpd, 1, "setuid(%d): %s", uid,
   2214 					strerror(errno));
   2215 
   2216 	/*
   2217 	 * prevent info leakage between different compartments.
   2218 	 * some PATH values in the environment would be invalided
   2219 	 * by chroot. cross-user settings might result in undesirable
   2220 	 * effects.
   2221 	 */
   2222 	if ((chrootdir != NULL || username != NULL) && !dirtyenv)
   2223 		environ = cleanenv;
   2224 
   2225 #ifdef _SC_PAGESIZE
   2226 	httpd->page_size = (long)sysconf(_SC_PAGESIZE);
   2227 #else
   2228 	httpd->page_size = 4096;
   2229 #endif
   2230 	debug((httpd, DEBUG_OBESE, "myname is %s, slashdir is %s",
   2231 			httpd->virthostname, httpd->slashdir));
   2232 
   2233 	return 1;
   2234 }
   2235