bozohttpd.c revision 1.42 1 /* $NetBSD: bozohttpd.c,v 1.42 2013/10/12 07:49:40 mbalmer Exp $ */
2
3 /* $eterna: bozohttpd.c,v 1.178 2011/11/18 09:21:15 mrg Exp $ */
4
5 /*
6 * Copyright (c) 1997-2013 Matthew R. Green
7 * All rights reserved.
8 *
9 * Redistribution and use in source and binary forms, with or without
10 * modification, are permitted provided that the following conditions
11 * are met:
12 * 1. Redistributions of source code must retain the above copyright
13 * notice, this list of conditions and the following disclaimer.
14 * 2. Redistributions in binary form must reproduce the above copyright
15 * notice, this list of conditions and the following disclaimer and
16 * dedication in the documentation and/or other materials provided
17 * with the distribution.
18 *
19 * THIS SOFTWARE IS PROVIDED BY THE AUTHOR ``AS IS'' AND ANY EXPRESS OR
20 * IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED WARRANTIES
21 * OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE ARE DISCLAIMED.
22 * IN NO EVENT SHALL THE AUTHOR BE LIABLE FOR ANY DIRECT, INDIRECT,
23 * INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING,
24 * BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES;
25 * LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED
26 * AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY,
27 * OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY
28 * OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF
29 * SUCH DAMAGE.
30 *
31 */
32
33 /* this program is dedicated to the Great God of Processed Cheese */
34
35 /*
36 * bozohttpd.c: minimal httpd; provides only these features:
37 * - HTTP/0.9 (by virtue of ..)
38 * - HTTP/1.0
39 * - HTTP/1.1
40 * - CGI/1.1 this will only be provided for "system" scripts
41 * - automatic "missing trailing slash" redirections
42 * - configurable translation of /~user/ to ~user/public_html,
43 * however, this does not include cgi-bin support
44 * - access lists via libwrap via inetd/tcpd
45 * - virtual hosting
46 * - not that we do not even pretend to understand MIME, but
47 * rely only on the HTTP specification
48 * - ipv6 support
49 * - automatic `index.html' generation
50 * - configurable server name
51 * - directory index generation
52 * - daemon mode (lacks libwrap support)
53 * - .htpasswd support
54 */
55
56 /*
57 * requirements for minimal http/1.1 (at least, as documented in
58 * <draft-ietf-http-v11-spec-rev-06> which expired may 18, 1999):
59 *
60 * - 14.15: content-encoding handling. [1]
61 *
62 * - 14.16: content-length handling. this is only a SHOULD header
63 * thus we could just not send it ever. [1]
64 *
65 * - 14.17: content-type handling. [1]
66 *
67 * - 14.25/28: if-{,un}modified-since handling. maybe do this, but
68 * i really don't want to have to parse 3 differnet date formats
69 *
70 * [1] need to revisit to ensure proper behaviour
71 *
72 * and the following is a list of features that we do not need
73 * to have due to other limits, or are too lazy. there are more
74 * of these than are listed, but these are of particular note,
75 * and could perhaps be implemented.
76 *
77 * - 3.5/3.6: content/transfer codings. probably can ignore
78 * this? we "SHOULD"n't. but 4.4 says we should ignore a
79 * `content-length' header upon reciept of a `transfer-encoding'
80 * header.
81 *
82 * - 5.1.1: request methods. only MUST support GET and HEAD,
83 * but there are new ones besides POST that are currently
84 * supported: OPTIONS PUT DELETE TRACE and CONNECT, plus
85 * extensions not yet known?
86 *
87 * - 10.1: we can ignore informational status codes
88 *
89 * - 10.3.3/10.3.4/10.3.8: just use '302' codes always.
90 *
91 * - 14.1/14.2/14.3/14.27: we do not support Accept: headers..
92 * just ignore them and send the request anyway. they are
93 * only SHOULD.
94 *
95 * - 14.5/14.16/14.35: we don't do ranges. from section 14.35.2
96 * `A server MAY ignore the Range header'. but it might be nice.
97 * since 20080301 we support simple range headers.
98 *
99 * - 14.9: we aren't a cache.
100 *
101 * - 14.15: content-md5 would be nice...
102 *
103 * - 14.24/14.26/14.27: be nice to support this...
104 *
105 * - 14.44: not sure about this Vary: header. ignore it for now.
106 */
107
108 #ifndef INDEX_HTML
109 #define INDEX_HTML "index.html"
110 #endif
111 #ifndef SERVER_SOFTWARE
112 #define SERVER_SOFTWARE "bozohttpd/20130711"
113 #endif
114 #ifndef DIRECT_ACCESS_FILE
115 #define DIRECT_ACCESS_FILE ".bzdirect"
116 #endif
117 #ifndef REDIRECT_FILE
118 #define REDIRECT_FILE ".bzredirect"
119 #endif
120 #ifndef ABSREDIRECT_FILE
121 #define ABSREDIRECT_FILE ".bzabsredirect"
122 #endif
123 #ifndef PUBLIC_HTML
124 #define PUBLIC_HTML "public_html"
125 #endif
126
127 #ifndef USE_ARG
128 #define USE_ARG(x) /*LINTED*/(void)&(x)
129 #endif
130
131 /*
132 * And so it begins ..
133 */
134
135 #include <sys/param.h>
136 #include <sys/socket.h>
137 #include <sys/time.h>
138 #include <sys/mman.h>
139
140 #include <arpa/inet.h>
141
142 #include <ctype.h>
143 #include <dirent.h>
144 #include <errno.h>
145 #include <fcntl.h>
146 #include <netdb.h>
147 #include <pwd.h>
148 #include <grp.h>
149 #include <signal.h>
150 #include <stdarg.h>
151 #include <stdlib.h>
152 #include <string.h>
153 #include <syslog.h>
154 #include <time.h>
155 #include <unistd.h>
156
157 #include "bozohttpd.h"
158
159 #ifndef MAX_WAIT_TIME
160 #define MAX_WAIT_TIME 60 /* hang around for 60 seconds max */
161 #endif
162
163 /* variables and functions */
164 #ifndef LOG_FTP
165 #define LOG_FTP LOG_DAEMON
166 #endif
167
168 volatile sig_atomic_t alarmhit;
169
170 /*
171 * check there's enough space in the prefs and names arrays.
172 */
173 static int
174 size_arrays(bozoprefs_t *bozoprefs, unsigned needed)
175 {
176 char **temp;
177
178 if (bozoprefs->size == 0) {
179 /* only get here first time around */
180 bozoprefs->size = needed;
181 if ((bozoprefs->name = calloc(sizeof(char *), needed)) == NULL) {
182 (void) fprintf(stderr, "size_arrays: bad alloc\n");
183 return 0;
184 }
185 if ((bozoprefs->value = calloc(sizeof(char *), needed)) == NULL) {
186 free(bozoprefs->name);
187 (void) fprintf(stderr, "size_arrays: bad alloc\n");
188 return 0;
189 }
190 } else if (bozoprefs->c == bozoprefs->size) {
191 /* only uses 'needed' when filled array */
192 bozoprefs->size += needed;
193 temp = realloc(bozoprefs->name, sizeof(char *) * needed);
194 if (temp == NULL) {
195 (void) fprintf(stderr, "size_arrays: bad alloc\n");
196 return 0;
197 }
198 bozoprefs->name = temp;
199 temp = realloc(bozoprefs->value, sizeof(char *) * needed);
200 if (temp == NULL) {
201 (void) fprintf(stderr, "size_arrays: bad alloc\n");
202 return 0;
203 }
204 bozoprefs->value = temp;
205 }
206 return 1;
207 }
208
209 static int
210 findvar(bozoprefs_t *bozoprefs, const char *name)
211 {
212 unsigned i;
213
214 for (i = 0 ; i < bozoprefs->c && strcmp(bozoprefs->name[i], name) != 0; i++)
215 ;
216 return (i == bozoprefs->c) ? -1 : (int)i;
217 }
218
219 int
220 bozo_set_pref(bozoprefs_t *bozoprefs, const char *name, const char *value)
221 {
222 int i;
223
224 if ((i = findvar(bozoprefs, name)) < 0) {
225 /* add the element to the array */
226 if (size_arrays(bozoprefs, bozoprefs->size + 15)) {
227 bozoprefs->name[i = bozoprefs->c++] = strdup(name);
228 }
229 } else {
230 /* replace the element in the array */
231 if (bozoprefs->value[i]) {
232 free(bozoprefs->value[i]);
233 bozoprefs->value[i] = NULL;
234 }
235 }
236 /* sanity checks for range of values go here */
237 bozoprefs->value[i] = strdup(value);
238 return 1;
239 }
240
241 /*
242 * get a variable's value, or NULL
243 */
244 char *
245 bozo_get_pref(bozoprefs_t *bozoprefs, const char *name)
246 {
247 int i;
248
249 return ((i = findvar(bozoprefs, name)) < 0) ? NULL :
250 bozoprefs->value[i];
251 }
252
253 char *
254 bozo_http_date(char *date, size_t datelen)
255 {
256 struct tm *tm;
257 time_t now;
258
259 /* Sun, 06 Nov 1994 08:49:37 GMT */
260 now = time(NULL);
261 tm = gmtime(&now); /* HTTP/1.1 spec rev 06 sez GMT only */
262 strftime(date, datelen, "%a, %d %b %Y %H:%M:%S GMT", tm);
263 return date;
264 }
265
266 /*
267 * convert "in" into the three parts of a request (first line).
268 * we allocate into file and query, but return pointers into
269 * "in" for proto and method.
270 */
271 static void
272 parse_request(bozohttpd_t *httpd, char *in, char **method, char **file,
273 char **query, char **proto)
274 {
275 ssize_t len;
276 char *val;
277
278 USE_ARG(httpd);
279 debug((httpd, DEBUG_EXPLODING, "parse in: %s", in));
280 *method = *file = *query = *proto = NULL;
281
282 len = (ssize_t)strlen(in);
283 val = bozostrnsep(&in, " \t\n\r", &len);
284 if (len < 1 || val == NULL)
285 return;
286 *method = val;
287
288 while (*in == ' ' || *in == '\t')
289 in++;
290 val = bozostrnsep(&in, " \t\n\r", &len);
291 if (len < 1) {
292 if (len == 0)
293 *file = val;
294 else
295 *file = in;
296 } else {
297 *file = val;
298
299 *query = strchr(*file, '?');
300 if (*query)
301 *(*query)++ = '\0';
302
303 if (in) {
304 while (*in && (*in == ' ' || *in == '\t'))
305 in++;
306 if (*in)
307 *proto = in;
308 }
309 }
310
311 /* allocate private copies */
312 *file = bozostrdup(httpd, *file);
313 if (*query)
314 *query = bozostrdup(httpd, *query);
315
316 debug((httpd, DEBUG_FAT,
317 "url: method: \"%s\" file: \"%s\" query: \"%s\" proto: \"%s\"",
318 *method, *file, *query, *proto));
319 }
320
321 /*
322 * cleanup a bozo_httpreq_t after use
323 */
324 void
325 bozo_clean_request(bozo_httpreq_t *request)
326 {
327 struct bozoheaders *hdr, *ohdr = NULL;
328
329 if (request == NULL)
330 return;
331
332 /* If SSL enabled cleanup SSL structure. */
333 bozo_ssl_destroy(request->hr_httpd);
334
335 /* clean up request */
336 #define MF(x) if (request->x) free(request->x)
337 MF(hr_remotehost);
338 MF(hr_remoteaddr);
339 MF(hr_serverport);
340 MF(hr_virthostname);
341 MF(hr_file);
342 MF(hr_oldfile);
343 MF(hr_query);
344 #undef MF
345 bozo_auth_cleanup(request);
346 for (hdr = SIMPLEQ_FIRST(&request->hr_headers); hdr;
347 hdr = SIMPLEQ_NEXT(hdr, h_next)) {
348 free(hdr->h_value);
349 free(hdr->h_header);
350 if (ohdr)
351 free(ohdr);
352 ohdr = hdr;
353 }
354 if (ohdr)
355 free(ohdr);
356
357 free(request);
358 }
359
360 /*
361 * send a HTTP/1.1 408 response if we timeout.
362 */
363 /* ARGSUSED */
364 static void
365 alarmer(int sig)
366 {
367 alarmhit = 1;
368 }
369
370 /*
371 * add or merge this header (val: str) into the requests list
372 */
373 static bozoheaders_t *
374 addmerge_header(bozo_httpreq_t *request, char *val,
375 char *str, ssize_t len)
376 {
377 struct bozoheaders *hdr;
378
379 USE_ARG(len);
380 /* do we exist already? */
381 SIMPLEQ_FOREACH(hdr, &request->hr_headers, h_next) {
382 if (strcasecmp(val, hdr->h_header) == 0)
383 break;
384 }
385
386 if (hdr) {
387 /* yup, merge it in */
388 char *nval;
389
390 if (asprintf(&nval, "%s, %s", hdr->h_value, str) == -1) {
391 (void)bozo_http_error(request->hr_httpd, 500, NULL,
392 "memory allocation failure");
393 return NULL;
394 }
395 free(hdr->h_value);
396 hdr->h_value = nval;
397 } else {
398 /* nope, create a new one */
399
400 hdr = bozomalloc(request->hr_httpd, sizeof *hdr);
401 hdr->h_header = bozostrdup(request->hr_httpd, val);
402 if (str && *str)
403 hdr->h_value = bozostrdup(request->hr_httpd, str);
404 else
405 hdr->h_value = bozostrdup(request->hr_httpd, " ");
406
407 SIMPLEQ_INSERT_TAIL(&request->hr_headers, hdr, h_next);
408 request->hr_nheaders++;
409 }
410
411 return hdr;
412 }
413
414 /*
415 * as the prototype string is not constant (eg, "HTTP/1.1" is equivalent
416 * to "HTTP/001.01"), we MUST parse this.
417 */
418 static int
419 process_proto(bozo_httpreq_t *request, const char *proto)
420 {
421 char majorstr[16], *minorstr;
422 int majorint, minorint;
423
424 if (proto == NULL) {
425 got_proto_09:
426 request->hr_proto = request->hr_httpd->consts.http_09;
427 debug((request->hr_httpd, DEBUG_FAT, "request %s is http/0.9",
428 request->hr_file));
429 return 0;
430 }
431
432 if (strncasecmp(proto, "HTTP/", 5) != 0)
433 goto bad;
434 strncpy(majorstr, proto + 5, sizeof majorstr);
435 majorstr[sizeof(majorstr)-1] = 0;
436 minorstr = strchr(majorstr, '.');
437 if (minorstr == NULL)
438 goto bad;
439 *minorstr++ = 0;
440
441 majorint = atoi(majorstr);
442 minorint = atoi(minorstr);
443
444 switch (majorint) {
445 case 0:
446 if (minorint != 9)
447 break;
448 goto got_proto_09;
449 case 1:
450 if (minorint == 0)
451 request->hr_proto = request->hr_httpd->consts.http_10;
452 else if (minorint == 1)
453 request->hr_proto = request->hr_httpd->consts.http_11;
454 else
455 break;
456
457 debug((request->hr_httpd, DEBUG_FAT, "request %s is %s",
458 request->hr_file, request->hr_proto));
459 SIMPLEQ_INIT(&request->hr_headers);
460 request->hr_nheaders = 0;
461 return 0;
462 }
463 bad:
464 return bozo_http_error(request->hr_httpd, 404, NULL, "unknown prototype");
465 }
466
467 /*
468 * process each type of HTTP method, setting this HTTP requests
469 # method type.
470 */
471 static struct method_map {
472 const char *name;
473 int type;
474 } method_map[] = {
475 { "GET", HTTP_GET, },
476 { "POST", HTTP_POST, },
477 { "HEAD", HTTP_HEAD, },
478 #if 0 /* other non-required http/1.1 methods */
479 { "OPTIONS", HTTP_OPTIONS, },
480 { "PUT", HTTP_PUT, },
481 { "DELETE", HTTP_DELETE, },
482 { "TRACE", HTTP_TRACE, },
483 { "CONNECT", HTTP_CONNECT, },
484 #endif
485 { NULL, 0, },
486 };
487
488 static int
489 process_method(bozo_httpreq_t *request, const char *method)
490 {
491 struct method_map *mmp;
492
493 if (request->hr_proto == request->hr_httpd->consts.http_11)
494 request->hr_allow = "GET, HEAD, POST";
495
496 for (mmp = method_map; mmp->name; mmp++)
497 if (strcasecmp(method, mmp->name) == 0) {
498 request->hr_method = mmp->type;
499 request->hr_methodstr = mmp->name;
500 return 0;
501 }
502
503 return bozo_http_error(request->hr_httpd, 404, request, "unknown method");
504 }
505
506 /*
507 * This function reads a http request from stdin, returning a pointer to a
508 * bozo_httpreq_t structure, describing the request.
509 */
510 bozo_httpreq_t *
511 bozo_read_request(bozohttpd_t *httpd)
512 {
513 struct sigaction sa;
514 char *str, *val, *method, *file, *proto, *query;
515 char *host, *addr, *port;
516 char bufport[10];
517 char hbuf[NI_MAXHOST], abuf[NI_MAXHOST];
518 struct sockaddr_storage ss;
519 ssize_t len;
520 int line = 0;
521 socklen_t slen;
522 bozo_httpreq_t *request;
523
524 /*
525 * if we're in daemon mode, bozo_daemon_fork() will return here twice
526 * for each call. once in the child, returning 0, and once in the
527 * parent, returning 1. for each child, then we can setup SSL, and
528 * the parent can signal the caller there was no request to process
529 * and it will wait for another.
530 */
531 if (bozo_daemon_fork(httpd))
532 return NULL;
533 bozo_ssl_accept(httpd);
534
535 request = bozomalloc(httpd, sizeof(*request));
536 memset(request, 0, sizeof(*request));
537 request->hr_httpd = httpd;
538 request->hr_allow = request->hr_host = NULL;
539 request->hr_content_type = request->hr_content_length = NULL;
540 request->hr_range = NULL;
541 request->hr_last_byte_pos = -1;
542 request->hr_if_modified_since = NULL;
543 request->hr_virthostname = NULL;
544 request->hr_file = NULL;
545 request->hr_oldfile = NULL;
546
547 slen = sizeof(ss);
548 if (getpeername(0, (struct sockaddr *)(void *)&ss, &slen) < 0)
549 host = addr = NULL;
550 else {
551 if (getnameinfo((struct sockaddr *)(void *)&ss, slen,
552 abuf, sizeof abuf, NULL, 0, NI_NUMERICHOST) == 0)
553 addr = abuf;
554 else
555 addr = NULL;
556 if (httpd->numeric == 0 &&
557 getnameinfo((struct sockaddr *)(void *)&ss, slen,
558 hbuf, sizeof hbuf, NULL, 0, 0) == 0)
559 host = hbuf;
560 else
561 host = NULL;
562 }
563 if (host != NULL)
564 request->hr_remotehost = bozostrdup(request->hr_httpd, host);
565 if (addr != NULL)
566 request->hr_remoteaddr = bozostrdup(request->hr_httpd, addr);
567 slen = sizeof(ss);
568
569 /*
570 * Override the bound port from the request value, so it works even
571 * if passed through a proxy that doesn't rewrite the port.
572 */
573 if (httpd->bindport) {
574 if (strcmp(httpd->bindport, "80") != 0)
575 port = httpd->bindport;
576 else
577 port = NULL;
578 } else {
579 if (getsockname(0, (struct sockaddr *)(void *)&ss, &slen) < 0)
580 port = NULL;
581 else {
582 if (getnameinfo((struct sockaddr *)(void *)&ss, slen, NULL, 0,
583 bufport, sizeof bufport, NI_NUMERICSERV) == 0)
584 port = bufport;
585 else
586 port = NULL;
587 }
588 }
589 if (port != NULL)
590 request->hr_serverport = bozostrdup(request->hr_httpd, port);
591
592 /*
593 * setup a timer to make sure the request is not hung
594 */
595 sa.sa_handler = alarmer;
596 sigemptyset(&sa.sa_mask);
597 sigaddset(&sa.sa_mask, SIGALRM);
598 sa.sa_flags = 0;
599 sigaction(SIGALRM, &sa, NULL); /* XXX */
600
601 alarm(MAX_WAIT_TIME);
602 while ((str = bozodgetln(httpd, STDIN_FILENO, &len, bozo_read)) != NULL) {
603 alarm(0);
604 if (alarmhit) {
605 (void)bozo_http_error(httpd, 408, NULL,
606 "request timed out");
607 goto cleanup;
608 }
609 line++;
610
611 if (line == 1) {
612
613 if (len < 1) {
614 (void)bozo_http_error(httpd, 404, NULL,
615 "null method");
616 goto cleanup;
617 }
618
619 bozo_warn(httpd, "got request ``%s'' from host %s to port %s",
620 str,
621 host ? host : addr ? addr : "<local>",
622 port ? port : "<stdin>");
623
624 /* we allocate return space in file and query only */
625 parse_request(httpd, str, &method, &file, &query, &proto);
626 request->hr_file = file;
627 request->hr_query = query;
628 if (method == NULL) {
629 (void)bozo_http_error(httpd, 404, NULL,
630 "null method");
631 goto cleanup;
632 }
633 if (file == NULL) {
634 (void)bozo_http_error(httpd, 404, NULL,
635 "null file");
636 goto cleanup;
637 }
638
639 /*
640 * note that we parse the proto first, so that we
641 * can more properly parse the method and the url.
642 */
643
644 if (process_proto(request, proto) ||
645 process_method(request, method)) {
646 goto cleanup;
647 }
648
649 debug((httpd, DEBUG_FAT, "got file \"%s\" query \"%s\"",
650 request->hr_file,
651 request->hr_query ? request->hr_query : "<none>"));
652
653 /* http/0.9 has no header processing */
654 if (request->hr_proto == httpd->consts.http_09)
655 break;
656 } else { /* incoming headers */
657 bozoheaders_t *hdr;
658
659 if (*str == '\0')
660 break;
661
662 val = bozostrnsep(&str, ":", &len);
663 debug((httpd, DEBUG_EXPLODING,
664 "read_req2: after bozostrnsep: str ``%s'' val ``%s''",
665 str, val));
666 if (val == NULL || len == -1) {
667 (void)bozo_http_error(httpd, 404, request,
668 "no header");
669 goto cleanup;
670 }
671 while (*str == ' ' || *str == '\t')
672 len--, str++;
673 while (*val == ' ' || *val == '\t')
674 val++;
675
676 if (bozo_auth_check_headers(request, val, str, len))
677 goto next_header;
678
679 hdr = addmerge_header(request, val, str, len);
680
681 if (strcasecmp(hdr->h_header, "content-type") == 0)
682 request->hr_content_type = hdr->h_value;
683 else if (strcasecmp(hdr->h_header, "content-length") == 0)
684 request->hr_content_length = hdr->h_value;
685 else if (strcasecmp(hdr->h_header, "host") == 0)
686 request->hr_host = hdr->h_value;
687 /* HTTP/1.1 rev06 draft spec: 14.20 */
688 else if (strcasecmp(hdr->h_header, "expect") == 0) {
689 (void)bozo_http_error(httpd, 417, request,
690 "we don't support Expect:");
691 goto cleanup;
692 }
693 else if (strcasecmp(hdr->h_header, "referrer") == 0 ||
694 strcasecmp(hdr->h_header, "referer") == 0)
695 request->hr_referrer = hdr->h_value;
696 else if (strcasecmp(hdr->h_header, "range") == 0)
697 request->hr_range = hdr->h_value;
698 else if (strcasecmp(hdr->h_header,
699 "if-modified-since") == 0)
700 request->hr_if_modified_since = hdr->h_value;
701 else if (strcasecmp(hdr->h_header,
702 "accept-encoding") == 0)
703 request->hr_accept_encoding = hdr->h_value;
704
705 debug((httpd, DEBUG_FAT, "adding header %s: %s",
706 hdr->h_header, hdr->h_value));
707 }
708 next_header:
709 alarm(MAX_WAIT_TIME);
710 }
711
712 /* now, clear it all out */
713 alarm(0);
714 signal(SIGALRM, SIG_DFL);
715
716 /* RFC1945, 8.3 */
717 if (request->hr_method == HTTP_POST &&
718 request->hr_content_length == NULL) {
719 (void)bozo_http_error(httpd, 400, request,
720 "missing content length");
721 goto cleanup;
722 }
723
724 /* HTTP/1.1 draft rev-06, 14.23 & 19.6.1.1 */
725 if (request->hr_proto == httpd->consts.http_11 &&
726 request->hr_host == NULL) {
727 (void)bozo_http_error(httpd, 400, request,
728 "missing Host header");
729 goto cleanup;
730 }
731
732 if (request->hr_range != NULL) {
733 debug((httpd, DEBUG_FAT, "hr_range: %s", request->hr_range));
734 /* support only simple ranges %d- and %d-%d */
735 if (strchr(request->hr_range, ',') == NULL) {
736 const char *rstart, *dash;
737
738 rstart = strchr(request->hr_range, '=');
739 if (rstart != NULL) {
740 rstart++;
741 dash = strchr(rstart, '-');
742 if (dash != NULL && dash != rstart) {
743 dash++;
744 request->hr_have_range = 1;
745 request->hr_first_byte_pos =
746 strtoll(rstart, NULL, 10);
747 if (request->hr_first_byte_pos < 0)
748 request->hr_first_byte_pos = 0;
749 if (*dash != '\0') {
750 request->hr_last_byte_pos =
751 strtoll(dash, NULL, 10);
752 if (request->hr_last_byte_pos < 0)
753 request->hr_last_byte_pos = -1;
754 }
755 }
756 }
757 }
758 }
759
760 debug((httpd, DEBUG_FAT, "bozo_read_request returns url %s in request",
761 request->hr_file));
762 return request;
763
764 cleanup:
765 bozo_clean_request(request);
766
767 return NULL;
768 }
769
770 static int
771 mmap_and_write_part(bozohttpd_t *httpd, int fd, off_t first_byte_pos, size_t sz)
772 {
773 size_t mappedsz, wroffset;
774 off_t mappedoffset;
775 char *addr;
776 void *mappedaddr;
777
778 /*
779 * we need to ensure that both the size *and* offset arguments to
780 * mmap() are page-aligned. our formala for this is:
781 *
782 * input offset: first_byte_pos
783 * input size: sz
784 *
785 * mapped offset = page align truncate (input offset)
786 * mapped size =
787 * page align extend (input offset - mapped offset + input size)
788 * write offset = input offset - mapped offset
789 *
790 * we use the write offset in all writes
791 */
792 mappedoffset = first_byte_pos & ~(httpd->page_size - 1);
793 mappedsz = (size_t)
794 (first_byte_pos - mappedoffset + sz + httpd->page_size - 1) &
795 ~(httpd->page_size - 1);
796 wroffset = (size_t)(first_byte_pos - mappedoffset);
797
798 addr = mmap(0, mappedsz, PROT_READ, MAP_SHARED, fd, mappedoffset);
799 if (addr == (char *)-1) {
800 bozo_warn(httpd, "mmap failed: %s", strerror(errno));
801 return -1;
802 }
803 mappedaddr = addr;
804
805 #ifdef MADV_SEQUENTIAL
806 (void)madvise(addr, sz, MADV_SEQUENTIAL);
807 #endif
808 while (sz > BOZO_WRSZ) {
809 if (bozo_write(httpd, STDOUT_FILENO, addr + wroffset,
810 BOZO_WRSZ) != BOZO_WRSZ) {
811 bozo_warn(httpd, "write failed: %s", strerror(errno));
812 goto out;
813 }
814 debug((httpd, DEBUG_OBESE, "wrote %d bytes", BOZO_WRSZ));
815 sz -= BOZO_WRSZ;
816 addr += BOZO_WRSZ;
817 }
818 if (sz && (size_t)bozo_write(httpd, STDOUT_FILENO, addr + wroffset,
819 sz) != sz) {
820 bozo_warn(httpd, "final write failed: %s", strerror(errno));
821 goto out;
822 }
823 debug((httpd, DEBUG_OBESE, "wrote %d bytes", (int)sz));
824 out:
825 if (munmap(mappedaddr, mappedsz) < 0) {
826 bozo_warn(httpd, "munmap failed");
827 return -1;
828 }
829
830 return 0;
831 }
832
833 static int
834 parse_http_date(const char *val, time_t *timestamp)
835 {
836 char *remainder;
837 struct tm tm;
838
839 if ((remainder = strptime(val, "%a, %d %b %Y %T GMT", &tm)) == NULL &&
840 (remainder = strptime(val, "%a, %d-%b-%y %T GMT", &tm)) == NULL &&
841 (remainder = strptime(val, "%a %b %d %T %Y", &tm)) == NULL)
842 return 0; /* Invalid HTTP date format */
843
844 if (*remainder)
845 return 0; /* No trailing garbage */
846
847 *timestamp = timegm(&tm);
848 return 1;
849 }
850
851 /*
852 * given an url, encode it ala rfc 3986. ie, escape ? and friends.
853 * note that this function returns a static buffer, and thus needs
854 * to be updated for any sort of parallel processing.
855 */
856 char *
857 bozo_escape_rfc3986(bozohttpd_t *httpd, const char *url)
858 {
859 static char *buf;
860 static size_t buflen = 0;
861 size_t len;
862 const char *s;
863 char *d;
864
865 len = strlen(url);
866 if (buflen < len * 3 + 1) {
867 buflen = len * 3 + 1;
868 buf = bozorealloc(httpd, buf, buflen);
869 }
870
871 if (url == NULL) {
872 buf[0] = 0;
873 return buf;
874 }
875
876 for (len = 0, s = url, d = buf; *s;) {
877 if (*s & 0x80)
878 goto encode_it;
879 switch (*s) {
880 case ':':
881 case '/':
882 case '?':
883 case '#':
884 case '[':
885 case ']':
886 case '@':
887 case '!':
888 case '$':
889 case '&':
890 case '\'':
891 case '(':
892 case ')':
893 case '*':
894 case '+':
895 case ',':
896 case ';':
897 case '=':
898 case '%':
899 encode_it:
900 snprintf(d, 4, "%%%2X", *s++);
901 d += 3;
902 len += 3;
903 break;
904 default:
905 *d++ = *s++;
906 len++;
907 break;
908 }
909 }
910 buf[len] = 0;
911
912 return buf;
913 }
914
915 /*
916 * checks to see if this request has a valid .bzdirect file. returns
917 * 0 on failure and 1 on success.
918 */
919 static int
920 check_direct_access(bozo_httpreq_t *request)
921 {
922 FILE *fp;
923 struct stat sb;
924 char dir[MAXPATHLEN], dirfile[MAXPATHLEN], *basename;
925
926 snprintf(dir, sizeof(dir), "%s", request->hr_file + 1);
927 debug((request->hr_httpd, DEBUG_FAT, "check_direct_access: dir %s", dir));
928 basename = strrchr(dir, '/');
929
930 if ((!basename || basename[1] != '\0') &&
931 lstat(dir, &sb) == 0 && S_ISDIR(sb.st_mode))
932 /* nothing */;
933 else if (basename == NULL)
934 strcpy(dir, ".");
935 else {
936 *basename++ = '\0';
937 bozo_check_special_files(request, basename);
938 }
939
940 snprintf(dirfile, sizeof(dirfile), "%s/%s", dir, DIRECT_ACCESS_FILE);
941 if (stat(dirfile, &sb) < 0 ||
942 (fp = fopen(dirfile, "r")) == NULL)
943 return 0;
944 fclose(fp);
945 return 1;
946 }
947
948 /*
949 * do automatic redirection -- if there are query parameters for the URL
950 * we will tack these on to the new (redirected) URL.
951 */
952 static void
953 handle_redirect(bozo_httpreq_t *request,
954 const char *url, int absolute)
955 {
956 bozohttpd_t *httpd = request->hr_httpd;
957 char *urlbuf;
958 char portbuf[20];
959 const char *hostname = BOZOHOST(httpd, request);
960 int query = 0;
961
962 if (url == NULL) {
963 if (asprintf(&urlbuf, "/%s/", request->hr_file) < 0)
964 bozo_err(httpd, 1, "asprintf");
965 url = urlbuf;
966 } else
967 urlbuf = NULL;
968 url = bozo_escape_rfc3986(request->hr_httpd, url);
969
970 if (request->hr_query && strlen(request->hr_query))
971 query = 1;
972
973 if (request->hr_serverport && strcmp(request->hr_serverport, "80") != 0)
974 snprintf(portbuf, sizeof(portbuf), ":%s",
975 request->hr_serverport);
976 else
977 portbuf[0] = '\0';
978 if (absolute)
979 bozo_warn(httpd, "redirecting %s", url);
980 else
981 bozo_warn(httpd, "redirecting %s%s%s", hostname, portbuf, url);
982 debug((httpd, DEBUG_FAT, "redirecting %s", url));
983 bozo_printf(httpd, "%s 301 Document Moved\r\n", request->hr_proto);
984 if (request->hr_proto != httpd->consts.http_09)
985 bozo_print_header(request, NULL, "text/html", NULL);
986 if (request->hr_proto != httpd->consts.http_09) {
987 bozo_printf(httpd, "Location: http://");
988 if (absolute == 0)
989 bozo_printf(httpd, "%s%s", hostname, portbuf);
990 if (query) {
991 bozo_printf(httpd, "%s?%s\r\n", url, request->hr_query);
992 } else {
993 bozo_printf(httpd, "%s\r\n", url);
994 }
995 }
996 bozo_printf(httpd, "\r\n");
997 if (request->hr_method == HTTP_HEAD)
998 goto head;
999 bozo_printf(httpd, "<html><head><title>Document Moved</title></head>\n");
1000 bozo_printf(httpd, "<body><h1>Document Moved</h1>\n");
1001 bozo_printf(httpd, "This document had moved <a href=\"http://");
1002 if (query) {
1003 if (absolute)
1004 bozo_printf(httpd, "%s?%s", url, request->hr_query);
1005 else
1006 bozo_printf(httpd, "%s%s%s?%s", hostname,
1007 portbuf, url, request->hr_query);
1008 } else {
1009 if (absolute)
1010 bozo_printf(httpd, "%s", url);
1011 else
1012 bozo_printf(httpd, "%s%s%s", hostname,
1013 portbuf, url);
1014 }
1015 bozo_printf(httpd, "\">here</a>\n");
1016 bozo_printf(httpd, "</body></html>\n");
1017 head:
1018 bozo_flush(httpd, stdout);
1019 if (urlbuf)
1020 free(urlbuf);
1021 }
1022
1023 /*
1024 * deal with virtual host names; we do this:
1025 * if we have a virtual path root (httpd->virtbase), and we are given a
1026 * virtual host spec (Host: ho.st or http://ho.st/), see if this
1027 * directory exists under httpd->virtbase. if it does, use this as the
1028 # new slashdir.
1029 */
1030 static int
1031 check_virtual(bozo_httpreq_t *request)
1032 {
1033 bozohttpd_t *httpd = request->hr_httpd;
1034 char *file = request->hr_file, *s;
1035 size_t len;
1036
1037 if (!httpd->virtbase)
1038 goto use_slashdir;
1039
1040 /*
1041 * convert http://virtual.host/ to request->hr_host
1042 */
1043 debug((httpd, DEBUG_OBESE, "checking for http:// virtual host in ``%s''",
1044 file));
1045 if (strncasecmp(file, "http://", 7) == 0) {
1046 /* we would do virtual hosting here? */
1047 file += 7;
1048 s = strchr(file, '/');
1049 /* HTTP/1.1 draft rev-06, 5.2: URI takes precedence over Host: */
1050 request->hr_host = file;
1051 request->hr_file = bozostrdup(request->hr_httpd, s ? s : "/");
1052 debug((httpd, DEBUG_OBESE, "got host ``%s'' file is now ``%s''",
1053 request->hr_host, request->hr_file));
1054 } else if (!request->hr_host)
1055 goto use_slashdir;
1056
1057 /*
1058 * ok, we have a virtual host, use scandir(3) to find a case
1059 * insensitive match for the virtual host we are asked for.
1060 * note that if the virtual host is the same as the master,
1061 * we don't need to do anything special.
1062 */
1063 len = strlen(request->hr_host);
1064 debug((httpd, DEBUG_OBESE,
1065 "check_virtual: checking host `%s' under httpd->virtbase `%s' "
1066 "for file `%s'",
1067 request->hr_host, httpd->virtbase, request->hr_file));
1068 if (strncasecmp(httpd->virthostname, request->hr_host, len) != 0) {
1069 s = 0;
1070 DIR *dirp;
1071 struct dirent *d;
1072
1073 if ((dirp = opendir(httpd->virtbase)) != NULL) {
1074 while ((d = readdir(dirp)) != NULL) {
1075 if (strcmp(d->d_name, ".") == 0 ||
1076 strcmp(d->d_name, "..") == 0) {
1077 continue;
1078 }
1079 debug((httpd, DEBUG_OBESE, "looking at dir``%s''",
1080 d->d_name));
1081 if (strncasecmp(d->d_name, request->hr_host,
1082 len) == 0) {
1083 /* found it, punch it */
1084 debug((httpd, DEBUG_OBESE, "found it punch it"));
1085 request->hr_virthostname =
1086 bozostrdup(httpd, d->d_name);
1087 if (asprintf(&s, "%s/%s", httpd->virtbase,
1088 request->hr_virthostname) < 0)
1089 bozo_err(httpd, 1, "asprintf");
1090 break;
1091 }
1092 }
1093 closedir(dirp);
1094 }
1095 else {
1096 debug((httpd, DEBUG_FAT, "opendir %s failed: %s",
1097 httpd->virtbase, strerror(errno)));
1098 }
1099 if (s == 0) {
1100 if (httpd->unknown_slash)
1101 goto use_slashdir;
1102 return bozo_http_error(httpd, 404, request,
1103 "unknown URL");
1104 }
1105 } else
1106 use_slashdir:
1107 s = httpd->slashdir;
1108
1109 /*
1110 * ok, nailed the correct slashdir, chdir to it
1111 */
1112 if (chdir(s) < 0)
1113 return bozo_http_error(httpd, 404, request,
1114 "can't chdir to slashdir");
1115 return 0;
1116 }
1117
1118 /*
1119 * checks to see if this request has a valid .bzredirect file. returns
1120 * 0 when no redirection happend, or 1 when handle_redirect() has been
1121 * called.
1122 */
1123 static int
1124 check_bzredirect(bozo_httpreq_t *request)
1125 {
1126 struct stat sb;
1127 char dir[MAXPATHLEN], redir[MAXPATHLEN], redirpath[MAXPATHLEN + 1],
1128 path[MAXPATHLEN];
1129 char *basename, *finalredir;
1130 int rv, absolute;
1131
1132 /*
1133 * if this pathname is really a directory, but doesn't end in /,
1134 * use it as the directory to look for the redir file.
1135 */
1136 snprintf(dir, sizeof(dir), "%s", request->hr_file + 1);
1137 debug((request->hr_httpd, DEBUG_FAT, "check_bzredirect: dir %s", dir));
1138 basename = strrchr(dir, '/');
1139
1140 if ((!basename || basename[1] != '\0') &&
1141 lstat(dir, &sb) == 0 && S_ISDIR(sb.st_mode))
1142 /* nothing */;
1143 else if (basename == NULL)
1144 strcpy(dir, ".");
1145 else {
1146 *basename++ = '\0';
1147 bozo_check_special_files(request, basename);
1148 }
1149
1150 snprintf(redir, sizeof(redir), "%s/%s", dir, REDIRECT_FILE);
1151 if (lstat(redir, &sb) == 0) {
1152 if (!S_ISLNK(sb.st_mode))
1153 return 0;
1154 absolute = 0;
1155 } else {
1156 snprintf(redir, sizeof(redir), "%s/%s", dir, ABSREDIRECT_FILE);
1157 if (lstat(redir, &sb) < 0 || !S_ISLNK(sb.st_mode))
1158 return 0;
1159 absolute = 1;
1160 }
1161 debug((request->hr_httpd, DEBUG_FAT,
1162 "check_bzredirect: calling readlink"));
1163 rv = readlink(redir, redirpath, sizeof redirpath - 1);
1164 if (rv == -1 || rv == 0) {
1165 debug((request->hr_httpd, DEBUG_FAT, "readlink failed"));
1166 return 0;
1167 }
1168 redirpath[rv] = '\0';
1169 debug((request->hr_httpd, DEBUG_FAT,
1170 "readlink returned \"%s\"", redirpath));
1171
1172 /* check if we need authentication */
1173 snprintf(path, sizeof(path), "%s/", dir);
1174 if (bozo_auth_check(request, path))
1175 return 1;
1176
1177 /* now we have the link pointer, redirect to the real place */
1178 if (absolute)
1179 finalredir = redirpath;
1180 else
1181 snprintf(finalredir = redir, sizeof(redir), "/%s/%s", dir,
1182 redirpath);
1183
1184 debug((request->hr_httpd, DEBUG_FAT,
1185 "check_bzredirect: new redir %s", finalredir));
1186 handle_redirect(request, finalredir, absolute);
1187 return 1;
1188 }
1189
1190 /* this fixes the %HH hack that RFC2396 requires. */
1191 static void
1192 fix_url_percent(bozo_httpreq_t *request)
1193 {
1194 bozohttpd_t *httpd = request->hr_httpd;
1195 char *s, *t, buf[3], *url;
1196 char *end; /* if end is not-zero, we don't translate beyond that */
1197
1198 url = request->hr_file;
1199
1200 end = url + strlen(url);
1201
1202 /* fast forward to the first % */
1203 if ((s = strchr(url, '%')) == NULL)
1204 return;
1205
1206 t = s;
1207 do {
1208 if (end && s >= end) {
1209 debug((httpd, DEBUG_EXPLODING,
1210 "fu_%%: past end, filling out.."));
1211 while (*s)
1212 *t++ = *s++;
1213 break;
1214 }
1215 debug((httpd, DEBUG_EXPLODING,
1216 "fu_%%: got s == %%, s[1]s[2] == %c%c",
1217 s[1], s[2]));
1218 if (s[1] == '\0' || s[2] == '\0') {
1219 (void)bozo_http_error(httpd, 400, request,
1220 "percent hack missing two chars afterwards");
1221 goto copy_rest;
1222 }
1223 if (s[1] == '0' && s[2] == '0') {
1224 (void)bozo_http_error(httpd, 404, request,
1225 "percent hack was %00");
1226 goto copy_rest;
1227 }
1228 if (s[1] == '2' && s[2] == 'f') {
1229 (void)bozo_http_error(httpd, 404, request,
1230 "percent hack was %2f (/)");
1231 goto copy_rest;
1232 }
1233
1234 buf[0] = *++s;
1235 buf[1] = *++s;
1236 buf[2] = '\0';
1237 s++;
1238 *t = (char)strtol(buf, NULL, 16);
1239 debug((httpd, DEBUG_EXPLODING,
1240 "fu_%%: strtol put '%02x' into *t", *t));
1241 if (*t++ == '\0') {
1242 (void)bozo_http_error(httpd, 400, request,
1243 "percent hack got a 0 back");
1244 goto copy_rest;
1245 }
1246
1247 while (*s && *s != '%') {
1248 if (end && s >= end)
1249 break;
1250 *t++ = *s++;
1251 }
1252 } while (*s);
1253 copy_rest:
1254 while (*s) {
1255 if (s >= end)
1256 break;
1257 *t++ = *s++;
1258 }
1259 *t = '\0';
1260 debug((httpd, DEBUG_FAT, "fix_url_percent returns %s in url",
1261 request->hr_file));
1262 }
1263
1264 /*
1265 * transform_request does this:
1266 * - ``expand'' %20 crapola
1267 * - punt if it doesn't start with /
1268 * - check httpd->untrustedref / referrer
1269 * - look for "http://myname/" and deal with it.
1270 * - maybe call bozo_process_cgi()
1271 * - check for ~user and call bozo_user_transform() if so
1272 * - if the length > 1, check for trailing slash. if so,
1273 * add the index.html file
1274 * - if the length is 1, return the index.html file
1275 * - disallow anything ending up with a file starting
1276 * at "/" or having ".." in it.
1277 * - anything else is a really weird internal error
1278 * - returns malloced file to serve, if unhandled
1279 */
1280 static int
1281 transform_request(bozo_httpreq_t *request, int *isindex)
1282 {
1283 bozohttpd_t *httpd = request->hr_httpd;
1284 char *file, *newfile = NULL;
1285 size_t len;
1286 const char *hostname = BOZOHOST(httpd, request);
1287
1288 file = NULL;
1289 *isindex = 0;
1290 debug((httpd, DEBUG_FAT, "tf_req: file %s", request->hr_file));
1291 fix_url_percent(request);
1292 if (check_virtual(request)) {
1293 goto bad_done;
1294 }
1295 file = request->hr_file;
1296
1297 if (file[0] != '/') {
1298 (void)bozo_http_error(httpd, 404, request, "unknown URL");
1299 goto bad_done;
1300 }
1301
1302 if (check_bzredirect(request))
1303 return 0;
1304
1305 if (httpd->untrustedref) {
1306 int to_indexhtml = 0;
1307
1308 #define TOP_PAGE(x) (strcmp((x), "/") == 0 || \
1309 strcmp((x) + 1, httpd->index_html) == 0 || \
1310 strcmp((x) + 1, "favicon.ico") == 0)
1311
1312 debug((httpd, DEBUG_EXPLODING, "checking httpd->untrustedref"));
1313 /*
1314 * first check that this path isn't allowed via .bzdirect file,
1315 * and then check referrer; make sure that people come via the
1316 * real name... otherwise if we aren't looking at / or
1317 * /index.html, redirect... we also special case favicon.ico.
1318 */
1319 if (check_direct_access(request))
1320 /* nothing */;
1321 else if (request->hr_referrer) {
1322 const char *r = request->hr_referrer;
1323
1324 debug((httpd, DEBUG_FAT,
1325 "checking referrer \"%s\" vs virthostname %s",
1326 r, hostname));
1327 if (strncmp(r, "http://", 7) != 0 ||
1328 (strncasecmp(r + 7, hostname,
1329 strlen(hostname)) != 0 &&
1330 !TOP_PAGE(file)))
1331 to_indexhtml = 1;
1332 } else {
1333 const char *h = request->hr_host;
1334
1335 debug((httpd, DEBUG_FAT, "url has no referrer at all"));
1336 /* if there's no referrer, let / or /index.html past */
1337 if (!TOP_PAGE(file) ||
1338 (h && strncasecmp(h, hostname,
1339 strlen(hostname)) != 0))
1340 to_indexhtml = 1;
1341 }
1342
1343 if (to_indexhtml) {
1344 char *slashindexhtml;
1345
1346 if (asprintf(&slashindexhtml, "/%s",
1347 httpd->index_html) < 0)
1348 bozo_err(httpd, 1, "asprintf");
1349 debug((httpd, DEBUG_FAT,
1350 "httpd->untrustedref: redirecting %s to %s",
1351 file, slashindexhtml));
1352 handle_redirect(request, slashindexhtml, 0);
1353 free(slashindexhtml);
1354 return 0;
1355 }
1356 }
1357
1358 len = strlen(file);
1359 if (/*CONSTCOND*/0) {
1360 #ifndef NO_USER_SUPPORT
1361 } else if (len > 1 && httpd->enable_users && file[1] == '~') {
1362 if (file[2] == '\0') {
1363 (void)bozo_http_error(httpd, 404, request,
1364 "missing username");
1365 goto bad_done;
1366 }
1367 if (strchr(file + 2, '/') == NULL) {
1368 handle_redirect(request, NULL, 0);
1369 return 0;
1370 }
1371 debug((httpd, DEBUG_FAT, "calling bozo_user_transform"));
1372
1373 return bozo_user_transform(request, isindex);
1374 #endif /* NO_USER_SUPPORT */
1375 } else if (len > 1) {
1376 debug((httpd, DEBUG_FAT, "file[len-1] == %c", file[len-1]));
1377 if (file[len-1] == '/') { /* append index.html */
1378 *isindex = 1;
1379 debug((httpd, DEBUG_FAT, "appending index.html"));
1380 newfile = bozomalloc(httpd,
1381 len + strlen(httpd->index_html) + 1);
1382 strcpy(newfile, file + 1);
1383 strcat(newfile, httpd->index_html);
1384 } else
1385 newfile = bozostrdup(request->hr_httpd, file + 1);
1386 } else if (len == 1) {
1387 debug((httpd, DEBUG_EXPLODING, "tf_req: len == 1"));
1388 newfile = bozostrdup(request->hr_httpd, httpd->index_html);
1389 *isindex = 1;
1390 } else { /* len == 0 ? */
1391 (void)bozo_http_error(httpd, 500, request,
1392 "request->hr_file is nul?");
1393 goto bad_done;
1394 }
1395
1396 if (newfile == NULL) {
1397 (void)bozo_http_error(httpd, 500, request, "internal failure");
1398 goto bad_done;
1399 }
1400
1401 /*
1402 * look for "http://myname/" and deal with it as necessary.
1403 */
1404
1405 /*
1406 * stop traversing outside our domain
1407 *
1408 * XXX true security only comes from our parent using chroot(2)
1409 * before execve(2)'ing us. or our own built in chroot(2) support.
1410 */
1411 if (*newfile == '/' || strcmp(newfile, "..") == 0 ||
1412 strstr(newfile, "/..") || strstr(newfile, "../")) {
1413 (void)bozo_http_error(httpd, 403, request, "illegal request");
1414 goto bad_done;
1415 }
1416
1417 if (bozo_auth_check(request, newfile))
1418 goto bad_done;
1419
1420 if (strlen(newfile)) {
1421 request->hr_oldfile = request->hr_file;
1422 request->hr_file = newfile;
1423 }
1424
1425 if (bozo_process_cgi(request))
1426 return 0;
1427
1428 debug((httpd, DEBUG_FAT, "transform_request set: %s", newfile));
1429 return 1;
1430 bad_done:
1431 debug((httpd, DEBUG_FAT, "transform_request returning: 0"));
1432 if (newfile)
1433 free(newfile);
1434 return 0;
1435 }
1436
1437 /*
1438 * can_gzip checks if the request supports and prefers gzip encoding.
1439 *
1440 * XXX: we do not consider the associated q with gzip in making our
1441 * decision which is broken.
1442 */
1443
1444 static int
1445 can_gzip(bozo_httpreq_t *request)
1446 {
1447 const char *pos;
1448 const char *tmp;
1449 size_t len;
1450
1451 /* First we decide if the request can be gzipped at all. */
1452
1453 /* not if we already are encoded... */
1454 tmp = bozo_content_encoding(request, request->hr_file);
1455 if (tmp && *tmp)
1456 return 0;
1457
1458 /* not if we are not asking for the whole file... */
1459 if (request->hr_last_byte_pos != -1 || request->hr_have_range)
1460 return 0;
1461
1462 /* Then we determine if gzip is on the cards. */
1463
1464 for (pos = request->hr_accept_encoding; pos && *pos; pos += len) {
1465 while (*pos == ' ')
1466 pos++;
1467
1468 len = strcspn(pos, ";,");
1469
1470 if ((len == 4 && strncasecmp("gzip", pos, 4) == 0) ||
1471 (len == 6 && strncasecmp("x-gzip", pos, 6) == 0))
1472 return 1;
1473
1474 if (pos[len] == ';')
1475 len += strcspn(&pos[len], ",");
1476
1477 if (pos[len])
1478 len++;
1479 }
1480
1481 return 0;
1482 }
1483
1484 /*
1485 * bozo_process_request does the following:
1486 * - check the request is valid
1487 * - process cgi-bin if necessary
1488 * - transform a filename if necesarry
1489 * - return the HTTP request
1490 */
1491 void
1492 bozo_process_request(bozo_httpreq_t *request)
1493 {
1494 bozohttpd_t *httpd = request->hr_httpd;
1495 struct stat sb;
1496 time_t timestamp;
1497 char *file;
1498 const char *type, *encoding;
1499 int fd, isindex;
1500
1501 /*
1502 * note that transform_request chdir()'s if required. also note
1503 * that cgi is handed here. if transform_request() returns 0
1504 * then the request has been handled already.
1505 */
1506 if (transform_request(request, &isindex) == 0)
1507 return;
1508
1509 fd = -1;
1510 encoding = NULL;
1511 if (can_gzip(request)) {
1512 asprintf(&file, "%s.gz", request->hr_file);
1513 fd = open(file, O_RDONLY);
1514 if (fd >= 0)
1515 encoding = "gzip";
1516 free(file);
1517 }
1518
1519 file = request->hr_file;
1520
1521 if (fd < 0)
1522 fd = open(file, O_RDONLY);
1523
1524 if (fd < 0) {
1525 debug((httpd, DEBUG_FAT, "open failed: %s", strerror(errno)));
1526 if (errno == EPERM)
1527 (void)bozo_http_error(httpd, 403, request,
1528 "no permission to open file");
1529 else if (errno == ENOENT) {
1530 if (!bozo_dir_index(request, file, isindex))
1531 (void)bozo_http_error(httpd, 404, request,
1532 "no file");
1533 } else
1534 (void)bozo_http_error(httpd, 500, request, "open file");
1535 goto cleanup_nofd;
1536 }
1537 if (fstat(fd, &sb) < 0) {
1538 (void)bozo_http_error(httpd, 500, request, "can't fstat");
1539 goto cleanup;
1540 }
1541 if (S_ISDIR(sb.st_mode)) {
1542 handle_redirect(request, NULL, 0);
1543 goto cleanup;
1544 }
1545
1546 if (request->hr_if_modified_since &&
1547 parse_http_date(request->hr_if_modified_since, ×tamp) &&
1548 timestamp >= sb.st_mtime) {
1549 /* XXX ignore subsecond of timestamp */
1550 bozo_printf(httpd, "%s 304 Not Modified\r\n",
1551 request->hr_proto);
1552 bozo_printf(httpd, "\r\n");
1553 bozo_flush(httpd, stdout);
1554 goto cleanup;
1555 }
1556
1557 /* validate requested range */
1558 if (request->hr_last_byte_pos == -1 ||
1559 request->hr_last_byte_pos >= sb.st_size)
1560 request->hr_last_byte_pos = sb.st_size - 1;
1561 if (request->hr_have_range &&
1562 request->hr_first_byte_pos > request->hr_last_byte_pos) {
1563 request->hr_have_range = 0; /* punt */
1564 request->hr_first_byte_pos = 0;
1565 request->hr_last_byte_pos = sb.st_size - 1;
1566 }
1567 debug((httpd, DEBUG_FAT, "have_range %d first_pos %lld last_pos %lld",
1568 request->hr_have_range,
1569 (long long)request->hr_first_byte_pos,
1570 (long long)request->hr_last_byte_pos));
1571 if (request->hr_have_range)
1572 bozo_printf(httpd, "%s 206 Partial Content\r\n",
1573 request->hr_proto);
1574 else
1575 bozo_printf(httpd, "%s 200 OK\r\n", request->hr_proto);
1576
1577 if (request->hr_proto != httpd->consts.http_09) {
1578 type = bozo_content_type(request, file);
1579 if (!encoding)
1580 encoding = bozo_content_encoding(request, file);
1581
1582 bozo_print_header(request, &sb, type, encoding);
1583 bozo_printf(httpd, "\r\n");
1584 }
1585 bozo_flush(httpd, stdout);
1586
1587 if (request->hr_method != HTTP_HEAD) {
1588 off_t szleft, cur_byte_pos;
1589
1590 szleft =
1591 request->hr_last_byte_pos - request->hr_first_byte_pos + 1;
1592 cur_byte_pos = request->hr_first_byte_pos;
1593
1594 retry:
1595 while (szleft) {
1596 size_t sz;
1597
1598 /* This should take care of the first unaligned chunk */
1599 if ((cur_byte_pos & (httpd->page_size - 1)) != 0)
1600 sz = (size_t)(cur_byte_pos & ~httpd->page_size);
1601 if ((off_t)httpd->mmapsz < szleft)
1602 sz = httpd->mmapsz;
1603 else
1604 sz = (size_t)szleft;
1605 if (mmap_and_write_part(httpd, fd, cur_byte_pos, sz)) {
1606 if (errno == ENOMEM) {
1607 httpd->mmapsz /= 2;
1608 if (httpd->mmapsz >= httpd->page_size)
1609 goto retry;
1610 }
1611 goto cleanup;
1612 }
1613 cur_byte_pos += sz;
1614 szleft -= sz;
1615 }
1616 }
1617 cleanup:
1618 close(fd);
1619 cleanup_nofd:
1620 close(STDIN_FILENO);
1621 close(STDOUT_FILENO);
1622 /*close(STDERR_FILENO);*/
1623 }
1624
1625 /* make sure we're not trying to access special files */
1626 int
1627 bozo_check_special_files(bozo_httpreq_t *request, const char *name)
1628 {
1629 bozohttpd_t *httpd = request->hr_httpd;
1630
1631 /* ensure basename(name) != special files */
1632 if (strcmp(name, DIRECT_ACCESS_FILE) == 0)
1633 return bozo_http_error(httpd, 403, request,
1634 "no permission to open direct access file");
1635 if (strcmp(name, REDIRECT_FILE) == 0)
1636 return bozo_http_error(httpd, 403, request,
1637 "no permission to open redirect file");
1638 if (strcmp(name, ABSREDIRECT_FILE) == 0)
1639 return bozo_http_error(httpd, 403, request,
1640 "no permission to open redirect file");
1641 return bozo_auth_check_special_files(request, name);
1642 }
1643
1644 /* generic header printing routine */
1645 void
1646 bozo_print_header(bozo_httpreq_t *request,
1647 struct stat *sbp, const char *type, const char *encoding)
1648 {
1649 bozohttpd_t *httpd = request->hr_httpd;
1650 off_t len;
1651 char date[40];
1652
1653 bozo_printf(httpd, "Date: %s\r\n", bozo_http_date(date, sizeof(date)));
1654 bozo_printf(httpd, "Server: %s\r\n", httpd->server_software);
1655 bozo_printf(httpd, "Accept-Ranges: bytes\r\n");
1656 if (sbp) {
1657 char filedate[40];
1658 struct tm *tm;
1659
1660 tm = gmtime(&sbp->st_mtime);
1661 strftime(filedate, sizeof filedate,
1662 "%a, %d %b %Y %H:%M:%S GMT", tm);
1663 bozo_printf(httpd, "Last-Modified: %s\r\n", filedate);
1664 }
1665 if (type && *type)
1666 bozo_printf(httpd, "Content-Type: %s\r\n", type);
1667 if (encoding && *encoding)
1668 bozo_printf(httpd, "Content-Encoding: %s\r\n", encoding);
1669 if (sbp) {
1670 if (request->hr_have_range) {
1671 len = request->hr_last_byte_pos -
1672 request->hr_first_byte_pos +1;
1673 bozo_printf(httpd,
1674 "Content-Range: bytes %qd-%qd/%qd\r\n",
1675 (long long) request->hr_first_byte_pos,
1676 (long long) request->hr_last_byte_pos,
1677 (long long) sbp->st_size);
1678 } else
1679 len = sbp->st_size;
1680 bozo_printf(httpd, "Content-Length: %qd\r\n", (long long)len);
1681 }
1682 if (request && request->hr_proto == httpd->consts.http_11)
1683 bozo_printf(httpd, "Connection: close\r\n");
1684 bozo_flush(httpd, stdout);
1685 }
1686
1687 #ifndef NO_DEBUG
1688 void
1689 debug__(bozohttpd_t *httpd, int level, const char *fmt, ...)
1690 {
1691 va_list ap;
1692 int savederrno;
1693
1694 /* only log if the level is low enough */
1695 if (httpd->debug < level)
1696 return;
1697
1698 savederrno = errno;
1699 va_start(ap, fmt);
1700 if (httpd->logstderr) {
1701 vfprintf(stderr, fmt, ap);
1702 fputs("\n", stderr);
1703 } else
1704 vsyslog(LOG_DEBUG, fmt, ap);
1705 va_end(ap);
1706 errno = savederrno;
1707 }
1708 #endif /* NO_DEBUG */
1709
1710 /* these are like warn() and err(), except for syslog not stderr */
1711 void
1712 bozo_warn(bozohttpd_t *httpd, const char *fmt, ...)
1713 {
1714 va_list ap;
1715
1716 va_start(ap, fmt);
1717 if (httpd->logstderr || isatty(STDERR_FILENO)) {
1718 //fputs("warning: ", stderr);
1719 vfprintf(stderr, fmt, ap);
1720 fputs("\n", stderr);
1721 } else
1722 vsyslog(LOG_INFO, fmt, ap);
1723 va_end(ap);
1724 }
1725
1726 void
1727 bozo_err(bozohttpd_t *httpd, int code, const char *fmt, ...)
1728 {
1729 va_list ap;
1730
1731 va_start(ap, fmt);
1732 if (httpd->logstderr || isatty(STDERR_FILENO)) {
1733 //fputs("error: ", stderr);
1734 vfprintf(stderr, fmt, ap);
1735 fputs("\n", stderr);
1736 } else
1737 vsyslog(LOG_ERR, fmt, ap);
1738 va_end(ap);
1739 exit(code);
1740 }
1741
1742 /*
1743 * this escapes HTML tags. returns allocated escaped
1744 * string if needed, or NULL on allocation failure or
1745 * lack of escape need.
1746 * call with NULL httpd in error paths, to avoid recursive
1747 * malloc failure. call with valid httpd in normal paths
1748 * to get automatic allocation failure handling.
1749 */
1750 char *
1751 bozo_escape_html(bozohttpd_t *httpd, const char *url)
1752 {
1753 int i, j;
1754 char *tmp;
1755 size_t len;
1756
1757 for (i = 0, j = 0; url[i]; i++) {
1758 switch (url[i]) {
1759 case '<':
1760 case '>':
1761 j += 4;
1762 break;
1763 case '&':
1764 j += 5;
1765 break;
1766 }
1767 }
1768
1769 if (j == 0)
1770 return NULL;
1771
1772 /*
1773 * we need to handle being called from different
1774 * pathnames.
1775 */
1776 len = strlen(url) + j;
1777 if (httpd)
1778 tmp = bozomalloc(httpd, len);
1779 else if ((tmp = malloc(len)) == 0)
1780 return NULL;
1781
1782 for (i = 0, j = 0; url[i]; i++) {
1783 switch (url[i]) {
1784 case '<':
1785 memcpy(tmp + j, "<", 4);
1786 j += 4;
1787 break;
1788 case '>':
1789 memcpy(tmp + j, ">", 4);
1790 j += 4;
1791 break;
1792 case '&':
1793 memcpy(tmp + j, "&", 5);
1794 j += 5;
1795 break;
1796 default:
1797 tmp[j++] = url[i];
1798 }
1799 }
1800 tmp[j] = 0;
1801
1802 return tmp;
1803 }
1804
1805 /* short map between error code, and short/long messages */
1806 static struct errors_map {
1807 int code; /* HTTP return code */
1808 const char *shortmsg; /* short version of message */
1809 const char *longmsg; /* long version of message */
1810 } errors_map[] = {
1811 { 400, "400 Bad Request", "The request was not valid", },
1812 { 401, "401 Unauthorized", "No authorization", },
1813 { 403, "403 Forbidden", "Access to this item has been denied",},
1814 { 404, "404 Not Found", "This item has not been found", },
1815 { 408, "408 Request Timeout", "This request took too long", },
1816 { 417, "417 Expectation Failed","Expectations not available", },
1817 { 500, "500 Internal Error", "An error occured on the server", },
1818 { 501, "501 Not Implemented", "This request is not available", },
1819 { 0, NULL, NULL, },
1820 };
1821
1822 static const char *help = "DANGER! WILL ROBINSON! DANGER!";
1823
1824 static const char *
1825 http_errors_short(int code)
1826 {
1827 struct errors_map *ep;
1828
1829 for (ep = errors_map; ep->code; ep++)
1830 if (ep->code == code)
1831 return (ep->shortmsg);
1832 return (help);
1833 }
1834
1835 static const char *
1836 http_errors_long(int code)
1837 {
1838 struct errors_map *ep;
1839
1840 for (ep = errors_map; ep->code; ep++)
1841 if (ep->code == code)
1842 return (ep->longmsg);
1843 return (help);
1844 }
1845
1846 /* the follow functions and variables are used in handling HTTP errors */
1847 /* ARGSUSED */
1848 int
1849 bozo_http_error(bozohttpd_t *httpd, int code, bozo_httpreq_t *request,
1850 const char *msg)
1851 {
1852 char portbuf[20];
1853 const char *header = http_errors_short(code);
1854 const char *reason = http_errors_long(code);
1855 const char *proto = (request && request->hr_proto) ?
1856 request->hr_proto : httpd->consts.http_11;
1857 const char *hostname = BOZOHOST(httpd, request);
1858 int size;
1859
1860 debug((httpd, DEBUG_FAT, "bozo_http_error %d: %s", code, msg));
1861 if (header == NULL || reason == NULL) {
1862 bozo_err(httpd, 1,
1863 "bozo_http_error() failed (short = %p, long = %p)",
1864 header, reason);
1865 return code;
1866 }
1867
1868 if (request && request->hr_serverport &&
1869 strcmp(request->hr_serverport, "80") != 0)
1870 snprintf(portbuf, sizeof(portbuf), ":%s",
1871 request->hr_serverport);
1872 else
1873 portbuf[0] = '\0';
1874
1875 if (request && request->hr_file) {
1876 char *file = NULL;
1877
1878 /* bozo_escape_html() failure here is just too bad. */
1879 file = bozo_escape_html(NULL, request->hr_file);
1880 if (file == NULL)
1881 file = request->hr_file;
1882 size = snprintf(httpd->errorbuf, BUFSIZ,
1883 "<html><head><title>%s</title></head>\n"
1884 "<body><h1>%s</h1>\n"
1885 "%s: <pre>%s</pre>\n"
1886 "<hr><address><a href=\"http://%s%s/\">%s%s</a></address>\n"
1887 "</body></html>\n",
1888 header, header, file, reason,
1889 hostname, portbuf, hostname, portbuf);
1890 if (size >= (int)BUFSIZ) {
1891 bozo_warn(httpd,
1892 "bozo_http_error buffer too small, truncated");
1893 size = (int)BUFSIZ;
1894 }
1895 } else
1896 size = 0;
1897
1898 bozo_printf(httpd, "%s %s\r\n", proto, header);
1899 if (request)
1900 bozo_auth_check_401(request, code);
1901
1902 bozo_printf(httpd, "Content-Type: text/html\r\n");
1903 bozo_printf(httpd, "Content-Length: %d\r\n", size);
1904 bozo_printf(httpd, "Server: %s\r\n", httpd->server_software);
1905 if (request && request->hr_allow)
1906 bozo_printf(httpd, "Allow: %s\r\n", request->hr_allow);
1907 bozo_printf(httpd, "\r\n");
1908 if (size)
1909 bozo_printf(httpd, "%s", httpd->errorbuf);
1910 bozo_flush(httpd, stdout);
1911
1912 return code;
1913 }
1914
1915 /* Below are various modified libc functions */
1916
1917 /*
1918 * returns -1 in lenp if the string ran out before finding a delimiter,
1919 * but is otherwise the same as strsep. Note that the length must be
1920 * correctly passed in.
1921 */
1922 char *
1923 bozostrnsep(char **strp, const char *delim, ssize_t *lenp)
1924 {
1925 char *s;
1926 const char *spanp;
1927 int c, sc;
1928 char *tok;
1929
1930 if ((s = *strp) == NULL)
1931 return (NULL);
1932 for (tok = s;;) {
1933 if (lenp && --(*lenp) == -1)
1934 return (NULL);
1935 c = *s++;
1936 spanp = delim;
1937 do {
1938 if ((sc = *spanp++) == c) {
1939 if (c == 0)
1940 s = NULL;
1941 else
1942 s[-1] = '\0';
1943 *strp = s;
1944 return (tok);
1945 }
1946 } while (sc != 0);
1947 }
1948 /* NOTREACHED */
1949 }
1950
1951 /*
1952 * inspired by fgetln(3), but works for fd's. should work identically
1953 * except it, however, does *not* return the newline, and it does nul
1954 * terminate the string.
1955 */
1956 char *
1957 bozodgetln(bozohttpd_t *httpd, int fd, ssize_t *lenp,
1958 ssize_t (*readfn)(bozohttpd_t *, int, void *, size_t))
1959 {
1960 ssize_t len;
1961 int got_cr = 0;
1962 char c, *nbuffer;
1963
1964 /* initialise */
1965 if (httpd->getln_buflen == 0) {
1966 /* should be plenty for most requests */
1967 httpd->getln_buflen = 128;
1968 httpd->getln_buffer = malloc((size_t)httpd->getln_buflen);
1969 if (httpd->getln_buffer == NULL) {
1970 httpd->getln_buflen = 0;
1971 return NULL;
1972 }
1973 }
1974 len = 0;
1975
1976 /*
1977 * we *have* to read one byte at a time, to not break cgi
1978 * programs (for we pass stdin off to them). could fix this
1979 * by becoming a fd-passing program instead of just exec'ing
1980 * the program
1981 *
1982 * the above is no longer true, we are the fd-passing
1983 * program already.
1984 */
1985 for (; readfn(httpd, fd, &c, 1) == 1; ) {
1986 debug((httpd, DEBUG_EXPLODING, "bozodgetln read %c", c));
1987
1988 if (len >= httpd->getln_buflen - 1) {
1989 httpd->getln_buflen *= 2;
1990 debug((httpd, DEBUG_EXPLODING, "bozodgetln: "
1991 "reallocating buffer to buflen %zu",
1992 httpd->getln_buflen));
1993 nbuffer = bozorealloc(httpd, httpd->getln_buffer,
1994 (size_t)httpd->getln_buflen);
1995 httpd->getln_buffer = nbuffer;
1996 }
1997
1998 httpd->getln_buffer[len++] = c;
1999 if (c == '\r') {
2000 got_cr = 1;
2001 continue;
2002 } else if (c == '\n') {
2003 /*
2004 * HTTP/1.1 spec says to ignore CR and treat
2005 * LF as the real line terminator. even though
2006 * the same spec defines CRLF as the line
2007 * terminator, it is recommended in section 19.3
2008 * to do the LF trick for tolerance.
2009 */
2010 if (got_cr)
2011 len -= 2;
2012 else
2013 len -= 1;
2014 break;
2015 }
2016
2017 }
2018 httpd->getln_buffer[len] = '\0';
2019 debug((httpd, DEBUG_OBESE, "bozodgetln returns: ``%s'' with len %zd",
2020 httpd->getln_buffer, len));
2021 *lenp = len;
2022 return httpd->getln_buffer;
2023 }
2024
2025 void *
2026 bozorealloc(bozohttpd_t *httpd, void *ptr, size_t size)
2027 {
2028 void *p;
2029
2030 p = realloc(ptr, size);
2031 if (p == NULL) {
2032 (void)bozo_http_error(httpd, 500, NULL,
2033 "memory allocation failure");
2034 exit(1);
2035 }
2036 return (p);
2037 }
2038
2039 void *
2040 bozomalloc(bozohttpd_t *httpd, size_t size)
2041 {
2042 void *p;
2043
2044 p = malloc(size);
2045 if (p == NULL) {
2046 (void)bozo_http_error(httpd, 500, NULL,
2047 "memory allocation failure");
2048 exit(1);
2049 }
2050 return (p);
2051 }
2052
2053 char *
2054 bozostrdup(bozohttpd_t *httpd, const char *str)
2055 {
2056 char *p;
2057
2058 p = strdup(str);
2059 if (p == NULL) {
2060 (void)bozo_http_error(httpd, 500, NULL,
2061 "memory allocation failure");
2062 exit(1);
2063 }
2064 return (p);
2065 }
2066
2067 /* set default values in bozohttpd_t struct */
2068 int
2069 bozo_init_httpd(bozohttpd_t *httpd)
2070 {
2071 /* make sure everything is clean */
2072 (void) memset(httpd, 0x0, sizeof(*httpd));
2073
2074 /* constants */
2075 httpd->consts.http_09 = "HTTP/0.9";
2076 httpd->consts.http_10 = "HTTP/1.0";
2077 httpd->consts.http_11 = "HTTP/1.1";
2078 httpd->consts.text_plain = "text/plain";
2079
2080 /* mmap region size */
2081 httpd->mmapsz = BOZO_MMAPSZ;
2082
2083 /* error buffer for bozo_http_error() */
2084 if ((httpd->errorbuf = malloc(BUFSIZ)) == NULL) {
2085 (void) fprintf(stderr,
2086 "bozohttpd: memory_allocation failure\n");
2087 return 0;
2088 }
2089 return 1;
2090 }
2091
2092 /* set default values in bozoprefs_t struct */
2093 int
2094 bozo_init_prefs(bozoprefs_t *prefs)
2095 {
2096 /* make sure everything is clean */
2097 (void) memset(prefs, 0x0, sizeof(*prefs));
2098
2099 /* set up default values */
2100 bozo_set_pref(prefs, "server software", SERVER_SOFTWARE);
2101 bozo_set_pref(prefs, "index.html", INDEX_HTML);
2102 bozo_set_pref(prefs, "public_html", PUBLIC_HTML);
2103
2104 return 1;
2105 }
2106
2107 /* set default values */
2108 int
2109 bozo_set_defaults(bozohttpd_t *httpd, bozoprefs_t *prefs)
2110 {
2111 return bozo_init_httpd(httpd) && bozo_init_prefs(prefs);
2112 }
2113
2114 /* set the virtual host name, port and root */
2115 int
2116 bozo_setup(bozohttpd_t *httpd, bozoprefs_t *prefs, const char *vhost,
2117 const char *root)
2118 {
2119 struct passwd *pw;
2120 extern char **environ;
2121 static char *cleanenv[1] = { NULL };
2122 uid_t uid;
2123 char *chrootdir;
2124 char *username;
2125 char *portnum;
2126 char *cp;
2127 int dirtyenv;
2128
2129 dirtyenv = 0;
2130
2131 if (vhost == NULL) {
2132 httpd->virthostname = bozomalloc(httpd, MAXHOSTNAMELEN+1);
2133 /* XXX we do not check for FQDN here */
2134 if (gethostname(httpd->virthostname, MAXHOSTNAMELEN+1) < 0)
2135 bozo_err(httpd, 1, "gethostname");
2136 httpd->virthostname[MAXHOSTNAMELEN] = '\0';
2137 } else {
2138 httpd->virthostname = strdup(vhost);
2139 }
2140 httpd->slashdir = strdup(root);
2141 if ((portnum = bozo_get_pref(prefs, "port number")) != NULL) {
2142 httpd->bindport = strdup(portnum);
2143 }
2144
2145 /* go over preferences now */
2146 if ((cp = bozo_get_pref(prefs, "numeric")) != NULL &&
2147 strcmp(cp, "true") == 0) {
2148 httpd->numeric = 1;
2149 }
2150 if ((cp = bozo_get_pref(prefs, "trusted referal")) != NULL &&
2151 strcmp(cp, "true") == 0) {
2152 httpd->untrustedref = 1;
2153 }
2154 if ((cp = bozo_get_pref(prefs, "log to stderr")) != NULL &&
2155 strcmp(cp, "true") == 0) {
2156 httpd->logstderr = 1;
2157 }
2158 if ((cp = bozo_get_pref(prefs, "bind address")) != NULL) {
2159 httpd->bindaddress = strdup(cp);
2160 }
2161 if ((cp = bozo_get_pref(prefs, "background")) != NULL) {
2162 httpd->background = atoi(cp);
2163 }
2164 if ((cp = bozo_get_pref(prefs, "foreground")) != NULL &&
2165 strcmp(cp, "true") == 0) {
2166 httpd->foreground = 1;
2167 }
2168 if ((cp = bozo_get_pref(prefs, "pid file")) != NULL) {
2169 httpd->pidfile = strdup(cp);
2170 }
2171 if ((cp = bozo_get_pref(prefs, "unknown slash")) != NULL &&
2172 strcmp(cp, "true") == 0) {
2173 httpd->unknown_slash = 1;
2174 }
2175 if ((cp = bozo_get_pref(prefs, "virtual base")) != NULL) {
2176 httpd->virtbase = strdup(cp);
2177 }
2178 if ((cp = bozo_get_pref(prefs, "enable users")) != NULL &&
2179 strcmp(cp, "true") == 0) {
2180 httpd->enable_users = 1;
2181 }
2182 if ((cp = bozo_get_pref(prefs, "dirty environment")) != NULL &&
2183 strcmp(cp, "true") == 0) {
2184 dirtyenv = 1;
2185 }
2186 if ((cp = bozo_get_pref(prefs, "hide dots")) != NULL &&
2187 strcmp(cp, "true") == 0) {
2188 httpd->hide_dots = 1;
2189 }
2190 if ((cp = bozo_get_pref(prefs, "directory indexing")) != NULL &&
2191 strcmp(cp, "true") == 0) {
2192 httpd->dir_indexing = 1;
2193 }
2194 if ((cp = bozo_get_pref(prefs, "public_html")) != NULL) {
2195 httpd->public_html = strdup(cp);
2196 }
2197 httpd->server_software =
2198 strdup(bozo_get_pref(prefs, "server software"));
2199 httpd->index_html = strdup(bozo_get_pref(prefs, "index.html"));
2200
2201 /*
2202 * initialise ssl and daemon mode if necessary.
2203 */
2204 bozo_ssl_init(httpd);
2205 bozo_daemon_init(httpd);
2206
2207 if ((username = bozo_get_pref(prefs, "username")) == NULL) {
2208 if ((pw = getpwuid(uid = 0)) == NULL)
2209 bozo_err(httpd, 1, "getpwuid(0): %s", strerror(errno));
2210 httpd->username = strdup(pw->pw_name);
2211 } else {
2212 httpd->username = strdup(username);
2213 if ((pw = getpwnam(httpd->username)) == NULL)
2214 bozo_err(httpd, 1, "getpwnam(%s): %s", httpd->username,
2215 strerror(errno));
2216 if (initgroups(pw->pw_name, pw->pw_gid) == -1)
2217 bozo_err(httpd, 1, "initgroups: %s", strerror(errno));
2218 if (setgid(pw->pw_gid) == -1)
2219 bozo_err(httpd, 1, "setgid(%u): %s", pw->pw_gid,
2220 strerror(errno));
2221 uid = pw->pw_uid;
2222 }
2223 /*
2224 * handle chroot.
2225 */
2226 if ((chrootdir = bozo_get_pref(prefs, "chroot dir")) != NULL) {
2227 httpd->rootdir = strdup(chrootdir);
2228 if (chdir(httpd->rootdir) == -1)
2229 bozo_err(httpd, 1, "chdir(%s): %s", httpd->rootdir,
2230 strerror(errno));
2231 if (chroot(httpd->rootdir) == -1)
2232 bozo_err(httpd, 1, "chroot(%s): %s", httpd->rootdir,
2233 strerror(errno));
2234 }
2235
2236 if (username != NULL)
2237 if (setuid(uid) == -1)
2238 bozo_err(httpd, 1, "setuid(%d): %s", uid,
2239 strerror(errno));
2240
2241 /*
2242 * prevent info leakage between different compartments.
2243 * some PATH values in the environment would be invalided
2244 * by chroot. cross-user settings might result in undesirable
2245 * effects.
2246 */
2247 if ((chrootdir != NULL || username != NULL) && !dirtyenv)
2248 environ = cleanenv;
2249
2250 #ifdef _SC_PAGESIZE
2251 httpd->page_size = (long)sysconf(_SC_PAGESIZE);
2252 #else
2253 httpd->page_size = 4096;
2254 #endif
2255 debug((httpd, DEBUG_OBESE, "myname is %s, slashdir is %s",
2256 httpd->virthostname, httpd->slashdir));
2257
2258 return 1;
2259 }
2260