bozohttpd.c revision 1.3 1 /* $NetBSD: bozohttpd.c,v 1.3 2007/10/17 18:48:00 tls Exp $ */
2
3 /* $eterna: bozohttpd.c,v 1.137 2006/05/17 08:37:36 mrg Exp $ */
4
5 /*
6 * Copyright (c) 1997-2006 Matthew R. Green
7 * All rights reserved.
8 *
9 * Redistribution and use in source and binary forms, with or without
10 * modification, are permitted provided that the following conditions
11 * are met:
12 * 1. Redistributions of source code must retain the above copyright
13 * notice, this list of conditions and the following disclaimer.
14 * 2. Redistributions in binary form must reproduce the above copyright
15 * notice, this list of conditions and the following disclaimer and
16 * dedication in the documentation and/or other materials provided
17 * with the distribution.
18 * 3. The name of the author may not be used to endorse or promote products
19 * derived from this software without specific prior written permission.
20 *
21 * THIS SOFTWARE IS PROVIDED BY THE AUTHOR ``AS IS'' AND ANY EXPRESS OR
22 * IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED WARRANTIES
23 * OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE ARE DISCLAIMED.
24 * IN NO EVENT SHALL THE AUTHOR BE LIABLE FOR ANY DIRECT, INDIRECT,
25 * INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING,
26 * BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES;
27 * LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED
28 * AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY,
29 * OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY
30 * OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF
31 * SUCH DAMAGE.
32 *
33 */
34
35 /* this program is dedicated to the Great God of Processed Cheese */
36
37 /*
38 * bozohttpd.c: minimal httpd; provides only these features:
39 * - HTTP/0.9 (by virtue of ..)
40 * - HTTP/1.0
41 * - HTTP/1.1
42 * - CGI/1.1 this will only be provided for "system" scripts
43 * - automatic "missing trailing slash" redirections
44 * - configurable translation of /~user/ to ~user/public_html,
45 * however, this does not include cgi-bin support
46 * - access lists via libwrap via inetd/tcpd
47 * - virtual hosting
48 * - not that we do not even pretend to understand MIME, but
49 * rely only on the HTTP specification
50 * - ipv6 support
51 * - automatic `index.html' generation
52 * - configurable server name
53 * - directory index generation
54 * - daemon mode (lacks libwrap support)
55 * - .htpasswd support
56 */
57
58 /*
59 * requirements for minimal http/1.1 (at least, as documented in
60 * <draft-ietf-http-v11-spec-rev-06> which expired may 18, 1999):
61 *
62 * - 14.15: content-encoding handling. [1]
63 *
64 * - 14.16: content-length handling. this is only a SHOULD header
65 * thus we could just not send it ever. [1]
66 *
67 * - 14.17: content-type handling. [1]
68 *
69 * - 14.25/28: if-{,un}modified-since handling. maybe do this, but
70 * i really don't want to have to parse 3 differnet date formats
71 *
72 * [1] need to revisit to ensure proper behaviour
73 *
74 * and the following is a list of features that we do not need
75 * to have due to other limits, or are too lazy. there are more
76 * of these than are listed, but these are of particular note,
77 * and could perhaps be implemented.
78 *
79 * - 3.5/3.6: content/transfer codings. probably can ignore
80 * this? we "SHOULD"n't. but 4.4 says we should ignore a
81 * `content-length' header upon reciept of a `transfer-encoding'
82 * header.
83 *
84 * - 5.1.1: request methods. only MUST support GET and HEAD,
85 * but there are new ones besides POST that are currently
86 * supported: OPTIONS PUT DELETE TRACE and CONNECT, plus
87 * extensions not yet known?
88 *
89 * - 10.1: we can ignore informational status codes
90 *
91 * - 10.3.3/10.3.4/10.3.8: just use '302' codes always.
92 *
93 * - 14.1/14.2/14.3/14.27: we do not support Accept: headers..
94 * just ignore them and send the request anyway. they are
95 * only SHOULD.
96 *
97 * - 14.5/14.16/14.35: we don't do ranges. from section 14.35.2
98 * `A server MAY ignore the Range header'. but it might be nice.
99 *
100 * - 14.9: we aren't a cache.
101 *
102 * - 14.15: content-md5 would be nice...
103 *
104 * - 14.24/14.26/14.27: be nice to support this...
105 *
106 * - 14.44: not sure about this Vary: header. ignore it for now.
107 */
108
109 #ifndef INDEX_HTML
110 #define INDEX_HTML "index.html"
111 #endif
112 #ifndef SERVER_SOFTWARE
113 #define SERVER_SOFTWARE "bozohttpd/20060517"
114 #endif
115 #ifndef DIRECT_ACCESS_FILE
116 #define DIRECT_ACCESS_FILE ".bzdirect"
117 #endif
118 #ifndef REDIRECT_FILE
119 #define REDIRECT_FILE ".bzredirect"
120 #endif
121 #ifndef ABSREDIRECT_FILE
122 #define ABSREDIRECT_FILE ".bzabsredirect"
123 #endif
124
125 /*
126 * And so it begins ..
127 */
128
129 #include <sys/param.h>
130 #include <sys/socket.h>
131 #include <sys/time.h>
132 #include <sys/mman.h>
133
134 #include <arpa/inet.h>
135
136 #include <ctype.h>
137 #include <dirent.h>
138 #include <errno.h>
139 #include <fcntl.h>
140 #include <netdb.h>
141 #include <pwd.h>
142 #include <grp.h>
143 #include <signal.h>
144 #include <stdarg.h>
145 #include <stdlib.h>
146 #include <string.h>
147 #include <syslog.h>
148 #include <time.h>
149 #include <unistd.h>
150
151 #ifndef __attribute__
152 #define __attribute__(x)
153 #endif /* __attribute__ */
154
155 #include "bozohttpd.h"
156
157 #ifndef MAX_WAIT_TIME
158 #define MAX_WAIT_TIME 60 /* hang around for 60 seconds max */
159 #endif
160
161 /* variables and functions */
162
163 int bflag; /* background; drop into daemon mode */
164 int fflag; /* keep daemon mode in foreground */
165 static int eflag; /* don't clean environ; -t/-U only */
166 const char *Iflag = "http";/* bind port; default "http" */
167 int Iflag_set;
168 int dflag = 0; /* debugging level */
169 char *myname; /* my name */
170
171 #ifndef LOG_FTP
172 #define LOG_FTP LOG_DAEMON
173 #endif
174
175 static char *tflag; /* root directory */
176 static char *Uflag; /* user name to switch to */
177 static int Vflag; /* unknown vhosts go to normal slashdir */
178 static int nflag; /* avoid gethostby*() */
179 static int rflag; /* make sure referrer = me unless url = / */
180 static int sflag; /* log to stderr even if it is not a TTY */
181 static char *vpath; /* virtual directory base */
182
183 char *slashdir; /* www slash directory */
184
185 const char *server_software = SERVER_SOFTWARE;
186 const char *index_html = INDEX_HTML;
187 const char http_09[] = "HTTP/0.9";
188 const char http_10[] = "HTTP/1.0";
189 const char http_11[] = "HTTP/1.1";
190 const char text_plain[] = "text/plain";
191
192 static void usage(void);
193 static void alarmer(int);
194 volatile sig_atomic_t alarmhit;
195
196 static void parse_request(char *, char **, char **, char **);
197 static http_req *read_request(void);
198 static struct headers *addmerge_header(http_req *request, char *val,
199 char *str, ssize_t len);
200 static void process_request(http_req *);
201 static int check_direct_access(http_req *request);
202 static char *transform_request(http_req *, int *);
203 static void handle_redirect(http_req *, const char *, int);
204
205 static void check_virtual(http_req *);
206 static void check_bzredirect(http_req *);
207 static void fix_url_percent(http_req *);
208 static void process_method(http_req *, const char *);
209 static void process_proto(http_req *, const char *);
210 static void escape_html(http_req *);
211
212 static const char *http_errors_short(int);
213 static const char *http_errors_long(int);
214
215
216 void *bozomalloc(size_t);
217 void *bozorealloc(void *, size_t);
218 char *bozostrdup(const char *);
219
220 /* bozotic io */
221 int (*bozoprintf)(const char *, ...) = printf;
222 ssize_t (*bozoread)(int, void *, size_t) = read;
223 ssize_t (*bozowrite)(int, const void *, size_t) = write;
224 int (*bozoflush)(FILE *) = fflush;
225
226 char *progname;
227
228 int main(int, char **);
229
230 static void
231 usage(void)
232 {
233 warning("usage: %s [options] slashdir [myname]", progname);
234 warning("options:");
235 #ifdef DEBUG
236 warning(" -d\t\t\tenable debug support");
237 #endif
238 warning(" -s\t\t\talways log to stderr");
239 #ifndef NO_USER_SUPPORT
240 warning(" -u\t\t\tenable ~user/public_html support");
241 warning(" -p dir\t\tchange `public_html' directory name]");
242 #endif
243 #ifndef NO_DYNAMIC_CONTENT
244 warning(" -M arg t c c11\tadd this mime extenstion");
245 #endif
246 #ifndef NO_CGIBIN_SUPPORT
247 #ifndef NO_DYNAMIC_CONTENT
248 warning(" -C arg prog\t\tadd this CGI handler");
249 #endif
250 warning(" -c cgibin\t\tenable cgi-bin support in this directory");
251 #endif
252 #ifndef NO_DAEMON_MODE
253 warning(" -b\t\t\tbackground and go into daemon mode");
254 warning(" -f\t\t\tkeep daemon mode in the foreground");
255 warning(" -i address\t\tbind on this address (daemon mode only)");
256 warning(" -I port\t\tbind on this port (daemon mode only)");
257 #endif
258 warning(" -S version\t\tset server version string");
259 warning(" -t dir\t\tchroot to `dir'");
260 warning(" -U username\t\tchange user to `user'");
261 warning(" -e\t\t\tdon't clean the environment (-t and -U only)");
262 warning(" -v virtualroot\tenable virtual host support in this directory");
263 warning(" -r\t\t\tmake sure sub-pages come from this host via referrer");
264 #ifndef NO_DIRINDEX_SUPPORT
265 warning(" -X\t\t\tenable automatic directory index support");
266 warning(" -H\t\t\thide files starting with a period (.) in index mode");
267 #endif
268 warning(" -x index\t\tchange default `index.html' file name");
269 #ifndef NO_SSL_SUPPORT
270 warning(" -Z cert privkey\tspecify path to server certificate and private key file\n"
271 "\t\t\tin pem format and enable bozohttpd in SSL mode");
272 #endif /* NO_SSL_SUPPORT */
273 error(1, "%s failed to start", progname);
274 }
275
276 int
277 main(int argc, char **argv)
278 {
279 http_req *http_request;
280 extern char **environ;
281 char *cleanenv[1];
282 uid_t uid;
283 int c;
284
285 uid = 0; /* XXX gcc */
286
287 if ((progname = strrchr(argv[0], '/')) != NULL)
288 progname++;
289 else
290 progname = argv[0];
291
292 openlog(progname, LOG_PID|LOG_NDELAY, LOG_FTP);
293
294 while ((c = getopt(argc, argv,
295 "C:HI:M:S:U:VXZ:bc:defhi:np:rst:uv:x:z:")) != -1) {
296 switch(c) {
297
298 case 'M':
299 #ifndef NO_DYNAMIC_CONTENT
300 /* make sure there's four arguments */
301 if (argc - optind < 3)
302 usage();
303 add_content_map_mime(optarg, argv[optind],
304 argv[optind+1], argv[optind+2]);
305 optind += 3;
306 break;
307 #else
308 error(1, "dynmic mime content support is not enabled");
309 /* NOTREACHED */
310 #endif /* NO_DYNAMIC_CONTENT */
311
312 case 'n':
313 nflag = 1;
314 break;
315
316 case 'r':
317 rflag = 1;
318 break;
319
320 case 's':
321 sflag = 1;
322 break;
323
324 case 'S':
325 server_software = optarg;
326 break;
327 case 'Z':
328 #ifndef NO_SSL_SUPPORT
329 /* make sure there's two arguments */
330 if (argc - optind < 1)
331 usage();
332 ssl_set_opts(optarg, argv[optind++]);
333 break;
334 #else
335 error(1, "ssl support is not enabled");
336 /* NOT REACHED */
337 #endif /* NO_SSL_SUPPORT */
338 case 'U':
339 Uflag = optarg;
340 break;
341
342 case 'V':
343 Vflag = 1;
344 break;
345
346 case 'v':
347 vpath = optarg;
348 break;
349
350 case 'x':
351 index_html = optarg;
352 break;
353
354 #ifndef NO_DAEMON_MODE
355 case 'b':
356 bflag = 1;
357 break;
358
359 case 'e':
360 eflag = 1;
361 break;
362
363 case 'f':
364 fflag = 1;
365 break;
366
367 case 'i':
368 iflag = optarg;
369 break;
370
371 case 'I':
372 Iflag_set = 1;
373 Iflag = optarg;
374 break;
375 #else /* NO_DAEMON_MODE */
376 case 'b':
377 case 'i':
378 case 'I':
379 error(1, "Daemon mode is not enabled");
380 /* NOTREACHED */
381 #endif /* NO_DAEMON_MODE */
382
383 #ifndef NO_CGIBIN_SUPPORT
384 case 'c':
385 set_cgibin(optarg);
386 break;
387
388 case 'C':
389 #ifndef NO_DYNAMIC_CONTENT
390 /* make sure there's two arguments */
391 if (argc - optind < 1)
392 usage();
393 add_content_map_cgi(optarg, argv[optind++]);
394 break;
395 #else
396 error(1, "dynmic CGI handler support is not enabled");
397 /* NOTREACHED */
398 #endif /* NO_DYNAMIC_CONTENT */
399
400 #else
401 case 'c':
402 case 'C':
403 error(1, "CGI is not enabled");
404 /* NOTREACHED */
405 #endif /* NO_CGIBIN_SUPPORT */
406
407 case 'd':
408 dflag++;
409 #ifndef DEBUG
410 if (dflag == 1)
411 warning("Debugging is not enabled");
412 #endif /* !DEBUG */
413 break;
414
415 #ifndef NO_USER_SUPPORT
416 case 'p':
417 public_html = optarg;
418 break;
419
420 case 't':
421 tflag = optarg;
422 break;
423
424 case 'u':
425 uflag = 1;
426 break;
427 #else
428 case 'u':
429 case 'p':
430 error(1, "User support is not enabled");
431 /* NOTREACHED */
432 #endif /* NO_USER_SUPPORT */
433
434 #ifndef NO_DIRINDEX_SUPPORT
435 case 'H':
436 Hflag = 1;
437 break;
438
439 case 'X':
440 Xflag = 1;
441 break;
442
443 #else
444 case 'H':
445 case 'X':
446 error(1, "directory indexing is not enabled");
447 /* NOTREACHED */
448 #endif /* NO_DIRINDEX_SUPPORT */
449
450 default:
451 usage();
452 /* NOTREACHED */
453 }
454 }
455 argc -= optind;
456 argv += optind;
457
458 if (argc == 1) {
459 myname = bozomalloc(MAXHOSTNAMELEN+1);
460 /* XXX we do not check for FQDN here */
461 if (gethostname(myname, MAXHOSTNAMELEN+1) < 0)
462 error(1, "gethostname");
463 myname[MAXHOSTNAMELEN] = '\0';
464 } else if (argc == 2)
465 myname = argv[1];
466 else
467 usage();
468
469 slashdir = argv[0];
470 debug((DEBUG_OBESE, "myname is %s, slashdir is %s", myname, slashdir));
471
472 /*
473 * initialise ssl and daemon mode if necessary.
474 */
475 ssl_init();
476 daemon_init();
477
478 /*
479 * prevent info leakage between different compartments.
480 * some PATH values in the environment would be invalided
481 * by chroot. cross-user settings might result in undesirable
482 * effects.
483 */
484 if ((tflag != NULL || Uflag != NULL) && !eflag) {
485 cleanenv[0] = NULL;
486 environ = cleanenv;
487 }
488
489 /*
490 * look up user/group information.
491 */
492 if (Uflag != NULL) {
493 struct passwd *pw;
494
495 if ((pw = getpwnam(Uflag)) == NULL)
496 error(1, "getpwnam(%s): %s", Uflag, strerror(errno));
497 if (initgroups(pw->pw_name, pw->pw_gid) == -1)
498 error(1, "initgroups: %s", strerror(errno));
499 if (setgid(pw->pw_gid) == -1)
500 error(1, "setgid(%u): %s", pw->pw_gid, strerror(errno));
501 uid = pw->pw_uid;
502 }
503
504 /*
505 * handle chroot.
506 */
507 if (tflag != NULL) {
508 if (chdir(tflag) == -1)
509 error(1, "chdir(%s): %s", tflag, strerror(errno));
510 if (chroot(tflag) == -1)
511 error(1, "chroot(%s): %s", tflag, strerror(errno));
512 }
513
514 if (Uflag != NULL)
515 if (setuid(uid) == -1)
516 error(1, "setuid(%d): %s", uid, strerror(errno));
517
518 /*
519 * be sane, don't start serving up files from a
520 * hierarchy we don't have permission to get to.
521 */
522 if (tflag != NULL)
523 if (chdir("/") == -1)
524 error(1, "chdir /: %s", strerror(errno));
525
526 /*
527 * read and process the HTTP request.
528 */
529 do {
530 http_request = read_request();
531 if (http_request) {
532 process_request(http_request);
533 return (0);
534 }
535 } while (bflag);
536
537 return (0);
538 }
539
540 char *
541 http_date(void)
542 {
543 static char date[40];
544 struct tm *tm;
545 time_t now;
546
547 /* Sun, 06 Nov 1994 08:49:37 GMT */
548 now = time(NULL);
549 tm = gmtime(&now); /* HTTP/1.1 spec rev 06 sez GMT only */
550 strftime(date, sizeof date, "%a, %d %b %Y %H:%M:%S GMT", tm);
551 return date;
552 }
553
554 /*
555 * convert "in" into the three parts of a request (first line)
556 */
557 static void
558 parse_request(char *in, char **method, char **url, char **proto)
559 {
560 ssize_t len;
561 char *val;
562
563 *method = *url = *proto = NULL; /* set them up */
564
565 len = (ssize_t)strlen(in);
566 val = strnsep(&in, " \t\n\r", &len);
567 if (len < 1 || val == NULL)
568 return;
569 *method = val;
570 while (*in == ' ' || *in == '\t')
571 in++;
572 val = strnsep(&in, " \t\n\r", &len);
573 if (len < 1) {
574 if (len == 0)
575 *url = val;
576 else
577 *url = in;
578 return;
579 }
580 *url = val;
581 if (in) {
582 while (*in && (*in == ' ' || *in == '\t'))
583 in++;
584 if (*in)
585 *proto = in;
586 }
587 }
588
589 /*
590 * send a HTTP/1.1 408 response if we timeout.
591 */
592 /* ARGSUSED */
593 static void
594 alarmer(int sig)
595 {
596 alarmhit = 1;
597 }
598
599 /*
600 * This function reads a http request from stdin, returning a pointer to a
601 * http_req structure, describing the request.
602 */
603 static http_req *
604 read_request(void)
605 {
606 struct sigaction sa;
607 char *str, *val, *method, *url, *proto;
608 char *host, *addr, *port;
609 char bufport[10];
610 char hbuf[NI_MAXHOST], abuf[NI_MAXHOST];
611 struct sockaddr_storage ss;
612 ssize_t len;
613 int line = 0;
614 socklen_t slen;
615 http_req *request;
616
617 /*
618 * if we're in daemon mode, daemon_fork() will return here once
619 * for each child, then we can setup SSL.
620 */
621 daemon_fork();
622 ssl_accept();
623
624 request = bozomalloc(sizeof *request);
625 memset(request, 0, sizeof *request);
626 request->hr_allow = request->hr_host = NULL;
627 request->hr_content_type = request->hr_content_length = NULL;
628
629 slen = sizeof(ss);
630 if (getpeername(0, (struct sockaddr *)&ss, &slen) < 0)
631 host = addr = NULL;
632 else {
633 if (getnameinfo((struct sockaddr *)&ss, slen,
634 abuf, sizeof abuf, NULL, 0, NI_NUMERICHOST) == 0)
635 addr = abuf;
636 else
637 addr = NULL;
638 if (nflag == 0 && getnameinfo((struct sockaddr *)&ss, slen,
639 hbuf, sizeof hbuf, NULL, 0, 0) == 0)
640 host = hbuf;
641 else
642 host = NULL;
643 }
644 if (host != NULL)
645 request->hr_remotehost = bozostrdup(host);
646 if (addr != NULL)
647 request->hr_remoteaddr = bozostrdup(addr);
648 slen = sizeof(ss);
649 if (getsockname(0, (struct sockaddr *)&ss, &slen) < 0)
650 port = NULL;
651 else {
652 if (getnameinfo((struct sockaddr *)&ss, slen, NULL, 0,
653 bufport, sizeof bufport, NI_NUMERICSERV) == 0)
654 port = bufport;
655 else
656 port = NULL;
657 }
658 if (port != NULL)
659 request->hr_serverport = bozostrdup(port);
660
661 /*
662 * setup a timer to make sure the request is not hung
663 */
664 sa.sa_handler = alarmer;
665 sigemptyset(&sa.sa_mask);
666 sigaddset(&sa.sa_mask, SIGALRM);
667 sa.sa_flags = 0;
668 sigaction(SIGALRM, &sa, NULL); /* XXX */
669
670 alarm(MAX_WAIT_TIME);
671 while ((str = dgetln(STDIN_FILENO, &len, bozoread)) != NULL) {
672 alarm(0);
673 if (alarmhit)
674 http_error(408, NULL, "request timed out");
675 line++;
676
677 if (line == 1) {
678 str = bozostrdup(str); /* we use this copy */
679
680 if (len < 1)
681 http_error(404, NULL, "null method");
682 warning("got request ``%s'' from host %s to port %s",
683 str,
684 host ? host : addr ? addr : "<local>",
685 port ? port : "<stdin>");
686 debug((DEBUG_FAT, "read_req, getting request: ``%s''",
687 str));
688
689 parse_request(str, &method, &url, &proto);
690 if (method == NULL)
691 http_error(404, NULL, "null method");
692 if (url == NULL)
693 http_error(404, NULL, "null url");
694
695 /*
696 * note that we parse the proto first, so that we
697 * can more properly parse the method and the url.
698 */
699 request->hr_url = url;
700 process_proto(request, proto);
701 process_method(request, method);
702
703 /* http/0.9 has no header processing */
704 if (request->hr_proto == http_09)
705 break;
706 } else { /* incoming headers */
707 struct headers *hdr;
708
709 if (*str == '\0')
710 break;
711
712 val = strnsep(&str, ":", &len);
713 debug((DEBUG_EXPLODING,
714 "read_req2: after strnsep: str ``%s'' val ``%s''",
715 str, val));
716 if (val == NULL || len == -1)
717 http_error(404, request, "no header");
718 while (*str == ' ' || *str == '\t')
719 len--, str++;
720
721 if (auth_check_headers(request, val, str, len))
722 goto next_header;
723
724 hdr = addmerge_header(request, val, str, len);
725
726 if (strcasecmp(hdr->h_header, "content-type") == 0)
727 request->hr_content_type = hdr->h_value;
728 else if (strcasecmp(hdr->h_header, "content-length") == 0)
729 request->hr_content_length = hdr->h_value;
730 else if (strcasecmp(hdr->h_header, "host") == 0)
731 request->hr_host = hdr->h_value;
732 /* HTTP/1.1 rev06 draft spec: 14.20 */
733 else if (strcasecmp(hdr->h_header, "expect") == 0)
734 http_error(417, request, "we don't support Expect:");
735 else if (strcasecmp(hdr->h_header, "referrer") == 0 ||
736 strcasecmp(hdr->h_header, "referer") == 0)
737 request->hr_referrer = hdr->h_value;
738
739 debug((DEBUG_FAT, "adding header %s: %s",
740 hdr->h_header, hdr->h_value));
741 }
742 next_header:
743 alarm(MAX_WAIT_TIME);
744 }
745
746 /* now, clear it all out */
747 alarm(0);
748 signal(SIGALRM, SIG_DFL);
749
750 /* RFC1945, 8.3 */
751 if (request->hr_method == HTTP_POST && request->hr_content_length == NULL)
752 http_error(400, request, "missing content length");
753
754 /* HTTP/1.1 draft rev-06, 14.23 & 19.6.1.1 */
755 if (request->hr_proto == http_11 && request->hr_host == NULL)
756 http_error(400, request, "missing Host header");
757
758 debug((DEBUG_FAT, "read_request returns url %s in request", request->hr_url));
759 return (request);
760 }
761
762 /*
763 * add or merge this header (val: str) into the requests list
764 */
765 static struct headers *
766 addmerge_header(http_req *request, char *val, char *str, ssize_t len)
767 {
768 struct headers *hdr;
769 static char space[2] = { ' ', 0 };
770
771 /* do we exist already? */
772 SIMPLEQ_FOREACH(hdr, &request->hr_headers, h_next) {
773 if (strcasecmp(val, hdr->h_header) == 0)
774 break;
775 }
776
777 if (hdr) {
778 /* yup, merge it in */
779 if (hdr->h_value == space)
780 hdr->h_value = bozostrdup(str);
781 else {
782 char *nval;
783
784 if (asprintf(&nval, "%s, %s", hdr->h_value, str) == -1)
785 http_error(500, NULL,
786 "memory allocation failure");
787 free(hdr->h_value);
788 hdr->h_value = nval;
789 }
790 } else {
791 /* nope, create a new one */
792
793 hdr = bozomalloc(sizeof *hdr);
794 hdr->h_header = bozostrdup(val);
795 if (str && *str)
796 hdr->h_value = bozostrdup(str);
797 else
798 hdr->h_value = space;
799
800 SIMPLEQ_INSERT_TAIL(&request->hr_headers, hdr, h_next);
801 request->hr_nheaders++;
802 }
803
804 return hdr;
805 }
806
807 /*
808 * process_request does the following:
809 * - check the request is valid
810 * - process cgi-bin if necessary
811 * - transform a filename if necesarry
812 * - return the HTTP request
813 */
814 static void
815 process_request(http_req *request)
816 {
817 struct stat sb;
818 char *file;
819 const char *type, *encoding;
820 int fd, isindex;
821
822 /*
823 * note that transform_request chdir()'s if required. also note
824 * that cgi is handed here, and a cgi request will never return
825 * back here.
826 */
827 file = transform_request(request, &isindex);
828 if (file == NULL)
829 http_error(404, request, "empty file after transform");
830
831 fd = open(file, O_RDONLY);
832 if (fd < 0) {
833 debug((DEBUG_FAT, "open failed: %s", strerror(errno)));
834 if (errno == EPERM)
835 http_error(403, request, "no permission to open file");
836 else if (errno == ENOENT) {
837 if (directory_index(request, file, isindex))
838 return;
839 http_error(404, request, "no file");
840 } else
841 http_error(500, request, "open file");
842 }
843 if (fstat(fd, &sb) < 0)
844 http_error(500, request, "can't fstat");
845 if (S_ISDIR(sb.st_mode))
846 handle_redirect(request, NULL, 0);
847 /* NOTREACHED */
848 /* XXX RFC1945 10.9 If-Modified-Since (http code 304) */
849
850 bozoprintf("%s 200 OK\r\n", request->hr_proto);
851
852 if (request->hr_proto != http_09) {
853 type = content_type(request, file);
854 encoding = content_encoding(request, file);
855
856 print_header(request, &sb, type, encoding);
857 bozoprintf("\r\n");
858 }
859 bozoflush(stdout);
860
861 if (request->hr_method != HTTP_HEAD) {
862 char *addr;
863 void *oaddr;
864 off_t sz = sb.st_size;
865
866 oaddr = addr = mmap(0, (size_t)sz, PROT_READ,
867 MAP_SHARED, fd, 0);
868 if (addr == (char *)-1)
869 error(1, "mmap failed: %s", strerror(errno));
870
871 #ifdef MADV_SEQUENTIAL
872 madvise(addr, sz, MADV_SEQUENTIAL);
873 #endif
874 while (sz > WRSZ) {
875 if (bozowrite(STDOUT_FILENO, addr, WRSZ) != WRSZ)
876 error(1, "write failed: %s", strerror(errno));
877 sz -= WRSZ;
878 addr += WRSZ;
879 }
880 if (sz && bozowrite(STDOUT_FILENO, addr, sz) != sz)
881 error(1, "final write failed: %s", strerror(errno));
882 if (munmap(oaddr, (size_t)sb.st_size) < 0)
883 warning("munmap failed");
884 }
885 /* If SSL enabled cleanup SSL structure. */
886 ssl_destroy();
887 close(fd);
888 free(file);
889 }
890
891 /*
892 * deal with virtual host names; we do this:
893 * if we have a virtual path root (vpath), and we are given a
894 * virtual host spec (Host: ho.st or http://ho.st/), see if this
895 * directory exists under vpath. if it does, use this as the
896 # new slashdir.
897 */
898 static void
899 check_virtual(http_req *request)
900 {
901 char *url = request->hr_url, *s;
902 struct dirent **list;
903 size_t len;
904 int i;
905
906 if (!vpath)
907 goto use_slashdir;
908
909 /*
910 * convert http://virtual.host/ to request->hr_host
911 */
912 debug((DEBUG_OBESE, "checking for http:// virtual host in ``%s''", url));
913 if (strncasecmp(url, "http://", 7) == 0) {
914 /* we would do virtual hosting here? */
915 url += 7;
916 s = strchr(url, '/');
917 /* HTTP/1.1 draft rev-06, 5.2: URI takes precedence over Host: */
918 request->hr_host = url;
919 request->hr_url = bozostrdup(s ? s : "/");
920 debug((DEBUG_OBESE, "got host ``%s'' url is now ``%s''",
921 request->hr_host, request->hr_url));
922 } else if (!request->hr_host)
923 goto use_slashdir;
924
925
926 /*
927 * ok, we have a virtual host, use scandir(3) to find a case
928 * insensitive match for the virtual host we are asked for.
929 * note that if the virtual host is the same as the master,
930 * we don't need to do anything special.
931 */
932 len = strlen(request->hr_host);
933 debug((DEBUG_OBESE,
934 "check_virtual: checking host `%s' under vpath `%s' for url `%s'",
935 request->hr_host, vpath, request->hr_url));
936 if (strncasecmp(myname, request->hr_host, len) != 0) {
937 s = 0;
938 for (i = scandir(vpath, &list, 0, 0); i--; list++) {
939 debug((DEBUG_OBESE, "looking at dir``%s''",
940 (*list)->d_name));
941 if (strncasecmp((*list)->d_name, request->hr_host,
942 len) == 0) {
943 /* found it, punch it */
944 myname = (*list)->d_name;
945 if (asprintf(&s, "%s/%s", vpath, myname) < 0)
946 error(1, "asprintf");
947 break;
948 }
949 }
950 if (s == 0) {
951 if (Vflag)
952 goto use_slashdir;
953 http_error(404, request, "unknown URL");
954 }
955 } else
956 use_slashdir:
957 s = slashdir;
958
959 /*
960 * ok, nailed the correct slashdir, chdir to it
961 */
962 if (chdir(s) < 0)
963 error(1, "can't chdir %s: %s", s, strerror(errno));
964 }
965
966 /* make sure we're not trying to access special files */
967 void
968 check_special_files(http_req *request, const char *name)
969 {
970 /* ensure basename(name) != special files */
971 if (strcmp(name, DIRECT_ACCESS_FILE) == 0)
972 http_error(403, request,
973 "no permission to open direct access file");
974 if (strcmp(name, REDIRECT_FILE) == 0)
975 http_error(403, request,
976 "no permission to open redirect file");
977 if (strcmp(name, ABSREDIRECT_FILE) == 0)
978 http_error(403, request,
979 "no permission to open redirect file");
980 auth_check_special_files(request, name);
981 }
982
983 /*
984 * checks to see if this request has a valid .bzredirect file. returns
985 * 0 on failure and 1 on success.
986 */
987 static void
988 check_bzredirect(http_req *request)
989 {
990 struct stat sb;
991 char dir[MAXPATHLEN], redir[MAXPATHLEN], redirpath[MAXPATHLEN + 1];
992 char *basename, *finalredir;
993 int rv, absolute;
994
995 /*
996 * if this pathname is really a directory, but doesn't end in /,
997 * use it as the directory to look for the redir file.
998 */
999 snprintf(dir, sizeof(dir), "%s", request->hr_url + 1);
1000 debug((DEBUG_FAT, "check_bzredirect: dir %s", dir));
1001 basename = strrchr(dir, '/');
1002
1003 if ((!basename || basename[1] != '\0') &&
1004 lstat(dir, &sb) == 0 && S_ISDIR(sb.st_mode))
1005 /* nothing */;
1006 else if (basename == NULL)
1007 strcpy(dir, ".");
1008 else {
1009 *basename++ = '\0';
1010 check_special_files(request, basename);
1011 }
1012
1013 snprintf(redir, sizeof(redir), "%s/%s", dir, REDIRECT_FILE);
1014 if (lstat(redir, &sb) == 0) {
1015 if (S_ISLNK(sb.st_mode) == 0)
1016 return;
1017 absolute = 0;
1018 } else {
1019 snprintf(redir, sizeof(redir), "%s/%s", dir, ABSREDIRECT_FILE);
1020 if (lstat(redir, &sb) < 0 || S_ISLNK(sb.st_mode) == 0)
1021 return;
1022 absolute = 1;
1023 }
1024 debug((DEBUG_FAT, "check_bzredirect: calling readlink"));
1025 rv = readlink(redir, redirpath, sizeof redirpath - 1);
1026 if (rv == -1 || rv == 0) {
1027 debug((DEBUG_FAT, "readlink failed"));
1028 return;
1029 }
1030 redirpath[rv] = '\0';
1031 debug((DEBUG_FAT, "readlink returned \"%s\"", redirpath));
1032
1033 /* now we have the link pointer, redirect to the real place */
1034 if (absolute)
1035 finalredir = redirpath;
1036 else
1037 snprintf(finalredir = redir, sizeof(redir), "/%s/%s", dir,
1038 redirpath);
1039
1040 debug((DEBUG_FAT, "check_bzredirect: new redir %s", finalredir));
1041 handle_redirect(request, finalredir, absolute);
1042 }
1043
1044 /*
1045 * checks to see if this request has a valid .bzdirect file. returns
1046 * 0 on failure and 1 on success.
1047 */
1048 static int
1049 check_direct_access(http_req *request)
1050 {
1051 FILE *fp;
1052 struct stat sb;
1053 char dir[MAXPATHLEN], dirfile[MAXPATHLEN], *basename;
1054
1055 snprintf(dir, sizeof(dir), "%s", request->hr_url + 1);
1056 debug((DEBUG_FAT, "check_bzredirect: dir %s", dir));
1057 basename = strrchr(dir, '/');
1058
1059 if ((!basename || basename[1] != '\0') &&
1060 lstat(dir, &sb) == 0 && S_ISDIR(sb.st_mode))
1061 /* nothing */;
1062 else if (basename == NULL)
1063 strcpy(dir, ".");
1064 else {
1065 *basename++ = '\0';
1066 check_special_files(request, basename);
1067 }
1068
1069 snprintf(dirfile, sizeof(dirfile), "%s/%s", dir, DIRECT_ACCESS_FILE);
1070 if (stat(dirfile, &sb) < 0 ||
1071 (fp = fopen(dirfile, "r")) == NULL)
1072 return 0;
1073 fclose(fp);
1074 return 1;
1075 }
1076
1077 /*
1078 * transform_request does this:
1079 * - ``expand'' %20 crapola
1080 * - punt if it doesn't start with /
1081 * - check rflag / referrer
1082 * - look for "http://myname/" and deal with it.
1083 * - maybe call process_cgi()
1084 * - check for ~user and call user_transform() if so
1085 * - if the length > 1, check for trailing slash. if so,
1086 * add the index.html file
1087 * - if the length is 1, return the index.html file
1088 * - disallow anything ending up with a file starting
1089 * at "/" or having ".." in it.
1090 * - anything else is a really weird internal error
1091 */
1092 static char *
1093 transform_request(http_req *request, int *isindex)
1094 {
1095 char *file;
1096 char *url;
1097 size_t len;
1098
1099 file = NULL;
1100 *isindex = 0;
1101 debug((DEBUG_FAT, "tf_req: url %s", request->hr_url));
1102 fix_url_percent(request);
1103 check_virtual(request);
1104 url = request->hr_url;
1105
1106 if (url[0] != '/')
1107 http_error(404, request, "unknown URL");
1108
1109 check_bzredirect(request);
1110
1111 if (rflag) {
1112 int to_indexhtml = 0;
1113
1114 #define TOP_PAGE(x) (strcmp((x), "/") == 0 || \
1115 strcmp((x) + 1, index_html) == 0 || \
1116 strcmp((x) + 1, "favicon.ico") == 0)
1117
1118 debug((DEBUG_EXPLODING, "checking rflag"));
1119 /*
1120 * first check that this path isn't allowed via .bzdirect file,
1121 * and then check referrer; make sure that people come via the
1122 * real name... otherwise if we aren't looking at / or
1123 * /index.html, redirect... we also special case favicon.ico.
1124 */
1125 if (check_direct_access(request))
1126 /* nothing */;
1127 else if (request->hr_referrer) {
1128 const char *r = request->hr_referrer;
1129
1130 debug((DEBUG_FAT,
1131 "checking referrer \"%s\" vs myname %s", r, myname));
1132 if (strncmp(r, "http://", 7) != 0 ||
1133 (strncasecmp(r + 7, myname, strlen(myname)) != 0 &&
1134 !TOP_PAGE(url)))
1135 to_indexhtml = 1;
1136 } else {
1137 const char *h = request->hr_host;
1138
1139 debug((DEBUG_FAT, "url has no referrer at all"));
1140 /* if there's no referrer, let / or /index.html past */
1141 if (!TOP_PAGE(url) ||
1142 (h && strncasecmp(h, myname, strlen(myname)) != 0))
1143 to_indexhtml = 1;
1144 }
1145
1146 if (to_indexhtml) {
1147 char *slashindexhtml;
1148
1149 if (asprintf(&slashindexhtml, "/%s", index_html) < 0)
1150 error(1, "asprintf");
1151 debug((DEBUG_FAT, "rflag: redirecting %s to %s", url, slashindexhtml));
1152 handle_redirect(request, slashindexhtml, 0);
1153 /* NOTREACHED */
1154 }
1155 }
1156
1157 process_cgi(request);
1158
1159 len = strlen(url);
1160 if (0) {
1161 #ifndef NO_USER_SUPPORT
1162 } else if (len > 1 && uflag && url[1] == '~') {
1163 if (url[2] == '\0')
1164 http_error(404, request, "missing username");
1165 if (strchr(url + 2, '/') == NULL)
1166 handle_redirect(request, NULL, 0);
1167 /* NOTREACHED */
1168 debug((DEBUG_FAT, "calling user_transform"));
1169 return (user_transform(request, isindex));
1170 #endif /* NO_USER_SUPPORT */
1171 } else if (len > 1) {
1172 debug((DEBUG_FAT, "url[len-1] == %c", url[len-1]));
1173 if (url[len-1] == '/') { /* append index.html */
1174 *isindex = 1;
1175 debug((DEBUG_FAT, "appending index.html"));
1176 file = bozomalloc(len + strlen(index_html) + 1);
1177 strcpy(file, url + 1);
1178 strcat(file, index_html);
1179 } else
1180 file = bozostrdup(url + 1);
1181 } else if (len == 1) {
1182 debug((DEBUG_EXPLODING, "tf_req: len == 1"));
1183 file = bozostrdup(index_html);
1184 *isindex = 1;
1185 } else /* len == 0 ? */
1186 http_error(500, request, "request->hr_url is nul?");
1187
1188 if (file == NULL)
1189 http_error(500, request, "internal failure");
1190
1191 /*
1192 * look for "http://myname/" and deal with it as necessary.
1193 */
1194
1195 /*
1196 * stop traversing outside our domain
1197 *
1198 * XXX true security only comes from our parent using chroot(2)
1199 * before execve(2)'ing us. or our own built in chroot(2) support.
1200 */
1201 if (*file == '/' || strcmp(file, "..") == 0 ||
1202 strstr(file, "/..") || strstr(file, "../"))
1203 http_error(403, request, "illegal request");
1204
1205 auth_check(request, file);
1206
1207 debug((DEBUG_FAT, "transform_request returned: %s", file));
1208 return (file);
1209 }
1210
1211 /*
1212 * do automatic redirection
1213 */
1214 static void
1215 handle_redirect(http_req *request, const char *url, int absolute)
1216 {
1217 char *urlbuf;
1218 char portbuf[20];
1219
1220 if (url == NULL) {
1221 if (asprintf(&urlbuf, "%s/", request->hr_url) < 0)
1222 error(1, "asprintf");
1223 url = urlbuf;
1224 }
1225 if (request->hr_serverport && strcmp(request->hr_serverport, "80") != 0)
1226 snprintf(portbuf, sizeof(portbuf), ":%s",
1227 request->hr_serverport);
1228 else
1229 portbuf[0] = '\0';
1230 warning("redirecting %s%s%s", myname, portbuf, url);
1231 debug((DEBUG_FAT, "redirecting %s", url));
1232 bozoprintf("%s 301 Document Moved\r\n", request->hr_proto);
1233 if (request->hr_proto != http_09)
1234 print_header(request, NULL, "text/html", NULL);
1235 if (request->hr_proto != http_09) {
1236 bozoprintf("Location: http://");
1237 if (absolute == 0)
1238 bozoprintf("%s%s", myname, portbuf);
1239 bozoprintf("%s\r\n", url);
1240 }
1241 bozoprintf("\r\n");
1242 if (request->hr_method == HTTP_HEAD)
1243 goto head;
1244 bozoprintf("<html><head><title>Document Moved</title></head>\n");
1245 bozoprintf("<body><h1>Document Moved</h1>\n");
1246 bozoprintf("This document had moved <a href=\"http://");
1247 if (absolute)
1248 bozoprintf("%s", url);
1249 else
1250 bozoprintf("%s%s%s", myname, portbuf, url);
1251 bozoprintf("\">here</a>\n");
1252 bozoprintf("</body></html>\n");
1253 head:
1254 bozoflush(stdout);
1255 exit(0);
1256 }
1257
1258 /* generic header printing routine */
1259 void
1260 print_header(http_req *request, struct stat *sbp, const char *type,
1261 const char *encoding)
1262 {
1263 bozoprintf("Date: %s\r\n", http_date());
1264 bozoprintf("Server: %s\r\n", server_software);
1265 if (sbp) {
1266 char filedate[40];
1267 struct tm *tm;
1268
1269 tm = gmtime(&sbp->st_mtime);
1270 strftime(filedate, sizeof filedate,
1271 "%a, %d %b %Y %H:%M:%S GMT", tm);
1272 bozoprintf("Last-Modified: %s\r\n", filedate);
1273 }
1274 if (type && *type)
1275 bozoprintf("Content-Type: %s\r\n", type);
1276 if (encoding && *encoding)
1277 bozoprintf("Content-Encoding: %s\r\n", encoding);
1278 if (sbp)
1279 bozoprintf("Content-Length: %qd\r\n", (long long)sbp->st_size);
1280 if (request && request->hr_proto == http_11)
1281 bozoprintf("Connection: close\r\n");
1282 bozoflush(stdout);
1283 }
1284
1285 /* this escape HTML tags */
1286 static void
1287 escape_html(http_req *request)
1288 {
1289 int i, j;
1290 char *url = request->hr_url, *tmp;
1291
1292 for (i = 0, j = 0; url[i]; i++) {
1293 switch (url[i]) {
1294 case '<':
1295 case '>':
1296 j += 4;
1297 break;
1298 case '&':
1299 j += 5;
1300 break;
1301 }
1302 }
1303
1304 if (j == 0)
1305 return;
1306
1307 if ((tmp = (char *) malloc(strlen(url) + j)) == 0)
1308 /*
1309 * ouch, but we are only called from an error context, and
1310 * most paths here come from malloc(3) failures anyway...
1311 * we could completely punt and just exit, but isn't returning
1312 * an not-quite-correct error better than nothing at all?
1313 */
1314 return;
1315
1316 for (i = 0, j = 0; url[i]; i++) {
1317 switch (url[i]) {
1318 case '<':
1319 memcpy(tmp + j, "<", 4);
1320 j += 4;
1321 break;
1322 case '>':
1323 memcpy(tmp + j, ">", 4);
1324 j += 4;
1325 break;
1326 case '&':
1327 memcpy(tmp + j, "&", 5);
1328 j += 5;
1329 break;
1330 default:
1331 tmp[j++] = url[i];
1332 }
1333 }
1334 tmp[j] = 0;
1335
1336 /*
1337 * XXX original "url" is a substring of an allocation, so we
1338 * can't touch it. so, ignore it and replace the request.
1339 */
1340 request->hr_url = tmp;
1341 }
1342
1343 /* this fixes the %HH hack that RFC2396 requires. */
1344 static void
1345 fix_url_percent(http_req *request)
1346 {
1347 char *s, *t, buf[3], *url;
1348 char *end; /* if end is not-zero, we don't translate beyond that */
1349
1350 url = request->hr_url;
1351
1352 /* make sure we don't translate *too* much */
1353 end = strchr(request->hr_url, '?');
1354
1355 /* fast forward to the first % */
1356 if ((s = strchr(url, '%')) == NULL)
1357 return;
1358
1359 t = s;
1360 do {
1361 if (end && s >= end) {
1362 debug((DEBUG_EXPLODING, "fu_%%: past end, filling out.."));
1363 while (*s)
1364 *t++ = *s++;
1365 break;
1366 }
1367 debug((DEBUG_EXPLODING, "fu_%%: got s == %%, s[1]s[2] == %c%c",
1368 s[1], s[2]));
1369 if (s[1] == '\0' || s[2] == '\0')
1370 http_error(400, request,
1371 "percent hack missing two chars afterwards");
1372 if (s[1] == '0' && s[2] == '0')
1373 http_error(404, request, "percent hack was %00");
1374 if (s[1] == '2' && s[2] == 'f')
1375 http_error(404, request, "percent hack was %2f (/)");
1376
1377 buf[0] = *++s;
1378 buf[1] = *++s;
1379 buf[2] = '\0';
1380 s++;
1381 *t = (char)strtol(buf, NULL, 16);
1382 debug((DEBUG_EXPLODING, "fu_%%: strtol put %c into *t", *t));
1383 if (*t++ == '\0')
1384 http_error(400, request, "percent hack got a 0 back");
1385
1386 while (*s && *s != '%') {
1387 if (s >= end)
1388 break;
1389 *t++ = *s++;
1390 }
1391 } while (*s);
1392 *t = '\0';
1393 debug((DEBUG_FAT, "fix_url_percent returns %s in url", request->hr_url));
1394 }
1395
1396 /*
1397 * process each type of HTTP method, setting this HTTP requests
1398 # method type.
1399 */
1400 static struct method_map {
1401 const char *name;
1402 int type;
1403 } method_map[] = {
1404 { "GET", HTTP_GET, },
1405 { "POST", HTTP_POST, },
1406 { "HEAD", HTTP_HEAD, },
1407 #if 0 /* other non-required http/1.1 methods */
1408 { "OPTIONS", HTTP_OPTIONS, },
1409 { "PUT", HTTP_PUT, },
1410 { "DELETE", HTTP_DELETE, },
1411 { "TRACE", HTTP_TRACE, },
1412 { "CONNECT", HTTP_CONNECT, },
1413 #endif
1414 { NULL, 0, },
1415 };
1416
1417 static void
1418 process_method(http_req *request, const char *method)
1419 {
1420 struct method_map *mmp;
1421
1422 for (mmp = method_map; mmp->name; mmp++)
1423 if (strcasecmp(method, mmp->name) == 0) {
1424 request->hr_method = mmp->type;
1425 request->hr_methodstr = mmp->name;
1426 return;
1427 }
1428
1429 if (request->hr_proto == http_11)
1430 request->hr_allow = "GET, HEAD, POST";
1431 http_error(404, request, "unknown method");
1432 }
1433
1434 /*
1435 * as the prototype string is not constant (eg, "HTTP/1.1" is equivalent
1436 * to "HTTP/001.01"), we MUST parse this.
1437 */
1438 static void
1439 process_proto(http_req *request, const char *proto)
1440 {
1441 char majorstr[16], *minorstr;
1442 int majorint, minorint;
1443
1444 if (proto == NULL) {
1445 got_proto_09:
1446 request->hr_proto = http_09;
1447 debug((DEBUG_FAT, "request %s is http/0.9", request->hr_url));
1448 return;
1449 }
1450
1451 if (strncasecmp(proto, "HTTP/", 5) != 0)
1452 goto bad;
1453 strncpy(majorstr, proto + 5, sizeof majorstr);
1454 majorstr[sizeof(majorstr)-1] = 0;
1455 minorstr = strchr(majorstr, '.');
1456 if (minorstr == NULL)
1457 goto bad;
1458 *minorstr++ = 0;
1459
1460 majorint = atoi(majorstr);
1461 minorint = atoi(minorstr);
1462
1463 switch (majorint) {
1464 case 0:
1465 if (minorint != 9)
1466 break;
1467 goto got_proto_09;
1468 case 1:
1469 if (minorint == 0)
1470 request->hr_proto = http_10;
1471 else if (minorint == 1)
1472 request->hr_proto = http_11;
1473 else
1474 break;
1475
1476 debug((DEBUG_FAT, "request %s is %s", request->hr_url,
1477 request->hr_proto));
1478 SIMPLEQ_INIT(&request->hr_headers);
1479 request->hr_nheaders = 0;
1480 return;
1481 }
1482 bad:
1483 http_error(404, NULL, "unknown prototype");
1484 }
1485
1486 #ifdef DEBUG
1487 void
1488 debug__(int level, const char *fmt, ...)
1489 {
1490 va_list ap;
1491 int savederrno;
1492
1493 /* only log if the level is low enough */
1494 if (dflag < level)
1495 return;
1496
1497 savederrno = errno;
1498 va_start(ap, fmt);
1499 if (sflag) {
1500 vfprintf(stderr, fmt, ap);
1501 fputs("\n", stderr);
1502 } else
1503 vsyslog(LOG_DEBUG, fmt, ap);
1504 va_end(ap);
1505 errno = savederrno;
1506 }
1507 #endif /* DEBUG */
1508
1509 /* these are like warn() and err(), except for syslog not stderr */
1510 void
1511 warning(const char *fmt, ...)
1512 {
1513 va_list ap;
1514
1515 va_start(ap, fmt);
1516 if (sflag || isatty(STDERR_FILENO)) {
1517 vfprintf(stderr, fmt, ap);
1518 fputs("\n", stderr);
1519 } else
1520 vsyslog(LOG_INFO, fmt, ap);
1521 va_end(ap);
1522 }
1523
1524 void
1525 error(int code, const char *fmt, ...)
1526 {
1527 va_list ap;
1528
1529 va_start(ap, fmt);
1530 if (sflag || isatty(STDERR_FILENO)) {
1531 vfprintf(stderr, fmt, ap);
1532 fputs("\n", stderr);
1533 } else
1534 vsyslog(LOG_ERR, fmt, ap);
1535 va_end(ap);
1536 exit(code);
1537 }
1538
1539 /* the follow functions and variables are used in handling HTTP errors */
1540 /* ARGSUSED */
1541 void
1542 http_error(int code, http_req *request, const char *msg)
1543 {
1544 static char buf[BUFSIZ];
1545 char portbuf[20];
1546 const char *header = http_errors_short(code);
1547 const char *reason = http_errors_long(code);
1548 const char *proto = (request && request->hr_proto) ? request->hr_proto : http_11;
1549 int size;
1550
1551 debug((DEBUG_FAT, "http_error %d: %s", code, msg));
1552 if (header == NULL || reason == NULL)
1553 error(1, "http_error() failed (short = %p, long = %p)",
1554 header, reason);
1555
1556 if (request && request->hr_serverport && strcmp(request->hr_serverport, "80") != 0)
1557 snprintf(portbuf, sizeof(portbuf), ":%s", request->hr_serverport);
1558 else
1559 portbuf[0] = '\0';
1560
1561 if (request && request->hr_url) {
1562 escape_html(request);
1563 size = snprintf(buf, sizeof buf,
1564 "<html><head><title>%s</title></head>\n"
1565 "<body><h1>%s</h1>\n"
1566 "%s: <pre>%s</pre>\n"
1567 "<hr><address><a href=\"http://%s%s/\">%s%s</a></address>\n"
1568 "</body></html>\n",
1569 header, header, request->hr_url, reason,
1570 myname, portbuf, myname, portbuf);
1571 if (size >= sizeof buf)
1572 warning("http_error buffer too small, truncated");
1573 } else
1574 size = 0;
1575
1576 bozoprintf("%s %s\r\n", proto, header);
1577 auth_check_401(request, code);
1578
1579 bozoprintf("Content-Type: text/html\r\n");
1580 bozoprintf("Content-Length: %d\r\n", size);
1581 bozoprintf("Server: %s\r\n", server_software);
1582 if (request && request->hr_allow)
1583 bozoprintf("Allow: %s\r\n", request->hr_allow);
1584 bozoprintf("\r\n");
1585 if (size)
1586 bozoprintf("%s", buf);
1587 bozoflush(stdout);
1588
1589 exit(1);
1590 }
1591
1592 /* short map between error code, and short/long messages */
1593 static struct errors_map {
1594 int code; /* HTTP return code */
1595 const char *shortmsg; /* short version of message */
1596 const char *longmsg; /* long version of message */
1597 } errors_map[] = {
1598 { 400, "400 Bad Request", "The request was not valid", },
1599 { 401, "401 Unauthorized", "No authorization", },
1600 { 403, "403 Forbidden", "Access to this item has been denied", },
1601 { 404, "404 Not Found", "This item has not been found", },
1602 { 408, "408 Request Timeout", "This request took too long", },
1603 { 417, "417 Expectation Failed","Expectations not available", },
1604 { 500, "500 Internal Error", "An error occured on the server", },
1605 { 501, "501 Not Implemented", "This request is not available", },
1606 { 0, NULL, NULL, },
1607 };
1608
1609 static const char *help = "DANGER! WILL ROBINSON! DANGER!";
1610
1611 static const char *
1612 http_errors_short(int code)
1613 {
1614 struct errors_map *ep;
1615
1616 for (ep = errors_map; ep->code; ep++)
1617 if (ep->code == code)
1618 return (ep->shortmsg);
1619 return (help);
1620 }
1621
1622 static const char *
1623 http_errors_long(int code)
1624 {
1625 struct errors_map *ep;
1626
1627 for (ep = errors_map; ep->code; ep++)
1628 if (ep->code == code)
1629 return (ep->longmsg);
1630 return (help);
1631 }
1632
1633 /* Below are various modified libc functions */
1634
1635 /*
1636 * returns -1 in lenp if the string ran out before finding a delimiter,
1637 * but is otherwise the same as strsep. Note that the length must be
1638 * correctly passed in.
1639 */
1640 char *
1641 strnsep(char **strp, const char *delim, ssize_t *lenp)
1642 {
1643 char *s;
1644 const char *spanp;
1645 int c, sc;
1646 char *tok;
1647
1648 if ((s = *strp) == NULL)
1649 return (NULL);
1650 for (tok = s;;) {
1651 if (lenp && --(*lenp) == -1)
1652 return (NULL);
1653 c = *s++;
1654 spanp = delim;
1655 do {
1656 if ((sc = *spanp++) == c) {
1657 if (c == 0)
1658 s = NULL;
1659 else
1660 s[-1] = '\0';
1661 *strp = s;
1662 return (tok);
1663 }
1664 } while (sc != 0);
1665 }
1666 /* NOTREACHED */
1667 }
1668
1669 /*
1670 * inspired by fgetln(3), but works for fd's. should work identically
1671 * except it, however, does *not* return the newline, and it does nul
1672 * terminate the string.
1673 */
1674 char *
1675 dgetln(int fd, ssize_t *lenp, ssize_t (*readfn)(int, void *, size_t))
1676 {
1677 static char *buffer;
1678 static ssize_t buflen = 0;
1679 ssize_t len;
1680 int got_cr = 0;
1681 char c, *nbuffer;
1682
1683 /* initialise */
1684 if (buflen == 0) {
1685 buflen = 128; /* should be plenty for most requests */
1686 buffer = malloc(buflen);
1687 if (buffer == NULL) {
1688 buflen = 0;
1689 return NULL;
1690 }
1691 }
1692 len = 0;
1693
1694 /*
1695 * we *have* to read one byte at a time, to not break cgi
1696 * programs (for we pass stdin off to them). could fix this
1697 * by becoming a fd-passing program instead of just exec'ing
1698 * the program
1699 */
1700 for (; readfn(fd, &c, 1) == 1; ) {
1701 debug((DEBUG_EXPLODING, "dgetln read %c", c));
1702
1703 if (len >= buflen - 1) {
1704 buflen *= 2;
1705 debug((DEBUG_EXPLODING,
1706 "dgetln: reallocating buffer to buflen %d", buflen));
1707 nbuffer = realloc(buffer, buflen);
1708 if (nbuffer == NULL) {
1709 free(buffer);
1710 buflen = 0;
1711 buffer = NULL;
1712 return NULL;
1713 }
1714 buffer = nbuffer;
1715 }
1716
1717 buffer[len++] = c;
1718 if (c == '\r') {
1719 got_cr = 1;
1720 continue;
1721 } else if (c == '\n') {
1722 /*
1723 * HTTP/1.1 spec says to ignore CR and treat
1724 * LF as the real line terminator. even though
1725 * the same spec defines CRLF as the line
1726 * terminator, it is recommended in section 19.3
1727 * to do the LF trick for tolerance.
1728 */
1729 if (got_cr)
1730 len -= 2;
1731 else
1732 len -= 1;
1733 break;
1734 }
1735
1736 }
1737 buffer[len] = '\0';
1738 debug((DEBUG_OBESE, "dgetln returns: ``%s'' with len %d", buffer, len));
1739 *lenp = len;
1740 return (buffer);
1741 }
1742
1743 void *
1744 bozorealloc(void *ptr, size_t size)
1745 {
1746 void *p;
1747
1748 p = realloc(ptr, size);
1749 if (p == NULL)
1750 http_error(500, NULL, "memory allocation failure");
1751 return (p);
1752 }
1753
1754 void *
1755 bozomalloc(size_t size)
1756 {
1757 void *p;
1758
1759 p = malloc(size);
1760 if (p == NULL)
1761 http_error(500, NULL, "memory allocation failure");
1762 return (p);
1763 }
1764
1765 char *
1766 bozostrdup(const char *str)
1767 {
1768 char *p;
1769
1770 p = strdup(str);
1771 if (p == NULL)
1772 http_error(500, NULL, "memory allocation failure");
1773 return (p);
1774 }
1775