bozohttpd.c revision 1.80 1 1.80 mrg /* $NetBSD: bozohttpd.c,v 1.80 2016/04/15 17:57:21 mrg Exp $ */
2 1.3 tls
3 1.30 mrg /* $eterna: bozohttpd.c,v 1.178 2011/11/18 09:21:15 mrg Exp $ */
4 1.1 tls
5 1.1 tls /*
6 1.63 mrg * Copyright (c) 1997-2015 Matthew R. Green
7 1.1 tls * All rights reserved.
8 1.1 tls *
9 1.1 tls * Redistribution and use in source and binary forms, with or without
10 1.1 tls * modification, are permitted provided that the following conditions
11 1.1 tls * are met:
12 1.1 tls * 1. Redistributions of source code must retain the above copyright
13 1.1 tls * notice, this list of conditions and the following disclaimer.
14 1.1 tls * 2. Redistributions in binary form must reproduce the above copyright
15 1.1 tls * notice, this list of conditions and the following disclaimer and
16 1.1 tls * dedication in the documentation and/or other materials provided
17 1.1 tls * with the distribution.
18 1.1 tls *
19 1.1 tls * THIS SOFTWARE IS PROVIDED BY THE AUTHOR ``AS IS'' AND ANY EXPRESS OR
20 1.1 tls * IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED WARRANTIES
21 1.1 tls * OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE ARE DISCLAIMED.
22 1.1 tls * IN NO EVENT SHALL THE AUTHOR BE LIABLE FOR ANY DIRECT, INDIRECT,
23 1.1 tls * INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING,
24 1.1 tls * BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES;
25 1.1 tls * LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED
26 1.1 tls * AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY,
27 1.1 tls * OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY
28 1.1 tls * OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF
29 1.1 tls * SUCH DAMAGE.
30 1.1 tls *
31 1.1 tls */
32 1.1 tls
33 1.1 tls /* this program is dedicated to the Great God of Processed Cheese */
34 1.1 tls
35 1.1 tls /*
36 1.1 tls * bozohttpd.c: minimal httpd; provides only these features:
37 1.1 tls * - HTTP/0.9 (by virtue of ..)
38 1.1 tls * - HTTP/1.0
39 1.1 tls * - HTTP/1.1
40 1.1 tls * - CGI/1.1 this will only be provided for "system" scripts
41 1.1 tls * - automatic "missing trailing slash" redirections
42 1.1 tls * - configurable translation of /~user/ to ~user/public_html,
43 1.1 tls * however, this does not include cgi-bin support
44 1.1 tls * - access lists via libwrap via inetd/tcpd
45 1.1 tls * - virtual hosting
46 1.1 tls * - not that we do not even pretend to understand MIME, but
47 1.1 tls * rely only on the HTTP specification
48 1.1 tls * - ipv6 support
49 1.1 tls * - automatic `index.html' generation
50 1.1 tls * - configurable server name
51 1.1 tls * - directory index generation
52 1.1 tls * - daemon mode (lacks libwrap support)
53 1.1 tls * - .htpasswd support
54 1.1 tls */
55 1.1 tls
56 1.1 tls /*
57 1.1 tls * requirements for minimal http/1.1 (at least, as documented in
58 1.48 mrg * RFC 2616 (HTTP/1.1):
59 1.1 tls *
60 1.48 mrg * - 14.11: content-encoding handling. [1]
61 1.1 tls *
62 1.48 mrg * - 14.13: content-length handling. this is only a SHOULD header
63 1.1 tls * thus we could just not send it ever. [1]
64 1.1 tls *
65 1.1 tls * - 14.17: content-type handling. [1]
66 1.1 tls *
67 1.48 mrg * - 14.28: if-unmodified-since handling. if-modified-since is
68 1.48 mrg * done since, shouldn't be too hard for this one.
69 1.1 tls *
70 1.1 tls * [1] need to revisit to ensure proper behaviour
71 1.1 tls *
72 1.1 tls * and the following is a list of features that we do not need
73 1.1 tls * to have due to other limits, or are too lazy. there are more
74 1.1 tls * of these than are listed, but these are of particular note,
75 1.1 tls * and could perhaps be implemented.
76 1.1 tls *
77 1.1 tls * - 3.5/3.6: content/transfer codings. probably can ignore
78 1.1 tls * this? we "SHOULD"n't. but 4.4 says we should ignore a
79 1.1 tls * `content-length' header upon reciept of a `transfer-encoding'
80 1.1 tls * header.
81 1.1 tls *
82 1.1 tls * - 5.1.1: request methods. only MUST support GET and HEAD,
83 1.1 tls * but there are new ones besides POST that are currently
84 1.1 tls * supported: OPTIONS PUT DELETE TRACE and CONNECT, plus
85 1.1 tls * extensions not yet known?
86 1.1 tls *
87 1.1 tls * - 10.1: we can ignore informational status codes
88 1.1 tls *
89 1.1 tls * - 10.3.3/10.3.4/10.3.8: just use '302' codes always.
90 1.1 tls *
91 1.48 mrg * - 14.1/14.2/14.3/14.27: we do not support Accept: headers.
92 1.1 tls * just ignore them and send the request anyway. they are
93 1.1 tls * only SHOULD.
94 1.1 tls *
95 1.48 mrg * - 14.5/14.16/14.35: only support simple ranges: %d- and %d-%d
96 1.48 mrg * would be nice to support more.
97 1.1 tls *
98 1.1 tls * - 14.9: we aren't a cache.
99 1.1 tls *
100 1.48 mrg * - 14.15: content-md5 would be nice.
101 1.42 mbalmer *
102 1.48 mrg * - 14.24/14.26/14.27: if-match, if-none-match, if-range. be
103 1.48 mrg * nice to support this.
104 1.1 tls *
105 1.48 mrg * - 14.44: Vary: seems unneeded. ignore it for now.
106 1.1 tls */
107 1.1 tls
108 1.1 tls #ifndef INDEX_HTML
109 1.1 tls #define INDEX_HTML "index.html"
110 1.1 tls #endif
111 1.1 tls #ifndef SERVER_SOFTWARE
112 1.80 mrg #define SERVER_SOFTWARE "bozohttpd/20160415"
113 1.1 tls #endif
114 1.1 tls #ifndef DIRECT_ACCESS_FILE
115 1.1 tls #define DIRECT_ACCESS_FILE ".bzdirect"
116 1.1 tls #endif
117 1.1 tls #ifndef REDIRECT_FILE
118 1.1 tls #define REDIRECT_FILE ".bzredirect"
119 1.1 tls #endif
120 1.1 tls #ifndef ABSREDIRECT_FILE
121 1.1 tls #define ABSREDIRECT_FILE ".bzabsredirect"
122 1.1 tls #endif
123 1.16 mrg #ifndef PUBLIC_HTML
124 1.16 mrg #define PUBLIC_HTML "public_html"
125 1.16 mrg #endif
126 1.16 mrg
127 1.16 mrg #ifndef USE_ARG
128 1.16 mrg #define USE_ARG(x) /*LINTED*/(void)&(x)
129 1.16 mrg #endif
130 1.1 tls
131 1.1 tls /*
132 1.1 tls * And so it begins ..
133 1.1 tls */
134 1.1 tls
135 1.1 tls #include <sys/param.h>
136 1.1 tls #include <sys/socket.h>
137 1.1 tls #include <sys/time.h>
138 1.1 tls #include <sys/mman.h>
139 1.1 tls
140 1.1 tls #include <arpa/inet.h>
141 1.1 tls
142 1.1 tls #include <ctype.h>
143 1.1 tls #include <dirent.h>
144 1.1 tls #include <errno.h>
145 1.1 tls #include <fcntl.h>
146 1.1 tls #include <netdb.h>
147 1.1 tls #include <pwd.h>
148 1.1 tls #include <grp.h>
149 1.1 tls #include <signal.h>
150 1.1 tls #include <stdarg.h>
151 1.1 tls #include <stdlib.h>
152 1.1 tls #include <string.h>
153 1.1 tls #include <syslog.h>
154 1.1 tls #include <time.h>
155 1.1 tls #include <unistd.h>
156 1.1 tls
157 1.1 tls #include "bozohttpd.h"
158 1.1 tls
159 1.1 tls #ifndef MAX_WAIT_TIME
160 1.1 tls #define MAX_WAIT_TIME 60 /* hang around for 60 seconds max */
161 1.1 tls #endif
162 1.1 tls
163 1.1 tls /* variables and functions */
164 1.1 tls #ifndef LOG_FTP
165 1.1 tls #define LOG_FTP LOG_DAEMON
166 1.1 tls #endif
167 1.1 tls
168 1.1 tls volatile sig_atomic_t alarmhit;
169 1.1 tls
170 1.16 mrg /*
171 1.16 mrg * check there's enough space in the prefs and names arrays.
172 1.16 mrg */
173 1.16 mrg static int
174 1.73 mrg size_arrays(bozoprefs_t *bozoprefs, size_t needed)
175 1.16 mrg {
176 1.16 mrg char **temp;
177 1.1 tls
178 1.16 mrg if (bozoprefs->size == 0) {
179 1.16 mrg /* only get here first time around */
180 1.73 mrg bozoprefs->name = calloc(sizeof(char *), needed);
181 1.73 mrg if (bozoprefs->name == NULL)
182 1.16 mrg return 0;
183 1.73 mrg bozoprefs->value = calloc(sizeof(char *), needed);
184 1.73 mrg if (bozoprefs->value == NULL) {
185 1.16 mrg free(bozoprefs->name);
186 1.16 mrg return 0;
187 1.16 mrg }
188 1.73 mrg bozoprefs->size = needed;
189 1.73 mrg } else if (bozoprefs->count == bozoprefs->size) {
190 1.16 mrg /* only uses 'needed' when filled array */
191 1.16 mrg temp = realloc(bozoprefs->name, sizeof(char *) * needed);
192 1.73 mrg if (temp == NULL)
193 1.16 mrg return 0;
194 1.16 mrg bozoprefs->name = temp;
195 1.16 mrg temp = realloc(bozoprefs->value, sizeof(char *) * needed);
196 1.73 mrg if (temp == NULL)
197 1.16 mrg return 0;
198 1.16 mrg bozoprefs->value = temp;
199 1.73 mrg bozoprefs->size += needed;
200 1.16 mrg }
201 1.16 mrg return 1;
202 1.16 mrg }
203 1.1 tls
204 1.73 mrg static ssize_t
205 1.16 mrg findvar(bozoprefs_t *bozoprefs, const char *name)
206 1.16 mrg {
207 1.73 mrg size_t i;
208 1.1 tls
209 1.73 mrg for (i = 0; i < bozoprefs->count; i++)
210 1.73 mrg if (strcmp(bozoprefs->name[i], name) == 0)
211 1.73 mrg return (ssize_t)i;
212 1.73 mrg return -1;
213 1.1 tls }
214 1.1 tls
215 1.1 tls int
216 1.73 mrg bozo_set_pref(bozohttpd_t *httpd, bozoprefs_t *bozoprefs,
217 1.73 mrg const char *name, const char *value)
218 1.1 tls {
219 1.73 mrg ssize_t i;
220 1.1 tls
221 1.16 mrg if ((i = findvar(bozoprefs, name)) < 0) {
222 1.16 mrg /* add the element to the array */
223 1.73 mrg if (!size_arrays(bozoprefs, bozoprefs->size + 15))
224 1.73 mrg return 0;
225 1.73 mrg i = bozoprefs->count++;
226 1.73 mrg bozoprefs->name[i] = bozostrdup(httpd, NULL, name);
227 1.16 mrg } else {
228 1.16 mrg /* replace the element in the array */
229 1.16 mrg if (bozoprefs->value[i]) {
230 1.16 mrg free(bozoprefs->value[i]);
231 1.16 mrg bozoprefs->value[i] = NULL;
232 1.1 tls }
233 1.1 tls }
234 1.73 mrg bozoprefs->value[i] = bozostrdup(httpd, NULL, value);
235 1.16 mrg return 1;
236 1.16 mrg }
237 1.1 tls
238 1.16 mrg /*
239 1.16 mrg * get a variable's value, or NULL
240 1.16 mrg */
241 1.16 mrg char *
242 1.16 mrg bozo_get_pref(bozoprefs_t *bozoprefs, const char *name)
243 1.16 mrg {
244 1.73 mrg ssize_t i;
245 1.1 tls
246 1.73 mrg i = findvar(bozoprefs, name);
247 1.73 mrg return i < 0 ? NULL : bozoprefs->value[i];
248 1.1 tls }
249 1.1 tls
250 1.1 tls char *
251 1.16 mrg bozo_http_date(char *date, size_t datelen)
252 1.1 tls {
253 1.1 tls struct tm *tm;
254 1.1 tls time_t now;
255 1.1 tls
256 1.1 tls /* Sun, 06 Nov 1994 08:49:37 GMT */
257 1.1 tls now = time(NULL);
258 1.1 tls tm = gmtime(&now); /* HTTP/1.1 spec rev 06 sez GMT only */
259 1.16 mrg strftime(date, datelen, "%a, %d %b %Y %H:%M:%S GMT", tm);
260 1.1 tls return date;
261 1.1 tls }
262 1.1 tls
263 1.1 tls /*
264 1.12 mrg * convert "in" into the three parts of a request (first line).
265 1.12 mrg * we allocate into file and query, but return pointers into
266 1.12 mrg * "in" for proto and method.
267 1.1 tls */
268 1.1 tls static void
269 1.16 mrg parse_request(bozohttpd_t *httpd, char *in, char **method, char **file,
270 1.16 mrg char **query, char **proto)
271 1.1 tls {
272 1.1 tls ssize_t len;
273 1.1 tls char *val;
274 1.16 mrg
275 1.16 mrg USE_ARG(httpd);
276 1.16 mrg debug((httpd, DEBUG_EXPLODING, "parse in: %s", in));
277 1.12 mrg *method = *file = *query = *proto = NULL;
278 1.1 tls
279 1.1 tls len = (ssize_t)strlen(in);
280 1.6 mrg val = bozostrnsep(&in, " \t\n\r", &len);
281 1.1 tls if (len < 1 || val == NULL)
282 1.1 tls return;
283 1.1 tls *method = val;
284 1.12 mrg
285 1.1 tls while (*in == ' ' || *in == '\t')
286 1.1 tls in++;
287 1.6 mrg val = bozostrnsep(&in, " \t\n\r", &len);
288 1.1 tls if (len < 1) {
289 1.1 tls if (len == 0)
290 1.9 tls *file = val;
291 1.1 tls else
292 1.9 tls *file = in;
293 1.16 mrg } else {
294 1.16 mrg *file = val;
295 1.9 tls
296 1.16 mrg *query = strchr(*file, '?');
297 1.16 mrg if (*query)
298 1.16 mrg *(*query)++ = '\0';
299 1.16 mrg
300 1.16 mrg if (in) {
301 1.16 mrg while (*in && (*in == ' ' || *in == '\t'))
302 1.16 mrg in++;
303 1.16 mrg if (*in)
304 1.16 mrg *proto = in;
305 1.16 mrg }
306 1.12 mrg }
307 1.12 mrg
308 1.12 mrg /* allocate private copies */
309 1.73 mrg *file = bozostrdup(httpd, NULL, *file);
310 1.12 mrg if (*query)
311 1.73 mrg *query = bozostrdup(httpd, NULL, *query);
312 1.12 mrg
313 1.16 mrg debug((httpd, DEBUG_FAT,
314 1.16 mrg "url: method: \"%s\" file: \"%s\" query: \"%s\" proto: \"%s\"",
315 1.16 mrg *method, *file, *query, *proto));
316 1.1 tls }
317 1.1 tls
318 1.1 tls /*
319 1.16 mrg * cleanup a bozo_httpreq_t after use
320 1.1 tls */
321 1.16 mrg void
322 1.16 mrg bozo_clean_request(bozo_httpreq_t *request)
323 1.1 tls {
324 1.16 mrg struct bozoheaders *hdr, *ohdr = NULL;
325 1.12 mrg
326 1.12 mrg if (request == NULL)
327 1.12 mrg return;
328 1.12 mrg
329 1.21 mrg /* If SSL enabled cleanup SSL structure. */
330 1.22 mrg bozo_ssl_destroy(request->hr_httpd);
331 1.21 mrg
332 1.12 mrg /* clean up request */
333 1.51 shm free(request->hr_remotehost);
334 1.51 shm free(request->hr_remoteaddr);
335 1.51 shm free(request->hr_serverport);
336 1.51 shm free(request->hr_virthostname);
337 1.51 shm free(request->hr_file);
338 1.51 shm free(request->hr_oldfile);
339 1.51 shm free(request->hr_query);
340 1.51 shm free(request->hr_host);
341 1.67 shm bozo_user_free(request->hr_user);
342 1.16 mrg bozo_auth_cleanup(request);
343 1.12 mrg for (hdr = SIMPLEQ_FIRST(&request->hr_headers); hdr;
344 1.12 mrg hdr = SIMPLEQ_NEXT(hdr, h_next)) {
345 1.12 mrg free(hdr->h_value);
346 1.12 mrg free(hdr->h_header);
347 1.44 mbalmer free(ohdr);
348 1.12 mrg ohdr = hdr;
349 1.12 mrg }
350 1.79 elric free(ohdr);
351 1.79 elric ohdr = NULL;
352 1.78 elric for (hdr = SIMPLEQ_FIRST(&request->hr_replheaders); hdr;
353 1.78 elric hdr = SIMPLEQ_NEXT(hdr, h_next)) {
354 1.78 elric free(hdr->h_value);
355 1.78 elric free(hdr->h_header);
356 1.78 elric free(ohdr);
357 1.78 elric ohdr = hdr;
358 1.78 elric }
359 1.44 mbalmer free(ohdr);
360 1.12 mrg
361 1.12 mrg free(request);
362 1.12 mrg }
363 1.12 mrg
364 1.12 mrg /*
365 1.16 mrg * send a HTTP/1.1 408 response if we timeout.
366 1.16 mrg */
367 1.16 mrg /* ARGSUSED */
368 1.16 mrg static void
369 1.16 mrg alarmer(int sig)
370 1.16 mrg {
371 1.16 mrg alarmhit = 1;
372 1.16 mrg }
373 1.16 mrg
374 1.16 mrg /*
375 1.78 elric * a list of header quirks: currently, a list of headers that
376 1.78 elric * can't be folded into a single line.
377 1.78 elric */
378 1.78 elric const char *header_quirks[] = { "WWW-Authenticate", NULL };
379 1.78 elric
380 1.78 elric /*
381 1.16 mrg * add or merge this header (val: str) into the requests list
382 1.16 mrg */
383 1.16 mrg static bozoheaders_t *
384 1.78 elric addmerge_header(bozo_httpreq_t *request, struct qheaders *headers,
385 1.78 elric const char *val, const char *str, ssize_t len)
386 1.16 mrg {
387 1.73 mrg struct bozohttpd_t *httpd = request->hr_httpd;
388 1.78 elric struct bozoheaders *hdr = NULL;
389 1.78 elric const char **quirk;
390 1.16 mrg
391 1.16 mrg USE_ARG(len);
392 1.78 elric for (quirk = header_quirks; *quirk; quirk++)
393 1.78 elric if (strcasecmp(*quirk, val) == 0)
394 1.16 mrg break;
395 1.78 elric
396 1.78 elric if (*quirk == NULL) {
397 1.78 elric /* do we exist already? */
398 1.78 elric SIMPLEQ_FOREACH(hdr, headers, h_next) {
399 1.78 elric if (strcasecmp(val, hdr->h_header) == 0)
400 1.78 elric break;
401 1.78 elric }
402 1.16 mrg }
403 1.16 mrg
404 1.16 mrg if (hdr) {
405 1.16 mrg /* yup, merge it in */
406 1.16 mrg char *nval;
407 1.16 mrg
408 1.75 mrg bozoasprintf(httpd, &nval, "%s, %s", hdr->h_value, str);
409 1.16 mrg free(hdr->h_value);
410 1.16 mrg hdr->h_value = nval;
411 1.16 mrg } else {
412 1.16 mrg /* nope, create a new one */
413 1.16 mrg
414 1.73 mrg hdr = bozomalloc(httpd, sizeof *hdr);
415 1.73 mrg hdr->h_header = bozostrdup(httpd, request, val);
416 1.16 mrg if (str && *str)
417 1.73 mrg hdr->h_value = bozostrdup(httpd, request, str);
418 1.16 mrg else
419 1.73 mrg hdr->h_value = bozostrdup(httpd, request, " ");
420 1.16 mrg
421 1.78 elric SIMPLEQ_INSERT_TAIL(headers, hdr, h_next);
422 1.16 mrg request->hr_nheaders++;
423 1.16 mrg }
424 1.16 mrg
425 1.16 mrg return hdr;
426 1.16 mrg }
427 1.16 mrg
428 1.78 elric bozoheaders_t *
429 1.78 elric addmerge_reqheader(bozo_httpreq_t *request, const char *val, const char *str,
430 1.78 elric ssize_t len)
431 1.78 elric {
432 1.78 elric
433 1.78 elric return addmerge_header(request, &request->hr_headers, val, str, len);
434 1.78 elric }
435 1.78 elric
436 1.78 elric bozoheaders_t *
437 1.78 elric addmerge_replheader(bozo_httpreq_t *request, const char *val, const char *str,
438 1.78 elric ssize_t len)
439 1.78 elric {
440 1.78 elric
441 1.78 elric return addmerge_header(request, &request->hr_replheaders,
442 1.78 elric val, str, len);
443 1.78 elric }
444 1.78 elric
445 1.16 mrg /*
446 1.16 mrg * as the prototype string is not constant (eg, "HTTP/1.1" is equivalent
447 1.16 mrg * to "HTTP/001.01"), we MUST parse this.
448 1.16 mrg */
449 1.16 mrg static int
450 1.16 mrg process_proto(bozo_httpreq_t *request, const char *proto)
451 1.16 mrg {
452 1.73 mrg struct bozohttpd_t *httpd = request->hr_httpd;
453 1.16 mrg char majorstr[16], *minorstr;
454 1.16 mrg int majorint, minorint;
455 1.16 mrg
456 1.16 mrg if (proto == NULL) {
457 1.16 mrg got_proto_09:
458 1.73 mrg request->hr_proto = httpd->consts.http_09;
459 1.73 mrg debug((httpd, DEBUG_FAT, "request %s is http/0.9",
460 1.16 mrg request->hr_file));
461 1.16 mrg return 0;
462 1.16 mrg }
463 1.16 mrg
464 1.16 mrg if (strncasecmp(proto, "HTTP/", 5) != 0)
465 1.16 mrg goto bad;
466 1.16 mrg strncpy(majorstr, proto + 5, sizeof majorstr);
467 1.16 mrg majorstr[sizeof(majorstr)-1] = 0;
468 1.16 mrg minorstr = strchr(majorstr, '.');
469 1.16 mrg if (minorstr == NULL)
470 1.16 mrg goto bad;
471 1.16 mrg *minorstr++ = 0;
472 1.16 mrg
473 1.16 mrg majorint = atoi(majorstr);
474 1.16 mrg minorint = atoi(minorstr);
475 1.16 mrg
476 1.16 mrg switch (majorint) {
477 1.16 mrg case 0:
478 1.16 mrg if (minorint != 9)
479 1.16 mrg break;
480 1.16 mrg goto got_proto_09;
481 1.16 mrg case 1:
482 1.16 mrg if (minorint == 0)
483 1.73 mrg request->hr_proto = httpd->consts.http_10;
484 1.16 mrg else if (minorint == 1)
485 1.73 mrg request->hr_proto = httpd->consts.http_11;
486 1.16 mrg else
487 1.16 mrg break;
488 1.16 mrg
489 1.73 mrg debug((httpd, DEBUG_FAT, "request %s is %s",
490 1.16 mrg request->hr_file, request->hr_proto));
491 1.16 mrg SIMPLEQ_INIT(&request->hr_headers);
492 1.16 mrg request->hr_nheaders = 0;
493 1.16 mrg return 0;
494 1.16 mrg }
495 1.16 mrg bad:
496 1.73 mrg return bozo_http_error(httpd, 404, NULL, "unknown prototype");
497 1.16 mrg }
498 1.16 mrg
499 1.16 mrg /*
500 1.16 mrg * process each type of HTTP method, setting this HTTP requests
501 1.73 mrg * method type.
502 1.16 mrg */
503 1.16 mrg static struct method_map {
504 1.16 mrg const char *name;
505 1.16 mrg int type;
506 1.16 mrg } method_map[] = {
507 1.16 mrg { "GET", HTTP_GET, },
508 1.16 mrg { "POST", HTTP_POST, },
509 1.16 mrg { "HEAD", HTTP_HEAD, },
510 1.16 mrg #if 0 /* other non-required http/1.1 methods */
511 1.16 mrg { "OPTIONS", HTTP_OPTIONS, },
512 1.16 mrg { "PUT", HTTP_PUT, },
513 1.16 mrg { "DELETE", HTTP_DELETE, },
514 1.16 mrg { "TRACE", HTTP_TRACE, },
515 1.16 mrg { "CONNECT", HTTP_CONNECT, },
516 1.16 mrg #endif
517 1.16 mrg { NULL, 0, },
518 1.16 mrg };
519 1.16 mrg
520 1.16 mrg static int
521 1.16 mrg process_method(bozo_httpreq_t *request, const char *method)
522 1.16 mrg {
523 1.73 mrg struct bozohttpd_t *httpd = request->hr_httpd;
524 1.16 mrg struct method_map *mmp;
525 1.16 mrg
526 1.73 mrg if (request->hr_proto == httpd->consts.http_11)
527 1.16 mrg request->hr_allow = "GET, HEAD, POST";
528 1.16 mrg
529 1.16 mrg for (mmp = method_map; mmp->name; mmp++)
530 1.16 mrg if (strcasecmp(method, mmp->name) == 0) {
531 1.16 mrg request->hr_method = mmp->type;
532 1.16 mrg request->hr_methodstr = mmp->name;
533 1.16 mrg return 0;
534 1.16 mrg }
535 1.16 mrg
536 1.73 mrg return bozo_http_error(httpd, 404, request, "unknown method");
537 1.16 mrg }
538 1.16 mrg
539 1.16 mrg /*
540 1.1 tls * This function reads a http request from stdin, returning a pointer to a
541 1.16 mrg * bozo_httpreq_t structure, describing the request.
542 1.1 tls */
543 1.16 mrg bozo_httpreq_t *
544 1.16 mrg bozo_read_request(bozohttpd_t *httpd)
545 1.1 tls {
546 1.1 tls struct sigaction sa;
547 1.9 tls char *str, *val, *method, *file, *proto, *query;
548 1.1 tls char *host, *addr, *port;
549 1.1 tls char bufport[10];
550 1.1 tls char hbuf[NI_MAXHOST], abuf[NI_MAXHOST];
551 1.1 tls struct sockaddr_storage ss;
552 1.1 tls ssize_t len;
553 1.1 tls int line = 0;
554 1.1 tls socklen_t slen;
555 1.16 mrg bozo_httpreq_t *request;
556 1.1 tls
557 1.1 tls /*
558 1.20 mrg * if we're in daemon mode, bozo_daemon_fork() will return here twice
559 1.20 mrg * for each call. once in the child, returning 0, and once in the
560 1.20 mrg * parent, returning 1. for each child, then we can setup SSL, and
561 1.20 mrg * the parent can signal the caller there was no request to process
562 1.20 mrg * and it will wait for another.
563 1.1 tls */
564 1.20 mrg if (bozo_daemon_fork(httpd))
565 1.20 mrg return NULL;
566 1.55 mrg if (bozo_ssl_accept(httpd))
567 1.55 mrg return NULL;
568 1.1 tls
569 1.16 mrg request = bozomalloc(httpd, sizeof(*request));
570 1.16 mrg memset(request, 0, sizeof(*request));
571 1.16 mrg request->hr_httpd = httpd;
572 1.1 tls request->hr_allow = request->hr_host = NULL;
573 1.1 tls request->hr_content_type = request->hr_content_length = NULL;
574 1.6 mrg request->hr_range = NULL;
575 1.12 mrg request->hr_last_byte_pos = -1;
576 1.10 joerg request->hr_if_modified_since = NULL;
577 1.35 martin request->hr_virthostname = NULL;
578 1.12 mrg request->hr_file = NULL;
579 1.20 mrg request->hr_oldfile = NULL;
580 1.78 elric SIMPLEQ_INIT(&request->hr_replheaders);
581 1.59 shm bozo_auth_init(request);
582 1.1 tls
583 1.1 tls slen = sizeof(ss);
584 1.16 mrg if (getpeername(0, (struct sockaddr *)(void *)&ss, &slen) < 0)
585 1.1 tls host = addr = NULL;
586 1.1 tls else {
587 1.16 mrg if (getnameinfo((struct sockaddr *)(void *)&ss, slen,
588 1.1 tls abuf, sizeof abuf, NULL, 0, NI_NUMERICHOST) == 0)
589 1.1 tls addr = abuf;
590 1.1 tls else
591 1.1 tls addr = NULL;
592 1.16 mrg if (httpd->numeric == 0 &&
593 1.16 mrg getnameinfo((struct sockaddr *)(void *)&ss, slen,
594 1.16 mrg hbuf, sizeof hbuf, NULL, 0, 0) == 0)
595 1.1 tls host = hbuf;
596 1.1 tls else
597 1.1 tls host = NULL;
598 1.1 tls }
599 1.1 tls if (host != NULL)
600 1.73 mrg request->hr_remotehost = bozostrdup(httpd, request, host);
601 1.1 tls if (addr != NULL)
602 1.73 mrg request->hr_remoteaddr = bozostrdup(httpd, request, addr);
603 1.1 tls slen = sizeof(ss);
604 1.29 mrg
605 1.29 mrg /*
606 1.29 mrg * Override the bound port from the request value, so it works even
607 1.29 mrg * if passed through a proxy that doesn't rewrite the port.
608 1.29 mrg */
609 1.29 mrg if (httpd->bindport) {
610 1.29 mrg if (strcmp(httpd->bindport, "80") != 0)
611 1.29 mrg port = httpd->bindport;
612 1.1 tls else
613 1.1 tls port = NULL;
614 1.29 mrg } else {
615 1.29 mrg if (getsockname(0, (struct sockaddr *)(void *)&ss, &slen) < 0)
616 1.29 mrg port = NULL;
617 1.29 mrg else {
618 1.73 mrg if (getnameinfo((struct sockaddr *)(void *)&ss, slen,
619 1.73 mrg NULL, 0, bufport, sizeof bufport,
620 1.73 mrg NI_NUMERICSERV) == 0)
621 1.29 mrg port = bufport;
622 1.29 mrg else
623 1.29 mrg port = NULL;
624 1.29 mrg }
625 1.1 tls }
626 1.1 tls if (port != NULL)
627 1.73 mrg request->hr_serverport = bozostrdup(httpd, request, port);
628 1.1 tls
629 1.1 tls /*
630 1.1 tls * setup a timer to make sure the request is not hung
631 1.1 tls */
632 1.1 tls sa.sa_handler = alarmer;
633 1.1 tls sigemptyset(&sa.sa_mask);
634 1.1 tls sigaddset(&sa.sa_mask, SIGALRM);
635 1.1 tls sa.sa_flags = 0;
636 1.74 mrg sigaction(SIGALRM, &sa, NULL);
637 1.1 tls
638 1.1 tls alarm(MAX_WAIT_TIME);
639 1.16 mrg while ((str = bozodgetln(httpd, STDIN_FILENO, &len, bozo_read)) != NULL) {
640 1.1 tls alarm(0);
641 1.12 mrg if (alarmhit) {
642 1.16 mrg (void)bozo_http_error(httpd, 408, NULL,
643 1.16 mrg "request timed out");
644 1.12 mrg goto cleanup;
645 1.12 mrg }
646 1.1 tls line++;
647 1.1 tls
648 1.1 tls if (line == 1) {
649 1.1 tls
650 1.12 mrg if (len < 1) {
651 1.16 mrg (void)bozo_http_error(httpd, 404, NULL,
652 1.16 mrg "null method");
653 1.12 mrg goto cleanup;
654 1.12 mrg }
655 1.74 mrg bozowarn(httpd,
656 1.73 mrg "got request ``%s'' from host %s to port %s",
657 1.73 mrg str,
658 1.73 mrg host ? host : addr ? addr : "<local>",
659 1.73 mrg port ? port : "<stdin>");
660 1.1 tls
661 1.12 mrg /* we allocate return space in file and query only */
662 1.16 mrg parse_request(httpd, str, &method, &file, &query, &proto);
663 1.12 mrg request->hr_file = file;
664 1.12 mrg request->hr_query = query;
665 1.12 mrg if (method == NULL) {
666 1.16 mrg (void)bozo_http_error(httpd, 404, NULL,
667 1.16 mrg "null method");
668 1.12 mrg goto cleanup;
669 1.12 mrg }
670 1.12 mrg if (file == NULL) {
671 1.16 mrg (void)bozo_http_error(httpd, 404, NULL,
672 1.16 mrg "null file");
673 1.12 mrg goto cleanup;
674 1.12 mrg }
675 1.1 tls
676 1.1 tls /*
677 1.1 tls * note that we parse the proto first, so that we
678 1.1 tls * can more properly parse the method and the url.
679 1.1 tls */
680 1.9 tls
681 1.12 mrg if (process_proto(request, proto) ||
682 1.12 mrg process_method(request, method)) {
683 1.12 mrg goto cleanup;
684 1.12 mrg }
685 1.12 mrg
686 1.16 mrg debug((httpd, DEBUG_FAT, "got file \"%s\" query \"%s\"",
687 1.12 mrg request->hr_file,
688 1.12 mrg request->hr_query ? request->hr_query : "<none>"));
689 1.1 tls
690 1.1 tls /* http/0.9 has no header processing */
691 1.16 mrg if (request->hr_proto == httpd->consts.http_09)
692 1.1 tls break;
693 1.1 tls } else { /* incoming headers */
694 1.16 mrg bozoheaders_t *hdr;
695 1.1 tls
696 1.1 tls if (*str == '\0')
697 1.1 tls break;
698 1.1 tls
699 1.6 mrg val = bozostrnsep(&str, ":", &len);
700 1.16 mrg debug((httpd, DEBUG_EXPLODING,
701 1.6 mrg "read_req2: after bozostrnsep: str ``%s'' val ``%s''",
702 1.1 tls str, val));
703 1.12 mrg if (val == NULL || len == -1) {
704 1.16 mrg (void)bozo_http_error(httpd, 404, request,
705 1.16 mrg "no header");
706 1.12 mrg goto cleanup;
707 1.12 mrg }
708 1.1 tls while (*str == ' ' || *str == '\t')
709 1.1 tls len--, str++;
710 1.6 mrg while (*val == ' ' || *val == '\t')
711 1.6 mrg val++;
712 1.1 tls
713 1.17 mrg if (bozo_auth_check_headers(request, val, str, len))
714 1.1 tls goto next_header;
715 1.1 tls
716 1.78 elric hdr = addmerge_reqheader(request, val, str, len);
717 1.1 tls
718 1.1 tls if (strcasecmp(hdr->h_header, "content-type") == 0)
719 1.1 tls request->hr_content_type = hdr->h_value;
720 1.1 tls else if (strcasecmp(hdr->h_header, "content-length") == 0)
721 1.1 tls request->hr_content_length = hdr->h_value;
722 1.1 tls else if (strcasecmp(hdr->h_header, "host") == 0)
723 1.73 mrg request->hr_host = bozostrdup(httpd, request,
724 1.73 mrg hdr->h_value);
725 1.48 mrg /* RFC 2616 (HTTP/1.1): 14.20 */
726 1.12 mrg else if (strcasecmp(hdr->h_header, "expect") == 0) {
727 1.16 mrg (void)bozo_http_error(httpd, 417, request,
728 1.16 mrg "we don't support Expect:");
729 1.12 mrg goto cleanup;
730 1.12 mrg }
731 1.1 tls else if (strcasecmp(hdr->h_header, "referrer") == 0 ||
732 1.1 tls strcasecmp(hdr->h_header, "referer") == 0)
733 1.1 tls request->hr_referrer = hdr->h_value;
734 1.6 mrg else if (strcasecmp(hdr->h_header, "range") == 0)
735 1.6 mrg request->hr_range = hdr->h_value;
736 1.16 mrg else if (strcasecmp(hdr->h_header,
737 1.16 mrg "if-modified-since") == 0)
738 1.10 joerg request->hr_if_modified_since = hdr->h_value;
739 1.31 elric else if (strcasecmp(hdr->h_header,
740 1.31 elric "accept-encoding") == 0)
741 1.31 elric request->hr_accept_encoding = hdr->h_value;
742 1.1 tls
743 1.16 mrg debug((httpd, DEBUG_FAT, "adding header %s: %s",
744 1.1 tls hdr->h_header, hdr->h_value));
745 1.1 tls }
746 1.1 tls next_header:
747 1.1 tls alarm(MAX_WAIT_TIME);
748 1.1 tls }
749 1.1 tls
750 1.1 tls /* now, clear it all out */
751 1.1 tls alarm(0);
752 1.1 tls signal(SIGALRM, SIG_DFL);
753 1.1 tls
754 1.1 tls /* RFC1945, 8.3 */
755 1.16 mrg if (request->hr_method == HTTP_POST &&
756 1.16 mrg request->hr_content_length == NULL) {
757 1.16 mrg (void)bozo_http_error(httpd, 400, request,
758 1.16 mrg "missing content length");
759 1.12 mrg goto cleanup;
760 1.12 mrg }
761 1.1 tls
762 1.48 mrg /* RFC 2616 (HTTP/1.1), 14.23 & 19.6.1.1 */
763 1.16 mrg if (request->hr_proto == httpd->consts.http_11 &&
764 1.48 mrg /*(strncasecmp(request->hr_file, "http://", 7) != 0) &&*/
765 1.16 mrg request->hr_host == NULL) {
766 1.16 mrg (void)bozo_http_error(httpd, 400, request,
767 1.16 mrg "missing Host header");
768 1.12 mrg goto cleanup;
769 1.12 mrg }
770 1.12 mrg
771 1.12 mrg if (request->hr_range != NULL) {
772 1.16 mrg debug((httpd, DEBUG_FAT, "hr_range: %s", request->hr_range));
773 1.12 mrg /* support only simple ranges %d- and %d-%d */
774 1.12 mrg if (strchr(request->hr_range, ',') == NULL) {
775 1.12 mrg const char *rstart, *dash;
776 1.12 mrg
777 1.12 mrg rstart = strchr(request->hr_range, '=');
778 1.12 mrg if (rstart != NULL) {
779 1.12 mrg rstart++;
780 1.12 mrg dash = strchr(rstart, '-');
781 1.12 mrg if (dash != NULL && dash != rstart) {
782 1.12 mrg dash++;
783 1.12 mrg request->hr_have_range = 1;
784 1.12 mrg request->hr_first_byte_pos =
785 1.12 mrg strtoll(rstart, NULL, 10);
786 1.12 mrg if (request->hr_first_byte_pos < 0)
787 1.12 mrg request->hr_first_byte_pos = 0;
788 1.12 mrg if (*dash != '\0') {
789 1.12 mrg request->hr_last_byte_pos =
790 1.12 mrg strtoll(dash, NULL, 10);
791 1.12 mrg if (request->hr_last_byte_pos < 0)
792 1.12 mrg request->hr_last_byte_pos = -1;
793 1.12 mrg }
794 1.12 mrg }
795 1.12 mrg }
796 1.12 mrg }
797 1.12 mrg }
798 1.1 tls
799 1.16 mrg debug((httpd, DEBUG_FAT, "bozo_read_request returns url %s in request",
800 1.16 mrg request->hr_file));
801 1.16 mrg return request;
802 1.1 tls
803 1.16 mrg cleanup:
804 1.16 mrg bozo_clean_request(request);
805 1.1 tls
806 1.16 mrg return NULL;
807 1.1 tls }
808 1.1 tls
809 1.10 joerg static int
810 1.16 mrg mmap_and_write_part(bozohttpd_t *httpd, int fd, off_t first_byte_pos, size_t sz)
811 1.12 mrg {
812 1.14 mrg size_t mappedsz, wroffset;
813 1.14 mrg off_t mappedoffset;
814 1.12 mrg char *addr;
815 1.14 mrg void *mappedaddr;
816 1.14 mrg
817 1.14 mrg /*
818 1.14 mrg * we need to ensure that both the size *and* offset arguments to
819 1.14 mrg * mmap() are page-aligned. our formala for this is:
820 1.14 mrg *
821 1.14 mrg * input offset: first_byte_pos
822 1.14 mrg * input size: sz
823 1.14 mrg *
824 1.14 mrg * mapped offset = page align truncate (input offset)
825 1.14 mrg * mapped size =
826 1.14 mrg * page align extend (input offset - mapped offset + input size)
827 1.14 mrg * write offset = input offset - mapped offset
828 1.14 mrg *
829 1.14 mrg * we use the write offset in all writes
830 1.14 mrg */
831 1.16 mrg mappedoffset = first_byte_pos & ~(httpd->page_size - 1);
832 1.16 mrg mappedsz = (size_t)
833 1.16 mrg (first_byte_pos - mappedoffset + sz + httpd->page_size - 1) &
834 1.16 mrg ~(httpd->page_size - 1);
835 1.16 mrg wroffset = (size_t)(first_byte_pos - mappedoffset);
836 1.12 mrg
837 1.14 mrg addr = mmap(0, mappedsz, PROT_READ, MAP_SHARED, fd, mappedoffset);
838 1.12 mrg if (addr == (char *)-1) {
839 1.74 mrg bozowarn(httpd, "mmap failed: %s", strerror(errno));
840 1.12 mrg return -1;
841 1.12 mrg }
842 1.14 mrg mappedaddr = addr;
843 1.12 mrg
844 1.12 mrg #ifdef MADV_SEQUENTIAL
845 1.12 mrg (void)madvise(addr, sz, MADV_SEQUENTIAL);
846 1.12 mrg #endif
847 1.16 mrg while (sz > BOZO_WRSZ) {
848 1.16 mrg if (bozo_write(httpd, STDOUT_FILENO, addr + wroffset,
849 1.16 mrg BOZO_WRSZ) != BOZO_WRSZ) {
850 1.74 mrg bozowarn(httpd, "write failed: %s", strerror(errno));
851 1.12 mrg goto out;
852 1.12 mrg }
853 1.16 mrg debug((httpd, DEBUG_OBESE, "wrote %d bytes", BOZO_WRSZ));
854 1.16 mrg sz -= BOZO_WRSZ;
855 1.16 mrg addr += BOZO_WRSZ;
856 1.16 mrg }
857 1.16 mrg if (sz && (size_t)bozo_write(httpd, STDOUT_FILENO, addr + wroffset,
858 1.16 mrg sz) != sz) {
859 1.74 mrg bozowarn(httpd, "final write failed: %s", strerror(errno));
860 1.12 mrg goto out;
861 1.12 mrg }
862 1.16 mrg debug((httpd, DEBUG_OBESE, "wrote %d bytes", (int)sz));
863 1.12 mrg out:
864 1.14 mrg if (munmap(mappedaddr, mappedsz) < 0) {
865 1.74 mrg bozowarn(httpd, "munmap failed");
866 1.12 mrg return -1;
867 1.12 mrg }
868 1.12 mrg
869 1.12 mrg return 0;
870 1.12 mrg }
871 1.12 mrg
872 1.12 mrg static int
873 1.10 joerg parse_http_date(const char *val, time_t *timestamp)
874 1.10 joerg {
875 1.10 joerg char *remainder;
876 1.10 joerg struct tm tm;
877 1.10 joerg
878 1.10 joerg if ((remainder = strptime(val, "%a, %d %b %Y %T GMT", &tm)) == NULL &&
879 1.10 joerg (remainder = strptime(val, "%a, %d-%b-%y %T GMT", &tm)) == NULL &&
880 1.10 joerg (remainder = strptime(val, "%a %b %d %T %Y", &tm)) == NULL)
881 1.10 joerg return 0; /* Invalid HTTP date format */
882 1.10 joerg
883 1.10 joerg if (*remainder)
884 1.10 joerg return 0; /* No trailing garbage */
885 1.10 joerg
886 1.10 joerg *timestamp = timegm(&tm);
887 1.10 joerg return 1;
888 1.10 joerg }
889 1.10 joerg
890 1.1 tls /*
891 1.32 mrg * given an url, encode it ala rfc 3986. ie, escape ? and friends.
892 1.32 mrg * note that this function returns a static buffer, and thus needs
893 1.67 shm * to be updated for any sort of parallel processing. escape only
894 1.67 shm * chosen characters for absolute redirects
895 1.32 mrg */
896 1.32 mrg char *
897 1.67 shm bozo_escape_rfc3986(bozohttpd_t *httpd, const char *url, int absolute)
898 1.32 mrg {
899 1.32 mrg static char *buf;
900 1.32 mrg static size_t buflen = 0;
901 1.32 mrg size_t len;
902 1.32 mrg const char *s;
903 1.32 mrg char *d;
904 1.32 mrg
905 1.32 mrg len = strlen(url);
906 1.32 mrg if (buflen < len * 3 + 1) {
907 1.32 mrg buflen = len * 3 + 1;
908 1.32 mrg buf = bozorealloc(httpd, buf, buflen);
909 1.32 mrg }
910 1.42 mbalmer
911 1.33 mrg for (len = 0, s = url, d = buf; *s;) {
912 1.32 mrg if (*s & 0x80)
913 1.32 mrg goto encode_it;
914 1.32 mrg switch (*s) {
915 1.32 mrg case ':':
916 1.32 mrg case '?':
917 1.32 mrg case '#':
918 1.32 mrg case '[':
919 1.32 mrg case ']':
920 1.32 mrg case '@':
921 1.32 mrg case '!':
922 1.32 mrg case '$':
923 1.32 mrg case '&':
924 1.32 mrg case '\'':
925 1.32 mrg case '(':
926 1.32 mrg case ')':
927 1.32 mrg case '*':
928 1.32 mrg case '+':
929 1.32 mrg case ',':
930 1.32 mrg case ';':
931 1.32 mrg case '=':
932 1.33 mrg case '%':
933 1.67 shm case '"':
934 1.67 shm if (absolute)
935 1.67 shm goto leave_it;
936 1.66 shm case '\n':
937 1.66 shm case '\r':
938 1.66 shm case ' ':
939 1.32 mrg encode_it:
940 1.66 shm snprintf(d, 4, "%%%02X", *s++);
941 1.32 mrg d += 3;
942 1.32 mrg len += 3;
943 1.33 mrg break;
944 1.67 shm leave_it:
945 1.32 mrg default:
946 1.32 mrg *d++ = *s++;
947 1.32 mrg len++;
948 1.33 mrg break;
949 1.32 mrg }
950 1.32 mrg }
951 1.32 mrg buf[len] = 0;
952 1.32 mrg
953 1.32 mrg return buf;
954 1.32 mrg }
955 1.32 mrg
956 1.32 mrg /*
957 1.67 shm * do automatic redirection -- if there are query parameters or userdir for
958 1.67 shm * the URL we will tack these on to the new (redirected) URL.
959 1.16 mrg */
960 1.16 mrg static void
961 1.74 mrg handle_redirect(bozo_httpreq_t *request, const char *url, int absolute)
962 1.16 mrg {
963 1.16 mrg bozohttpd_t *httpd = request->hr_httpd;
964 1.67 shm char *finalurl, *urlbuf;
965 1.67 shm #ifndef NO_USER_SUPPORT
966 1.67 shm char *userbuf;
967 1.67 shm #endif /* !NO_USER_SUPPORT */
968 1.16 mrg char portbuf[20];
969 1.76 mrg const char *scheme, *query, *quest;
970 1.35 martin const char *hostname = BOZOHOST(httpd, request);
971 1.76 mrg int absproto = 0; /* absolute redirect provides own schema */
972 1.42 mbalmer
973 1.16 mrg if (url == NULL) {
974 1.74 mrg bozoasprintf(httpd, &urlbuf, "/%s/", request->hr_file);
975 1.16 mrg url = urlbuf;
976 1.16 mrg } else
977 1.16 mrg urlbuf = NULL;
978 1.67 shm
979 1.67 shm #ifndef NO_USER_SUPPORT
980 1.67 shm if (request->hr_user && !absolute) {
981 1.74 mrg bozoasprintf(httpd, &userbuf, "/~%s%s", request->hr_user, url);
982 1.67 shm url = userbuf;
983 1.67 shm } else
984 1.67 shm userbuf = NULL;
985 1.67 shm #endif /* !NO_USER_SUPPORT */
986 1.67 shm
987 1.67 shm if (absolute) {
988 1.67 shm char *sep = NULL;
989 1.67 shm const char *s;
990 1.67 shm
991 1.67 shm /*
992 1.75 mrg * absolute redirect may specify own protocol i.e. to redirect
993 1.75 mrg * to another schema like https:// or ftp://.
994 1.75 mrg * Details: RFC 3986, section 3.
995 1.67 shm */
996 1.67 shm
997 1.67 shm /* 1. check if url contains :// */
998 1.67 shm sep = strstr(url, "://");
999 1.67 shm
1000 1.67 shm /*
1001 1.67 shm * RFC 3986, section 3.1:
1002 1.67 shm * scheme = ALPHA *( ALPHA / DIGIT / "+" / "-" / "." )
1003 1.67 shm */
1004 1.73 mrg if (sep) {
1005 1.67 shm for (s = url; s != sep;) {
1006 1.75 mrg if (!isalnum((int)*s) &&
1007 1.75 mrg *s != '+' && *s != '-' && *s != '.')
1008 1.67 shm break;
1009 1.67 shm if (++s == sep) {
1010 1.67 shm absproto = 1;
1011 1.67 shm }
1012 1.67 shm }
1013 1.67 shm }
1014 1.67 shm }
1015 1.67 shm
1016 1.76 mrg /* construct final redirection url */
1017 1.1 tls
1018 1.76 mrg scheme = absproto ? "" : httpd->sslinfo ? "https://" : "http://";
1019 1.1 tls
1020 1.76 mrg if (absolute) {
1021 1.76 mrg hostname = "";
1022 1.16 mrg portbuf[0] = '\0';
1023 1.76 mrg } else {
1024 1.76 mrg const char *defport = httpd->sslinfo ? "443" : "80";
1025 1.67 shm
1026 1.76 mrg if (request->hr_serverport &&
1027 1.76 mrg strcmp(request->hr_serverport, defport) != 0)
1028 1.76 mrg snprintf(portbuf, sizeof(portbuf), ":%s",
1029 1.76 mrg request->hr_serverport);
1030 1.67 shm else
1031 1.76 mrg portbuf[0] = '\0';
1032 1.67 shm }
1033 1.76 mrg
1034 1.76 mrg url = bozo_escape_rfc3986(httpd, url, absolute);
1035 1.76 mrg
1036 1.76 mrg if (request->hr_query && strlen(request->hr_query)) {
1037 1.76 mrg query = request->hr_query;
1038 1.76 mrg quest = "?";
1039 1.76 mrg } else {
1040 1.76 mrg query = quest = "";
1041 1.67 shm }
1042 1.76 mrg
1043 1.76 mrg bozoasprintf(httpd, &finalurl, "%s%s%s%s%s%s",
1044 1.76 mrg scheme, hostname, portbuf, url, quest, query);
1045 1.67 shm
1046 1.74 mrg bozowarn(httpd, "redirecting %s", finalurl);
1047 1.67 shm debug((httpd, DEBUG_FAT, "redirecting %s", finalurl));
1048 1.67 shm
1049 1.16 mrg bozo_printf(httpd, "%s 301 Document Moved\r\n", request->hr_proto);
1050 1.42 mbalmer if (request->hr_proto != httpd->consts.http_09)
1051 1.16 mrg bozo_print_header(request, NULL, "text/html", NULL);
1052 1.67 shm if (request->hr_proto != httpd->consts.http_09)
1053 1.67 shm bozo_printf(httpd, "Location: %s\r\n", finalurl);
1054 1.16 mrg bozo_printf(httpd, "\r\n");
1055 1.16 mrg if (request->hr_method == HTTP_HEAD)
1056 1.16 mrg goto head;
1057 1.16 mrg bozo_printf(httpd, "<html><head><title>Document Moved</title></head>\n");
1058 1.16 mrg bozo_printf(httpd, "<body><h1>Document Moved</h1>\n");
1059 1.67 shm bozo_printf(httpd, "This document had moved <a href=\"%s\">here</a>\n",
1060 1.67 shm finalurl);
1061 1.16 mrg bozo_printf(httpd, "</body></html>\n");
1062 1.16 mrg head:
1063 1.16 mrg bozo_flush(httpd, stdout);
1064 1.44 mbalmer free(urlbuf);
1065 1.67 shm free(finalurl);
1066 1.67 shm #ifndef NO_USER_SUPPORT
1067 1.67 shm free(userbuf);
1068 1.67 shm #endif /* !NO_USER_SUPPORT */
1069 1.1 tls }
1070 1.1 tls
1071 1.1 tls /*
1072 1.1 tls * deal with virtual host names; we do this:
1073 1.16 mrg * if we have a virtual path root (httpd->virtbase), and we are given a
1074 1.1 tls * virtual host spec (Host: ho.st or http://ho.st/), see if this
1075 1.16 mrg * directory exists under httpd->virtbase. if it does, use this as the
1076 1.1 tls # new slashdir.
1077 1.1 tls */
1078 1.12 mrg static int
1079 1.16 mrg check_virtual(bozo_httpreq_t *request)
1080 1.1 tls {
1081 1.16 mrg bozohttpd_t *httpd = request->hr_httpd;
1082 1.9 tls char *file = request->hr_file, *s;
1083 1.1 tls size_t len;
1084 1.1 tls
1085 1.1 tls /*
1086 1.1 tls * convert http://virtual.host/ to request->hr_host
1087 1.1 tls */
1088 1.16 mrg debug((httpd, DEBUG_OBESE, "checking for http:// virtual host in ``%s''",
1089 1.16 mrg file));
1090 1.9 tls if (strncasecmp(file, "http://", 7) == 0) {
1091 1.1 tls /* we would do virtual hosting here? */
1092 1.9 tls file += 7;
1093 1.48 mrg /* RFC 2616 (HTTP/1.1), 5.2: URI takes precedence over Host: */
1094 1.48 mrg free(request->hr_host);
1095 1.73 mrg request->hr_host = bozostrdup(httpd, request, file);
1096 1.48 mrg if ((s = strchr(request->hr_host, '/')) != NULL)
1097 1.48 mrg *s = '\0';
1098 1.9 tls s = strchr(file, '/');
1099 1.48 mrg free(request->hr_file);
1100 1.73 mrg request->hr_file = bozostrdup(httpd, request, s ? s : "/");
1101 1.16 mrg debug((httpd, DEBUG_OBESE, "got host ``%s'' file is now ``%s''",
1102 1.9 tls request->hr_host, request->hr_file));
1103 1.1 tls } else if (!request->hr_host)
1104 1.1 tls goto use_slashdir;
1105 1.1 tls
1106 1.1 tls /*
1107 1.49 mrg * canonicalise hr_host - that is, remove any :80.
1108 1.49 mrg */
1109 1.49 mrg len = strlen(request->hr_host);
1110 1.49 mrg if (len > 3 && strcmp(request->hr_host + len - 3, ":80") == 0) {
1111 1.49 mrg request->hr_host[len - 3] = '\0';
1112 1.49 mrg len = strlen(request->hr_host);
1113 1.49 mrg }
1114 1.67 shm
1115 1.67 shm if (!httpd->virtbase) {
1116 1.67 shm
1117 1.67 shm /*
1118 1.67 shm * if we don't use vhost support, then set virthostname if
1119 1.67 shm * user supplied Host header. It will be used for possible
1120 1.67 shm * redirections
1121 1.67 shm */
1122 1.67 shm
1123 1.67 shm if (request->hr_host) {
1124 1.67 shm s = strrchr(request->hr_host, ':');
1125 1.67 shm if (s != NULL)
1126 1.67 shm /* truncate Host: as we want to copy it without port part */
1127 1.67 shm *s = '\0';
1128 1.73 mrg request->hr_virthostname = bozostrdup(httpd, request,
1129 1.67 shm request->hr_host);
1130 1.67 shm if (s != NULL)
1131 1.67 shm /* fix Host: again, if we truncated it */
1132 1.67 shm *s = ':';
1133 1.67 shm }
1134 1.67 shm
1135 1.67 shm goto use_slashdir;
1136 1.67 shm }
1137 1.49 mrg
1138 1.49 mrg /*
1139 1.49 mrg * ok, we have a virtual host, use opendir(3) to find a case
1140 1.1 tls * insensitive match for the virtual host we are asked for.
1141 1.1 tls * note that if the virtual host is the same as the master,
1142 1.1 tls * we don't need to do anything special.
1143 1.1 tls */
1144 1.16 mrg debug((httpd, DEBUG_OBESE,
1145 1.16 mrg "check_virtual: checking host `%s' under httpd->virtbase `%s' "
1146 1.16 mrg "for file `%s'",
1147 1.16 mrg request->hr_host, httpd->virtbase, request->hr_file));
1148 1.16 mrg if (strncasecmp(httpd->virthostname, request->hr_host, len) != 0) {
1149 1.1 tls s = 0;
1150 1.24 mrg DIR *dirp;
1151 1.24 mrg struct dirent *d;
1152 1.24 mrg
1153 1.23 mrg if ((dirp = opendir(httpd->virtbase)) != NULL) {
1154 1.23 mrg while ((d = readdir(dirp)) != NULL) {
1155 1.23 mrg if (strcmp(d->d_name, ".") == 0 ||
1156 1.23 mrg strcmp(d->d_name, "..") == 0) {
1157 1.23 mrg continue;
1158 1.23 mrg }
1159 1.23 mrg debug((httpd, DEBUG_OBESE, "looking at dir``%s''",
1160 1.23 mrg d->d_name));
1161 1.65 shm if (strcmp(d->d_name, request->hr_host) == 0) {
1162 1.23 mrg /* found it, punch it */
1163 1.23 mrg debug((httpd, DEBUG_OBESE, "found it punch it"));
1164 1.35 martin request->hr_virthostname =
1165 1.73 mrg bozostrdup(httpd, request, d->d_name);
1166 1.74 mrg bozoasprintf(httpd, &s, "%s/%s",
1167 1.72 christos httpd->virtbase,
1168 1.72 christos request->hr_virthostname);
1169 1.23 mrg break;
1170 1.23 mrg }
1171 1.1 tls }
1172 1.23 mrg closedir(dirp);
1173 1.23 mrg }
1174 1.23 mrg else {
1175 1.23 mrg debug((httpd, DEBUG_FAT, "opendir %s failed: %s",
1176 1.23 mrg httpd->virtbase, strerror(errno)));
1177 1.1 tls }
1178 1.1 tls if (s == 0) {
1179 1.16 mrg if (httpd->unknown_slash)
1180 1.1 tls goto use_slashdir;
1181 1.16 mrg return bozo_http_error(httpd, 404, request,
1182 1.16 mrg "unknown URL");
1183 1.1 tls }
1184 1.1 tls } else
1185 1.1 tls use_slashdir:
1186 1.16 mrg s = httpd->slashdir;
1187 1.1 tls
1188 1.1 tls /*
1189 1.1 tls * ok, nailed the correct slashdir, chdir to it
1190 1.1 tls */
1191 1.1 tls if (chdir(s) < 0)
1192 1.16 mrg return bozo_http_error(httpd, 404, request,
1193 1.16 mrg "can't chdir to slashdir");
1194 1.12 mrg return 0;
1195 1.1 tls }
1196 1.1 tls
1197 1.1 tls /*
1198 1.1 tls * checks to see if this request has a valid .bzredirect file. returns
1199 1.36 martin * 0 when no redirection happend, or 1 when handle_redirect() has been
1200 1.53 mrg * called, -1 on error.
1201 1.1 tls */
1202 1.36 martin static int
1203 1.16 mrg check_bzredirect(bozo_httpreq_t *request)
1204 1.1 tls {
1205 1.73 mrg bozohttpd_t *httpd = request->hr_httpd;
1206 1.1 tls struct stat sb;
1207 1.39 martin char dir[MAXPATHLEN], redir[MAXPATHLEN], redirpath[MAXPATHLEN + 1],
1208 1.39 martin path[MAXPATHLEN];
1209 1.1 tls char *basename, *finalredir;
1210 1.1 tls int rv, absolute;
1211 1.1 tls
1212 1.1 tls /*
1213 1.1 tls * if this pathname is really a directory, but doesn't end in /,
1214 1.1 tls * use it as the directory to look for the redir file.
1215 1.1 tls */
1216 1.53 mrg if((size_t)snprintf(dir, sizeof(dir), "%s", request->hr_file + 1) >=
1217 1.53 mrg sizeof(dir)) {
1218 1.73 mrg bozo_http_error(httpd, 404, request,
1219 1.53 mrg "file path too long");
1220 1.53 mrg return -1;
1221 1.53 mrg }
1222 1.73 mrg debug((httpd, DEBUG_FAT, "check_bzredirect: dir %s", dir));
1223 1.1 tls basename = strrchr(dir, '/');
1224 1.1 tls
1225 1.1 tls if ((!basename || basename[1] != '\0') &&
1226 1.67 shm lstat(dir, &sb) == 0 && S_ISDIR(sb.st_mode)) {
1227 1.67 shm strcpy(path, dir);
1228 1.67 shm } else if (basename == NULL) {
1229 1.67 shm strcpy(path, ".");
1230 1.67 shm strcpy(dir, "");
1231 1.67 shm } else {
1232 1.1 tls *basename++ = '\0';
1233 1.16 mrg bozo_check_special_files(request, basename);
1234 1.67 shm strcpy(path, dir);
1235 1.1 tls }
1236 1.1 tls
1237 1.73 mrg debug((httpd, DEBUG_FAT, "check_bzredirect: path %s", path));
1238 1.67 shm
1239 1.67 shm if ((size_t)snprintf(redir, sizeof(redir), "%s/%s", path,
1240 1.53 mrg REDIRECT_FILE) >= sizeof(redir)) {
1241 1.73 mrg bozo_http_error(httpd, 404, request,
1242 1.73 mrg "redirectfile path too long");
1243 1.53 mrg return -1;
1244 1.53 mrg }
1245 1.1 tls if (lstat(redir, &sb) == 0) {
1246 1.16 mrg if (!S_ISLNK(sb.st_mode))
1247 1.36 martin return 0;
1248 1.1 tls absolute = 0;
1249 1.1 tls } else {
1250 1.67 shm if((size_t)snprintf(redir, sizeof(redir), "%s/%s", path,
1251 1.53 mrg ABSREDIRECT_FILE) >= sizeof(redir)) {
1252 1.73 mrg bozo_http_error(httpd, 404, request,
1253 1.53 mrg "redirectfile path too long");
1254 1.53 mrg return -1;
1255 1.53 mrg }
1256 1.16 mrg if (lstat(redir, &sb) < 0 || !S_ISLNK(sb.st_mode))
1257 1.36 martin return 0;
1258 1.1 tls absolute = 1;
1259 1.1 tls }
1260 1.73 mrg debug((httpd, DEBUG_FAT, "check_bzredirect: calling readlink"));
1261 1.1 tls rv = readlink(redir, redirpath, sizeof redirpath - 1);
1262 1.1 tls if (rv == -1 || rv == 0) {
1263 1.73 mrg debug((httpd, DEBUG_FAT, "readlink failed"));
1264 1.36 martin return 0;
1265 1.1 tls }
1266 1.1 tls redirpath[rv] = '\0';
1267 1.73 mrg debug((httpd, DEBUG_FAT, "readlink returned \"%s\"", redirpath));
1268 1.39 martin
1269 1.39 martin /* check if we need authentication */
1270 1.39 martin snprintf(path, sizeof(path), "%s/", dir);
1271 1.39 martin if (bozo_auth_check(request, path))
1272 1.39 martin return 1;
1273 1.39 martin
1274 1.1 tls /* now we have the link pointer, redirect to the real place */
1275 1.67 shm if (!absolute && redirpath[0] != '/') {
1276 1.67 shm if ((size_t)snprintf(finalredir = redir, sizeof(redir), "%s%s/%s",
1277 1.67 shm (strlen(dir) > 0 ? "/" : ""), dir, redirpath) >= sizeof(redir)) {
1278 1.73 mrg bozo_http_error(httpd, 404, request,
1279 1.53 mrg "redirect path too long");
1280 1.53 mrg return -1;
1281 1.53 mrg }
1282 1.67 shm } else
1283 1.67 shm finalredir = redirpath;
1284 1.1 tls
1285 1.73 mrg debug((httpd, DEBUG_FAT, "check_bzredirect: new redir %s", finalredir));
1286 1.1 tls handle_redirect(request, finalredir, absolute);
1287 1.36 martin return 1;
1288 1.1 tls }
1289 1.1 tls
1290 1.16 mrg /* this fixes the %HH hack that RFC2396 requires. */
1291 1.80 mrg int
1292 1.80 mrg bozo_decode_url_percent(bozo_httpreq_t *request, char *str)
1293 1.1 tls {
1294 1.16 mrg bozohttpd_t *httpd = request->hr_httpd;
1295 1.80 mrg char *s, *t, buf[3];
1296 1.16 mrg char *end; /* if end is not-zero, we don't translate beyond that */
1297 1.16 mrg
1298 1.80 mrg end = str + strlen(str);
1299 1.16 mrg
1300 1.16 mrg /* fast forward to the first % */
1301 1.80 mrg if ((s = strchr(str, '%')) == NULL)
1302 1.51 shm return 0;
1303 1.1 tls
1304 1.16 mrg t = s;
1305 1.16 mrg do {
1306 1.16 mrg if (end && s >= end) {
1307 1.16 mrg debug((httpd, DEBUG_EXPLODING,
1308 1.16 mrg "fu_%%: past end, filling out.."));
1309 1.16 mrg while (*s)
1310 1.16 mrg *t++ = *s++;
1311 1.16 mrg break;
1312 1.16 mrg }
1313 1.16 mrg debug((httpd, DEBUG_EXPLODING,
1314 1.16 mrg "fu_%%: got s == %%, s[1]s[2] == %c%c",
1315 1.16 mrg s[1], s[2]));
1316 1.16 mrg if (s[1] == '\0' || s[2] == '\0') {
1317 1.16 mrg (void)bozo_http_error(httpd, 400, request,
1318 1.16 mrg "percent hack missing two chars afterwards");
1319 1.51 shm return 1;
1320 1.16 mrg }
1321 1.16 mrg if (s[1] == '0' && s[2] == '0') {
1322 1.16 mrg (void)bozo_http_error(httpd, 404, request,
1323 1.16 mrg "percent hack was %00");
1324 1.51 shm return 1;
1325 1.16 mrg }
1326 1.16 mrg if (s[1] == '2' && s[2] == 'f') {
1327 1.16 mrg (void)bozo_http_error(httpd, 404, request,
1328 1.16 mrg "percent hack was %2f (/)");
1329 1.51 shm return 1;
1330 1.16 mrg }
1331 1.42 mbalmer
1332 1.16 mrg buf[0] = *++s;
1333 1.16 mrg buf[1] = *++s;
1334 1.16 mrg buf[2] = '\0';
1335 1.16 mrg s++;
1336 1.16 mrg *t = (char)strtol(buf, NULL, 16);
1337 1.16 mrg debug((httpd, DEBUG_EXPLODING,
1338 1.16 mrg "fu_%%: strtol put '%02x' into *t", *t));
1339 1.16 mrg if (*t++ == '\0') {
1340 1.16 mrg (void)bozo_http_error(httpd, 400, request,
1341 1.16 mrg "percent hack got a 0 back");
1342 1.51 shm return 1;
1343 1.16 mrg }
1344 1.1 tls
1345 1.16 mrg while (*s && *s != '%') {
1346 1.16 mrg if (end && s >= end)
1347 1.16 mrg break;
1348 1.16 mrg *t++ = *s++;
1349 1.16 mrg }
1350 1.16 mrg } while (*s);
1351 1.16 mrg *t = '\0';
1352 1.51 shm
1353 1.80 mrg debug((httpd, DEBUG_FAT, "bozo_decode_url_percent returns `%s'",
1354 1.16 mrg request->hr_file));
1355 1.51 shm
1356 1.51 shm return 0;
1357 1.1 tls }
1358 1.1 tls
1359 1.1 tls /*
1360 1.1 tls * transform_request does this:
1361 1.1 tls * - ``expand'' %20 crapola
1362 1.1 tls * - punt if it doesn't start with /
1363 1.1 tls * - look for "http://myname/" and deal with it.
1364 1.42 mbalmer * - maybe call bozo_process_cgi()
1365 1.16 mrg * - check for ~user and call bozo_user_transform() if so
1366 1.1 tls * - if the length > 1, check for trailing slash. if so,
1367 1.1 tls * add the index.html file
1368 1.1 tls * - if the length is 1, return the index.html file
1369 1.1 tls * - disallow anything ending up with a file starting
1370 1.1 tls * at "/" or having ".." in it.
1371 1.1 tls * - anything else is a really weird internal error
1372 1.12 mrg * - returns malloced file to serve, if unhandled
1373 1.1 tls */
1374 1.16 mrg static int
1375 1.16 mrg transform_request(bozo_httpreq_t *request, int *isindex)
1376 1.1 tls {
1377 1.16 mrg bozohttpd_t *httpd = request->hr_httpd;
1378 1.12 mrg char *file, *newfile = NULL;
1379 1.1 tls size_t len;
1380 1.1 tls
1381 1.12 mrg file = NULL;
1382 1.1 tls *isindex = 0;
1383 1.16 mrg debug((httpd, DEBUG_FAT, "tf_req: file %s", request->hr_file));
1384 1.80 mrg if (bozo_decode_url_percent(request, request->hr_file)) {
1385 1.51 shm goto bad_done;
1386 1.51 shm }
1387 1.12 mrg if (check_virtual(request)) {
1388 1.12 mrg goto bad_done;
1389 1.12 mrg }
1390 1.12 mrg file = request->hr_file;
1391 1.1 tls
1392 1.12 mrg if (file[0] != '/') {
1393 1.16 mrg (void)bozo_http_error(httpd, 404, request, "unknown URL");
1394 1.12 mrg goto bad_done;
1395 1.12 mrg }
1396 1.1 tls
1397 1.66 shm /* omit additional slashes at the beginning */
1398 1.66 shm while (file[1] == '/')
1399 1.66 shm file++;
1400 1.66 shm
1401 1.67 shm /* fix file provided by user as it's used in other handlers */
1402 1.67 shm request->hr_file = file;
1403 1.1 tls
1404 1.67 shm len = strlen(file);
1405 1.1 tls
1406 1.1 tls #ifndef NO_USER_SUPPORT
1407 1.67 shm /* first of all expand user path */
1408 1.67 shm if (len > 1 && httpd->enable_users && file[1] == '~') {
1409 1.12 mrg if (file[2] == '\0') {
1410 1.16 mrg (void)bozo_http_error(httpd, 404, request,
1411 1.16 mrg "missing username");
1412 1.12 mrg goto bad_done;
1413 1.12 mrg }
1414 1.12 mrg if (strchr(file + 2, '/') == NULL) {
1415 1.67 shm char *userredirecturl;
1416 1.74 mrg bozoasprintf(httpd, &userredirecturl, "%s/", file);
1417 1.67 shm handle_redirect(request, userredirecturl, 0);
1418 1.67 shm free(userredirecturl);
1419 1.12 mrg return 0;
1420 1.12 mrg }
1421 1.16 mrg debug((httpd, DEBUG_FAT, "calling bozo_user_transform"));
1422 1.12 mrg
1423 1.67 shm if (!bozo_user_transform(request))
1424 1.67 shm return 0;
1425 1.67 shm
1426 1.67 shm file = request->hr_file;
1427 1.67 shm len = strlen(file);
1428 1.67 shm }
1429 1.1 tls #endif /* NO_USER_SUPPORT */
1430 1.67 shm
1431 1.67 shm
1432 1.67 shm switch (check_bzredirect(request)) {
1433 1.67 shm case -1:
1434 1.67 shm goto bad_done;
1435 1.67 shm case 1:
1436 1.67 shm return 0;
1437 1.67 shm }
1438 1.67 shm
1439 1.67 shm if (len > 1) {
1440 1.16 mrg debug((httpd, DEBUG_FAT, "file[len-1] == %c", file[len-1]));
1441 1.12 mrg if (file[len-1] == '/') { /* append index.html */
1442 1.1 tls *isindex = 1;
1443 1.16 mrg debug((httpd, DEBUG_FAT, "appending index.html"));
1444 1.16 mrg newfile = bozomalloc(httpd,
1445 1.16 mrg len + strlen(httpd->index_html) + 1);
1446 1.12 mrg strcpy(newfile, file + 1);
1447 1.16 mrg strcat(newfile, httpd->index_html);
1448 1.1 tls } else
1449 1.73 mrg newfile = bozostrdup(httpd, request, file + 1);
1450 1.1 tls } else if (len == 1) {
1451 1.16 mrg debug((httpd, DEBUG_EXPLODING, "tf_req: len == 1"));
1452 1.73 mrg newfile = bozostrdup(httpd, request, httpd->index_html);
1453 1.1 tls *isindex = 1;
1454 1.12 mrg } else { /* len == 0 ? */
1455 1.16 mrg (void)bozo_http_error(httpd, 500, request,
1456 1.16 mrg "request->hr_file is nul?");
1457 1.12 mrg goto bad_done;
1458 1.12 mrg }
1459 1.1 tls
1460 1.12 mrg if (newfile == NULL) {
1461 1.16 mrg (void)bozo_http_error(httpd, 500, request, "internal failure");
1462 1.12 mrg goto bad_done;
1463 1.12 mrg }
1464 1.1 tls
1465 1.1 tls /*
1466 1.42 mbalmer * stop traversing outside our domain
1467 1.1 tls *
1468 1.1 tls * XXX true security only comes from our parent using chroot(2)
1469 1.1 tls * before execve(2)'ing us. or our own built in chroot(2) support.
1470 1.1 tls */
1471 1.67 shm
1472 1.67 shm debug((httpd, DEBUG_FAT, "newfile: %s", newfile));
1473 1.67 shm
1474 1.12 mrg if (*newfile == '/' || strcmp(newfile, "..") == 0 ||
1475 1.12 mrg strstr(newfile, "/..") || strstr(newfile, "../")) {
1476 1.16 mrg (void)bozo_http_error(httpd, 403, request, "illegal request");
1477 1.12 mrg goto bad_done;
1478 1.12 mrg }
1479 1.12 mrg
1480 1.17 mrg if (bozo_auth_check(request, newfile))
1481 1.12 mrg goto bad_done;
1482 1.1 tls
1483 1.13 mrg if (strlen(newfile)) {
1484 1.20 mrg request->hr_oldfile = request->hr_file;
1485 1.12 mrg request->hr_file = newfile;
1486 1.13 mrg }
1487 1.9 tls
1488 1.16 mrg if (bozo_process_cgi(request))
1489 1.12 mrg return 0;
1490 1.1 tls
1491 1.43 mbalmer if (bozo_process_lua(request))
1492 1.43 mbalmer return 0;
1493 1.43 mbalmer
1494 1.16 mrg debug((httpd, DEBUG_FAT, "transform_request set: %s", newfile));
1495 1.12 mrg return 1;
1496 1.12 mrg bad_done:
1497 1.16 mrg debug((httpd, DEBUG_FAT, "transform_request returning: 0"));
1498 1.44 mbalmer free(newfile);
1499 1.12 mrg return 0;
1500 1.1 tls }
1501 1.1 tls
1502 1.1 tls /*
1503 1.31 elric * can_gzip checks if the request supports and prefers gzip encoding.
1504 1.31 elric *
1505 1.31 elric * XXX: we do not consider the associated q with gzip in making our
1506 1.31 elric * decision which is broken.
1507 1.31 elric */
1508 1.31 elric
1509 1.31 elric static int
1510 1.31 elric can_gzip(bozo_httpreq_t *request)
1511 1.31 elric {
1512 1.31 elric const char *pos;
1513 1.31 elric const char *tmp;
1514 1.31 elric size_t len;
1515 1.31 elric
1516 1.31 elric /* First we decide if the request can be gzipped at all. */
1517 1.31 elric
1518 1.31 elric /* not if we already are encoded... */
1519 1.31 elric tmp = bozo_content_encoding(request, request->hr_file);
1520 1.31 elric if (tmp && *tmp)
1521 1.31 elric return 0;
1522 1.31 elric
1523 1.31 elric /* not if we are not asking for the whole file... */
1524 1.31 elric if (request->hr_last_byte_pos != -1 || request->hr_have_range)
1525 1.31 elric return 0;
1526 1.31 elric
1527 1.31 elric /* Then we determine if gzip is on the cards. */
1528 1.31 elric
1529 1.31 elric for (pos = request->hr_accept_encoding; pos && *pos; pos += len) {
1530 1.31 elric while (*pos == ' ')
1531 1.31 elric pos++;
1532 1.31 elric
1533 1.31 elric len = strcspn(pos, ";,");
1534 1.31 elric
1535 1.31 elric if ((len == 4 && strncasecmp("gzip", pos, 4) == 0) ||
1536 1.31 elric (len == 6 && strncasecmp("x-gzip", pos, 6) == 0))
1537 1.31 elric return 1;
1538 1.31 elric
1539 1.31 elric if (pos[len] == ';')
1540 1.31 elric len += strcspn(&pos[len], ",");
1541 1.31 elric
1542 1.31 elric if (pos[len])
1543 1.31 elric len++;
1544 1.31 elric }
1545 1.31 elric
1546 1.31 elric return 0;
1547 1.31 elric }
1548 1.31 elric
1549 1.31 elric /*
1550 1.16 mrg * bozo_process_request does the following:
1551 1.16 mrg * - check the request is valid
1552 1.16 mrg * - process cgi-bin if necessary
1553 1.16 mrg * - transform a filename if necesarry
1554 1.16 mrg * - return the HTTP request
1555 1.1 tls */
1556 1.16 mrg void
1557 1.16 mrg bozo_process_request(bozo_httpreq_t *request)
1558 1.1 tls {
1559 1.16 mrg bozohttpd_t *httpd = request->hr_httpd;
1560 1.16 mrg struct stat sb;
1561 1.16 mrg time_t timestamp;
1562 1.16 mrg char *file;
1563 1.16 mrg const char *type, *encoding;
1564 1.16 mrg int fd, isindex;
1565 1.16 mrg
1566 1.16 mrg /*
1567 1.16 mrg * note that transform_request chdir()'s if required. also note
1568 1.16 mrg * that cgi is handed here. if transform_request() returns 0
1569 1.16 mrg * then the request has been handled already.
1570 1.16 mrg */
1571 1.16 mrg if (transform_request(request, &isindex) == 0)
1572 1.16 mrg return;
1573 1.12 mrg
1574 1.31 elric fd = -1;
1575 1.31 elric encoding = NULL;
1576 1.31 elric if (can_gzip(request)) {
1577 1.74 mrg bozoasprintf(httpd, &file, "%s.gz", request->hr_file);
1578 1.31 elric fd = open(file, O_RDONLY);
1579 1.31 elric if (fd >= 0)
1580 1.31 elric encoding = "gzip";
1581 1.31 elric free(file);
1582 1.31 elric }
1583 1.31 elric
1584 1.16 mrg file = request->hr_file;
1585 1.9 tls
1586 1.31 elric if (fd < 0)
1587 1.31 elric fd = open(file, O_RDONLY);
1588 1.31 elric
1589 1.16 mrg if (fd < 0) {
1590 1.16 mrg debug((httpd, DEBUG_FAT, "open failed: %s", strerror(errno)));
1591 1.67 shm switch (errno) {
1592 1.52 shm case EPERM:
1593 1.61 snj case EACCES:
1594 1.16 mrg (void)bozo_http_error(httpd, 403, request,
1595 1.16 mrg "no permission to open file");
1596 1.52 shm break;
1597 1.52 shm case ENAMETOOLONG:
1598 1.52 shm /*FALLTHROUGH*/
1599 1.52 shm case ENOENT:
1600 1.42 mbalmer if (!bozo_dir_index(request, file, isindex))
1601 1.16 mrg (void)bozo_http_error(httpd, 404, request,
1602 1.16 mrg "no file");
1603 1.52 shm break;
1604 1.52 shm default:
1605 1.16 mrg (void)bozo_http_error(httpd, 500, request, "open file");
1606 1.52 shm }
1607 1.16 mrg goto cleanup_nofd;
1608 1.1 tls }
1609 1.16 mrg if (fstat(fd, &sb) < 0) {
1610 1.16 mrg (void)bozo_http_error(httpd, 500, request, "can't fstat");
1611 1.16 mrg goto cleanup;
1612 1.9 tls }
1613 1.16 mrg if (S_ISDIR(sb.st_mode)) {
1614 1.16 mrg handle_redirect(request, NULL, 0);
1615 1.16 mrg goto cleanup;
1616 1.6 mrg }
1617 1.1 tls
1618 1.16 mrg if (request->hr_if_modified_since &&
1619 1.16 mrg parse_http_date(request->hr_if_modified_since, ×tamp) &&
1620 1.16 mrg timestamp >= sb.st_mtime) {
1621 1.16 mrg /* XXX ignore subsecond of timestamp */
1622 1.16 mrg bozo_printf(httpd, "%s 304 Not Modified\r\n",
1623 1.16 mrg request->hr_proto);
1624 1.16 mrg bozo_printf(httpd, "\r\n");
1625 1.16 mrg bozo_flush(httpd, stdout);
1626 1.16 mrg goto cleanup;
1627 1.1 tls }
1628 1.1 tls
1629 1.16 mrg /* validate requested range */
1630 1.16 mrg if (request->hr_last_byte_pos == -1 ||
1631 1.16 mrg request->hr_last_byte_pos >= sb.st_size)
1632 1.16 mrg request->hr_last_byte_pos = sb.st_size - 1;
1633 1.16 mrg if (request->hr_have_range &&
1634 1.16 mrg request->hr_first_byte_pos > request->hr_last_byte_pos) {
1635 1.16 mrg request->hr_have_range = 0; /* punt */
1636 1.16 mrg request->hr_first_byte_pos = 0;
1637 1.16 mrg request->hr_last_byte_pos = sb.st_size - 1;
1638 1.1 tls }
1639 1.28 joerg debug((httpd, DEBUG_FAT, "have_range %d first_pos %lld last_pos %lld",
1640 1.16 mrg request->hr_have_range,
1641 1.28 joerg (long long)request->hr_first_byte_pos,
1642 1.28 joerg (long long)request->hr_last_byte_pos));
1643 1.16 mrg if (request->hr_have_range)
1644 1.16 mrg bozo_printf(httpd, "%s 206 Partial Content\r\n",
1645 1.16 mrg request->hr_proto);
1646 1.16 mrg else
1647 1.16 mrg bozo_printf(httpd, "%s 200 OK\r\n", request->hr_proto);
1648 1.1 tls
1649 1.16 mrg if (request->hr_proto != httpd->consts.http_09) {
1650 1.16 mrg type = bozo_content_type(request, file);
1651 1.31 elric if (!encoding)
1652 1.31 elric encoding = bozo_content_encoding(request, file);
1653 1.1 tls
1654 1.16 mrg bozo_print_header(request, &sb, type, encoding);
1655 1.16 mrg bozo_printf(httpd, "\r\n");
1656 1.12 mrg }
1657 1.16 mrg bozo_flush(httpd, stdout);
1658 1.1 tls
1659 1.16 mrg if (request->hr_method != HTTP_HEAD) {
1660 1.16 mrg off_t szleft, cur_byte_pos;
1661 1.1 tls
1662 1.16 mrg szleft =
1663 1.16 mrg request->hr_last_byte_pos - request->hr_first_byte_pos + 1;
1664 1.16 mrg cur_byte_pos = request->hr_first_byte_pos;
1665 1.1 tls
1666 1.16 mrg retry:
1667 1.16 mrg while (szleft) {
1668 1.16 mrg size_t sz;
1669 1.12 mrg
1670 1.16 mrg if ((off_t)httpd->mmapsz < szleft)
1671 1.16 mrg sz = httpd->mmapsz;
1672 1.16 mrg else
1673 1.16 mrg sz = (size_t)szleft;
1674 1.16 mrg if (mmap_and_write_part(httpd, fd, cur_byte_pos, sz)) {
1675 1.16 mrg if (errno == ENOMEM) {
1676 1.16 mrg httpd->mmapsz /= 2;
1677 1.16 mrg if (httpd->mmapsz >= httpd->page_size)
1678 1.16 mrg goto retry;
1679 1.16 mrg }
1680 1.16 mrg goto cleanup;
1681 1.16 mrg }
1682 1.16 mrg cur_byte_pos += sz;
1683 1.16 mrg szleft -= sz;
1684 1.1 tls }
1685 1.16 mrg }
1686 1.16 mrg cleanup:
1687 1.16 mrg close(fd);
1688 1.16 mrg cleanup_nofd:
1689 1.16 mrg close(STDIN_FILENO);
1690 1.16 mrg close(STDOUT_FILENO);
1691 1.16 mrg /*close(STDERR_FILENO);*/
1692 1.1 tls }
1693 1.1 tls
1694 1.16 mrg /* make sure we're not trying to access special files */
1695 1.16 mrg int
1696 1.16 mrg bozo_check_special_files(bozo_httpreq_t *request, const char *name)
1697 1.1 tls {
1698 1.16 mrg bozohttpd_t *httpd = request->hr_httpd;
1699 1.1 tls
1700 1.16 mrg /* ensure basename(name) != special files */
1701 1.16 mrg if (strcmp(name, DIRECT_ACCESS_FILE) == 0)
1702 1.16 mrg return bozo_http_error(httpd, 403, request,
1703 1.16 mrg "no permission to open direct access file");
1704 1.16 mrg if (strcmp(name, REDIRECT_FILE) == 0)
1705 1.16 mrg return bozo_http_error(httpd, 403, request,
1706 1.16 mrg "no permission to open redirect file");
1707 1.16 mrg if (strcmp(name, ABSREDIRECT_FILE) == 0)
1708 1.16 mrg return bozo_http_error(httpd, 403, request,
1709 1.16 mrg "no permission to open redirect file");
1710 1.17 mrg return bozo_auth_check_special_files(request, name);
1711 1.16 mrg }
1712 1.1 tls
1713 1.16 mrg /* generic header printing routine */
1714 1.16 mrg void
1715 1.16 mrg bozo_print_header(bozo_httpreq_t *request,
1716 1.16 mrg struct stat *sbp, const char *type, const char *encoding)
1717 1.16 mrg {
1718 1.16 mrg bozohttpd_t *httpd = request->hr_httpd;
1719 1.16 mrg off_t len;
1720 1.16 mrg char date[40];
1721 1.78 elric bozoheaders_t *hdr;
1722 1.78 elric
1723 1.78 elric SIMPLEQ_FOREACH(hdr, &request->hr_replheaders, h_next) {
1724 1.78 elric bozo_printf(httpd, "%s: %s\r\n", hdr->h_header,
1725 1.78 elric hdr->h_value);
1726 1.78 elric }
1727 1.1 tls
1728 1.16 mrg bozo_printf(httpd, "Date: %s\r\n", bozo_http_date(date, sizeof(date)));
1729 1.16 mrg bozo_printf(httpd, "Server: %s\r\n", httpd->server_software);
1730 1.16 mrg bozo_printf(httpd, "Accept-Ranges: bytes\r\n");
1731 1.16 mrg if (sbp) {
1732 1.16 mrg char filedate[40];
1733 1.16 mrg struct tm *tm;
1734 1.1 tls
1735 1.16 mrg tm = gmtime(&sbp->st_mtime);
1736 1.16 mrg strftime(filedate, sizeof filedate,
1737 1.16 mrg "%a, %d %b %Y %H:%M:%S GMT", tm);
1738 1.16 mrg bozo_printf(httpd, "Last-Modified: %s\r\n", filedate);
1739 1.16 mrg }
1740 1.16 mrg if (type && *type)
1741 1.16 mrg bozo_printf(httpd, "Content-Type: %s\r\n", type);
1742 1.16 mrg if (encoding && *encoding)
1743 1.16 mrg bozo_printf(httpd, "Content-Encoding: %s\r\n", encoding);
1744 1.16 mrg if (sbp) {
1745 1.16 mrg if (request->hr_have_range) {
1746 1.16 mrg len = request->hr_last_byte_pos -
1747 1.16 mrg request->hr_first_byte_pos +1;
1748 1.16 mrg bozo_printf(httpd,
1749 1.16 mrg "Content-Range: bytes %qd-%qd/%qd\r\n",
1750 1.16 mrg (long long) request->hr_first_byte_pos,
1751 1.16 mrg (long long) request->hr_last_byte_pos,
1752 1.16 mrg (long long) sbp->st_size);
1753 1.16 mrg } else
1754 1.16 mrg len = sbp->st_size;
1755 1.16 mrg bozo_printf(httpd, "Content-Length: %qd\r\n", (long long)len);
1756 1.1 tls }
1757 1.67 shm if (request->hr_proto == httpd->consts.http_11)
1758 1.16 mrg bozo_printf(httpd, "Connection: close\r\n");
1759 1.16 mrg bozo_flush(httpd, stdout);
1760 1.1 tls }
1761 1.1 tls
1762 1.25 mrg #ifndef NO_DEBUG
1763 1.1 tls void
1764 1.16 mrg debug__(bozohttpd_t *httpd, int level, const char *fmt, ...)
1765 1.1 tls {
1766 1.1 tls va_list ap;
1767 1.1 tls int savederrno;
1768 1.42 mbalmer
1769 1.1 tls /* only log if the level is low enough */
1770 1.16 mrg if (httpd->debug < level)
1771 1.1 tls return;
1772 1.1 tls
1773 1.1 tls savederrno = errno;
1774 1.1 tls va_start(ap, fmt);
1775 1.16 mrg if (httpd->logstderr) {
1776 1.1 tls vfprintf(stderr, fmt, ap);
1777 1.1 tls fputs("\n", stderr);
1778 1.1 tls } else
1779 1.1 tls vsyslog(LOG_DEBUG, fmt, ap);
1780 1.1 tls va_end(ap);
1781 1.1 tls errno = savederrno;
1782 1.1 tls }
1783 1.25 mrg #endif /* NO_DEBUG */
1784 1.1 tls
1785 1.1 tls /* these are like warn() and err(), except for syslog not stderr */
1786 1.1 tls void
1787 1.74 mrg bozowarn(bozohttpd_t *httpd, const char *fmt, ...)
1788 1.1 tls {
1789 1.1 tls va_list ap;
1790 1.1 tls
1791 1.1 tls va_start(ap, fmt);
1792 1.16 mrg if (httpd->logstderr || isatty(STDERR_FILENO)) {
1793 1.14 mrg //fputs("warning: ", stderr);
1794 1.1 tls vfprintf(stderr, fmt, ap);
1795 1.1 tls fputs("\n", stderr);
1796 1.1 tls } else
1797 1.1 tls vsyslog(LOG_INFO, fmt, ap);
1798 1.1 tls va_end(ap);
1799 1.1 tls }
1800 1.1 tls
1801 1.1 tls void
1802 1.74 mrg bozoerr(bozohttpd_t *httpd, int code, const char *fmt, ...)
1803 1.1 tls {
1804 1.1 tls va_list ap;
1805 1.1 tls
1806 1.1 tls va_start(ap, fmt);
1807 1.16 mrg if (httpd->logstderr || isatty(STDERR_FILENO)) {
1808 1.14 mrg //fputs("error: ", stderr);
1809 1.1 tls vfprintf(stderr, fmt, ap);
1810 1.1 tls fputs("\n", stderr);
1811 1.1 tls } else
1812 1.1 tls vsyslog(LOG_ERR, fmt, ap);
1813 1.1 tls va_end(ap);
1814 1.1 tls exit(code);
1815 1.1 tls }
1816 1.1 tls
1817 1.72 christos void
1818 1.74 mrg bozoasprintf(bozohttpd_t *httpd, char **str, const char *fmt, ...)
1819 1.72 christos {
1820 1.72 christos va_list ap;
1821 1.72 christos int e;
1822 1.72 christos
1823 1.72 christos va_start(ap, fmt);
1824 1.72 christos e = vasprintf(str, fmt, ap);
1825 1.72 christos va_end(ap);
1826 1.72 christos
1827 1.72 christos if (e < 0)
1828 1.74 mrg bozoerr(httpd, EXIT_FAILURE, "asprintf");
1829 1.72 christos }
1830 1.72 christos
1831 1.40 mrg /*
1832 1.40 mrg * this escapes HTML tags. returns allocated escaped
1833 1.40 mrg * string if needed, or NULL on allocation failure or
1834 1.40 mrg * lack of escape need.
1835 1.40 mrg * call with NULL httpd in error paths, to avoid recursive
1836 1.40 mrg * malloc failure. call with valid httpd in normal paths
1837 1.40 mrg * to get automatic allocation failure handling.
1838 1.40 mrg */
1839 1.40 mrg char *
1840 1.40 mrg bozo_escape_html(bozohttpd_t *httpd, const char *url)
1841 1.1 tls {
1842 1.16 mrg int i, j;
1843 1.40 mrg char *tmp;
1844 1.40 mrg size_t len;
1845 1.1 tls
1846 1.16 mrg for (i = 0, j = 0; url[i]; i++) {
1847 1.16 mrg switch (url[i]) {
1848 1.16 mrg case '<':
1849 1.16 mrg case '>':
1850 1.16 mrg j += 4;
1851 1.16 mrg break;
1852 1.16 mrg case '&':
1853 1.16 mrg j += 5;
1854 1.16 mrg break;
1855 1.16 mrg }
1856 1.12 mrg }
1857 1.1 tls
1858 1.16 mrg if (j == 0)
1859 1.40 mrg return NULL;
1860 1.16 mrg
1861 1.40 mrg /*
1862 1.40 mrg * we need to handle being called from different
1863 1.40 mrg * pathnames.
1864 1.40 mrg */
1865 1.40 mrg len = strlen(url) + j;
1866 1.40 mrg if (httpd)
1867 1.40 mrg tmp = bozomalloc(httpd, len);
1868 1.40 mrg else if ((tmp = malloc(len)) == 0)
1869 1.40 mrg return NULL;
1870 1.1 tls
1871 1.16 mrg for (i = 0, j = 0; url[i]; i++) {
1872 1.16 mrg switch (url[i]) {
1873 1.16 mrg case '<':
1874 1.16 mrg memcpy(tmp + j, "<", 4);
1875 1.16 mrg j += 4;
1876 1.16 mrg break;
1877 1.16 mrg case '>':
1878 1.16 mrg memcpy(tmp + j, ">", 4);
1879 1.16 mrg j += 4;
1880 1.16 mrg break;
1881 1.16 mrg case '&':
1882 1.16 mrg memcpy(tmp + j, "&", 5);
1883 1.16 mrg j += 5;
1884 1.16 mrg break;
1885 1.16 mrg default:
1886 1.16 mrg tmp[j++] = url[i];
1887 1.12 mrg }
1888 1.16 mrg }
1889 1.16 mrg tmp[j] = 0;
1890 1.1 tls
1891 1.40 mrg return tmp;
1892 1.1 tls }
1893 1.1 tls
1894 1.1 tls /* short map between error code, and short/long messages */
1895 1.1 tls static struct errors_map {
1896 1.1 tls int code; /* HTTP return code */
1897 1.1 tls const char *shortmsg; /* short version of message */
1898 1.1 tls const char *longmsg; /* long version of message */
1899 1.1 tls } errors_map[] = {
1900 1.1 tls { 400, "400 Bad Request", "The request was not valid", },
1901 1.1 tls { 401, "401 Unauthorized", "No authorization", },
1902 1.6 mrg { 403, "403 Forbidden", "Access to this item has been denied",},
1903 1.1 tls { 404, "404 Not Found", "This item has not been found", },
1904 1.1 tls { 408, "408 Request Timeout", "This request took too long", },
1905 1.1 tls { 417, "417 Expectation Failed","Expectations not available", },
1906 1.64 mrg { 420, "420 Enhance Your Calm","Chill, Winston", },
1907 1.1 tls { 500, "500 Internal Error", "An error occured on the server", },
1908 1.1 tls { 501, "501 Not Implemented", "This request is not available", },
1909 1.1 tls { 0, NULL, NULL, },
1910 1.1 tls };
1911 1.1 tls
1912 1.1 tls static const char *help = "DANGER! WILL ROBINSON! DANGER!";
1913 1.1 tls
1914 1.1 tls static const char *
1915 1.1 tls http_errors_short(int code)
1916 1.1 tls {
1917 1.1 tls struct errors_map *ep;
1918 1.1 tls
1919 1.1 tls for (ep = errors_map; ep->code; ep++)
1920 1.1 tls if (ep->code == code)
1921 1.1 tls return (ep->shortmsg);
1922 1.1 tls return (help);
1923 1.1 tls }
1924 1.1 tls
1925 1.1 tls static const char *
1926 1.1 tls http_errors_long(int code)
1927 1.1 tls {
1928 1.1 tls struct errors_map *ep;
1929 1.1 tls
1930 1.1 tls for (ep = errors_map; ep->code; ep++)
1931 1.1 tls if (ep->code == code)
1932 1.1 tls return (ep->longmsg);
1933 1.1 tls return (help);
1934 1.1 tls }
1935 1.1 tls
1936 1.16 mrg /* the follow functions and variables are used in handling HTTP errors */
1937 1.16 mrg /* ARGSUSED */
1938 1.16 mrg int
1939 1.16 mrg bozo_http_error(bozohttpd_t *httpd, int code, bozo_httpreq_t *request,
1940 1.16 mrg const char *msg)
1941 1.16 mrg {
1942 1.16 mrg char portbuf[20];
1943 1.16 mrg const char *header = http_errors_short(code);
1944 1.16 mrg const char *reason = http_errors_long(code);
1945 1.16 mrg const char *proto = (request && request->hr_proto) ?
1946 1.16 mrg request->hr_proto : httpd->consts.http_11;
1947 1.16 mrg int size;
1948 1.78 elric bozoheaders_t *hdr;
1949 1.16 mrg
1950 1.16 mrg debug((httpd, DEBUG_FAT, "bozo_http_error %d: %s", code, msg));
1951 1.16 mrg if (header == NULL || reason == NULL) {
1952 1.74 mrg bozoerr(httpd, 1,
1953 1.16 mrg "bozo_http_error() failed (short = %p, long = %p)",
1954 1.16 mrg header, reason);
1955 1.16 mrg return code;
1956 1.16 mrg }
1957 1.16 mrg
1958 1.16 mrg if (request && request->hr_serverport &&
1959 1.16 mrg strcmp(request->hr_serverport, "80") != 0)
1960 1.16 mrg snprintf(portbuf, sizeof(portbuf), ":%s",
1961 1.16 mrg request->hr_serverport);
1962 1.16 mrg else
1963 1.16 mrg portbuf[0] = '\0';
1964 1.16 mrg
1965 1.16 mrg if (request && request->hr_file) {
1966 1.67 shm char *file = NULL, *user = NULL, *user_escaped = NULL;
1967 1.69 christos int file_alloc = 0;
1968 1.46 mrg const char *hostname = BOZOHOST(httpd, request);
1969 1.40 mrg
1970 1.40 mrg /* bozo_escape_html() failure here is just too bad. */
1971 1.40 mrg file = bozo_escape_html(NULL, request->hr_file);
1972 1.67 shm if (file == NULL)
1973 1.40 mrg file = request->hr_file;
1974 1.67 shm else
1975 1.67 shm file_alloc = 1;
1976 1.67 shm
1977 1.67 shm #ifndef NO_USER_SUPPORT
1978 1.67 shm if (request->hr_user != NULL) {
1979 1.67 shm user_escaped = bozo_escape_html(NULL, request->hr_user);
1980 1.67 shm if (user_escaped == NULL)
1981 1.67 shm user_escaped = request->hr_user;
1982 1.67 shm /* expand username to ~user/ */
1983 1.74 mrg bozoasprintf(httpd, &user, "~%s/", user_escaped);
1984 1.69 christos if (user_escaped != request->hr_user)
1985 1.67 shm free(user_escaped);
1986 1.67 shm }
1987 1.67 shm #endif /* !NO_USER_SUPPORT */
1988 1.67 shm
1989 1.16 mrg size = snprintf(httpd->errorbuf, BUFSIZ,
1990 1.16 mrg "<html><head><title>%s</title></head>\n"
1991 1.16 mrg "<body><h1>%s</h1>\n"
1992 1.67 shm "%s%s: <pre>%s</pre>\n"
1993 1.16 mrg "<hr><address><a href=\"http://%s%s/\">%s%s</a></address>\n"
1994 1.16 mrg "</body></html>\n",
1995 1.67 shm header, header,
1996 1.67 shm user ? user : "", file,
1997 1.67 shm reason, hostname, portbuf, hostname, portbuf);
1998 1.69 christos free(user);
1999 1.16 mrg if (size >= (int)BUFSIZ) {
2000 1.74 mrg bozowarn(httpd,
2001 1.16 mrg "bozo_http_error buffer too small, truncated");
2002 1.16 mrg size = (int)BUFSIZ;
2003 1.16 mrg }
2004 1.67 shm
2005 1.67 shm if (file_alloc)
2006 1.67 shm free(file);
2007 1.16 mrg } else
2008 1.16 mrg size = 0;
2009 1.16 mrg
2010 1.16 mrg bozo_printf(httpd, "%s %s\r\n", proto, header);
2011 1.78 elric
2012 1.78 elric if (request) {
2013 1.26 pooka bozo_auth_check_401(request, code);
2014 1.78 elric SIMPLEQ_FOREACH(hdr, &request->hr_replheaders, h_next) {
2015 1.78 elric bozo_printf(httpd, "%s: %s\r\n", hdr->h_header,
2016 1.78 elric hdr->h_value);
2017 1.78 elric }
2018 1.78 elric }
2019 1.16 mrg
2020 1.16 mrg bozo_printf(httpd, "Content-Type: text/html\r\n");
2021 1.16 mrg bozo_printf(httpd, "Content-Length: %d\r\n", size);
2022 1.16 mrg bozo_printf(httpd, "Server: %s\r\n", httpd->server_software);
2023 1.16 mrg if (request && request->hr_allow)
2024 1.16 mrg bozo_printf(httpd, "Allow: %s\r\n", request->hr_allow);
2025 1.16 mrg bozo_printf(httpd, "\r\n");
2026 1.51 shm /* According to the RFC 2616 sec. 9.4 HEAD method MUST NOT return a
2027 1.51 shm * message-body in the response */
2028 1.51 shm if (size && request && request->hr_method != HTTP_HEAD)
2029 1.16 mrg bozo_printf(httpd, "%s", httpd->errorbuf);
2030 1.16 mrg bozo_flush(httpd, stdout);
2031 1.16 mrg
2032 1.16 mrg return code;
2033 1.16 mrg }
2034 1.16 mrg
2035 1.1 tls /* Below are various modified libc functions */
2036 1.1 tls
2037 1.1 tls /*
2038 1.1 tls * returns -1 in lenp if the string ran out before finding a delimiter,
2039 1.1 tls * but is otherwise the same as strsep. Note that the length must be
2040 1.1 tls * correctly passed in.
2041 1.1 tls */
2042 1.1 tls char *
2043 1.6 mrg bozostrnsep(char **strp, const char *delim, ssize_t *lenp)
2044 1.1 tls {
2045 1.1 tls char *s;
2046 1.1 tls const char *spanp;
2047 1.1 tls int c, sc;
2048 1.1 tls char *tok;
2049 1.1 tls
2050 1.1 tls if ((s = *strp) == NULL)
2051 1.1 tls return (NULL);
2052 1.1 tls for (tok = s;;) {
2053 1.1 tls if (lenp && --(*lenp) == -1)
2054 1.1 tls return (NULL);
2055 1.1 tls c = *s++;
2056 1.1 tls spanp = delim;
2057 1.1 tls do {
2058 1.1 tls if ((sc = *spanp++) == c) {
2059 1.1 tls if (c == 0)
2060 1.1 tls s = NULL;
2061 1.1 tls else
2062 1.1 tls s[-1] = '\0';
2063 1.1 tls *strp = s;
2064 1.1 tls return (tok);
2065 1.1 tls }
2066 1.1 tls } while (sc != 0);
2067 1.1 tls }
2068 1.1 tls /* NOTREACHED */
2069 1.1 tls }
2070 1.1 tls
2071 1.1 tls /*
2072 1.1 tls * inspired by fgetln(3), but works for fd's. should work identically
2073 1.1 tls * except it, however, does *not* return the newline, and it does nul
2074 1.1 tls * terminate the string.
2075 1.1 tls */
2076 1.1 tls char *
2077 1.16 mrg bozodgetln(bozohttpd_t *httpd, int fd, ssize_t *lenp,
2078 1.16 mrg ssize_t (*readfn)(bozohttpd_t *, int, void *, size_t))
2079 1.1 tls {
2080 1.1 tls ssize_t len;
2081 1.1 tls int got_cr = 0;
2082 1.1 tls char c, *nbuffer;
2083 1.1 tls
2084 1.1 tls /* initialise */
2085 1.16 mrg if (httpd->getln_buflen == 0) {
2086 1.16 mrg /* should be plenty for most requests */
2087 1.16 mrg httpd->getln_buflen = 128;
2088 1.16 mrg httpd->getln_buffer = malloc((size_t)httpd->getln_buflen);
2089 1.16 mrg if (httpd->getln_buffer == NULL) {
2090 1.16 mrg httpd->getln_buflen = 0;
2091 1.1 tls return NULL;
2092 1.1 tls }
2093 1.1 tls }
2094 1.1 tls len = 0;
2095 1.1 tls
2096 1.1 tls /*
2097 1.1 tls * we *have* to read one byte at a time, to not break cgi
2098 1.1 tls * programs (for we pass stdin off to them). could fix this
2099 1.1 tls * by becoming a fd-passing program instead of just exec'ing
2100 1.1 tls * the program
2101 1.17 mrg *
2102 1.17 mrg * the above is no longer true, we are the fd-passing
2103 1.17 mrg * program already.
2104 1.1 tls */
2105 1.16 mrg for (; readfn(httpd, fd, &c, 1) == 1; ) {
2106 1.16 mrg debug((httpd, DEBUG_EXPLODING, "bozodgetln read %c", c));
2107 1.1 tls
2108 1.16 mrg if (len >= httpd->getln_buflen - 1) {
2109 1.16 mrg httpd->getln_buflen *= 2;
2110 1.16 mrg debug((httpd, DEBUG_EXPLODING, "bozodgetln: "
2111 1.16 mrg "reallocating buffer to buflen %zu",
2112 1.16 mrg httpd->getln_buflen));
2113 1.16 mrg nbuffer = bozorealloc(httpd, httpd->getln_buffer,
2114 1.16 mrg (size_t)httpd->getln_buflen);
2115 1.16 mrg httpd->getln_buffer = nbuffer;
2116 1.1 tls }
2117 1.1 tls
2118 1.16 mrg httpd->getln_buffer[len++] = c;
2119 1.1 tls if (c == '\r') {
2120 1.1 tls got_cr = 1;
2121 1.1 tls continue;
2122 1.1 tls } else if (c == '\n') {
2123 1.1 tls /*
2124 1.1 tls * HTTP/1.1 spec says to ignore CR and treat
2125 1.1 tls * LF as the real line terminator. even though
2126 1.1 tls * the same spec defines CRLF as the line
2127 1.1 tls * terminator, it is recommended in section 19.3
2128 1.1 tls * to do the LF trick for tolerance.
2129 1.1 tls */
2130 1.1 tls if (got_cr)
2131 1.1 tls len -= 2;
2132 1.1 tls else
2133 1.1 tls len -= 1;
2134 1.1 tls break;
2135 1.1 tls }
2136 1.1 tls
2137 1.1 tls }
2138 1.16 mrg httpd->getln_buffer[len] = '\0';
2139 1.28 joerg debug((httpd, DEBUG_OBESE, "bozodgetln returns: ``%s'' with len %zd",
2140 1.16 mrg httpd->getln_buffer, len));
2141 1.1 tls *lenp = len;
2142 1.16 mrg return httpd->getln_buffer;
2143 1.1 tls }
2144 1.1 tls
2145 1.1 tls void *
2146 1.16 mrg bozorealloc(bozohttpd_t *httpd, void *ptr, size_t size)
2147 1.1 tls {
2148 1.1 tls void *p;
2149 1.1 tls
2150 1.1 tls p = realloc(ptr, size);
2151 1.73 mrg if (p)
2152 1.73 mrg return p;
2153 1.73 mrg
2154 1.73 mrg (void)bozo_http_error(httpd, 500, NULL, "memory allocation failure");
2155 1.73 mrg exit(EXIT_FAILURE);
2156 1.1 tls }
2157 1.1 tls
2158 1.1 tls void *
2159 1.16 mrg bozomalloc(bozohttpd_t *httpd, size_t size)
2160 1.1 tls {
2161 1.1 tls void *p;
2162 1.1 tls
2163 1.1 tls p = malloc(size);
2164 1.73 mrg if (p)
2165 1.73 mrg return p;
2166 1.73 mrg
2167 1.73 mrg (void)bozo_http_error(httpd, 500, NULL, "memory allocation failure");
2168 1.73 mrg exit(EXIT_FAILURE);
2169 1.1 tls }
2170 1.1 tls
2171 1.1 tls char *
2172 1.73 mrg bozostrdup(bozohttpd_t *httpd, bozo_httpreq_t *request, const char *str)
2173 1.1 tls {
2174 1.1 tls char *p;
2175 1.1 tls
2176 1.1 tls p = strdup(str);
2177 1.73 mrg if (p)
2178 1.73 mrg return p;
2179 1.73 mrg
2180 1.73 mrg if (!request)
2181 1.74 mrg bozoerr(httpd, EXIT_FAILURE, "strdup");
2182 1.73 mrg
2183 1.73 mrg (void)bozo_http_error(httpd, 500, request, "memory allocation failure");
2184 1.73 mrg exit(EXIT_FAILURE);
2185 1.1 tls }
2186 1.16 mrg
2187 1.16 mrg /* set default values in bozohttpd_t struct */
2188 1.16 mrg int
2189 1.16 mrg bozo_init_httpd(bozohttpd_t *httpd)
2190 1.16 mrg {
2191 1.16 mrg /* make sure everything is clean */
2192 1.16 mrg (void) memset(httpd, 0x0, sizeof(*httpd));
2193 1.16 mrg
2194 1.16 mrg /* constants */
2195 1.16 mrg httpd->consts.http_09 = "HTTP/0.9";
2196 1.16 mrg httpd->consts.http_10 = "HTTP/1.0";
2197 1.16 mrg httpd->consts.http_11 = "HTTP/1.1";
2198 1.16 mrg httpd->consts.text_plain = "text/plain";
2199 1.16 mrg
2200 1.16 mrg /* mmap region size */
2201 1.16 mrg httpd->mmapsz = BOZO_MMAPSZ;
2202 1.16 mrg
2203 1.16 mrg /* error buffer for bozo_http_error() */
2204 1.16 mrg if ((httpd->errorbuf = malloc(BUFSIZ)) == NULL) {
2205 1.16 mrg (void) fprintf(stderr,
2206 1.16 mrg "bozohttpd: memory_allocation failure\n");
2207 1.16 mrg return 0;
2208 1.16 mrg }
2209 1.43 mbalmer #ifndef NO_LUA_SUPPORT
2210 1.43 mbalmer SIMPLEQ_INIT(&httpd->lua_states);
2211 1.43 mbalmer #endif
2212 1.16 mrg return 1;
2213 1.16 mrg }
2214 1.16 mrg
2215 1.16 mrg /* set default values in bozoprefs_t struct */
2216 1.16 mrg int
2217 1.73 mrg bozo_init_prefs(bozohttpd_t *httpd, bozoprefs_t *prefs)
2218 1.16 mrg {
2219 1.16 mrg /* make sure everything is clean */
2220 1.16 mrg (void) memset(prefs, 0x0, sizeof(*prefs));
2221 1.16 mrg
2222 1.16 mrg /* set up default values */
2223 1.73 mrg if (!bozo_set_pref(httpd, prefs, "server software", SERVER_SOFTWARE) ||
2224 1.73 mrg !bozo_set_pref(httpd, prefs, "index.html", INDEX_HTML) ||
2225 1.73 mrg !bozo_set_pref(httpd, prefs, "public_html", PUBLIC_HTML))
2226 1.73 mrg return 0;
2227 1.16 mrg
2228 1.16 mrg return 1;
2229 1.16 mrg }
2230 1.16 mrg
2231 1.16 mrg /* set default values */
2232 1.16 mrg int
2233 1.16 mrg bozo_set_defaults(bozohttpd_t *httpd, bozoprefs_t *prefs)
2234 1.16 mrg {
2235 1.73 mrg return bozo_init_httpd(httpd) && bozo_init_prefs(httpd, prefs);
2236 1.16 mrg }
2237 1.16 mrg
2238 1.16 mrg /* set the virtual host name, port and root */
2239 1.16 mrg int
2240 1.16 mrg bozo_setup(bozohttpd_t *httpd, bozoprefs_t *prefs, const char *vhost,
2241 1.16 mrg const char *root)
2242 1.16 mrg {
2243 1.16 mrg struct passwd *pw;
2244 1.16 mrg extern char **environ;
2245 1.21 mrg static char *cleanenv[1] = { NULL };
2246 1.16 mrg uid_t uid;
2247 1.16 mrg char *chrootdir;
2248 1.16 mrg char *username;
2249 1.16 mrg char *portnum;
2250 1.16 mrg char *cp;
2251 1.16 mrg int dirtyenv;
2252 1.16 mrg
2253 1.16 mrg dirtyenv = 0;
2254 1.16 mrg
2255 1.16 mrg if (vhost == NULL) {
2256 1.16 mrg httpd->virthostname = bozomalloc(httpd, MAXHOSTNAMELEN+1);
2257 1.16 mrg if (gethostname(httpd->virthostname, MAXHOSTNAMELEN+1) < 0)
2258 1.74 mrg bozoerr(httpd, 1, "gethostname");
2259 1.16 mrg httpd->virthostname[MAXHOSTNAMELEN] = '\0';
2260 1.16 mrg } else {
2261 1.73 mrg httpd->virthostname = bozostrdup(httpd, NULL, vhost);
2262 1.16 mrg }
2263 1.73 mrg httpd->slashdir = bozostrdup(httpd, NULL, root);
2264 1.16 mrg if ((portnum = bozo_get_pref(prefs, "port number")) != NULL) {
2265 1.73 mrg httpd->bindport = bozostrdup(httpd, NULL, portnum);
2266 1.16 mrg }
2267 1.16 mrg
2268 1.16 mrg /* go over preferences now */
2269 1.16 mrg if ((cp = bozo_get_pref(prefs, "numeric")) != NULL &&
2270 1.16 mrg strcmp(cp, "true") == 0) {
2271 1.16 mrg httpd->numeric = 1;
2272 1.16 mrg }
2273 1.16 mrg if ((cp = bozo_get_pref(prefs, "log to stderr")) != NULL &&
2274 1.16 mrg strcmp(cp, "true") == 0) {
2275 1.16 mrg httpd->logstderr = 1;
2276 1.16 mrg }
2277 1.16 mrg if ((cp = bozo_get_pref(prefs, "bind address")) != NULL) {
2278 1.73 mrg httpd->bindaddress = bozostrdup(httpd, NULL, cp);
2279 1.16 mrg }
2280 1.16 mrg if ((cp = bozo_get_pref(prefs, "background")) != NULL) {
2281 1.16 mrg httpd->background = atoi(cp);
2282 1.16 mrg }
2283 1.16 mrg if ((cp = bozo_get_pref(prefs, "foreground")) != NULL &&
2284 1.16 mrg strcmp(cp, "true") == 0) {
2285 1.16 mrg httpd->foreground = 1;
2286 1.16 mrg }
2287 1.27 jmmv if ((cp = bozo_get_pref(prefs, "pid file")) != NULL) {
2288 1.73 mrg httpd->pidfile = bozostrdup(httpd, NULL, cp);
2289 1.27 jmmv }
2290 1.16 mrg if ((cp = bozo_get_pref(prefs, "unknown slash")) != NULL &&
2291 1.16 mrg strcmp(cp, "true") == 0) {
2292 1.16 mrg httpd->unknown_slash = 1;
2293 1.16 mrg }
2294 1.16 mrg if ((cp = bozo_get_pref(prefs, "virtual base")) != NULL) {
2295 1.73 mrg httpd->virtbase = bozostrdup(httpd, NULL, cp);
2296 1.16 mrg }
2297 1.16 mrg if ((cp = bozo_get_pref(prefs, "enable users")) != NULL &&
2298 1.16 mrg strcmp(cp, "true") == 0) {
2299 1.16 mrg httpd->enable_users = 1;
2300 1.16 mrg }
2301 1.67 shm if ((cp = bozo_get_pref(prefs, "enable user cgibin")) != NULL &&
2302 1.67 shm strcmp(cp, "true") == 0) {
2303 1.67 shm httpd->enable_cgi_users = 1;
2304 1.67 shm }
2305 1.16 mrg if ((cp = bozo_get_pref(prefs, "dirty environment")) != NULL &&
2306 1.16 mrg strcmp(cp, "true") == 0) {
2307 1.16 mrg dirtyenv = 1;
2308 1.16 mrg }
2309 1.16 mrg if ((cp = bozo_get_pref(prefs, "hide dots")) != NULL &&
2310 1.16 mrg strcmp(cp, "true") == 0) {
2311 1.16 mrg httpd->hide_dots = 1;
2312 1.16 mrg }
2313 1.16 mrg if ((cp = bozo_get_pref(prefs, "directory indexing")) != NULL &&
2314 1.16 mrg strcmp(cp, "true") == 0) {
2315 1.16 mrg httpd->dir_indexing = 1;
2316 1.16 mrg }
2317 1.20 mrg if ((cp = bozo_get_pref(prefs, "public_html")) != NULL) {
2318 1.73 mrg httpd->public_html = bozostrdup(httpd, NULL, cp);
2319 1.20 mrg }
2320 1.16 mrg httpd->server_software =
2321 1.73 mrg bozostrdup(httpd, NULL, bozo_get_pref(prefs, "server software"));
2322 1.72 christos httpd->index_html =
2323 1.73 mrg bozostrdup(httpd, NULL, bozo_get_pref(prefs, "index.html"));
2324 1.16 mrg
2325 1.16 mrg /*
2326 1.16 mrg * initialise ssl and daemon mode if necessary.
2327 1.16 mrg */
2328 1.16 mrg bozo_ssl_init(httpd);
2329 1.16 mrg bozo_daemon_init(httpd);
2330 1.16 mrg
2331 1.75 mrg username = bozo_get_pref(prefs, "username");
2332 1.75 mrg if (username != NULL) {
2333 1.75 mrg if ((pw = getpwnam(username)) == NULL)
2334 1.75 mrg bozoerr(httpd, 1, "getpwnam(%s): %s", username,
2335 1.75 mrg strerror(errno));
2336 1.16 mrg if (initgroups(pw->pw_name, pw->pw_gid) == -1)
2337 1.74 mrg bozoerr(httpd, 1, "initgroups: %s", strerror(errno));
2338 1.16 mrg if (setgid(pw->pw_gid) == -1)
2339 1.74 mrg bozoerr(httpd, 1, "setgid(%u): %s", pw->pw_gid,
2340 1.75 mrg strerror(errno));
2341 1.16 mrg uid = pw->pw_uid;
2342 1.16 mrg }
2343 1.16 mrg /*
2344 1.16 mrg * handle chroot.
2345 1.16 mrg */
2346 1.16 mrg if ((chrootdir = bozo_get_pref(prefs, "chroot dir")) != NULL) {
2347 1.73 mrg httpd->rootdir = bozostrdup(httpd, NULL, chrootdir);
2348 1.16 mrg if (chdir(httpd->rootdir) == -1)
2349 1.74 mrg bozoerr(httpd, 1, "chdir(%s): %s", httpd->rootdir,
2350 1.16 mrg strerror(errno));
2351 1.16 mrg if (chroot(httpd->rootdir) == -1)
2352 1.74 mrg bozoerr(httpd, 1, "chroot(%s): %s", httpd->rootdir,
2353 1.16 mrg strerror(errno));
2354 1.16 mrg }
2355 1.16 mrg
2356 1.75 mrg if (username != NULL && setuid(uid) == -1)
2357 1.75 mrg bozoerr(httpd, 1, "setuid(%d): %s", uid, strerror(errno));
2358 1.16 mrg
2359 1.16 mrg /*
2360 1.16 mrg * prevent info leakage between different compartments.
2361 1.16 mrg * some PATH values in the environment would be invalided
2362 1.16 mrg * by chroot. cross-user settings might result in undesirable
2363 1.16 mrg * effects.
2364 1.16 mrg */
2365 1.21 mrg if ((chrootdir != NULL || username != NULL) && !dirtyenv)
2366 1.16 mrg environ = cleanenv;
2367 1.21 mrg
2368 1.16 mrg #ifdef _SC_PAGESIZE
2369 1.16 mrg httpd->page_size = (long)sysconf(_SC_PAGESIZE);
2370 1.16 mrg #else
2371 1.16 mrg httpd->page_size = 4096;
2372 1.16 mrg #endif
2373 1.16 mrg debug((httpd, DEBUG_OBESE, "myname is %s, slashdir is %s",
2374 1.16 mrg httpd->virthostname, httpd->slashdir));
2375 1.16 mrg
2376 1.16 mrg return 1;
2377 1.16 mrg }
2378