xref: /minix/libexec/httpd/bozohttpd.c (revision 340f5e56)
1 /*	$NetBSD: bozohttpd.c,v 1.66 2015/07/16 12:19:23 shm Exp $	*/
2 
3 /*	$eterna: bozohttpd.c,v 1.178 2011/11/18 09:21:15 mrg Exp $	*/
4 
5 /*
6  * Copyright (c) 1997-2015 Matthew R. Green
7  * All rights reserved.
8  *
9  * Redistribution and use in source and binary forms, with or without
10  * modification, are permitted provided that the following conditions
11  * are met:
12  * 1. Redistributions of source code must retain the above copyright
13  *    notice, this list of conditions and the following disclaimer.
14  * 2. Redistributions in binary form must reproduce the above copyright
15  *    notice, this list of conditions and the following disclaimer and
16  *    dedication in the documentation and/or other materials provided
17  *    with the distribution.
18  *
19  * THIS SOFTWARE IS PROVIDED BY THE AUTHOR ``AS IS'' AND ANY EXPRESS OR
20  * IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED WARRANTIES
21  * OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE ARE DISCLAIMED.
22  * IN NO EVENT SHALL THE AUTHOR BE LIABLE FOR ANY DIRECT, INDIRECT,
23  * INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING,
24  * BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES;
25  * LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED
26  * AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY,
27  * OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY
28  * OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF
29  * SUCH DAMAGE.
30  *
31  */
32 
33 /* this program is dedicated to the Great God of Processed Cheese */
34 
35 /*
36  * bozohttpd.c:  minimal httpd; provides only these features:
37  *	- HTTP/0.9 (by virtue of ..)
38  *	- HTTP/1.0
39  *	- HTTP/1.1
40  *	- CGI/1.1 this will only be provided for "system" scripts
41  *	- automatic "missing trailing slash" redirections
42  *	- configurable translation of /~user/ to ~user/public_html,
43  *	  however, this does not include cgi-bin support
44  *	- access lists via libwrap via inetd/tcpd
45  *	- virtual hosting
46  *	- not that we do not even pretend to understand MIME, but
47  *	  rely only on the HTTP specification
48  *	- ipv6 support
49  *	- automatic `index.html' generation
50  *	- configurable server name
51  *	- directory index generation
52  *	- daemon mode (lacks libwrap support)
53  *	- .htpasswd support
54  */
55 
56 /*
57  * requirements for minimal http/1.1 (at least, as documented in
58  * RFC 2616 (HTTP/1.1):
59  *
60  *	- 14.11: content-encoding handling. [1]
61  *
62  *	- 14.13: content-length handling.  this is only a SHOULD header
63  *	  thus we could just not send it ever.  [1]
64  *
65  *	- 14.17: content-type handling. [1]
66  *
67  *	- 14.28: if-unmodified-since handling.  if-modified-since is
68  *	  done since, shouldn't be too hard for this one.
69  *
70  * [1] need to revisit to ensure proper behaviour
71  *
72  * and the following is a list of features that we do not need
73  * to have due to other limits, or are too lazy.  there are more
74  * of these than are listed, but these are of particular note,
75  * and could perhaps be implemented.
76  *
77  *	- 3.5/3.6: content/transfer codings.  probably can ignore
78  *	  this?  we "SHOULD"n't.  but 4.4 says we should ignore a
79  *	  `content-length' header upon reciept of a `transfer-encoding'
80  *	  header.
81  *
82  *	- 5.1.1: request methods.  only MUST support GET and HEAD,
83  *	  but there are new ones besides POST that are currently
84  *	  supported: OPTIONS PUT DELETE TRACE and CONNECT, plus
85  *	  extensions not yet known?
86  *
87  * 	- 10.1: we can ignore informational status codes
88  *
89  *	- 10.3.3/10.3.4/10.3.8:  just use '302' codes always.
90  *
91  *	- 14.1/14.2/14.3/14.27: we do not support Accept: headers.
92  *	  just ignore them and send the request anyway.  they are
93  *	  only SHOULD.
94  *
95  *	- 14.5/14.16/14.35: only support simple ranges: %d- and %d-%d
96  *	  would be nice to support more.
97  *
98  *	- 14.9: we aren't a cache.
99  *
100  *	- 14.15: content-md5 would be nice.
101  *
102  *	- 14.24/14.26/14.27: if-match, if-none-match, if-range.  be
103  *	  nice to support this.
104  *
105  *	- 14.44: Vary: seems unneeded.  ignore it for now.
106  */
107 
108 #ifndef INDEX_HTML
109 #define INDEX_HTML		"index.html"
110 #endif
111 #ifndef SERVER_SOFTWARE
112 #define SERVER_SOFTWARE		"bozohttpd/20150501"
113 #endif
114 #ifndef DIRECT_ACCESS_FILE
115 #define DIRECT_ACCESS_FILE	".bzdirect"
116 #endif
117 #ifndef REDIRECT_FILE
118 #define REDIRECT_FILE		".bzredirect"
119 #endif
120 #ifndef ABSREDIRECT_FILE
121 #define ABSREDIRECT_FILE	".bzabsredirect"
122 #endif
123 #ifndef PUBLIC_HTML
124 #define PUBLIC_HTML		"public_html"
125 #endif
126 
127 #ifndef USE_ARG
128 #define USE_ARG(x)	/*LINTED*/(void)&(x)
129 #endif
130 
131 /*
132  * And so it begins ..
133  */
134 
135 #include <sys/param.h>
136 #include <sys/socket.h>
137 #include <sys/time.h>
138 #include <sys/mman.h>
139 
140 #include <arpa/inet.h>
141 
142 #include <ctype.h>
143 #include <dirent.h>
144 #include <errno.h>
145 #include <fcntl.h>
146 #include <netdb.h>
147 #include <pwd.h>
148 #include <grp.h>
149 #include <signal.h>
150 #include <stdarg.h>
151 #include <stdlib.h>
152 #include <string.h>
153 #include <syslog.h>
154 #include <time.h>
155 #include <unistd.h>
156 
157 #include "bozohttpd.h"
158 
159 #ifndef MAX_WAIT_TIME
160 #define	MAX_WAIT_TIME	60	/* hang around for 60 seconds max */
161 #endif
162 
163 /* variables and functions */
164 #ifndef LOG_FTP
165 #define LOG_FTP LOG_DAEMON
166 #endif
167 
168 volatile sig_atomic_t	alarmhit;
169 
170 /*
171  * check there's enough space in the prefs and names arrays.
172  */
173 static int
size_arrays(bozoprefs_t * bozoprefs,unsigned needed)174 size_arrays(bozoprefs_t *bozoprefs, unsigned needed)
175 {
176 	char	**temp;
177 
178 	if (bozoprefs->size == 0) {
179 		/* only get here first time around */
180 		bozoprefs->size = needed;
181 		if ((bozoprefs->name = calloc(sizeof(char *), needed)) == NULL) {
182 			(void) fprintf(stderr, "size_arrays: bad alloc\n");
183 			return 0;
184 		}
185 		if ((bozoprefs->value = calloc(sizeof(char *), needed)) == NULL) {
186 			free(bozoprefs->name);
187 			(void) fprintf(stderr, "size_arrays: bad alloc\n");
188 			return 0;
189 		}
190 	} else if (bozoprefs->c == bozoprefs->size) {
191 		/* only uses 'needed' when filled array */
192 		bozoprefs->size += needed;
193 		temp = realloc(bozoprefs->name, sizeof(char *) * needed);
194 		if (temp == NULL) {
195 			(void) fprintf(stderr, "size_arrays: bad alloc\n");
196 			return 0;
197 		}
198 		bozoprefs->name = temp;
199 		temp = realloc(bozoprefs->value, sizeof(char *) * needed);
200 		if (temp == NULL) {
201 			(void) fprintf(stderr, "size_arrays: bad alloc\n");
202 			return 0;
203 		}
204 		bozoprefs->value = temp;
205 	}
206 	return 1;
207 }
208 
209 static int
findvar(bozoprefs_t * bozoprefs,const char * name)210 findvar(bozoprefs_t *bozoprefs, const char *name)
211 {
212 	unsigned	i;
213 
214 	for (i = 0 ; i < bozoprefs->c && strcmp(bozoprefs->name[i], name) != 0; i++)
215 		;
216 	return (i == bozoprefs->c) ? -1 : (int)i;
217 }
218 
219 int
bozo_set_pref(bozoprefs_t * bozoprefs,const char * name,const char * value)220 bozo_set_pref(bozoprefs_t *bozoprefs, const char *name, const char *value)
221 {
222 	int	i;
223 
224 	if ((i = findvar(bozoprefs, name)) < 0) {
225 		/* add the element to the array */
226 		if (size_arrays(bozoprefs, bozoprefs->size + 15)) {
227 			bozoprefs->name[i = bozoprefs->c++] = strdup(name);
228 		}
229 	} else {
230 		/* replace the element in the array */
231 		if (bozoprefs->value[i]) {
232 			free(bozoprefs->value[i]);
233 			bozoprefs->value[i] = NULL;
234 		}
235 	}
236 	/* sanity checks for range of values go here */
237 	bozoprefs->value[i] = strdup(value);
238 	return 1;
239 }
240 
241 /*
242  * get a variable's value, or NULL
243  */
244 char *
bozo_get_pref(bozoprefs_t * bozoprefs,const char * name)245 bozo_get_pref(bozoprefs_t *bozoprefs, const char *name)
246 {
247 	int	i;
248 
249 	return ((i = findvar(bozoprefs, name)) < 0) ? NULL :
250 			bozoprefs->value[i];
251 }
252 
253 char *
bozo_http_date(char * date,size_t datelen)254 bozo_http_date(char *date, size_t datelen)
255 {
256 	struct	tm *tm;
257 	time_t	now;
258 
259 	/* Sun, 06 Nov 1994 08:49:37 GMT */
260 	now = time(NULL);
261 	tm = gmtime(&now);	/* HTTP/1.1 spec rev 06 sez GMT only */
262 	strftime(date, datelen, "%a, %d %b %Y %H:%M:%S GMT", tm);
263 	return date;
264 }
265 
266 /*
267  * convert "in" into the three parts of a request (first line).
268  * we allocate into file and query, but return pointers into
269  * "in" for proto and method.
270  */
271 static void
parse_request(bozohttpd_t * httpd,char * in,char ** method,char ** file,char ** query,char ** proto)272 parse_request(bozohttpd_t *httpd, char *in, char **method, char **file,
273 		char **query, char **proto)
274 {
275 	ssize_t	len;
276 	char	*val;
277 
278 	USE_ARG(httpd);
279 	debug((httpd, DEBUG_EXPLODING, "parse in: %s", in));
280 	*method = *file = *query = *proto = NULL;
281 
282 	len = (ssize_t)strlen(in);
283 	val = bozostrnsep(&in, " \t\n\r", &len);
284 	if (len < 1 || val == NULL)
285 		return;
286 	*method = val;
287 
288 	while (*in == ' ' || *in == '\t')
289 		in++;
290 	val = bozostrnsep(&in, " \t\n\r", &len);
291 	if (len < 1) {
292 		if (len == 0)
293 			*file = val;
294 		else
295 			*file = in;
296 	} else {
297 		*file = val;
298 
299 		*query = strchr(*file, '?');
300 		if (*query)
301 			*(*query)++ = '\0';
302 
303 		if (in) {
304 			while (*in && (*in == ' ' || *in == '\t'))
305 				in++;
306 			if (*in)
307 				*proto = in;
308 		}
309 	}
310 
311 	/* allocate private copies */
312 	*file = bozostrdup(httpd, *file);
313 	if (*query)
314 		*query = bozostrdup(httpd, *query);
315 
316 	debug((httpd, DEBUG_FAT,
317 		"url: method: \"%s\" file: \"%s\" query: \"%s\" proto: \"%s\"",
318 		*method, *file, *query, *proto));
319 }
320 
321 /*
322  * cleanup a bozo_httpreq_t after use
323  */
324 void
bozo_clean_request(bozo_httpreq_t * request)325 bozo_clean_request(bozo_httpreq_t *request)
326 {
327 	struct bozoheaders *hdr, *ohdr = NULL;
328 
329 	if (request == NULL)
330 		return;
331 
332 	/* If SSL enabled cleanup SSL structure. */
333 	bozo_ssl_destroy(request->hr_httpd);
334 
335 	/* clean up request */
336 	free(request->hr_remotehost);
337 	free(request->hr_remoteaddr);
338 	free(request->hr_serverport);
339 	free(request->hr_virthostname);
340 	free(request->hr_file);
341 	free(request->hr_oldfile);
342 	free(request->hr_query);
343 	free(request->hr_host);
344 	bozo_auth_cleanup(request);
345 	for (hdr = SIMPLEQ_FIRST(&request->hr_headers); hdr;
346 	    hdr = SIMPLEQ_NEXT(hdr, h_next)) {
347 		free(hdr->h_value);
348 		free(hdr->h_header);
349 		free(ohdr);
350 		ohdr = hdr;
351 	}
352 	free(ohdr);
353 
354 	free(request);
355 }
356 
357 /*
358  * send a HTTP/1.1 408 response if we timeout.
359  */
360 /* ARGSUSED */
361 static void
alarmer(int sig)362 alarmer(int sig)
363 {
364 	alarmhit = 1;
365 }
366 
367 /*
368  * add or merge this header (val: str) into the requests list
369  */
370 static bozoheaders_t *
addmerge_header(bozo_httpreq_t * request,char * val,char * str,ssize_t len)371 addmerge_header(bozo_httpreq_t *request, char *val,
372 		char *str, ssize_t len)
373 {
374 	struct	bozoheaders *hdr;
375 
376 	USE_ARG(len);
377 	/* do we exist already? */
378 	SIMPLEQ_FOREACH(hdr, &request->hr_headers, h_next) {
379 		if (strcasecmp(val, hdr->h_header) == 0)
380 			break;
381 	}
382 
383 	if (hdr) {
384 		/* yup, merge it in */
385 		char *nval;
386 
387 		if (asprintf(&nval, "%s, %s", hdr->h_value, str) == -1) {
388 			(void)bozo_http_error(request->hr_httpd, 500, NULL,
389 			     "memory allocation failure");
390 			return NULL;
391 		}
392 		free(hdr->h_value);
393 		hdr->h_value = nval;
394 	} else {
395 		/* nope, create a new one */
396 
397 		hdr = bozomalloc(request->hr_httpd, sizeof *hdr);
398 		hdr->h_header = bozostrdup(request->hr_httpd, val);
399 		if (str && *str)
400 			hdr->h_value = bozostrdup(request->hr_httpd, str);
401 		else
402 			hdr->h_value = bozostrdup(request->hr_httpd, " ");
403 
404 		SIMPLEQ_INSERT_TAIL(&request->hr_headers, hdr, h_next);
405 		request->hr_nheaders++;
406 	}
407 
408 	return hdr;
409 }
410 
411 /*
412  * as the prototype string is not constant (eg, "HTTP/1.1" is equivalent
413  * to "HTTP/001.01"), we MUST parse this.
414  */
415 static int
process_proto(bozo_httpreq_t * request,const char * proto)416 process_proto(bozo_httpreq_t *request, const char *proto)
417 {
418 	char	majorstr[16], *minorstr;
419 	int	majorint, minorint;
420 
421 	if (proto == NULL) {
422 got_proto_09:
423 		request->hr_proto = request->hr_httpd->consts.http_09;
424 		debug((request->hr_httpd, DEBUG_FAT, "request %s is http/0.9",
425 			request->hr_file));
426 		return 0;
427 	}
428 
429 	if (strncasecmp(proto, "HTTP/", 5) != 0)
430 		goto bad;
431 	strncpy(majorstr, proto + 5, sizeof majorstr);
432 	majorstr[sizeof(majorstr)-1] = 0;
433 	minorstr = strchr(majorstr, '.');
434 	if (minorstr == NULL)
435 		goto bad;
436 	*minorstr++ = 0;
437 
438 	majorint = atoi(majorstr);
439 	minorint = atoi(minorstr);
440 
441 	switch (majorint) {
442 	case 0:
443 		if (minorint != 9)
444 			break;
445 		goto got_proto_09;
446 	case 1:
447 		if (minorint == 0)
448 			request->hr_proto = request->hr_httpd->consts.http_10;
449 		else if (minorint == 1)
450 			request->hr_proto = request->hr_httpd->consts.http_11;
451 		else
452 			break;
453 
454 		debug((request->hr_httpd, DEBUG_FAT, "request %s is %s",
455 		    request->hr_file, request->hr_proto));
456 		SIMPLEQ_INIT(&request->hr_headers);
457 		request->hr_nheaders = 0;
458 		return 0;
459 	}
460 bad:
461 	return bozo_http_error(request->hr_httpd, 404, NULL, "unknown prototype");
462 }
463 
464 /*
465  * process each type of HTTP method, setting this HTTP requests
466  # method type.
467  */
468 static struct method_map {
469 	const char *name;
470 	int	type;
471 } method_map[] = {
472 	{ "GET", 	HTTP_GET, },
473 	{ "POST",	HTTP_POST, },
474 	{ "HEAD",	HTTP_HEAD, },
475 #if 0	/* other non-required http/1.1 methods */
476 	{ "OPTIONS",	HTTP_OPTIONS, },
477 	{ "PUT",	HTTP_PUT, },
478 	{ "DELETE",	HTTP_DELETE, },
479 	{ "TRACE",	HTTP_TRACE, },
480 	{ "CONNECT",	HTTP_CONNECT, },
481 #endif
482 	{ NULL,		0, },
483 };
484 
485 static int
process_method(bozo_httpreq_t * request,const char * method)486 process_method(bozo_httpreq_t *request, const char *method)
487 {
488 	struct	method_map *mmp;
489 
490 	if (request->hr_proto == request->hr_httpd->consts.http_11)
491 		request->hr_allow = "GET, HEAD, POST";
492 
493 	for (mmp = method_map; mmp->name; mmp++)
494 		if (strcasecmp(method, mmp->name) == 0) {
495 			request->hr_method = mmp->type;
496 			request->hr_methodstr = mmp->name;
497 			return 0;
498 		}
499 
500 	return bozo_http_error(request->hr_httpd, 404, request, "unknown method");
501 }
502 
503 /*
504  * This function reads a http request from stdin, returning a pointer to a
505  * bozo_httpreq_t structure, describing the request.
506  */
507 bozo_httpreq_t *
bozo_read_request(bozohttpd_t * httpd)508 bozo_read_request(bozohttpd_t *httpd)
509 {
510 	struct	sigaction	sa;
511 	char	*str, *val, *method, *file, *proto, *query;
512 	char	*host, *addr, *port;
513 	char	bufport[10];
514 	char	hbuf[NI_MAXHOST], abuf[NI_MAXHOST];
515 	struct	sockaddr_storage ss;
516 	ssize_t	len;
517 	int	line = 0;
518 	socklen_t slen;
519 	bozo_httpreq_t *request;
520 
521 	/*
522 	 * if we're in daemon mode, bozo_daemon_fork() will return here twice
523 	 * for each call.  once in the child, returning 0, and once in the
524 	 * parent, returning 1.  for each child, then we can setup SSL, and
525 	 * the parent can signal the caller there was no request to process
526 	 * and it will wait for another.
527 	 */
528 	if (bozo_daemon_fork(httpd))
529 		return NULL;
530 	if (bozo_ssl_accept(httpd))
531 		return NULL;
532 
533 	request = bozomalloc(httpd, sizeof(*request));
534 	memset(request, 0, sizeof(*request));
535 	request->hr_httpd = httpd;
536 	request->hr_allow = request->hr_host = NULL;
537 	request->hr_content_type = request->hr_content_length = NULL;
538 	request->hr_range = NULL;
539 	request->hr_last_byte_pos = -1;
540 	request->hr_if_modified_since = NULL;
541 	request->hr_virthostname = NULL;
542 	request->hr_file = NULL;
543 	request->hr_oldfile = NULL;
544 	bozo_auth_init(request);
545 
546 	slen = sizeof(ss);
547 	if (getpeername(0, (struct sockaddr *)(void *)&ss, &slen) < 0)
548 		host = addr = NULL;
549 	else {
550 		if (getnameinfo((struct sockaddr *)(void *)&ss, slen,
551 		    abuf, sizeof abuf, NULL, 0, NI_NUMERICHOST) == 0)
552 			addr = abuf;
553 		else
554 			addr = NULL;
555 		if (httpd->numeric == 0 &&
556 		    getnameinfo((struct sockaddr *)(void *)&ss, slen,
557 				hbuf, sizeof hbuf, NULL, 0, 0) == 0)
558 			host = hbuf;
559 		else
560 			host = NULL;
561 	}
562 	if (host != NULL)
563 		request->hr_remotehost = bozostrdup(request->hr_httpd, host);
564 	if (addr != NULL)
565 		request->hr_remoteaddr = bozostrdup(request->hr_httpd, addr);
566 	slen = sizeof(ss);
567 
568 	/*
569 	 * Override the bound port from the request value, so it works even
570 	 * if passed through a proxy that doesn't rewrite the port.
571 	 */
572 	if (httpd->bindport) {
573 		if (strcmp(httpd->bindport, "80") != 0)
574 			port = httpd->bindport;
575 		else
576 			port = NULL;
577 	} else {
578 		if (getsockname(0, (struct sockaddr *)(void *)&ss, &slen) < 0)
579 			port = NULL;
580 		else {
581 			if (getnameinfo((struct sockaddr *)(void *)&ss, slen, NULL, 0,
582 					bufport, sizeof bufport, NI_NUMERICSERV) == 0)
583 				port = bufport;
584 			else
585 				port = NULL;
586 		}
587 	}
588 	if (port != NULL)
589 		request->hr_serverport = bozostrdup(request->hr_httpd, port);
590 
591 	/*
592 	 * setup a timer to make sure the request is not hung
593 	 */
594 	sa.sa_handler = alarmer;
595 	sigemptyset(&sa.sa_mask);
596 	sigaddset(&sa.sa_mask, SIGALRM);
597 	sa.sa_flags = 0;
598 	sigaction(SIGALRM, &sa, NULL);	/* XXX */
599 
600 	alarm(MAX_WAIT_TIME);
601 	while ((str = bozodgetln(httpd, STDIN_FILENO, &len, bozo_read)) != NULL) {
602 		alarm(0);
603 		if (alarmhit) {
604 			(void)bozo_http_error(httpd, 408, NULL,
605 					"request timed out");
606 			goto cleanup;
607 		}
608 		line++;
609 
610 		if (line == 1) {
611 
612 			if (len < 1) {
613 				(void)bozo_http_error(httpd, 404, NULL,
614 						"null method");
615 				goto cleanup;
616 			}
617 
618 			bozo_warn(httpd, "got request ``%s'' from host %s to port %s",
619 				str,
620 				host ? host : addr ? addr : "<local>",
621 				port ? port : "<stdin>");
622 
623 			/* we allocate return space in file and query only */
624 			parse_request(httpd, str, &method, &file, &query, &proto);
625 			request->hr_file = file;
626 			request->hr_query = query;
627 			if (method == NULL) {
628 				(void)bozo_http_error(httpd, 404, NULL,
629 						"null method");
630 				goto cleanup;
631 			}
632 			if (file == NULL) {
633 				(void)bozo_http_error(httpd, 404, NULL,
634 						"null file");
635 				goto cleanup;
636 			}
637 
638 			/*
639 			 * note that we parse the proto first, so that we
640 			 * can more properly parse the method and the url.
641 			 */
642 
643 			if (process_proto(request, proto) ||
644 			    process_method(request, method)) {
645 				goto cleanup;
646 			}
647 
648 			debug((httpd, DEBUG_FAT, "got file \"%s\" query \"%s\"",
649 			    request->hr_file,
650 			    request->hr_query ? request->hr_query : "<none>"));
651 
652 			/* http/0.9 has no header processing */
653 			if (request->hr_proto == httpd->consts.http_09)
654 				break;
655 		} else {		/* incoming headers */
656 			bozoheaders_t *hdr;
657 
658 			if (*str == '\0')
659 				break;
660 
661 			val = bozostrnsep(&str, ":", &len);
662 			debug((httpd, DEBUG_EXPLODING,
663 			    "read_req2: after bozostrnsep: str ``%s'' val ``%s''",
664 			    str, val));
665 			if (val == NULL || len == -1) {
666 				(void)bozo_http_error(httpd, 404, request,
667 						"no header");
668 				goto cleanup;
669 			}
670 			while (*str == ' ' || *str == '\t')
671 				len--, str++;
672 			while (*val == ' ' || *val == '\t')
673 				val++;
674 
675 			if (bozo_auth_check_headers(request, val, str, len))
676 				goto next_header;
677 
678 			hdr = addmerge_header(request, val, str, len);
679 
680 			if (strcasecmp(hdr->h_header, "content-type") == 0)
681 				request->hr_content_type = hdr->h_value;
682 			else if (strcasecmp(hdr->h_header, "content-length") == 0)
683 				request->hr_content_length = hdr->h_value;
684 			else if (strcasecmp(hdr->h_header, "host") == 0)
685 				request->hr_host = bozostrdup(httpd, hdr->h_value);
686 			/* RFC 2616 (HTTP/1.1): 14.20 */
687 			else if (strcasecmp(hdr->h_header, "expect") == 0) {
688 				(void)bozo_http_error(httpd, 417, request,
689 						"we don't support Expect:");
690 				goto cleanup;
691 			}
692 			else if (strcasecmp(hdr->h_header, "referrer") == 0 ||
693 			         strcasecmp(hdr->h_header, "referer") == 0)
694 				request->hr_referrer = hdr->h_value;
695 			else if (strcasecmp(hdr->h_header, "range") == 0)
696 				request->hr_range = hdr->h_value;
697 			else if (strcasecmp(hdr->h_header,
698 					"if-modified-since") == 0)
699 				request->hr_if_modified_since = hdr->h_value;
700 			else if (strcasecmp(hdr->h_header,
701 					"accept-encoding") == 0)
702 				request->hr_accept_encoding = hdr->h_value;
703 
704 			debug((httpd, DEBUG_FAT, "adding header %s: %s",
705 			    hdr->h_header, hdr->h_value));
706 		}
707 next_header:
708 		alarm(MAX_WAIT_TIME);
709 	}
710 
711 	/* now, clear it all out */
712 	alarm(0);
713 	signal(SIGALRM, SIG_DFL);
714 
715 	/* RFC1945, 8.3 */
716 	if (request->hr_method == HTTP_POST &&
717 	    request->hr_content_length == NULL) {
718 		(void)bozo_http_error(httpd, 400, request,
719 				"missing content length");
720 		goto cleanup;
721 	}
722 
723 	/* RFC 2616 (HTTP/1.1), 14.23 & 19.6.1.1 */
724 	if (request->hr_proto == httpd->consts.http_11 &&
725 	    /*(strncasecmp(request->hr_file, "http://", 7) != 0) &&*/
726 	    request->hr_host == NULL) {
727 		(void)bozo_http_error(httpd, 400, request,
728 				"missing Host header");
729 		goto cleanup;
730 	}
731 
732 	if (request->hr_range != NULL) {
733 		debug((httpd, DEBUG_FAT, "hr_range: %s", request->hr_range));
734 		/* support only simple ranges %d- and %d-%d */
735 		if (strchr(request->hr_range, ',') == NULL) {
736 			const char *rstart, *dash;
737 
738 			rstart = strchr(request->hr_range, '=');
739 			if (rstart != NULL) {
740 				rstart++;
741 				dash = strchr(rstart, '-');
742 				if (dash != NULL && dash != rstart) {
743 					dash++;
744 					request->hr_have_range = 1;
745 					request->hr_first_byte_pos =
746 					    strtoll(rstart, NULL, 10);
747 					if (request->hr_first_byte_pos < 0)
748 						request->hr_first_byte_pos = 0;
749 					if (*dash != '\0') {
750 						request->hr_last_byte_pos =
751 						    strtoll(dash, NULL, 10);
752 						if (request->hr_last_byte_pos < 0)
753 							request->hr_last_byte_pos = -1;
754 					}
755 				}
756 			}
757 		}
758 	}
759 
760 	debug((httpd, DEBUG_FAT, "bozo_read_request returns url %s in request",
761 	       request->hr_file));
762 	return request;
763 
764 cleanup:
765 	bozo_clean_request(request);
766 
767 	return NULL;
768 }
769 
770 static int
mmap_and_write_part(bozohttpd_t * httpd,int fd,off_t first_byte_pos,size_t sz)771 mmap_and_write_part(bozohttpd_t *httpd, int fd, off_t first_byte_pos, size_t sz)
772 {
773 	size_t mappedsz, wroffset;
774 	off_t mappedoffset;
775 	char *addr;
776 	void *mappedaddr;
777 
778 	/*
779 	 * we need to ensure that both the size *and* offset arguments to
780 	 * mmap() are page-aligned.  our formala for this is:
781 	 *
782 	 *    input offset: first_byte_pos
783 	 *    input size: sz
784 	 *
785 	 *    mapped offset = page align truncate (input offset)
786 	 *    mapped size   =
787 	 *        page align extend (input offset - mapped offset + input size)
788 	 *    write offset  = input offset - mapped offset
789 	 *
790 	 * we use the write offset in all writes
791 	 */
792 	mappedoffset = first_byte_pos & ~(httpd->page_size - 1);
793 	mappedsz = (size_t)
794 		(first_byte_pos - mappedoffset + sz + httpd->page_size - 1) &
795 		~(httpd->page_size - 1);
796 	wroffset = (size_t)(first_byte_pos - mappedoffset);
797 
798 	addr = mmap(0, mappedsz, PROT_READ, MAP_SHARED, fd, mappedoffset);
799 	if (addr == (char *)-1) {
800 		bozo_warn(httpd, "mmap failed: %s", strerror(errno));
801 		return -1;
802 	}
803 	mappedaddr = addr;
804 
805 #ifdef MADV_SEQUENTIAL
806 #ifndef __minix
807 	(void)madvise(addr, sz, MADV_SEQUENTIAL);
808 #endif /* !__minix */
809 #endif
810 	while (sz > BOZO_WRSZ) {
811 		if (bozo_write(httpd, STDOUT_FILENO, addr + wroffset,
812 				BOZO_WRSZ) != BOZO_WRSZ) {
813 			bozo_warn(httpd, "write failed: %s", strerror(errno));
814 			goto out;
815 		}
816 		debug((httpd, DEBUG_OBESE, "wrote %d bytes", BOZO_WRSZ));
817 		sz -= BOZO_WRSZ;
818 		addr += BOZO_WRSZ;
819 	}
820 	if (sz && (size_t)bozo_write(httpd, STDOUT_FILENO, addr + wroffset,
821 				sz) != sz) {
822 		bozo_warn(httpd, "final write failed: %s", strerror(errno));
823 		goto out;
824 	}
825 	debug((httpd, DEBUG_OBESE, "wrote %d bytes", (int)sz));
826  out:
827 	if (munmap(mappedaddr, mappedsz) < 0) {
828 		bozo_warn(httpd, "munmap failed");
829 		return -1;
830 	}
831 
832 	return 0;
833 }
834 
835 static int
parse_http_date(const char * val,time_t * timestamp)836 parse_http_date(const char *val, time_t *timestamp)
837 {
838 	char *remainder;
839 	struct tm tm;
840 
841 	if ((remainder = strptime(val, "%a, %d %b %Y %T GMT", &tm)) == NULL &&
842 	    (remainder = strptime(val, "%a, %d-%b-%y %T GMT", &tm)) == NULL &&
843 	    (remainder = strptime(val, "%a %b %d %T %Y", &tm)) == NULL)
844 		return 0; /* Invalid HTTP date format */
845 
846 	if (*remainder)
847 		return 0; /* No trailing garbage */
848 
849 	*timestamp = timegm(&tm);
850 	return 1;
851 }
852 
853 /*
854  * given an url, encode it ala rfc 3986.  ie, escape ? and friends.
855  * note that this function returns a static buffer, and thus needs
856  * to be updated for any sort of parallel processing.
857  */
858 char *
bozo_escape_rfc3986(bozohttpd_t * httpd,const char * url)859 bozo_escape_rfc3986(bozohttpd_t *httpd, const char *url)
860 {
861 	static char *buf;
862 	static size_t buflen = 0;
863 	size_t len;
864 	const char *s;
865 	char *d;
866 
867 	len = strlen(url);
868 	if (buflen < len * 3 + 1) {
869 		buflen = len * 3 + 1;
870 		buf = bozorealloc(httpd, buf, buflen);
871 	}
872 
873 	if (url == NULL) {
874 		buf[0] = 0;
875 		return buf;
876 	}
877 
878 	for (len = 0, s = url, d = buf; *s;) {
879 		if (*s & 0x80)
880 			goto encode_it;
881 		switch (*s) {
882 		case ':':
883 		case '?':
884 		case '#':
885 		case '[':
886 		case ']':
887 		case '@':
888 		case '!':
889 		case '$':
890 		case '&':
891 		case '\'':
892 		case '(':
893 		case ')':
894 		case '*':
895 		case '+':
896 		case ',':
897 		case ';':
898 		case '=':
899 		case '%':
900 		case '\n':
901 		case '\r':
902 		case ' ':
903 		case '"':
904 		encode_it:
905 			snprintf(d, 4, "%%%02X", *s++);
906 			d += 3;
907 			len += 3;
908 			break;
909 		default:
910 			*d++ = *s++;
911 			len++;
912 			break;
913 		}
914 	}
915 	buf[len] = 0;
916 
917 	return buf;
918 }
919 
920 /*
921  * checks to see if this request has a valid .bzdirect file.  returns
922  * 0 on failure and 1 on success.
923  */
924 static int
check_direct_access(bozo_httpreq_t * request)925 check_direct_access(bozo_httpreq_t *request)
926 {
927 	FILE *fp;
928 	struct stat sb;
929 	char dir[MAXPATHLEN], dirfile[MAXPATHLEN], *basename;
930 
931 	snprintf(dir, sizeof(dir), "%s", request->hr_file + 1);
932 	debug((request->hr_httpd, DEBUG_FAT, "check_direct_access: dir %s", dir));
933 	basename = strrchr(dir, '/');
934 
935 	if ((!basename || basename[1] != '\0') &&
936 	    lstat(dir, &sb) == 0 && S_ISDIR(sb.st_mode))
937 		/* nothing */;
938 	else if (basename == NULL)
939 		strcpy(dir, ".");
940 	else {
941 		*basename++ = '\0';
942 		bozo_check_special_files(request, basename);
943 	}
944 
945 	if ((size_t)snprintf(dirfile, sizeof(dirfile), "%s/%s", dir,
946 	  DIRECT_ACCESS_FILE) >= sizeof(dirfile)) {
947 		bozo_http_error(request->hr_httpd, 404, request,
948 		  "directfile path too long");
949 		return 0;
950 	}
951 	if (stat(dirfile, &sb) < 0 ||
952 	    (fp = fopen(dirfile, "r")) == NULL)
953 		return 0;
954 	fclose(fp);
955 	return 1;
956 }
957 
958 /*
959  * do automatic redirection -- if there are query parameters for the URL
960  * we will tack these on to the new (redirected) URL.
961  */
962 static void
handle_redirect(bozo_httpreq_t * request,const char * url,int absolute)963 handle_redirect(bozo_httpreq_t *request,
964 		const char *url, int absolute)
965 {
966 	bozohttpd_t *httpd = request->hr_httpd;
967 	char *urlbuf;
968 	char portbuf[20];
969 	const char *hostname = BOZOHOST(httpd, request);
970 	int query = 0;
971 
972 	if (url == NULL) {
973 		if (asprintf(&urlbuf, "/%s/", request->hr_file) < 0)
974 			bozo_err(httpd, 1, "asprintf");
975 		url = urlbuf;
976 	} else
977 		urlbuf = NULL;
978 	url = bozo_escape_rfc3986(request->hr_httpd, url);
979 
980 	if (request->hr_query && strlen(request->hr_query))
981 		query = 1;
982 
983 	if (request->hr_serverport && strcmp(request->hr_serverport, "80") != 0)
984 		snprintf(portbuf, sizeof(portbuf), ":%s",
985 		    request->hr_serverport);
986 	else
987 		portbuf[0] = '\0';
988 	if (absolute)
989 		bozo_warn(httpd, "redirecting %s", url);
990 	else
991 		bozo_warn(httpd, "redirecting %s%s%s", hostname, portbuf, url);
992 	debug((httpd, DEBUG_FAT, "redirecting %s", url));
993 	bozo_printf(httpd, "%s 301 Document Moved\r\n", request->hr_proto);
994 	if (request->hr_proto != httpd->consts.http_09)
995 		bozo_print_header(request, NULL, "text/html", NULL);
996 	if (request->hr_proto != httpd->consts.http_09) {
997 		bozo_printf(httpd, "Location: http://");
998 		if (absolute == 0)
999 			bozo_printf(httpd, "%s%s", hostname, portbuf);
1000 		if (query) {
1001 			bozo_printf(httpd, "%s?%s\r\n", url, request->hr_query);
1002 		} else {
1003 			bozo_printf(httpd, "%s\r\n", url);
1004 		}
1005 	}
1006 	bozo_printf(httpd, "\r\n");
1007 	if (request->hr_method == HTTP_HEAD)
1008 		goto head;
1009 	bozo_printf(httpd, "<html><head><title>Document Moved</title></head>\n");
1010 	bozo_printf(httpd, "<body><h1>Document Moved</h1>\n");
1011 	bozo_printf(httpd, "This document had moved <a href=\"http://");
1012 	if (query) {
1013 		if (absolute)
1014 			bozo_printf(httpd, "%s?%s", url, request->hr_query);
1015 		else
1016 			bozo_printf(httpd, "%s%s%s?%s", hostname,
1017 				    portbuf, url, request->hr_query);
1018 	} else {
1019 		if (absolute)
1020 			bozo_printf(httpd, "%s", url);
1021 		else
1022 			bozo_printf(httpd, "%s%s%s", hostname,
1023 				    portbuf, url);
1024 	}
1025 	bozo_printf(httpd, "\">here</a>\n");
1026 	bozo_printf(httpd, "</body></html>\n");
1027 head:
1028 	bozo_flush(httpd, stdout);
1029 	free(urlbuf);
1030 }
1031 
1032 /*
1033  * deal with virtual host names; we do this:
1034  *	if we have a virtual path root (httpd->virtbase), and we are given a
1035  *	virtual host spec (Host: ho.st or http://ho.st/), see if this
1036  *	directory exists under httpd->virtbase.  if it does, use this as the
1037  #	new slashdir.
1038  */
1039 static int
check_virtual(bozo_httpreq_t * request)1040 check_virtual(bozo_httpreq_t *request)
1041 {
1042 	bozohttpd_t *httpd = request->hr_httpd;
1043 	char *file = request->hr_file, *s;
1044 	size_t len;
1045 
1046 	if (!httpd->virtbase)
1047 		goto use_slashdir;
1048 
1049 	/*
1050 	 * convert http://virtual.host/ to request->hr_host
1051 	 */
1052 	debug((httpd, DEBUG_OBESE, "checking for http:// virtual host in ``%s''",
1053 			file));
1054 	if (strncasecmp(file, "http://", 7) == 0) {
1055 		/* we would do virtual hosting here? */
1056 		file += 7;
1057 		/* RFC 2616 (HTTP/1.1), 5.2: URI takes precedence over Host: */
1058 		free(request->hr_host);
1059 		request->hr_host = bozostrdup(request->hr_httpd, file);
1060 		if ((s = strchr(request->hr_host, '/')) != NULL)
1061 			*s = '\0';
1062 		s = strchr(file, '/');
1063 		free(request->hr_file);
1064 		request->hr_file = bozostrdup(request->hr_httpd, s ? s : "/");
1065 		debug((httpd, DEBUG_OBESE, "got host ``%s'' file is now ``%s''",
1066 		    request->hr_host, request->hr_file));
1067 	} else if (!request->hr_host)
1068 		goto use_slashdir;
1069 
1070 	/*
1071 	 * canonicalise hr_host - that is, remove any :80.
1072 	 */
1073 	len = strlen(request->hr_host);
1074 	if (len > 3 && strcmp(request->hr_host + len - 3, ":80") == 0) {
1075 		request->hr_host[len - 3] = '\0';
1076 		len = strlen(request->hr_host);
1077 	}
1078 
1079 	/*
1080 	 * ok, we have a virtual host, use opendir(3) to find a case
1081 	 * insensitive match for the virtual host we are asked for.
1082 	 * note that if the virtual host is the same as the master,
1083 	 * we don't need to do anything special.
1084 	 */
1085 	debug((httpd, DEBUG_OBESE,
1086 	    "check_virtual: checking host `%s' under httpd->virtbase `%s' "
1087 	    "for file `%s'",
1088 	    request->hr_host, httpd->virtbase, request->hr_file));
1089 	if (strncasecmp(httpd->virthostname, request->hr_host, len) != 0) {
1090 		s = 0;
1091 		DIR *dirp;
1092 		struct dirent *d;
1093 
1094 		if ((dirp = opendir(httpd->virtbase)) != NULL) {
1095 			while ((d = readdir(dirp)) != NULL) {
1096 				if (strcmp(d->d_name, ".") == 0 ||
1097 				    strcmp(d->d_name, "..") == 0) {
1098 					continue;
1099 				}
1100 				debug((httpd, DEBUG_OBESE, "looking at dir``%s''",
1101 			 	   d->d_name));
1102 				if (strcmp(d->d_name, request->hr_host) == 0) {
1103 					/* found it, punch it */
1104 					debug((httpd, DEBUG_OBESE, "found it punch it"));
1105 					request->hr_virthostname =
1106 					    bozostrdup(httpd, d->d_name);
1107 					if (asprintf(&s, "%s/%s", httpd->virtbase,
1108 					    request->hr_virthostname) < 0)
1109 						bozo_err(httpd, 1, "asprintf");
1110 					break;
1111 				}
1112 			}
1113 			closedir(dirp);
1114 		}
1115 		else {
1116 			debug((httpd, DEBUG_FAT, "opendir %s failed: %s",
1117 			    httpd->virtbase, strerror(errno)));
1118 		}
1119 		if (s == 0) {
1120 			if (httpd->unknown_slash)
1121 				goto use_slashdir;
1122 			return bozo_http_error(httpd, 404, request,
1123 						"unknown URL");
1124 		}
1125 	} else
1126 use_slashdir:
1127 		s = httpd->slashdir;
1128 
1129 	/*
1130 	 * ok, nailed the correct slashdir, chdir to it
1131 	 */
1132 	if (chdir(s) < 0)
1133 		return bozo_http_error(httpd, 404, request,
1134 					"can't chdir to slashdir");
1135 	return 0;
1136 }
1137 
1138 /*
1139  * checks to see if this request has a valid .bzredirect file.  returns
1140  * 0 when no redirection happend, or 1 when handle_redirect() has been
1141  * called, -1 on error.
1142  */
1143 static int
check_bzredirect(bozo_httpreq_t * request)1144 check_bzredirect(bozo_httpreq_t *request)
1145 {
1146 	struct stat sb;
1147 	char dir[MAXPATHLEN], redir[MAXPATHLEN], redirpath[MAXPATHLEN + 1],
1148 	    path[MAXPATHLEN];
1149 	char *basename, *finalredir;
1150 	int rv, absolute;
1151 
1152 	/*
1153 	 * if this pathname is really a directory, but doesn't end in /,
1154 	 * use it as the directory to look for the redir file.
1155 	 */
1156 	if((size_t)snprintf(dir, sizeof(dir), "%s", request->hr_file + 1) >=
1157 	  sizeof(dir)) {
1158 		bozo_http_error(request->hr_httpd, 404, request,
1159 		  "file path too long");
1160 		return -1;
1161 	}
1162 	debug((request->hr_httpd, DEBUG_FAT, "check_bzredirect: dir %s", dir));
1163 	basename = strrchr(dir, '/');
1164 
1165 	if ((!basename || basename[1] != '\0') &&
1166 	    lstat(dir, &sb) == 0 && S_ISDIR(sb.st_mode))
1167 		/* nothing */;
1168 	else if (basename == NULL)
1169 		strcpy(dir, ".");
1170 	else {
1171 		*basename++ = '\0';
1172 		bozo_check_special_files(request, basename);
1173 	}
1174 
1175 	if ((size_t)snprintf(redir, sizeof(redir), "%s/%s", dir,
1176 	  REDIRECT_FILE) >= sizeof(redir)) {
1177 		bozo_http_error(request->hr_httpd, 404, request,
1178 		  "redirectfile path too long");
1179 		return -1;
1180 	}
1181 	if (lstat(redir, &sb) == 0) {
1182 		if (!S_ISLNK(sb.st_mode))
1183 			return 0;
1184 		absolute = 0;
1185 	} else {
1186 		if((size_t)snprintf(redir, sizeof(redir), "%s/%s", dir,
1187 		  ABSREDIRECT_FILE) >= sizeof(redir)) {
1188 			bozo_http_error(request->hr_httpd, 404, request,
1189 			  "redirectfile path too long");
1190 			return -1;
1191 		}
1192 		if (lstat(redir, &sb) < 0 || !S_ISLNK(sb.st_mode))
1193 			return 0;
1194 		absolute = 1;
1195 	}
1196 	debug((request->hr_httpd, DEBUG_FAT,
1197 	       "check_bzredirect: calling readlink"));
1198 	rv = readlink(redir, redirpath, sizeof redirpath - 1);
1199 	if (rv == -1 || rv == 0) {
1200 		debug((request->hr_httpd, DEBUG_FAT, "readlink failed"));
1201 		return 0;
1202 	}
1203 	redirpath[rv] = '\0';
1204 	debug((request->hr_httpd, DEBUG_FAT,
1205 	       "readlink returned \"%s\"", redirpath));
1206 
1207 	/* check if we need authentication */
1208 	snprintf(path, sizeof(path), "%s/", dir);
1209 	if (bozo_auth_check(request, path))
1210 		return 1;
1211 
1212 	/* now we have the link pointer, redirect to the real place */
1213 	if (absolute)
1214 		finalredir = redirpath;
1215 	else {
1216 		if ((size_t)snprintf(finalredir = redir, sizeof(redir), "/%s/%s",
1217 		  dir, redirpath) >= sizeof(redir)) {
1218 			bozo_http_error(request->hr_httpd, 404, request,
1219 			  "redirect path too long");
1220 			return -1;
1221 		}
1222 	}
1223 
1224 	debug((request->hr_httpd, DEBUG_FAT,
1225 	       "check_bzredirect: new redir %s", finalredir));
1226 	handle_redirect(request, finalredir, absolute);
1227 	return 1;
1228 }
1229 
1230 /* this fixes the %HH hack that RFC2396 requires.  */
1231 static int
fix_url_percent(bozo_httpreq_t * request)1232 fix_url_percent(bozo_httpreq_t *request)
1233 {
1234 	bozohttpd_t *httpd = request->hr_httpd;
1235 	char	*s, *t, buf[3], *url;
1236 	char	*end;	/* if end is not-zero, we don't translate beyond that */
1237 
1238 	url = request->hr_file;
1239 
1240 	end = url + strlen(url);
1241 
1242 	/* fast forward to the first % */
1243 	if ((s = strchr(url, '%')) == NULL)
1244 		return 0;
1245 
1246 	t = s;
1247 	do {
1248 		if (end && s >= end) {
1249 			debug((httpd, DEBUG_EXPLODING,
1250 				"fu_%%: past end, filling out.."));
1251 			while (*s)
1252 				*t++ = *s++;
1253 			break;
1254 		}
1255 		debug((httpd, DEBUG_EXPLODING,
1256 			"fu_%%: got s == %%, s[1]s[2] == %c%c",
1257 			s[1], s[2]));
1258 		if (s[1] == '\0' || s[2] == '\0') {
1259 			(void)bozo_http_error(httpd, 400, request,
1260 			    "percent hack missing two chars afterwards");
1261 			return 1;
1262 		}
1263 		if (s[1] == '0' && s[2] == '0') {
1264 			(void)bozo_http_error(httpd, 404, request,
1265 					"percent hack was %00");
1266 			return 1;
1267 		}
1268 		if (s[1] == '2' && s[2] == 'f') {
1269 			(void)bozo_http_error(httpd, 404, request,
1270 					"percent hack was %2f (/)");
1271 			return 1;
1272 		}
1273 
1274 		buf[0] = *++s;
1275 		buf[1] = *++s;
1276 		buf[2] = '\0';
1277 		s++;
1278 		*t = (char)strtol(buf, NULL, 16);
1279 		debug((httpd, DEBUG_EXPLODING,
1280 				"fu_%%: strtol put '%02x' into *t", *t));
1281 		if (*t++ == '\0') {
1282 			(void)bozo_http_error(httpd, 400, request,
1283 					"percent hack got a 0 back");
1284 			return 1;
1285 		}
1286 
1287 		while (*s && *s != '%') {
1288 			if (end && s >= end)
1289 				break;
1290 			*t++ = *s++;
1291 		}
1292 	} while (*s);
1293 	*t = '\0';
1294 
1295 	debug((httpd, DEBUG_FAT, "fix_url_percent returns %s in url",
1296 			request->hr_file));
1297 
1298 	return 0;
1299 }
1300 
1301 /*
1302  * transform_request does this:
1303  *	- ``expand'' %20 crapola
1304  *	- punt if it doesn't start with /
1305  *	- check httpd->untrustedref / referrer
1306  *	- look for "http://myname/" and deal with it.
1307  *	- maybe call bozo_process_cgi()
1308  *	- check for ~user and call bozo_user_transform() if so
1309  *	- if the length > 1, check for trailing slash.  if so,
1310  *	  add the index.html file
1311  *	- if the length is 1, return the index.html file
1312  *	- disallow anything ending up with a file starting
1313  *	  at "/" or having ".." in it.
1314  *	- anything else is a really weird internal error
1315  *	- returns malloced file to serve, if unhandled
1316  */
1317 static int
transform_request(bozo_httpreq_t * request,int * isindex)1318 transform_request(bozo_httpreq_t *request, int *isindex)
1319 {
1320 	bozohttpd_t *httpd = request->hr_httpd;
1321 	char	*file, *newfile = NULL;
1322 	size_t	len;
1323 	const char *hostname = BOZOHOST(httpd, request);
1324 
1325 	file = NULL;
1326 	*isindex = 0;
1327 	debug((httpd, DEBUG_FAT, "tf_req: file %s", request->hr_file));
1328 	if (fix_url_percent(request)) {
1329 		goto bad_done;
1330 	}
1331 	if (check_virtual(request)) {
1332 		goto bad_done;
1333 	}
1334 	file = request->hr_file;
1335 
1336 	if (file[0] != '/') {
1337 		(void)bozo_http_error(httpd, 404, request, "unknown URL");
1338 		goto bad_done;
1339 	}
1340 
1341 	/* omit additional slashes at the beginning */
1342 	while (file[1] == '/')
1343 		file++;
1344 
1345 	switch(check_bzredirect(request)) {
1346 	case -1:
1347 		goto bad_done;
1348 	case 1:
1349 		return 0;
1350 	}
1351 
1352 	if (httpd->untrustedref) {
1353 		int to_indexhtml = 0;
1354 
1355 #define TOP_PAGE(x)	(strcmp((x), "/") == 0 || \
1356 			 strcmp((x) + 1, httpd->index_html) == 0 || \
1357 			 strcmp((x) + 1, "favicon.ico") == 0)
1358 
1359 		debug((httpd, DEBUG_EXPLODING, "checking httpd->untrustedref"));
1360 		/*
1361 		 * first check that this path isn't allowed via .bzdirect file,
1362 		 * and then check referrer; make sure that people come via the
1363 		 * real name... otherwise if we aren't looking at / or
1364 		 * /index.html, redirect...  we also special case favicon.ico.
1365 		 */
1366 		if (check_direct_access(request))
1367 			/* nothing */;
1368 		else if (request->hr_referrer) {
1369 			const char *r = request->hr_referrer;
1370 
1371 			debug((httpd, DEBUG_FAT,
1372 				"checking referrer \"%s\" vs virthostname %s",
1373 				r, hostname));
1374 			if (strncmp(r, "http://", 7) != 0 ||
1375 			    (strncasecmp(r + 7, hostname,
1376 			    		 strlen(hostname)) != 0 &&
1377 			     !TOP_PAGE(file)))
1378 				to_indexhtml = 1;
1379 		} else {
1380 			const char *h = request->hr_host;
1381 
1382 			debug((httpd, DEBUG_FAT, "url has no referrer at all"));
1383 			/* if there's no referrer, let / or /index.html past */
1384 			if (!TOP_PAGE(file) ||
1385 			    (h && strncasecmp(h, hostname,
1386 			    		strlen(hostname)) != 0))
1387 				to_indexhtml = 1;
1388 		}
1389 
1390 		if (to_indexhtml) {
1391 			char *slashindexhtml;
1392 
1393 			if (asprintf(&slashindexhtml, "/%s",
1394 					httpd->index_html) < 0)
1395 				bozo_err(httpd, 1, "asprintf");
1396 			debug((httpd, DEBUG_FAT,
1397 				"httpd->untrustedref: redirecting %s to %s",
1398 				file, slashindexhtml));
1399 			handle_redirect(request, slashindexhtml, 0);
1400 			free(slashindexhtml);
1401 			return 0;
1402 		}
1403 	}
1404 
1405 	len = strlen(file);
1406 	if (/*CONSTCOND*/0) {
1407 #ifndef NO_USER_SUPPORT
1408 	} else if (len > 1 && httpd->enable_users && file[1] == '~') {
1409 		if (file[2] == '\0') {
1410 			(void)bozo_http_error(httpd, 404, request,
1411 						"missing username");
1412 			goto bad_done;
1413 		}
1414 		if (strchr(file + 2, '/') == NULL) {
1415 			handle_redirect(request, NULL, 0);
1416 			return 0;
1417 		}
1418 		debug((httpd, DEBUG_FAT, "calling bozo_user_transform"));
1419 
1420 		return bozo_user_transform(request, isindex);
1421 #endif /* NO_USER_SUPPORT */
1422 	} else if (len > 1) {
1423 		debug((httpd, DEBUG_FAT, "file[len-1] == %c", file[len-1]));
1424 		if (file[len-1] == '/') {	/* append index.html */
1425 			*isindex = 1;
1426 			debug((httpd, DEBUG_FAT, "appending index.html"));
1427 			newfile = bozomalloc(httpd,
1428 					len + strlen(httpd->index_html) + 1);
1429 			strcpy(newfile, file + 1);
1430 			strcat(newfile, httpd->index_html);
1431 		} else
1432 			newfile = bozostrdup(request->hr_httpd, file + 1);
1433 	} else if (len == 1) {
1434 		debug((httpd, DEBUG_EXPLODING, "tf_req: len == 1"));
1435 		newfile = bozostrdup(request->hr_httpd, httpd->index_html);
1436 		*isindex = 1;
1437 	} else {	/* len == 0 ? */
1438 		(void)bozo_http_error(httpd, 500, request,
1439 					"request->hr_file is nul?");
1440 		goto bad_done;
1441 	}
1442 
1443 	if (newfile == NULL) {
1444 		(void)bozo_http_error(httpd, 500, request, "internal failure");
1445 		goto bad_done;
1446 	}
1447 
1448 	/*
1449 	 * look for "http://myname/" and deal with it as necessary.
1450 	 */
1451 
1452 	/*
1453 	 * stop traversing outside our domain
1454 	 *
1455 	 * XXX true security only comes from our parent using chroot(2)
1456 	 * before execve(2)'ing us.  or our own built in chroot(2) support.
1457 	 */
1458 	if (*newfile == '/' || strcmp(newfile, "..") == 0 ||
1459 	    strstr(newfile, "/..") || strstr(newfile, "../")) {
1460 		(void)bozo_http_error(httpd, 403, request, "illegal request");
1461 		goto bad_done;
1462 	}
1463 
1464 	if (bozo_auth_check(request, newfile))
1465 		goto bad_done;
1466 
1467 	if (strlen(newfile)) {
1468 		request->hr_oldfile = request->hr_file;
1469 		request->hr_file = newfile;
1470 	}
1471 
1472 	if (bozo_process_cgi(request))
1473 		return 0;
1474 
1475 	if (bozo_process_lua(request))
1476 		return 0;
1477 
1478 	debug((httpd, DEBUG_FAT, "transform_request set: %s", newfile));
1479 	return 1;
1480 bad_done:
1481 	debug((httpd, DEBUG_FAT, "transform_request returning: 0"));
1482 	free(newfile);
1483 	return 0;
1484 }
1485 
1486 /*
1487  * can_gzip checks if the request supports and prefers gzip encoding.
1488  *
1489  * XXX: we do not consider the associated q with gzip in making our
1490  *      decision which is broken.
1491  */
1492 
1493 static int
can_gzip(bozo_httpreq_t * request)1494 can_gzip(bozo_httpreq_t *request)
1495 {
1496 	const char	*pos;
1497 	const char	*tmp;
1498 	size_t		 len;
1499 
1500 	/* First we decide if the request can be gzipped at all. */
1501 
1502 	/* not if we already are encoded... */
1503 	tmp = bozo_content_encoding(request, request->hr_file);
1504 	if (tmp && *tmp)
1505 		return 0;
1506 
1507 	/* not if we are not asking for the whole file... */
1508 	if (request->hr_last_byte_pos != -1 || request->hr_have_range)
1509 		return 0;
1510 
1511 	/* Then we determine if gzip is on the cards. */
1512 
1513 	for (pos = request->hr_accept_encoding; pos && *pos; pos += len) {
1514 		while (*pos == ' ')
1515 			pos++;
1516 
1517 		len = strcspn(pos, ";,");
1518 
1519 		if ((len == 4 && strncasecmp("gzip", pos, 4) == 0) ||
1520 		    (len == 6 && strncasecmp("x-gzip", pos, 6) == 0))
1521 			return 1;
1522 
1523 		if (pos[len] == ';')
1524 			len += strcspn(&pos[len], ",");
1525 
1526 		if (pos[len])
1527 			len++;
1528 	}
1529 
1530 	return 0;
1531 }
1532 
1533 /*
1534  * bozo_process_request does the following:
1535  *	- check the request is valid
1536  *	- process cgi-bin if necessary
1537  *	- transform a filename if necesarry
1538  *	- return the HTTP request
1539  */
1540 void
bozo_process_request(bozo_httpreq_t * request)1541 bozo_process_request(bozo_httpreq_t *request)
1542 {
1543 	bozohttpd_t *httpd = request->hr_httpd;
1544 	struct	stat sb;
1545 	time_t timestamp;
1546 	char	*file;
1547 	const char *type, *encoding;
1548 	int	fd, isindex;
1549 
1550 	/*
1551 	 * note that transform_request chdir()'s if required.  also note
1552 	 * that cgi is handed here.  if transform_request() returns 0
1553 	 * then the request has been handled already.
1554 	 */
1555 	if (transform_request(request, &isindex) == 0)
1556 		return;
1557 
1558 	fd = -1;
1559 	encoding = NULL;
1560 	if (can_gzip(request)) {
1561 		asprintf(&file, "%s.gz", request->hr_file);
1562 		fd = open(file, O_RDONLY);
1563 		if (fd >= 0)
1564 			encoding = "gzip";
1565 		free(file);
1566 	}
1567 
1568 	file = request->hr_file;
1569 
1570 	if (fd < 0)
1571 		fd = open(file, O_RDONLY);
1572 
1573 	if (fd < 0) {
1574 		debug((httpd, DEBUG_FAT, "open failed: %s", strerror(errno)));
1575 		switch(errno) {
1576 		case EPERM:
1577 		case EACCES:
1578 			(void)bozo_http_error(httpd, 403, request,
1579 						"no permission to open file");
1580 			break;
1581 		case ENAMETOOLONG:
1582 			/*FALLTHROUGH*/
1583 		case ENOENT:
1584 			if (!bozo_dir_index(request, file, isindex))
1585 				(void)bozo_http_error(httpd, 404, request,
1586 							"no file");
1587 			break;
1588 		default:
1589 			(void)bozo_http_error(httpd, 500, request, "open file");
1590 		}
1591 		goto cleanup_nofd;
1592 	}
1593 	if (fstat(fd, &sb) < 0) {
1594 		(void)bozo_http_error(httpd, 500, request, "can't fstat");
1595 		goto cleanup;
1596 	}
1597 	if (S_ISDIR(sb.st_mode)) {
1598 		handle_redirect(request, NULL, 0);
1599 		goto cleanup;
1600 	}
1601 
1602 	if (request->hr_if_modified_since &&
1603 	    parse_http_date(request->hr_if_modified_since, &timestamp) &&
1604 	    timestamp >= sb.st_mtime) {
1605 		/* XXX ignore subsecond of timestamp */
1606 		bozo_printf(httpd, "%s 304 Not Modified\r\n",
1607 				request->hr_proto);
1608 		bozo_printf(httpd, "\r\n");
1609 		bozo_flush(httpd, stdout);
1610 		goto cleanup;
1611 	}
1612 
1613 	/* validate requested range */
1614 	if (request->hr_last_byte_pos == -1 ||
1615 	    request->hr_last_byte_pos >= sb.st_size)
1616 		request->hr_last_byte_pos = sb.st_size - 1;
1617 	if (request->hr_have_range &&
1618 	    request->hr_first_byte_pos > request->hr_last_byte_pos) {
1619 		request->hr_have_range = 0;	/* punt */
1620 		request->hr_first_byte_pos = 0;
1621 		request->hr_last_byte_pos = sb.st_size - 1;
1622 	}
1623 	debug((httpd, DEBUG_FAT, "have_range %d first_pos %lld last_pos %lld",
1624 	    request->hr_have_range,
1625 	    (long long)request->hr_first_byte_pos,
1626 	    (long long)request->hr_last_byte_pos));
1627 	if (request->hr_have_range)
1628 		bozo_printf(httpd, "%s 206 Partial Content\r\n",
1629 				request->hr_proto);
1630 	else
1631 		bozo_printf(httpd, "%s 200 OK\r\n", request->hr_proto);
1632 
1633 	if (request->hr_proto != httpd->consts.http_09) {
1634 		type = bozo_content_type(request, file);
1635 		if (!encoding)
1636 			encoding = bozo_content_encoding(request, file);
1637 
1638 		bozo_print_header(request, &sb, type, encoding);
1639 		bozo_printf(httpd, "\r\n");
1640 	}
1641 	bozo_flush(httpd, stdout);
1642 
1643 	if (request->hr_method != HTTP_HEAD) {
1644 		off_t szleft, cur_byte_pos;
1645 
1646 		szleft =
1647 		     request->hr_last_byte_pos - request->hr_first_byte_pos + 1;
1648 		cur_byte_pos = request->hr_first_byte_pos;
1649 
1650  retry:
1651 		while (szleft) {
1652 			size_t sz;
1653 
1654 			/* This should take care of the first unaligned chunk */
1655 			if ((cur_byte_pos & (httpd->page_size - 1)) != 0)
1656 				sz = (size_t)(cur_byte_pos & ~httpd->page_size);
1657 			if ((off_t)httpd->mmapsz < szleft)
1658 				sz = httpd->mmapsz;
1659 			else
1660 				sz = (size_t)szleft;
1661 			if (mmap_and_write_part(httpd, fd, cur_byte_pos, sz)) {
1662 				if (errno == ENOMEM) {
1663 					httpd->mmapsz /= 2;
1664 					if (httpd->mmapsz >= httpd->page_size)
1665 						goto retry;
1666 				}
1667 				goto cleanup;
1668 			}
1669 			cur_byte_pos += sz;
1670 			szleft -= sz;
1671 		}
1672 	}
1673  cleanup:
1674 	close(fd);
1675  cleanup_nofd:
1676 	close(STDIN_FILENO);
1677 	close(STDOUT_FILENO);
1678 	/*close(STDERR_FILENO);*/
1679 }
1680 
1681 /* make sure we're not trying to access special files */
1682 int
bozo_check_special_files(bozo_httpreq_t * request,const char * name)1683 bozo_check_special_files(bozo_httpreq_t *request, const char *name)
1684 {
1685 	bozohttpd_t *httpd = request->hr_httpd;
1686 
1687 	/* ensure basename(name) != special files */
1688 	if (strcmp(name, DIRECT_ACCESS_FILE) == 0)
1689 		return bozo_http_error(httpd, 403, request,
1690 		    "no permission to open direct access file");
1691 	if (strcmp(name, REDIRECT_FILE) == 0)
1692 		return bozo_http_error(httpd, 403, request,
1693 		    "no permission to open redirect file");
1694 	if (strcmp(name, ABSREDIRECT_FILE) == 0)
1695 		return bozo_http_error(httpd, 403, request,
1696 		    "no permission to open redirect file");
1697 	return bozo_auth_check_special_files(request, name);
1698 }
1699 
1700 /* generic header printing routine */
1701 void
bozo_print_header(bozo_httpreq_t * request,struct stat * sbp,const char * type,const char * encoding)1702 bozo_print_header(bozo_httpreq_t *request,
1703 		struct stat *sbp, const char *type, const char *encoding)
1704 {
1705 	bozohttpd_t *httpd = request->hr_httpd;
1706 	off_t len;
1707 	char	date[40];
1708 
1709 	bozo_printf(httpd, "Date: %s\r\n", bozo_http_date(date, sizeof(date)));
1710 	bozo_printf(httpd, "Server: %s\r\n", httpd->server_software);
1711 	bozo_printf(httpd, "Accept-Ranges: bytes\r\n");
1712 	if (sbp) {
1713 		char filedate[40];
1714 		struct	tm *tm;
1715 
1716 		tm = gmtime(&sbp->st_mtime);
1717 		strftime(filedate, sizeof filedate,
1718 		    "%a, %d %b %Y %H:%M:%S GMT", tm);
1719 		bozo_printf(httpd, "Last-Modified: %s\r\n", filedate);
1720 	}
1721 	if (type && *type)
1722 		bozo_printf(httpd, "Content-Type: %s\r\n", type);
1723 	if (encoding && *encoding)
1724 		bozo_printf(httpd, "Content-Encoding: %s\r\n", encoding);
1725 	if (sbp) {
1726 		if (request->hr_have_range) {
1727 			len = request->hr_last_byte_pos -
1728 					request->hr_first_byte_pos +1;
1729 			bozo_printf(httpd,
1730 				"Content-Range: bytes %qd-%qd/%qd\r\n",
1731 				(long long) request->hr_first_byte_pos,
1732 				(long long) request->hr_last_byte_pos,
1733 				(long long) sbp->st_size);
1734 		} else
1735 			len = sbp->st_size;
1736 		bozo_printf(httpd, "Content-Length: %qd\r\n", (long long)len);
1737 	}
1738 	if (request && request->hr_proto == httpd->consts.http_11)
1739 		bozo_printf(httpd, "Connection: close\r\n");
1740 	bozo_flush(httpd, stdout);
1741 }
1742 
1743 #ifndef NO_DEBUG
1744 void
debug__(bozohttpd_t * httpd,int level,const char * fmt,...)1745 debug__(bozohttpd_t *httpd, int level, const char *fmt, ...)
1746 {
1747 	va_list	ap;
1748 	int savederrno;
1749 
1750 	/* only log if the level is low enough */
1751 	if (httpd->debug < level)
1752 		return;
1753 
1754 	savederrno = errno;
1755 	va_start(ap, fmt);
1756 	if (httpd->logstderr) {
1757 		vfprintf(stderr, fmt, ap);
1758 		fputs("\n", stderr);
1759 	} else
1760 		vsyslog(LOG_DEBUG, fmt, ap);
1761 	va_end(ap);
1762 	errno = savederrno;
1763 }
1764 #endif /* NO_DEBUG */
1765 
1766 /* these are like warn() and err(), except for syslog not stderr */
1767 void
bozo_warn(bozohttpd_t * httpd,const char * fmt,...)1768 bozo_warn(bozohttpd_t *httpd, const char *fmt, ...)
1769 {
1770 	va_list ap;
1771 
1772 	va_start(ap, fmt);
1773 	if (httpd->logstderr || isatty(STDERR_FILENO)) {
1774 		//fputs("warning: ", stderr);
1775 		vfprintf(stderr, fmt, ap);
1776 		fputs("\n", stderr);
1777 	} else
1778 		vsyslog(LOG_INFO, fmt, ap);
1779 	va_end(ap);
1780 }
1781 
1782 void
bozo_err(bozohttpd_t * httpd,int code,const char * fmt,...)1783 bozo_err(bozohttpd_t *httpd, int code, const char *fmt, ...)
1784 {
1785 	va_list ap;
1786 
1787 	va_start(ap, fmt);
1788 	if (httpd->logstderr || isatty(STDERR_FILENO)) {
1789 		//fputs("error: ", stderr);
1790 		vfprintf(stderr, fmt, ap);
1791 		fputs("\n", stderr);
1792 	} else
1793 		vsyslog(LOG_ERR, fmt, ap);
1794 	va_end(ap);
1795 	exit(code);
1796 }
1797 
1798 /*
1799  * this escapes HTML tags.  returns allocated escaped
1800  * string if needed, or NULL on allocation failure or
1801  * lack of escape need.
1802  * call with NULL httpd in error paths, to avoid recursive
1803  * malloc failure.  call with valid httpd in normal paths
1804  * to get automatic allocation failure handling.
1805  */
1806 char *
bozo_escape_html(bozohttpd_t * httpd,const char * url)1807 bozo_escape_html(bozohttpd_t *httpd, const char *url)
1808 {
1809 	int	i, j;
1810 	char	*tmp;
1811 	size_t	len;
1812 
1813 	for (i = 0, j = 0; url[i]; i++) {
1814 		switch (url[i]) {
1815 		case '<':
1816 		case '>':
1817 			j += 4;
1818 			break;
1819 		case '&':
1820 			j += 5;
1821 			break;
1822 		}
1823 	}
1824 
1825 	if (j == 0)
1826 		return NULL;
1827 
1828 	/*
1829 	 * we need to handle being called from different
1830 	 * pathnames.
1831 	 */
1832 	len = strlen(url) + j;
1833 	if (httpd)
1834 		tmp = bozomalloc(httpd, len);
1835 	else if ((tmp = malloc(len)) == 0)
1836 			return NULL;
1837 
1838 	for (i = 0, j = 0; url[i]; i++) {
1839 		switch (url[i]) {
1840 		case '<':
1841 			memcpy(tmp + j, "&lt;", 4);
1842 			j += 4;
1843 			break;
1844 		case '>':
1845 			memcpy(tmp + j, "&gt;", 4);
1846 			j += 4;
1847 			break;
1848 		case '&':
1849 			memcpy(tmp + j, "&amp;", 5);
1850 			j += 5;
1851 			break;
1852 		default:
1853 			tmp[j++] = url[i];
1854 		}
1855 	}
1856 	tmp[j] = 0;
1857 
1858 	return tmp;
1859 }
1860 
1861 /* short map between error code, and short/long messages */
1862 static struct errors_map {
1863 	int	code;			/* HTTP return code */
1864 	const char *shortmsg;		/* short version of message */
1865 	const char *longmsg;		/* long version of message */
1866 } errors_map[] = {
1867 	{ 400,	"400 Bad Request",	"The request was not valid", },
1868 	{ 401,	"401 Unauthorized",	"No authorization", },
1869 	{ 403,	"403 Forbidden",	"Access to this item has been denied",},
1870 	{ 404, 	"404 Not Found",	"This item has not been found", },
1871 	{ 408, 	"408 Request Timeout",	"This request took too long", },
1872 	{ 417,	"417 Expectation Failed","Expectations not available", },
1873 	{ 420,	"420 Enhance Your Calm","Chill, Winston", },
1874 	{ 500,	"500 Internal Error",	"An error occured on the server", },
1875 	{ 501,	"501 Not Implemented",	"This request is not available", },
1876 	{ 0,	NULL,			NULL, },
1877 };
1878 
1879 static const char *help = "DANGER! WILL ROBINSON! DANGER!";
1880 
1881 static const char *
http_errors_short(int code)1882 http_errors_short(int code)
1883 {
1884 	struct errors_map *ep;
1885 
1886 	for (ep = errors_map; ep->code; ep++)
1887 		if (ep->code == code)
1888 			return (ep->shortmsg);
1889 	return (help);
1890 }
1891 
1892 static const char *
http_errors_long(int code)1893 http_errors_long(int code)
1894 {
1895 	struct errors_map *ep;
1896 
1897 	for (ep = errors_map; ep->code; ep++)
1898 		if (ep->code == code)
1899 			return (ep->longmsg);
1900 	return (help);
1901 }
1902 
1903 /* the follow functions and variables are used in handling HTTP errors */
1904 /* ARGSUSED */
1905 int
bozo_http_error(bozohttpd_t * httpd,int code,bozo_httpreq_t * request,const char * msg)1906 bozo_http_error(bozohttpd_t *httpd, int code, bozo_httpreq_t *request,
1907 		const char *msg)
1908 {
1909 	char portbuf[20];
1910 	const char *header = http_errors_short(code);
1911 	const char *reason = http_errors_long(code);
1912 	const char *proto = (request && request->hr_proto) ?
1913 				request->hr_proto : httpd->consts.http_11;
1914 	int	size;
1915 
1916 	debug((httpd, DEBUG_FAT, "bozo_http_error %d: %s", code, msg));
1917 	if (header == NULL || reason == NULL) {
1918 		bozo_err(httpd, 1,
1919 			"bozo_http_error() failed (short = %p, long = %p)",
1920 			header, reason);
1921 		return code;
1922 	}
1923 
1924 	if (request && request->hr_serverport &&
1925 	    strcmp(request->hr_serverport, "80") != 0)
1926 		snprintf(portbuf, sizeof(portbuf), ":%s",
1927 				request->hr_serverport);
1928 	else
1929 		portbuf[0] = '\0';
1930 
1931 	if (request && request->hr_file) {
1932 		char *file = NULL;
1933 		const char *hostname = BOZOHOST(httpd, request);
1934 
1935 		/* bozo_escape_html() failure here is just too bad. */
1936 		file = bozo_escape_html(NULL, request->hr_file);
1937 		if (file == NULL)
1938 			file = request->hr_file;
1939 		size = snprintf(httpd->errorbuf, BUFSIZ,
1940 		    "<html><head><title>%s</title></head>\n"
1941 		    "<body><h1>%s</h1>\n"
1942 		    "%s: <pre>%s</pre>\n"
1943  		    "<hr><address><a href=\"http://%s%s/\">%s%s</a></address>\n"
1944 		    "</body></html>\n",
1945 		    header, header, file, reason,
1946 		    hostname, portbuf, hostname, portbuf);
1947 		if (size >= (int)BUFSIZ) {
1948 			bozo_warn(httpd,
1949 				"bozo_http_error buffer too small, truncated");
1950 			size = (int)BUFSIZ;
1951 		}
1952 	} else
1953 		size = 0;
1954 
1955 	bozo_printf(httpd, "%s %s\r\n", proto, header);
1956 	if (request)
1957 		bozo_auth_check_401(request, code);
1958 
1959 	bozo_printf(httpd, "Content-Type: text/html\r\n");
1960 	bozo_printf(httpd, "Content-Length: %d\r\n", size);
1961 	bozo_printf(httpd, "Server: %s\r\n", httpd->server_software);
1962 	if (request && request->hr_allow)
1963 		bozo_printf(httpd, "Allow: %s\r\n", request->hr_allow);
1964 	bozo_printf(httpd, "\r\n");
1965 	/* According to the RFC 2616 sec. 9.4 HEAD method MUST NOT return a
1966 	 * message-body in the response */
1967 	if (size && request && request->hr_method != HTTP_HEAD)
1968 		bozo_printf(httpd, "%s", httpd->errorbuf);
1969 	bozo_flush(httpd, stdout);
1970 
1971 	return code;
1972 }
1973 
1974 /* Below are various modified libc functions */
1975 
1976 /*
1977  * returns -1 in lenp if the string ran out before finding a delimiter,
1978  * but is otherwise the same as strsep.  Note that the length must be
1979  * correctly passed in.
1980  */
1981 char *
bozostrnsep(char ** strp,const char * delim,ssize_t * lenp)1982 bozostrnsep(char **strp, const char *delim, ssize_t	*lenp)
1983 {
1984 	char	*s;
1985 	const	char *spanp;
1986 	int	c, sc;
1987 	char	*tok;
1988 
1989 	if ((s = *strp) == NULL)
1990 		return (NULL);
1991 	for (tok = s;;) {
1992 		if (lenp && --(*lenp) == -1)
1993 			return (NULL);
1994 		c = *s++;
1995 		spanp = delim;
1996 		do {
1997 			if ((sc = *spanp++) == c) {
1998 				if (c == 0)
1999 					s = NULL;
2000 				else
2001 					s[-1] = '\0';
2002 				*strp = s;
2003 				return (tok);
2004 			}
2005 		} while (sc != 0);
2006 	}
2007 	/* NOTREACHED */
2008 }
2009 
2010 /*
2011  * inspired by fgetln(3), but works for fd's.  should work identically
2012  * except it, however, does *not* return the newline, and it does nul
2013  * terminate the string.
2014  */
2015 char *
bozodgetln(bozohttpd_t * httpd,int fd,ssize_t * lenp,ssize_t (* readfn)(bozohttpd_t *,int,void *,size_t))2016 bozodgetln(bozohttpd_t *httpd, int fd, ssize_t *lenp,
2017 	ssize_t (*readfn)(bozohttpd_t *, int, void *, size_t))
2018 {
2019 	ssize_t	len;
2020 	int	got_cr = 0;
2021 	char	c, *nbuffer;
2022 
2023 	/* initialise */
2024 	if (httpd->getln_buflen == 0) {
2025 		/* should be plenty for most requests */
2026 		httpd->getln_buflen = 128;
2027 		httpd->getln_buffer = malloc((size_t)httpd->getln_buflen);
2028 		if (httpd->getln_buffer == NULL) {
2029 			httpd->getln_buflen = 0;
2030 			return NULL;
2031 		}
2032 	}
2033 	len = 0;
2034 
2035 	/*
2036 	 * we *have* to read one byte at a time, to not break cgi
2037 	 * programs (for we pass stdin off to them).  could fix this
2038 	 * by becoming a fd-passing program instead of just exec'ing
2039 	 * the program
2040 	 *
2041 	 * the above is no longer true, we are the fd-passing
2042 	 * program already.
2043 	 */
2044 	for (; readfn(httpd, fd, &c, 1) == 1; ) {
2045 		debug((httpd, DEBUG_EXPLODING, "bozodgetln read %c", c));
2046 
2047 		if (len >= httpd->getln_buflen - 1) {
2048 			httpd->getln_buflen *= 2;
2049 			debug((httpd, DEBUG_EXPLODING, "bozodgetln: "
2050 				"reallocating buffer to buflen %zu",
2051 				httpd->getln_buflen));
2052 			nbuffer = bozorealloc(httpd, httpd->getln_buffer,
2053 				(size_t)httpd->getln_buflen);
2054 			httpd->getln_buffer = nbuffer;
2055 		}
2056 
2057 		httpd->getln_buffer[len++] = c;
2058 		if (c == '\r') {
2059 			got_cr = 1;
2060 			continue;
2061 		} else if (c == '\n') {
2062 			/*
2063 			 * HTTP/1.1 spec says to ignore CR and treat
2064 			 * LF as the real line terminator.  even though
2065 			 * the same spec defines CRLF as the line
2066 			 * terminator, it is recommended in section 19.3
2067 			 * to do the LF trick for tolerance.
2068 			 */
2069 			if (got_cr)
2070 				len -= 2;
2071 			else
2072 				len -= 1;
2073 			break;
2074 		}
2075 
2076 	}
2077 	httpd->getln_buffer[len] = '\0';
2078 	debug((httpd, DEBUG_OBESE, "bozodgetln returns: ``%s'' with len %zd",
2079 	       httpd->getln_buffer, len));
2080 	*lenp = len;
2081 	return httpd->getln_buffer;
2082 }
2083 
2084 void *
bozorealloc(bozohttpd_t * httpd,void * ptr,size_t size)2085 bozorealloc(bozohttpd_t *httpd, void *ptr, size_t size)
2086 {
2087 	void	*p;
2088 
2089 	p = realloc(ptr, size);
2090 	if (p == NULL) {
2091 		(void)bozo_http_error(httpd, 500, NULL,
2092 				"memory allocation failure");
2093 		exit(1);
2094 	}
2095 	return (p);
2096 }
2097 
2098 void *
bozomalloc(bozohttpd_t * httpd,size_t size)2099 bozomalloc(bozohttpd_t *httpd, size_t size)
2100 {
2101 	void	*p;
2102 
2103 	p = malloc(size);
2104 	if (p == NULL) {
2105 		(void)bozo_http_error(httpd, 500, NULL,
2106 				"memory allocation failure");
2107 		exit(1);
2108 	}
2109 	return (p);
2110 }
2111 
2112 char *
bozostrdup(bozohttpd_t * httpd,const char * str)2113 bozostrdup(bozohttpd_t *httpd, const char *str)
2114 {
2115 	char	*p;
2116 
2117 	p = strdup(str);
2118 	if (p == NULL) {
2119 		(void)bozo_http_error(httpd, 500, NULL,
2120 					"memory allocation failure");
2121 		exit(1);
2122 	}
2123 	return (p);
2124 }
2125 
2126 /* set default values in bozohttpd_t struct */
2127 int
bozo_init_httpd(bozohttpd_t * httpd)2128 bozo_init_httpd(bozohttpd_t *httpd)
2129 {
2130 	/* make sure everything is clean */
2131 	(void) memset(httpd, 0x0, sizeof(*httpd));
2132 
2133 	/* constants */
2134 	httpd->consts.http_09 = "HTTP/0.9";
2135 	httpd->consts.http_10 = "HTTP/1.0";
2136 	httpd->consts.http_11 = "HTTP/1.1";
2137 	httpd->consts.text_plain = "text/plain";
2138 
2139 	/* mmap region size */
2140 	httpd->mmapsz = BOZO_MMAPSZ;
2141 
2142 	/* error buffer for bozo_http_error() */
2143 	if ((httpd->errorbuf = malloc(BUFSIZ)) == NULL) {
2144 		(void) fprintf(stderr,
2145 			"bozohttpd: memory_allocation failure\n");
2146 		return 0;
2147 	}
2148 #ifndef NO_LUA_SUPPORT
2149 	SIMPLEQ_INIT(&httpd->lua_states);
2150 #endif
2151 	return 1;
2152 }
2153 
2154 /* set default values in bozoprefs_t struct */
2155 int
bozo_init_prefs(bozoprefs_t * prefs)2156 bozo_init_prefs(bozoprefs_t *prefs)
2157 {
2158 	/* make sure everything is clean */
2159 	(void) memset(prefs, 0x0, sizeof(*prefs));
2160 
2161 	/* set up default values */
2162 	bozo_set_pref(prefs, "server software", SERVER_SOFTWARE);
2163 	bozo_set_pref(prefs, "index.html", INDEX_HTML);
2164 	bozo_set_pref(prefs, "public_html", PUBLIC_HTML);
2165 
2166 	return 1;
2167 }
2168 
2169 /* set default values */
2170 int
bozo_set_defaults(bozohttpd_t * httpd,bozoprefs_t * prefs)2171 bozo_set_defaults(bozohttpd_t *httpd, bozoprefs_t *prefs)
2172 {
2173 	return bozo_init_httpd(httpd) && bozo_init_prefs(prefs);
2174 }
2175 
2176 /* set the virtual host name, port and root */
2177 int
bozo_setup(bozohttpd_t * httpd,bozoprefs_t * prefs,const char * vhost,const char * root)2178 bozo_setup(bozohttpd_t *httpd, bozoprefs_t *prefs, const char *vhost,
2179 		const char *root)
2180 {
2181 	struct passwd	 *pw;
2182 	extern char	**environ;
2183 	static char	 *cleanenv[1] = { NULL };
2184 	uid_t		  uid;
2185 	char		 *chrootdir;
2186 	char		 *username;
2187 	char		 *portnum;
2188 	char		 *cp;
2189 	int		  dirtyenv;
2190 
2191 	dirtyenv = 0;
2192 
2193 	if (vhost == NULL) {
2194 		httpd->virthostname = bozomalloc(httpd, MAXHOSTNAMELEN+1);
2195 		/* XXX we do not check for FQDN here */
2196 		if (gethostname(httpd->virthostname, MAXHOSTNAMELEN+1) < 0)
2197 			bozo_err(httpd, 1, "gethostname");
2198 		httpd->virthostname[MAXHOSTNAMELEN] = '\0';
2199 	} else {
2200 		httpd->virthostname = strdup(vhost);
2201 	}
2202 	httpd->slashdir = strdup(root);
2203 	if ((portnum = bozo_get_pref(prefs, "port number")) != NULL) {
2204 		httpd->bindport = strdup(portnum);
2205 	}
2206 
2207 	/* go over preferences now */
2208 	if ((cp = bozo_get_pref(prefs, "numeric")) != NULL &&
2209 	    strcmp(cp, "true") == 0) {
2210 		httpd->numeric = 1;
2211 	}
2212 	if ((cp = bozo_get_pref(prefs, "trusted referal")) != NULL &&
2213 	    strcmp(cp, "true") == 0) {
2214 		httpd->untrustedref = 1;
2215 	}
2216 	if ((cp = bozo_get_pref(prefs, "log to stderr")) != NULL &&
2217 	    strcmp(cp, "true") == 0) {
2218 		httpd->logstderr = 1;
2219 	}
2220 	if ((cp = bozo_get_pref(prefs, "bind address")) != NULL) {
2221 		httpd->bindaddress = strdup(cp);
2222 	}
2223 	if ((cp = bozo_get_pref(prefs, "background")) != NULL) {
2224 		httpd->background = atoi(cp);
2225 	}
2226 	if ((cp = bozo_get_pref(prefs, "foreground")) != NULL &&
2227 	    strcmp(cp, "true") == 0) {
2228 		httpd->foreground = 1;
2229 	}
2230 	if ((cp = bozo_get_pref(prefs, "pid file")) != NULL) {
2231 		httpd->pidfile = strdup(cp);
2232 	}
2233 	if ((cp = bozo_get_pref(prefs, "unknown slash")) != NULL &&
2234 	    strcmp(cp, "true") == 0) {
2235 		httpd->unknown_slash = 1;
2236 	}
2237 	if ((cp = bozo_get_pref(prefs, "virtual base")) != NULL) {
2238 		httpd->virtbase = strdup(cp);
2239 	}
2240 	if ((cp = bozo_get_pref(prefs, "enable users")) != NULL &&
2241 	    strcmp(cp, "true") == 0) {
2242 		httpd->enable_users = 1;
2243 	}
2244 	if ((cp = bozo_get_pref(prefs, "dirty environment")) != NULL &&
2245 	    strcmp(cp, "true") == 0) {
2246 		dirtyenv = 1;
2247 	}
2248 	if ((cp = bozo_get_pref(prefs, "hide dots")) != NULL &&
2249 	    strcmp(cp, "true") == 0) {
2250 		httpd->hide_dots = 1;
2251 	}
2252 	if ((cp = bozo_get_pref(prefs, "directory indexing")) != NULL &&
2253 	    strcmp(cp, "true") == 0) {
2254 		httpd->dir_indexing = 1;
2255 	}
2256 	if ((cp = bozo_get_pref(prefs, "public_html")) != NULL) {
2257 		httpd->public_html = strdup(cp);
2258 	}
2259 	httpd->server_software =
2260 			strdup(bozo_get_pref(prefs, "server software"));
2261 	httpd->index_html = strdup(bozo_get_pref(prefs, "index.html"));
2262 
2263 	/*
2264 	 * initialise ssl and daemon mode if necessary.
2265 	 */
2266 	bozo_ssl_init(httpd);
2267 	bozo_daemon_init(httpd);
2268 
2269 	if ((username = bozo_get_pref(prefs, "username")) == NULL) {
2270 		if ((pw = getpwuid(uid = 0)) == NULL)
2271 			bozo_err(httpd, 1, "getpwuid(0): %s", strerror(errno));
2272 		httpd->username = strdup(pw->pw_name);
2273 	} else {
2274 		httpd->username = strdup(username);
2275 		if ((pw = getpwnam(httpd->username)) == NULL)
2276 			bozo_err(httpd, 1, "getpwnam(%s): %s", httpd->username,
2277 					strerror(errno));
2278 		if (initgroups(pw->pw_name, pw->pw_gid) == -1)
2279 			bozo_err(httpd, 1, "initgroups: %s", strerror(errno));
2280 		if (setgid(pw->pw_gid) == -1)
2281 			bozo_err(httpd, 1, "setgid(%u): %s", pw->pw_gid,
2282 					strerror(errno));
2283 		uid = pw->pw_uid;
2284 	}
2285 	/*
2286 	 * handle chroot.
2287 	 */
2288 	if ((chrootdir = bozo_get_pref(prefs, "chroot dir")) != NULL) {
2289 		httpd->rootdir = strdup(chrootdir);
2290 		if (chdir(httpd->rootdir) == -1)
2291 			bozo_err(httpd, 1, "chdir(%s): %s", httpd->rootdir,
2292 				strerror(errno));
2293 		if (chroot(httpd->rootdir) == -1)
2294 			bozo_err(httpd, 1, "chroot(%s): %s", httpd->rootdir,
2295 				strerror(errno));
2296 	}
2297 
2298 	if (username != NULL)
2299 		if (setuid(uid) == -1)
2300 			bozo_err(httpd, 1, "setuid(%d): %s", uid,
2301 					strerror(errno));
2302 
2303 	/*
2304 	 * prevent info leakage between different compartments.
2305 	 * some PATH values in the environment would be invalided
2306 	 * by chroot. cross-user settings might result in undesirable
2307 	 * effects.
2308 	 */
2309 	if ((chrootdir != NULL || username != NULL) && !dirtyenv)
2310 		environ = cleanenv;
2311 
2312 #ifdef _SC_PAGESIZE
2313 	httpd->page_size = (long)sysconf(_SC_PAGESIZE);
2314 #else
2315 	httpd->page_size = 4096;
2316 #endif
2317 	debug((httpd, DEBUG_OBESE, "myname is %s, slashdir is %s",
2318 			httpd->virthostname, httpd->slashdir));
2319 
2320 	return 1;
2321 }
2322