htparser: Fixed pidfile initialization bug.
[ashd.git] / src / htparser.c
... / ...
CommitLineData
1/*
2 ashd - A Sane HTTP Daemon
3 Copyright (C) 2008 Fredrik Tolf <fredrik@dolda2000.com>
4
5 This program is free software: you can redistribute it and/or modify
6 it under the terms of the GNU General Public License as published by
7 the Free Software Foundation, either version 3 of the License, or
8 (at your option) any later version.
9
10 This program is distributed in the hope that it will be useful,
11 but WITHOUT ANY WARRANTY; without even the implied warranty of
12 MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
13 GNU General Public License for more details.
14
15 You should have received a copy of the GNU General Public License
16 along with this program. If not, see <http://www.gnu.org/licenses/>.
17*/
18
19#include <stdlib.h>
20#include <unistd.h>
21#include <stdio.h>
22#include <fcntl.h>
23#include <string.h>
24#include <sys/socket.h>
25#include <pwd.h>
26#include <sys/signal.h>
27#include <errno.h>
28
29#ifdef HAVE_CONFIG_H
30#include <config.h>
31#endif
32#include <utils.h>
33#include <mt.h>
34#include <mtio.h>
35#include <log.h>
36#include <req.h>
37#include <proc.h>
38#include <bufio.h>
39
40#include "htparser.h"
41
42static int plex;
43static int daemonize, usesyslog;
44struct mtbuf listeners;
45
46static void trimx(struct hthead *req)
47{
48 int i;
49
50 i = 0;
51 while(i < req->noheaders) {
52 if(!strncasecmp(req->headers[i][0], "x-ash-", 6)) {
53 free(req->headers[i][0]);
54 free(req->headers[i][1]);
55 free(req->headers[i]);
56 memmove(req->headers + i, req->headers + i + 1, sizeof(*req->headers) * (--req->noheaders - i));
57 } else {
58 i++;
59 }
60 }
61}
62
63static struct hthead *parsereq(struct bufio *in)
64{
65 struct hthead *req;
66 struct charbuf method, url, ver;
67 int c;
68
69 req = NULL;
70 bufinit(method);
71 bufinit(url);
72 bufinit(ver);
73 while(1) {
74 c = biogetc(in);
75 if(c == ' ') {
76 break;
77 } else if((c == EOF) || (c < 32) || (c >= 128)) {
78 goto fail;
79 } else {
80 bufadd(method, c);
81 if(method.d >= 128)
82 goto fail;
83 }
84 }
85 while(1) {
86 c = biogetc(in);
87 if(c == ' ') {
88 break;
89 } else if((c == EOF) || (c < 32)) {
90 goto fail;
91 } else {
92 bufadd(url, c);
93 if(url.d >= 65536)
94 goto fail;
95 }
96 }
97 while(1) {
98 c = biogetc(in);
99 if(c == 10) {
100 break;
101 } else if(c == 13) {
102 } else if((c == EOF) || (c < 32) || (c >= 128)) {
103 goto fail;
104 } else {
105 bufadd(ver, c);
106 if(ver.d >= 128)
107 goto fail;
108 }
109 }
110 bufadd(method, 0);
111 bufadd(url, 0);
112 bufadd(ver, 0);
113 req = mkreq(method.b, url.b, ver.b);
114 if(parseheadersb(req, in))
115 goto fail;
116 trimx(req);
117 goto out;
118
119fail:
120 if(req != NULL) {
121 freehthead(req);
122 req = NULL;
123 }
124out:
125 buffree(method);
126 buffree(url);
127 buffree(ver);
128 return(req);
129}
130
131static off_t passdata(struct bufio *in, struct bufio *out, off_t max)
132{
133 ssize_t read;
134 off_t total;
135
136 total = 0;
137 while(!bioeof(in) && ((max < 0) || (total < max))) {
138 if((read = biordata(in)) > 0) {
139 if(max >= 0)
140 read = min(max - total, read);
141 if((read = biowritesome(out, in->rbuf.b + in->rh, read)) < 0)
142 return(-1);
143 in->rh += read;
144 total += read;
145 }
146 if(biorspace(in) && ((max < 0) || (biordata(in) < max - total)) && (biofillsome(in) < 0))
147 return(-1);
148 }
149 return(total);
150}
151
152static int recvchunks(struct bufio *in, struct bufio *out)
153{
154 ssize_t read, chlen;
155 int c, r;
156
157 while(1) {
158 chlen = 0;
159 r = 0;
160 while(1) {
161 c = biogetc(in);
162 if(c == 10) {
163 if(!r)
164 return(-1);
165 break;
166 } else if(c == 13) {
167 } else if((c >= '0') && (c <= '9')) {
168 chlen = (chlen << 4) + (c - '0');
169 r = 1;
170 } else if((c >= 'A') && (c <= 'F')) {
171 chlen = (chlen << 4) + (c + 10 - 'A');
172 r = 1;
173 } else if((c >= 'a') && (c <= 'f')) {
174 chlen = (chlen << 4) + (c + 10 - 'a');
175 r = 1;
176 } else {
177 /* XXX: Technically, there may be chunk extensions to
178 * be read, but since that will likely never actually
179 * happen in practice, I can just as well add support
180 * for that if it actually does become relevant. */
181 return(-1);
182 }
183 }
184 if(chlen == 0)
185 break;
186 while(chlen > 0) {
187 if((read = biordata(in)) > 0) {
188 if((read = biowritesome(out, in->rbuf.b + in->rh, min(read, chlen))) < 0)
189 return(-1);
190 in->rh += read;
191 chlen -= read;
192 }
193 if(biorspace(in) && (biordata(in) < chlen) && (biofillsome(in) <= 0))
194 return(-1);
195 }
196 if((biogetc(in) != 13) || (biogetc(in) != 10))
197 return(-1);
198 }
199 /* XXX: Technically, there may be trailers to be read, but that's
200 * just about as likely as chunk extensions. */
201 if((biogetc(in) != 13) || (biogetc(in) != 10))
202 return(-1);
203 return(0);
204}
205
206static int passchunks(struct bufio *in, struct bufio *out)
207{
208 size_t read;
209
210 while(!bioeof(in)) {
211 if((read = biordata(in)) > 0) {
212 bioprintf(out, "%zx\r\n", read);
213 if(biowrite(out, in->rbuf.b + in->rh, read) != read)
214 return(-1);
215 in->rh += read;
216 bioprintf(out, "\r\n");
217 if(bioflush(out) < 0)
218 return(-1);
219 }
220 if(biorspace(in) && (biofillsome(in) < 0))
221 return(-1);
222 }
223 bioprintf(out, "0\r\n\r\n");
224 return(0);
225}
226
227static int hasheader(struct hthead *head, char *name, char *val)
228{
229 char *hd;
230
231 if((hd = getheader(head, name)) == NULL)
232 return(0);
233 return(!strcasecmp(hd, val));
234}
235
236static int canonreq(struct hthead *req)
237{
238 char *p, *p2, *r;
239 int n;
240
241 if(req->url[0] == '/') {
242 replrest(req, req->url + 1);
243 if((p = strchr(req->rest, '?')) != NULL)
244 *p = 0;
245 return(1);
246 }
247 if((p = strstr(req->url, "://")) != NULL) {
248 n = p - req->url;
249 if(((n == 4) && !strncasecmp(req->url, "http", 4)) ||
250 ((n == 5) && !strncasecmp(req->url, "https", 5))) {
251 if(getheader(req, "host"))
252 return(0);
253 p += 3;
254 if((p2 = strchr(p, '/')) == NULL) {
255 headappheader(req, "Host", p);
256 free(req->url);
257 req->url = sstrdup("/");
258 } else {
259 r = sstrdup(p2);
260 *(p2++) = 0;
261 headappheader(req, "Host", p);
262 free(req->url);
263 req->url = r;
264 }
265 replrest(req, req->url + 1);
266 if((p = strchr(req->rest, '?')) != NULL)
267 *p = 0;
268 return(1);
269 }
270 }
271 return(0);
272}
273
274static int http10keep(struct hthead *req, struct hthead *resp)
275{
276 int fc;
277
278 fc = hasheader(resp, "connection", "close");
279 headrmheader(resp, "connection");
280 if(!fc && hasheader(req, "connection", "keep-alive")) {
281 headappheader(resp, "Connection", "Keep-Alive");
282 return(1);
283 } else {
284 return(0);
285 }
286}
287
288static char *connid(void)
289{
290 static struct charbuf cur;
291 int i;
292 char *ret;
293
294 for(i = 0; i < cur.d; i++) {
295 if((++cur.b[i]) > 'Z')
296 cur.b[i] = 'A';
297 else
298 goto done;
299 }
300 bufadd(cur, 'A');
301done:
302 ret = memcpy(smalloc(cur.d + 1), cur.b, cur.d);
303 ret[cur.d] = 0;
304 return(ret);
305}
306
307static void passduplex(struct bufio *a, int afd, struct bufio *b, int bfd)
308{
309 struct selected pfd[4], sel;
310 struct bufio *sio;
311 int n, ev;
312
313 while(!bioeof(a) && !bioeof(b)) {
314 biocopybuf(b, a);
315 biocopybuf(a, b);
316 n = 0;
317 if(!a->eof) {
318 ev = 0;
319 if(biorspace(a))
320 ev |= EV_READ;
321 if(biowdata(a))
322 ev |= EV_WRITE;
323 if(ev)
324 pfd[n++] = (struct selected){.fd = afd, .ev = ev};
325 }
326 if(!b->eof) {
327 ev = 0;
328 if(!b->eof && biorspace(b))
329 ev |= EV_READ;
330 if(biowdata(b))
331 ev |= EV_WRITE;
332 if(ev)
333 pfd[n++] = (struct selected){.fd = bfd, .ev = ev};
334 }
335 if((sel = mblock(600, n, pfd)).ev == 0)
336 break;
337 if(sel.fd == afd)
338 sio = a;
339 else if(sel.fd == bfd)
340 sio = b;
341 else
342 break;
343 if((sel.ev & EV_READ) && (biofillsome(sio) < 0))
344 break;
345 if((sel.ev & EV_WRITE) && (bioflushsome(sio) < 0))
346 break;
347 }
348}
349
350void serve(struct bufio *in, int infd, struct conn *conn)
351{
352 int pfds[2];
353 struct bufio *out, *dout;
354 struct stdiofd *outi;
355 struct hthead *req, *resp;
356 char *hd, *id;
357 off_t dlen;
358 int keep, duplex;
359
360 id = connid();
361 out = NULL;
362 req = resp = NULL;
363 while(plex >= 0) {
364 bioflush(in);
365 if((req = parsereq(in)) == NULL)
366 break;
367 if(!canonreq(req))
368 break;
369
370 headappheader(req, "X-Ash-Connection-ID", id);
371 if((conn->initreq != NULL) && conn->initreq(conn, req))
372 break;
373
374 if((plex < 0) || block(plex, EV_WRITE, 60) <= 0)
375 break;
376 if(socketpair(PF_UNIX, SOCK_STREAM, 0, pfds))
377 break;
378 if(sendreq(plex, req, pfds[0]))
379 break;
380 close(pfds[0]);
381 out = mtbioopen(pfds[1], 1, 600, "r+", &outi);
382
383 if(getheader(req, "content-type") != NULL) {
384 if((hd = getheader(req, "content-length")) != NULL) {
385 dlen = atoo(hd);
386 if(dlen > 0) {
387 if(passdata(in, out, dlen) != dlen)
388 break;
389 }
390 } else if(((hd = getheader(req, "transfer-encoding")) != NULL) && !strcasecmp(hd, "chunked")) {
391 if(recvchunks(in, out))
392 break;
393 } else {
394 /* Ignore rather than abort, to be kinder to broken clients. */
395 headrmheader(req, "content-type");
396 }
397 }
398 if(bioflush(out))
399 break;
400 /* Make sure to send EOF */
401 shutdown(pfds[1], SHUT_WR);
402
403 if((resp = parseresponseb(out)) == NULL)
404 break;
405 replstr(&resp->ver, req->ver);
406
407 if(!getheader(resp, "server"))
408 headappheader(resp, "Server", sprintf3("ashd/%s", VERSION));
409 duplex = hasheader(resp, "x-ash-switch", "duplex");
410 trimx(resp);
411
412 if(duplex) {
413 if(outi->rights < 0)
414 break;
415 writerespb(in, resp);
416 bioprintf(in, "\r\n");
417 dout = mtbioopen(outi->rights, 1, 600, "r+", NULL);
418 passduplex(in, infd, dout, outi->rights);
419 outi->rights = -1;
420 bioclose(dout);
421 break;
422 } else if(!strcasecmp(req->ver, "HTTP/1.0")) {
423 if(!strcasecmp(req->method, "head")) {
424 keep = http10keep(req, resp);
425 writerespb(in, resp);
426 bioprintf(in, "\r\n");
427 } else if((hd = getheader(resp, "content-length")) != NULL) {
428 keep = http10keep(req, resp);
429 dlen = atoo(hd);
430 writerespb(in, resp);
431 bioprintf(in, "\r\n");
432 if(passdata(out, in, dlen) != dlen)
433 break;
434 } else {
435 headrmheader(resp, "connection");
436 writerespb(in, resp);
437 bioprintf(in, "\r\n");
438 passdata(out, in, -1);
439 break;
440 }
441 if(!keep)
442 break;
443 } else if(!strcasecmp(req->ver, "HTTP/1.1")) {
444 if(!strcasecmp(req->method, "head")) {
445 writerespb(in, resp);
446 bioprintf(in, "\r\n");
447 } else if((hd = getheader(resp, "content-length")) != NULL) {
448 writerespb(in, resp);
449 bioprintf(in, "\r\n");
450 dlen = atoo(hd);
451 if(passdata(out, in, dlen) != dlen)
452 break;
453 } else if(!getheader(resp, "transfer-encoding")) {
454 headappheader(resp, "Transfer-Encoding", "chunked");
455 writerespb(in, resp);
456 bioprintf(in, "\r\n");
457 if(passchunks(out, in))
458 break;
459 } else {
460 writerespb(in, resp);
461 bioprintf(in, "\r\n");
462 passdata(out, in, -1);
463 break;
464 }
465 if(hasheader(req, "connection", "close") || hasheader(resp, "connection", "close"))
466 break;
467 } else {
468 break;
469 }
470
471 bioclose(out);
472 out = NULL;
473 freehthead(req);
474 freehthead(resp);
475 req = resp = NULL;
476 }
477
478 if(out != NULL)
479 bioclose(out);
480 if(req != NULL)
481 freehthead(req);
482 if(resp != NULL)
483 freehthead(resp);
484 bioclose(in);
485 free(id);
486}
487
488static void plexwatch(struct muth *muth, va_list args)
489{
490 vavar(int, fd);
491 char *buf;
492 int i, s, ret;
493
494 s = 0;
495 while(1) {
496 if(block(fd, EV_READ, 0) == 0)
497 break;
498 buf = smalloc(65536);
499 ret = recv(fd, buf, 65536, 0);
500 if(ret < 0) {
501 flog(LOG_WARNING, "received error on rootplex read channel: %s", strerror(errno));
502 exit(1);
503 } else if(ret == 0) {
504 s = 1;
505 free(buf);
506 break;
507 }
508 /* Maybe I'd like to implement some protocol in this direction
509 * some day... */
510 free(buf);
511 }
512 shutdown(plex, SHUT_RDWR);
513 for(i = 0; i < listeners.d; i++) {
514 if(listeners.b[i] == muth)
515 bufdel(listeners, i);
516 }
517 if(s) {
518 flog(LOG_INFO, "root handler exited, so shutting down listening...");
519 while(listeners.d > 0)
520 resume(listeners.b[0], 0);
521 }
522}
523
524static void initroot(void *uu)
525{
526 int fd;
527
528 setsid();
529 if(daemonize) {
530 chdir("/");
531 if((fd = open("/dev/null", O_RDWR)) >= 0) {
532 dup2(fd, 0);
533 dup2(fd, 1);
534 dup2(fd, 2);
535 close(fd);
536 }
537 }
538 if(usesyslog)
539 putenv("ASHD_USESYSLOG=1");
540 else
541 unsetenv("ASHD_USESYSLOG");
542}
543
544static void usage(FILE *out)
545{
546 fprintf(out, "usage: htparser [-hSf] [-u USER] [-r ROOT] [-p PIDFILE] PORTSPEC... -- ROOT [ARGS...]\n");
547 fprintf(out, "\twhere PORTSPEC is HANDLER[:PAR[=VAL][(,PAR[=VAL])...]] (try HANDLER:help)\n");
548 fprintf(out, "\tavailable handlers are `plain' and `ssl'.\n");
549}
550
551static void addport(char *spec)
552{
553 char *nm, *p, *p2, *n;
554 struct charvbuf pars, vals;
555
556 bufinit(pars);
557 bufinit(vals);
558 if((p = strchr(spec, ':')) == NULL) {
559 nm = spec;
560 } else {
561 nm = spec;
562 *(p++) = 0;
563 do {
564 if((n = strchr(p, ',')) != NULL)
565 *(n++) = 0;
566 if((p2 = strchr(p, '=')) != NULL)
567 *(p2++) = 0;
568 if(!*p) {
569 usage(stderr);
570 exit(1);
571 }
572 bufadd(pars, p);
573 if(p2)
574 bufadd(vals, p2);
575 else
576 bufadd(vals, "");
577 } while((p = n) != NULL);
578 }
579
580 /* XXX: It would be nice to decentralize this, but, meh... */
581 if(!strcmp(nm, "plain")) {
582 handleplain(pars.d, pars.b, vals.b);
583#ifdef HAVE_GNUTLS
584 } else if(!strcmp(nm, "ssl")) {
585 handlegnussl(pars.d, pars.b, vals.b);
586#endif
587 } else {
588 flog(LOG_ERR, "htparser: unknown port handler `%s'", nm);
589 exit(1);
590 }
591
592 buffree(pars);
593 buffree(vals);
594}
595
596static void sighandler(int sig)
597{
598 exitioloop(1);
599}
600
601int main(int argc, char **argv)
602{
603 int c, d;
604 int i, s1;
605 char *root, *pidfile, *pidtmp;
606 FILE *pidout;
607 struct passwd *pwent;
608
609 daemonize = usesyslog = 0;
610 root = pidfile = NULL;
611 pwent = NULL;
612 while((c = getopt(argc, argv, "+hSfu:r:p:")) >= 0) {
613 switch(c) {
614 case 'h':
615 usage(stdout);
616 exit(0);
617 case 'f':
618 daemonize = 1;
619 break;
620 case 'S':
621 usesyslog = 1;
622 break;
623 case 'u':
624 if(optarg[0] && ((pwent = getpwnam(optarg)) == NULL)) {
625 flog(LOG_ERR, "could not find user %s", optarg);
626 exit(1);
627 }
628 break;
629 case 'r':
630 root = optarg[0] ? optarg : NULL;
631 break;
632 case 'p':
633 pidfile = optarg[0] ? optarg : NULL;
634 break;
635 default:
636 usage(stderr);
637 exit(1);
638 }
639 }
640 s1 = 0;
641 for(i = optind; i < argc; i++) {
642 if(!strcmp(argv[i], "--"))
643 break;
644 s1 = 1;
645 addport(argv[i]);
646 }
647 if(!s1 || (i == argc)) {
648 usage(stderr);
649 exit(1);
650 }
651 if((plex = stdmkchild(argv + ++i, initroot, NULL)) < 0) {
652 flog(LOG_ERR, "could not spawn root multiplexer: %s", strerror(errno));
653 return(1);
654 }
655 bufadd(listeners, mustart(plexwatch, plex));
656 pidout = NULL;
657 if(pidfile != NULL) {
658 pidtmp = sprintf3("%s.new", pidfile);
659 if((pidout = fopen(pidtmp, "w")) == NULL) {
660 flog(LOG_ERR, "could not open %s for writing: %s", pidtmp, strerror(errno));
661 return(1);
662 }
663 if(rename(pidtmp, pidfile)) {
664 flog(LOG_ERR, "could not overwrite %s: %s", pidfile, strerror(errno));
665 unlink(pidtmp);
666 return(1);
667 }
668 }
669 if(usesyslog)
670 opensyslog();
671 if(root) {
672 if(chdir(root) || chroot(root)) {
673 flog(LOG_ERR, "could not chroot to %s: %s", root, strerror(errno));
674 exit(1);
675 }
676 }
677 if(pwent) {
678 if(setgid(pwent->pw_gid)) {
679 flog(LOG_ERR, "could not switch group to %i: %s", (int)pwent->pw_gid, strerror(errno));
680 exit(1);
681 }
682 if(setuid(pwent->pw_uid)) {
683 flog(LOG_ERR, "could not switch user to %i: %s", (int)pwent->pw_uid, strerror(errno));
684 exit(1);
685 }
686 }
687 signal(SIGPIPE, SIG_IGN);
688 signal(SIGCHLD, SIG_IGN);
689 signal(SIGINT, sighandler);
690 signal(SIGTERM, sighandler);
691 if(daemonize) {
692 daemon(0, 0);
693 }
694 if(pidout != NULL) {
695 fprintf(pidout, "%i\n", getpid());
696 fflush(pidout);
697 }
698 d = 0;
699 while(!d) {
700 switch(ioloop()) {
701 case 0:
702 d = 1;
703 break;
704 case 1:
705 if(listeners.d > 0) {
706 while(listeners.d > 0)
707 resume(listeners.b[0], 0);
708 flog(LOG_INFO, "no longer listening");
709 if(pidout != NULL) {
710 putc('\n', pidout);
711 fflush(pidout);
712 }
713 } else {
714 d = 1;
715 }
716 break;
717 }
718 }
719 if(pidout != NULL)
720 ftruncate(fileno(pidout), 0);
721 return(0);
722}