2 * Copyright (c) 2022 Omar Polo <op@omarpolo.com>
3 * Copyright (c) 2006 - 2015 Reyk Floeter <reyk@openbsd.org>
5 * Permission to use, copy, modify, and distribute this software for any
6 * purpose with or without fee is hereby granted, provided that the above
7 * copyright notice and this permission notice appear in all copies.
9 * THE SOFTWARE IS PROVIDED "AS IS" AND THE AUTHOR DISCLAIMS ALL WARRANTIES
10 * WITH REGARD TO THIS SOFTWARE INCLUDING ALL IMPLIED WARRANTIES OF
11 * MERCHANTABILITY AND FITNESS. IN NO EVENT SHALL THE AUTHOR BE LIABLE FOR
12 * ANY SPECIAL, DIRECT, INDIRECT, OR CONSEQUENTIAL DAMAGES OR ANY DAMAGES
13 * WHATSOEVER RESULTING FROM LOSS OF USE, DATA OR PROFITS, WHETHER IN AN
14 * ACTION OF CONTRACT, NEGLIGENCE OR OTHER TORTIOUS ACTION, ARISING OUT OF
15 * OR IN CONNECTION WITH THE USE OR PERFORMANCE OF THIS SOFTWARE.
18 #include <sys/types.h>
19 #include <sys/queue.h>
21 #include <sys/socket.h>
24 #include <netinet/in.h>
25 #include <arpa/inet.h>
49 #define MINIMUM(a, b) ((a) < (b) ? (a) : (b))
52 # define G_TOUT(t) ((t).tv_sec)
54 # define G_TOUT(t) (t)
57 /* provided by OpenBSD' base libevent but not in any header? */
58 extern void bufferevent_read_pressure_cb(struct evbuffer *, size_t,
61 void proxy_init(struct privsep *, struct privsep_proc *, void *);
62 int proxy_launch(struct galileo *);
63 void proxy_inflight_dec(const char *);
64 int proxy_dispatch_parent(int, struct privsep_proc *, struct imsg *);
65 void proxy_translate_gemtext(struct client *);
66 void proxy_resolved(struct asr_result *, void *);
67 void proxy_connect(int, short, void *);
68 int proxy_start_reply(struct client *, int, const char *);
69 void proxy_read(struct bufferevent *, void *);
70 void proxy_write(struct bufferevent *, void *);
71 void proxy_error(struct bufferevent *, short, void *);
72 int proxy_bufferevent_add(struct event *, int);
73 void proxy_tls_writecb(int, short, void *);
74 void proxy_tls_readcb(int, short, void *);
76 static struct privsep_proc procs[] = {
77 { "parent", PROC_PARENT, proxy_dispatch_parent },
80 volatile int proxy_clients;
81 volatile int proxy_inflight;
82 uint32_t proxy_fcg_id;
85 proxy(struct privsep *ps, struct privsep_proc *p)
87 proc_run(ps, p, procs, nitems(procs), proxy_init, NULL);
91 proxy_init(struct privsep *ps, struct privsep_proc *p, void *arg)
93 if (config_init(ps->ps_env) == -1)
94 fatal("failed to initialize configuration");
96 /* We use a custom shutdown callback */
97 /* p->p_shutdown = proxy_shutdown */
99 if (pledge("stdio recvfd unix inet dns", NULL) == -1)
104 proxy_launch(struct galileo *env)
106 event_add(&env->sc_evsock, NULL);
111 proxy_purge(struct proxy *pr)
117 proxy_inflight_dec(const char *why)
120 log_debug("%s: inflight decremented, now %d, %s",
121 __func__, proxy_inflight, why);
125 proxy_dispatch_parent(int fd, struct privsep_proc *p, struct imsg *imsg)
127 struct privsep *ps = p->p_ps;
128 struct galileo *env = ps->ps_env;
130 switch (imsg->hdr.type) {
132 if (config_getproxy(env, imsg) == -1)
133 fatal("config_getproxy");
138 env->sc_sock_fd = config_getsock(env, imsg);
139 if (env->sc_sock_fd == -1)
140 fatal("config_getsock");
142 event_set(&env->sc_evsock, env->sc_sock_fd,
143 EV_READ | EV_PERSIST, fcgi_accept, env);
144 evtimer_set(&env->sc_evpause, fcgi_accept, env);
147 config_getcfg(env, imsg);
153 config_getreset(env, imsg);
163 gemtext_translate_line(struct client *clt, char *line)
165 /* preformatted line / closing */
166 if (clt->clt_translate & TR_PRE) {
167 if (!strncmp(line, "```", 3)) {
168 clt->clt_translate &= ~TR_PRE;
169 return (tp_pre_close(clt->clt_tp));
172 if (tp_htmlescape(clt->clt_tp, line) == -1)
174 return (clt_putc(clt, '\n'));
178 if (!strncmp(line, "* ", 2)) {
179 if (clt->clt_translate & TR_NAV) {
180 if (clt_puts(clt, "</ul></nav>") == -1)
182 clt->clt_translate &= ~TR_NAV;
185 if (!(clt->clt_translate & TR_LIST)) {
186 if (clt_puts(clt, "<ul>") == -1)
188 clt->clt_translate |= TR_LIST;
191 if (clt_puts(clt, "<li>") == -1 ||
192 tp_htmlescape(clt->clt_tp, line + 2) == -1 ||
193 clt_puts(clt, "</li>") == -1)
198 if (clt->clt_translate & TR_LIST) {
199 if (clt_puts(clt, "</ul>") == -1)
201 clt->clt_translate &= ~TR_LIST;
204 /* link -- TODO: relativify from SCRIPT_NAME */
205 if (!strncmp(line, "=>", 2)) {
209 line += strspn(line, " \t");
211 label = line + strcspn(line, " \t");
217 if (fnmatch("*.jpg", line, 0) == 0 ||
218 fnmatch("*.jpeg", line, 0) == 0 ||
219 fnmatch("*.gif", line, 0) == 0 ||
220 fnmatch("*.png", line, 0) == 0 ||
221 fnmatch("*.svg", line, 0) == 0 ||
222 fnmatch("*.webp", line, 0) == 0) {
223 if (clt->clt_translate & TR_NAV) {
224 if (clt_puts(clt, "</ul></nav>") == -1)
226 clt->clt_translate &= ~TR_NAV;
229 if (tp_figure(clt->clt_tp, line, label) == -1)
235 if (!(clt->clt_translate & TR_NAV)) {
236 if (clt_puts(clt, "<nav><ul>") == -1)
238 clt->clt_translate |= TR_NAV;
241 if (clt_puts(clt, "<li><a href='") == -1)
244 /* XXX: do proper parsing */
245 if (*line == '/' || strstr(line, "//") == NULL) {
246 if (tp_urlescape(clt->clt_tp,
247 clt->clt_script_name) == -1)
250 /* skip the first / */
254 if (tp_urlescape(clt->clt_tp, line) == -1 ||
255 clt_puts(clt, "'>") == -1 ||
256 tp_htmlescape(clt->clt_tp, label) == -1 ||
257 clt_puts(clt, "</a></li>") == -1)
263 if (clt->clt_translate & TR_NAV) {
264 if (clt_puts(clt, "</ul></nav>") == -1)
266 clt->clt_translate &= ~TR_NAV;
270 if (!strncmp(line, "```", 3)) {
272 line += strspn(line, " \t");
274 clt->clt_translate |= TR_PRE;
275 return (tp_pre_open(clt->clt_tp, line));
280 if (clt_puts(clt, "<blockquote>") == -1 ||
281 tp_htmlescape(clt->clt_tp, line + 1) == -1 ||
282 clt_puts(clt, "</blockquote>") == -1)
288 if (!strncmp(line, "###", 3)) {
289 if (clt_puts(clt, "<h3>") == -1 ||
290 tp_htmlescape(clt->clt_tp, line + 3) == -1 ||
291 clt_puts(clt, "</h3>") == -1)
295 if (!strncmp(line, "##", 2)) {
296 if (clt_puts(clt, "<h2>") == -1 ||
297 tp_htmlescape(clt->clt_tp, line + 2) == -1 ||
298 clt_puts(clt, "</h2>") == -1)
302 if (!strncmp(line, "#", 1)) {
303 if (clt_puts(clt, "<h1>") == -1 ||
304 tp_htmlescape(clt->clt_tp, line + 1) == -1 ||
305 clt_puts(clt, "</h1>") == -1)
310 /* Not following strictly the gemini specification... */
315 if (clt_puts(clt, "<p>") == -1 ||
316 tp_htmlescape(clt->clt_tp, line) == -1 ||
317 clt_puts(clt, "</p>") == -1)
324 proxy_translate_gemtext(struct client *clt)
326 struct bufferevent *bev = clt->clt_bev;
327 struct evbuffer *src = EVBUFFER_INPUT(bev);
333 line = evbuffer_readln(src, &len, EVBUFFER_EOL_CRLF);
337 r = gemtext_translate_line(clt, line);
344 struct proxy_config *
345 proxy_match(struct galileo *env, const char *name)
352 TAILQ_FOREACH(pr, &env->sc_proxies, pr_entry) {
353 if (!strcmp(name, pr->pr_conf.host))
354 return (&pr->pr_conf);
361 proxy_start_request(struct galileo *env, struct client *clt)
363 struct addrinfo hints;
364 struct asr_query *query;
368 if (clt->clt_path_info == NULL) {
369 log_warnx("PATH_INFO not defined!");
370 if (proxy_start_reply(clt, 501, "text/html") == -1)
372 if (tp_error(clt->clt_tp, -1, "internal server error") == -1)
374 return (fcgi_end_request(clt, 1));
377 if ((clt->clt_pc = proxy_match(env, clt->clt_server_name)) == NULL) {
378 if (proxy_start_reply(clt, 501, "text/html") == -1)
380 if (tp_error(clt->clt_tp, -1, "unknown server") == -1)
382 return (fcgi_end_request(clt, 1));
385 if (clt->clt_bodylen != 0 && clt->clt_body == NULL) {
386 if (proxy_start_reply(clt, 400, "text/html") == -1)
388 if (tp_error(clt->clt_tp, -1, "bad request") == -1)
390 return (fcgi_end_request(clt, 1));
394 r = asprintf(&url, "%s%s?%s", clt->clt_script_name,
395 clt->clt_path_info + 1, clt->clt_body);
397 return (fcgi_end_request(clt, 1));
399 if (proxy_start_reply(clt, 302, url) == -1 ||
400 fcgi_end_request(clt, 1) == -1) {
408 memset(&hints, 0, sizeof(hints));
409 hints.ai_family = AF_UNSPEC;
410 hints.ai_socktype = SOCK_STREAM;
412 query = getaddrinfo_async(clt->clt_pc->proxy_addr,
413 clt->clt_pc->proxy_port, &hints, NULL);
415 log_warn("getaddrinfo_async");
416 return (fcgi_abort_request(clt));
419 clt->clt_evasr = event_asr_run(query, proxy_resolved, clt);
420 if (clt->clt_evasr == NULL) {
421 log_warn("event_asr_run");
423 return (fcgi_abort_request(clt));
430 proxy_resolved(struct asr_result *res, void *d)
432 struct client *clt = d;
433 struct proxy_config *pc = clt->clt_pc;
435 clt->clt_evasr = NULL;
437 if (res->ar_gai_errno != 0) {
438 log_warnx("failed to resolve %s:%s: %s",
439 pc->proxy_addr, pc->proxy_port,
440 gai_strerror(res->ar_gai_errno));
441 if (proxy_start_reply(clt, 501, "text/html") == -1)
443 if (tp_error(clt->clt_tp, -1, "Can't resolve host") == -1)
445 fcgi_end_request(clt, 1);
449 clt->clt_addrinfo = res->ar_addrinfo;
450 clt->clt_p = clt->clt_addrinfo;
451 proxy_connect(-1, 0, clt);
455 proxy_connect(int fd, short ev, void *d)
457 struct client *clt = d;
458 struct evbuffer *out;
460 struct tls_config *conf;
461 struct timeval conntv = {5, 0};
463 socklen_t len = sizeof(err);
466 if (clt->clt_p == NULL)
469 if (clt->clt_fd != -1) {
470 if (getsockopt(clt->clt_fd, SOL_SOCKET, SO_ERROR, &err, &len)
481 clt->clt_fd = socket(p->ai_family, p->ai_socktype | SOCK_NONBLOCK,
483 if (clt->clt_fd == -1) {
484 clt->clt_p = clt->clt_p->ai_next;
488 if (connect(clt->clt_fd, p->ai_addr, p->ai_addrlen) == 0)
491 clt->clt_evconn_live = 1;
492 event_set(&clt->clt_evconn, clt->clt_fd, EV_WRITE, proxy_connect, clt);
493 event_add(&clt->clt_evconn, &conntv);
497 clt->clt_evconn_live = 0;
498 freeaddrinfo(clt->clt_addrinfo);
499 clt->clt_addrinfo = clt->clt_p = NULL;
501 clt->clt_bev = bufferevent_new(clt->clt_fd, proxy_read, proxy_write,
503 if (clt->clt_bev == NULL) {
504 log_warn("bufferevent_new");
508 if (!clt->clt_pc->no_tls) {
509 /* initialize TLS for Gemini */
510 if ((conf = tls_config_new()) == NULL) {
511 log_warn("tls_config_new failed");
515 tls_config_insecure_noverifycert(conf);
517 if ((clt->clt_ctx = tls_client()) == NULL) {
518 log_warnx("tls_client failed");
519 tls_config_free(conf);
523 if (tls_configure(clt->clt_ctx, conf) == -1) {
524 log_warnx("tls_configure failed");
525 tls_config_free(conf);
529 tls_config_free(conf);
531 if (tls_connect_socket(clt->clt_ctx, clt->clt_fd,
532 clt->clt_pc->proxy_name) == -1) {
533 log_warnx("tls_connect_socket failed");
537 event_set(&clt->clt_bev->ev_read, clt->clt_fd, EV_READ,
538 proxy_tls_readcb, clt->clt_bev);
539 event_set(&clt->clt_bev->ev_write, clt->clt_fd, EV_WRITE,
540 proxy_tls_writecb, clt->clt_bev);
543 evbuffer_unfreeze(clt->clt_bev->input, 0);
544 evbuffer_unfreeze(clt->clt_bev->output, 1);
548 /* bufferevent_settimeout(); */
549 bufferevent_enable(clt->clt_bev, EV_READ|EV_WRITE);
551 /* TODO: compute the URL */
552 out = EVBUFFER_OUTPUT(clt->clt_bev);
553 if (evbuffer_add_printf(out, "gemini://%s/%s",
554 clt->clt_pc->proxy_name, clt->clt_path_info) == -1) {
555 log_warn("bufferevent_printf failed");
559 if (clt->clt_query &&
560 evbuffer_add_printf(out, "?%s", clt->clt_query) == -1) {
561 log_warn("bufferevent_printf failed");
565 if (evbuffer_add(out, "\r\n", 2) == -1) {
566 log_warn("bufferevent_add failed");
573 log_warn("failed to connect to %s:%s",
574 clt->clt_pc->proxy_addr, clt->clt_pc->proxy_port);
575 if (proxy_start_reply(clt, 501, "text/html") == -1)
577 if (tp_error(clt->clt_tp, -1, "Can't connect") == -1)
579 fcgi_end_request(clt, 1);
583 parse_mime(struct client *clt, char *mime, char *lang, size_t len)
587 if (strncmp(mime, "text/gemini", 11) != 0)
590 clt->clt_translate = TR_ENABLED;
592 if ((mime = strchr(mime, ';')) == NULL)
596 while ((t = strsep(&mime, ";")) != NULL) {
597 if (!strncmp(t, "charset=", 8)) {
599 if (!strncasecmp(t, "utf8", 4) ||
600 !strncasecmp(t, "utf-8", 5) ||
601 !strncasecmp(t, "ascii", 5)) {
602 log_debug("unknown charset %s", t);
608 if (!strncmp(t, "lang=", 5)) {
610 if ((semi = strchr(t, ';')) != NULL)
613 if (strlcpy(lang, t, len) >= len) {
614 log_debug("lang too long: %s", t);
628 proxy_start_reply(struct client *clt, int status, const char *ctype)
632 csp = "Content-Security-Policy: default-src 'self'; "
633 "script-src 'none'; object-src 'none';\r\n";
636 clt_printf(clt, "Status: %d\r\n", status) == -1)
639 if (clt_puts(clt, csp) == -1)
643 /* use "ctype" as redirect target */
644 if (clt_printf(clt, "Location: %s\r\n", ctype) == -1)
646 if (clt_puts(clt, "\r\n") == -1)
652 if (!strcmp(ctype, "text/html"))
653 ctype = "text/html;charset=utf-8";
654 if (clt_printf(clt, "Content-Type: %s\r\n", ctype)
659 if (clt_puts(clt, "\r\n") == -1)
666 proxy_read(struct bufferevent *bev, void *d)
668 struct client *clt = d;
669 struct evbuffer *src = EVBUFFER_INPUT(bev);
676 if (clt->clt_headersdone) {
677 if (clt->clt_translate)
678 proxy_translate_gemtext(clt);
680 clt_write_bufferevent(clt, bev);
684 hdr = evbuffer_readln(src, &len, EVBUFFER_EOL_CRLF_STRICT);
686 if (EVBUFFER_LENGTH(src) >= 1026)
687 proxy_error(bev, EV_READ, clt);
692 !isdigit((unsigned char)hdr[0]) ||
693 !isdigit((unsigned char)hdr[1]) ||
695 log_warnx("invalid ");
696 proxy_error(bev, EV_READ, clt);
700 code = (hdr[0] - '0') * 10 + (hdr[1] - '0');
704 if (proxy_start_reply(clt, 200, "text/html") == -1)
706 if (tp_inputpage(clt->clt_tp, &hdr[3]) == -1)
708 fcgi_end_request(clt, 0);
714 /* XXX: do proper parsing */
715 if (hdr[3] == '/' || strstr(&hdr[3], "//") == NULL) {
718 if (asprintf(&url, "%s%s", clt->clt_script_name,
722 if (proxy_start_reply(clt, 302, url)) {
727 fcgi_end_request(clt, 0);
732 if (proxy_start_reply(clt, 501, "text/html") == -1)
734 if (tp_error(clt->clt_tp, code, &hdr[3]) == -1)
736 fcgi_end_request(clt, 1);
740 mime = hdr + 2 + strspn(hdr + 2, " \t");
741 if (parse_mime(clt, mime, lang, sizeof(lang)) == -1) {
742 if (proxy_start_reply(clt, 501, "text/html") == -1)
744 if (tp_error(clt->clt_tp, -1, "Bad response") == -1)
746 fcgi_end_request(clt, 1);
750 if (clt->clt_translate)
751 ctype = "text/html;charset=utf-8";
755 if (clt_printf(clt, "Content-Type: %s\r\n\r\n", ctype) == -1)
758 clt->clt_headersdone = 1;
760 if (clt->clt_translate &&
761 tp_head(clt->clt_tp, lang, NULL) == -1)
765 * Trigger the read again so we proceed with the response
777 proxy_write(struct bufferevent *bev, void *d)
783 proxy_error(struct bufferevent *bev, short err, void *d)
785 struct client *clt = d;
786 int status = !(err & EVBUFFER_EOF);
788 log_debug("proxy error, shutting down the connection (err: %x)",
791 if (!clt->clt_headersdone) {
792 if (proxy_start_reply(clt, 501, "text/html") == -1)
794 if (tp_error(clt->clt_tp, -1, "Proxy error") == -1)
796 } else if (status == 0) {
797 if (clt->clt_translate & TR_PRE) {
798 if (tp_pre_close(clt->clt_tp))
800 clt->clt_translate &= ~TR_PRE;
803 if (clt->clt_translate & TR_LIST) {
804 if (clt_puts(clt, "</ul>") == -1)
806 clt->clt_translate &= ~TR_LIST;
809 if (clt->clt_translate & TR_NAV) {
810 if (clt_puts(clt, "</ul></nav>") == -1)
812 clt->clt_translate &= ~TR_NAV;
815 if (clt->clt_translate &&
816 tp_foot(clt->clt_tp) == -1)
820 fcgi_end_request(clt, status);
824 proxy_tls_readcb(int fd, short event, void *arg)
826 struct bufferevent *bufev = arg;
827 struct client *clt = bufev->cbarg;
828 char rbuf[IBUF_READ_SIZE];
829 int what = EVBUFFER_READ;
830 int howmuch = IBUF_READ_SIZE;
834 if (event == EV_TIMEOUT) {
835 what |= EVBUFFER_TIMEOUT;
839 if (bufev->wm_read.high != 0)
840 howmuch = MINIMUM(sizeof(rbuf), bufev->wm_read.high);
842 ret = tls_read(clt->clt_ctx, rbuf, howmuch);
843 if (ret == TLS_WANT_POLLIN || ret == TLS_WANT_POLLOUT) {
845 } else if (ret == -1) {
846 what |= EVBUFFER_ERROR;
852 what |= EVBUFFER_EOF;
856 if (evbuffer_add(bufev->input, rbuf, len) == -1) {
857 what |= EVBUFFER_ERROR;
861 proxy_bufferevent_add(&bufev->ev_read, G_TOUT(bufev->timeout_read));
863 len = EVBUFFER_LENGTH(bufev->input);
864 if (bufev->wm_read.low != 0 && len < bufev->wm_read.low)
866 if (bufev->wm_read.high != 0 && len > bufev->wm_read.high) {
867 struct evbuffer *buf = bufev->input;
868 event_del(&bufev->ev_read);
869 evbuffer_setcb(buf, bufferevent_read_pressure_cb, bufev);
873 if (bufev->readcb != NULL)
874 (*bufev->readcb)(bufev, bufev->cbarg);
878 proxy_bufferevent_add(&bufev->ev_read, G_TOUT(bufev->timeout_read));
882 (*bufev->errorcb)(bufev, what, bufev->cbarg);
886 proxy_bufferevent_add(struct event *ev, int timeout)
888 struct timeval tv, *ptv = NULL;
896 return (event_add(ev, ptv));
900 proxy_tls_writecb(int fd, short event, void *arg)
902 struct bufferevent *bufev = arg;
903 struct client *clt = bufev->cbarg;
905 short what = EVBUFFER_WRITE;
908 if (event == EV_TIMEOUT) {
909 what |= EVBUFFER_TIMEOUT;
913 if (EVBUFFER_LENGTH(bufev->output)) {
914 ret = tls_write(clt->clt_ctx,
915 EVBUFFER_DATA(bufev->output),
916 EVBUFFER_LENGTH(bufev->output));
917 if (ret == TLS_WANT_POLLIN || ret == TLS_WANT_POLLOUT) {
919 } else if (ret == -1) {
920 what |= EVBUFFER_ERROR;
924 evbuffer_drain(bufev->output, len);
927 if (EVBUFFER_LENGTH(bufev->output) != 0)
928 proxy_bufferevent_add(&bufev->ev_write,
929 G_TOUT(bufev->timeout_write));
931 if (bufev->writecb != NULL &&
932 EVBUFFER_LENGTH(bufev->output) <= bufev->wm_write.low)
933 (*bufev->writecb)(bufev, bufev->cbarg);
937 proxy_bufferevent_add(&bufev->ev_write, G_TOUT(bufev->timeout_write));
941 (*bufev->errorcb)(bufev, what, bufev->cbarg);
945 proxy_client_free(struct client *clt)
948 event_asr_abort(clt->clt_evasr);
950 if (clt->clt_addrinfo)
951 freeaddrinfo(clt->clt_addrinfo);
953 if (clt->clt_evconn_live)
954 event_del(&clt->clt_evconn);
956 if (clt->clt_fd != -1)
960 tls_free(clt->clt_ctx);
963 bufferevent_free(clt->clt_bev);
965 template_free(clt->clt_tp);
968 free(clt->clt_server_name);
969 free(clt->clt_script_name);
970 free(clt->clt_path_info);
971 free(clt->clt_query);