gmid/gmid.c

735 lines
13 KiB
C
Raw Normal View History

2020-10-02 19:39:00 +02:00
/*
* Copyright (c) 2020 Omar Polo <op@omarpolo.com>
*
* Permission to use, copy, modify, and distribute this software for any
* purpose with or without fee is hereby granted, provided that the above
* copyright notice and this permission notice appear in all copies.
*
* THE SOFTWARE IS PROVIDED "AS IS" AND THE AUTHOR DISCLAIMS ALL WARRANTIES
* WITH REGARD TO THIS SOFTWARE INCLUDING ALL IMPLIED WARRANTIES OF
* MERCHANTABILITY AND FITNESS. IN NO EVENT SHALL THE AUTHOR BE LIABLE FOR
* ANY SPECIAL, DIRECT, INDIRECT, OR CONSEQUENTIAL DAMAGES OR ANY DAMAGES
* WHATSOEVER RESULTING FROM LOSS OF USE, DATA OR PROFITS, WHETHER IN AN
* ACTION OF CONTRACT, NEGLIGENCE OR OTHER TORTIOUS ACTION, ARISING OUT OF
* OR IN CONNECTION WITH THE USE OR PERFORMANCE OF THIS SOFTWARE.
*/
#include <sys/mman.h>
2020-10-02 19:39:00 +02:00
#include <sys/socket.h>
#include <sys/stat.h>
#include <netinet/in.h>
#include <assert.h>
#include <err.h>
#include <errno.h>
2020-10-02 19:39:00 +02:00
#include <fcntl.h>
#include <poll.h>
#include <signal.h>
2020-10-02 19:39:00 +02:00
#include <stdio.h>
#include <stdlib.h>
#include <string.h>
#include <tls.h>
#include <unistd.h>
#ifndef __OpenBSD__
# define pledge(a, b) 0
# define unveil(a, b) 0
#endif /* __OpenBSD__ */
#ifndef INFTIM
# define INFTIM -1
#endif /* INFTIM */
2020-10-02 19:39:00 +02:00
#define GEMINI_URL_LEN (1024+3) /* URL max len + \r\n + \0 */
2020-10-03 18:25:31 +02:00
/* large enough to hold a copy of a gemini URL and still have extra room */
2020-10-07 13:56:24 +02:00
#define PATHBUF 2048
2020-10-02 19:39:00 +02:00
#define SUCCESS 20
#define NOT_FOUND 51
#define BAD_REQUEST 59
#ifndef MAX_USERS
#define MAX_USERS 64
#endif
enum {
S_OPEN,
S_INITIALIZING,
S_SENDING,
S_CLOSING,
};
struct client {
struct tls *ctx;
int state;
int code;
const char *meta;
int fd;
void *buf, *i;
ssize_t len, off;
};
struct etm { /* file extension to mime */
const char *mime;
const char *ext;
} filetypes[] = {
{"application/pdf", "pdf"},
{"image/gif", "gif"},
{"image/jpeg", "jpg"},
{"image/jpeg", "jpeg"},
{"image/png", "png"},
{"image/svg+xml", "svg"},
{"text/gemini", "gemini"},
{"text/gemini", "gmi"},
{"text/markdown", "markdown"},
{"text/markdown", "md"},
{"text/plain", "txt"},
2020-11-06 10:45:06 +01:00
{"text/xml", "xml"},
{NULL, NULL}
};
2020-10-02 19:39:00 +02:00
int dirfd;
char *url_after_proto(char*);
char *url_start_of_request(char*);
int url_trim(char*);
void adjust_path(char*);
int path_isdir(char*);
ssize_t filesize(int);
int start_reply(struct pollfd*, struct client*, int, const char*);
int isdir(int);
const char *path_ext(const char*);
const char *mime(const char*);
int open_file(char*, struct pollfd*, struct client*);
void send_file(char*, struct pollfd*, struct client*);
void send_dir(char*, struct pollfd*, struct client*);
void handle(struct pollfd*, struct client*);
void mark_nonblock(int);
int make_soket(int);
void do_accept(int, struct tls*, struct pollfd*, struct client*);
void goodbye(struct pollfd*, struct client*);
void loop(struct tls*, int);
void usage(const char*);
2020-10-02 19:39:00 +02:00
char *
url_after_proto(char *url)
{
char *s;
const char *proto = "gemini";
const char *marker = "://";
if ((s = strstr(url, marker)) == NULL)
return url;
/* not a gemini:// URL */
if (s - strlen(proto) < url)
return NULL;
/* TODO: */
/* if (strcmp(s - strlen(proto), proto)) */
/* return NULL; */
/* a valid gemini:// URL */
return s + strlen(marker);
}
char *
url_start_of_request(char *url)
{
char *s, *t;
if ((s = url_after_proto(url)) == NULL)
return NULL;
if ((t = strstr(s, "/")) == NULL)
return s + strlen(s);
return t;
}
int
url_trim(char *url)
{
const char *e = "\r\n";
char *s;
if ((s = strstr(url, e)) == NULL)
return 0;
s[0] = '\0';
s[1] = '\0';
if (s[2] != '\0') {
2020-10-03 18:25:31 +02:00
fprintf(stderr, "the request was longer than 1024 bytes\n");
2020-10-02 19:39:00 +02:00
return 0;
}
return 1;
}
void
adjust_path(char *path)
{
char *s;
size_t len;
/* /.. -> / */
2020-10-02 19:39:00 +02:00
len = strlen(path);
if (len >= 3) {
if (!strcmp(&path[len-3], "/..")) {
path[len-2] = '\0';
}
}
/* if the path is only `..` trim out and exit */
if (!strcmp(path, "..")) {
path[0] = '\0';
return;
}
/* remove every ../ in the path */
while (1) {
if ((s = strstr(path, "../")) == NULL)
return;
memmove(s, s+3, strlen(s)+1); /* copy also the \0 */
2020-10-02 19:39:00 +02:00
}
}
int
path_isdir(char *path)
{
if (*path == '\0')
return 1;
2020-10-03 18:25:31 +02:00
return path[strlen(path)-1] == '/';
2020-10-02 19:39:00 +02:00
}
int
start_reply(struct pollfd *pfd, struct client *client, int code, const char *reason)
2020-10-02 19:39:00 +02:00
{
char buf[1030] = {0}; /* status + ' ' + max reply len + \r\n\0 */
int len;
int ret;
client->code = code;
client->meta = reason;
client->state = S_INITIALIZING;
2020-10-02 19:39:00 +02:00
len = snprintf(buf, sizeof(buf), "%d %s\r\n", code, reason);
assert(len < (int)sizeof(buf));
ret = tls_write(client->ctx, buf, len);
if (ret == TLS_WANT_POLLIN) {
pfd->events = POLLIN;
return 0;
}
if (ret == TLS_WANT_POLLOUT) {
pfd->events = POLLOUT;
return 0;
}
return 1;
2020-10-02 19:39:00 +02:00
}
int
isdir(int fd)
{
struct stat sb;
if (fstat(fd, &sb) == -1) {
warn("fstat");
2020-10-03 18:25:31 +02:00
return 1; /* we'll probably fail later on anyway */
2020-10-02 19:39:00 +02:00
}
return S_ISDIR(sb.st_mode);
}
ssize_t
filesize(int fd)
{
ssize_t len;
if ((len = lseek(fd, 0, SEEK_END)) == -1)
return -1;
if (lseek(fd, 0, SEEK_SET) == -1)
return -1;
return len;
}
const char *
path_ext(const char *path)
{
const char *end;
end = path + strlen(path)-1; /* the last byte before the NUL */
for (; end != path; --end) {
if (*end == '.')
return end+1;
if (*end == '/')
break;
}
return NULL;
}
const char *
mime(const char *path)
{
const char *ext, *def = "application/octet-stream";
struct etm *t;
if ((ext = path_ext(path)) == NULL)
return def;
for (t = filetypes; t->mime != NULL; ++t)
if (!strcmp(ext, t->ext))
return t->mime;
return def;
}
int
open_file(char *path, struct pollfd *fds, struct client *c)
2020-10-02 19:39:00 +02:00
{
char fpath[PATHBUF];
assert(path != NULL);
2020-10-02 19:39:00 +02:00
bzero(fpath, sizeof(fpath));
2020-10-02 19:39:00 +02:00
if (*path != '.')
fpath[0] = '.';
strlcat(fpath, path, PATHBUF);
2020-10-02 19:39:00 +02:00
if ((c->fd = openat(dirfd, fpath, O_RDONLY | O_NOFOLLOW)) == -1) {
warn("open: %s", fpath);
if (!start_reply(fds, c, NOT_FOUND, "not found"))
return 0;
goodbye(fds, c);
return 0;
}
2020-10-02 19:39:00 +02:00
if (isdir(c->fd)) {
warnx("%s is a directory, trying %s/index.gmi", fpath, fpath);
close(c->fd);
c->fd = -1;
send_dir(fpath, fds, c);
return 0;
}
if ((c->len = filesize(c->fd)) == -1) {
warn("filesize: %s", fpath);
goodbye(fds, c);
return 0;
}
if ((c->buf = mmap(NULL, c->len, PROT_READ, MAP_PRIVATE,
c->fd, 0)) == MAP_FAILED) {
warn("mmap: %s", fpath);
goodbye(fds, c);
return 0;
}
c->i = c->buf;
return start_reply(fds, c, SUCCESS, mime(fpath));
}
2020-10-02 19:39:00 +02:00
void
send_file(char *path, struct pollfd *fds, struct client *c)
{
ssize_t ret, len;
if (c->fd == -1) {
if (!open_file(path, fds, c))
return;
c->state = S_SENDING;
}
len = (c->buf + c->len) - c->i;
while (len > 0) {
switch (ret = tls_write(c->ctx, c->i, len)) {
case -1:
warnx("tls_write: %s", tls_error(c->ctx));
goodbye(fds, c);
return;
2020-10-02 19:39:00 +02:00
case TLS_WANT_POLLIN:
fds->events = POLLIN;
return;
case TLS_WANT_POLLOUT:
fds->events = POLLOUT;
return;
default:
c->i += ret;
len -= ret;
break;
2020-10-02 19:39:00 +02:00
}
}
goodbye(fds, c);
2020-10-02 19:39:00 +02:00
}
void
send_dir(char *path, struct pollfd *fds, struct client *client)
2020-10-02 19:39:00 +02:00
{
char fpath[PATHBUF];
size_t len;
bzero(fpath, PATHBUF);
2020-10-14 09:21:59 +02:00
if (path[0] != '.')
2020-10-02 19:39:00 +02:00
fpath[0] = '.';
/* this cannot fail since sizeof(fpath) > maxlen of path */
strlcat(fpath, path, PATHBUF);
len = strlen(fpath);
/* add a trailing / in case. */
if (fpath[len-1] != '/') {
fpath[len] = '/';
}
strlcat(fpath, "index.gmi", sizeof(fpath));
send_file(fpath, fds, client);
2020-10-02 19:39:00 +02:00
}
void
handle(struct pollfd *fds, struct client *client)
2020-10-02 19:39:00 +02:00
{
char buf[GEMINI_URL_LEN];
2020-10-02 19:39:00 +02:00
char *path;
switch (client->state) {
case S_OPEN:
bzero(buf, GEMINI_URL_LEN);
switch (tls_read(client->ctx, buf, sizeof(buf)-1)) {
case -1:
warnx("tls_read: %s", tls_error(client->ctx));
goodbye(fds, client);
return;
2020-10-02 19:39:00 +02:00
case TLS_WANT_POLLIN:
fds->events = POLLIN;
return;
2020-10-02 19:39:00 +02:00
case TLS_WANT_POLLOUT:
fds->events = POLLOUT;
return;
}
if (!url_trim(buf)) {
if (!start_reply(fds, client, BAD_REQUEST, "bad request"))
return;
goodbye(fds, client);
return;
}
if ((path = url_start_of_request(buf)) == NULL) {
if (!start_reply(fds, client, BAD_REQUEST, "bad request"))
return;
goodbye(fds, client);
return;
}
adjust_path(path);
fprintf(stderr, "requested path: %s\n", path);
2020-10-02 19:39:00 +02:00
if (path_isdir(path))
send_dir(path, fds, client);
else
send_file(path, fds, client);
break;
case S_INITIALIZING:
if (!start_reply(fds, client, client->code, client->meta))
return;
if (client->code != SUCCESS) {
/* we don't need a body */
goodbye(fds, client);
return;
}
2020-10-02 19:39:00 +02:00
client->state = S_SENDING;
/* fallthrough */
case S_SENDING:
send_file(NULL, fds, client);
break;
case S_CLOSING:
goodbye(fds, client);
break;
default:
/* unreachable */
abort();
}
}
void
mark_nonblock(int fd)
{
int flags;
if ((flags = fcntl(fd, F_GETFL)) == -1)
err(1, "fcntl(F_GETFL)");
if (fcntl(fd, F_SETFL, flags | O_NONBLOCK) == -1)
err(1, "fcntl(F_SETFL)");
2020-10-02 19:39:00 +02:00
}
int
make_socket(int port, int family)
2020-10-02 19:39:00 +02:00
{
int sock, v;
struct sockaddr_in addr4;
struct sockaddr_in6 addr6;
struct sockaddr *addr;
socklen_t len;
switch (family) {
case AF_INET:
bzero(&addr4, sizeof(addr4));
addr4.sin_family = family;
addr4.sin_port = htons(port);
addr4.sin_addr.s_addr = INADDR_ANY;
addr = (struct sockaddr*)&addr4;
len = sizeof(addr4);
break;
case AF_INET6:
bzero(&addr6, sizeof(addr6));
addr6.sin6_family = AF_INET6;
addr6.sin6_port = htons(port);
addr6.sin6_addr = in6addr_any;
addr = (struct sockaddr*)&addr6;
len = sizeof(addr6);
break;
2020-10-02 19:39:00 +02:00
default:
/* unreachable */
abort();
}
if ((sock = socket(family, SOCK_STREAM, 0)) == -1)
err(1, "socket");
2020-10-02 19:39:00 +02:00
v = 1;
if (setsockopt(sock, SOL_SOCKET, SO_REUSEADDR, &v, sizeof(v)) == -1)
err(1, "setsockopt(SO_REUSEADDR)");
v = 1;
if (setsockopt(sock, SOL_SOCKET, SO_REUSEPORT, &v, sizeof(v)) == -1)
err(1, "setsockopt(SO_REUSEPORT)");
mark_nonblock(sock);
if (bind(sock, addr, len) == -1)
err(1, "bind");
2020-10-02 19:39:00 +02:00
if (listen(sock, 16) == -1)
err(1, "listen");
2020-10-02 19:39:00 +02:00
return sock;
}
void
do_accept(int sock, struct tls *ctx, struct pollfd *fds, struct client *clients)
2020-10-02 19:39:00 +02:00
{
int i, fd;
struct sockaddr_in addr;
2020-10-02 19:39:00 +02:00
socklen_t len;
len = sizeof(addr);
if ((fd = accept(sock, (struct sockaddr*)&addr, &len)) == -1) {
if (errno == EWOULDBLOCK)
return;
err(1, "accept");
}
2020-10-02 19:39:00 +02:00
mark_nonblock(fd);
2020-10-02 19:39:00 +02:00
for (i = 0; i < MAX_USERS; ++i) {
if (fds[i].fd == -1) {
bzero(&clients[i], sizeof(struct client));
if (tls_accept_socket(ctx, &clients[i].ctx, fd) == -1)
break; /* goodbye fd! */
fds[i].fd = fd;
fds[i].events = POLLIN;
clients[i].state = S_OPEN;
clients[i].fd = -1;
clients[i].buf = MAP_FAILED;
return;
2020-10-02 19:39:00 +02:00
}
}
2020-10-02 19:39:00 +02:00
close(fd);
}
void
goodbye(struct pollfd *pfd, struct client *c)
{
ssize_t ret;
2020-10-02 19:39:00 +02:00
c->state = S_CLOSING;
ret = tls_close(c->ctx);
if (ret == TLS_WANT_POLLIN) {
pfd->events = POLLIN;
return;
}
if (ret == TLS_WANT_POLLOUT) {
pfd->events = POLLOUT;
return;
}
tls_free(c->ctx);
c->ctx = NULL;
if (c->buf != MAP_FAILED)
munmap(c->buf, c->len);
if (c->fd != -1)
close(c->fd);
close(pfd->fd);
pfd->fd = -1;
}
void
loop(struct tls *ctx, int sock)
{
int i, todo;
struct client clients[MAX_USERS];
struct pollfd fds[MAX_USERS];
for (i = 0; i < MAX_USERS; ++i) {
fds[i].fd = -1;
fds[i].events = POLLIN;
bzero(&clients[i], sizeof(struct client));
}
fds[0].fd = sock;
for (;;) {
if ((todo = poll(fds, MAX_USERS, INFTIM)) == -1)
err(1, "poll");
for (i = 0; i < MAX_USERS; i++) {
assert(i < MAX_USERS);
if (fds[i].revents == 0)
continue;
if (fds[i].revents & (POLLERR|POLLNVAL))
err(1, "bad fd %d", fds[i].fd);
if (fds[i].revents & POLLHUP) {
goodbye(&fds[i], &clients[i]);
continue;
}
todo--;
if (i == 0) { /* new client */
do_accept(sock, ctx, fds, clients);
continue;
}
handle(&fds[i], &clients[i]);
}
2020-10-02 19:39:00 +02:00
}
}
void
usage(const char *me)
{
fprintf(stderr,
"USAGE: %s [-h] [-c cert.pem] [-d docs] [-k key.pem]\n",
me);
}
int
main(int argc, char **argv)
{
const char *cert = "cert.pem", *key = "key.pem", *dir = "docs";
struct tls *ctx = NULL;
struct tls_config *conf;
int sock, ch;
signal(SIGPIPE, SIG_IGN);
2020-10-02 19:39:00 +02:00
while ((ch = getopt(argc, argv, "c:d:hk:")) != -1) {
switch (ch) {
case 'c':
cert = optarg;
break;
case 'd':
dir = optarg;
break;
case 'h':
usage(*argv);
return 0;
case 'k':
key = optarg;
break;
default:
usage(*argv);
return 1;
}
}
if ((conf = tls_config_new()) == NULL)
err(1, "tls_config_new");
if (tls_config_set_protocols(conf,
TLS_PROTOCOL_TLSv1_2 | TLS_PROTOCOL_TLSv1_3) == -1)
err(1, "tls_config_set_protocols");
2020-10-03 18:25:31 +02:00
if (tls_config_set_cert_file(conf, cert) == -1)
err(1, "tls_config_set_cert_file: %s", cert);
2020-10-02 19:39:00 +02:00
2020-10-03 18:25:31 +02:00
if (tls_config_set_key_file(conf, key) == -1)
err(1, "tls_config_set_key_file: %s", key);
2020-10-02 19:39:00 +02:00
if ((ctx = tls_server()) == NULL)
err(1, "tls_server");
if (tls_configure(ctx, conf) == -1)
errx(1, "tls_configure: %s", tls_error(ctx));
sock = make_socket(1965, AF_INET);
2020-10-02 19:39:00 +02:00
if ((dirfd = open(dir, O_RDONLY | O_DIRECTORY)) == -1)
err(1, "open: %s", dir);
if (unveil(dir, "r") == -1)
err(1, "unveil");
if (pledge("stdio rpath inet", "") == -1)
err(1, "pledge");
loop(ctx, sock);
close(sock);
tls_free(ctx);
tls_config_free(conf);
}