vger/main.c

527 lines
13 KiB
C
Raw Normal View History

#include <sys/types.h>
#include <sys/stat.h>
#include <sys/wait.h>
2020-12-05 05:31:13 +11:00
2021-03-02 20:06:09 +11:00
#include <ctype.h>
#include <dirent.h>
2020-12-04 08:59:39 +11:00
#include <err.h>
#include <errno.h>
#include <fcntl.h>
#include <limits.h>
2020-12-04 08:59:39 +11:00
#include <pwd.h>
2020-12-05 04:55:31 +11:00
#include <stdarg.h>
2020-12-02 09:39:05 +11:00
#include <stdio.h>
2020-12-04 08:59:39 +11:00
#include <stdlib.h>
2020-12-02 09:39:05 +11:00
#include <string.h>
2020-12-05 04:55:31 +11:00
#include <syslog.h>
2020-12-02 09:39:05 +11:00
#include <unistd.h>
2020-12-05 05:29:44 +11:00
#include "mimes.h"
#include "opts.h"
#include "utils.h"
2020-12-02 09:39:05 +11:00
/* length of "gemini://" */
2020-12-02 09:39:05 +11:00
#define GEMINI_PART 9
2021-10-21 20:41:22 +11:00
/*
* number of bytes to read with fgets() : 2014 + 1.
* fgets() reads at most size-1 (1024 here).
* See https://gemini.circumlunar.space/docs/specification.html.
*/
#define GEMINI_REQUEST_MAX 1025
2020-12-02 09:39:05 +11:00
2021-10-21 20:41:22 +11:00
void autoindex(const char *);
void cgi (const char *cgicmd);
void display_file(const char *);
void drop_privileges(const char *, const char *);
2021-10-21 20:41:22 +11:00
void echdir (const char *);
void status (const int, const char *);
void status_redirect(const int, const char *);
void status_error(const int, const char *);
int uridecode (char *);
2021-03-02 20:06:09 +11:00
void
echdir(const char *path)
{
if (chdir(path) == -1) {
switch (errno) {
2021-10-21 20:41:22 +11:00
case ENOTDIR: /* FALLTHROUGH */
case ENOENT:
status_error(51, "file not found");
break;
case EACCES:
status_error(50, "Forbidden path");
break;
default:
status_error(50, "Internal server error");
break;
}
errlog("failed to chdir(%s)", path);
}
}
2021-03-02 20:06:09 +11:00
int
uridecode(char *uri)
{
2021-10-21 20:41:22 +11:00
int n = 0;
char c = '\0';
long l = 0;
char *pos = NULL;
if ((pos = strchr(uri, '%')) == NULL)
return n;
while ((pos = strchr(pos, '%')) != NULL) {
if (strlen(pos) < 3)
return n;
char hex[3] = {'\0'};
for (size_t i = 0; i < 2; i++)
hex[i] = tolower(pos[i + 1]);
errno = 0;
l = strtol(hex, 0, 16);
if (errno == ERANGE && (l == LONG_MAX || l == LONG_MIN))
continue; /* conversion failed */
c = (char)l;
pos[0] = c;
/* rewind of two char to remove %hex */
memmove(pos + 1, pos + 3, strlen(pos + 3) + 1); /* +1 for \0 */
n++;
pos++; /* avoid infinite loop */
}
2021-03-02 20:06:09 +11:00
return n;
}
2020-12-10 07:12:25 +11:00
2020-12-02 09:39:05 +11:00
void
drop_privileges(const char *user, const char *path)
2020-12-02 09:39:05 +11:00
{
struct passwd *pw;
2020-12-06 00:44:59 +11:00
/*
* use chroot() if an user is specified requires root user to be
* running the program to run chroot() and then drop privileges
*/
if (strlen(user) > 0) {
2020-12-06 00:44:59 +11:00
/* is root? */
2021-10-21 20:41:22 +11:00
if (getuid() != 0)
errlog("chroot requires program to be run as root");
/* search user uid from name */
2021-10-21 20:41:22 +11:00
if ((pw = getpwnam(user)) == NULL)
errlog("the user %s can't be found on the system", user);
/* chroot worked? */
2021-10-21 20:41:22 +11:00
if (chroot(path) != 0)
errlog("the chroot_dir %s can't be used for chroot", path);
chrooted = 1;
echdir("/");
/* drop privileges */
#if defined (__OpenBSD__) || defined(__FreeBSD__)
2020-12-05 05:39:16 +11:00
if (setgroups(1, &pw->pw_gid) ||
setresgid(pw->pw_gid, pw->pw_gid, pw->pw_gid) ||
setresuid(pw->pw_uid, pw->pw_uid, pw->pw_uid)) {
errlog("dropping privileges to user %s (uid=%i) failed",
user, pw->pw_uid);
}
#else
if (setgroups(1, &pw->pw_gid) ||
setgid(pw->pw_gid) ||
setuid(pw->pw_uid)) {
errlog("dropping privileges to user %s (uid=%i) failed",
user, pw->pw_uid);
}
#endif
}
#ifdef __OpenBSD__
/*
* prevent access to files other than the one in path
*/
2021-10-21 20:41:22 +11:00
if (chrooted)
eunveil("/", "r");
else
eunveil(path, "r");
/* permission to execute what's inside cgidir */
2021-10-21 20:41:22 +11:00
if (strlen(cgidir) > 0)
eunveil(cgidir, "rx");
eunveil(NULL, NULL); /* no more call to unveil() */
/* promise permissions */
2021-10-21 20:41:22 +11:00
if (strlen(cgidir) > 0)
epledge("stdio rpath exec", NULL);
else
epledge("stdio rpath", NULL);
#endif
2021-10-21 20:41:22 +11:00
if (!chrooted)
echdir(path); /* move to the gemini data directory */
2020-12-02 09:39:05 +11:00
}
2020-12-03 05:59:52 +11:00
void
status(const int code, const char *file_mime)
2020-12-03 05:59:52 +11:00
{
2021-10-21 20:41:22 +11:00
if (strcmp(file_mime, "text/gemini") == 0)
printf("%i %s; %s\r\n", code, file_mime, lang);
else
printf("%i %s\r\n", code, file_mime);
2020-12-03 05:59:52 +11:00
}
2020-12-02 09:39:05 +11:00
2021-01-02 07:00:40 +11:00
void
status_redirect(const int code, const char *url)
{
printf("%i %s\r\n",
code, url);
}
void
status_error(const int code, const char *reason)
{
printf("%i %s\r\n",
2021-10-21 20:41:22 +11:00
code, reason);
}
2020-12-02 09:39:05 +11:00
void
display_file(const char *fname)
2020-12-02 09:39:05 +11:00
{
2021-10-21 20:41:22 +11:00
FILE *fd = NULL;
struct stat sb = {0};
ssize_t nread = 0;
const char *file_mime;
char *buffer[BUFSIZ];
char target[FILENAME_MAX] = {'\0'};
char tmp[PATH_MAX] = {'\0'}; /* used to build
* temporary path */
/*
* special case : fname empty. The user requested just the directory
* name
*/
if (strlen(fname) == 0) {
if (stat("index.gmi", &sb) == 0) {
/* there is index.gmi in the current directory */
display_file("index.gmi");
return;
} else if (doautoidx) {
/* no index.gmi, so display autoindex if enabled */
autoindex(".");
return;
} else {
goto err;
}
}
2021-01-02 07:00:40 +11:00
/* this is to check if path exists and obtain metadata later */
if (stat(fname, &sb) == -1) {
2021-10-21 20:41:22 +11:00
/*
* check if fname is a symbolic link if so, redirect using
* its target
*/
if (lstat(fname, &sb) != -1 && S_ISLNK(sb.st_mode) == 1)
2021-10-21 20:41:22 +11:00
goto redirect;
else
2021-10-21 20:41:22 +11:00
goto err;
2021-01-02 07:00:40 +11:00
}
/* check if directory */
if (S_ISDIR(sb.st_mode) != 0) {
/* no ending "/", redirect to "fname/" */
estrlcpy(tmp, fname, sizeof(tmp));
estrlcat(tmp, "/", sizeof(tmp));
status_redirect(31, tmp);
return;
}
2021-01-02 07:00:40 +11:00
/* open the file requested */
2021-10-21 20:41:22 +11:00
if ((fd = fopen(fname, "r")) == NULL)
goto err;
2021-01-02 07:00:40 +11:00
file_mime = get_file_mime(fname, default_mime);
2020-12-03 05:59:52 +11:00
status(20, file_mime);
2020-12-02 09:39:05 +11:00
/* read the file byte after byte in buffer and write it to stdout */
while ((nread = fread(buffer, 1, sizeof(buffer), fd)) != 0)
fwrite(buffer, 1, nread, stdout);
2021-10-21 20:41:22 +11:00
goto closefd; /* close file descriptor */
syslog(LOG_INFO, "path served %s", fname);
2020-12-02 09:39:05 +11:00
return;
2020-12-06 00:44:59 +11:00
err:
/* return an error code and no content */
status_error(51, "file not found");
syslog(LOG_INFO, "path invalid %s", fname);
goto closefd;
2021-01-02 07:00:40 +11:00
redirect:
/* read symbolic link target to redirect */
2021-10-21 20:41:22 +11:00
if (readlink(fname, target, FILENAME_MAX) == -1)
goto err;
2021-01-02 07:00:40 +11:00
status_redirect(30, target);
syslog(LOG_INFO, "redirection from %s to %s", fname, target);
2021-01-02 07:00:40 +11:00
closefd:
2021-10-21 20:41:22 +11:00
if (S_ISREG(sb.st_mode) != 0)
fclose(fd);
}
void
autoindex(const char *path)
{
/* display liks to files in path + a link to parent (..) */
2021-10-21 20:41:22 +11:00
int n = 0;
struct dirent **namelist; /* this must be freed at last */
syslog(LOG_INFO, "autoindex: %s", path);
/* use alphasort to always have the same order on every system */
if ((n = scandir(path, &namelist, NULL, alphasort)) < 0) {
status_error(50, "Internal server error");
errlog("Can't scan %s", path);
} else {
status(20, "text/gemini");
2021-10-21 20:41:22 +11:00
printf("=> .. ../\n"); /* display link to parent */
for (int j = 0; j < n; j++) {
/* skip self and parent */
if ((strcmp(namelist[j]->d_name, ".") == 0) ||
(strcmp(namelist[j]->d_name, "..") == 0)) {
continue;
}
/* add "/" at the end of a directory path */
2021-10-21 20:41:22 +11:00
if (namelist[j]->d_type == DT_DIR)
printf("=> ./%s/ %s/\n", namelist[j]->d_name, namelist[j]->d_name);
else
printf("=> ./%s %s\n", namelist[j]->d_name, namelist[j]->d_name);
free(namelist[j]);
}
free(namelist);
}
2020-12-02 09:39:05 +11:00
}
void
cgi(const char *cgicmd)
{
/* run cgicmd replacing current process */
execl(cgicmd, cgicmd, NULL);
/* if execl is ok, this will never be reached */
status(42, "Couldn't execute CGI script");
errlog("error when trying to execl %s", cgicmd);
exit(1);
}
2020-12-02 09:39:05 +11:00
int
main(int argc, char **argv)
{
2021-10-21 20:41:22 +11:00
char request [GEMINI_REQUEST_MAX] = {'\0'};
char user [_SC_LOGIN_NAME_MAX] = "";
char hostname [GEMINI_REQUEST_MAX] = {'\0'};
char query [PATH_MAX] = {'\0'};
char chroot_dir[PATH_MAX] = DEFAULT_CHROOT;
char file [FILENAME_MAX] = DEFAULT_INDEX;
char dir [PATH_MAX] = {'\0'};
char *pos = NULL;
int option = 0;
int virtualhost = 0;
int docgi = 0;
/*
2021-10-21 20:41:22 +11:00
* request : contain the whole request from client : gemini://...\r\n
* user : username, used in drop_privileges()
* hostname : extracted from hostname. used with virtualhosts and cgi SERVER_NAME
* query : file requested in cgi : gemini://...?query
* file : file basename to display. Emtpy is a directory has been requested
* dir : directory requested. vger will chdir() in to find file
* pos : used to parse request and split into interesting parts
*/
while ((option = getopt(argc, argv, ":d:l:m:u:c:vi")) != -1) {
switch (option) {
case 'd':
estrlcpy(chroot_dir, optarg, sizeof(chroot_dir));
break;
case 'l':
estrlcpy(lang, "lang=", sizeof(lang));
estrlcat(lang, optarg, sizeof(lang));
break;
case 'm':
estrlcpy(default_mime, optarg, sizeof(default_mime));
break;
2020-12-04 08:59:39 +11:00
case 'u':
estrlcpy(user, optarg, sizeof(user));
break;
case 'c':
estrlcpy(cgidir, optarg, sizeof(cgidir));
docgi = 1;
break;
case 'v':
virtualhost = 1;
break;
case 'i':
doautoidx = 1;
2020-12-04 08:59:39 +11:00
break;
}
2020-12-02 09:39:05 +11:00
}
/*
* set logging options and defaults
*/
openlog("vger", LOG_PID, LOG_DAEMON);
2020-12-03 05:59:52 +11:00
2020-12-04 08:59:39 +11:00
/*
* do chroot if an user is supplied
2020-12-04 08:59:39 +11:00
*/
drop_privileges(user, chroot_dir);
2020-12-06 00:44:59 +11:00
2020-12-02 09:39:05 +11:00
/*
* read 1024 chars from stdin
* to get the request
* (actually 1024 + \0)
2020-12-02 09:39:05 +11:00
*/
if (fgets(request, GEMINI_REQUEST_MAX, stdin) == NULL) {
/* EOF reached before reading anything */
if (feof(stdin)) {
status(59, "request is too short and probably empty");
errlog("request is too short and probably empty");
2021-10-21 20:41:22 +11:00
/* error before reading anything */
} else if (ferror(stdin)) {
status(59, "Error while reading request");
errlog("Error while reading request: %s", request);
}
}
/* check if string ends with '\n', or to long */
if (request[strnlen(request, GEMINI_REQUEST_MAX) - 1] != '\n') {
status(59, "request is too long (1024 max)");
errlog("request is too long (1024 max): %s", request);
}
2020-12-02 09:39:05 +11:00
/* remove \r\n at the end of string */
pos = strchr(request, '\r');
if (pos != NULL)
2020-12-05 04:55:31 +11:00
*pos = '\0';
2020-12-02 09:39:05 +11:00
/*
* check if the beginning of the request starts with
* gemini://
*/
if (strncmp(request, "gemini://", GEMINI_PART) != 0) {
2020-12-02 09:39:05 +11:00
/* error code url malformed */
errlog("request «%s» doesn't match gemini://",
request);
2020-12-02 09:39:05 +11:00
}
syslog(LOG_INFO, "request %s", request);
2020-12-05 04:55:31 +11:00
2020-12-02 09:39:05 +11:00
/* remove the gemini:// part */
2021-10-21 20:41:22 +11:00
memmove(request, request + GEMINI_PART, strlen(request) + 1 - GEMINI_PART);
/* remove all "/.." for safety reasons */
2021-10-21 20:41:22 +11:00
while ((pos = strstr(request, "/..")) != NULL)
memmove(request, pos + 3, strlen(pos) + 1 - 3); /* "/.." = 3 */
2020-12-02 09:39:05 +11:00
/* look for hostname in request : first thing before first / if any */
pos = strchr(request, '/');
2020-12-02 09:39:05 +11:00
if (pos != NULL) {
/* copy what's after hostname in dir */
2021-10-21 20:41:22 +11:00
estrlcpy(dir, pos, strlen(pos) + 1);
/* just keep hostname in request : stop the string with \0 */
pos[0] = '\0';
2020-12-02 09:39:05 +11:00
}
/* check if client added :port at end of hostname and remove it */
pos = strchr(request, ':');
if (pos != NULL) {
2021-10-21 20:41:22 +11:00
/* end string at : */
pos[0] = '\0';
}
/* copy hostname from request */
estrlcpy(hostname, request, sizeof(hostname));
2020-12-02 09:39:05 +11:00
/* remove leading '/' in dir */
2021-10-21 20:41:22 +11:00
while (dir[0] == '/')
memmove(dir, dir + 1, strlen(dir + 1) + 1);
if (virtualhost) {
/* add hostname at the beginning of the dir path */
2021-10-21 20:41:22 +11:00
char tmp [PATH_MAX] = {'\0'};
estrlcpy(tmp, hostname, sizeof(tmp));
estrlcat(tmp, "/", sizeof(tmp));
estrlcat(tmp, dir, sizeof(tmp));
estrlcpy(dir, tmp, sizeof(dir));
}
/* percent decode */
uridecode(dir);
2021-10-21 20:41:22 +11:00
/*
* split dir and filename. file is last part after last '/'. if none
* found, then requested file is actually a directory
*/
if (strlen(dir) > 0) {
pos = strrchr(dir, '/');
if (pos != NULL) {
2021-10-21 20:41:22 +11:00
estrlcpy(file, pos + 1, sizeof(file)); /* +1 : no leading '/' */
pos[0] = '\0';
2021-10-21 20:41:22 +11:00
/* change directory to requested directory */
if (strlen(dir) > 0)
echdir(dir);
} else {
estrlcpy(file, dir, sizeof(file));
}
}
if (docgi) {
/* check if directory is cgidir */
2021-10-21 20:41:22 +11:00
char cgifp [PATH_MAX] = {'\0'};
estrlcpy(cgifp, chroot_dir, sizeof(cgifp));
2021-10-21 20:41:22 +11:00
if (cgifp[strlen(cgifp) - 1] != '/')
estrlcat(cgifp, "/", sizeof(cgifp));
estrlcat(cgifp, dir, sizeof(cgifp));
2021-10-21 20:41:22 +11:00
/* not cgipath, display file content */
if (strcmp(cgifp, cgidir) != 0)
goto file_to_stdout;
2021-10-21 20:41:22 +11:00
/* set env variables for CGI */
2021-10-21 20:41:22 +11:00
/*
* see
* https://lists.orbitalfox.eu/archives/gemini/2020/000315.htm
* l
*/
esetenv("GATEWAY_INTERFACE", "CGI/1.1", 1);
esetenv("SERVER_PROTOCOL", "GEMINI", 1);
esetenv("SERVER_SOFTWARE", "vger/1", 1);
2021-10-21 20:41:22 +11:00
/* look for "?" if any to set query for cgi, remove it */
pos = strchr(file, '?');
if (pos != NULL) {
2021-10-21 20:41:22 +11:00
estrlcpy(query, pos + 1, sizeof(query));
esetenv("QUERY_STRING", query, 1);
pos[0] = '\0';
}
/* look for an extension to find PATH_INFO */
pos = strrchr(file, '.');
if (pos != NULL) {
/* found a dot */
pos = strchr(pos, '/');
if (pos != NULL) {
setenv("PATH_INFO", pos, 1);
2021-10-21 20:41:22 +11:00
pos[0] = '\0'; /* keep only script name */
}
}
esetenv("SCRIPT_NAME", file, 1);
esetenv("SERVER_NAME", hostname, 1);
cgi(file);
return 0;
}
file_to_stdout:
/* regular file to stdout */
display_file(file);
/* end logging */
closelog();
return (0);
2020-12-02 09:39:05 +11:00
}