c_simple_http/src/http.c
Stephen Seo 700adf2f7b Impl. cache file lifetime checking
By default cache files are invalidated when the are aged for longer than
1 week. This "timeout-time" can be modified with a paramter/argument.
2024-09-26 12:37:45 +09:00

411 lines
12 KiB
C

// ISC License
//
// Copyright (c) 2024 Stephen Seo
//
// Permission to use, copy, modify, and/or distribute this software for any
// purpose with or without fee is hereby granted, provided that the above
// copyright notice and this permission notice appear in all copies.
//
// THE SOFTWARE IS PROVIDED "AS IS" AND THE AUTHOR DISCLAIMS ALL WARRANTIES WITH
// REGARD TO THIS SOFTWARE INCLUDING ALL IMPLIED WARRANTIES OF MERCHANTABILITY
// AND FITNESS. IN NO EVENT SHALL THE AUTHOR BE LIABLE FOR ANY SPECIAL, DIRECT,
// INDIRECT, OR CONSEQUENTIAL DAMAGES OR ANY DAMAGES WHATSOEVER RESULTING FROM
// LOSS OF USE, DATA OR PROFITS, WHETHER IN AN ACTION OF CONTRACT, NEGLIGENCE OR
// OTHER TORTIOUS ACTION, ARISING OUT OF OR IN CONNECTION WITH THE USE OR
// PERFORMANCE OF THIS SOFTWARE.
#include "http.h"
// Standard library includes.
#include <stdlib.h>
#include <string.h>
#include <stdio.h>
// Third party includes.
#include <SimpleArchiver/src/helpers.h>
#include <SimpleArchiver/src/data_structures/linked_list.h>
// Local includes
#include "http_template.h"
#include "helpers.h"
#include "html_cache.h"
#define REQUEST_TYPE_BUFFER_SIZE 16
#define REQUEST_PATH_BUFFER_SIZE 256
#define REQUEST_PROTO_BUFFER_SIZE 16
const char *c_simple_http_response_code_error_to_response(
enum C_SIMPLE_HTTP_ResponseCode response_code) {
switch (response_code) {
case C_SIMPLE_HTTP_Response_400_Bad_Request:
return "HTTP/1.1 400 Bad Request\nAllow: GET\n"
"Connection: close\n"
"Content-Type: text/html\n"
"Content-Length: 25\n\n"
"<h1>400 Bad Request</h1>\n";
case C_SIMPLE_HTTP_Response_404_Not_Found:
return "HTTP/1.1 404 Not Found\nAllow: GET\n"
"Connection: close\n"
"Content-Type: text/html\n"
"Content-Length: 23\n\n"
"<h1>404 Not Found</h1>\n";
case C_SIMPLE_HTTP_Response_500_Internal_Server_Error:
default:
return "HTTP/1.1 500 Internal Server Error\nAllow: GET\n"
"Connection: close\n"
"Content-Type: text/html\n"
"Content-Length: 35\n\n"
"<h1>500 Internal Server Error</h1>\n";
}
}
char *c_simple_http_request_response(
const char *request,
uint32_t size,
C_SIMPLE_HTTP_HTTPTemplates *templates,
size_t *out_size,
enum C_SIMPLE_HTTP_ResponseCode *out_response_code,
const Args *args) {
if (out_size) {
*out_size = 0;
}
// parse first line.
uint32_t idx = 0;
char request_type[REQUEST_TYPE_BUFFER_SIZE] = {0};
uint32_t request_type_idx = 0;
for (; idx < size
&& request[idx] != ' '
&& request[idx] != '\n'
&& request[idx] != '\r'
&& request[idx] != '\t'
&& request_type_idx < REQUEST_TYPE_BUFFER_SIZE - 1;
++idx) {
request_type[request_type_idx++] = request[idx];
}
if (request_type_idx == 0) {
if (out_response_code) {
*out_response_code = C_SIMPLE_HTTP_Response_400_Bad_Request;
}
return NULL;
}
#ifndef NDEBUG
fprintf(stderr, "Parsing request: got type \"%s\"\n", request_type);
#endif
// skip whitespace until next part.
for (; idx < size
&& (request[idx] == ' ' ||
request[idx] == '\n' ||
request[idx] == '\r' ||
request[idx] == '\t');
++idx) {}
// parse request path.
char request_path[REQUEST_PATH_BUFFER_SIZE] = {0};
uint32_t request_path_idx = 0;
for (; idx < size
&& request[idx] != ' '
&& request[idx] != '\n'
&& request[idx] != '\r'
&& request[idx] != '\t'
&& request_path_idx < REQUEST_PATH_BUFFER_SIZE - 1;
++idx) {
request_path[request_path_idx++] = request[idx];
}
if (request_path_idx == 0) {
if (out_response_code) {
*out_response_code = C_SIMPLE_HTTP_Response_400_Bad_Request;
}
return NULL;
}
#ifndef NDEBUG
fprintf(stderr, "Parsing request: got path \"%s\"\n", request_path);
#endif
__attribute__((cleanup(simple_archiver_helper_cleanup_c_string)))
char *request_path_unescaped =
c_simple_http_helper_unescape_uri(request_path);
#ifndef NDEBUG
fprintf(
stderr, "Parsing request: unescaped path \"%s\"\n", request_path_unescaped);
#endif
// skip whitespace until next part.
for (; idx < size
&& (request[idx] == ' ' ||
request[idx] == '\n' ||
request[idx] == '\r' ||
request[idx] == '\t');
++idx) {}
// parse request http protocol.
char request_proto[REQUEST_PROTO_BUFFER_SIZE] = {0};
uint32_t request_proto_idx = 0;
for (; idx < size
&& request[idx] != ' '
&& request[idx] != '\n'
&& request[idx] != '\r'
&& request[idx] != '\t'
&& request_proto_idx < REQUEST_PROTO_BUFFER_SIZE - 1;
++idx) {
request_proto[request_proto_idx++] = request[idx];
}
if (request_proto_idx == 0) {
if (out_response_code) {
*out_response_code = C_SIMPLE_HTTP_Response_400_Bad_Request;
}
return NULL;
}
#ifndef NDEBUG
fprintf(stderr, "Parsing request: got http protocol \"%s\"\n", request_proto);
#endif
if (strcmp(request_type, "GET") != 0) {
fprintf(stderr, "ERROR Only GET requests are allowed!\n");
if (out_response_code) {
*out_response_code = C_SIMPLE_HTTP_Response_400_Bad_Request;
}
return NULL;
} else if (strcmp(request_proto, "HTTP/1.1") != 0) {
fprintf(stderr, "ERROR Only HTTP/1.1 protocol requests are allowed!\n");
if (out_response_code) {
*out_response_code = C_SIMPLE_HTTP_Response_400_Bad_Request;
}
return NULL;
}
size_t generated_size = 0;
__attribute__((cleanup(simple_archiver_helper_cleanup_c_string)))
char *stripped_path = c_simple_http_strip_path(
request_path_unescaped, strlen(request_path_unescaped));
char *generated_buf = NULL;
if (args->cache_dir) {
int ret = c_simple_http_cache_path(
stripped_path ? stripped_path : request_path_unescaped,
args->config_file,
args->cache_dir,
templates,
args->cache_lifespan_seconds,
&generated_buf);
if (ret < 0) {
fprintf(stderr, "ERROR Failed to generate template with cache!\n");
if (out_response_code) {
if (
simple_archiver_hash_map_get(
templates->hash_map,
stripped_path ? stripped_path : request_path_unescaped,
stripped_path
? strlen(stripped_path) + 1
: strlen(request_path_unescaped) + 1)
== NULL) {
*out_response_code = C_SIMPLE_HTTP_Response_404_Not_Found;
} else {
*out_response_code = C_SIMPLE_HTTP_Response_500_Internal_Server_Error;
}
}
return NULL;
}
generated_size = strlen(generated_buf);
} else {
generated_buf = c_simple_http_path_to_generated(
stripped_path ? stripped_path : request_path_unescaped,
templates,
&generated_size,
NULL);
}
if (!generated_buf || generated_size == 0) {
fprintf(stderr, "ERROR Unable to generate response html for path \"%s\"!\n",
request_path);
if (out_response_code) {
if (
simple_archiver_hash_map_get(
templates->hash_map,
stripped_path ? stripped_path : request_path_unescaped,
stripped_path
? strlen(stripped_path) + 1
: strlen(request_path_unescaped) + 1)
== NULL) {
*out_response_code = C_SIMPLE_HTTP_Response_404_Not_Found;
} else {
*out_response_code = C_SIMPLE_HTTP_Response_500_Internal_Server_Error;
}
}
return NULL;
}
if (out_size) {
*out_size = generated_size;
}
if (out_response_code) {
*out_response_code = C_SIMPLE_HTTP_Response_200_OK;
}
return generated_buf;
}
char *c_simple_http_strip_path(const char *path, size_t path_size) {
if (path_size == 1 && path[0] == '/') {
// Edge case: root path.
char *buf = malloc(2);
buf[0] = '/';
buf[1] = 0;
return buf;
}
size_t idx = 0;
for (; idx < path_size && path[idx] != 0; ++idx) {
if (path[idx] == '?' || path[idx] == '#') {
break;
}
}
char *stripped_path = malloc(idx + 1);
memcpy(stripped_path, path, idx);
stripped_path[idx] = 0;
// Strip multiple '/' into one.
__attribute((cleanup(simple_archiver_list_free)))
SDArchiverLinkedList *parts = simple_archiver_list_init();
idx = 0;
size_t prev_idx = 0;
size_t size;
char *buf;
uint_fast8_t slash_visited = 0;
for (; stripped_path[idx] != 0; ++idx) {
if (stripped_path[idx] == '/') {
if (slash_visited) {
// Intentionally left blank.
} else {
slash_visited = 1;
if (idx > prev_idx) {
size = idx - prev_idx + 1;
buf = malloc(size);
memcpy(buf, stripped_path + prev_idx, size - 1);
buf[size - 1] = 0;
c_simple_http_add_string_part(parts, buf, 0);
free(buf);
}
}
} else {
if (slash_visited) {
buf = malloc(2);
buf[0] = '/';
buf[1] = 0;
c_simple_http_add_string_part(parts, buf, 0);
free(buf);
prev_idx = idx;
}
slash_visited = 0;
}
}
if (!slash_visited && idx > prev_idx) {
size = idx - prev_idx + 1;
buf = malloc(size);
memcpy(buf, stripped_path + prev_idx, size - 1);
buf[size - 1] = 0;
c_simple_http_add_string_part(parts, buf, 0);
free(buf);
} else if (slash_visited && prev_idx == 0) {
buf = malloc(2);
buf[0] = '/';
buf[1] = 0;
c_simple_http_add_string_part(parts, buf, 0);
free(buf);
}
free(stripped_path);
stripped_path = c_simple_http_combine_string_parts(parts);
// Strip trailing '/'.
idx = strlen(stripped_path);
while (idx-- > 1) {
if (stripped_path[idx] == '/' || stripped_path[idx] == 0) {
stripped_path[idx] = 0;
} else {
break;
}
}
return stripped_path;
}
SDArchiverHashMap *c_simple_http_request_to_headers_map(
const char *request, size_t request_size) {
SDArchiverHashMap *hash_map = simple_archiver_hash_map_init();
// xxxx xx00 - Beginning of line.
// xxxx xx01 - Reached end of header key.
// xxxx xx10 - Non-header line.
uint32_t state = 0;
size_t idx = 0;
size_t header_key_idx = 0;
__attribute__((cleanup(simple_archiver_helper_cleanup_c_string)))
char *key_buf = NULL;
size_t key_buf_size = 0;
__attribute__((cleanup(simple_archiver_helper_cleanup_c_string)))
char *value_buf = NULL;
for (; idx < request_size; ++idx) {
if ((state & 3) == 0) {
if ((request[idx] >= 'a' && request[idx] <= 'z')
|| (request[idx] >= 'A' && request[idx] <= 'Z')
|| request[idx] == '-') {
continue;
} else if (request[idx] == ':') {
key_buf_size = idx - header_key_idx + 1;
key_buf = malloc(key_buf_size);
memcpy(key_buf, request + header_key_idx, key_buf_size - 1);
key_buf[key_buf_size - 1] = 0;
c_simple_http_helper_to_lowercase_in_place(key_buf, key_buf_size);
state &= 0xFFFFFFFC;
state |= 1;
} else {
state &= 0xFFFFFFFC;
state |= 2;
}
} else if ((state & 3) == 1) {
if (request[idx] == '\n') {
size_t value_buf_size = idx - header_key_idx + 1;
value_buf = malloc(value_buf_size);
memcpy(value_buf, request + header_key_idx, value_buf_size - 1);
value_buf[value_buf_size - 1] = 0;
simple_archiver_hash_map_insert(
hash_map, value_buf, key_buf, key_buf_size, NULL, NULL);
key_buf = NULL;
value_buf = NULL;
key_buf_size = 0;
header_key_idx = idx + 1;
state &= 0xFFFFFFFC;
}
} else if ((state & 3) == 2) {
// Do nothing, just wait until '\n' is parsed.
}
if (request[idx] == '\n') {
header_key_idx = idx + 1;
state &= 0xFFFFFFFC;
}
}
if (key_buf && key_buf_size != 0 && !value_buf && idx > header_key_idx) {
size_t value_buf_size = idx - header_key_idx + 1;
value_buf = malloc(value_buf_size);
memcpy(value_buf, request + header_key_idx, value_buf_size - 1);
value_buf[value_buf_size - 1] = 0;
simple_archiver_hash_map_insert(
hash_map, value_buf, key_buf, key_buf_size, NULL, NULL);
key_buf = NULL;
value_buf = NULL;
}
return hash_map;
}
// vim: et ts=2 sts=2 sw=2