Files
wget2/libwget/hsts.c
2022-02-25 17:46:43 +01:00

587 lines
15 KiB
C

/*
* Copyright (c) 2014 Tim Ruehsen
* Copyright (c) 2015-2022 Free Software Foundation, Inc.
*
* This file is part of libwget.
*
* Libwget is free software: you can redistribute it and/or modify
* it under the terms of the GNU Lesser General Public License as published by
* the Free Software Foundation, either version 3 of the License, or
* (at your option) any later version.
*
* Libwget is distributed in the hope that it will be useful,
* but WITHOUT ANY WARRANTY; without even the implied warranty of
* MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
* GNU Lesser General Public License for more details.
*
* You should have received a copy of the GNU Lesser General Public License
* along with libwget. If not, see <https://www.gnu.org/licenses/>.
*
*
* HSTS routines
*
* Changelog
* 28.01.2014 Tim Ruehsen created
*
*/
#include <config.h>
#include <stdio.h>
#include <stdlib.h>
#include <string.h>
#include <ctype.h>
#include <time.h>
#include <errno.h>
#include <sys/stat.h>
#include <sys/file.h>
#include <wget.h>
#include "private.h"
/**
* \file
* \brief HTTP Strict Transport Security (RFC 6797) routines
* \defgroup libwget-hsts HTTP Strict Transport Security (RFC 6797) routines
* @{
*
* This is an implementation of RFC 6797.
*/
struct wget_hsts_db_st {
const char *
fname;
wget_hashmap *
entries;
wget_thread_mutex
mutex;
int64_t
load_time;
};
typedef struct {
const char *
host;
int64_t
expires; // expiry time
int64_t
created; // creation time
int64_t
maxage; // max-age in seconds
uint16_t
port;
bool
include_subdomains : 1; // whether or not subdomains are included
} hsts_entry;
/// Pointer to the function table
static const wget_hsts_db_vtable
*plugin_vtable;
void wget_hsts_set_plugin(const wget_hsts_db_vtable *vtable)
{
plugin_vtable = vtable;
}
#ifdef __clang__
__attribute__((no_sanitize("integer")))
#endif
WGET_GCC_PURE
static unsigned int hash_hsts(const hsts_entry *hsts)
{
unsigned int hash = hsts->port;
const unsigned char *p;
for (p = (unsigned char *)hsts->host; *p; p++)
hash = hash * 101 + *p;
return hash;
}
WGET_GCC_NONNULL_ALL WGET_GCC_PURE
static int compare_hsts(const hsts_entry *h1, const hsts_entry *h2)
{
int n;
if ((n = strcmp(h1->host, h2->host)))
return n;
return h1->port < h2->port ? -1 : (h1->port > h2->port ? 1 : 0);
}
static hsts_entry *init_hsts(hsts_entry *hsts)
{
if (!hsts) {
if (!(hsts = wget_calloc(1, sizeof(hsts_entry))))
return NULL;
} else
memset(hsts, 0, sizeof(*hsts));
hsts->created = time(NULL);
return hsts;
}
static void deinit_hsts(hsts_entry *hsts)
{
if (hsts) {
xfree(hsts->host);
}
}
static void free_hsts(hsts_entry *hsts)
{
if (hsts) {
deinit_hsts(hsts);
xfree(hsts);
}
}
static hsts_entry *new_hsts(const char *host, uint16_t port, int64_t maxage, bool include_subdomains)
{
hsts_entry *hsts = init_hsts(NULL);
if (!hsts)
return NULL;
hsts->host = wget_strdup(host);
hsts->port = port ? port : 443;
hsts->include_subdomains = include_subdomains;
if (maxage <= 0 || maxage >= INT64_MAX / 2 || hsts->created < 0 || hsts->created >= INT64_MAX / 2) {
hsts->maxage = 0;
hsts->expires = 0;
} else {
hsts->maxage = maxage;
hsts->expires = hsts->created + maxage;
}
return hsts;
}
/**
* \param[in] hsts_db An HSTS database
* \param[in] host Hostname to search for
* \param[in] port Port number in the original URI/IRI.
* Port number 80 is treated similar to 443, as 80 is default port for HTTP.
* \return 1 if the host must be accessed only through TLS, 0 if there is no such condition.
*
* Searches for a given host in the database for any previously added entry.
*
* HSTS entries older than amount of time specified by `maxage` are considered `expired` and are ignored.
*
* This function is thread-safe and can be called from multiple threads concurrently.
* Any implementation for this function must be thread-safe as well.
*/
int wget_hsts_host_match(const wget_hsts_db *hsts_db, const char *host, uint16_t port)
{
if (plugin_vtable)
return plugin_vtable->host_match(hsts_db, host, port);
if (!hsts_db)
return 0;
hsts_entry hsts, *hstsp;
const char *p;
int64_t now = time(NULL);
// first look for an exact match
// if it's the default port, "normalize" it
// we assume the scheme is HTTP
hsts.port = (port == 80 ? 443 : port);
hsts.host = host;
if (wget_hashmap_get(hsts_db->entries, &hsts, &hstsp) && hstsp->expires >= now)
return 1;
// now look for a valid subdomain match
for (p = host; (p = strchr(p, '.')); ) {
hsts.host = ++p;
if (wget_hashmap_get(hsts_db->entries, &hsts, &hstsp)
&& hstsp->include_subdomains && hstsp->expires >= now)
return 1;
}
return 0;
}
/**
* \param[in] hsts_db HSTS database created by wget_hsts_db_init()
*
* Frees all resources allocated for HSTS database, except for the structure itself. The `hsts_db` pointer can then
* be passed to wget_hsts_db_init() for reinitialization.
*
* If `hsts_db` is NULL this function does nothing.
*
* This function only works with databases created by wget_hsts_db_init().
*/
void wget_hsts_db_deinit(wget_hsts_db *hsts_db)
{
if (plugin_vtable) {
plugin_vtable->deinit(hsts_db);
return;
}
if (hsts_db) {
xfree(hsts_db->fname);
wget_thread_mutex_lock(hsts_db->mutex);
wget_hashmap_free(&hsts_db->entries);
wget_thread_mutex_unlock(hsts_db->mutex);
wget_thread_mutex_destroy(&hsts_db->mutex);
}
}
/**
* \param[in] hsts_db Pointer to the HSTS database handle (will be set to NULL)
*
* Frees all resources allocated for the HSTS database.
*
* A double pointer is required because this function will set the handle (pointer) to the HPKP database to NULL
* to prevent potential use-after-free conditions.
*
* If `hsts_db` or pointer it points to is NULL, then the function does nothing.
*
* Newly added entries will be lost unless committed to persistent storage using wget_hsts_db_save().
*/
void wget_hsts_db_free(wget_hsts_db **hsts_db)
{
if (plugin_vtable) {
plugin_vtable->free(hsts_db);
return;
}
if (hsts_db && *hsts_db) {
wget_hsts_db_deinit(*hsts_db);
xfree(*hsts_db);
}
}
static void hsts_db_add_entry(wget_hsts_db *hsts_db, hsts_entry *hsts)
{
if (!hsts)
return;
wget_thread_mutex_lock(hsts_db->mutex);
if (hsts->maxage == 0) {
if (wget_hashmap_remove(hsts_db->entries, hsts))
debug_printf("removed HSTS %s:%hu\n", hsts->host, hsts->port);
free_hsts(hsts);
hsts = NULL;
} else {
hsts_entry *old;
if (wget_hashmap_get(hsts_db->entries, hsts, &old)) {
if (old->created < hsts->created || old->maxage != hsts->maxage || old->include_subdomains != hsts->include_subdomains) {
old->created = hsts->created;
old->expires = hsts->expires;
old->maxage = hsts->maxage;
old->include_subdomains = hsts->include_subdomains;
debug_printf("update HSTS %s:%hu (maxage=%lld, includeSubDomains=%d)\n", old->host, old->port, (long long)old->maxage, old->include_subdomains);
}
free_hsts(hsts);
hsts = NULL;
} else {
// key and value are the same to make wget_hashmap_get() return old 'hsts'
// debug_printf("add HSTS %s:%hu (maxage=%lld, includeSubDomains=%d)\n", hsts->host, hsts->port, (long long)hsts->maxage, hsts->include_subdomains);
wget_hashmap_put(hsts_db->entries, hsts, hsts);
// no need to free anything here
}
}
wget_thread_mutex_unlock(hsts_db->mutex);
}
/**
* \param[in] hsts_db An HSTS database
* \param[in] host Hostname from where `Strict-Transport-Security` header was received
* \param[in] port Port number used for connecting to the host
* \param[in] maxage The time from now till the entry is valid, in seconds, or 0 to remove existing entry.
* Corresponds to the `max-age` directive in `Strict-Transport-Security` header.
* \param[in] include_subdomains Nonzero if `includeSubDomains` directive was present in the header, zero otherwise
*
* Add an entry to the HSTS database. An entry corresponds to the `Strict-Transport-Security` HTTP response header.
* Any existing entry with same `host` and `port` is replaced. If `maxage` is zero, any existing entry with
* matching `host` and `port` is removed.
*
* This function is thread-safe and can be called from multiple threads concurrently.
* Any implementation for this function must be thread-safe as well.
*/
void wget_hsts_db_add(wget_hsts_db *hsts_db, const char *host, uint16_t port, int64_t maxage, bool include_subdomains)
{
if (plugin_vtable) {
plugin_vtable->add(hsts_db, host, port, maxage, include_subdomains);
return;
}
if (hsts_db) {
hsts_entry *hsts = new_hsts(host, port, maxage, include_subdomains);
hsts_db_add_entry(hsts_db, hsts);
}
}
static int hsts_db_load(wget_hsts_db *hsts_db, FILE *fp)
{
hsts_entry hsts;
struct stat st;
char *buf = NULL, *linep, *p;
size_t bufsize = 0;
ssize_t buflen;
int64_t now = time(NULL);
int ok;
// if the database file hasn't changed since the last read
// there's no need to reload
if (fstat(fileno(fp), &st) == 0) {
if (st.st_mtime != hsts_db->load_time)
hsts_db->load_time = st.st_mtime;
else
return 0;
}
while ((buflen = wget_getline(&buf, &bufsize, fp)) >= 0) {
linep = buf;
while (isspace(*linep)) linep++; // ignore leading whitespace
if (!*linep) continue; // skip empty lines
if (*linep == '#')
continue; // skip comments
// strip off \r\n
while (buflen > 0 && (buf[buflen] == '\n' || buf[buflen] == '\r'))
buf[--buflen] = 0;
init_hsts(&hsts);
ok = 0;
// parse host
if (*linep) {
for (p = linep; *linep && !isspace(*linep); )
linep++;
hsts.host = wget_strmemdup(p, linep - p);
}
// parse port
if (*linep) {
for (p = ++linep; *linep && !isspace(*linep); )
linep++;
hsts.port = (uint16_t) atoi(p);
if (hsts.port == 0)
hsts.port = 443;
}
// parse includeSubDomains
if (*linep) {
for (p = ++linep; *linep && !isspace(*linep); )
linep++;
hsts.include_subdomains = atoi(p) ? 1 : 0;
}
// parse creation time
if (*linep) {
for (p = ++linep; *linep && !isspace(*linep); )
linep++;
hsts.created = atoll(p);
if (hsts.created < 0 || hsts.created >= INT64_MAX / 2)
hsts.created = 0;
}
// parse max age
if (*linep) {
for (p = ++linep; *linep && !isspace(*linep); )
linep++;
hsts.maxage = atoll(p);
if (hsts.maxage < 0 || hsts.maxage >= INT64_MAX / 2)
hsts.maxage = 0; // avoid integer overflow here
hsts.expires = hsts.maxage ? hsts.created + hsts.maxage : 0;
if (hsts.expires < now) {
// drop expired entry
deinit_hsts(&hsts);
continue;
}
ok = 1;
}
if (ok) {
hsts_db_add_entry(hsts_db, wget_memdup(&hsts, sizeof(hsts)));
} else {
deinit_hsts(&hsts);
error_printf(_("Failed to parse HSTS line: '%s'\n"), buf);
}
}
xfree(buf);
if (ferror(fp)) {
hsts_db->load_time = 0; // reload on next call to this function
return -1;
}
return 0;
}
/**
* \param[in] hsts_db An HSTS database
* \return 0 if the operation succeeded, -1 in case of error
*
* Performs all operations necessary to access the HSTS database entries from persistent storage
* using wget_hsts_host_match() for example.
*
* For database created by wget_hsts_db_init() this function will load all the entries from the file specified
* in `fname` parameter of wget_hsts_db_init().
*
* If `hsts_db` is NULL this function does nothing and returns 0.
*/
int wget_hsts_db_load(wget_hsts_db *hsts_db)
{
if (plugin_vtable)
return plugin_vtable->load(hsts_db);
if (!hsts_db)
return -1;
if (!hsts_db->fname || !*hsts_db->fname)
return 0;
// Load the HSTS cache from a flat file
// Protected by flock()
if (wget_update_file(hsts_db->fname, (wget_update_load_fn *) hsts_db_load, NULL, hsts_db)) {
error_printf(_("Failed to read HSTS data\n"));
return -1;
} else {
debug_printf("Fetched HSTS data from '%s'\n", hsts_db->fname);
return 0;
}
}
WGET_GCC_NONNULL_ALL
static int hsts_save(void *_fp, const void *_hsts, WGET_GCC_UNUSED void *v)
{
FILE *fp = _fp;
const hsts_entry *hsts = _hsts;
wget_fprintf(fp, "%s %hu %d %lld %lld\n", hsts->host, hsts->port, hsts->include_subdomains, (long long)hsts->created, (long long)hsts->maxage);
return 0;
}
static int hsts_db_save(void *hsts_db, FILE *fp)
{
wget_hashmap *entries = ((wget_hsts_db *) hsts_db)->entries;
if (wget_hashmap_size(entries) > 0) {
fputs("#HSTS 1.0 file\n", fp);
fputs("#Generated by libwget " PACKAGE_VERSION ". Edit at your own risk.\n", fp);
fputs("# <hostname> <port> <incl. subdomains> <created> <max-age>\n", fp);
wget_hashmap_browse(entries, hsts_save, fp);
if (ferror(fp))
return -1;
}
return 0;
}
/**
* \param[in] hsts_db HSTS database
* \return 0 if the operation succeeded, -1 otherwise
*
* Saves all changes to the HSTS database (via wget_hsts_db_add() for example) to persistent storage.
*
* For databases created by wget_hsts_db_init(), the data is stored into file specified by `fname` parameter
* of wget_hsts_db_init().
*
* If `hsts_db` is NULL this function does nothing.
*/
int wget_hsts_db_save(wget_hsts_db *hsts_db)
{
int size;
if (plugin_vtable)
return plugin_vtable->save(hsts_db);
if (!hsts_db)
return -1;
if (!hsts_db->fname || !*hsts_db->fname)
return -1;
// Save the HSTS cache to a flat file
// Protected by flock()
if (wget_update_file(hsts_db->fname, (wget_update_load_fn *) hsts_db_load, hsts_db_save, hsts_db)) {
error_printf(_("Failed to write HSTS file '%s'\n"), hsts_db->fname);
return -1;
}
if ((size = wget_hashmap_size(hsts_db->entries)))
debug_printf("Saved %d HSTS entr%s into '%s'\n", size, size != 1 ? "ies" : "y", hsts_db->fname);
else
debug_printf("No HSTS entries to save. Table is empty.\n");
return 0;
}
/**
* \param[in] hsts_db Previously created HSTS database on which wget_hsts_db_deinit() has been called, or NULL
* \param[in] fname The file where the data is stored, or NULL.
* \return A new wget_hsts_db
*
* Constructor for the default implementation of HSTS database.
*
* This function does no file IO, data is read only when \ref wget_hsts_db_load "wget_hsts_db_load()" is called.
*/
wget_hsts_db *wget_hsts_db_init(wget_hsts_db *hsts_db, const char *fname)
{
if (plugin_vtable)
return plugin_vtable->init(hsts_db, fname);
if (fname) {
if (!(fname = wget_strdup(fname)))
return NULL;
}
wget_hashmap *entries = wget_hashmap_create(16, (wget_hashmap_hash_fn *) hash_hsts, (wget_hashmap_compare_fn *) compare_hsts);
if (!entries) {
xfree(fname);
return NULL;
}
if (!hsts_db) {
if (!(hsts_db = wget_calloc(1, sizeof(struct wget_hsts_db_st)))) {
wget_hashmap_free(&entries);
xfree(fname);
return NULL;
}
} else
memset(hsts_db, 0, sizeof(*hsts_db));
hsts_db->fname = fname;
hsts_db->entries = entries;
wget_hashmap_set_key_destructor(hsts_db->entries, (wget_hashmap_key_destructor *) free_hsts);
wget_hashmap_set_value_destructor(hsts_db->entries, (wget_hashmap_value_destructor *) free_hsts);
wget_thread_mutex_init(&hsts_db->mutex);
return hsts_db;
}
/**
* \param[in] hsts_db HSTS database created by wget_hsts_db_init().
* \param[in] fname Filename where database should be stored, or NULL
*
* Changes the file where HSTS database entries are stored.
*
* Works only for the HSTS databases created by wget_hsts_db_init().
* This function does no file IO, data is read or written only when wget_hsts_db_load() or wget_hsts_db_save()
* is called.
*/
void wget_hsts_db_set_fname(wget_hsts_db *hsts_db, const char *fname)
{
xfree(hsts_db->fname);
hsts_db->fname = wget_strdup(fname);
}
/**@}*/