Initial commit
This commit is contained in:
commit
b2df740514
19 changed files with 1640 additions and 0 deletions
319
dlhist.c
Normal file
319
dlhist.c
Normal file
|
|
@ -0,0 +1,319 @@
|
|||
|
||||
#include <stdio.h>
|
||||
#include <string.h>
|
||||
#include <stdlib.h>
|
||||
#include <unistd.h>
|
||||
#include <arpa/inet.h>
|
||||
#include <sys/types.h>
|
||||
#include <sys/stat.h>
|
||||
#include <fcntl.h>
|
||||
#include <time.h>
|
||||
#include "env.h"
|
||||
#include "dlhist.h"
|
||||
|
||||
/*
|
||||
* TODO: maybe better to store hashes instead of strings in the file
|
||||
* to 1, make records fixed size. 2, faster memory copy.
|
||||
*/
|
||||
|
||||
/* \195 D L H */
|
||||
#define SIGNATURE 0xC3444C48
|
||||
#define STORAGE_FILE "dlhist"
|
||||
|
||||
#define TABLE_MIN_SIZE 128
|
||||
|
||||
#define HASH_TABLE_LOAD(c, s) ((double) (c) / ((s) ? (s) : 1))
|
||||
|
||||
struct header {
|
||||
unsigned int signature;
|
||||
unsigned int version;
|
||||
unsigned int size;
|
||||
};
|
||||
|
||||
struct hash_entry {
|
||||
unsigned int time;
|
||||
char *key;
|
||||
};
|
||||
|
||||
#define he_empty(x) (!(x) || (x)->key == NULL)
|
||||
|
||||
static int fd = -1;
|
||||
|
||||
static struct hash_entry *table;
|
||||
static unsigned int table_size;
|
||||
static unsigned int table_count;
|
||||
|
||||
static unsigned hash(const char *s) {
|
||||
|
||||
unsigned h;
|
||||
|
||||
for(h=0; *s; s++) {
|
||||
if (!strncmp(s, "://", 3)) {
|
||||
h = 0;
|
||||
s += 2;
|
||||
} else if (!strncmp(s, "/", 2)) {
|
||||
break;
|
||||
}
|
||||
h = ((unsigned)*s) + (h << 6) + (h << 16) - h;
|
||||
}
|
||||
return h;
|
||||
}
|
||||
|
||||
static struct hash_entry* lookup(const char *key) {
|
||||
|
||||
unsigned index = hash(key) % table_size;
|
||||
|
||||
/* linear probing */
|
||||
while(table[index].key) {
|
||||
if (!strcmp(table[index].key, key))
|
||||
break;
|
||||
index = (index + 1) % table_size;
|
||||
}
|
||||
return table + index;
|
||||
}
|
||||
|
||||
static inline void he_set(struct hash_entry *he, const char *key) {
|
||||
|
||||
if (!he_empty(he))
|
||||
return;
|
||||
he->key = strdup(key);
|
||||
table_count++;
|
||||
}
|
||||
|
||||
static int he_insert(struct hash_entry *he) {
|
||||
|
||||
struct hash_entry *dest = lookup(he->key);
|
||||
|
||||
if (he_empty(dest)) {
|
||||
memcpy(dest, he, sizeof(*he));
|
||||
table_count++;
|
||||
return 1;
|
||||
}
|
||||
return 0;
|
||||
}
|
||||
|
||||
static void he_remove(struct hash_entry *he) {
|
||||
|
||||
free(he->key);
|
||||
memset(he, 0, sizeof(*he));
|
||||
table_count--;
|
||||
}
|
||||
|
||||
static void resize_table() {
|
||||
|
||||
unsigned int load, i, old_size = table_size;
|
||||
struct hash_entry *old = table;
|
||||
|
||||
load = HASH_TABLE_LOAD(table_count, table_size);
|
||||
|
||||
/* check if resize should be done */
|
||||
if ((load < 0.5 && table_size <= TABLE_MIN_SIZE) ||
|
||||
(load >= 0.5 && load <= 0.75))
|
||||
return;
|
||||
|
||||
/*
|
||||
* set size to a load factor that is in the
|
||||
* middle in the valid range.
|
||||
*/
|
||||
table_size = table_count / 0.625;
|
||||
if (table_size < TABLE_MIN_SIZE)
|
||||
table_size = TABLE_MIN_SIZE;
|
||||
|
||||
table_count = 0;
|
||||
table = calloc(sizeof(*table), table_size);
|
||||
|
||||
for(i=0; i < old_size; i++) {
|
||||
struct hash_entry *he = old + i;
|
||||
if (!he_empty(he))
|
||||
he_insert(he);
|
||||
}
|
||||
free(old);
|
||||
}
|
||||
|
||||
static void build_table(const char *buf, size_t len) {
|
||||
|
||||
size_t offset = 0;
|
||||
|
||||
table = calloc(sizeof(*table), table_size);
|
||||
|
||||
while(offset < len) {
|
||||
unsigned int keylen;
|
||||
struct hash_entry entry;
|
||||
|
||||
memcpy(&entry.time, buf + offset, sizeof(entry.time));
|
||||
offset += sizeof(entry.time);
|
||||
|
||||
memcpy(&keylen, buf + offset, sizeof(keylen));
|
||||
offset += sizeof(keylen);
|
||||
|
||||
entry.time = ntohl(entry.time);
|
||||
keylen = ntohl(keylen);
|
||||
|
||||
entry.key = malloc(keylen);
|
||||
memcpy(entry.key, buf + offset, keylen);
|
||||
offset += keylen;
|
||||
|
||||
if (he_insert(&entry) < 0)
|
||||
free(entry.key);
|
||||
}
|
||||
}
|
||||
|
||||
int dlhist_open() {
|
||||
|
||||
char filename[4096], *buf = NULL;
|
||||
unsigned offset = 0;
|
||||
struct stat st;
|
||||
struct header *hdr;
|
||||
|
||||
/* Open file */
|
||||
snprintf(filename, sizeof(filename),
|
||||
"%s/%s", env_get_dir(), STORAGE_FILE);
|
||||
|
||||
fd = open(filename, O_CREAT | O_RDWR, 0600);
|
||||
if (fd < 0 || fstat(fd, &st) < 0) {
|
||||
perror("dlhist_open");
|
||||
goto error;
|
||||
}
|
||||
|
||||
if (st.st_size >= sizeof(*hdr)) {
|
||||
|
||||
buf = malloc(st.st_size);
|
||||
if (!buf)
|
||||
goto error;
|
||||
|
||||
read(fd, buf, st.st_size);
|
||||
|
||||
/* Validate header */
|
||||
hdr = (struct header *) buf;
|
||||
if (hdr->signature != htonl(SIGNATURE) ||
|
||||
hdr->version != htonl(1)) {
|
||||
fprintf(stderr, "dlhist_open: Invalid header\n");
|
||||
goto error;
|
||||
}
|
||||
|
||||
/* Get current table size */
|
||||
table_size = htonl(hdr->size);
|
||||
|
||||
offset = sizeof(*hdr);
|
||||
}
|
||||
|
||||
if (table_size < 1)
|
||||
table_size = TABLE_MIN_SIZE;
|
||||
|
||||
build_table(buf + offset, st.st_size - offset);
|
||||
|
||||
if (buf)
|
||||
free(buf);
|
||||
return 0;
|
||||
error:
|
||||
if (buf)
|
||||
free(buf);
|
||||
if (fd >= 0)
|
||||
close(fd);
|
||||
fd = -1;
|
||||
return -1;
|
||||
}
|
||||
|
||||
int dlhist_lookup(const char *url) {
|
||||
|
||||
if (table_size < 1)
|
||||
return 0;
|
||||
return !he_empty(lookup(url));
|
||||
}
|
||||
|
||||
void dlhist_update(const char *url) {
|
||||
|
||||
struct hash_entry *he;
|
||||
|
||||
if (table_size < 1)
|
||||
return;
|
||||
|
||||
/*
|
||||
* set time and key before resize,
|
||||
* hash_entry pointer is invalid after that operation.
|
||||
*/
|
||||
he = lookup(url);
|
||||
he->time = time(NULL);
|
||||
if (he_empty(he)) {
|
||||
he_set(he, url);
|
||||
resize_table();
|
||||
}
|
||||
}
|
||||
|
||||
void dlhist_purge(unsigned int timestamp) {
|
||||
|
||||
unsigned int i, t = 0, now = time(NULL);
|
||||
|
||||
if (now < timestamp)
|
||||
return;
|
||||
|
||||
t = now - timestamp;
|
||||
for(i=0; i < table_size; i++) {
|
||||
struct hash_entry *entry = table + i;
|
||||
|
||||
if (entry->key && entry->time <= t)
|
||||
he_remove(entry);
|
||||
}
|
||||
|
||||
resize_table();
|
||||
}
|
||||
|
||||
void dlhist_flush() {
|
||||
|
||||
int i;
|
||||
struct header hdr;
|
||||
|
||||
if (fd < 0)
|
||||
return;
|
||||
|
||||
ftruncate(fd, 0);
|
||||
lseek(fd, 0, SEEK_SET);
|
||||
|
||||
/* Write header */
|
||||
hdr.signature = htonl(SIGNATURE);
|
||||
hdr.version = htonl(1);
|
||||
hdr.size = htonl(table_size);
|
||||
|
||||
write(fd, &hdr, sizeof(hdr));
|
||||
|
||||
/* Write hash entries */
|
||||
for(i=0; i < table_size; i++) {
|
||||
unsigned int keylen;
|
||||
struct hash_entry ondisk, *entry = table + i;
|
||||
|
||||
if (he_empty(entry))
|
||||
continue;
|
||||
|
||||
ondisk.time = htonl(entry->time);
|
||||
keylen = htonl(strlen(entry->key) + 1);
|
||||
|
||||
write(fd, &ondisk.time, sizeof(ondisk.time));
|
||||
write(fd, &keylen, sizeof(keylen));
|
||||
write(fd, entry->key, strlen(entry->key) + 1);
|
||||
}
|
||||
|
||||
/* Make sure we flush to disk */
|
||||
fsync(fd);
|
||||
}
|
||||
|
||||
void dlhist_close() {
|
||||
|
||||
int i;
|
||||
|
||||
dlhist_flush();
|
||||
|
||||
if (fd >= 0)
|
||||
close(fd);
|
||||
fd = -1;
|
||||
|
||||
if (table) {
|
||||
for(i=0; i < table_size; i++) {
|
||||
struct hash_entry *he = table + i;
|
||||
if (!he_empty(he))
|
||||
free(he->key);
|
||||
}
|
||||
free(table);
|
||||
}
|
||||
table = NULL;
|
||||
table_count = table_size = 0;
|
||||
}
|
||||
Reference in a new issue