2013-08-10 12:06:09 +02:00
|
|
|
/**
|
|
|
|
* Bloom filter implementation
|
2013-08-04 22:01:11 +02:00
|
|
|
*
|
2013-08-10 12:06:09 +02:00
|
|
|
* Copyright (C) 2013 Freie Universität Berlin
|
2013-08-04 22:01:11 +02:00
|
|
|
*
|
2014-07-31 19:45:27 +02:00
|
|
|
* This file is subject to the terms and conditions of the GNU Lesser
|
|
|
|
* General Public License v2.1. See the file LICENSE in the top level
|
|
|
|
* directory for more details.
|
2013-08-04 22:01:11 +02:00
|
|
|
*
|
2013-08-10 12:06:09 +02:00
|
|
|
* @file
|
2014-01-24 19:04:28 +01:00
|
|
|
* @author Jason Linehan <patientulysses@gmail.com>
|
|
|
|
* @author Christian Mehlis <mehlis@inf.fu-berlin.de>
|
2013-08-04 22:01:11 +02:00
|
|
|
*
|
2013-08-10 12:06:09 +02:00
|
|
|
*/
|
2013-08-04 22:01:11 +02:00
|
|
|
|
|
|
|
#include <limits.h>
|
|
|
|
#include <stdarg.h>
|
|
|
|
#include <stdbool.h>
|
|
|
|
|
|
|
|
#include "bloom.h"
|
|
|
|
|
|
|
|
#define SETBIT(a,n) (a[n/CHAR_BIT] |= (1<<(n%CHAR_BIT)))
|
|
|
|
#define GETBIT(a,n) (a[n/CHAR_BIT] & (1<<(n%CHAR_BIT)))
|
|
|
|
#define ROUND(size) ((size + CHAR_BIT - 1) / CHAR_BIT)
|
|
|
|
|
2013-08-20 09:05:07 +02:00
|
|
|
struct bloom_t *bloom_new(size_t size, size_t num_hashes, ...)
|
|
|
|
{
|
2013-08-04 22:01:11 +02:00
|
|
|
struct bloom_t *bloom;
|
|
|
|
va_list hashes;
|
2013-08-20 09:05:07 +02:00
|
|
|
size_t n;
|
2013-08-04 22:01:11 +02:00
|
|
|
|
|
|
|
/* Allocate Bloom filter container */
|
|
|
|
if (!(bloom = malloc(sizeof(struct bloom_t)))) {
|
|
|
|
return NULL;
|
|
|
|
}
|
|
|
|
|
|
|
|
/* Allocate Bloom array */
|
|
|
|
if (!(bloom->a = calloc(ROUND(size), sizeof(char)))) {
|
|
|
|
free(bloom);
|
|
|
|
return NULL;
|
|
|
|
}
|
|
|
|
|
|
|
|
/* Allocate Bloom filter hash function pointers */
|
2013-08-20 09:05:07 +02:00
|
|
|
if (!(bloom->hash = (hashfp_t *)malloc(num_hashes * sizeof(hashfp_t)))) {
|
2013-08-04 22:01:11 +02:00
|
|
|
free(bloom->a);
|
|
|
|
free(bloom);
|
|
|
|
return NULL;
|
|
|
|
}
|
|
|
|
|
|
|
|
/* Assign hash functions to pointers in the Bloom filter */
|
|
|
|
va_start(hashes, num_hashes);
|
|
|
|
|
|
|
|
for (n = 0; n < num_hashes; n++) {
|
|
|
|
bloom->hash[n] = va_arg(hashes, hashfp_t);
|
|
|
|
}
|
|
|
|
|
|
|
|
va_end(hashes);
|
|
|
|
|
|
|
|
/*
|
|
|
|
* Record the number of hash functions (k) and the number of bytes
|
|
|
|
* in the Bloom array (m).
|
|
|
|
*/
|
|
|
|
bloom->k = num_hashes;
|
|
|
|
bloom->m = size;
|
|
|
|
|
|
|
|
return bloom;
|
|
|
|
}
|
|
|
|
|
|
|
|
void bloom_del(struct bloom_t *bloom)
|
|
|
|
{
|
|
|
|
free(bloom->a);
|
|
|
|
free(bloom->hash);
|
|
|
|
free(bloom);
|
|
|
|
}
|
|
|
|
|
2013-08-20 09:05:07 +02:00
|
|
|
void bloom_add(struct bloom_t *bloom, const uint8_t *buf, size_t len)
|
2013-08-04 22:01:11 +02:00
|
|
|
{
|
2013-08-20 09:05:07 +02:00
|
|
|
uint32_t hash;
|
|
|
|
size_t n;
|
2013-08-04 22:01:11 +02:00
|
|
|
|
|
|
|
for (n = 0; n < bloom->k; n++) {
|
2013-08-20 09:05:07 +02:00
|
|
|
hash = bloom->hash[n](buf, len);
|
2013-08-04 22:01:11 +02:00
|
|
|
SETBIT(bloom->a, (hash % bloom->m));
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
2013-08-20 09:05:07 +02:00
|
|
|
bool bloom_check(struct bloom_t *bloom, const uint8_t *buf, size_t len)
|
2013-08-04 22:01:11 +02:00
|
|
|
{
|
2013-08-20 09:05:07 +02:00
|
|
|
uint32_t hash;
|
|
|
|
size_t n;
|
2013-08-04 22:01:11 +02:00
|
|
|
|
|
|
|
for (n = 0; n < bloom->k; n++) {
|
2013-08-20 09:05:07 +02:00
|
|
|
hash = bloom->hash[n](buf, len);
|
2013-08-04 22:01:11 +02:00
|
|
|
|
|
|
|
if (!(GETBIT(bloom->a, (hash % bloom->m)))) {
|
|
|
|
return false;
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
return true; /* ? */
|
|
|
|
}
|