mirror of
https://github.com/albertobsd/keyhunt.git
synced 2025-04-07 11:28:23 +02:00
issue 26
This commit is contained in:
parent
6a92828f7f
commit
36fa623451
@ -1,275 +0,0 @@
|
||||
/*
|
||||
* Copyright (c) 2012-2019, Jyri J. Virkki
|
||||
* All rights reserved.
|
||||
*
|
||||
* This file is under BSD license. See LICENSE file.
|
||||
*/
|
||||
|
||||
/*
|
||||
* Refer to custombloom.h for documentation on the public interfaces.
|
||||
*/
|
||||
|
||||
#include <assert.h>
|
||||
#include <fcntl.h>
|
||||
#include <math.h>
|
||||
#include <stdint.h>
|
||||
#include <stdio.h>
|
||||
#include <stdlib.h>
|
||||
#include <string.h>
|
||||
#include <sys/stat.h>
|
||||
#include <inttypes.h>
|
||||
#include <sys/types.h>
|
||||
#include <unistd.h>
|
||||
|
||||
#include "bloom.h"
|
||||
#include "../xxhash/xxhash.h"
|
||||
|
||||
#define MAKESTRING(n) STRING(n)
|
||||
#define STRING(n) #n
|
||||
#define BLOOM_MAGIC "libbloom2"
|
||||
#define BLOOM_VERSION_MAJOR 2
|
||||
#define BLOOM_VERSION_MINOR 1
|
||||
|
||||
inline static int custombloom_test_bit_set_bit(unsigned char * buf, uint64_t bit, int set_bit)
|
||||
{
|
||||
uint64_t byte = bit >> 3;
|
||||
uint8_t c = buf[byte]; // expensive memory access
|
||||
uint8_t mask = 1 << (bit % 8);
|
||||
if (c & mask) {
|
||||
return 1;
|
||||
} else {
|
||||
if (set_bit) {
|
||||
buf[byte] = c | mask;
|
||||
}
|
||||
return 0;
|
||||
}
|
||||
}
|
||||
|
||||
|
||||
static int custombloom_check_add(struct custombloom * bloom, const void * buffer, int len, int add)
|
||||
{
|
||||
if (bloom->ready == 0) {
|
||||
printf("bloom at %p not initialized!\n", (void *)bloom);
|
||||
return -1;
|
||||
}
|
||||
uint8_t hits = 0;
|
||||
//uint64_t *data = (uint64_t *)buffer;
|
||||
uint64_t a = XXH64(buffer, len, 0x59f2815b16f81798);
|
||||
uint64_t b = XXH64(buffer, len, a);
|
||||
uint64_t x;
|
||||
uint8_t i;
|
||||
for (i = 0; i < bloom->hashes; i++) {
|
||||
x = (a + b *i) % bloom->bits;
|
||||
if (custombloom_test_bit_set_bit(bloom->bf, x, add)) {
|
||||
hits++;
|
||||
} else if (!add) {
|
||||
// Don't care about the presence of all the bits. Just our own.
|
||||
return 0;
|
||||
}
|
||||
}
|
||||
if (hits == bloom->hashes) {
|
||||
return 1; // 1 == element already in (or collision)
|
||||
}
|
||||
return 0;
|
||||
}
|
||||
|
||||
|
||||
// DEPRECATED - Please migrate to bloom_init2.
|
||||
int custombloom_init(struct custombloom * bloom, uint64_t entries, long double error)
|
||||
{
|
||||
return custombloom_init2(bloom, entries, error);
|
||||
}
|
||||
|
||||
|
||||
int custombloom_init2(struct custombloom * bloom, uint64_t entries, long double error)
|
||||
{
|
||||
memset(bloom, 0, sizeof(struct custombloom));
|
||||
if (entries < 1000 || error <= 0 || error >= 1) {
|
||||
return 1;
|
||||
}
|
||||
|
||||
bloom->entries = entries;
|
||||
bloom->error = error;
|
||||
|
||||
long double num = -log(bloom->error);
|
||||
long double denom = 0.480453013918201; // ln(2)^2
|
||||
bloom->bpe = (num / denom);
|
||||
|
||||
long double dentries = (long double)entries;
|
||||
long double allbits = dentries * bloom->bpe;
|
||||
bloom->bits = (uint64_t)allbits;
|
||||
|
||||
bloom->bytes = (uint64_t) bloom->bits / 8;
|
||||
if (bloom->bits % 8) {
|
||||
bloom->bytes +=1;
|
||||
}
|
||||
|
||||
bloom->hashes = (uint8_t)ceil(0.693147180559945 * bloom->bpe); // ln(2)
|
||||
|
||||
bloom->bf = (uint8_t *)calloc(bloom->bytes, sizeof(uint8_t));
|
||||
if (bloom->bf == NULL) { // LCOV_EXCL_START
|
||||
return 1;
|
||||
} // LCOV_EXCL_STOP
|
||||
|
||||
bloom->ready = 1;
|
||||
bloom->major = BLOOM_VERSION_MAJOR;
|
||||
bloom->minor = BLOOM_VERSION_MINOR;
|
||||
return 0;
|
||||
}
|
||||
|
||||
|
||||
int custombloom_check(struct custombloom * bloom, const void * buffer, int len)
|
||||
{
|
||||
return custombloom_check_add(bloom, buffer, len, 0);
|
||||
}
|
||||
|
||||
|
||||
int custombloom_add(struct custombloom * bloom, const void * buffer, int len)
|
||||
{
|
||||
return custombloom_check_add(bloom, buffer, len, 1);
|
||||
}
|
||||
|
||||
|
||||
void custombloom_print(struct custombloom * bloom)
|
||||
{
|
||||
printf("bloom at %p\n", (void *)bloom);
|
||||
if (!bloom->ready) { printf(" *** NOT READY ***\n"); }
|
||||
printf(" ->version = %d.%d\n", bloom->major, bloom->minor);
|
||||
printf(" ->entries = %"PRIu64"\n", bloom->entries);
|
||||
printf(" ->error = %Lf\n", bloom->error);
|
||||
printf(" ->bits = %"PRIu64"\n", bloom->bits);
|
||||
printf(" ->bits per elem = %f\n", bloom->bpe);
|
||||
printf(" ->bytes = %"PRIu64"\n", bloom->bytes);
|
||||
unsigned int KB = bloom->bytes / 1024;
|
||||
unsigned int MB = KB / 1024;
|
||||
printf(" (%u KB, %u MB)\n", KB, MB);
|
||||
printf(" ->hash functions = %d\n", bloom->hashes);
|
||||
}
|
||||
|
||||
|
||||
void custombloom_free(struct custombloom * bloom)
|
||||
{
|
||||
if (bloom->ready) {
|
||||
free(bloom->bf);
|
||||
}
|
||||
bloom->ready = 0;
|
||||
}
|
||||
|
||||
|
||||
int custombloom_reset(struct custombloom * bloom)
|
||||
{
|
||||
if (!bloom->ready) return 1;
|
||||
memset(bloom->bf, 0, bloom->bytes);
|
||||
return 0;
|
||||
}
|
||||
|
||||
|
||||
int custombloom_save(struct custombloom * bloom, char * filename)
|
||||
{
|
||||
if (filename == NULL || filename[0] == 0) {
|
||||
return 1;
|
||||
}
|
||||
|
||||
int fd = open(filename, O_WRONLY | O_CREAT, 0644);
|
||||
if (fd < 0) {
|
||||
return 1;
|
||||
}
|
||||
|
||||
ssize_t out = write(fd, BLOOM_MAGIC, strlen(BLOOM_MAGIC));
|
||||
if (out != strlen(BLOOM_MAGIC)) { goto save_error; } // LCOV_EXCL_LINE
|
||||
|
||||
uint16_t size = sizeof(struct custombloom);
|
||||
out = write(fd, &size, sizeof(uint16_t));
|
||||
if (out != sizeof(uint16_t)) { goto save_error; } // LCOV_EXCL_LINE
|
||||
|
||||
out = write(fd, bloom, sizeof(struct custombloom));
|
||||
if (out != sizeof(struct custombloom)) { goto save_error; } // LCOV_EXCL_LINE
|
||||
|
||||
out = write(fd, bloom->bf, bloom->bytes);
|
||||
if (out != bloom->bytes) { goto save_error; } // LCOV_EXCL_LINE
|
||||
|
||||
close(fd);
|
||||
return 0;
|
||||
// LCOV_EXCL_START
|
||||
save_error:
|
||||
close(fd);
|
||||
return 1;
|
||||
// LCOV_EXCL_STOP
|
||||
}
|
||||
|
||||
|
||||
int custombloom_load(struct custombloom * bloom, char * filename)
|
||||
{
|
||||
int rv = 0;
|
||||
|
||||
if (filename == NULL || filename[0] == 0) { return 1; }
|
||||
if (bloom == NULL) { return 2; }
|
||||
|
||||
memset(bloom, 0, sizeof(struct custombloom));
|
||||
|
||||
int fd = open(filename, O_RDONLY);
|
||||
if (fd < 0) { return 3; }
|
||||
|
||||
char line[30];
|
||||
memset(line, 0, 30);
|
||||
ssize_t in = read(fd, line, strlen(BLOOM_MAGIC));
|
||||
|
||||
if (in != strlen(BLOOM_MAGIC)) {
|
||||
rv = 4;
|
||||
goto load_error;
|
||||
}
|
||||
|
||||
if (strncmp(line, BLOOM_MAGIC, strlen(BLOOM_MAGIC))) {
|
||||
rv = 5;
|
||||
goto load_error;
|
||||
}
|
||||
|
||||
uint16_t size;
|
||||
in = read(fd, &size, sizeof(uint16_t));
|
||||
if (in != sizeof(uint16_t)) {
|
||||
rv = 6;
|
||||
goto load_error;
|
||||
}
|
||||
|
||||
if (size != sizeof(struct custombloom)) {
|
||||
rv = 7;
|
||||
goto load_error;
|
||||
}
|
||||
|
||||
in = read(fd, bloom, sizeof(struct custombloom));
|
||||
if (in != sizeof(struct custombloom)) {
|
||||
rv = 8;
|
||||
goto load_error;
|
||||
}
|
||||
|
||||
bloom->bf = NULL;
|
||||
if (bloom->major != BLOOM_VERSION_MAJOR) {
|
||||
rv = 9;
|
||||
goto load_error;
|
||||
}
|
||||
|
||||
bloom->bf = (unsigned char *)malloc(bloom->bytes);
|
||||
if (bloom->bf == NULL) { rv = 10; goto load_error; } // LCOV_EXCL_LINE
|
||||
|
||||
in = read(fd, bloom->bf, bloom->bytes);
|
||||
if (in != bloom->bytes) {
|
||||
rv = 11;
|
||||
free(bloom->bf);
|
||||
bloom->bf = NULL;
|
||||
goto load_error;
|
||||
}
|
||||
|
||||
close(fd);
|
||||
return rv;
|
||||
|
||||
load_error:
|
||||
close(fd);
|
||||
bloom->ready = 0;
|
||||
return rv;
|
||||
}
|
||||
|
||||
|
||||
const char * custombloom_version()
|
||||
{
|
||||
return MAKESTRING(BLOOM_VERSION);
|
||||
}
|
@ -1,210 +0,0 @@
|
||||
/*
|
||||
* Copyright (c) 2012-2019, Jyri J. Virkki
|
||||
* All rights reserved.
|
||||
*
|
||||
* This file is under BSD license. See LICENSE file.
|
||||
*/
|
||||
|
||||
#ifndef _CUSTOMBLOOM_H
|
||||
#define _CUSTOMBLOOM_H
|
||||
|
||||
#ifdef __cplusplus
|
||||
extern "C" {
|
||||
#endif
|
||||
|
||||
|
||||
/** ***************************************************************************
|
||||
* Structure to keep track of one bloom filter. Caller needs to
|
||||
* allocate this and pass it to the functions below. First call for
|
||||
* every struct must be to bloom_init().
|
||||
*
|
||||
*/
|
||||
struct custombloom
|
||||
{
|
||||
// These fields are part of the public interface of this structure.
|
||||
// Client code may read these values if desired. Client code MUST NOT
|
||||
// modify any of these.
|
||||
uint64_t entries;
|
||||
uint64_t bits;
|
||||
uint64_t bytes;
|
||||
uint8_t hashes;
|
||||
long double error;
|
||||
|
||||
// Fields below are private to the implementation. These may go away or
|
||||
// change incompatibly at any moment. Client code MUST NOT access or rely
|
||||
// on these.
|
||||
uint8_t ready;
|
||||
uint8_t major;
|
||||
uint8_t minor;
|
||||
double bpe;
|
||||
uint8_t *bf;
|
||||
};
|
||||
|
||||
|
||||
/** ***************************************************************************
|
||||
* Initialize the bloom filter for use.
|
||||
*
|
||||
* The filter is initialized with a bit field and number of hash functions
|
||||
* according to the computations from the wikipedia entry:
|
||||
* http://en.wikipedia.org/wiki/Bloom_filter
|
||||
*
|
||||
* Optimal number of bits is:
|
||||
* bits = (entries * ln(error)) / ln(2)^2
|
||||
*
|
||||
* Optimal number of hash functions is:
|
||||
* hashes = bpe * ln(2)
|
||||
*
|
||||
* Parameters:
|
||||
* -----------
|
||||
* bloom - Pointer to an allocated struct custombloom (see above).
|
||||
* entries - The expected number of entries which will be inserted.
|
||||
* Must be at least 1000 (in practice, likely much larger).
|
||||
* error - Probability of collision (as long as entries are not
|
||||
* exceeded).
|
||||
*
|
||||
* Return:
|
||||
* -------
|
||||
* 0 - on success
|
||||
* 1 - on failure
|
||||
*
|
||||
*/
|
||||
int custombloom_init2(struct custombloom * bloom, uint64_t entries, long double error);
|
||||
|
||||
|
||||
/**
|
||||
* DEPRECATED.
|
||||
* Kept for compatibility with libbloom v.1. To be removed in v3.0.
|
||||
*
|
||||
*/
|
||||
int bcustombloom_init(struct custombloom * bloom, uint64_t entries, long double error);
|
||||
|
||||
|
||||
/** ***************************************************************************
|
||||
* Check if the given element is in the bloom filter. Remember this may
|
||||
* return false positive if a collision occurred.
|
||||
*
|
||||
* Parameters:
|
||||
* -----------
|
||||
* bloom - Pointer to an allocated struct custombloom (see above).
|
||||
* buffer - Pointer to buffer containing element to check.
|
||||
* len - Size of 'buffer'.
|
||||
*
|
||||
* Return:
|
||||
* -------
|
||||
* 0 - element is not present
|
||||
* 1 - element is present (or false positive due to collision)
|
||||
* -1 - bloom not initialized
|
||||
*
|
||||
*/
|
||||
int custombloom_check(struct custombloom * bloom, const void * buffer, int len);
|
||||
|
||||
|
||||
/** ***************************************************************************
|
||||
* Add the given element to the bloom filter.
|
||||
* The return code indicates if the element (or a collision) was already in,
|
||||
* so for the common check+add use case, no need to call check separately.
|
||||
*
|
||||
* Parameters:
|
||||
* -----------
|
||||
* bloom - Pointer to an allocated struct custombloom (see above).
|
||||
* buffer - Pointer to buffer containing element to add.
|
||||
* len - Size of 'buffer'.
|
||||
*
|
||||
* Return:
|
||||
* -------
|
||||
* 0 - element was not present and was added
|
||||
* 1 - element (or a collision) had already been added previously
|
||||
* -1 - bloom not initialized
|
||||
*
|
||||
*/
|
||||
int custombloom_add(struct custombloom * bloom, const void * buffer, int len);
|
||||
|
||||
|
||||
/** ***************************************************************************
|
||||
* Print (to stdout) info about this bloom filter. Debugging aid.
|
||||
*
|
||||
*/
|
||||
void custombloom_print(struct custombloom * bloom);
|
||||
|
||||
|
||||
/** ***************************************************************************
|
||||
* Deallocate internal storage.
|
||||
*
|
||||
* Upon return, the bloom struct is no longer usable. You may call bloom_init
|
||||
* again on the same struct to reinitialize it again.
|
||||
*
|
||||
* Parameters:
|
||||
* -----------
|
||||
* bloom - Pointer to an allocated struct custombloom (see above).
|
||||
*
|
||||
* Return: none
|
||||
*
|
||||
*/
|
||||
void custombloom_free(struct custombloom * bloom);
|
||||
|
||||
|
||||
/** ***************************************************************************
|
||||
* Erase internal storage.
|
||||
*
|
||||
* Erases all elements. Upon return, the bloom struct returns to its initial
|
||||
* (initialized) state.
|
||||
*
|
||||
* Parameters:
|
||||
* -----------
|
||||
* bloom - Pointer to an allocated struct custombloom (see above).
|
||||
*
|
||||
* Return:
|
||||
* 0 - on success
|
||||
* 1 - on failure
|
||||
*
|
||||
*/
|
||||
int custombloom_reset(struct custombloom * bloom);
|
||||
|
||||
|
||||
/** ***************************************************************************
|
||||
* Save a bloom filter to a file.
|
||||
*
|
||||
* Parameters:
|
||||
* -----------
|
||||
* bloom - Pointer to an allocated struct custombloom (see above).
|
||||
* filename - Create (or overwrite) bloom data to this file.
|
||||
*
|
||||
* Return:
|
||||
* 0 - on success
|
||||
* 1 - on failure
|
||||
*
|
||||
*/
|
||||
int custombloom_save(struct custombloom * bloom, char * filename);
|
||||
|
||||
|
||||
/** ***************************************************************************
|
||||
* Load a bloom filter from a file.
|
||||
*
|
||||
* This functions loads a file previously saved with bloom_save().
|
||||
*
|
||||
* Parameters:
|
||||
* -----------
|
||||
* bloom - Pointer to an allocated struct custombloom (see above).
|
||||
* filename - Load bloom filter data from this file.
|
||||
*
|
||||
* Return:
|
||||
* 0 - on success
|
||||
* > 0 - on failure
|
||||
*
|
||||
*/
|
||||
int custombloom_load(struct custombloom * bloom, char * filename);
|
||||
|
||||
|
||||
/** ***************************************************************************
|
||||
* Returns version string compiled into library.
|
||||
*
|
||||
* Return: version string
|
||||
*
|
||||
*/
|
||||
const char * custombloom_version();
|
||||
|
||||
#ifdef __cplusplus
|
||||
}
|
||||
#endif
|
||||
|
||||
#endif
|
Loading…
x
Reference in New Issue
Block a user