/* * Copyright (c) 2012-2019, Jyri J. Virkki * All rights reserved. * * This file is under BSD license. See LICENSE file. */ #ifndef _BLOOM_H #define _BLOOM_H #ifdef __cplusplus extern "C" { #endif /** *************************************************************************** * Structure to keep track of one bloom filter. Caller needs to * allocate this and pass it to the functions below. First call for * every struct must be to bloom_init(). * */ struct bloom { // These fields are part of the public interface of this structure. // Client code may read these values if desired. Client code MUST NOT // modify any of these. uint64_t entries; uint64_t bits; uint64_t bytes; uint8_t hashes; long double error; // Fields below are private to the implementation. These may go away or // change incompatibly at any moment. Client code MUST NOT access or rely // on these. uint8_t ready; uint8_t major; uint8_t minor; double bpe; uint8_t *bf; }; /* Customs */ int bloom_dummy(struct bloom * bloom, uint64_t entries, long double error); int bloom_loadcustom(struct bloom * bloom, char * filename); int bloom_savecustom(struct bloom * bloom, char * filename); /** *************************************************************************** * Initialize the bloom filter for use. * * The filter is initialized with a bit field and number of hash functions * according to the computations from the wikipedia entry: * http://en.wikipedia.org/wiki/Bloom_filter * * Optimal number of bits is: * bits = (entries * ln(error)) / ln(2)^2 * * Optimal number of hash functions is: * hashes = bpe * ln(2) * * Parameters: * ----------- * bloom - Pointer to an allocated struct bloom (see above). * entries - The expected number of entries which will be inserted. * Must be at least 1000 (in practice, likely much larger). * error - Probability of collision (as long as entries are not * exceeded). * * Return: * ------- * 0 - on success * 1 - on failure * */ int bloom_init2(struct bloom * bloom, uint64_t entries, long double error); /** * DEPRECATED. * Kept for compatibility with libbloom v.1. To be removed in v3.0. * */ int bloom_init(struct bloom * bloom, uint64_t entries, long double error); /** *************************************************************************** * Check if the given element is in the bloom filter. Remember this may * return false positive if a collision occurred. * * Parameters: * ----------- * bloom - Pointer to an allocated struct bloom (see above). * buffer - Pointer to buffer containing element to check. * len - Size of 'buffer'. * * Return: * ------- * 0 - element is not present * 1 - element is present (or false positive due to collision) * -1 - bloom not initialized * */ int bloom_check(struct bloom * bloom, const void * buffer, int len); /** *************************************************************************** * Add the given element to the bloom filter. * The return code indicates if the element (or a collision) was already in, * so for the common check+add use case, no need to call check separately. * * Parameters: * ----------- * bloom - Pointer to an allocated struct bloom (see above). * buffer - Pointer to buffer containing element to add. * len - Size of 'buffer'. * * Return: * ------- * 0 - element was not present and was added * 1 - element (or a collision) had already been added previously * -1 - bloom not initialized * */ int bloom_add(struct bloom * bloom, const void * buffer, int len); /** *************************************************************************** * Print (to stdout) info about this bloom filter. Debugging aid. * */ void bloom_print(struct bloom * bloom); /** *************************************************************************** * Deallocate internal storage. * * Upon return, the bloom struct is no longer usable. You may call bloom_init * again on the same struct to reinitialize it again. * * Parameters: * ----------- * bloom - Pointer to an allocated struct bloom (see above). * * Return: none * */ void bloom_free(struct bloom * bloom); /** *************************************************************************** * Erase internal storage. * * Erases all elements. Upon return, the bloom struct returns to its initial * (initialized) state. * * Parameters: * ----------- * bloom - Pointer to an allocated struct bloom (see above). * * Return: * 0 - on success * 1 - on failure * */ int bloom_reset(struct bloom * bloom); /** *************************************************************************** * Save a bloom filter to a file. * * Parameters: * ----------- * bloom - Pointer to an allocated struct bloom (see above). * filename - Create (or overwrite) bloom data to this file. * * Return: * 0 - on success * 1 - on failure * */ int bloom_save(struct bloom * bloom, char * filename); /** *************************************************************************** * Load a bloom filter from a file. * * This functions loads a file previously saved with bloom_save(). * * Parameters: * ----------- * bloom - Pointer to an allocated struct bloom (see above). * filename - Load bloom filter data from this file. * * Return: * 0 - on success * > 0 - on failure * */ int bloom_load(struct bloom * bloom, char * filename); /** *************************************************************************** * Returns version string compiled into library. * * Return: version string * */ const char * bloom_version(); #ifdef __cplusplus } #endif #endif