2013-08-10 12:06:09 +02:00
|
|
|
/**
|
|
|
|
* This file contains some simple hash function
|
|
|
|
*
|
|
|
|
* Copyright (C) 2013 Freie Universität Berlin
|
|
|
|
*
|
2013-11-22 20:47:05 +01:00
|
|
|
* This file is subject to the terms and conditions of the GNU Lesser General
|
2013-08-10 12:06:09 +02:00
|
|
|
* Public License. See the file LICENSE in the top level directory for more
|
|
|
|
* details.
|
|
|
|
*/
|
|
|
|
|
|
|
|
/**
|
|
|
|
* @file
|
|
|
|
* @autor Jason Linehan <patientulysses@gmail.com>
|
|
|
|
* @author Freie Universität Berlin, Computer Systems & Telematics
|
|
|
|
* @author Christian Mehlis <mehlis@inf.fu-berlin.de>
|
|
|
|
*/
|
|
|
|
|
2013-08-20 09:05:07 +02:00
|
|
|
#include <stddef.h>
|
|
|
|
#include <inttypes.h>
|
|
|
|
|
2013-08-10 12:06:09 +02:00
|
|
|
/**
|
2013-08-20 09:05:07 +02:00
|
|
|
* @brief djb2_hash
|
2013-08-10 12:06:09 +02:00
|
|
|
*
|
2013-08-04 22:01:11 +02:00
|
|
|
* HISTORY
|
|
|
|
* This algorithm (k=33) was first reported by Dan Bernstein many years
|
|
|
|
* ago in comp.lang.c. Another version of this algorithm (now favored by
|
|
|
|
* bernstein) uses XOR:
|
|
|
|
*
|
|
|
|
* hash(i) = hash(i - 1) * 33 ^ str[i];
|
|
|
|
*
|
|
|
|
* The magic of number 33 (why it works better than many other constants,
|
|
|
|
* prime or not) has never been adequately explained.
|
2013-08-20 09:05:07 +02:00
|
|
|
*
|
|
|
|
* @param buf input buffer to hash
|
|
|
|
* @param len length of buffer
|
|
|
|
* @return 32 bit sized hash
|
2013-08-10 12:06:09 +02:00
|
|
|
*/
|
2013-08-20 09:05:07 +02:00
|
|
|
uint32_t djb2_hash(const uint8_t *buf, size_t len);
|
2013-08-04 22:01:11 +02:00
|
|
|
|
2013-08-10 12:06:09 +02:00
|
|
|
/**
|
2013-08-20 09:05:07 +02:00
|
|
|
* @brief sdbm_hash
|
2013-08-10 12:06:09 +02:00
|
|
|
*
|
2013-08-04 22:01:11 +02:00
|
|
|
* HISTORY
|
|
|
|
* This algorithm was created for sdbm (a public-domain reimplementation
|
|
|
|
* of ndbm) database library. It was found to do well in scrambling bits,
|
|
|
|
* causing better distribution of the keys and fewer splits. it also
|
|
|
|
* happens to be a good general hashing function with good distribution.
|
|
|
|
*
|
|
|
|
* The actual function is
|
|
|
|
*
|
|
|
|
* hash(i) = hash(i - 1) * 65599 + str[i];
|
|
|
|
*
|
|
|
|
* What is included below is the faster version used in gawk. [there is
|
|
|
|
* even a faster, duff-device version] the magic constant 65599 was picked
|
|
|
|
* out of thin air while experimenting with different constants, and turns
|
|
|
|
* out to be a prime. this is one of the algorithms used in berkeley db
|
|
|
|
* (see sleepycat) and elsewhere.
|
|
|
|
*
|
2013-08-20 09:05:07 +02:00
|
|
|
* @param buf input buffer to hash
|
|
|
|
* @param len length of buffer
|
|
|
|
* @return 32 bit sized hash
|
2013-08-10 12:06:09 +02:00
|
|
|
*/
|
2013-08-20 09:05:07 +02:00
|
|
|
uint32_t sdbm_hash(const uint8_t *buf, size_t len);
|
2013-08-04 22:01:11 +02:00
|
|
|
|
2013-08-10 12:06:09 +02:00
|
|
|
/**
|
2013-08-20 09:05:07 +02:00
|
|
|
* @brief lose lose
|
2013-08-10 12:06:09 +02:00
|
|
|
*
|
2013-08-04 22:01:11 +02:00
|
|
|
* HISTORY
|
|
|
|
* This hash function appeared in K&R (1st ed) but at least the reader
|
|
|
|
* was warned:
|
|
|
|
*
|
|
|
|
* "This is not the best possible algorithm, but it has the merit
|
|
|
|
* of extreme simplicity."
|
|
|
|
*
|
|
|
|
* This is an understatement. It is a terrible hashing algorithm, and it
|
|
|
|
* could have been much better without sacrificing its "extreme simplicity."
|
|
|
|
* [see the second edition!]
|
|
|
|
*
|
|
|
|
* Many C programmers use this function without actually testing it, or
|
|
|
|
* checking something like Knuth's Sorting and Searching, so it stuck.
|
|
|
|
* It is now found mixed with otherwise respectable code, eg. cnews. sigh.
|
|
|
|
* [see also: tpop]
|
2013-08-20 09:05:07 +02:00
|
|
|
*
|
|
|
|
* @param buf input buffer to hash
|
|
|
|
* @param len length of buffer
|
|
|
|
* @return 32 bit sized hash
|
2013-08-10 12:06:09 +02:00
|
|
|
*/
|
2013-08-20 09:05:07 +02:00
|
|
|
uint32_t kr_hash(const uint8_t *buf, size_t len);
|
2013-08-04 22:01:11 +02:00
|
|
|
|
2013-08-10 12:06:09 +02:00
|
|
|
/**
|
2013-08-20 09:05:07 +02:00
|
|
|
* @bief sax_hash
|
2013-08-04 22:01:11 +02:00
|
|
|
*
|
2013-08-10 12:06:09 +02:00
|
|
|
* Shift, Add, XOR
|
2013-08-20 09:05:07 +02:00
|
|
|
*
|
|
|
|
* @param buf input buffer to hash
|
|
|
|
* @param len length of buffer
|
|
|
|
* @return 32 bit sized hash
|
2013-08-10 12:06:09 +02:00
|
|
|
*/
|
2013-08-20 09:05:07 +02:00
|
|
|
uint32_t sax_hash(const uint8_t *buf, size_t len);
|
2013-08-04 22:01:11 +02:00
|
|
|
|
2013-08-10 12:06:09 +02:00
|
|
|
/**
|
2013-08-20 09:05:07 +02:00
|
|
|
* @brief dek_hash
|
2013-08-10 12:06:09 +02:00
|
|
|
*
|
2013-08-04 22:01:11 +02:00
|
|
|
* HISTORY
|
|
|
|
* Proposed by Donald E. Knuth in The Art Of Computer Programming Vol. 3,
|
|
|
|
* under the topic of "Sorting and Search", Chapter 6.4.
|
2013-08-20 09:05:07 +02:00
|
|
|
*
|
|
|
|
* @param buf input buffer to hash
|
|
|
|
* @param len length of buffer
|
|
|
|
* @return 32 bit sized hash
|
2013-08-10 12:06:09 +02:00
|
|
|
*/
|
2013-08-20 09:05:07 +02:00
|
|
|
uint32_t dek_hash(const uint8_t *buf, size_t len);
|
2013-08-04 22:01:11 +02:00
|
|
|
|
2013-08-10 12:06:09 +02:00
|
|
|
/**
|
2013-08-20 09:05:07 +02:00
|
|
|
* @brief fnv_hash
|
2013-08-10 12:06:09 +02:00
|
|
|
*
|
2013-08-04 22:01:11 +02:00
|
|
|
* NOTE
|
|
|
|
* For a more fully featured and modern version of this hash, see fnv32.c
|
2013-08-20 09:05:07 +02:00
|
|
|
*
|
|
|
|
* @param buf input buffer to hash
|
|
|
|
* @param len length of buffer
|
|
|
|
* @return 32 bit sized hash
|
2013-08-10 12:06:09 +02:00
|
|
|
*/
|
2013-08-20 09:05:07 +02:00
|
|
|
uint32_t fnv_hash(const uint8_t *buf, size_t len);
|
2013-08-04 22:01:11 +02:00
|
|
|
|
|
|
|
|
2013-08-20 09:05:07 +02:00
|
|
|
/**
|
|
|
|
* @brief rotating_hash
|
|
|
|
*
|
|
|
|
* found on
|
|
|
|
* http://burtleburtle.net/bob/hash/doobs.html
|
|
|
|
*
|
|
|
|
* @param buf input buffer to hash
|
|
|
|
* @param len length of buffer
|
|
|
|
* @return 32 bit sized hash
|
|
|
|
*/
|
|
|
|
uint32_t rotating_hash(const uint8_t *buf, size_t len);
|
2013-08-04 22:01:11 +02:00
|
|
|
|
2013-08-20 09:05:07 +02:00
|
|
|
/**
|
|
|
|
* @brief one_at_a_time_hash
|
|
|
|
*
|
|
|
|
* found on
|
|
|
|
* http://burtleburtle.net/bob/hash/doobs.html
|
|
|
|
*
|
|
|
|
* @param buf input buffer to hash
|
|
|
|
* @param len length of buffer
|
|
|
|
* @return 32 bit sized hash
|
|
|
|
*/
|
|
|
|
uint32_t one_at_a_time_hash(const uint8_t *buf, size_t len);
|