hash.pyx 1.5 KB

12345678910111213141516171819202122232425262728293031323334353637383940414243444546474849
  1. from libc.stdint cimport uint64_t
  2. from libc.string cimport memcpy
  3. from lakesuperior.store.ldp_rs.term cimport Buffer
  4. memcpy(&term_hash_seed1, TERM_HASH_SEED, SEED_LEN)
  5. memcpy(&term_hash_seed2, TERM_HASH_SEED + SEED_LEN, SEED_LEN)
  6. # We only need a couple of functions from spookyhash. No need for a pxd file.
  7. cdef extern from 'spookyhash_api.h':
  8. void spookyhash_128(
  9. const void *input, size_t input_size, uint64_t *hash_1,
  10. uint64_t *hash_2)
  11. uint64_t spookyhash_64(const void *input, size_t input_size, uint64_t seed)
  12. cdef inline int hash128(const Buffer *message, Hash128 *hash) except -1:
  13. """
  14. Get the hash value of a byte string with a defined size.
  15. The hashing algorithm is `SpookyHash
  16. <http://burtleburtle.net/bob/hash/spooky.html>`_ which produces 128-bit
  17. (16-byte) digests.
  18. The initial seeds are determined in the application configuration.
  19. :rtype: Hash128
  20. """
  21. cdef:
  22. DoubleHash64 seed = [term_hash_seed1, term_hash_seed2]
  23. Hash128 digest
  24. spookyhash_128(message[0].addr, message[0].sz, seed, seed + 1)
  25. # This casts the 2 contiguous uint64_t's into a char[16] pointer.
  26. hash[0] = <Hash128>seed
  27. cdef inline int hash64(const Buffer *message, Hash64 *hash) except -1:
  28. """
  29. Get a 64-bit (unsigned long) hash value of a byte string.
  30. This function also uses SpookyHash. Note that this returns a UInt64 while
  31. the 128-bit function returns a char array.
  32. """
  33. cdef uint64_t seed = term_hash_seed1
  34. hash[0] = spookyhash_64(message[0].addr, message[0].sz, seed)