From 2dec07424eaeade587740f1d2751986a36ea70f1 Mon Sep 17 00:00:00 2001 From: mame Date: Sat, 14 Feb 2009 19:55:34 +0000 Subject: * string.c (rb_hash_uint32, rb_hash_uint, rb_hash_start, rb_hash_end), include/ruby/intern.h: add Murmurhash API. [ruby-dev:37784] * complex.c (nucomp_hash), array.c (rb_ary_hash), time.c (time_hash), string.c (rb_str_hsah), object.c (rb_obj_hash), range.c (range_hash), struct.c (rb_struct_hash), hash.c (rb_any_hash), rational.c (nurat_hash): use Murmurhash. [ruby-dev:37784] git-svn-id: http://svn.ruby-lang.org/repos/ruby/trunk@22317 b2dd03c8-39d4-4d8f-98ff-823fe69b080e --- string.c | 58 +++++++++++++++++++++++++++++++++++++++++++++++++++++++--- 1 file changed, 55 insertions(+), 3 deletions(-) (limited to 'string.c') diff --git a/string.c b/string.c index 28410a448..4f30aea59 100644 --- a/string.c +++ b/string.c @@ -1912,6 +1912,7 @@ murmur(unsigned int h, unsigned int k, int r) #endif return h; } +#define murmur16(h) murmur_step(h, 16) static inline unsigned int murmur_finish(unsigned int h) @@ -2053,8 +2054,53 @@ hash(const unsigned char * data, int len, unsigned int h) return murmur_finish(h); } -int -rb_memhash(const void *ptr, long len) +unsigned int +rb_hash_uint32(unsigned int h, unsigned int i) +{ + return murmur_step(h + i, 16); +} + +unsigned int +rb_hash_uint(unsigned int h, unsigned int i) +{ + unsigned int v = 0; + h += i; +#ifdef WORDS_BIGENDIAN +#if SIZEOF_INT*CHAR_BIT > 12*8 + v = murmur16(v + (h >> 12*8)); +#endif +#if SIZEOF_INT*CHAR_BIT > 8*8 + v = murmur16(v + (h >> 8*8)); +#endif +#if SIZEOF_INT*CHAR_BIT > 4*8 + v = murmur16(v + (h >> 4*8)); +#endif +#endif + v = murmur16(v + h); +#ifndef WORDS_BIGENDIAN +#if SIZEOF_INT*CHAR_BIT > 4*8 + v = murmur16(v + (h >> 4*8)); +#endif +#if SIZEOF_INT*CHAR_BIT > 8*8 + v = murmur16(v + (h >> 8*8)); +#endif +#if SIZEOF_INT*CHAR_BIT > 12*8 + v = murmur16(v + (h >> 12*8)); +#endif +#endif + return v; +} + +unsigned int +rb_hash_end(unsigned int h) +{ + h = murmur_step(h, 10); + h = murmur_step(h, 17); + return h; +} + +unsigned int +rb_hash_start(unsigned int h) { static int hashseed_init = 0; static unsigned int hashseed; @@ -2064,7 +2110,13 @@ rb_memhash(const void *ptr, long len) hashseed_init = 1; } - return hash(ptr, len, hashseed); + return hashseed + h; +} + +int +rb_memhash(const void *ptr, long len) +{ + return hash(ptr, len, rb_hash_start(0)); } int -- cgit