murmur.cc 3.3 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123
  1. /* vim:expandtab:shiftwidth=2:tabstop=2:smarttab:
  2. *
  3. * HashKit library
  4. *
  5. * Copyright (C) 2011-2012 Data Differential, http://datadifferential.com/
  6. * Copyright (C) 2006-2009 Brian Aker All rights reserved.
  7. *
  8. * Redistribution and use in source and binary forms, with or without
  9. * modification, are permitted provided that the following conditions are
  10. * met:
  11. *
  12. * * Redistributions of source code must retain the above copyright
  13. * notice, this list of conditions and the following disclaimer.
  14. *
  15. * * Redistributions in binary form must reproduce the above
  16. * copyright notice, this list of conditions and the following disclaimer
  17. * in the documentation and/or other materials provided with the
  18. * distribution.
  19. *
  20. * * The names of its contributors may not be used to endorse or
  21. * promote products derived from this software without specific prior
  22. * written permission.
  23. *
  24. * THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS
  25. * "AS IS" AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT
  26. * LIMITED TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR
  27. * A PARTICULAR PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT
  28. * OWNER OR CONTRIBUTORS BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL,
  29. * SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT
  30. * LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE,
  31. * DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY
  32. * THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT
  33. * (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE
  34. * OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
  35. *
  36. */
  37. /*
  38. "Murmur" hash provided by Austin, tanjent@gmail.com
  39. http://murmurhash.googlepages.com/
  40. Note - This code makes a few assumptions about how your machine behaves -
  41. 1. We can read a 4-byte value from any address without crashing
  42. 2. sizeof(int) == 4
  43. And it has a few limitations -
  44. 1. It will not work incrementally.
  45. 2. It will not produce the same results on little-endian and big-endian
  46. machines.
  47. Updated to murmur2 hash - BP
  48. */
  49. #include <libhashkit/common.h>
  50. #ifdef HAVE_MURMUR_HASH
  51. uint32_t hashkit_murmur(const char *key, size_t length, void *context)
  52. {
  53. /*
  54. 'm' and 'r' are mixing constants generated offline. They're not
  55. really 'magic', they just happen to work well.
  56. */
  57. const unsigned int m= 0x5bd1e995;
  58. const uint32_t seed= (0xdeadbeef * (uint32_t)length);
  59. const int r= 24;
  60. // Initialize the hash to a 'random' value
  61. uint32_t h= seed ^ (uint32_t)length;
  62. // Mix 4 bytes at a time into the hash
  63. const unsigned char * data= (const unsigned char *)key;
  64. (void)context;
  65. while(length >= 4)
  66. {
  67. unsigned int k = *(unsigned int *)data;
  68. k *= m;
  69. k ^= k >> r;
  70. k *= m;
  71. h *= m;
  72. h ^= k;
  73. data += 4;
  74. length -= 4;
  75. }
  76. // Handle the last few bytes of the input array
  77. switch(length)
  78. {
  79. case 3: h ^= ((uint32_t)data[2]) << 16;
  80. case 2: h ^= ((uint32_t)data[1]) << 8;
  81. case 1: h ^= data[0];
  82. h *= m;
  83. default: break;
  84. };
  85. /*
  86. Do a few final mixes of the hash to ensure the last few bytes are
  87. well-incorporated.
  88. */
  89. h ^= h >> 13;
  90. h *= m;
  91. h ^= h >> 15;
  92. return h;
  93. }
  94. #else
  95. uint32_t hashkit_murmur(const char *, size_t , void *)
  96. {
  97. return 0;
  98. }
  99. #endif