murmur3_32.c 3.4 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132
  1. /*-
  2. * Copyright (c) 2014 Dag-Erling Smørgrav
  3. * All rights reserved.
  4. *
  5. * Redistribution and use in source and binary forms, with or without
  6. * modification, are permitted provided that the following conditions
  7. * are met:
  8. * 1. Redistributions of source code must retain the above copyright
  9. * notice, this list of conditions and the following disclaimer.
  10. * 2. Redistributions in binary form must reproduce the above copyright
  11. * notice, this list of conditions and the following disclaimer in the
  12. * documentation and/or other materials provided with the distribution.
  13. *
  14. * THIS SOFTWARE IS PROVIDED BY THE AUTHOR AND CONTRIBUTORS ``AS IS'' AND
  15. * ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
  16. * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
  17. * ARE DISCLAIMED. IN NO EVENT SHALL THE AUTHOR OR CONTRIBUTORS BE LIABLE
  18. * FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL
  19. * DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS
  20. * OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION)
  21. * HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT
  22. * LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY
  23. * OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF
  24. * SUCH DAMAGE.
  25. *
  26. * $FreeBSD$
  27. */
  28. #include <sys/hash.h>
  29. #include <sys/endian.h>
  30. #include <sys/stdint.h>
  31. #include <sys/types.h>
  32. #define rol32(i32, n) ((i32) << (n) | (i32) >> (32 - (n)))
  33. /*
  34. * Simple implementation of the Murmur3-32 hash function.
  35. *
  36. * This implementation is slow but safe. It can be made significantly
  37. * faster if the caller guarantees that the input is correctly aligned for
  38. * 32-bit reads, and slightly faster yet if the caller guarantees that the
  39. * length of the input is always a multiple of 4 bytes.
  40. */
  41. uint32_t
  42. murmur3_32_hash(const void *data, size_t len, uint32_t seed)
  43. {
  44. const uint8_t *bytes;
  45. uint32_t hash, k;
  46. size_t res;
  47. /* initialization */
  48. bytes = data;
  49. res = len;
  50. hash = seed;
  51. /* main loop */
  52. while (res >= 4) {
  53. /* replace with le32toh() if input is aligned */
  54. k = le32dec(bytes);
  55. bytes += 4;
  56. res -= 4;
  57. k *= 0xcc9e2d51;
  58. k = rol32(k, 15);
  59. k *= 0x1b873593;
  60. hash ^= k;
  61. hash = rol32(hash, 13);
  62. hash *= 5;
  63. hash += 0xe6546b64;
  64. }
  65. /* remainder */
  66. /* remove if input length is a multiple of 4 */
  67. if (res > 0) {
  68. k = 0;
  69. switch (res) {
  70. case 3:
  71. k |= bytes[2] << 16;
  72. case 2:
  73. k |= bytes[1] << 8;
  74. case 1:
  75. k |= bytes[0];
  76. k *= 0xcc9e2d51;
  77. k = rol32(k, 15);
  78. k *= 0x1b873593;
  79. hash ^= k;
  80. break;
  81. }
  82. }
  83. /* finalize */
  84. hash ^= (uint32_t)len;
  85. hash ^= hash >> 16;
  86. hash *= 0x85ebca6b;
  87. hash ^= hash >> 13;
  88. hash *= 0xc2b2ae35;
  89. hash ^= hash >> 16;
  90. return (hash);
  91. }
  92. /*
  93. * Simplified version of the above optimized for aligned sequences of
  94. * 32-bit words. The count argument is the number of words, not the
  95. * length in bytes.
  96. */
  97. uint32_t
  98. murmur3_32_hash32(const uint32_t *data, size_t count, uint32_t seed)
  99. {
  100. uint32_t hash, k;
  101. size_t res;
  102. /* iterate */
  103. for (res = count, hash = seed; res > 0; res--, data++) {
  104. k = le32toh(*data);
  105. k *= 0xcc9e2d51;
  106. k = rol32(k, 15);
  107. k *= 0x1b873593;
  108. hash ^= k;
  109. hash = rol32(hash, 13);
  110. hash *= 5;
  111. hash += 0xe6546b64;
  112. }
  113. /* finalize */
  114. hash ^= (uint32_t)count;
  115. hash ^= hash >> 16;
  116. hash *= 0x85ebca6b;
  117. hash ^= hash >> 13;
  118. hash *= 0xc2b2ae35;
  119. hash ^= hash >> 16;
  120. return (hash);
  121. }