You can not select more than 25 topics Topics must start with a letter or number, can include dashes ('-') and can be up to 35 characters long.

mishmash.cpp 3.1KB

1234567891011121314151617181920212223242526272829303132333435363738394041424344454647484950515253545556575859606162636465666768697071727374
  1. // mishmash.cpp
  2. //
  3. // Copyright (C) 2019-2020 MicroNeil Research Corporation.
  4. //
  5. // This software is released under the MIT license. See LICENSE.TXT.
  6. //
  7. // Mishmash is a non-cryptographic hash optimized for short strings.
  8. #include "mishmash.hpp"
  9. namespace codedweller {
  10. uint32_t primes[256] {
  11. 1019, 1021, 1031, 1033, 1039, 1049, 1051, 1061,
  12. 1063, 1069, 1087, 1091, 1093, 1097, 1103, 1109,
  13. 1117, 1123, 1129, 1151, 1153, 1163, 1171, 1181,
  14. 1187, 1193, 1201, 1213, 1217, 1223, 1229, 1231,
  15. 1237, 1249, 1259, 1277, 1279, 1283, 1289, 1291,
  16. 1297, 1301, 1303, 1307, 1319, 1321, 1327, 1361,
  17. 1367, 1373, 1381, 1399, 1409, 1423, 1427, 1429,
  18. 1433, 1439, 1447, 1451, 1453, 1459, 1471, 1481,
  19. 1483, 1487, 1489, 1493, 1499, 1511, 1523, 1531,
  20. 1543, 1549, 1553, 1559, 1567, 1571, 1579, 1583,
  21. 1597, 1601, 1607, 1609, 1613, 1619, 1621, 1627,
  22. 1637, 1657, 1663, 1667, 1669, 1693, 1697, 1699,
  23. 1709, 1721, 1723, 1733, 1741, 1747, 1753, 1759,
  24. 1777, 1783, 1787, 1789, 1801, 1811, 1823, 1831,
  25. 1847, 1861, 1867, 1871, 1873, 1877, 1879, 1889,
  26. 1901, 1907, 1913, 1931, 1933, 1949, 1951, 1973,
  27. 1979, 1987, 1993, 1997, 1999, 2003, 2011, 2017,
  28. 2027, 2029, 2039, 2053, 2063, 2069, 2081, 2083,
  29. 2087, 2089, 2099, 2111, 2113, 2129, 2131, 2137,
  30. 2141, 2143, 2153, 2161, 2179, 2203, 2207, 2213,
  31. 2221, 2237, 2239, 2243, 2251, 2267, 2269, 2273,
  32. 2281, 2287, 2293, 2297, 2309, 2311, 2333, 2339,
  33. 2341, 2347, 2351, 2357, 2371, 2377, 2381, 2383,
  34. 2389, 2393, 2399, 2411, 2417, 2423, 2437, 2441,
  35. 2447, 2459, 2467, 2473, 2477, 2503, 2521, 2531,
  36. 2539, 2543, 2549, 2551, 2557, 2579, 2591, 2593,
  37. 2609, 2617, 2621, 2633, 2647, 2657, 2659, 2663,
  38. 2671, 2677, 2683, 2687, 2689, 2693, 2699, 2707,
  39. 2711, 2713, 2719, 2729, 2731, 2741, 2749, 2753,
  40. 2767, 2777, 2789, 2791, 2797, 2801, 2803, 2819,
  41. 2833, 2837, 2843, 2851, 2857, 2861, 2879, 2887,
  42. 2897, 2903, 2909, 2917, 2927, 2939, 2953, 2957
  43. };
  44. inline size_t mod256(size_t n) noexcept { return (n & 0xff); }
  45. uint32_t mishmash(const unsigned char* buffer, size_t length) noexcept {
  46. uint64_t accumulator = selectedPrime(length);
  47. for(size_t index = 0; index < length; index++) {
  48. unsigned char byte = buffer[index];
  49. accumulator += selectedPrime(index + accumulator);
  50. accumulator *= selectedPrime(byte + accumulator);
  51. accumulator += accumulator >> 32;
  52. accumulator &= 0x00000fffffffffff;
  53. }
  54. return static_cast<uint32_t>(accumulator);
  55. }
  56. uint32_t mishmash(const std::string& s) noexcept {
  57. return mishmash((const unsigned char*) s.c_str(), s.length());
  58. }
  59. uint32_t mishmash(const std::vector<unsigned char>& v) noexcept {
  60. return mishmash(v.data(), v.size());
  61. }
  62. }