Line | Count | Source (jump to first uncovered line) |
1 | | // Copyright (c) 2011-present, Facebook, Inc. All rights reserved. |
2 | | // This source code is licensed under both the GPLv2 (found in the |
3 | | // COPYING file in the root directory) and Apache 2.0 License |
4 | | // (found in the LICENSE.Apache file in the root directory). |
5 | | // |
6 | | // Copyright (c) 2011 The LevelDB Authors. All rights reserved. |
7 | | // Use of this source code is governed by a BSD-style license that can be |
8 | | // found in the LICENSE file. See the AUTHORS file for names of contributors. |
9 | | // |
10 | | // Common hash functions with convenient interfaces. If hashing a |
11 | | // statically-sized input in a performance-critical context, consider |
12 | | // calling a specific hash implementation directly, such as |
13 | | // XXH3_64bits from xxhash.h. |
14 | | // |
15 | | // Since this is a very common header, implementation details are kept |
16 | | // out-of-line. Out-of-lining also aids in tracking the time spent in |
17 | | // hashing functions. Inlining is of limited benefit for runtime-sized |
18 | | // hash inputs. |
19 | | |
20 | | #pragma once |
21 | | |
22 | | #include <cstddef> |
23 | | #include <cstdint> |
24 | | |
25 | | #include "rocksdb/slice.h" |
26 | | #include "util/fastrange.h" |
27 | | |
28 | | namespace ROCKSDB_NAMESPACE { |
29 | | |
30 | | // Stable/persistent 64-bit hash. Higher quality and generally faster than |
31 | | // Hash(), especially for inputs > 24 bytes. |
32 | | // KNOWN FLAW: incrementing seed by 1 might not give sufficiently independent |
33 | | // results from previous seed. Recommend incrementing by a large odd number. |
34 | | uint64_t Hash64(const char* data, size_t n, uint64_t seed); |
35 | | |
36 | | // Specific optimization without seed (same as seed = 0) |
37 | | uint64_t Hash64(const char* data, size_t n); |
38 | | |
39 | | // Non-persistent hash. Must only used for in-memory data structures. |
40 | | // The hash results are thus subject to change between releases, |
41 | | // architectures, build configuration, etc. (Thus, it rarely makes sense |
42 | | // to specify a seed for this function, except for a "rolling" hash.) |
43 | | // KNOWN FLAW: incrementing seed by 1 might not give sufficiently independent |
44 | | // results from previous seed. Recommend incrementing by a large odd number. |
45 | 13.4M | inline uint64_t NPHash64(const char* data, size_t n, uint64_t seed) { |
46 | | #ifdef ROCKSDB_MODIFY_NPHASH |
47 | | // For testing "subject to change" |
48 | | return Hash64(data, n, seed + 123456789); |
49 | | #else |
50 | | // Currently same as Hash64 |
51 | 13.4M | return Hash64(data, n, seed); |
52 | 13.4M | #endif |
53 | 13.4M | } |
54 | | |
55 | | // Specific optimization without seed (same as seed = 0) |
56 | 0 | inline uint64_t NPHash64(const char* data, size_t n) { |
57 | | #ifdef ROCKSDB_MODIFY_NPHASH |
58 | | // For testing "subject to change" |
59 | | return Hash64(data, n, 123456789); |
60 | | #else |
61 | | // Currently same as Hash64 |
62 | 0 | return Hash64(data, n); |
63 | 0 | #endif |
64 | 0 | } |
65 | | |
66 | | // Convenient and equivalent version of Hash128 without depending on 128-bit |
67 | | // scalars |
68 | | void Hash2x64(const char* data, size_t n, uint64_t* high64, uint64_t* low64); |
69 | | void Hash2x64(const char* data, size_t n, uint64_t seed, uint64_t* high64, |
70 | | uint64_t* low64); |
71 | | |
72 | | // Hash 128 bits to 128 bits, guaranteed not to lose data (equivalent to |
73 | | // Hash2x64 on 16 bytes little endian) |
74 | | void BijectiveHash2x64(uint64_t in_high64, uint64_t in_low64, |
75 | | uint64_t* out_high64, uint64_t* out_low64); |
76 | | void BijectiveHash2x64(uint64_t in_high64, uint64_t in_low64, uint64_t seed, |
77 | | uint64_t* out_high64, uint64_t* out_low64); |
78 | | |
79 | | // Inverse of above (mostly for testing) |
80 | | void BijectiveUnhash2x64(uint64_t in_high64, uint64_t in_low64, |
81 | | uint64_t* out_high64, uint64_t* out_low64); |
82 | | void BijectiveUnhash2x64(uint64_t in_high64, uint64_t in_low64, uint64_t seed, |
83 | | uint64_t* out_high64, uint64_t* out_low64); |
84 | | |
85 | | // Stable/persistent 32-bit hash. Moderate quality and high speed on |
86 | | // small inputs. |
87 | | // TODO: consider rename to Hash32 |
88 | | // KNOWN FLAW: incrementing seed by 1 might not give sufficiently independent |
89 | | // results from previous seed. Recommend pseudorandom or hashed seeds. |
90 | | uint32_t Hash(const char* data, size_t n, uint32_t seed); |
91 | | |
92 | | // TODO: consider rename to LegacyBloomHash32 |
93 | 0 | inline uint32_t BloomHash(const Slice& key) { |
94 | 0 | return Hash(key.data(), key.size(), 0xbc9f1d34); |
95 | 0 | } |
96 | | |
97 | 0 | inline uint64_t GetSliceHash64(const Slice& key) { |
98 | 0 | return Hash64(key.data(), key.size()); |
99 | 0 | } |
100 | | // Provided for convenience for use with template argument deduction, where a |
101 | | // specific overload needs to be used. |
102 | | extern uint64_t (*kGetSliceNPHash64UnseededFnPtr)(const Slice&); |
103 | | |
104 | 0 | inline uint64_t GetSliceNPHash64(const Slice& s) { |
105 | 0 | return NPHash64(s.data(), s.size()); |
106 | 0 | } |
107 | | |
108 | 5.32M | inline uint64_t GetSliceNPHash64(const Slice& s, uint64_t seed) { |
109 | 5.32M | return NPHash64(s.data(), s.size(), seed); |
110 | 5.32M | } |
111 | | |
112 | | // Similar to `GetSliceNPHash64()` with `seed`, but input comes from |
113 | | // concatenation of `Slice`s in `data`. |
114 | | uint64_t GetSlicePartsNPHash64(const SliceParts& data, uint64_t seed); |
115 | | |
116 | 0 | inline size_t GetSliceRangedNPHash(const Slice& s, size_t range) { |
117 | 0 | return FastRange64(NPHash64(s.data(), s.size()), range); |
118 | 0 | } |
119 | | |
120 | | // TODO: consider rename to GetSliceHash32 |
121 | 94.7k | inline uint32_t GetSliceHash(const Slice& s) { |
122 | 94.7k | return Hash(s.data(), s.size(), 397); |
123 | 94.7k | } |
124 | | |
125 | | // Useful for splitting up a 64-bit hash |
126 | 63.8k | inline uint32_t Upper32of64(uint64_t v) { |
127 | 63.8k | return static_cast<uint32_t>(v >> 32); |
128 | 63.8k | } |
129 | 272k | inline uint32_t Lower32of64(uint64_t v) { return static_cast<uint32_t>(v); } |
130 | | |
131 | | // std::hash-like interface. |
132 | | struct SliceHasher32 { |
133 | 0 | uint32_t operator()(const Slice& s) const { return GetSliceHash(s); } |
134 | | }; |
135 | | struct SliceNPHasher64 { |
136 | 4.48k | uint64_t operator()(const Slice& s, uint64_t seed = 0) const { |
137 | 4.48k | return GetSliceNPHash64(s, seed); |
138 | 4.48k | } |
139 | | }; |
140 | | |
141 | | } // namespace ROCKSDB_NAMESPACE |