1 | /** |
2 | * MIT License |
3 | * |
4 | * Copyright (c) 2017 Tessil |
5 | * |
6 | * Permission is hereby granted, free of charge, to any person obtaining a copy |
7 | * of this software and associated documentation files (the "Software"), to deal |
8 | * in the Software without restriction, including without limitation the rights |
9 | * to use, copy, modify, merge, publish, distribute, sublicense, and/or sell |
10 | * copies of the Software, and to permit persons to whom the Software is |
11 | * furnished to do so, subject to the following conditions: |
12 | * |
13 | * The above copyright notice and this permission notice shall be included in all |
14 | * copies or substantial portions of the Software. |
15 | * |
16 | * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR |
17 | * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY, |
18 | * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL THE |
19 | * AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER |
20 | * LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM, |
21 | * OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE |
22 | * SOFTWARE. |
23 | */ |
24 | #ifndef TSL_HOPSCOTCH_HASH_H |
25 | #define TSL_HOPSCOTCH_HASH_H |
26 | |
27 | |
28 | #include <algorithm> |
29 | #include <array> |
30 | #include <cassert> |
31 | #include <cmath> |
32 | #include <climits> |
33 | #include <cstddef> |
34 | #include <cstdint> |
35 | #include <exception> |
36 | #include <functional> |
37 | #include <initializer_list> |
38 | #include <iterator> |
39 | #include <limits> |
40 | #include <memory> |
41 | #include <ratio> |
42 | #include <stdexcept> |
43 | #include <tuple> |
44 | #include <type_traits> |
45 | #include <utility> |
46 | #include <vector> |
47 | |
48 | #if (defined(__GNUC__) && (__GNUC__ == 4) && (__GNUC_MINOR__ < 9)) |
49 | #define TSL_NO_RANGE_ERASE_WITH_CONST_ITERATOR |
50 | #endif |
51 | |
52 | |
53 | |
54 | /* |
55 | * Only activate tsl_assert if TSL_DEBUG is defined. |
56 | * This way we avoid the performance hit when NDEBUG is not defined with assert as tsl_assert is used a lot |
57 | * (people usually compile with "-O3" and not "-O3 -DNDEBUG"). |
58 | */ |
59 | #ifndef tsl_assert |
60 | #ifdef TSL_DEBUG |
61 | #define tsl_assert(expr) assert(expr) |
62 | #else |
63 | #define tsl_assert(expr) (static_cast<void>(0)) |
64 | #endif |
65 | #endif |
66 | |
67 | namespace tsl { |
68 | |
69 | /** |
70 | * Grow the map by a factor of two keeping bucket_count to a power of two. It allows |
71 | * the map to use a mask operation instead of a modulo operation to map a hash to a bucket. |
72 | */ |
73 | class power_of_two_growth_policy { |
74 | public: |
75 | /** |
76 | * Called on map creation and rehash. The number of buckets requested is passed by parameter. |
77 | * This number is a minimum, the policy may update this value with a higher value if needed. |
78 | */ |
79 | power_of_two_growth_policy(std::size_t& min_bucket_count_in_out) { |
80 | if(min_bucket_count_in_out > max_bucket_count()) { |
81 | throw std::length_error("The map exceeds its maxmimum size." ); |
82 | } |
83 | |
84 | static_assert(MIN_BUCKETS_SIZE > 0, "" ); |
85 | const std::size_t min_bucket_count = MIN_BUCKETS_SIZE; |
86 | |
87 | min_bucket_count_in_out = std::max(min_bucket_count, min_bucket_count_in_out); |
88 | min_bucket_count_in_out = round_up_to_power_of_two(min_bucket_count_in_out); |
89 | m_mask = min_bucket_count_in_out - 1; |
90 | } |
91 | |
92 | /** |
93 | * Return the bucket [0, bucket_count()) to which the hash belongs. |
94 | */ |
95 | std::size_t bucket_for_hash(std::size_t hash) const { |
96 | return hash & m_mask; |
97 | } |
98 | |
99 | /** |
100 | * Return the bucket count to uses when the bucket array grows on rehash. |
101 | */ |
102 | std::size_t next_bucket_count() const { |
103 | if((m_mask + 1) > max_bucket_count()/2) { |
104 | throw std::length_error("The map exceeds its maxmimum size." ); |
105 | } |
106 | |
107 | return (m_mask + 1) * 2; |
108 | } |
109 | |
110 | /** |
111 | * Return the maximum number of buckets supported by the policy. |
112 | */ |
113 | std::size_t max_bucket_count() const { |
114 | return std::numeric_limits<std::size_t>::max()/2 + 1; |
115 | } |
116 | |
117 | private: |
118 | static std::size_t round_up_to_power_of_two(std::size_t value) { |
119 | if(value == 0) { |
120 | return 1; |
121 | } |
122 | |
123 | if(is_power_of_two(value)) { |
124 | return value; |
125 | } |
126 | |
127 | --value; |
128 | for(std::size_t i = 1; i < sizeof(std::size_t) * CHAR_BIT; i *= 2) { |
129 | value |= value >> i; |
130 | } |
131 | |
132 | return value + 1; |
133 | } |
134 | |
135 | static constexpr bool is_power_of_two(std::size_t value) { |
136 | return value != 0 && (value & (value - 1)) == 0; |
137 | } |
138 | |
139 | private: |
140 | static const std::size_t MIN_BUCKETS_SIZE = 2; |
141 | |
142 | std::size_t m_mask; |
143 | }; |
144 | |
145 | /** |
146 | * Grow the map by GrowthFactor::num/GrowthFactor::den and use a modulo to map a hash |
147 | * to a bucket. Slower but it can be usefull if you want a slower growth. |
148 | */ |
149 | template<class GrowthFactor = std::ratio<3, 2>> |
150 | class mod_growth_policy { |
151 | public: |
152 | mod_growth_policy(std::size_t& min_bucket_count_in_out) { |
153 | if(min_bucket_count_in_out > max_bucket_count()) { |
154 | throw std::length_error("The map exceeds its maxmimum size." ); |
155 | } |
156 | |
157 | static_assert(MIN_BUCKETS_SIZE > 0, "" ); |
158 | const std::size_t min_bucket_count = MIN_BUCKETS_SIZE; |
159 | |
160 | min_bucket_count_in_out = std::max(min_bucket_count, min_bucket_count_in_out); |
161 | m_bucket_count = min_bucket_count_in_out; |
162 | } |
163 | |
164 | std::size_t bucket_for_hash(std::size_t hash) const { |
165 | tsl_assert(m_bucket_count != 0); |
166 | return hash % m_bucket_count; |
167 | } |
168 | |
169 | std::size_t next_bucket_count() const { |
170 | if(m_bucket_count == max_bucket_count()) { |
171 | throw std::length_error("The map exceeds its maxmimum size." ); |
172 | } |
173 | |
174 | const double next_bucket_count = std::ceil(double(m_bucket_count) * REHASH_SIZE_MULTIPLICATION_FACTOR); |
175 | if(!std::isnormal(next_bucket_count)) { |
176 | throw std::length_error("The map exceeds its maxmimum size." ); |
177 | } |
178 | |
179 | if(next_bucket_count > double(max_bucket_count())) { |
180 | return max_bucket_count(); |
181 | } |
182 | else { |
183 | return std::size_t(next_bucket_count); |
184 | } |
185 | } |
186 | |
187 | std::size_t max_bucket_count() const { |
188 | return MAX_BUCKET_COUNT; |
189 | } |
190 | |
191 | private: |
192 | static const std::size_t MIN_BUCKETS_SIZE = 2; |
193 | static constexpr double REHASH_SIZE_MULTIPLICATION_FACTOR = 1.0*GrowthFactor::num/GrowthFactor::den; |
194 | static const std::size_t MAX_BUCKET_COUNT = |
195 | std::size_t(double( |
196 | std::numeric_limits<std::size_t>::max()/REHASH_SIZE_MULTIPLICATION_FACTOR |
197 | )); |
198 | |
199 | static_assert(REHASH_SIZE_MULTIPLICATION_FACTOR >= 1.1, "Grow factor should be >= 1.1." ); |
200 | |
201 | std::size_t m_bucket_count; |
202 | }; |
203 | |
204 | |
205 | |
206 | namespace detail_hopscotch_hash { |
207 | |
208 | static constexpr const std::array<std::size_t, 39> PRIMES = {{ |
209 | 5ul, 17ul, 29ul, 37ul, 53ul, 67ul, 79ul, 97ul, 131ul, 193ul, 257ul, 389ul, 521ul, 769ul, 1031ul, 1543ul, 2053ul, |
210 | 3079ul, 6151ul, 12289ul, 24593ul, 49157ul, 98317ul, 196613ul, 393241ul, 786433ul, 1572869ul, 3145739ul, |
211 | 6291469ul, 12582917ul, 25165843ul, 50331653ul, 100663319ul, 201326611ul, 402653189ul, 805306457ul, |
212 | 1610612741ul, 3221225473ul, 4294967291ul |
213 | }}; |
214 | |
215 | template<unsigned int IPrime> |
216 | static std::size_t mod(std::size_t hash) { return hash % PRIMES[IPrime]; } |
217 | |
218 | // MOD_PRIME[iprime](hash) returns hash % PRIMES[iprime]. This table allows for faster modulo as the |
219 | // compiler can optimize the modulo code better with a constant known at the compilation. |
220 | static constexpr const std::array<std::size_t(*)(std::size_t), 39> MOD_PRIME = {{ |
221 | &mod<0>, &mod<1>, &mod<2>, &mod<3>, &mod<4>, &mod<5>, &mod<6>, &mod<7>, &mod<8>, &mod<9>, &mod<10>, |
222 | &mod<11>, &mod<12>, &mod<13>, &mod<14>, &mod<15>, &mod<16>, &mod<17>, &mod<18>, &mod<19>, &mod<20>, |
223 | &mod<21>, &mod<22>, &mod<23>, &mod<24>, &mod<25>, &mod<26>, &mod<27>, &mod<28>, &mod<29>, &mod<30>, |
224 | &mod<31>, &mod<32>, &mod<33>, &mod<34>, &mod<35>, &mod<36>, &mod<37> , &mod<38> |
225 | }}; |
226 | |
227 | } |
228 | |
229 | /** |
230 | * Grow the map by using prime numbers as size. Slower than tsl::power_of_two_growth_policy in general |
231 | * but will probably distribute the values around better in the buckets with a poor hash function. |
232 | */ |
233 | class prime_growth_policy { |
234 | public: |
235 | prime_growth_policy(std::size_t& min_bucket_count_in_out) { |
236 | auto it_prime = std::lower_bound(tsl::detail_hopscotch_hash::PRIMES.begin(), |
237 | tsl::detail_hopscotch_hash::PRIMES.end(), min_bucket_count_in_out); |
238 | if(it_prime == tsl::detail_hopscotch_hash::PRIMES.end()) { |
239 | throw std::length_error("The map exceeds its maxmimum size." ); |
240 | } |
241 | |
242 | m_iprime = static_cast<unsigned int>(std::distance(tsl::detail_hopscotch_hash::PRIMES.begin(), it_prime)); |
243 | min_bucket_count_in_out = *it_prime; |
244 | } |
245 | |
246 | std::size_t bucket_for_hash(std::size_t hash) const { |
247 | return bucket_for_hash_iprime(hash, m_iprime); |
248 | } |
249 | |
250 | std::size_t next_bucket_count() const { |
251 | if(m_iprime + 1 >= tsl::detail_hopscotch_hash::PRIMES.size()) { |
252 | throw std::length_error("The map exceeds its maxmimum size." ); |
253 | } |
254 | |
255 | return tsl::detail_hopscotch_hash::PRIMES[m_iprime + 1]; |
256 | } |
257 | |
258 | std::size_t max_bucket_count() const { |
259 | return tsl::detail_hopscotch_hash::PRIMES.back(); |
260 | } |
261 | |
262 | private: |
263 | std::size_t bucket_for_hash_iprime(std::size_t hash, unsigned int iprime) const { |
264 | tsl_assert(iprime < tsl::detail_hopscotch_hash::MOD_PRIME.size()); |
265 | return tsl::detail_hopscotch_hash::MOD_PRIME[iprime](hash); |
266 | } |
267 | |
268 | private: |
269 | unsigned int m_iprime; |
270 | }; |
271 | |
272 | |
273 | namespace detail_hopscotch_hash { |
274 | |
275 | |
276 | |
277 | template<typename T> |
278 | struct make_void { |
279 | using type = void; |
280 | }; |
281 | |
282 | |
283 | template<typename T, typename = void> |
284 | struct has_is_transparent : std::false_type { |
285 | }; |
286 | |
287 | template<typename T> |
288 | struct has_is_transparent<T, typename make_void<typename T::is_transparent>::type> : std::true_type { |
289 | }; |
290 | |
291 | |
292 | template<typename T, typename = void> |
293 | struct has_key_compare : std::false_type { |
294 | }; |
295 | |
296 | template<typename T> |
297 | struct has_key_compare<T, typename make_void<typename T::key_compare>::type> : std::true_type { |
298 | }; |
299 | |
300 | |
301 | |
302 | |
303 | |
304 | /* |
305 | * smallest_type_for_min_bits::type returns the smallest type that can fit MinBits. |
306 | */ |
307 | static const size_t SMALLEST_TYPE_MAX_BITS_SUPPORTED = 64; |
308 | template<unsigned int MinBits, typename Enable = void> |
309 | class smallest_type_for_min_bits { |
310 | }; |
311 | |
312 | template<unsigned int MinBits> |
313 | class smallest_type_for_min_bits<MinBits, typename std::enable_if<(MinBits > 0) && (MinBits <= 8)>::type> { |
314 | public: |
315 | using type = std::uint_least8_t; |
316 | }; |
317 | |
318 | template<unsigned int MinBits> |
319 | class smallest_type_for_min_bits<MinBits, typename std::enable_if<(MinBits > 8) && (MinBits <= 16)>::type> { |
320 | public: |
321 | using type = std::uint_least16_t; |
322 | }; |
323 | |
324 | template<unsigned int MinBits> |
325 | class smallest_type_for_min_bits<MinBits, typename std::enable_if<(MinBits > 16) && (MinBits <= 32)>::type> { |
326 | public: |
327 | using type = std::uint_least32_t; |
328 | }; |
329 | |
330 | template<unsigned int MinBits> |
331 | class smallest_type_for_min_bits<MinBits, typename std::enable_if<(MinBits > 32) && (MinBits <= 64)>::type> { |
332 | public: |
333 | using type = std::uint_least64_t; |
334 | }; |
335 | |
336 | |
337 | |
338 | /* |
339 | * Each bucket may store up to three elements: |
340 | * - An aligned storage to store a value_type object with placement-new. |
341 | * - An (optional) hash of the value in the bucket. |
342 | * - An unsigned integer of type neighborhood_bitmap used to tell us which buckets in the neighborhood of the |
343 | * current bucket contain a value with a hash belonging to the current bucket. |
344 | * |
345 | * For a bucket 'b' a bit 'i' (counting from 0 and from the least significant bit to the most significant) |
346 | * set to 1 means that the bucket 'b+i' contains a value with a hash belonging to bucket 'b'. |
347 | * The bits used for that, start from the third least significant bit. |
348 | * |
349 | * The least significant bit is set to 1 if there is a value in the bucket storage. |
350 | * The second least significant bit is set to 1 if there is an overflow. More than NeighborhoodSize values |
351 | * give the same hash, all overflow values are stored in the m_overflow_elements list of the map. |
352 | */ |
353 | static const std::size_t NB_RESERVED_BITS_IN_NEIGHBORHOOD = 2; |
354 | |
355 | |
356 | template<bool StoreHash> |
357 | class hopscotch_bucket_hash { |
358 | public: |
359 | using hash_type = std::false_type; |
360 | |
361 | bool bucket_hash_equal(std::size_t /*hash*/) const noexcept { |
362 | return true; |
363 | } |
364 | |
365 | std::size_t truncated_bucket_hash() const noexcept { |
366 | assert(false); |
367 | return 0; |
368 | } |
369 | |
370 | protected: |
371 | void copy_hash(const hopscotch_bucket_hash& ) noexcept { |
372 | } |
373 | |
374 | void set_hash(std::size_t /*hash*/) noexcept { |
375 | } |
376 | }; |
377 | |
378 | template<> |
379 | class hopscotch_bucket_hash<true> { |
380 | public: |
381 | using hash_type = std::uint_least32_t; |
382 | static_assert(sizeof(hash_type) <= sizeof(std::size_t), "" ); |
383 | |
384 | bool bucket_hash_equal(std::size_t hash) const noexcept { |
385 | return m_hash == hash_type(hash); |
386 | } |
387 | |
388 | std::size_t truncated_bucket_hash() const noexcept { |
389 | return m_hash; |
390 | } |
391 | |
392 | protected: |
393 | void copy_hash(const hopscotch_bucket_hash& bucket) noexcept { |
394 | m_hash = bucket.m_hash; |
395 | } |
396 | |
397 | void set_hash(std::size_t hash) noexcept { |
398 | m_hash = hash_type(hash); |
399 | } |
400 | |
401 | private: |
402 | hash_type m_hash; |
403 | }; |
404 | |
405 | template<typename ValueType, unsigned int NeighborhoodSize, bool StoreHash> |
406 | class hopscotch_bucket: public hopscotch_bucket_hash<StoreHash> { |
407 | private: |
408 | static const size_t MIN_NEIGHBORHOOD_SIZE = 4; |
409 | static const size_t MAX_NEIGHBORHOOD_SIZE = SMALLEST_TYPE_MAX_BITS_SUPPORTED - NB_RESERVED_BITS_IN_NEIGHBORHOOD; |
410 | |
411 | |
412 | static_assert(NeighborhoodSize >= 4, "NeighborhoodSize should be >= 4." ); |
413 | // We can't put a variable in the message, ensure coherence |
414 | static_assert(MIN_NEIGHBORHOOD_SIZE == 4, "" ); |
415 | |
416 | static_assert(NeighborhoodSize <= 62, "NeighborhoodSize should be <= 62." ); |
417 | // We can't put a variable in the message, ensure coherence |
418 | static_assert(MAX_NEIGHBORHOOD_SIZE == 62, "" ); |
419 | |
420 | |
421 | static_assert(!StoreHash || NeighborhoodSize <= 30, |
422 | "NeighborhoodSize should be <= 30 if StoreHash is true." ); |
423 | // We can't put a variable in the message, ensure coherence |
424 | static_assert(MAX_NEIGHBORHOOD_SIZE - 32 == 30, "" ); |
425 | |
426 | using bucket_hash = hopscotch_bucket_hash<StoreHash>; |
427 | |
428 | public: |
429 | using value_type = ValueType; |
430 | using neighborhood_bitmap = |
431 | typename smallest_type_for_min_bits<NeighborhoodSize + NB_RESERVED_BITS_IN_NEIGHBORHOOD>::type; |
432 | |
433 | |
434 | hopscotch_bucket() noexcept: bucket_hash(), m_neighborhood_infos(0) { |
435 | tsl_assert(empty()); |
436 | } |
437 | |
438 | |
439 | hopscotch_bucket(const hopscotch_bucket& bucket) |
440 | noexcept(std::is_nothrow_copy_constructible<value_type>::value): bucket_hash(bucket), |
441 | m_neighborhood_infos(0) |
442 | { |
443 | if(!bucket.empty()) { |
444 | ::new (static_cast<void*>(std::addressof(m_value))) value_type(bucket.value()); |
445 | } |
446 | |
447 | m_neighborhood_infos = bucket.m_neighborhood_infos; |
448 | } |
449 | |
450 | hopscotch_bucket(hopscotch_bucket&& bucket) |
451 | noexcept(std::is_nothrow_move_constructible<value_type>::value) : bucket_hash(std::move(bucket)), |
452 | m_neighborhood_infos(0) |
453 | { |
454 | if(!bucket.empty()) { |
455 | ::new (static_cast<void*>(std::addressof(m_value))) value_type(std::move(bucket.value())); |
456 | } |
457 | |
458 | m_neighborhood_infos = bucket.m_neighborhood_infos; |
459 | } |
460 | |
461 | hopscotch_bucket& operator=(const hopscotch_bucket& bucket) |
462 | noexcept(std::is_nothrow_copy_constructible<value_type>::value) |
463 | { |
464 | if(this != &bucket) { |
465 | bucket_hash::operator=(bucket); |
466 | |
467 | if(!empty()) { |
468 | destroy_value(); |
469 | set_empty(true); |
470 | } |
471 | |
472 | if(!bucket.empty()) { |
473 | ::new (static_cast<void*>(std::addressof(m_value))) value_type(bucket.value()); |
474 | } |
475 | |
476 | m_neighborhood_infos = bucket.m_neighborhood_infos; |
477 | } |
478 | |
479 | return *this; |
480 | } |
481 | |
482 | hopscotch_bucket& operator=(hopscotch_bucket&& ) = delete; |
483 | |
484 | ~hopscotch_bucket() noexcept { |
485 | if(!empty()) { |
486 | destroy_value(); |
487 | } |
488 | } |
489 | |
490 | neighborhood_bitmap neighborhood_infos() const noexcept { |
491 | return neighborhood_bitmap(m_neighborhood_infos >> NB_RESERVED_BITS_IN_NEIGHBORHOOD); |
492 | } |
493 | |
494 | void set_overflow(bool has_overflow) noexcept { |
495 | if(has_overflow) { |
496 | m_neighborhood_infos = neighborhood_bitmap(m_neighborhood_infos | 2); |
497 | } |
498 | else { |
499 | m_neighborhood_infos = neighborhood_bitmap(m_neighborhood_infos & ~2); |
500 | } |
501 | } |
502 | |
503 | bool has_overflow() const noexcept { |
504 | return (m_neighborhood_infos & 2) != 0; |
505 | } |
506 | |
507 | bool empty() const noexcept { |
508 | return (m_neighborhood_infos & 1) == 0; |
509 | } |
510 | |
511 | void toggle_neighbor_presence(std::size_t ineighbor) noexcept { |
512 | tsl_assert(ineighbor <= NeighborhoodSize); |
513 | m_neighborhood_infos = neighborhood_bitmap( |
514 | m_neighborhood_infos ^ (1ull << (ineighbor + NB_RESERVED_BITS_IN_NEIGHBORHOOD))); |
515 | } |
516 | |
517 | bool check_neighbor_presence(std::size_t ineighbor) const noexcept { |
518 | tsl_assert(ineighbor <= NeighborhoodSize); |
519 | if(((m_neighborhood_infos >> (ineighbor + NB_RESERVED_BITS_IN_NEIGHBORHOOD)) & 1) == 1) { |
520 | return true; |
521 | } |
522 | |
523 | return false; |
524 | } |
525 | |
526 | value_type& value() noexcept { |
527 | tsl_assert(!empty()); |
528 | return *reinterpret_cast<value_type*>(std::addressof(m_value)); |
529 | } |
530 | |
531 | const value_type& value() const noexcept { |
532 | tsl_assert(!empty()); |
533 | return *reinterpret_cast<const value_type*>(std::addressof(m_value)); |
534 | } |
535 | |
536 | template<typename P> |
537 | void set_value_of_empty_bucket(P&& value, std::size_t hash) { |
538 | tsl_assert(empty()); |
539 | |
540 | ::new (static_cast<void*>(std::addressof(m_value))) value_type(std::forward<P>(value)); |
541 | set_empty(false); |
542 | this->set_hash(hash); |
543 | } |
544 | |
545 | void swap_value_into_empty_bucket(hopscotch_bucket& empty_bucket) { |
546 | tsl_assert(empty_bucket.empty()); |
547 | if(!empty()) { |
548 | ::new (static_cast<void*>(std::addressof(empty_bucket.m_value))) value_type(std::move(value())); |
549 | empty_bucket.copy_hash(*this); |
550 | empty_bucket.set_empty(false); |
551 | |
552 | destroy_value(); |
553 | set_empty(true); |
554 | } |
555 | } |
556 | |
557 | void remove_value() noexcept { |
558 | if(!empty()) { |
559 | destroy_value(); |
560 | set_empty(true); |
561 | } |
562 | } |
563 | |
564 | void clear() noexcept { |
565 | if(!empty()) { |
566 | destroy_value(); |
567 | } |
568 | |
569 | m_neighborhood_infos = 0; |
570 | tsl_assert(empty()); |
571 | } |
572 | |
573 | static std::size_t max_size() noexcept { |
574 | if(StoreHash) { |
575 | return std::numeric_limits<typename bucket_hash::hash_type>::max(); |
576 | } |
577 | else { |
578 | return std::numeric_limits<std::size_t>::max(); |
579 | } |
580 | } |
581 | |
582 | private: |
583 | void set_empty(bool is_empty) noexcept { |
584 | if(is_empty) { |
585 | m_neighborhood_infos = neighborhood_bitmap(m_neighborhood_infos & ~1); |
586 | } |
587 | else { |
588 | m_neighborhood_infos = neighborhood_bitmap(m_neighborhood_infos | 1); |
589 | } |
590 | } |
591 | |
592 | void destroy_value() noexcept { |
593 | try { |
594 | tsl_assert(!empty()); |
595 | |
596 | value().~value_type(); |
597 | } |
598 | catch(...) { |
599 | std::terminate(); |
600 | } |
601 | } |
602 | |
603 | private: |
604 | using storage = typename std::aligned_storage<sizeof(value_type), alignof(value_type)>::type; |
605 | |
606 | neighborhood_bitmap m_neighborhood_infos; |
607 | storage m_value; |
608 | }; |
609 | |
610 | |
611 | /** |
612 | * Internal common class used by hopscotch_(sc)_map and hopscotch_(sc)_set. |
613 | * |
614 | * ValueType is what will be stored by hopscotch_hash (usually std::pair<Key, T> for map and Key for set). |
615 | * |
616 | * KeySelect should be a FunctionObject which takes a ValueType in parameter and returns a reference to the key. |
617 | * |
618 | * ValueSelect should be a FunctionObject which takes a ValueType in parameter and returns a reference to the value. |
619 | * ValueSelect should be void if there is no value (in set for example). |
620 | * |
621 | * OverflowContainer will be used as containers for overflown elements. Usually it should be a list<ValueType> |
622 | * or a set<Key>/map<Key, T>. |
623 | */ |
624 | template<class ValueType, |
625 | class KeySelect, |
626 | class ValueSelect, |
627 | class Hash, |
628 | class KeyEqual, |
629 | class Allocator, |
630 | unsigned int NeighborhoodSize, |
631 | bool StoreHash, |
632 | class GrowthPolicy, |
633 | class OverflowContainer> |
634 | class hopscotch_hash: private Hash, private KeyEqual, private GrowthPolicy { |
635 | private: |
636 | template<typename U> |
637 | using has_mapped_type = typename std::integral_constant<bool, !std::is_same<U, void>::value>; |
638 | |
639 | public: |
640 | template<bool is_const> |
641 | class hopscotch_iterator; |
642 | |
643 | using key_type = typename KeySelect::key_type; |
644 | using value_type = ValueType; |
645 | using size_type = std::size_t; |
646 | using difference_type = std::ptrdiff_t; |
647 | using hasher = Hash; |
648 | using key_equal = KeyEqual; |
649 | using allocator_type = Allocator; |
650 | using reference = value_type&; |
651 | using const_reference = const value_type&; |
652 | using pointer = value_type*; |
653 | using const_pointer = const value_type*; |
654 | using iterator = hopscotch_iterator<false>; |
655 | using const_iterator = hopscotch_iterator<true>; |
656 | |
657 | private: |
658 | using hopscotch_bucket = tsl::detail_hopscotch_hash::hopscotch_bucket<ValueType, NeighborhoodSize, StoreHash>; |
659 | using neighborhood_bitmap = typename hopscotch_bucket::neighborhood_bitmap; |
660 | |
661 | using buckets_allocator = typename std::allocator_traits<allocator_type>::template rebind_alloc<hopscotch_bucket>; |
662 | using buckets_container_type = std::vector<hopscotch_bucket, buckets_allocator>; |
663 | |
664 | using overflow_container_type = OverflowContainer; |
665 | |
666 | static_assert(std::is_same<typename overflow_container_type::value_type, ValueType>::value, |
667 | "OverflowContainer should have ValueType as type." ); |
668 | |
669 | static_assert(std::is_same<typename overflow_container_type::allocator_type, Allocator>::value, |
670 | "Invalid allocator, not the same type as the value_type." ); |
671 | |
672 | |
673 | using iterator_buckets = typename buckets_container_type::iterator; |
674 | using const_iterator_buckets = typename buckets_container_type::const_iterator; |
675 | |
676 | using iterator_overflow = typename overflow_container_type::iterator; |
677 | using const_iterator_overflow = typename overflow_container_type::const_iterator; |
678 | |
679 | public: |
680 | /** |
681 | * The 'operator*()' and 'operator->()' methods return a const reference and const pointer respectively to the |
682 | * stored value type. |
683 | * |
684 | * In case of a map, to get a modifiable reference to the value associated to a key (the '.second' in the |
685 | * stored pair), you have to call 'value()'. |
686 | */ |
687 | template<bool is_const> |
688 | class hopscotch_iterator { |
689 | friend class hopscotch_hash; |
690 | private: |
691 | using iterator_bucket = typename std::conditional<is_const, |
692 | typename hopscotch_hash::const_iterator_buckets, |
693 | typename hopscotch_hash::iterator_buckets>::type; |
694 | using iterator_overflow = typename std::conditional<is_const, |
695 | typename hopscotch_hash::const_iterator_overflow, |
696 | typename hopscotch_hash::iterator_overflow>::type; |
697 | |
698 | |
699 | hopscotch_iterator(iterator_bucket buckets_iterator, iterator_bucket buckets_end_iterator, |
700 | iterator_overflow overflow_iterator) noexcept : |
701 | m_buckets_iterator(buckets_iterator), m_buckets_end_iterator(buckets_end_iterator), |
702 | m_overflow_iterator(overflow_iterator) |
703 | { |
704 | } |
705 | |
706 | public: |
707 | using iterator_category = std::forward_iterator_tag; |
708 | using value_type = const typename hopscotch_hash::value_type; |
709 | using difference_type = std::ptrdiff_t; |
710 | using reference = value_type&; |
711 | using pointer = value_type*; |
712 | |
713 | |
714 | hopscotch_iterator() noexcept { |
715 | } |
716 | |
717 | hopscotch_iterator(const hopscotch_iterator<false>& other) noexcept : |
718 | m_buckets_iterator(other.m_buckets_iterator), m_buckets_end_iterator(other.m_buckets_end_iterator), |
719 | m_overflow_iterator(other.m_overflow_iterator) |
720 | { |
721 | } |
722 | |
723 | const typename hopscotch_hash::key_type& key() const { |
724 | if(m_buckets_iterator != m_buckets_end_iterator) { |
725 | return KeySelect()(m_buckets_iterator->value()); |
726 | } |
727 | |
728 | return KeySelect()(*m_overflow_iterator); |
729 | } |
730 | |
731 | template<class U = ValueSelect, typename std::enable_if<has_mapped_type<U>::value>::type* = nullptr> |
732 | typename std::conditional< |
733 | is_const, |
734 | const typename U::value_type&, |
735 | typename U::value_type&>::type value() const |
736 | { |
737 | if(m_buckets_iterator != m_buckets_end_iterator) { |
738 | return U()(m_buckets_iterator->value()); |
739 | } |
740 | |
741 | return U()(*m_overflow_iterator); |
742 | } |
743 | |
744 | reference operator*() const { |
745 | if(m_buckets_iterator != m_buckets_end_iterator) { |
746 | return m_buckets_iterator->value(); |
747 | } |
748 | |
749 | return *m_overflow_iterator; |
750 | } |
751 | |
752 | pointer operator->() const { |
753 | if(m_buckets_iterator != m_buckets_end_iterator) { |
754 | return std::addressof(m_buckets_iterator->value()); |
755 | } |
756 | |
757 | return std::addressof(*m_overflow_iterator); |
758 | } |
759 | |
760 | hopscotch_iterator& operator++() { |
761 | if(m_buckets_iterator == m_buckets_end_iterator) { |
762 | ++m_overflow_iterator; |
763 | return *this; |
764 | } |
765 | |
766 | do { |
767 | ++m_buckets_iterator; |
768 | } while(m_buckets_iterator != m_buckets_end_iterator && m_buckets_iterator->empty()); |
769 | |
770 | return *this; |
771 | } |
772 | |
773 | hopscotch_iterator operator++(int) { |
774 | hopscotch_iterator tmp(*this); |
775 | ++*this; |
776 | |
777 | return tmp; |
778 | } |
779 | |
780 | friend bool operator==(const hopscotch_iterator& lhs, const hopscotch_iterator& rhs) { |
781 | return lhs.m_buckets_iterator == rhs.m_buckets_iterator && |
782 | lhs.m_overflow_iterator == rhs.m_overflow_iterator; |
783 | } |
784 | |
785 | friend bool operator!=(const hopscotch_iterator& lhs, const hopscotch_iterator& rhs) { |
786 | return !(lhs == rhs); |
787 | } |
788 | |
789 | private: |
790 | iterator_bucket m_buckets_iterator; |
791 | iterator_bucket m_buckets_end_iterator; |
792 | iterator_overflow m_overflow_iterator; |
793 | }; |
794 | |
795 | |
796 | |
797 | public: |
798 | template<class OC = OverflowContainer, typename std::enable_if<!has_key_compare<OC>::value>::type* = nullptr> |
799 | hopscotch_hash(size_type bucket_count, |
800 | const Hash& hash, |
801 | const KeyEqual& equal, |
802 | const Allocator& alloc, |
803 | float max_load_factor) : Hash(hash), |
804 | KeyEqual(equal), |
805 | GrowthPolicy(bucket_count), |
806 | m_buckets(alloc), |
807 | m_overflow_elements(alloc), |
808 | m_nb_elements(0) |
809 | { |
810 | if(bucket_count > max_bucket_count()) { |
811 | throw std::length_error("The map exceeds its maxmimum size." ); |
812 | } |
813 | |
814 | static_assert(NeighborhoodSize - 1 > 0, "" ); |
815 | m_buckets.resize(bucket_count + NeighborhoodSize - 1); |
816 | |
817 | |
818 | this->max_load_factor(max_load_factor); |
819 | } |
820 | |
821 | template<class OC = OverflowContainer, typename std::enable_if<has_key_compare<OC>::value>::type* = nullptr> |
822 | hopscotch_hash(size_type bucket_count, |
823 | const Hash& hash, |
824 | const KeyEqual& equal, |
825 | const Allocator& alloc, |
826 | float max_load_factor, |
827 | const typename OC::key_compare& comp) : Hash(hash), |
828 | KeyEqual(equal), |
829 | GrowthPolicy(bucket_count), |
830 | m_buckets(alloc), |
831 | m_overflow_elements(comp, alloc), |
832 | m_nb_elements(0) |
833 | { |
834 | |
835 | if(bucket_count > max_bucket_count()) { |
836 | throw std::length_error("The map exceeds its maxmimum size." ); |
837 | } |
838 | |
839 | static_assert(NeighborhoodSize - 1 > 0, "" ); |
840 | m_buckets.resize(bucket_count + NeighborhoodSize - 1); |
841 | |
842 | |
843 | this->max_load_factor(max_load_factor); |
844 | } |
845 | |
846 | hopscotch_hash(const hopscotch_hash& other) = default; |
847 | |
848 | hopscotch_hash(hopscotch_hash&& other) |
849 | noexcept( |
850 | std::is_nothrow_move_constructible<Hash>::value && |
851 | std::is_nothrow_move_constructible<KeyEqual>::value && |
852 | std::is_nothrow_move_constructible<GrowthPolicy>::value && |
853 | std::is_nothrow_move_constructible<buckets_container_type>::value && |
854 | std::is_nothrow_move_constructible<overflow_container_type>::value |
855 | ) |
856 | : Hash(std::move(static_cast<Hash&>(other))), |
857 | KeyEqual(std::move(static_cast<KeyEqual&>(other))), |
858 | GrowthPolicy(std::move(static_cast<GrowthPolicy&>(other))), |
859 | m_buckets(std::move(other.m_buckets)), |
860 | m_overflow_elements(std::move(other.m_overflow_elements)), |
861 | m_nb_elements(other.m_nb_elements), |
862 | m_max_load_factor(other.m_max_load_factor), |
863 | m_load_threshold(other.m_load_threshold), |
864 | m_min_load_factor_rehash_threshold(other.m_min_load_factor_rehash_threshold) |
865 | { |
866 | other.clear(); |
867 | } |
868 | |
869 | hopscotch_hash& operator=(const hopscotch_hash& other) = default; |
870 | |
871 | hopscotch_hash& operator=(hopscotch_hash&& other) { |
872 | other.swap(*this); |
873 | other.clear(); |
874 | |
875 | return *this; |
876 | } |
877 | |
878 | allocator_type get_allocator() const { |
879 | return m_buckets.get_allocator(); |
880 | } |
881 | |
882 | |
883 | /* |
884 | * Iterators |
885 | */ |
886 | iterator begin() noexcept { |
887 | auto begin = m_buckets.begin(); |
888 | while(begin != m_buckets.end() && begin->empty()) { |
889 | ++begin; |
890 | } |
891 | |
892 | return iterator(begin, m_buckets.end(), m_overflow_elements.begin()); |
893 | } |
894 | |
895 | const_iterator begin() const noexcept { |
896 | return cbegin(); |
897 | } |
898 | |
899 | const_iterator cbegin() const noexcept { |
900 | auto begin = m_buckets.cbegin(); |
901 | while(begin != m_buckets.cend() && begin->empty()) { |
902 | ++begin; |
903 | } |
904 | |
905 | return const_iterator(begin, m_buckets.cend(), m_overflow_elements.cbegin()); |
906 | } |
907 | |
908 | iterator end() noexcept { |
909 | return iterator(m_buckets.end(), m_buckets.end(), m_overflow_elements.end()); |
910 | } |
911 | |
912 | const_iterator end() const noexcept { |
913 | return cend(); |
914 | } |
915 | |
916 | const_iterator cend() const noexcept { |
917 | return const_iterator(m_buckets.cend(), m_buckets.cend(), m_overflow_elements.cend()); |
918 | } |
919 | |
920 | |
921 | /* |
922 | * Capacity |
923 | */ |
924 | bool empty() const noexcept { |
925 | return m_nb_elements == 0; |
926 | } |
927 | |
928 | size_type size() const noexcept { |
929 | return m_nb_elements; |
930 | } |
931 | |
932 | size_type max_size() const noexcept { |
933 | return hopscotch_bucket::max_size(); |
934 | } |
935 | |
936 | /* |
937 | * Modifiers |
938 | */ |
939 | void clear() noexcept { |
940 | for(auto& bucket : m_buckets) { |
941 | bucket.clear(); |
942 | } |
943 | |
944 | m_overflow_elements.clear(); |
945 | m_nb_elements = 0; |
946 | } |
947 | |
948 | |
949 | std::pair<iterator, bool> insert(const value_type& value) { |
950 | return insert_impl(value); |
951 | } |
952 | |
953 | template<class P, typename std::enable_if<std::is_constructible<value_type, P&&>::value>::type* = nullptr> |
954 | std::pair<iterator, bool> insert(P&& value) { |
955 | return emplace(std::forward<P>(value)); |
956 | } |
957 | |
958 | std::pair<iterator, bool> insert(value_type&& value) { |
959 | return insert_impl(std::move(value)); |
960 | } |
961 | |
962 | |
963 | iterator insert(const_iterator hint, const value_type& value) { |
964 | if(hint != cend() && compare_keys(KeySelect()(*hint), KeySelect()(value))) { |
965 | return mutable_iterator(hint); |
966 | } |
967 | |
968 | return insert(value).first; |
969 | } |
970 | |
971 | template<class P, typename std::enable_if<std::is_constructible<value_type, P&&>::value>::type* = nullptr> |
972 | iterator insert(const_iterator hint, P&& value) { |
973 | return emplace_hint(hint, std::forward<P>(value)); |
974 | } |
975 | |
976 | iterator insert(const_iterator hint, value_type&& value) { |
977 | if(hint != cend() && compare_keys(KeySelect()(*hint), KeySelect()(value))) { |
978 | return mutable_iterator(hint); |
979 | } |
980 | |
981 | return insert(std::move(value)).first; |
982 | } |
983 | |
984 | |
985 | template<class InputIt> |
986 | void insert(InputIt first, InputIt last) { |
987 | if(std::is_base_of<std::forward_iterator_tag, |
988 | typename std::iterator_traits<InputIt>::iterator_category>::value) |
989 | { |
990 | const auto nb_elements_insert = std::distance(first, last); |
991 | const std::size_t nb_elements_in_buckets = m_nb_elements - m_overflow_elements.size(); |
992 | const std::size_t nb_free_buckets = m_load_threshold - nb_elements_in_buckets; |
993 | tsl_assert(m_nb_elements >= m_overflow_elements.size()); |
994 | tsl_assert(m_load_threshold >= nb_elements_in_buckets); |
995 | |
996 | if(nb_elements_insert > 0 && nb_free_buckets < std::size_t(nb_elements_insert)) { |
997 | reserve(nb_elements_in_buckets + std::size_t(nb_elements_insert)); |
998 | } |
999 | } |
1000 | |
1001 | for(; first != last; ++first) { |
1002 | insert(*first); |
1003 | } |
1004 | } |
1005 | |
1006 | |
1007 | template<class M> |
1008 | std::pair<iterator, bool> insert_or_assign(const key_type& k, M&& obj) { |
1009 | return insert_or_assign_impl(k, std::forward<M>(obj)); |
1010 | } |
1011 | |
1012 | template<class M> |
1013 | std::pair<iterator, bool> insert_or_assign(key_type&& k, M&& obj) { |
1014 | return insert_or_assign_impl(std::move(k), std::forward<M>(obj)); |
1015 | } |
1016 | |
1017 | |
1018 | template<class M> |
1019 | iterator insert_or_assign(const_iterator hint, const key_type& k, M&& obj) { |
1020 | if(hint != cend() && compare_keys(KeySelect()(*hint), k)) { |
1021 | auto it = mutable_iterator(hint); |
1022 | it.value() = std::forward<M>(obj); |
1023 | |
1024 | return it; |
1025 | } |
1026 | |
1027 | return insert_or_assign(k, std::forward<M>(obj)).first; |
1028 | } |
1029 | |
1030 | template<class M> |
1031 | iterator insert_or_assign(const_iterator hint, key_type&& k, M&& obj) { |
1032 | if(hint != cend() && compare_keys(KeySelect()(*hint), k)) { |
1033 | auto it = mutable_iterator(hint); |
1034 | it.value() = std::forward<M>(obj); |
1035 | |
1036 | return it; |
1037 | } |
1038 | |
1039 | return insert_or_assign(std::move(k), std::forward<M>(obj)).first; |
1040 | } |
1041 | |
1042 | |
1043 | template<class... Args> |
1044 | std::pair<iterator, bool> emplace(Args&&... args) { |
1045 | return insert(value_type(std::forward<Args>(args)...)); |
1046 | } |
1047 | |
1048 | template<class... Args> |
1049 | iterator emplace_hint(const_iterator hint, Args&&... args) { |
1050 | return insert(hint, value_type(std::forward<Args>(args)...)); |
1051 | } |
1052 | |
1053 | template<class... Args> |
1054 | std::pair<iterator, bool> try_emplace(const key_type& k, Args&&... args) { |
1055 | return try_emplace_impl(k, std::forward<Args>(args)...); |
1056 | } |
1057 | |
1058 | template<class... Args> |
1059 | std::pair<iterator, bool> try_emplace(key_type&& k, Args&&... args) { |
1060 | return try_emplace_impl(std::move(k), std::forward<Args>(args)...); |
1061 | } |
1062 | |
1063 | template<class... Args> |
1064 | iterator try_emplace(const_iterator hint, const key_type& k, Args&&... args) { |
1065 | if(hint != cend() && compare_keys(KeySelect()(*hint), k)) { |
1066 | return mutable_iterator(hint); |
1067 | } |
1068 | |
1069 | return try_emplace(k, std::forward<Args>(args)...).first; |
1070 | } |
1071 | |
1072 | template<class... Args> |
1073 | iterator try_emplace(const_iterator hint, key_type&& k, Args&&... args) { |
1074 | if(hint != cend() && compare_keys(KeySelect()(*hint), k)) { |
1075 | return mutable_iterator(hint); |
1076 | } |
1077 | |
1078 | return try_emplace(std::move(k), std::forward<Args>(args)...).first; |
1079 | } |
1080 | |
1081 | |
1082 | |
1083 | iterator erase(iterator pos) { |
1084 | return erase(const_iterator(pos)); |
1085 | } |
1086 | |
1087 | iterator erase(const_iterator pos) { |
1088 | const std::size_t ibucket_for_hash = bucket_for_hash(hash_key(pos.key())); |
1089 | |
1090 | if(pos.m_buckets_iterator != pos.m_buckets_end_iterator) { |
1091 | auto it_bucket = m_buckets.begin() + std::distance(m_buckets.cbegin(), pos.m_buckets_iterator); |
1092 | erase_from_bucket(it_bucket, ibucket_for_hash); |
1093 | |
1094 | return ++iterator(it_bucket, m_buckets.end(), m_overflow_elements.begin()); |
1095 | } |
1096 | else { |
1097 | auto it_next_overflow = erase_from_overflow(pos.m_overflow_iterator, ibucket_for_hash); |
1098 | return iterator(m_buckets.end(), m_buckets.end(), it_next_overflow); |
1099 | } |
1100 | } |
1101 | |
1102 | iterator erase(const_iterator first, const_iterator last) { |
1103 | if(first == last) { |
1104 | return mutable_iterator(first); |
1105 | } |
1106 | |
1107 | auto to_delete = erase(first); |
1108 | while(to_delete != last) { |
1109 | to_delete = erase(to_delete); |
1110 | } |
1111 | |
1112 | return to_delete; |
1113 | } |
1114 | |
1115 | template<class K> |
1116 | size_type erase(const K& key) { |
1117 | return erase(key, hash_key(key)); |
1118 | } |
1119 | |
1120 | template<class K> |
1121 | size_type erase(const K& key, std::size_t hash) { |
1122 | const std::size_t ibucket_for_hash = bucket_for_hash(hash); |
1123 | |
1124 | auto it_find = find_in_buckets(key, hash, m_buckets.begin() + ibucket_for_hash); |
1125 | if(it_find != m_buckets.end()) { |
1126 | erase_from_bucket(it_find, ibucket_for_hash); |
1127 | |
1128 | return 1; |
1129 | } |
1130 | |
1131 | if(m_buckets[ibucket_for_hash].has_overflow()) { |
1132 | auto it_overflow = find_in_overflow(key); |
1133 | if(it_overflow != m_overflow_elements.end()) { |
1134 | erase_from_overflow(it_overflow, ibucket_for_hash); |
1135 | |
1136 | return 1; |
1137 | } |
1138 | } |
1139 | |
1140 | return 0; |
1141 | } |
1142 | |
1143 | void swap(hopscotch_hash& other) { |
1144 | using std::swap; |
1145 | |
1146 | swap(static_cast<Hash&>(*this), static_cast<Hash&>(other)); |
1147 | swap(static_cast<KeyEqual&>(*this), static_cast<KeyEqual&>(other)); |
1148 | swap(static_cast<GrowthPolicy&>(*this), static_cast<GrowthPolicy&>(other)); |
1149 | swap(m_buckets, other.m_buckets); |
1150 | swap(m_overflow_elements, other.m_overflow_elements); |
1151 | swap(m_nb_elements, other.m_nb_elements); |
1152 | swap(m_max_load_factor, other.m_max_load_factor); |
1153 | swap(m_load_threshold, other.m_load_threshold); |
1154 | swap(m_min_load_factor_rehash_threshold, other.m_min_load_factor_rehash_threshold); |
1155 | } |
1156 | |
1157 | |
1158 | /* |
1159 | * Lookup |
1160 | */ |
1161 | template<class K, class U = ValueSelect, typename std::enable_if<has_mapped_type<U>::value>::type* = nullptr> |
1162 | typename U::value_type& at(const K& key) { |
1163 | return at(key, hash_key(key)); |
1164 | } |
1165 | |
1166 | template<class K, class U = ValueSelect, typename std::enable_if<has_mapped_type<U>::value>::type* = nullptr> |
1167 | typename U::value_type& at(const K& key, std::size_t hash) { |
1168 | return const_cast<typename U::value_type&>(static_cast<const hopscotch_hash*>(this)->at(key, hash)); |
1169 | } |
1170 | |
1171 | |
1172 | template<class K, class U = ValueSelect, typename std::enable_if<has_mapped_type<U>::value>::type* = nullptr> |
1173 | const typename U::value_type& at(const K& key) const { |
1174 | return at(key, hash_key(key)); |
1175 | } |
1176 | |
1177 | template<class K, class U = ValueSelect, typename std::enable_if<has_mapped_type<U>::value>::type* = nullptr> |
1178 | const typename U::value_type& at(const K& key, std::size_t hash) const { |
1179 | using T = typename U::value_type; |
1180 | |
1181 | const T* value = find_value_impl(key, hash, m_buckets.begin() + bucket_for_hash(hash)); |
1182 | if(value == nullptr) { |
1183 | throw std::out_of_range("Couldn't find key." ); |
1184 | } |
1185 | else { |
1186 | return *value; |
1187 | } |
1188 | } |
1189 | |
1190 | |
1191 | template<class K, class U = ValueSelect, typename std::enable_if<has_mapped_type<U>::value>::type* = nullptr> |
1192 | typename U::value_type& operator[](K&& key) { |
1193 | using T = typename U::value_type; |
1194 | |
1195 | const std::size_t hash = hash_key(key); |
1196 | const std::size_t ibucket_for_hash = bucket_for_hash(hash); |
1197 | |
1198 | T* value = find_value_impl(key, hash, m_buckets.begin() + ibucket_for_hash); |
1199 | if(value != nullptr) { |
1200 | return *value; |
1201 | } |
1202 | else { |
1203 | return insert_impl(std::make_pair(std::forward<K>(key), T()), hash, ibucket_for_hash).first.value(); |
1204 | } |
1205 | } |
1206 | |
1207 | |
1208 | template<class K> |
1209 | size_type count(const K& key) const { |
1210 | return count(key, hash_key(key)); |
1211 | } |
1212 | |
1213 | template<class K> |
1214 | size_type count(const K& key, std::size_t hash) const { |
1215 | return count_impl(key, hash, m_buckets.cbegin() + bucket_for_hash(hash)); |
1216 | } |
1217 | |
1218 | |
1219 | template<class K> |
1220 | iterator find(const K& key) { |
1221 | return find(key, hash_key(key)); |
1222 | } |
1223 | |
1224 | template<class K> |
1225 | iterator find(const K& key, std::size_t hash) { |
1226 | return find_impl(key, hash, m_buckets.begin() + bucket_for_hash(hash)); |
1227 | } |
1228 | |
1229 | |
1230 | template<class K> |
1231 | const_iterator find(const K& key) const { |
1232 | return find(key, hash_key(key)); |
1233 | } |
1234 | |
1235 | template<class K> |
1236 | const_iterator find(const K& key, std::size_t hash) const { |
1237 | return find_impl(key, hash, m_buckets.begin() + bucket_for_hash(hash)); |
1238 | } |
1239 | |
1240 | |
1241 | template<class K> |
1242 | std::pair<iterator, iterator> equal_range(const K& key) { |
1243 | return equal_range(key, hash_key(key)); |
1244 | } |
1245 | |
1246 | template<class K> |
1247 | std::pair<iterator, iterator> equal_range(const K& key, std::size_t hash) { |
1248 | iterator it = find(key, hash); |
1249 | return std::make_pair(it, (it == end())?it:std::next(it)); |
1250 | } |
1251 | |
1252 | |
1253 | template<class K> |
1254 | std::pair<const_iterator, const_iterator> equal_range(const K& key) const { |
1255 | return equal_range(key, hash_key(key)); |
1256 | } |
1257 | |
1258 | template<class K> |
1259 | std::pair<const_iterator, const_iterator> equal_range(const K& key, std::size_t hash) const { |
1260 | const_iterator it = find(key, hash); |
1261 | return std::make_pair(it, (it == cend())?it:std::next(it)); |
1262 | } |
1263 | |
1264 | /* |
1265 | * Bucket interface |
1266 | */ |
1267 | size_type bucket_count() const { |
1268 | /* |
1269 | * So that the last bucket can have NeighborhoodSize neighbors, the size of the bucket array is a little |
1270 | * bigger than the real number of buckets. We could use some of the buckets at the beginning, but |
1271 | * it is easier this way and we avoid weird behaviour with iterators. |
1272 | */ |
1273 | return m_buckets.size() - NeighborhoodSize + 1; |
1274 | } |
1275 | |
1276 | size_type max_bucket_count() const { |
1277 | const std::size_t max_bucket_count = std::min(GrowthPolicy::max_bucket_count(), m_buckets.max_size()); |
1278 | return max_bucket_count - NeighborhoodSize + 1; |
1279 | } |
1280 | |
1281 | |
1282 | /* |
1283 | * Hash policy |
1284 | */ |
1285 | float load_factor() const { |
1286 | return float(m_nb_elements)/float(bucket_count()); |
1287 | } |
1288 | |
1289 | float max_load_factor() const { |
1290 | return m_max_load_factor; |
1291 | } |
1292 | |
1293 | void max_load_factor(float ml) { |
1294 | m_max_load_factor = ml; |
1295 | m_load_threshold = size_type(float(bucket_count())*m_max_load_factor); |
1296 | m_min_load_factor_rehash_threshold = size_type(bucket_count()*MIN_LOAD_FACTOR_FOR_REHASH); |
1297 | } |
1298 | |
1299 | void rehash(size_type count) { |
1300 | count = std::max(count, size_type(std::ceil(float(size())/max_load_factor()))); |
1301 | rehash_impl(count); |
1302 | } |
1303 | |
1304 | void reserve(size_type count) { |
1305 | rehash(size_type(std::ceil(float(count)/max_load_factor()))); |
1306 | } |
1307 | |
1308 | |
1309 | /* |
1310 | * Observers |
1311 | */ |
1312 | hasher hash_function() const { |
1313 | return static_cast<Hash>(*this); |
1314 | } |
1315 | |
1316 | key_equal key_eq() const { |
1317 | return static_cast<KeyEqual>(*this); |
1318 | } |
1319 | |
1320 | /* |
1321 | * Other |
1322 | */ |
1323 | size_type overflow_size() const noexcept { |
1324 | return m_overflow_elements.size(); |
1325 | } |
1326 | |
1327 | template<class U = OverflowContainer, typename std::enable_if<has_key_compare<U>::value>::type* = nullptr> |
1328 | typename U::key_compare key_comp() const { |
1329 | return m_overflow_elements.key_comp(); |
1330 | } |
1331 | |
1332 | private: |
1333 | template<class K> |
1334 | std::size_t hash_key(const K& key) const { |
1335 | return Hash::operator()(key); |
1336 | } |
1337 | |
1338 | template<class K1, class K2> |
1339 | bool compare_keys(const K1& key1, const K2& key2) const { |
1340 | return KeyEqual::operator()(key1, key2); |
1341 | } |
1342 | |
1343 | std::size_t bucket_for_hash(std::size_t hash) const { |
1344 | return GrowthPolicy::bucket_for_hash(hash); |
1345 | } |
1346 | |
1347 | iterator mutable_iterator(const_iterator pos) { |
1348 | if(pos.m_buckets_iterator != pos.m_buckets_end_iterator) { |
1349 | // Get a non-const iterator |
1350 | auto it = m_buckets.begin() + std::distance(m_buckets.cbegin(), pos.m_buckets_iterator); |
1351 | return iterator(it, m_buckets.end(), m_overflow_elements.begin()); |
1352 | } |
1353 | else { |
1354 | // Get a non-const iterator |
1355 | auto it = mutable_overflow_iterator(pos.m_overflow_iterator); |
1356 | |
1357 | return iterator(m_buckets.end(), m_buckets.end(), it); |
1358 | } |
1359 | } |
1360 | |
1361 | |
1362 | static_assert(std::is_nothrow_move_constructible<value_type>::value || |
1363 | std::is_copy_constructible<value_type>::value, |
1364 | "value_type must be either copy constructible or nothrow move constructible." ); |
1365 | |
1366 | template<typename U = value_type, |
1367 | typename std::enable_if<std::is_nothrow_move_constructible<U>::value>::type* = nullptr> |
1368 | void rehash_impl(size_type count) { |
1369 | hopscotch_hash new_map = new_hopscotch_hash(count); |
1370 | |
1371 | if(!m_overflow_elements.empty()) { |
1372 | new_map.m_overflow_elements.swap(m_overflow_elements); |
1373 | new_map.m_nb_elements += new_map.m_overflow_elements.size(); |
1374 | |
1375 | for(const value_type& value : new_map.m_overflow_elements) { |
1376 | const std::size_t ibucket_for_hash = new_map.bucket_for_hash(new_map.hash_key(KeySelect()(value))); |
1377 | new_map.m_buckets[ibucket_for_hash].set_overflow(true); |
1378 | } |
1379 | } |
1380 | |
1381 | try { |
1382 | for(auto it_bucket = m_buckets.begin(); it_bucket != m_buckets.end(); ++it_bucket) { |
1383 | if(it_bucket->empty()) { |
1384 | continue; |
1385 | } |
1386 | |
1387 | const std::size_t hash = USE_STORED_HASH_ON_REHASH? |
1388 | it_bucket->truncated_bucket_hash(): |
1389 | new_map.hash_key(KeySelect()(it_bucket->value())); |
1390 | const std::size_t ibucket_for_hash = new_map.bucket_for_hash(hash); |
1391 | |
1392 | new_map.insert_impl(std::move(it_bucket->value()), hash, ibucket_for_hash); |
1393 | |
1394 | |
1395 | erase_from_bucket(it_bucket, bucket_for_hash(hash)); |
1396 | } |
1397 | } |
1398 | /* |
1399 | * The call to insert_impl may throw an exception if an element is added to the overflow |
1400 | * list. Rollback the elements in this case. |
1401 | */ |
1402 | catch(...) { |
1403 | m_overflow_elements.swap(new_map.m_overflow_elements); |
1404 | |
1405 | for(auto it_bucket = new_map.m_buckets.begin(); it_bucket != new_map.m_buckets.end(); ++it_bucket) { |
1406 | if(it_bucket->empty()) { |
1407 | continue; |
1408 | } |
1409 | |
1410 | const std::size_t hash = USE_STORED_HASH_ON_REHASH? |
1411 | it_bucket->truncated_bucket_hash(): |
1412 | hash_key(KeySelect()(it_bucket->value())); |
1413 | const std::size_t ibucket_for_hash = bucket_for_hash(hash); |
1414 | |
1415 | // The elements we insert were not in the overflow list before the switch. |
1416 | // They will not be go in the overflow list if we rollback the switch. |
1417 | insert_impl(std::move(it_bucket->value()), hash, ibucket_for_hash); |
1418 | } |
1419 | |
1420 | throw; |
1421 | } |
1422 | |
1423 | new_map.swap(*this); |
1424 | } |
1425 | |
1426 | template<typename U = value_type, |
1427 | typename std::enable_if<std::is_copy_constructible<U>::value && |
1428 | !std::is_nothrow_move_constructible<U>::value>::type* = nullptr> |
1429 | void rehash_impl(size_type count) { |
1430 | hopscotch_hash new_map = new_hopscotch_hash(count); |
1431 | |
1432 | for(const hopscotch_bucket& bucket: m_buckets) { |
1433 | if(bucket.empty()) { |
1434 | continue; |
1435 | } |
1436 | |
1437 | const std::size_t hash = USE_STORED_HASH_ON_REHASH? |
1438 | bucket.truncated_bucket_hash(): |
1439 | new_map.hash_key(KeySelect()(bucket.value())); |
1440 | const std::size_t ibucket_for_hash = new_map.bucket_for_hash(hash); |
1441 | |
1442 | new_map.insert_impl(bucket.value(), hash, ibucket_for_hash); |
1443 | } |
1444 | |
1445 | for(const value_type& value: m_overflow_elements) { |
1446 | const std::size_t hash = new_map.hash_key(KeySelect()(value)); |
1447 | const std::size_t ibucket_for_hash = new_map.bucket_for_hash(hash); |
1448 | |
1449 | new_map.insert_impl(value, hash, ibucket_for_hash); |
1450 | } |
1451 | |
1452 | new_map.swap(*this); |
1453 | } |
1454 | |
1455 | #ifdef TSL_NO_RANGE_ERASE_WITH_CONST_ITERATOR |
1456 | iterator_overflow mutable_overflow_iterator(const_iterator_overflow it) { |
1457 | return std::next(m_overflow_elements.begin(), std::distance(m_overflow_elements.cbegin(), it)); |
1458 | } |
1459 | #else |
1460 | iterator_overflow mutable_overflow_iterator(const_iterator_overflow it) { |
1461 | return m_overflow_elements.erase(it, it); |
1462 | } |
1463 | #endif |
1464 | |
1465 | // iterator is in overflow list |
1466 | iterator_overflow erase_from_overflow(const_iterator_overflow pos, std::size_t ibucket_for_hash) { |
1467 | #ifdef TSL_NO_RANGE_ERASE_WITH_CONST_ITERATOR |
1468 | auto it_next = m_overflow_elements.erase(mutable_overflow_iterator(pos)); |
1469 | #else |
1470 | auto it_next = m_overflow_elements.erase(pos); |
1471 | #endif |
1472 | m_nb_elements--; |
1473 | |
1474 | |
1475 | // Check if we can remove the overflow flag |
1476 | tsl_assert(m_buckets[ibucket_for_hash].has_overflow()); |
1477 | for(const value_type& value: m_overflow_elements) { |
1478 | const std::size_t bucket_for_value = bucket_for_hash(hash_key(KeySelect()(value))); |
1479 | if(bucket_for_value == ibucket_for_hash) { |
1480 | return it_next; |
1481 | } |
1482 | } |
1483 | |
1484 | m_buckets[ibucket_for_hash].set_overflow(false); |
1485 | return it_next; |
1486 | } |
1487 | |
1488 | // iterator is in bucket |
1489 | void erase_from_bucket(iterator_buckets pos, std::size_t ibucket_for_hash) noexcept { |
1490 | const std::size_t ibucket_for_pos = std::distance(m_buckets.begin(), pos); |
1491 | tsl_assert(ibucket_for_pos >= ibucket_for_hash); |
1492 | |
1493 | m_buckets[ibucket_for_pos].remove_value(); |
1494 | m_buckets[ibucket_for_hash].toggle_neighbor_presence(ibucket_for_pos - ibucket_for_hash); |
1495 | m_nb_elements--; |
1496 | } |
1497 | |
1498 | |
1499 | |
1500 | template<class K, class M> |
1501 | std::pair<iterator, bool> insert_or_assign_impl(K&& key, M&& obj) { |
1502 | const std::size_t hash = hash_key(key); |
1503 | const std::size_t ibucket_for_hash = bucket_for_hash(hash); |
1504 | |
1505 | // Check if already presents |
1506 | auto it_find = find_impl(key, hash, m_buckets.begin() + ibucket_for_hash); |
1507 | if(it_find != end()) { |
1508 | it_find.value() = std::forward<M>(obj); |
1509 | return std::make_pair(it_find, false); |
1510 | } |
1511 | |
1512 | |
1513 | return insert_impl(value_type(std::forward<K>(key), std::forward<M>(obj)), hash, ibucket_for_hash); |
1514 | } |
1515 | |
1516 | template<typename P, class... Args> |
1517 | std::pair<iterator, bool> try_emplace_impl(P&& key, Args&&... args_value) { |
1518 | const std::size_t hash = hash_key(key); |
1519 | const std::size_t ibucket_for_hash = bucket_for_hash(hash); |
1520 | |
1521 | // Check if already presents |
1522 | auto it_find = find_impl(key, hash, m_buckets.begin() + ibucket_for_hash); |
1523 | if(it_find != end()) { |
1524 | return std::make_pair(it_find, false); |
1525 | } |
1526 | |
1527 | |
1528 | return insert_impl(value_type(std::piecewise_construct, |
1529 | std::forward_as_tuple(std::forward<P>(key)), |
1530 | std::forward_as_tuple(std::forward<Args>(args_value)...)), |
1531 | hash, ibucket_for_hash); |
1532 | } |
1533 | |
1534 | template<typename P> |
1535 | std::pair<iterator, bool> insert_impl(P&& value) { |
1536 | const std::size_t hash = hash_key(KeySelect()(value)); |
1537 | const std::size_t ibucket_for_hash = bucket_for_hash(hash); |
1538 | |
1539 | // Check if already presents |
1540 | auto it_find = find_impl(KeySelect()(value), hash, m_buckets.begin() + ibucket_for_hash); |
1541 | if(it_find != end()) { |
1542 | return std::make_pair(it_find, false); |
1543 | } |
1544 | |
1545 | |
1546 | return insert_impl(std::forward<P>(value), hash, ibucket_for_hash); |
1547 | } |
1548 | |
1549 | template<typename P> |
1550 | std::pair<iterator, bool> insert_impl(P&& value, std::size_t hash, std::size_t ibucket_for_hash) { |
1551 | if((m_nb_elements - m_overflow_elements.size()) >= m_load_threshold) { |
1552 | rehash(GrowthPolicy::next_bucket_count()); |
1553 | ibucket_for_hash = bucket_for_hash(hash); |
1554 | } |
1555 | |
1556 | std::size_t ibucket_empty = find_empty_bucket(ibucket_for_hash); |
1557 | if(ibucket_empty < m_buckets.size()) { |
1558 | do { |
1559 | tsl_assert(ibucket_empty >= ibucket_for_hash); |
1560 | |
1561 | // Empty bucket is in range of NeighborhoodSize, use it |
1562 | if(ibucket_empty - ibucket_for_hash < NeighborhoodSize) { |
1563 | auto it = insert_in_bucket(std::forward<P>(value), hash, ibucket_empty, ibucket_for_hash); |
1564 | return std::make_pair(iterator(it, m_buckets.end(), m_overflow_elements.begin()), true); |
1565 | } |
1566 | } |
1567 | // else, try to swap values to get a closer empty bucket |
1568 | while(swap_empty_bucket_closer(ibucket_empty)); |
1569 | } |
1570 | |
1571 | // Load factor is too low or a rehash will not change the neighborhood, put the value in overflow list |
1572 | if(size() < m_min_load_factor_rehash_threshold || !will_neighborhood_change_on_rehash(ibucket_for_hash)) { |
1573 | auto it_insert = m_overflow_elements.insert(m_overflow_elements.end(), std::forward<P>(value)); |
1574 | m_buckets[ibucket_for_hash].set_overflow(true); |
1575 | m_nb_elements++; |
1576 | |
1577 | return std::make_pair(iterator(m_buckets.end(), m_buckets.end(), it_insert), true); |
1578 | } |
1579 | |
1580 | rehash(GrowthPolicy::next_bucket_count()); |
1581 | |
1582 | ibucket_for_hash = bucket_for_hash(hash); |
1583 | return insert_impl(std::forward<P>(value), hash, ibucket_for_hash); |
1584 | } |
1585 | |
1586 | /* |
1587 | * Return true if a rehash will change the position of a key-value in the neighborhood of |
1588 | * ibucket_neighborhood_check. In this case a rehash is needed instead of puting the value in overflow list. |
1589 | */ |
1590 | bool will_neighborhood_change_on_rehash(size_t ibucket_neighborhood_check) const { |
1591 | std::size_t expand_bucket_count = GrowthPolicy::next_bucket_count(); |
1592 | GrowthPolicy expand_growth_policy(expand_bucket_count); |
1593 | |
1594 | for(size_t ibucket = ibucket_neighborhood_check; |
1595 | ibucket < m_buckets.size() && (ibucket - ibucket_neighborhood_check) < NeighborhoodSize; |
1596 | ++ibucket) |
1597 | { |
1598 | tsl_assert(!m_buckets[ibucket].empty()); |
1599 | |
1600 | const size_t hash = USE_STORED_HASH_ON_REHASH? |
1601 | m_buckets[ibucket].truncated_bucket_hash(): |
1602 | hash_key(KeySelect()(m_buckets[ibucket].value())); |
1603 | if(bucket_for_hash(hash) != expand_growth_policy.bucket_for_hash(hash)) { |
1604 | return true; |
1605 | } |
1606 | } |
1607 | |
1608 | return false; |
1609 | } |
1610 | |
1611 | /* |
1612 | * Return the index of an empty bucket in m_buckets. |
1613 | * If none, the returned index equals m_buckets.size() |
1614 | */ |
1615 | std::size_t find_empty_bucket(std::size_t ibucket_start) const { |
1616 | const std::size_t limit = std::min(ibucket_start + MAX_PROBES_FOR_EMPTY_BUCKET, m_buckets.size()); |
1617 | for(; ibucket_start < limit; ibucket_start++) { |
1618 | if(m_buckets[ibucket_start].empty()) { |
1619 | return ibucket_start; |
1620 | } |
1621 | } |
1622 | |
1623 | return m_buckets.size(); |
1624 | } |
1625 | |
1626 | /* |
1627 | * Insert value in ibucket_empty where value originally belongs to ibucket_for_hash |
1628 | * |
1629 | * Return bucket iterator to ibucket_empty |
1630 | */ |
1631 | template<typename P> |
1632 | iterator_buckets insert_in_bucket(P&& value, std::size_t hash, |
1633 | std::size_t ibucket_empty, std::size_t ibucket_for_hash) |
1634 | { |
1635 | tsl_assert(ibucket_empty >= ibucket_for_hash ); |
1636 | tsl_assert(m_buckets[ibucket_empty].empty()); |
1637 | m_buckets[ibucket_empty].set_value_of_empty_bucket(std::forward<P>(value), hash); |
1638 | |
1639 | tsl_assert(!m_buckets[ibucket_for_hash].empty()); |
1640 | m_buckets[ibucket_for_hash].toggle_neighbor_presence(ibucket_empty - ibucket_for_hash); |
1641 | m_nb_elements++; |
1642 | |
1643 | return m_buckets.begin() + ibucket_empty; |
1644 | } |
1645 | |
1646 | /* |
1647 | * Try to swap the bucket ibucket_empty_in_out with a bucket preceding it while keeping the neighborhood |
1648 | * conditions correct. |
1649 | * |
1650 | * If a swap was possible, the position of ibucket_empty_in_out will be closer to 0 and true will re returned. |
1651 | */ |
1652 | bool swap_empty_bucket_closer(std::size_t& ibucket_empty_in_out) { |
1653 | tsl_assert(ibucket_empty_in_out >= NeighborhoodSize); |
1654 | const std::size_t neighborhood_start = ibucket_empty_in_out - NeighborhoodSize + 1; |
1655 | |
1656 | for(std::size_t to_check = neighborhood_start; to_check < ibucket_empty_in_out; to_check++) { |
1657 | neighborhood_bitmap neighborhood_infos = m_buckets[to_check].neighborhood_infos(); |
1658 | std::size_t to_swap = to_check; |
1659 | |
1660 | while(neighborhood_infos != 0 && to_swap < ibucket_empty_in_out) { |
1661 | if((neighborhood_infos & 1) == 1) { |
1662 | tsl_assert(m_buckets[ibucket_empty_in_out].empty()); |
1663 | tsl_assert(!m_buckets[to_swap].empty()); |
1664 | |
1665 | m_buckets[to_swap].swap_value_into_empty_bucket(m_buckets[ibucket_empty_in_out]); |
1666 | |
1667 | tsl_assert(!m_buckets[to_check].check_neighbor_presence(ibucket_empty_in_out - to_check)); |
1668 | tsl_assert(m_buckets[to_check].check_neighbor_presence(to_swap - to_check)); |
1669 | |
1670 | m_buckets[to_check].toggle_neighbor_presence(ibucket_empty_in_out - to_check); |
1671 | m_buckets[to_check].toggle_neighbor_presence(to_swap - to_check); |
1672 | |
1673 | |
1674 | ibucket_empty_in_out = to_swap; |
1675 | |
1676 | return true; |
1677 | } |
1678 | |
1679 | to_swap++; |
1680 | neighborhood_infos = neighborhood_bitmap(neighborhood_infos >> 1); |
1681 | } |
1682 | } |
1683 | |
1684 | return false; |
1685 | } |
1686 | |
1687 | |
1688 | |
1689 | template<class K, class U = ValueSelect, typename std::enable_if<has_mapped_type<U>::value>::type* = nullptr> |
1690 | typename U::value_type* find_value_impl(const K& key, std::size_t hash, iterator_buckets it_bucket) { |
1691 | return const_cast<typename U::value_type*>( |
1692 | static_cast<const hopscotch_hash*>(this)->find_value_impl(key, hash, it_bucket)); |
1693 | } |
1694 | |
1695 | /* |
1696 | * Avoid the creation of an iterator to just get the value for operator[] and at() in maps. Faster this way. |
1697 | * |
1698 | * Return null if no value for key (TODO use std::optional when available). |
1699 | */ |
1700 | template<class K, class U = ValueSelect, typename std::enable_if<has_mapped_type<U>::value>::type* = nullptr> |
1701 | const typename U::value_type* find_value_impl(const K& key, std::size_t hash, |
1702 | const_iterator_buckets it_bucket) const |
1703 | { |
1704 | auto it_find = find_in_buckets(key, hash, it_bucket); |
1705 | if(it_find != m_buckets.cend()) { |
1706 | return std::addressof(ValueSelect()(it_find->value())); |
1707 | } |
1708 | |
1709 | if(it_bucket->has_overflow()) { |
1710 | auto it_overflow = find_in_overflow(key); |
1711 | if(it_overflow != m_overflow_elements.end()) { |
1712 | return std::addressof(ValueSelect()(*it_overflow)); |
1713 | } |
1714 | } |
1715 | |
1716 | return nullptr; |
1717 | } |
1718 | |
1719 | template<class K> |
1720 | size_type count_impl(const K& key, std::size_t hash, const_iterator_buckets it_bucket) const { |
1721 | if(find_in_buckets(key, hash, it_bucket) != m_buckets.cend()) { |
1722 | return 1; |
1723 | } |
1724 | else if(it_bucket->has_overflow() && find_in_overflow(key) != m_overflow_elements.cend()) { |
1725 | return 1; |
1726 | } |
1727 | else { |
1728 | return 0; |
1729 | } |
1730 | } |
1731 | |
1732 | template<class K> |
1733 | iterator find_impl(const K& key, std::size_t hash, iterator_buckets it_bucket) { |
1734 | auto it = find_in_buckets(key, hash, it_bucket); |
1735 | if(it != m_buckets.end()) { |
1736 | return iterator(it, m_buckets.end(), m_overflow_elements.begin()); |
1737 | } |
1738 | |
1739 | if(!it_bucket->has_overflow()) { |
1740 | return end(); |
1741 | } |
1742 | |
1743 | return iterator(m_buckets.end(), m_buckets.end(), find_in_overflow(key)); |
1744 | } |
1745 | |
1746 | template<class K> |
1747 | const_iterator find_impl(const K& key, std::size_t hash, const_iterator_buckets it_bucket) const { |
1748 | auto it = find_in_buckets(key, hash, it_bucket); |
1749 | if(it != m_buckets.cend()) { |
1750 | return const_iterator(it, m_buckets.cend(), m_overflow_elements.cbegin()); |
1751 | } |
1752 | |
1753 | if(!it_bucket->has_overflow()) { |
1754 | return cend(); |
1755 | } |
1756 | |
1757 | |
1758 | return const_iterator(m_buckets.cend(), m_buckets.cend(), find_in_overflow(key)); |
1759 | } |
1760 | |
1761 | template<class K> |
1762 | iterator_buckets find_in_buckets(const K& key, std::size_t hash, iterator_buckets it_bucket) { |
1763 | auto it_find = static_cast<const hopscotch_hash*>(this)->find_in_buckets(key, hash, it_bucket); |
1764 | return m_buckets.begin() + std::distance(m_buckets.cbegin(), it_find); |
1765 | } |
1766 | |
1767 | |
1768 | template<class K> |
1769 | const_iterator_buckets find_in_buckets(const K& key, std::size_t hash, const_iterator_buckets it_bucket) const { |
1770 | (void) hash; // Avoid warning of unused variable when StoreHash is false; |
1771 | |
1772 | // TODO Try to optimize the function. |
1773 | // I tried to use ffs and __builtin_ffs functions but I could not reduce the time the function |
1774 | // takes with -march=native |
1775 | |
1776 | neighborhood_bitmap neighborhood_infos = it_bucket->neighborhood_infos(); |
1777 | while(neighborhood_infos != 0) { |
1778 | if((neighborhood_infos & 1) == 1) { |
1779 | // Check StoreHash before calling bucket_hash_equal. Functionally it doesn't change anythin. |
1780 | // If StoreHash is false, bucket_hash_equal is a no-op. Avoiding the call is there to help |
1781 | // GCC optimizes `hash` parameter away, it seems to not be able to do without this hint. |
1782 | if((!StoreHash || it_bucket->bucket_hash_equal(hash)) && |
1783 | compare_keys(KeySelect()(it_bucket->value()), key)) |
1784 | { |
1785 | return it_bucket; |
1786 | } |
1787 | } |
1788 | |
1789 | ++it_bucket; |
1790 | neighborhood_infos = neighborhood_bitmap(neighborhood_infos >> 1); |
1791 | } |
1792 | |
1793 | return m_buckets.end(); |
1794 | } |
1795 | |
1796 | |
1797 | // TODO Use a better way to check if we should use |
1798 | // std::find_if(m_overflow_elements.begin(), m_overflow_elements.end(), ...) or |
1799 | // m_overflow_elements.find(...) |
1800 | template<class K, class U = OverflowContainer, typename std::enable_if<!has_key_compare<U>::value>::type* = nullptr> |
1801 | iterator_overflow find_in_overflow(const K& key) { |
1802 | return std::find_if(m_overflow_elements.begin(), m_overflow_elements.end(), |
1803 | [&](const value_type& value) { |
1804 | return compare_keys(key, KeySelect()(value)); |
1805 | }); |
1806 | } |
1807 | |
1808 | template<class K, class U = OverflowContainer, typename std::enable_if<!has_key_compare<U>::value>::type* = nullptr> |
1809 | const_iterator_overflow find_in_overflow(const K& key) const { |
1810 | return std::find_if(m_overflow_elements.cbegin(), m_overflow_elements.cend(), |
1811 | [&](const value_type& value) { |
1812 | return compare_keys(key, KeySelect()(value)); |
1813 | }); |
1814 | } |
1815 | |
1816 | template<class K, class U = OverflowContainer, typename std::enable_if<has_key_compare<U>::value>::type* = nullptr> |
1817 | iterator_overflow find_in_overflow(const K& key) { |
1818 | return m_overflow_elements.find(key); |
1819 | } |
1820 | |
1821 | template<class K, class U = OverflowContainer, typename std::enable_if<has_key_compare<U>::value>::type* = nullptr> |
1822 | const_iterator_overflow find_in_overflow(const K& key) const { |
1823 | return m_overflow_elements.find(key); |
1824 | } |
1825 | |
1826 | template<class U = OverflowContainer, typename std::enable_if<!has_key_compare<U>::value>::type* = nullptr> |
1827 | hopscotch_hash new_hopscotch_hash(size_type bucket_count) { |
1828 | return hopscotch_hash(bucket_count, static_cast<Hash&>(*this), static_cast<KeyEqual&>(*this), |
1829 | get_allocator(), m_max_load_factor); |
1830 | } |
1831 | |
1832 | template<class U = OverflowContainer, typename std::enable_if<has_key_compare<U>::value>::type* = nullptr> |
1833 | hopscotch_hash new_hopscotch_hash(size_type bucket_count) { |
1834 | return hopscotch_hash(bucket_count, static_cast<Hash&>(*this), static_cast<KeyEqual&>(*this), |
1835 | get_allocator(), m_max_load_factor, m_overflow_elements.key_comp()); |
1836 | } |
1837 | |
1838 | public: |
1839 | static const size_type DEFAULT_INIT_BUCKETS_SIZE = 16; |
1840 | static constexpr float DEFAULT_MAX_LOAD_FACTOR = 0.9f; |
1841 | |
1842 | private: |
1843 | static const std::size_t MAX_PROBES_FOR_EMPTY_BUCKET = 12*NeighborhoodSize; |
1844 | static constexpr float MIN_LOAD_FACTOR_FOR_REHASH = 0.1f; |
1845 | |
1846 | static const bool USE_STORED_HASH_ON_REHASH = |
1847 | StoreHash && std::is_same<GrowthPolicy, tsl::power_of_two_growth_policy>::value; |
1848 | |
1849 | private: |
1850 | buckets_container_type m_buckets; |
1851 | overflow_container_type m_overflow_elements; |
1852 | |
1853 | size_type m_nb_elements; |
1854 | |
1855 | float m_max_load_factor; |
1856 | size_type m_load_threshold; |
1857 | size_type m_min_load_factor_rehash_threshold; |
1858 | }; |
1859 | |
1860 | } // end namespace detail_hopscotch_hash |
1861 | |
1862 | |
1863 | } // end namespace tsl |
1864 | |
1865 | #endif |
1866 | |