2 * Copyright (C) 2002-2025 CERN for the benefit of the ATLAS collaboration.
5 * @file CxxUtils/ConcurrentHashmapImpl.h
6 * @author scott snyder <snyder@bnl.gov>
8 * @brief Hash table allowing concurrent, lockless reads.
22 * @param hash The hash of the entry we're looking for.
23 * @param mask Table mask; i.e., the table capacity - 1.
24 * @param maskBits Number of 1 bits in mask.
25 * @param probeLimit Maximum number of probes to try before failing.
27 template <unsigned ENTRIES_PER_CACHELINE>
29 CHMTableIterator<ENTRIES_PER_CACHELINE>::CHMTableIterator
30 (size_t hash, size_t mask, size_t maskBits, size_t probeLimit)
31 // Mask limited to the table. Also mask off the part within a cache line.
32 : m_mask ((mask & ~ENTRIES_PER_CACHELINE_MASK)),
33 // Offset of hash within a cache line.
34 m_boffs (hash & ENTRIES_PER_CACHELINE_MASK),
35 // Starting increment between hash probes.
36 // Must be large enough to go to a new cache line, which is why
37 // we or in ENTRIES_PER_CACHELINE.
38 m_stride (((hash >> maskBits) | hash | ENTRIES_PER_CACHELINE) & ENTRIES_PER_CACHELINE_MASK),
39 m_probeLimit (probeLimit),
40 // Index at the start of the cache line containing hash.
41 m_bucket (hash & m_mask),
48 * @brief Offset of the element currently being probed.
50 template <unsigned ENTRIES_PER_CACHELINE>
52 size_t CHMTableIterator<ENTRIES_PER_CACHELINE>::offset() const
54 // m_bucket the starting index of the current cache line.
55 // Count within the cache line in a circular manner starting
57 return m_bucket + ((m_nprobes + m_boffs)&ENTRIES_PER_CACHELINE_MASK);
62 * @brief Return the number of probes performed so far.
64 template <unsigned ENTRIES_PER_CACHELINE>
66 size_t CHMTableIterator<ENTRIES_PER_CACHELINE>::nprobes() const
73 * @brief Move to the next probe.
74 * Returns true if we should continue, or false if we've hit the maximum
77 template <unsigned ENTRIES_PER_CACHELINE>
79 bool CHMTableIterator<ENTRIES_PER_CACHELINE>::next()
81 // Increment number of probes and stop if we've hit the maximum.
82 if (++m_nprobes >= m_probeLimit) {
85 // We've finished a cache line if the low bits are back to 0.
86 if ((m_nprobes & ENTRIES_PER_CACHELINE_MASK) == 0) {
87 // Move to a different cacheline.
88 // cf. knuth AOCP exercise 6.4.20.
89 // By construction, the low bits (within the cacheline) of
90 // m_bucket, m_nprobes, and m_stride should all be 0.
91 m_bucket = (m_bucket + m_nprobes + m_stride) & m_mask;
97 //*****************************************************************************
101 template <template <class> class UPDATER_, \
104 uintptr_t NULLVAL_, \
105 uintptr_t TOMBSTONE_>
107 #define CHMIMPL ConcurrentHashmapImpl<UPDATER_, HASHER_, MATCHER_, NULLVAL_, TOMBSTONE_>
111 * @brief Constructor.
112 * @param capacity Number of entries in the table. Must be a power of 2.
113 * @param hasher Hash object to use.
114 * @param matcher Key match object to use.
117 CHMIMPL::Table::Table (size_t capacity,
118 const Hasher_t& hasher /*= Hasher_t()*/,
119 const Matcher_t& matcher /*= Matcher_t()*/)
120 : m_capacity (capacity),
121 m_maxProbe (capacity / 4),
123 m_maskBits (std::countr_zero (capacity)),
128 // Clear all the keys.
129 for (size_t i = 0; i < capacity; i++) {
130 m_entries[i].m_key = nullval;
136 * @brief Allocator for table objects.
137 * @param capacity Size of the table (must be a power of 2).
139 * Allocate with enough space for the table of entries.
140 * Also align on a cache line.
143 void* CHMIMPL::Table::operator new (size_t, size_t capacity)
145 void* memptr = nullptr;
146 // Allocate aligned memory block.
147 // The Table structure includes one entry at the end,
148 // so subtract 1 from capacity.
149 posix_memalign (&memptr, CACHELINE, sizeof(Table) + (capacity-1)*sizeof(entry_t));
150 if (!memptr) std::abort();
156 * @brief Deallocator for table objects.
159 void CHMIMPL::Table::operator delete (void* p)
166 * @brief Find a table entry for reading.
167 * @param key The key for which to search.
168 * @param hash The hash of the key.
170 * Returns the matching entry, or nullptr.
173 size_t CHMIMPL::Table::probeRead (val_t key, size_t hash) const
175 // Iterate over table probes.
176 // We don't need to check more than the longest probe sequence
178 TableIterator it (hash, m_mask, m_maskBits, m_longestProbe);
180 size_t offset = it.offset();
181 const entry_t* ent = m_entries + offset;
182 if (ent->m_key == nullval) {
183 // If we hit an empty key, report failure.
186 if (m_matcher (ent->m_key, key)) {
187 // Found a matching key.
191 // Too many probes --- return failure.
197 * @brief Find a table entry for writing.
198 * @param key The key for which to search.
199 * @param hash The hash of the key.
200 * @param entry[out] The entry found.
202 * If we find the entry, return true with @c entry pointing at it.
203 * If we don't find it, and there's still room in the table, return false
204 * with @c entry pointing at the next empty entry.
205 * Otherwise, return false with @c entry set to nullptr.
208 size_t CHMIMPL::Table::probeWrite (val_t key, size_t hash, bool& insert)
210 // Iterate over table probes.
211 TableIterator it (hash, m_mask, m_maskBits, m_maxProbe);
213 size_t offset = it.offset();
214 entry_t* ent = m_entries + offset;
215 if (ent->m_key == nullval) {
216 // We hit an empty key; a new entry could be added here.
217 // Update the longest probe count.
218 CxxUtils::atomic_fetch_max (&m_longestProbe, it.nprobes()+1);
222 if (m_matcher (ent->m_key, key)) {
223 // Found a matching key.
228 // Too many probes --- return failure.
234 * @brief The number of entries in the table.
238 size_t CHMIMPL::Table::capacity() const
245 * @brief Return the entry for an offset.
246 * @param offset The index of the desired entry.
250 const typename CHMIMPL::entry_t& CHMIMPL::Table::entry (size_t offset) const
252 return m_entries[offset];
257 * @brief Return the entry for an offset (non-const).
258 * @param offset The index of the desired entry.
262 typename CHMIMPL::entry_t& CHMIMPL::Table::entry (size_t offset)
264 return m_entries[offset];
268 //*****************************************************************************
272 * @brief Constructor.
273 * @param updater Object used to manage memory
274 * (see comments at the start of the class).
275 * @param capacity Minimum initial table size.
276 * @param hasher Hash object to use.
277 * @param matcher Key match object to use.
278 * @param ctx Execution context.
281 CHMIMPL::ConcurrentHashmapImpl (Updater_t&& updater,
283 const Hasher_t& hasher,
284 const Matcher_t& matcher,
285 const typename Updater_t::Context_t& ctx)
286 : m_updater (std::move (updater)),
292 // Round up capacity to a power of 2.
293 size_t capacity = round_up (capacity_in);
295 m_table = new (capacity) Table (capacity, hasher, matcher);
296 m_updater.update (std::unique_ptr<Table> (m_table), ctx);
301 * @brief Take a lock on the container.
303 * Take a lock on the container.
304 * The lock can then be passed to put(), allowing to factor out the locking
305 * when put() gets used in a loop. The lock will be released when the
306 * lock object is destroyed.
310 typename CHMIMPL::Lock_t CHMIMPL::lock()
312 return Lock_t (m_mutex);
317 * @brief Add an entry to the table, with external locking.
318 * @param lock The lock object returned from lock().
319 * @param key The key to insert.
320 * @param hash The hash of the key.
321 * @param val The value to insert.
322 * @param overwrite If true, then overwrite an existing entry.
323 * If false, an existing entry will not be changed.
324 * @param ctx Execution context.
326 * If the key already exists, then its value will be updated.
327 * Returns an iterator pointing at the entry and a flag which is
328 * true if a new element was added.
331 std::pair<typename CHMIMPL::const_iterator, bool>
332 CHMIMPL::put (const Lock_t& lock,
333 val_t key, size_t hash, val_t val, bool overwrite,
334 const typename Updater_t::Context_t& ctx)
336 assert (key != nullval && key != tombstone);
340 size_t offset = m_table->probeWrite (key, hash, insert);
341 if (offset != INVALID) {
342 entry_t& ent = m_table->entry (offset);
344 // Found a place to put it.
345 // Be sure not to set the key until the value is in place.
351 // Found --- update the entry if wanted.
353 if (val != ent.m_val) {
358 return std::make_pair (const_iterator (*m_table, offset), insert);
361 // Need to grow the table.
362 } while (grow (lock, ctx));
365 return std::make_pair (end(), false);
370 * @brief Add an entry to the table.
371 * @param key The key to insert.
372 * @param hash The hash of the key.
373 * @param val The value to insert.
374 * @param overwrite If true, then overwrite an existing entry.
375 * If false, an existing entry will not be changed.
376 * @param ctx Execution context.
378 * If the key already exists, then its value will be updated.
379 * Returns an iterator pointing at the entry and a flag which is
380 * true if a new element was added.
384 std::pair<typename CHMIMPL::const_iterator, bool>
385 CHMIMPL::put (val_t key, size_t hash, val_t val, bool overwrite,
386 const typename Updater_t::Context_t& ctx)
388 return put (lock(), key, hash, val, overwrite, ctx);
393 * @brief Look up an entry in the table.
394 * @param key The key to find.
395 * @param hash The hash of the key.
397 * Returns an iterator pointing at the found entry, or end().
400 typename CHMIMPL::const_iterator CHMIMPL::get (val_t key, size_t hash) const
402 const Table& table = m_updater.get();
403 size_t offset = table.probeRead (key, hash);
404 // Offset will be -1 if not found --- invalid iterator.
405 return const_iterator (table, offset);
410 * @brief Erase an entry from the table, with external locking.
411 * @param lock The lock object returned from lock().
412 * @param key The key to find.
413 * @param hash The hash of the key.
415 * Mark the corresponding entry as deleted.
416 * Return true on success, false on failure (key not found).
418 * The tombstone value must be different from the null value.
420 * Take care if the key or value types require memory allocation.
422 * This may cause the key type returned by an iterator to change
423 * asynchronously to the tombstone value.
427 CHMIMPL::erase (const Lock_t& /*lock*/, val_t key, size_t hash)
429 static_assert (nullval != tombstone);
430 const Table& table = m_updater.get();
431 size_t offset = table.probeRead (key, hash);
432 if (offset != INVALID) {
433 entry_t& ent = m_table->entry (offset);
436 ent.m_key = tombstone;
444 * @brief Erase an entry from the table.
445 * @param key The key to find.
446 * @param hash The hash of the key.
448 * Mark the corresponding entry as deleted.
449 * Return true on success, false on failure (key not found).
451 * The tombstone value must be different from the null value.
453 * Take care if the key or value types require memory allocation.
455 * This may cause the key type returned by an iterator to change
456 * asynchronously to the tombstone value.
461 CHMIMPL::erase (val_t key, size_t hash)
463 return erase (lock(), key, hash);
468 * @brief Return the number of items currently stored.
471 size_t CHMIMPL::size() const
478 * @brief Return the current table size.
481 size_t CHMIMPL::capacity() const
483 const Table& table = m_updater.get();
484 return table.capacity();
489 * @brief The number of erased elements in the current table.
492 size_t CHMIMPL::erased() const
499 * @brief Return the hasher object.
503 const typename CHMIMPL::Hasher_t& CHMIMPL::hasher() const
510 * @brief Return the matcher object.
514 const typename CHMIMPL::Matcher_t& CHMIMPL::matcher() const
521 * @brief Constructor.
522 * @param table The table instance we're referencing.
523 * @param end If true, initialize this to an end iterator.
524 * Otherwise, initialize it to a a begin iterator.
528 CHMIMPL::const_iterator::const_iterator (const Table& table, bool end)
532 // For an end iterator, we want offset to be -1.
533 // For a begin iterator, we need to advance to the first non-null entry.
541 * @brief Constructor.
542 * @param table The table instance we're referencing.
543 * @param offset Offset of the iterator within the table.
544 * (Must point at an occupied entry.)
547 CHMIMPL::const_iterator::const_iterator (const Table& table, size_t offset)
551 assert (offset == INVALID || m_table.entry (offset).m_key != nullval);
556 * @brief Advance the iterator to the next occupied entry.
560 void CHMIMPL::const_iterator::next()
565 if (m_offset >= m_table.capacity()) {
569 key = m_table.entry (m_offset).m_key;
570 } while (key == nullval || key == tombstone);
575 * @brief Move the iterator back to the previous occupied entry.
579 void CHMIMPL::const_iterator::prev()
581 if (m_offset == INVALID) {
582 m_offset = m_table.capacity();
587 if (m_offset >= m_table.capacity()) {
591 key = m_table.entry (m_offset).m_key;
592 } while (key == nullval || key == tombstone);
597 * @brief Return the key for this iterator.
598 * If deletions are allowed, then the key may change asynchronously
599 * to the tombstone value.
603 typename CHMIMPL::val_t CHMIMPL::const_iterator::key() const
605 return m_table.entry (m_offset).m_key;
610 * @brief Return the value for this iterator.
614 typename CHMIMPL::val_t CHMIMPL::const_iterator::value() const
616 return m_table.entry (m_offset).m_val;
621 * @brief Compare two iterators.
625 bool CHMIMPL::const_iterator::operator!= (const const_iterator& other) const
627 if (m_offset != other.m_offset) return true;
628 if (m_offset == INVALID) return false;
629 return &m_table != &other.m_table;
634 * @brief Check that the iterator is valid (not pointing at the end).
638 bool CHMIMPL::const_iterator::valid() const
640 return m_offset != INVALID;
645 * @brief Return a range that can be used to iterate over the container.
649 typename CHMIMPL::const_iterator_range CHMIMPL::range() const
651 const Table& table = m_updater.get();
652 return const_iterator_range (const_iterator (table, false),
653 const_iterator (table, true));
658 * @brief A begin iterator for the container.
662 typename CHMIMPL::const_iterator CHMIMPL::begin() const
664 const Table& table = m_updater.get();
665 return const_iterator (table, false);
670 * @brief An end iterator for the container.
674 typename CHMIMPL::const_iterator CHMIMPL::end() const
676 const Table& table = m_updater.get();
677 return const_iterator (table, true);
682 * @brief Erase the table and change the capacity.
683 * @param capacity The new table capacity.
684 * @param ctx Execution context.
686 * Returns an iterator pointing at the start of the old table.
689 typename CHMIMPL::const_iterator
690 CHMIMPL::clear (size_t capacity,
691 const typename Updater_t::Context_t& ctx)
693 capacity = round_up (capacity);
694 Lock_t lock (m_mutex);
695 std::unique_ptr<Table> new_table (new (capacity) Table (capacity,
699 // Save an iterator to the old table.
700 const_iterator it = begin();
702 // Publish the new table.
705 m_table = new_table.get();
706 m_updater.update (std::move (new_table), ctx);
712 * @brief Erase the table (don't change the capacity).
713 * @param ctx Execution context.
715 * Returns an iterator pointing at the start of the old table.
718 typename CHMIMPL::const_iterator
719 CHMIMPL::clear (const typename Updater_t::Context_t& ctx)
721 const Table& table = m_updater.get();
722 // Possible race here in that the container capacity could increase
723 // before we take out the lock in clear(). In practice, this should
724 // not actually be a problem.
725 return clear (table.capacity(), ctx);
730 * @brief Erase the table by filling it with nulls.
732 * This method is not safe to use concurrently --- no other threads
733 * may be accessing the container at the same time, either for read
737 void CHMIMPL::forceClear()
739 Lock_t lock (m_mutex);
740 size_t cap = m_table->capacity();
741 for (size_t i = 0; i < cap; i++) {
742 m_table->entry(i).m_key.store (nullval, std::memory_order_relaxed);
746 std::atomic_thread_fence (std::memory_order_seq_cst);
751 * @brief Increase the table capacity.
752 * @param capacity The new table capacity.
753 * @param ctx Execution context.
755 * No action will be taken if @c capacity is smaller
756 * than the current capacity.
759 void CHMIMPL::reserve (size_t capacity,
760 const typename Updater_t::Context_t& ctx)
762 Lock_t lock (m_mutex);
763 if (capacity < m_table->capacity()) return;
764 grow (lock, round_up (capacity), ctx);
769 * @brief Called when this thread is no longer referencing anything
770 * from this container.
771 * @param ctx Execution context.
774 void CHMIMPL::quiescent (const typename Updater_t::Context_t& ctx)
776 m_updater.quiescent (ctx);
781 * @brief Swap this container with another.
782 * @param other The container with which to swap.
784 * This will also call swap on the Updater object; hence, the Updater
785 * object must also support swap. The Hasher and Matcher instances
788 * This operation is NOT thread-safe. No other threads may be accessing
789 * either container during this operation.
792 void CHMIMPL::swap (ConcurrentHashmapImpl& other)
794 // Shouldn't be needed since we specified that no other threads can be
796 Lock_t lock (m_mutex);
797 Lock_t lock_other (other.m_mutex);
799 m_updater.swap (other.m_updater);
800 std::swap (m_table, other.m_table);
802 auto swap_atomic = [] (std::atomic<size_t>& a, std::atomic<size_t>& b)
804 size_t tmp = a.load (std::memory_order_relaxed);
805 a.store (b.load (std::memory_order_relaxed),
806 std::memory_order_relaxed);
807 b.store (tmp, std::memory_order_relaxed);
810 swap_atomic (m_size, other.m_size);
811 swap_atomic (m_erased, other.m_erased);
816 * @brief Access the Updater instance.
820 typename CHMIMPL::Updater_t& CHMIMPL::updater()
827 * @brief Make the table larger.
828 * @param ctx Execution context.
830 * Must be holding a lock on the mutex to call this.
833 bool CHMIMPL::grow (const Lock_t& lock, const typename Updater_t::Context_t& ctx)
835 // Allocate a new table with twice the capacity, unless there
836 // have been many erasures.
837 size_t new_capacity = m_erased >= m_table->capacity()/2 ?
838 m_table->capacity() : 2*m_table->capacity();
839 return grow (lock, new_capacity, ctx);
844 * @brief Make the table larger.
845 * @param new_capacity The new table capacity (must be a power of 2).
846 * @param ctx Execution context.
848 * Must be holding a lock on the mutex to call this.
851 bool CHMIMPL::grow (const Lock_t& /*lock*/,
853 const typename Updater_t::Context_t& ctx)
855 // The current table.
856 const Table& table = *m_table;
858 std::unique_ptr<Table> new_table (new (new_capacity) Table (new_capacity,
862 // Copy data from the existing table to the new one.
863 size_t capacity = table.capacity();
864 for (size_t i = 0; i < capacity; i++) {
865 const entry_t& ent = table.entry(i);
866 if (ent.m_key != nullval) {
867 size_t hash = m_hasher (ent.m_key);
869 size_t offset = new_table->probeWrite (ent.m_key, hash, insert);
870 if (offset == INVALID) {
873 entry_t& new_entry = new_table->entry (offset);
874 new_entry.m_key = static_cast<val_t> (ent.m_key);
875 new_entry.m_val = static_cast<val_t> (ent.m_val);
881 // Publish the new table.
882 m_table = new_table.get();
883 m_updater.update (std::move (new_table), ctx);
890 * @brief Round up to a power of 2.
893 uint64_t CHMIMPL::round_up (uint64_t x)
895 if (x <= 64) return 64;
896 return std::bit_ceil (x);
905 } // namespace detail
906 } // namespace CxxUtils