//===- llvm/ADT/SparseMultiSet.h - Sparse multiset --------------*- C++ -*-===// // // Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions. // See https://llvm.org/LICENSE.txt for license information. // SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception // //===----------------------------------------------------------------------===// /// /// \file /// This file defines the SparseMultiSet class, which adds multiset behavior to /// the SparseSet. /// /// A sparse multiset holds a small number of objects identified by integer keys /// from a moderately sized universe. The sparse multiset uses more memory than /// other containers in order to provide faster operations. Any key can map to /// multiple values. A SparseMultiSetNode class is provided, which serves as a /// convenient base class for the contents of a SparseMultiSet. /// //===----------------------------------------------------------------------===// #ifndef LLVM_ADT_SPARSEMULTISET_H #define LLVM_ADT_SPARSEMULTISET_H #include "llvm/ADT/identity.h" #include "llvm/ADT/SmallVector.h" #include "llvm/ADT/SparseSet.h" #include <cassert> #include <cstdint> #include <cstdlib> #include <iterator> #include <limits> #include <utility> namespace llvm { /// Fast multiset implementation for objects that can be identified by small /// unsigned keys. /// /// SparseMultiSet allocates memory proportional to the size of the key /// universe, so it is not recommended for building composite data structures. /// It is useful for algorithms that require a single set with fast operations. /// /// Compared to DenseSet and DenseMap, SparseMultiSet provides constant-time /// fast clear() as fast as a vector. The find(), insert(), and erase() /// operations are all constant time, and typically faster than a hash table. /// The iteration order doesn't depend on numerical key values, it only depends /// on the order of insert() and erase() operations. Iteration order is the /// insertion order. Iteration is only provided over elements of equivalent /// keys, but iterators are bidirectional. /// /// Compared to BitVector, SparseMultiSet<unsigned> uses 8x-40x more memory, but /// offers constant-time clear() and size() operations as well as fast iteration /// independent on the size of the universe. /// /// SparseMultiSet contains a dense vector holding all the objects and a sparse /// array holding indexes into the dense vector. Most of the memory is used by /// the sparse array which is the size of the key universe. The SparseT template /// parameter provides a space/speed tradeoff for sets holding many elements. /// /// When SparseT is uint32_t, find() only touches up to 3 cache lines, but the /// sparse array uses 4 x Universe bytes. /// /// When SparseT is uint8_t (the default), find() touches up to 3+[N/256] cache /// lines, but the sparse array is 4x smaller. N is the number of elements in /// the set. /// /// For sets that may grow to thousands of elements, SparseT should be set to /// uint16_t or uint32_t. /// /// Multiset behavior is provided by providing doubly linked lists for values /// that are inlined in the dense vector. SparseMultiSet is a good choice when /// one desires a growable number of entries per key, as it will retain the /// SparseSet algorithmic properties despite being growable. Thus, it is often a /// better choice than a SparseSet of growable containers or a vector of /// vectors. SparseMultiSet also keeps iterators valid after erasure (provided /// the iterators don't point to the element erased), allowing for more /// intuitive and fast removal. /// /// @tparam ValueT The type of objects in the set. /// @tparam KeyFunctorT A functor that computes an unsigned index from KeyT. /// @tparam SparseT An unsigned integer type. See above. /// template<typename ValueT, typename KeyFunctorT = identity<unsigned>, typename SparseT = uint8_t> class SparseMultiSet { … }; } // end namespace llvm #endif // LLVM_ADT_SPARSEMULTISET_H