Andrew Scull | 5e1ddfa | 2018-08-14 10:06:54 +0100 | [diff] [blame] | 1 | //===- llvm/ADT/SmallSet.h - 'Normally small' sets --------------*- C++ -*-===// |
| 2 | // |
Andrew Walbran | 16937d0 | 2019-10-22 13:54:20 +0100 | [diff] [blame] | 3 | // Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions. |
| 4 | // See https://llvm.org/LICENSE.txt for license information. |
| 5 | // SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception |
Andrew Scull | 5e1ddfa | 2018-08-14 10:06:54 +0100 | [diff] [blame] | 6 | // |
| 7 | //===----------------------------------------------------------------------===// |
| 8 | // |
| 9 | // This file defines the SmallSet class. |
| 10 | // |
| 11 | //===----------------------------------------------------------------------===// |
| 12 | |
| 13 | #ifndef LLVM_ADT_SMALLSET_H |
| 14 | #define LLVM_ADT_SMALLSET_H |
| 15 | |
| 16 | #include "llvm/ADT/None.h" |
| 17 | #include "llvm/ADT/SmallPtrSet.h" |
| 18 | #include "llvm/ADT/SmallVector.h" |
Andrew Scull | cdfcccc | 2018-10-05 20:58:37 +0100 | [diff] [blame] | 19 | #include "llvm/ADT/iterator.h" |
Andrew Scull | 5e1ddfa | 2018-08-14 10:06:54 +0100 | [diff] [blame] | 20 | #include "llvm/Support/Compiler.h" |
Andrew Scull | cdfcccc | 2018-10-05 20:58:37 +0100 | [diff] [blame] | 21 | #include "llvm/Support/type_traits.h" |
Andrew Scull | 5e1ddfa | 2018-08-14 10:06:54 +0100 | [diff] [blame] | 22 | #include <cstddef> |
| 23 | #include <functional> |
| 24 | #include <set> |
Andrew Scull | cdfcccc | 2018-10-05 20:58:37 +0100 | [diff] [blame] | 25 | #include <type_traits> |
Andrew Scull | 5e1ddfa | 2018-08-14 10:06:54 +0100 | [diff] [blame] | 26 | #include <utility> |
| 27 | |
| 28 | namespace llvm { |
| 29 | |
Andrew Scull | cdfcccc | 2018-10-05 20:58:37 +0100 | [diff] [blame] | 30 | /// SmallSetIterator - This class implements a const_iterator for SmallSet by |
| 31 | /// delegating to the underlying SmallVector or Set iterators. |
| 32 | template <typename T, unsigned N, typename C> |
| 33 | class SmallSetIterator |
| 34 | : public iterator_facade_base<SmallSetIterator<T, N, C>, |
| 35 | std::forward_iterator_tag, T> { |
| 36 | private: |
| 37 | using SetIterTy = typename std::set<T, C>::const_iterator; |
| 38 | using VecIterTy = typename SmallVector<T, N>::const_iterator; |
| 39 | using SelfTy = SmallSetIterator<T, N, C>; |
| 40 | |
| 41 | /// Iterators to the parts of the SmallSet containing the data. They are set |
| 42 | /// depending on isSmall. |
| 43 | union { |
| 44 | SetIterTy SetIter; |
| 45 | VecIterTy VecIter; |
| 46 | }; |
| 47 | |
| 48 | bool isSmall; |
| 49 | |
| 50 | public: |
| 51 | SmallSetIterator(SetIterTy SetIter) : SetIter(SetIter), isSmall(false) {} |
| 52 | |
| 53 | SmallSetIterator(VecIterTy VecIter) : VecIter(VecIter), isSmall(true) {} |
| 54 | |
| 55 | // Spell out destructor, copy/move constructor and assignment operators for |
| 56 | // MSVC STL, where set<T>::const_iterator is not trivially copy constructible. |
| 57 | ~SmallSetIterator() { |
| 58 | if (isSmall) |
| 59 | VecIter.~VecIterTy(); |
| 60 | else |
| 61 | SetIter.~SetIterTy(); |
| 62 | } |
| 63 | |
| 64 | SmallSetIterator(const SmallSetIterator &Other) : isSmall(Other.isSmall) { |
| 65 | if (isSmall) |
| 66 | VecIter = Other.VecIter; |
| 67 | else |
| 68 | // Use placement new, to make sure SetIter is properly constructed, even |
| 69 | // if it is not trivially copy-able (e.g. in MSVC). |
| 70 | new (&SetIter) SetIterTy(Other.SetIter); |
| 71 | } |
| 72 | |
| 73 | SmallSetIterator(SmallSetIterator &&Other) : isSmall(Other.isSmall) { |
| 74 | if (isSmall) |
| 75 | VecIter = std::move(Other.VecIter); |
| 76 | else |
| 77 | // Use placement new, to make sure SetIter is properly constructed, even |
| 78 | // if it is not trivially copy-able (e.g. in MSVC). |
| 79 | new (&SetIter) SetIterTy(std::move(Other.SetIter)); |
| 80 | } |
| 81 | |
| 82 | SmallSetIterator& operator=(const SmallSetIterator& Other) { |
| 83 | // Call destructor for SetIter, so it gets properly destroyed if it is |
| 84 | // not trivially destructible in case we are setting VecIter. |
| 85 | if (!isSmall) |
| 86 | SetIter.~SetIterTy(); |
| 87 | |
| 88 | isSmall = Other.isSmall; |
| 89 | if (isSmall) |
| 90 | VecIter = Other.VecIter; |
| 91 | else |
| 92 | new (&SetIter) SetIterTy(Other.SetIter); |
| 93 | return *this; |
| 94 | } |
| 95 | |
| 96 | SmallSetIterator& operator=(SmallSetIterator&& Other) { |
| 97 | // Call destructor for SetIter, so it gets properly destroyed if it is |
| 98 | // not trivially destructible in case we are setting VecIter. |
| 99 | if (!isSmall) |
| 100 | SetIter.~SetIterTy(); |
| 101 | |
| 102 | isSmall = Other.isSmall; |
| 103 | if (isSmall) |
| 104 | VecIter = std::move(Other.VecIter); |
| 105 | else |
| 106 | new (&SetIter) SetIterTy(std::move(Other.SetIter)); |
| 107 | return *this; |
| 108 | } |
| 109 | |
| 110 | bool operator==(const SmallSetIterator &RHS) const { |
| 111 | if (isSmall != RHS.isSmall) |
| 112 | return false; |
| 113 | if (isSmall) |
| 114 | return VecIter == RHS.VecIter; |
| 115 | return SetIter == RHS.SetIter; |
| 116 | } |
| 117 | |
| 118 | SmallSetIterator &operator++() { // Preincrement |
| 119 | if (isSmall) |
| 120 | VecIter++; |
| 121 | else |
| 122 | SetIter++; |
| 123 | return *this; |
| 124 | } |
| 125 | |
| 126 | const T &operator*() const { return isSmall ? *VecIter : *SetIter; } |
| 127 | }; |
| 128 | |
Andrew Scull | 5e1ddfa | 2018-08-14 10:06:54 +0100 | [diff] [blame] | 129 | /// SmallSet - This maintains a set of unique values, optimizing for the case |
| 130 | /// when the set is small (less than N). In this case, the set can be |
| 131 | /// maintained with no mallocs. If the set gets large, we expand to using an |
| 132 | /// std::set to maintain reasonable lookup times. |
Andrew Scull | 5e1ddfa | 2018-08-14 10:06:54 +0100 | [diff] [blame] | 133 | template <typename T, unsigned N, typename C = std::less<T>> |
| 134 | class SmallSet { |
| 135 | /// Use a SmallVector to hold the elements here (even though it will never |
| 136 | /// reach its 'large' stage) to avoid calling the default ctors of elements |
| 137 | /// we will never use. |
| 138 | SmallVector<T, N> Vector; |
| 139 | std::set<T, C> Set; |
| 140 | |
| 141 | using VIterator = typename SmallVector<T, N>::const_iterator; |
| 142 | using mutable_iterator = typename SmallVector<T, N>::iterator; |
| 143 | |
| 144 | // In small mode SmallPtrSet uses linear search for the elements, so it is |
| 145 | // not a good idea to choose this value too high. You may consider using a |
| 146 | // DenseSet<> instead if you expect many elements in the set. |
| 147 | static_assert(N <= 32, "N should be small"); |
| 148 | |
| 149 | public: |
| 150 | using size_type = size_t; |
Andrew Scull | cdfcccc | 2018-10-05 20:58:37 +0100 | [diff] [blame] | 151 | using const_iterator = SmallSetIterator<T, N, C>; |
Andrew Scull | 5e1ddfa | 2018-08-14 10:06:54 +0100 | [diff] [blame] | 152 | |
| 153 | SmallSet() = default; |
| 154 | |
| 155 | LLVM_NODISCARD bool empty() const { |
| 156 | return Vector.empty() && Set.empty(); |
| 157 | } |
| 158 | |
| 159 | size_type size() const { |
| 160 | return isSmall() ? Vector.size() : Set.size(); |
| 161 | } |
| 162 | |
| 163 | /// count - Return 1 if the element is in the set, 0 otherwise. |
| 164 | size_type count(const T &V) const { |
| 165 | if (isSmall()) { |
| 166 | // Since the collection is small, just do a linear search. |
| 167 | return vfind(V) == Vector.end() ? 0 : 1; |
| 168 | } else { |
| 169 | return Set.count(V); |
| 170 | } |
| 171 | } |
| 172 | |
| 173 | /// insert - Insert an element into the set if it isn't already there. |
| 174 | /// Returns true if the element is inserted (it was not in the set before). |
| 175 | /// The first value of the returned pair is unused and provided for |
| 176 | /// partial compatibility with the standard library self-associative container |
| 177 | /// concept. |
| 178 | // FIXME: Add iterators that abstract over the small and large form, and then |
| 179 | // return those here. |
| 180 | std::pair<NoneType, bool> insert(const T &V) { |
| 181 | if (!isSmall()) |
| 182 | return std::make_pair(None, Set.insert(V).second); |
| 183 | |
| 184 | VIterator I = vfind(V); |
| 185 | if (I != Vector.end()) // Don't reinsert if it already exists. |
| 186 | return std::make_pair(None, false); |
| 187 | if (Vector.size() < N) { |
| 188 | Vector.push_back(V); |
| 189 | return std::make_pair(None, true); |
| 190 | } |
| 191 | |
| 192 | // Otherwise, grow from vector to set. |
| 193 | while (!Vector.empty()) { |
| 194 | Set.insert(Vector.back()); |
| 195 | Vector.pop_back(); |
| 196 | } |
| 197 | Set.insert(V); |
| 198 | return std::make_pair(None, true); |
| 199 | } |
| 200 | |
| 201 | template <typename IterT> |
| 202 | void insert(IterT I, IterT E) { |
| 203 | for (; I != E; ++I) |
| 204 | insert(*I); |
| 205 | } |
| 206 | |
| 207 | bool erase(const T &V) { |
| 208 | if (!isSmall()) |
| 209 | return Set.erase(V); |
| 210 | for (mutable_iterator I = Vector.begin(), E = Vector.end(); I != E; ++I) |
| 211 | if (*I == V) { |
| 212 | Vector.erase(I); |
| 213 | return true; |
| 214 | } |
| 215 | return false; |
| 216 | } |
| 217 | |
| 218 | void clear() { |
| 219 | Vector.clear(); |
| 220 | Set.clear(); |
| 221 | } |
| 222 | |
Andrew Scull | cdfcccc | 2018-10-05 20:58:37 +0100 | [diff] [blame] | 223 | const_iterator begin() const { |
| 224 | if (isSmall()) |
| 225 | return {Vector.begin()}; |
| 226 | return {Set.begin()}; |
| 227 | } |
| 228 | |
| 229 | const_iterator end() const { |
| 230 | if (isSmall()) |
| 231 | return {Vector.end()}; |
| 232 | return {Set.end()}; |
| 233 | } |
| 234 | |
Olivier Deprez | f4ef2d0 | 2021-04-20 13:36:24 +0200 | [diff] [blame] | 235 | /// Check if the SmallSet contains the given element. |
| 236 | bool contains(const T &V) const { |
| 237 | if (isSmall()) |
| 238 | return vfind(V) != Vector.end(); |
| 239 | return Set.find(V) != Set.end(); |
| 240 | } |
| 241 | |
Andrew Scull | 5e1ddfa | 2018-08-14 10:06:54 +0100 | [diff] [blame] | 242 | private: |
| 243 | bool isSmall() const { return Set.empty(); } |
| 244 | |
| 245 | VIterator vfind(const T &V) const { |
| 246 | for (VIterator I = Vector.begin(), E = Vector.end(); I != E; ++I) |
| 247 | if (*I == V) |
| 248 | return I; |
| 249 | return Vector.end(); |
| 250 | } |
| 251 | }; |
| 252 | |
| 253 | /// If this set is of pointer values, transparently switch over to using |
| 254 | /// SmallPtrSet for performance. |
| 255 | template <typename PointeeType, unsigned N> |
| 256 | class SmallSet<PointeeType*, N> : public SmallPtrSet<PointeeType*, N> {}; |
| 257 | |
Olivier Deprez | f4ef2d0 | 2021-04-20 13:36:24 +0200 | [diff] [blame] | 258 | /// Equality comparison for SmallSet. |
| 259 | /// |
| 260 | /// Iterates over elements of LHS confirming that each element is also a member |
| 261 | /// of RHS, and that RHS contains no additional values. |
| 262 | /// Equivalent to N calls to RHS.count. |
| 263 | /// For small-set mode amortized complexity is O(N^2) |
| 264 | /// For large-set mode amortized complexity is linear, worst case is O(N^2) (if |
| 265 | /// every hash collides). |
| 266 | template <typename T, unsigned LN, unsigned RN, typename C> |
| 267 | bool operator==(const SmallSet<T, LN, C> &LHS, const SmallSet<T, RN, C> &RHS) { |
| 268 | if (LHS.size() != RHS.size()) |
| 269 | return false; |
| 270 | |
| 271 | // All elements in LHS must also be in RHS |
| 272 | return all_of(LHS, [&RHS](const T &E) { return RHS.count(E); }); |
| 273 | } |
| 274 | |
| 275 | /// Inequality comparison for SmallSet. |
| 276 | /// |
| 277 | /// Equivalent to !(LHS == RHS). See operator== for performance notes. |
| 278 | template <typename T, unsigned LN, unsigned RN, typename C> |
| 279 | bool operator!=(const SmallSet<T, LN, C> &LHS, const SmallSet<T, RN, C> &RHS) { |
| 280 | return !(LHS == RHS); |
| 281 | } |
| 282 | |
Andrew Scull | 5e1ddfa | 2018-08-14 10:06:54 +0100 | [diff] [blame] | 283 | } // end namespace llvm |
| 284 | |
| 285 | #endif // LLVM_ADT_SMALLSET_H |