// Part of the Carbon Language project, under the Apache License v2.0 with LLVM // Exceptions. See /LICENSE for license information. // SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception #ifndef CARBON_COMMON_MAP_H_ #define CARBON_COMMON_MAP_H_ #include #include #include #include "common/check.h" #include "common/hashtable_key_context.h" #include "common/raw_hashtable.h" #include "llvm/Support/Compiler.h" namespace Carbon { // Forward declarations to resolve cyclic references. template class MapView; template class MapBase; template class Map; // A read-only view type for a map from key to value. // // This view is a cheap-to-copy type that should be passed by value, but // provides view or read-only reference semantics to the underlying map data // structure. // // This should always be preferred to a `const`-ref parameter for the `MapBase` // or `Map` type as it provides more flexibility and a cleaner API. // // Note that while this type is a read-only view, that applies to the underlying // *map* data structure, not the individual entries stored within it. Those can // be mutated freely as long as both the hashes and equality of the keys are // preserved. If we applied a deep-`const` design here, it would prevent using // this type in many useful situations where the elements are mutated but the // associative container is not. A view of immutable data can always be obtained // by using `MapView`, and we enable conversions to more-const // views. This mirrors the semantics of views like `std::span`. // // A specific `KeyContextT` type can optionally be provided to configure how // keys will be hashed and compared. The default is `DefaultKeyContext` which is // stateless and will hash using `Carbon::HashValue` and compare using // `operator==`. Every method accepting a lookup key or operating on the keys in // the table will also accept an instance of this type. For stateless context // types, including the default, an instance will be default constructed if not // provided to these methods. However, stateful contexts should be constructed // and passed in explicitly. The context type should be small and reasonable to // pass by value, often a wrapper or pointer to the relevant context needed for // hashing and comparing keys. For more details about the key context, see // `hashtable_key_context.h`. template class MapView : RawHashtable::ViewImpl { using ImplT = RawHashtable::ViewImpl; using EntryT = typename ImplT::EntryT; public: using KeyT = typename ImplT::KeyT; using ValueT = typename ImplT::ValueT; using KeyContextT = typename ImplT::KeyContextT; // This type represents the result of lookup operations. It encodes whether // the lookup was a success as well as accessors for the key and value. class LookupKVResult { public: LookupKVResult() = default; explicit LookupKVResult(EntryT* entry) : entry_(entry) {} explicit operator bool() const { return entry_ != nullptr; } auto key() const -> KeyT& { return entry_->key(); } auto value() const -> ValueT& { return entry_->value(); } private: EntryT* entry_ = nullptr; }; // Enable implicit conversions that add `const`-ness to either key or value // type. This is always safe to do with a view. We use a template to avoid // needing all 3 versions. template // NOLINTNEXTLINE(google-explicit-constructor) MapView(MapView other_view) requires(std::same_as || std::same_as) && (std::same_as || std::same_as) : ImplT(other_view) {} // Tests whether a key is present in the map. template auto Contains(LookupKeyT lookup_key, KeyContextT key_context = KeyContextT()) const -> bool; // Lookup a key in the map. template auto Lookup(LookupKeyT lookup_key, KeyContextT key_context = KeyContextT()) const -> LookupKVResult; // Lookup a key in the map and try to return a pointer to its value. Returns // null on a missing key. template auto operator[](LookupKeyT lookup_key) const -> ValueT* requires(std::default_initializable); // Run the provided callback for every key and value in the map. template void ForEach(CallbackT callback) requires(std::invocable); // This routine is relatively inefficient and only intended for use in // benchmarking or logging of performance anomalies. The specific count // returned has no specific guarantees beyond being informative in benchmarks. // It counts how many of the keys in the hashtable have required probing // beyond their initial group of slots. // // TODO: Replace with a more general metrics routine that covers other // important aspects such as load factor, and average probe *distance*. auto CountProbedKeys(KeyContextT key_context = KeyContextT()) -> ssize_t { return ImplT::CountProbedKeys(key_context); } private: template friend class Map; friend class MapBase; friend class MapView; friend class MapView; friend class MapView; MapView() = default; // NOLINTNEXTLINE(google-explicit-constructor): Implicit by design. MapView(ImplT base) : ImplT(base) {} MapView(ssize_t size, RawHashtable::Storage* storage) : ImplT(size, storage) {} }; // A base class for a `Map` type that remains mutable while type-erasing the // `SmallSize` (SSO) template parameter. // // A pointer or reference to this type is the preferred way to pass a mutable // handle to a `Map` type across API boundaries as it avoids encoding specific // SSO sizing information while providing a near-complete mutable API. template class MapBase : protected RawHashtable::BaseImpl { protected: using ImplT = RawHashtable::BaseImpl; using EntryT = typename ImplT::EntryT; public: using KeyT = typename ImplT::KeyT; using ValueT = typename ImplT::ValueT; using KeyContextT = typename ImplT::KeyContextT; using ViewT = MapView; using LookupKVResult = typename ViewT::LookupKVResult; // The result type for insertion operations both indicates whether an insert // was needed (as opposed to finding an existing element), and provides access // to the element's key and value. class InsertKVResult { public: InsertKVResult() = default; explicit InsertKVResult(bool inserted, EntryT& entry) : entry_(&entry), inserted_(inserted) {} auto is_inserted() const -> bool { return inserted_; } auto key() const -> KeyT& { return entry_->key(); } auto value() const -> ValueT& { return entry_->value(); } private: EntryT* entry_; bool inserted_; }; // Implicitly convertible to the relevant view type. // // NOLINTNEXTLINE(google-explicit-constructor): Designed to implicitly decay. operator ViewT() const { return this->view_impl(); } // We can't chain the above conversion with the conversions on `ViewT` to add // const, so explicitly support adding const to produce a view here. template // NOLINTNEXTLINE(google-explicit-constructor) operator MapView() const requires(std::same_as || std::same_as) && (std::same_as || std::same_as) { return ViewT(*this); } // Convenience forwarder to the view type. template auto Contains(LookupKeyT lookup_key, KeyContextT key_context = KeyContextT()) const -> bool { return ViewT(*this).Contains(lookup_key, key_context); } // Convenience forwarder to the view type. template auto Lookup(LookupKeyT lookup_key, KeyContextT key_context = KeyContextT()) const -> LookupKVResult { return ViewT(*this).Lookup(lookup_key, key_context); } // Convenience forwarder to the view type. template auto operator[](LookupKeyT lookup_key) const -> ValueT* requires(std::default_initializable) { return ViewT(*this)[lookup_key]; } // Convenience forwarder to the view type. template void ForEach(CallbackT callback) requires(std::invocable) { return ViewT(*this).ForEach(callback); } // Convenience forwarder to the view type. auto CountProbedKeys(KeyContextT key_context = KeyContextT()) const -> ssize_t { return ViewT(*this).CountProbedKeys(key_context); } // Insert a key and value into the map. If the key is already present, the new // value is discarded and the existing value preserved. template auto Insert(LookupKeyT lookup_key, ValueT new_v, KeyContextT key_context = KeyContextT()) -> InsertKVResult; // Insert a key into the map and call the provided callback if necessary to // produce a new value when no existing value is found. // // Example: `m.Insert(key, [] { return default_value; });` // // TODO: The `;` formatting below appears to be bugs in clang-format with // concepts that should be filed upstream. template auto Insert(LookupKeyT lookup_key, ValueCallbackT value_cb, KeyContextT key_context = KeyContextT()) -> InsertKVResult requires( !std::same_as && std::convertible_to()()), ValueT>) ; // Lookup a key in the map and if missing insert it and call the provided // callback to in-place construct both the key and value. The lookup key is // passed through to the callback so it needn't be captured and can be kept in // a register argument throughout. // // Example: // ```cpp // m.Insert("widget", [](MyStringViewType lookup_key, void* key_storage, // void* value_storage) { // new (key_storage) MyStringType(lookup_key); // new (value_storage) MyValueType(....); // }); // ``` template auto Insert(LookupKeyT lookup_key, InsertCallbackT insert_cb, KeyContextT key_context = KeyContextT()) -> InsertKVResult requires(!std::same_as && std::invocable); // Replace a key's value in a map if already present or insert it if not // already present. The new value is always used. template auto Update(LookupKeyT lookup_key, ValueT new_v, KeyContextT key_context = KeyContextT()) -> InsertKVResult; // Lookup or insert a key into the map, and set it's value to the result of // the `value_cb` callback. The callback is always run and its result is // always used, whether the key was already in the map or not. Any existing // value is replaced with the result. // // Example: `m.Update(key, [] { return new_value; });` template auto Update(LookupKeyT lookup_key, ValueCallbackT value_cb, KeyContextT key_context = KeyContextT()) -> InsertKVResult requires( !std::same_as && std::convertible_to()()), ValueT>) ; // Lookup or insert a key into the map. If not already present and the key is // inserted, the `insert_cb` is used to construct the new key and value in // place. When inserting, the lookup key is passed through to the callback so // it needn't be captured and can be kept in a register argument throughout. // If the key was already present, the `update_cb` is called to update the // existing key and value as desired. // // Example of counting occurrences: // ```cpp // m.Update(item, /*insert_cb=*/[](MyStringViewType lookup_key, // void* key_storage, void* value_storage) { // new (key_storage) MyItem(lookup_key); // new (value_storage) Count(1); // }, // /*update_cb=*/[](MyItem& /*key*/, Count& count) { // ++count; // }); // ``` template auto Update(LookupKeyT lookup_key, InsertCallbackT insert_cb, UpdateCallbackT update_cb, KeyContextT key_context = KeyContextT()) -> InsertKVResult requires(!std::same_as && std::invocable && std::invocable); // Erase a key from the map. template auto Erase(LookupKeyT lookup_key, KeyContextT key_context = KeyContextT()) -> bool; // Clear all key/value pairs from the map but leave the underlying hashtable // allocated and in place. void Clear(); protected: using ImplT::ImplT; }; // A data structure mapping from key to value. // // This map also supports small size optimization (or "SSO"). The provided // `SmallSize` type parameter indicates the size of an embedded buffer for // storing maps small enough to fit. The default is zero, which always allocates // a heap buffer on construction. When non-zero, must be a multiple of the // `MaxGroupSize` which is currently 16. The library will check that the size is // valid and provide an error at compile time if not. We don't automatically // select the next multiple or otherwise fit the size to the constraints to make // it clear in the code how much memory is used by the SSO buffer. // // This data structure optimizes heavily for small key types that are cheap to // move and even copy. Using types with large keys or expensive to copy keys may // create surprising performance bottlenecks. A `std::string` key should be fine // with generally small strings, but if some or many strings are large heap // allocations the performance of hashtable routines may be unacceptably bad and // another data structure or key design is likely preferable. // // Note that this type should typically not appear on API boundaries; either // `MapBase` or `MapView` should be used instead. template class Map : public RawHashtable::TableImpl< MapBase, SmallSize> { using BaseT = MapBase; using ImplT = RawHashtable::TableImpl; public: using KeyT = typename BaseT::KeyT; using ValueT = typename BaseT::ValueT; Map() = default; Map(const Map& arg) = default; Map(Map&& arg) noexcept = default; // Reset the entire state of the hashtable to as it was when constructed, // throwing away any intervening allocations. void Reset(); }; template template auto MapView::Contains( LookupKeyT lookup_key, KeyContextT key_context) const -> bool { return this->LookupEntry(lookup_key, key_context) != nullptr; } template template auto MapView::Lookup( LookupKeyT lookup_key, KeyContextT key_context) const -> LookupKVResult { return LookupKVResult(this->LookupEntry(lookup_key, key_context)); } template template auto MapView::operator[]( LookupKeyT lookup_key) const -> ValueT* requires(std::default_initializable) { auto result = Lookup(lookup_key, KeyContextT()); return result ? &result.value() : nullptr; } template template void MapView::ForEach( CallbackT callback) requires(std::invocable) { this->ForEachEntry( [callback](EntryT& entry) { callback(entry.key(), entry.value()); }, [](auto...) {}); } template template [[clang::always_inline]] auto MapBase::Insert( LookupKeyT lookup_key, ValueT new_v, KeyContextT key_context) -> InsertKVResult { return Insert( lookup_key, [&new_v](LookupKeyT lookup_key, void* key_storage, void* value_storage) { new (key_storage) KeyT(lookup_key); new (value_storage) ValueT(std::move(new_v)); }, key_context); } template template [[clang::always_inline]] auto MapBase::Insert( LookupKeyT lookup_key, ValueCallbackT value_cb, KeyContextT key_context) -> InsertKVResult requires( !std::same_as && std::convertible_to()()), ValueT>) { return Insert( lookup_key, [&value_cb](LookupKeyT lookup_key, void* key_storage, void* value_storage) { new (key_storage) KeyT(lookup_key); new (value_storage) ValueT(value_cb()); }, key_context); } template template [[clang::always_inline]] auto MapBase::Insert( LookupKeyT lookup_key, InsertCallbackT insert_cb, KeyContextT key_context) -> InsertKVResult requires(!std::same_as && std::invocable) { auto [entry, inserted] = this->InsertImpl(lookup_key, key_context); CARBON_DCHECK(entry) << "Should always result in a valid index."; if (LLVM_LIKELY(!inserted)) { return InsertKVResult(false, *entry); } insert_cb(lookup_key, static_cast(&entry->key_storage), static_cast(&entry->value_storage)); return InsertKVResult(true, *entry); } template template [[clang::always_inline]] auto MapBase::Update( LookupKeyT lookup_key, ValueT new_v, KeyContextT key_context) -> InsertKVResult { return Update( lookup_key, [&new_v](LookupKeyT lookup_key, void* key_storage, void* value_storage) { new (key_storage) KeyT(lookup_key); new (value_storage) ValueT(std::move(new_v)); }, [&new_v](KeyT& /*key*/, ValueT& value) { value.~ValueT(); new (&value) ValueT(std::move(new_v)); }, key_context); } template template [[clang::always_inline]] auto MapBase::Update( LookupKeyT lookup_key, ValueCallbackT value_cb, KeyContextT key_context) -> InsertKVResult requires( !std::same_as && std::convertible_to()()), ValueT>) { return Update( lookup_key, [&value_cb](LookupKeyT lookup_key, void* key_storage, void* value_storage) { new (key_storage) KeyT(lookup_key); new (value_storage) ValueT(value_cb()); }, [&value_cb](KeyT& /*key*/, ValueT& value) { value.~ValueT(); new (&value) ValueT(value_cb()); }, key_context); } template template [[clang::always_inline]] auto MapBase::Update( LookupKeyT lookup_key, InsertCallbackT insert_cb, UpdateCallbackT update_cb, KeyContextT key_context) -> InsertKVResult requires(!std::same_as && std::invocable && std::invocable) { auto [entry, inserted] = this->InsertImpl(lookup_key, key_context); CARBON_DCHECK(entry) << "Should always result in a valid index."; if (LLVM_LIKELY(!inserted)) { update_cb(entry->key(), entry->value()); return InsertKVResult(false, *entry); } insert_cb(lookup_key, static_cast(&entry->key_storage), static_cast(&entry->value_storage)); return InsertKVResult(true, *entry); } template template auto MapBase::Erase( LookupKeyT lookup_key, KeyContextT key_context) -> bool { return this->EraseImpl(lookup_key, key_context); } template void MapBase::Clear() { this->ClearImpl(); } template void Map::Reset() { this->ResetImpl(); } } // namespace Carbon #endif // CARBON_COMMON_MAP_H_