123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407408409410411412413414415416417418419420421422423424425426427428429430431432433434435436437438439440441442443444445446447448449 |
- #pragma once
- #ifdef __GNUC__
- #pragma GCC diagnostic push
- #pragma GCC diagnostic ignored "-Wunused-parameter"
- #endif
- //===- llvm/Support/HashBuilder.h - Convenient hashing interface-*- C++ -*-===//
- //
- // Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions.
- // See https://llvm.org/LICENSE.txt for license information.
- // SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception
- //
- //===----------------------------------------------------------------------===//
- //
- // This file implements an interface allowing to conveniently build hashes of
- // various data types, without relying on the underlying hasher type to know
- // about hashed data types.
- //
- //===----------------------------------------------------------------------===//
- #ifndef LLVM_SUPPORT_HASHBUILDER_H
- #define LLVM_SUPPORT_HASHBUILDER_H
- #include "llvm/ADT/ArrayRef.h"
- #include "llvm/ADT/Hashing.h"
- #include "llvm/ADT/STLExtras.h"
- #include "llvm/ADT/StringRef.h"
- #include "llvm/Support/Endian.h"
- #include "llvm/Support/type_traits.h"
- #include <iterator>
- #include <utility>
- namespace llvm {
- namespace hashbuilder_detail {
- /// Trait to indicate whether a type's bits can be hashed directly (after
- /// endianness correction).
- template <typename U>
- struct IsHashableData
- : std::integral_constant<bool, is_integral_or_enum<U>::value> {};
- } // namespace hashbuilder_detail
- /// Declares the hasher member, and functions forwarding directly to the hasher.
- template <typename HasherT> class HashBuilderBase {
- public:
- HasherT &getHasher() { return Hasher; }
- /// Forward to `HasherT::update(ArrayRef<uint8_t>)`.
- ///
- /// This may not take the size of `Data` into account.
- /// Users of this function should pay attention to respect endianness
- /// contraints.
- void update(ArrayRef<uint8_t> Data) { this->getHasher().update(Data); }
- /// Forward to `HasherT::update(ArrayRef<uint8_t>)`.
- ///
- /// This may not take the size of `Data` into account.
- /// Users of this function should pay attention to respect endianness
- /// contraints.
- void update(StringRef Data) {
- update(makeArrayRef(reinterpret_cast<const uint8_t *>(Data.data()),
- Data.size()));
- }
- /// Forward to `HasherT::final()` if available.
- template <typename HasherT_ = HasherT> StringRef final() {
- return this->getHasher().final();
- }
- /// Forward to `HasherT::result()` if available.
- template <typename HasherT_ = HasherT> StringRef result() {
- return this->getHasher().result();
- }
- protected:
- explicit HashBuilderBase(HasherT &Hasher) : Hasher(Hasher) {}
- template <typename... ArgTypes>
- explicit HashBuilderBase(ArgTypes &&...Args)
- : OptionalHasher(in_place, std::forward<ArgTypes>(Args)...),
- Hasher(*OptionalHasher) {}
- private:
- Optional<HasherT> OptionalHasher;
- HasherT &Hasher;
- };
- /// Implementation of the `HashBuilder` interface.
- ///
- /// `support::endianness::native` is not supported. `HashBuilder` is
- /// expected to canonicalize `support::endianness::native` to one of
- /// `support::endianness::big` or `support::endianness::little`.
- template <typename HasherT, support::endianness Endianness>
- class HashBuilderImpl : public HashBuilderBase<HasherT> {
- static_assert(Endianness != support::endianness::native,
- "HashBuilder should canonicalize endianness");
- public:
- explicit HashBuilderImpl(HasherT &Hasher)
- : HashBuilderBase<HasherT>(Hasher) {}
- template <typename... ArgTypes>
- explicit HashBuilderImpl(ArgTypes &&...Args)
- : HashBuilderBase<HasherT>(Args...) {}
- /// Implement hashing for hashable data types, e.g. integral or enum values.
- template <typename T>
- std::enable_if_t<hashbuilder_detail::IsHashableData<T>::value,
- HashBuilderImpl &>
- add(T Value) {
- return adjustForEndiannessAndAdd(Value);
- }
- /// Support hashing `ArrayRef`.
- ///
- /// `Value.size()` is taken into account to ensure cases like
- /// ```
- /// builder.add({1});
- /// builder.add({2, 3});
- /// ```
- /// and
- /// ```
- /// builder.add({1, 2});
- /// builder.add({3});
- /// ```
- /// do not collide.
- template <typename T> HashBuilderImpl &add(ArrayRef<T> Value) {
- // As of implementation time, simply calling `addRange(Value)` would also go
- // through the `update` fast path. But that would rely on the implementation
- // details of `ArrayRef::begin()` and `ArrayRef::end()`. Explicitly call
- // `update` to guarantee the fast path.
- add(Value.size());
- if (hashbuilder_detail::IsHashableData<T>::value &&
- Endianness == support::endian::system_endianness()) {
- this->update(
- makeArrayRef(reinterpret_cast<const uint8_t *>(Value.begin()),
- Value.size() * sizeof(T)));
- } else {
- for (auto &V : Value)
- add(V);
- }
- return *this;
- }
- /// Support hashing `StringRef`.
- ///
- /// `Value.size()` is taken into account to ensure cases like
- /// ```
- /// builder.add("a");
- /// builder.add("bc");
- /// ```
- /// and
- /// ```
- /// builder.add("ab");
- /// builder.add("c");
- /// ```
- /// do not collide.
- HashBuilderImpl &add(StringRef Value) {
- // As of implementation time, simply calling `addRange(Value)` would also go
- // through `update`. But that would rely on the implementation of
- // `StringRef::begin()` and `StringRef::end()`. Explicitly call `update` to
- // guarantee the fast path.
- add(Value.size());
- this->update(makeArrayRef(reinterpret_cast<const uint8_t *>(Value.begin()),
- Value.size()));
- return *this;
- }
- template <typename T>
- using HasAddHashT =
- decltype(addHash(std::declval<HashBuilderImpl &>(), std::declval<T &>()));
- /// Implement hashing for user-defined `struct`s.
- ///
- /// Any user-define `struct` can participate in hashing via `HashBuilder` by
- /// providing a `addHash` templated function.
- ///
- /// ```
- /// template <typename HasherT, support::endianness Endianness>
- /// void addHash(HashBuilder<HasherT, Endianness> &HBuilder,
- /// const UserDefinedStruct &Value);
- /// ```
- ///
- /// For example:
- /// ```
- /// struct SimpleStruct {
- /// char c;
- /// int i;
- /// };
- ///
- /// template <typename HasherT, support::endianness Endianness>
- /// void addHash(HashBuilderImpl<HasherT, Endianness> &HBuilder,
- /// const SimpleStruct &Value) {
- /// HBuilder.add(Value.c);
- /// HBuilder.add(Value.i);
- /// }
- /// ```
- ///
- /// To avoid endianness issues, specializations of `addHash` should
- /// generally rely on exising `add`, `addRange`, and `addRangeElements`
- /// functions. If directly using `update`, an implementation must correctly
- /// handle endianness.
- ///
- /// ```
- /// struct __attribute__ ((packed)) StructWithFastHash {
- /// int I;
- /// char C;
- ///
- /// // If possible, we want to hash both `I` and `C` in a single
- /// // `update` call for performance concerns.
- /// template <typename HasherT, support::endianness Endianness>
- /// friend void addHash(HashBuilderImpl<HasherT, Endianness> &HBuilder,
- /// const StructWithFastHash &Value) {
- /// if (Endianness == support::endian::system_endianness()) {
- /// HBuilder.update(makeArrayRef(
- /// reinterpret_cast<const uint8_t *>(&Value), sizeof(Value)));
- /// } else {
- /// // Rely on existing `add` methods to handle endianness.
- /// HBuilder.add(Value.I);
- /// HBuilder.add(Value.C);
- /// }
- /// }
- /// };
- /// ```
- ///
- /// To avoid collisions, specialization of `addHash` for variable-size
- /// types must take the size into account.
- ///
- /// For example:
- /// ```
- /// struct CustomContainer {
- /// private:
- /// size_t Size;
- /// int Elements[100];
- ///
- /// public:
- /// CustomContainer(size_t Size) : Size(Size) {
- /// for (size_t I = 0; I != Size; ++I)
- /// Elements[I] = I;
- /// }
- /// template <typename HasherT, support::endianness Endianness>
- /// friend void addHash(HashBuilderImpl<HasherT, Endianness> &HBuilder,
- /// const CustomContainer &Value) {
- /// if (Endianness == support::endian::system_endianness()) {
- /// HBuilder.update(makeArrayRef(
- /// reinterpret_cast<const uint8_t *>(&Value.Size),
- /// sizeof(Value.Size) + Value.Size * sizeof(Value.Elements[0])));
- /// } else {
- /// // `addRange` will take care of encoding the size.
- /// HBuilder.addRange(&Value.Elements[0], &Value.Elements[0] +
- /// Value.Size);
- /// }
- /// }
- /// };
- /// ```
- template <typename T>
- std::enable_if_t<is_detected<HasAddHashT, T>::value &&
- !hashbuilder_detail::IsHashableData<T>::value,
- HashBuilderImpl &>
- add(const T &Value) {
- addHash(*this, Value);
- return *this;
- }
- template <typename T1, typename T2>
- HashBuilderImpl &add(const std::pair<T1, T2> &Value) {
- add(Value.first);
- add(Value.second);
- return *this;
- }
- template <typename... Ts> HashBuilderImpl &add(const std::tuple<Ts...> &Arg) {
- return addTupleHelper(Arg, typename std::index_sequence_for<Ts...>());
- }
- /// A convenenience variadic helper.
- /// It simply iterates over its arguments, in order.
- /// ```
- /// add(Arg1, Arg2);
- /// ```
- /// is equivalent to
- /// ```
- /// add(Arg1)
- /// add(Arg2)
- /// ```
- template <typename T, typename... Ts>
- typename std::enable_if<(sizeof...(Ts) >= 1), HashBuilderImpl &>::type
- add(const T &FirstArg, const Ts &...Args) {
- add(FirstArg);
- add(Args...);
- return *this;
- }
- template <typename ForwardIteratorT>
- HashBuilderImpl &addRange(ForwardIteratorT First, ForwardIteratorT Last) {
- add(std::distance(First, Last));
- return addRangeElements(First, Last);
- }
- template <typename RangeT> HashBuilderImpl &addRange(const RangeT &Range) {
- return addRange(adl_begin(Range), adl_end(Range));
- }
- template <typename ForwardIteratorT>
- HashBuilderImpl &addRangeElements(ForwardIteratorT First,
- ForwardIteratorT Last) {
- return addRangeElementsImpl(
- First, Last,
- typename std::iterator_traits<ForwardIteratorT>::iterator_category());
- }
- template <typename RangeT>
- HashBuilderImpl &addRangeElements(const RangeT &Range) {
- return addRangeElements(adl_begin(Range), adl_end(Range));
- }
- template <typename T>
- using HasByteSwapT = decltype(support::endian::byte_swap(
- std::declval<T &>(), support::endianness::little));
- /// Adjust `Value` for the target endianness and add it to the hash.
- template <typename T>
- std::enable_if_t<is_detected<HasByteSwapT, T>::value, HashBuilderImpl &>
- adjustForEndiannessAndAdd(const T &Value) {
- T SwappedValue = support::endian::byte_swap(Value, Endianness);
- this->update(makeArrayRef(reinterpret_cast<const uint8_t *>(&SwappedValue),
- sizeof(SwappedValue)));
- return *this;
- }
- private:
- template <typename... Ts, std::size_t... Indices>
- HashBuilderImpl &addTupleHelper(const std::tuple<Ts...> &Arg,
- std::index_sequence<Indices...>) {
- add(std::get<Indices>(Arg)...);
- return *this;
- }
- // FIXME: Once available, specialize this function for `contiguous_iterator`s,
- // and use it for `ArrayRef` and `StringRef`.
- template <typename ForwardIteratorT>
- HashBuilderImpl &addRangeElementsImpl(ForwardIteratorT First,
- ForwardIteratorT Last,
- std::forward_iterator_tag) {
- for (auto It = First; It != Last; ++It)
- add(*It);
- return *this;
- }
- template <typename T>
- std::enable_if_t<hashbuilder_detail::IsHashableData<T>::value &&
- Endianness == support::endian::system_endianness(),
- HashBuilderImpl &>
- addRangeElementsImpl(T *First, T *Last, std::forward_iterator_tag) {
- this->update(makeArrayRef(reinterpret_cast<const uint8_t *>(First),
- (Last - First) * sizeof(T)));
- return *this;
- }
- };
- /// Interface to help hash various types through a hasher type.
- ///
- /// Via provided specializations of `add`, `addRange`, and `addRangeElements`
- /// functions, various types (e.g. `ArrayRef`, `StringRef`, etc.) can be hashed
- /// without requiring any knowledge of hashed types from the hasher type.
- ///
- /// The only method expected from the templated hasher type `HasherT` is:
- /// * void update(ArrayRef<uint8_t> Data)
- ///
- /// Additionally, the following methods will be forwarded to the hasher type:
- /// * decltype(std::declval<HasherT &>().final()) final()
- /// * decltype(std::declval<HasherT &>().result()) result()
- ///
- /// From a user point of view, the interface provides the following:
- /// * `template<typename T> add(const T &Value)`
- /// The `add` function implements hashing of various types.
- /// * `template <typename ItT> void addRange(ItT First, ItT Last)`
- /// The `addRange` function is designed to aid hashing a range of values.
- /// It explicitly adds the size of the range in the hash.
- /// * `template <typename ItT> void addRangeElements(ItT First, ItT Last)`
- /// The `addRangeElements` function is also designed to aid hashing a range of
- /// values. In contrast to `addRange`, it **ignores** the size of the range,
- /// behaving as if elements were added one at a time with `add`.
- ///
- /// User-defined `struct` types can participate in this interface by providing
- /// an `addHash` templated function. See the associated template specialization
- /// for details.
- ///
- /// This interface does not impose requirements on the hasher
- /// `update(ArrayRef<uint8_t> Data)` method. We want to avoid collisions for
- /// variable-size types; for example for
- /// ```
- /// builder.add({1});
- /// builder.add({2, 3});
- /// ```
- /// and
- /// ```
- /// builder.add({1, 2});
- /// builder.add({3});
- /// ```
- /// . Thus, specializations of `add` and `addHash` for variable-size types must
- /// not assume that the hasher type considers the size as part of the hash; they
- /// must explicitly add the size to the hash. See for example specializations
- /// for `ArrayRef` and `StringRef`.
- ///
- /// Additionally, since types are eventually forwarded to the hasher's
- /// `void update(ArrayRef<uint8_t>)` method, endianness plays a role in the hash
- /// computation (for example when computing `add((int)123)`).
- /// Specifiying a non-`native` `Endianness` template parameter allows to compute
- /// stable hash across platforms with different endianness.
- template <class HasherT, support::endianness Endianness>
- using HashBuilder =
- HashBuilderImpl<HasherT, (Endianness == support::endianness::native
- ? support::endian::system_endianness()
- : Endianness)>;
- namespace hashbuilder_detail {
- class HashCodeHasher {
- public:
- HashCodeHasher() : Code(0) {}
- void update(ArrayRef<uint8_t> Data) {
- hash_code DataCode = hash_value(Data);
- Code = hash_combine(Code, DataCode);
- }
- hash_code Code;
- };
- using HashCodeHashBuilder = HashBuilder<hashbuilder_detail::HashCodeHasher,
- support::endianness::native>;
- } // namespace hashbuilder_detail
- /// Provide a default implementation of `hash_value` when `addHash(const T &)`
- /// is supported.
- template <typename T>
- std::enable_if_t<
- is_detected<hashbuilder_detail::HashCodeHashBuilder::HasAddHashT, T>::value,
- hash_code>
- hash_value(const T &Value) {
- hashbuilder_detail::HashCodeHashBuilder HBuilder;
- HBuilder.add(Value);
- return HBuilder.getHasher().Code;
- }
- } // end namespace llvm
- #endif // LLVM_SUPPORT_HASHBUILDER_H
- #ifdef __GNUC__
- #pragma GCC diagnostic pop
- #endif
|