| 1 | //===--- SymbolID.h ----------------------------------------------*- C++-*-===// |
| 2 | // |
| 3 | // Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions. |
| 4 | // See https://llvm.org/LICENSE.txt for license information. |
| 5 | // SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception |
| 6 | // |
| 7 | //===----------------------------------------------------------------------===// |
| 8 | |
| 9 | #ifndef LLVM_CLANG_TOOLS_EXTRA_CLANGD_INDEX_SYMBOLID_H |
| 10 | #define |
| 11 | |
| 12 | #include "llvm/ADT/Hashing.h" |
| 13 | #include "llvm/ADT/StringRef.h" |
| 14 | #include "llvm/Support/Error.h" |
| 15 | #include "llvm/Support/raw_ostream.h" |
| 16 | #include <array> |
| 17 | #include <cstddef> |
| 18 | #include <cstdint> |
| 19 | #include <string> |
| 20 | |
| 21 | namespace clang { |
| 22 | namespace clangd { |
| 23 | |
| 24 | // The class identifies a particular C++ symbol (class, function, method, etc). |
| 25 | // |
| 26 | // As USRs (Unified Symbol Resolution) could be large, especially for functions |
| 27 | // with long type arguments, SymbolID is using truncated SHA1(USR) values to |
| 28 | // guarantee the uniqueness of symbols while using a relatively small amount of |
| 29 | // memory (vs storing USRs directly). |
| 30 | // |
| 31 | // SymbolID can be used as key in the symbol indexes to lookup the symbol. |
| 32 | class SymbolID { |
| 33 | public: |
| 34 | SymbolID() = default; |
| 35 | explicit SymbolID(llvm::StringRef USR); |
| 36 | |
| 37 | bool operator==(const SymbolID &Sym) const { |
| 38 | return HashValue == Sym.HashValue; |
| 39 | } |
| 40 | bool operator!=(const SymbolID &Sym) const { return !(*this == Sym); } |
| 41 | bool operator<(const SymbolID &Sym) const { |
| 42 | // Avoid lexicographic compare which requires swapping bytes or even memcmp! |
| 43 | return llvm::bit_cast<IntTy>(from: HashValue) < |
| 44 | llvm::bit_cast<IntTy>(from: Sym.HashValue); |
| 45 | } |
| 46 | |
| 47 | // The stored hash is truncated to RawSize bytes. |
| 48 | // This trades off memory against the number of symbols we can handle. |
| 49 | constexpr static size_t RawSize = 8; |
| 50 | llvm::StringRef raw() const; |
| 51 | static SymbolID fromRaw(llvm::StringRef); |
| 52 | |
| 53 | // Returns a hex encoded string. |
| 54 | std::string str() const; |
| 55 | static llvm::Expected<SymbolID> fromStr(llvm::StringRef); |
| 56 | |
| 57 | bool isNull() const { return *this == SymbolID(); } |
| 58 | explicit operator bool() const { return !isNull(); } |
| 59 | |
| 60 | private: |
| 61 | using IntTy = uint64_t; |
| 62 | static_assert(sizeof(IntTy) == RawSize); |
| 63 | std::array<uint8_t, RawSize> HashValue{}; |
| 64 | }; |
| 65 | |
| 66 | inline llvm::hash_code hash_value(const SymbolID &ID) { |
| 67 | // We already have a good hash, just return the first bytes. |
| 68 | static_assert(sizeof(size_t) <= SymbolID::RawSize, |
| 69 | "size_t longer than SHA1!" ); |
| 70 | size_t Result; |
| 71 | memcpy(dest: &Result, src: ID.raw().data(), n: sizeof(size_t)); |
| 72 | return llvm::hash_code(Result); |
| 73 | } |
| 74 | |
| 75 | // Write SymbolID into the given stream. SymbolID is encoded as ID.str(). |
| 76 | llvm::raw_ostream &operator<<(llvm::raw_ostream &OS, const SymbolID &ID); |
| 77 | |
| 78 | } // namespace clangd |
| 79 | } // namespace clang |
| 80 | |
| 81 | namespace llvm { |
| 82 | // Support SymbolIDs as DenseMap keys. |
| 83 | template <> struct DenseMapInfo<clang::clangd::SymbolID> { |
| 84 | static inline clang::clangd::SymbolID getEmptyKey() { |
| 85 | static clang::clangd::SymbolID EmptyKey("EMPTYKEY" ); |
| 86 | return EmptyKey; |
| 87 | } |
| 88 | static inline clang::clangd::SymbolID getTombstoneKey() { |
| 89 | static clang::clangd::SymbolID TombstoneKey("TOMBSTONEKEY" ); |
| 90 | return TombstoneKey; |
| 91 | } |
| 92 | static unsigned getHashValue(const clang::clangd::SymbolID &Sym) { |
| 93 | return hash_value(ID: Sym); |
| 94 | } |
| 95 | static bool isEqual(const clang::clangd::SymbolID &LHS, |
| 96 | const clang::clangd::SymbolID &RHS) { |
| 97 | return LHS == RHS; |
| 98 | } |
| 99 | }; |
| 100 | } // namespace llvm |
| 101 | |
| 102 | #endif // LLVM_CLANG_TOOLS_EXTRA_CLANGD_INDEX_SYMBOLID_H |
| 103 | |