| 1 | //===--- Ref.h ---------------------------------------------------*- C++-*-===// |
| 2 | // |
| 3 | // Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions. |
| 4 | // See https://llvm.org/LICENSE.txt for license information. |
| 5 | // SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception |
| 6 | // |
| 7 | //===----------------------------------------------------------------------===// |
| 8 | |
| 9 | #ifndef LLVM_CLANG_TOOLS_EXTRA_CLANGD_INDEX_REF_H |
| 10 | #define |
| 11 | |
| 12 | #include "index/SymbolID.h" |
| 13 | #include "index/SymbolLocation.h" |
| 14 | #include "llvm/ADT/Hashing.h" |
| 15 | #include "llvm/Support/Allocator.h" |
| 16 | #include "llvm/Support/StringSaver.h" |
| 17 | #include "llvm/Support/raw_ostream.h" |
| 18 | #include <cstdint> |
| 19 | #include <set> |
| 20 | #include <utility> |
| 21 | |
| 22 | namespace clang { |
| 23 | namespace clangd { |
| 24 | |
| 25 | /// Describes the kind of a cross-reference. |
| 26 | /// |
| 27 | /// This is a bitfield which can be combined from different kinds. |
| 28 | enum class RefKind : uint8_t { |
| 29 | Unknown = 0, |
| 30 | // Points to symbol declaration. Example: |
| 31 | // |
| 32 | // class Foo; |
| 33 | // ^ Foo declaration |
| 34 | // Foo foo; |
| 35 | // ^ this does not reference Foo declaration |
| 36 | Declaration = 1 << 0, |
| 37 | // Points to symbol definition. Example: |
| 38 | // |
| 39 | // int foo(); |
| 40 | // ^ references foo declaration, but not foo definition |
| 41 | // int foo() { return 42; } |
| 42 | // ^ references foo definition, but not declaration |
| 43 | // bool bar() { return true; } |
| 44 | // ^ references both definition and declaration |
| 45 | Definition = 1 << 1, |
| 46 | // Points to symbol reference. Example: |
| 47 | // |
| 48 | // int Foo = 42; |
| 49 | // int Bar = Foo + 1; |
| 50 | // ^ this is a reference to Foo |
| 51 | Reference = 1 << 2, |
| 52 | // The reference explicitly spells out declaration's name. Such references can |
| 53 | // not come from macro expansions or implicit AST nodes. |
| 54 | // |
| 55 | // class Foo { public: Foo() {} }; |
| 56 | // ^ references declaration, definition and explicitly spells out name |
| 57 | // #define MACRO Foo |
| 58 | // v there is an implicit constructor call here which is not a spelled ref |
| 59 | // Foo foo; |
| 60 | // ^ this reference explicitly spells out Foo's name |
| 61 | // struct Bar { |
| 62 | // MACRO Internal; |
| 63 | // ^ this references Foo, but does not explicitly spell out its name |
| 64 | // }; |
| 65 | Spelled = 1 << 3, |
| 66 | // A reference which is a call. Used as a filter for which references |
| 67 | // to store in data structures used for computing outgoing calls. |
| 68 | Call = 1 << 4, |
| 69 | All = Declaration | Definition | Reference | Spelled, |
| 70 | }; |
| 71 | |
| 72 | inline RefKind operator|(RefKind L, RefKind R) { |
| 73 | return static_cast<RefKind>(static_cast<uint8_t>(L) | |
| 74 | static_cast<uint8_t>(R)); |
| 75 | } |
| 76 | inline RefKind &operator|=(RefKind &L, RefKind R) { return L = L | R; } |
| 77 | inline RefKind operator&(RefKind A, RefKind B) { |
| 78 | return static_cast<RefKind>(static_cast<uint8_t>(A) & |
| 79 | static_cast<uint8_t>(B)); |
| 80 | } |
| 81 | |
| 82 | llvm::raw_ostream &operator<<(llvm::raw_ostream &, RefKind); |
| 83 | |
| 84 | /// Represents a symbol occurrence in the source file. |
| 85 | /// Despite the name, it could be a declaration/definition/reference. |
| 86 | /// |
| 87 | /// WARNING: Location does not own the underlying data - Copies are shallow. |
| 88 | struct Ref { |
| 89 | /// The source location where the symbol is named. |
| 90 | SymbolLocation Location; |
| 91 | RefKind Kind = RefKind::Unknown; |
| 92 | /// The ID of the symbol whose definition contains this reference. |
| 93 | /// For example, for a reference inside a function body, this would |
| 94 | /// be that function. For top-level definitions this isNull(). |
| 95 | SymbolID Container; |
| 96 | }; |
| 97 | |
| 98 | inline bool operator<(const Ref &L, const Ref &R) { |
| 99 | return std::tie(args: L.Location, args: L.Kind, args: L.Container) < |
| 100 | std::tie(args: R.Location, args: R.Kind, args: R.Container); |
| 101 | } |
| 102 | inline bool operator==(const Ref &L, const Ref &R) { |
| 103 | return std::tie(args: L.Location, args: L.Kind, args: L.Container) == |
| 104 | std::tie(args: R.Location, args: R.Kind, args: R.Container); |
| 105 | } |
| 106 | |
| 107 | llvm::raw_ostream &operator<<(llvm::raw_ostream &, const Ref &); |
| 108 | |
| 109 | /// An efficient structure of storing large set of symbol references in memory. |
| 110 | /// Filenames are deduplicated. |
| 111 | class RefSlab { |
| 112 | public: |
| 113 | // Refs are stored in order. |
| 114 | using value_type = std::pair<SymbolID, llvm::ArrayRef<Ref>>; |
| 115 | using const_iterator = std::vector<value_type>::const_iterator; |
| 116 | using iterator = const_iterator; |
| 117 | |
| 118 | RefSlab() = default; |
| 119 | RefSlab(RefSlab &&Slab) = default; |
| 120 | RefSlab &operator=(RefSlab &&RHS) = default; |
| 121 | |
| 122 | const_iterator begin() const { return Refs.begin(); } |
| 123 | const_iterator end() const { return Refs.end(); } |
| 124 | /// Gets the number of symbols. |
| 125 | size_t size() const { return Refs.size(); } |
| 126 | size_t numRefs() const { return NumRefs; } |
| 127 | bool empty() const { return Refs.empty(); } |
| 128 | |
| 129 | size_t bytes() const { |
| 130 | return sizeof(*this) + Arena.getTotalMemory() + |
| 131 | sizeof(value_type) * Refs.capacity(); |
| 132 | } |
| 133 | |
| 134 | /// RefSlab::Builder is a mutable container that can 'freeze' to RefSlab. |
| 135 | class Builder { |
| 136 | public: |
| 137 | Builder() : UniqueStrings(Arena) {} |
| 138 | /// Adds a ref to the slab. Deep copy: Strings will be owned by the slab. |
| 139 | void insert(const SymbolID &ID, const Ref &S); |
| 140 | /// Consumes the builder to finalize the slab. |
| 141 | RefSlab build() &&; |
| 142 | |
| 143 | private: |
| 144 | // A ref we're storing with its symbol to consume with build(). |
| 145 | // All strings are interned, so DenseMapInfo can use pointer comparisons. |
| 146 | struct Entry { |
| 147 | SymbolID Symbol; |
| 148 | Ref Reference; |
| 149 | }; |
| 150 | friend struct llvm::DenseMapInfo<Entry>; |
| 151 | |
| 152 | llvm::BumpPtrAllocator Arena; |
| 153 | llvm::UniqueStringSaver UniqueStrings; // Contents on the arena. |
| 154 | llvm::DenseSet<Entry> Entries; |
| 155 | }; |
| 156 | |
| 157 | private: |
| 158 | RefSlab(std::vector<value_type> Refs, llvm::BumpPtrAllocator Arena, |
| 159 | size_t NumRefs) |
| 160 | : Arena(std::move(Arena)), Refs(std::move(Refs)), NumRefs(NumRefs) {} |
| 161 | |
| 162 | llvm::BumpPtrAllocator Arena; |
| 163 | std::vector<value_type> Refs; |
| 164 | /// Number of all references. |
| 165 | size_t NumRefs = 0; |
| 166 | }; |
| 167 | |
| 168 | } // namespace clangd |
| 169 | } // namespace clang |
| 170 | |
| 171 | namespace llvm { |
| 172 | template <> struct DenseMapInfo<clang::clangd::RefSlab::Builder::Entry> { |
| 173 | using Entry = clang::clangd::RefSlab::Builder::Entry; |
| 174 | static inline Entry getEmptyKey() { |
| 175 | static Entry E{.Symbol: clang::clangd::SymbolID("" ), .Reference: {}}; |
| 176 | return E; |
| 177 | } |
| 178 | static inline Entry getTombstoneKey() { |
| 179 | static Entry E{.Symbol: clang::clangd::SymbolID("TOMBSTONE" ), .Reference: {}}; |
| 180 | return E; |
| 181 | } |
| 182 | static unsigned getHashValue(const Entry &Val) { |
| 183 | return llvm::hash_combine( |
| 184 | args: Val.Symbol, args: reinterpret_cast<uintptr_t>(Val.Reference.Location.FileURI), |
| 185 | args: Val.Reference.Location.Start.rep(), args: Val.Reference.Location.End.rep()); |
| 186 | } |
| 187 | static bool isEqual(const Entry &LHS, const Entry &RHS) { |
| 188 | return std::tie(args: LHS.Symbol, args: LHS.Reference.Location.FileURI, |
| 189 | args: LHS.Reference.Kind) == |
| 190 | std::tie(args: RHS.Symbol, args: RHS.Reference.Location.FileURI, |
| 191 | args: RHS.Reference.Kind) && |
| 192 | LHS.Reference.Location.Start == RHS.Reference.Location.Start && |
| 193 | LHS.Reference.Location.End == RHS.Reference.Location.End; |
| 194 | } |
| 195 | }; |
| 196 | } // namespace llvm |
| 197 | |
| 198 | #endif // LLVM_CLANG_TOOLS_EXTRA_CLANGD_INDEX_REF_H |
| 199 | |