1 | //===--- CrossTranslationUnit.h - -------------------------------*- C++ -*-===// |
2 | // |
3 | // Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions. |
4 | // See https://llvm.org/LICENSE.txt for license information. |
5 | // SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception |
6 | // |
7 | //===----------------------------------------------------------------------===// |
8 | // |
9 | // This file provides an interface to load binary AST dumps on demand. This |
10 | // feature can be utilized for tools that require cross translation unit |
11 | // support. |
12 | // |
13 | //===----------------------------------------------------------------------===// |
14 | #ifndef LLVM_CLANG_CROSSTU_CROSSTRANSLATIONUNIT_H |
15 | #define LLVM_CLANG_CROSSTU_CROSSTRANSLATIONUNIT_H |
16 | |
17 | #include "clang/AST/ASTImporterSharedState.h" |
18 | #include "clang/Analysis/MacroExpansionContext.h" |
19 | #include "clang/Basic/LLVM.h" |
20 | #include "llvm/ADT/DenseMap.h" |
21 | #include "llvm/ADT/SmallPtrSet.h" |
22 | #include "llvm/ADT/StringMap.h" |
23 | #include "llvm/Support/Error.h" |
24 | #include "llvm/Support/Path.h" |
25 | #include <optional> |
26 | |
27 | namespace clang { |
28 | class CompilerInstance; |
29 | class ASTContext; |
30 | class ASTImporter; |
31 | class ASTUnit; |
32 | class DeclContext; |
33 | class FunctionDecl; |
34 | class VarDecl; |
35 | class NamedDecl; |
36 | class TranslationUnitDecl; |
37 | |
38 | namespace cross_tu { |
39 | |
40 | enum class index_error_code { |
41 | success = 0, |
42 | unspecified = 1, |
43 | missing_index_file, |
44 | invalid_index_format, |
45 | multiple_definitions, |
46 | missing_definition, |
47 | failed_import, |
48 | failed_to_get_external_ast, |
49 | failed_to_generate_usr, |
50 | triple_mismatch, |
51 | lang_mismatch, |
52 | lang_dialect_mismatch, |
53 | load_threshold_reached, |
54 | invocation_list_ambiguous, |
55 | invocation_list_file_not_found, |
56 | invocation_list_empty, |
57 | invocation_list_wrong_format, |
58 | invocation_list_lookup_unsuccessful |
59 | }; |
60 | |
61 | class IndexError : public llvm::ErrorInfo<IndexError> { |
62 | public: |
63 | static char ID; |
64 | IndexError(index_error_code C) : Code(C), LineNo(0) {} |
65 | IndexError(index_error_code C, std::string FileName, int LineNo = 0) |
66 | : Code(C), FileName(std::move(FileName)), LineNo(LineNo) {} |
67 | IndexError(index_error_code C, std::string FileName, std::string TripleToName, |
68 | std::string TripleFromName) |
69 | : Code(C), FileName(std::move(FileName)), |
70 | TripleToName(std::move(TripleToName)), |
71 | TripleFromName(std::move(TripleFromName)) {} |
72 | void log(raw_ostream &OS) const override; |
73 | std::error_code convertToErrorCode() const override; |
74 | index_error_code getCode() const { return Code; } |
75 | int getLineNum() const { return LineNo; } |
76 | std::string getFileName() const { return FileName; } |
77 | std::string getTripleToName() const { return TripleToName; } |
78 | std::string getTripleFromName() const { return TripleFromName; } |
79 | |
80 | private: |
81 | index_error_code Code; |
82 | std::string FileName; |
83 | int LineNo; |
84 | std::string TripleToName; |
85 | std::string TripleFromName; |
86 | }; |
87 | |
88 | /// This function parses an index file that determines which |
89 | /// translation unit contains which definition. The IndexPath is not prefixed |
90 | /// with CTUDir, so an absolute path is expected for consistent results. |
91 | /// |
92 | /// The index file format is the following: |
93 | /// each line consists of an USR and a filepath separated by a space. |
94 | /// |
95 | /// \return Returns a map where the USR is the key and the filepath is the value |
96 | /// or an error. |
97 | llvm::Expected<llvm::StringMap<std::string>> |
98 | parseCrossTUIndex(StringRef IndexPath); |
99 | |
100 | std::string createCrossTUIndexString(const llvm::StringMap<std::string> &Index); |
101 | |
102 | using InvocationListTy = llvm::StringMap<llvm::SmallVector<std::string, 32>>; |
103 | /// Parse the YAML formatted invocation list file content \p FileContent. |
104 | /// The format is expected to be a mapping from absolute source file |
105 | /// paths in the filesystem to a list of command-line parts, which |
106 | /// constitute the invocation needed to compile that file. That invocation |
107 | /// will be used to produce the AST of the TU. |
108 | llvm::Expected<InvocationListTy> parseInvocationList( |
109 | StringRef FileContent, |
110 | llvm::sys::path::Style PathStyle = llvm::sys::path::Style::posix); |
111 | |
112 | /// Returns true if it makes sense to import a foreign variable definition. |
113 | /// For instance, we don't want to import variables that have non-trivial types |
114 | /// because the constructor might have side-effects. |
115 | bool shouldImport(const VarDecl *VD, const ASTContext &ACtx); |
116 | |
117 | /// This class is used for tools that requires cross translation |
118 | /// unit capability. |
119 | /// |
120 | /// This class can load definitions from external AST sources. |
121 | /// The loaded definition will be merged back to the original AST using the |
122 | /// AST Importer. |
123 | /// In order to use this class, an index file is required that describes |
124 | /// the locations of the AST files for each definition. |
125 | /// |
126 | /// Note that this class also implements caching. |
127 | class CrossTranslationUnitContext { |
128 | public: |
129 | CrossTranslationUnitContext(CompilerInstance &CI); |
130 | ~CrossTranslationUnitContext(); |
131 | |
132 | /// This function loads a function or variable definition from an |
133 | /// external AST file and merges it into the original AST. |
134 | /// |
135 | /// This method should only be used on functions that have no definitions or |
136 | /// variables that have no initializer in |
137 | /// the current translation unit. A function definition with the same |
138 | /// declaration will be looked up in the index file which should be in the |
139 | /// \p CrossTUDir directory, called \p IndexName. In case the declaration is |
140 | /// found in the index the corresponding AST will be loaded and the |
141 | /// definition will be merged into the original AST using the AST Importer. |
142 | /// |
143 | /// \return The declaration with the definition will be returned. |
144 | /// If no suitable definition is found in the index file or multiple |
145 | /// definitions found error will be returned. |
146 | /// |
147 | /// Note that the AST files should also be in the \p CrossTUDir. |
148 | llvm::Expected<const FunctionDecl *> |
149 | getCrossTUDefinition(const FunctionDecl *FD, StringRef CrossTUDir, |
150 | StringRef IndexName, bool DisplayCTUProgress = false); |
151 | llvm::Expected<const VarDecl *> |
152 | getCrossTUDefinition(const VarDecl *VD, StringRef CrossTUDir, |
153 | StringRef IndexName, bool DisplayCTUProgress = false); |
154 | |
155 | /// This function loads a definition from an external AST file. |
156 | /// |
157 | /// A definition with the same declaration will be looked up in the |
158 | /// index file which should be in the \p CrossTUDir directory, called |
159 | /// \p IndexName. In case the declaration is found in the index the |
160 | /// corresponding AST will be loaded. If the number of TUs imported |
161 | /// reaches \p CTULoadTreshold, no loading is performed. |
162 | /// |
163 | /// \return Returns a pointer to the ASTUnit that contains the definition of |
164 | /// the looked up name or an Error. |
165 | /// The returned pointer is never a nullptr. |
166 | /// |
167 | /// Note that the AST files should also be in the \p CrossTUDir. |
168 | llvm::Expected<ASTUnit *> loadExternalAST(StringRef LookupName, |
169 | StringRef CrossTUDir, |
170 | StringRef IndexName, |
171 | bool DisplayCTUProgress = false); |
172 | |
173 | /// This function merges a definition from a separate AST Unit into |
174 | /// the current one which was created by the compiler instance that |
175 | /// was passed to the constructor. |
176 | /// |
177 | /// \return Returns the resulting definition or an error. |
178 | llvm::Expected<const FunctionDecl *> importDefinition(const FunctionDecl *FD, |
179 | ASTUnit *Unit); |
180 | llvm::Expected<const VarDecl *> importDefinition(const VarDecl *VD, |
181 | ASTUnit *Unit); |
182 | |
183 | /// Get a name to identify a named decl. |
184 | static std::optional<std::string> getLookupName(const NamedDecl *ND); |
185 | |
186 | /// Emit diagnostics for the user for potential configuration errors. |
187 | void emitCrossTUDiagnostics(const IndexError &IE); |
188 | |
189 | /// Returns the MacroExpansionContext for the imported TU to which the given |
190 | /// source-location corresponds. |
191 | /// \p ToLoc Source location in the imported-to AST. |
192 | /// \note If any error happens such as \p ToLoc is a non-imported |
193 | /// source-location, empty is returned. |
194 | /// \note Macro expansion tracking for imported TUs is not implemented yet. |
195 | /// It returns empty unconditionally. |
196 | std::optional<clang::MacroExpansionContext> |
197 | getMacroExpansionContextForSourceLocation( |
198 | const clang::SourceLocation &ToLoc) const; |
199 | |
200 | /// Returns true if the given Decl is newly created during the import. |
201 | bool isImportedAsNew(const Decl *ToDecl) const; |
202 | |
203 | /// Returns true if the given Decl is mapped (or created) during an import |
204 | /// but there was an unrecoverable error (the AST node cannot be erased, it |
205 | /// is marked with an Error object in this case). |
206 | bool hasError(const Decl *ToDecl) const; |
207 | |
208 | private: |
209 | void lazyInitImporterSharedSt(TranslationUnitDecl *ToTU); |
210 | ASTImporter &getOrCreateASTImporter(ASTUnit *Unit); |
211 | template <typename T> |
212 | llvm::Expected<const T *> getCrossTUDefinitionImpl(const T *D, |
213 | StringRef CrossTUDir, |
214 | StringRef IndexName, |
215 | bool DisplayCTUProgress); |
216 | template <typename T> |
217 | const T *findDefInDeclContext(const DeclContext *DC, |
218 | StringRef LookupName); |
219 | template <typename T> |
220 | llvm::Expected<const T *> importDefinitionImpl(const T *D, ASTUnit *Unit); |
221 | |
222 | using ImporterMapTy = |
223 | llvm::DenseMap<TranslationUnitDecl *, std::unique_ptr<ASTImporter>>; |
224 | |
225 | ImporterMapTy ASTUnitImporterMap; |
226 | |
227 | ASTContext &Context; |
228 | std::shared_ptr<ASTImporterSharedState> ImporterSharedSt; |
229 | |
230 | using LoadResultTy = llvm::Expected<std::unique_ptr<ASTUnit>>; |
231 | |
232 | /// Loads ASTUnits from AST-dumps or source-files. |
233 | class ASTLoader { |
234 | public: |
235 | ASTLoader(CompilerInstance &CI, StringRef CTUDir, |
236 | StringRef InvocationListFilePath); |
237 | |
238 | /// Load the ASTUnit by its identifier found in the index file. If the |
239 | /// identifier is suffixed with '.ast' it is considered a dump. Otherwise |
240 | /// it is treated as source-file, and on-demand parsed. Relative paths are |
241 | /// prefixed with CTUDir. |
242 | LoadResultTy load(StringRef Identifier); |
243 | |
244 | /// Lazily initialize the invocation list information, which is needed for |
245 | /// on-demand parsing. |
246 | llvm::Error lazyInitInvocationList(); |
247 | |
248 | private: |
249 | /// The style used for storage and lookup of filesystem paths. |
250 | /// Defaults to posix. |
251 | const llvm::sys::path::Style PathStyle = llvm::sys::path::Style::posix; |
252 | |
253 | /// Loads an AST from a pch-dump. |
254 | LoadResultTy loadFromDump(StringRef Identifier); |
255 | /// Loads an AST from a source-file. |
256 | LoadResultTy loadFromSource(StringRef Identifier); |
257 | |
258 | CompilerInstance &CI; |
259 | StringRef CTUDir; |
260 | /// The path to the file containing the invocation list, which is in YAML |
261 | /// format, and contains a mapping from source files to compiler invocations |
262 | /// that produce the AST used for analysis. |
263 | StringRef InvocationListFilePath; |
264 | /// In case of on-demand parsing, the invocations for parsing the source |
265 | /// files is stored. |
266 | std::optional<InvocationListTy> InvocationList; |
267 | index_error_code PreviousParsingResult = index_error_code::success; |
268 | }; |
269 | |
270 | /// Maintain number of AST loads and check for reaching the load limit. |
271 | class ASTLoadGuard { |
272 | public: |
273 | ASTLoadGuard(unsigned Limit) : Limit(Limit) {} |
274 | |
275 | /// Indicates, whether a new load operation is permitted, it is within the |
276 | /// threshold. |
277 | operator bool() const { return Count < Limit; } |
278 | |
279 | /// Tell that a new AST was loaded successfully. |
280 | void indicateLoadSuccess() { ++Count; } |
281 | |
282 | private: |
283 | /// The number of ASTs actually imported. |
284 | unsigned Count{0u}; |
285 | /// The limit (threshold) value for number of loaded ASTs. |
286 | const unsigned Limit; |
287 | }; |
288 | |
289 | /// Storage and load of ASTUnits, cached access, and providing searchability |
290 | /// are the concerns of ASTUnitStorage class. |
291 | class ASTUnitStorage { |
292 | public: |
293 | ASTUnitStorage(CompilerInstance &CI); |
294 | /// Loads an ASTUnit for a function. |
295 | /// |
296 | /// \param FunctionName USR name of the function. |
297 | /// \param CrossTUDir Path to the directory used to store CTU related files. |
298 | /// \param IndexName Name of the file inside \p CrossTUDir which maps |
299 | /// function USR names to file paths. These files contain the corresponding |
300 | /// AST-dumps. |
301 | /// \param DisplayCTUProgress Display a message about loading new ASTs. |
302 | /// |
303 | /// \return An Expected instance which contains the ASTUnit pointer or the |
304 | /// error occurred during the load. |
305 | llvm::Expected<ASTUnit *> getASTUnitForFunction(StringRef FunctionName, |
306 | StringRef CrossTUDir, |
307 | StringRef IndexName, |
308 | bool DisplayCTUProgress); |
309 | /// Identifies the path of the file which can be used to load the ASTUnit |
310 | /// for a given function. |
311 | /// |
312 | /// \param FunctionName USR name of the function. |
313 | /// \param CrossTUDir Path to the directory used to store CTU related files. |
314 | /// \param IndexName Name of the file inside \p CrossTUDir which maps |
315 | /// function USR names to file paths. These files contain the corresponding |
316 | /// AST-dumps. |
317 | /// |
318 | /// \return An Expected instance containing the filepath. |
319 | llvm::Expected<std::string> getFileForFunction(StringRef FunctionName, |
320 | StringRef CrossTUDir, |
321 | StringRef IndexName); |
322 | |
323 | private: |
324 | llvm::Error ensureCTUIndexLoaded(StringRef CrossTUDir, StringRef IndexName); |
325 | llvm::Expected<ASTUnit *> getASTUnitForFile(StringRef FileName, |
326 | bool DisplayCTUProgress); |
327 | |
328 | template <typename... T> using BaseMapTy = llvm::StringMap<T...>; |
329 | using OwningMapTy = BaseMapTy<std::unique_ptr<clang::ASTUnit>>; |
330 | using NonOwningMapTy = BaseMapTy<clang::ASTUnit *>; |
331 | |
332 | OwningMapTy FileASTUnitMap; |
333 | NonOwningMapTy NameASTUnitMap; |
334 | |
335 | using IndexMapTy = BaseMapTy<std::string>; |
336 | IndexMapTy NameFileMap; |
337 | |
338 | /// Loads the AST based on the identifier found in the index. |
339 | ASTLoader Loader; |
340 | |
341 | /// Limit the number of loaded ASTs. It is used to limit the memory usage |
342 | /// of the CrossTranslationUnitContext. The ASTUnitStorage has the |
343 | /// information whether the AST to load is actually loaded or returned from |
344 | /// cache. This information is needed to maintain the counter. |
345 | ASTLoadGuard LoadGuard; |
346 | }; |
347 | |
348 | ASTUnitStorage ASTStorage; |
349 | }; |
350 | |
351 | } // namespace cross_tu |
352 | } // namespace clang |
353 | |
354 | #endif // LLVM_CLANG_CROSSTU_CROSSTRANSLATIONUNIT_H |
355 | |