clang  19.0.0git
CrossTranslationUnit.h
Go to the documentation of this file.
1 //===--- CrossTranslationUnit.h - -------------------------------*- C++ -*-===//
2 //
3 // Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions.
4 // See https://llvm.org/LICENSE.txt for license information.
5 // SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception
6 //
7 //===----------------------------------------------------------------------===//
8 //
9 // This file provides an interface to load binary AST dumps on demand. This
10 // feature can be utilized for tools that require cross translation unit
11 // support.
12 //
13 //===----------------------------------------------------------------------===//
14 #ifndef LLVM_CLANG_CROSSTU_CROSSTRANSLATIONUNIT_H
15 #define LLVM_CLANG_CROSSTU_CROSSTRANSLATIONUNIT_H
16 
19 #include "clang/Basic/LLVM.h"
20 #include "llvm/ADT/DenseMap.h"
21 #include "llvm/ADT/SmallPtrSet.h"
22 #include "llvm/ADT/StringMap.h"
23 #include "llvm/Support/Error.h"
24 #include "llvm/Support/Path.h"
25 #include <optional>
26 
27 namespace clang {
28 class CompilerInstance;
29 class ASTContext;
30 class ASTImporter;
31 class ASTUnit;
32 class DeclContext;
33 class FunctionDecl;
34 class VarDecl;
35 class NamedDecl;
36 class TranslationUnitDecl;
37 
38 namespace cross_tu {
39 
40 enum class index_error_code {
41  success = 0,
42  unspecified = 1,
59 };
60 
61 class IndexError : public llvm::ErrorInfo<IndexError> {
62 public:
63  static char ID;
64  IndexError(index_error_code C) : Code(C), LineNo(0) {}
65  IndexError(index_error_code C, std::string FileName, int LineNo = 0)
66  : Code(C), FileName(std::move(FileName)), LineNo(LineNo) {}
67  IndexError(index_error_code C, std::string FileName, std::string TripleToName,
68  std::string TripleFromName)
69  : Code(C), FileName(std::move(FileName)),
70  TripleToName(std::move(TripleToName)),
71  TripleFromName(std::move(TripleFromName)) {}
72  void log(raw_ostream &OS) const override;
73  std::error_code convertToErrorCode() const override;
74  index_error_code getCode() const { return Code; }
75  int getLineNum() const { return LineNo; }
76  std::string getFileName() const { return FileName; }
77  std::string getTripleToName() const { return TripleToName; }
78  std::string getTripleFromName() const { return TripleFromName; }
79 
80 private:
81  index_error_code Code;
82  std::string FileName;
83  int LineNo;
84  std::string TripleToName;
85  std::string TripleFromName;
86 };
87 
88 /// This function parses an index file that determines which
89 /// translation unit contains which definition. The IndexPath is not prefixed
90 /// with CTUDir, so an absolute path is expected for consistent results.
91 ///
92 /// The index file format is the following:
93 /// each line consists of an USR and a filepath separated by a space.
94 ///
95 /// \return Returns a map where the USR is the key and the filepath is the value
96 /// or an error.
98 parseCrossTUIndex(StringRef IndexPath);
99 
100 std::string createCrossTUIndexString(const llvm::StringMap<std::string> &Index);
101 
102 using InvocationListTy = llvm::StringMap<llvm::SmallVector<std::string, 32>>;
103 /// Parse the YAML formatted invocation list file content \p FileContent.
104 /// The format is expected to be a mapping from absolute source file
105 /// paths in the filesystem to a list of command-line parts, which
106 /// constitute the invocation needed to compile that file. That invocation
107 /// will be used to produce the AST of the TU.
109  StringRef FileContent,
110  llvm::sys::path::Style PathStyle = llvm::sys::path::Style::posix);
111 
112 /// Returns true if it makes sense to import a foreign variable definition.
113 /// For instance, we don't want to import variables that have non-trivial types
114 /// because the constructor might have side-effects.
115 bool shouldImport(const VarDecl *VD, const ASTContext &ACtx);
116 
117 /// This class is used for tools that requires cross translation
118 /// unit capability.
119 ///
120 /// This class can load definitions from external AST sources.
121 /// The loaded definition will be merged back to the original AST using the
122 /// AST Importer.
123 /// In order to use this class, an index file is required that describes
124 /// the locations of the AST files for each definition.
125 ///
126 /// Note that this class also implements caching.
128 public:
131 
132  /// This function loads a function or variable definition from an
133  /// external AST file and merges it into the original AST.
134  ///
135  /// This method should only be used on functions that have no definitions or
136  /// variables that have no initializer in
137  /// the current translation unit. A function definition with the same
138  /// declaration will be looked up in the index file which should be in the
139  /// \p CrossTUDir directory, called \p IndexName. In case the declaration is
140  /// found in the index the corresponding AST will be loaded and the
141  /// definition will be merged into the original AST using the AST Importer.
142  ///
143  /// \return The declaration with the definition will be returned.
144  /// If no suitable definition is found in the index file or multiple
145  /// definitions found error will be returned.
146  ///
147  /// Note that the AST files should also be in the \p CrossTUDir.
149  getCrossTUDefinition(const FunctionDecl *FD, StringRef CrossTUDir,
150  StringRef IndexName, bool DisplayCTUProgress = false);
152  getCrossTUDefinition(const VarDecl *VD, StringRef CrossTUDir,
153  StringRef IndexName, bool DisplayCTUProgress = false);
154 
155  /// This function loads a definition from an external AST file.
156  ///
157  /// A definition with the same declaration will be looked up in the
158  /// index file which should be in the \p CrossTUDir directory, called
159  /// \p IndexName. In case the declaration is found in the index the
160  /// corresponding AST will be loaded. If the number of TUs imported
161  /// reaches \p CTULoadTreshold, no loading is performed.
162  ///
163  /// \return Returns a pointer to the ASTUnit that contains the definition of
164  /// the looked up name or an Error.
165  /// The returned pointer is never a nullptr.
166  ///
167  /// Note that the AST files should also be in the \p CrossTUDir.
168  llvm::Expected<ASTUnit *> loadExternalAST(StringRef LookupName,
169  StringRef CrossTUDir,
170  StringRef IndexName,
171  bool DisplayCTUProgress = false);
172 
173  /// This function merges a definition from a separate AST Unit into
174  /// the current one which was created by the compiler instance that
175  /// was passed to the constructor.
176  ///
177  /// \return Returns the resulting definition or an error.
179  ASTUnit *Unit);
181  ASTUnit *Unit);
182 
183  /// Get a name to identify a named decl.
184  static std::optional<std::string> getLookupName(const NamedDecl *ND);
185 
186  /// Emit diagnostics for the user for potential configuration errors.
187  void emitCrossTUDiagnostics(const IndexError &IE);
188 
189  /// Returns the MacroExpansionContext for the imported TU to which the given
190  /// source-location corresponds.
191  /// \p ToLoc Source location in the imported-to AST.
192  /// \note If any error happens such as \p ToLoc is a non-imported
193  /// source-location, empty is returned.
194  /// \note Macro expansion tracking for imported TUs is not implemented yet.
195  /// It returns empty unconditionally.
196  std::optional<clang::MacroExpansionContext>
198  const clang::SourceLocation &ToLoc) const;
199 
200  /// Returns true if the given Decl is newly created during the import.
201  bool isImportedAsNew(const Decl *ToDecl) const;
202 
203  /// Returns true if the given Decl is mapped (or created) during an import
204  /// but there was an unrecoverable error (the AST node cannot be erased, it
205  /// is marked with an Error object in this case).
206  bool hasError(const Decl *ToDecl) const;
207 
208 private:
209  void lazyInitImporterSharedSt(TranslationUnitDecl *ToTU);
210  ASTImporter &getOrCreateASTImporter(ASTUnit *Unit);
211  template <typename T>
212  llvm::Expected<const T *> getCrossTUDefinitionImpl(const T *D,
213  StringRef CrossTUDir,
214  StringRef IndexName,
215  bool DisplayCTUProgress);
216  template <typename T>
217  const T *findDefInDeclContext(const DeclContext *DC,
218  StringRef LookupName);
219  template <typename T>
220  llvm::Expected<const T *> importDefinitionImpl(const T *D, ASTUnit *Unit);
221 
222  using ImporterMapTy =
223  llvm::DenseMap<TranslationUnitDecl *, std::unique_ptr<ASTImporter>>;
224 
225  ImporterMapTy ASTUnitImporterMap;
226 
227  ASTContext &Context;
228  std::shared_ptr<ASTImporterSharedState> ImporterSharedSt;
229 
231 
232  /// Loads ASTUnits from AST-dumps or source-files.
233  class ASTLoader {
234  public:
235  ASTLoader(CompilerInstance &CI, StringRef CTUDir,
236  StringRef InvocationListFilePath);
237 
238  /// Load the ASTUnit by its identifier found in the index file. If the
239  /// identifier is suffixed with '.ast' it is considered a dump. Otherwise
240  /// it is treated as source-file, and on-demand parsed. Relative paths are
241  /// prefixed with CTUDir.
242  LoadResultTy load(StringRef Identifier);
243 
244  /// Lazily initialize the invocation list information, which is needed for
245  /// on-demand parsing.
246  llvm::Error lazyInitInvocationList();
247 
248  private:
249  /// The style used for storage and lookup of filesystem paths.
250  /// Defaults to posix.
251  const llvm::sys::path::Style PathStyle = llvm::sys::path::Style::posix;
252 
253  /// Loads an AST from a pch-dump.
254  LoadResultTy loadFromDump(StringRef Identifier);
255  /// Loads an AST from a source-file.
256  LoadResultTy loadFromSource(StringRef Identifier);
257 
258  CompilerInstance &CI;
259  StringRef CTUDir;
260  /// The path to the file containing the invocation list, which is in YAML
261  /// format, and contains a mapping from source files to compiler invocations
262  /// that produce the AST used for analysis.
263  StringRef InvocationListFilePath;
264  /// In case of on-demand parsing, the invocations for parsing the source
265  /// files is stored.
266  std::optional<InvocationListTy> InvocationList;
267  index_error_code PreviousParsingResult = index_error_code::success;
268  };
269 
270  /// Maintain number of AST loads and check for reaching the load limit.
271  class ASTLoadGuard {
272  public:
273  ASTLoadGuard(unsigned Limit) : Limit(Limit) {}
274 
275  /// Indicates, whether a new load operation is permitted, it is within the
276  /// threshold.
277  operator bool() const { return Count < Limit; }
278 
279  /// Tell that a new AST was loaded successfully.
280  void indicateLoadSuccess() { ++Count; }
281 
282  private:
283  /// The number of ASTs actually imported.
284  unsigned Count{0u};
285  /// The limit (threshold) value for number of loaded ASTs.
286  const unsigned Limit;
287  };
288 
289  /// Storage and load of ASTUnits, cached access, and providing searchability
290  /// are the concerns of ASTUnitStorage class.
291  class ASTUnitStorage {
292  public:
293  ASTUnitStorage(CompilerInstance &CI);
294  /// Loads an ASTUnit for a function.
295  ///
296  /// \param FunctionName USR name of the function.
297  /// \param CrossTUDir Path to the directory used to store CTU related files.
298  /// \param IndexName Name of the file inside \p CrossTUDir which maps
299  /// function USR names to file paths. These files contain the corresponding
300  /// AST-dumps.
301  /// \param DisplayCTUProgress Display a message about loading new ASTs.
302  ///
303  /// \return An Expected instance which contains the ASTUnit pointer or the
304  /// error occurred during the load.
305  llvm::Expected<ASTUnit *> getASTUnitForFunction(StringRef FunctionName,
306  StringRef CrossTUDir,
307  StringRef IndexName,
308  bool DisplayCTUProgress);
309  /// Identifies the path of the file which can be used to load the ASTUnit
310  /// for a given function.
311  ///
312  /// \param FunctionName USR name of the function.
313  /// \param CrossTUDir Path to the directory used to store CTU related files.
314  /// \param IndexName Name of the file inside \p CrossTUDir which maps
315  /// function USR names to file paths. These files contain the corresponding
316  /// AST-dumps.
317  ///
318  /// \return An Expected instance containing the filepath.
319  llvm::Expected<std::string> getFileForFunction(StringRef FunctionName,
320  StringRef CrossTUDir,
321  StringRef IndexName);
322 
323  private:
324  llvm::Error ensureCTUIndexLoaded(StringRef CrossTUDir, StringRef IndexName);
325  llvm::Expected<ASTUnit *> getASTUnitForFile(StringRef FileName,
326  bool DisplayCTUProgress);
327 
328  template <typename... T> using BaseMapTy = llvm::StringMap<T...>;
329  using OwningMapTy = BaseMapTy<std::unique_ptr<clang::ASTUnit>>;
330  using NonOwningMapTy = BaseMapTy<clang::ASTUnit *>;
331 
332  OwningMapTy FileASTUnitMap;
333  NonOwningMapTy NameASTUnitMap;
334 
335  using IndexMapTy = BaseMapTy<std::string>;
336  IndexMapTy NameFileMap;
337 
338  /// Loads the AST based on the identifier found in the index.
339  ASTLoader Loader;
340 
341  /// Limit the number of loaded ASTs. It is used to limit the memory usage
342  /// of the CrossTranslationUnitContext. The ASTUnitStorage has the
343  /// information whether the AST to load is actually loaded or returned from
344  /// cache. This information is needed to maintain the counter.
345  ASTLoadGuard LoadGuard;
346  };
347 
348  ASTUnitStorage ASTStorage;
349 };
350 
351 } // namespace cross_tu
352 } // namespace clang
353 
354 #endif // LLVM_CLANG_CROSSTU_CROSSTRANSLATIONUNIT_H
StringRef Identifier
Definition: Format.cpp:2984
Forward-declares and imports various common LLVM datatypes that clang wants to use unqualified.
Holds long-lived AST nodes (such as types and decls) that can be referred to throughout the semantic ...
Definition: ASTContext.h:185
Imports selected nodes from one AST context into another context, merging AST nodes where appropriate...
Definition: ASTImporter.h:62
Utility class for loading a ASTContext from an AST file.
Definition: ASTUnit.h:89
CompilerInstance - Helper class for managing a single instance of the Clang compiler.
DeclContext - This is used only as base class of specific decl types that can act as declaration cont...
Definition: DeclBase.h:1436
Decl - This represents one declaration (or definition), e.g.
Definition: DeclBase.h:86
Represents a function declaration or definition.
Definition: Decl.h:1972
This represents a decl that may have a name.
Definition: Decl.h:249
Encodes a location in the source.
The top declaration context.
Definition: Decl.h:84
Represents a variable declaration or definition.
Definition: Decl.h:919
This class is used for tools that requires cross translation unit capability.
void emitCrossTUDiagnostics(const IndexError &IE)
Emit diagnostics for the user for potential configuration errors.
llvm::Expected< const FunctionDecl * > getCrossTUDefinition(const FunctionDecl *FD, StringRef CrossTUDir, StringRef IndexName, bool DisplayCTUProgress=false)
This function loads a function or variable definition from an external AST file and merges it into th...
llvm::Expected< const FunctionDecl * > importDefinition(const FunctionDecl *FD, ASTUnit *Unit)
This function merges a definition from a separate AST Unit into the current one which was created by ...
std::optional< clang::MacroExpansionContext > getMacroExpansionContextForSourceLocation(const clang::SourceLocation &ToLoc) const
Returns the MacroExpansionContext for the imported TU to which the given source-location corresponds.
static std::optional< std::string > getLookupName(const NamedDecl *ND)
Get a name to identify a named decl.
bool hasError(const Decl *ToDecl) const
Returns true if the given Decl is mapped (or created) during an import but there was an unrecoverable...
bool isImportedAsNew(const Decl *ToDecl) const
Returns true if the given Decl is newly created during the import.
llvm::Expected< ASTUnit * > loadExternalAST(StringRef LookupName, StringRef CrossTUDir, StringRef IndexName, bool DisplayCTUProgress=false)
This function loads a definition from an external AST file.
IndexError(index_error_code C, std::string FileName, std::string TripleToName, std::string TripleFromName)
index_error_code getCode() const
std::string getTripleToName() const
IndexError(index_error_code C, std::string FileName, int LineNo=0)
std::error_code convertToErrorCode() const override
void log(raw_ostream &OS) const override
std::string getTripleFromName() const
bool shouldImport(const VarDecl *VD, const ASTContext &ACtx)
Returns true if it makes sense to import a foreign variable definition.
llvm::StringMap< llvm::SmallVector< std::string, 32 > > InvocationListTy
llvm::Expected< llvm::StringMap< std::string > > parseCrossTUIndex(StringRef IndexPath)
This function parses an index file that determines which translation unit contains which definition.
std::string createCrossTUIndexString(const llvm::StringMap< std::string > &Index)
llvm::Expected< InvocationListTy > parseInvocationList(StringRef FileContent, llvm::sys::path::Style PathStyle=llvm::sys::path::Style::posix)
Parse the YAML formatted invocation list file content FileContent.
The JSON file list parser is used to communicate input to InstallAPI.
const FunctionProtoType * T
Definition: Format.h:5433
#define bool
Definition: stdbool.h:24