1 | //===- CompilationDatabase.h ------------------------------------*- C++ -*-===// |
---|---|
2 | // |
3 | // Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions. |
4 | // See https://llvm.org/LICENSE.txt for license information. |
5 | // SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception |
6 | // |
7 | //===----------------------------------------------------------------------===// |
8 | // |
9 | // This file provides an interface and multiple implementations for |
10 | // CompilationDatabases. |
11 | // |
12 | // While C++ refactoring and analysis tools are not compilers, and thus |
13 | // don't run as part of the build system, they need the exact information |
14 | // of a build in order to be able to correctly understand the C++ code of |
15 | // the project. This information is provided via the CompilationDatabase |
16 | // interface. |
17 | // |
18 | // To create a CompilationDatabase from a build directory one can call |
19 | // CompilationDatabase::loadFromDirectory(), which deduces the correct |
20 | // compilation database from the root of the build tree. |
21 | // |
22 | // See the concrete subclasses of CompilationDatabase for currently supported |
23 | // formats. |
24 | // |
25 | //===----------------------------------------------------------------------===// |
26 | |
27 | #ifndef LLVM_CLANG_TOOLING_COMPILATIONDATABASE_H |
28 | #define LLVM_CLANG_TOOLING_COMPILATIONDATABASE_H |
29 | |
30 | #include "clang/Basic/LLVM.h" |
31 | #include "llvm/ADT/ArrayRef.h" |
32 | #include "llvm/ADT/StringRef.h" |
33 | #include "llvm/ADT/Twine.h" |
34 | #include <memory> |
35 | #include <string> |
36 | #include <utility> |
37 | #include <vector> |
38 | |
39 | namespace clang { |
40 | namespace tooling { |
41 | |
42 | /// Specifies the working directory and command of a compilation. |
43 | struct CompileCommand { |
44 | CompileCommand() = default; |
45 | CompileCommand(Twine Directory, Twine Filename, |
46 | std::vector<std::string> CommandLine, Twine Output) |
47 | : Directory(Directory.str()), Filename(Filename.str()), |
48 | CommandLine(std::move(CommandLine)), Output(Output.str()){} |
49 | |
50 | /// The working directory the command was executed from. |
51 | std::string Directory; |
52 | |
53 | /// The source file associated with the command. |
54 | std::string Filename; |
55 | |
56 | /// The command line that was executed. |
57 | std::vector<std::string> CommandLine; |
58 | |
59 | /// The output file associated with the command. |
60 | std::string Output; |
61 | |
62 | friend bool operator==(const CompileCommand &LHS, const CompileCommand &RHS) { |
63 | return LHS.Directory == RHS.Directory && LHS.Filename == RHS.Filename && |
64 | LHS.CommandLine == RHS.CommandLine && LHS.Output == RHS.Output; |
65 | } |
66 | |
67 | friend bool operator!=(const CompileCommand &LHS, const CompileCommand &RHS) { |
68 | return !(LHS == RHS); |
69 | } |
70 | }; |
71 | |
72 | /// Interface for compilation databases. |
73 | /// |
74 | /// A compilation database allows the user to retrieve compile command lines |
75 | /// for the files in a project. |
76 | /// |
77 | /// Many implementations are enumerable, allowing all command lines to be |
78 | /// retrieved. These can be used to run clang tools over a subset of the files |
79 | /// in a project. |
80 | class CompilationDatabase { |
81 | public: |
82 | virtual ~CompilationDatabase(); |
83 | |
84 | /// Loads a compilation database from a build directory. |
85 | /// |
86 | /// Looks at the specified 'BuildDirectory' and creates a compilation database |
87 | /// that allows to query compile commands for source files in the |
88 | /// corresponding source tree. |
89 | /// |
90 | /// Returns NULL and sets ErrorMessage if we were not able to build up a |
91 | /// compilation database for the build directory. |
92 | /// |
93 | /// FIXME: Currently only supports JSON compilation databases, which |
94 | /// are named 'compile_commands.json' in the given directory. Extend this |
95 | /// for other build types (like ninja build files). |
96 | static std::unique_ptr<CompilationDatabase> |
97 | loadFromDirectory(StringRef BuildDirectory, std::string &ErrorMessage); |
98 | |
99 | /// Tries to detect a compilation database location and load it. |
100 | /// |
101 | /// Looks for a compilation database in all parent paths of file 'SourceFile' |
102 | /// by calling loadFromDirectory. |
103 | static std::unique_ptr<CompilationDatabase> |
104 | autoDetectFromSource(StringRef SourceFile, std::string &ErrorMessage); |
105 | |
106 | /// Tries to detect a compilation database location and load it. |
107 | /// |
108 | /// Looks for a compilation database in directory 'SourceDir' and all |
109 | /// its parent paths by calling loadFromDirectory. |
110 | static std::unique_ptr<CompilationDatabase> |
111 | autoDetectFromDirectory(StringRef SourceDir, std::string &ErrorMessage); |
112 | |
113 | /// Returns all compile commands in which the specified file was |
114 | /// compiled. |
115 | /// |
116 | /// This includes compile commands that span multiple source files. |
117 | /// For example, consider a project with the following compilations: |
118 | /// $ clang++ -o test a.cc b.cc t.cc |
119 | /// $ clang++ -o production a.cc b.cc -DPRODUCTION |
120 | /// A compilation database representing the project would return both command |
121 | /// lines for a.cc and b.cc and only the first command line for t.cc. |
122 | virtual std::vector<CompileCommand> getCompileCommands( |
123 | StringRef FilePath) const = 0; |
124 | |
125 | /// Returns the list of all files available in the compilation database. |
126 | /// |
127 | /// By default, returns nothing. Implementations should override this if they |
128 | /// can enumerate their source files. |
129 | virtual std::vector<std::string> getAllFiles() const { return {}; } |
130 | |
131 | /// Returns all compile commands for all the files in the compilation |
132 | /// database. |
133 | /// |
134 | /// FIXME: Add a layer in Tooling that provides an interface to run a tool |
135 | /// over all files in a compilation database. Not all build systems have the |
136 | /// ability to provide a feasible implementation for \c getAllCompileCommands. |
137 | /// |
138 | /// By default, this is implemented in terms of getAllFiles() and |
139 | /// getCompileCommands(). Subclasses may override this for efficiency. |
140 | virtual std::vector<CompileCommand> getAllCompileCommands() const; |
141 | }; |
142 | |
143 | /// A compilation database that returns a single compile command line. |
144 | /// |
145 | /// Useful when we want a tool to behave more like a compiler invocation. |
146 | /// This compilation database is not enumerable: getAllFiles() returns {}. |
147 | class FixedCompilationDatabase : public CompilationDatabase { |
148 | public: |
149 | /// Creates a FixedCompilationDatabase from the arguments after "--". |
150 | /// |
151 | /// Parses the given command line for "--". If "--" is found, the rest of |
152 | /// the arguments will make up the command line in the returned |
153 | /// FixedCompilationDatabase. |
154 | /// The arguments after "--" must not include positional parameters or the |
155 | /// argv[0] of the tool. Those will be added by the FixedCompilationDatabase |
156 | /// when a CompileCommand is requested. The argv[0] of the returned command |
157 | /// line will be "clang-tool". |
158 | /// |
159 | /// Returns NULL in case "--" is not found. |
160 | /// |
161 | /// The argument list is meant to be compatible with normal llvm command line |
162 | /// parsing in main methods. |
163 | /// int main(int argc, char **argv) { |
164 | /// std::unique_ptr<FixedCompilationDatabase> Compilations( |
165 | /// FixedCompilationDatabase::loadFromCommandLine(argc, argv)); |
166 | /// cl::ParseCommandLineOptions(argc, argv); |
167 | /// ... |
168 | /// } |
169 | /// |
170 | /// \param Argc The number of command line arguments - will be changed to |
171 | /// the number of arguments before "--", if "--" was found in the argument |
172 | /// list. |
173 | /// \param Argv Points to the command line arguments. |
174 | /// \param ErrorMsg Contains error text if the function returns null pointer. |
175 | /// \param Directory The base directory used in the FixedCompilationDatabase. |
176 | static std::unique_ptr<FixedCompilationDatabase> loadFromCommandLine( |
177 | int &Argc, const char *const *Argv, std::string &ErrorMsg, |
178 | Twine Directory = "."); |
179 | |
180 | /// Reads flags from the given file, one-per line. |
181 | /// Returns nullptr and sets ErrorMessage if we can't read the file. |
182 | static std::unique_ptr<FixedCompilationDatabase> |
183 | loadFromFile(StringRef Path, std::string &ErrorMsg); |
184 | |
185 | /// Constructs a compilation data base from a specified directory |
186 | /// and command line. |
187 | FixedCompilationDatabase(Twine Directory, ArrayRef<std::string> CommandLine); |
188 | |
189 | /// Returns the given compile command. |
190 | /// |
191 | /// Will always return a vector with one entry that contains the directory |
192 | /// and command line specified at construction with "clang-tool" as argv[0] |
193 | /// and 'FilePath' as positional argument. |
194 | std::vector<CompileCommand> |
195 | getCompileCommands(StringRef FilePath) const override; |
196 | |
197 | private: |
198 | /// This is built up to contain a single entry vector to be returned from |
199 | /// getCompileCommands after adding the positional argument. |
200 | std::vector<CompileCommand> CompileCommands; |
201 | }; |
202 | |
203 | /// Returns a wrapped CompilationDatabase that defers to the provided one, |
204 | /// but getCompileCommands() will infer commands for unknown files. |
205 | /// The return value of getAllFiles() or getAllCompileCommands() is unchanged. |
206 | /// See InterpolatingCompilationDatabase.cpp for details on heuristics. |
207 | std::unique_ptr<CompilationDatabase> |
208 | inferMissingCompileCommands(std::unique_ptr<CompilationDatabase>); |
209 | |
210 | } // namespace tooling |
211 | } // namespace clang |
212 | |
213 | #endif // LLVM_CLANG_TOOLING_COMPILATIONDATABASE_H |
214 |