xref: /freebsd/contrib/llvm-project/llvm/include/llvm/LTO/LTO.h (revision 2f513db72b034fd5ef7f080b11be5c711c15186a)
1 //===-LTO.h - LLVM Link Time Optimizer ------------------------------------===//
2 //
3 // Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions.
4 // See https://llvm.org/LICENSE.txt for license information.
5 // SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception
6 //
7 //===----------------------------------------------------------------------===//
8 //
9 // This file declares functions and classes used to support LTO. It is intended
10 // to be used both by LTO classes as well as by clients (gold-plugin) that
11 // don't utilize the LTO code generator interfaces.
12 //
13 //===----------------------------------------------------------------------===//
14 
15 #ifndef LLVM_LTO_LTO_H
16 #define LLVM_LTO_LTO_H
17 
18 #include "llvm/ADT/MapVector.h"
19 #include "llvm/ADT/StringMap.h"
20 #include "llvm/ADT/StringSet.h"
21 #include "llvm/IR/DiagnosticInfo.h"
22 #include "llvm/IR/ModuleSummaryIndex.h"
23 #include "llvm/IR/RemarkStreamer.h"
24 #include "llvm/LTO/Config.h"
25 #include "llvm/Linker/IRMover.h"
26 #include "llvm/Object/IRSymtab.h"
27 #include "llvm/Support/Error.h"
28 #include "llvm/Support/ToolOutputFile.h"
29 #include "llvm/Support/thread.h"
30 #include "llvm/Target/TargetOptions.h"
31 #include "llvm/Transforms/IPO/FunctionImport.h"
32 
33 namespace llvm {
34 
35 class BitcodeModule;
36 class Error;
37 class LLVMContext;
38 class MemoryBufferRef;
39 class Module;
40 class Target;
41 class raw_pwrite_stream;
42 
43 /// Resolve linkage for prevailing symbols in the \p Index. Linkage changes
44 /// recorded in the index and the ThinLTO backends must apply the changes to
45 /// the module via thinLTOResolvePrevailingInModule.
46 ///
47 /// This is done for correctness (if value exported, ensure we always
48 /// emit a copy), and compile-time optimization (allow drop of duplicates).
49 void thinLTOResolvePrevailingInIndex(
50     ModuleSummaryIndex &Index,
51     function_ref<bool(GlobalValue::GUID, const GlobalValueSummary *)>
52         isPrevailing,
53     function_ref<void(StringRef, GlobalValue::GUID, GlobalValue::LinkageTypes)>
54         recordNewLinkage,
55     const DenseSet<GlobalValue::GUID> &GUIDPreservedSymbols);
56 
57 /// Update the linkages in the given \p Index to mark exported values
58 /// as external and non-exported values as internal. The ThinLTO backends
59 /// must apply the changes to the Module via thinLTOInternalizeModule.
60 void thinLTOInternalizeAndPromoteInIndex(
61     ModuleSummaryIndex &Index,
62     function_ref<bool(StringRef, GlobalValue::GUID)> isExported);
63 
64 /// Computes a unique hash for the Module considering the current list of
65 /// export/import and other global analysis results.
66 /// The hash is produced in \p Key.
67 void computeLTOCacheKey(
68     SmallString<40> &Key, const lto::Config &Conf,
69     const ModuleSummaryIndex &Index, StringRef ModuleID,
70     const FunctionImporter::ImportMapTy &ImportList,
71     const FunctionImporter::ExportSetTy &ExportList,
72     const std::map<GlobalValue::GUID, GlobalValue::LinkageTypes> &ResolvedODR,
73     const GVSummaryMapTy &DefinedGlobals,
74     const std::set<GlobalValue::GUID> &CfiFunctionDefs = {},
75     const std::set<GlobalValue::GUID> &CfiFunctionDecls = {});
76 
77 namespace lto {
78 
79 /// Given the original \p Path to an output file, replace any path
80 /// prefix matching \p OldPrefix with \p NewPrefix. Also, create the
81 /// resulting directory if it does not yet exist.
82 std::string getThinLTOOutputFile(const std::string &Path,
83                                  const std::string &OldPrefix,
84                                  const std::string &NewPrefix);
85 
86 /// Setup optimization remarks.
87 Expected<std::unique_ptr<ToolOutputFile>>
88 setupOptimizationRemarks(LLVMContext &Context, StringRef RemarksFilename,
89                          StringRef RemarksPasses, StringRef RemarksFormat,
90                          bool RemarksWithHotness, int Count = -1);
91 
92 /// Setups the output file for saving statistics.
93 Expected<std::unique_ptr<ToolOutputFile>>
94 setupStatsFile(StringRef StatsFilename);
95 
96 class LTO;
97 struct SymbolResolution;
98 class ThinBackendProc;
99 
100 /// An input file. This is a symbol table wrapper that only exposes the
101 /// information that an LTO client should need in order to do symbol resolution.
102 class InputFile {
103 public:
104   class Symbol;
105 
106 private:
107   // FIXME: Remove LTO class friendship once we have bitcode symbol tables.
108   friend LTO;
109   InputFile() = default;
110 
111   std::vector<BitcodeModule> Mods;
112   SmallVector<char, 0> Strtab;
113   std::vector<Symbol> Symbols;
114 
115   // [begin, end) for each module
116   std::vector<std::pair<size_t, size_t>> ModuleSymIndices;
117 
118   StringRef TargetTriple, SourceFileName, COFFLinkerOpts;
119   std::vector<StringRef> DependentLibraries;
120   std::vector<StringRef> ComdatTable;
121 
122 public:
123   ~InputFile();
124 
125   /// Create an InputFile.
126   static Expected<std::unique_ptr<InputFile>> create(MemoryBufferRef Object);
127 
128   /// The purpose of this class is to only expose the symbol information that an
129   /// LTO client should need in order to do symbol resolution.
130   class Symbol : irsymtab::Symbol {
131     friend LTO;
132 
133   public:
134     Symbol(const irsymtab::Symbol &S) : irsymtab::Symbol(S) {}
135 
136     using irsymtab::Symbol::isUndefined;
137     using irsymtab::Symbol::isCommon;
138     using irsymtab::Symbol::isWeak;
139     using irsymtab::Symbol::isIndirect;
140     using irsymtab::Symbol::getName;
141     using irsymtab::Symbol::getIRName;
142     using irsymtab::Symbol::getVisibility;
143     using irsymtab::Symbol::canBeOmittedFromSymbolTable;
144     using irsymtab::Symbol::isTLS;
145     using irsymtab::Symbol::getComdatIndex;
146     using irsymtab::Symbol::getCommonSize;
147     using irsymtab::Symbol::getCommonAlignment;
148     using irsymtab::Symbol::getCOFFWeakExternalFallback;
149     using irsymtab::Symbol::getSectionName;
150     using irsymtab::Symbol::isExecutable;
151     using irsymtab::Symbol::isUsed;
152   };
153 
154   /// A range over the symbols in this InputFile.
155   ArrayRef<Symbol> symbols() const { return Symbols; }
156 
157   /// Returns linker options specified in the input file.
158   StringRef getCOFFLinkerOpts() const { return COFFLinkerOpts; }
159 
160   /// Returns dependent library specifiers from the input file.
161   ArrayRef<StringRef> getDependentLibraries() const { return DependentLibraries; }
162 
163   /// Returns the path to the InputFile.
164   StringRef getName() const;
165 
166   /// Returns the input file's target triple.
167   StringRef getTargetTriple() const { return TargetTriple; }
168 
169   /// Returns the source file path specified at compile time.
170   StringRef getSourceFileName() const { return SourceFileName; }
171 
172   // Returns a table with all the comdats used by this file.
173   ArrayRef<StringRef> getComdatTable() const { return ComdatTable; }
174 
175   // Returns the only BitcodeModule from InputFile.
176   BitcodeModule &getSingleBitcodeModule();
177 
178 private:
179   ArrayRef<Symbol> module_symbols(unsigned I) const {
180     const auto &Indices = ModuleSymIndices[I];
181     return {Symbols.data() + Indices.first, Symbols.data() + Indices.second};
182   }
183 };
184 
185 /// This class wraps an output stream for a native object. Most clients should
186 /// just be able to return an instance of this base class from the stream
187 /// callback, but if a client needs to perform some action after the stream is
188 /// written to, that can be done by deriving from this class and overriding the
189 /// destructor.
190 class NativeObjectStream {
191 public:
192   NativeObjectStream(std::unique_ptr<raw_pwrite_stream> OS) : OS(std::move(OS)) {}
193   std::unique_ptr<raw_pwrite_stream> OS;
194   virtual ~NativeObjectStream() = default;
195 };
196 
197 /// This type defines the callback to add a native object that is generated on
198 /// the fly.
199 ///
200 /// Stream callbacks must be thread safe.
201 using AddStreamFn =
202     std::function<std::unique_ptr<NativeObjectStream>(unsigned Task)>;
203 
204 /// This is the type of a native object cache. To request an item from the
205 /// cache, pass a unique string as the Key. For hits, the cached file will be
206 /// added to the link and this function will return AddStreamFn(). For misses,
207 /// the cache will return a stream callback which must be called at most once to
208 /// produce content for the stream. The native object stream produced by the
209 /// stream callback will add the file to the link after the stream is written
210 /// to.
211 ///
212 /// Clients generally look like this:
213 ///
214 /// if (AddStreamFn AddStream = Cache(Task, Key))
215 ///   ProduceContent(AddStream);
216 using NativeObjectCache =
217     std::function<AddStreamFn(unsigned Task, StringRef Key)>;
218 
219 /// A ThinBackend defines what happens after the thin-link phase during ThinLTO.
220 /// The details of this type definition aren't important; clients can only
221 /// create a ThinBackend using one of the create*ThinBackend() functions below.
222 using ThinBackend = std::function<std::unique_ptr<ThinBackendProc>(
223     Config &C, ModuleSummaryIndex &CombinedIndex,
224     StringMap<GVSummaryMapTy> &ModuleToDefinedGVSummaries,
225     AddStreamFn AddStream, NativeObjectCache Cache)>;
226 
227 /// This ThinBackend runs the individual backend jobs in-process.
228 ThinBackend createInProcessThinBackend(unsigned ParallelismLevel);
229 
230 /// This ThinBackend writes individual module indexes to files, instead of
231 /// running the individual backend jobs. This backend is for distributed builds
232 /// where separate processes will invoke the real backends.
233 ///
234 /// To find the path to write the index to, the backend checks if the path has a
235 /// prefix of OldPrefix; if so, it replaces that prefix with NewPrefix. It then
236 /// appends ".thinlto.bc" and writes the index to that path. If
237 /// ShouldEmitImportsFiles is true it also writes a list of imported files to a
238 /// similar path with ".imports" appended instead.
239 /// LinkedObjectsFile is an output stream to write the list of object files for
240 /// the final ThinLTO linking. Can be nullptr.
241 /// OnWrite is callback which receives module identifier and notifies LTO user
242 /// that index file for the module (and optionally imports file) was created.
243 using IndexWriteCallback = std::function<void(const std::string &)>;
244 ThinBackend createWriteIndexesThinBackend(std::string OldPrefix,
245                                           std::string NewPrefix,
246                                           bool ShouldEmitImportsFiles,
247                                           raw_fd_ostream *LinkedObjectsFile,
248                                           IndexWriteCallback OnWrite);
249 
250 /// This class implements a resolution-based interface to LLVM's LTO
251 /// functionality. It supports regular LTO, parallel LTO code generation and
252 /// ThinLTO. You can use it from a linker in the following way:
253 /// - Set hooks and code generation options (see lto::Config struct defined in
254 ///   Config.h), and use the lto::Config object to create an lto::LTO object.
255 /// - Create lto::InputFile objects using lto::InputFile::create(), then use
256 ///   the symbols() function to enumerate its symbols and compute a resolution
257 ///   for each symbol (see SymbolResolution below).
258 /// - After the linker has visited each input file (and each regular object
259 ///   file) and computed a resolution for each symbol, take each lto::InputFile
260 ///   and pass it and an array of symbol resolutions to the add() function.
261 /// - Call the getMaxTasks() function to get an upper bound on the number of
262 ///   native object files that LTO may add to the link.
263 /// - Call the run() function. This function will use the supplied AddStream
264 ///   and Cache functions to add up to getMaxTasks() native object files to
265 ///   the link.
266 class LTO {
267   friend InputFile;
268 
269 public:
270   /// Create an LTO object. A default constructed LTO object has a reasonable
271   /// production configuration, but you can customize it by passing arguments to
272   /// this constructor.
273   /// FIXME: We do currently require the DiagHandler field to be set in Conf.
274   /// Until that is fixed, a Config argument is required.
275   LTO(Config Conf, ThinBackend Backend = nullptr,
276       unsigned ParallelCodeGenParallelismLevel = 1);
277   ~LTO();
278 
279   /// Add an input file to the LTO link, using the provided symbol resolutions.
280   /// The symbol resolutions must appear in the enumeration order given by
281   /// InputFile::symbols().
282   Error add(std::unique_ptr<InputFile> Obj, ArrayRef<SymbolResolution> Res);
283 
284   /// Returns an upper bound on the number of tasks that the client may expect.
285   /// This may only be called after all IR object files have been added. For a
286   /// full description of tasks see LTOBackend.h.
287   unsigned getMaxTasks() const;
288 
289   /// Runs the LTO pipeline. This function calls the supplied AddStream
290   /// function to add native object files to the link.
291   ///
292   /// The Cache parameter is optional. If supplied, it will be used to cache
293   /// native object files and add them to the link.
294   ///
295   /// The client will receive at most one callback (via either AddStream or
296   /// Cache) for each task identifier.
297   Error run(AddStreamFn AddStream, NativeObjectCache Cache = nullptr);
298 
299 private:
300   Config Conf;
301 
302   struct RegularLTOState {
303     RegularLTOState(unsigned ParallelCodeGenParallelismLevel, Config &Conf);
304     struct CommonResolution {
305       uint64_t Size = 0;
306       unsigned Align = 0;
307       /// Record if at least one instance of the common was marked as prevailing
308       bool Prevailing = false;
309     };
310     std::map<std::string, CommonResolution> Commons;
311 
312     unsigned ParallelCodeGenParallelismLevel;
313     LTOLLVMContext Ctx;
314     std::unique_ptr<Module> CombinedModule;
315     std::unique_ptr<IRMover> Mover;
316 
317     // This stores the information about a regular LTO module that we have added
318     // to the link. It will either be linked immediately (for modules without
319     // summaries) or after summary-based dead stripping (for modules with
320     // summaries).
321     struct AddedModule {
322       std::unique_ptr<Module> M;
323       std::vector<GlobalValue *> Keep;
324     };
325     std::vector<AddedModule> ModsWithSummaries;
326   } RegularLTO;
327 
328   struct ThinLTOState {
329     ThinLTOState(ThinBackend Backend);
330 
331     ThinBackend Backend;
332     ModuleSummaryIndex CombinedIndex;
333     MapVector<StringRef, BitcodeModule> ModuleMap;
334     DenseMap<GlobalValue::GUID, StringRef> PrevailingModuleForGUID;
335   } ThinLTO;
336 
337   // The global resolution for a particular (mangled) symbol name. This is in
338   // particular necessary to track whether each symbol can be internalized.
339   // Because any input file may introduce a new cross-partition reference, we
340   // cannot make any final internalization decisions until all input files have
341   // been added and the client has called run(). During run() we apply
342   // internalization decisions either directly to the module (for regular LTO)
343   // or to the combined index (for ThinLTO).
344   struct GlobalResolution {
345     /// The unmangled name of the global.
346     std::string IRName;
347 
348     /// Keep track if the symbol is visible outside of a module with a summary
349     /// (i.e. in either a regular object or a regular LTO module without a
350     /// summary).
351     bool VisibleOutsideSummary = false;
352 
353     bool UnnamedAddr = true;
354 
355     /// True if module contains the prevailing definition.
356     bool Prevailing = false;
357 
358     /// Returns true if module contains the prevailing definition and symbol is
359     /// an IR symbol. For example when module-level inline asm block is used,
360     /// symbol can be prevailing in module but have no IR name.
361     bool isPrevailingIRSymbol() const { return Prevailing && !IRName.empty(); }
362 
363     /// This field keeps track of the partition number of this global. The
364     /// regular LTO object is partition 0, while each ThinLTO object has its own
365     /// partition number from 1 onwards.
366     ///
367     /// Any global that is defined or used by more than one partition, or that
368     /// is referenced externally, may not be internalized.
369     ///
370     /// Partitions generally have a one-to-one correspondence with tasks, except
371     /// that we use partition 0 for all parallel LTO code generation partitions.
372     /// Any partitioning of the combined LTO object is done internally by the
373     /// LTO backend.
374     unsigned Partition = Unknown;
375 
376     /// Special partition numbers.
377     enum : unsigned {
378       /// A partition number has not yet been assigned to this global.
379       Unknown = -1u,
380 
381       /// This global is either used by more than one partition or has an
382       /// external reference, and therefore cannot be internalized.
383       External = -2u,
384 
385       /// The RegularLTO partition
386       RegularLTO = 0,
387     };
388   };
389 
390   // Global mapping from mangled symbol names to resolutions.
391   StringMap<GlobalResolution> GlobalResolutions;
392 
393   void addModuleToGlobalRes(ArrayRef<InputFile::Symbol> Syms,
394                             ArrayRef<SymbolResolution> Res, unsigned Partition,
395                             bool InSummary);
396 
397   // These functions take a range of symbol resolutions [ResI, ResE) and consume
398   // the resolutions used by a single input module by incrementing ResI. After
399   // these functions return, [ResI, ResE) will refer to the resolution range for
400   // the remaining modules in the InputFile.
401   Error addModule(InputFile &Input, unsigned ModI,
402                   const SymbolResolution *&ResI, const SymbolResolution *ResE);
403 
404   Expected<RegularLTOState::AddedModule>
405   addRegularLTO(BitcodeModule BM, ArrayRef<InputFile::Symbol> Syms,
406                 const SymbolResolution *&ResI, const SymbolResolution *ResE);
407   Error linkRegularLTO(RegularLTOState::AddedModule Mod,
408                        bool LivenessFromIndex);
409 
410   Error addThinLTO(BitcodeModule BM, ArrayRef<InputFile::Symbol> Syms,
411                    const SymbolResolution *&ResI, const SymbolResolution *ResE);
412 
413   Error runRegularLTO(AddStreamFn AddStream);
414   Error runThinLTO(AddStreamFn AddStream, NativeObjectCache Cache,
415                    const DenseSet<GlobalValue::GUID> &GUIDPreservedSymbols);
416 
417   Error checkPartiallySplit();
418 
419   mutable bool CalledGetMaxTasks = false;
420 
421   // Use Optional to distinguish false from not yet initialized.
422   Optional<bool> EnableSplitLTOUnit;
423 };
424 
425 /// The resolution for a symbol. The linker must provide a SymbolResolution for
426 /// each global symbol based on its internal resolution of that symbol.
427 struct SymbolResolution {
428   SymbolResolution()
429       : Prevailing(0), FinalDefinitionInLinkageUnit(0), VisibleToRegularObj(0),
430         LinkerRedefined(0) {}
431 
432   /// The linker has chosen this definition of the symbol.
433   unsigned Prevailing : 1;
434 
435   /// The definition of this symbol is unpreemptable at runtime and is known to
436   /// be in this linkage unit.
437   unsigned FinalDefinitionInLinkageUnit : 1;
438 
439   /// The definition of this symbol is visible outside of the LTO unit.
440   unsigned VisibleToRegularObj : 1;
441 
442   /// Linker redefined version of the symbol which appeared in -wrap or -defsym
443   /// linker option.
444   unsigned LinkerRedefined : 1;
445 };
446 
447 } // namespace lto
448 } // namespace llvm
449 
450 #endif
451