xref: /freebsd/contrib/llvm-project/llvm/lib/ExecutionEngine/JITLink/JITLink.cpp (revision b64c5a0ace59af62eff52bfe110a521dc73c937b)
1 //===------------- JITLink.cpp - Core Run-time JIT linker APIs ------------===//
2 //
3 // Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions.
4 // See https://llvm.org/LICENSE.txt for license information.
5 // SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception
6 //
7 //===----------------------------------------------------------------------===//
8 
9 #include "llvm/ExecutionEngine/JITLink/JITLink.h"
10 
11 #include "llvm/ADT/StringExtras.h"
12 #include "llvm/BinaryFormat/Magic.h"
13 #include "llvm/ExecutionEngine/JITLink/COFF.h"
14 #include "llvm/ExecutionEngine/JITLink/ELF.h"
15 #include "llvm/ExecutionEngine/JITLink/MachO.h"
16 #include "llvm/ExecutionEngine/JITLink/aarch64.h"
17 #include "llvm/ExecutionEngine/JITLink/i386.h"
18 #include "llvm/ExecutionEngine/JITLink/loongarch.h"
19 #include "llvm/ExecutionEngine/JITLink/x86_64.h"
20 #include "llvm/Support/Format.h"
21 #include "llvm/Support/MemoryBuffer.h"
22 #include "llvm/Support/raw_ostream.h"
23 
24 using namespace llvm;
25 using namespace llvm::object;
26 
27 #define DEBUG_TYPE "jitlink"
28 
29 namespace {
30 
31 enum JITLinkErrorCode { GenericJITLinkError = 1 };
32 
33 // FIXME: This class is only here to support the transition to llvm::Error. It
34 // will be removed once this transition is complete. Clients should prefer to
35 // deal with the Error value directly, rather than converting to error_code.
36 class JITLinkerErrorCategory : public std::error_category {
37 public:
38   const char *name() const noexcept override { return "runtimedyld"; }
39 
40   std::string message(int Condition) const override {
41     switch (static_cast<JITLinkErrorCode>(Condition)) {
42     case GenericJITLinkError:
43       return "Generic JITLink error";
44     }
45     llvm_unreachable("Unrecognized JITLinkErrorCode");
46   }
47 };
48 
49 } // namespace
50 
51 namespace llvm {
52 namespace jitlink {
53 
54 char JITLinkError::ID = 0;
55 
56 void JITLinkError::log(raw_ostream &OS) const { OS << ErrMsg; }
57 
58 std::error_code JITLinkError::convertToErrorCode() const {
59   static JITLinkerErrorCategory TheJITLinkerErrorCategory;
60   return std::error_code(GenericJITLinkError, TheJITLinkerErrorCategory);
61 }
62 
63 const char *getGenericEdgeKindName(Edge::Kind K) {
64   switch (K) {
65   case Edge::Invalid:
66     return "INVALID RELOCATION";
67   case Edge::KeepAlive:
68     return "Keep-Alive";
69   default:
70     return "<Unrecognized edge kind>";
71   }
72 }
73 
74 const char *getLinkageName(Linkage L) {
75   switch (L) {
76   case Linkage::Strong:
77     return "strong";
78   case Linkage::Weak:
79     return "weak";
80   }
81   llvm_unreachable("Unrecognized llvm.jitlink.Linkage enum");
82 }
83 
84 const char *getScopeName(Scope S) {
85   switch (S) {
86   case Scope::Default:
87     return "default";
88   case Scope::Hidden:
89     return "hidden";
90   case Scope::Local:
91     return "local";
92   }
93   llvm_unreachable("Unrecognized llvm.jitlink.Scope enum");
94 }
95 
96 bool isCStringBlock(Block &B) {
97   if (B.getSize() == 0) // Empty blocks are not valid C-strings.
98     return false;
99 
100   // Zero-fill blocks of size one are valid empty strings.
101   if (B.isZeroFill())
102     return B.getSize() == 1;
103 
104   for (size_t I = 0; I != B.getSize() - 1; ++I)
105     if (B.getContent()[I] == '\0')
106       return false;
107 
108   return B.getContent()[B.getSize() - 1] == '\0';
109 }
110 
111 raw_ostream &operator<<(raw_ostream &OS, const Block &B) {
112   return OS << B.getAddress() << " -- " << (B.getAddress() + B.getSize())
113             << ": "
114             << "size = " << formatv("{0:x8}", B.getSize()) << ", "
115             << (B.isZeroFill() ? "zero-fill" : "content")
116             << ", align = " << B.getAlignment()
117             << ", align-ofs = " << B.getAlignmentOffset()
118             << ", section = " << B.getSection().getName();
119 }
120 
121 raw_ostream &operator<<(raw_ostream &OS, const Symbol &Sym) {
122   OS << Sym.getAddress() << " (" << (Sym.isDefined() ? "block" : "addressable")
123      << " + " << formatv("{0:x8}", Sym.getOffset())
124      << "): size: " << formatv("{0:x8}", Sym.getSize())
125      << ", linkage: " << formatv("{0:6}", getLinkageName(Sym.getLinkage()))
126      << ", scope: " << formatv("{0:8}", getScopeName(Sym.getScope())) << ", "
127      << (Sym.isLive() ? "live" : "dead") << "  -   "
128      << (Sym.hasName() ? Sym.getName() : "<anonymous symbol>");
129   return OS;
130 }
131 
132 void printEdge(raw_ostream &OS, const Block &B, const Edge &E,
133                StringRef EdgeKindName) {
134   OS << "edge@" << B.getAddress() + E.getOffset() << ": " << B.getAddress()
135      << " + " << formatv("{0:x}", E.getOffset()) << " -- " << EdgeKindName
136      << " -> ";
137 
138   auto &TargetSym = E.getTarget();
139   if (TargetSym.hasName())
140     OS << TargetSym.getName();
141   else {
142     auto &TargetBlock = TargetSym.getBlock();
143     auto &TargetSec = TargetBlock.getSection();
144     orc::ExecutorAddr SecAddress(~uint64_t(0));
145     for (auto *B : TargetSec.blocks())
146       if (B->getAddress() < SecAddress)
147         SecAddress = B->getAddress();
148 
149     orc::ExecutorAddrDiff SecDelta = TargetSym.getAddress() - SecAddress;
150     OS << TargetSym.getAddress() << " (section " << TargetSec.getName();
151     if (SecDelta)
152       OS << " + " << formatv("{0:x}", SecDelta);
153     OS << " / block " << TargetBlock.getAddress();
154     if (TargetSym.getOffset())
155       OS << " + " << formatv("{0:x}", TargetSym.getOffset());
156     OS << ")";
157   }
158 
159   if (E.getAddend() != 0)
160     OS << " + " << E.getAddend();
161 }
162 
163 Section::~Section() {
164   for (auto *Sym : Symbols)
165     Sym->~Symbol();
166   for (auto *B : Blocks)
167     B->~Block();
168 }
169 
170 Block &LinkGraph::splitBlock(Block &B, size_t SplitIndex,
171                              SplitBlockCache *Cache) {
172 
173   assert(SplitIndex > 0 && "splitBlock can not be called with SplitIndex == 0");
174 
175   // If the split point covers all of B then just return B.
176   if (SplitIndex == B.getSize())
177     return B;
178 
179   assert(SplitIndex < B.getSize() && "SplitIndex out of range");
180 
181   // Create the new block covering [ 0, SplitIndex ).
182   auto &NewBlock =
183       B.isZeroFill()
184           ? createZeroFillBlock(B.getSection(), SplitIndex, B.getAddress(),
185                                 B.getAlignment(), B.getAlignmentOffset())
186           : createContentBlock(
187                 B.getSection(), B.getContent().slice(0, SplitIndex),
188                 B.getAddress(), B.getAlignment(), B.getAlignmentOffset());
189 
190   // Modify B to cover [ SplitIndex, B.size() ).
191   B.setAddress(B.getAddress() + SplitIndex);
192   B.setContent(B.getContent().slice(SplitIndex));
193   B.setAlignmentOffset((B.getAlignmentOffset() + SplitIndex) %
194                        B.getAlignment());
195 
196   // Handle edge transfer/update.
197   {
198     // Copy edges to NewBlock (recording their iterators so that we can remove
199     // them from B), and update of Edges remaining on B.
200     std::vector<Block::edge_iterator> EdgesToRemove;
201     for (auto I = B.edges().begin(); I != B.edges().end();) {
202       if (I->getOffset() < SplitIndex) {
203         NewBlock.addEdge(*I);
204         I = B.removeEdge(I);
205       } else {
206         I->setOffset(I->getOffset() - SplitIndex);
207         ++I;
208       }
209     }
210   }
211 
212   // Handle symbol transfer/update.
213   {
214     // Initialize the symbols cache if necessary.
215     SplitBlockCache LocalBlockSymbolsCache;
216     if (!Cache)
217       Cache = &LocalBlockSymbolsCache;
218     if (*Cache == std::nullopt) {
219       *Cache = SplitBlockCache::value_type();
220       for (auto *Sym : B.getSection().symbols())
221         if (&Sym->getBlock() == &B)
222           (*Cache)->push_back(Sym);
223 
224       llvm::sort(**Cache, [](const Symbol *LHS, const Symbol *RHS) {
225         return LHS->getOffset() > RHS->getOffset();
226       });
227     }
228     auto &BlockSymbols = **Cache;
229 
230     // Transfer all symbols with offset less than SplitIndex to NewBlock.
231     while (!BlockSymbols.empty() &&
232            BlockSymbols.back()->getOffset() < SplitIndex) {
233       auto *Sym = BlockSymbols.back();
234       // If the symbol extends beyond the split, update the size to be within
235       // the new block.
236       if (Sym->getOffset() + Sym->getSize() > SplitIndex)
237         Sym->setSize(SplitIndex - Sym->getOffset());
238       Sym->setBlock(NewBlock);
239       BlockSymbols.pop_back();
240     }
241 
242     // Update offsets for all remaining symbols in B.
243     for (auto *Sym : BlockSymbols)
244       Sym->setOffset(Sym->getOffset() - SplitIndex);
245   }
246 
247   return NewBlock;
248 }
249 
250 void LinkGraph::dump(raw_ostream &OS) {
251   DenseMap<Block *, std::vector<Symbol *>> BlockSymbols;
252 
253   // Map from blocks to the symbols pointing at them.
254   for (auto *Sym : defined_symbols())
255     BlockSymbols[&Sym->getBlock()].push_back(Sym);
256 
257   // For each block, sort its symbols by something approximating
258   // relevance.
259   for (auto &KV : BlockSymbols)
260     llvm::sort(KV.second, [](const Symbol *LHS, const Symbol *RHS) {
261       if (LHS->getOffset() != RHS->getOffset())
262         return LHS->getOffset() < RHS->getOffset();
263       if (LHS->getLinkage() != RHS->getLinkage())
264         return LHS->getLinkage() < RHS->getLinkage();
265       if (LHS->getScope() != RHS->getScope())
266         return LHS->getScope() < RHS->getScope();
267       if (LHS->hasName()) {
268         if (!RHS->hasName())
269           return true;
270         return LHS->getName() < RHS->getName();
271       }
272       return false;
273     });
274 
275   for (auto &Sec : sections()) {
276     OS << "section " << Sec.getName() << ":\n\n";
277 
278     std::vector<Block *> SortedBlocks;
279     llvm::copy(Sec.blocks(), std::back_inserter(SortedBlocks));
280     llvm::sort(SortedBlocks, [](const Block *LHS, const Block *RHS) {
281       return LHS->getAddress() < RHS->getAddress();
282     });
283 
284     for (auto *B : SortedBlocks) {
285       OS << "  block " << B->getAddress()
286          << " size = " << formatv("{0:x8}", B->getSize())
287          << ", align = " << B->getAlignment()
288          << ", alignment-offset = " << B->getAlignmentOffset();
289       if (B->isZeroFill())
290         OS << ", zero-fill";
291       OS << "\n";
292 
293       auto BlockSymsI = BlockSymbols.find(B);
294       if (BlockSymsI != BlockSymbols.end()) {
295         OS << "    symbols:\n";
296         auto &Syms = BlockSymsI->second;
297         for (auto *Sym : Syms)
298           OS << "      " << *Sym << "\n";
299       } else
300         OS << "    no symbols\n";
301 
302       if (!B->edges_empty()) {
303         OS << "    edges:\n";
304         std::vector<Edge> SortedEdges;
305         llvm::copy(B->edges(), std::back_inserter(SortedEdges));
306         llvm::sort(SortedEdges, [](const Edge &LHS, const Edge &RHS) {
307           return LHS.getOffset() < RHS.getOffset();
308         });
309         for (auto &E : SortedEdges) {
310           OS << "      " << B->getFixupAddress(E) << " (block + "
311              << formatv("{0:x8}", E.getOffset()) << "), addend = ";
312           if (E.getAddend() >= 0)
313             OS << formatv("+{0:x8}", E.getAddend());
314           else
315             OS << formatv("-{0:x8}", -E.getAddend());
316           OS << ", kind = " << getEdgeKindName(E.getKind()) << ", target = ";
317           if (E.getTarget().hasName())
318             OS << E.getTarget().getName();
319           else
320             OS << "addressable@"
321                << formatv("{0:x16}", E.getTarget().getAddress()) << "+"
322                << formatv("{0:x8}", E.getTarget().getOffset());
323           OS << "\n";
324         }
325       } else
326         OS << "    no edges\n";
327       OS << "\n";
328     }
329   }
330 
331   OS << "Absolute symbols:\n";
332   if (!absolute_symbols().empty()) {
333     for (auto *Sym : absolute_symbols())
334       OS << "  " << Sym->getAddress() << ": " << *Sym << "\n";
335   } else
336     OS << "  none\n";
337 
338   OS << "\nExternal symbols:\n";
339   if (!external_symbols().empty()) {
340     for (auto *Sym : external_symbols())
341       OS << "  " << Sym->getAddress() << ": " << *Sym
342          << (Sym->isWeaklyReferenced() ? " (weakly referenced)" : "") << "\n";
343   } else
344     OS << "  none\n";
345 }
346 
347 raw_ostream &operator<<(raw_ostream &OS, const SymbolLookupFlags &LF) {
348   switch (LF) {
349   case SymbolLookupFlags::RequiredSymbol:
350     return OS << "RequiredSymbol";
351   case SymbolLookupFlags::WeaklyReferencedSymbol:
352     return OS << "WeaklyReferencedSymbol";
353   }
354   llvm_unreachable("Unrecognized lookup flags");
355 }
356 
357 void JITLinkAsyncLookupContinuation::anchor() {}
358 
359 JITLinkContext::~JITLinkContext() = default;
360 
361 bool JITLinkContext::shouldAddDefaultTargetPasses(const Triple &TT) const {
362   return true;
363 }
364 
365 LinkGraphPassFunction JITLinkContext::getMarkLivePass(const Triple &TT) const {
366   return LinkGraphPassFunction();
367 }
368 
369 Error JITLinkContext::modifyPassConfig(LinkGraph &G,
370                                        PassConfiguration &Config) {
371   return Error::success();
372 }
373 
374 Error markAllSymbolsLive(LinkGraph &G) {
375   for (auto *Sym : G.defined_symbols())
376     Sym->setLive(true);
377   return Error::success();
378 }
379 
380 Error makeTargetOutOfRangeError(const LinkGraph &G, const Block &B,
381                                 const Edge &E) {
382   std::string ErrMsg;
383   {
384     raw_string_ostream ErrStream(ErrMsg);
385     Section &Sec = B.getSection();
386     ErrStream << "In graph " << G.getName() << ", section " << Sec.getName()
387               << ": relocation target ";
388     if (E.getTarget().hasName()) {
389       ErrStream << "\"" << E.getTarget().getName() << "\"";
390     } else
391       ErrStream << E.getTarget().getBlock().getSection().getName() << " + "
392                 << formatv("{0:x}", E.getOffset());
393     ErrStream << " at address " << formatv("{0:x}", E.getTarget().getAddress())
394               << " is out of range of " << G.getEdgeKindName(E.getKind())
395               << " fixup at " << formatv("{0:x}", B.getFixupAddress(E)) << " (";
396 
397     Symbol *BestSymbolForBlock = nullptr;
398     for (auto *Sym : Sec.symbols())
399       if (&Sym->getBlock() == &B && Sym->hasName() && Sym->getOffset() == 0 &&
400           (!BestSymbolForBlock ||
401            Sym->getScope() < BestSymbolForBlock->getScope() ||
402            Sym->getLinkage() < BestSymbolForBlock->getLinkage()))
403         BestSymbolForBlock = Sym;
404 
405     if (BestSymbolForBlock)
406       ErrStream << BestSymbolForBlock->getName() << ", ";
407     else
408       ErrStream << "<anonymous block> @ ";
409 
410     ErrStream << formatv("{0:x}", B.getAddress()) << " + "
411               << formatv("{0:x}", E.getOffset()) << ")";
412   }
413   return make_error<JITLinkError>(std::move(ErrMsg));
414 }
415 
416 Error makeAlignmentError(llvm::orc::ExecutorAddr Loc, uint64_t Value, int N,
417                          const Edge &E) {
418   return make_error<JITLinkError>("0x" + llvm::utohexstr(Loc.getValue()) +
419                                   " improper alignment for relocation " +
420                                   formatv("{0:d}", E.getKind()) + ": 0x" +
421                                   llvm::utohexstr(Value) +
422                                   " is not aligned to " + Twine(N) + " bytes");
423 }
424 
425 AnonymousPointerCreator getAnonymousPointerCreator(const Triple &TT) {
426   switch (TT.getArch()) {
427   case Triple::aarch64:
428     return aarch64::createAnonymousPointer;
429   case Triple::x86_64:
430     return x86_64::createAnonymousPointer;
431   case Triple::x86:
432     return i386::createAnonymousPointer;
433   case Triple::loongarch32:
434   case Triple::loongarch64:
435     return loongarch::createAnonymousPointer;
436   default:
437     return nullptr;
438   }
439 }
440 
441 PointerJumpStubCreator getPointerJumpStubCreator(const Triple &TT) {
442   switch (TT.getArch()) {
443   case Triple::aarch64:
444     return aarch64::createAnonymousPointerJumpStub;
445   case Triple::x86_64:
446     return x86_64::createAnonymousPointerJumpStub;
447   case Triple::x86:
448     return i386::createAnonymousPointerJumpStub;
449   case Triple::loongarch32:
450   case Triple::loongarch64:
451     return loongarch::createAnonymousPointerJumpStub;
452   default:
453     return nullptr;
454   }
455 }
456 
457 Expected<std::unique_ptr<LinkGraph>>
458 createLinkGraphFromObject(MemoryBufferRef ObjectBuffer) {
459   auto Magic = identify_magic(ObjectBuffer.getBuffer());
460   switch (Magic) {
461   case file_magic::macho_object:
462     return createLinkGraphFromMachOObject(ObjectBuffer);
463   case file_magic::elf_relocatable:
464     return createLinkGraphFromELFObject(ObjectBuffer);
465   case file_magic::coff_object:
466     return createLinkGraphFromCOFFObject(ObjectBuffer);
467   default:
468     return make_error<JITLinkError>("Unsupported file format");
469   };
470 }
471 
472 std::unique_ptr<LinkGraph> absoluteSymbolsLinkGraph(const Triple &TT,
473                                                     orc::SymbolMap Symbols) {
474   unsigned PointerSize;
475   endianness Endianness =
476       TT.isLittleEndian() ? endianness::little : endianness::big;
477   switch (TT.getArch()) {
478   case Triple::aarch64:
479   case llvm::Triple::riscv64:
480   case Triple::x86_64:
481     PointerSize = 8;
482     break;
483   case llvm::Triple::arm:
484   case llvm::Triple::riscv32:
485   case llvm::Triple::x86:
486     PointerSize = 4;
487     break;
488   default:
489     llvm::report_fatal_error("unhandled target architecture");
490   }
491 
492   static std::atomic<uint64_t> Counter = {0};
493   auto Index = Counter.fetch_add(1, std::memory_order_relaxed);
494   auto G = std::make_unique<LinkGraph>(
495       "<Absolute Symbols " + std::to_string(Index) + ">", TT, PointerSize,
496       Endianness, /*GetEdgeKindName=*/nullptr);
497   for (auto &[Name, Def] : Symbols) {
498     auto &Sym =
499         G->addAbsoluteSymbol(*Name, Def.getAddress(), /*Size=*/0,
500                              Linkage::Strong, Scope::Default, /*IsLive=*/true);
501     Sym.setCallable(Def.getFlags().isCallable());
502   }
503 
504   return G;
505 }
506 
507 void link(std::unique_ptr<LinkGraph> G, std::unique_ptr<JITLinkContext> Ctx) {
508   switch (G->getTargetTriple().getObjectFormat()) {
509   case Triple::MachO:
510     return link_MachO(std::move(G), std::move(Ctx));
511   case Triple::ELF:
512     return link_ELF(std::move(G), std::move(Ctx));
513   case Triple::COFF:
514     return link_COFF(std::move(G), std::move(Ctx));
515   default:
516     Ctx->notifyFailed(make_error<JITLinkError>("Unsupported object format"));
517   };
518 }
519 
520 } // end namespace jitlink
521 } // end namespace llvm
522