xref: /freebsd/contrib/llvm-project/lld/ELF/Thunks.cpp (revision 3a56015a2f5d630910177fa79a522bb95511ccf7)
1 //===- Thunks.cpp --------------------------------------------------------===//
2 //
3 // Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions.
4 // See https://llvm.org/LICENSE.txt for license information.
5 // SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception
6 //
7 //===---------------------------------------------------------------------===//
8 //
9 // This file contains Thunk subclasses.
10 //
11 // A thunk is a small piece of code written after an input section
12 // which is used to jump between "incompatible" functions
13 // such as MIPS PIC and non-PIC or ARM non-Thumb and Thumb functions.
14 //
15 // If a jump target is too far and its address doesn't fit to a
16 // short jump instruction, we need to create a thunk too, but we
17 // haven't supported it yet.
18 //
19 // i386 and x86-64 don't need thunks.
20 //
21 //===---------------------------------------------------------------------===//
22 
23 #include "Thunks.h"
24 #include "Config.h"
25 #include "InputFiles.h"
26 #include "InputSection.h"
27 #include "OutputSections.h"
28 #include "Symbols.h"
29 #include "SyntheticSections.h"
30 #include "Target.h"
31 #include "lld/Common/CommonLinkerContext.h"
32 #include "llvm/BinaryFormat/ELF.h"
33 #include "llvm/Support/Casting.h"
34 #include "llvm/Support/ErrorHandling.h"
35 #include "llvm/Support/MathExtras.h"
36 #include <cstdint>
37 #include <cstring>
38 
39 using namespace llvm;
40 using namespace llvm::object;
41 using namespace llvm::ELF;
42 using namespace lld;
43 using namespace lld::elf;
44 
45 namespace {
46 
47 // Base class for AArch64 thunks.
48 //
49 // An AArch64 thunk may be either short or long. A short thunk is simply a
50 // branch (B) instruction, and it may be used to call AArch64 functions when the
51 // distance from the thunk to the target is less than 128MB. Long thunks can
52 // branch to any virtual address and they are implemented in the derived
53 // classes. This class tries to create a short thunk if the target is in range,
54 // otherwise it creates a long thunk.
55 class AArch64Thunk : public Thunk {
56 public:
57   AArch64Thunk(Symbol &dest, int64_t addend) : Thunk(dest, addend) {}
58   bool getMayUseShortThunk();
59   void writeTo(uint8_t *buf) override;
60 
61 private:
62   bool mayUseShortThunk = true;
63   virtual void writeLong(uint8_t *buf) = 0;
64 };
65 
66 // AArch64 long range Thunks.
67 class AArch64ABSLongThunk final : public AArch64Thunk {
68 public:
69   AArch64ABSLongThunk(Symbol &dest, int64_t addend)
70       : AArch64Thunk(dest, addend) {}
71   uint32_t size() override { return getMayUseShortThunk() ? 4 : 16; }
72   void addSymbols(ThunkSection &isec) override;
73 
74 private:
75   void writeLong(uint8_t *buf) override;
76 };
77 
78 class AArch64ADRPThunk final : public AArch64Thunk {
79 public:
80   AArch64ADRPThunk(Symbol &dest, int64_t addend) : AArch64Thunk(dest, addend) {}
81   uint32_t size() override { return getMayUseShortThunk() ? 4 : 12; }
82   void addSymbols(ThunkSection &isec) override;
83 
84 private:
85   void writeLong(uint8_t *buf) override;
86 };
87 
88 // Base class for ARM thunks.
89 //
90 // An ARM thunk may be either short or long. A short thunk is simply a branch
91 // (B) instruction, and it may be used to call ARM functions when the distance
92 // from the thunk to the target is less than 32MB. Long thunks can branch to any
93 // virtual address and can switch between ARM and Thumb, and they are
94 // implemented in the derived classes. This class tries to create a short thunk
95 // if the target is in range, otherwise it creates a long thunk.
96 class ARMThunk : public Thunk {
97 public:
98   ARMThunk(Symbol &dest, int64_t addend) : Thunk(dest, addend) {}
99 
100   bool getMayUseShortThunk();
101   uint32_t size() override { return getMayUseShortThunk() ? 4 : sizeLong(); }
102   void writeTo(uint8_t *buf) override;
103   bool isCompatibleWith(const InputSection &isec,
104                         const Relocation &rel) const override;
105 
106   // Returns the size of a long thunk.
107   virtual uint32_t sizeLong() = 0;
108 
109   // Writes a long thunk to Buf.
110   virtual void writeLong(uint8_t *buf) = 0;
111 
112 private:
113   // This field tracks whether all previously considered layouts would allow
114   // this thunk to be short. If we have ever needed a long thunk, we always
115   // create a long thunk, even if the thunk may be short given the current
116   // distance to the target. We do this because transitioning from long to short
117   // can create layout oscillations in certain corner cases which would prevent
118   // the layout from converging.
119   bool mayUseShortThunk = true;
120 };
121 
122 // Base class for Thumb-2 thunks.
123 //
124 // This class is similar to ARMThunk, but it uses the Thumb-2 B.W instruction
125 // which has a range of 16MB.
126 class ThumbThunk : public Thunk {
127 public:
128   ThumbThunk(Symbol &dest, int64_t addend) : Thunk(dest, addend) {
129     alignment = 2;
130   }
131 
132   bool getMayUseShortThunk();
133   uint32_t size() override { return getMayUseShortThunk() ? 4 : sizeLong(); }
134   void writeTo(uint8_t *buf) override;
135   bool isCompatibleWith(const InputSection &isec,
136                         const Relocation &rel) const override;
137 
138   // Returns the size of a long thunk.
139   virtual uint32_t sizeLong() = 0;
140 
141   // Writes a long thunk to Buf.
142   virtual void writeLong(uint8_t *buf) = 0;
143 
144 private:
145   // See comment in ARMThunk above.
146   bool mayUseShortThunk = true;
147 };
148 
149 // Specific ARM Thunk implementations. The naming convention is:
150 // Source State, TargetState, Target Requirement, ABS or PI, Range
151 class ARMV7ABSLongThunk final : public ARMThunk {
152 public:
153   ARMV7ABSLongThunk(Symbol &dest, int64_t addend) : ARMThunk(dest, addend) {}
154 
155   uint32_t sizeLong() override { return 12; }
156   void writeLong(uint8_t *buf) override;
157   void addSymbols(ThunkSection &isec) override;
158 };
159 
160 class ARMV7PILongThunk final : public ARMThunk {
161 public:
162   ARMV7PILongThunk(Symbol &dest, int64_t addend) : ARMThunk(dest, addend) {}
163 
164   uint32_t sizeLong() override { return 16; }
165   void writeLong(uint8_t *buf) override;
166   void addSymbols(ThunkSection &isec) override;
167 };
168 
169 class ThumbV7ABSLongThunk final : public ThumbThunk {
170 public:
171   ThumbV7ABSLongThunk(Symbol &dest, int64_t addend)
172       : ThumbThunk(dest, addend) {}
173 
174   uint32_t sizeLong() override { return 10; }
175   void writeLong(uint8_t *buf) override;
176   void addSymbols(ThunkSection &isec) override;
177 };
178 
179 class ThumbV7PILongThunk final : public ThumbThunk {
180 public:
181   ThumbV7PILongThunk(Symbol &dest, int64_t addend) : ThumbThunk(dest, addend) {}
182 
183   uint32_t sizeLong() override { return 12; }
184   void writeLong(uint8_t *buf) override;
185   void addSymbols(ThunkSection &isec) override;
186 };
187 
188 // Implementations of Thunks for Arm v6-M. Only Thumb instructions are permitted
189 class ThumbV6MABSLongThunk final : public ThumbThunk {
190 public:
191   ThumbV6MABSLongThunk(Symbol &dest, int64_t addend)
192       : ThumbThunk(dest, addend) {}
193 
194   uint32_t sizeLong() override { return 12; }
195   void writeLong(uint8_t *buf) override;
196   void addSymbols(ThunkSection &isec) override;
197 };
198 
199 class ThumbV6MABSXOLongThunk final : public ThumbThunk {
200 public:
201   ThumbV6MABSXOLongThunk(Symbol &dest, int64_t addend)
202       : ThumbThunk(dest, addend) {}
203 
204   uint32_t sizeLong() override { return 20; }
205   void writeLong(uint8_t *buf) override;
206   void addSymbols(ThunkSection &isec) override;
207 };
208 
209 class ThumbV6MPILongThunk final : public ThumbThunk {
210 public:
211   ThumbV6MPILongThunk(Symbol &dest, int64_t addend)
212       : ThumbThunk(dest, addend) {}
213 
214   uint32_t sizeLong() override { return 16; }
215   void writeLong(uint8_t *buf) override;
216   void addSymbols(ThunkSection &isec) override;
217 };
218 
219 // Architectures v4, v5 and v6 do not support the movt/movw instructions. v5 and
220 // v6 support BLX to which BL instructions can be rewritten inline. There are no
221 // Thumb entrypoints for v5 and v6 as there is no Thumb branch instruction on
222 // these architecture that can result in a thunk.
223 
224 // LDR on v5 and v6 can switch processor state, so for v5 and v6,
225 // ARMV5LongLdrPcThunk can be used for both Arm->Arm and Arm->Thumb calls. v4
226 // can also use this thunk, but only for Arm->Arm calls.
227 class ARMV5LongLdrPcThunk final : public ARMThunk {
228 public:
229   ARMV5LongLdrPcThunk(Symbol &dest, int64_t addend) : ARMThunk(dest, addend) {}
230 
231   uint32_t sizeLong() override { return 8; }
232   void writeLong(uint8_t *buf) override;
233   void addSymbols(ThunkSection &isec) override;
234 };
235 
236 // Implementations of Thunks for v4. BLX is not supported, and loads
237 // will not invoke Arm/Thumb state changes.
238 class ARMV4PILongBXThunk final : public ARMThunk {
239 public:
240   ARMV4PILongBXThunk(Symbol &dest, int64_t addend) : ARMThunk(dest, addend) {}
241 
242   uint32_t sizeLong() override { return 16; }
243   void writeLong(uint8_t *buf) override;
244   void addSymbols(ThunkSection &isec) override;
245 };
246 
247 class ARMV4PILongThunk final : public ARMThunk {
248 public:
249   ARMV4PILongThunk(Symbol &dest, int64_t addend) : ARMThunk(dest, addend) {}
250 
251   uint32_t sizeLong() override { return 12; }
252   void writeLong(uint8_t *buf) override;
253   void addSymbols(ThunkSection &isec) override;
254 };
255 
256 class ThumbV4PILongBXThunk final : public ThumbThunk {
257 public:
258   ThumbV4PILongBXThunk(Symbol &dest, int64_t addend)
259       : ThumbThunk(dest, addend) {}
260 
261   uint32_t sizeLong() override { return 16; }
262   void writeLong(uint8_t *buf) override;
263   void addSymbols(ThunkSection &isec) override;
264 };
265 
266 class ThumbV4PILongThunk final : public ThumbThunk {
267 public:
268   ThumbV4PILongThunk(Symbol &dest, int64_t addend)
269       : ThumbThunk(dest, addend) {}
270 
271   uint32_t sizeLong() override { return 20; }
272   void writeLong(uint8_t *buf) override;
273   void addSymbols(ThunkSection &isec) override;
274 };
275 
276 class ARMV4ABSLongBXThunk final : public ARMThunk {
277 public:
278   ARMV4ABSLongBXThunk(Symbol &dest, int64_t addend) : ARMThunk(dest, addend) {}
279 
280   uint32_t sizeLong() override { return 12; }
281   void writeLong(uint8_t *buf) override;
282   void addSymbols(ThunkSection &isec) override;
283 };
284 
285 class ThumbV4ABSLongBXThunk final : public ThumbThunk {
286 public:
287   ThumbV4ABSLongBXThunk(Symbol &dest, int64_t addend)
288       : ThumbThunk(dest, addend) {}
289 
290   uint32_t sizeLong() override { return 12; }
291   void writeLong(uint8_t *buf) override;
292   void addSymbols(ThunkSection &isec) override;
293 };
294 
295 class ThumbV4ABSLongThunk final : public ThumbThunk {
296 public:
297   ThumbV4ABSLongThunk(Symbol &dest, int64_t addend)
298       : ThumbThunk(dest, addend) {}
299 
300   uint32_t sizeLong() override { return 16; }
301   void writeLong(uint8_t *buf) override;
302   void addSymbols(ThunkSection &isec) override;
303 };
304 
305 // The AVR devices need thunks for R_AVR_LO8_LDI_GS/R_AVR_HI8_LDI_GS
306 // when their destination is out of range [0, 0x1ffff].
307 class AVRThunk : public Thunk {
308 public:
309   AVRThunk(Symbol &dest, int64_t addend) : Thunk(dest, addend) {}
310   uint32_t size() override { return 4; }
311   void writeTo(uint8_t *buf) override;
312   void addSymbols(ThunkSection &isec) override;
313 };
314 
315 // MIPS LA25 thunk
316 class MipsThunk final : public Thunk {
317 public:
318   MipsThunk(Symbol &dest) : Thunk(dest, 0) {}
319 
320   uint32_t size() override { return 16; }
321   void writeTo(uint8_t *buf) override;
322   void addSymbols(ThunkSection &isec) override;
323   InputSection *getTargetInputSection() const override;
324 };
325 
326 // microMIPS R2-R5 LA25 thunk
327 class MicroMipsThunk final : public Thunk {
328 public:
329   MicroMipsThunk(Symbol &dest) : Thunk(dest, 0) {}
330 
331   uint32_t size() override { return 14; }
332   void writeTo(uint8_t *buf) override;
333   void addSymbols(ThunkSection &isec) override;
334   InputSection *getTargetInputSection() const override;
335 };
336 
337 // microMIPS R6 LA25 thunk
338 class MicroMipsR6Thunk final : public Thunk {
339 public:
340   MicroMipsR6Thunk(Symbol &dest) : Thunk(dest, 0) {}
341 
342   uint32_t size() override { return 12; }
343   void writeTo(uint8_t *buf) override;
344   void addSymbols(ThunkSection &isec) override;
345   InputSection *getTargetInputSection() const override;
346 };
347 
348 class PPC32PltCallStub final : public Thunk {
349 public:
350   // For R_PPC_PLTREL24, Thunk::addend records the addend which will be used to
351   // decide the offsets in the call stub.
352   PPC32PltCallStub(const InputSection &isec, const Relocation &rel,
353                    Symbol &dest)
354       : Thunk(dest, rel.addend), file(isec.file) {}
355   uint32_t size() override { return 16; }
356   void writeTo(uint8_t *buf) override;
357   void addSymbols(ThunkSection &isec) override;
358   bool isCompatibleWith(const InputSection &isec, const Relocation &rel) const override;
359 
360 private:
361   // Records the call site of the call stub.
362   const InputFile *file;
363 };
364 
365 class PPC32LongThunk final : public Thunk {
366 public:
367   PPC32LongThunk(Symbol &dest, int64_t addend) : Thunk(dest, addend) {}
368   uint32_t size() override { return config->isPic ? 32 : 16; }
369   void writeTo(uint8_t *buf) override;
370   void addSymbols(ThunkSection &isec) override;
371 };
372 
373 // PPC64 Plt call stubs.
374 // Any call site that needs to call through a plt entry needs a call stub in
375 // the .text section. The call stub is responsible for:
376 // 1) Saving the toc-pointer to the stack.
377 // 2) Loading the target functions address from the procedure linkage table into
378 //    r12 for use by the target functions global entry point, and into the count
379 //    register.
380 // 3) Transferring control to the target function through an indirect branch.
381 class PPC64PltCallStub final : public Thunk {
382 public:
383   PPC64PltCallStub(Symbol &dest) : Thunk(dest, 0) {}
384   uint32_t size() override { return 20; }
385   void writeTo(uint8_t *buf) override;
386   void addSymbols(ThunkSection &isec) override;
387   bool isCompatibleWith(const InputSection &isec,
388                         const Relocation &rel) const override;
389 };
390 
391 // PPC64 R2 Save Stub
392 // When the caller requires a valid R2 TOC pointer but the callee does not
393 // require a TOC pointer and the callee cannot guarantee that it doesn't
394 // clobber R2 then we need to save R2. This stub:
395 // 1) Saves the TOC pointer to the stack.
396 // 2) Tail calls the callee.
397 class PPC64R2SaveStub final : public Thunk {
398 public:
399   PPC64R2SaveStub(Symbol &dest, int64_t addend) : Thunk(dest, addend) {
400     alignment = 16;
401   }
402 
403   // To prevent oscillations in layout when moving from short to long thunks
404   // we make sure that once a thunk has been set to long it cannot go back.
405   bool getMayUseShortThunk() {
406     if (!mayUseShortThunk)
407       return false;
408     if (!isInt<26>(computeOffset())) {
409       mayUseShortThunk = false;
410       return false;
411     }
412     return true;
413   }
414   uint32_t size() override { return getMayUseShortThunk() ? 8 : 32; }
415   void writeTo(uint8_t *buf) override;
416   void addSymbols(ThunkSection &isec) override;
417   bool isCompatibleWith(const InputSection &isec,
418                         const Relocation &rel) const override;
419 
420 private:
421   // Transitioning from long to short can create layout oscillations in
422   // certain corner cases which would prevent the layout from converging.
423   // This is similar to the handling for ARMThunk.
424   bool mayUseShortThunk = true;
425   int64_t computeOffset() const {
426     return destination.getVA() - (getThunkTargetSym()->getVA() + 4);
427   }
428 };
429 
430 // PPC64 R12 Setup Stub
431 // When a caller that does not maintain TOC calls a target which may possibly
432 // use TOC (either non-preemptible with localentry>1 or preemptible), we need to
433 // set r12 to satisfy the requirement of the global entry point.
434 class PPC64R12SetupStub final : public Thunk {
435 public:
436   PPC64R12SetupStub(Symbol &dest, bool gotPlt)
437       : Thunk(dest, 0), gotPlt(gotPlt) {
438     alignment = 16;
439   }
440   uint32_t size() override { return 32; }
441   void writeTo(uint8_t *buf) override;
442   void addSymbols(ThunkSection &isec) override;
443   bool isCompatibleWith(const InputSection &isec,
444                         const Relocation &rel) const override;
445 
446 private:
447   bool gotPlt;
448 };
449 
450 // A bl instruction uses a signed 24 bit offset, with an implicit 4 byte
451 // alignment. This gives a possible 26 bits of 'reach'. If the call offset is
452 // larger than that we need to emit a long-branch thunk. The target address
453 // of the callee is stored in a table to be accessed TOC-relative. Since the
454 // call must be local (a non-local call will have a PltCallStub instead) the
455 // table stores the address of the callee's local entry point. For
456 // position-independent code a corresponding relative dynamic relocation is
457 // used.
458 class PPC64LongBranchThunk : public Thunk {
459 public:
460   uint32_t size() override { return 32; }
461   void writeTo(uint8_t *buf) override;
462   void addSymbols(ThunkSection &isec) override;
463   bool isCompatibleWith(const InputSection &isec,
464                         const Relocation &rel) const override;
465 
466 protected:
467   PPC64LongBranchThunk(Symbol &dest, int64_t addend) : Thunk(dest, addend) {}
468 };
469 
470 class PPC64PILongBranchThunk final : public PPC64LongBranchThunk {
471 public:
472   PPC64PILongBranchThunk(Symbol &dest, int64_t addend)
473       : PPC64LongBranchThunk(dest, addend) {
474     assert(!dest.isPreemptible);
475     if (std::optional<uint32_t> index =
476             in.ppc64LongBranchTarget->addEntry(&dest, addend)) {
477       mainPart->relaDyn->addRelativeReloc(
478           target->relativeRel, *in.ppc64LongBranchTarget, *index * UINT64_C(8),
479           dest, addend + getPPC64GlobalEntryToLocalEntryOffset(dest.stOther),
480           target->symbolicRel, R_ABS);
481     }
482   }
483 };
484 
485 class PPC64PDLongBranchThunk final : public PPC64LongBranchThunk {
486 public:
487   PPC64PDLongBranchThunk(Symbol &dest, int64_t addend)
488       : PPC64LongBranchThunk(dest, addend) {
489     in.ppc64LongBranchTarget->addEntry(&dest, addend);
490   }
491 };
492 
493 } // end anonymous namespace
494 
495 Defined *Thunk::addSymbol(StringRef name, uint8_t type, uint64_t value,
496                           InputSectionBase &section) {
497   Defined *d = addSyntheticLocal(name, type, value, /*size=*/0, section);
498   syms.push_back(d);
499   return d;
500 }
501 
502 void Thunk::setOffset(uint64_t newOffset) {
503   for (Defined *d : syms)
504     d->value = d->value - offset + newOffset;
505   offset = newOffset;
506 }
507 
508 // AArch64 Thunk base class.
509 static uint64_t getAArch64ThunkDestVA(const Symbol &s, int64_t a) {
510   uint64_t v = s.isInPlt() ? s.getPltVA() : s.getVA(a);
511   return v;
512 }
513 
514 bool AArch64Thunk::getMayUseShortThunk() {
515   if (!mayUseShortThunk)
516     return false;
517   uint64_t s = getAArch64ThunkDestVA(destination, addend);
518   uint64_t p = getThunkTargetSym()->getVA();
519   mayUseShortThunk = llvm::isInt<28>(s - p);
520   return mayUseShortThunk;
521 }
522 
523 void AArch64Thunk::writeTo(uint8_t *buf) {
524   if (!getMayUseShortThunk()) {
525     writeLong(buf);
526     return;
527   }
528   uint64_t s = getAArch64ThunkDestVA(destination, addend);
529   uint64_t p = getThunkTargetSym()->getVA();
530   write32(buf, 0x14000000); // b S
531   target->relocateNoSym(buf, R_AARCH64_CALL26, s - p);
532 }
533 
534 // AArch64 long range Thunks.
535 void AArch64ABSLongThunk::writeLong(uint8_t *buf) {
536   const uint8_t data[] = {
537     0x50, 0x00, 0x00, 0x58, //     ldr x16, L0
538     0x00, 0x02, 0x1f, 0xd6, //     br  x16
539     0x00, 0x00, 0x00, 0x00, // L0: .xword S
540     0x00, 0x00, 0x00, 0x00,
541   };
542   uint64_t s = getAArch64ThunkDestVA(destination, addend);
543   memcpy(buf, data, sizeof(data));
544   target->relocateNoSym(buf + 8, R_AARCH64_ABS64, s);
545 }
546 
547 void AArch64ABSLongThunk::addSymbols(ThunkSection &isec) {
548   addSymbol(saver().save("__AArch64AbsLongThunk_" + destination.getName()),
549             STT_FUNC, 0, isec);
550   addSymbol("$x", STT_NOTYPE, 0, isec);
551   if (!getMayUseShortThunk())
552     addSymbol("$d", STT_NOTYPE, 8, isec);
553 }
554 
555 // This Thunk has a maximum range of 4Gb, this is sufficient for all programs
556 // using the small code model, including pc-relative ones. At time of writing
557 // clang and gcc do not support the large code model for position independent
558 // code so it is safe to use this for position independent thunks without
559 // worrying about the destination being more than 4Gb away.
560 void AArch64ADRPThunk::writeLong(uint8_t *buf) {
561   const uint8_t data[] = {
562       0x10, 0x00, 0x00, 0x90, // adrp x16, Dest R_AARCH64_ADR_PREL_PG_HI21(Dest)
563       0x10, 0x02, 0x00, 0x91, // add  x16, x16, R_AARCH64_ADD_ABS_LO12_NC(Dest)
564       0x00, 0x02, 0x1f, 0xd6, // br   x16
565   };
566   uint64_t s = getAArch64ThunkDestVA(destination, addend);
567   uint64_t p = getThunkTargetSym()->getVA();
568   memcpy(buf, data, sizeof(data));
569   target->relocateNoSym(buf, R_AARCH64_ADR_PREL_PG_HI21,
570                         getAArch64Page(s) - getAArch64Page(p));
571   target->relocateNoSym(buf + 4, R_AARCH64_ADD_ABS_LO12_NC, s);
572 }
573 
574 void AArch64ADRPThunk::addSymbols(ThunkSection &isec) {
575   addSymbol(saver().save("__AArch64ADRPThunk_" + destination.getName()),
576             STT_FUNC, 0, isec);
577   addSymbol("$x", STT_NOTYPE, 0, isec);
578 }
579 
580 // ARM Target Thunks
581 static uint64_t getARMThunkDestVA(const Symbol &s) {
582   uint64_t v = s.isInPlt() ? s.getPltVA() : s.getVA();
583   return SignExtend64<32>(v);
584 }
585 
586 // This function returns true if the target is not Thumb and is within 2^26, and
587 // it has not previously returned false (see comment for mayUseShortThunk).
588 bool ARMThunk::getMayUseShortThunk() {
589   if (!mayUseShortThunk)
590     return false;
591   uint64_t s = getARMThunkDestVA(destination);
592   if (s & 1) {
593     mayUseShortThunk = false;
594     return false;
595   }
596   uint64_t p = getThunkTargetSym()->getVA();
597   int64_t offset = s - p - 8;
598   mayUseShortThunk = llvm::isInt<26>(offset);
599   return mayUseShortThunk;
600 }
601 
602 void ARMThunk::writeTo(uint8_t *buf) {
603   if (!getMayUseShortThunk()) {
604     writeLong(buf);
605     return;
606   }
607 
608   uint64_t s = getARMThunkDestVA(destination);
609   uint64_t p = getThunkTargetSym()->getVA();
610   int64_t offset = s - p - 8;
611   write32(buf, 0xea000000); // b S
612   target->relocateNoSym(buf, R_ARM_JUMP24, offset);
613 }
614 
615 bool ARMThunk::isCompatibleWith(const InputSection &isec,
616                                 const Relocation &rel) const {
617   // v4T does not have BLX, so also deny R_ARM_THM_CALL
618   if (!config->armHasBlx && rel.type == R_ARM_THM_CALL)
619     return false;
620 
621   // Thumb branch relocations can't use BLX
622   return rel.type != R_ARM_THM_JUMP19 && rel.type != R_ARM_THM_JUMP24;
623 }
624 
625 // This function returns true if:
626 // the target is Thumb
627 // && is within branch range
628 // && this function has not previously returned false
629 //    (see comment for mayUseShortThunk)
630 // && the arch supports Thumb branch range extension.
631 bool ThumbThunk::getMayUseShortThunk() {
632   if (!mayUseShortThunk || !config->armJ1J2BranchEncoding)
633     return false;
634   uint64_t s = getARMThunkDestVA(destination);
635   if ((s & 1) == 0) {
636     mayUseShortThunk = false;
637     return false;
638   }
639   uint64_t p = getThunkTargetSym()->getVA() & ~1;
640   int64_t offset = s - p - 4;
641   mayUseShortThunk = llvm::isInt<25>(offset);
642   return mayUseShortThunk;
643 }
644 
645 void ThumbThunk::writeTo(uint8_t *buf) {
646   if (!getMayUseShortThunk()) {
647     writeLong(buf);
648     return;
649   }
650 
651   uint64_t s = getARMThunkDestVA(destination);
652   uint64_t p = getThunkTargetSym()->getVA();
653   int64_t offset = s - p - 4;
654   write16(buf + 0, 0xf000); // b.w S
655   write16(buf + 2, 0xb000);
656   target->relocateNoSym(buf, R_ARM_THM_JUMP24, offset);
657 }
658 
659 bool ThumbThunk::isCompatibleWith(const InputSection &isec,
660                                   const Relocation &rel) const {
661   // v4T does not have BLX, so also deny R_ARM_CALL
662   if (!config->armHasBlx && rel.type == R_ARM_CALL)
663     return false;
664 
665   // ARM branch relocations can't use BLX
666   return rel.type != R_ARM_JUMP24 && rel.type != R_ARM_PC24 && rel.type != R_ARM_PLT32;
667 }
668 
669 void ARMV7ABSLongThunk::writeLong(uint8_t *buf) {
670   write32(buf + 0, 0xe300c000); // movw ip,:lower16:S
671   write32(buf + 4, 0xe340c000); // movt ip,:upper16:S
672   write32(buf + 8, 0xe12fff1c); // bx   ip
673   uint64_t s = getARMThunkDestVA(destination);
674   target->relocateNoSym(buf, R_ARM_MOVW_ABS_NC, s);
675   target->relocateNoSym(buf + 4, R_ARM_MOVT_ABS, s);
676 }
677 
678 void ARMV7ABSLongThunk::addSymbols(ThunkSection &isec) {
679   addSymbol(saver().save("__ARMv7ABSLongThunk_" + destination.getName()),
680             STT_FUNC, 0, isec);
681   addSymbol("$a", STT_NOTYPE, 0, isec);
682 }
683 
684 void ThumbV7ABSLongThunk::writeLong(uint8_t *buf) {
685   write16(buf + 0, 0xf240); // movw ip, :lower16:S
686   write16(buf + 2, 0x0c00);
687   write16(buf + 4, 0xf2c0); // movt ip, :upper16:S
688   write16(buf + 6, 0x0c00);
689   write16(buf + 8, 0x4760); // bx   ip
690   uint64_t s = getARMThunkDestVA(destination);
691   target->relocateNoSym(buf, R_ARM_THM_MOVW_ABS_NC, s);
692   target->relocateNoSym(buf + 4, R_ARM_THM_MOVT_ABS, s);
693 }
694 
695 void ThumbV7ABSLongThunk::addSymbols(ThunkSection &isec) {
696   addSymbol(saver().save("__Thumbv7ABSLongThunk_" + destination.getName()),
697             STT_FUNC, 1, isec);
698   addSymbol("$t", STT_NOTYPE, 0, isec);
699 }
700 
701 void ARMV7PILongThunk::writeLong(uint8_t *buf) {
702   write32(buf + 0, 0xe30fcff0);   // P:  movw ip,:lower16:S - (P + (L1-P) + 8)
703   write32(buf + 4, 0xe340c000);   //     movt ip,:upper16:S - (P + (L1-P) + 8)
704   write32(buf + 8, 0xe08cc00f);   // L1: add  ip, ip, pc
705   write32(buf + 12, 0xe12fff1c);  //     bx   ip
706   uint64_t s = getARMThunkDestVA(destination);
707   uint64_t p = getThunkTargetSym()->getVA();
708   int64_t offset = s - p - 16;
709   target->relocateNoSym(buf, R_ARM_MOVW_PREL_NC, offset);
710   target->relocateNoSym(buf + 4, R_ARM_MOVT_PREL, offset);
711 }
712 
713 void ARMV7PILongThunk::addSymbols(ThunkSection &isec) {
714   addSymbol(saver().save("__ARMV7PILongThunk_" + destination.getName()),
715             STT_FUNC, 0, isec);
716   addSymbol("$a", STT_NOTYPE, 0, isec);
717 }
718 
719 void ThumbV7PILongThunk::writeLong(uint8_t *buf) {
720   write16(buf + 0, 0xf64f);   // P:  movw ip,:lower16:S - (P + (L1-P) + 4)
721   write16(buf + 2, 0x7cf4);
722   write16(buf + 4, 0xf2c0);   //     movt ip,:upper16:S - (P + (L1-P) + 4)
723   write16(buf + 6, 0x0c00);
724   write16(buf + 8, 0x44fc);   // L1: add  ip, pc
725   write16(buf + 10, 0x4760);  //     bx   ip
726   uint64_t s = getARMThunkDestVA(destination);
727   uint64_t p = getThunkTargetSym()->getVA() & ~0x1;
728   int64_t offset = s - p - 12;
729   target->relocateNoSym(buf, R_ARM_THM_MOVW_PREL_NC, offset);
730   target->relocateNoSym(buf + 4, R_ARM_THM_MOVT_PREL, offset);
731 }
732 
733 void ThumbV7PILongThunk::addSymbols(ThunkSection &isec) {
734   addSymbol(saver().save("__ThumbV7PILongThunk_" + destination.getName()),
735             STT_FUNC, 1, isec);
736   addSymbol("$t", STT_NOTYPE, 0, isec);
737 }
738 
739 void ThumbV6MABSLongThunk::writeLong(uint8_t *buf) {
740   // Most Thumb instructions cannot access the high registers r8 - r15. As the
741   // only register we can corrupt is r12 we must instead spill a low register
742   // to the stack to use as a scratch register. We push r1 even though we
743   // don't need to get some space to use for the return address.
744   write16(buf + 0, 0xb403);   // push {r0, r1} ; Obtain scratch registers
745   write16(buf + 2, 0x4801);   // ldr r0, [pc, #4] ; L1
746   write16(buf + 4, 0x9001);   // str r0, [sp, #4] ; SP + 4 = S
747   write16(buf + 6, 0xbd01);   // pop {r0, pc} ; restore r0 and branch to dest
748   write32(buf + 8, 0x00000000);   // L1: .word S
749   uint64_t s = getARMThunkDestVA(destination);
750   target->relocateNoSym(buf + 8, R_ARM_ABS32, s);
751 }
752 
753 void ThumbV6MABSLongThunk::addSymbols(ThunkSection &isec) {
754   addSymbol(saver().save("__Thumbv6MABSLongThunk_" + destination.getName()),
755             STT_FUNC, 1, isec);
756   addSymbol("$t", STT_NOTYPE, 0, isec);
757   if (!getMayUseShortThunk())
758     addSymbol("$d", STT_NOTYPE, 8, isec);
759 }
760 
761 void ThumbV6MABSXOLongThunk::writeLong(uint8_t *buf) {
762   // Most Thumb instructions cannot access the high registers r8 - r15. As the
763   // only register we can corrupt is r12 we must instead spill a low register
764   // to the stack to use as a scratch register. We push r1 even though we
765   // don't need to get some space to use for the return address.
766   write16(buf + 0, 0xb403);  // push {r0, r1} ; Obtain scratch registers
767   write16(buf + 2, 0x2000);  // movs r0, :upper8_15:S
768   write16(buf + 4, 0x0200);  // lsls r0, r0, #8
769   write16(buf + 6, 0x3000);  // adds r0, :upper0_7:S
770   write16(buf + 8, 0x0200);  // lsls r0, r0, #8
771   write16(buf + 10, 0x3000); // adds r0, :lower8_15:S
772   write16(buf + 12, 0x0200); // lsls r0, r0, #8
773   write16(buf + 14, 0x3000); // adds r0, :lower0_7:S
774   write16(buf + 16, 0x9001); // str r0, [sp, #4] ; SP + 4 = S
775   write16(buf + 18, 0xbd01); // pop {r0, pc} ; restore r0 and branch to dest
776   uint64_t s = getARMThunkDestVA(destination);
777   target->relocateNoSym(buf + 2, R_ARM_THM_ALU_ABS_G3, s);
778   target->relocateNoSym(buf + 6, R_ARM_THM_ALU_ABS_G2_NC, s);
779   target->relocateNoSym(buf + 10, R_ARM_THM_ALU_ABS_G1_NC, s);
780   target->relocateNoSym(buf + 14, R_ARM_THM_ALU_ABS_G0_NC, s);
781 }
782 
783 void ThumbV6MABSXOLongThunk::addSymbols(ThunkSection &isec) {
784   addSymbol(saver().save("__Thumbv6MABSXOLongThunk_" + destination.getName()),
785             STT_FUNC, 1, isec);
786   addSymbol("$t", STT_NOTYPE, 0, isec);
787 }
788 
789 void ThumbV6MPILongThunk::writeLong(uint8_t *buf) {
790   // Most Thumb instructions cannot access the high registers r8 - r15. As the
791   // only register we can corrupt is ip (r12) we must instead spill a low
792   // register to the stack to use as a scratch register.
793   write16(buf + 0, 0xb401);   // P:  push {r0}        ; Obtain scratch register
794   write16(buf + 2, 0x4802);   //     ldr r0, [pc, #8] ; L2
795   write16(buf + 4, 0x4684);   //     mov ip, r0       ; high to low register
796   write16(buf + 6, 0xbc01);   //     pop {r0}         ; restore scratch register
797   write16(buf + 8, 0x44e7);   // L1: add pc, ip       ; transfer control
798   write16(buf + 10, 0x46c0);  //     nop              ; pad to 4-byte boundary
799   write32(buf + 12, 0x00000000);  // L2: .word S - (P + (L1 - P) + 4)
800   uint64_t s = getARMThunkDestVA(destination);
801   uint64_t p = getThunkTargetSym()->getVA() & ~0x1;
802   target->relocateNoSym(buf + 12, R_ARM_REL32, s - p - 12);
803 }
804 
805 void ThumbV6MPILongThunk::addSymbols(ThunkSection &isec) {
806   addSymbol(saver().save("__Thumbv6MPILongThunk_" + destination.getName()),
807             STT_FUNC, 1, isec);
808   addSymbol("$t", STT_NOTYPE, 0, isec);
809   if (!getMayUseShortThunk())
810     addSymbol("$d", STT_NOTYPE, 12, isec);
811 }
812 
813 void ARMV5LongLdrPcThunk::writeLong(uint8_t *buf) {
814   write32(buf + 0, 0xe51ff004); // ldr pc, [pc,#-4] ; L1
815   write32(buf + 4, 0x00000000); // L1: .word S
816   target->relocateNoSym(buf + 4, R_ARM_ABS32, getARMThunkDestVA(destination));
817 }
818 
819 void ARMV5LongLdrPcThunk::addSymbols(ThunkSection &isec) {
820   addSymbol(saver().save("__ARMv5LongLdrPcThunk_" + destination.getName()),
821             STT_FUNC, 0, isec);
822   addSymbol("$a", STT_NOTYPE, 0, isec);
823   if (!getMayUseShortThunk())
824     addSymbol("$d", STT_NOTYPE, 4, isec);
825 }
826 
827 void ARMV4ABSLongBXThunk::writeLong(uint8_t *buf) {
828   write32(buf + 0, 0xe59fc000); // ldr r12, [pc] ; L1
829   write32(buf + 4, 0xe12fff1c); // bx r12
830   write32(buf + 8, 0x00000000); // L1: .word S
831   target->relocateNoSym(buf + 8, R_ARM_ABS32, getARMThunkDestVA(destination));
832 }
833 
834 void ARMV4ABSLongBXThunk::addSymbols(ThunkSection &isec) {
835   addSymbol(saver().save("__ARMv4ABSLongBXThunk_" + destination.getName()),
836             STT_FUNC, 0, isec);
837   addSymbol("$a", STT_NOTYPE, 0, isec);
838   if (!getMayUseShortThunk())
839     addSymbol("$d", STT_NOTYPE, 8, isec);
840 }
841 
842 void ThumbV4ABSLongBXThunk::writeLong(uint8_t *buf) {
843   write16(buf + 0, 0x4778); // bx pc
844   write16(buf + 2, 0xe7fd); // b #-6 ; Arm recommended sequence to follow bx pc
845   write32(buf + 4, 0xe51ff004); // ldr pc, [pc, #-4] ; L1
846   write32(buf + 8, 0x00000000); // L1: .word S
847   target->relocateNoSym(buf + 8, R_ARM_ABS32, getARMThunkDestVA(destination));
848 }
849 
850 void ThumbV4ABSLongBXThunk::addSymbols(ThunkSection &isec) {
851   addSymbol(saver().save("__Thumbv4ABSLongBXThunk_" + destination.getName()),
852             STT_FUNC, 1, isec);
853   addSymbol("$t", STT_NOTYPE, 0, isec);
854   addSymbol("$a", STT_NOTYPE, 4, isec);
855   if (!getMayUseShortThunk())
856     addSymbol("$d", STT_NOTYPE, 8, isec);
857 }
858 
859 void ThumbV4ABSLongThunk::writeLong(uint8_t *buf) {
860   write16(buf + 0, 0x4778); // bx pc
861   write16(buf + 2, 0xe7fd); // b #-6 ; Arm recommended sequence to follow bx pc
862   write32(buf + 4, 0xe59fc000); // ldr r12, [pc] ; L1
863   write32(buf + 8, 0xe12fff1c); // bx r12
864   write32(buf + 12, 0x00000000); // L1: .word S
865   target->relocateNoSym(buf + 12, R_ARM_ABS32, getARMThunkDestVA(destination));
866 }
867 
868 void ThumbV4ABSLongThunk::addSymbols(ThunkSection &isec) {
869   addSymbol(saver().save("__Thumbv4ABSLongThunk_" + destination.getName()),
870             STT_FUNC, 1, isec);
871   addSymbol("$t", STT_NOTYPE, 0, isec);
872   addSymbol("$a", STT_NOTYPE, 4, isec);
873   if (!getMayUseShortThunk())
874     addSymbol("$d", STT_NOTYPE, 12, isec);
875 }
876 
877 void ARMV4PILongBXThunk::writeLong(uint8_t *buf) {
878   write32(buf + 0, 0xe59fc004); // P:  ldr ip, [pc,#4] ; L2
879   write32(buf + 4, 0xe08fc00c);	// L1: add ip, pc, ip
880   write32(buf + 8, 0xe12fff1c);	//     bx ip
881   write32(buf + 12, 0x00000000); // L2: .word S - (P + (L1 - P) + 8)
882   uint64_t s = getARMThunkDestVA(destination);
883   uint64_t p = getThunkTargetSym()->getVA() & ~0x1;
884   target->relocateNoSym(buf + 12, R_ARM_REL32, s - p - 12);
885 }
886 
887 void ARMV4PILongBXThunk::addSymbols(ThunkSection &isec) {
888   addSymbol(saver().save("__ARMv4PILongBXThunk_" + destination.getName()),
889             STT_FUNC, 0, isec);
890   addSymbol("$a", STT_NOTYPE, 0, isec);
891   if (!getMayUseShortThunk())
892     addSymbol("$d", STT_NOTYPE, 12, isec);
893 }
894 
895 void ARMV4PILongThunk::writeLong(uint8_t *buf) {
896   write32(buf + 0, 0xe59fc000); // P:  ldr ip, [pc] ; L2
897   write32(buf + 4, 0xe08ff00c); // L1: add pc, pc, r12
898   write32(buf + 8, 0x00000000); // L2: .word S - (P + (L1 - P) + 8)
899   uint64_t s = getARMThunkDestVA(destination);
900   uint64_t p = getThunkTargetSym()->getVA() & ~0x1;
901   target->relocateNoSym(buf + 8, R_ARM_REL32, s - p - 12);
902 }
903 
904 void ARMV4PILongThunk::addSymbols(ThunkSection &isec) {
905   addSymbol(saver().save("__ARMv4PILongThunk_" + destination.getName()),
906             STT_FUNC, 0, isec);
907   addSymbol("$a", STT_NOTYPE, 0, isec);
908   if (!getMayUseShortThunk())
909     addSymbol("$d", STT_NOTYPE, 8, isec);
910 }
911 
912 void ThumbV4PILongBXThunk::writeLong(uint8_t *buf) {
913   write16(buf + 0, 0x4778); // P:  bx pc
914   write16(buf + 2, 0xe7fd); //     b #-6 ; Arm recommended sequence to follow bx pc
915   write32(buf + 4, 0xe59fc000); //     ldr r12, [pc] ; L2
916   write32(buf + 8, 0xe08cf00f); // L1: add pc, r12, pc
917   write32(buf + 12, 0x00000000); // L2: .word S - (P + (L1 - P) + 8)
918   uint64_t s = getARMThunkDestVA(destination);
919   uint64_t p = getThunkTargetSym()->getVA() & ~0x1;
920   target->relocateNoSym(buf + 12, R_ARM_REL32, s - p - 16);
921 }
922 
923 void ThumbV4PILongBXThunk::addSymbols(ThunkSection &isec) {
924   addSymbol(saver().save("__Thumbv4PILongBXThunk_" + destination.getName()),
925             STT_FUNC, 1, isec);
926   addSymbol("$t", STT_NOTYPE, 0, isec);
927   addSymbol("$a", STT_NOTYPE, 4, isec);
928   if (!getMayUseShortThunk())
929     addSymbol("$d", STT_NOTYPE, 12, isec);
930 }
931 
932 void ThumbV4PILongThunk::writeLong(uint8_t *buf) {
933   write16(buf + 0, 0x4778); // P:  bx pc
934   write16(buf + 2, 0xe7fd); //     b #-6 ; Arm recommended sequence to follow bx pc
935   write32(buf + 4, 0xe59fc004); //     ldr ip, [pc,#4] ; L2
936   write32(buf + 8, 0xe08fc00c); // L1: add ip, pc, ip
937   write32(buf + 12, 0xe12fff1c); //     bx ip
938   write32(buf + 16, 0x00000000); // L2: .word S - (P + (L1 - P) + 8)
939   uint64_t s = getARMThunkDestVA(destination);
940   uint64_t p = getThunkTargetSym()->getVA() & ~0x1;
941   target->relocateNoSym(buf + 16, R_ARM_REL32, s - p - 16);
942 }
943 
944 void ThumbV4PILongThunk::addSymbols(ThunkSection &isec) {
945   addSymbol(saver().save("__Thumbv4PILongThunk_" + destination.getName()),
946             STT_FUNC, 1, isec);
947   addSymbol("$t", STT_NOTYPE, 0, isec);
948   addSymbol("$a", STT_NOTYPE, 4, isec);
949   if (!getMayUseShortThunk())
950     addSymbol("$d", STT_NOTYPE, 16, isec);
951 }
952 
953 // Use the long jump which covers a range up to 8MiB.
954 void AVRThunk::writeTo(uint8_t *buf) {
955   write32(buf, 0x940c); // jmp func
956   target->relocateNoSym(buf, R_AVR_CALL, destination.getVA());
957 }
958 
959 void AVRThunk::addSymbols(ThunkSection &isec) {
960   addSymbol(saver().save("__AVRThunk_" + destination.getName()), STT_FUNC, 0,
961             isec);
962 }
963 
964 // Write MIPS LA25 thunk code to call PIC function from the non-PIC one.
965 void MipsThunk::writeTo(uint8_t *buf) {
966   uint64_t s = destination.getVA();
967   write32(buf, 0x3c190000); // lui   $25, %hi(func)
968   write32(buf + 4, 0x08000000 | (s >> 2)); // j     func
969   write32(buf + 8, 0x27390000); // addiu $25, $25, %lo(func)
970   write32(buf + 12, 0x00000000); // nop
971   target->relocateNoSym(buf, R_MIPS_HI16, s);
972   target->relocateNoSym(buf + 8, R_MIPS_LO16, s);
973 }
974 
975 void MipsThunk::addSymbols(ThunkSection &isec) {
976   addSymbol(saver().save("__LA25Thunk_" + destination.getName()), STT_FUNC, 0,
977             isec);
978 }
979 
980 InputSection *MipsThunk::getTargetInputSection() const {
981   auto &dr = cast<Defined>(destination);
982   return dyn_cast<InputSection>(dr.section);
983 }
984 
985 // Write microMIPS R2-R5 LA25 thunk code
986 // to call PIC function from the non-PIC one.
987 void MicroMipsThunk::writeTo(uint8_t *buf) {
988   uint64_t s = destination.getVA();
989   write16(buf, 0x41b9);       // lui   $25, %hi(func)
990   write16(buf + 4, 0xd400);   // j     func
991   write16(buf + 8, 0x3339);   // addiu $25, $25, %lo(func)
992   write16(buf + 12, 0x0c00);  // nop
993   target->relocateNoSym(buf, R_MICROMIPS_HI16, s);
994   target->relocateNoSym(buf + 4, R_MICROMIPS_26_S1, s);
995   target->relocateNoSym(buf + 8, R_MICROMIPS_LO16, s);
996 }
997 
998 void MicroMipsThunk::addSymbols(ThunkSection &isec) {
999   Defined *d =
1000       addSymbol(saver().save("__microLA25Thunk_" + destination.getName()),
1001                 STT_FUNC, 0, isec);
1002   d->stOther |= STO_MIPS_MICROMIPS;
1003 }
1004 
1005 InputSection *MicroMipsThunk::getTargetInputSection() const {
1006   auto &dr = cast<Defined>(destination);
1007   return dyn_cast<InputSection>(dr.section);
1008 }
1009 
1010 // Write microMIPS R6 LA25 thunk code
1011 // to call PIC function from the non-PIC one.
1012 void MicroMipsR6Thunk::writeTo(uint8_t *buf) {
1013   uint64_t s = destination.getVA();
1014   uint64_t p = getThunkTargetSym()->getVA();
1015   write16(buf, 0x1320);       // lui   $25, %hi(func)
1016   write16(buf + 4, 0x3339);   // addiu $25, $25, %lo(func)
1017   write16(buf + 8, 0x9400);   // bc    func
1018   target->relocateNoSym(buf, R_MICROMIPS_HI16, s);
1019   target->relocateNoSym(buf + 4, R_MICROMIPS_LO16, s);
1020   target->relocateNoSym(buf + 8, R_MICROMIPS_PC26_S1, s - p - 12);
1021 }
1022 
1023 void MicroMipsR6Thunk::addSymbols(ThunkSection &isec) {
1024   Defined *d =
1025       addSymbol(saver().save("__microLA25Thunk_" + destination.getName()),
1026                 STT_FUNC, 0, isec);
1027   d->stOther |= STO_MIPS_MICROMIPS;
1028 }
1029 
1030 InputSection *MicroMipsR6Thunk::getTargetInputSection() const {
1031   auto &dr = cast<Defined>(destination);
1032   return dyn_cast<InputSection>(dr.section);
1033 }
1034 
1035 void elf::writePPC32PltCallStub(uint8_t *buf, uint64_t gotPltVA,
1036                                 const InputFile *file, int64_t addend) {
1037   if (!config->isPic) {
1038     write32(buf + 0, 0x3d600000 | (gotPltVA + 0x8000) >> 16); // lis r11,ha
1039     write32(buf + 4, 0x816b0000 | (uint16_t)gotPltVA);        // lwz r11,l(r11)
1040     write32(buf + 8, 0x7d6903a6);                             // mtctr r11
1041     write32(buf + 12, 0x4e800420);                            // bctr
1042     return;
1043   }
1044   uint32_t offset;
1045   if (addend >= 0x8000) {
1046     // The stub loads an address relative to r30 (.got2+Addend). Addend is
1047     // almost always 0x8000. The address of .got2 is different in another object
1048     // file, so a stub cannot be shared.
1049     offset = gotPltVA -
1050              (in.ppc32Got2->getParent()->getVA() +
1051               (file->ppc32Got2 ? file->ppc32Got2->outSecOff : 0) + addend);
1052   } else {
1053     // The stub loads an address relative to _GLOBAL_OFFSET_TABLE_ (which is
1054     // currently the address of .got).
1055     offset = gotPltVA - in.got->getVA();
1056   }
1057   uint16_t ha = (offset + 0x8000) >> 16, l = (uint16_t)offset;
1058   if (ha == 0) {
1059     write32(buf + 0, 0x817e0000 | l); // lwz r11,l(r30)
1060     write32(buf + 4, 0x7d6903a6);     // mtctr r11
1061     write32(buf + 8, 0x4e800420);     // bctr
1062     write32(buf + 12, 0x60000000);    // nop
1063   } else {
1064     write32(buf + 0, 0x3d7e0000 | ha); // addis r11,r30,ha
1065     write32(buf + 4, 0x816b0000 | l);  // lwz r11,l(r11)
1066     write32(buf + 8, 0x7d6903a6);      // mtctr r11
1067     write32(buf + 12, 0x4e800420);     // bctr
1068   }
1069 }
1070 
1071 void PPC32PltCallStub::writeTo(uint8_t *buf) {
1072   writePPC32PltCallStub(buf, destination.getGotPltVA(), file, addend);
1073 }
1074 
1075 void PPC32PltCallStub::addSymbols(ThunkSection &isec) {
1076   std::string buf;
1077   raw_string_ostream os(buf);
1078   os << format_hex_no_prefix(addend, 8);
1079   if (!config->isPic)
1080     os << ".plt_call32.";
1081   else if (addend >= 0x8000)
1082     os << ".got2.plt_pic32.";
1083   else
1084     os << ".plt_pic32.";
1085   os << destination.getName();
1086   addSymbol(saver().save(os.str()), STT_FUNC, 0, isec);
1087 }
1088 
1089 bool PPC32PltCallStub::isCompatibleWith(const InputSection &isec,
1090                                         const Relocation &rel) const {
1091   return !config->isPic || (isec.file == file && rel.addend == addend);
1092 }
1093 
1094 void PPC32LongThunk::addSymbols(ThunkSection &isec) {
1095   addSymbol(saver().save("__LongThunk_" + destination.getName()), STT_FUNC, 0,
1096             isec);
1097 }
1098 
1099 void PPC32LongThunk::writeTo(uint8_t *buf) {
1100   auto ha = [](uint32_t v) -> uint16_t { return (v + 0x8000) >> 16; };
1101   auto lo = [](uint32_t v) -> uint16_t { return v; };
1102   uint32_t d = destination.getVA(addend);
1103   if (config->isPic) {
1104     uint32_t off = d - (getThunkTargetSym()->getVA() + 8);
1105     write32(buf + 0, 0x7c0802a6);            // mflr r12,0
1106     write32(buf + 4, 0x429f0005);            // bcl r20,r31,.+4
1107     write32(buf + 8, 0x7d8802a6);            // mtctr r12
1108     write32(buf + 12, 0x3d8c0000 | ha(off)); // addis r12,r12,off@ha
1109     write32(buf + 16, 0x398c0000 | lo(off)); // addi r12,r12,off@l
1110     write32(buf + 20, 0x7c0803a6);           // mtlr r0
1111     buf += 24;
1112   } else {
1113     write32(buf + 0, 0x3d800000 | ha(d));    // lis r12,d@ha
1114     write32(buf + 4, 0x398c0000 | lo(d));    // addi r12,r12,d@l
1115     buf += 8;
1116   }
1117   write32(buf + 0, 0x7d8903a6);              // mtctr r12
1118   write32(buf + 4, 0x4e800420);              // bctr
1119 }
1120 
1121 void elf::writePPC64LoadAndBranch(uint8_t *buf, int64_t offset) {
1122   uint16_t offHa = (offset + 0x8000) >> 16;
1123   uint16_t offLo = offset & 0xffff;
1124 
1125   write32(buf + 0, 0x3d820000 | offHa); // addis r12, r2, OffHa
1126   write32(buf + 4, 0xe98c0000 | offLo); // ld    r12, OffLo(r12)
1127   write32(buf + 8, 0x7d8903a6);         // mtctr r12
1128   write32(buf + 12, 0x4e800420);        // bctr
1129 }
1130 
1131 void PPC64PltCallStub::writeTo(uint8_t *buf) {
1132   int64_t offset = destination.getGotPltVA() - getPPC64TocBase();
1133   // Save the TOC pointer to the save-slot reserved in the call frame.
1134   write32(buf + 0, 0xf8410018); // std     r2,24(r1)
1135   writePPC64LoadAndBranch(buf + 4, offset);
1136 }
1137 
1138 void PPC64PltCallStub::addSymbols(ThunkSection &isec) {
1139   Defined *s = addSymbol(saver().save("__plt_" + destination.getName()),
1140                          STT_FUNC, 0, isec);
1141   s->setNeedsTocRestore(true);
1142   s->file = destination.file;
1143 }
1144 
1145 bool PPC64PltCallStub::isCompatibleWith(const InputSection &isec,
1146                                         const Relocation &rel) const {
1147   return rel.type == R_PPC64_REL24 || rel.type == R_PPC64_REL14;
1148 }
1149 
1150 void PPC64R2SaveStub::writeTo(uint8_t *buf) {
1151   const int64_t offset = computeOffset();
1152   write32(buf + 0, 0xf8410018); // std  r2,24(r1)
1153   // The branch offset needs to fit in 26 bits.
1154   if (getMayUseShortThunk()) {
1155     write32(buf + 4, 0x48000000 | (offset & 0x03fffffc)); // b    <offset>
1156   } else if (isInt<34>(offset)) {
1157     int nextInstOffset;
1158     uint64_t tocOffset = destination.getVA() - getPPC64TocBase();
1159     if (tocOffset >> 16 > 0) {
1160       const uint64_t addi = ADDI_R12_TO_R12_NO_DISP | (tocOffset & 0xffff);
1161       const uint64_t addis =
1162           ADDIS_R12_TO_R2_NO_DISP | ((tocOffset >> 16) & 0xffff);
1163       write32(buf + 4, addis); // addis r12, r2 , top of offset
1164       write32(buf + 8, addi);  // addi  r12, r12, bottom of offset
1165       nextInstOffset = 12;
1166     } else {
1167       const uint64_t addi = ADDI_R12_TO_R2_NO_DISP | (tocOffset & 0xffff);
1168       write32(buf + 4, addi); // addi r12, r2, offset
1169       nextInstOffset = 8;
1170     }
1171     write32(buf + nextInstOffset, MTCTR_R12); // mtctr r12
1172     write32(buf + nextInstOffset + 4, BCTR);  // bctr
1173   } else {
1174     in.ppc64LongBranchTarget->addEntry(&destination, addend);
1175     const int64_t offsetFromTOC =
1176         in.ppc64LongBranchTarget->getEntryVA(&destination, addend) -
1177         getPPC64TocBase();
1178     writePPC64LoadAndBranch(buf + 4, offsetFromTOC);
1179   }
1180 }
1181 
1182 void PPC64R2SaveStub::addSymbols(ThunkSection &isec) {
1183   Defined *s = addSymbol(saver().save("__toc_save_" + destination.getName()),
1184                          STT_FUNC, 0, isec);
1185   s->setNeedsTocRestore(true);
1186 }
1187 
1188 bool PPC64R2SaveStub::isCompatibleWith(const InputSection &isec,
1189                                        const Relocation &rel) const {
1190   return rel.type == R_PPC64_REL24 || rel.type == R_PPC64_REL14;
1191 }
1192 
1193 void PPC64R12SetupStub::writeTo(uint8_t *buf) {
1194   int64_t offset = (gotPlt ? destination.getGotPltVA() : destination.getVA()) -
1195                    getThunkTargetSym()->getVA();
1196   if (!isInt<34>(offset))
1197     reportRangeError(buf, offset, 34, destination, "R12 setup stub offset");
1198 
1199   int nextInstOffset;
1200   if (config->power10Stubs) {
1201     const uint64_t imm = (((offset >> 16) & 0x3ffff) << 32) | (offset & 0xffff);
1202     // pld 12, func@plt@pcrel or  paddi r12, 0, func@pcrel
1203     writePrefixedInstruction(
1204         buf, (gotPlt ? PLD_R12_NO_DISP : PADDI_R12_NO_DISP) | imm);
1205     nextInstOffset = 8;
1206   } else {
1207     uint32_t off = offset - 8;
1208     write32(buf + 0, 0x7d8802a6);                     // mflr 12
1209     write32(buf + 4, 0x429f0005);                     // bcl 20,31,.+4
1210     write32(buf + 8, 0x7d6802a6);                     // mflr 11
1211     write32(buf + 12, 0x7d8803a6);                    // mtlr 12
1212     write32(buf + 16,
1213             0x3d8b0000 | ((off + 0x8000) >> 16));     // addis 12,11,off@ha
1214     if (gotPlt)
1215       write32(buf + 20, 0xe98c0000 | (off & 0xffff)); // ld 12, off@l(12)
1216     else
1217       write32(buf + 20, 0x398c0000 | (off & 0xffff)); // addi 12,12,off@l
1218     nextInstOffset = 24;
1219   }
1220   write32(buf + nextInstOffset, MTCTR_R12); // mtctr r12
1221   write32(buf + nextInstOffset + 4, BCTR);  // bctr
1222 }
1223 
1224 void PPC64R12SetupStub::addSymbols(ThunkSection &isec) {
1225   addSymbol(saver().save((gotPlt ? "__plt_pcrel_" : "__gep_setup_") +
1226                          destination.getName()),
1227             STT_FUNC, 0, isec);
1228 }
1229 
1230 bool PPC64R12SetupStub::isCompatibleWith(const InputSection &isec,
1231                                          const Relocation &rel) const {
1232   return rel.type == R_PPC64_REL24_NOTOC;
1233 }
1234 
1235 void PPC64LongBranchThunk::writeTo(uint8_t *buf) {
1236   int64_t offset = in.ppc64LongBranchTarget->getEntryVA(&destination, addend) -
1237                    getPPC64TocBase();
1238   writePPC64LoadAndBranch(buf, offset);
1239 }
1240 
1241 void PPC64LongBranchThunk::addSymbols(ThunkSection &isec) {
1242   addSymbol(saver().save("__long_branch_" + destination.getName()), STT_FUNC, 0,
1243             isec);
1244 }
1245 
1246 bool PPC64LongBranchThunk::isCompatibleWith(const InputSection &isec,
1247                                             const Relocation &rel) const {
1248   return rel.type == R_PPC64_REL24 || rel.type == R_PPC64_REL14;
1249 }
1250 
1251 Thunk::Thunk(Symbol &d, int64_t a) : destination(d), addend(a), offset(0) {
1252   destination.thunkAccessed = true;
1253 }
1254 
1255 Thunk::~Thunk() = default;
1256 
1257 static Thunk *addThunkAArch64(RelType type, Symbol &s, int64_t a) {
1258   if (type != R_AARCH64_CALL26 && type != R_AARCH64_JUMP26 &&
1259       type != R_AARCH64_PLT32)
1260     fatal("unrecognized relocation type");
1261   if (config->picThunk)
1262     return make<AArch64ADRPThunk>(s, a);
1263   return make<AArch64ABSLongThunk>(s, a);
1264 }
1265 
1266 // Creates a thunk for long branches or Thumb-ARM interworking.
1267 // Arm Architectures v4t does not support Thumb2 technology, and does not
1268 // support BLX or LDR Arm/Thumb state switching. This means that
1269 // - MOVT and MOVW instructions cannot be used.
1270 // - We can't rewrite BL in place to BLX. We will need thunks.
1271 //
1272 // TODO: use B for short Thumb->Arm thunks instead of LDR (this doesn't work for
1273 //       Arm->Thumb, as in Arm state no BX PC trick; it doesn't switch state).
1274 static Thunk *addThunkArmv4(RelType reloc, Symbol &s, int64_t a) {
1275   bool thumb_target = s.getVA(a) & 1;
1276 
1277   switch (reloc) {
1278   case R_ARM_PC24:
1279   case R_ARM_PLT32:
1280   case R_ARM_JUMP24:
1281   case R_ARM_CALL:
1282     if (config->picThunk) {
1283       if (thumb_target)
1284         return make<ARMV4PILongBXThunk>(s, a);
1285       return make<ARMV4PILongThunk>(s, a);
1286     }
1287     if (thumb_target)
1288       return make<ARMV4ABSLongBXThunk>(s, a);
1289     return make<ARMV5LongLdrPcThunk>(s, a);
1290   case R_ARM_THM_CALL:
1291     if (config->picThunk) {
1292       if (thumb_target)
1293         return make<ThumbV4PILongThunk>(s, a);
1294       return make<ThumbV4PILongBXThunk>(s, a);
1295     }
1296     if (thumb_target)
1297       return make<ThumbV4ABSLongThunk>(s, a);
1298     return make<ThumbV4ABSLongBXThunk>(s, a);
1299   }
1300   fatal("relocation " + toString(reloc) + " to " + toString(s) +
1301         " not supported for Armv4 or Armv4T target");
1302 }
1303 
1304 // Creates a thunk for Thumb-ARM interworking compatible with Armv5 and Armv6.
1305 // Arm Architectures v5 and v6 do not support Thumb2 technology. This means that
1306 // - MOVT and MOVW instructions cannot be used
1307 // - Only Thumb relocation that can generate a Thunk is a BL, this can always
1308 //   be transformed into a BLX
1309 static Thunk *addThunkArmv5v6(RelType reloc, Symbol &s, int64_t a) {
1310   switch (reloc) {
1311   case R_ARM_PC24:
1312   case R_ARM_PLT32:
1313   case R_ARM_JUMP24:
1314   case R_ARM_CALL:
1315   case R_ARM_THM_CALL:
1316     if (config->picThunk)
1317       return make<ARMV4PILongBXThunk>(s, a);
1318     return make<ARMV5LongLdrPcThunk>(s, a);
1319   }
1320   fatal("relocation " + toString(reloc) + " to " + toString(s) +
1321         " not supported for Armv5 or Armv6 targets");
1322 }
1323 
1324 // Create a thunk for Thumb long branch on V6-M.
1325 // Arm Architecture v6-M only supports Thumb instructions. This means
1326 // - MOVT and MOVW instructions cannot be used.
1327 // - Only a limited number of instructions can access registers r8 and above
1328 // - No interworking support is needed (all Thumb).
1329 static Thunk *addThunkV6M(const InputSection &isec, RelType reloc, Symbol &s,
1330                           int64_t a) {
1331   const bool isPureCode = isec.getParent()->flags & SHF_ARM_PURECODE;
1332   switch (reloc) {
1333   case R_ARM_THM_JUMP19:
1334   case R_ARM_THM_JUMP24:
1335   case R_ARM_THM_CALL:
1336     if (config->isPic) {
1337       if (!isPureCode)
1338         return make<ThumbV6MPILongThunk>(s, a);
1339 
1340       fatal("relocation " + toString(reloc) + " to " + toString(s) +
1341             " not supported for Armv6-M targets for position independent"
1342             " and execute only code");
1343     }
1344     if (isPureCode)
1345       return make<ThumbV6MABSXOLongThunk>(s, a);
1346     return make<ThumbV6MABSLongThunk>(s, a);
1347   }
1348   fatal("relocation " + toString(reloc) + " to " + toString(s) +
1349         " not supported for Armv6-M targets");
1350 }
1351 
1352 // Creates a thunk for Thumb-ARM interworking or branch range extension.
1353 static Thunk *addThunkArm(const InputSection &isec, RelType reloc, Symbol &s,
1354                           int64_t a) {
1355   // Decide which Thunk is needed based on:
1356   // Available instruction set
1357   // - An Arm Thunk can only be used if Arm state is available.
1358   // - A Thumb Thunk can only be used if Thumb state is available.
1359   // - Can only use a Thunk if it uses instructions that the Target supports.
1360   // Relocation is branch or branch and link
1361   // - Branch instructions cannot change state, can only select Thunk that
1362   //   starts in the same state as the caller.
1363   // - Branch and link relocations can change state, can select Thunks from
1364   //   either Arm or Thumb.
1365   // Position independent Thunks if we require position independent code.
1366   // Execute Only Thunks if the output section is execute only code.
1367 
1368   // Handle architectures that have restrictions on the instructions that they
1369   // can use in Thunks. The flags below are set by reading the BuildAttributes
1370   // of the input objects. InputFiles.cpp contains the mapping from ARM
1371   // architecture to flag.
1372   if (!config->armHasMovtMovw) {
1373     if (config->armJ1J2BranchEncoding)
1374       return addThunkV6M(isec, reloc, s, a);
1375     if (config->armHasBlx)
1376       return addThunkArmv5v6(reloc, s, a);
1377     return addThunkArmv4(reloc, s, a);
1378   }
1379 
1380   switch (reloc) {
1381   case R_ARM_PC24:
1382   case R_ARM_PLT32:
1383   case R_ARM_JUMP24:
1384   case R_ARM_CALL:
1385     if (config->picThunk)
1386       return make<ARMV7PILongThunk>(s, a);
1387     return make<ARMV7ABSLongThunk>(s, a);
1388   case R_ARM_THM_JUMP19:
1389   case R_ARM_THM_JUMP24:
1390   case R_ARM_THM_CALL:
1391     if (config->picThunk)
1392       return make<ThumbV7PILongThunk>(s, a);
1393     return make<ThumbV7ABSLongThunk>(s, a);
1394   }
1395   fatal("unrecognized relocation type");
1396 }
1397 
1398 static Thunk *addThunkAVR(RelType type, Symbol &s, int64_t a) {
1399   switch (type) {
1400   case R_AVR_LO8_LDI_GS:
1401   case R_AVR_HI8_LDI_GS:
1402     return make<AVRThunk>(s, a);
1403   default:
1404     fatal("unrecognized relocation type " + toString(type));
1405   }
1406 }
1407 
1408 static Thunk *addThunkMips(RelType type, Symbol &s) {
1409   if ((s.stOther & STO_MIPS_MICROMIPS) && isMipsR6())
1410     return make<MicroMipsR6Thunk>(s);
1411   if (s.stOther & STO_MIPS_MICROMIPS)
1412     return make<MicroMipsThunk>(s);
1413   return make<MipsThunk>(s);
1414 }
1415 
1416 static Thunk *addThunkPPC32(const InputSection &isec, const Relocation &rel,
1417                             Symbol &s) {
1418   assert((rel.type == R_PPC_LOCAL24PC || rel.type == R_PPC_REL24 ||
1419           rel.type == R_PPC_PLTREL24) &&
1420          "unexpected relocation type for thunk");
1421   if (s.isInPlt())
1422     return make<PPC32PltCallStub>(isec, rel, s);
1423   return make<PPC32LongThunk>(s, rel.addend);
1424 }
1425 
1426 static Thunk *addThunkPPC64(RelType type, Symbol &s, int64_t a) {
1427   assert((type == R_PPC64_REL14 || type == R_PPC64_REL24 ||
1428           type == R_PPC64_REL24_NOTOC) &&
1429          "unexpected relocation type for thunk");
1430 
1431   // If we are emitting stubs for NOTOC relocations, we need to tell
1432   // the PLT resolver that there can be multiple TOCs.
1433   if (type == R_PPC64_REL24_NOTOC)
1434     getPPC64TargetInfo()->ppc64DynamicSectionOpt = 0x2;
1435 
1436   if (s.isInPlt())
1437     return type == R_PPC64_REL24_NOTOC
1438                ? (Thunk *)make<PPC64R12SetupStub>(s, /*gotPlt=*/true)
1439                : (Thunk *)make<PPC64PltCallStub>(s);
1440 
1441   // This check looks at the st_other bits of the callee. If the value is 1
1442   // then the callee clobbers the TOC and we need an R2 save stub when RelType
1443   // is R_PPC64_REL14 or R_PPC64_REL24.
1444   if ((type == R_PPC64_REL14 || type == R_PPC64_REL24) && (s.stOther >> 5) == 1)
1445     return make<PPC64R2SaveStub>(s, a);
1446 
1447   if (type == R_PPC64_REL24_NOTOC)
1448     return make<PPC64R12SetupStub>(s, /*gotPlt=*/false);
1449 
1450   if (config->picThunk)
1451     return make<PPC64PILongBranchThunk>(s, a);
1452 
1453   return make<PPC64PDLongBranchThunk>(s, a);
1454 }
1455 
1456 Thunk *elf::addThunk(const InputSection &isec, Relocation &rel) {
1457   Symbol &s = *rel.sym;
1458   int64_t a = rel.addend;
1459 
1460   switch (config->emachine) {
1461   case EM_AARCH64:
1462     return addThunkAArch64(rel.type, s, a);
1463   case EM_ARM:
1464     return addThunkArm(isec, rel.type, s, a);
1465   case EM_AVR:
1466     return addThunkAVR(rel.type, s, a);
1467   case EM_MIPS:
1468     return addThunkMips(rel.type, s);
1469   case EM_PPC:
1470     return addThunkPPC32(isec, rel, s);
1471   case EM_PPC64:
1472     return addThunkPPC64(rel.type, s, a);
1473   default:
1474     llvm_unreachable("add Thunk only supported for ARM, AVR, Mips and PowerPC");
1475   }
1476 }
1477