1 //===- Thunks.cpp --------------------------------------------------------===// 2 // 3 // Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions. 4 // See https://llvm.org/LICENSE.txt for license information. 5 // SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception 6 // 7 //===---------------------------------------------------------------------===// 8 // 9 // This file contains Thunk subclasses. 10 // 11 // A thunk is a small piece of code written after an input section 12 // which is used to jump between "incompatible" functions 13 // such as MIPS PIC and non-PIC or ARM non-Thumb and Thumb functions. 14 // 15 // If a jump target is too far and its address doesn't fit to a 16 // short jump instruction, we need to create a thunk too, but we 17 // haven't supported it yet. 18 // 19 // i386 and x86-64 don't need thunks. 20 // 21 //===---------------------------------------------------------------------===// 22 23 #include "Thunks.h" 24 #include "Config.h" 25 #include "InputSection.h" 26 #include "OutputSections.h" 27 #include "Symbols.h" 28 #include "SyntheticSections.h" 29 #include "Target.h" 30 #include "lld/Common/ErrorHandler.h" 31 #include "lld/Common/Memory.h" 32 #include "llvm/BinaryFormat/ELF.h" 33 #include "llvm/Support/Casting.h" 34 #include "llvm/Support/Endian.h" 35 #include "llvm/Support/ErrorHandling.h" 36 #include "llvm/Support/MathExtras.h" 37 #include <cstdint> 38 #include <cstring> 39 40 using namespace llvm; 41 using namespace llvm::object; 42 using namespace llvm::ELF; 43 using namespace lld; 44 using namespace lld::elf; 45 46 namespace { 47 48 // AArch64 long range Thunks 49 class AArch64ABSLongThunk final : public Thunk { 50 public: 51 AArch64ABSLongThunk(Symbol &dest, int64_t addend) : Thunk(dest, addend) {} 52 uint32_t size() override { return 16; } 53 void writeTo(uint8_t *buf) override; 54 void addSymbols(ThunkSection &isec) override; 55 }; 56 57 class AArch64ADRPThunk final : public Thunk { 58 public: 59 AArch64ADRPThunk(Symbol &dest, int64_t addend) : Thunk(dest, addend) {} 60 uint32_t size() override { return 12; } 61 void writeTo(uint8_t *buf) override; 62 void addSymbols(ThunkSection &isec) override; 63 }; 64 65 // Base class for ARM thunks. 66 // 67 // An ARM thunk may be either short or long. A short thunk is simply a branch 68 // (B) instruction, and it may be used to call ARM functions when the distance 69 // from the thunk to the target is less than 32MB. Long thunks can branch to any 70 // virtual address and can switch between ARM and Thumb, and they are 71 // implemented in the derived classes. This class tries to create a short thunk 72 // if the target is in range, otherwise it creates a long thunk. 73 class ARMThunk : public Thunk { 74 public: 75 ARMThunk(Symbol &dest) : Thunk(dest, 0) {} 76 77 bool getMayUseShortThunk(); 78 uint32_t size() override { return getMayUseShortThunk() ? 4 : sizeLong(); } 79 void writeTo(uint8_t *buf) override; 80 bool isCompatibleWith(const InputSection &isec, 81 const Relocation &rel) const override; 82 83 // Returns the size of a long thunk. 84 virtual uint32_t sizeLong() = 0; 85 86 // Writes a long thunk to Buf. 87 virtual void writeLong(uint8_t *buf) = 0; 88 89 private: 90 // This field tracks whether all previously considered layouts would allow 91 // this thunk to be short. If we have ever needed a long thunk, we always 92 // create a long thunk, even if the thunk may be short given the current 93 // distance to the target. We do this because transitioning from long to short 94 // can create layout oscillations in certain corner cases which would prevent 95 // the layout from converging. 96 bool mayUseShortThunk = true; 97 }; 98 99 // Base class for Thumb-2 thunks. 100 // 101 // This class is similar to ARMThunk, but it uses the Thumb-2 B.W instruction 102 // which has a range of 16MB. 103 class ThumbThunk : public Thunk { 104 public: 105 ThumbThunk(Symbol &dest) : Thunk(dest, 0) { alignment = 2; } 106 107 bool getMayUseShortThunk(); 108 uint32_t size() override { return getMayUseShortThunk() ? 4 : sizeLong(); } 109 void writeTo(uint8_t *buf) override; 110 bool isCompatibleWith(const InputSection &isec, 111 const Relocation &rel) const override; 112 113 // Returns the size of a long thunk. 114 virtual uint32_t sizeLong() = 0; 115 116 // Writes a long thunk to Buf. 117 virtual void writeLong(uint8_t *buf) = 0; 118 119 private: 120 // See comment in ARMThunk above. 121 bool mayUseShortThunk = true; 122 }; 123 124 // Specific ARM Thunk implementations. The naming convention is: 125 // Source State, TargetState, Target Requirement, ABS or PI, Range 126 class ARMV7ABSLongThunk final : public ARMThunk { 127 public: 128 ARMV7ABSLongThunk(Symbol &dest) : ARMThunk(dest) {} 129 130 uint32_t sizeLong() override { return 12; } 131 void writeLong(uint8_t *buf) override; 132 void addSymbols(ThunkSection &isec) override; 133 }; 134 135 class ARMV7PILongThunk final : public ARMThunk { 136 public: 137 ARMV7PILongThunk(Symbol &dest) : ARMThunk(dest) {} 138 139 uint32_t sizeLong() override { return 16; } 140 void writeLong(uint8_t *buf) override; 141 void addSymbols(ThunkSection &isec) override; 142 }; 143 144 class ThumbV7ABSLongThunk final : public ThumbThunk { 145 public: 146 ThumbV7ABSLongThunk(Symbol &dest) : ThumbThunk(dest) {} 147 148 uint32_t sizeLong() override { return 10; } 149 void writeLong(uint8_t *buf) override; 150 void addSymbols(ThunkSection &isec) override; 151 }; 152 153 class ThumbV7PILongThunk final : public ThumbThunk { 154 public: 155 ThumbV7PILongThunk(Symbol &dest) : ThumbThunk(dest) {} 156 157 uint32_t sizeLong() override { return 12; } 158 void writeLong(uint8_t *buf) override; 159 void addSymbols(ThunkSection &isec) override; 160 }; 161 162 // Implementations of Thunks for older Arm architectures that do not support 163 // the movt/movw instructions. These thunks require at least Architecture v5 164 // as used on processors such as the Arm926ej-s. There are no Thumb entry 165 // points as there is no Thumb branch instruction on these architecture that 166 // can result in a thunk 167 class ARMV5ABSLongThunk final : public ARMThunk { 168 public: 169 ARMV5ABSLongThunk(Symbol &dest) : ARMThunk(dest) {} 170 171 uint32_t sizeLong() override { return 8; } 172 void writeLong(uint8_t *buf) override; 173 void addSymbols(ThunkSection &isec) override; 174 bool isCompatibleWith(const InputSection &isec, 175 const Relocation &rel) const override; 176 }; 177 178 class ARMV5PILongThunk final : public ARMThunk { 179 public: 180 ARMV5PILongThunk(Symbol &dest) : ARMThunk(dest) {} 181 182 uint32_t sizeLong() override { return 16; } 183 void writeLong(uint8_t *buf) override; 184 void addSymbols(ThunkSection &isec) override; 185 bool isCompatibleWith(const InputSection &isec, 186 const Relocation &rel) const override; 187 }; 188 189 // Implementations of Thunks for Arm v6-M. Only Thumb instructions are permitted 190 class ThumbV6MABSLongThunk final : public ThumbThunk { 191 public: 192 ThumbV6MABSLongThunk(Symbol &dest) : ThumbThunk(dest) {} 193 194 uint32_t sizeLong() override { return 12; } 195 void writeLong(uint8_t *buf) override; 196 void addSymbols(ThunkSection &isec) override; 197 }; 198 199 class ThumbV6MPILongThunk final : public ThumbThunk { 200 public: 201 ThumbV6MPILongThunk(Symbol &dest) : ThumbThunk(dest) {} 202 203 uint32_t sizeLong() override { return 16; } 204 void writeLong(uint8_t *buf) override; 205 void addSymbols(ThunkSection &isec) override; 206 }; 207 208 // MIPS LA25 thunk 209 class MipsThunk final : public Thunk { 210 public: 211 MipsThunk(Symbol &dest) : Thunk(dest, 0) {} 212 213 uint32_t size() override { return 16; } 214 void writeTo(uint8_t *buf) override; 215 void addSymbols(ThunkSection &isec) override; 216 InputSection *getTargetInputSection() const override; 217 }; 218 219 // microMIPS R2-R5 LA25 thunk 220 class MicroMipsThunk final : public Thunk { 221 public: 222 MicroMipsThunk(Symbol &dest) : Thunk(dest, 0) {} 223 224 uint32_t size() override { return 14; } 225 void writeTo(uint8_t *buf) override; 226 void addSymbols(ThunkSection &isec) override; 227 InputSection *getTargetInputSection() const override; 228 }; 229 230 // microMIPS R6 LA25 thunk 231 class MicroMipsR6Thunk final : public Thunk { 232 public: 233 MicroMipsR6Thunk(Symbol &dest) : Thunk(dest, 0) {} 234 235 uint32_t size() override { return 12; } 236 void writeTo(uint8_t *buf) override; 237 void addSymbols(ThunkSection &isec) override; 238 InputSection *getTargetInputSection() const override; 239 }; 240 241 class PPC32PltCallStub final : public Thunk { 242 public: 243 // For R_PPC_PLTREL24, Thunk::addend records the addend which will be used to 244 // decide the offsets in the call stub. 245 PPC32PltCallStub(const InputSection &isec, const Relocation &rel, 246 Symbol &dest) 247 : Thunk(dest, rel.addend), file(isec.file) {} 248 uint32_t size() override { return 16; } 249 void writeTo(uint8_t *buf) override; 250 void addSymbols(ThunkSection &isec) override; 251 bool isCompatibleWith(const InputSection &isec, const Relocation &rel) const override; 252 253 private: 254 // Records the call site of the call stub. 255 const InputFile *file; 256 }; 257 258 class PPC32LongThunk final : public Thunk { 259 public: 260 PPC32LongThunk(Symbol &dest, int64_t addend) : Thunk(dest, addend) {} 261 uint32_t size() override { return config->isPic ? 32 : 16; } 262 void writeTo(uint8_t *buf) override; 263 void addSymbols(ThunkSection &isec) override; 264 }; 265 266 // PPC64 Plt call stubs. 267 // Any call site that needs to call through a plt entry needs a call stub in 268 // the .text section. The call stub is responsible for: 269 // 1) Saving the toc-pointer to the stack. 270 // 2) Loading the target functions address from the procedure linkage table into 271 // r12 for use by the target functions global entry point, and into the count 272 // register. 273 // 3) Transferring control to the target function through an indirect branch. 274 class PPC64PltCallStub final : public Thunk { 275 public: 276 PPC64PltCallStub(Symbol &dest) : Thunk(dest, 0) {} 277 uint32_t size() override { return 20; } 278 void writeTo(uint8_t *buf) override; 279 void addSymbols(ThunkSection &isec) override; 280 }; 281 282 // PPC64 R2 Save Stub 283 // When the caller requires a valid R2 TOC pointer but the callee does not 284 // require a TOC pointer and the callee cannot guarantee that it doesn't 285 // clobber R2 then we need to save R2. This stub: 286 // 1) Saves the TOC pointer to the stack. 287 // 2) Tail calls the callee. 288 class PPC64R2SaveStub final : public Thunk { 289 public: 290 PPC64R2SaveStub(Symbol &dest) : Thunk(dest, 0) {} 291 uint32_t size() override { return 8; } 292 void writeTo(uint8_t *buf) override; 293 void addSymbols(ThunkSection &isec) override; 294 }; 295 296 // A bl instruction uses a signed 24 bit offset, with an implicit 4 byte 297 // alignment. This gives a possible 26 bits of 'reach'. If the call offset is 298 // larger then that we need to emit a long-branch thunk. The target address 299 // of the callee is stored in a table to be accessed TOC-relative. Since the 300 // call must be local (a non-local call will have a PltCallStub instead) the 301 // table stores the address of the callee's local entry point. For 302 // position-independent code a corresponding relative dynamic relocation is 303 // used. 304 class PPC64LongBranchThunk : public Thunk { 305 public: 306 uint32_t size() override { return 16; } 307 void writeTo(uint8_t *buf) override; 308 void addSymbols(ThunkSection &isec) override; 309 310 protected: 311 PPC64LongBranchThunk(Symbol &dest, int64_t addend) : Thunk(dest, addend) {} 312 }; 313 314 class PPC64PILongBranchThunk final : public PPC64LongBranchThunk { 315 public: 316 PPC64PILongBranchThunk(Symbol &dest, int64_t addend) 317 : PPC64LongBranchThunk(dest, addend) { 318 assert(!dest.isPreemptible); 319 if (Optional<uint32_t> index = 320 in.ppc64LongBranchTarget->addEntry(&dest, addend)) { 321 mainPart->relaDyn->addReloc( 322 {target->relativeRel, in.ppc64LongBranchTarget, *index * UINT64_C(8), 323 true, &dest, 324 addend + getPPC64GlobalEntryToLocalEntryOffset(dest.stOther)}); 325 } 326 } 327 }; 328 329 class PPC64PDLongBranchThunk final : public PPC64LongBranchThunk { 330 public: 331 PPC64PDLongBranchThunk(Symbol &dest, int64_t addend) 332 : PPC64LongBranchThunk(dest, addend) { 333 in.ppc64LongBranchTarget->addEntry(&dest, addend); 334 } 335 }; 336 337 } // end anonymous namespace 338 339 Defined *Thunk::addSymbol(StringRef name, uint8_t type, uint64_t value, 340 InputSectionBase §ion) { 341 Defined *d = addSyntheticLocal(name, type, value, /*size=*/0, section); 342 syms.push_back(d); 343 return d; 344 } 345 346 void Thunk::setOffset(uint64_t newOffset) { 347 for (Defined *d : syms) 348 d->value = d->value - offset + newOffset; 349 offset = newOffset; 350 } 351 352 // AArch64 long range Thunks 353 354 static uint64_t getAArch64ThunkDestVA(const Symbol &s, int64_t a) { 355 uint64_t v = s.isInPlt() ? s.getPltVA() : s.getVA(a); 356 return v; 357 } 358 359 void AArch64ABSLongThunk::writeTo(uint8_t *buf) { 360 const uint8_t data[] = { 361 0x50, 0x00, 0x00, 0x58, // ldr x16, L0 362 0x00, 0x02, 0x1f, 0xd6, // br x16 363 0x00, 0x00, 0x00, 0x00, // L0: .xword S 364 0x00, 0x00, 0x00, 0x00, 365 }; 366 uint64_t s = getAArch64ThunkDestVA(destination, addend); 367 memcpy(buf, data, sizeof(data)); 368 target->relocateNoSym(buf + 8, R_AARCH64_ABS64, s); 369 } 370 371 void AArch64ABSLongThunk::addSymbols(ThunkSection &isec) { 372 addSymbol(saver.save("__AArch64AbsLongThunk_" + destination.getName()), 373 STT_FUNC, 0, isec); 374 addSymbol("$x", STT_NOTYPE, 0, isec); 375 addSymbol("$d", STT_NOTYPE, 8, isec); 376 } 377 378 // This Thunk has a maximum range of 4Gb, this is sufficient for all programs 379 // using the small code model, including pc-relative ones. At time of writing 380 // clang and gcc do not support the large code model for position independent 381 // code so it is safe to use this for position independent thunks without 382 // worrying about the destination being more than 4Gb away. 383 void AArch64ADRPThunk::writeTo(uint8_t *buf) { 384 const uint8_t data[] = { 385 0x10, 0x00, 0x00, 0x90, // adrp x16, Dest R_AARCH64_ADR_PREL_PG_HI21(Dest) 386 0x10, 0x02, 0x00, 0x91, // add x16, x16, R_AARCH64_ADD_ABS_LO12_NC(Dest) 387 0x00, 0x02, 0x1f, 0xd6, // br x16 388 }; 389 uint64_t s = getAArch64ThunkDestVA(destination, addend); 390 uint64_t p = getThunkTargetSym()->getVA(); 391 memcpy(buf, data, sizeof(data)); 392 target->relocateNoSym(buf, R_AARCH64_ADR_PREL_PG_HI21, 393 getAArch64Page(s) - getAArch64Page(p)); 394 target->relocateNoSym(buf + 4, R_AARCH64_ADD_ABS_LO12_NC, s); 395 } 396 397 void AArch64ADRPThunk::addSymbols(ThunkSection &isec) { 398 addSymbol(saver.save("__AArch64ADRPThunk_" + destination.getName()), STT_FUNC, 399 0, isec); 400 addSymbol("$x", STT_NOTYPE, 0, isec); 401 } 402 403 // ARM Target Thunks 404 static uint64_t getARMThunkDestVA(const Symbol &s) { 405 uint64_t v = s.isInPlt() ? s.getPltVA() : s.getVA(); 406 return SignExtend64<32>(v); 407 } 408 409 // This function returns true if the target is not Thumb and is within 2^26, and 410 // it has not previously returned false (see comment for mayUseShortThunk). 411 bool ARMThunk::getMayUseShortThunk() { 412 if (!mayUseShortThunk) 413 return false; 414 uint64_t s = getARMThunkDestVA(destination); 415 if (s & 1) { 416 mayUseShortThunk = false; 417 return false; 418 } 419 uint64_t p = getThunkTargetSym()->getVA(); 420 int64_t offset = s - p - 8; 421 mayUseShortThunk = llvm::isInt<26>(offset); 422 return mayUseShortThunk; 423 } 424 425 void ARMThunk::writeTo(uint8_t *buf) { 426 if (!getMayUseShortThunk()) { 427 writeLong(buf); 428 return; 429 } 430 431 uint64_t s = getARMThunkDestVA(destination); 432 uint64_t p = getThunkTargetSym()->getVA(); 433 int64_t offset = s - p - 8; 434 const uint8_t data[] = { 435 0x00, 0x00, 0x00, 0xea, // b S 436 }; 437 memcpy(buf, data, sizeof(data)); 438 target->relocateNoSym(buf, R_ARM_JUMP24, offset); 439 } 440 441 bool ARMThunk::isCompatibleWith(const InputSection &isec, 442 const Relocation &rel) const { 443 // Thumb branch relocations can't use BLX 444 return rel.type != R_ARM_THM_JUMP19 && rel.type != R_ARM_THM_JUMP24; 445 } 446 447 // This function returns true if the target is Thumb and is within 2^25, and 448 // it has not previously returned false (see comment for mayUseShortThunk). 449 bool ThumbThunk::getMayUseShortThunk() { 450 if (!mayUseShortThunk) 451 return false; 452 uint64_t s = getARMThunkDestVA(destination); 453 if ((s & 1) == 0) { 454 mayUseShortThunk = false; 455 return false; 456 } 457 uint64_t p = getThunkTargetSym()->getVA() & ~1; 458 int64_t offset = s - p - 4; 459 mayUseShortThunk = llvm::isInt<25>(offset); 460 return mayUseShortThunk; 461 } 462 463 void ThumbThunk::writeTo(uint8_t *buf) { 464 if (!getMayUseShortThunk()) { 465 writeLong(buf); 466 return; 467 } 468 469 uint64_t s = getARMThunkDestVA(destination); 470 uint64_t p = getThunkTargetSym()->getVA(); 471 int64_t offset = s - p - 4; 472 const uint8_t data[] = { 473 0x00, 0xf0, 0x00, 0xb0, // b.w S 474 }; 475 memcpy(buf, data, sizeof(data)); 476 target->relocateNoSym(buf, R_ARM_THM_JUMP24, offset); 477 } 478 479 bool ThumbThunk::isCompatibleWith(const InputSection &isec, 480 const Relocation &rel) const { 481 // ARM branch relocations can't use BLX 482 return rel.type != R_ARM_JUMP24 && rel.type != R_ARM_PC24 && rel.type != R_ARM_PLT32; 483 } 484 485 void ARMV7ABSLongThunk::writeLong(uint8_t *buf) { 486 const uint8_t data[] = { 487 0x00, 0xc0, 0x00, 0xe3, // movw ip,:lower16:S 488 0x00, 0xc0, 0x40, 0xe3, // movt ip,:upper16:S 489 0x1c, 0xff, 0x2f, 0xe1, // bx ip 490 }; 491 uint64_t s = getARMThunkDestVA(destination); 492 memcpy(buf, data, sizeof(data)); 493 target->relocateNoSym(buf, R_ARM_MOVW_ABS_NC, s); 494 target->relocateNoSym(buf + 4, R_ARM_MOVT_ABS, s); 495 } 496 497 void ARMV7ABSLongThunk::addSymbols(ThunkSection &isec) { 498 addSymbol(saver.save("__ARMv7ABSLongThunk_" + destination.getName()), 499 STT_FUNC, 0, isec); 500 addSymbol("$a", STT_NOTYPE, 0, isec); 501 } 502 503 void ThumbV7ABSLongThunk::writeLong(uint8_t *buf) { 504 const uint8_t data[] = { 505 0x40, 0xf2, 0x00, 0x0c, // movw ip, :lower16:S 506 0xc0, 0xf2, 0x00, 0x0c, // movt ip, :upper16:S 507 0x60, 0x47, // bx ip 508 }; 509 uint64_t s = getARMThunkDestVA(destination); 510 memcpy(buf, data, sizeof(data)); 511 target->relocateNoSym(buf, R_ARM_THM_MOVW_ABS_NC, s); 512 target->relocateNoSym(buf + 4, R_ARM_THM_MOVT_ABS, s); 513 } 514 515 void ThumbV7ABSLongThunk::addSymbols(ThunkSection &isec) { 516 addSymbol(saver.save("__Thumbv7ABSLongThunk_" + destination.getName()), 517 STT_FUNC, 1, isec); 518 addSymbol("$t", STT_NOTYPE, 0, isec); 519 } 520 521 void ARMV7PILongThunk::writeLong(uint8_t *buf) { 522 const uint8_t data[] = { 523 0xf0, 0xcf, 0x0f, 0xe3, // P: movw ip,:lower16:S - (P + (L1-P) + 8) 524 0x00, 0xc0, 0x40, 0xe3, // movt ip,:upper16:S - (P + (L1-P) + 8) 525 0x0f, 0xc0, 0x8c, 0xe0, // L1: add ip, ip, pc 526 0x1c, 0xff, 0x2f, 0xe1, // bx ip 527 }; 528 uint64_t s = getARMThunkDestVA(destination); 529 uint64_t p = getThunkTargetSym()->getVA(); 530 int64_t offset = s - p - 16; 531 memcpy(buf, data, sizeof(data)); 532 target->relocateNoSym(buf, R_ARM_MOVW_PREL_NC, offset); 533 target->relocateNoSym(buf + 4, R_ARM_MOVT_PREL, offset); 534 } 535 536 void ARMV7PILongThunk::addSymbols(ThunkSection &isec) { 537 addSymbol(saver.save("__ARMV7PILongThunk_" + destination.getName()), STT_FUNC, 538 0, isec); 539 addSymbol("$a", STT_NOTYPE, 0, isec); 540 } 541 542 void ThumbV7PILongThunk::writeLong(uint8_t *buf) { 543 const uint8_t data[] = { 544 0x4f, 0xf6, 0xf4, 0x7c, // P: movw ip,:lower16:S - (P + (L1-P) + 4) 545 0xc0, 0xf2, 0x00, 0x0c, // movt ip,:upper16:S - (P + (L1-P) + 4) 546 0xfc, 0x44, // L1: add ip, pc 547 0x60, 0x47, // bx ip 548 }; 549 uint64_t s = getARMThunkDestVA(destination); 550 uint64_t p = getThunkTargetSym()->getVA() & ~0x1; 551 int64_t offset = s - p - 12; 552 memcpy(buf, data, sizeof(data)); 553 target->relocateNoSym(buf, R_ARM_THM_MOVW_PREL_NC, offset); 554 target->relocateNoSym(buf + 4, R_ARM_THM_MOVT_PREL, offset); 555 } 556 557 void ThumbV7PILongThunk::addSymbols(ThunkSection &isec) { 558 addSymbol(saver.save("__ThumbV7PILongThunk_" + destination.getName()), 559 STT_FUNC, 1, isec); 560 addSymbol("$t", STT_NOTYPE, 0, isec); 561 } 562 563 void ARMV5ABSLongThunk::writeLong(uint8_t *buf) { 564 const uint8_t data[] = { 565 0x04, 0xf0, 0x1f, 0xe5, // ldr pc, [pc,#-4] ; L1 566 0x00, 0x00, 0x00, 0x00, // L1: .word S 567 }; 568 memcpy(buf, data, sizeof(data)); 569 target->relocateNoSym(buf + 4, R_ARM_ABS32, getARMThunkDestVA(destination)); 570 } 571 572 void ARMV5ABSLongThunk::addSymbols(ThunkSection &isec) { 573 addSymbol(saver.save("__ARMv5ABSLongThunk_" + destination.getName()), 574 STT_FUNC, 0, isec); 575 addSymbol("$a", STT_NOTYPE, 0, isec); 576 addSymbol("$d", STT_NOTYPE, 4, isec); 577 } 578 579 bool ARMV5ABSLongThunk::isCompatibleWith(const InputSection &isec, 580 const Relocation &rel) const { 581 // Thumb branch relocations can't use BLX 582 return rel.type != R_ARM_THM_JUMP19 && rel.type != R_ARM_THM_JUMP24; 583 } 584 585 void ARMV5PILongThunk::writeLong(uint8_t *buf) { 586 const uint8_t data[] = { 587 0x04, 0xc0, 0x9f, 0xe5, // P: ldr ip, [pc,#4] ; L2 588 0x0c, 0xc0, 0x8f, 0xe0, // L1: add ip, pc, ip 589 0x1c, 0xff, 0x2f, 0xe1, // bx ip 590 0x00, 0x00, 0x00, 0x00, // L2: .word S - (P + (L1 - P) + 8) 591 }; 592 uint64_t s = getARMThunkDestVA(destination); 593 uint64_t p = getThunkTargetSym()->getVA() & ~0x1; 594 memcpy(buf, data, sizeof(data)); 595 target->relocateNoSym(buf + 12, R_ARM_REL32, s - p - 12); 596 } 597 598 void ARMV5PILongThunk::addSymbols(ThunkSection &isec) { 599 addSymbol(saver.save("__ARMV5PILongThunk_" + destination.getName()), STT_FUNC, 600 0, isec); 601 addSymbol("$a", STT_NOTYPE, 0, isec); 602 addSymbol("$d", STT_NOTYPE, 12, isec); 603 } 604 605 bool ARMV5PILongThunk::isCompatibleWith(const InputSection &isec, 606 const Relocation &rel) const { 607 // Thumb branch relocations can't use BLX 608 return rel.type != R_ARM_THM_JUMP19 && rel.type != R_ARM_THM_JUMP24; 609 } 610 611 void ThumbV6MABSLongThunk::writeLong(uint8_t *buf) { 612 // Most Thumb instructions cannot access the high registers r8 - r15. As the 613 // only register we can corrupt is r12 we must instead spill a low register 614 // to the stack to use as a scratch register. We push r1 even though we 615 // don't need to get some space to use for the return address. 616 const uint8_t data[] = { 617 0x03, 0xb4, // push {r0, r1} ; Obtain scratch registers 618 0x01, 0x48, // ldr r0, [pc, #4] ; L1 619 0x01, 0x90, // str r0, [sp, #4] ; SP + 4 = S 620 0x01, 0xbd, // pop {r0, pc} ; restore r0 and branch to dest 621 0x00, 0x00, 0x00, 0x00 // L1: .word S 622 }; 623 uint64_t s = getARMThunkDestVA(destination); 624 memcpy(buf, data, sizeof(data)); 625 target->relocateNoSym(buf + 8, R_ARM_ABS32, s); 626 } 627 628 void ThumbV6MABSLongThunk::addSymbols(ThunkSection &isec) { 629 addSymbol(saver.save("__Thumbv6MABSLongThunk_" + destination.getName()), 630 STT_FUNC, 1, isec); 631 addSymbol("$t", STT_NOTYPE, 0, isec); 632 addSymbol("$d", STT_NOTYPE, 8, isec); 633 } 634 635 void ThumbV6MPILongThunk::writeLong(uint8_t *buf) { 636 // Most Thumb instructions cannot access the high registers r8 - r15. As the 637 // only register we can corrupt is ip (r12) we must instead spill a low 638 // register to the stack to use as a scratch register. 639 const uint8_t data[] = { 640 0x01, 0xb4, // P: push {r0} ; Obtain scratch register 641 0x02, 0x48, // ldr r0, [pc, #8] ; L2 642 0x84, 0x46, // mov ip, r0 ; high to low register 643 0x01, 0xbc, // pop {r0} ; restore scratch register 644 0xe7, 0x44, // L1: add pc, ip ; transfer control 645 0xc0, 0x46, // nop ; pad to 4-byte boundary 646 0x00, 0x00, 0x00, 0x00, // L2: .word S - (P + (L1 - P) + 4) 647 }; 648 uint64_t s = getARMThunkDestVA(destination); 649 uint64_t p = getThunkTargetSym()->getVA() & ~0x1; 650 memcpy(buf, data, sizeof(data)); 651 target->relocateNoSym(buf + 12, R_ARM_REL32, s - p - 12); 652 } 653 654 void ThumbV6MPILongThunk::addSymbols(ThunkSection &isec) { 655 addSymbol(saver.save("__Thumbv6MPILongThunk_" + destination.getName()), 656 STT_FUNC, 1, isec); 657 addSymbol("$t", STT_NOTYPE, 0, isec); 658 addSymbol("$d", STT_NOTYPE, 12, isec); 659 } 660 661 // Write MIPS LA25 thunk code to call PIC function from the non-PIC one. 662 void MipsThunk::writeTo(uint8_t *buf) { 663 uint64_t s = destination.getVA(); 664 write32(buf, 0x3c190000); // lui $25, %hi(func) 665 write32(buf + 4, 0x08000000 | (s >> 2)); // j func 666 write32(buf + 8, 0x27390000); // addiu $25, $25, %lo(func) 667 write32(buf + 12, 0x00000000); // nop 668 target->relocateNoSym(buf, R_MIPS_HI16, s); 669 target->relocateNoSym(buf + 8, R_MIPS_LO16, s); 670 } 671 672 void MipsThunk::addSymbols(ThunkSection &isec) { 673 addSymbol(saver.save("__LA25Thunk_" + destination.getName()), STT_FUNC, 0, 674 isec); 675 } 676 677 InputSection *MipsThunk::getTargetInputSection() const { 678 auto &dr = cast<Defined>(destination); 679 return dyn_cast<InputSection>(dr.section); 680 } 681 682 // Write microMIPS R2-R5 LA25 thunk code 683 // to call PIC function from the non-PIC one. 684 void MicroMipsThunk::writeTo(uint8_t *buf) { 685 uint64_t s = destination.getVA(); 686 write16(buf, 0x41b9); // lui $25, %hi(func) 687 write16(buf + 4, 0xd400); // j func 688 write16(buf + 8, 0x3339); // addiu $25, $25, %lo(func) 689 write16(buf + 12, 0x0c00); // nop 690 target->relocateNoSym(buf, R_MICROMIPS_HI16, s); 691 target->relocateNoSym(buf + 4, R_MICROMIPS_26_S1, s); 692 target->relocateNoSym(buf + 8, R_MICROMIPS_LO16, s); 693 } 694 695 void MicroMipsThunk::addSymbols(ThunkSection &isec) { 696 Defined *d = addSymbol( 697 saver.save("__microLA25Thunk_" + destination.getName()), STT_FUNC, 0, isec); 698 d->stOther |= STO_MIPS_MICROMIPS; 699 } 700 701 InputSection *MicroMipsThunk::getTargetInputSection() const { 702 auto &dr = cast<Defined>(destination); 703 return dyn_cast<InputSection>(dr.section); 704 } 705 706 // Write microMIPS R6 LA25 thunk code 707 // to call PIC function from the non-PIC one. 708 void MicroMipsR6Thunk::writeTo(uint8_t *buf) { 709 uint64_t s = destination.getVA(); 710 uint64_t p = getThunkTargetSym()->getVA(); 711 write16(buf, 0x1320); // lui $25, %hi(func) 712 write16(buf + 4, 0x3339); // addiu $25, $25, %lo(func) 713 write16(buf + 8, 0x9400); // bc func 714 target->relocateNoSym(buf, R_MICROMIPS_HI16, s); 715 target->relocateNoSym(buf + 4, R_MICROMIPS_LO16, s); 716 target->relocateNoSym(buf + 8, R_MICROMIPS_PC26_S1, s - p - 12); 717 } 718 719 void MicroMipsR6Thunk::addSymbols(ThunkSection &isec) { 720 Defined *d = addSymbol( 721 saver.save("__microLA25Thunk_" + destination.getName()), STT_FUNC, 0, isec); 722 d->stOther |= STO_MIPS_MICROMIPS; 723 } 724 725 InputSection *MicroMipsR6Thunk::getTargetInputSection() const { 726 auto &dr = cast<Defined>(destination); 727 return dyn_cast<InputSection>(dr.section); 728 } 729 730 void elf::writePPC32PltCallStub(uint8_t *buf, uint64_t gotPltVA, 731 const InputFile *file, int64_t addend) { 732 if (!config->isPic) { 733 write32(buf + 0, 0x3d600000 | (gotPltVA + 0x8000) >> 16); // lis r11,ha 734 write32(buf + 4, 0x816b0000 | (uint16_t)gotPltVA); // lwz r11,l(r11) 735 write32(buf + 8, 0x7d6903a6); // mtctr r11 736 write32(buf + 12, 0x4e800420); // bctr 737 return; 738 } 739 uint32_t offset; 740 if (addend >= 0x8000) { 741 // The stub loads an address relative to r30 (.got2+Addend). Addend is 742 // almost always 0x8000. The address of .got2 is different in another object 743 // file, so a stub cannot be shared. 744 offset = gotPltVA - (in.ppc32Got2->getParent()->getVA() + 745 file->ppc32Got2OutSecOff + addend); 746 } else { 747 // The stub loads an address relative to _GLOBAL_OFFSET_TABLE_ (which is 748 // currently the address of .got). 749 offset = gotPltVA - in.got->getVA(); 750 } 751 uint16_t ha = (offset + 0x8000) >> 16, l = (uint16_t)offset; 752 if (ha == 0) { 753 write32(buf + 0, 0x817e0000 | l); // lwz r11,l(r30) 754 write32(buf + 4, 0x7d6903a6); // mtctr r11 755 write32(buf + 8, 0x4e800420); // bctr 756 write32(buf + 12, 0x60000000); // nop 757 } else { 758 write32(buf + 0, 0x3d7e0000 | ha); // addis r11,r30,ha 759 write32(buf + 4, 0x816b0000 | l); // lwz r11,l(r11) 760 write32(buf + 8, 0x7d6903a6); // mtctr r11 761 write32(buf + 12, 0x4e800420); // bctr 762 } 763 } 764 765 void PPC32PltCallStub::writeTo(uint8_t *buf) { 766 writePPC32PltCallStub(buf, destination.getGotPltVA(), file, addend); 767 } 768 769 void PPC32PltCallStub::addSymbols(ThunkSection &isec) { 770 std::string buf; 771 raw_string_ostream os(buf); 772 os << format_hex_no_prefix(addend, 8); 773 if (!config->isPic) 774 os << ".plt_call32."; 775 else if (addend >= 0x8000) 776 os << ".got2.plt_pic32."; 777 else 778 os << ".plt_pic32."; 779 os << destination.getName(); 780 addSymbol(saver.save(os.str()), STT_FUNC, 0, isec); 781 } 782 783 bool PPC32PltCallStub::isCompatibleWith(const InputSection &isec, 784 const Relocation &rel) const { 785 return !config->isPic || (isec.file == file && rel.addend == addend); 786 } 787 788 void PPC32LongThunk::addSymbols(ThunkSection &isec) { 789 addSymbol(saver.save("__LongThunk_" + destination.getName()), STT_FUNC, 0, 790 isec); 791 } 792 793 void PPC32LongThunk::writeTo(uint8_t *buf) { 794 auto ha = [](uint32_t v) -> uint16_t { return (v + 0x8000) >> 16; }; 795 auto lo = [](uint32_t v) -> uint16_t { return v; }; 796 uint32_t d = destination.getVA(addend); 797 if (config->isPic) { 798 uint32_t off = d - (getThunkTargetSym()->getVA() + 8); 799 write32(buf + 0, 0x7c0802a6); // mflr r12,0 800 write32(buf + 4, 0x429f0005); // bcl r20,r31,.+4 801 write32(buf + 8, 0x7d8802a6); // mtctr r12 802 write32(buf + 12, 0x3d8c0000 | ha(off)); // addis r12,r12,off@ha 803 write32(buf + 16, 0x398c0000 | lo(off)); // addi r12,r12,off@l 804 write32(buf + 20, 0x7c0803a6); // mtlr r0 805 buf += 24; 806 } else { 807 write32(buf + 0, 0x3d800000 | ha(d)); // lis r12,d@ha 808 write32(buf + 4, 0x398c0000 | lo(d)); // addi r12,r12,d@l 809 buf += 8; 810 } 811 write32(buf + 0, 0x7d8903a6); // mtctr r12 812 write32(buf + 4, 0x4e800420); // bctr 813 } 814 815 void elf::writePPC64LoadAndBranch(uint8_t *buf, int64_t offset) { 816 uint16_t offHa = (offset + 0x8000) >> 16; 817 uint16_t offLo = offset & 0xffff; 818 819 write32(buf + 0, 0x3d820000 | offHa); // addis r12, r2, OffHa 820 write32(buf + 4, 0xe98c0000 | offLo); // ld r12, OffLo(r12) 821 write32(buf + 8, 0x7d8903a6); // mtctr r12 822 write32(buf + 12, 0x4e800420); // bctr 823 } 824 825 void PPC64PltCallStub::writeTo(uint8_t *buf) { 826 int64_t offset = destination.getGotPltVA() - getPPC64TocBase(); 827 // Save the TOC pointer to the save-slot reserved in the call frame. 828 write32(buf + 0, 0xf8410018); // std r2,24(r1) 829 writePPC64LoadAndBranch(buf + 4, offset); 830 } 831 832 void PPC64PltCallStub::addSymbols(ThunkSection &isec) { 833 Defined *s = addSymbol(saver.save("__plt_" + destination.getName()), STT_FUNC, 834 0, isec); 835 s->needsTocRestore = true; 836 s->file = destination.file; 837 } 838 839 void PPC64R2SaveStub::writeTo(uint8_t *buf) { 840 int64_t offset = destination.getVA() - (getThunkTargetSym()->getVA() + 4); 841 // The branch offset needs to fit in 26 bits. 842 if (!isInt<26>(offset)) 843 fatal("R2 save stub branch offset is too large: " + Twine(offset)); 844 write32(buf + 0, 0xf8410018); // std r2,24(r1) 845 write32(buf + 4, 0x48000000 | (offset & 0x03fffffc)); // b <offset> 846 } 847 848 void PPC64R2SaveStub::addSymbols(ThunkSection &isec) { 849 Defined *s = addSymbol(saver.save("__toc_save_" + destination.getName()), 850 STT_FUNC, 0, isec); 851 s->needsTocRestore = true; 852 } 853 854 void PPC64LongBranchThunk::writeTo(uint8_t *buf) { 855 int64_t offset = in.ppc64LongBranchTarget->getEntryVA(&destination, addend) - 856 getPPC64TocBase(); 857 writePPC64LoadAndBranch(buf, offset); 858 } 859 860 void PPC64LongBranchThunk::addSymbols(ThunkSection &isec) { 861 addSymbol(saver.save("__long_branch_" + destination.getName()), STT_FUNC, 0, 862 isec); 863 } 864 865 Thunk::Thunk(Symbol &d, int64_t a) : destination(d), addend(a), offset(0) {} 866 867 Thunk::~Thunk() = default; 868 869 static Thunk *addThunkAArch64(RelType type, Symbol &s, int64_t a) { 870 if (type != R_AARCH64_CALL26 && type != R_AARCH64_JUMP26 && 871 type != R_AARCH64_PLT32) 872 fatal("unrecognized relocation type"); 873 if (config->picThunk) 874 return make<AArch64ADRPThunk>(s, a); 875 return make<AArch64ABSLongThunk>(s, a); 876 } 877 878 // Creates a thunk for Thumb-ARM interworking. 879 // Arm Architectures v5 and v6 do not support Thumb2 technology. This means 880 // - MOVT and MOVW instructions cannot be used 881 // - Only Thumb relocation that can generate a Thunk is a BL, this can always 882 // be transformed into a BLX 883 static Thunk *addThunkPreArmv7(RelType reloc, Symbol &s) { 884 switch (reloc) { 885 case R_ARM_PC24: 886 case R_ARM_PLT32: 887 case R_ARM_JUMP24: 888 case R_ARM_CALL: 889 case R_ARM_THM_CALL: 890 if (config->picThunk) 891 return make<ARMV5PILongThunk>(s); 892 return make<ARMV5ABSLongThunk>(s); 893 } 894 fatal("relocation " + toString(reloc) + " to " + toString(s) + 895 " not supported for Armv5 or Armv6 targets"); 896 } 897 898 // Create a thunk for Thumb long branch on V6-M. 899 // Arm Architecture v6-M only supports Thumb instructions. This means 900 // - MOVT and MOVW instructions cannot be used. 901 // - Only a limited number of instructions can access registers r8 and above 902 // - No interworking support is needed (all Thumb). 903 static Thunk *addThunkV6M(RelType reloc, Symbol &s) { 904 switch (reloc) { 905 case R_ARM_THM_JUMP19: 906 case R_ARM_THM_JUMP24: 907 case R_ARM_THM_CALL: 908 if (config->isPic) 909 return make<ThumbV6MPILongThunk>(s); 910 return make<ThumbV6MABSLongThunk>(s); 911 } 912 fatal("relocation " + toString(reloc) + " to " + toString(s) + 913 " not supported for Armv6-M targets"); 914 } 915 916 // Creates a thunk for Thumb-ARM interworking or branch range extension. 917 static Thunk *addThunkArm(RelType reloc, Symbol &s) { 918 // Decide which Thunk is needed based on: 919 // Available instruction set 920 // - An Arm Thunk can only be used if Arm state is available. 921 // - A Thumb Thunk can only be used if Thumb state is available. 922 // - Can only use a Thunk if it uses instructions that the Target supports. 923 // Relocation is branch or branch and link 924 // - Branch instructions cannot change state, can only select Thunk that 925 // starts in the same state as the caller. 926 // - Branch and link relocations can change state, can select Thunks from 927 // either Arm or Thumb. 928 // Position independent Thunks if we require position independent code. 929 930 // Handle architectures that have restrictions on the instructions that they 931 // can use in Thunks. The flags below are set by reading the BuildAttributes 932 // of the input objects. InputFiles.cpp contains the mapping from ARM 933 // architecture to flag. 934 if (!config->armHasMovtMovw) { 935 if (!config->armJ1J2BranchEncoding) 936 return addThunkPreArmv7(reloc, s); 937 return addThunkV6M(reloc, s); 938 } 939 940 switch (reloc) { 941 case R_ARM_PC24: 942 case R_ARM_PLT32: 943 case R_ARM_JUMP24: 944 case R_ARM_CALL: 945 if (config->picThunk) 946 return make<ARMV7PILongThunk>(s); 947 return make<ARMV7ABSLongThunk>(s); 948 case R_ARM_THM_JUMP19: 949 case R_ARM_THM_JUMP24: 950 case R_ARM_THM_CALL: 951 if (config->picThunk) 952 return make<ThumbV7PILongThunk>(s); 953 return make<ThumbV7ABSLongThunk>(s); 954 } 955 fatal("unrecognized relocation type"); 956 } 957 958 static Thunk *addThunkMips(RelType type, Symbol &s) { 959 if ((s.stOther & STO_MIPS_MICROMIPS) && isMipsR6()) 960 return make<MicroMipsR6Thunk>(s); 961 if (s.stOther & STO_MIPS_MICROMIPS) 962 return make<MicroMipsThunk>(s); 963 return make<MipsThunk>(s); 964 } 965 966 static Thunk *addThunkPPC32(const InputSection &isec, const Relocation &rel, 967 Symbol &s) { 968 assert((rel.type == R_PPC_LOCAL24PC || rel.type == R_PPC_REL24 || 969 rel.type == R_PPC_PLTREL24) && 970 "unexpected relocation type for thunk"); 971 if (s.isInPlt()) 972 return make<PPC32PltCallStub>(isec, rel, s); 973 return make<PPC32LongThunk>(s, rel.addend); 974 } 975 976 static Thunk *addThunkPPC64(RelType type, Symbol &s, int64_t a) { 977 assert((type == R_PPC64_REL14 || type == R_PPC64_REL24) && 978 "unexpected relocation type for thunk"); 979 if (s.isInPlt()) 980 return make<PPC64PltCallStub>(s); 981 982 // This check looks at the st_other bits of the callee. If the value is 1 983 // then the callee clobbers the TOC and we need an R2 save stub. 984 if ((s.stOther >> 5) == 1) 985 return make<PPC64R2SaveStub>(s); 986 987 if (config->picThunk) 988 return make<PPC64PILongBranchThunk>(s, a); 989 990 return make<PPC64PDLongBranchThunk>(s, a); 991 } 992 993 Thunk *elf::addThunk(const InputSection &isec, Relocation &rel) { 994 Symbol &s = *rel.sym; 995 int64_t a = rel.addend; 996 997 if (config->emachine == EM_AARCH64) 998 return addThunkAArch64(rel.type, s, a); 999 1000 if (config->emachine == EM_ARM) 1001 return addThunkArm(rel.type, s); 1002 1003 if (config->emachine == EM_MIPS) 1004 return addThunkMips(rel.type, s); 1005 1006 if (config->emachine == EM_PPC) 1007 return addThunkPPC32(isec, rel, s); 1008 1009 if (config->emachine == EM_PPC64) 1010 return addThunkPPC64(rel.type, s, a); 1011 1012 llvm_unreachable("add Thunk only supported for ARM, Mips and PowerPC"); 1013 } 1014