1 //===- Thunks.cpp --------------------------------------------------------===// 2 // 3 // Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions. 4 // See https://llvm.org/LICENSE.txt for license information. 5 // SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception 6 // 7 //===---------------------------------------------------------------------===// 8 // 9 // This file contains Thunk subclasses. 10 // 11 // A thunk is a small piece of code written after an input section 12 // which is used to jump between "incompatible" functions 13 // such as MIPS PIC and non-PIC or ARM non-Thumb and Thumb functions. 14 // 15 // If a jump target is too far and its address doesn't fit to a 16 // short jump instruction, we need to create a thunk too, but we 17 // haven't supported it yet. 18 // 19 // i386 and x86-64 don't need thunks. 20 // 21 //===---------------------------------------------------------------------===// 22 23 #include "Thunks.h" 24 #include "Config.h" 25 #include "InputFiles.h" 26 #include "InputSection.h" 27 #include "OutputSections.h" 28 #include "Symbols.h" 29 #include "SyntheticSections.h" 30 #include "Target.h" 31 #include "lld/Common/CommonLinkerContext.h" 32 #include "llvm/BinaryFormat/ELF.h" 33 #include "llvm/Support/Casting.h" 34 #include "llvm/Support/ErrorHandling.h" 35 #include "llvm/Support/MathExtras.h" 36 #include <cstdint> 37 #include <cstring> 38 39 using namespace llvm; 40 using namespace llvm::object; 41 using namespace llvm::ELF; 42 using namespace lld; 43 using namespace lld::elf; 44 45 namespace { 46 47 // AArch64 long range Thunks 48 class AArch64ABSLongThunk final : public Thunk { 49 public: 50 AArch64ABSLongThunk(Symbol &dest, int64_t addend) : Thunk(dest, addend) {} 51 uint32_t size() override { return 16; } 52 void writeTo(uint8_t *buf) override; 53 void addSymbols(ThunkSection &isec) override; 54 }; 55 56 class AArch64ADRPThunk final : public Thunk { 57 public: 58 AArch64ADRPThunk(Symbol &dest, int64_t addend) : Thunk(dest, addend) {} 59 uint32_t size() override { return 12; } 60 void writeTo(uint8_t *buf) override; 61 void addSymbols(ThunkSection &isec) override; 62 }; 63 64 // Base class for ARM thunks. 65 // 66 // An ARM thunk may be either short or long. A short thunk is simply a branch 67 // (B) instruction, and it may be used to call ARM functions when the distance 68 // from the thunk to the target is less than 32MB. Long thunks can branch to any 69 // virtual address and can switch between ARM and Thumb, and they are 70 // implemented in the derived classes. This class tries to create a short thunk 71 // if the target is in range, otherwise it creates a long thunk. 72 class ARMThunk : public Thunk { 73 public: 74 ARMThunk(Symbol &dest, int64_t addend) : Thunk(dest, addend) {} 75 76 bool getMayUseShortThunk(); 77 uint32_t size() override { return getMayUseShortThunk() ? 4 : sizeLong(); } 78 void writeTo(uint8_t *buf) override; 79 bool isCompatibleWith(const InputSection &isec, 80 const Relocation &rel) const override; 81 82 // Returns the size of a long thunk. 83 virtual uint32_t sizeLong() = 0; 84 85 // Writes a long thunk to Buf. 86 virtual void writeLong(uint8_t *buf) = 0; 87 88 private: 89 // This field tracks whether all previously considered layouts would allow 90 // this thunk to be short. If we have ever needed a long thunk, we always 91 // create a long thunk, even if the thunk may be short given the current 92 // distance to the target. We do this because transitioning from long to short 93 // can create layout oscillations in certain corner cases which would prevent 94 // the layout from converging. 95 bool mayUseShortThunk = true; 96 }; 97 98 // Base class for Thumb-2 thunks. 99 // 100 // This class is similar to ARMThunk, but it uses the Thumb-2 B.W instruction 101 // which has a range of 16MB. 102 class ThumbThunk : public Thunk { 103 public: 104 ThumbThunk(Symbol &dest, int64_t addend) : Thunk(dest, addend) { 105 alignment = 2; 106 } 107 108 bool getMayUseShortThunk(); 109 uint32_t size() override { return getMayUseShortThunk() ? 4 : sizeLong(); } 110 void writeTo(uint8_t *buf) override; 111 bool isCompatibleWith(const InputSection &isec, 112 const Relocation &rel) const override; 113 114 // Returns the size of a long thunk. 115 virtual uint32_t sizeLong() = 0; 116 117 // Writes a long thunk to Buf. 118 virtual void writeLong(uint8_t *buf) = 0; 119 120 private: 121 // See comment in ARMThunk above. 122 bool mayUseShortThunk = true; 123 }; 124 125 // Specific ARM Thunk implementations. The naming convention is: 126 // Source State, TargetState, Target Requirement, ABS or PI, Range 127 class ARMV7ABSLongThunk final : public ARMThunk { 128 public: 129 ARMV7ABSLongThunk(Symbol &dest, int64_t addend) : ARMThunk(dest, addend) {} 130 131 uint32_t sizeLong() override { return 12; } 132 void writeLong(uint8_t *buf) override; 133 void addSymbols(ThunkSection &isec) override; 134 }; 135 136 class ARMV7PILongThunk final : public ARMThunk { 137 public: 138 ARMV7PILongThunk(Symbol &dest, int64_t addend) : ARMThunk(dest, addend) {} 139 140 uint32_t sizeLong() override { return 16; } 141 void writeLong(uint8_t *buf) override; 142 void addSymbols(ThunkSection &isec) override; 143 }; 144 145 class ThumbV7ABSLongThunk final : public ThumbThunk { 146 public: 147 ThumbV7ABSLongThunk(Symbol &dest, int64_t addend) 148 : ThumbThunk(dest, addend) {} 149 150 uint32_t sizeLong() override { return 10; } 151 void writeLong(uint8_t *buf) override; 152 void addSymbols(ThunkSection &isec) override; 153 }; 154 155 class ThumbV7PILongThunk final : public ThumbThunk { 156 public: 157 ThumbV7PILongThunk(Symbol &dest, int64_t addend) : ThumbThunk(dest, addend) {} 158 159 uint32_t sizeLong() override { return 12; } 160 void writeLong(uint8_t *buf) override; 161 void addSymbols(ThunkSection &isec) override; 162 }; 163 164 // Implementations of Thunks for Arm v6-M. Only Thumb instructions are permitted 165 class ThumbV6MABSLongThunk final : public ThumbThunk { 166 public: 167 ThumbV6MABSLongThunk(Symbol &dest, int64_t addend) 168 : ThumbThunk(dest, addend) {} 169 170 uint32_t sizeLong() override { return 12; } 171 void writeLong(uint8_t *buf) override; 172 void addSymbols(ThunkSection &isec) override; 173 }; 174 175 class ThumbV6MPILongThunk final : public ThumbThunk { 176 public: 177 ThumbV6MPILongThunk(Symbol &dest, int64_t addend) 178 : ThumbThunk(dest, addend) {} 179 180 uint32_t sizeLong() override { return 16; } 181 void writeLong(uint8_t *buf) override; 182 void addSymbols(ThunkSection &isec) override; 183 }; 184 185 // Architectures v4, v5 and v6 do not support the movt/movw instructions. v5 and 186 // v6 support BLX to which BL instructions can be rewritten inline. There are no 187 // Thumb entrypoints for v5 and v6 as there is no Thumb branch instruction on 188 // these architecture that can result in a thunk. 189 190 // LDR on v5 and v6 can switch processor state, so for v5 and v6, 191 // ARMV5LongLdrPcThunk can be used for both Arm->Arm and Arm->Thumb calls. v4 192 // can also use this thunk, but only for Arm->Arm calls. 193 class ARMV5LongLdrPcThunk final : public ARMThunk { 194 public: 195 ARMV5LongLdrPcThunk(Symbol &dest, int64_t addend) : ARMThunk(dest, addend) {} 196 197 uint32_t sizeLong() override { return 8; } 198 void writeLong(uint8_t *buf) override; 199 void addSymbols(ThunkSection &isec) override; 200 }; 201 202 // Implementations of Thunks for v4. BLX is not supported, and loads 203 // will not invoke Arm/Thumb state changes. 204 class ARMV4PILongBXThunk final : public ARMThunk { 205 public: 206 ARMV4PILongBXThunk(Symbol &dest, int64_t addend) : ARMThunk(dest, addend) {} 207 208 uint32_t sizeLong() override { return 16; } 209 void writeLong(uint8_t *buf) override; 210 void addSymbols(ThunkSection &isec) override; 211 }; 212 213 class ARMV4PILongThunk final : public ARMThunk { 214 public: 215 ARMV4PILongThunk(Symbol &dest, int64_t addend) : ARMThunk(dest, addend) {} 216 217 uint32_t sizeLong() override { return 12; } 218 void writeLong(uint8_t *buf) override; 219 void addSymbols(ThunkSection &isec) override; 220 }; 221 222 class ThumbV4PILongBXThunk final : public ThumbThunk { 223 public: 224 ThumbV4PILongBXThunk(Symbol &dest, int64_t addend) 225 : ThumbThunk(dest, addend) {} 226 227 uint32_t sizeLong() override { return 16; } 228 void writeLong(uint8_t *buf) override; 229 void addSymbols(ThunkSection &isec) override; 230 }; 231 232 class ThumbV4PILongThunk final : public ThumbThunk { 233 public: 234 ThumbV4PILongThunk(Symbol &dest, int64_t addend) 235 : ThumbThunk(dest, addend) {} 236 237 uint32_t sizeLong() override { return 20; } 238 void writeLong(uint8_t *buf) override; 239 void addSymbols(ThunkSection &isec) override; 240 }; 241 242 class ARMV4ABSLongBXThunk final : public ARMThunk { 243 public: 244 ARMV4ABSLongBXThunk(Symbol &dest, int64_t addend) : ARMThunk(dest, addend) {} 245 246 uint32_t sizeLong() override { return 12; } 247 void writeLong(uint8_t *buf) override; 248 void addSymbols(ThunkSection &isec) override; 249 }; 250 251 class ThumbV4ABSLongBXThunk final : public ThumbThunk { 252 public: 253 ThumbV4ABSLongBXThunk(Symbol &dest, int64_t addend) 254 : ThumbThunk(dest, addend) {} 255 256 uint32_t sizeLong() override { return 12; } 257 void writeLong(uint8_t *buf) override; 258 void addSymbols(ThunkSection &isec) override; 259 }; 260 261 class ThumbV4ABSLongThunk final : public ThumbThunk { 262 public: 263 ThumbV4ABSLongThunk(Symbol &dest, int64_t addend) 264 : ThumbThunk(dest, addend) {} 265 266 uint32_t sizeLong() override { return 16; } 267 void writeLong(uint8_t *buf) override; 268 void addSymbols(ThunkSection &isec) override; 269 }; 270 271 // MIPS LA25 thunk 272 class MipsThunk final : public Thunk { 273 public: 274 MipsThunk(Symbol &dest) : Thunk(dest, 0) {} 275 276 uint32_t size() override { return 16; } 277 void writeTo(uint8_t *buf) override; 278 void addSymbols(ThunkSection &isec) override; 279 InputSection *getTargetInputSection() const override; 280 }; 281 282 // microMIPS R2-R5 LA25 thunk 283 class MicroMipsThunk final : public Thunk { 284 public: 285 MicroMipsThunk(Symbol &dest) : Thunk(dest, 0) {} 286 287 uint32_t size() override { return 14; } 288 void writeTo(uint8_t *buf) override; 289 void addSymbols(ThunkSection &isec) override; 290 InputSection *getTargetInputSection() const override; 291 }; 292 293 // microMIPS R6 LA25 thunk 294 class MicroMipsR6Thunk final : public Thunk { 295 public: 296 MicroMipsR6Thunk(Symbol &dest) : Thunk(dest, 0) {} 297 298 uint32_t size() override { return 12; } 299 void writeTo(uint8_t *buf) override; 300 void addSymbols(ThunkSection &isec) override; 301 InputSection *getTargetInputSection() const override; 302 }; 303 304 class PPC32PltCallStub final : public Thunk { 305 public: 306 // For R_PPC_PLTREL24, Thunk::addend records the addend which will be used to 307 // decide the offsets in the call stub. 308 PPC32PltCallStub(const InputSection &isec, const Relocation &rel, 309 Symbol &dest) 310 : Thunk(dest, rel.addend), file(isec.file) {} 311 uint32_t size() override { return 16; } 312 void writeTo(uint8_t *buf) override; 313 void addSymbols(ThunkSection &isec) override; 314 bool isCompatibleWith(const InputSection &isec, const Relocation &rel) const override; 315 316 private: 317 // Records the call site of the call stub. 318 const InputFile *file; 319 }; 320 321 class PPC32LongThunk final : public Thunk { 322 public: 323 PPC32LongThunk(Symbol &dest, int64_t addend) : Thunk(dest, addend) {} 324 uint32_t size() override { return config->isPic ? 32 : 16; } 325 void writeTo(uint8_t *buf) override; 326 void addSymbols(ThunkSection &isec) override; 327 }; 328 329 // PPC64 Plt call stubs. 330 // Any call site that needs to call through a plt entry needs a call stub in 331 // the .text section. The call stub is responsible for: 332 // 1) Saving the toc-pointer to the stack. 333 // 2) Loading the target functions address from the procedure linkage table into 334 // r12 for use by the target functions global entry point, and into the count 335 // register. 336 // 3) Transferring control to the target function through an indirect branch. 337 class PPC64PltCallStub final : public Thunk { 338 public: 339 PPC64PltCallStub(Symbol &dest) : Thunk(dest, 0) {} 340 uint32_t size() override { return 20; } 341 void writeTo(uint8_t *buf) override; 342 void addSymbols(ThunkSection &isec) override; 343 bool isCompatibleWith(const InputSection &isec, 344 const Relocation &rel) const override; 345 }; 346 347 // PPC64 R2 Save Stub 348 // When the caller requires a valid R2 TOC pointer but the callee does not 349 // require a TOC pointer and the callee cannot guarantee that it doesn't 350 // clobber R2 then we need to save R2. This stub: 351 // 1) Saves the TOC pointer to the stack. 352 // 2) Tail calls the callee. 353 class PPC64R2SaveStub final : public Thunk { 354 public: 355 PPC64R2SaveStub(Symbol &dest, int64_t addend) : Thunk(dest, addend) { 356 alignment = 16; 357 } 358 359 // To prevent oscillations in layout when moving from short to long thunks 360 // we make sure that once a thunk has been set to long it cannot go back. 361 bool getMayUseShortThunk() { 362 if (!mayUseShortThunk) 363 return false; 364 if (!isInt<26>(computeOffset())) { 365 mayUseShortThunk = false; 366 return false; 367 } 368 return true; 369 } 370 uint32_t size() override { return getMayUseShortThunk() ? 8 : 32; } 371 void writeTo(uint8_t *buf) override; 372 void addSymbols(ThunkSection &isec) override; 373 bool isCompatibleWith(const InputSection &isec, 374 const Relocation &rel) const override; 375 376 private: 377 // Transitioning from long to short can create layout oscillations in 378 // certain corner cases which would prevent the layout from converging. 379 // This is similar to the handling for ARMThunk. 380 bool mayUseShortThunk = true; 381 int64_t computeOffset() const { 382 return destination.getVA() - (getThunkTargetSym()->getVA() + 4); 383 } 384 }; 385 386 // PPC64 R12 Setup Stub 387 // When a caller that does not maintain a toc-pointer performs a local call to 388 // a callee which requires a toc-pointer then we need this stub to place the 389 // callee's global entry point into r12 without a save of R2. 390 class PPC64R12SetupStub final : public Thunk { 391 public: 392 PPC64R12SetupStub(Symbol &dest) : Thunk(dest, 0) { alignment = 16; } 393 uint32_t size() override { return 32; } 394 void writeTo(uint8_t *buf) override; 395 void addSymbols(ThunkSection &isec) override; 396 bool isCompatibleWith(const InputSection &isec, 397 const Relocation &rel) const override; 398 }; 399 400 // PPC64 PC-relative PLT Stub 401 // When a caller that does not maintain a toc-pointer performs an extern call 402 // then this stub is needed for: 403 // 1) Loading the target functions address from the procedure linkage table into 404 // r12 for use by the target functions global entry point, and into the count 405 // register with pc-relative instructions. 406 // 2) Transferring control to the target function through an indirect branch. 407 class PPC64PCRelPLTStub final : public Thunk { 408 public: 409 PPC64PCRelPLTStub(Symbol &dest) : Thunk(dest, 0) { alignment = 16; } 410 uint32_t size() override { return 32; } 411 void writeTo(uint8_t *buf) override; 412 void addSymbols(ThunkSection &isec) override; 413 bool isCompatibleWith(const InputSection &isec, 414 const Relocation &rel) const override; 415 }; 416 417 // A bl instruction uses a signed 24 bit offset, with an implicit 4 byte 418 // alignment. This gives a possible 26 bits of 'reach'. If the call offset is 419 // larger than that we need to emit a long-branch thunk. The target address 420 // of the callee is stored in a table to be accessed TOC-relative. Since the 421 // call must be local (a non-local call will have a PltCallStub instead) the 422 // table stores the address of the callee's local entry point. For 423 // position-independent code a corresponding relative dynamic relocation is 424 // used. 425 class PPC64LongBranchThunk : public Thunk { 426 public: 427 uint32_t size() override { return 32; } 428 void writeTo(uint8_t *buf) override; 429 void addSymbols(ThunkSection &isec) override; 430 bool isCompatibleWith(const InputSection &isec, 431 const Relocation &rel) const override; 432 433 protected: 434 PPC64LongBranchThunk(Symbol &dest, int64_t addend) : Thunk(dest, addend) {} 435 }; 436 437 class PPC64PILongBranchThunk final : public PPC64LongBranchThunk { 438 public: 439 PPC64PILongBranchThunk(Symbol &dest, int64_t addend) 440 : PPC64LongBranchThunk(dest, addend) { 441 assert(!dest.isPreemptible); 442 if (std::optional<uint32_t> index = 443 in.ppc64LongBranchTarget->addEntry(&dest, addend)) { 444 mainPart->relaDyn->addRelativeReloc( 445 target->relativeRel, *in.ppc64LongBranchTarget, *index * UINT64_C(8), 446 dest, addend + getPPC64GlobalEntryToLocalEntryOffset(dest.stOther), 447 target->symbolicRel, R_ABS); 448 } 449 } 450 }; 451 452 class PPC64PDLongBranchThunk final : public PPC64LongBranchThunk { 453 public: 454 PPC64PDLongBranchThunk(Symbol &dest, int64_t addend) 455 : PPC64LongBranchThunk(dest, addend) { 456 in.ppc64LongBranchTarget->addEntry(&dest, addend); 457 } 458 }; 459 460 } // end anonymous namespace 461 462 Defined *Thunk::addSymbol(StringRef name, uint8_t type, uint64_t value, 463 InputSectionBase §ion) { 464 Defined *d = addSyntheticLocal(name, type, value, /*size=*/0, section); 465 syms.push_back(d); 466 return d; 467 } 468 469 void Thunk::setOffset(uint64_t newOffset) { 470 for (Defined *d : syms) 471 d->value = d->value - offset + newOffset; 472 offset = newOffset; 473 } 474 475 // AArch64 long range Thunks 476 477 static uint64_t getAArch64ThunkDestVA(const Symbol &s, int64_t a) { 478 uint64_t v = s.isInPlt() ? s.getPltVA() : s.getVA(a); 479 return v; 480 } 481 482 void AArch64ABSLongThunk::writeTo(uint8_t *buf) { 483 const uint8_t data[] = { 484 0x50, 0x00, 0x00, 0x58, // ldr x16, L0 485 0x00, 0x02, 0x1f, 0xd6, // br x16 486 0x00, 0x00, 0x00, 0x00, // L0: .xword S 487 0x00, 0x00, 0x00, 0x00, 488 }; 489 uint64_t s = getAArch64ThunkDestVA(destination, addend); 490 memcpy(buf, data, sizeof(data)); 491 target->relocateNoSym(buf + 8, R_AARCH64_ABS64, s); 492 } 493 494 void AArch64ABSLongThunk::addSymbols(ThunkSection &isec) { 495 addSymbol(saver().save("__AArch64AbsLongThunk_" + destination.getName()), 496 STT_FUNC, 0, isec); 497 addSymbol("$x", STT_NOTYPE, 0, isec); 498 addSymbol("$d", STT_NOTYPE, 8, isec); 499 } 500 501 // This Thunk has a maximum range of 4Gb, this is sufficient for all programs 502 // using the small code model, including pc-relative ones. At time of writing 503 // clang and gcc do not support the large code model for position independent 504 // code so it is safe to use this for position independent thunks without 505 // worrying about the destination being more than 4Gb away. 506 void AArch64ADRPThunk::writeTo(uint8_t *buf) { 507 const uint8_t data[] = { 508 0x10, 0x00, 0x00, 0x90, // adrp x16, Dest R_AARCH64_ADR_PREL_PG_HI21(Dest) 509 0x10, 0x02, 0x00, 0x91, // add x16, x16, R_AARCH64_ADD_ABS_LO12_NC(Dest) 510 0x00, 0x02, 0x1f, 0xd6, // br x16 511 }; 512 uint64_t s = getAArch64ThunkDestVA(destination, addend); 513 uint64_t p = getThunkTargetSym()->getVA(); 514 memcpy(buf, data, sizeof(data)); 515 target->relocateNoSym(buf, R_AARCH64_ADR_PREL_PG_HI21, 516 getAArch64Page(s) - getAArch64Page(p)); 517 target->relocateNoSym(buf + 4, R_AARCH64_ADD_ABS_LO12_NC, s); 518 } 519 520 void AArch64ADRPThunk::addSymbols(ThunkSection &isec) { 521 addSymbol(saver().save("__AArch64ADRPThunk_" + destination.getName()), 522 STT_FUNC, 0, isec); 523 addSymbol("$x", STT_NOTYPE, 0, isec); 524 } 525 526 // ARM Target Thunks 527 static uint64_t getARMThunkDestVA(const Symbol &s) { 528 uint64_t v = s.isInPlt() ? s.getPltVA() : s.getVA(); 529 return SignExtend64<32>(v); 530 } 531 532 // This function returns true if the target is not Thumb and is within 2^26, and 533 // it has not previously returned false (see comment for mayUseShortThunk). 534 bool ARMThunk::getMayUseShortThunk() { 535 if (!mayUseShortThunk) 536 return false; 537 uint64_t s = getARMThunkDestVA(destination); 538 if (s & 1) { 539 mayUseShortThunk = false; 540 return false; 541 } 542 uint64_t p = getThunkTargetSym()->getVA(); 543 int64_t offset = s - p - 8; 544 mayUseShortThunk = llvm::isInt<26>(offset); 545 return mayUseShortThunk; 546 } 547 548 void ARMThunk::writeTo(uint8_t *buf) { 549 if (!getMayUseShortThunk()) { 550 writeLong(buf); 551 return; 552 } 553 554 uint64_t s = getARMThunkDestVA(destination); 555 uint64_t p = getThunkTargetSym()->getVA(); 556 int64_t offset = s - p - 8; 557 const uint8_t data[] = { 558 0x00, 0x00, 0x00, 0xea, // b S 559 }; 560 memcpy(buf, data, sizeof(data)); 561 target->relocateNoSym(buf, R_ARM_JUMP24, offset); 562 } 563 564 bool ARMThunk::isCompatibleWith(const InputSection &isec, 565 const Relocation &rel) const { 566 // v4T does not have BLX, so also deny R_ARM_THM_CALL 567 if (!config->armHasBlx && rel.type == R_ARM_THM_CALL) 568 return false; 569 570 // Thumb branch relocations can't use BLX 571 return rel.type != R_ARM_THM_JUMP19 && rel.type != R_ARM_THM_JUMP24; 572 } 573 574 // This function returns true if: 575 // the target is Thumb 576 // && is within branch range 577 // && this function has not previously returned false 578 // (see comment for mayUseShortThunk) 579 // && the arch supports Thumb branch range extension. 580 bool ThumbThunk::getMayUseShortThunk() { 581 if (!mayUseShortThunk || !config->armJ1J2BranchEncoding) 582 return false; 583 uint64_t s = getARMThunkDestVA(destination); 584 if ((s & 1) == 0) { 585 mayUseShortThunk = false; 586 return false; 587 } 588 uint64_t p = getThunkTargetSym()->getVA() & ~1; 589 int64_t offset = s - p - 4; 590 mayUseShortThunk = llvm::isInt<25>(offset); 591 return mayUseShortThunk; 592 } 593 594 void ThumbThunk::writeTo(uint8_t *buf) { 595 if (!getMayUseShortThunk()) { 596 writeLong(buf); 597 return; 598 } 599 600 uint64_t s = getARMThunkDestVA(destination); 601 uint64_t p = getThunkTargetSym()->getVA(); 602 int64_t offset = s - p - 4; 603 const uint8_t data[] = { 604 0x00, 0xf0, 0x00, 0xb0, // b.w S 605 }; 606 memcpy(buf, data, sizeof(data)); 607 target->relocateNoSym(buf, R_ARM_THM_JUMP24, offset); 608 } 609 610 bool ThumbThunk::isCompatibleWith(const InputSection &isec, 611 const Relocation &rel) const { 612 // v4T does not have BLX, so also deny R_ARM_CALL 613 if (!config->armHasBlx && rel.type == R_ARM_CALL) 614 return false; 615 616 // ARM branch relocations can't use BLX 617 return rel.type != R_ARM_JUMP24 && rel.type != R_ARM_PC24 && rel.type != R_ARM_PLT32; 618 } 619 620 void ARMV7ABSLongThunk::writeLong(uint8_t *buf) { 621 const uint8_t data[] = { 622 0x00, 0xc0, 0x00, 0xe3, // movw ip,:lower16:S 623 0x00, 0xc0, 0x40, 0xe3, // movt ip,:upper16:S 624 0x1c, 0xff, 0x2f, 0xe1, // bx ip 625 }; 626 uint64_t s = getARMThunkDestVA(destination); 627 memcpy(buf, data, sizeof(data)); 628 target->relocateNoSym(buf, R_ARM_MOVW_ABS_NC, s); 629 target->relocateNoSym(buf + 4, R_ARM_MOVT_ABS, s); 630 } 631 632 void ARMV7ABSLongThunk::addSymbols(ThunkSection &isec) { 633 addSymbol(saver().save("__ARMv7ABSLongThunk_" + destination.getName()), 634 STT_FUNC, 0, isec); 635 addSymbol("$a", STT_NOTYPE, 0, isec); 636 } 637 638 void ThumbV7ABSLongThunk::writeLong(uint8_t *buf) { 639 const uint8_t data[] = { 640 0x40, 0xf2, 0x00, 0x0c, // movw ip, :lower16:S 641 0xc0, 0xf2, 0x00, 0x0c, // movt ip, :upper16:S 642 0x60, 0x47, // bx ip 643 }; 644 uint64_t s = getARMThunkDestVA(destination); 645 memcpy(buf, data, sizeof(data)); 646 target->relocateNoSym(buf, R_ARM_THM_MOVW_ABS_NC, s); 647 target->relocateNoSym(buf + 4, R_ARM_THM_MOVT_ABS, s); 648 } 649 650 void ThumbV7ABSLongThunk::addSymbols(ThunkSection &isec) { 651 addSymbol(saver().save("__Thumbv7ABSLongThunk_" + destination.getName()), 652 STT_FUNC, 1, isec); 653 addSymbol("$t", STT_NOTYPE, 0, isec); 654 } 655 656 void ARMV7PILongThunk::writeLong(uint8_t *buf) { 657 const uint8_t data[] = { 658 0xf0, 0xcf, 0x0f, 0xe3, // P: movw ip,:lower16:S - (P + (L1-P) + 8) 659 0x00, 0xc0, 0x40, 0xe3, // movt ip,:upper16:S - (P + (L1-P) + 8) 660 0x0f, 0xc0, 0x8c, 0xe0, // L1: add ip, ip, pc 661 0x1c, 0xff, 0x2f, 0xe1, // bx ip 662 }; 663 uint64_t s = getARMThunkDestVA(destination); 664 uint64_t p = getThunkTargetSym()->getVA(); 665 int64_t offset = s - p - 16; 666 memcpy(buf, data, sizeof(data)); 667 target->relocateNoSym(buf, R_ARM_MOVW_PREL_NC, offset); 668 target->relocateNoSym(buf + 4, R_ARM_MOVT_PREL, offset); 669 } 670 671 void ARMV7PILongThunk::addSymbols(ThunkSection &isec) { 672 addSymbol(saver().save("__ARMV7PILongThunk_" + destination.getName()), 673 STT_FUNC, 0, isec); 674 addSymbol("$a", STT_NOTYPE, 0, isec); 675 } 676 677 void ThumbV7PILongThunk::writeLong(uint8_t *buf) { 678 const uint8_t data[] = { 679 0x4f, 0xf6, 0xf4, 0x7c, // P: movw ip,:lower16:S - (P + (L1-P) + 4) 680 0xc0, 0xf2, 0x00, 0x0c, // movt ip,:upper16:S - (P + (L1-P) + 4) 681 0xfc, 0x44, // L1: add ip, pc 682 0x60, 0x47, // bx ip 683 }; 684 uint64_t s = getARMThunkDestVA(destination); 685 uint64_t p = getThunkTargetSym()->getVA() & ~0x1; 686 int64_t offset = s - p - 12; 687 memcpy(buf, data, sizeof(data)); 688 target->relocateNoSym(buf, R_ARM_THM_MOVW_PREL_NC, offset); 689 target->relocateNoSym(buf + 4, R_ARM_THM_MOVT_PREL, offset); 690 } 691 692 void ThumbV7PILongThunk::addSymbols(ThunkSection &isec) { 693 addSymbol(saver().save("__ThumbV7PILongThunk_" + destination.getName()), 694 STT_FUNC, 1, isec); 695 addSymbol("$t", STT_NOTYPE, 0, isec); 696 } 697 698 void ThumbV6MABSLongThunk::writeLong(uint8_t *buf) { 699 // Most Thumb instructions cannot access the high registers r8 - r15. As the 700 // only register we can corrupt is r12 we must instead spill a low register 701 // to the stack to use as a scratch register. We push r1 even though we 702 // don't need to get some space to use for the return address. 703 const uint8_t data[] = { 704 0x03, 0xb4, // push {r0, r1} ; Obtain scratch registers 705 0x01, 0x48, // ldr r0, [pc, #4] ; L1 706 0x01, 0x90, // str r0, [sp, #4] ; SP + 4 = S 707 0x01, 0xbd, // pop {r0, pc} ; restore r0 and branch to dest 708 0x00, 0x00, 0x00, 0x00 // L1: .word S 709 }; 710 uint64_t s = getARMThunkDestVA(destination); 711 memcpy(buf, data, sizeof(data)); 712 target->relocateNoSym(buf + 8, R_ARM_ABS32, s); 713 } 714 715 void ThumbV6MABSLongThunk::addSymbols(ThunkSection &isec) { 716 addSymbol(saver().save("__Thumbv6MABSLongThunk_" + destination.getName()), 717 STT_FUNC, 1, isec); 718 addSymbol("$t", STT_NOTYPE, 0, isec); 719 addSymbol("$d", STT_NOTYPE, 8, isec); 720 } 721 722 void ThumbV6MPILongThunk::writeLong(uint8_t *buf) { 723 // Most Thumb instructions cannot access the high registers r8 - r15. As the 724 // only register we can corrupt is ip (r12) we must instead spill a low 725 // register to the stack to use as a scratch register. 726 const uint8_t data[] = { 727 0x01, 0xb4, // P: push {r0} ; Obtain scratch register 728 0x02, 0x48, // ldr r0, [pc, #8] ; L2 729 0x84, 0x46, // mov ip, r0 ; high to low register 730 0x01, 0xbc, // pop {r0} ; restore scratch register 731 0xe7, 0x44, // L1: add pc, ip ; transfer control 732 0xc0, 0x46, // nop ; pad to 4-byte boundary 733 0x00, 0x00, 0x00, 0x00, // L2: .word S - (P + (L1 - P) + 4) 734 }; 735 uint64_t s = getARMThunkDestVA(destination); 736 uint64_t p = getThunkTargetSym()->getVA() & ~0x1; 737 memcpy(buf, data, sizeof(data)); 738 target->relocateNoSym(buf + 12, R_ARM_REL32, s - p - 12); 739 } 740 741 void ThumbV6MPILongThunk::addSymbols(ThunkSection &isec) { 742 addSymbol(saver().save("__Thumbv6MPILongThunk_" + destination.getName()), 743 STT_FUNC, 1, isec); 744 addSymbol("$t", STT_NOTYPE, 0, isec); 745 addSymbol("$d", STT_NOTYPE, 12, isec); 746 } 747 748 void ARMV5LongLdrPcThunk::writeLong(uint8_t *buf) { 749 const uint8_t data[] = { 750 0x04, 0xf0, 0x1f, 0xe5, // ldr pc, [pc,#-4] ; L1 751 0x00, 0x00, 0x00, 0x00, // L1: .word S 752 }; 753 memcpy(buf, data, sizeof(data)); 754 target->relocateNoSym(buf + 4, R_ARM_ABS32, getARMThunkDestVA(destination)); 755 } 756 757 void ARMV5LongLdrPcThunk::addSymbols(ThunkSection &isec) { 758 addSymbol(saver().save("__ARMv5LongLdrPcThunk_" + destination.getName()), 759 STT_FUNC, 0, isec); 760 addSymbol("$a", STT_NOTYPE, 0, isec); 761 addSymbol("$d", STT_NOTYPE, 4, isec); 762 } 763 764 void ARMV4ABSLongBXThunk::writeLong(uint8_t *buf) { 765 const uint8_t data[] = { 766 0x00, 0xc0, 0x9f, 0xe5, // ldr r12, [pc] ; L1 767 0x1c, 0xff, 0x2f, 0xe1, // bx r12 768 0x00, 0x00, 0x00, 0x00, // L1: .word S 769 }; 770 memcpy(buf, data, sizeof(data)); 771 target->relocateNoSym(buf + 8, R_ARM_ABS32, getARMThunkDestVA(destination)); 772 } 773 774 void ARMV4ABSLongBXThunk::addSymbols(ThunkSection &isec) { 775 addSymbol(saver().save("__ARMv4ABSLongBXThunk_" + destination.getName()), 776 STT_FUNC, 0, isec); 777 addSymbol("$a", STT_NOTYPE, 0, isec); 778 addSymbol("$d", STT_NOTYPE, 8, isec); 779 } 780 781 void ThumbV4ABSLongBXThunk::writeLong(uint8_t *buf) { 782 const uint8_t data[] = { 783 0x78, 0x47, // bx pc 784 0xfd, 0xe7, // b #-6 ; Arm recommended sequence to follow bx pc 785 0x04, 0xf0, 0x1f, 0xe5, // ldr pc, [pc, #-4] ; L1 786 0x00, 0x00, 0x00, 0x00, // L1: .word S 787 }; 788 memcpy(buf, data, sizeof(data)); 789 target->relocateNoSym(buf + 8, R_ARM_ABS32, getARMThunkDestVA(destination)); 790 } 791 792 void ThumbV4ABSLongBXThunk::addSymbols(ThunkSection &isec) { 793 addSymbol(saver().save("__Thumbv4ABSLongBXThunk_" + destination.getName()), 794 STT_FUNC, 1, isec); 795 addSymbol("$t", STT_NOTYPE, 0, isec); 796 addSymbol("$a", STT_NOTYPE, 4, isec); 797 addSymbol("$d", STT_NOTYPE, 8, isec); 798 } 799 800 void ThumbV4ABSLongThunk::writeLong(uint8_t *buf) { 801 const uint8_t data[] = { 802 0x78, 0x47, // bx pc 803 0xfd, 0xe7, // b #-6 ; Arm recommended sequence to follow bx pc 804 0x00, 0xc0, 0x9f, 0xe5, // ldr r12, [pc] ; L1 805 0x1c, 0xff, 0x2f, 0xe1, // bx r12 806 0x00, 0x00, 0x00, 0x00, // L1: .word S 807 }; 808 memcpy(buf, data, sizeof(data)); 809 target->relocateNoSym(buf + 12, R_ARM_ABS32, getARMThunkDestVA(destination)); 810 } 811 812 void ThumbV4ABSLongThunk::addSymbols(ThunkSection &isec) { 813 addSymbol(saver().save("__Thumbv4ABSLongThunk_" + destination.getName()), 814 STT_FUNC, 1, isec); 815 addSymbol("$t", STT_NOTYPE, 0, isec); 816 addSymbol("$a", STT_NOTYPE, 4, isec); 817 addSymbol("$d", STT_NOTYPE, 12, isec); 818 } 819 820 void ARMV4PILongBXThunk::writeLong(uint8_t *buf) { 821 const uint8_t data[] = { 822 0x04, 0xc0, 0x9f, 0xe5, // P: ldr ip, [pc,#4] ; L2 823 0x0c, 0xc0, 0x8f, 0xe0, // L1: add ip, pc, ip 824 0x1c, 0xff, 0x2f, 0xe1, // bx ip 825 0x00, 0x00, 0x00, 0x00, // L2: .word S - (P + (L1 - P) + 8) 826 }; 827 uint64_t s = getARMThunkDestVA(destination); 828 uint64_t p = getThunkTargetSym()->getVA() & ~0x1; 829 memcpy(buf, data, sizeof(data)); 830 target->relocateNoSym(buf + 12, R_ARM_REL32, s - p - 12); 831 } 832 833 void ARMV4PILongBXThunk::addSymbols(ThunkSection &isec) { 834 addSymbol(saver().save("__ARMv4PILongBXThunk_" + destination.getName()), 835 STT_FUNC, 0, isec); 836 addSymbol("$a", STT_NOTYPE, 0, isec); 837 addSymbol("$d", STT_NOTYPE, 12, isec); 838 } 839 840 void ARMV4PILongThunk::writeLong(uint8_t *buf) { 841 const uint8_t data[] = { 842 0x00, 0xc0, 0x9f, 0xe5, // P: ldr ip, [pc] ; L2 843 0x0c, 0xf0, 0x8f, 0xe0, // L1: add pc, pc, r12 844 0x00, 0x00, 0x00, 0x00, // L2: .word S - (P + (L1 - P) + 8) 845 }; 846 uint64_t s = getARMThunkDestVA(destination); 847 uint64_t p = getThunkTargetSym()->getVA() & ~0x1; 848 memcpy(buf, data, sizeof(data)); 849 target->relocateNoSym(buf + 8, R_ARM_REL32, s - p - 12); 850 } 851 852 void ARMV4PILongThunk::addSymbols(ThunkSection &isec) { 853 addSymbol(saver().save("__ARMv4PILongThunk_" + destination.getName()), 854 STT_FUNC, 0, isec); 855 addSymbol("$a", STT_NOTYPE, 0, isec); 856 addSymbol("$d", STT_NOTYPE, 8, isec); 857 } 858 859 void ThumbV4PILongBXThunk::writeLong(uint8_t *buf) { 860 const uint8_t data[] = { 861 0x78, 0x47, // P: bx pc 862 0xfd, 0xe7, // b #-6 ; Arm recommended sequence to follow bx pc 863 0x00, 0xc0, 0x9f, 0xe5, // ldr r12, [pc] ; L2 864 0x0f, 0xf0, 0x8c, 0xe0, // L1: add pc, r12, pc 865 0x00, 0x00, 0x00, 0x00, // L2: .word S - (P + (L1 - P) + 8) 866 }; 867 uint64_t s = getARMThunkDestVA(destination); 868 uint64_t p = getThunkTargetSym()->getVA() & ~0x1; 869 memcpy(buf, data, sizeof(data)); 870 target->relocateNoSym(buf + 12, R_ARM_REL32, s - p - 16); 871 } 872 873 void ThumbV4PILongBXThunk::addSymbols(ThunkSection &isec) { 874 addSymbol(saver().save("__Thumbv4PILongBXThunk_" + destination.getName()), 875 STT_FUNC, 1, isec); 876 addSymbol("$t", STT_NOTYPE, 0, isec); 877 addSymbol("$a", STT_NOTYPE, 4, isec); 878 addSymbol("$d", STT_NOTYPE, 12, isec); 879 } 880 881 void ThumbV4PILongThunk::writeLong(uint8_t *buf) { 882 const uint8_t data[] = { 883 0x78, 0x47, // P: bx pc 884 0xfd, 0xe7, // b #-6 ; Arm recommended sequence to follow bx pc 885 0x04, 0xc0, 0x9f, 0xe5, // ldr ip, [pc,#4] ; L2 886 0x0c, 0xc0, 0x8f, 0xe0, // L1: add ip, pc, ip 887 0x1c, 0xff, 0x2f, 0xe1, // bx ip 888 0x00, 0x00, 0x00, 0x00, // L2: .word S - (P + (L1 - P) + 8) 889 }; 890 uint64_t s = getARMThunkDestVA(destination); 891 uint64_t p = getThunkTargetSym()->getVA() & ~0x1; 892 memcpy(buf, data, sizeof(data)); 893 target->relocateNoSym(buf + 16, R_ARM_REL32, s - p - 16); 894 } 895 896 void ThumbV4PILongThunk::addSymbols(ThunkSection &isec) { 897 addSymbol(saver().save("__Thumbv4PILongThunk_" + destination.getName()), 898 STT_FUNC, 1, isec); 899 addSymbol("$t", STT_NOTYPE, 0, isec); 900 addSymbol("$a", STT_NOTYPE, 4, isec); 901 addSymbol("$d", STT_NOTYPE, 16, isec); 902 } 903 904 // Write MIPS LA25 thunk code to call PIC function from the non-PIC one. 905 void MipsThunk::writeTo(uint8_t *buf) { 906 uint64_t s = destination.getVA(); 907 write32(buf, 0x3c190000); // lui $25, %hi(func) 908 write32(buf + 4, 0x08000000 | (s >> 2)); // j func 909 write32(buf + 8, 0x27390000); // addiu $25, $25, %lo(func) 910 write32(buf + 12, 0x00000000); // nop 911 target->relocateNoSym(buf, R_MIPS_HI16, s); 912 target->relocateNoSym(buf + 8, R_MIPS_LO16, s); 913 } 914 915 void MipsThunk::addSymbols(ThunkSection &isec) { 916 addSymbol(saver().save("__LA25Thunk_" + destination.getName()), STT_FUNC, 0, 917 isec); 918 } 919 920 InputSection *MipsThunk::getTargetInputSection() const { 921 auto &dr = cast<Defined>(destination); 922 return dyn_cast<InputSection>(dr.section); 923 } 924 925 // Write microMIPS R2-R5 LA25 thunk code 926 // to call PIC function from the non-PIC one. 927 void MicroMipsThunk::writeTo(uint8_t *buf) { 928 uint64_t s = destination.getVA(); 929 write16(buf, 0x41b9); // lui $25, %hi(func) 930 write16(buf + 4, 0xd400); // j func 931 write16(buf + 8, 0x3339); // addiu $25, $25, %lo(func) 932 write16(buf + 12, 0x0c00); // nop 933 target->relocateNoSym(buf, R_MICROMIPS_HI16, s); 934 target->relocateNoSym(buf + 4, R_MICROMIPS_26_S1, s); 935 target->relocateNoSym(buf + 8, R_MICROMIPS_LO16, s); 936 } 937 938 void MicroMipsThunk::addSymbols(ThunkSection &isec) { 939 Defined *d = 940 addSymbol(saver().save("__microLA25Thunk_" + destination.getName()), 941 STT_FUNC, 0, isec); 942 d->stOther |= STO_MIPS_MICROMIPS; 943 } 944 945 InputSection *MicroMipsThunk::getTargetInputSection() const { 946 auto &dr = cast<Defined>(destination); 947 return dyn_cast<InputSection>(dr.section); 948 } 949 950 // Write microMIPS R6 LA25 thunk code 951 // to call PIC function from the non-PIC one. 952 void MicroMipsR6Thunk::writeTo(uint8_t *buf) { 953 uint64_t s = destination.getVA(); 954 uint64_t p = getThunkTargetSym()->getVA(); 955 write16(buf, 0x1320); // lui $25, %hi(func) 956 write16(buf + 4, 0x3339); // addiu $25, $25, %lo(func) 957 write16(buf + 8, 0x9400); // bc func 958 target->relocateNoSym(buf, R_MICROMIPS_HI16, s); 959 target->relocateNoSym(buf + 4, R_MICROMIPS_LO16, s); 960 target->relocateNoSym(buf + 8, R_MICROMIPS_PC26_S1, s - p - 12); 961 } 962 963 void MicroMipsR6Thunk::addSymbols(ThunkSection &isec) { 964 Defined *d = 965 addSymbol(saver().save("__microLA25Thunk_" + destination.getName()), 966 STT_FUNC, 0, isec); 967 d->stOther |= STO_MIPS_MICROMIPS; 968 } 969 970 InputSection *MicroMipsR6Thunk::getTargetInputSection() const { 971 auto &dr = cast<Defined>(destination); 972 return dyn_cast<InputSection>(dr.section); 973 } 974 975 void elf::writePPC32PltCallStub(uint8_t *buf, uint64_t gotPltVA, 976 const InputFile *file, int64_t addend) { 977 if (!config->isPic) { 978 write32(buf + 0, 0x3d600000 | (gotPltVA + 0x8000) >> 16); // lis r11,ha 979 write32(buf + 4, 0x816b0000 | (uint16_t)gotPltVA); // lwz r11,l(r11) 980 write32(buf + 8, 0x7d6903a6); // mtctr r11 981 write32(buf + 12, 0x4e800420); // bctr 982 return; 983 } 984 uint32_t offset; 985 if (addend >= 0x8000) { 986 // The stub loads an address relative to r30 (.got2+Addend). Addend is 987 // almost always 0x8000. The address of .got2 is different in another object 988 // file, so a stub cannot be shared. 989 offset = gotPltVA - 990 (in.ppc32Got2->getParent()->getVA() + 991 (file->ppc32Got2 ? file->ppc32Got2->outSecOff : 0) + addend); 992 } else { 993 // The stub loads an address relative to _GLOBAL_OFFSET_TABLE_ (which is 994 // currently the address of .got). 995 offset = gotPltVA - in.got->getVA(); 996 } 997 uint16_t ha = (offset + 0x8000) >> 16, l = (uint16_t)offset; 998 if (ha == 0) { 999 write32(buf + 0, 0x817e0000 | l); // lwz r11,l(r30) 1000 write32(buf + 4, 0x7d6903a6); // mtctr r11 1001 write32(buf + 8, 0x4e800420); // bctr 1002 write32(buf + 12, 0x60000000); // nop 1003 } else { 1004 write32(buf + 0, 0x3d7e0000 | ha); // addis r11,r30,ha 1005 write32(buf + 4, 0x816b0000 | l); // lwz r11,l(r11) 1006 write32(buf + 8, 0x7d6903a6); // mtctr r11 1007 write32(buf + 12, 0x4e800420); // bctr 1008 } 1009 } 1010 1011 void PPC32PltCallStub::writeTo(uint8_t *buf) { 1012 writePPC32PltCallStub(buf, destination.getGotPltVA(), file, addend); 1013 } 1014 1015 void PPC32PltCallStub::addSymbols(ThunkSection &isec) { 1016 std::string buf; 1017 raw_string_ostream os(buf); 1018 os << format_hex_no_prefix(addend, 8); 1019 if (!config->isPic) 1020 os << ".plt_call32."; 1021 else if (addend >= 0x8000) 1022 os << ".got2.plt_pic32."; 1023 else 1024 os << ".plt_pic32."; 1025 os << destination.getName(); 1026 addSymbol(saver().save(os.str()), STT_FUNC, 0, isec); 1027 } 1028 1029 bool PPC32PltCallStub::isCompatibleWith(const InputSection &isec, 1030 const Relocation &rel) const { 1031 return !config->isPic || (isec.file == file && rel.addend == addend); 1032 } 1033 1034 void PPC32LongThunk::addSymbols(ThunkSection &isec) { 1035 addSymbol(saver().save("__LongThunk_" + destination.getName()), STT_FUNC, 0, 1036 isec); 1037 } 1038 1039 void PPC32LongThunk::writeTo(uint8_t *buf) { 1040 auto ha = [](uint32_t v) -> uint16_t { return (v + 0x8000) >> 16; }; 1041 auto lo = [](uint32_t v) -> uint16_t { return v; }; 1042 uint32_t d = destination.getVA(addend); 1043 if (config->isPic) { 1044 uint32_t off = d - (getThunkTargetSym()->getVA() + 8); 1045 write32(buf + 0, 0x7c0802a6); // mflr r12,0 1046 write32(buf + 4, 0x429f0005); // bcl r20,r31,.+4 1047 write32(buf + 8, 0x7d8802a6); // mtctr r12 1048 write32(buf + 12, 0x3d8c0000 | ha(off)); // addis r12,r12,off@ha 1049 write32(buf + 16, 0x398c0000 | lo(off)); // addi r12,r12,off@l 1050 write32(buf + 20, 0x7c0803a6); // mtlr r0 1051 buf += 24; 1052 } else { 1053 write32(buf + 0, 0x3d800000 | ha(d)); // lis r12,d@ha 1054 write32(buf + 4, 0x398c0000 | lo(d)); // addi r12,r12,d@l 1055 buf += 8; 1056 } 1057 write32(buf + 0, 0x7d8903a6); // mtctr r12 1058 write32(buf + 4, 0x4e800420); // bctr 1059 } 1060 1061 void elf::writePPC64LoadAndBranch(uint8_t *buf, int64_t offset) { 1062 uint16_t offHa = (offset + 0x8000) >> 16; 1063 uint16_t offLo = offset & 0xffff; 1064 1065 write32(buf + 0, 0x3d820000 | offHa); // addis r12, r2, OffHa 1066 write32(buf + 4, 0xe98c0000 | offLo); // ld r12, OffLo(r12) 1067 write32(buf + 8, 0x7d8903a6); // mtctr r12 1068 write32(buf + 12, 0x4e800420); // bctr 1069 } 1070 1071 void PPC64PltCallStub::writeTo(uint8_t *buf) { 1072 int64_t offset = destination.getGotPltVA() - getPPC64TocBase(); 1073 // Save the TOC pointer to the save-slot reserved in the call frame. 1074 write32(buf + 0, 0xf8410018); // std r2,24(r1) 1075 writePPC64LoadAndBranch(buf + 4, offset); 1076 } 1077 1078 void PPC64PltCallStub::addSymbols(ThunkSection &isec) { 1079 Defined *s = addSymbol(saver().save("__plt_" + destination.getName()), 1080 STT_FUNC, 0, isec); 1081 s->needsTocRestore = true; 1082 s->file = destination.file; 1083 } 1084 1085 bool PPC64PltCallStub::isCompatibleWith(const InputSection &isec, 1086 const Relocation &rel) const { 1087 return rel.type == R_PPC64_REL24 || rel.type == R_PPC64_REL14; 1088 } 1089 1090 void PPC64R2SaveStub::writeTo(uint8_t *buf) { 1091 const int64_t offset = computeOffset(); 1092 write32(buf + 0, 0xf8410018); // std r2,24(r1) 1093 // The branch offset needs to fit in 26 bits. 1094 if (getMayUseShortThunk()) { 1095 write32(buf + 4, 0x48000000 | (offset & 0x03fffffc)); // b <offset> 1096 } else if (isInt<34>(offset)) { 1097 int nextInstOffset; 1098 uint64_t tocOffset = destination.getVA() - getPPC64TocBase(); 1099 if (tocOffset >> 16 > 0) { 1100 const uint64_t addi = ADDI_R12_TO_R12_NO_DISP | (tocOffset & 0xffff); 1101 const uint64_t addis = 1102 ADDIS_R12_TO_R2_NO_DISP | ((tocOffset >> 16) & 0xffff); 1103 write32(buf + 4, addis); // addis r12, r2 , top of offset 1104 write32(buf + 8, addi); // addi r12, r12, bottom of offset 1105 nextInstOffset = 12; 1106 } else { 1107 const uint64_t addi = ADDI_R12_TO_R2_NO_DISP | (tocOffset & 0xffff); 1108 write32(buf + 4, addi); // addi r12, r2, offset 1109 nextInstOffset = 8; 1110 } 1111 write32(buf + nextInstOffset, MTCTR_R12); // mtctr r12 1112 write32(buf + nextInstOffset + 4, BCTR); // bctr 1113 } else { 1114 in.ppc64LongBranchTarget->addEntry(&destination, addend); 1115 const int64_t offsetFromTOC = 1116 in.ppc64LongBranchTarget->getEntryVA(&destination, addend) - 1117 getPPC64TocBase(); 1118 writePPC64LoadAndBranch(buf + 4, offsetFromTOC); 1119 } 1120 } 1121 1122 void PPC64R2SaveStub::addSymbols(ThunkSection &isec) { 1123 Defined *s = addSymbol(saver().save("__toc_save_" + destination.getName()), 1124 STT_FUNC, 0, isec); 1125 s->needsTocRestore = true; 1126 } 1127 1128 bool PPC64R2SaveStub::isCompatibleWith(const InputSection &isec, 1129 const Relocation &rel) const { 1130 return rel.type == R_PPC64_REL24 || rel.type == R_PPC64_REL14; 1131 } 1132 1133 void PPC64R12SetupStub::writeTo(uint8_t *buf) { 1134 int64_t offset = destination.getVA() - getThunkTargetSym()->getVA(); 1135 if (!isInt<34>(offset)) 1136 reportRangeError(buf, offset, 34, destination, "R12 setup stub offset"); 1137 1138 int nextInstOffset; 1139 if (!config->power10Stubs) { 1140 uint32_t off = destination.getVA(addend) - getThunkTargetSym()->getVA() - 8; 1141 write32(buf + 0, 0x7c0802a6); // mflr r12 1142 write32(buf + 4, 0x429f0005); // bcl 20,31,.+4 1143 write32(buf + 8, 0x7d6802a6); // mflr r11 1144 write32(buf + 12, 0x7d8803a6); // mtlr r12 1145 write32(buf + 16, 0x3d8b0000 | computeHiBits(off));// addis r12,r11,off@ha 1146 write32(buf + 20, 0x398c0000 | (off & 0xffff)); // addi r12,r12,off@l 1147 nextInstOffset = 24; 1148 } else { 1149 uint64_t paddi = PADDI_R12_NO_DISP | (((offset >> 16) & 0x3ffff) << 32) | 1150 (offset & 0xffff); 1151 writePrefixedInstruction(buf + 0, paddi); // paddi r12, 0, func@pcrel, 1 1152 nextInstOffset = 8; 1153 } 1154 write32(buf + nextInstOffset, MTCTR_R12); // mtctr r12 1155 write32(buf + nextInstOffset + 4, BCTR); // bctr 1156 } 1157 1158 void PPC64R12SetupStub::addSymbols(ThunkSection &isec) { 1159 addSymbol(saver().save("__gep_setup_" + destination.getName()), STT_FUNC, 0, 1160 isec); 1161 } 1162 1163 bool PPC64R12SetupStub::isCompatibleWith(const InputSection &isec, 1164 const Relocation &rel) const { 1165 return rel.type == R_PPC64_REL24_NOTOC; 1166 } 1167 1168 void PPC64PCRelPLTStub::writeTo(uint8_t *buf) { 1169 int nextInstOffset = 0; 1170 int64_t offset = destination.getGotPltVA() - getThunkTargetSym()->getVA(); 1171 1172 if (config->power10Stubs) { 1173 if (!isInt<34>(offset)) 1174 reportRangeError(buf, offset, 34, destination, 1175 "PC-relative PLT stub offset"); 1176 const uint64_t pld = PLD_R12_NO_DISP | (((offset >> 16) & 0x3ffff) << 32) | 1177 (offset & 0xffff); 1178 writePrefixedInstruction(buf + 0, pld); // pld r12, func@plt@pcrel 1179 nextInstOffset = 8; 1180 } else { 1181 uint32_t off = destination.getVA(addend) - getThunkTargetSym()->getVA() - 8; 1182 write32(buf + 0, 0x7c0802a6); // mflr r12 1183 write32(buf + 4, 0x429f0005); // bcl 20,31,.+4 1184 write32(buf + 8, 0x7d6802a6); // mflr r11 1185 write32(buf + 12, 0x7d8803a6); // mtlr r12 1186 write32(buf + 16, 0x3d8b0000 | computeHiBits(off)); // addis r12,r11,off@ha 1187 write32(buf + 20, 0x398c0000 | (off & 0xffff)); // addi r12,r12,off@l 1188 nextInstOffset = 24; 1189 } 1190 write32(buf + nextInstOffset, MTCTR_R12); // mtctr r12 1191 write32(buf + nextInstOffset + 4, BCTR); // bctr 1192 } 1193 1194 void PPC64PCRelPLTStub::addSymbols(ThunkSection &isec) { 1195 addSymbol(saver().save("__plt_pcrel_" + destination.getName()), STT_FUNC, 0, 1196 isec); 1197 } 1198 1199 bool PPC64PCRelPLTStub::isCompatibleWith(const InputSection &isec, 1200 const Relocation &rel) const { 1201 return rel.type == R_PPC64_REL24_NOTOC; 1202 } 1203 1204 void PPC64LongBranchThunk::writeTo(uint8_t *buf) { 1205 int64_t offset = in.ppc64LongBranchTarget->getEntryVA(&destination, addend) - 1206 getPPC64TocBase(); 1207 writePPC64LoadAndBranch(buf, offset); 1208 } 1209 1210 void PPC64LongBranchThunk::addSymbols(ThunkSection &isec) { 1211 addSymbol(saver().save("__long_branch_" + destination.getName()), STT_FUNC, 0, 1212 isec); 1213 } 1214 1215 bool PPC64LongBranchThunk::isCompatibleWith(const InputSection &isec, 1216 const Relocation &rel) const { 1217 return rel.type == R_PPC64_REL24 || rel.type == R_PPC64_REL14; 1218 } 1219 1220 Thunk::Thunk(Symbol &d, int64_t a) : destination(d), addend(a), offset(0) {} 1221 1222 Thunk::~Thunk() = default; 1223 1224 static Thunk *addThunkAArch64(RelType type, Symbol &s, int64_t a) { 1225 if (type != R_AARCH64_CALL26 && type != R_AARCH64_JUMP26 && 1226 type != R_AARCH64_PLT32) 1227 fatal("unrecognized relocation type"); 1228 if (config->picThunk) 1229 return make<AArch64ADRPThunk>(s, a); 1230 return make<AArch64ABSLongThunk>(s, a); 1231 } 1232 1233 // Creates a thunk for long branches or Thumb-ARM interworking. 1234 // Arm Architectures v4t does not support Thumb2 technology, and does not 1235 // support BLX or LDR Arm/Thumb state switching. This means that 1236 // - MOVT and MOVW instructions cannot be used. 1237 // - We can't rewrite BL in place to BLX. We will need thunks. 1238 // 1239 // TODO: use B for short Thumb->Arm thunks instead of LDR (this doesn't work for 1240 // Arm->Thumb, as in Arm state no BX PC trick; it doesn't switch state). 1241 static Thunk *addThunkArmv4(RelType reloc, Symbol &s, int64_t a) { 1242 bool thumb_target = s.getVA(a) & 1; 1243 1244 switch (reloc) { 1245 case R_ARM_PC24: 1246 case R_ARM_PLT32: 1247 case R_ARM_JUMP24: 1248 case R_ARM_CALL: 1249 if (config->picThunk) { 1250 if (thumb_target) 1251 return make<ARMV4PILongBXThunk>(s, a); 1252 return make<ARMV4PILongThunk>(s, a); 1253 } 1254 if (thumb_target) 1255 return make<ARMV4ABSLongBXThunk>(s, a); 1256 return make<ARMV5LongLdrPcThunk>(s, a); 1257 case R_ARM_THM_CALL: 1258 if (config->picThunk) { 1259 if (thumb_target) 1260 return make<ThumbV4PILongThunk>(s, a); 1261 return make<ThumbV4PILongBXThunk>(s, a); 1262 } 1263 if (thumb_target) 1264 return make<ThumbV4ABSLongThunk>(s, a); 1265 return make<ThumbV4ABSLongBXThunk>(s, a); 1266 } 1267 fatal("relocation " + toString(reloc) + " to " + toString(s) + 1268 " not supported for Armv4 or Armv4T target"); 1269 } 1270 1271 // Creates a thunk for Thumb-ARM interworking compatible with Armv5 and Armv6. 1272 // Arm Architectures v5 and v6 do not support Thumb2 technology. This means that 1273 // - MOVT and MOVW instructions cannot be used 1274 // - Only Thumb relocation that can generate a Thunk is a BL, this can always 1275 // be transformed into a BLX 1276 static Thunk *addThunkArmv5v6(RelType reloc, Symbol &s, int64_t a) { 1277 switch (reloc) { 1278 case R_ARM_PC24: 1279 case R_ARM_PLT32: 1280 case R_ARM_JUMP24: 1281 case R_ARM_CALL: 1282 case R_ARM_THM_CALL: 1283 if (config->picThunk) 1284 return make<ARMV4PILongBXThunk>(s, a); 1285 return make<ARMV5LongLdrPcThunk>(s, a); 1286 } 1287 fatal("relocation " + toString(reloc) + " to " + toString(s) + 1288 " not supported for Armv5 or Armv6 targets"); 1289 } 1290 1291 // Create a thunk for Thumb long branch on V6-M. 1292 // Arm Architecture v6-M only supports Thumb instructions. This means 1293 // - MOVT and MOVW instructions cannot be used. 1294 // - Only a limited number of instructions can access registers r8 and above 1295 // - No interworking support is needed (all Thumb). 1296 static Thunk *addThunkV6M(RelType reloc, Symbol &s, int64_t a) { 1297 switch (reloc) { 1298 case R_ARM_THM_JUMP19: 1299 case R_ARM_THM_JUMP24: 1300 case R_ARM_THM_CALL: 1301 if (config->isPic) 1302 return make<ThumbV6MPILongThunk>(s, a); 1303 return make<ThumbV6MABSLongThunk>(s, a); 1304 } 1305 fatal("relocation " + toString(reloc) + " to " + toString(s) + 1306 " not supported for Armv6-M targets"); 1307 } 1308 1309 // Creates a thunk for Thumb-ARM interworking or branch range extension. 1310 static Thunk *addThunkArm(RelType reloc, Symbol &s, int64_t a) { 1311 // Decide which Thunk is needed based on: 1312 // Available instruction set 1313 // - An Arm Thunk can only be used if Arm state is available. 1314 // - A Thumb Thunk can only be used if Thumb state is available. 1315 // - Can only use a Thunk if it uses instructions that the Target supports. 1316 // Relocation is branch or branch and link 1317 // - Branch instructions cannot change state, can only select Thunk that 1318 // starts in the same state as the caller. 1319 // - Branch and link relocations can change state, can select Thunks from 1320 // either Arm or Thumb. 1321 // Position independent Thunks if we require position independent code. 1322 1323 // Handle architectures that have restrictions on the instructions that they 1324 // can use in Thunks. The flags below are set by reading the BuildAttributes 1325 // of the input objects. InputFiles.cpp contains the mapping from ARM 1326 // architecture to flag. 1327 if (!config->armHasMovtMovw) { 1328 if (config->armJ1J2BranchEncoding) 1329 return addThunkV6M(reloc, s, a); 1330 if (config->armHasBlx) 1331 return addThunkArmv5v6(reloc, s, a); 1332 return addThunkArmv4(reloc, s, a); 1333 } 1334 1335 switch (reloc) { 1336 case R_ARM_PC24: 1337 case R_ARM_PLT32: 1338 case R_ARM_JUMP24: 1339 case R_ARM_CALL: 1340 if (config->picThunk) 1341 return make<ARMV7PILongThunk>(s, a); 1342 return make<ARMV7ABSLongThunk>(s, a); 1343 case R_ARM_THM_JUMP19: 1344 case R_ARM_THM_JUMP24: 1345 case R_ARM_THM_CALL: 1346 if (config->picThunk) 1347 return make<ThumbV7PILongThunk>(s, a); 1348 return make<ThumbV7ABSLongThunk>(s, a); 1349 } 1350 fatal("unrecognized relocation type"); 1351 } 1352 1353 static Thunk *addThunkMips(RelType type, Symbol &s) { 1354 if ((s.stOther & STO_MIPS_MICROMIPS) && isMipsR6()) 1355 return make<MicroMipsR6Thunk>(s); 1356 if (s.stOther & STO_MIPS_MICROMIPS) 1357 return make<MicroMipsThunk>(s); 1358 return make<MipsThunk>(s); 1359 } 1360 1361 static Thunk *addThunkPPC32(const InputSection &isec, const Relocation &rel, 1362 Symbol &s) { 1363 assert((rel.type == R_PPC_LOCAL24PC || rel.type == R_PPC_REL24 || 1364 rel.type == R_PPC_PLTREL24) && 1365 "unexpected relocation type for thunk"); 1366 if (s.isInPlt()) 1367 return make<PPC32PltCallStub>(isec, rel, s); 1368 return make<PPC32LongThunk>(s, rel.addend); 1369 } 1370 1371 static Thunk *addThunkPPC64(RelType type, Symbol &s, int64_t a) { 1372 assert((type == R_PPC64_REL14 || type == R_PPC64_REL24 || 1373 type == R_PPC64_REL24_NOTOC) && 1374 "unexpected relocation type for thunk"); 1375 if (s.isInPlt()) 1376 return type == R_PPC64_REL24_NOTOC ? (Thunk *)make<PPC64PCRelPLTStub>(s) 1377 : (Thunk *)make<PPC64PltCallStub>(s); 1378 1379 // This check looks at the st_other bits of the callee. If the value is 1 1380 // then the callee clobbers the TOC and we need an R2 save stub when RelType 1381 // is R_PPC64_REL14 or R_PPC64_REL24. 1382 if ((type == R_PPC64_REL14 || type == R_PPC64_REL24) && (s.stOther >> 5) == 1) 1383 return make<PPC64R2SaveStub>(s, a); 1384 1385 if (type == R_PPC64_REL24_NOTOC) 1386 return make<PPC64R12SetupStub>(s); 1387 1388 if (config->picThunk) 1389 return make<PPC64PILongBranchThunk>(s, a); 1390 1391 return make<PPC64PDLongBranchThunk>(s, a); 1392 } 1393 1394 Thunk *elf::addThunk(const InputSection &isec, Relocation &rel) { 1395 Symbol &s = *rel.sym; 1396 int64_t a = rel.addend; 1397 1398 if (config->emachine == EM_AARCH64) 1399 return addThunkAArch64(rel.type, s, a); 1400 1401 if (config->emachine == EM_ARM) 1402 return addThunkArm(rel.type, s, a); 1403 1404 if (config->emachine == EM_MIPS) 1405 return addThunkMips(rel.type, s); 1406 1407 if (config->emachine == EM_PPC) 1408 return addThunkPPC32(isec, rel, s); 1409 1410 if (config->emachine == EM_PPC64) 1411 return addThunkPPC64(rel.type, s, a); 1412 1413 llvm_unreachable("add Thunk only supported for ARM, Mips and PowerPC"); 1414 } 1415