10b57cec5SDimitry Andric //===- AMDGPU.cpp ---------------------------------------------------------===// 20b57cec5SDimitry Andric // 30b57cec5SDimitry Andric // Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions. 40b57cec5SDimitry Andric // See https://llvm.org/LICENSE.txt for license information. 50b57cec5SDimitry Andric // SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception 60b57cec5SDimitry Andric // 70b57cec5SDimitry Andric //===----------------------------------------------------------------------===// 80b57cec5SDimitry Andric 90b57cec5SDimitry Andric #include "InputFiles.h" 100b57cec5SDimitry Andric #include "Symbols.h" 110b57cec5SDimitry Andric #include "Target.h" 120b57cec5SDimitry Andric #include "lld/Common/ErrorHandler.h" 13*81ad6265SDimitry Andric #include "llvm/BinaryFormat/ELF.h" 140b57cec5SDimitry Andric #include "llvm/Support/Endian.h" 150b57cec5SDimitry Andric 160b57cec5SDimitry Andric using namespace llvm; 170b57cec5SDimitry Andric using namespace llvm::object; 180b57cec5SDimitry Andric using namespace llvm::support::endian; 190b57cec5SDimitry Andric using namespace llvm::ELF; 205ffd83dbSDimitry Andric using namespace lld; 215ffd83dbSDimitry Andric using namespace lld::elf; 220b57cec5SDimitry Andric 230b57cec5SDimitry Andric namespace { 240b57cec5SDimitry Andric class AMDGPU final : public TargetInfo { 25fe6060f1SDimitry Andric private: 26fe6060f1SDimitry Andric uint32_t calcEFlagsV3() const; 27fe6060f1SDimitry Andric uint32_t calcEFlagsV4() const; 28fe6060f1SDimitry Andric 290b57cec5SDimitry Andric public: 300b57cec5SDimitry Andric AMDGPU(); 310b57cec5SDimitry Andric uint32_t calcEFlags() const override; 325ffd83dbSDimitry Andric void relocate(uint8_t *loc, const Relocation &rel, 335ffd83dbSDimitry Andric uint64_t val) const override; 340b57cec5SDimitry Andric RelExpr getRelExpr(RelType type, const Symbol &s, 350b57cec5SDimitry Andric const uint8_t *loc) const override; 360b57cec5SDimitry Andric RelType getDynRel(RelType type) const override; 370b57cec5SDimitry Andric }; 380b57cec5SDimitry Andric } // namespace 390b57cec5SDimitry Andric 400b57cec5SDimitry Andric AMDGPU::AMDGPU() { 410b57cec5SDimitry Andric relativeRel = R_AMDGPU_RELATIVE64; 420b57cec5SDimitry Andric gotRel = R_AMDGPU_ABS64; 430b57cec5SDimitry Andric symbolicRel = R_AMDGPU_ABS64; 440b57cec5SDimitry Andric } 450b57cec5SDimitry Andric 460b57cec5SDimitry Andric static uint32_t getEFlags(InputFile *file) { 47e8d8bef9SDimitry Andric return cast<ObjFile<ELF64LE>>(file)->getObj().getHeader().e_flags; 480b57cec5SDimitry Andric } 490b57cec5SDimitry Andric 50fe6060f1SDimitry Andric uint32_t AMDGPU::calcEFlagsV3() const { 51*81ad6265SDimitry Andric uint32_t ret = getEFlags(ctx->objectFiles[0]); 520b57cec5SDimitry Andric 530b57cec5SDimitry Andric // Verify that all input files have the same e_flags. 54*81ad6265SDimitry Andric for (InputFile *f : makeArrayRef(ctx->objectFiles).slice(1)) { 550b57cec5SDimitry Andric if (ret == getEFlags(f)) 560b57cec5SDimitry Andric continue; 570b57cec5SDimitry Andric error("incompatible e_flags: " + toString(f)); 580b57cec5SDimitry Andric return 0; 590b57cec5SDimitry Andric } 600b57cec5SDimitry Andric return ret; 610b57cec5SDimitry Andric } 620b57cec5SDimitry Andric 63fe6060f1SDimitry Andric uint32_t AMDGPU::calcEFlagsV4() const { 64*81ad6265SDimitry Andric uint32_t retMach = getEFlags(ctx->objectFiles[0]) & EF_AMDGPU_MACH; 65*81ad6265SDimitry Andric uint32_t retXnack = 66*81ad6265SDimitry Andric getEFlags(ctx->objectFiles[0]) & EF_AMDGPU_FEATURE_XNACK_V4; 67fe6060f1SDimitry Andric uint32_t retSramEcc = 68*81ad6265SDimitry Andric getEFlags(ctx->objectFiles[0]) & EF_AMDGPU_FEATURE_SRAMECC_V4; 69fe6060f1SDimitry Andric 70fe6060f1SDimitry Andric // Verify that all input files have compatible e_flags (same mach, all 71fe6060f1SDimitry Andric // features in the same category are either ANY, ANY and ON, or ANY and OFF). 72*81ad6265SDimitry Andric for (InputFile *f : makeArrayRef(ctx->objectFiles).slice(1)) { 73fe6060f1SDimitry Andric if (retMach != (getEFlags(f) & EF_AMDGPU_MACH)) { 74fe6060f1SDimitry Andric error("incompatible mach: " + toString(f)); 75fe6060f1SDimitry Andric return 0; 76fe6060f1SDimitry Andric } 77fe6060f1SDimitry Andric 78fe6060f1SDimitry Andric if (retXnack == EF_AMDGPU_FEATURE_XNACK_UNSUPPORTED_V4 || 79fe6060f1SDimitry Andric (retXnack != EF_AMDGPU_FEATURE_XNACK_ANY_V4 && 80fe6060f1SDimitry Andric (getEFlags(f) & EF_AMDGPU_FEATURE_XNACK_V4) 81fe6060f1SDimitry Andric != EF_AMDGPU_FEATURE_XNACK_ANY_V4)) { 82fe6060f1SDimitry Andric if (retXnack != (getEFlags(f) & EF_AMDGPU_FEATURE_XNACK_V4)) { 83fe6060f1SDimitry Andric error("incompatible xnack: " + toString(f)); 84fe6060f1SDimitry Andric return 0; 85fe6060f1SDimitry Andric } 86fe6060f1SDimitry Andric } else { 87fe6060f1SDimitry Andric if (retXnack == EF_AMDGPU_FEATURE_XNACK_ANY_V4) 88fe6060f1SDimitry Andric retXnack = getEFlags(f) & EF_AMDGPU_FEATURE_XNACK_V4; 89fe6060f1SDimitry Andric } 90fe6060f1SDimitry Andric 91fe6060f1SDimitry Andric if (retSramEcc == EF_AMDGPU_FEATURE_SRAMECC_UNSUPPORTED_V4 || 92fe6060f1SDimitry Andric (retSramEcc != EF_AMDGPU_FEATURE_SRAMECC_ANY_V4 && 93fe6060f1SDimitry Andric (getEFlags(f) & EF_AMDGPU_FEATURE_SRAMECC_V4) != 94fe6060f1SDimitry Andric EF_AMDGPU_FEATURE_SRAMECC_ANY_V4)) { 95fe6060f1SDimitry Andric if (retSramEcc != (getEFlags(f) & EF_AMDGPU_FEATURE_SRAMECC_V4)) { 96fe6060f1SDimitry Andric error("incompatible sramecc: " + toString(f)); 97fe6060f1SDimitry Andric return 0; 98fe6060f1SDimitry Andric } 99fe6060f1SDimitry Andric } else { 100fe6060f1SDimitry Andric if (retSramEcc == EF_AMDGPU_FEATURE_SRAMECC_ANY_V4) 101fe6060f1SDimitry Andric retSramEcc = getEFlags(f) & EF_AMDGPU_FEATURE_SRAMECC_V4; 102fe6060f1SDimitry Andric } 103fe6060f1SDimitry Andric } 104fe6060f1SDimitry Andric 105fe6060f1SDimitry Andric return retMach | retXnack | retSramEcc; 106fe6060f1SDimitry Andric } 107fe6060f1SDimitry Andric 108fe6060f1SDimitry Andric uint32_t AMDGPU::calcEFlags() const { 109*81ad6265SDimitry Andric if (ctx->objectFiles.empty()) 110*81ad6265SDimitry Andric return 0; 111fe6060f1SDimitry Andric 112*81ad6265SDimitry Andric uint8_t abiVersion = cast<ObjFile<ELF64LE>>(ctx->objectFiles[0]) 113*81ad6265SDimitry Andric ->getObj() 114*81ad6265SDimitry Andric .getHeader() 115*81ad6265SDimitry Andric .e_ident[EI_ABIVERSION]; 116fe6060f1SDimitry Andric switch (abiVersion) { 117fe6060f1SDimitry Andric case ELFABIVERSION_AMDGPU_HSA_V2: 118fe6060f1SDimitry Andric case ELFABIVERSION_AMDGPU_HSA_V3: 119fe6060f1SDimitry Andric return calcEFlagsV3(); 120fe6060f1SDimitry Andric case ELFABIVERSION_AMDGPU_HSA_V4: 121*81ad6265SDimitry Andric case ELFABIVERSION_AMDGPU_HSA_V5: 122fe6060f1SDimitry Andric return calcEFlagsV4(); 123fe6060f1SDimitry Andric default: 124fe6060f1SDimitry Andric error("unknown abi version: " + Twine(abiVersion)); 125fe6060f1SDimitry Andric return 0; 126fe6060f1SDimitry Andric } 127fe6060f1SDimitry Andric } 128fe6060f1SDimitry Andric 1295ffd83dbSDimitry Andric void AMDGPU::relocate(uint8_t *loc, const Relocation &rel, uint64_t val) const { 1305ffd83dbSDimitry Andric switch (rel.type) { 1310b57cec5SDimitry Andric case R_AMDGPU_ABS32: 1320b57cec5SDimitry Andric case R_AMDGPU_GOTPCREL: 1330b57cec5SDimitry Andric case R_AMDGPU_GOTPCREL32_LO: 1340b57cec5SDimitry Andric case R_AMDGPU_REL32: 1350b57cec5SDimitry Andric case R_AMDGPU_REL32_LO: 1360b57cec5SDimitry Andric write32le(loc, val); 1370b57cec5SDimitry Andric break; 1380b57cec5SDimitry Andric case R_AMDGPU_ABS64: 1390b57cec5SDimitry Andric case R_AMDGPU_REL64: 1400b57cec5SDimitry Andric write64le(loc, val); 1410b57cec5SDimitry Andric break; 1420b57cec5SDimitry Andric case R_AMDGPU_GOTPCREL32_HI: 1430b57cec5SDimitry Andric case R_AMDGPU_REL32_HI: 1440b57cec5SDimitry Andric write32le(loc, val >> 32); 1450b57cec5SDimitry Andric break; 146fe6060f1SDimitry Andric case R_AMDGPU_REL16: { 147fe6060f1SDimitry Andric int64_t simm = (static_cast<int64_t>(val) - 4) / 4; 148fe6060f1SDimitry Andric checkInt(loc, simm, 16, rel); 149fe6060f1SDimitry Andric write16le(loc, simm); 150fe6060f1SDimitry Andric break; 151fe6060f1SDimitry Andric } 1520b57cec5SDimitry Andric default: 1530b57cec5SDimitry Andric llvm_unreachable("unknown relocation"); 1540b57cec5SDimitry Andric } 1550b57cec5SDimitry Andric } 1560b57cec5SDimitry Andric 1570b57cec5SDimitry Andric RelExpr AMDGPU::getRelExpr(RelType type, const Symbol &s, 1580b57cec5SDimitry Andric const uint8_t *loc) const { 1590b57cec5SDimitry Andric switch (type) { 1600b57cec5SDimitry Andric case R_AMDGPU_ABS32: 1610b57cec5SDimitry Andric case R_AMDGPU_ABS64: 1620b57cec5SDimitry Andric return R_ABS; 1630b57cec5SDimitry Andric case R_AMDGPU_REL32: 1640b57cec5SDimitry Andric case R_AMDGPU_REL32_LO: 1650b57cec5SDimitry Andric case R_AMDGPU_REL32_HI: 1660b57cec5SDimitry Andric case R_AMDGPU_REL64: 167fe6060f1SDimitry Andric case R_AMDGPU_REL16: 1680b57cec5SDimitry Andric return R_PC; 1690b57cec5SDimitry Andric case R_AMDGPU_GOTPCREL: 1700b57cec5SDimitry Andric case R_AMDGPU_GOTPCREL32_LO: 1710b57cec5SDimitry Andric case R_AMDGPU_GOTPCREL32_HI: 1720b57cec5SDimitry Andric return R_GOT_PC; 1730b57cec5SDimitry Andric default: 1740b57cec5SDimitry Andric error(getErrorLocation(loc) + "unknown relocation (" + Twine(type) + 1750b57cec5SDimitry Andric ") against symbol " + toString(s)); 1760b57cec5SDimitry Andric return R_NONE; 1770b57cec5SDimitry Andric } 1780b57cec5SDimitry Andric } 1790b57cec5SDimitry Andric 1800b57cec5SDimitry Andric RelType AMDGPU::getDynRel(RelType type) const { 1810b57cec5SDimitry Andric if (type == R_AMDGPU_ABS64) 1820b57cec5SDimitry Andric return type; 1830b57cec5SDimitry Andric return R_AMDGPU_NONE; 1840b57cec5SDimitry Andric } 1850b57cec5SDimitry Andric 1865ffd83dbSDimitry Andric TargetInfo *elf::getAMDGPUTargetInfo() { 1870b57cec5SDimitry Andric static AMDGPU target; 1880b57cec5SDimitry Andric return ⌖ 1890b57cec5SDimitry Andric } 190