1*0b57cec5SDimitry Andric //===- ELF.cpp - ELF object file implementation ---------------------------===// 2*0b57cec5SDimitry Andric // 3*0b57cec5SDimitry Andric // Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions. 4*0b57cec5SDimitry Andric // See https://llvm.org/LICENSE.txt for license information. 5*0b57cec5SDimitry Andric // SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception 6*0b57cec5SDimitry Andric // 7*0b57cec5SDimitry Andric //===----------------------------------------------------------------------===// 8*0b57cec5SDimitry Andric 9*0b57cec5SDimitry Andric #include "llvm/Object/ELF.h" 10*0b57cec5SDimitry Andric #include "llvm/BinaryFormat/ELF.h" 11*0b57cec5SDimitry Andric #include "llvm/Support/LEB128.h" 12*0b57cec5SDimitry Andric 13*0b57cec5SDimitry Andric using namespace llvm; 14*0b57cec5SDimitry Andric using namespace object; 15*0b57cec5SDimitry Andric 16*0b57cec5SDimitry Andric #define STRINGIFY_ENUM_CASE(ns, name) \ 17*0b57cec5SDimitry Andric case ns::name: \ 18*0b57cec5SDimitry Andric return #name; 19*0b57cec5SDimitry Andric 20*0b57cec5SDimitry Andric #define ELF_RELOC(name, value) STRINGIFY_ENUM_CASE(ELF, name) 21*0b57cec5SDimitry Andric 22*0b57cec5SDimitry Andric StringRef llvm::object::getELFRelocationTypeName(uint32_t Machine, 23*0b57cec5SDimitry Andric uint32_t Type) { 24*0b57cec5SDimitry Andric switch (Machine) { 25*0b57cec5SDimitry Andric case ELF::EM_X86_64: 26*0b57cec5SDimitry Andric switch (Type) { 27*0b57cec5SDimitry Andric #include "llvm/BinaryFormat/ELFRelocs/x86_64.def" 28*0b57cec5SDimitry Andric default: 29*0b57cec5SDimitry Andric break; 30*0b57cec5SDimitry Andric } 31*0b57cec5SDimitry Andric break; 32*0b57cec5SDimitry Andric case ELF::EM_386: 33*0b57cec5SDimitry Andric case ELF::EM_IAMCU: 34*0b57cec5SDimitry Andric switch (Type) { 35*0b57cec5SDimitry Andric #include "llvm/BinaryFormat/ELFRelocs/i386.def" 36*0b57cec5SDimitry Andric default: 37*0b57cec5SDimitry Andric break; 38*0b57cec5SDimitry Andric } 39*0b57cec5SDimitry Andric break; 40*0b57cec5SDimitry Andric case ELF::EM_MIPS: 41*0b57cec5SDimitry Andric switch (Type) { 42*0b57cec5SDimitry Andric #include "llvm/BinaryFormat/ELFRelocs/Mips.def" 43*0b57cec5SDimitry Andric default: 44*0b57cec5SDimitry Andric break; 45*0b57cec5SDimitry Andric } 46*0b57cec5SDimitry Andric break; 47*0b57cec5SDimitry Andric case ELF::EM_AARCH64: 48*0b57cec5SDimitry Andric switch (Type) { 49*0b57cec5SDimitry Andric #include "llvm/BinaryFormat/ELFRelocs/AArch64.def" 50*0b57cec5SDimitry Andric default: 51*0b57cec5SDimitry Andric break; 52*0b57cec5SDimitry Andric } 53*0b57cec5SDimitry Andric break; 54*0b57cec5SDimitry Andric case ELF::EM_ARM: 55*0b57cec5SDimitry Andric switch (Type) { 56*0b57cec5SDimitry Andric #include "llvm/BinaryFormat/ELFRelocs/ARM.def" 57*0b57cec5SDimitry Andric default: 58*0b57cec5SDimitry Andric break; 59*0b57cec5SDimitry Andric } 60*0b57cec5SDimitry Andric break; 61*0b57cec5SDimitry Andric case ELF::EM_ARC_COMPACT: 62*0b57cec5SDimitry Andric case ELF::EM_ARC_COMPACT2: 63*0b57cec5SDimitry Andric switch (Type) { 64*0b57cec5SDimitry Andric #include "llvm/BinaryFormat/ELFRelocs/ARC.def" 65*0b57cec5SDimitry Andric default: 66*0b57cec5SDimitry Andric break; 67*0b57cec5SDimitry Andric } 68*0b57cec5SDimitry Andric break; 69*0b57cec5SDimitry Andric case ELF::EM_AVR: 70*0b57cec5SDimitry Andric switch (Type) { 71*0b57cec5SDimitry Andric #include "llvm/BinaryFormat/ELFRelocs/AVR.def" 72*0b57cec5SDimitry Andric default: 73*0b57cec5SDimitry Andric break; 74*0b57cec5SDimitry Andric } 75*0b57cec5SDimitry Andric break; 76*0b57cec5SDimitry Andric case ELF::EM_HEXAGON: 77*0b57cec5SDimitry Andric switch (Type) { 78*0b57cec5SDimitry Andric #include "llvm/BinaryFormat/ELFRelocs/Hexagon.def" 79*0b57cec5SDimitry Andric default: 80*0b57cec5SDimitry Andric break; 81*0b57cec5SDimitry Andric } 82*0b57cec5SDimitry Andric break; 83*0b57cec5SDimitry Andric case ELF::EM_LANAI: 84*0b57cec5SDimitry Andric switch (Type) { 85*0b57cec5SDimitry Andric #include "llvm/BinaryFormat/ELFRelocs/Lanai.def" 86*0b57cec5SDimitry Andric default: 87*0b57cec5SDimitry Andric break; 88*0b57cec5SDimitry Andric } 89*0b57cec5SDimitry Andric break; 90*0b57cec5SDimitry Andric case ELF::EM_PPC: 91*0b57cec5SDimitry Andric switch (Type) { 92*0b57cec5SDimitry Andric #include "llvm/BinaryFormat/ELFRelocs/PowerPC.def" 93*0b57cec5SDimitry Andric default: 94*0b57cec5SDimitry Andric break; 95*0b57cec5SDimitry Andric } 96*0b57cec5SDimitry Andric break; 97*0b57cec5SDimitry Andric case ELF::EM_PPC64: 98*0b57cec5SDimitry Andric switch (Type) { 99*0b57cec5SDimitry Andric #include "llvm/BinaryFormat/ELFRelocs/PowerPC64.def" 100*0b57cec5SDimitry Andric default: 101*0b57cec5SDimitry Andric break; 102*0b57cec5SDimitry Andric } 103*0b57cec5SDimitry Andric break; 104*0b57cec5SDimitry Andric case ELF::EM_RISCV: 105*0b57cec5SDimitry Andric switch (Type) { 106*0b57cec5SDimitry Andric #include "llvm/BinaryFormat/ELFRelocs/RISCV.def" 107*0b57cec5SDimitry Andric default: 108*0b57cec5SDimitry Andric break; 109*0b57cec5SDimitry Andric } 110*0b57cec5SDimitry Andric break; 111*0b57cec5SDimitry Andric case ELF::EM_S390: 112*0b57cec5SDimitry Andric switch (Type) { 113*0b57cec5SDimitry Andric #include "llvm/BinaryFormat/ELFRelocs/SystemZ.def" 114*0b57cec5SDimitry Andric default: 115*0b57cec5SDimitry Andric break; 116*0b57cec5SDimitry Andric } 117*0b57cec5SDimitry Andric break; 118*0b57cec5SDimitry Andric case ELF::EM_SPARC: 119*0b57cec5SDimitry Andric case ELF::EM_SPARC32PLUS: 120*0b57cec5SDimitry Andric case ELF::EM_SPARCV9: 121*0b57cec5SDimitry Andric switch (Type) { 122*0b57cec5SDimitry Andric #include "llvm/BinaryFormat/ELFRelocs/Sparc.def" 123*0b57cec5SDimitry Andric default: 124*0b57cec5SDimitry Andric break; 125*0b57cec5SDimitry Andric } 126*0b57cec5SDimitry Andric break; 127*0b57cec5SDimitry Andric case ELF::EM_AMDGPU: 128*0b57cec5SDimitry Andric switch (Type) { 129*0b57cec5SDimitry Andric #include "llvm/BinaryFormat/ELFRelocs/AMDGPU.def" 130*0b57cec5SDimitry Andric default: 131*0b57cec5SDimitry Andric break; 132*0b57cec5SDimitry Andric } 133*0b57cec5SDimitry Andric break; 134*0b57cec5SDimitry Andric case ELF::EM_BPF: 135*0b57cec5SDimitry Andric switch (Type) { 136*0b57cec5SDimitry Andric #include "llvm/BinaryFormat/ELFRelocs/BPF.def" 137*0b57cec5SDimitry Andric default: 138*0b57cec5SDimitry Andric break; 139*0b57cec5SDimitry Andric } 140*0b57cec5SDimitry Andric break; 141*0b57cec5SDimitry Andric case ELF::EM_MSP430: 142*0b57cec5SDimitry Andric switch (Type) { 143*0b57cec5SDimitry Andric #include "llvm/BinaryFormat/ELFRelocs/MSP430.def" 144*0b57cec5SDimitry Andric default: 145*0b57cec5SDimitry Andric break; 146*0b57cec5SDimitry Andric } 147*0b57cec5SDimitry Andric break; 148*0b57cec5SDimitry Andric default: 149*0b57cec5SDimitry Andric break; 150*0b57cec5SDimitry Andric } 151*0b57cec5SDimitry Andric return "Unknown"; 152*0b57cec5SDimitry Andric } 153*0b57cec5SDimitry Andric 154*0b57cec5SDimitry Andric #undef ELF_RELOC 155*0b57cec5SDimitry Andric 156*0b57cec5SDimitry Andric uint32_t llvm::object::getELFRelativeRelocationType(uint32_t Machine) { 157*0b57cec5SDimitry Andric switch (Machine) { 158*0b57cec5SDimitry Andric case ELF::EM_X86_64: 159*0b57cec5SDimitry Andric return ELF::R_X86_64_RELATIVE; 160*0b57cec5SDimitry Andric case ELF::EM_386: 161*0b57cec5SDimitry Andric case ELF::EM_IAMCU: 162*0b57cec5SDimitry Andric return ELF::R_386_RELATIVE; 163*0b57cec5SDimitry Andric case ELF::EM_MIPS: 164*0b57cec5SDimitry Andric break; 165*0b57cec5SDimitry Andric case ELF::EM_AARCH64: 166*0b57cec5SDimitry Andric return ELF::R_AARCH64_RELATIVE; 167*0b57cec5SDimitry Andric case ELF::EM_ARM: 168*0b57cec5SDimitry Andric return ELF::R_ARM_RELATIVE; 169*0b57cec5SDimitry Andric case ELF::EM_ARC_COMPACT: 170*0b57cec5SDimitry Andric case ELF::EM_ARC_COMPACT2: 171*0b57cec5SDimitry Andric return ELF::R_ARC_RELATIVE; 172*0b57cec5SDimitry Andric case ELF::EM_AVR: 173*0b57cec5SDimitry Andric break; 174*0b57cec5SDimitry Andric case ELF::EM_HEXAGON: 175*0b57cec5SDimitry Andric return ELF::R_HEX_RELATIVE; 176*0b57cec5SDimitry Andric case ELF::EM_LANAI: 177*0b57cec5SDimitry Andric break; 178*0b57cec5SDimitry Andric case ELF::EM_PPC: 179*0b57cec5SDimitry Andric break; 180*0b57cec5SDimitry Andric case ELF::EM_PPC64: 181*0b57cec5SDimitry Andric return ELF::R_PPC64_RELATIVE; 182*0b57cec5SDimitry Andric case ELF::EM_RISCV: 183*0b57cec5SDimitry Andric return ELF::R_RISCV_RELATIVE; 184*0b57cec5SDimitry Andric case ELF::EM_S390: 185*0b57cec5SDimitry Andric return ELF::R_390_RELATIVE; 186*0b57cec5SDimitry Andric case ELF::EM_SPARC: 187*0b57cec5SDimitry Andric case ELF::EM_SPARC32PLUS: 188*0b57cec5SDimitry Andric case ELF::EM_SPARCV9: 189*0b57cec5SDimitry Andric return ELF::R_SPARC_RELATIVE; 190*0b57cec5SDimitry Andric case ELF::EM_AMDGPU: 191*0b57cec5SDimitry Andric break; 192*0b57cec5SDimitry Andric case ELF::EM_BPF: 193*0b57cec5SDimitry Andric break; 194*0b57cec5SDimitry Andric default: 195*0b57cec5SDimitry Andric break; 196*0b57cec5SDimitry Andric } 197*0b57cec5SDimitry Andric return 0; 198*0b57cec5SDimitry Andric } 199*0b57cec5SDimitry Andric 200*0b57cec5SDimitry Andric StringRef llvm::object::getELFSectionTypeName(uint32_t Machine, unsigned Type) { 201*0b57cec5SDimitry Andric switch (Machine) { 202*0b57cec5SDimitry Andric case ELF::EM_ARM: 203*0b57cec5SDimitry Andric switch (Type) { 204*0b57cec5SDimitry Andric STRINGIFY_ENUM_CASE(ELF, SHT_ARM_EXIDX); 205*0b57cec5SDimitry Andric STRINGIFY_ENUM_CASE(ELF, SHT_ARM_PREEMPTMAP); 206*0b57cec5SDimitry Andric STRINGIFY_ENUM_CASE(ELF, SHT_ARM_ATTRIBUTES); 207*0b57cec5SDimitry Andric STRINGIFY_ENUM_CASE(ELF, SHT_ARM_DEBUGOVERLAY); 208*0b57cec5SDimitry Andric STRINGIFY_ENUM_CASE(ELF, SHT_ARM_OVERLAYSECTION); 209*0b57cec5SDimitry Andric } 210*0b57cec5SDimitry Andric break; 211*0b57cec5SDimitry Andric case ELF::EM_HEXAGON: 212*0b57cec5SDimitry Andric switch (Type) { STRINGIFY_ENUM_CASE(ELF, SHT_HEX_ORDERED); } 213*0b57cec5SDimitry Andric break; 214*0b57cec5SDimitry Andric case ELF::EM_X86_64: 215*0b57cec5SDimitry Andric switch (Type) { STRINGIFY_ENUM_CASE(ELF, SHT_X86_64_UNWIND); } 216*0b57cec5SDimitry Andric break; 217*0b57cec5SDimitry Andric case ELF::EM_MIPS: 218*0b57cec5SDimitry Andric case ELF::EM_MIPS_RS3_LE: 219*0b57cec5SDimitry Andric switch (Type) { 220*0b57cec5SDimitry Andric STRINGIFY_ENUM_CASE(ELF, SHT_MIPS_REGINFO); 221*0b57cec5SDimitry Andric STRINGIFY_ENUM_CASE(ELF, SHT_MIPS_OPTIONS); 222*0b57cec5SDimitry Andric STRINGIFY_ENUM_CASE(ELF, SHT_MIPS_DWARF); 223*0b57cec5SDimitry Andric STRINGIFY_ENUM_CASE(ELF, SHT_MIPS_ABIFLAGS); 224*0b57cec5SDimitry Andric } 225*0b57cec5SDimitry Andric break; 226*0b57cec5SDimitry Andric default: 227*0b57cec5SDimitry Andric break; 228*0b57cec5SDimitry Andric } 229*0b57cec5SDimitry Andric 230*0b57cec5SDimitry Andric switch (Type) { 231*0b57cec5SDimitry Andric STRINGIFY_ENUM_CASE(ELF, SHT_NULL); 232*0b57cec5SDimitry Andric STRINGIFY_ENUM_CASE(ELF, SHT_PROGBITS); 233*0b57cec5SDimitry Andric STRINGIFY_ENUM_CASE(ELF, SHT_SYMTAB); 234*0b57cec5SDimitry Andric STRINGIFY_ENUM_CASE(ELF, SHT_STRTAB); 235*0b57cec5SDimitry Andric STRINGIFY_ENUM_CASE(ELF, SHT_RELA); 236*0b57cec5SDimitry Andric STRINGIFY_ENUM_CASE(ELF, SHT_HASH); 237*0b57cec5SDimitry Andric STRINGIFY_ENUM_CASE(ELF, SHT_DYNAMIC); 238*0b57cec5SDimitry Andric STRINGIFY_ENUM_CASE(ELF, SHT_NOTE); 239*0b57cec5SDimitry Andric STRINGIFY_ENUM_CASE(ELF, SHT_NOBITS); 240*0b57cec5SDimitry Andric STRINGIFY_ENUM_CASE(ELF, SHT_REL); 241*0b57cec5SDimitry Andric STRINGIFY_ENUM_CASE(ELF, SHT_SHLIB); 242*0b57cec5SDimitry Andric STRINGIFY_ENUM_CASE(ELF, SHT_DYNSYM); 243*0b57cec5SDimitry Andric STRINGIFY_ENUM_CASE(ELF, SHT_INIT_ARRAY); 244*0b57cec5SDimitry Andric STRINGIFY_ENUM_CASE(ELF, SHT_FINI_ARRAY); 245*0b57cec5SDimitry Andric STRINGIFY_ENUM_CASE(ELF, SHT_PREINIT_ARRAY); 246*0b57cec5SDimitry Andric STRINGIFY_ENUM_CASE(ELF, SHT_GROUP); 247*0b57cec5SDimitry Andric STRINGIFY_ENUM_CASE(ELF, SHT_SYMTAB_SHNDX); 248*0b57cec5SDimitry Andric STRINGIFY_ENUM_CASE(ELF, SHT_RELR); 249*0b57cec5SDimitry Andric STRINGIFY_ENUM_CASE(ELF, SHT_ANDROID_REL); 250*0b57cec5SDimitry Andric STRINGIFY_ENUM_CASE(ELF, SHT_ANDROID_RELA); 251*0b57cec5SDimitry Andric STRINGIFY_ENUM_CASE(ELF, SHT_ANDROID_RELR); 252*0b57cec5SDimitry Andric STRINGIFY_ENUM_CASE(ELF, SHT_LLVM_ODRTAB); 253*0b57cec5SDimitry Andric STRINGIFY_ENUM_CASE(ELF, SHT_LLVM_LINKER_OPTIONS); 254*0b57cec5SDimitry Andric STRINGIFY_ENUM_CASE(ELF, SHT_LLVM_CALL_GRAPH_PROFILE); 255*0b57cec5SDimitry Andric STRINGIFY_ENUM_CASE(ELF, SHT_LLVM_ADDRSIG); 256*0b57cec5SDimitry Andric STRINGIFY_ENUM_CASE(ELF, SHT_LLVM_DEPENDENT_LIBRARIES); 257*0b57cec5SDimitry Andric STRINGIFY_ENUM_CASE(ELF, SHT_LLVM_SYMPART); 258*0b57cec5SDimitry Andric STRINGIFY_ENUM_CASE(ELF, SHT_GNU_ATTRIBUTES); 259*0b57cec5SDimitry Andric STRINGIFY_ENUM_CASE(ELF, SHT_GNU_HASH); 260*0b57cec5SDimitry Andric STRINGIFY_ENUM_CASE(ELF, SHT_GNU_verdef); 261*0b57cec5SDimitry Andric STRINGIFY_ENUM_CASE(ELF, SHT_GNU_verneed); 262*0b57cec5SDimitry Andric STRINGIFY_ENUM_CASE(ELF, SHT_GNU_versym); 263*0b57cec5SDimitry Andric default: 264*0b57cec5SDimitry Andric return "Unknown"; 265*0b57cec5SDimitry Andric } 266*0b57cec5SDimitry Andric } 267*0b57cec5SDimitry Andric 268*0b57cec5SDimitry Andric template <class ELFT> 269*0b57cec5SDimitry Andric Expected<std::vector<typename ELFT::Rela>> 270*0b57cec5SDimitry Andric ELFFile<ELFT>::decode_relrs(Elf_Relr_Range relrs) const { 271*0b57cec5SDimitry Andric // This function decodes the contents of an SHT_RELR packed relocation 272*0b57cec5SDimitry Andric // section. 273*0b57cec5SDimitry Andric // 274*0b57cec5SDimitry Andric // Proposal for adding SHT_RELR sections to generic-abi is here: 275*0b57cec5SDimitry Andric // https://groups.google.com/forum/#!topic/generic-abi/bX460iggiKg 276*0b57cec5SDimitry Andric // 277*0b57cec5SDimitry Andric // The encoded sequence of Elf64_Relr entries in a SHT_RELR section looks 278*0b57cec5SDimitry Andric // like [ AAAAAAAA BBBBBBB1 BBBBBBB1 ... AAAAAAAA BBBBBB1 ... ] 279*0b57cec5SDimitry Andric // 280*0b57cec5SDimitry Andric // i.e. start with an address, followed by any number of bitmaps. The address 281*0b57cec5SDimitry Andric // entry encodes 1 relocation. The subsequent bitmap entries encode up to 63 282*0b57cec5SDimitry Andric // relocations each, at subsequent offsets following the last address entry. 283*0b57cec5SDimitry Andric // 284*0b57cec5SDimitry Andric // The bitmap entries must have 1 in the least significant bit. The assumption 285*0b57cec5SDimitry Andric // here is that an address cannot have 1 in lsb. Odd addresses are not 286*0b57cec5SDimitry Andric // supported. 287*0b57cec5SDimitry Andric // 288*0b57cec5SDimitry Andric // Excluding the least significant bit in the bitmap, each non-zero bit in 289*0b57cec5SDimitry Andric // the bitmap represents a relocation to be applied to a corresponding machine 290*0b57cec5SDimitry Andric // word that follows the base address word. The second least significant bit 291*0b57cec5SDimitry Andric // represents the machine word immediately following the initial address, and 292*0b57cec5SDimitry Andric // each bit that follows represents the next word, in linear order. As such, 293*0b57cec5SDimitry Andric // a single bitmap can encode up to 31 relocations in a 32-bit object, and 294*0b57cec5SDimitry Andric // 63 relocations in a 64-bit object. 295*0b57cec5SDimitry Andric // 296*0b57cec5SDimitry Andric // This encoding has a couple of interesting properties: 297*0b57cec5SDimitry Andric // 1. Looking at any entry, it is clear whether it's an address or a bitmap: 298*0b57cec5SDimitry Andric // even means address, odd means bitmap. 299*0b57cec5SDimitry Andric // 2. Just a simple list of addresses is a valid encoding. 300*0b57cec5SDimitry Andric 301*0b57cec5SDimitry Andric Elf_Rela Rela; 302*0b57cec5SDimitry Andric Rela.r_info = 0; 303*0b57cec5SDimitry Andric Rela.r_addend = 0; 304*0b57cec5SDimitry Andric Rela.setType(getRelativeRelocationType(), false); 305*0b57cec5SDimitry Andric std::vector<Elf_Rela> Relocs; 306*0b57cec5SDimitry Andric 307*0b57cec5SDimitry Andric // Word type: uint32_t for Elf32, and uint64_t for Elf64. 308*0b57cec5SDimitry Andric typedef typename ELFT::uint Word; 309*0b57cec5SDimitry Andric 310*0b57cec5SDimitry Andric // Word size in number of bytes. 311*0b57cec5SDimitry Andric const size_t WordSize = sizeof(Word); 312*0b57cec5SDimitry Andric 313*0b57cec5SDimitry Andric // Number of bits used for the relocation offsets bitmap. 314*0b57cec5SDimitry Andric // These many relative relocations can be encoded in a single entry. 315*0b57cec5SDimitry Andric const size_t NBits = 8*WordSize - 1; 316*0b57cec5SDimitry Andric 317*0b57cec5SDimitry Andric Word Base = 0; 318*0b57cec5SDimitry Andric for (const Elf_Relr &R : relrs) { 319*0b57cec5SDimitry Andric Word Entry = R; 320*0b57cec5SDimitry Andric if ((Entry&1) == 0) { 321*0b57cec5SDimitry Andric // Even entry: encodes the offset for next relocation. 322*0b57cec5SDimitry Andric Rela.r_offset = Entry; 323*0b57cec5SDimitry Andric Relocs.push_back(Rela); 324*0b57cec5SDimitry Andric // Set base offset for subsequent bitmap entries. 325*0b57cec5SDimitry Andric Base = Entry + WordSize; 326*0b57cec5SDimitry Andric continue; 327*0b57cec5SDimitry Andric } 328*0b57cec5SDimitry Andric 329*0b57cec5SDimitry Andric // Odd entry: encodes bitmap for relocations starting at base. 330*0b57cec5SDimitry Andric Word Offset = Base; 331*0b57cec5SDimitry Andric while (Entry != 0) { 332*0b57cec5SDimitry Andric Entry >>= 1; 333*0b57cec5SDimitry Andric if ((Entry&1) != 0) { 334*0b57cec5SDimitry Andric Rela.r_offset = Offset; 335*0b57cec5SDimitry Andric Relocs.push_back(Rela); 336*0b57cec5SDimitry Andric } 337*0b57cec5SDimitry Andric Offset += WordSize; 338*0b57cec5SDimitry Andric } 339*0b57cec5SDimitry Andric 340*0b57cec5SDimitry Andric // Advance base offset by NBits words. 341*0b57cec5SDimitry Andric Base += NBits * WordSize; 342*0b57cec5SDimitry Andric } 343*0b57cec5SDimitry Andric 344*0b57cec5SDimitry Andric return Relocs; 345*0b57cec5SDimitry Andric } 346*0b57cec5SDimitry Andric 347*0b57cec5SDimitry Andric template <class ELFT> 348*0b57cec5SDimitry Andric Expected<std::vector<typename ELFT::Rela>> 349*0b57cec5SDimitry Andric ELFFile<ELFT>::android_relas(const Elf_Shdr *Sec) const { 350*0b57cec5SDimitry Andric // This function reads relocations in Android's packed relocation format, 351*0b57cec5SDimitry Andric // which is based on SLEB128 and delta encoding. 352*0b57cec5SDimitry Andric Expected<ArrayRef<uint8_t>> ContentsOrErr = getSectionContents(Sec); 353*0b57cec5SDimitry Andric if (!ContentsOrErr) 354*0b57cec5SDimitry Andric return ContentsOrErr.takeError(); 355*0b57cec5SDimitry Andric const uint8_t *Cur = ContentsOrErr->begin(); 356*0b57cec5SDimitry Andric const uint8_t *End = ContentsOrErr->end(); 357*0b57cec5SDimitry Andric if (ContentsOrErr->size() < 4 || Cur[0] != 'A' || Cur[1] != 'P' || 358*0b57cec5SDimitry Andric Cur[2] != 'S' || Cur[3] != '2') 359*0b57cec5SDimitry Andric return createError("invalid packed relocation header"); 360*0b57cec5SDimitry Andric Cur += 4; 361*0b57cec5SDimitry Andric 362*0b57cec5SDimitry Andric const char *ErrStr = nullptr; 363*0b57cec5SDimitry Andric auto ReadSLEB = [&]() -> int64_t { 364*0b57cec5SDimitry Andric if (ErrStr) 365*0b57cec5SDimitry Andric return 0; 366*0b57cec5SDimitry Andric unsigned Len; 367*0b57cec5SDimitry Andric int64_t Result = decodeSLEB128(Cur, &Len, End, &ErrStr); 368*0b57cec5SDimitry Andric Cur += Len; 369*0b57cec5SDimitry Andric return Result; 370*0b57cec5SDimitry Andric }; 371*0b57cec5SDimitry Andric 372*0b57cec5SDimitry Andric uint64_t NumRelocs = ReadSLEB(); 373*0b57cec5SDimitry Andric uint64_t Offset = ReadSLEB(); 374*0b57cec5SDimitry Andric uint64_t Addend = 0; 375*0b57cec5SDimitry Andric 376*0b57cec5SDimitry Andric if (ErrStr) 377*0b57cec5SDimitry Andric return createError(ErrStr); 378*0b57cec5SDimitry Andric 379*0b57cec5SDimitry Andric std::vector<Elf_Rela> Relocs; 380*0b57cec5SDimitry Andric Relocs.reserve(NumRelocs); 381*0b57cec5SDimitry Andric while (NumRelocs) { 382*0b57cec5SDimitry Andric uint64_t NumRelocsInGroup = ReadSLEB(); 383*0b57cec5SDimitry Andric if (NumRelocsInGroup > NumRelocs) 384*0b57cec5SDimitry Andric return createError("relocation group unexpectedly large"); 385*0b57cec5SDimitry Andric NumRelocs -= NumRelocsInGroup; 386*0b57cec5SDimitry Andric 387*0b57cec5SDimitry Andric uint64_t GroupFlags = ReadSLEB(); 388*0b57cec5SDimitry Andric bool GroupedByInfo = GroupFlags & ELF::RELOCATION_GROUPED_BY_INFO_FLAG; 389*0b57cec5SDimitry Andric bool GroupedByOffsetDelta = GroupFlags & ELF::RELOCATION_GROUPED_BY_OFFSET_DELTA_FLAG; 390*0b57cec5SDimitry Andric bool GroupedByAddend = GroupFlags & ELF::RELOCATION_GROUPED_BY_ADDEND_FLAG; 391*0b57cec5SDimitry Andric bool GroupHasAddend = GroupFlags & ELF::RELOCATION_GROUP_HAS_ADDEND_FLAG; 392*0b57cec5SDimitry Andric 393*0b57cec5SDimitry Andric uint64_t GroupOffsetDelta; 394*0b57cec5SDimitry Andric if (GroupedByOffsetDelta) 395*0b57cec5SDimitry Andric GroupOffsetDelta = ReadSLEB(); 396*0b57cec5SDimitry Andric 397*0b57cec5SDimitry Andric uint64_t GroupRInfo; 398*0b57cec5SDimitry Andric if (GroupedByInfo) 399*0b57cec5SDimitry Andric GroupRInfo = ReadSLEB(); 400*0b57cec5SDimitry Andric 401*0b57cec5SDimitry Andric if (GroupedByAddend && GroupHasAddend) 402*0b57cec5SDimitry Andric Addend += ReadSLEB(); 403*0b57cec5SDimitry Andric 404*0b57cec5SDimitry Andric if (!GroupHasAddend) 405*0b57cec5SDimitry Andric Addend = 0; 406*0b57cec5SDimitry Andric 407*0b57cec5SDimitry Andric for (uint64_t I = 0; I != NumRelocsInGroup; ++I) { 408*0b57cec5SDimitry Andric Elf_Rela R; 409*0b57cec5SDimitry Andric Offset += GroupedByOffsetDelta ? GroupOffsetDelta : ReadSLEB(); 410*0b57cec5SDimitry Andric R.r_offset = Offset; 411*0b57cec5SDimitry Andric R.r_info = GroupedByInfo ? GroupRInfo : ReadSLEB(); 412*0b57cec5SDimitry Andric if (GroupHasAddend && !GroupedByAddend) 413*0b57cec5SDimitry Andric Addend += ReadSLEB(); 414*0b57cec5SDimitry Andric R.r_addend = Addend; 415*0b57cec5SDimitry Andric Relocs.push_back(R); 416*0b57cec5SDimitry Andric 417*0b57cec5SDimitry Andric if (ErrStr) 418*0b57cec5SDimitry Andric return createError(ErrStr); 419*0b57cec5SDimitry Andric } 420*0b57cec5SDimitry Andric 421*0b57cec5SDimitry Andric if (ErrStr) 422*0b57cec5SDimitry Andric return createError(ErrStr); 423*0b57cec5SDimitry Andric } 424*0b57cec5SDimitry Andric 425*0b57cec5SDimitry Andric return Relocs; 426*0b57cec5SDimitry Andric } 427*0b57cec5SDimitry Andric 428*0b57cec5SDimitry Andric template <class ELFT> 429*0b57cec5SDimitry Andric std::string ELFFile<ELFT>::getDynamicTagAsString(unsigned Arch, 430*0b57cec5SDimitry Andric uint64_t Type) const { 431*0b57cec5SDimitry Andric #define DYNAMIC_STRINGIFY_ENUM(tag, value) \ 432*0b57cec5SDimitry Andric case value: \ 433*0b57cec5SDimitry Andric return #tag; 434*0b57cec5SDimitry Andric 435*0b57cec5SDimitry Andric #define DYNAMIC_TAG(n, v) 436*0b57cec5SDimitry Andric switch (Arch) { 437*0b57cec5SDimitry Andric case ELF::EM_AARCH64: 438*0b57cec5SDimitry Andric switch (Type) { 439*0b57cec5SDimitry Andric #define AARCH64_DYNAMIC_TAG(name, value) DYNAMIC_STRINGIFY_ENUM(name, value) 440*0b57cec5SDimitry Andric #include "llvm/BinaryFormat/DynamicTags.def" 441*0b57cec5SDimitry Andric #undef AARCH64_DYNAMIC_TAG 442*0b57cec5SDimitry Andric } 443*0b57cec5SDimitry Andric break; 444*0b57cec5SDimitry Andric 445*0b57cec5SDimitry Andric case ELF::EM_HEXAGON: 446*0b57cec5SDimitry Andric switch (Type) { 447*0b57cec5SDimitry Andric #define HEXAGON_DYNAMIC_TAG(name, value) DYNAMIC_STRINGIFY_ENUM(name, value) 448*0b57cec5SDimitry Andric #include "llvm/BinaryFormat/DynamicTags.def" 449*0b57cec5SDimitry Andric #undef HEXAGON_DYNAMIC_TAG 450*0b57cec5SDimitry Andric } 451*0b57cec5SDimitry Andric break; 452*0b57cec5SDimitry Andric 453*0b57cec5SDimitry Andric case ELF::EM_MIPS: 454*0b57cec5SDimitry Andric switch (Type) { 455*0b57cec5SDimitry Andric #define MIPS_DYNAMIC_TAG(name, value) DYNAMIC_STRINGIFY_ENUM(name, value) 456*0b57cec5SDimitry Andric #include "llvm/BinaryFormat/DynamicTags.def" 457*0b57cec5SDimitry Andric #undef MIPS_DYNAMIC_TAG 458*0b57cec5SDimitry Andric } 459*0b57cec5SDimitry Andric break; 460*0b57cec5SDimitry Andric 461*0b57cec5SDimitry Andric case ELF::EM_PPC64: 462*0b57cec5SDimitry Andric switch (Type) { 463*0b57cec5SDimitry Andric #define PPC64_DYNAMIC_TAG(name, value) DYNAMIC_STRINGIFY_ENUM(name, value) 464*0b57cec5SDimitry Andric #include "llvm/BinaryFormat/DynamicTags.def" 465*0b57cec5SDimitry Andric #undef PPC64_DYNAMIC_TAG 466*0b57cec5SDimitry Andric } 467*0b57cec5SDimitry Andric break; 468*0b57cec5SDimitry Andric } 469*0b57cec5SDimitry Andric #undef DYNAMIC_TAG 470*0b57cec5SDimitry Andric switch (Type) { 471*0b57cec5SDimitry Andric // Now handle all dynamic tags except the architecture specific ones 472*0b57cec5SDimitry Andric #define AARCH64_DYNAMIC_TAG(name, value) 473*0b57cec5SDimitry Andric #define MIPS_DYNAMIC_TAG(name, value) 474*0b57cec5SDimitry Andric #define HEXAGON_DYNAMIC_TAG(name, value) 475*0b57cec5SDimitry Andric #define PPC64_DYNAMIC_TAG(name, value) 476*0b57cec5SDimitry Andric // Also ignore marker tags such as DT_HIOS (maps to DT_VERNEEDNUM), etc. 477*0b57cec5SDimitry Andric #define DYNAMIC_TAG_MARKER(name, value) 478*0b57cec5SDimitry Andric #define DYNAMIC_TAG(name, value) DYNAMIC_STRINGIFY_ENUM(name, value) 479*0b57cec5SDimitry Andric #include "llvm/BinaryFormat/DynamicTags.def" 480*0b57cec5SDimitry Andric #undef DYNAMIC_TAG 481*0b57cec5SDimitry Andric #undef AARCH64_DYNAMIC_TAG 482*0b57cec5SDimitry Andric #undef MIPS_DYNAMIC_TAG 483*0b57cec5SDimitry Andric #undef HEXAGON_DYNAMIC_TAG 484*0b57cec5SDimitry Andric #undef PPC64_DYNAMIC_TAG 485*0b57cec5SDimitry Andric #undef DYNAMIC_TAG_MARKER 486*0b57cec5SDimitry Andric #undef DYNAMIC_STRINGIFY_ENUM 487*0b57cec5SDimitry Andric default: 488*0b57cec5SDimitry Andric return "<unknown:>0x" + utohexstr(Type, true); 489*0b57cec5SDimitry Andric } 490*0b57cec5SDimitry Andric } 491*0b57cec5SDimitry Andric 492*0b57cec5SDimitry Andric template <class ELFT> 493*0b57cec5SDimitry Andric std::string ELFFile<ELFT>::getDynamicTagAsString(uint64_t Type) const { 494*0b57cec5SDimitry Andric return getDynamicTagAsString(getHeader()->e_machine, Type); 495*0b57cec5SDimitry Andric } 496*0b57cec5SDimitry Andric 497*0b57cec5SDimitry Andric template <class ELFT> 498*0b57cec5SDimitry Andric Expected<typename ELFT::DynRange> ELFFile<ELFT>::dynamicEntries() const { 499*0b57cec5SDimitry Andric ArrayRef<Elf_Dyn> Dyn; 500*0b57cec5SDimitry Andric size_t DynSecSize = 0; 501*0b57cec5SDimitry Andric 502*0b57cec5SDimitry Andric auto ProgramHeadersOrError = program_headers(); 503*0b57cec5SDimitry Andric if (!ProgramHeadersOrError) 504*0b57cec5SDimitry Andric return ProgramHeadersOrError.takeError(); 505*0b57cec5SDimitry Andric 506*0b57cec5SDimitry Andric for (const Elf_Phdr &Phdr : *ProgramHeadersOrError) { 507*0b57cec5SDimitry Andric if (Phdr.p_type == ELF::PT_DYNAMIC) { 508*0b57cec5SDimitry Andric Dyn = makeArrayRef( 509*0b57cec5SDimitry Andric reinterpret_cast<const Elf_Dyn *>(base() + Phdr.p_offset), 510*0b57cec5SDimitry Andric Phdr.p_filesz / sizeof(Elf_Dyn)); 511*0b57cec5SDimitry Andric DynSecSize = Phdr.p_filesz; 512*0b57cec5SDimitry Andric break; 513*0b57cec5SDimitry Andric } 514*0b57cec5SDimitry Andric } 515*0b57cec5SDimitry Andric 516*0b57cec5SDimitry Andric // If we can't find the dynamic section in the program headers, we just fall 517*0b57cec5SDimitry Andric // back on the sections. 518*0b57cec5SDimitry Andric if (Dyn.empty()) { 519*0b57cec5SDimitry Andric auto SectionsOrError = sections(); 520*0b57cec5SDimitry Andric if (!SectionsOrError) 521*0b57cec5SDimitry Andric return SectionsOrError.takeError(); 522*0b57cec5SDimitry Andric 523*0b57cec5SDimitry Andric for (const Elf_Shdr &Sec : *SectionsOrError) { 524*0b57cec5SDimitry Andric if (Sec.sh_type == ELF::SHT_DYNAMIC) { 525*0b57cec5SDimitry Andric Expected<ArrayRef<Elf_Dyn>> DynOrError = 526*0b57cec5SDimitry Andric getSectionContentsAsArray<Elf_Dyn>(&Sec); 527*0b57cec5SDimitry Andric if (!DynOrError) 528*0b57cec5SDimitry Andric return DynOrError.takeError(); 529*0b57cec5SDimitry Andric Dyn = *DynOrError; 530*0b57cec5SDimitry Andric DynSecSize = Sec.sh_size; 531*0b57cec5SDimitry Andric break; 532*0b57cec5SDimitry Andric } 533*0b57cec5SDimitry Andric } 534*0b57cec5SDimitry Andric 535*0b57cec5SDimitry Andric if (!Dyn.data()) 536*0b57cec5SDimitry Andric return ArrayRef<Elf_Dyn>(); 537*0b57cec5SDimitry Andric } 538*0b57cec5SDimitry Andric 539*0b57cec5SDimitry Andric if (Dyn.empty()) 540*0b57cec5SDimitry Andric // TODO: this error is untested. 541*0b57cec5SDimitry Andric return createError("invalid empty dynamic section"); 542*0b57cec5SDimitry Andric 543*0b57cec5SDimitry Andric if (DynSecSize % sizeof(Elf_Dyn) != 0) 544*0b57cec5SDimitry Andric // TODO: this error is untested. 545*0b57cec5SDimitry Andric return createError("malformed dynamic section"); 546*0b57cec5SDimitry Andric 547*0b57cec5SDimitry Andric if (Dyn.back().d_tag != ELF::DT_NULL) 548*0b57cec5SDimitry Andric // TODO: this error is untested. 549*0b57cec5SDimitry Andric return createError("dynamic sections must be DT_NULL terminated"); 550*0b57cec5SDimitry Andric 551*0b57cec5SDimitry Andric return Dyn; 552*0b57cec5SDimitry Andric } 553*0b57cec5SDimitry Andric 554*0b57cec5SDimitry Andric template <class ELFT> 555*0b57cec5SDimitry Andric Expected<const uint8_t *> ELFFile<ELFT>::toMappedAddr(uint64_t VAddr) const { 556*0b57cec5SDimitry Andric auto ProgramHeadersOrError = program_headers(); 557*0b57cec5SDimitry Andric if (!ProgramHeadersOrError) 558*0b57cec5SDimitry Andric return ProgramHeadersOrError.takeError(); 559*0b57cec5SDimitry Andric 560*0b57cec5SDimitry Andric llvm::SmallVector<Elf_Phdr *, 4> LoadSegments; 561*0b57cec5SDimitry Andric 562*0b57cec5SDimitry Andric for (const Elf_Phdr &Phdr : *ProgramHeadersOrError) 563*0b57cec5SDimitry Andric if (Phdr.p_type == ELF::PT_LOAD) 564*0b57cec5SDimitry Andric LoadSegments.push_back(const_cast<Elf_Phdr *>(&Phdr)); 565*0b57cec5SDimitry Andric 566*0b57cec5SDimitry Andric const Elf_Phdr *const *I = 567*0b57cec5SDimitry Andric std::upper_bound(LoadSegments.begin(), LoadSegments.end(), VAddr, 568*0b57cec5SDimitry Andric [](uint64_t VAddr, const Elf_Phdr_Impl<ELFT> *Phdr) { 569*0b57cec5SDimitry Andric return VAddr < Phdr->p_vaddr; 570*0b57cec5SDimitry Andric }); 571*0b57cec5SDimitry Andric 572*0b57cec5SDimitry Andric if (I == LoadSegments.begin()) 573*0b57cec5SDimitry Andric return createError("virtual address is not in any segment: 0x" + 574*0b57cec5SDimitry Andric Twine::utohexstr(VAddr)); 575*0b57cec5SDimitry Andric --I; 576*0b57cec5SDimitry Andric const Elf_Phdr &Phdr = **I; 577*0b57cec5SDimitry Andric uint64_t Delta = VAddr - Phdr.p_vaddr; 578*0b57cec5SDimitry Andric if (Delta >= Phdr.p_filesz) 579*0b57cec5SDimitry Andric return createError("virtual address is not in any segment: 0x" + 580*0b57cec5SDimitry Andric Twine::utohexstr(VAddr)); 581*0b57cec5SDimitry Andric return base() + Phdr.p_offset + Delta; 582*0b57cec5SDimitry Andric } 583*0b57cec5SDimitry Andric 584*0b57cec5SDimitry Andric template class llvm::object::ELFFile<ELF32LE>; 585*0b57cec5SDimitry Andric template class llvm::object::ELFFile<ELF32BE>; 586*0b57cec5SDimitry Andric template class llvm::object::ELFFile<ELF64LE>; 587*0b57cec5SDimitry Andric template class llvm::object::ELFFile<ELF64BE>; 588