xref: /freebsd/contrib/llvm-project/llvm/lib/Object/ELF.cpp (revision e8d8bef961a50d4dc22501cde4fb9fb0be1b2532)
10b57cec5SDimitry Andric //===- ELF.cpp - ELF object file implementation ---------------------------===//
20b57cec5SDimitry Andric //
30b57cec5SDimitry Andric // Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions.
40b57cec5SDimitry Andric // See https://llvm.org/LICENSE.txt for license information.
50b57cec5SDimitry Andric // SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception
60b57cec5SDimitry Andric //
70b57cec5SDimitry Andric //===----------------------------------------------------------------------===//
80b57cec5SDimitry Andric 
90b57cec5SDimitry Andric #include "llvm/Object/ELF.h"
100b57cec5SDimitry Andric #include "llvm/BinaryFormat/ELF.h"
110b57cec5SDimitry Andric #include "llvm/Support/LEB128.h"
120b57cec5SDimitry Andric 
130b57cec5SDimitry Andric using namespace llvm;
140b57cec5SDimitry Andric using namespace object;
150b57cec5SDimitry Andric 
160b57cec5SDimitry Andric #define STRINGIFY_ENUM_CASE(ns, name)                                          \
170b57cec5SDimitry Andric   case ns::name:                                                               \
180b57cec5SDimitry Andric     return #name;
190b57cec5SDimitry Andric 
200b57cec5SDimitry Andric #define ELF_RELOC(name, value) STRINGIFY_ENUM_CASE(ELF, name)
210b57cec5SDimitry Andric 
220b57cec5SDimitry Andric StringRef llvm::object::getELFRelocationTypeName(uint32_t Machine,
230b57cec5SDimitry Andric                                                  uint32_t Type) {
240b57cec5SDimitry Andric   switch (Machine) {
250b57cec5SDimitry Andric   case ELF::EM_X86_64:
260b57cec5SDimitry Andric     switch (Type) {
270b57cec5SDimitry Andric #include "llvm/BinaryFormat/ELFRelocs/x86_64.def"
280b57cec5SDimitry Andric     default:
290b57cec5SDimitry Andric       break;
300b57cec5SDimitry Andric     }
310b57cec5SDimitry Andric     break;
320b57cec5SDimitry Andric   case ELF::EM_386:
330b57cec5SDimitry Andric   case ELF::EM_IAMCU:
340b57cec5SDimitry Andric     switch (Type) {
350b57cec5SDimitry Andric #include "llvm/BinaryFormat/ELFRelocs/i386.def"
360b57cec5SDimitry Andric     default:
370b57cec5SDimitry Andric       break;
380b57cec5SDimitry Andric     }
390b57cec5SDimitry Andric     break;
400b57cec5SDimitry Andric   case ELF::EM_MIPS:
410b57cec5SDimitry Andric     switch (Type) {
420b57cec5SDimitry Andric #include "llvm/BinaryFormat/ELFRelocs/Mips.def"
430b57cec5SDimitry Andric     default:
440b57cec5SDimitry Andric       break;
450b57cec5SDimitry Andric     }
460b57cec5SDimitry Andric     break;
470b57cec5SDimitry Andric   case ELF::EM_AARCH64:
480b57cec5SDimitry Andric     switch (Type) {
490b57cec5SDimitry Andric #include "llvm/BinaryFormat/ELFRelocs/AArch64.def"
500b57cec5SDimitry Andric     default:
510b57cec5SDimitry Andric       break;
520b57cec5SDimitry Andric     }
530b57cec5SDimitry Andric     break;
540b57cec5SDimitry Andric   case ELF::EM_ARM:
550b57cec5SDimitry Andric     switch (Type) {
560b57cec5SDimitry Andric #include "llvm/BinaryFormat/ELFRelocs/ARM.def"
570b57cec5SDimitry Andric     default:
580b57cec5SDimitry Andric       break;
590b57cec5SDimitry Andric     }
600b57cec5SDimitry Andric     break;
610b57cec5SDimitry Andric   case ELF::EM_ARC_COMPACT:
620b57cec5SDimitry Andric   case ELF::EM_ARC_COMPACT2:
630b57cec5SDimitry Andric     switch (Type) {
640b57cec5SDimitry Andric #include "llvm/BinaryFormat/ELFRelocs/ARC.def"
650b57cec5SDimitry Andric     default:
660b57cec5SDimitry Andric       break;
670b57cec5SDimitry Andric     }
680b57cec5SDimitry Andric     break;
690b57cec5SDimitry Andric   case ELF::EM_AVR:
700b57cec5SDimitry Andric     switch (Type) {
710b57cec5SDimitry Andric #include "llvm/BinaryFormat/ELFRelocs/AVR.def"
720b57cec5SDimitry Andric     default:
730b57cec5SDimitry Andric       break;
740b57cec5SDimitry Andric     }
750b57cec5SDimitry Andric     break;
760b57cec5SDimitry Andric   case ELF::EM_HEXAGON:
770b57cec5SDimitry Andric     switch (Type) {
780b57cec5SDimitry Andric #include "llvm/BinaryFormat/ELFRelocs/Hexagon.def"
790b57cec5SDimitry Andric     default:
800b57cec5SDimitry Andric       break;
810b57cec5SDimitry Andric     }
820b57cec5SDimitry Andric     break;
830b57cec5SDimitry Andric   case ELF::EM_LANAI:
840b57cec5SDimitry Andric     switch (Type) {
850b57cec5SDimitry Andric #include "llvm/BinaryFormat/ELFRelocs/Lanai.def"
860b57cec5SDimitry Andric     default:
870b57cec5SDimitry Andric       break;
880b57cec5SDimitry Andric     }
890b57cec5SDimitry Andric     break;
900b57cec5SDimitry Andric   case ELF::EM_PPC:
910b57cec5SDimitry Andric     switch (Type) {
920b57cec5SDimitry Andric #include "llvm/BinaryFormat/ELFRelocs/PowerPC.def"
930b57cec5SDimitry Andric     default:
940b57cec5SDimitry Andric       break;
950b57cec5SDimitry Andric     }
960b57cec5SDimitry Andric     break;
970b57cec5SDimitry Andric   case ELF::EM_PPC64:
980b57cec5SDimitry Andric     switch (Type) {
990b57cec5SDimitry Andric #include "llvm/BinaryFormat/ELFRelocs/PowerPC64.def"
1000b57cec5SDimitry Andric     default:
1010b57cec5SDimitry Andric       break;
1020b57cec5SDimitry Andric     }
1030b57cec5SDimitry Andric     break;
1040b57cec5SDimitry Andric   case ELF::EM_RISCV:
1050b57cec5SDimitry Andric     switch (Type) {
1060b57cec5SDimitry Andric #include "llvm/BinaryFormat/ELFRelocs/RISCV.def"
1070b57cec5SDimitry Andric     default:
1080b57cec5SDimitry Andric       break;
1090b57cec5SDimitry Andric     }
1100b57cec5SDimitry Andric     break;
1110b57cec5SDimitry Andric   case ELF::EM_S390:
1120b57cec5SDimitry Andric     switch (Type) {
1130b57cec5SDimitry Andric #include "llvm/BinaryFormat/ELFRelocs/SystemZ.def"
1140b57cec5SDimitry Andric     default:
1150b57cec5SDimitry Andric       break;
1160b57cec5SDimitry Andric     }
1170b57cec5SDimitry Andric     break;
1180b57cec5SDimitry Andric   case ELF::EM_SPARC:
1190b57cec5SDimitry Andric   case ELF::EM_SPARC32PLUS:
1200b57cec5SDimitry Andric   case ELF::EM_SPARCV9:
1210b57cec5SDimitry Andric     switch (Type) {
1220b57cec5SDimitry Andric #include "llvm/BinaryFormat/ELFRelocs/Sparc.def"
1230b57cec5SDimitry Andric     default:
1240b57cec5SDimitry Andric       break;
1250b57cec5SDimitry Andric     }
1260b57cec5SDimitry Andric     break;
1270b57cec5SDimitry Andric   case ELF::EM_AMDGPU:
1280b57cec5SDimitry Andric     switch (Type) {
1290b57cec5SDimitry Andric #include "llvm/BinaryFormat/ELFRelocs/AMDGPU.def"
1300b57cec5SDimitry Andric     default:
1310b57cec5SDimitry Andric       break;
1320b57cec5SDimitry Andric     }
1330b57cec5SDimitry Andric     break;
1340b57cec5SDimitry Andric   case ELF::EM_BPF:
1350b57cec5SDimitry Andric     switch (Type) {
1360b57cec5SDimitry Andric #include "llvm/BinaryFormat/ELFRelocs/BPF.def"
1370b57cec5SDimitry Andric     default:
1380b57cec5SDimitry Andric       break;
1390b57cec5SDimitry Andric     }
1400b57cec5SDimitry Andric     break;
1410b57cec5SDimitry Andric   case ELF::EM_MSP430:
1420b57cec5SDimitry Andric     switch (Type) {
1430b57cec5SDimitry Andric #include "llvm/BinaryFormat/ELFRelocs/MSP430.def"
1440b57cec5SDimitry Andric     default:
1450b57cec5SDimitry Andric       break;
1460b57cec5SDimitry Andric     }
1470b57cec5SDimitry Andric     break;
1485ffd83dbSDimitry Andric   case ELF::EM_VE:
1495ffd83dbSDimitry Andric     switch (Type) {
1505ffd83dbSDimitry Andric #include "llvm/BinaryFormat/ELFRelocs/VE.def"
1515ffd83dbSDimitry Andric     default:
1525ffd83dbSDimitry Andric       break;
1535ffd83dbSDimitry Andric     }
1545ffd83dbSDimitry Andric     break;
155*e8d8bef9SDimitry Andric   case ELF::EM_CSKY:
156*e8d8bef9SDimitry Andric     switch (Type) {
157*e8d8bef9SDimitry Andric #include "llvm/BinaryFormat/ELFRelocs/CSKY.def"
158*e8d8bef9SDimitry Andric     default:
159*e8d8bef9SDimitry Andric       break;
160*e8d8bef9SDimitry Andric     }
161*e8d8bef9SDimitry Andric     break;
1620b57cec5SDimitry Andric   default:
1630b57cec5SDimitry Andric     break;
1640b57cec5SDimitry Andric   }
1650b57cec5SDimitry Andric   return "Unknown";
1660b57cec5SDimitry Andric }
1670b57cec5SDimitry Andric 
1680b57cec5SDimitry Andric #undef ELF_RELOC
1690b57cec5SDimitry Andric 
1700b57cec5SDimitry Andric uint32_t llvm::object::getELFRelativeRelocationType(uint32_t Machine) {
1710b57cec5SDimitry Andric   switch (Machine) {
1720b57cec5SDimitry Andric   case ELF::EM_X86_64:
1730b57cec5SDimitry Andric     return ELF::R_X86_64_RELATIVE;
1740b57cec5SDimitry Andric   case ELF::EM_386:
1750b57cec5SDimitry Andric   case ELF::EM_IAMCU:
1760b57cec5SDimitry Andric     return ELF::R_386_RELATIVE;
1770b57cec5SDimitry Andric   case ELF::EM_MIPS:
1780b57cec5SDimitry Andric     break;
1790b57cec5SDimitry Andric   case ELF::EM_AARCH64:
1800b57cec5SDimitry Andric     return ELF::R_AARCH64_RELATIVE;
1810b57cec5SDimitry Andric   case ELF::EM_ARM:
1820b57cec5SDimitry Andric     return ELF::R_ARM_RELATIVE;
1830b57cec5SDimitry Andric   case ELF::EM_ARC_COMPACT:
1840b57cec5SDimitry Andric   case ELF::EM_ARC_COMPACT2:
1850b57cec5SDimitry Andric     return ELF::R_ARC_RELATIVE;
1860b57cec5SDimitry Andric   case ELF::EM_AVR:
1870b57cec5SDimitry Andric     break;
1880b57cec5SDimitry Andric   case ELF::EM_HEXAGON:
1890b57cec5SDimitry Andric     return ELF::R_HEX_RELATIVE;
1900b57cec5SDimitry Andric   case ELF::EM_LANAI:
1910b57cec5SDimitry Andric     break;
1920b57cec5SDimitry Andric   case ELF::EM_PPC:
1930b57cec5SDimitry Andric     break;
1940b57cec5SDimitry Andric   case ELF::EM_PPC64:
1950b57cec5SDimitry Andric     return ELF::R_PPC64_RELATIVE;
1960b57cec5SDimitry Andric   case ELF::EM_RISCV:
1970b57cec5SDimitry Andric     return ELF::R_RISCV_RELATIVE;
1980b57cec5SDimitry Andric   case ELF::EM_S390:
1990b57cec5SDimitry Andric     return ELF::R_390_RELATIVE;
2000b57cec5SDimitry Andric   case ELF::EM_SPARC:
2010b57cec5SDimitry Andric   case ELF::EM_SPARC32PLUS:
2020b57cec5SDimitry Andric   case ELF::EM_SPARCV9:
2030b57cec5SDimitry Andric     return ELF::R_SPARC_RELATIVE;
204*e8d8bef9SDimitry Andric   case ELF::EM_CSKY:
205*e8d8bef9SDimitry Andric     return ELF::R_CKCORE_RELATIVE;
2060b57cec5SDimitry Andric   case ELF::EM_AMDGPU:
2070b57cec5SDimitry Andric     break;
2080b57cec5SDimitry Andric   case ELF::EM_BPF:
2090b57cec5SDimitry Andric     break;
2100b57cec5SDimitry Andric   default:
2110b57cec5SDimitry Andric     break;
2120b57cec5SDimitry Andric   }
2130b57cec5SDimitry Andric   return 0;
2140b57cec5SDimitry Andric }
2150b57cec5SDimitry Andric 
2160b57cec5SDimitry Andric StringRef llvm::object::getELFSectionTypeName(uint32_t Machine, unsigned Type) {
2170b57cec5SDimitry Andric   switch (Machine) {
2180b57cec5SDimitry Andric   case ELF::EM_ARM:
2190b57cec5SDimitry Andric     switch (Type) {
2200b57cec5SDimitry Andric       STRINGIFY_ENUM_CASE(ELF, SHT_ARM_EXIDX);
2210b57cec5SDimitry Andric       STRINGIFY_ENUM_CASE(ELF, SHT_ARM_PREEMPTMAP);
2220b57cec5SDimitry Andric       STRINGIFY_ENUM_CASE(ELF, SHT_ARM_ATTRIBUTES);
2230b57cec5SDimitry Andric       STRINGIFY_ENUM_CASE(ELF, SHT_ARM_DEBUGOVERLAY);
2240b57cec5SDimitry Andric       STRINGIFY_ENUM_CASE(ELF, SHT_ARM_OVERLAYSECTION);
2250b57cec5SDimitry Andric     }
2260b57cec5SDimitry Andric     break;
2270b57cec5SDimitry Andric   case ELF::EM_HEXAGON:
2280b57cec5SDimitry Andric     switch (Type) { STRINGIFY_ENUM_CASE(ELF, SHT_HEX_ORDERED); }
2290b57cec5SDimitry Andric     break;
2300b57cec5SDimitry Andric   case ELF::EM_X86_64:
2310b57cec5SDimitry Andric     switch (Type) { STRINGIFY_ENUM_CASE(ELF, SHT_X86_64_UNWIND); }
2320b57cec5SDimitry Andric     break;
2330b57cec5SDimitry Andric   case ELF::EM_MIPS:
2340b57cec5SDimitry Andric   case ELF::EM_MIPS_RS3_LE:
2350b57cec5SDimitry Andric     switch (Type) {
2360b57cec5SDimitry Andric       STRINGIFY_ENUM_CASE(ELF, SHT_MIPS_REGINFO);
2370b57cec5SDimitry Andric       STRINGIFY_ENUM_CASE(ELF, SHT_MIPS_OPTIONS);
2380b57cec5SDimitry Andric       STRINGIFY_ENUM_CASE(ELF, SHT_MIPS_DWARF);
2390b57cec5SDimitry Andric       STRINGIFY_ENUM_CASE(ELF, SHT_MIPS_ABIFLAGS);
2400b57cec5SDimitry Andric     }
2410b57cec5SDimitry Andric     break;
2425ffd83dbSDimitry Andric   case ELF::EM_RISCV:
2435ffd83dbSDimitry Andric     switch (Type) { STRINGIFY_ENUM_CASE(ELF, SHT_RISCV_ATTRIBUTES); }
2445ffd83dbSDimitry Andric     break;
2450b57cec5SDimitry Andric   default:
2460b57cec5SDimitry Andric     break;
2470b57cec5SDimitry Andric   }
2480b57cec5SDimitry Andric 
2490b57cec5SDimitry Andric   switch (Type) {
2500b57cec5SDimitry Andric     STRINGIFY_ENUM_CASE(ELF, SHT_NULL);
2510b57cec5SDimitry Andric     STRINGIFY_ENUM_CASE(ELF, SHT_PROGBITS);
2520b57cec5SDimitry Andric     STRINGIFY_ENUM_CASE(ELF, SHT_SYMTAB);
2530b57cec5SDimitry Andric     STRINGIFY_ENUM_CASE(ELF, SHT_STRTAB);
2540b57cec5SDimitry Andric     STRINGIFY_ENUM_CASE(ELF, SHT_RELA);
2550b57cec5SDimitry Andric     STRINGIFY_ENUM_CASE(ELF, SHT_HASH);
2560b57cec5SDimitry Andric     STRINGIFY_ENUM_CASE(ELF, SHT_DYNAMIC);
2570b57cec5SDimitry Andric     STRINGIFY_ENUM_CASE(ELF, SHT_NOTE);
2580b57cec5SDimitry Andric     STRINGIFY_ENUM_CASE(ELF, SHT_NOBITS);
2590b57cec5SDimitry Andric     STRINGIFY_ENUM_CASE(ELF, SHT_REL);
2600b57cec5SDimitry Andric     STRINGIFY_ENUM_CASE(ELF, SHT_SHLIB);
2610b57cec5SDimitry Andric     STRINGIFY_ENUM_CASE(ELF, SHT_DYNSYM);
2620b57cec5SDimitry Andric     STRINGIFY_ENUM_CASE(ELF, SHT_INIT_ARRAY);
2630b57cec5SDimitry Andric     STRINGIFY_ENUM_CASE(ELF, SHT_FINI_ARRAY);
2640b57cec5SDimitry Andric     STRINGIFY_ENUM_CASE(ELF, SHT_PREINIT_ARRAY);
2650b57cec5SDimitry Andric     STRINGIFY_ENUM_CASE(ELF, SHT_GROUP);
2660b57cec5SDimitry Andric     STRINGIFY_ENUM_CASE(ELF, SHT_SYMTAB_SHNDX);
2670b57cec5SDimitry Andric     STRINGIFY_ENUM_CASE(ELF, SHT_RELR);
2680b57cec5SDimitry Andric     STRINGIFY_ENUM_CASE(ELF, SHT_ANDROID_REL);
2690b57cec5SDimitry Andric     STRINGIFY_ENUM_CASE(ELF, SHT_ANDROID_RELA);
2700b57cec5SDimitry Andric     STRINGIFY_ENUM_CASE(ELF, SHT_ANDROID_RELR);
2710b57cec5SDimitry Andric     STRINGIFY_ENUM_CASE(ELF, SHT_LLVM_ODRTAB);
2720b57cec5SDimitry Andric     STRINGIFY_ENUM_CASE(ELF, SHT_LLVM_LINKER_OPTIONS);
2730b57cec5SDimitry Andric     STRINGIFY_ENUM_CASE(ELF, SHT_LLVM_CALL_GRAPH_PROFILE);
2740b57cec5SDimitry Andric     STRINGIFY_ENUM_CASE(ELF, SHT_LLVM_ADDRSIG);
2750b57cec5SDimitry Andric     STRINGIFY_ENUM_CASE(ELF, SHT_LLVM_DEPENDENT_LIBRARIES);
2760b57cec5SDimitry Andric     STRINGIFY_ENUM_CASE(ELF, SHT_LLVM_SYMPART);
2778bcb0991SDimitry Andric     STRINGIFY_ENUM_CASE(ELF, SHT_LLVM_PART_EHDR);
2788bcb0991SDimitry Andric     STRINGIFY_ENUM_CASE(ELF, SHT_LLVM_PART_PHDR);
279*e8d8bef9SDimitry Andric     STRINGIFY_ENUM_CASE(ELF, SHT_LLVM_BB_ADDR_MAP);
2800b57cec5SDimitry Andric     STRINGIFY_ENUM_CASE(ELF, SHT_GNU_ATTRIBUTES);
2810b57cec5SDimitry Andric     STRINGIFY_ENUM_CASE(ELF, SHT_GNU_HASH);
2820b57cec5SDimitry Andric     STRINGIFY_ENUM_CASE(ELF, SHT_GNU_verdef);
2830b57cec5SDimitry Andric     STRINGIFY_ENUM_CASE(ELF, SHT_GNU_verneed);
2840b57cec5SDimitry Andric     STRINGIFY_ENUM_CASE(ELF, SHT_GNU_versym);
2850b57cec5SDimitry Andric   default:
2860b57cec5SDimitry Andric     return "Unknown";
2870b57cec5SDimitry Andric   }
2880b57cec5SDimitry Andric }
2890b57cec5SDimitry Andric 
2900b57cec5SDimitry Andric template <class ELFT>
291*e8d8bef9SDimitry Andric std::vector<typename ELFT::Rel>
2920b57cec5SDimitry Andric ELFFile<ELFT>::decode_relrs(Elf_Relr_Range relrs) const {
2930b57cec5SDimitry Andric   // This function decodes the contents of an SHT_RELR packed relocation
2940b57cec5SDimitry Andric   // section.
2950b57cec5SDimitry Andric   //
2960b57cec5SDimitry Andric   // Proposal for adding SHT_RELR sections to generic-abi is here:
2970b57cec5SDimitry Andric   //   https://groups.google.com/forum/#!topic/generic-abi/bX460iggiKg
2980b57cec5SDimitry Andric   //
2990b57cec5SDimitry Andric   // The encoded sequence of Elf64_Relr entries in a SHT_RELR section looks
3000b57cec5SDimitry Andric   // like [ AAAAAAAA BBBBBBB1 BBBBBBB1 ... AAAAAAAA BBBBBB1 ... ]
3010b57cec5SDimitry Andric   //
3020b57cec5SDimitry Andric   // i.e. start with an address, followed by any number of bitmaps. The address
3030b57cec5SDimitry Andric   // entry encodes 1 relocation. The subsequent bitmap entries encode up to 63
3040b57cec5SDimitry Andric   // relocations each, at subsequent offsets following the last address entry.
3050b57cec5SDimitry Andric   //
3060b57cec5SDimitry Andric   // The bitmap entries must have 1 in the least significant bit. The assumption
3070b57cec5SDimitry Andric   // here is that an address cannot have 1 in lsb. Odd addresses are not
3080b57cec5SDimitry Andric   // supported.
3090b57cec5SDimitry Andric   //
3100b57cec5SDimitry Andric   // Excluding the least significant bit in the bitmap, each non-zero bit in
3110b57cec5SDimitry Andric   // the bitmap represents a relocation to be applied to a corresponding machine
3120b57cec5SDimitry Andric   // word that follows the base address word. The second least significant bit
3130b57cec5SDimitry Andric   // represents the machine word immediately following the initial address, and
3140b57cec5SDimitry Andric   // each bit that follows represents the next word, in linear order. As such,
3150b57cec5SDimitry Andric   // a single bitmap can encode up to 31 relocations in a 32-bit object, and
3160b57cec5SDimitry Andric   // 63 relocations in a 64-bit object.
3170b57cec5SDimitry Andric   //
3180b57cec5SDimitry Andric   // This encoding has a couple of interesting properties:
3190b57cec5SDimitry Andric   // 1. Looking at any entry, it is clear whether it's an address or a bitmap:
3200b57cec5SDimitry Andric   //    even means address, odd means bitmap.
3210b57cec5SDimitry Andric   // 2. Just a simple list of addresses is a valid encoding.
3220b57cec5SDimitry Andric 
323*e8d8bef9SDimitry Andric   Elf_Rel Rel;
324*e8d8bef9SDimitry Andric   Rel.r_info = 0;
325*e8d8bef9SDimitry Andric   Rel.setType(getRelativeRelocationType(), false);
326*e8d8bef9SDimitry Andric   std::vector<Elf_Rel> Relocs;
3270b57cec5SDimitry Andric 
3280b57cec5SDimitry Andric   // Word type: uint32_t for Elf32, and uint64_t for Elf64.
3290b57cec5SDimitry Andric   typedef typename ELFT::uint Word;
3300b57cec5SDimitry Andric 
3310b57cec5SDimitry Andric   // Word size in number of bytes.
3320b57cec5SDimitry Andric   const size_t WordSize = sizeof(Word);
3330b57cec5SDimitry Andric 
3340b57cec5SDimitry Andric   // Number of bits used for the relocation offsets bitmap.
3350b57cec5SDimitry Andric   // These many relative relocations can be encoded in a single entry.
3360b57cec5SDimitry Andric   const size_t NBits = 8*WordSize - 1;
3370b57cec5SDimitry Andric 
3380b57cec5SDimitry Andric   Word Base = 0;
3390b57cec5SDimitry Andric   for (const Elf_Relr &R : relrs) {
3400b57cec5SDimitry Andric     Word Entry = R;
3410b57cec5SDimitry Andric     if ((Entry&1) == 0) {
3420b57cec5SDimitry Andric       // Even entry: encodes the offset for next relocation.
343*e8d8bef9SDimitry Andric       Rel.r_offset = Entry;
344*e8d8bef9SDimitry Andric       Relocs.push_back(Rel);
3450b57cec5SDimitry Andric       // Set base offset for subsequent bitmap entries.
3460b57cec5SDimitry Andric       Base = Entry + WordSize;
3470b57cec5SDimitry Andric       continue;
3480b57cec5SDimitry Andric     }
3490b57cec5SDimitry Andric 
3500b57cec5SDimitry Andric     // Odd entry: encodes bitmap for relocations starting at base.
3510b57cec5SDimitry Andric     Word Offset = Base;
3520b57cec5SDimitry Andric     while (Entry != 0) {
3530b57cec5SDimitry Andric       Entry >>= 1;
3540b57cec5SDimitry Andric       if ((Entry&1) != 0) {
355*e8d8bef9SDimitry Andric         Rel.r_offset = Offset;
356*e8d8bef9SDimitry Andric         Relocs.push_back(Rel);
3570b57cec5SDimitry Andric       }
3580b57cec5SDimitry Andric       Offset += WordSize;
3590b57cec5SDimitry Andric     }
3600b57cec5SDimitry Andric 
3610b57cec5SDimitry Andric     // Advance base offset by NBits words.
3620b57cec5SDimitry Andric     Base += NBits * WordSize;
3630b57cec5SDimitry Andric   }
3640b57cec5SDimitry Andric 
3650b57cec5SDimitry Andric   return Relocs;
3660b57cec5SDimitry Andric }
3670b57cec5SDimitry Andric 
3680b57cec5SDimitry Andric template <class ELFT>
3690b57cec5SDimitry Andric Expected<std::vector<typename ELFT::Rela>>
370*e8d8bef9SDimitry Andric ELFFile<ELFT>::android_relas(const Elf_Shdr &Sec) const {
3710b57cec5SDimitry Andric   // This function reads relocations in Android's packed relocation format,
3720b57cec5SDimitry Andric   // which is based on SLEB128 and delta encoding.
3730b57cec5SDimitry Andric   Expected<ArrayRef<uint8_t>> ContentsOrErr = getSectionContents(Sec);
3740b57cec5SDimitry Andric   if (!ContentsOrErr)
3750b57cec5SDimitry Andric     return ContentsOrErr.takeError();
3760b57cec5SDimitry Andric   const uint8_t *Cur = ContentsOrErr->begin();
3770b57cec5SDimitry Andric   const uint8_t *End = ContentsOrErr->end();
3780b57cec5SDimitry Andric   if (ContentsOrErr->size() < 4 || Cur[0] != 'A' || Cur[1] != 'P' ||
3790b57cec5SDimitry Andric       Cur[2] != 'S' || Cur[3] != '2')
3800b57cec5SDimitry Andric     return createError("invalid packed relocation header");
3810b57cec5SDimitry Andric   Cur += 4;
3820b57cec5SDimitry Andric 
3830b57cec5SDimitry Andric   const char *ErrStr = nullptr;
3840b57cec5SDimitry Andric   auto ReadSLEB = [&]() -> int64_t {
3850b57cec5SDimitry Andric     if (ErrStr)
3860b57cec5SDimitry Andric       return 0;
3870b57cec5SDimitry Andric     unsigned Len;
3880b57cec5SDimitry Andric     int64_t Result = decodeSLEB128(Cur, &Len, End, &ErrStr);
3890b57cec5SDimitry Andric     Cur += Len;
3900b57cec5SDimitry Andric     return Result;
3910b57cec5SDimitry Andric   };
3920b57cec5SDimitry Andric 
3930b57cec5SDimitry Andric   uint64_t NumRelocs = ReadSLEB();
3940b57cec5SDimitry Andric   uint64_t Offset = ReadSLEB();
3950b57cec5SDimitry Andric   uint64_t Addend = 0;
3960b57cec5SDimitry Andric 
3970b57cec5SDimitry Andric   if (ErrStr)
3980b57cec5SDimitry Andric     return createError(ErrStr);
3990b57cec5SDimitry Andric 
4000b57cec5SDimitry Andric   std::vector<Elf_Rela> Relocs;
4010b57cec5SDimitry Andric   Relocs.reserve(NumRelocs);
4020b57cec5SDimitry Andric   while (NumRelocs) {
4030b57cec5SDimitry Andric     uint64_t NumRelocsInGroup = ReadSLEB();
4040b57cec5SDimitry Andric     if (NumRelocsInGroup > NumRelocs)
4050b57cec5SDimitry Andric       return createError("relocation group unexpectedly large");
4060b57cec5SDimitry Andric     NumRelocs -= NumRelocsInGroup;
4070b57cec5SDimitry Andric 
4080b57cec5SDimitry Andric     uint64_t GroupFlags = ReadSLEB();
4090b57cec5SDimitry Andric     bool GroupedByInfo = GroupFlags & ELF::RELOCATION_GROUPED_BY_INFO_FLAG;
4100b57cec5SDimitry Andric     bool GroupedByOffsetDelta = GroupFlags & ELF::RELOCATION_GROUPED_BY_OFFSET_DELTA_FLAG;
4110b57cec5SDimitry Andric     bool GroupedByAddend = GroupFlags & ELF::RELOCATION_GROUPED_BY_ADDEND_FLAG;
4120b57cec5SDimitry Andric     bool GroupHasAddend = GroupFlags & ELF::RELOCATION_GROUP_HAS_ADDEND_FLAG;
4130b57cec5SDimitry Andric 
4140b57cec5SDimitry Andric     uint64_t GroupOffsetDelta;
4150b57cec5SDimitry Andric     if (GroupedByOffsetDelta)
4160b57cec5SDimitry Andric       GroupOffsetDelta = ReadSLEB();
4170b57cec5SDimitry Andric 
4180b57cec5SDimitry Andric     uint64_t GroupRInfo;
4190b57cec5SDimitry Andric     if (GroupedByInfo)
4200b57cec5SDimitry Andric       GroupRInfo = ReadSLEB();
4210b57cec5SDimitry Andric 
4220b57cec5SDimitry Andric     if (GroupedByAddend && GroupHasAddend)
4230b57cec5SDimitry Andric       Addend += ReadSLEB();
4240b57cec5SDimitry Andric 
4250b57cec5SDimitry Andric     if (!GroupHasAddend)
4260b57cec5SDimitry Andric       Addend = 0;
4270b57cec5SDimitry Andric 
4280b57cec5SDimitry Andric     for (uint64_t I = 0; I != NumRelocsInGroup; ++I) {
4290b57cec5SDimitry Andric       Elf_Rela R;
4300b57cec5SDimitry Andric       Offset += GroupedByOffsetDelta ? GroupOffsetDelta : ReadSLEB();
4310b57cec5SDimitry Andric       R.r_offset = Offset;
4320b57cec5SDimitry Andric       R.r_info = GroupedByInfo ? GroupRInfo : ReadSLEB();
4330b57cec5SDimitry Andric       if (GroupHasAddend && !GroupedByAddend)
4340b57cec5SDimitry Andric         Addend += ReadSLEB();
4350b57cec5SDimitry Andric       R.r_addend = Addend;
4360b57cec5SDimitry Andric       Relocs.push_back(R);
4370b57cec5SDimitry Andric 
4380b57cec5SDimitry Andric       if (ErrStr)
4390b57cec5SDimitry Andric         return createError(ErrStr);
4400b57cec5SDimitry Andric     }
4410b57cec5SDimitry Andric 
4420b57cec5SDimitry Andric     if (ErrStr)
4430b57cec5SDimitry Andric       return createError(ErrStr);
4440b57cec5SDimitry Andric   }
4450b57cec5SDimitry Andric 
4460b57cec5SDimitry Andric   return Relocs;
4470b57cec5SDimitry Andric }
4480b57cec5SDimitry Andric 
4490b57cec5SDimitry Andric template <class ELFT>
4500b57cec5SDimitry Andric std::string ELFFile<ELFT>::getDynamicTagAsString(unsigned Arch,
4510b57cec5SDimitry Andric                                                  uint64_t Type) const {
4520b57cec5SDimitry Andric #define DYNAMIC_STRINGIFY_ENUM(tag, value)                                     \
4530b57cec5SDimitry Andric   case value:                                                                  \
4540b57cec5SDimitry Andric     return #tag;
4550b57cec5SDimitry Andric 
4560b57cec5SDimitry Andric #define DYNAMIC_TAG(n, v)
4570b57cec5SDimitry Andric   switch (Arch) {
4580b57cec5SDimitry Andric   case ELF::EM_AARCH64:
4590b57cec5SDimitry Andric     switch (Type) {
4600b57cec5SDimitry Andric #define AARCH64_DYNAMIC_TAG(name, value) DYNAMIC_STRINGIFY_ENUM(name, value)
4610b57cec5SDimitry Andric #include "llvm/BinaryFormat/DynamicTags.def"
4620b57cec5SDimitry Andric #undef AARCH64_DYNAMIC_TAG
4630b57cec5SDimitry Andric     }
4640b57cec5SDimitry Andric     break;
4650b57cec5SDimitry Andric 
4660b57cec5SDimitry Andric   case ELF::EM_HEXAGON:
4670b57cec5SDimitry Andric     switch (Type) {
4680b57cec5SDimitry Andric #define HEXAGON_DYNAMIC_TAG(name, value) DYNAMIC_STRINGIFY_ENUM(name, value)
4690b57cec5SDimitry Andric #include "llvm/BinaryFormat/DynamicTags.def"
4700b57cec5SDimitry Andric #undef HEXAGON_DYNAMIC_TAG
4710b57cec5SDimitry Andric     }
4720b57cec5SDimitry Andric     break;
4730b57cec5SDimitry Andric 
4740b57cec5SDimitry Andric   case ELF::EM_MIPS:
4750b57cec5SDimitry Andric     switch (Type) {
4760b57cec5SDimitry Andric #define MIPS_DYNAMIC_TAG(name, value) DYNAMIC_STRINGIFY_ENUM(name, value)
4770b57cec5SDimitry Andric #include "llvm/BinaryFormat/DynamicTags.def"
4780b57cec5SDimitry Andric #undef MIPS_DYNAMIC_TAG
4790b57cec5SDimitry Andric     }
4800b57cec5SDimitry Andric     break;
4810b57cec5SDimitry Andric 
4820b57cec5SDimitry Andric   case ELF::EM_PPC64:
4830b57cec5SDimitry Andric     switch (Type) {
4840b57cec5SDimitry Andric #define PPC64_DYNAMIC_TAG(name, value) DYNAMIC_STRINGIFY_ENUM(name, value)
4850b57cec5SDimitry Andric #include "llvm/BinaryFormat/DynamicTags.def"
4860b57cec5SDimitry Andric #undef PPC64_DYNAMIC_TAG
4870b57cec5SDimitry Andric     }
4880b57cec5SDimitry Andric     break;
4890b57cec5SDimitry Andric   }
4900b57cec5SDimitry Andric #undef DYNAMIC_TAG
4910b57cec5SDimitry Andric   switch (Type) {
4920b57cec5SDimitry Andric // Now handle all dynamic tags except the architecture specific ones
4930b57cec5SDimitry Andric #define AARCH64_DYNAMIC_TAG(name, value)
4940b57cec5SDimitry Andric #define MIPS_DYNAMIC_TAG(name, value)
4950b57cec5SDimitry Andric #define HEXAGON_DYNAMIC_TAG(name, value)
4960b57cec5SDimitry Andric #define PPC64_DYNAMIC_TAG(name, value)
4970b57cec5SDimitry Andric // Also ignore marker tags such as DT_HIOS (maps to DT_VERNEEDNUM), etc.
4980b57cec5SDimitry Andric #define DYNAMIC_TAG_MARKER(name, value)
499480093f4SDimitry Andric #define DYNAMIC_TAG(name, value) case value: return #name;
5000b57cec5SDimitry Andric #include "llvm/BinaryFormat/DynamicTags.def"
5010b57cec5SDimitry Andric #undef DYNAMIC_TAG
5020b57cec5SDimitry Andric #undef AARCH64_DYNAMIC_TAG
5030b57cec5SDimitry Andric #undef MIPS_DYNAMIC_TAG
5040b57cec5SDimitry Andric #undef HEXAGON_DYNAMIC_TAG
5050b57cec5SDimitry Andric #undef PPC64_DYNAMIC_TAG
5060b57cec5SDimitry Andric #undef DYNAMIC_TAG_MARKER
5070b57cec5SDimitry Andric #undef DYNAMIC_STRINGIFY_ENUM
5080b57cec5SDimitry Andric   default:
5090b57cec5SDimitry Andric     return "<unknown:>0x" + utohexstr(Type, true);
5100b57cec5SDimitry Andric   }
5110b57cec5SDimitry Andric }
5120b57cec5SDimitry Andric 
5130b57cec5SDimitry Andric template <class ELFT>
5140b57cec5SDimitry Andric std::string ELFFile<ELFT>::getDynamicTagAsString(uint64_t Type) const {
515*e8d8bef9SDimitry Andric   return getDynamicTagAsString(getHeader().e_machine, Type);
5160b57cec5SDimitry Andric }
5170b57cec5SDimitry Andric 
5180b57cec5SDimitry Andric template <class ELFT>
5190b57cec5SDimitry Andric Expected<typename ELFT::DynRange> ELFFile<ELFT>::dynamicEntries() const {
5200b57cec5SDimitry Andric   ArrayRef<Elf_Dyn> Dyn;
5210b57cec5SDimitry Andric 
5220b57cec5SDimitry Andric   auto ProgramHeadersOrError = program_headers();
5230b57cec5SDimitry Andric   if (!ProgramHeadersOrError)
5240b57cec5SDimitry Andric     return ProgramHeadersOrError.takeError();
5250b57cec5SDimitry Andric 
5260b57cec5SDimitry Andric   for (const Elf_Phdr &Phdr : *ProgramHeadersOrError) {
5270b57cec5SDimitry Andric     if (Phdr.p_type == ELF::PT_DYNAMIC) {
5280b57cec5SDimitry Andric       Dyn = makeArrayRef(
5290b57cec5SDimitry Andric           reinterpret_cast<const Elf_Dyn *>(base() + Phdr.p_offset),
5300b57cec5SDimitry Andric           Phdr.p_filesz / sizeof(Elf_Dyn));
5310b57cec5SDimitry Andric       break;
5320b57cec5SDimitry Andric     }
5330b57cec5SDimitry Andric   }
5340b57cec5SDimitry Andric 
5350b57cec5SDimitry Andric   // If we can't find the dynamic section in the program headers, we just fall
5360b57cec5SDimitry Andric   // back on the sections.
5370b57cec5SDimitry Andric   if (Dyn.empty()) {
5380b57cec5SDimitry Andric     auto SectionsOrError = sections();
5390b57cec5SDimitry Andric     if (!SectionsOrError)
5400b57cec5SDimitry Andric       return SectionsOrError.takeError();
5410b57cec5SDimitry Andric 
5420b57cec5SDimitry Andric     for (const Elf_Shdr &Sec : *SectionsOrError) {
5430b57cec5SDimitry Andric       if (Sec.sh_type == ELF::SHT_DYNAMIC) {
5440b57cec5SDimitry Andric         Expected<ArrayRef<Elf_Dyn>> DynOrError =
545*e8d8bef9SDimitry Andric             getSectionContentsAsArray<Elf_Dyn>(Sec);
5460b57cec5SDimitry Andric         if (!DynOrError)
5470b57cec5SDimitry Andric           return DynOrError.takeError();
5480b57cec5SDimitry Andric         Dyn = *DynOrError;
5490b57cec5SDimitry Andric         break;
5500b57cec5SDimitry Andric       }
5510b57cec5SDimitry Andric     }
5520b57cec5SDimitry Andric 
5530b57cec5SDimitry Andric     if (!Dyn.data())
5540b57cec5SDimitry Andric       return ArrayRef<Elf_Dyn>();
5550b57cec5SDimitry Andric   }
5560b57cec5SDimitry Andric 
5570b57cec5SDimitry Andric   if (Dyn.empty())
5580b57cec5SDimitry Andric     // TODO: this error is untested.
5590b57cec5SDimitry Andric     return createError("invalid empty dynamic section");
5600b57cec5SDimitry Andric 
5610b57cec5SDimitry Andric   if (Dyn.back().d_tag != ELF::DT_NULL)
5620b57cec5SDimitry Andric     // TODO: this error is untested.
5630b57cec5SDimitry Andric     return createError("dynamic sections must be DT_NULL terminated");
5640b57cec5SDimitry Andric 
5650b57cec5SDimitry Andric   return Dyn;
5660b57cec5SDimitry Andric }
5670b57cec5SDimitry Andric 
5680b57cec5SDimitry Andric template <class ELFT>
569*e8d8bef9SDimitry Andric Expected<const uint8_t *>
570*e8d8bef9SDimitry Andric ELFFile<ELFT>::toMappedAddr(uint64_t VAddr, WarningHandler WarnHandler) const {
5710b57cec5SDimitry Andric   auto ProgramHeadersOrError = program_headers();
5720b57cec5SDimitry Andric   if (!ProgramHeadersOrError)
5730b57cec5SDimitry Andric     return ProgramHeadersOrError.takeError();
5740b57cec5SDimitry Andric 
5750b57cec5SDimitry Andric   llvm::SmallVector<Elf_Phdr *, 4> LoadSegments;
5760b57cec5SDimitry Andric 
5770b57cec5SDimitry Andric   for (const Elf_Phdr &Phdr : *ProgramHeadersOrError)
5780b57cec5SDimitry Andric     if (Phdr.p_type == ELF::PT_LOAD)
5790b57cec5SDimitry Andric       LoadSegments.push_back(const_cast<Elf_Phdr *>(&Phdr));
5800b57cec5SDimitry Andric 
581*e8d8bef9SDimitry Andric   auto SortPred = [](const Elf_Phdr_Impl<ELFT> *A,
582*e8d8bef9SDimitry Andric                      const Elf_Phdr_Impl<ELFT> *B) {
583*e8d8bef9SDimitry Andric     return A->p_vaddr < B->p_vaddr;
584*e8d8bef9SDimitry Andric   };
585*e8d8bef9SDimitry Andric   if (!llvm::is_sorted(LoadSegments, SortPred)) {
586*e8d8bef9SDimitry Andric     if (Error E =
587*e8d8bef9SDimitry Andric             WarnHandler("loadable segments are unsorted by virtual address"))
588*e8d8bef9SDimitry Andric       return std::move(E);
589*e8d8bef9SDimitry Andric     llvm::stable_sort(LoadSegments, SortPred);
590*e8d8bef9SDimitry Andric   }
591*e8d8bef9SDimitry Andric 
592*e8d8bef9SDimitry Andric   const Elf_Phdr *const *I = llvm::upper_bound(
593*e8d8bef9SDimitry Andric       LoadSegments, VAddr, [](uint64_t VAddr, const Elf_Phdr_Impl<ELFT> *Phdr) {
5940b57cec5SDimitry Andric         return VAddr < Phdr->p_vaddr;
5950b57cec5SDimitry Andric       });
5960b57cec5SDimitry Andric 
5970b57cec5SDimitry Andric   if (I == LoadSegments.begin())
5980b57cec5SDimitry Andric     return createError("virtual address is not in any segment: 0x" +
5990b57cec5SDimitry Andric                        Twine::utohexstr(VAddr));
6000b57cec5SDimitry Andric   --I;
6010b57cec5SDimitry Andric   const Elf_Phdr &Phdr = **I;
6020b57cec5SDimitry Andric   uint64_t Delta = VAddr - Phdr.p_vaddr;
6030b57cec5SDimitry Andric   if (Delta >= Phdr.p_filesz)
6040b57cec5SDimitry Andric     return createError("virtual address is not in any segment: 0x" +
6050b57cec5SDimitry Andric                        Twine::utohexstr(VAddr));
6065ffd83dbSDimitry Andric 
6075ffd83dbSDimitry Andric   uint64_t Offset = Phdr.p_offset + Delta;
6085ffd83dbSDimitry Andric   if (Offset >= getBufSize())
6095ffd83dbSDimitry Andric     return createError("can't map virtual address 0x" +
6105ffd83dbSDimitry Andric                        Twine::utohexstr(VAddr) + " to the segment with index " +
6115ffd83dbSDimitry Andric                        Twine(&Phdr - (*ProgramHeadersOrError).data() + 1) +
6125ffd83dbSDimitry Andric                        ": the segment ends at 0x" +
6135ffd83dbSDimitry Andric                        Twine::utohexstr(Phdr.p_offset + Phdr.p_filesz) +
6145ffd83dbSDimitry Andric                        ", which is greater than the file size (0x" +
6155ffd83dbSDimitry Andric                        Twine::utohexstr(getBufSize()) + ")");
6165ffd83dbSDimitry Andric 
6175ffd83dbSDimitry Andric   return base() + Offset;
6180b57cec5SDimitry Andric }
6190b57cec5SDimitry Andric 
6200b57cec5SDimitry Andric template class llvm::object::ELFFile<ELF32LE>;
6210b57cec5SDimitry Andric template class llvm::object::ELFFile<ELF32BE>;
6220b57cec5SDimitry Andric template class llvm::object::ELFFile<ELF64LE>;
6230b57cec5SDimitry Andric template class llvm::object::ELFFile<ELF64BE>;
624