xref: /freebsd/contrib/llvm-project/llvm/lib/Object/ELF.cpp (revision 0b57cec536236d46e3dba9bd041533462f33dbb7)
1*0b57cec5SDimitry Andric //===- ELF.cpp - ELF object file implementation ---------------------------===//
2*0b57cec5SDimitry Andric //
3*0b57cec5SDimitry Andric // Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions.
4*0b57cec5SDimitry Andric // See https://llvm.org/LICENSE.txt for license information.
5*0b57cec5SDimitry Andric // SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception
6*0b57cec5SDimitry Andric //
7*0b57cec5SDimitry Andric //===----------------------------------------------------------------------===//
8*0b57cec5SDimitry Andric 
9*0b57cec5SDimitry Andric #include "llvm/Object/ELF.h"
10*0b57cec5SDimitry Andric #include "llvm/BinaryFormat/ELF.h"
11*0b57cec5SDimitry Andric #include "llvm/Support/LEB128.h"
12*0b57cec5SDimitry Andric 
13*0b57cec5SDimitry Andric using namespace llvm;
14*0b57cec5SDimitry Andric using namespace object;
15*0b57cec5SDimitry Andric 
16*0b57cec5SDimitry Andric #define STRINGIFY_ENUM_CASE(ns, name)                                          \
17*0b57cec5SDimitry Andric   case ns::name:                                                               \
18*0b57cec5SDimitry Andric     return #name;
19*0b57cec5SDimitry Andric 
20*0b57cec5SDimitry Andric #define ELF_RELOC(name, value) STRINGIFY_ENUM_CASE(ELF, name)
21*0b57cec5SDimitry Andric 
22*0b57cec5SDimitry Andric StringRef llvm::object::getELFRelocationTypeName(uint32_t Machine,
23*0b57cec5SDimitry Andric                                                  uint32_t Type) {
24*0b57cec5SDimitry Andric   switch (Machine) {
25*0b57cec5SDimitry Andric   case ELF::EM_X86_64:
26*0b57cec5SDimitry Andric     switch (Type) {
27*0b57cec5SDimitry Andric #include "llvm/BinaryFormat/ELFRelocs/x86_64.def"
28*0b57cec5SDimitry Andric     default:
29*0b57cec5SDimitry Andric       break;
30*0b57cec5SDimitry Andric     }
31*0b57cec5SDimitry Andric     break;
32*0b57cec5SDimitry Andric   case ELF::EM_386:
33*0b57cec5SDimitry Andric   case ELF::EM_IAMCU:
34*0b57cec5SDimitry Andric     switch (Type) {
35*0b57cec5SDimitry Andric #include "llvm/BinaryFormat/ELFRelocs/i386.def"
36*0b57cec5SDimitry Andric     default:
37*0b57cec5SDimitry Andric       break;
38*0b57cec5SDimitry Andric     }
39*0b57cec5SDimitry Andric     break;
40*0b57cec5SDimitry Andric   case ELF::EM_MIPS:
41*0b57cec5SDimitry Andric     switch (Type) {
42*0b57cec5SDimitry Andric #include "llvm/BinaryFormat/ELFRelocs/Mips.def"
43*0b57cec5SDimitry Andric     default:
44*0b57cec5SDimitry Andric       break;
45*0b57cec5SDimitry Andric     }
46*0b57cec5SDimitry Andric     break;
47*0b57cec5SDimitry Andric   case ELF::EM_AARCH64:
48*0b57cec5SDimitry Andric     switch (Type) {
49*0b57cec5SDimitry Andric #include "llvm/BinaryFormat/ELFRelocs/AArch64.def"
50*0b57cec5SDimitry Andric     default:
51*0b57cec5SDimitry Andric       break;
52*0b57cec5SDimitry Andric     }
53*0b57cec5SDimitry Andric     break;
54*0b57cec5SDimitry Andric   case ELF::EM_ARM:
55*0b57cec5SDimitry Andric     switch (Type) {
56*0b57cec5SDimitry Andric #include "llvm/BinaryFormat/ELFRelocs/ARM.def"
57*0b57cec5SDimitry Andric     default:
58*0b57cec5SDimitry Andric       break;
59*0b57cec5SDimitry Andric     }
60*0b57cec5SDimitry Andric     break;
61*0b57cec5SDimitry Andric   case ELF::EM_ARC_COMPACT:
62*0b57cec5SDimitry Andric   case ELF::EM_ARC_COMPACT2:
63*0b57cec5SDimitry Andric     switch (Type) {
64*0b57cec5SDimitry Andric #include "llvm/BinaryFormat/ELFRelocs/ARC.def"
65*0b57cec5SDimitry Andric     default:
66*0b57cec5SDimitry Andric       break;
67*0b57cec5SDimitry Andric     }
68*0b57cec5SDimitry Andric     break;
69*0b57cec5SDimitry Andric   case ELF::EM_AVR:
70*0b57cec5SDimitry Andric     switch (Type) {
71*0b57cec5SDimitry Andric #include "llvm/BinaryFormat/ELFRelocs/AVR.def"
72*0b57cec5SDimitry Andric     default:
73*0b57cec5SDimitry Andric       break;
74*0b57cec5SDimitry Andric     }
75*0b57cec5SDimitry Andric     break;
76*0b57cec5SDimitry Andric   case ELF::EM_HEXAGON:
77*0b57cec5SDimitry Andric     switch (Type) {
78*0b57cec5SDimitry Andric #include "llvm/BinaryFormat/ELFRelocs/Hexagon.def"
79*0b57cec5SDimitry Andric     default:
80*0b57cec5SDimitry Andric       break;
81*0b57cec5SDimitry Andric     }
82*0b57cec5SDimitry Andric     break;
83*0b57cec5SDimitry Andric   case ELF::EM_LANAI:
84*0b57cec5SDimitry Andric     switch (Type) {
85*0b57cec5SDimitry Andric #include "llvm/BinaryFormat/ELFRelocs/Lanai.def"
86*0b57cec5SDimitry Andric     default:
87*0b57cec5SDimitry Andric       break;
88*0b57cec5SDimitry Andric     }
89*0b57cec5SDimitry Andric     break;
90*0b57cec5SDimitry Andric   case ELF::EM_PPC:
91*0b57cec5SDimitry Andric     switch (Type) {
92*0b57cec5SDimitry Andric #include "llvm/BinaryFormat/ELFRelocs/PowerPC.def"
93*0b57cec5SDimitry Andric     default:
94*0b57cec5SDimitry Andric       break;
95*0b57cec5SDimitry Andric     }
96*0b57cec5SDimitry Andric     break;
97*0b57cec5SDimitry Andric   case ELF::EM_PPC64:
98*0b57cec5SDimitry Andric     switch (Type) {
99*0b57cec5SDimitry Andric #include "llvm/BinaryFormat/ELFRelocs/PowerPC64.def"
100*0b57cec5SDimitry Andric     default:
101*0b57cec5SDimitry Andric       break;
102*0b57cec5SDimitry Andric     }
103*0b57cec5SDimitry Andric     break;
104*0b57cec5SDimitry Andric   case ELF::EM_RISCV:
105*0b57cec5SDimitry Andric     switch (Type) {
106*0b57cec5SDimitry Andric #include "llvm/BinaryFormat/ELFRelocs/RISCV.def"
107*0b57cec5SDimitry Andric     default:
108*0b57cec5SDimitry Andric       break;
109*0b57cec5SDimitry Andric     }
110*0b57cec5SDimitry Andric     break;
111*0b57cec5SDimitry Andric   case ELF::EM_S390:
112*0b57cec5SDimitry Andric     switch (Type) {
113*0b57cec5SDimitry Andric #include "llvm/BinaryFormat/ELFRelocs/SystemZ.def"
114*0b57cec5SDimitry Andric     default:
115*0b57cec5SDimitry Andric       break;
116*0b57cec5SDimitry Andric     }
117*0b57cec5SDimitry Andric     break;
118*0b57cec5SDimitry Andric   case ELF::EM_SPARC:
119*0b57cec5SDimitry Andric   case ELF::EM_SPARC32PLUS:
120*0b57cec5SDimitry Andric   case ELF::EM_SPARCV9:
121*0b57cec5SDimitry Andric     switch (Type) {
122*0b57cec5SDimitry Andric #include "llvm/BinaryFormat/ELFRelocs/Sparc.def"
123*0b57cec5SDimitry Andric     default:
124*0b57cec5SDimitry Andric       break;
125*0b57cec5SDimitry Andric     }
126*0b57cec5SDimitry Andric     break;
127*0b57cec5SDimitry Andric   case ELF::EM_AMDGPU:
128*0b57cec5SDimitry Andric     switch (Type) {
129*0b57cec5SDimitry Andric #include "llvm/BinaryFormat/ELFRelocs/AMDGPU.def"
130*0b57cec5SDimitry Andric     default:
131*0b57cec5SDimitry Andric       break;
132*0b57cec5SDimitry Andric     }
133*0b57cec5SDimitry Andric     break;
134*0b57cec5SDimitry Andric   case ELF::EM_BPF:
135*0b57cec5SDimitry Andric     switch (Type) {
136*0b57cec5SDimitry Andric #include "llvm/BinaryFormat/ELFRelocs/BPF.def"
137*0b57cec5SDimitry Andric     default:
138*0b57cec5SDimitry Andric       break;
139*0b57cec5SDimitry Andric     }
140*0b57cec5SDimitry Andric     break;
141*0b57cec5SDimitry Andric   case ELF::EM_MSP430:
142*0b57cec5SDimitry Andric     switch (Type) {
143*0b57cec5SDimitry Andric #include "llvm/BinaryFormat/ELFRelocs/MSP430.def"
144*0b57cec5SDimitry Andric     default:
145*0b57cec5SDimitry Andric       break;
146*0b57cec5SDimitry Andric     }
147*0b57cec5SDimitry Andric     break;
148*0b57cec5SDimitry Andric   default:
149*0b57cec5SDimitry Andric     break;
150*0b57cec5SDimitry Andric   }
151*0b57cec5SDimitry Andric   return "Unknown";
152*0b57cec5SDimitry Andric }
153*0b57cec5SDimitry Andric 
154*0b57cec5SDimitry Andric #undef ELF_RELOC
155*0b57cec5SDimitry Andric 
156*0b57cec5SDimitry Andric uint32_t llvm::object::getELFRelativeRelocationType(uint32_t Machine) {
157*0b57cec5SDimitry Andric   switch (Machine) {
158*0b57cec5SDimitry Andric   case ELF::EM_X86_64:
159*0b57cec5SDimitry Andric     return ELF::R_X86_64_RELATIVE;
160*0b57cec5SDimitry Andric   case ELF::EM_386:
161*0b57cec5SDimitry Andric   case ELF::EM_IAMCU:
162*0b57cec5SDimitry Andric     return ELF::R_386_RELATIVE;
163*0b57cec5SDimitry Andric   case ELF::EM_MIPS:
164*0b57cec5SDimitry Andric     break;
165*0b57cec5SDimitry Andric   case ELF::EM_AARCH64:
166*0b57cec5SDimitry Andric     return ELF::R_AARCH64_RELATIVE;
167*0b57cec5SDimitry Andric   case ELF::EM_ARM:
168*0b57cec5SDimitry Andric     return ELF::R_ARM_RELATIVE;
169*0b57cec5SDimitry Andric   case ELF::EM_ARC_COMPACT:
170*0b57cec5SDimitry Andric   case ELF::EM_ARC_COMPACT2:
171*0b57cec5SDimitry Andric     return ELF::R_ARC_RELATIVE;
172*0b57cec5SDimitry Andric   case ELF::EM_AVR:
173*0b57cec5SDimitry Andric     break;
174*0b57cec5SDimitry Andric   case ELF::EM_HEXAGON:
175*0b57cec5SDimitry Andric     return ELF::R_HEX_RELATIVE;
176*0b57cec5SDimitry Andric   case ELF::EM_LANAI:
177*0b57cec5SDimitry Andric     break;
178*0b57cec5SDimitry Andric   case ELF::EM_PPC:
179*0b57cec5SDimitry Andric     break;
180*0b57cec5SDimitry Andric   case ELF::EM_PPC64:
181*0b57cec5SDimitry Andric     return ELF::R_PPC64_RELATIVE;
182*0b57cec5SDimitry Andric   case ELF::EM_RISCV:
183*0b57cec5SDimitry Andric     return ELF::R_RISCV_RELATIVE;
184*0b57cec5SDimitry Andric   case ELF::EM_S390:
185*0b57cec5SDimitry Andric     return ELF::R_390_RELATIVE;
186*0b57cec5SDimitry Andric   case ELF::EM_SPARC:
187*0b57cec5SDimitry Andric   case ELF::EM_SPARC32PLUS:
188*0b57cec5SDimitry Andric   case ELF::EM_SPARCV9:
189*0b57cec5SDimitry Andric     return ELF::R_SPARC_RELATIVE;
190*0b57cec5SDimitry Andric   case ELF::EM_AMDGPU:
191*0b57cec5SDimitry Andric     break;
192*0b57cec5SDimitry Andric   case ELF::EM_BPF:
193*0b57cec5SDimitry Andric     break;
194*0b57cec5SDimitry Andric   default:
195*0b57cec5SDimitry Andric     break;
196*0b57cec5SDimitry Andric   }
197*0b57cec5SDimitry Andric   return 0;
198*0b57cec5SDimitry Andric }
199*0b57cec5SDimitry Andric 
200*0b57cec5SDimitry Andric StringRef llvm::object::getELFSectionTypeName(uint32_t Machine, unsigned Type) {
201*0b57cec5SDimitry Andric   switch (Machine) {
202*0b57cec5SDimitry Andric   case ELF::EM_ARM:
203*0b57cec5SDimitry Andric     switch (Type) {
204*0b57cec5SDimitry Andric       STRINGIFY_ENUM_CASE(ELF, SHT_ARM_EXIDX);
205*0b57cec5SDimitry Andric       STRINGIFY_ENUM_CASE(ELF, SHT_ARM_PREEMPTMAP);
206*0b57cec5SDimitry Andric       STRINGIFY_ENUM_CASE(ELF, SHT_ARM_ATTRIBUTES);
207*0b57cec5SDimitry Andric       STRINGIFY_ENUM_CASE(ELF, SHT_ARM_DEBUGOVERLAY);
208*0b57cec5SDimitry Andric       STRINGIFY_ENUM_CASE(ELF, SHT_ARM_OVERLAYSECTION);
209*0b57cec5SDimitry Andric     }
210*0b57cec5SDimitry Andric     break;
211*0b57cec5SDimitry Andric   case ELF::EM_HEXAGON:
212*0b57cec5SDimitry Andric     switch (Type) { STRINGIFY_ENUM_CASE(ELF, SHT_HEX_ORDERED); }
213*0b57cec5SDimitry Andric     break;
214*0b57cec5SDimitry Andric   case ELF::EM_X86_64:
215*0b57cec5SDimitry Andric     switch (Type) { STRINGIFY_ENUM_CASE(ELF, SHT_X86_64_UNWIND); }
216*0b57cec5SDimitry Andric     break;
217*0b57cec5SDimitry Andric   case ELF::EM_MIPS:
218*0b57cec5SDimitry Andric   case ELF::EM_MIPS_RS3_LE:
219*0b57cec5SDimitry Andric     switch (Type) {
220*0b57cec5SDimitry Andric       STRINGIFY_ENUM_CASE(ELF, SHT_MIPS_REGINFO);
221*0b57cec5SDimitry Andric       STRINGIFY_ENUM_CASE(ELF, SHT_MIPS_OPTIONS);
222*0b57cec5SDimitry Andric       STRINGIFY_ENUM_CASE(ELF, SHT_MIPS_DWARF);
223*0b57cec5SDimitry Andric       STRINGIFY_ENUM_CASE(ELF, SHT_MIPS_ABIFLAGS);
224*0b57cec5SDimitry Andric     }
225*0b57cec5SDimitry Andric     break;
226*0b57cec5SDimitry Andric   default:
227*0b57cec5SDimitry Andric     break;
228*0b57cec5SDimitry Andric   }
229*0b57cec5SDimitry Andric 
230*0b57cec5SDimitry Andric   switch (Type) {
231*0b57cec5SDimitry Andric     STRINGIFY_ENUM_CASE(ELF, SHT_NULL);
232*0b57cec5SDimitry Andric     STRINGIFY_ENUM_CASE(ELF, SHT_PROGBITS);
233*0b57cec5SDimitry Andric     STRINGIFY_ENUM_CASE(ELF, SHT_SYMTAB);
234*0b57cec5SDimitry Andric     STRINGIFY_ENUM_CASE(ELF, SHT_STRTAB);
235*0b57cec5SDimitry Andric     STRINGIFY_ENUM_CASE(ELF, SHT_RELA);
236*0b57cec5SDimitry Andric     STRINGIFY_ENUM_CASE(ELF, SHT_HASH);
237*0b57cec5SDimitry Andric     STRINGIFY_ENUM_CASE(ELF, SHT_DYNAMIC);
238*0b57cec5SDimitry Andric     STRINGIFY_ENUM_CASE(ELF, SHT_NOTE);
239*0b57cec5SDimitry Andric     STRINGIFY_ENUM_CASE(ELF, SHT_NOBITS);
240*0b57cec5SDimitry Andric     STRINGIFY_ENUM_CASE(ELF, SHT_REL);
241*0b57cec5SDimitry Andric     STRINGIFY_ENUM_CASE(ELF, SHT_SHLIB);
242*0b57cec5SDimitry Andric     STRINGIFY_ENUM_CASE(ELF, SHT_DYNSYM);
243*0b57cec5SDimitry Andric     STRINGIFY_ENUM_CASE(ELF, SHT_INIT_ARRAY);
244*0b57cec5SDimitry Andric     STRINGIFY_ENUM_CASE(ELF, SHT_FINI_ARRAY);
245*0b57cec5SDimitry Andric     STRINGIFY_ENUM_CASE(ELF, SHT_PREINIT_ARRAY);
246*0b57cec5SDimitry Andric     STRINGIFY_ENUM_CASE(ELF, SHT_GROUP);
247*0b57cec5SDimitry Andric     STRINGIFY_ENUM_CASE(ELF, SHT_SYMTAB_SHNDX);
248*0b57cec5SDimitry Andric     STRINGIFY_ENUM_CASE(ELF, SHT_RELR);
249*0b57cec5SDimitry Andric     STRINGIFY_ENUM_CASE(ELF, SHT_ANDROID_REL);
250*0b57cec5SDimitry Andric     STRINGIFY_ENUM_CASE(ELF, SHT_ANDROID_RELA);
251*0b57cec5SDimitry Andric     STRINGIFY_ENUM_CASE(ELF, SHT_ANDROID_RELR);
252*0b57cec5SDimitry Andric     STRINGIFY_ENUM_CASE(ELF, SHT_LLVM_ODRTAB);
253*0b57cec5SDimitry Andric     STRINGIFY_ENUM_CASE(ELF, SHT_LLVM_LINKER_OPTIONS);
254*0b57cec5SDimitry Andric     STRINGIFY_ENUM_CASE(ELF, SHT_LLVM_CALL_GRAPH_PROFILE);
255*0b57cec5SDimitry Andric     STRINGIFY_ENUM_CASE(ELF, SHT_LLVM_ADDRSIG);
256*0b57cec5SDimitry Andric     STRINGIFY_ENUM_CASE(ELF, SHT_LLVM_DEPENDENT_LIBRARIES);
257*0b57cec5SDimitry Andric     STRINGIFY_ENUM_CASE(ELF, SHT_LLVM_SYMPART);
258*0b57cec5SDimitry Andric     STRINGIFY_ENUM_CASE(ELF, SHT_GNU_ATTRIBUTES);
259*0b57cec5SDimitry Andric     STRINGIFY_ENUM_CASE(ELF, SHT_GNU_HASH);
260*0b57cec5SDimitry Andric     STRINGIFY_ENUM_CASE(ELF, SHT_GNU_verdef);
261*0b57cec5SDimitry Andric     STRINGIFY_ENUM_CASE(ELF, SHT_GNU_verneed);
262*0b57cec5SDimitry Andric     STRINGIFY_ENUM_CASE(ELF, SHT_GNU_versym);
263*0b57cec5SDimitry Andric   default:
264*0b57cec5SDimitry Andric     return "Unknown";
265*0b57cec5SDimitry Andric   }
266*0b57cec5SDimitry Andric }
267*0b57cec5SDimitry Andric 
268*0b57cec5SDimitry Andric template <class ELFT>
269*0b57cec5SDimitry Andric Expected<std::vector<typename ELFT::Rela>>
270*0b57cec5SDimitry Andric ELFFile<ELFT>::decode_relrs(Elf_Relr_Range relrs) const {
271*0b57cec5SDimitry Andric   // This function decodes the contents of an SHT_RELR packed relocation
272*0b57cec5SDimitry Andric   // section.
273*0b57cec5SDimitry Andric   //
274*0b57cec5SDimitry Andric   // Proposal for adding SHT_RELR sections to generic-abi is here:
275*0b57cec5SDimitry Andric   //   https://groups.google.com/forum/#!topic/generic-abi/bX460iggiKg
276*0b57cec5SDimitry Andric   //
277*0b57cec5SDimitry Andric   // The encoded sequence of Elf64_Relr entries in a SHT_RELR section looks
278*0b57cec5SDimitry Andric   // like [ AAAAAAAA BBBBBBB1 BBBBBBB1 ... AAAAAAAA BBBBBB1 ... ]
279*0b57cec5SDimitry Andric   //
280*0b57cec5SDimitry Andric   // i.e. start with an address, followed by any number of bitmaps. The address
281*0b57cec5SDimitry Andric   // entry encodes 1 relocation. The subsequent bitmap entries encode up to 63
282*0b57cec5SDimitry Andric   // relocations each, at subsequent offsets following the last address entry.
283*0b57cec5SDimitry Andric   //
284*0b57cec5SDimitry Andric   // The bitmap entries must have 1 in the least significant bit. The assumption
285*0b57cec5SDimitry Andric   // here is that an address cannot have 1 in lsb. Odd addresses are not
286*0b57cec5SDimitry Andric   // supported.
287*0b57cec5SDimitry Andric   //
288*0b57cec5SDimitry Andric   // Excluding the least significant bit in the bitmap, each non-zero bit in
289*0b57cec5SDimitry Andric   // the bitmap represents a relocation to be applied to a corresponding machine
290*0b57cec5SDimitry Andric   // word that follows the base address word. The second least significant bit
291*0b57cec5SDimitry Andric   // represents the machine word immediately following the initial address, and
292*0b57cec5SDimitry Andric   // each bit that follows represents the next word, in linear order. As such,
293*0b57cec5SDimitry Andric   // a single bitmap can encode up to 31 relocations in a 32-bit object, and
294*0b57cec5SDimitry Andric   // 63 relocations in a 64-bit object.
295*0b57cec5SDimitry Andric   //
296*0b57cec5SDimitry Andric   // This encoding has a couple of interesting properties:
297*0b57cec5SDimitry Andric   // 1. Looking at any entry, it is clear whether it's an address or a bitmap:
298*0b57cec5SDimitry Andric   //    even means address, odd means bitmap.
299*0b57cec5SDimitry Andric   // 2. Just a simple list of addresses is a valid encoding.
300*0b57cec5SDimitry Andric 
301*0b57cec5SDimitry Andric   Elf_Rela Rela;
302*0b57cec5SDimitry Andric   Rela.r_info = 0;
303*0b57cec5SDimitry Andric   Rela.r_addend = 0;
304*0b57cec5SDimitry Andric   Rela.setType(getRelativeRelocationType(), false);
305*0b57cec5SDimitry Andric   std::vector<Elf_Rela> Relocs;
306*0b57cec5SDimitry Andric 
307*0b57cec5SDimitry Andric   // Word type: uint32_t for Elf32, and uint64_t for Elf64.
308*0b57cec5SDimitry Andric   typedef typename ELFT::uint Word;
309*0b57cec5SDimitry Andric 
310*0b57cec5SDimitry Andric   // Word size in number of bytes.
311*0b57cec5SDimitry Andric   const size_t WordSize = sizeof(Word);
312*0b57cec5SDimitry Andric 
313*0b57cec5SDimitry Andric   // Number of bits used for the relocation offsets bitmap.
314*0b57cec5SDimitry Andric   // These many relative relocations can be encoded in a single entry.
315*0b57cec5SDimitry Andric   const size_t NBits = 8*WordSize - 1;
316*0b57cec5SDimitry Andric 
317*0b57cec5SDimitry Andric   Word Base = 0;
318*0b57cec5SDimitry Andric   for (const Elf_Relr &R : relrs) {
319*0b57cec5SDimitry Andric     Word Entry = R;
320*0b57cec5SDimitry Andric     if ((Entry&1) == 0) {
321*0b57cec5SDimitry Andric       // Even entry: encodes the offset for next relocation.
322*0b57cec5SDimitry Andric       Rela.r_offset = Entry;
323*0b57cec5SDimitry Andric       Relocs.push_back(Rela);
324*0b57cec5SDimitry Andric       // Set base offset for subsequent bitmap entries.
325*0b57cec5SDimitry Andric       Base = Entry + WordSize;
326*0b57cec5SDimitry Andric       continue;
327*0b57cec5SDimitry Andric     }
328*0b57cec5SDimitry Andric 
329*0b57cec5SDimitry Andric     // Odd entry: encodes bitmap for relocations starting at base.
330*0b57cec5SDimitry Andric     Word Offset = Base;
331*0b57cec5SDimitry Andric     while (Entry != 0) {
332*0b57cec5SDimitry Andric       Entry >>= 1;
333*0b57cec5SDimitry Andric       if ((Entry&1) != 0) {
334*0b57cec5SDimitry Andric         Rela.r_offset = Offset;
335*0b57cec5SDimitry Andric         Relocs.push_back(Rela);
336*0b57cec5SDimitry Andric       }
337*0b57cec5SDimitry Andric       Offset += WordSize;
338*0b57cec5SDimitry Andric     }
339*0b57cec5SDimitry Andric 
340*0b57cec5SDimitry Andric     // Advance base offset by NBits words.
341*0b57cec5SDimitry Andric     Base += NBits * WordSize;
342*0b57cec5SDimitry Andric   }
343*0b57cec5SDimitry Andric 
344*0b57cec5SDimitry Andric   return Relocs;
345*0b57cec5SDimitry Andric }
346*0b57cec5SDimitry Andric 
347*0b57cec5SDimitry Andric template <class ELFT>
348*0b57cec5SDimitry Andric Expected<std::vector<typename ELFT::Rela>>
349*0b57cec5SDimitry Andric ELFFile<ELFT>::android_relas(const Elf_Shdr *Sec) const {
350*0b57cec5SDimitry Andric   // This function reads relocations in Android's packed relocation format,
351*0b57cec5SDimitry Andric   // which is based on SLEB128 and delta encoding.
352*0b57cec5SDimitry Andric   Expected<ArrayRef<uint8_t>> ContentsOrErr = getSectionContents(Sec);
353*0b57cec5SDimitry Andric   if (!ContentsOrErr)
354*0b57cec5SDimitry Andric     return ContentsOrErr.takeError();
355*0b57cec5SDimitry Andric   const uint8_t *Cur = ContentsOrErr->begin();
356*0b57cec5SDimitry Andric   const uint8_t *End = ContentsOrErr->end();
357*0b57cec5SDimitry Andric   if (ContentsOrErr->size() < 4 || Cur[0] != 'A' || Cur[1] != 'P' ||
358*0b57cec5SDimitry Andric       Cur[2] != 'S' || Cur[3] != '2')
359*0b57cec5SDimitry Andric     return createError("invalid packed relocation header");
360*0b57cec5SDimitry Andric   Cur += 4;
361*0b57cec5SDimitry Andric 
362*0b57cec5SDimitry Andric   const char *ErrStr = nullptr;
363*0b57cec5SDimitry Andric   auto ReadSLEB = [&]() -> int64_t {
364*0b57cec5SDimitry Andric     if (ErrStr)
365*0b57cec5SDimitry Andric       return 0;
366*0b57cec5SDimitry Andric     unsigned Len;
367*0b57cec5SDimitry Andric     int64_t Result = decodeSLEB128(Cur, &Len, End, &ErrStr);
368*0b57cec5SDimitry Andric     Cur += Len;
369*0b57cec5SDimitry Andric     return Result;
370*0b57cec5SDimitry Andric   };
371*0b57cec5SDimitry Andric 
372*0b57cec5SDimitry Andric   uint64_t NumRelocs = ReadSLEB();
373*0b57cec5SDimitry Andric   uint64_t Offset = ReadSLEB();
374*0b57cec5SDimitry Andric   uint64_t Addend = 0;
375*0b57cec5SDimitry Andric 
376*0b57cec5SDimitry Andric   if (ErrStr)
377*0b57cec5SDimitry Andric     return createError(ErrStr);
378*0b57cec5SDimitry Andric 
379*0b57cec5SDimitry Andric   std::vector<Elf_Rela> Relocs;
380*0b57cec5SDimitry Andric   Relocs.reserve(NumRelocs);
381*0b57cec5SDimitry Andric   while (NumRelocs) {
382*0b57cec5SDimitry Andric     uint64_t NumRelocsInGroup = ReadSLEB();
383*0b57cec5SDimitry Andric     if (NumRelocsInGroup > NumRelocs)
384*0b57cec5SDimitry Andric       return createError("relocation group unexpectedly large");
385*0b57cec5SDimitry Andric     NumRelocs -= NumRelocsInGroup;
386*0b57cec5SDimitry Andric 
387*0b57cec5SDimitry Andric     uint64_t GroupFlags = ReadSLEB();
388*0b57cec5SDimitry Andric     bool GroupedByInfo = GroupFlags & ELF::RELOCATION_GROUPED_BY_INFO_FLAG;
389*0b57cec5SDimitry Andric     bool GroupedByOffsetDelta = GroupFlags & ELF::RELOCATION_GROUPED_BY_OFFSET_DELTA_FLAG;
390*0b57cec5SDimitry Andric     bool GroupedByAddend = GroupFlags & ELF::RELOCATION_GROUPED_BY_ADDEND_FLAG;
391*0b57cec5SDimitry Andric     bool GroupHasAddend = GroupFlags & ELF::RELOCATION_GROUP_HAS_ADDEND_FLAG;
392*0b57cec5SDimitry Andric 
393*0b57cec5SDimitry Andric     uint64_t GroupOffsetDelta;
394*0b57cec5SDimitry Andric     if (GroupedByOffsetDelta)
395*0b57cec5SDimitry Andric       GroupOffsetDelta = ReadSLEB();
396*0b57cec5SDimitry Andric 
397*0b57cec5SDimitry Andric     uint64_t GroupRInfo;
398*0b57cec5SDimitry Andric     if (GroupedByInfo)
399*0b57cec5SDimitry Andric       GroupRInfo = ReadSLEB();
400*0b57cec5SDimitry Andric 
401*0b57cec5SDimitry Andric     if (GroupedByAddend && GroupHasAddend)
402*0b57cec5SDimitry Andric       Addend += ReadSLEB();
403*0b57cec5SDimitry Andric 
404*0b57cec5SDimitry Andric     if (!GroupHasAddend)
405*0b57cec5SDimitry Andric       Addend = 0;
406*0b57cec5SDimitry Andric 
407*0b57cec5SDimitry Andric     for (uint64_t I = 0; I != NumRelocsInGroup; ++I) {
408*0b57cec5SDimitry Andric       Elf_Rela R;
409*0b57cec5SDimitry Andric       Offset += GroupedByOffsetDelta ? GroupOffsetDelta : ReadSLEB();
410*0b57cec5SDimitry Andric       R.r_offset = Offset;
411*0b57cec5SDimitry Andric       R.r_info = GroupedByInfo ? GroupRInfo : ReadSLEB();
412*0b57cec5SDimitry Andric       if (GroupHasAddend && !GroupedByAddend)
413*0b57cec5SDimitry Andric         Addend += ReadSLEB();
414*0b57cec5SDimitry Andric       R.r_addend = Addend;
415*0b57cec5SDimitry Andric       Relocs.push_back(R);
416*0b57cec5SDimitry Andric 
417*0b57cec5SDimitry Andric       if (ErrStr)
418*0b57cec5SDimitry Andric         return createError(ErrStr);
419*0b57cec5SDimitry Andric     }
420*0b57cec5SDimitry Andric 
421*0b57cec5SDimitry Andric     if (ErrStr)
422*0b57cec5SDimitry Andric       return createError(ErrStr);
423*0b57cec5SDimitry Andric   }
424*0b57cec5SDimitry Andric 
425*0b57cec5SDimitry Andric   return Relocs;
426*0b57cec5SDimitry Andric }
427*0b57cec5SDimitry Andric 
428*0b57cec5SDimitry Andric template <class ELFT>
429*0b57cec5SDimitry Andric std::string ELFFile<ELFT>::getDynamicTagAsString(unsigned Arch,
430*0b57cec5SDimitry Andric                                                  uint64_t Type) const {
431*0b57cec5SDimitry Andric #define DYNAMIC_STRINGIFY_ENUM(tag, value)                                     \
432*0b57cec5SDimitry Andric   case value:                                                                  \
433*0b57cec5SDimitry Andric     return #tag;
434*0b57cec5SDimitry Andric 
435*0b57cec5SDimitry Andric #define DYNAMIC_TAG(n, v)
436*0b57cec5SDimitry Andric   switch (Arch) {
437*0b57cec5SDimitry Andric   case ELF::EM_AARCH64:
438*0b57cec5SDimitry Andric     switch (Type) {
439*0b57cec5SDimitry Andric #define AARCH64_DYNAMIC_TAG(name, value) DYNAMIC_STRINGIFY_ENUM(name, value)
440*0b57cec5SDimitry Andric #include "llvm/BinaryFormat/DynamicTags.def"
441*0b57cec5SDimitry Andric #undef AARCH64_DYNAMIC_TAG
442*0b57cec5SDimitry Andric     }
443*0b57cec5SDimitry Andric     break;
444*0b57cec5SDimitry Andric 
445*0b57cec5SDimitry Andric   case ELF::EM_HEXAGON:
446*0b57cec5SDimitry Andric     switch (Type) {
447*0b57cec5SDimitry Andric #define HEXAGON_DYNAMIC_TAG(name, value) DYNAMIC_STRINGIFY_ENUM(name, value)
448*0b57cec5SDimitry Andric #include "llvm/BinaryFormat/DynamicTags.def"
449*0b57cec5SDimitry Andric #undef HEXAGON_DYNAMIC_TAG
450*0b57cec5SDimitry Andric     }
451*0b57cec5SDimitry Andric     break;
452*0b57cec5SDimitry Andric 
453*0b57cec5SDimitry Andric   case ELF::EM_MIPS:
454*0b57cec5SDimitry Andric     switch (Type) {
455*0b57cec5SDimitry Andric #define MIPS_DYNAMIC_TAG(name, value) DYNAMIC_STRINGIFY_ENUM(name, value)
456*0b57cec5SDimitry Andric #include "llvm/BinaryFormat/DynamicTags.def"
457*0b57cec5SDimitry Andric #undef MIPS_DYNAMIC_TAG
458*0b57cec5SDimitry Andric     }
459*0b57cec5SDimitry Andric     break;
460*0b57cec5SDimitry Andric 
461*0b57cec5SDimitry Andric   case ELF::EM_PPC64:
462*0b57cec5SDimitry Andric     switch (Type) {
463*0b57cec5SDimitry Andric #define PPC64_DYNAMIC_TAG(name, value) DYNAMIC_STRINGIFY_ENUM(name, value)
464*0b57cec5SDimitry Andric #include "llvm/BinaryFormat/DynamicTags.def"
465*0b57cec5SDimitry Andric #undef PPC64_DYNAMIC_TAG
466*0b57cec5SDimitry Andric     }
467*0b57cec5SDimitry Andric     break;
468*0b57cec5SDimitry Andric   }
469*0b57cec5SDimitry Andric #undef DYNAMIC_TAG
470*0b57cec5SDimitry Andric   switch (Type) {
471*0b57cec5SDimitry Andric // Now handle all dynamic tags except the architecture specific ones
472*0b57cec5SDimitry Andric #define AARCH64_DYNAMIC_TAG(name, value)
473*0b57cec5SDimitry Andric #define MIPS_DYNAMIC_TAG(name, value)
474*0b57cec5SDimitry Andric #define HEXAGON_DYNAMIC_TAG(name, value)
475*0b57cec5SDimitry Andric #define PPC64_DYNAMIC_TAG(name, value)
476*0b57cec5SDimitry Andric // Also ignore marker tags such as DT_HIOS (maps to DT_VERNEEDNUM), etc.
477*0b57cec5SDimitry Andric #define DYNAMIC_TAG_MARKER(name, value)
478*0b57cec5SDimitry Andric #define DYNAMIC_TAG(name, value) DYNAMIC_STRINGIFY_ENUM(name, value)
479*0b57cec5SDimitry Andric #include "llvm/BinaryFormat/DynamicTags.def"
480*0b57cec5SDimitry Andric #undef DYNAMIC_TAG
481*0b57cec5SDimitry Andric #undef AARCH64_DYNAMIC_TAG
482*0b57cec5SDimitry Andric #undef MIPS_DYNAMIC_TAG
483*0b57cec5SDimitry Andric #undef HEXAGON_DYNAMIC_TAG
484*0b57cec5SDimitry Andric #undef PPC64_DYNAMIC_TAG
485*0b57cec5SDimitry Andric #undef DYNAMIC_TAG_MARKER
486*0b57cec5SDimitry Andric #undef DYNAMIC_STRINGIFY_ENUM
487*0b57cec5SDimitry Andric   default:
488*0b57cec5SDimitry Andric     return "<unknown:>0x" + utohexstr(Type, true);
489*0b57cec5SDimitry Andric   }
490*0b57cec5SDimitry Andric }
491*0b57cec5SDimitry Andric 
492*0b57cec5SDimitry Andric template <class ELFT>
493*0b57cec5SDimitry Andric std::string ELFFile<ELFT>::getDynamicTagAsString(uint64_t Type) const {
494*0b57cec5SDimitry Andric   return getDynamicTagAsString(getHeader()->e_machine, Type);
495*0b57cec5SDimitry Andric }
496*0b57cec5SDimitry Andric 
497*0b57cec5SDimitry Andric template <class ELFT>
498*0b57cec5SDimitry Andric Expected<typename ELFT::DynRange> ELFFile<ELFT>::dynamicEntries() const {
499*0b57cec5SDimitry Andric   ArrayRef<Elf_Dyn> Dyn;
500*0b57cec5SDimitry Andric   size_t DynSecSize = 0;
501*0b57cec5SDimitry Andric 
502*0b57cec5SDimitry Andric   auto ProgramHeadersOrError = program_headers();
503*0b57cec5SDimitry Andric   if (!ProgramHeadersOrError)
504*0b57cec5SDimitry Andric     return ProgramHeadersOrError.takeError();
505*0b57cec5SDimitry Andric 
506*0b57cec5SDimitry Andric   for (const Elf_Phdr &Phdr : *ProgramHeadersOrError) {
507*0b57cec5SDimitry Andric     if (Phdr.p_type == ELF::PT_DYNAMIC) {
508*0b57cec5SDimitry Andric       Dyn = makeArrayRef(
509*0b57cec5SDimitry Andric           reinterpret_cast<const Elf_Dyn *>(base() + Phdr.p_offset),
510*0b57cec5SDimitry Andric           Phdr.p_filesz / sizeof(Elf_Dyn));
511*0b57cec5SDimitry Andric       DynSecSize = Phdr.p_filesz;
512*0b57cec5SDimitry Andric       break;
513*0b57cec5SDimitry Andric     }
514*0b57cec5SDimitry Andric   }
515*0b57cec5SDimitry Andric 
516*0b57cec5SDimitry Andric   // If we can't find the dynamic section in the program headers, we just fall
517*0b57cec5SDimitry Andric   // back on the sections.
518*0b57cec5SDimitry Andric   if (Dyn.empty()) {
519*0b57cec5SDimitry Andric     auto SectionsOrError = sections();
520*0b57cec5SDimitry Andric     if (!SectionsOrError)
521*0b57cec5SDimitry Andric       return SectionsOrError.takeError();
522*0b57cec5SDimitry Andric 
523*0b57cec5SDimitry Andric     for (const Elf_Shdr &Sec : *SectionsOrError) {
524*0b57cec5SDimitry Andric       if (Sec.sh_type == ELF::SHT_DYNAMIC) {
525*0b57cec5SDimitry Andric         Expected<ArrayRef<Elf_Dyn>> DynOrError =
526*0b57cec5SDimitry Andric             getSectionContentsAsArray<Elf_Dyn>(&Sec);
527*0b57cec5SDimitry Andric         if (!DynOrError)
528*0b57cec5SDimitry Andric           return DynOrError.takeError();
529*0b57cec5SDimitry Andric         Dyn = *DynOrError;
530*0b57cec5SDimitry Andric         DynSecSize = Sec.sh_size;
531*0b57cec5SDimitry Andric         break;
532*0b57cec5SDimitry Andric       }
533*0b57cec5SDimitry Andric     }
534*0b57cec5SDimitry Andric 
535*0b57cec5SDimitry Andric     if (!Dyn.data())
536*0b57cec5SDimitry Andric       return ArrayRef<Elf_Dyn>();
537*0b57cec5SDimitry Andric   }
538*0b57cec5SDimitry Andric 
539*0b57cec5SDimitry Andric   if (Dyn.empty())
540*0b57cec5SDimitry Andric     // TODO: this error is untested.
541*0b57cec5SDimitry Andric     return createError("invalid empty dynamic section");
542*0b57cec5SDimitry Andric 
543*0b57cec5SDimitry Andric   if (DynSecSize % sizeof(Elf_Dyn) != 0)
544*0b57cec5SDimitry Andric     // TODO: this error is untested.
545*0b57cec5SDimitry Andric     return createError("malformed dynamic section");
546*0b57cec5SDimitry Andric 
547*0b57cec5SDimitry Andric   if (Dyn.back().d_tag != ELF::DT_NULL)
548*0b57cec5SDimitry Andric     // TODO: this error is untested.
549*0b57cec5SDimitry Andric     return createError("dynamic sections must be DT_NULL terminated");
550*0b57cec5SDimitry Andric 
551*0b57cec5SDimitry Andric   return Dyn;
552*0b57cec5SDimitry Andric }
553*0b57cec5SDimitry Andric 
554*0b57cec5SDimitry Andric template <class ELFT>
555*0b57cec5SDimitry Andric Expected<const uint8_t *> ELFFile<ELFT>::toMappedAddr(uint64_t VAddr) const {
556*0b57cec5SDimitry Andric   auto ProgramHeadersOrError = program_headers();
557*0b57cec5SDimitry Andric   if (!ProgramHeadersOrError)
558*0b57cec5SDimitry Andric     return ProgramHeadersOrError.takeError();
559*0b57cec5SDimitry Andric 
560*0b57cec5SDimitry Andric   llvm::SmallVector<Elf_Phdr *, 4> LoadSegments;
561*0b57cec5SDimitry Andric 
562*0b57cec5SDimitry Andric   for (const Elf_Phdr &Phdr : *ProgramHeadersOrError)
563*0b57cec5SDimitry Andric     if (Phdr.p_type == ELF::PT_LOAD)
564*0b57cec5SDimitry Andric       LoadSegments.push_back(const_cast<Elf_Phdr *>(&Phdr));
565*0b57cec5SDimitry Andric 
566*0b57cec5SDimitry Andric   const Elf_Phdr *const *I =
567*0b57cec5SDimitry Andric       std::upper_bound(LoadSegments.begin(), LoadSegments.end(), VAddr,
568*0b57cec5SDimitry Andric                        [](uint64_t VAddr, const Elf_Phdr_Impl<ELFT> *Phdr) {
569*0b57cec5SDimitry Andric                          return VAddr < Phdr->p_vaddr;
570*0b57cec5SDimitry Andric                        });
571*0b57cec5SDimitry Andric 
572*0b57cec5SDimitry Andric   if (I == LoadSegments.begin())
573*0b57cec5SDimitry Andric     return createError("virtual address is not in any segment: 0x" +
574*0b57cec5SDimitry Andric                        Twine::utohexstr(VAddr));
575*0b57cec5SDimitry Andric   --I;
576*0b57cec5SDimitry Andric   const Elf_Phdr &Phdr = **I;
577*0b57cec5SDimitry Andric   uint64_t Delta = VAddr - Phdr.p_vaddr;
578*0b57cec5SDimitry Andric   if (Delta >= Phdr.p_filesz)
579*0b57cec5SDimitry Andric     return createError("virtual address is not in any segment: 0x" +
580*0b57cec5SDimitry Andric                        Twine::utohexstr(VAddr));
581*0b57cec5SDimitry Andric   return base() + Phdr.p_offset + Delta;
582*0b57cec5SDimitry Andric }
583*0b57cec5SDimitry Andric 
584*0b57cec5SDimitry Andric template class llvm::object::ELFFile<ELF32LE>;
585*0b57cec5SDimitry Andric template class llvm::object::ELFFile<ELF32BE>;
586*0b57cec5SDimitry Andric template class llvm::object::ELFFile<ELF64LE>;
587*0b57cec5SDimitry Andric template class llvm::object::ELFFile<ELF64BE>;
588