xref: /freebsd/contrib/llvm-project/lld/ELF/EhFrame.cpp (revision e3f4a63af63bea70bc86b6c790b14aa5ee99fcd0)
1 //===- EhFrame.cpp -------------------------------------------------------===//
2 //
3 // Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions.
4 // See https://llvm.org/LICENSE.txt for license information.
5 // SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception
6 //
7 //===----------------------------------------------------------------------===//
8 //
9 // .eh_frame section contains information on how to unwind the stack when
10 // an exception is thrown. The section consists of sequence of CIE and FDE
11 // records. The linker needs to merge CIEs and associate FDEs to CIEs.
12 // That means the linker has to understand the format of the section.
13 //
14 // This file contains a few utility functions to read .eh_frame contents.
15 //
16 //===----------------------------------------------------------------------===//
17 
18 #include "EhFrame.h"
19 #include "Config.h"
20 #include "InputFiles.h"
21 #include "InputSection.h"
22 #include "Relocations.h"
23 #include "Target.h"
24 #include "llvm/BinaryFormat/Dwarf.h"
25 
26 using namespace llvm;
27 using namespace llvm::ELF;
28 using namespace llvm::dwarf;
29 using namespace llvm::object;
30 using namespace lld;
31 using namespace lld::elf;
32 
33 namespace {
34 class EhReader {
35 public:
36   EhReader(InputSectionBase *s, ArrayRef<uint8_t> d) : isec(s), d(d) {}
37   uint8_t getFdeEncoding();
38   bool hasLSDA();
39 
40 private:
41   template <class P> void errOn(const P *loc, const Twine &msg) {
42     Ctx &ctx = isec->file->ctx;
43     Err(ctx) << "corrupted .eh_frame: " << msg << "\n>>> defined in "
44              << isec->getObjMsg((const uint8_t *)loc - isec->content().data());
45   }
46 
47   uint8_t readByte();
48   void skipBytes(size_t count);
49   StringRef readString();
50   void skipLeb128();
51   void skipAugP();
52   StringRef getAugmentation();
53 
54   InputSectionBase *isec;
55   ArrayRef<uint8_t> d;
56 };
57 }
58 
59 // Read a byte and advance D by one byte.
60 uint8_t EhReader::readByte() {
61   if (d.empty()) {
62     errOn(d.data(), "unexpected end of CIE");
63     return 0;
64   }
65   uint8_t b = d.front();
66   d = d.slice(1);
67   return b;
68 }
69 
70 void EhReader::skipBytes(size_t count) {
71   if (d.size() < count)
72     errOn(d.data(), "CIE is too small");
73   else
74     d = d.slice(count);
75 }
76 
77 // Read a null-terminated string.
78 StringRef EhReader::readString() {
79   const uint8_t *end = llvm::find(d, '\0');
80   if (end == d.end()) {
81     errOn(d.data(), "corrupted CIE (failed to read string)");
82     return {};
83   }
84   StringRef s = toStringRef(d.slice(0, end - d.begin()));
85   d = d.slice(s.size() + 1);
86   return s;
87 }
88 
89 // Skip an integer encoded in the LEB128 format.
90 // Actual number is not of interest because only the runtime needs it.
91 // But we need to be at least able to skip it so that we can read
92 // the field that follows a LEB128 number.
93 void EhReader::skipLeb128() {
94   const uint8_t *errPos = d.data();
95   while (!d.empty()) {
96     uint8_t val = d.front();
97     d = d.slice(1);
98     if ((val & 0x80) == 0)
99       return;
100   }
101   errOn(errPos, "corrupted CIE (failed to read LEB128)");
102 }
103 
104 static size_t getAugPSize(Ctx &ctx, unsigned enc) {
105   switch (enc & 0x0f) {
106   case DW_EH_PE_absptr:
107   case DW_EH_PE_signed:
108     return ctx.arg.wordsize;
109   case DW_EH_PE_udata2:
110   case DW_EH_PE_sdata2:
111     return 2;
112   case DW_EH_PE_udata4:
113   case DW_EH_PE_sdata4:
114     return 4;
115   case DW_EH_PE_udata8:
116   case DW_EH_PE_sdata8:
117     return 8;
118   }
119   return 0;
120 }
121 
122 void EhReader::skipAugP() {
123   uint8_t enc = readByte();
124   if ((enc & 0xf0) == DW_EH_PE_aligned)
125     return errOn(d.data() - 1, "DW_EH_PE_aligned encoding is not supported");
126   size_t size = getAugPSize(isec->getCtx(), enc);
127   if (size == 0)
128     return errOn(d.data() - 1, "unknown FDE encoding");
129   if (size >= d.size())
130     return errOn(d.data() - 1, "corrupted CIE");
131   d = d.slice(size);
132 }
133 
134 uint8_t elf::getFdeEncoding(EhSectionPiece *p) {
135   return EhReader(p->sec, p->data()).getFdeEncoding();
136 }
137 
138 bool elf::hasLSDA(const EhSectionPiece &p) {
139   return EhReader(p.sec, p.data()).hasLSDA();
140 }
141 
142 StringRef EhReader::getAugmentation() {
143   skipBytes(8);
144   int version = readByte();
145   if (version != 1 && version != 3) {
146     errOn(d.data() - 1,
147           "FDE version 1 or 3 expected, but got " + Twine(version));
148     return {};
149   }
150 
151   StringRef aug = readString();
152 
153   // Skip code and data alignment factors.
154   skipLeb128();
155   skipLeb128();
156 
157   // Skip the return address register. In CIE version 1 this is a single
158   // byte. In CIE version 3 this is an unsigned LEB128.
159   if (version == 1)
160     readByte();
161   else
162     skipLeb128();
163   return aug;
164 }
165 
166 uint8_t EhReader::getFdeEncoding() {
167   // We only care about an 'R' value, but other records may precede an 'R'
168   // record. Unfortunately records are not in TLV (type-length-value) format,
169   // so we need to teach the linker how to skip records for each type.
170   StringRef aug = getAugmentation();
171   for (char c : aug) {
172     if (c == 'R')
173       return readByte();
174     if (c == 'z')
175       skipLeb128();
176     else if (c == 'L')
177       readByte();
178     else if (c == 'P')
179       skipAugP();
180     else if (c != 'B' && c != 'S' && c != 'G') {
181       errOn(aug.data(), "unknown .eh_frame augmentation string: " + aug);
182       break;
183     }
184   }
185   return DW_EH_PE_absptr;
186 }
187 
188 bool EhReader::hasLSDA() {
189   StringRef aug = getAugmentation();
190   for (char c : aug) {
191     if (c == 'L')
192       return true;
193     if (c == 'z')
194       skipLeb128();
195     else if (c == 'P')
196       skipAugP();
197     else if (c == 'R')
198       readByte();
199     else if (c != 'B' && c != 'S' && c != 'G') {
200       errOn(aug.data(), "unknown .eh_frame augmentation string: " + aug);
201       break;
202     }
203   }
204   return false;
205 }
206