xref: /freebsd/contrib/llvm-project/llvm/tools/llvm-readobj/ARMWinEHPrinter.cpp (revision b64c5a0ace59af62eff52bfe110a521dc73c937b)
1 //===-- ARMWinEHPrinter.cpp - Windows on ARM EH Data Printer ----*- C++ -*-===//
2 //
3 // Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions.
4 // See https://llvm.org/LICENSE.txt for license information.
5 // SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception
6 //
7 //===----------------------------------------------------------------------===//
8 
9 // Windows on ARM uses a series of serialised data structures (RuntimeFunction)
10 // to create a table of information for unwinding.  In order to conserve space,
11 // there are two different ways that this data is represented.
12 //
13 // For functions with canonical forms for the prologue and epilogue, the data
14 // can be stored in a "packed" form.  In this case, the data is packed into the
15 // RuntimeFunction's remaining 30-bits and can fully describe the entire frame.
16 //
17 //        +---------------------------------------+
18 //        |         Function Entry Address        |
19 //        +---------------------------------------+
20 //        |           Packed Form Data            |
21 //        +---------------------------------------+
22 //
23 // This layout is parsed by Decoder::dumpPackedEntry.  No unwind bytecode is
24 // associated with such a frame as they can be derived from the provided data.
25 // The decoder does not synthesize this data as it is unnecessary for the
26 // purposes of validation, with the synthesis being required only by a proper
27 // unwinder.
28 //
29 // For functions that are large or do not match canonical forms, the data is
30 // split up into two portions, with the actual data residing in the "exception
31 // data" table (.xdata) with a reference to the entry from the "procedure data"
32 // (.pdata) entry.
33 //
34 // The exception data contains information about the frame setup, all of the
35 // epilogue scopes (for functions for which there are multiple exit points) and
36 // the associated exception handler.  Additionally, the entry contains byte-code
37 // describing how to unwind the function (c.f. Decoder::decodeOpcodes).
38 //
39 //        +---------------------------------------+
40 //        |         Function Entry Address        |
41 //        +---------------------------------------+
42 //        |      Exception Data Entry Address     |
43 //        +---------------------------------------+
44 //
45 // This layout is parsed by Decoder::dumpUnpackedEntry.  Such an entry must
46 // first resolve the exception data entry address.  This structure
47 // (ExceptionDataRecord) has a variable sized header
48 // (c.f. ARM::WinEH::HeaderWords) and encodes most of the same information as
49 // the packed form.  However, because this information is insufficient to
50 // synthesize the unwinding, there are associated unwinding bytecode which make
51 // up the bulk of the Decoder.
52 //
53 // The decoder itself is table-driven, using the first byte to determine the
54 // opcode and dispatching to the associated printing routine.  The bytecode
55 // itself is a variable length instruction encoding that can fully describe the
56 // state of the stack and the necessary operations for unwinding to the
57 // beginning of the frame.
58 //
59 // The byte-code maintains a 1-1 instruction mapping, indicating both the width
60 // of the instruction (Thumb2 instructions are variable length, 16 or 32 bits
61 // wide) allowing the program to unwind from any point in the prologue, body, or
62 // epilogue of the function.
63 
64 #include "ARMWinEHPrinter.h"
65 #include "llvm/ADT/STLExtras.h"
66 #include "llvm/ADT/StringExtras.h"
67 #include "llvm/Support/ARMWinEH.h"
68 #include "llvm/Support/Format.h"
69 
70 using namespace llvm;
71 using namespace llvm::object;
72 using namespace llvm::support;
73 
74 namespace llvm {
75 raw_ostream &operator<<(raw_ostream &OS, const ARM::WinEH::ReturnType &RT) {
76   switch (RT) {
77   case ARM::WinEH::ReturnType::RT_POP:
78     OS << "pop {pc}";
79     break;
80   case ARM::WinEH::ReturnType::RT_B:
81     OS << "bx <reg>";
82     break;
83   case ARM::WinEH::ReturnType::RT_BW:
84     OS << "b.w <target>";
85     break;
86   case ARM::WinEH::ReturnType::RT_NoEpilogue:
87     OS << "(no epilogue)";
88     break;
89   }
90   return OS;
91 }
92 }
93 
94 static std::string formatSymbol(StringRef Name, uint64_t Address,
95                                 uint64_t Offset = 0) {
96   std::string Buffer;
97   raw_string_ostream OS(Buffer);
98 
99   if (!Name.empty())
100     OS << Name << " ";
101 
102   if (Offset)
103     OS << format("+0x%" PRIX64 " (0x%" PRIX64 ")", Offset, Address);
104   else if (!Name.empty())
105     OS << format("(0x%" PRIX64 ")", Address);
106   else
107     OS << format("0x%" PRIX64, Address);
108 
109   return OS.str();
110 }
111 
112 namespace llvm {
113 namespace ARM {
114 namespace WinEH {
115 const size_t Decoder::PDataEntrySize = sizeof(RuntimeFunction);
116 
117 // TODO name the uops more appropriately
118 const Decoder::RingEntry Decoder::Ring[] = {
119   { 0x80, 0x00, 1, &Decoder::opcode_0xxxxxxx },  // UOP_STACK_FREE (16-bit)
120   { 0xc0, 0x80, 2, &Decoder::opcode_10Lxxxxx },  // UOP_POP (32-bit)
121   { 0xf0, 0xc0, 1, &Decoder::opcode_1100xxxx },  // UOP_STACK_SAVE (16-bit)
122   { 0xf8, 0xd0, 1, &Decoder::opcode_11010Lxx },  // UOP_POP (16-bit)
123   { 0xf8, 0xd8, 1, &Decoder::opcode_11011Lxx },  // UOP_POP (32-bit)
124   { 0xf8, 0xe0, 1, &Decoder::opcode_11100xxx },  // UOP_VPOP (32-bit)
125   { 0xfc, 0xe8, 2, &Decoder::opcode_111010xx },  // UOP_STACK_FREE (32-bit)
126   { 0xfe, 0xec, 2, &Decoder::opcode_1110110L },  // UOP_POP (16-bit)
127   { 0xff, 0xee, 2, &Decoder::opcode_11101110 },  // UOP_MICROSOFT_SPECIFIC (16-bit)
128                                               // UOP_PUSH_MACHINE_FRAME
129                                               // UOP_PUSH_CONTEXT
130                                               // UOP_PUSH_TRAP_FRAME
131                                               // UOP_REDZONE_RESTORE_LR
132   { 0xff, 0xef, 2, &Decoder::opcode_11101111 },  // UOP_LDRPC_POSTINC (32-bit)
133   { 0xff, 0xf5, 2, &Decoder::opcode_11110101 },  // UOP_VPOP (32-bit)
134   { 0xff, 0xf6, 2, &Decoder::opcode_11110110 },  // UOP_VPOP (32-bit)
135   { 0xff, 0xf7, 3, &Decoder::opcode_11110111 },  // UOP_STACK_RESTORE (16-bit)
136   { 0xff, 0xf8, 4, &Decoder::opcode_11111000 },  // UOP_STACK_RESTORE (16-bit)
137   { 0xff, 0xf9, 3, &Decoder::opcode_11111001 },  // UOP_STACK_RESTORE (32-bit)
138   { 0xff, 0xfa, 4, &Decoder::opcode_11111010 },  // UOP_STACK_RESTORE (32-bit)
139   { 0xff, 0xfb, 1, &Decoder::opcode_11111011 },  // UOP_NOP (16-bit)
140   { 0xff, 0xfc, 1, &Decoder::opcode_11111100 },  // UOP_NOP (32-bit)
141   { 0xff, 0xfd, 1, &Decoder::opcode_11111101 },  // UOP_NOP (16-bit) / END
142   { 0xff, 0xfe, 1, &Decoder::opcode_11111110 },  // UOP_NOP (32-bit) / END
143   { 0xff, 0xff, 1, &Decoder::opcode_11111111 },  // UOP_END
144 };
145 
146 // Unwind opcodes for ARM64.
147 // https://docs.microsoft.com/en-us/cpp/build/arm64-exception-handling
148 const Decoder::RingEntry Decoder::Ring64[] = {
149     {0xe0, 0x00, 1, &Decoder::opcode_alloc_s},
150     {0xe0, 0x20, 1, &Decoder::opcode_save_r19r20_x},
151     {0xc0, 0x40, 1, &Decoder::opcode_save_fplr},
152     {0xc0, 0x80, 1, &Decoder::opcode_save_fplr_x},
153     {0xf8, 0xc0, 2, &Decoder::opcode_alloc_m},
154     {0xfc, 0xc8, 2, &Decoder::opcode_save_regp},
155     {0xfc, 0xcc, 2, &Decoder::opcode_save_regp_x},
156     {0xfc, 0xd0, 2, &Decoder::opcode_save_reg},
157     {0xfe, 0xd4, 2, &Decoder::opcode_save_reg_x},
158     {0xfe, 0xd6, 2, &Decoder::opcode_save_lrpair},
159     {0xfe, 0xd8, 2, &Decoder::opcode_save_fregp},
160     {0xfe, 0xda, 2, &Decoder::opcode_save_fregp_x},
161     {0xfe, 0xdc, 2, &Decoder::opcode_save_freg},
162     {0xff, 0xde, 2, &Decoder::opcode_save_freg_x},
163     {0xff, 0xe0, 4, &Decoder::opcode_alloc_l},
164     {0xff, 0xe1, 1, &Decoder::opcode_setfp},
165     {0xff, 0xe2, 2, &Decoder::opcode_addfp},
166     {0xff, 0xe3, 1, &Decoder::opcode_nop},
167     {0xff, 0xe4, 1, &Decoder::opcode_end},
168     {0xff, 0xe5, 1, &Decoder::opcode_end_c},
169     {0xff, 0xe6, 1, &Decoder::opcode_save_next},
170     {0xff, 0xe7, 3, &Decoder::opcode_save_any_reg},
171     {0xff, 0xe8, 1, &Decoder::opcode_trap_frame},
172     {0xff, 0xe9, 1, &Decoder::opcode_machine_frame},
173     {0xff, 0xea, 1, &Decoder::opcode_context},
174     {0xff, 0xeb, 1, &Decoder::opcode_ec_context},
175     {0xff, 0xec, 1, &Decoder::opcode_clear_unwound_to_call},
176     {0xff, 0xfc, 1, &Decoder::opcode_pac_sign_lr},
177 };
178 
179 static void printRange(raw_ostream &OS, ListSeparator &LS, unsigned First,
180                        unsigned Last, char Letter) {
181   if (First == Last)
182     OS << LS << Letter << First;
183   else
184     OS << LS << Letter << First << "-" << Letter << Last;
185 }
186 
187 static void printRange(raw_ostream &OS, uint32_t Mask, ListSeparator &LS,
188                        unsigned Start, unsigned End, char Letter) {
189   int First = -1;
190   for (unsigned RI = Start; RI <= End; ++RI) {
191     if (Mask & (1 << RI)) {
192       if (First < 0)
193         First = RI;
194     } else {
195       if (First >= 0) {
196         printRange(OS, LS, First, RI - 1, Letter);
197         First = -1;
198       }
199     }
200   }
201   if (First >= 0)
202     printRange(OS, LS, First, End, Letter);
203 }
204 
205 void Decoder::printGPRMask(uint16_t GPRMask) {
206   OS << '{';
207   ListSeparator LS;
208   printRange(OS, GPRMask, LS, 0, 12, 'r');
209   if (GPRMask & (1 << 14))
210     OS << LS << "lr";
211   if (GPRMask & (1 << 15))
212     OS << LS << "pc";
213   OS << '}';
214 }
215 
216 void Decoder::printVFPMask(uint32_t VFPMask) {
217   OS << '{';
218   ListSeparator LS;
219   printRange(OS, VFPMask, LS, 0, 31, 'd');
220   OS << '}';
221 }
222 
223 ErrorOr<object::SectionRef>
224 Decoder::getSectionContaining(const COFFObjectFile &COFF, uint64_t VA) {
225   for (const auto &Section : COFF.sections()) {
226     uint64_t Address = Section.getAddress();
227     uint64_t Size = Section.getSize();
228 
229     if (VA >= Address && (VA - Address) <= Size)
230       return Section;
231   }
232   return inconvertibleErrorCode();
233 }
234 
235 ErrorOr<object::SymbolRef> Decoder::getSymbol(const COFFObjectFile &COFF,
236                                               uint64_t VA, bool FunctionOnly) {
237   for (const auto &Symbol : COFF.symbols()) {
238     Expected<SymbolRef::Type> Type = Symbol.getType();
239     if (!Type)
240       return errorToErrorCode(Type.takeError());
241     if (FunctionOnly && *Type != SymbolRef::ST_Function)
242       continue;
243 
244     Expected<uint64_t> Address = Symbol.getAddress();
245     if (!Address)
246       return errorToErrorCode(Address.takeError());
247     if (*Address == VA)
248       return Symbol;
249   }
250   return inconvertibleErrorCode();
251 }
252 
253 ErrorOr<SymbolRef> Decoder::getRelocatedSymbol(const COFFObjectFile &,
254                                                const SectionRef &Section,
255                                                uint64_t Offset) {
256   for (const auto &Relocation : Section.relocations()) {
257     uint64_t RelocationOffset = Relocation.getOffset();
258     if (RelocationOffset == Offset)
259       return *Relocation.getSymbol();
260   }
261   return inconvertibleErrorCode();
262 }
263 
264 SymbolRef Decoder::getPreferredSymbol(const COFFObjectFile &COFF, SymbolRef Sym,
265                                       uint64_t &SymbolOffset) {
266   // The symbol resolved by getRelocatedSymbol can be any internal
267   // nondescriptive symbol; try to resolve a more descriptive one.
268   COFFSymbolRef CoffSym = COFF.getCOFFSymbol(Sym);
269   if (CoffSym.getStorageClass() != COFF::IMAGE_SYM_CLASS_LABEL &&
270       CoffSym.getSectionDefinition() == nullptr)
271     return Sym;
272   for (const auto &S : COFF.symbols()) {
273     COFFSymbolRef CS = COFF.getCOFFSymbol(S);
274     if (CS.getSectionNumber() == CoffSym.getSectionNumber() &&
275         CS.getValue() <= CoffSym.getValue() + SymbolOffset &&
276         CS.getStorageClass() != COFF::IMAGE_SYM_CLASS_LABEL &&
277         CS.getSectionDefinition() == nullptr) {
278       uint32_t Offset = CoffSym.getValue() + SymbolOffset - CS.getValue();
279       if (Offset <= SymbolOffset) {
280         SymbolOffset = Offset;
281         Sym = S;
282         CoffSym = CS;
283         if (CS.isExternal() && SymbolOffset == 0)
284           return Sym;
285       }
286     }
287   }
288   return Sym;
289 }
290 
291 ErrorOr<SymbolRef> Decoder::getSymbolForLocation(
292     const COFFObjectFile &COFF, const SectionRef &Section,
293     uint64_t OffsetInSection, uint64_t ImmediateOffset, uint64_t &SymbolAddress,
294     uint64_t &SymbolOffset, bool FunctionOnly) {
295   // Try to locate a relocation that points at the offset in the section
296   ErrorOr<SymbolRef> SymOrErr =
297       getRelocatedSymbol(COFF, Section, OffsetInSection);
298   if (SymOrErr) {
299     // We found a relocation symbol; the immediate offset needs to be added
300     // to the symbol address.
301     SymbolOffset = ImmediateOffset;
302 
303     Expected<uint64_t> AddressOrErr = SymOrErr->getAddress();
304     if (!AddressOrErr) {
305       std::string Buf;
306       llvm::raw_string_ostream OS(Buf);
307       logAllUnhandledErrors(AddressOrErr.takeError(), OS);
308       report_fatal_error(Twine(OS.str()));
309     }
310     // We apply SymbolOffset here directly. We return it separately to allow
311     // the caller to print it as an offset on the symbol name.
312     SymbolAddress = *AddressOrErr + SymbolOffset;
313 
314     if (FunctionOnly) // Resolve label/section symbols into function names.
315       SymOrErr = getPreferredSymbol(COFF, *SymOrErr, SymbolOffset);
316   } else {
317     // No matching relocation found; operating on a linked image. Try to
318     // find a descriptive symbol if possible. The immediate offset contains
319     // the image relative address, and we shouldn't add any offset to the
320     // symbol.
321     SymbolAddress = COFF.getImageBase() + ImmediateOffset;
322     SymbolOffset = 0;
323     SymOrErr = getSymbol(COFF, SymbolAddress, FunctionOnly);
324   }
325   return SymOrErr;
326 }
327 
328 bool Decoder::opcode_0xxxxxxx(const uint8_t *OC, unsigned &Offset,
329                               unsigned Length, bool Prologue) {
330   uint8_t Imm = OC[Offset] & 0x7f;
331   SW.startLine() << format("0x%02x                ; %s sp, #(%u * 4)\n",
332                            OC[Offset],
333                            static_cast<const char *>(Prologue ? "sub" : "add"),
334                            Imm);
335   ++Offset;
336   return false;
337 }
338 
339 bool Decoder::opcode_10Lxxxxx(const uint8_t *OC, unsigned &Offset,
340                               unsigned Length, bool Prologue) {
341   unsigned Link = (OC[Offset] & 0x20) >> 5;
342   uint16_t RegisterMask = (Link << (Prologue ? 14 : 15))
343                         | ((OC[Offset + 0] & 0x1f) << 8)
344                         | ((OC[Offset + 1] & 0xff) << 0);
345   assert((~RegisterMask & (1 << 13)) && "sp must not be set");
346   assert((~RegisterMask & (1 << (Prologue ? 15 : 14))) && "pc must not be set");
347 
348   SW.startLine() << format("0x%02x 0x%02x           ; %s.w ",
349                            OC[Offset + 0], OC[Offset + 1],
350                            Prologue ? "push" : "pop");
351   printGPRMask(RegisterMask);
352   OS << '\n';
353 
354   Offset += 2;
355   return false;
356 }
357 
358 bool Decoder::opcode_1100xxxx(const uint8_t *OC, unsigned &Offset,
359                               unsigned Length, bool Prologue) {
360   if (Prologue)
361     SW.startLine() << format("0x%02x                ; mov r%u, sp\n",
362                              OC[Offset], OC[Offset] & 0xf);
363   else
364     SW.startLine() << format("0x%02x                ; mov sp, r%u\n",
365                              OC[Offset], OC[Offset] & 0xf);
366   ++Offset;
367   return false;
368 }
369 
370 bool Decoder::opcode_11010Lxx(const uint8_t *OC, unsigned &Offset,
371                               unsigned Length, bool Prologue) {
372   unsigned Link = (OC[Offset] & 0x4) >> 2;
373   unsigned Count = (OC[Offset] & 0x3);
374 
375   uint16_t GPRMask = (Link << (Prologue ? 14 : 15))
376                    | (((1 << (Count + 1)) - 1) << 4);
377 
378   SW.startLine() << format("0x%02x                ; %s ", OC[Offset],
379                            Prologue ? "push" : "pop");
380   printGPRMask(GPRMask);
381   OS << '\n';
382 
383   ++Offset;
384   return false;
385 }
386 
387 bool Decoder::opcode_11011Lxx(const uint8_t *OC, unsigned &Offset,
388                               unsigned Length, bool Prologue) {
389   unsigned Link = (OC[Offset] & 0x4) >> 2;
390   unsigned Count = (OC[Offset] & 0x3) + 4;
391 
392   uint16_t GPRMask = (Link << (Prologue ? 14 : 15))
393                    | (((1 << (Count + 1)) - 1) << 4);
394 
395   SW.startLine() << format("0x%02x                ; %s.w ", OC[Offset],
396                            Prologue ? "push" : "pop");
397   printGPRMask(GPRMask);
398   OS << '\n';
399 
400   ++Offset;
401   return false;
402 }
403 
404 bool Decoder::opcode_11100xxx(const uint8_t *OC, unsigned &Offset,
405                               unsigned Length, bool Prologue) {
406   unsigned High = (OC[Offset] & 0x7);
407   uint32_t VFPMask = (((1 << (High + 1)) - 1) << 8);
408 
409   SW.startLine() << format("0x%02x                ; %s ", OC[Offset],
410                            Prologue ? "vpush" : "vpop");
411   printVFPMask(VFPMask);
412   OS << '\n';
413 
414   ++Offset;
415   return false;
416 }
417 
418 bool Decoder::opcode_111010xx(const uint8_t *OC, unsigned &Offset,
419                               unsigned Length, bool Prologue) {
420   uint16_t Imm = ((OC[Offset + 0] & 0x03) << 8) | ((OC[Offset + 1] & 0xff) << 0);
421 
422   SW.startLine() << format("0x%02x 0x%02x           ; %s.w sp, #(%u * 4)\n",
423                            OC[Offset + 0], OC[Offset + 1],
424                            static_cast<const char *>(Prologue ? "sub" : "add"),
425                            Imm);
426 
427   Offset += 2;
428   return false;
429 }
430 
431 bool Decoder::opcode_1110110L(const uint8_t *OC, unsigned &Offset,
432                               unsigned Length, bool Prologue) {
433   uint16_t GPRMask = ((OC[Offset + 0] & 0x01) << (Prologue ? 14 : 15))
434                    | ((OC[Offset + 1] & 0xff) << 0);
435 
436   SW.startLine() << format("0x%02x 0x%02x           ; %s ", OC[Offset + 0],
437                            OC[Offset + 1], Prologue ? "push" : "pop");
438   printGPRMask(GPRMask);
439   OS << '\n';
440 
441   Offset += 2;
442   return false;
443 }
444 
445 bool Decoder::opcode_11101110(const uint8_t *OC, unsigned &Offset,
446                               unsigned Length, bool Prologue) {
447   assert(!Prologue && "may not be used in prologue");
448 
449   if (OC[Offset + 1] & 0xf0)
450     SW.startLine() << format("0x%02x 0x%02x           ; reserved\n",
451                              OC[Offset + 0], OC[Offset +  1]);
452   else
453     SW.startLine()
454       << format("0x%02x 0x%02x           ; microsoft-specific (type: %u)\n",
455                 OC[Offset + 0], OC[Offset + 1], OC[Offset + 1] & 0x0f);
456 
457   Offset += 2;
458   return false;
459 }
460 
461 bool Decoder::opcode_11101111(const uint8_t *OC, unsigned &Offset,
462                               unsigned Length, bool Prologue) {
463   if (OC[Offset + 1] & 0xf0)
464     SW.startLine() << format("0x%02x 0x%02x           ; reserved\n",
465                              OC[Offset + 0], OC[Offset +  1]);
466   else if (Prologue)
467     SW.startLine()
468       << format("0x%02x 0x%02x           ; str.w lr, [sp, #-%u]!\n",
469                 OC[Offset + 0], OC[Offset + 1], OC[Offset + 1] << 2);
470   else
471     SW.startLine()
472       << format("0x%02x 0x%02x           ; ldr.w lr, [sp], #%u\n",
473                 OC[Offset + 0], OC[Offset + 1], OC[Offset + 1] << 2);
474 
475   Offset += 2;
476   return false;
477 }
478 
479 bool Decoder::opcode_11110101(const uint8_t *OC, unsigned &Offset,
480                               unsigned Length, bool Prologue) {
481   unsigned Start = (OC[Offset + 1] & 0xf0) >> 4;
482   unsigned End = (OC[Offset + 1] & 0x0f) >> 0;
483   uint32_t VFPMask = ((1 << (End + 1 - Start)) - 1) << Start;
484 
485   SW.startLine() << format("0x%02x 0x%02x           ; %s ", OC[Offset + 0],
486                            OC[Offset + 1], Prologue ? "vpush" : "vpop");
487   printVFPMask(VFPMask);
488   OS << '\n';
489 
490   Offset += 2;
491   return false;
492 }
493 
494 bool Decoder::opcode_11110110(const uint8_t *OC, unsigned &Offset,
495                               unsigned Length, bool Prologue) {
496   unsigned Start = (OC[Offset + 1] & 0xf0) >> 4;
497   unsigned End = (OC[Offset + 1] & 0x0f) >> 0;
498   uint32_t VFPMask = ((1 << (End + 1 - Start)) - 1) << (16 + Start);
499 
500   SW.startLine() << format("0x%02x 0x%02x           ; %s ", OC[Offset + 0],
501                            OC[Offset + 1], Prologue ? "vpush" : "vpop");
502   printVFPMask(VFPMask);
503   OS << '\n';
504 
505   Offset += 2;
506   return false;
507 }
508 
509 bool Decoder::opcode_11110111(const uint8_t *OC, unsigned &Offset,
510                               unsigned Length, bool Prologue) {
511   uint32_t Imm = (OC[Offset + 1] << 8) | (OC[Offset + 2] << 0);
512 
513   SW.startLine() << format("0x%02x 0x%02x 0x%02x      ; %s sp, sp, #(%u * 4)\n",
514                            OC[Offset + 0], OC[Offset + 1], OC[Offset + 2],
515                            static_cast<const char *>(Prologue ? "sub" : "add"),
516                            Imm);
517 
518   Offset += 3;
519   return false;
520 }
521 
522 bool Decoder::opcode_11111000(const uint8_t *OC, unsigned &Offset,
523                               unsigned Length, bool Prologue) {
524   uint32_t Imm = (OC[Offset + 1] << 16)
525                | (OC[Offset + 2] << 8)
526                | (OC[Offset + 3] << 0);
527 
528   SW.startLine()
529     << format("0x%02x 0x%02x 0x%02x 0x%02x ; %s sp, sp, #(%u * 4)\n",
530               OC[Offset + 0], OC[Offset + 1], OC[Offset + 2], OC[Offset + 3],
531               static_cast<const char *>(Prologue ? "sub" : "add"), Imm);
532 
533   Offset += 4;
534   return false;
535 }
536 
537 bool Decoder::opcode_11111001(const uint8_t *OC, unsigned &Offset,
538                               unsigned Length, bool Prologue) {
539   uint32_t Imm = (OC[Offset + 1] << 8) | (OC[Offset + 2] << 0);
540 
541   SW.startLine()
542     << format("0x%02x 0x%02x 0x%02x      ; %s.w sp, sp, #(%u * 4)\n",
543               OC[Offset + 0], OC[Offset + 1], OC[Offset + 2],
544               static_cast<const char *>(Prologue ? "sub" : "add"), Imm);
545 
546   Offset += 3;
547   return false;
548 }
549 
550 bool Decoder::opcode_11111010(const uint8_t *OC, unsigned &Offset,
551                               unsigned Length, bool Prologue) {
552   uint32_t Imm = (OC[Offset + 1] << 16)
553                | (OC[Offset + 2] << 8)
554                | (OC[Offset + 3] << 0);
555 
556   SW.startLine()
557     << format("0x%02x 0x%02x 0x%02x 0x%02x ; %s.w sp, sp, #(%u * 4)\n",
558               OC[Offset + 0], OC[Offset + 1], OC[Offset + 2], OC[Offset + 3],
559               static_cast<const char *>(Prologue ? "sub" : "add"), Imm);
560 
561   Offset += 4;
562   return false;
563 }
564 
565 bool Decoder::opcode_11111011(const uint8_t *OC, unsigned &Offset,
566                               unsigned Length, bool Prologue) {
567   SW.startLine() << format("0x%02x                ; nop\n", OC[Offset]);
568   ++Offset;
569   return false;
570 }
571 
572 bool Decoder::opcode_11111100(const uint8_t *OC, unsigned &Offset,
573                               unsigned Length, bool Prologue) {
574   SW.startLine() << format("0x%02x                ; nop.w\n", OC[Offset]);
575   ++Offset;
576   return false;
577 }
578 
579 bool Decoder::opcode_11111101(const uint8_t *OC, unsigned &Offset,
580                               unsigned Length, bool Prologue) {
581   SW.startLine() << format("0x%02x                ; bx <reg>\n", OC[Offset]);
582   ++Offset;
583   return true;
584 }
585 
586 bool Decoder::opcode_11111110(const uint8_t *OC, unsigned &Offset,
587                               unsigned Length, bool Prologue) {
588   SW.startLine() << format("0x%02x                ; b.w <target>\n", OC[Offset]);
589   ++Offset;
590   return true;
591 }
592 
593 bool Decoder::opcode_11111111(const uint8_t *OC, unsigned &Offset,
594                               unsigned Length, bool Prologue) {
595   ++Offset;
596   return true;
597 }
598 
599 // ARM64 unwind codes start here.
600 bool Decoder::opcode_alloc_s(const uint8_t *OC, unsigned &Offset,
601                              unsigned Length, bool Prologue) {
602   uint32_t NumBytes = (OC[Offset] & 0x1F) << 4;
603   SW.startLine() << format("0x%02x                ; %s sp, #%u\n", OC[Offset],
604                            static_cast<const char *>(Prologue ? "sub" : "add"),
605                            NumBytes);
606   ++Offset;
607   return false;
608 }
609 
610 bool Decoder::opcode_save_r19r20_x(const uint8_t *OC, unsigned &Offset,
611                                    unsigned Length, bool Prologue) {
612   uint32_t Off = (OC[Offset] & 0x1F) << 3;
613   if (Prologue)
614     SW.startLine() << format(
615         "0x%02x                ; stp x19, x20, [sp, #-%u]!\n", OC[Offset], Off);
616   else
617     SW.startLine() << format(
618         "0x%02x                ; ldp x19, x20, [sp], #%u\n", OC[Offset], Off);
619   ++Offset;
620   return false;
621 }
622 
623 bool Decoder::opcode_save_fplr(const uint8_t *OC, unsigned &Offset,
624                                unsigned Length, bool Prologue) {
625   uint32_t Off = (OC[Offset] & 0x3F) << 3;
626   SW.startLine() << format(
627       "0x%02x                ; %s x29, x30, [sp, #%u]\n", OC[Offset],
628       static_cast<const char *>(Prologue ? "stp" : "ldp"), Off);
629   ++Offset;
630   return false;
631 }
632 
633 bool Decoder::opcode_save_fplr_x(const uint8_t *OC, unsigned &Offset,
634                                  unsigned Length, bool Prologue) {
635   uint32_t Off = ((OC[Offset] & 0x3F) + 1) << 3;
636   if (Prologue)
637     SW.startLine() << format(
638         "0x%02x                ; stp x29, x30, [sp, #-%u]!\n", OC[Offset], Off);
639   else
640     SW.startLine() << format(
641         "0x%02x                ; ldp x29, x30, [sp], #%u\n", OC[Offset], Off);
642   ++Offset;
643   return false;
644 }
645 
646 bool Decoder::opcode_alloc_m(const uint8_t *OC, unsigned &Offset,
647                              unsigned Length, bool Prologue) {
648   uint32_t NumBytes = ((OC[Offset] & 0x07) << 8);
649   NumBytes |= (OC[Offset + 1] & 0xFF);
650   NumBytes <<= 4;
651   SW.startLine() << format("0x%02x%02x              ; %s sp, #%u\n",
652                            OC[Offset], OC[Offset + 1],
653                            static_cast<const char *>(Prologue ? "sub" : "add"),
654                            NumBytes);
655   Offset += 2;
656   return false;
657 }
658 
659 bool Decoder::opcode_save_regp(const uint8_t *OC, unsigned &Offset,
660                                unsigned Length, bool Prologue) {
661   uint32_t Reg = ((OC[Offset] & 0x03) << 8);
662   Reg |= (OC[Offset + 1] & 0xC0);
663   Reg >>= 6;
664   Reg += 19;
665   uint32_t Off = (OC[Offset + 1] & 0x3F) << 3;
666   SW.startLine() << format(
667       "0x%02x%02x              ; %s x%u, x%u, [sp, #%u]\n",
668       OC[Offset], OC[Offset + 1],
669       static_cast<const char *>(Prologue ? "stp" : "ldp"), Reg, Reg + 1, Off);
670   Offset += 2;
671   return false;
672 }
673 
674 bool Decoder::opcode_save_regp_x(const uint8_t *OC, unsigned &Offset,
675                                  unsigned Length, bool Prologue) {
676   uint32_t Reg = ((OC[Offset] & 0x03) << 8);
677   Reg |= (OC[Offset + 1] & 0xC0);
678   Reg >>= 6;
679   Reg += 19;
680   uint32_t Off = ((OC[Offset + 1] & 0x3F) + 1) << 3;
681   if (Prologue)
682     SW.startLine() << format(
683         "0x%02x%02x              ; stp x%u, x%u, [sp, #-%u]!\n",
684         OC[Offset], OC[Offset + 1], Reg,
685         Reg + 1, Off);
686   else
687     SW.startLine() << format(
688         "0x%02x%02x              ; ldp x%u, x%u, [sp], #%u\n",
689         OC[Offset], OC[Offset + 1], Reg,
690         Reg + 1, Off);
691   Offset += 2;
692   return false;
693 }
694 
695 bool Decoder::opcode_save_reg(const uint8_t *OC, unsigned &Offset,
696                               unsigned Length, bool Prologue) {
697   uint32_t Reg = (OC[Offset] & 0x03) << 8;
698   Reg |= (OC[Offset + 1] & 0xC0);
699   Reg >>= 6;
700   Reg += 19;
701   uint32_t Off = (OC[Offset + 1] & 0x3F) << 3;
702   SW.startLine() << format("0x%02x%02x              ; %s x%u, [sp, #%u]\n",
703                            OC[Offset], OC[Offset + 1],
704                            static_cast<const char *>(Prologue ? "str" : "ldr"),
705                            Reg, Off);
706   Offset += 2;
707   return false;
708 }
709 
710 bool Decoder::opcode_save_reg_x(const uint8_t *OC, unsigned &Offset,
711                                 unsigned Length, bool Prologue) {
712   uint32_t Reg = (OC[Offset] & 0x01) << 8;
713   Reg |= (OC[Offset + 1] & 0xE0);
714   Reg >>= 5;
715   Reg += 19;
716   uint32_t Off = ((OC[Offset + 1] & 0x1F) + 1) << 3;
717   if (Prologue)
718     SW.startLine() << format("0x%02x%02x              ; str x%u, [sp, #-%u]!\n",
719                              OC[Offset], OC[Offset + 1], Reg, Off);
720   else
721     SW.startLine() << format("0x%02x%02x              ; ldr x%u, [sp], #%u\n",
722                              OC[Offset], OC[Offset + 1], Reg, Off);
723   Offset += 2;
724   return false;
725 }
726 
727 bool Decoder::opcode_save_lrpair(const uint8_t *OC, unsigned &Offset,
728                                  unsigned Length, bool Prologue) {
729   uint32_t Reg = (OC[Offset] & 0x01) << 8;
730   Reg |= (OC[Offset + 1] & 0xC0);
731   Reg >>= 6;
732   Reg *= 2;
733   Reg += 19;
734   uint32_t Off = (OC[Offset + 1] & 0x3F) << 3;
735   SW.startLine() << format("0x%02x%02x              ; %s x%u, lr, [sp, #%u]\n",
736                            OC[Offset], OC[Offset + 1],
737                            static_cast<const char *>(Prologue ? "stp" : "ldp"),
738                            Reg, Off);
739   Offset += 2;
740   return false;
741 }
742 
743 bool Decoder::opcode_save_fregp(const uint8_t *OC, unsigned &Offset,
744                                 unsigned Length, bool Prologue) {
745   uint32_t Reg = (OC[Offset] & 0x01) << 8;
746   Reg |= (OC[Offset + 1] & 0xC0);
747   Reg >>= 6;
748   Reg += 8;
749   uint32_t Off = (OC[Offset + 1] & 0x3F) << 3;
750   SW.startLine() << format("0x%02x%02x              ; %s d%u, d%u, [sp, #%u]\n",
751                            OC[Offset], OC[Offset + 1],
752                            static_cast<const char *>(Prologue ? "stp" : "ldp"),
753                            Reg, Reg + 1, Off);
754   Offset += 2;
755   return false;
756 }
757 
758 bool Decoder::opcode_save_fregp_x(const uint8_t *OC, unsigned &Offset,
759                                   unsigned Length, bool Prologue) {
760   uint32_t Reg = (OC[Offset] & 0x01) << 8;
761   Reg |= (OC[Offset + 1] & 0xC0);
762   Reg >>= 6;
763   Reg += 8;
764   uint32_t Off = ((OC[Offset + 1] & 0x3F) + 1) << 3;
765   if (Prologue)
766     SW.startLine() << format(
767         "0x%02x%02x              ; stp d%u, d%u, [sp, #-%u]!\n", OC[Offset],
768         OC[Offset + 1], Reg, Reg + 1, Off);
769   else
770     SW.startLine() << format(
771         "0x%02x%02x              ; ldp d%u, d%u, [sp], #%u\n", OC[Offset],
772         OC[Offset + 1], Reg, Reg + 1, Off);
773   Offset += 2;
774   return false;
775 }
776 
777 bool Decoder::opcode_save_freg(const uint8_t *OC, unsigned &Offset,
778                                unsigned Length, bool Prologue) {
779   uint32_t Reg = (OC[Offset] & 0x01) << 8;
780   Reg |= (OC[Offset + 1] & 0xC0);
781   Reg >>= 6;
782   Reg += 8;
783   uint32_t Off = (OC[Offset + 1] & 0x3F) << 3;
784   SW.startLine() << format("0x%02x%02x              ; %s d%u, [sp, #%u]\n",
785                            OC[Offset], OC[Offset + 1],
786                            static_cast<const char *>(Prologue ? "str" : "ldr"),
787                            Reg, Off);
788   Offset += 2;
789   return false;
790 }
791 
792 bool Decoder::opcode_save_freg_x(const uint8_t *OC, unsigned &Offset,
793                                  unsigned Length, bool Prologue) {
794   uint32_t Reg = ((OC[Offset + 1] & 0xE0) >> 5) + 8;
795   uint32_t Off = ((OC[Offset + 1] & 0x1F) + 1) << 3;
796   if (Prologue)
797     SW.startLine() << format(
798         "0x%02x%02x              ; str d%u, [sp, #-%u]!\n", OC[Offset],
799         OC[Offset + 1], Reg, Off);
800   else
801     SW.startLine() << format(
802         "0x%02x%02x              ; ldr d%u, [sp], #%u\n", OC[Offset],
803         OC[Offset + 1], Reg, Off);
804   Offset += 2;
805   return false;
806 }
807 
808 bool Decoder::opcode_alloc_l(const uint8_t *OC, unsigned &Offset,
809                              unsigned Length, bool Prologue) {
810   unsigned Off =
811       (OC[Offset + 1] << 16) | (OC[Offset + 2] << 8) | (OC[Offset + 3] << 0);
812   Off <<= 4;
813   SW.startLine() << format(
814       "0x%02x%02x%02x%02x          ; %s sp, #%u\n", OC[Offset], OC[Offset + 1],
815       OC[Offset + 2], OC[Offset + 3],
816       static_cast<const char *>(Prologue ? "sub" : "add"), Off);
817   Offset += 4;
818   return false;
819 }
820 
821 bool Decoder::opcode_setfp(const uint8_t *OC, unsigned &Offset, unsigned Length,
822                            bool Prologue) {
823   SW.startLine() << format("0x%02x                ; mov %s, %s\n", OC[Offset],
824                            static_cast<const char *>(Prologue ? "fp" : "sp"),
825                            static_cast<const char *>(Prologue ? "sp" : "fp"));
826   ++Offset;
827   return false;
828 }
829 
830 bool Decoder::opcode_addfp(const uint8_t *OC, unsigned &Offset, unsigned Length,
831                            bool Prologue) {
832   unsigned NumBytes = OC[Offset + 1] << 3;
833   SW.startLine() << format(
834       "0x%02x%02x              ; %s %s, %s, #%u\n", OC[Offset], OC[Offset + 1],
835       static_cast<const char *>(Prologue ? "add" : "sub"),
836       static_cast<const char *>(Prologue ? "fp" : "sp"),
837       static_cast<const char *>(Prologue ? "sp" : "fp"), NumBytes);
838   Offset += 2;
839   return false;
840 }
841 
842 bool Decoder::opcode_nop(const uint8_t *OC, unsigned &Offset, unsigned Length,
843                          bool Prologue) {
844   SW.startLine() << format("0x%02x                ; nop\n", OC[Offset]);
845   ++Offset;
846   return false;
847 }
848 
849 bool Decoder::opcode_end(const uint8_t *OC, unsigned &Offset, unsigned Length,
850                          bool Prologue) {
851   SW.startLine() << format("0x%02x                ; end\n", OC[Offset]);
852   ++Offset;
853   return true;
854 }
855 
856 bool Decoder::opcode_end_c(const uint8_t *OC, unsigned &Offset, unsigned Length,
857                            bool Prologue) {
858   SW.startLine() << format("0x%02x                ; end_c\n", OC[Offset]);
859   ++Offset;
860   return false;
861 }
862 
863 bool Decoder::opcode_save_next(const uint8_t *OC, unsigned &Offset,
864                                unsigned Length, bool Prologue) {
865   if (Prologue)
866     SW.startLine() << format("0x%02x                ; save next\n", OC[Offset]);
867   else
868     SW.startLine() << format("0x%02x                ; restore next\n",
869                              OC[Offset]);
870   ++Offset;
871   return false;
872 }
873 
874 bool Decoder::opcode_save_any_reg(const uint8_t *OC, unsigned &Offset,
875                                   unsigned Length, bool Prologue) {
876   // Whether the instruction has writeback
877   bool Writeback = (OC[Offset + 1] & 0x20) == 0x20;
878   // Whether the instruction is paired.  (Paired instructions are required
879   // to save/restore adjacent registers.)
880   bool Paired = (OC[Offset + 1] & 0x40) == 0x40;
881   // The kind of register saved:
882   // - 0 is an x register
883   // - 1 is the low half of a q register
884   // - 2 is a whole q register
885   int RegKind = (OC[Offset + 2] & 0xC0) >> 6;
886   // Encoded register name (0 -> x0/q0, 1 -> x1/q1, etc.)
887   int Reg = OC[Offset + 1] & 0x1F;
888   // Encoded stack offset of load/store instruction; decoding varies by mode.
889   int StackOffset = OC[Offset + 2] & 0x3F;
890   if (Writeback)
891     StackOffset++;
892   if (!Writeback && !Paired && RegKind != 2)
893     StackOffset *= 8;
894   else
895     StackOffset *= 16;
896 
897   SW.startLine() << format("0x%02x%02x%02x            ; ", OC[Offset],
898                            OC[Offset + 1], OC[Offset + 2]);
899 
900   // Verify the encoding is in a form we understand.  The high bit of the first
901   // byte, and mode 3 for the register kind are apparently reserved.  The
902   // encoded register must refer to a valid register.
903   int MaxReg = 0x1F;
904   if (Paired)
905     --MaxReg;
906   if (RegKind == 0)
907     --MaxReg;
908   if ((OC[Offset + 1] & 0x80) == 0x80 || RegKind == 3 || Reg > MaxReg) {
909     SW.getOStream() << "invalid save_any_reg encoding\n";
910     Offset += 3;
911     return false;
912   }
913 
914   if (Paired) {
915     if (Prologue)
916       SW.getOStream() << "stp ";
917     else
918       SW.getOStream() << "ldp ";
919   } else {
920     if (Prologue)
921       SW.getOStream() << "str ";
922     else
923       SW.getOStream() << "ldr ";
924   }
925 
926   char RegChar = 'x';
927   if (RegKind == 1) {
928     RegChar = 'd';
929   } else if (RegKind == 2) {
930     RegChar = 'q';
931   }
932 
933   if (Paired)
934     SW.getOStream() << format("%c%d, %c%d, ", RegChar, Reg, RegChar, Reg + 1);
935   else
936     SW.getOStream() << format("%c%d, ", RegChar, Reg);
937 
938   if (Writeback) {
939     if (Prologue)
940       SW.getOStream() << format("[sp, #-%d]!\n", StackOffset);
941     else
942       SW.getOStream() << format("[sp], #%d\n", StackOffset);
943   } else {
944     SW.getOStream() << format("[sp, #%d]\n", StackOffset);
945   }
946 
947   Offset += 3;
948   return false;
949 }
950 
951 bool Decoder::opcode_trap_frame(const uint8_t *OC, unsigned &Offset,
952                                 unsigned Length, bool Prologue) {
953   SW.startLine() << format("0x%02x                ; trap frame\n", OC[Offset]);
954   ++Offset;
955   return false;
956 }
957 
958 bool Decoder::opcode_machine_frame(const uint8_t *OC, unsigned &Offset,
959                                    unsigned Length, bool Prologue) {
960   SW.startLine() << format("0x%02x                ; machine frame\n",
961                            OC[Offset]);
962   ++Offset;
963   return false;
964 }
965 
966 bool Decoder::opcode_context(const uint8_t *OC, unsigned &Offset,
967                              unsigned Length, bool Prologue) {
968   SW.startLine() << format("0x%02x                ; context\n", OC[Offset]);
969   ++Offset;
970   return false;
971 }
972 
973 bool Decoder::opcode_ec_context(const uint8_t *OC, unsigned &Offset,
974                                 unsigned Length, bool Prologue) {
975   SW.startLine() << format("0x%02x                ; EC context\n", OC[Offset]);
976   ++Offset;
977   return false;
978 }
979 
980 bool Decoder::opcode_clear_unwound_to_call(const uint8_t *OC, unsigned &Offset,
981                                            unsigned Length, bool Prologue) {
982   SW.startLine() << format("0x%02x                ; clear unwound to call\n",
983                            OC[Offset]);
984   ++Offset;
985   return false;
986 }
987 
988 bool Decoder::opcode_pac_sign_lr(const uint8_t *OC, unsigned &Offset,
989                                  unsigned Length, bool Prologue) {
990   if (Prologue)
991     SW.startLine() << format("0x%02x                ; pacibsp\n", OC[Offset]);
992   else
993     SW.startLine() << format("0x%02x                ; autibsp\n", OC[Offset]);
994   ++Offset;
995   return false;
996 }
997 
998 void Decoder::decodeOpcodes(ArrayRef<uint8_t> Opcodes, unsigned Offset,
999                             bool Prologue) {
1000   assert((!Prologue || Offset == 0) && "prologue should always use offset 0");
1001   const RingEntry* DecodeRing = isAArch64 ? Ring64 : Ring;
1002   bool Terminated = false;
1003   for (unsigned OI = Offset, OE = Opcodes.size(); !Terminated && OI < OE; ) {
1004     for (unsigned DI = 0;; ++DI) {
1005       if ((isAArch64 && (DI >= std::size(Ring64))) ||
1006           (!isAArch64 && (DI >= std::size(Ring)))) {
1007         SW.startLine() << format("0x%02x                ; Bad opcode!\n",
1008                                  Opcodes.data()[OI]);
1009         ++OI;
1010         break;
1011       }
1012 
1013       if ((Opcodes[OI] & DecodeRing[DI].Mask) == DecodeRing[DI].Value) {
1014         if (OI + DecodeRing[DI].Length > OE) {
1015           SW.startLine() << format("Opcode 0x%02x goes past the unwind data\n",
1016                                     Opcodes[OI]);
1017           OI += DecodeRing[DI].Length;
1018           break;
1019         }
1020         Terminated =
1021             (this->*DecodeRing[DI].Routine)(Opcodes.data(), OI, 0, Prologue);
1022         break;
1023       }
1024     }
1025   }
1026 }
1027 
1028 bool Decoder::dumpXDataRecord(const COFFObjectFile &COFF,
1029                               const SectionRef &Section,
1030                               uint64_t FunctionAddress, uint64_t VA) {
1031   ArrayRef<uint8_t> Contents;
1032   if (COFF.getSectionContents(COFF.getCOFFSection(Section), Contents))
1033     return false;
1034 
1035   uint64_t SectionVA = Section.getAddress();
1036   uint64_t Offset = VA - SectionVA;
1037   const ulittle32_t *Data =
1038     reinterpret_cast<const ulittle32_t *>(Contents.data() + Offset);
1039 
1040   // Sanity check to ensure that the .xdata header is present.
1041   // A header is one or two words, followed by at least one word to describe
1042   // the unwind codes. Applicable to both ARM and AArch64.
1043   if (Contents.size() - Offset < 8)
1044     report_fatal_error(".xdata must be at least 8 bytes in size");
1045 
1046   const ExceptionDataRecord XData(Data, isAArch64);
1047   DictScope XRS(SW, "ExceptionData");
1048   SW.printNumber("FunctionLength",
1049                  isAArch64 ? XData.FunctionLengthInBytesAArch64() :
1050                  XData.FunctionLengthInBytesARM());
1051   SW.printNumber("Version", XData.Vers());
1052   SW.printBoolean("ExceptionData", XData.X());
1053   SW.printBoolean("EpiloguePacked", XData.E());
1054   if (!isAArch64)
1055     SW.printBoolean("Fragment", XData.F());
1056   SW.printNumber(XData.E() ? "EpilogueOffset" : "EpilogueScopes",
1057                  XData.EpilogueCount());
1058   uint64_t ByteCodeLength = XData.CodeWords() * sizeof(uint32_t);
1059   SW.printNumber("ByteCodeLength", ByteCodeLength);
1060 
1061   if ((int64_t)(Contents.size() - Offset - 4 * HeaderWords(XData) -
1062                 (XData.E() ? 0 : XData.EpilogueCount() * 4) -
1063                 (XData.X() ? 8 : 0)) < (int64_t)ByteCodeLength) {
1064     SW.flush();
1065     report_fatal_error("Malformed unwind data");
1066   }
1067 
1068   if (XData.E()) {
1069     ArrayRef<uint8_t> UC = XData.UnwindByteCode();
1070     {
1071       ListScope PS(SW, "Prologue");
1072       decodeOpcodes(UC, 0, /*Prologue=*/true);
1073     }
1074     if (XData.EpilogueCount()) {
1075       ListScope ES(SW, "Epilogue");
1076       decodeOpcodes(UC, XData.EpilogueCount(), /*Prologue=*/false);
1077     }
1078   } else {
1079     {
1080       ListScope PS(SW, "Prologue");
1081       decodeOpcodes(XData.UnwindByteCode(), 0, /*Prologue=*/true);
1082     }
1083     ArrayRef<ulittle32_t> EpilogueScopes = XData.EpilogueScopes();
1084     ListScope ESS(SW, "EpilogueScopes");
1085     for (const EpilogueScope ES : EpilogueScopes) {
1086       DictScope ESES(SW, "EpilogueScope");
1087       SW.printNumber("StartOffset", ES.EpilogueStartOffset());
1088       if (!isAArch64)
1089         SW.printNumber("Condition", ES.Condition());
1090       SW.printNumber("EpilogueStartIndex",
1091                      isAArch64 ? ES.EpilogueStartIndexAArch64()
1092                                : ES.EpilogueStartIndexARM());
1093       unsigned ReservedMask = isAArch64 ? 0xF : 0x3;
1094       if ((ES.ES >> 18) & ReservedMask)
1095         SW.printNumber("ReservedBits", (ES.ES >> 18) & ReservedMask);
1096 
1097       ListScope Opcodes(SW, "Opcodes");
1098       decodeOpcodes(XData.UnwindByteCode(),
1099                     isAArch64 ? ES.EpilogueStartIndexAArch64()
1100                               : ES.EpilogueStartIndexARM(),
1101                     /*Prologue=*/false);
1102     }
1103   }
1104 
1105   if (XData.X()) {
1106     const uint32_t Parameter = XData.ExceptionHandlerParameter();
1107     const size_t HandlerOffset = HeaderWords(XData) +
1108                                  (XData.E() ? 0 : XData.EpilogueCount()) +
1109                                  XData.CodeWords();
1110 
1111     uint64_t Address, SymbolOffset;
1112     ErrorOr<SymbolRef> Symbol = getSymbolForLocation(
1113         COFF, Section, Offset + HandlerOffset * sizeof(uint32_t),
1114         XData.ExceptionHandlerRVA(), Address, SymbolOffset,
1115         /*FunctionOnly=*/true);
1116     if (!Symbol) {
1117       ListScope EHS(SW, "ExceptionHandler");
1118       SW.printHex("Routine", Address);
1119       SW.printHex("Parameter", Parameter);
1120       return true;
1121     }
1122 
1123     Expected<StringRef> Name = Symbol->getName();
1124     if (!Name) {
1125       std::string Buf;
1126       llvm::raw_string_ostream OS(Buf);
1127       logAllUnhandledErrors(Name.takeError(), OS);
1128       report_fatal_error(Twine(OS.str()));
1129     }
1130 
1131     ListScope EHS(SW, "ExceptionHandler");
1132     SW.printString("Routine", formatSymbol(*Name, Address, SymbolOffset));
1133     SW.printHex("Parameter", Parameter);
1134   }
1135 
1136   return true;
1137 }
1138 
1139 bool Decoder::dumpUnpackedEntry(const COFFObjectFile &COFF,
1140                                 const SectionRef Section, uint64_t Offset,
1141                                 unsigned Index, const RuntimeFunction &RF) {
1142   assert(RF.Flag() == RuntimeFunctionFlag::RFF_Unpacked &&
1143          "packed entry cannot be treated as an unpacked entry");
1144 
1145   uint64_t FunctionAddress, FunctionOffset;
1146   ErrorOr<SymbolRef> Function = getSymbolForLocation(
1147       COFF, Section, Offset, RF.BeginAddress, FunctionAddress, FunctionOffset,
1148       /*FunctionOnly=*/true);
1149 
1150   uint64_t XDataAddress, XDataOffset;
1151   ErrorOr<SymbolRef> XDataRecord = getSymbolForLocation(
1152       COFF, Section, Offset + 4, RF.ExceptionInformationRVA(), XDataAddress,
1153       XDataOffset);
1154 
1155   if (!RF.BeginAddress && !Function)
1156     return false;
1157   if (!RF.UnwindData && !XDataRecord)
1158     return false;
1159 
1160   StringRef FunctionName;
1161   if (Function) {
1162     Expected<StringRef> FunctionNameOrErr = Function->getName();
1163     if (!FunctionNameOrErr) {
1164       std::string Buf;
1165       llvm::raw_string_ostream OS(Buf);
1166       logAllUnhandledErrors(FunctionNameOrErr.takeError(), OS);
1167       report_fatal_error(Twine(OS.str()));
1168     }
1169     FunctionName = *FunctionNameOrErr;
1170   }
1171 
1172   SW.printString("Function",
1173                  formatSymbol(FunctionName, FunctionAddress, FunctionOffset));
1174 
1175   if (XDataRecord) {
1176     Expected<StringRef> Name = XDataRecord->getName();
1177     if (!Name) {
1178       std::string Buf;
1179       llvm::raw_string_ostream OS(Buf);
1180       logAllUnhandledErrors(Name.takeError(), OS);
1181       report_fatal_error(Twine(OS.str()));
1182     }
1183 
1184     SW.printString("ExceptionRecord",
1185                    formatSymbol(*Name, XDataAddress, XDataOffset));
1186 
1187     Expected<section_iterator> SIOrErr = XDataRecord->getSection();
1188     if (!SIOrErr) {
1189       // TODO: Actually report errors helpfully.
1190       consumeError(SIOrErr.takeError());
1191       return false;
1192     }
1193     section_iterator SI = *SIOrErr;
1194 
1195     return dumpXDataRecord(COFF, *SI, FunctionAddress, XDataAddress);
1196   } else {
1197     SW.printString("ExceptionRecord", formatSymbol("", XDataAddress));
1198 
1199     ErrorOr<SectionRef> Section = getSectionContaining(COFF, XDataAddress);
1200     if (!Section)
1201       return false;
1202 
1203     return dumpXDataRecord(COFF, *Section, FunctionAddress, XDataAddress);
1204   }
1205 }
1206 
1207 bool Decoder::dumpPackedEntry(const object::COFFObjectFile &COFF,
1208                               const SectionRef Section, uint64_t Offset,
1209                               unsigned Index, const RuntimeFunction &RF) {
1210   assert((RF.Flag() == RuntimeFunctionFlag::RFF_Packed ||
1211           RF.Flag() == RuntimeFunctionFlag::RFF_PackedFragment) &&
1212          "unpacked entry cannot be treated as a packed entry");
1213 
1214   uint64_t FunctionAddress, FunctionOffset;
1215   ErrorOr<SymbolRef> Function = getSymbolForLocation(
1216       COFF, Section, Offset, RF.BeginAddress, FunctionAddress, FunctionOffset,
1217       /*FunctionOnly=*/true);
1218 
1219   StringRef FunctionName;
1220   if (Function) {
1221     Expected<StringRef> FunctionNameOrErr = Function->getName();
1222     if (!FunctionNameOrErr) {
1223       std::string Buf;
1224       llvm::raw_string_ostream OS(Buf);
1225       logAllUnhandledErrors(FunctionNameOrErr.takeError(), OS);
1226       report_fatal_error(Twine(OS.str()));
1227     }
1228     FunctionName = *FunctionNameOrErr;
1229   }
1230 
1231   SW.printString("Function",
1232                  formatSymbol(FunctionName, FunctionAddress, FunctionOffset));
1233   SW.printBoolean("Fragment",
1234                   RF.Flag() == RuntimeFunctionFlag::RFF_PackedFragment);
1235   SW.printNumber("FunctionLength", RF.FunctionLength());
1236   SW.startLine() << "ReturnType: " << RF.Ret() << '\n';
1237   SW.printBoolean("HomedParameters", RF.H());
1238   SW.printNumber("Reg", RF.Reg());
1239   SW.printNumber("R", RF.R());
1240   SW.printBoolean("LinkRegister", RF.L());
1241   SW.printBoolean("Chaining", RF.C());
1242   SW.printNumber("StackAdjustment", StackAdjustment(RF) << 2);
1243 
1244   {
1245     ListScope PS(SW, "Prologue");
1246 
1247     uint16_t GPRMask, VFPMask;
1248     std::tie(GPRMask, VFPMask) = SavedRegisterMask(RF, /*Prologue=*/true);
1249 
1250     if (StackAdjustment(RF) && !PrologueFolding(RF))
1251       SW.startLine() << "sub sp, sp, #" << StackAdjustment(RF) * 4 << "\n";
1252     if (VFPMask) {
1253       SW.startLine() << "vpush ";
1254       printVFPMask(VFPMask);
1255       OS << "\n";
1256     }
1257     if (RF.C()) {
1258       // Count the number of registers pushed below R11
1259       int FpOffset = 4 * llvm::popcount(GPRMask & ((1U << 11) - 1));
1260       if (FpOffset)
1261         SW.startLine() << "add.w r11, sp, #" << FpOffset << "\n";
1262       else
1263         SW.startLine() << "mov r11, sp\n";
1264     }
1265     if (GPRMask) {
1266       SW.startLine() << "push ";
1267       printGPRMask(GPRMask);
1268       OS << "\n";
1269     }
1270     if (RF.H())
1271       SW.startLine() << "push {r0-r3}\n";
1272   }
1273 
1274   if (RF.Ret() != ReturnType::RT_NoEpilogue) {
1275     ListScope PS(SW, "Epilogue");
1276 
1277     uint16_t GPRMask, VFPMask;
1278     std::tie(GPRMask, VFPMask) = SavedRegisterMask(RF, /*Prologue=*/false);
1279 
1280     if (StackAdjustment(RF) && !EpilogueFolding(RF))
1281       SW.startLine() << "add sp, sp, #" << StackAdjustment(RF) * 4 << "\n";
1282     if (VFPMask) {
1283       SW.startLine() << "vpop ";
1284       printVFPMask(VFPMask);
1285       OS << "\n";
1286     }
1287     if (GPRMask) {
1288       SW.startLine() << "pop ";
1289       printGPRMask(GPRMask);
1290       OS << "\n";
1291     }
1292     if (RF.H()) {
1293       if (RF.L() == 0 || RF.Ret() != ReturnType::RT_POP)
1294         SW.startLine() << "add sp, sp, #16\n";
1295       else
1296         SW.startLine() << "ldr pc, [sp], #20\n";
1297     }
1298     if (RF.Ret() != ReturnType::RT_POP)
1299       SW.startLine() << RF.Ret() << '\n';
1300   }
1301 
1302   return true;
1303 }
1304 
1305 bool Decoder::dumpPackedARM64Entry(const object::COFFObjectFile &COFF,
1306                                    const SectionRef Section, uint64_t Offset,
1307                                    unsigned Index,
1308                                    const RuntimeFunctionARM64 &RF) {
1309   assert((RF.Flag() == RuntimeFunctionFlag::RFF_Packed ||
1310           RF.Flag() == RuntimeFunctionFlag::RFF_PackedFragment) &&
1311          "unpacked entry cannot be treated as a packed entry");
1312 
1313   uint64_t FunctionAddress, FunctionOffset;
1314   ErrorOr<SymbolRef> Function = getSymbolForLocation(
1315       COFF, Section, Offset, RF.BeginAddress, FunctionAddress, FunctionOffset,
1316       /*FunctionOnly=*/true);
1317 
1318   StringRef FunctionName;
1319   if (Function) {
1320     Expected<StringRef> FunctionNameOrErr = Function->getName();
1321     if (!FunctionNameOrErr) {
1322       std::string Buf;
1323       llvm::raw_string_ostream OS(Buf);
1324       logAllUnhandledErrors(FunctionNameOrErr.takeError(), OS);
1325       report_fatal_error(Twine(OS.str()));
1326     }
1327     FunctionName = *FunctionNameOrErr;
1328   }
1329 
1330   SW.printString("Function",
1331                  formatSymbol(FunctionName, FunctionAddress, FunctionOffset));
1332   SW.printBoolean("Fragment",
1333                   RF.Flag() == RuntimeFunctionFlag::RFF_PackedFragment);
1334   SW.printNumber("FunctionLength", RF.FunctionLength());
1335   SW.printNumber("RegF", RF.RegF());
1336   SW.printNumber("RegI", RF.RegI());
1337   SW.printBoolean("HomedParameters", RF.H());
1338   SW.printNumber("CR", RF.CR());
1339   SW.printNumber("FrameSize", RF.FrameSize() << 4);
1340   ListScope PS(SW, "Prologue");
1341 
1342   // Synthesize the equivalent prologue according to the documentation
1343   // at https://docs.microsoft.com/en-us/cpp/build/arm64-exception-handling,
1344   // printed in reverse order compared to the docs, to match how prologues
1345   // are printed for the non-packed case.
1346   int IntSZ = 8 * RF.RegI();
1347   if (RF.CR() == 1)
1348     IntSZ += 8;
1349   int FpSZ = 8 * RF.RegF();
1350   if (RF.RegF())
1351     FpSZ += 8;
1352   int SavSZ = (IntSZ + FpSZ + 8 * 8 * RF.H() + 0xf) & ~0xf;
1353   int LocSZ = (RF.FrameSize() << 4) - SavSZ;
1354 
1355   if (RF.CR() == 2 || RF.CR() == 3) {
1356     SW.startLine() << "mov x29, sp\n";
1357     if (LocSZ <= 512) {
1358       SW.startLine() << format("stp x29, lr, [sp, #-%d]!\n", LocSZ);
1359     } else {
1360       SW.startLine() << "stp x29, lr, [sp, #0]\n";
1361     }
1362   }
1363   if (LocSZ > 4080) {
1364     SW.startLine() << format("sub sp, sp, #%d\n", LocSZ - 4080);
1365     SW.startLine() << "sub sp, sp, #4080\n";
1366   } else if ((RF.CR() != 3 && RF.CR() != 2 && LocSZ > 0) || LocSZ > 512) {
1367     SW.startLine() << format("sub sp, sp, #%d\n", LocSZ);
1368   }
1369   if (RF.H()) {
1370     SW.startLine() << format("stp x6, x7, [sp, #%d]\n", SavSZ - 16);
1371     SW.startLine() << format("stp x4, x5, [sp, #%d]\n", SavSZ - 32);
1372     SW.startLine() << format("stp x2, x3, [sp, #%d]\n", SavSZ - 48);
1373     if (RF.RegI() > 0 || RF.RegF() > 0 || RF.CR() == 1) {
1374       SW.startLine() << format("stp x0, x1, [sp, #%d]\n", SavSZ - 64);
1375     } else {
1376       // This case isn't documented; if neither RegI nor RegF nor CR=1
1377       // have decremented the stack pointer by SavSZ, we need to do it here
1378       // (as the final stack adjustment of LocSZ excludes SavSZ).
1379       SW.startLine() << format("stp x0, x1, [sp, #-%d]!\n", SavSZ);
1380     }
1381   }
1382   int FloatRegs = RF.RegF() > 0 ? RF.RegF() + 1 : 0;
1383   for (int I = (FloatRegs + 1) / 2 - 1; I >= 0; I--) {
1384     if (I == (FloatRegs + 1) / 2 - 1 && FloatRegs % 2 == 1) {
1385       // The last register, an odd register without a pair
1386       SW.startLine() << format("str d%d, [sp, #%d]\n", 8 + 2 * I,
1387                                IntSZ + 16 * I);
1388     } else if (I == 0 && RF.RegI() == 0 && RF.CR() != 1) {
1389       SW.startLine() << format("stp d%d, d%d, [sp, #-%d]!\n", 8 + 2 * I,
1390                                8 + 2 * I + 1, SavSZ);
1391     } else {
1392       SW.startLine() << format("stp d%d, d%d, [sp, #%d]\n", 8 + 2 * I,
1393                                8 + 2 * I + 1, IntSZ + 16 * I);
1394     }
1395   }
1396   if (RF.CR() == 1 && (RF.RegI() % 2) == 0) {
1397     if (RF.RegI() == 0)
1398       SW.startLine() << format("str lr, [sp, #-%d]!\n", SavSZ);
1399     else
1400       SW.startLine() << format("str lr, [sp, #%d]\n", IntSZ - 8);
1401   }
1402   for (int I = (RF.RegI() + 1) / 2 - 1; I >= 0; I--) {
1403     if (I == (RF.RegI() + 1) / 2 - 1 && RF.RegI() % 2 == 1) {
1404       // The last register, an odd register without a pair
1405       if (RF.CR() == 1) {
1406         if (I == 0) { // If this is the only register pair
1407           // CR=1 combined with RegI=1 doesn't map to a documented case;
1408           // it doesn't map to any regular unwind info opcode, and the
1409           // actual unwinder doesn't support it.
1410           SW.startLine() << "INVALID!\n";
1411         } else
1412           SW.startLine() << format("stp x%d, lr, [sp, #%d]\n", 19 + 2 * I,
1413                                    16 * I);
1414       } else {
1415         if (I == 0)
1416           SW.startLine() << format("str x%d, [sp, #-%d]!\n", 19 + 2 * I, SavSZ);
1417         else
1418           SW.startLine() << format("str x%d, [sp, #%d]\n", 19 + 2 * I, 16 * I);
1419       }
1420     } else if (I == 0) {
1421       // The first register pair
1422       SW.startLine() << format("stp x19, x20, [sp, #-%d]!\n", SavSZ);
1423     } else {
1424       SW.startLine() << format("stp x%d, x%d, [sp, #%d]\n", 19 + 2 * I,
1425                                19 + 2 * I + 1, 16 * I);
1426     }
1427   }
1428   // CR=2 is yet undocumented, see
1429   // https://github.com/MicrosoftDocs/cpp-docs/pull/4202 for upstream
1430   // progress on getting it documented.
1431   if (RF.CR() == 2)
1432     SW.startLine() << "pacibsp\n";
1433   SW.startLine() << "end\n";
1434 
1435   return true;
1436 }
1437 
1438 bool Decoder::dumpProcedureDataEntry(const COFFObjectFile &COFF,
1439                                      const SectionRef Section, unsigned Index,
1440                                      ArrayRef<uint8_t> Contents) {
1441   uint64_t Offset = PDataEntrySize * Index;
1442   const ulittle32_t *Data =
1443     reinterpret_cast<const ulittle32_t *>(Contents.data() + Offset);
1444 
1445   const RuntimeFunction Entry(Data);
1446   DictScope RFS(SW, "RuntimeFunction");
1447   if (Entry.Flag() == RuntimeFunctionFlag::RFF_Unpacked)
1448     return dumpUnpackedEntry(COFF, Section, Offset, Index, Entry);
1449   if (isAArch64) {
1450     const RuntimeFunctionARM64 EntryARM64(Data);
1451     return dumpPackedARM64Entry(COFF, Section, Offset, Index, EntryARM64);
1452   }
1453   return dumpPackedEntry(COFF, Section, Offset, Index, Entry);
1454 }
1455 
1456 void Decoder::dumpProcedureData(const COFFObjectFile &COFF,
1457                                 const SectionRef Section) {
1458   ArrayRef<uint8_t> Contents;
1459   if (COFF.getSectionContents(COFF.getCOFFSection(Section), Contents))
1460     return;
1461 
1462   if (Contents.size() % PDataEntrySize) {
1463     errs() << ".pdata content is not " << PDataEntrySize << "-byte aligned\n";
1464     return;
1465   }
1466 
1467   for (unsigned EI = 0, EE = Contents.size() / PDataEntrySize; EI < EE; ++EI)
1468     if (!dumpProcedureDataEntry(COFF, Section, EI, Contents))
1469       break;
1470 }
1471 
1472 Error Decoder::dumpProcedureData(const COFFObjectFile &COFF) {
1473   for (const auto &Section : COFF.sections()) {
1474     Expected<StringRef> NameOrErr =
1475         COFF.getSectionName(COFF.getCOFFSection(Section));
1476     if (!NameOrErr)
1477       return NameOrErr.takeError();
1478 
1479     if (NameOrErr->starts_with(".pdata"))
1480       dumpProcedureData(COFF, Section);
1481   }
1482   return Error::success();
1483 }
1484 }
1485 }
1486 }
1487