xref: /freebsd/contrib/llvm-project/llvm/lib/DebugInfo/DWARF/DWARFAcceleratorTable.cpp (revision 6580f5c38dd5b01aeeaed16b370f1a12423437f0)
1 //===- DWARFAcceleratorTable.cpp ------------------------------------------===//
2 //
3 // Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions.
4 // See https://llvm.org/LICENSE.txt for license information.
5 // SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception
6 //
7 //===----------------------------------------------------------------------===//
8 
9 #include "llvm/DebugInfo/DWARF/DWARFAcceleratorTable.h"
10 
11 #include "llvm/ADT/SmallVector.h"
12 #include "llvm/BinaryFormat/Dwarf.h"
13 #include "llvm/Support/Compiler.h"
14 #include "llvm/Support/DJB.h"
15 #include "llvm/Support/Errc.h"
16 #include "llvm/Support/Format.h"
17 #include "llvm/Support/FormatVariadic.h"
18 #include "llvm/Support/ScopedPrinter.h"
19 #include "llvm/Support/raw_ostream.h"
20 #include <cstddef>
21 #include <cstdint>
22 #include <utility>
23 
24 using namespace llvm;
25 
26 namespace {
27 struct Atom {
28   unsigned Value;
29 };
30 
31 static raw_ostream &operator<<(raw_ostream &OS, const Atom &A) {
32   StringRef Str = dwarf::AtomTypeString(A.Value);
33   if (!Str.empty())
34     return OS << Str;
35   return OS << "DW_ATOM_unknown_" << format("%x", A.Value);
36 }
37 } // namespace
38 
39 static Atom formatAtom(unsigned Atom) { return {Atom}; }
40 
41 DWARFAcceleratorTable::~DWARFAcceleratorTable() = default;
42 
43 Error AppleAcceleratorTable::extract() {
44   uint64_t Offset = 0;
45 
46   // Check that we can at least read the header.
47   if (!AccelSection.isValidOffset(offsetof(Header, HeaderDataLength) + 4))
48     return createStringError(errc::illegal_byte_sequence,
49                              "Section too small: cannot read header.");
50 
51   Hdr.Magic = AccelSection.getU32(&Offset);
52   Hdr.Version = AccelSection.getU16(&Offset);
53   Hdr.HashFunction = AccelSection.getU16(&Offset);
54   Hdr.BucketCount = AccelSection.getU32(&Offset);
55   Hdr.HashCount = AccelSection.getU32(&Offset);
56   Hdr.HeaderDataLength = AccelSection.getU32(&Offset);
57   FormParams = {Hdr.Version, 0, dwarf::DwarfFormat::DWARF32};
58 
59   // Check that we can read all the hashes and offsets from the
60   // section (see SourceLevelDebugging.rst for the structure of the index).
61   if (!AccelSection.isValidOffset(getIthBucketBase(Hdr.BucketCount - 1)))
62     return createStringError(
63         errc::illegal_byte_sequence,
64         "Section too small: cannot read buckets and hashes.");
65 
66   HdrData.DIEOffsetBase = AccelSection.getU32(&Offset);
67   uint32_t NumAtoms = AccelSection.getU32(&Offset);
68 
69   HashDataEntryLength = 0;
70   auto MakeUnsupportedFormError = [](dwarf::Form Form) {
71     return createStringError(errc::not_supported,
72                              "Unsupported form:" +
73                                  dwarf::FormEncodingString(Form));
74   };
75 
76   for (unsigned i = 0; i < NumAtoms; ++i) {
77     uint16_t AtomType = AccelSection.getU16(&Offset);
78     auto AtomForm = static_cast<dwarf::Form>(AccelSection.getU16(&Offset));
79     HdrData.Atoms.push_back(std::make_pair(AtomType, AtomForm));
80 
81     std::optional<uint8_t> FormSize =
82         dwarf::getFixedFormByteSize(AtomForm, FormParams);
83     if (!FormSize)
84       return MakeUnsupportedFormError(AtomForm);
85     HashDataEntryLength += *FormSize;
86   }
87 
88   IsValid = true;
89   return Error::success();
90 }
91 
92 uint32_t AppleAcceleratorTable::getNumBuckets() const {
93   return Hdr.BucketCount;
94 }
95 uint32_t AppleAcceleratorTable::getNumHashes() const { return Hdr.HashCount; }
96 uint32_t AppleAcceleratorTable::getSizeHdr() const { return sizeof(Hdr); }
97 uint32_t AppleAcceleratorTable::getHeaderDataLength() const {
98   return Hdr.HeaderDataLength;
99 }
100 
101 ArrayRef<std::pair<AppleAcceleratorTable::HeaderData::AtomType,
102                    AppleAcceleratorTable::HeaderData::Form>>
103 AppleAcceleratorTable::getAtomsDesc() {
104   return HdrData.Atoms;
105 }
106 
107 bool AppleAcceleratorTable::validateForms() {
108   for (auto Atom : getAtomsDesc()) {
109     DWARFFormValue FormValue(Atom.second);
110     switch (Atom.first) {
111     case dwarf::DW_ATOM_die_offset:
112     case dwarf::DW_ATOM_die_tag:
113     case dwarf::DW_ATOM_type_flags:
114       if ((!FormValue.isFormClass(DWARFFormValue::FC_Constant) &&
115            !FormValue.isFormClass(DWARFFormValue::FC_Flag)) ||
116           FormValue.getForm() == dwarf::DW_FORM_sdata)
117         return false;
118       break;
119     default:
120       break;
121     }
122   }
123   return true;
124 }
125 
126 std::pair<uint64_t, dwarf::Tag>
127 AppleAcceleratorTable::readAtoms(uint64_t *HashDataOffset) {
128   uint64_t DieOffset = dwarf::DW_INVALID_OFFSET;
129   dwarf::Tag DieTag = dwarf::DW_TAG_null;
130 
131   for (auto Atom : getAtomsDesc()) {
132     DWARFFormValue FormValue(Atom.second);
133     FormValue.extractValue(AccelSection, HashDataOffset, FormParams);
134     switch (Atom.first) {
135     case dwarf::DW_ATOM_die_offset:
136       DieOffset = *FormValue.getAsUnsignedConstant();
137       break;
138     case dwarf::DW_ATOM_die_tag:
139       DieTag = (dwarf::Tag)*FormValue.getAsUnsignedConstant();
140       break;
141     default:
142       break;
143     }
144   }
145   return {DieOffset, DieTag};
146 }
147 
148 void AppleAcceleratorTable::Header::dump(ScopedPrinter &W) const {
149   DictScope HeaderScope(W, "Header");
150   W.printHex("Magic", Magic);
151   W.printHex("Version", Version);
152   W.printHex("Hash function", HashFunction);
153   W.printNumber("Bucket count", BucketCount);
154   W.printNumber("Hashes count", HashCount);
155   W.printNumber("HeaderData length", HeaderDataLength);
156 }
157 
158 std::optional<uint64_t> AppleAcceleratorTable::HeaderData::extractOffset(
159     std::optional<DWARFFormValue> Value) const {
160   if (!Value)
161     return std::nullopt;
162 
163   switch (Value->getForm()) {
164   case dwarf::DW_FORM_ref1:
165   case dwarf::DW_FORM_ref2:
166   case dwarf::DW_FORM_ref4:
167   case dwarf::DW_FORM_ref8:
168   case dwarf::DW_FORM_ref_udata:
169     return Value->getRawUValue() + DIEOffsetBase;
170   default:
171     return Value->getAsSectionOffset();
172   }
173 }
174 
175 bool AppleAcceleratorTable::dumpName(ScopedPrinter &W,
176                                      SmallVectorImpl<DWARFFormValue> &AtomForms,
177                                      uint64_t *DataOffset) const {
178   uint64_t NameOffset = *DataOffset;
179   if (!AccelSection.isValidOffsetForDataOfSize(*DataOffset, 4)) {
180     W.printString("Incorrectly terminated list.");
181     return false;
182   }
183   uint64_t StringOffset = AccelSection.getRelocatedValue(4, DataOffset);
184   if (!StringOffset)
185     return false; // End of list
186 
187   DictScope NameScope(W, ("Name@0x" + Twine::utohexstr(NameOffset)).str());
188   W.startLine() << format("String: 0x%08" PRIx64, StringOffset);
189   W.getOStream() << " \"" << StringSection.getCStr(&StringOffset) << "\"\n";
190 
191   unsigned NumData = AccelSection.getU32(DataOffset);
192   for (unsigned Data = 0; Data < NumData; ++Data) {
193     ListScope DataScope(W, ("Data " + Twine(Data)).str());
194     unsigned i = 0;
195     for (auto &Atom : AtomForms) {
196       W.startLine() << format("Atom[%d]: ", i);
197       if (Atom.extractValue(AccelSection, DataOffset, FormParams)) {
198         Atom.dump(W.getOStream());
199         if (std::optional<uint64_t> Val = Atom.getAsUnsignedConstant()) {
200           StringRef Str = dwarf::AtomValueString(HdrData.Atoms[i].first, *Val);
201           if (!Str.empty())
202             W.getOStream() << " (" << Str << ")";
203         }
204       } else
205         W.getOStream() << "Error extracting the value";
206       W.getOStream() << "\n";
207       i++;
208     }
209   }
210   return true; // more entries follow
211 }
212 
213 LLVM_DUMP_METHOD void AppleAcceleratorTable::dump(raw_ostream &OS) const {
214   if (!IsValid)
215     return;
216 
217   ScopedPrinter W(OS);
218 
219   Hdr.dump(W);
220 
221   W.printNumber("DIE offset base", HdrData.DIEOffsetBase);
222   W.printNumber("Number of atoms", uint64_t(HdrData.Atoms.size()));
223   W.printNumber("Size of each hash data entry", getHashDataEntryLength());
224   SmallVector<DWARFFormValue, 3> AtomForms;
225   {
226     ListScope AtomsScope(W, "Atoms");
227     unsigned i = 0;
228     for (const auto &Atom : HdrData.Atoms) {
229       DictScope AtomScope(W, ("Atom " + Twine(i++)).str());
230       W.startLine() << "Type: " << formatAtom(Atom.first) << '\n';
231       W.startLine() << "Form: " << formatv("{0}", Atom.second) << '\n';
232       AtomForms.push_back(DWARFFormValue(Atom.second));
233     }
234   }
235 
236   // Now go through the actual tables and dump them.
237   uint64_t Offset = sizeof(Hdr) + Hdr.HeaderDataLength;
238   uint64_t HashesBase = Offset + Hdr.BucketCount * 4;
239   uint64_t OffsetsBase = HashesBase + Hdr.HashCount * 4;
240 
241   for (unsigned Bucket = 0; Bucket < Hdr.BucketCount; ++Bucket) {
242     unsigned Index = AccelSection.getU32(&Offset);
243 
244     ListScope BucketScope(W, ("Bucket " + Twine(Bucket)).str());
245     if (Index == UINT32_MAX) {
246       W.printString("EMPTY");
247       continue;
248     }
249 
250     for (unsigned HashIdx = Index; HashIdx < Hdr.HashCount; ++HashIdx) {
251       uint64_t HashOffset = HashesBase + HashIdx*4;
252       uint64_t OffsetsOffset = OffsetsBase + HashIdx*4;
253       uint32_t Hash = AccelSection.getU32(&HashOffset);
254 
255       if (Hash % Hdr.BucketCount != Bucket)
256         break;
257 
258       uint64_t DataOffset = AccelSection.getU32(&OffsetsOffset);
259       ListScope HashScope(W, ("Hash 0x" + Twine::utohexstr(Hash)).str());
260       if (!AccelSection.isValidOffset(DataOffset)) {
261         W.printString("Invalid section offset");
262         continue;
263       }
264       while (dumpName(W, AtomForms, &DataOffset))
265         /*empty*/;
266     }
267   }
268 }
269 
270 AppleAcceleratorTable::Entry::Entry(const AppleAcceleratorTable &Table)
271     : Table(Table) {
272   Values.reserve(Table.HdrData.Atoms.size());
273   for (const auto &Atom : Table.HdrData.Atoms)
274     Values.push_back(DWARFFormValue(Atom.second));
275 }
276 
277 void AppleAcceleratorTable::Entry::extract(uint64_t *Offset) {
278   for (auto &FormValue : Values)
279     FormValue.extractValue(Table.AccelSection, Offset, Table.FormParams);
280 }
281 
282 std::optional<DWARFFormValue>
283 AppleAcceleratorTable::Entry::lookup(HeaderData::AtomType AtomToFind) const {
284   for (auto [Atom, FormValue] : zip_equal(Table.HdrData.Atoms, Values))
285     if (Atom.first == AtomToFind)
286       return FormValue;
287   return std::nullopt;
288 }
289 
290 std::optional<uint64_t>
291 AppleAcceleratorTable::Entry::getDIESectionOffset() const {
292   return Table.HdrData.extractOffset(lookup(dwarf::DW_ATOM_die_offset));
293 }
294 
295 std::optional<uint64_t> AppleAcceleratorTable::Entry::getCUOffset() const {
296   return Table.HdrData.extractOffset(lookup(dwarf::DW_ATOM_cu_offset));
297 }
298 
299 std::optional<dwarf::Tag> AppleAcceleratorTable::Entry::getTag() const {
300   std::optional<DWARFFormValue> Tag = lookup(dwarf::DW_ATOM_die_tag);
301   if (!Tag)
302     return std::nullopt;
303   if (std::optional<uint64_t> Value = Tag->getAsUnsignedConstant())
304     return dwarf::Tag(*Value);
305   return std::nullopt;
306 }
307 
308 AppleAcceleratorTable::SameNameIterator::SameNameIterator(
309     const AppleAcceleratorTable &AccelTable, uint64_t DataOffset)
310     : Current(AccelTable), Offset(DataOffset) {}
311 
312 void AppleAcceleratorTable::Iterator::prepareNextEntryOrEnd() {
313   if (NumEntriesToCome == 0)
314     prepareNextStringOrEnd();
315   if (isEnd())
316     return;
317   uint64_t OffsetCopy = Offset;
318   Current.BaseEntry.extract(&OffsetCopy);
319   NumEntriesToCome--;
320   Offset += getTable().getHashDataEntryLength();
321 }
322 
323 void AppleAcceleratorTable::Iterator::prepareNextStringOrEnd() {
324   std::optional<uint32_t> StrOffset = getTable().readStringOffsetAt(Offset);
325   if (!StrOffset)
326     return setToEnd();
327 
328   // A zero denotes the end of the collision list. Read the next string
329   // again.
330   if (*StrOffset == 0)
331     return prepareNextStringOrEnd();
332   Current.StrOffset = *StrOffset;
333 
334   std::optional<uint32_t> MaybeNumEntries = getTable().readU32FromAccel(Offset);
335   if (!MaybeNumEntries || *MaybeNumEntries == 0)
336     return setToEnd();
337   NumEntriesToCome = *MaybeNumEntries;
338 }
339 
340 AppleAcceleratorTable::Iterator::Iterator(const AppleAcceleratorTable &Table,
341                                           bool SetEnd)
342     : Current(Table), Offset(Table.getEntriesBase()), NumEntriesToCome(0) {
343   if (SetEnd)
344     setToEnd();
345   else
346     prepareNextEntryOrEnd();
347 }
348 
349 iterator_range<AppleAcceleratorTable::SameNameIterator>
350 AppleAcceleratorTable::equal_range(StringRef Key) const {
351   const auto EmptyRange =
352       make_range(SameNameIterator(*this, 0), SameNameIterator(*this, 0));
353   if (!IsValid)
354     return EmptyRange;
355 
356   // Find the bucket.
357   uint32_t SearchHash = djbHash(Key);
358   uint32_t BucketIdx = hashToBucketIdx(SearchHash);
359   std::optional<uint32_t> HashIdx = idxOfHashInBucket(SearchHash, BucketIdx);
360   if (!HashIdx)
361     return EmptyRange;
362 
363   std::optional<uint64_t> MaybeDataOffset = readIthOffset(*HashIdx);
364   if (!MaybeDataOffset)
365     return EmptyRange;
366 
367   uint64_t DataOffset = *MaybeDataOffset;
368   if (DataOffset >= AccelSection.size())
369     return EmptyRange;
370 
371   std::optional<uint32_t> StrOffset = readStringOffsetAt(DataOffset);
372   // Valid input and still have strings in this hash.
373   while (StrOffset && *StrOffset) {
374     std::optional<StringRef> MaybeStr = readStringFromStrSection(*StrOffset);
375     std::optional<uint32_t> NumEntries = this->readU32FromAccel(DataOffset);
376     if (!MaybeStr || !NumEntries)
377       return EmptyRange;
378     uint64_t EndOffset = DataOffset + *NumEntries * getHashDataEntryLength();
379     if (Key == *MaybeStr)
380       return make_range({*this, DataOffset},
381                         SameNameIterator{*this, EndOffset});
382     DataOffset = EndOffset;
383     StrOffset = readStringOffsetAt(DataOffset);
384   }
385 
386   return EmptyRange;
387 }
388 
389 std::optional<uint32_t>
390 AppleAcceleratorTable::idxOfHashInBucket(uint32_t HashToFind,
391                                          uint32_t BucketIdx) const {
392   std::optional<uint32_t> HashStartIdx = readIthBucket(BucketIdx);
393   if (!HashStartIdx)
394     return std::nullopt;
395 
396   for (uint32_t HashIdx = *HashStartIdx; HashIdx < getNumHashes(); HashIdx++) {
397     std::optional<uint32_t> MaybeHash = readIthHash(HashIdx);
398     if (!MaybeHash || !wouldHashBeInBucket(*MaybeHash, BucketIdx))
399       break;
400     if (*MaybeHash == HashToFind)
401       return HashIdx;
402   }
403   return std::nullopt;
404 }
405 
406 std::optional<StringRef> AppleAcceleratorTable::readStringFromStrSection(
407     uint64_t StringSectionOffset) const {
408   Error E = Error::success();
409   StringRef Str = StringSection.getCStrRef(&StringSectionOffset, &E);
410   if (E) {
411     consumeError(std::move(E));
412     return std::nullopt;
413   }
414   return Str;
415 }
416 
417 std::optional<uint32_t>
418 AppleAcceleratorTable::readU32FromAccel(uint64_t &Offset,
419                                         bool UseRelocation) const {
420   Error E = Error::success();
421   uint32_t Data = UseRelocation
422                       ? AccelSection.getRelocatedValue(4, &Offset, nullptr, &E)
423                       : AccelSection.getU32(&Offset, &E);
424   if (E) {
425     consumeError(std::move(E));
426     return std::nullopt;
427   }
428   return Data;
429 }
430 
431 void DWARFDebugNames::Header::dump(ScopedPrinter &W) const {
432   DictScope HeaderScope(W, "Header");
433   W.printHex("Length", UnitLength);
434   W.printString("Format", dwarf::FormatString(Format));
435   W.printNumber("Version", Version);
436   W.printNumber("CU count", CompUnitCount);
437   W.printNumber("Local TU count", LocalTypeUnitCount);
438   W.printNumber("Foreign TU count", ForeignTypeUnitCount);
439   W.printNumber("Bucket count", BucketCount);
440   W.printNumber("Name count", NameCount);
441   W.printHex("Abbreviations table size", AbbrevTableSize);
442   W.startLine() << "Augmentation: '" << AugmentationString << "'\n";
443 }
444 
445 Error DWARFDebugNames::Header::extract(const DWARFDataExtractor &AS,
446                                              uint64_t *Offset) {
447   auto HeaderError = [Offset = *Offset](Error E) {
448     return createStringError(errc::illegal_byte_sequence,
449                              "parsing .debug_names header at 0x%" PRIx64 ": %s",
450                              Offset, toString(std::move(E)).c_str());
451   };
452 
453   DataExtractor::Cursor C(*Offset);
454   std::tie(UnitLength, Format) = AS.getInitialLength(C);
455 
456   Version = AS.getU16(C);
457   AS.skip(C, 2); // padding
458   CompUnitCount = AS.getU32(C);
459   LocalTypeUnitCount = AS.getU32(C);
460   ForeignTypeUnitCount = AS.getU32(C);
461   BucketCount = AS.getU32(C);
462   NameCount = AS.getU32(C);
463   AbbrevTableSize = AS.getU32(C);
464   AugmentationStringSize = alignTo(AS.getU32(C), 4);
465 
466   if (!C)
467     return HeaderError(C.takeError());
468 
469   if (!AS.isValidOffsetForDataOfSize(C.tell(), AugmentationStringSize))
470     return HeaderError(createStringError(errc::illegal_byte_sequence,
471                                          "cannot read header augmentation"));
472   AugmentationString.resize(AugmentationStringSize);
473   AS.getU8(C, reinterpret_cast<uint8_t *>(AugmentationString.data()),
474            AugmentationStringSize);
475   *Offset = C.tell();
476   return C.takeError();
477 }
478 
479 void DWARFDebugNames::Abbrev::dump(ScopedPrinter &W) const {
480   DictScope AbbrevScope(W, ("Abbreviation 0x" + Twine::utohexstr(Code)).str());
481   W.startLine() << formatv("Tag: {0}\n", Tag);
482 
483   for (const auto &Attr : Attributes)
484     W.startLine() << formatv("{0}: {1}\n", Attr.Index, Attr.Form);
485 }
486 
487 static constexpr DWARFDebugNames::AttributeEncoding sentinelAttrEnc() {
488   return {dwarf::Index(0), dwarf::Form(0)};
489 }
490 
491 static bool isSentinel(const DWARFDebugNames::AttributeEncoding &AE) {
492   return AE == sentinelAttrEnc();
493 }
494 
495 static DWARFDebugNames::Abbrev sentinelAbbrev() {
496   return DWARFDebugNames::Abbrev(0, dwarf::Tag(0), {});
497 }
498 
499 static bool isSentinel(const DWARFDebugNames::Abbrev &Abbr) {
500   return Abbr.Code == 0;
501 }
502 
503 DWARFDebugNames::Abbrev DWARFDebugNames::AbbrevMapInfo::getEmptyKey() {
504   return sentinelAbbrev();
505 }
506 
507 DWARFDebugNames::Abbrev DWARFDebugNames::AbbrevMapInfo::getTombstoneKey() {
508   return DWARFDebugNames::Abbrev(~0, dwarf::Tag(0), {});
509 }
510 
511 Expected<DWARFDebugNames::AttributeEncoding>
512 DWARFDebugNames::NameIndex::extractAttributeEncoding(uint64_t *Offset) {
513   if (*Offset >= EntriesBase) {
514     return createStringError(errc::illegal_byte_sequence,
515                              "Incorrectly terminated abbreviation table.");
516   }
517 
518   uint32_t Index = Section.AccelSection.getULEB128(Offset);
519   uint32_t Form = Section.AccelSection.getULEB128(Offset);
520   return AttributeEncoding(dwarf::Index(Index), dwarf::Form(Form));
521 }
522 
523 Expected<std::vector<DWARFDebugNames::AttributeEncoding>>
524 DWARFDebugNames::NameIndex::extractAttributeEncodings(uint64_t *Offset) {
525   std::vector<AttributeEncoding> Result;
526   for (;;) {
527     auto AttrEncOr = extractAttributeEncoding(Offset);
528     if (!AttrEncOr)
529       return AttrEncOr.takeError();
530     if (isSentinel(*AttrEncOr))
531       return std::move(Result);
532 
533     Result.emplace_back(*AttrEncOr);
534   }
535 }
536 
537 Expected<DWARFDebugNames::Abbrev>
538 DWARFDebugNames::NameIndex::extractAbbrev(uint64_t *Offset) {
539   if (*Offset >= EntriesBase) {
540     return createStringError(errc::illegal_byte_sequence,
541                              "Incorrectly terminated abbreviation table.");
542   }
543 
544   uint32_t Code = Section.AccelSection.getULEB128(Offset);
545   if (Code == 0)
546     return sentinelAbbrev();
547 
548   uint32_t Tag = Section.AccelSection.getULEB128(Offset);
549   auto AttrEncOr = extractAttributeEncodings(Offset);
550   if (!AttrEncOr)
551     return AttrEncOr.takeError();
552   return Abbrev(Code, dwarf::Tag(Tag), std::move(*AttrEncOr));
553 }
554 
555 Error DWARFDebugNames::NameIndex::extract() {
556   const DWARFDataExtractor &AS = Section.AccelSection;
557   uint64_t Offset = Base;
558   if (Error E = Hdr.extract(AS, &Offset))
559     return E;
560 
561   const unsigned SectionOffsetSize = dwarf::getDwarfOffsetByteSize(Hdr.Format);
562   CUsBase = Offset;
563   Offset += Hdr.CompUnitCount * SectionOffsetSize;
564   Offset += Hdr.LocalTypeUnitCount * SectionOffsetSize;
565   Offset += Hdr.ForeignTypeUnitCount * 8;
566   BucketsBase = Offset;
567   Offset += Hdr.BucketCount * 4;
568   HashesBase = Offset;
569   if (Hdr.BucketCount > 0)
570     Offset += Hdr.NameCount * 4;
571   StringOffsetsBase = Offset;
572   Offset += Hdr.NameCount * SectionOffsetSize;
573   EntryOffsetsBase = Offset;
574   Offset += Hdr.NameCount * SectionOffsetSize;
575 
576   if (!AS.isValidOffsetForDataOfSize(Offset, Hdr.AbbrevTableSize))
577     return createStringError(errc::illegal_byte_sequence,
578                              "Section too small: cannot read abbreviations.");
579 
580   EntriesBase = Offset + Hdr.AbbrevTableSize;
581 
582   for (;;) {
583     auto AbbrevOr = extractAbbrev(&Offset);
584     if (!AbbrevOr)
585       return AbbrevOr.takeError();
586     if (isSentinel(*AbbrevOr))
587       return Error::success();
588 
589     if (!Abbrevs.insert(std::move(*AbbrevOr)).second)
590       return createStringError(errc::invalid_argument,
591                                "Duplicate abbreviation code.");
592   }
593 }
594 
595 DWARFDebugNames::Entry::Entry(const NameIndex &NameIdx, const Abbrev &Abbr)
596     : NameIdx(&NameIdx), Abbr(&Abbr) {
597   // This merely creates form values. It is up to the caller
598   // (NameIndex::getEntry) to populate them.
599   Values.reserve(Abbr.Attributes.size());
600   for (const auto &Attr : Abbr.Attributes)
601     Values.emplace_back(Attr.Form);
602 }
603 
604 std::optional<DWARFFormValue>
605 DWARFDebugNames::Entry::lookup(dwarf::Index Index) const {
606   assert(Abbr->Attributes.size() == Values.size());
607   for (auto Tuple : zip_first(Abbr->Attributes, Values)) {
608     if (std::get<0>(Tuple).Index == Index)
609       return std::get<1>(Tuple);
610   }
611   return std::nullopt;
612 }
613 
614 std::optional<uint64_t> DWARFDebugNames::Entry::getDIEUnitOffset() const {
615   if (std::optional<DWARFFormValue> Off = lookup(dwarf::DW_IDX_die_offset))
616     return Off->getAsReferenceUVal();
617   return std::nullopt;
618 }
619 
620 std::optional<uint64_t> DWARFDebugNames::Entry::getCUIndex() const {
621   if (std::optional<DWARFFormValue> Off = lookup(dwarf::DW_IDX_compile_unit))
622     return Off->getAsUnsignedConstant();
623   // In a per-CU index, the entries without a DW_IDX_compile_unit attribute
624   // implicitly refer to the single CU, but only if we don't have a
625   // DW_IDX_type_unit.
626   if (lookup(dwarf::DW_IDX_type_unit).has_value())
627     return std::nullopt;
628   if (NameIdx->getCUCount() == 1)
629     return 0;
630   return std::nullopt;
631 }
632 
633 std::optional<uint64_t> DWARFDebugNames::Entry::getCUOffset() const {
634   std::optional<uint64_t> Index = getCUIndex();
635   if (!Index || *Index >= NameIdx->getCUCount())
636     return std::nullopt;
637   return NameIdx->getCUOffset(*Index);
638 }
639 
640 std::optional<uint64_t> DWARFDebugNames::Entry::getLocalTUOffset() const {
641   std::optional<uint64_t> Index = getLocalTUIndex();
642   if (!Index || *Index >= NameIdx->getLocalTUCount())
643     return std::nullopt;
644   return NameIdx->getLocalTUOffset(*Index);
645 }
646 
647 std::optional<uint64_t> DWARFDebugNames::Entry::getLocalTUIndex() const {
648   if (std::optional<DWARFFormValue> Off = lookup(dwarf::DW_IDX_type_unit))
649     return Off->getAsUnsignedConstant();
650   return std::nullopt;
651 }
652 
653 void DWARFDebugNames::Entry::dump(ScopedPrinter &W) const {
654   W.startLine() << formatv("Abbrev: {0:x}\n", Abbr->Code);
655   W.startLine() << formatv("Tag: {0}\n", Abbr->Tag);
656   assert(Abbr->Attributes.size() == Values.size());
657   for (auto Tuple : zip_first(Abbr->Attributes, Values)) {
658     W.startLine() << formatv("{0}: ", std::get<0>(Tuple).Index);
659     std::get<1>(Tuple).dump(W.getOStream());
660     W.getOStream() << '\n';
661   }
662 }
663 
664 char DWARFDebugNames::SentinelError::ID;
665 std::error_code DWARFDebugNames::SentinelError::convertToErrorCode() const {
666   return inconvertibleErrorCode();
667 }
668 
669 uint64_t DWARFDebugNames::NameIndex::getCUOffset(uint32_t CU) const {
670   assert(CU < Hdr.CompUnitCount);
671   const unsigned SectionOffsetSize = dwarf::getDwarfOffsetByteSize(Hdr.Format);
672   uint64_t Offset = CUsBase + SectionOffsetSize * CU;
673   return Section.AccelSection.getRelocatedValue(SectionOffsetSize, &Offset);
674 }
675 
676 uint64_t DWARFDebugNames::NameIndex::getLocalTUOffset(uint32_t TU) const {
677   assert(TU < Hdr.LocalTypeUnitCount);
678   const unsigned SectionOffsetSize = dwarf::getDwarfOffsetByteSize(Hdr.Format);
679   uint64_t Offset = CUsBase + SectionOffsetSize * (Hdr.CompUnitCount + TU);
680   return Section.AccelSection.getRelocatedValue(SectionOffsetSize, &Offset);
681 }
682 
683 uint64_t DWARFDebugNames::NameIndex::getForeignTUSignature(uint32_t TU) const {
684   assert(TU < Hdr.ForeignTypeUnitCount);
685   const unsigned SectionOffsetSize = dwarf::getDwarfOffsetByteSize(Hdr.Format);
686   uint64_t Offset =
687       CUsBase +
688       SectionOffsetSize * (Hdr.CompUnitCount + Hdr.LocalTypeUnitCount) + 8 * TU;
689   return Section.AccelSection.getU64(&Offset);
690 }
691 
692 Expected<DWARFDebugNames::Entry>
693 DWARFDebugNames::NameIndex::getEntry(uint64_t *Offset) const {
694   const DWARFDataExtractor &AS = Section.AccelSection;
695   if (!AS.isValidOffset(*Offset))
696     return createStringError(errc::illegal_byte_sequence,
697                              "Incorrectly terminated entry list.");
698 
699   uint32_t AbbrevCode = AS.getULEB128(Offset);
700   if (AbbrevCode == 0)
701     return make_error<SentinelError>();
702 
703   const auto AbbrevIt = Abbrevs.find_as(AbbrevCode);
704   if (AbbrevIt == Abbrevs.end())
705     return createStringError(errc::invalid_argument, "Invalid abbreviation.");
706 
707   Entry E(*this, *AbbrevIt);
708 
709   dwarf::FormParams FormParams = {Hdr.Version, 0, Hdr.Format};
710   for (auto &Value : E.Values) {
711     if (!Value.extractValue(AS, Offset, FormParams))
712       return createStringError(errc::io_error,
713                                "Error extracting index attribute values.");
714   }
715   return std::move(E);
716 }
717 
718 DWARFDebugNames::NameTableEntry
719 DWARFDebugNames::NameIndex::getNameTableEntry(uint32_t Index) const {
720   assert(0 < Index && Index <= Hdr.NameCount);
721   const unsigned SectionOffsetSize = dwarf::getDwarfOffsetByteSize(Hdr.Format);
722   uint64_t StringOffsetOffset =
723       StringOffsetsBase + SectionOffsetSize * (Index - 1);
724   uint64_t EntryOffsetOffset =
725       EntryOffsetsBase + SectionOffsetSize * (Index - 1);
726   const DWARFDataExtractor &AS = Section.AccelSection;
727 
728   uint64_t StringOffset =
729       AS.getRelocatedValue(SectionOffsetSize, &StringOffsetOffset);
730   uint64_t EntryOffset = AS.getUnsigned(&EntryOffsetOffset, SectionOffsetSize);
731   EntryOffset += EntriesBase;
732   return {Section.StringSection, Index, StringOffset, EntryOffset};
733 }
734 
735 uint32_t
736 DWARFDebugNames::NameIndex::getBucketArrayEntry(uint32_t Bucket) const {
737   assert(Bucket < Hdr.BucketCount);
738   uint64_t BucketOffset = BucketsBase + 4 * Bucket;
739   return Section.AccelSection.getU32(&BucketOffset);
740 }
741 
742 uint32_t DWARFDebugNames::NameIndex::getHashArrayEntry(uint32_t Index) const {
743   assert(0 < Index && Index <= Hdr.NameCount);
744   uint64_t HashOffset = HashesBase + 4 * (Index - 1);
745   return Section.AccelSection.getU32(&HashOffset);
746 }
747 
748 // Returns true if we should continue scanning for entries, false if this is the
749 // last (sentinel) entry). In case of a parsing error we also return false, as
750 // it's not possible to recover this entry list (but the other lists may still
751 // parse OK).
752 bool DWARFDebugNames::NameIndex::dumpEntry(ScopedPrinter &W,
753                                            uint64_t *Offset) const {
754   uint64_t EntryId = *Offset;
755   auto EntryOr = getEntry(Offset);
756   if (!EntryOr) {
757     handleAllErrors(EntryOr.takeError(), [](const SentinelError &) {},
758                     [&W](const ErrorInfoBase &EI) { EI.log(W.startLine()); });
759     return false;
760   }
761 
762   DictScope EntryScope(W, ("Entry @ 0x" + Twine::utohexstr(EntryId)).str());
763   EntryOr->dump(W);
764   return true;
765 }
766 
767 void DWARFDebugNames::NameIndex::dumpName(ScopedPrinter &W,
768                                           const NameTableEntry &NTE,
769                                           std::optional<uint32_t> Hash) const {
770   DictScope NameScope(W, ("Name " + Twine(NTE.getIndex())).str());
771   if (Hash)
772     W.printHex("Hash", *Hash);
773 
774   W.startLine() << format("String: 0x%08" PRIx64, NTE.getStringOffset());
775   W.getOStream() << " \"" << NTE.getString() << "\"\n";
776 
777   uint64_t EntryOffset = NTE.getEntryOffset();
778   while (dumpEntry(W, &EntryOffset))
779     /*empty*/;
780 }
781 
782 void DWARFDebugNames::NameIndex::dumpCUs(ScopedPrinter &W) const {
783   ListScope CUScope(W, "Compilation Unit offsets");
784   for (uint32_t CU = 0; CU < Hdr.CompUnitCount; ++CU)
785     W.startLine() << format("CU[%u]: 0x%08" PRIx64 "\n", CU, getCUOffset(CU));
786 }
787 
788 void DWARFDebugNames::NameIndex::dumpLocalTUs(ScopedPrinter &W) const {
789   if (Hdr.LocalTypeUnitCount == 0)
790     return;
791 
792   ListScope TUScope(W, "Local Type Unit offsets");
793   for (uint32_t TU = 0; TU < Hdr.LocalTypeUnitCount; ++TU)
794     W.startLine() << format("LocalTU[%u]: 0x%08" PRIx64 "\n", TU,
795                             getLocalTUOffset(TU));
796 }
797 
798 void DWARFDebugNames::NameIndex::dumpForeignTUs(ScopedPrinter &W) const {
799   if (Hdr.ForeignTypeUnitCount == 0)
800     return;
801 
802   ListScope TUScope(W, "Foreign Type Unit signatures");
803   for (uint32_t TU = 0; TU < Hdr.ForeignTypeUnitCount; ++TU) {
804     W.startLine() << format("ForeignTU[%u]: 0x%016" PRIx64 "\n", TU,
805                             getForeignTUSignature(TU));
806   }
807 }
808 
809 void DWARFDebugNames::NameIndex::dumpAbbreviations(ScopedPrinter &W) const {
810   ListScope AbbrevsScope(W, "Abbreviations");
811   for (const auto &Abbr : Abbrevs)
812     Abbr.dump(W);
813 }
814 
815 void DWARFDebugNames::NameIndex::dumpBucket(ScopedPrinter &W,
816                                             uint32_t Bucket) const {
817   ListScope BucketScope(W, ("Bucket " + Twine(Bucket)).str());
818   uint32_t Index = getBucketArrayEntry(Bucket);
819   if (Index == 0) {
820     W.printString("EMPTY");
821     return;
822   }
823   if (Index > Hdr.NameCount) {
824     W.printString("Name index is invalid");
825     return;
826   }
827 
828   for (; Index <= Hdr.NameCount; ++Index) {
829     uint32_t Hash = getHashArrayEntry(Index);
830     if (Hash % Hdr.BucketCount != Bucket)
831       break;
832 
833     dumpName(W, getNameTableEntry(Index), Hash);
834   }
835 }
836 
837 LLVM_DUMP_METHOD void DWARFDebugNames::NameIndex::dump(ScopedPrinter &W) const {
838   DictScope UnitScope(W, ("Name Index @ 0x" + Twine::utohexstr(Base)).str());
839   Hdr.dump(W);
840   dumpCUs(W);
841   dumpLocalTUs(W);
842   dumpForeignTUs(W);
843   dumpAbbreviations(W);
844 
845   if (Hdr.BucketCount > 0) {
846     for (uint32_t Bucket = 0; Bucket < Hdr.BucketCount; ++Bucket)
847       dumpBucket(W, Bucket);
848     return;
849   }
850 
851   W.startLine() << "Hash table not present\n";
852   for (const NameTableEntry &NTE : *this)
853     dumpName(W, NTE, std::nullopt);
854 }
855 
856 Error DWARFDebugNames::extract() {
857   uint64_t Offset = 0;
858   while (AccelSection.isValidOffset(Offset)) {
859     NameIndex Next(*this, Offset);
860     if (Error E = Next.extract())
861       return E;
862     Offset = Next.getNextUnitOffset();
863     NameIndices.push_back(std::move(Next));
864   }
865   return Error::success();
866 }
867 
868 iterator_range<DWARFDebugNames::ValueIterator>
869 DWARFDebugNames::NameIndex::equal_range(StringRef Key) const {
870   return make_range(ValueIterator(*this, Key), ValueIterator());
871 }
872 
873 LLVM_DUMP_METHOD void DWARFDebugNames::dump(raw_ostream &OS) const {
874   ScopedPrinter W(OS);
875   for (const NameIndex &NI : NameIndices)
876     NI.dump(W);
877 }
878 
879 std::optional<uint64_t>
880 DWARFDebugNames::ValueIterator::findEntryOffsetInCurrentIndex() {
881   const Header &Hdr = CurrentIndex->Hdr;
882   if (Hdr.BucketCount == 0) {
883     // No Hash Table, We need to search through all names in the Name Index.
884     for (const NameTableEntry &NTE : *CurrentIndex) {
885       if (NTE.getString() == Key)
886         return NTE.getEntryOffset();
887     }
888     return std::nullopt;
889   }
890 
891   // The Name Index has a Hash Table, so use that to speed up the search.
892   // Compute the Key Hash, if it has not been done already.
893   if (!Hash)
894     Hash = caseFoldingDjbHash(Key);
895   uint32_t Bucket = *Hash % Hdr.BucketCount;
896   uint32_t Index = CurrentIndex->getBucketArrayEntry(Bucket);
897   if (Index == 0)
898     return std::nullopt; // Empty bucket
899 
900   for (; Index <= Hdr.NameCount; ++Index) {
901     uint32_t Hash = CurrentIndex->getHashArrayEntry(Index);
902     if (Hash % Hdr.BucketCount != Bucket)
903       return std::nullopt; // End of bucket
904 
905     NameTableEntry NTE = CurrentIndex->getNameTableEntry(Index);
906     if (NTE.getString() == Key)
907       return NTE.getEntryOffset();
908   }
909   return std::nullopt;
910 }
911 
912 bool DWARFDebugNames::ValueIterator::getEntryAtCurrentOffset() {
913   auto EntryOr = CurrentIndex->getEntry(&DataOffset);
914   if (!EntryOr) {
915     consumeError(EntryOr.takeError());
916     return false;
917   }
918   CurrentEntry = std::move(*EntryOr);
919   return true;
920 }
921 
922 bool DWARFDebugNames::ValueIterator::findInCurrentIndex() {
923   std::optional<uint64_t> Offset = findEntryOffsetInCurrentIndex();
924   if (!Offset)
925     return false;
926   DataOffset = *Offset;
927   return getEntryAtCurrentOffset();
928 }
929 
930 void DWARFDebugNames::ValueIterator::searchFromStartOfCurrentIndex() {
931   for (const NameIndex *End = CurrentIndex->Section.NameIndices.end();
932        CurrentIndex != End; ++CurrentIndex) {
933     if (findInCurrentIndex())
934       return;
935   }
936   setEnd();
937 }
938 
939 void DWARFDebugNames::ValueIterator::next() {
940   assert(CurrentIndex && "Incrementing an end() iterator?");
941 
942   // First try the next entry in the current Index.
943   if (getEntryAtCurrentOffset())
944     return;
945 
946   // If we're a local iterator or we have reached the last Index, we're done.
947   if (IsLocal || CurrentIndex == &CurrentIndex->Section.NameIndices.back()) {
948     setEnd();
949     return;
950   }
951 
952   // Otherwise, try the next index.
953   ++CurrentIndex;
954   searchFromStartOfCurrentIndex();
955 }
956 
957 DWARFDebugNames::ValueIterator::ValueIterator(const DWARFDebugNames &AccelTable,
958                                               StringRef Key)
959     : CurrentIndex(AccelTable.NameIndices.begin()), IsLocal(false),
960       Key(std::string(Key)) {
961   searchFromStartOfCurrentIndex();
962 }
963 
964 DWARFDebugNames::ValueIterator::ValueIterator(
965     const DWARFDebugNames::NameIndex &NI, StringRef Key)
966     : CurrentIndex(&NI), IsLocal(true), Key(std::string(Key)) {
967   if (!findInCurrentIndex())
968     setEnd();
969 }
970 
971 iterator_range<DWARFDebugNames::ValueIterator>
972 DWARFDebugNames::equal_range(StringRef Key) const {
973   if (NameIndices.empty())
974     return make_range(ValueIterator(), ValueIterator());
975   return make_range(ValueIterator(*this, Key), ValueIterator());
976 }
977 
978 const DWARFDebugNames::NameIndex *
979 DWARFDebugNames::getCUNameIndex(uint64_t CUOffset) {
980   if (CUToNameIndex.size() == 0 && NameIndices.size() > 0) {
981     for (const auto &NI : *this) {
982       for (uint32_t CU = 0; CU < NI.getCUCount(); ++CU)
983         CUToNameIndex.try_emplace(NI.getCUOffset(CU), &NI);
984     }
985   }
986   return CUToNameIndex.lookup(CUOffset);
987 }
988 
989 static bool isObjCSelector(StringRef Name) {
990   return Name.size() > 2 && (Name[0] == '-' || Name[0] == '+') &&
991          (Name[1] == '[');
992 }
993 
994 std::optional<ObjCSelectorNames> llvm::getObjCNamesIfSelector(StringRef Name) {
995   if (!isObjCSelector(Name))
996     return std::nullopt;
997   // "-[Atom setMass:]"
998   StringRef ClassNameStart(Name.drop_front(2));
999   size_t FirstSpace = ClassNameStart.find(' ');
1000   if (FirstSpace == StringRef::npos)
1001     return std::nullopt;
1002 
1003   StringRef SelectorStart = ClassNameStart.drop_front(FirstSpace + 1);
1004   if (!SelectorStart.size())
1005     return std::nullopt;
1006 
1007   ObjCSelectorNames Ans;
1008   Ans.ClassName = ClassNameStart.take_front(FirstSpace);
1009   Ans.Selector = SelectorStart.drop_back(); // drop ']';
1010 
1011   // "-[Class(Category) selector :withArg ...]"
1012   if (Ans.ClassName.back() == ')') {
1013     size_t OpenParens = Ans.ClassName.find('(');
1014     if (OpenParens != StringRef::npos) {
1015       Ans.ClassNameNoCategory = Ans.ClassName.take_front(OpenParens);
1016 
1017       Ans.MethodNameNoCategory = Name.take_front(OpenParens + 2);
1018       // FIXME: The missing space here may be a bug, but dsymutil-classic also
1019       // does it this way.
1020       append_range(*Ans.MethodNameNoCategory, SelectorStart);
1021     }
1022   }
1023   return Ans;
1024 }
1025 
1026 std::optional<StringRef> llvm::StripTemplateParameters(StringRef Name) {
1027   // We are looking for template parameters to strip from Name. e.g.
1028   //
1029   //  operator<<B>
1030   //
1031   // We look for > at the end but if it does not contain any < then we
1032   // have something like operator>>. We check for the operator<=> case.
1033   if (!Name.ends_with(">") || Name.count("<") == 0 || Name.ends_with("<=>"))
1034     return {};
1035 
1036   // How many < until we have the start of the template parameters.
1037   size_t NumLeftAnglesToSkip = 1;
1038 
1039   // If we have operator<=> then we need to skip its < as well.
1040   NumLeftAnglesToSkip += Name.count("<=>");
1041 
1042   size_t RightAngleCount = Name.count('>');
1043   size_t LeftAngleCount = Name.count('<');
1044 
1045   // If we have more < than > we have operator< or operator<<
1046   // we to account for their < as well.
1047   if (LeftAngleCount > RightAngleCount)
1048     NumLeftAnglesToSkip += LeftAngleCount - RightAngleCount;
1049 
1050   size_t StartOfTemplate = 0;
1051   while (NumLeftAnglesToSkip--)
1052     StartOfTemplate = Name.find('<', StartOfTemplate) + 1;
1053 
1054   return Name.substr(0, StartOfTemplate - 1);
1055 }
1056