1 //=== DWARFLinker.cpp -----------------------------------------------------===// 2 // 3 // Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions. 4 // See https://llvm.org/LICENSE.txt for license information. 5 // SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception 6 // 7 //===----------------------------------------------------------------------===// 8 9 #include "llvm/DWARFLinker/Classic/DWARFLinker.h" 10 #include "llvm/ADT/ArrayRef.h" 11 #include "llvm/ADT/BitVector.h" 12 #include "llvm/ADT/STLExtras.h" 13 #include "llvm/ADT/StringExtras.h" 14 #include "llvm/CodeGen/NonRelocatableStringpool.h" 15 #include "llvm/DWARFLinker/Classic/DWARFLinkerDeclContext.h" 16 #include "llvm/DWARFLinker/Classic/DWARFStreamer.h" 17 #include "llvm/DWARFLinker/Utils.h" 18 #include "llvm/DebugInfo/DWARF/DWARFAbbreviationDeclaration.h" 19 #include "llvm/DebugInfo/DWARF/DWARFAcceleratorTable.h" 20 #include "llvm/DebugInfo/DWARF/DWARFContext.h" 21 #include "llvm/DebugInfo/DWARF/DWARFDataExtractor.h" 22 #include "llvm/DebugInfo/DWARF/DWARFDebugLine.h" 23 #include "llvm/DebugInfo/DWARF/DWARFDebugMacro.h" 24 #include "llvm/DebugInfo/DWARF/DWARFDebugRangeList.h" 25 #include "llvm/DebugInfo/DWARF/DWARFDie.h" 26 #include "llvm/DebugInfo/DWARF/DWARFExpression.h" 27 #include "llvm/DebugInfo/DWARF/DWARFFormValue.h" 28 #include "llvm/DebugInfo/DWARF/DWARFSection.h" 29 #include "llvm/DebugInfo/DWARF/DWARFUnit.h" 30 #include "llvm/MC/MCDwarf.h" 31 #include "llvm/Support/DataExtractor.h" 32 #include "llvm/Support/Error.h" 33 #include "llvm/Support/ErrorHandling.h" 34 #include "llvm/Support/ErrorOr.h" 35 #include "llvm/Support/FormatVariadic.h" 36 #include "llvm/Support/LEB128.h" 37 #include "llvm/Support/Path.h" 38 #include "llvm/Support/ThreadPool.h" 39 #include <vector> 40 41 namespace llvm { 42 43 using namespace dwarf_linker; 44 using namespace dwarf_linker::classic; 45 46 /// Hold the input and output of the debug info size in bytes. 47 struct DebugInfoSize { 48 uint64_t Input; 49 uint64_t Output; 50 }; 51 52 /// Compute the total size of the debug info. 53 static uint64_t getDebugInfoSize(DWARFContext &Dwarf) { 54 uint64_t Size = 0; 55 for (auto &Unit : Dwarf.compile_units()) { 56 Size += Unit->getLength(); 57 } 58 return Size; 59 } 60 61 /// Similar to DWARFUnitSection::getUnitForOffset(), but returning our 62 /// CompileUnit object instead. 63 static CompileUnit *getUnitForOffset(const UnitListTy &Units, uint64_t Offset) { 64 auto CU = llvm::upper_bound( 65 Units, Offset, [](uint64_t LHS, const std::unique_ptr<CompileUnit> &RHS) { 66 return LHS < RHS->getOrigUnit().getNextUnitOffset(); 67 }); 68 return CU != Units.end() ? CU->get() : nullptr; 69 } 70 71 /// Resolve the DIE attribute reference that has been extracted in \p RefValue. 72 /// The resulting DIE might be in another CompileUnit which is stored into \p 73 /// ReferencedCU. \returns null if resolving fails for any reason. 74 DWARFDie DWARFLinker::resolveDIEReference(const DWARFFile &File, 75 const UnitListTy &Units, 76 const DWARFFormValue &RefValue, 77 const DWARFDie &DIE, 78 CompileUnit *&RefCU) { 79 assert(RefValue.isFormClass(DWARFFormValue::FC_Reference)); 80 uint64_t RefOffset = *RefValue.getAsReference(); 81 if ((RefCU = getUnitForOffset(Units, RefOffset))) 82 if (const auto RefDie = RefCU->getOrigUnit().getDIEForOffset(RefOffset)) { 83 // In a file with broken references, an attribute might point to a NULL 84 // DIE. 85 if (!RefDie.isNULL()) 86 return RefDie; 87 } 88 89 reportWarning("could not find referenced DIE", File, &DIE); 90 return DWARFDie(); 91 } 92 93 /// \returns whether the passed \a Attr type might contain a DIE reference 94 /// suitable for ODR uniquing. 95 static bool isODRAttribute(uint16_t Attr) { 96 switch (Attr) { 97 default: 98 return false; 99 case dwarf::DW_AT_type: 100 case dwarf::DW_AT_containing_type: 101 case dwarf::DW_AT_specification: 102 case dwarf::DW_AT_abstract_origin: 103 case dwarf::DW_AT_import: 104 return true; 105 } 106 llvm_unreachable("Improper attribute."); 107 } 108 109 static bool isTypeTag(uint16_t Tag) { 110 switch (Tag) { 111 case dwarf::DW_TAG_array_type: 112 case dwarf::DW_TAG_class_type: 113 case dwarf::DW_TAG_enumeration_type: 114 case dwarf::DW_TAG_pointer_type: 115 case dwarf::DW_TAG_reference_type: 116 case dwarf::DW_TAG_string_type: 117 case dwarf::DW_TAG_structure_type: 118 case dwarf::DW_TAG_subroutine_type: 119 case dwarf::DW_TAG_typedef: 120 case dwarf::DW_TAG_union_type: 121 case dwarf::DW_TAG_ptr_to_member_type: 122 case dwarf::DW_TAG_set_type: 123 case dwarf::DW_TAG_subrange_type: 124 case dwarf::DW_TAG_base_type: 125 case dwarf::DW_TAG_const_type: 126 case dwarf::DW_TAG_constant: 127 case dwarf::DW_TAG_file_type: 128 case dwarf::DW_TAG_namelist: 129 case dwarf::DW_TAG_packed_type: 130 case dwarf::DW_TAG_volatile_type: 131 case dwarf::DW_TAG_restrict_type: 132 case dwarf::DW_TAG_atomic_type: 133 case dwarf::DW_TAG_interface_type: 134 case dwarf::DW_TAG_unspecified_type: 135 case dwarf::DW_TAG_shared_type: 136 case dwarf::DW_TAG_immutable_type: 137 return true; 138 default: 139 break; 140 } 141 return false; 142 } 143 144 bool DWARFLinker::DIECloner::getDIENames(const DWARFDie &Die, 145 AttributesInfo &Info, 146 OffsetsStringPool &StringPool, 147 bool StripTemplate) { 148 // This function will be called on DIEs having low_pcs and 149 // ranges. As getting the name might be more expansive, filter out 150 // blocks directly. 151 if (Die.getTag() == dwarf::DW_TAG_lexical_block) 152 return false; 153 154 if (!Info.MangledName) 155 if (const char *MangledName = Die.getLinkageName()) 156 Info.MangledName = StringPool.getEntry(MangledName); 157 158 if (!Info.Name) 159 if (const char *Name = Die.getShortName()) 160 Info.Name = StringPool.getEntry(Name); 161 162 if (!Info.MangledName) 163 Info.MangledName = Info.Name; 164 165 if (StripTemplate && Info.Name && Info.MangledName != Info.Name) { 166 StringRef Name = Info.Name.getString(); 167 if (std::optional<StringRef> StrippedName = StripTemplateParameters(Name)) 168 Info.NameWithoutTemplate = StringPool.getEntry(*StrippedName); 169 } 170 171 return Info.Name || Info.MangledName; 172 } 173 174 /// Resolve the relative path to a build artifact referenced by DWARF by 175 /// applying DW_AT_comp_dir. 176 static void resolveRelativeObjectPath(SmallVectorImpl<char> &Buf, DWARFDie CU) { 177 sys::path::append(Buf, dwarf::toString(CU.find(dwarf::DW_AT_comp_dir), "")); 178 } 179 180 /// Collect references to parseable Swift interfaces in imported 181 /// DW_TAG_module blocks. 182 static void analyzeImportedModule( 183 const DWARFDie &DIE, CompileUnit &CU, 184 DWARFLinkerBase::SwiftInterfacesMapTy *ParseableSwiftInterfaces, 185 std::function<void(const Twine &, const DWARFDie &)> ReportWarning) { 186 if (CU.getLanguage() != dwarf::DW_LANG_Swift) 187 return; 188 189 if (!ParseableSwiftInterfaces) 190 return; 191 192 StringRef Path = dwarf::toStringRef(DIE.find(dwarf::DW_AT_LLVM_include_path)); 193 if (!Path.ends_with(".swiftinterface")) 194 return; 195 // Don't track interfaces that are part of the SDK. 196 StringRef SysRoot = dwarf::toStringRef(DIE.find(dwarf::DW_AT_LLVM_sysroot)); 197 if (SysRoot.empty()) 198 SysRoot = CU.getSysRoot(); 199 if (!SysRoot.empty() && Path.starts_with(SysRoot)) 200 return; 201 // Don't track interfaces that are part of the toolchain. 202 // For example: Swift, _Concurrency, ... 203 SmallString<128> Toolchain = guessToolchainBaseDir(SysRoot); 204 if (!Toolchain.empty() && Path.starts_with(Toolchain)) 205 return; 206 std::optional<const char *> Name = 207 dwarf::toString(DIE.find(dwarf::DW_AT_name)); 208 if (!Name) 209 return; 210 auto &Entry = (*ParseableSwiftInterfaces)[*Name]; 211 // The prepend path is applied later when copying. 212 DWARFDie CUDie = CU.getOrigUnit().getUnitDIE(); 213 SmallString<128> ResolvedPath; 214 if (sys::path::is_relative(Path)) 215 resolveRelativeObjectPath(ResolvedPath, CUDie); 216 sys::path::append(ResolvedPath, Path); 217 if (!Entry.empty() && Entry != ResolvedPath) 218 ReportWarning(Twine("Conflicting parseable interfaces for Swift Module ") + 219 *Name + ": " + Entry + " and " + Path, 220 DIE); 221 Entry = std::string(ResolvedPath); 222 } 223 224 /// The distinct types of work performed by the work loop in 225 /// analyzeContextInfo. 226 enum class ContextWorklistItemType : uint8_t { 227 AnalyzeContextInfo, 228 UpdateChildPruning, 229 UpdatePruning, 230 }; 231 232 /// This class represents an item in the work list. The type defines what kind 233 /// of work needs to be performed when processing the current item. Everything 234 /// but the Type and Die fields are optional based on the type. 235 struct ContextWorklistItem { 236 DWARFDie Die; 237 unsigned ParentIdx; 238 union { 239 CompileUnit::DIEInfo *OtherInfo; 240 DeclContext *Context; 241 }; 242 ContextWorklistItemType Type; 243 bool InImportedModule; 244 245 ContextWorklistItem(DWARFDie Die, ContextWorklistItemType T, 246 CompileUnit::DIEInfo *OtherInfo = nullptr) 247 : Die(Die), ParentIdx(0), OtherInfo(OtherInfo), Type(T), 248 InImportedModule(false) {} 249 250 ContextWorklistItem(DWARFDie Die, DeclContext *Context, unsigned ParentIdx, 251 bool InImportedModule) 252 : Die(Die), ParentIdx(ParentIdx), Context(Context), 253 Type(ContextWorklistItemType::AnalyzeContextInfo), 254 InImportedModule(InImportedModule) {} 255 }; 256 257 static bool updatePruning(const DWARFDie &Die, CompileUnit &CU, 258 uint64_t ModulesEndOffset) { 259 CompileUnit::DIEInfo &Info = CU.getInfo(Die); 260 261 // Prune this DIE if it is either a forward declaration inside a 262 // DW_TAG_module or a DW_TAG_module that contains nothing but 263 // forward declarations. 264 Info.Prune &= (Die.getTag() == dwarf::DW_TAG_module) || 265 (isTypeTag(Die.getTag()) && 266 dwarf::toUnsigned(Die.find(dwarf::DW_AT_declaration), 0)); 267 268 // Only prune forward declarations inside a DW_TAG_module for which a 269 // definition exists elsewhere. 270 if (ModulesEndOffset == 0) 271 Info.Prune &= Info.Ctxt && Info.Ctxt->getCanonicalDIEOffset(); 272 else 273 Info.Prune &= Info.Ctxt && Info.Ctxt->getCanonicalDIEOffset() > 0 && 274 Info.Ctxt->getCanonicalDIEOffset() <= ModulesEndOffset; 275 276 return Info.Prune; 277 } 278 279 static void updateChildPruning(const DWARFDie &Die, CompileUnit &CU, 280 CompileUnit::DIEInfo &ChildInfo) { 281 CompileUnit::DIEInfo &Info = CU.getInfo(Die); 282 Info.Prune &= ChildInfo.Prune; 283 } 284 285 /// Recursive helper to build the global DeclContext information and 286 /// gather the child->parent relationships in the original compile unit. 287 /// 288 /// This function uses the same work list approach as lookForDIEsToKeep. 289 /// 290 /// \return true when this DIE and all of its children are only 291 /// forward declarations to types defined in external clang modules 292 /// (i.e., forward declarations that are children of a DW_TAG_module). 293 static void analyzeContextInfo( 294 const DWARFDie &DIE, unsigned ParentIdx, CompileUnit &CU, 295 DeclContext *CurrentDeclContext, DeclContextTree &Contexts, 296 uint64_t ModulesEndOffset, 297 DWARFLinkerBase::SwiftInterfacesMapTy *ParseableSwiftInterfaces, 298 std::function<void(const Twine &, const DWARFDie &)> ReportWarning) { 299 // LIFO work list. 300 std::vector<ContextWorklistItem> Worklist; 301 Worklist.emplace_back(DIE, CurrentDeclContext, ParentIdx, false); 302 303 while (!Worklist.empty()) { 304 ContextWorklistItem Current = Worklist.back(); 305 Worklist.pop_back(); 306 307 switch (Current.Type) { 308 case ContextWorklistItemType::UpdatePruning: 309 updatePruning(Current.Die, CU, ModulesEndOffset); 310 continue; 311 case ContextWorklistItemType::UpdateChildPruning: 312 updateChildPruning(Current.Die, CU, *Current.OtherInfo); 313 continue; 314 case ContextWorklistItemType::AnalyzeContextInfo: 315 break; 316 } 317 318 unsigned Idx = CU.getOrigUnit().getDIEIndex(Current.Die); 319 CompileUnit::DIEInfo &Info = CU.getInfo(Idx); 320 321 // Clang imposes an ODR on modules(!) regardless of the language: 322 // "The module-id should consist of only a single identifier, 323 // which provides the name of the module being defined. Each 324 // module shall have a single definition." 325 // 326 // This does not extend to the types inside the modules: 327 // "[I]n C, this implies that if two structs are defined in 328 // different submodules with the same name, those two types are 329 // distinct types (but may be compatible types if their 330 // definitions match)." 331 // 332 // We treat non-C++ modules like namespaces for this reason. 333 if (Current.Die.getTag() == dwarf::DW_TAG_module && 334 Current.ParentIdx == 0 && 335 dwarf::toString(Current.Die.find(dwarf::DW_AT_name), "") != 336 CU.getClangModuleName()) { 337 Current.InImportedModule = true; 338 analyzeImportedModule(Current.Die, CU, ParseableSwiftInterfaces, 339 ReportWarning); 340 } 341 342 Info.ParentIdx = Current.ParentIdx; 343 Info.InModuleScope = CU.isClangModule() || Current.InImportedModule; 344 if (CU.hasODR() || Info.InModuleScope) { 345 if (Current.Context) { 346 auto PtrInvalidPair = Contexts.getChildDeclContext( 347 *Current.Context, Current.Die, CU, Info.InModuleScope); 348 Current.Context = PtrInvalidPair.getPointer(); 349 Info.Ctxt = 350 PtrInvalidPair.getInt() ? nullptr : PtrInvalidPair.getPointer(); 351 if (Info.Ctxt) 352 Info.Ctxt->setDefinedInClangModule(Info.InModuleScope); 353 } else 354 Info.Ctxt = Current.Context = nullptr; 355 } 356 357 Info.Prune = Current.InImportedModule; 358 // Add children in reverse order to the worklist to effectively process 359 // them in order. 360 Worklist.emplace_back(Current.Die, ContextWorklistItemType::UpdatePruning); 361 for (auto Child : reverse(Current.Die.children())) { 362 CompileUnit::DIEInfo &ChildInfo = CU.getInfo(Child); 363 Worklist.emplace_back( 364 Current.Die, ContextWorklistItemType::UpdateChildPruning, &ChildInfo); 365 Worklist.emplace_back(Child, Current.Context, Idx, 366 Current.InImportedModule); 367 } 368 } 369 } 370 371 static bool dieNeedsChildrenToBeMeaningful(uint32_t Tag) { 372 switch (Tag) { 373 default: 374 return false; 375 case dwarf::DW_TAG_class_type: 376 case dwarf::DW_TAG_common_block: 377 case dwarf::DW_TAG_lexical_block: 378 case dwarf::DW_TAG_structure_type: 379 case dwarf::DW_TAG_subprogram: 380 case dwarf::DW_TAG_subroutine_type: 381 case dwarf::DW_TAG_union_type: 382 return true; 383 } 384 llvm_unreachable("Invalid Tag"); 385 } 386 387 void DWARFLinker::cleanupAuxiliarryData(LinkContext &Context) { 388 Context.clear(); 389 390 for (DIEBlock *I : DIEBlocks) 391 I->~DIEBlock(); 392 for (DIELoc *I : DIELocs) 393 I->~DIELoc(); 394 395 DIEBlocks.clear(); 396 DIELocs.clear(); 397 DIEAlloc.Reset(); 398 } 399 400 static bool isTlsAddressCode(uint8_t DW_OP_Code) { 401 return DW_OP_Code == dwarf::DW_OP_form_tls_address || 402 DW_OP_Code == dwarf::DW_OP_GNU_push_tls_address; 403 } 404 405 std::pair<bool, std::optional<int64_t>> 406 DWARFLinker::getVariableRelocAdjustment(AddressesMap &RelocMgr, 407 const DWARFDie &DIE) { 408 assert((DIE.getTag() == dwarf::DW_TAG_variable || 409 DIE.getTag() == dwarf::DW_TAG_constant) && 410 "Wrong type of input die"); 411 412 const auto *Abbrev = DIE.getAbbreviationDeclarationPtr(); 413 414 // Check if DIE has DW_AT_location attribute. 415 DWARFUnit *U = DIE.getDwarfUnit(); 416 std::optional<uint32_t> LocationIdx = 417 Abbrev->findAttributeIndex(dwarf::DW_AT_location); 418 if (!LocationIdx) 419 return std::make_pair(false, std::nullopt); 420 421 // Get offset to the DW_AT_location attribute. 422 uint64_t AttrOffset = 423 Abbrev->getAttributeOffsetFromIndex(*LocationIdx, DIE.getOffset(), *U); 424 425 // Get value of the DW_AT_location attribute. 426 std::optional<DWARFFormValue> LocationValue = 427 Abbrev->getAttributeValueFromOffset(*LocationIdx, AttrOffset, *U); 428 if (!LocationValue) 429 return std::make_pair(false, std::nullopt); 430 431 // Check that DW_AT_location attribute is of 'exprloc' class. 432 // Handling value of location expressions for attributes of 'loclist' 433 // class is not implemented yet. 434 std::optional<ArrayRef<uint8_t>> Expr = LocationValue->getAsBlock(); 435 if (!Expr) 436 return std::make_pair(false, std::nullopt); 437 438 // Parse 'exprloc' expression. 439 DataExtractor Data(toStringRef(*Expr), U->getContext().isLittleEndian(), 440 U->getAddressByteSize()); 441 DWARFExpression Expression(Data, U->getAddressByteSize(), 442 U->getFormParams().Format); 443 444 bool HasLocationAddress = false; 445 uint64_t CurExprOffset = 0; 446 for (DWARFExpression::iterator It = Expression.begin(); 447 It != Expression.end(); ++It) { 448 DWARFExpression::iterator NextIt = It; 449 ++NextIt; 450 451 const DWARFExpression::Operation &Op = *It; 452 switch (Op.getCode()) { 453 case dwarf::DW_OP_const2u: 454 case dwarf::DW_OP_const4u: 455 case dwarf::DW_OP_const8u: 456 case dwarf::DW_OP_const2s: 457 case dwarf::DW_OP_const4s: 458 case dwarf::DW_OP_const8s: 459 if (NextIt == Expression.end() || !isTlsAddressCode(NextIt->getCode())) 460 break; 461 [[fallthrough]]; 462 case dwarf::DW_OP_addr: { 463 HasLocationAddress = true; 464 // Check relocation for the address. 465 if (std::optional<int64_t> RelocAdjustment = 466 RelocMgr.getExprOpAddressRelocAdjustment( 467 *U, Op, AttrOffset + CurExprOffset, 468 AttrOffset + Op.getEndOffset(), Options.Verbose)) 469 return std::make_pair(HasLocationAddress, *RelocAdjustment); 470 } break; 471 case dwarf::DW_OP_constx: 472 case dwarf::DW_OP_addrx: { 473 HasLocationAddress = true; 474 if (std::optional<uint64_t> AddressOffset = 475 DIE.getDwarfUnit()->getIndexedAddressOffset( 476 Op.getRawOperand(0))) { 477 // Check relocation for the address. 478 if (std::optional<int64_t> RelocAdjustment = 479 RelocMgr.getExprOpAddressRelocAdjustment( 480 *U, Op, *AddressOffset, 481 *AddressOffset + DIE.getDwarfUnit()->getAddressByteSize(), 482 Options.Verbose)) 483 return std::make_pair(HasLocationAddress, *RelocAdjustment); 484 } 485 } break; 486 default: { 487 // Nothing to do. 488 } break; 489 } 490 CurExprOffset = Op.getEndOffset(); 491 } 492 493 return std::make_pair(HasLocationAddress, std::nullopt); 494 } 495 496 /// Check if a variable describing DIE should be kept. 497 /// \returns updated TraversalFlags. 498 unsigned DWARFLinker::shouldKeepVariableDIE(AddressesMap &RelocMgr, 499 const DWARFDie &DIE, 500 CompileUnit::DIEInfo &MyInfo, 501 unsigned Flags) { 502 const auto *Abbrev = DIE.getAbbreviationDeclarationPtr(); 503 504 // Global variables with constant value can always be kept. 505 if (!(Flags & TF_InFunctionScope) && 506 Abbrev->findAttributeIndex(dwarf::DW_AT_const_value)) { 507 MyInfo.InDebugMap = true; 508 return Flags | TF_Keep; 509 } 510 511 // See if there is a relocation to a valid debug map entry inside this 512 // variable's location. The order is important here. We want to always check 513 // if the variable has a valid relocation, so that the DIEInfo is filled. 514 // However, we don't want a static variable in a function to force us to keep 515 // the enclosing function, unless requested explicitly. 516 std::pair<bool, std::optional<int64_t>> LocExprAddrAndRelocAdjustment = 517 getVariableRelocAdjustment(RelocMgr, DIE); 518 519 if (LocExprAddrAndRelocAdjustment.first) 520 MyInfo.HasLocationExpressionAddr = true; 521 522 if (!LocExprAddrAndRelocAdjustment.second) 523 return Flags; 524 525 MyInfo.AddrAdjust = *LocExprAddrAndRelocAdjustment.second; 526 MyInfo.InDebugMap = true; 527 528 if (((Flags & TF_InFunctionScope) && 529 !LLVM_UNLIKELY(Options.KeepFunctionForStatic))) 530 return Flags; 531 532 if (Options.Verbose) { 533 outs() << "Keeping variable DIE:"; 534 DIDumpOptions DumpOpts; 535 DumpOpts.ChildRecurseDepth = 0; 536 DumpOpts.Verbose = Options.Verbose; 537 DIE.dump(outs(), 8 /* Indent */, DumpOpts); 538 } 539 540 return Flags | TF_Keep; 541 } 542 543 /// Check if a function describing DIE should be kept. 544 /// \returns updated TraversalFlags. 545 unsigned DWARFLinker::shouldKeepSubprogramDIE( 546 AddressesMap &RelocMgr, const DWARFDie &DIE, const DWARFFile &File, 547 CompileUnit &Unit, CompileUnit::DIEInfo &MyInfo, unsigned Flags) { 548 Flags |= TF_InFunctionScope; 549 550 auto LowPc = dwarf::toAddress(DIE.find(dwarf::DW_AT_low_pc)); 551 if (!LowPc) 552 return Flags; 553 554 assert(LowPc && "low_pc attribute is not an address."); 555 std::optional<int64_t> RelocAdjustment = 556 RelocMgr.getSubprogramRelocAdjustment(DIE, Options.Verbose); 557 if (!RelocAdjustment) 558 return Flags; 559 560 MyInfo.AddrAdjust = *RelocAdjustment; 561 MyInfo.InDebugMap = true; 562 563 if (Options.Verbose) { 564 outs() << "Keeping subprogram DIE:"; 565 DIDumpOptions DumpOpts; 566 DumpOpts.ChildRecurseDepth = 0; 567 DumpOpts.Verbose = Options.Verbose; 568 DIE.dump(outs(), 8 /* Indent */, DumpOpts); 569 } 570 571 if (DIE.getTag() == dwarf::DW_TAG_label) { 572 if (Unit.hasLabelAt(*LowPc)) 573 return Flags; 574 575 DWARFUnit &OrigUnit = Unit.getOrigUnit(); 576 // FIXME: dsymutil-classic compat. dsymutil-classic doesn't consider labels 577 // that don't fall into the CU's aranges. This is wrong IMO. Debug info 578 // generation bugs aside, this is really wrong in the case of labels, where 579 // a label marking the end of a function will have a PC == CU's high_pc. 580 if (dwarf::toAddress(OrigUnit.getUnitDIE().find(dwarf::DW_AT_high_pc)) 581 .value_or(UINT64_MAX) <= LowPc) 582 return Flags; 583 Unit.addLabelLowPc(*LowPc, MyInfo.AddrAdjust); 584 return Flags | TF_Keep; 585 } 586 587 Flags |= TF_Keep; 588 589 std::optional<uint64_t> HighPc = DIE.getHighPC(*LowPc); 590 if (!HighPc) { 591 reportWarning("Function without high_pc. Range will be discarded.\n", File, 592 &DIE); 593 return Flags; 594 } 595 if (*LowPc > *HighPc) { 596 reportWarning("low_pc greater than high_pc. Range will be discarded.\n", 597 File, &DIE); 598 return Flags; 599 } 600 601 // Replace the debug map range with a more accurate one. 602 Unit.addFunctionRange(*LowPc, *HighPc, MyInfo.AddrAdjust); 603 return Flags; 604 } 605 606 /// Check if a DIE should be kept. 607 /// \returns updated TraversalFlags. 608 unsigned DWARFLinker::shouldKeepDIE(AddressesMap &RelocMgr, const DWARFDie &DIE, 609 const DWARFFile &File, CompileUnit &Unit, 610 CompileUnit::DIEInfo &MyInfo, 611 unsigned Flags) { 612 switch (DIE.getTag()) { 613 case dwarf::DW_TAG_constant: 614 case dwarf::DW_TAG_variable: 615 return shouldKeepVariableDIE(RelocMgr, DIE, MyInfo, Flags); 616 case dwarf::DW_TAG_subprogram: 617 case dwarf::DW_TAG_label: 618 return shouldKeepSubprogramDIE(RelocMgr, DIE, File, Unit, MyInfo, Flags); 619 case dwarf::DW_TAG_base_type: 620 // DWARF Expressions may reference basic types, but scanning them 621 // is expensive. Basic types are tiny, so just keep all of them. 622 case dwarf::DW_TAG_imported_module: 623 case dwarf::DW_TAG_imported_declaration: 624 case dwarf::DW_TAG_imported_unit: 625 // We always want to keep these. 626 return Flags | TF_Keep; 627 default: 628 break; 629 } 630 631 return Flags; 632 } 633 634 /// Helper that updates the completeness of the current DIE based on the 635 /// completeness of one of its children. It depends on the incompleteness of 636 /// the children already being computed. 637 static void updateChildIncompleteness(const DWARFDie &Die, CompileUnit &CU, 638 CompileUnit::DIEInfo &ChildInfo) { 639 switch (Die.getTag()) { 640 case dwarf::DW_TAG_structure_type: 641 case dwarf::DW_TAG_class_type: 642 case dwarf::DW_TAG_union_type: 643 break; 644 default: 645 return; 646 } 647 648 CompileUnit::DIEInfo &MyInfo = CU.getInfo(Die); 649 650 if (ChildInfo.Incomplete || ChildInfo.Prune) 651 MyInfo.Incomplete = true; 652 } 653 654 /// Helper that updates the completeness of the current DIE based on the 655 /// completeness of the DIEs it references. It depends on the incompleteness of 656 /// the referenced DIE already being computed. 657 static void updateRefIncompleteness(const DWARFDie &Die, CompileUnit &CU, 658 CompileUnit::DIEInfo &RefInfo) { 659 switch (Die.getTag()) { 660 case dwarf::DW_TAG_typedef: 661 case dwarf::DW_TAG_member: 662 case dwarf::DW_TAG_reference_type: 663 case dwarf::DW_TAG_ptr_to_member_type: 664 case dwarf::DW_TAG_pointer_type: 665 break; 666 default: 667 return; 668 } 669 670 CompileUnit::DIEInfo &MyInfo = CU.getInfo(Die); 671 672 if (MyInfo.Incomplete) 673 return; 674 675 if (RefInfo.Incomplete) 676 MyInfo.Incomplete = true; 677 } 678 679 /// Look at the children of the given DIE and decide whether they should be 680 /// kept. 681 void DWARFLinker::lookForChildDIEsToKeep( 682 const DWARFDie &Die, CompileUnit &CU, unsigned Flags, 683 SmallVectorImpl<WorklistItem> &Worklist) { 684 // The TF_ParentWalk flag tells us that we are currently walking up the 685 // parent chain of a required DIE, and we don't want to mark all the children 686 // of the parents as kept (consider for example a DW_TAG_namespace node in 687 // the parent chain). There are however a set of DIE types for which we want 688 // to ignore that directive and still walk their children. 689 if (dieNeedsChildrenToBeMeaningful(Die.getTag())) 690 Flags &= ~DWARFLinker::TF_ParentWalk; 691 692 // We're finished if this DIE has no children or we're walking the parent 693 // chain. 694 if (!Die.hasChildren() || (Flags & DWARFLinker::TF_ParentWalk)) 695 return; 696 697 // Add children in reverse order to the worklist to effectively process them 698 // in order. 699 for (auto Child : reverse(Die.children())) { 700 // Add a worklist item before every child to calculate incompleteness right 701 // after the current child is processed. 702 CompileUnit::DIEInfo &ChildInfo = CU.getInfo(Child); 703 Worklist.emplace_back(Die, CU, WorklistItemType::UpdateChildIncompleteness, 704 &ChildInfo); 705 Worklist.emplace_back(Child, CU, Flags); 706 } 707 } 708 709 static bool isODRCanonicalCandidate(const DWARFDie &Die, CompileUnit &CU) { 710 CompileUnit::DIEInfo &Info = CU.getInfo(Die); 711 712 if (!Info.Ctxt || (Die.getTag() == dwarf::DW_TAG_namespace)) 713 return false; 714 715 if (!CU.hasODR() && !Info.InModuleScope) 716 return false; 717 718 return !Info.Incomplete && Info.Ctxt != CU.getInfo(Info.ParentIdx).Ctxt; 719 } 720 721 void DWARFLinker::markODRCanonicalDie(const DWARFDie &Die, CompileUnit &CU) { 722 CompileUnit::DIEInfo &Info = CU.getInfo(Die); 723 724 Info.ODRMarkingDone = true; 725 if (Info.Keep && isODRCanonicalCandidate(Die, CU) && 726 !Info.Ctxt->hasCanonicalDIE()) 727 Info.Ctxt->setHasCanonicalDIE(); 728 } 729 730 /// Look at DIEs referenced by the given DIE and decide whether they should be 731 /// kept. All DIEs referenced though attributes should be kept. 732 void DWARFLinker::lookForRefDIEsToKeep( 733 const DWARFDie &Die, CompileUnit &CU, unsigned Flags, 734 const UnitListTy &Units, const DWARFFile &File, 735 SmallVectorImpl<WorklistItem> &Worklist) { 736 bool UseOdr = (Flags & DWARFLinker::TF_DependencyWalk) 737 ? (Flags & DWARFLinker::TF_ODR) 738 : CU.hasODR(); 739 DWARFUnit &Unit = CU.getOrigUnit(); 740 DWARFDataExtractor Data = Unit.getDebugInfoExtractor(); 741 const auto *Abbrev = Die.getAbbreviationDeclarationPtr(); 742 uint64_t Offset = Die.getOffset() + getULEB128Size(Abbrev->getCode()); 743 744 SmallVector<std::pair<DWARFDie, CompileUnit &>, 4> ReferencedDIEs; 745 for (const auto &AttrSpec : Abbrev->attributes()) { 746 DWARFFormValue Val(AttrSpec.Form); 747 if (!Val.isFormClass(DWARFFormValue::FC_Reference) || 748 AttrSpec.Attr == dwarf::DW_AT_sibling) { 749 DWARFFormValue::skipValue(AttrSpec.Form, Data, &Offset, 750 Unit.getFormParams()); 751 continue; 752 } 753 754 Val.extractValue(Data, &Offset, Unit.getFormParams(), &Unit); 755 CompileUnit *ReferencedCU; 756 if (auto RefDie = 757 resolveDIEReference(File, Units, Val, Die, ReferencedCU)) { 758 CompileUnit::DIEInfo &Info = ReferencedCU->getInfo(RefDie); 759 // If the referenced DIE has a DeclContext that has already been 760 // emitted, then do not keep the one in this CU. We'll link to 761 // the canonical DIE in cloneDieReferenceAttribute. 762 // 763 // FIXME: compatibility with dsymutil-classic. UseODR shouldn't 764 // be necessary and could be advantageously replaced by 765 // ReferencedCU->hasODR() && CU.hasODR(). 766 // 767 // FIXME: compatibility with dsymutil-classic. There is no 768 // reason not to unique ref_addr references. 769 if (AttrSpec.Form != dwarf::DW_FORM_ref_addr && 770 isODRAttribute(AttrSpec.Attr) && Info.Ctxt && 771 Info.Ctxt->hasCanonicalDIE()) 772 continue; 773 774 // Keep a module forward declaration if there is no definition. 775 if (!(isODRAttribute(AttrSpec.Attr) && Info.Ctxt && 776 Info.Ctxt->hasCanonicalDIE())) 777 Info.Prune = false; 778 ReferencedDIEs.emplace_back(RefDie, *ReferencedCU); 779 } 780 } 781 782 unsigned ODRFlag = UseOdr ? DWARFLinker::TF_ODR : 0; 783 784 // Add referenced DIEs in reverse order to the worklist to effectively 785 // process them in order. 786 for (auto &P : reverse(ReferencedDIEs)) { 787 // Add a worklist item before every child to calculate incompleteness right 788 // after the current child is processed. 789 CompileUnit::DIEInfo &Info = P.second.getInfo(P.first); 790 Worklist.emplace_back(Die, CU, WorklistItemType::UpdateRefIncompleteness, 791 &Info); 792 Worklist.emplace_back(P.first, P.second, 793 DWARFLinker::TF_Keep | 794 DWARFLinker::TF_DependencyWalk | ODRFlag); 795 } 796 } 797 798 /// Look at the parent of the given DIE and decide whether they should be kept. 799 void DWARFLinker::lookForParentDIEsToKeep( 800 unsigned AncestorIdx, CompileUnit &CU, unsigned Flags, 801 SmallVectorImpl<WorklistItem> &Worklist) { 802 // Stop if we encounter an ancestor that's already marked as kept. 803 if (CU.getInfo(AncestorIdx).Keep) 804 return; 805 806 DWARFUnit &Unit = CU.getOrigUnit(); 807 DWARFDie ParentDIE = Unit.getDIEAtIndex(AncestorIdx); 808 Worklist.emplace_back(CU.getInfo(AncestorIdx).ParentIdx, CU, Flags); 809 Worklist.emplace_back(ParentDIE, CU, Flags); 810 } 811 812 /// Recursively walk the \p DIE tree and look for DIEs to keep. Store that 813 /// information in \p CU's DIEInfo. 814 /// 815 /// This function is the entry point of the DIE selection algorithm. It is 816 /// expected to walk the DIE tree in file order and (though the mediation of 817 /// its helper) call hasValidRelocation() on each DIE that might be a 'root 818 /// DIE' (See DwarfLinker class comment). 819 /// 820 /// While walking the dependencies of root DIEs, this function is also called, 821 /// but during these dependency walks the file order is not respected. The 822 /// TF_DependencyWalk flag tells us which kind of traversal we are currently 823 /// doing. 824 /// 825 /// The recursive algorithm is implemented iteratively as a work list because 826 /// very deep recursion could exhaust the stack for large projects. The work 827 /// list acts as a scheduler for different types of work that need to be 828 /// performed. 829 /// 830 /// The recursive nature of the algorithm is simulated by running the "main" 831 /// algorithm (LookForDIEsToKeep) followed by either looking at more DIEs 832 /// (LookForChildDIEsToKeep, LookForRefDIEsToKeep, LookForParentDIEsToKeep) or 833 /// fixing up a computed property (UpdateChildIncompleteness, 834 /// UpdateRefIncompleteness). 835 /// 836 /// The return value indicates whether the DIE is incomplete. 837 void DWARFLinker::lookForDIEsToKeep(AddressesMap &AddressesMap, 838 const UnitListTy &Units, 839 const DWARFDie &Die, const DWARFFile &File, 840 CompileUnit &Cu, unsigned Flags) { 841 // LIFO work list. 842 SmallVector<WorklistItem, 4> Worklist; 843 Worklist.emplace_back(Die, Cu, Flags); 844 845 while (!Worklist.empty()) { 846 WorklistItem Current = Worklist.pop_back_val(); 847 848 // Look at the worklist type to decide what kind of work to perform. 849 switch (Current.Type) { 850 case WorklistItemType::UpdateChildIncompleteness: 851 updateChildIncompleteness(Current.Die, Current.CU, *Current.OtherInfo); 852 continue; 853 case WorklistItemType::UpdateRefIncompleteness: 854 updateRefIncompleteness(Current.Die, Current.CU, *Current.OtherInfo); 855 continue; 856 case WorklistItemType::LookForChildDIEsToKeep: 857 lookForChildDIEsToKeep(Current.Die, Current.CU, Current.Flags, Worklist); 858 continue; 859 case WorklistItemType::LookForRefDIEsToKeep: 860 lookForRefDIEsToKeep(Current.Die, Current.CU, Current.Flags, Units, File, 861 Worklist); 862 continue; 863 case WorklistItemType::LookForParentDIEsToKeep: 864 lookForParentDIEsToKeep(Current.AncestorIdx, Current.CU, Current.Flags, 865 Worklist); 866 continue; 867 case WorklistItemType::MarkODRCanonicalDie: 868 markODRCanonicalDie(Current.Die, Current.CU); 869 continue; 870 case WorklistItemType::LookForDIEsToKeep: 871 break; 872 } 873 874 unsigned Idx = Current.CU.getOrigUnit().getDIEIndex(Current.Die); 875 CompileUnit::DIEInfo &MyInfo = Current.CU.getInfo(Idx); 876 877 if (MyInfo.Prune) { 878 // We're walking the dependencies of a module forward declaration that was 879 // kept because there is no definition. 880 if (Current.Flags & TF_DependencyWalk) 881 MyInfo.Prune = false; 882 else 883 continue; 884 } 885 886 // If the Keep flag is set, we are marking a required DIE's dependencies. 887 // If our target is already marked as kept, we're all set. 888 bool AlreadyKept = MyInfo.Keep; 889 if ((Current.Flags & TF_DependencyWalk) && AlreadyKept) 890 continue; 891 892 if (!(Current.Flags & TF_DependencyWalk)) 893 Current.Flags = shouldKeepDIE(AddressesMap, Current.Die, File, Current.CU, 894 MyInfo, Current.Flags); 895 896 // We need to mark context for the canonical die in the end of normal 897 // traversing(not TF_DependencyWalk) or after normal traversing if die 898 // was not marked as kept. 899 if (!(Current.Flags & TF_DependencyWalk) || 900 (MyInfo.ODRMarkingDone && !MyInfo.Keep)) { 901 if (Current.CU.hasODR() || MyInfo.InModuleScope) 902 Worklist.emplace_back(Current.Die, Current.CU, 903 WorklistItemType::MarkODRCanonicalDie); 904 } 905 906 // Finish by looking for child DIEs. Because of the LIFO worklist we need 907 // to schedule that work before any subsequent items are added to the 908 // worklist. 909 Worklist.emplace_back(Current.Die, Current.CU, Current.Flags, 910 WorklistItemType::LookForChildDIEsToKeep); 911 912 if (AlreadyKept || !(Current.Flags & TF_Keep)) 913 continue; 914 915 // If it is a newly kept DIE mark it as well as all its dependencies as 916 // kept. 917 MyInfo.Keep = true; 918 919 // We're looking for incomplete types. 920 MyInfo.Incomplete = 921 Current.Die.getTag() != dwarf::DW_TAG_subprogram && 922 Current.Die.getTag() != dwarf::DW_TAG_member && 923 dwarf::toUnsigned(Current.Die.find(dwarf::DW_AT_declaration), 0); 924 925 // After looking at the parent chain, look for referenced DIEs. Because of 926 // the LIFO worklist we need to schedule that work before any subsequent 927 // items are added to the worklist. 928 Worklist.emplace_back(Current.Die, Current.CU, Current.Flags, 929 WorklistItemType::LookForRefDIEsToKeep); 930 931 bool UseOdr = (Current.Flags & TF_DependencyWalk) ? (Current.Flags & TF_ODR) 932 : Current.CU.hasODR(); 933 unsigned ODRFlag = UseOdr ? TF_ODR : 0; 934 unsigned ParFlags = TF_ParentWalk | TF_Keep | TF_DependencyWalk | ODRFlag; 935 936 // Now schedule the parent walk. 937 Worklist.emplace_back(MyInfo.ParentIdx, Current.CU, ParFlags); 938 } 939 } 940 941 #ifndef NDEBUG 942 /// A broken link in the keep chain. By recording both the parent and the child 943 /// we can show only broken links for DIEs with multiple children. 944 struct BrokenLink { 945 BrokenLink(DWARFDie Parent, DWARFDie Child) : Parent(Parent), Child(Child) {} 946 DWARFDie Parent; 947 DWARFDie Child; 948 }; 949 950 /// Verify the keep chain by looking for DIEs that are kept but who's parent 951 /// isn't. 952 static void verifyKeepChain(CompileUnit &CU) { 953 std::vector<DWARFDie> Worklist; 954 Worklist.push_back(CU.getOrigUnit().getUnitDIE()); 955 956 // List of broken links. 957 std::vector<BrokenLink> BrokenLinks; 958 959 while (!Worklist.empty()) { 960 const DWARFDie Current = Worklist.back(); 961 Worklist.pop_back(); 962 963 const bool CurrentDieIsKept = CU.getInfo(Current).Keep; 964 965 for (DWARFDie Child : reverse(Current.children())) { 966 Worklist.push_back(Child); 967 968 const bool ChildDieIsKept = CU.getInfo(Child).Keep; 969 if (!CurrentDieIsKept && ChildDieIsKept) 970 BrokenLinks.emplace_back(Current, Child); 971 } 972 } 973 974 if (!BrokenLinks.empty()) { 975 for (BrokenLink Link : BrokenLinks) { 976 WithColor::error() << formatv( 977 "Found invalid link in keep chain between {0:x} and {1:x}\n", 978 Link.Parent.getOffset(), Link.Child.getOffset()); 979 980 errs() << "Parent:"; 981 Link.Parent.dump(errs(), 0, {}); 982 CU.getInfo(Link.Parent).dump(); 983 984 errs() << "Child:"; 985 Link.Child.dump(errs(), 2, {}); 986 CU.getInfo(Link.Child).dump(); 987 } 988 report_fatal_error("invalid keep chain"); 989 } 990 } 991 #endif 992 993 /// Assign an abbreviation number to \p Abbrev. 994 /// 995 /// Our DIEs get freed after every DebugMapObject has been processed, 996 /// thus the FoldingSet we use to unique DIEAbbrevs cannot refer to 997 /// the instances hold by the DIEs. When we encounter an abbreviation 998 /// that we don't know, we create a permanent copy of it. 999 void DWARFLinker::assignAbbrev(DIEAbbrev &Abbrev) { 1000 // Check the set for priors. 1001 FoldingSetNodeID ID; 1002 Abbrev.Profile(ID); 1003 void *InsertToken; 1004 DIEAbbrev *InSet = AbbreviationsSet.FindNodeOrInsertPos(ID, InsertToken); 1005 1006 // If it's newly added. 1007 if (InSet) { 1008 // Assign existing abbreviation number. 1009 Abbrev.setNumber(InSet->getNumber()); 1010 } else { 1011 // Add to abbreviation list. 1012 Abbreviations.push_back( 1013 std::make_unique<DIEAbbrev>(Abbrev.getTag(), Abbrev.hasChildren())); 1014 for (const auto &Attr : Abbrev.getData()) 1015 Abbreviations.back()->AddAttribute(Attr); 1016 AbbreviationsSet.InsertNode(Abbreviations.back().get(), InsertToken); 1017 // Assign the unique abbreviation number. 1018 Abbrev.setNumber(Abbreviations.size()); 1019 Abbreviations.back()->setNumber(Abbreviations.size()); 1020 } 1021 } 1022 1023 unsigned DWARFLinker::DIECloner::cloneStringAttribute(DIE &Die, 1024 AttributeSpec AttrSpec, 1025 const DWARFFormValue &Val, 1026 const DWARFUnit &U, 1027 AttributesInfo &Info) { 1028 std::optional<const char *> String = dwarf::toString(Val); 1029 if (!String) 1030 return 0; 1031 DwarfStringPoolEntryRef StringEntry; 1032 if (AttrSpec.Form == dwarf::DW_FORM_line_strp) { 1033 StringEntry = DebugLineStrPool.getEntry(*String); 1034 } else { 1035 StringEntry = DebugStrPool.getEntry(*String); 1036 1037 if (AttrSpec.Attr == dwarf::DW_AT_APPLE_origin) { 1038 Info.HasAppleOrigin = true; 1039 if (std::optional<StringRef> FileName = 1040 ObjFile.Addresses->getLibraryInstallName()) { 1041 StringEntry = DebugStrPool.getEntry(*FileName); 1042 } 1043 } 1044 1045 // Update attributes info. 1046 if (AttrSpec.Attr == dwarf::DW_AT_name) 1047 Info.Name = StringEntry; 1048 else if (AttrSpec.Attr == dwarf::DW_AT_MIPS_linkage_name || 1049 AttrSpec.Attr == dwarf::DW_AT_linkage_name) 1050 Info.MangledName = StringEntry; 1051 if (U.getVersion() >= 5) { 1052 // Switch everything to DW_FORM_strx strings. 1053 auto StringOffsetIndex = 1054 StringOffsetPool.getValueIndex(StringEntry.getOffset()); 1055 return Die 1056 .addValue(DIEAlloc, dwarf::Attribute(AttrSpec.Attr), 1057 dwarf::DW_FORM_strx, DIEInteger(StringOffsetIndex)) 1058 ->sizeOf(U.getFormParams()); 1059 } 1060 // Switch everything to out of line strings. 1061 AttrSpec.Form = dwarf::DW_FORM_strp; 1062 } 1063 Die.addValue(DIEAlloc, dwarf::Attribute(AttrSpec.Attr), AttrSpec.Form, 1064 DIEInteger(StringEntry.getOffset())); 1065 return 4; 1066 } 1067 1068 unsigned DWARFLinker::DIECloner::cloneDieReferenceAttribute( 1069 DIE &Die, const DWARFDie &InputDIE, AttributeSpec AttrSpec, 1070 unsigned AttrSize, const DWARFFormValue &Val, const DWARFFile &File, 1071 CompileUnit &Unit) { 1072 const DWARFUnit &U = Unit.getOrigUnit(); 1073 uint64_t Ref = *Val.getAsReference(); 1074 1075 DIE *NewRefDie = nullptr; 1076 CompileUnit *RefUnit = nullptr; 1077 1078 DWARFDie RefDie = 1079 Linker.resolveDIEReference(File, CompileUnits, Val, InputDIE, RefUnit); 1080 1081 // If the referenced DIE is not found, drop the attribute. 1082 if (!RefDie || AttrSpec.Attr == dwarf::DW_AT_sibling) 1083 return 0; 1084 1085 CompileUnit::DIEInfo &RefInfo = RefUnit->getInfo(RefDie); 1086 1087 // If we already have emitted an equivalent DeclContext, just point 1088 // at it. 1089 if (isODRAttribute(AttrSpec.Attr) && RefInfo.Ctxt && 1090 RefInfo.Ctxt->getCanonicalDIEOffset()) { 1091 assert(RefInfo.Ctxt->hasCanonicalDIE() && 1092 "Offset to canonical die is set, but context is not marked"); 1093 DIEInteger Attr(RefInfo.Ctxt->getCanonicalDIEOffset()); 1094 Die.addValue(DIEAlloc, dwarf::Attribute(AttrSpec.Attr), 1095 dwarf::DW_FORM_ref_addr, Attr); 1096 return U.getRefAddrByteSize(); 1097 } 1098 1099 if (!RefInfo.Clone) { 1100 // We haven't cloned this DIE yet. Just create an empty one and 1101 // store it. It'll get really cloned when we process it. 1102 RefInfo.UnclonedReference = true; 1103 RefInfo.Clone = DIE::get(DIEAlloc, dwarf::Tag(RefDie.getTag())); 1104 } 1105 NewRefDie = RefInfo.Clone; 1106 1107 if (AttrSpec.Form == dwarf::DW_FORM_ref_addr || 1108 (Unit.hasODR() && isODRAttribute(AttrSpec.Attr))) { 1109 // We cannot currently rely on a DIEEntry to emit ref_addr 1110 // references, because the implementation calls back to DwarfDebug 1111 // to find the unit offset. (We don't have a DwarfDebug) 1112 // FIXME: we should be able to design DIEEntry reliance on 1113 // DwarfDebug away. 1114 uint64_t Attr; 1115 if (Ref < InputDIE.getOffset() && !RefInfo.UnclonedReference) { 1116 // We have already cloned that DIE. 1117 uint32_t NewRefOffset = 1118 RefUnit->getStartOffset() + NewRefDie->getOffset(); 1119 Attr = NewRefOffset; 1120 Die.addValue(DIEAlloc, dwarf::Attribute(AttrSpec.Attr), 1121 dwarf::DW_FORM_ref_addr, DIEInteger(Attr)); 1122 } else { 1123 // A forward reference. Note and fixup later. 1124 Attr = 0xBADDEF; 1125 Unit.noteForwardReference( 1126 NewRefDie, RefUnit, RefInfo.Ctxt, 1127 Die.addValue(DIEAlloc, dwarf::Attribute(AttrSpec.Attr), 1128 dwarf::DW_FORM_ref_addr, DIEInteger(Attr))); 1129 } 1130 return U.getRefAddrByteSize(); 1131 } 1132 1133 Die.addValue(DIEAlloc, dwarf::Attribute(AttrSpec.Attr), 1134 dwarf::Form(AttrSpec.Form), DIEEntry(*NewRefDie)); 1135 1136 return AttrSize; 1137 } 1138 1139 void DWARFLinker::DIECloner::cloneExpression( 1140 DataExtractor &Data, DWARFExpression Expression, const DWARFFile &File, 1141 CompileUnit &Unit, SmallVectorImpl<uint8_t> &OutputBuffer, 1142 int64_t AddrRelocAdjustment, bool IsLittleEndian) { 1143 using Encoding = DWARFExpression::Operation::Encoding; 1144 1145 uint8_t OrigAddressByteSize = Unit.getOrigUnit().getAddressByteSize(); 1146 1147 uint64_t OpOffset = 0; 1148 for (auto &Op : Expression) { 1149 auto Desc = Op.getDescription(); 1150 // DW_OP_const_type is variable-length and has 3 1151 // operands. Thus far we only support 2. 1152 if ((Desc.Op.size() == 2 && Desc.Op[0] == Encoding::BaseTypeRef) || 1153 (Desc.Op.size() == 2 && Desc.Op[1] == Encoding::BaseTypeRef && 1154 Desc.Op[0] != Encoding::Size1)) 1155 Linker.reportWarning("Unsupported DW_OP encoding.", File); 1156 1157 if ((Desc.Op.size() == 1 && Desc.Op[0] == Encoding::BaseTypeRef) || 1158 (Desc.Op.size() == 2 && Desc.Op[1] == Encoding::BaseTypeRef && 1159 Desc.Op[0] == Encoding::Size1)) { 1160 // This code assumes that the other non-typeref operand fits into 1 byte. 1161 assert(OpOffset < Op.getEndOffset()); 1162 uint32_t ULEBsize = Op.getEndOffset() - OpOffset - 1; 1163 assert(ULEBsize <= 16); 1164 1165 // Copy over the operation. 1166 assert(!Op.getSubCode() && "SubOps not yet supported"); 1167 OutputBuffer.push_back(Op.getCode()); 1168 uint64_t RefOffset; 1169 if (Desc.Op.size() == 1) { 1170 RefOffset = Op.getRawOperand(0); 1171 } else { 1172 OutputBuffer.push_back(Op.getRawOperand(0)); 1173 RefOffset = Op.getRawOperand(1); 1174 } 1175 uint32_t Offset = 0; 1176 // Look up the base type. For DW_OP_convert, the operand may be 0 to 1177 // instead indicate the generic type. The same holds for 1178 // DW_OP_reinterpret, which is currently not supported. 1179 if (RefOffset > 0 || Op.getCode() != dwarf::DW_OP_convert) { 1180 RefOffset += Unit.getOrigUnit().getOffset(); 1181 auto RefDie = Unit.getOrigUnit().getDIEForOffset(RefOffset); 1182 CompileUnit::DIEInfo &Info = Unit.getInfo(RefDie); 1183 if (DIE *Clone = Info.Clone) 1184 Offset = Clone->getOffset(); 1185 else 1186 Linker.reportWarning( 1187 "base type ref doesn't point to DW_TAG_base_type.", File); 1188 } 1189 uint8_t ULEB[16]; 1190 unsigned RealSize = encodeULEB128(Offset, ULEB, ULEBsize); 1191 if (RealSize > ULEBsize) { 1192 // Emit the generic type as a fallback. 1193 RealSize = encodeULEB128(0, ULEB, ULEBsize); 1194 Linker.reportWarning("base type ref doesn't fit.", File); 1195 } 1196 assert(RealSize == ULEBsize && "padding failed"); 1197 ArrayRef<uint8_t> ULEBbytes(ULEB, ULEBsize); 1198 OutputBuffer.append(ULEBbytes.begin(), ULEBbytes.end()); 1199 } else if (!Linker.Options.Update && Op.getCode() == dwarf::DW_OP_addrx) { 1200 if (std::optional<object::SectionedAddress> SA = 1201 Unit.getOrigUnit().getAddrOffsetSectionItem( 1202 Op.getRawOperand(0))) { 1203 // DWARFLinker does not use addrx forms since it generates relocated 1204 // addresses. Replace DW_OP_addrx with DW_OP_addr here. 1205 // Argument of DW_OP_addrx should be relocated here as it is not 1206 // processed by applyValidRelocs. 1207 OutputBuffer.push_back(dwarf::DW_OP_addr); 1208 uint64_t LinkedAddress = SA->Address + AddrRelocAdjustment; 1209 if (IsLittleEndian != sys::IsLittleEndianHost) 1210 sys::swapByteOrder(LinkedAddress); 1211 ArrayRef<uint8_t> AddressBytes( 1212 reinterpret_cast<const uint8_t *>(&LinkedAddress), 1213 OrigAddressByteSize); 1214 OutputBuffer.append(AddressBytes.begin(), AddressBytes.end()); 1215 } else 1216 Linker.reportWarning("cannot read DW_OP_addrx operand.", File); 1217 } else if (!Linker.Options.Update && Op.getCode() == dwarf::DW_OP_constx) { 1218 if (std::optional<object::SectionedAddress> SA = 1219 Unit.getOrigUnit().getAddrOffsetSectionItem( 1220 Op.getRawOperand(0))) { 1221 // DWARFLinker does not use constx forms since it generates relocated 1222 // addresses. Replace DW_OP_constx with DW_OP_const[*]u here. 1223 // Argument of DW_OP_constx should be relocated here as it is not 1224 // processed by applyValidRelocs. 1225 std::optional<uint8_t> OutOperandKind; 1226 switch (OrigAddressByteSize) { 1227 case 4: 1228 OutOperandKind = dwarf::DW_OP_const4u; 1229 break; 1230 case 8: 1231 OutOperandKind = dwarf::DW_OP_const8u; 1232 break; 1233 default: 1234 Linker.reportWarning( 1235 formatv(("unsupported address size: {0}."), OrigAddressByteSize), 1236 File); 1237 break; 1238 } 1239 1240 if (OutOperandKind) { 1241 OutputBuffer.push_back(*OutOperandKind); 1242 uint64_t LinkedAddress = SA->Address + AddrRelocAdjustment; 1243 if (IsLittleEndian != sys::IsLittleEndianHost) 1244 sys::swapByteOrder(LinkedAddress); 1245 ArrayRef<uint8_t> AddressBytes( 1246 reinterpret_cast<const uint8_t *>(&LinkedAddress), 1247 OrigAddressByteSize); 1248 OutputBuffer.append(AddressBytes.begin(), AddressBytes.end()); 1249 } 1250 } else 1251 Linker.reportWarning("cannot read DW_OP_constx operand.", File); 1252 } else { 1253 // Copy over everything else unmodified. 1254 StringRef Bytes = Data.getData().slice(OpOffset, Op.getEndOffset()); 1255 OutputBuffer.append(Bytes.begin(), Bytes.end()); 1256 } 1257 OpOffset = Op.getEndOffset(); 1258 } 1259 } 1260 1261 unsigned DWARFLinker::DIECloner::cloneBlockAttribute( 1262 DIE &Die, const DWARFDie &InputDIE, const DWARFFile &File, 1263 CompileUnit &Unit, AttributeSpec AttrSpec, const DWARFFormValue &Val, 1264 bool IsLittleEndian) { 1265 DIEValueList *Attr; 1266 DIEValue Value; 1267 DIELoc *Loc = nullptr; 1268 DIEBlock *Block = nullptr; 1269 if (AttrSpec.Form == dwarf::DW_FORM_exprloc) { 1270 Loc = new (DIEAlloc) DIELoc; 1271 Linker.DIELocs.push_back(Loc); 1272 } else { 1273 Block = new (DIEAlloc) DIEBlock; 1274 Linker.DIEBlocks.push_back(Block); 1275 } 1276 Attr = Loc ? static_cast<DIEValueList *>(Loc) 1277 : static_cast<DIEValueList *>(Block); 1278 1279 DWARFUnit &OrigUnit = Unit.getOrigUnit(); 1280 // If the block is a DWARF Expression, clone it into the temporary 1281 // buffer using cloneExpression(), otherwise copy the data directly. 1282 SmallVector<uint8_t, 32> Buffer; 1283 ArrayRef<uint8_t> Bytes = *Val.getAsBlock(); 1284 if (DWARFAttribute::mayHaveLocationExpr(AttrSpec.Attr) && 1285 (Val.isFormClass(DWARFFormValue::FC_Block) || 1286 Val.isFormClass(DWARFFormValue::FC_Exprloc))) { 1287 DataExtractor Data(StringRef((const char *)Bytes.data(), Bytes.size()), 1288 IsLittleEndian, OrigUnit.getAddressByteSize()); 1289 DWARFExpression Expr(Data, OrigUnit.getAddressByteSize(), 1290 OrigUnit.getFormParams().Format); 1291 cloneExpression(Data, Expr, File, Unit, Buffer, 1292 Unit.getInfo(InputDIE).AddrAdjust, IsLittleEndian); 1293 Bytes = Buffer; 1294 } 1295 for (auto Byte : Bytes) 1296 Attr->addValue(DIEAlloc, static_cast<dwarf::Attribute>(0), 1297 dwarf::DW_FORM_data1, DIEInteger(Byte)); 1298 1299 // FIXME: If DIEBlock and DIELoc just reuses the Size field of 1300 // the DIE class, this "if" could be replaced by 1301 // Attr->setSize(Bytes.size()). 1302 if (Loc) 1303 Loc->setSize(Bytes.size()); 1304 else 1305 Block->setSize(Bytes.size()); 1306 1307 if (Loc) 1308 Value = DIEValue(dwarf::Attribute(AttrSpec.Attr), 1309 dwarf::Form(AttrSpec.Form), Loc); 1310 else { 1311 // The expression location data might be updated and exceed the original 1312 // size. Check whether the new data fits into the original form. 1313 if ((AttrSpec.Form == dwarf::DW_FORM_block1 && 1314 (Bytes.size() > UINT8_MAX)) || 1315 (AttrSpec.Form == dwarf::DW_FORM_block2 && 1316 (Bytes.size() > UINT16_MAX)) || 1317 (AttrSpec.Form == dwarf::DW_FORM_block4 && (Bytes.size() > UINT32_MAX))) 1318 AttrSpec.Form = dwarf::DW_FORM_block; 1319 1320 Value = DIEValue(dwarf::Attribute(AttrSpec.Attr), 1321 dwarf::Form(AttrSpec.Form), Block); 1322 } 1323 1324 return Die.addValue(DIEAlloc, Value)->sizeOf(OrigUnit.getFormParams()); 1325 } 1326 1327 unsigned DWARFLinker::DIECloner::cloneAddressAttribute( 1328 DIE &Die, const DWARFDie &InputDIE, AttributeSpec AttrSpec, 1329 unsigned AttrSize, const DWARFFormValue &Val, const CompileUnit &Unit, 1330 AttributesInfo &Info) { 1331 if (AttrSpec.Attr == dwarf::DW_AT_low_pc) 1332 Info.HasLowPc = true; 1333 1334 if (LLVM_UNLIKELY(Linker.Options.Update)) { 1335 Die.addValue(DIEAlloc, dwarf::Attribute(AttrSpec.Attr), 1336 dwarf::Form(AttrSpec.Form), DIEInteger(Val.getRawUValue())); 1337 return AttrSize; 1338 } 1339 1340 // Cloned Die may have address attributes relocated to a 1341 // totally unrelated value. This can happen: 1342 // - If high_pc is an address (Dwarf version == 2), then it might have been 1343 // relocated to a totally unrelated value (because the end address in the 1344 // object file might be start address of another function which got moved 1345 // independently by the linker). 1346 // - If address relocated in an inline_subprogram that happens at the 1347 // beginning of its inlining function. 1348 // To avoid above cases and to not apply relocation twice (in 1349 // applyValidRelocs and here), read address attribute from InputDIE and apply 1350 // Info.PCOffset here. 1351 1352 std::optional<DWARFFormValue> AddrAttribute = InputDIE.find(AttrSpec.Attr); 1353 if (!AddrAttribute) 1354 llvm_unreachable("Cann't find attribute."); 1355 1356 std::optional<uint64_t> Addr = AddrAttribute->getAsAddress(); 1357 if (!Addr) { 1358 Linker.reportWarning("Cann't read address attribute value.", ObjFile); 1359 return 0; 1360 } 1361 1362 if (InputDIE.getTag() == dwarf::DW_TAG_compile_unit && 1363 AttrSpec.Attr == dwarf::DW_AT_low_pc) { 1364 if (std::optional<uint64_t> LowPC = Unit.getLowPc()) 1365 Addr = *LowPC; 1366 else 1367 return 0; 1368 } else if (InputDIE.getTag() == dwarf::DW_TAG_compile_unit && 1369 AttrSpec.Attr == dwarf::DW_AT_high_pc) { 1370 if (uint64_t HighPc = Unit.getHighPc()) 1371 Addr = HighPc; 1372 else 1373 return 0; 1374 } else { 1375 *Addr += Info.PCOffset; 1376 } 1377 1378 if (AttrSpec.Form == dwarf::DW_FORM_addr) { 1379 Die.addValue(DIEAlloc, static_cast<dwarf::Attribute>(AttrSpec.Attr), 1380 AttrSpec.Form, DIEInteger(*Addr)); 1381 return Unit.getOrigUnit().getAddressByteSize(); 1382 } 1383 1384 auto AddrIndex = AddrPool.getValueIndex(*Addr); 1385 1386 return Die 1387 .addValue(DIEAlloc, static_cast<dwarf::Attribute>(AttrSpec.Attr), 1388 dwarf::Form::DW_FORM_addrx, DIEInteger(AddrIndex)) 1389 ->sizeOf(Unit.getOrigUnit().getFormParams()); 1390 } 1391 1392 unsigned DWARFLinker::DIECloner::cloneScalarAttribute( 1393 DIE &Die, const DWARFDie &InputDIE, const DWARFFile &File, 1394 CompileUnit &Unit, AttributeSpec AttrSpec, const DWARFFormValue &Val, 1395 unsigned AttrSize, AttributesInfo &Info) { 1396 uint64_t Value; 1397 1398 // Check for the offset to the macro table. If offset is incorrect then we 1399 // need to remove the attribute. 1400 if (AttrSpec.Attr == dwarf::DW_AT_macro_info) { 1401 if (std::optional<uint64_t> Offset = Val.getAsSectionOffset()) { 1402 const llvm::DWARFDebugMacro *Macro = File.Dwarf->getDebugMacinfo(); 1403 if (Macro == nullptr || !Macro->hasEntryForOffset(*Offset)) 1404 return 0; 1405 } 1406 } 1407 1408 if (AttrSpec.Attr == dwarf::DW_AT_macros) { 1409 if (std::optional<uint64_t> Offset = Val.getAsSectionOffset()) { 1410 const llvm::DWARFDebugMacro *Macro = File.Dwarf->getDebugMacro(); 1411 if (Macro == nullptr || !Macro->hasEntryForOffset(*Offset)) 1412 return 0; 1413 } 1414 } 1415 1416 if (AttrSpec.Attr == dwarf::DW_AT_str_offsets_base) { 1417 // DWARFLinker generates common .debug_str_offsets table used for all 1418 // compile units. The offset to the common .debug_str_offsets table is 8 on 1419 // DWARF32. 1420 Info.AttrStrOffsetBaseSeen = true; 1421 return Die 1422 .addValue(DIEAlloc, dwarf::DW_AT_str_offsets_base, 1423 dwarf::DW_FORM_sec_offset, DIEInteger(8)) 1424 ->sizeOf(Unit.getOrigUnit().getFormParams()); 1425 } 1426 1427 if (LLVM_UNLIKELY(Linker.Options.Update)) { 1428 if (auto OptionalValue = Val.getAsUnsignedConstant()) 1429 Value = *OptionalValue; 1430 else if (auto OptionalValue = Val.getAsSignedConstant()) 1431 Value = *OptionalValue; 1432 else if (auto OptionalValue = Val.getAsSectionOffset()) 1433 Value = *OptionalValue; 1434 else { 1435 Linker.reportWarning( 1436 "Unsupported scalar attribute form. Dropping attribute.", File, 1437 &InputDIE); 1438 return 0; 1439 } 1440 if (AttrSpec.Attr == dwarf::DW_AT_declaration && Value) 1441 Info.IsDeclaration = true; 1442 1443 if (AttrSpec.Form == dwarf::DW_FORM_loclistx) 1444 Die.addValue(DIEAlloc, dwarf::Attribute(AttrSpec.Attr), 1445 dwarf::Form(AttrSpec.Form), DIELocList(Value)); 1446 else 1447 Die.addValue(DIEAlloc, dwarf::Attribute(AttrSpec.Attr), 1448 dwarf::Form(AttrSpec.Form), DIEInteger(Value)); 1449 return AttrSize; 1450 } 1451 1452 [[maybe_unused]] dwarf::Form OriginalForm = AttrSpec.Form; 1453 if (AttrSpec.Form == dwarf::DW_FORM_rnglistx) { 1454 // DWARFLinker does not generate .debug_addr table. Thus we need to change 1455 // all "addrx" related forms to "addr" version. Change DW_FORM_rnglistx 1456 // to DW_FORM_sec_offset here. 1457 std::optional<uint64_t> Index = Val.getAsSectionOffset(); 1458 if (!Index) { 1459 Linker.reportWarning("Cannot read the attribute. Dropping.", File, 1460 &InputDIE); 1461 return 0; 1462 } 1463 std::optional<uint64_t> Offset = 1464 Unit.getOrigUnit().getRnglistOffset(*Index); 1465 if (!Offset) { 1466 Linker.reportWarning("Cannot read the attribute. Dropping.", File, 1467 &InputDIE); 1468 return 0; 1469 } 1470 1471 Value = *Offset; 1472 AttrSpec.Form = dwarf::DW_FORM_sec_offset; 1473 AttrSize = Unit.getOrigUnit().getFormParams().getDwarfOffsetByteSize(); 1474 } else if (AttrSpec.Form == dwarf::DW_FORM_loclistx) { 1475 // DWARFLinker does not generate .debug_addr table. Thus we need to change 1476 // all "addrx" related forms to "addr" version. Change DW_FORM_loclistx 1477 // to DW_FORM_sec_offset here. 1478 std::optional<uint64_t> Index = Val.getAsSectionOffset(); 1479 if (!Index) { 1480 Linker.reportWarning("Cannot read the attribute. Dropping.", File, 1481 &InputDIE); 1482 return 0; 1483 } 1484 std::optional<uint64_t> Offset = 1485 Unit.getOrigUnit().getLoclistOffset(*Index); 1486 if (!Offset) { 1487 Linker.reportWarning("Cannot read the attribute. Dropping.", File, 1488 &InputDIE); 1489 return 0; 1490 } 1491 1492 Value = *Offset; 1493 AttrSpec.Form = dwarf::DW_FORM_sec_offset; 1494 AttrSize = Unit.getOrigUnit().getFormParams().getDwarfOffsetByteSize(); 1495 } else if (AttrSpec.Attr == dwarf::DW_AT_high_pc && 1496 Die.getTag() == dwarf::DW_TAG_compile_unit) { 1497 std::optional<uint64_t> LowPC = Unit.getLowPc(); 1498 if (!LowPC) 1499 return 0; 1500 // Dwarf >= 4 high_pc is an size, not an address. 1501 Value = Unit.getHighPc() - *LowPC; 1502 } else if (AttrSpec.Form == dwarf::DW_FORM_sec_offset) 1503 Value = *Val.getAsSectionOffset(); 1504 else if (AttrSpec.Form == dwarf::DW_FORM_sdata) 1505 Value = *Val.getAsSignedConstant(); 1506 else if (auto OptionalValue = Val.getAsUnsignedConstant()) 1507 Value = *OptionalValue; 1508 else { 1509 Linker.reportWarning( 1510 "Unsupported scalar attribute form. Dropping attribute.", File, 1511 &InputDIE); 1512 return 0; 1513 } 1514 1515 DIE::value_iterator Patch = 1516 Die.addValue(DIEAlloc, dwarf::Attribute(AttrSpec.Attr), 1517 dwarf::Form(AttrSpec.Form), DIEInteger(Value)); 1518 if (AttrSpec.Attr == dwarf::DW_AT_ranges || 1519 AttrSpec.Attr == dwarf::DW_AT_start_scope) { 1520 Unit.noteRangeAttribute(Die, Patch); 1521 Info.HasRanges = true; 1522 } else if (DWARFAttribute::mayHaveLocationList(AttrSpec.Attr) && 1523 dwarf::doesFormBelongToClass(AttrSpec.Form, 1524 DWARFFormValue::FC_SectionOffset, 1525 Unit.getOrigUnit().getVersion())) { 1526 1527 CompileUnit::DIEInfo &LocationDieInfo = Unit.getInfo(InputDIE); 1528 Unit.noteLocationAttribute({Patch, LocationDieInfo.InDebugMap 1529 ? LocationDieInfo.AddrAdjust 1530 : Info.PCOffset}); 1531 } else if (AttrSpec.Attr == dwarf::DW_AT_declaration && Value) 1532 Info.IsDeclaration = true; 1533 1534 // check that all dwarf::DW_FORM_rnglistx are handled previously. 1535 assert((Info.HasRanges || (OriginalForm != dwarf::DW_FORM_rnglistx)) && 1536 "Unhandled DW_FORM_rnglistx attribute"); 1537 1538 return AttrSize; 1539 } 1540 1541 /// Clone \p InputDIE's attribute described by \p AttrSpec with 1542 /// value \p Val, and add it to \p Die. 1543 /// \returns the size of the cloned attribute. 1544 unsigned DWARFLinker::DIECloner::cloneAttribute( 1545 DIE &Die, const DWARFDie &InputDIE, const DWARFFile &File, 1546 CompileUnit &Unit, const DWARFFormValue &Val, const AttributeSpec AttrSpec, 1547 unsigned AttrSize, AttributesInfo &Info, bool IsLittleEndian) { 1548 const DWARFUnit &U = Unit.getOrigUnit(); 1549 1550 switch (AttrSpec.Form) { 1551 case dwarf::DW_FORM_strp: 1552 case dwarf::DW_FORM_line_strp: 1553 case dwarf::DW_FORM_string: 1554 case dwarf::DW_FORM_strx: 1555 case dwarf::DW_FORM_strx1: 1556 case dwarf::DW_FORM_strx2: 1557 case dwarf::DW_FORM_strx3: 1558 case dwarf::DW_FORM_strx4: 1559 return cloneStringAttribute(Die, AttrSpec, Val, U, Info); 1560 case dwarf::DW_FORM_ref_addr: 1561 case dwarf::DW_FORM_ref1: 1562 case dwarf::DW_FORM_ref2: 1563 case dwarf::DW_FORM_ref4: 1564 case dwarf::DW_FORM_ref8: 1565 return cloneDieReferenceAttribute(Die, InputDIE, AttrSpec, AttrSize, Val, 1566 File, Unit); 1567 case dwarf::DW_FORM_block: 1568 case dwarf::DW_FORM_block1: 1569 case dwarf::DW_FORM_block2: 1570 case dwarf::DW_FORM_block4: 1571 case dwarf::DW_FORM_exprloc: 1572 return cloneBlockAttribute(Die, InputDIE, File, Unit, AttrSpec, Val, 1573 IsLittleEndian); 1574 case dwarf::DW_FORM_addr: 1575 case dwarf::DW_FORM_addrx: 1576 case dwarf::DW_FORM_addrx1: 1577 case dwarf::DW_FORM_addrx2: 1578 case dwarf::DW_FORM_addrx3: 1579 case dwarf::DW_FORM_addrx4: 1580 return cloneAddressAttribute(Die, InputDIE, AttrSpec, AttrSize, Val, Unit, 1581 Info); 1582 case dwarf::DW_FORM_data1: 1583 case dwarf::DW_FORM_data2: 1584 case dwarf::DW_FORM_data4: 1585 case dwarf::DW_FORM_data8: 1586 case dwarf::DW_FORM_udata: 1587 case dwarf::DW_FORM_sdata: 1588 case dwarf::DW_FORM_sec_offset: 1589 case dwarf::DW_FORM_flag: 1590 case dwarf::DW_FORM_flag_present: 1591 case dwarf::DW_FORM_rnglistx: 1592 case dwarf::DW_FORM_loclistx: 1593 case dwarf::DW_FORM_implicit_const: 1594 return cloneScalarAttribute(Die, InputDIE, File, Unit, AttrSpec, Val, 1595 AttrSize, Info); 1596 default: 1597 Linker.reportWarning("Unsupported attribute form " + 1598 dwarf::FormEncodingString(AttrSpec.Form) + 1599 " in cloneAttribute. Dropping.", 1600 File, &InputDIE); 1601 } 1602 1603 return 0; 1604 } 1605 1606 void DWARFLinker::DIECloner::addObjCAccelerator(CompileUnit &Unit, 1607 const DIE *Die, 1608 DwarfStringPoolEntryRef Name, 1609 OffsetsStringPool &StringPool, 1610 bool SkipPubSection) { 1611 std::optional<ObjCSelectorNames> Names = 1612 getObjCNamesIfSelector(Name.getString()); 1613 if (!Names) 1614 return; 1615 Unit.addNameAccelerator(Die, StringPool.getEntry(Names->Selector), 1616 SkipPubSection); 1617 Unit.addObjCAccelerator(Die, StringPool.getEntry(Names->ClassName), 1618 SkipPubSection); 1619 if (Names->ClassNameNoCategory) 1620 Unit.addObjCAccelerator( 1621 Die, StringPool.getEntry(*Names->ClassNameNoCategory), SkipPubSection); 1622 if (Names->MethodNameNoCategory) 1623 Unit.addNameAccelerator( 1624 Die, StringPool.getEntry(*Names->MethodNameNoCategory), SkipPubSection); 1625 } 1626 1627 static bool 1628 shouldSkipAttribute(bool Update, 1629 DWARFAbbreviationDeclaration::AttributeSpec AttrSpec, 1630 bool SkipPC) { 1631 switch (AttrSpec.Attr) { 1632 default: 1633 return false; 1634 case dwarf::DW_AT_low_pc: 1635 case dwarf::DW_AT_high_pc: 1636 case dwarf::DW_AT_ranges: 1637 return !Update && SkipPC; 1638 case dwarf::DW_AT_rnglists_base: 1639 // In case !Update the .debug_addr table is not generated/preserved. 1640 // Thus instead of DW_FORM_rnglistx the DW_FORM_sec_offset is used. 1641 // Since DW_AT_rnglists_base is used for only DW_FORM_rnglistx the 1642 // DW_AT_rnglists_base is removed. 1643 return !Update; 1644 case dwarf::DW_AT_loclists_base: 1645 // In case !Update the .debug_addr table is not generated/preserved. 1646 // Thus instead of DW_FORM_loclistx the DW_FORM_sec_offset is used. 1647 // Since DW_AT_loclists_base is used for only DW_FORM_loclistx the 1648 // DW_AT_loclists_base is removed. 1649 return !Update; 1650 case dwarf::DW_AT_location: 1651 case dwarf::DW_AT_frame_base: 1652 return !Update && SkipPC; 1653 } 1654 } 1655 1656 struct AttributeLinkedOffsetFixup { 1657 int64_t LinkedOffsetFixupVal; 1658 uint64_t InputAttrStartOffset; 1659 uint64_t InputAttrEndOffset; 1660 }; 1661 1662 DIE *DWARFLinker::DIECloner::cloneDIE(const DWARFDie &InputDIE, 1663 const DWARFFile &File, CompileUnit &Unit, 1664 int64_t PCOffset, uint32_t OutOffset, 1665 unsigned Flags, bool IsLittleEndian, 1666 DIE *Die) { 1667 DWARFUnit &U = Unit.getOrigUnit(); 1668 unsigned Idx = U.getDIEIndex(InputDIE); 1669 CompileUnit::DIEInfo &Info = Unit.getInfo(Idx); 1670 1671 // Should the DIE appear in the output? 1672 if (!Unit.getInfo(Idx).Keep) 1673 return nullptr; 1674 1675 uint64_t Offset = InputDIE.getOffset(); 1676 assert(!(Die && Info.Clone) && "Can't supply a DIE and a cloned DIE"); 1677 if (!Die) { 1678 // The DIE might have been already created by a forward reference 1679 // (see cloneDieReferenceAttribute()). 1680 if (!Info.Clone) 1681 Info.Clone = DIE::get(DIEAlloc, dwarf::Tag(InputDIE.getTag())); 1682 Die = Info.Clone; 1683 } 1684 1685 assert(Die->getTag() == InputDIE.getTag()); 1686 Die->setOffset(OutOffset); 1687 if (isODRCanonicalCandidate(InputDIE, Unit) && Info.Ctxt && 1688 (Info.Ctxt->getCanonicalDIEOffset() == 0)) { 1689 if (!Info.Ctxt->hasCanonicalDIE()) 1690 Info.Ctxt->setHasCanonicalDIE(); 1691 // We are about to emit a DIE that is the root of its own valid 1692 // DeclContext tree. Make the current offset the canonical offset 1693 // for this context. 1694 Info.Ctxt->setCanonicalDIEOffset(OutOffset + Unit.getStartOffset()); 1695 } 1696 1697 // Extract and clone every attribute. 1698 DWARFDataExtractor Data = U.getDebugInfoExtractor(); 1699 // Point to the next DIE (generally there is always at least a NULL 1700 // entry after the current one). If this is a lone 1701 // DW_TAG_compile_unit without any children, point to the next unit. 1702 uint64_t NextOffset = (Idx + 1 < U.getNumDIEs()) 1703 ? U.getDIEAtIndex(Idx + 1).getOffset() 1704 : U.getNextUnitOffset(); 1705 AttributesInfo AttrInfo; 1706 1707 // We could copy the data only if we need to apply a relocation to it. After 1708 // testing, it seems there is no performance downside to doing the copy 1709 // unconditionally, and it makes the code simpler. 1710 SmallString<40> DIECopy(Data.getData().substr(Offset, NextOffset - Offset)); 1711 Data = 1712 DWARFDataExtractor(DIECopy, Data.isLittleEndian(), Data.getAddressSize()); 1713 1714 // Modify the copy with relocated addresses. 1715 ObjFile.Addresses->applyValidRelocs(DIECopy, Offset, Data.isLittleEndian()); 1716 1717 // Reset the Offset to 0 as we will be working on the local copy of 1718 // the data. 1719 Offset = 0; 1720 1721 const auto *Abbrev = InputDIE.getAbbreviationDeclarationPtr(); 1722 Offset += getULEB128Size(Abbrev->getCode()); 1723 1724 // We are entering a subprogram. Get and propagate the PCOffset. 1725 if (Die->getTag() == dwarf::DW_TAG_subprogram) 1726 PCOffset = Info.AddrAdjust; 1727 AttrInfo.PCOffset = PCOffset; 1728 1729 if (Abbrev->getTag() == dwarf::DW_TAG_subprogram) { 1730 Flags |= TF_InFunctionScope; 1731 if (!Info.InDebugMap && LLVM_LIKELY(!Update)) 1732 Flags |= TF_SkipPC; 1733 } else if (Abbrev->getTag() == dwarf::DW_TAG_variable) { 1734 // Function-local globals could be in the debug map even when the function 1735 // is not, e.g., inlined functions. 1736 if ((Flags & TF_InFunctionScope) && Info.InDebugMap) 1737 Flags &= ~TF_SkipPC; 1738 // Location expressions referencing an address which is not in debug map 1739 // should be deleted. 1740 else if (!Info.InDebugMap && Info.HasLocationExpressionAddr && 1741 LLVM_LIKELY(!Update)) 1742 Flags |= TF_SkipPC; 1743 } 1744 1745 std::optional<StringRef> LibraryInstallName = 1746 ObjFile.Addresses->getLibraryInstallName(); 1747 SmallVector<AttributeLinkedOffsetFixup> AttributesFixups; 1748 for (const auto &AttrSpec : Abbrev->attributes()) { 1749 if (shouldSkipAttribute(Update, AttrSpec, Flags & TF_SkipPC)) { 1750 DWARFFormValue::skipValue(AttrSpec.Form, Data, &Offset, 1751 U.getFormParams()); 1752 continue; 1753 } 1754 1755 AttributeLinkedOffsetFixup CurAttrFixup; 1756 CurAttrFixup.InputAttrStartOffset = InputDIE.getOffset() + Offset; 1757 CurAttrFixup.LinkedOffsetFixupVal = 1758 Unit.getStartOffset() + OutOffset - CurAttrFixup.InputAttrStartOffset; 1759 1760 DWARFFormValue Val = AttrSpec.getFormValue(); 1761 uint64_t AttrSize = Offset; 1762 Val.extractValue(Data, &Offset, U.getFormParams(), &U); 1763 CurAttrFixup.InputAttrEndOffset = InputDIE.getOffset() + Offset; 1764 AttrSize = Offset - AttrSize; 1765 1766 uint64_t FinalAttrSize = 1767 cloneAttribute(*Die, InputDIE, File, Unit, Val, AttrSpec, AttrSize, 1768 AttrInfo, IsLittleEndian); 1769 if (FinalAttrSize != 0 && ObjFile.Addresses->needToSaveValidRelocs()) 1770 AttributesFixups.push_back(CurAttrFixup); 1771 1772 OutOffset += FinalAttrSize; 1773 } 1774 1775 uint16_t Tag = InputDIE.getTag(); 1776 // Add the DW_AT_APPLE_origin attribute to Compile Unit die if we have 1777 // an install name and the DWARF doesn't have the attribute yet. 1778 const bool NeedsAppleOrigin = (Tag == dwarf::DW_TAG_compile_unit) && 1779 LibraryInstallName.has_value() && 1780 !AttrInfo.HasAppleOrigin; 1781 if (NeedsAppleOrigin) { 1782 auto StringEntry = DebugStrPool.getEntry(LibraryInstallName.value()); 1783 Die->addValue(DIEAlloc, dwarf::Attribute(dwarf::DW_AT_APPLE_origin), 1784 dwarf::DW_FORM_strp, DIEInteger(StringEntry.getOffset())); 1785 AttrInfo.Name = StringEntry; 1786 OutOffset += 4; 1787 } 1788 1789 // Look for accelerator entries. 1790 // FIXME: This is slightly wrong. An inline_subroutine without a 1791 // low_pc, but with AT_ranges might be interesting to get into the 1792 // accelerator tables too. For now stick with dsymutil's behavior. 1793 if ((Info.InDebugMap || AttrInfo.HasLowPc || AttrInfo.HasRanges) && 1794 Tag != dwarf::DW_TAG_compile_unit && 1795 getDIENames(InputDIE, AttrInfo, DebugStrPool, 1796 Tag != dwarf::DW_TAG_inlined_subroutine)) { 1797 if (AttrInfo.MangledName && AttrInfo.MangledName != AttrInfo.Name) 1798 Unit.addNameAccelerator(Die, AttrInfo.MangledName, 1799 Tag == dwarf::DW_TAG_inlined_subroutine); 1800 if (AttrInfo.Name) { 1801 if (AttrInfo.NameWithoutTemplate) 1802 Unit.addNameAccelerator(Die, AttrInfo.NameWithoutTemplate, 1803 /* SkipPubSection */ true); 1804 Unit.addNameAccelerator(Die, AttrInfo.Name, 1805 Tag == dwarf::DW_TAG_inlined_subroutine); 1806 } 1807 if (AttrInfo.Name) 1808 addObjCAccelerator(Unit, Die, AttrInfo.Name, DebugStrPool, 1809 /* SkipPubSection =*/true); 1810 1811 } else if (Tag == dwarf::DW_TAG_namespace) { 1812 if (!AttrInfo.Name) 1813 AttrInfo.Name = DebugStrPool.getEntry("(anonymous namespace)"); 1814 Unit.addNamespaceAccelerator(Die, AttrInfo.Name); 1815 } else if (Tag == dwarf::DW_TAG_imported_declaration && AttrInfo.Name) { 1816 Unit.addNamespaceAccelerator(Die, AttrInfo.Name); 1817 } else if (isTypeTag(Tag) && !AttrInfo.IsDeclaration && 1818 getDIENames(InputDIE, AttrInfo, DebugStrPool) && AttrInfo.Name && 1819 AttrInfo.Name.getString()[0]) { 1820 uint32_t Hash = hashFullyQualifiedName(InputDIE, Unit, File); 1821 uint64_t RuntimeLang = 1822 dwarf::toUnsigned(InputDIE.find(dwarf::DW_AT_APPLE_runtime_class)) 1823 .value_or(0); 1824 bool ObjCClassIsImplementation = 1825 (RuntimeLang == dwarf::DW_LANG_ObjC || 1826 RuntimeLang == dwarf::DW_LANG_ObjC_plus_plus) && 1827 dwarf::toUnsigned(InputDIE.find(dwarf::DW_AT_APPLE_objc_complete_type)) 1828 .value_or(0); 1829 Unit.addTypeAccelerator(Die, AttrInfo.Name, ObjCClassIsImplementation, 1830 Hash); 1831 } 1832 1833 // Determine whether there are any children that we want to keep. 1834 bool HasChildren = false; 1835 for (auto Child : InputDIE.children()) { 1836 unsigned Idx = U.getDIEIndex(Child); 1837 if (Unit.getInfo(Idx).Keep) { 1838 HasChildren = true; 1839 break; 1840 } 1841 } 1842 1843 if (Unit.getOrigUnit().getVersion() >= 5 && !AttrInfo.AttrStrOffsetBaseSeen && 1844 Die->getTag() == dwarf::DW_TAG_compile_unit) { 1845 // No DW_AT_str_offsets_base seen, add it to the DIE. 1846 Die->addValue(DIEAlloc, dwarf::DW_AT_str_offsets_base, 1847 dwarf::DW_FORM_sec_offset, DIEInteger(8)); 1848 OutOffset += 4; 1849 } 1850 1851 DIEAbbrev NewAbbrev = Die->generateAbbrev(); 1852 if (HasChildren) 1853 NewAbbrev.setChildrenFlag(dwarf::DW_CHILDREN_yes); 1854 // Assign a permanent abbrev number 1855 Linker.assignAbbrev(NewAbbrev); 1856 Die->setAbbrevNumber(NewAbbrev.getNumber()); 1857 1858 uint64_t AbbrevNumberSize = getULEB128Size(Die->getAbbrevNumber()); 1859 1860 // Add the size of the abbreviation number to the output offset. 1861 OutOffset += AbbrevNumberSize; 1862 1863 // Update fixups with the size of the abbreviation number 1864 for (AttributeLinkedOffsetFixup &F : AttributesFixups) 1865 F.LinkedOffsetFixupVal += AbbrevNumberSize; 1866 1867 for (AttributeLinkedOffsetFixup &F : AttributesFixups) 1868 ObjFile.Addresses->updateAndSaveValidRelocs( 1869 Unit.getOrigUnit().getVersion() >= 5, Unit.getOrigUnit().getOffset(), 1870 F.LinkedOffsetFixupVal, F.InputAttrStartOffset, F.InputAttrEndOffset); 1871 1872 if (!HasChildren) { 1873 // Update our size. 1874 Die->setSize(OutOffset - Die->getOffset()); 1875 return Die; 1876 } 1877 1878 // Recursively clone children. 1879 for (auto Child : InputDIE.children()) { 1880 if (DIE *Clone = cloneDIE(Child, File, Unit, PCOffset, OutOffset, Flags, 1881 IsLittleEndian)) { 1882 Die->addChild(Clone); 1883 OutOffset = Clone->getOffset() + Clone->getSize(); 1884 } 1885 } 1886 1887 // Account for the end of children marker. 1888 OutOffset += sizeof(int8_t); 1889 // Update our size. 1890 Die->setSize(OutOffset - Die->getOffset()); 1891 return Die; 1892 } 1893 1894 /// Patch the input object file relevant debug_ranges or debug_rnglists 1895 /// entries and emit them in the output file. Update the relevant attributes 1896 /// to point at the new entries. 1897 void DWARFLinker::generateUnitRanges(CompileUnit &Unit, const DWARFFile &File, 1898 DebugDieValuePool &AddrPool) const { 1899 if (LLVM_UNLIKELY(Options.Update)) 1900 return; 1901 1902 const auto &FunctionRanges = Unit.getFunctionRanges(); 1903 1904 // Build set of linked address ranges for unit function ranges. 1905 AddressRanges LinkedFunctionRanges; 1906 for (const AddressRangeValuePair &Range : FunctionRanges) 1907 LinkedFunctionRanges.insert( 1908 {Range.Range.start() + Range.Value, Range.Range.end() + Range.Value}); 1909 1910 // Emit LinkedFunctionRanges into .debug_aranges 1911 if (!LinkedFunctionRanges.empty()) 1912 TheDwarfEmitter->emitDwarfDebugArangesTable(Unit, LinkedFunctionRanges); 1913 1914 RngListAttributesTy AllRngListAttributes = Unit.getRangesAttributes(); 1915 std::optional<PatchLocation> UnitRngListAttribute = 1916 Unit.getUnitRangesAttribute(); 1917 1918 if (!AllRngListAttributes.empty() || UnitRngListAttribute) { 1919 std::optional<AddressRangeValuePair> CachedRange; 1920 MCSymbol *EndLabel = TheDwarfEmitter->emitDwarfDebugRangeListHeader(Unit); 1921 1922 // Read original address ranges, apply relocation value, emit linked address 1923 // ranges. 1924 for (PatchLocation &AttributePatch : AllRngListAttributes) { 1925 // Get ranges from the source DWARF corresponding to the current 1926 // attribute. 1927 AddressRanges LinkedRanges; 1928 if (Expected<DWARFAddressRangesVector> OriginalRanges = 1929 Unit.getOrigUnit().findRnglistFromOffset(AttributePatch.get())) { 1930 // Apply relocation adjustment. 1931 for (const auto &Range : *OriginalRanges) { 1932 if (!CachedRange || !CachedRange->Range.contains(Range.LowPC)) 1933 CachedRange = FunctionRanges.getRangeThatContains(Range.LowPC); 1934 1935 // All range entries should lie in the function range. 1936 if (!CachedRange) { 1937 reportWarning("inconsistent range data.", File); 1938 continue; 1939 } 1940 1941 // Store range for emiting. 1942 LinkedRanges.insert({Range.LowPC + CachedRange->Value, 1943 Range.HighPC + CachedRange->Value}); 1944 } 1945 } else { 1946 llvm::consumeError(OriginalRanges.takeError()); 1947 reportWarning("invalid range list ignored.", File); 1948 } 1949 1950 // Emit linked ranges. 1951 TheDwarfEmitter->emitDwarfDebugRangeListFragment( 1952 Unit, LinkedRanges, AttributePatch, AddrPool); 1953 } 1954 1955 // Emit ranges for Unit AT_ranges attribute. 1956 if (UnitRngListAttribute.has_value()) 1957 TheDwarfEmitter->emitDwarfDebugRangeListFragment( 1958 Unit, LinkedFunctionRanges, *UnitRngListAttribute, AddrPool); 1959 1960 // Emit ranges footer. 1961 TheDwarfEmitter->emitDwarfDebugRangeListFooter(Unit, EndLabel); 1962 } 1963 } 1964 1965 void DWARFLinker::DIECloner::generateUnitLocations( 1966 CompileUnit &Unit, const DWARFFile &File, 1967 ExpressionHandlerRef ExprHandler) { 1968 if (LLVM_UNLIKELY(Linker.Options.Update)) 1969 return; 1970 1971 const LocListAttributesTy &AllLocListAttributes = 1972 Unit.getLocationAttributes(); 1973 1974 if (AllLocListAttributes.empty()) 1975 return; 1976 1977 // Emit locations list table header. 1978 MCSymbol *EndLabel = Emitter->emitDwarfDebugLocListHeader(Unit); 1979 1980 for (auto &CurLocAttr : AllLocListAttributes) { 1981 // Get location expressions vector corresponding to the current attribute 1982 // from the source DWARF. 1983 Expected<DWARFLocationExpressionsVector> OriginalLocations = 1984 Unit.getOrigUnit().findLoclistFromOffset(CurLocAttr.get()); 1985 1986 if (!OriginalLocations) { 1987 llvm::consumeError(OriginalLocations.takeError()); 1988 Linker.reportWarning("Invalid location attribute ignored.", File); 1989 continue; 1990 } 1991 1992 DWARFLocationExpressionsVector LinkedLocationExpressions; 1993 for (DWARFLocationExpression &CurExpression : *OriginalLocations) { 1994 DWARFLocationExpression LinkedExpression; 1995 1996 if (CurExpression.Range) { 1997 // Relocate address range. 1998 LinkedExpression.Range = { 1999 CurExpression.Range->LowPC + CurLocAttr.RelocAdjustment, 2000 CurExpression.Range->HighPC + CurLocAttr.RelocAdjustment}; 2001 } 2002 2003 // Clone expression. 2004 LinkedExpression.Expr.reserve(CurExpression.Expr.size()); 2005 ExprHandler(CurExpression.Expr, LinkedExpression.Expr, 2006 CurLocAttr.RelocAdjustment); 2007 2008 LinkedLocationExpressions.push_back(LinkedExpression); 2009 } 2010 2011 // Emit locations list table fragment corresponding to the CurLocAttr. 2012 Emitter->emitDwarfDebugLocListFragment(Unit, LinkedLocationExpressions, 2013 CurLocAttr, AddrPool); 2014 } 2015 2016 // Emit locations list table footer. 2017 Emitter->emitDwarfDebugLocListFooter(Unit, EndLabel); 2018 } 2019 2020 static void patchAddrBase(DIE &Die, DIEInteger Offset) { 2021 for (auto &V : Die.values()) 2022 if (V.getAttribute() == dwarf::DW_AT_addr_base) { 2023 V = DIEValue(V.getAttribute(), V.getForm(), Offset); 2024 return; 2025 } 2026 2027 llvm_unreachable("Didn't find a DW_AT_addr_base in cloned DIE!"); 2028 } 2029 2030 void DWARFLinker::DIECloner::emitDebugAddrSection( 2031 CompileUnit &Unit, const uint16_t DwarfVersion) const { 2032 2033 if (LLVM_UNLIKELY(Linker.Options.Update)) 2034 return; 2035 2036 if (DwarfVersion < 5) 2037 return; 2038 2039 if (AddrPool.getValues().empty()) 2040 return; 2041 2042 MCSymbol *EndLabel = Emitter->emitDwarfDebugAddrsHeader(Unit); 2043 patchAddrBase(*Unit.getOutputUnitDIE(), 2044 DIEInteger(Emitter->getDebugAddrSectionSize())); 2045 Emitter->emitDwarfDebugAddrs(AddrPool.getValues(), 2046 Unit.getOrigUnit().getAddressByteSize()); 2047 Emitter->emitDwarfDebugAddrsFooter(Unit, EndLabel); 2048 } 2049 2050 /// Insert the new line info sequence \p Seq into the current 2051 /// set of already linked line info \p Rows. 2052 static void insertLineSequence(std::vector<DWARFDebugLine::Row> &Seq, 2053 std::vector<DWARFDebugLine::Row> &Rows) { 2054 if (Seq.empty()) 2055 return; 2056 2057 if (!Rows.empty() && Rows.back().Address < Seq.front().Address) { 2058 llvm::append_range(Rows, Seq); 2059 Seq.clear(); 2060 return; 2061 } 2062 2063 object::SectionedAddress Front = Seq.front().Address; 2064 auto InsertPoint = partition_point( 2065 Rows, [=](const DWARFDebugLine::Row &O) { return O.Address < Front; }); 2066 2067 // FIXME: this only removes the unneeded end_sequence if the 2068 // sequences have been inserted in order. Using a global sort like 2069 // described in generateLineTableForUnit() and delaying the end_sequene 2070 // elimination to emitLineTableForUnit() we can get rid of all of them. 2071 if (InsertPoint != Rows.end() && InsertPoint->Address == Front && 2072 InsertPoint->EndSequence) { 2073 *InsertPoint = Seq.front(); 2074 Rows.insert(InsertPoint + 1, Seq.begin() + 1, Seq.end()); 2075 } else { 2076 Rows.insert(InsertPoint, Seq.begin(), Seq.end()); 2077 } 2078 2079 Seq.clear(); 2080 } 2081 2082 static void patchStmtList(DIE &Die, DIEInteger Offset) { 2083 for (auto &V : Die.values()) 2084 if (V.getAttribute() == dwarf::DW_AT_stmt_list) { 2085 V = DIEValue(V.getAttribute(), V.getForm(), Offset); 2086 return; 2087 } 2088 2089 llvm_unreachable("Didn't find DW_AT_stmt_list in cloned DIE!"); 2090 } 2091 2092 void DWARFLinker::DIECloner::rememberUnitForMacroOffset(CompileUnit &Unit) { 2093 DWARFUnit &OrigUnit = Unit.getOrigUnit(); 2094 DWARFDie OrigUnitDie = OrigUnit.getUnitDIE(); 2095 2096 if (std::optional<uint64_t> MacroAttr = 2097 dwarf::toSectionOffset(OrigUnitDie.find(dwarf::DW_AT_macros))) { 2098 UnitMacroMap.insert(std::make_pair(*MacroAttr, &Unit)); 2099 return; 2100 } 2101 2102 if (std::optional<uint64_t> MacroAttr = 2103 dwarf::toSectionOffset(OrigUnitDie.find(dwarf::DW_AT_macro_info))) { 2104 UnitMacroMap.insert(std::make_pair(*MacroAttr, &Unit)); 2105 return; 2106 } 2107 } 2108 2109 void DWARFLinker::DIECloner::generateLineTableForUnit(CompileUnit &Unit) { 2110 if (LLVM_UNLIKELY(Emitter == nullptr)) 2111 return; 2112 2113 // Check whether DW_AT_stmt_list attribute is presented. 2114 DWARFDie CUDie = Unit.getOrigUnit().getUnitDIE(); 2115 auto StmtList = dwarf::toSectionOffset(CUDie.find(dwarf::DW_AT_stmt_list)); 2116 if (!StmtList) 2117 return; 2118 2119 // Update the cloned DW_AT_stmt_list with the correct debug_line offset. 2120 if (auto *OutputDIE = Unit.getOutputUnitDIE()) 2121 patchStmtList(*OutputDIE, DIEInteger(Emitter->getLineSectionSize())); 2122 2123 if (const DWARFDebugLine::LineTable *LT = 2124 ObjFile.Dwarf->getLineTableForUnit(&Unit.getOrigUnit())) { 2125 2126 DWARFDebugLine::LineTable LineTable; 2127 2128 // Set Line Table header. 2129 LineTable.Prologue = LT->Prologue; 2130 2131 // Set Line Table Rows. 2132 if (Linker.Options.Update) { 2133 LineTable.Rows = LT->Rows; 2134 // If all the line table contains is a DW_LNE_end_sequence, clear the line 2135 // table rows, it will be inserted again in the DWARFStreamer. 2136 if (LineTable.Rows.size() == 1 && LineTable.Rows[0].EndSequence) 2137 LineTable.Rows.clear(); 2138 2139 LineTable.Sequences = LT->Sequences; 2140 } else { 2141 // This vector is the output line table. 2142 std::vector<DWARFDebugLine::Row> NewRows; 2143 NewRows.reserve(LT->Rows.size()); 2144 2145 // Current sequence of rows being extracted, before being inserted 2146 // in NewRows. 2147 std::vector<DWARFDebugLine::Row> Seq; 2148 2149 const auto &FunctionRanges = Unit.getFunctionRanges(); 2150 std::optional<AddressRangeValuePair> CurrRange; 2151 2152 // FIXME: This logic is meant to generate exactly the same output as 2153 // Darwin's classic dsymutil. There is a nicer way to implement this 2154 // by simply putting all the relocated line info in NewRows and simply 2155 // sorting NewRows before passing it to emitLineTableForUnit. This 2156 // should be correct as sequences for a function should stay 2157 // together in the sorted output. There are a few corner cases that 2158 // look suspicious though, and that required to implement the logic 2159 // this way. Revisit that once initial validation is finished. 2160 2161 // Iterate over the object file line info and extract the sequences 2162 // that correspond to linked functions. 2163 for (DWARFDebugLine::Row Row : LT->Rows) { 2164 // Check whether we stepped out of the range. The range is 2165 // half-open, but consider accept the end address of the range if 2166 // it is marked as end_sequence in the input (because in that 2167 // case, the relocation offset is accurate and that entry won't 2168 // serve as the start of another function). 2169 if (!CurrRange || !CurrRange->Range.contains(Row.Address.Address)) { 2170 // We just stepped out of a known range. Insert a end_sequence 2171 // corresponding to the end of the range. 2172 uint64_t StopAddress = 2173 CurrRange ? CurrRange->Range.end() + CurrRange->Value : -1ULL; 2174 CurrRange = FunctionRanges.getRangeThatContains(Row.Address.Address); 2175 if (StopAddress != -1ULL && !Seq.empty()) { 2176 // Insert end sequence row with the computed end address, but 2177 // the same line as the previous one. 2178 auto NextLine = Seq.back(); 2179 NextLine.Address.Address = StopAddress; 2180 NextLine.EndSequence = 1; 2181 NextLine.PrologueEnd = 0; 2182 NextLine.BasicBlock = 0; 2183 NextLine.EpilogueBegin = 0; 2184 Seq.push_back(NextLine); 2185 insertLineSequence(Seq, NewRows); 2186 } 2187 2188 if (!CurrRange) 2189 continue; 2190 } 2191 2192 // Ignore empty sequences. 2193 if (Row.EndSequence && Seq.empty()) 2194 continue; 2195 2196 // Relocate row address and add it to the current sequence. 2197 Row.Address.Address += CurrRange->Value; 2198 Seq.emplace_back(Row); 2199 2200 if (Row.EndSequence) 2201 insertLineSequence(Seq, NewRows); 2202 } 2203 2204 LineTable.Rows = std::move(NewRows); 2205 } 2206 2207 Emitter->emitLineTableForUnit(LineTable, Unit, DebugStrPool, 2208 DebugLineStrPool); 2209 } else 2210 Linker.reportWarning("Cann't load line table.", ObjFile); 2211 } 2212 2213 void DWARFLinker::emitAcceleratorEntriesForUnit(CompileUnit &Unit) { 2214 for (AccelTableKind AccelTableKind : Options.AccelTables) { 2215 switch (AccelTableKind) { 2216 case AccelTableKind::Apple: { 2217 // Add namespaces. 2218 for (const auto &Namespace : Unit.getNamespaces()) 2219 AppleNamespaces.addName(Namespace.Name, Namespace.Die->getOffset() + 2220 Unit.getStartOffset()); 2221 // Add names. 2222 for (const auto &Pubname : Unit.getPubnames()) 2223 AppleNames.addName(Pubname.Name, 2224 Pubname.Die->getOffset() + Unit.getStartOffset()); 2225 // Add types. 2226 for (const auto &Pubtype : Unit.getPubtypes()) 2227 AppleTypes.addName( 2228 Pubtype.Name, Pubtype.Die->getOffset() + Unit.getStartOffset(), 2229 Pubtype.Die->getTag(), 2230 Pubtype.ObjcClassImplementation ? dwarf::DW_FLAG_type_implementation 2231 : 0, 2232 Pubtype.QualifiedNameHash); 2233 // Add ObjC names. 2234 for (const auto &ObjC : Unit.getObjC()) 2235 AppleObjc.addName(ObjC.Name, 2236 ObjC.Die->getOffset() + Unit.getStartOffset()); 2237 } break; 2238 case AccelTableKind::Pub: { 2239 TheDwarfEmitter->emitPubNamesForUnit(Unit); 2240 TheDwarfEmitter->emitPubTypesForUnit(Unit); 2241 } break; 2242 case AccelTableKind::DebugNames: { 2243 for (const auto &Namespace : Unit.getNamespaces()) 2244 DebugNames.addName( 2245 Namespace.Name, Namespace.Die->getOffset(), 2246 DWARF5AccelTableData::getDefiningParentDieOffset(*Namespace.Die), 2247 Namespace.Die->getTag(), Unit.getUniqueID()); 2248 for (const auto &Pubname : Unit.getPubnames()) 2249 DebugNames.addName( 2250 Pubname.Name, Pubname.Die->getOffset(), 2251 DWARF5AccelTableData::getDefiningParentDieOffset(*Pubname.Die), 2252 Pubname.Die->getTag(), Unit.getUniqueID()); 2253 for (const auto &Pubtype : Unit.getPubtypes()) 2254 DebugNames.addName( 2255 Pubtype.Name, Pubtype.Die->getOffset(), 2256 DWARF5AccelTableData::getDefiningParentDieOffset(*Pubtype.Die), 2257 Pubtype.Die->getTag(), Unit.getUniqueID()); 2258 } break; 2259 } 2260 } 2261 } 2262 2263 /// Read the frame info stored in the object, and emit the 2264 /// patched frame descriptions for the resulting file. 2265 /// 2266 /// This is actually pretty easy as the data of the CIEs and FDEs can 2267 /// be considered as black boxes and moved as is. The only thing to do 2268 /// is to patch the addresses in the headers. 2269 void DWARFLinker::patchFrameInfoForObject(LinkContext &Context) { 2270 DWARFContext &OrigDwarf = *Context.File.Dwarf; 2271 unsigned SrcAddrSize = OrigDwarf.getDWARFObj().getAddressSize(); 2272 2273 StringRef FrameData = OrigDwarf.getDWARFObj().getFrameSection().Data; 2274 if (FrameData.empty()) 2275 return; 2276 2277 RangesTy AllUnitsRanges; 2278 for (std::unique_ptr<CompileUnit> &Unit : Context.CompileUnits) { 2279 for (auto CurRange : Unit->getFunctionRanges()) 2280 AllUnitsRanges.insert(CurRange.Range, CurRange.Value); 2281 } 2282 2283 DataExtractor Data(FrameData, OrigDwarf.isLittleEndian(), 0); 2284 uint64_t InputOffset = 0; 2285 2286 // Store the data of the CIEs defined in this object, keyed by their 2287 // offsets. 2288 DenseMap<uint64_t, StringRef> LocalCIES; 2289 2290 while (Data.isValidOffset(InputOffset)) { 2291 uint64_t EntryOffset = InputOffset; 2292 uint32_t InitialLength = Data.getU32(&InputOffset); 2293 if (InitialLength == 0xFFFFFFFF) 2294 return reportWarning("Dwarf64 bits no supported", Context.File); 2295 2296 uint32_t CIEId = Data.getU32(&InputOffset); 2297 if (CIEId == 0xFFFFFFFF) { 2298 // This is a CIE, store it. 2299 StringRef CIEData = FrameData.substr(EntryOffset, InitialLength + 4); 2300 LocalCIES[EntryOffset] = CIEData; 2301 // The -4 is to account for the CIEId we just read. 2302 InputOffset += InitialLength - 4; 2303 continue; 2304 } 2305 2306 uint64_t Loc = Data.getUnsigned(&InputOffset, SrcAddrSize); 2307 2308 // Some compilers seem to emit frame info that doesn't start at 2309 // the function entry point, thus we can't just lookup the address 2310 // in the debug map. Use the AddressInfo's range map to see if the FDE 2311 // describes something that we can relocate. 2312 std::optional<AddressRangeValuePair> Range = 2313 AllUnitsRanges.getRangeThatContains(Loc); 2314 if (!Range) { 2315 // The +4 is to account for the size of the InitialLength field itself. 2316 InputOffset = EntryOffset + InitialLength + 4; 2317 continue; 2318 } 2319 2320 // This is an FDE, and we have a mapping. 2321 // Have we already emitted a corresponding CIE? 2322 StringRef CIEData = LocalCIES[CIEId]; 2323 if (CIEData.empty()) 2324 return reportWarning("Inconsistent debug_frame content. Dropping.", 2325 Context.File); 2326 2327 // Look if we already emitted a CIE that corresponds to the 2328 // referenced one (the CIE data is the key of that lookup). 2329 auto IteratorInserted = EmittedCIEs.insert( 2330 std::make_pair(CIEData, TheDwarfEmitter->getFrameSectionSize())); 2331 // If there is no CIE yet for this ID, emit it. 2332 if (IteratorInserted.second) { 2333 LastCIEOffset = TheDwarfEmitter->getFrameSectionSize(); 2334 IteratorInserted.first->getValue() = LastCIEOffset; 2335 TheDwarfEmitter->emitCIE(CIEData); 2336 } 2337 2338 // Emit the FDE with updated address and CIE pointer. 2339 // (4 + AddrSize) is the size of the CIEId + initial_location 2340 // fields that will get reconstructed by emitFDE(). 2341 unsigned FDERemainingBytes = InitialLength - (4 + SrcAddrSize); 2342 TheDwarfEmitter->emitFDE(IteratorInserted.first->getValue(), SrcAddrSize, 2343 Loc + Range->Value, 2344 FrameData.substr(InputOffset, FDERemainingBytes)); 2345 InputOffset += FDERemainingBytes; 2346 } 2347 } 2348 2349 uint32_t DWARFLinker::DIECloner::hashFullyQualifiedName(DWARFDie DIE, 2350 CompileUnit &U, 2351 const DWARFFile &File, 2352 int ChildRecurseDepth) { 2353 const char *Name = nullptr; 2354 DWARFUnit *OrigUnit = &U.getOrigUnit(); 2355 CompileUnit *CU = &U; 2356 std::optional<DWARFFormValue> Ref; 2357 2358 while (true) { 2359 if (const char *CurrentName = DIE.getName(DINameKind::ShortName)) 2360 Name = CurrentName; 2361 2362 if (!(Ref = DIE.find(dwarf::DW_AT_specification)) && 2363 !(Ref = DIE.find(dwarf::DW_AT_abstract_origin))) 2364 break; 2365 2366 if (!Ref->isFormClass(DWARFFormValue::FC_Reference)) 2367 break; 2368 2369 CompileUnit *RefCU; 2370 if (auto RefDIE = 2371 Linker.resolveDIEReference(File, CompileUnits, *Ref, DIE, RefCU)) { 2372 CU = RefCU; 2373 OrigUnit = &RefCU->getOrigUnit(); 2374 DIE = RefDIE; 2375 } 2376 } 2377 2378 unsigned Idx = OrigUnit->getDIEIndex(DIE); 2379 if (!Name && DIE.getTag() == dwarf::DW_TAG_namespace) 2380 Name = "(anonymous namespace)"; 2381 2382 if (CU->getInfo(Idx).ParentIdx == 0 || 2383 // FIXME: dsymutil-classic compatibility. Ignore modules. 2384 CU->getOrigUnit().getDIEAtIndex(CU->getInfo(Idx).ParentIdx).getTag() == 2385 dwarf::DW_TAG_module) 2386 return djbHash(Name ? Name : "", djbHash(ChildRecurseDepth ? "" : "::")); 2387 2388 DWARFDie Die = OrigUnit->getDIEAtIndex(CU->getInfo(Idx).ParentIdx); 2389 return djbHash( 2390 (Name ? Name : ""), 2391 djbHash((Name ? "::" : ""), 2392 hashFullyQualifiedName(Die, *CU, File, ++ChildRecurseDepth))); 2393 } 2394 2395 static uint64_t getDwoId(const DWARFDie &CUDie) { 2396 auto DwoId = dwarf::toUnsigned( 2397 CUDie.find({dwarf::DW_AT_dwo_id, dwarf::DW_AT_GNU_dwo_id})); 2398 if (DwoId) 2399 return *DwoId; 2400 return 0; 2401 } 2402 2403 static std::string 2404 remapPath(StringRef Path, 2405 const DWARFLinkerBase::ObjectPrefixMapTy &ObjectPrefixMap) { 2406 if (ObjectPrefixMap.empty()) 2407 return Path.str(); 2408 2409 SmallString<256> p = Path; 2410 for (const auto &Entry : ObjectPrefixMap) 2411 if (llvm::sys::path::replace_path_prefix(p, Entry.first, Entry.second)) 2412 break; 2413 return p.str().str(); 2414 } 2415 2416 static std::string 2417 getPCMFile(const DWARFDie &CUDie, 2418 const DWARFLinkerBase::ObjectPrefixMapTy *ObjectPrefixMap) { 2419 std::string PCMFile = dwarf::toString( 2420 CUDie.find({dwarf::DW_AT_dwo_name, dwarf::DW_AT_GNU_dwo_name}), ""); 2421 2422 if (PCMFile.empty()) 2423 return PCMFile; 2424 2425 if (ObjectPrefixMap) 2426 PCMFile = remapPath(PCMFile, *ObjectPrefixMap); 2427 2428 return PCMFile; 2429 } 2430 2431 std::pair<bool, bool> DWARFLinker::isClangModuleRef(const DWARFDie &CUDie, 2432 std::string &PCMFile, 2433 LinkContext &Context, 2434 unsigned Indent, 2435 bool Quiet) { 2436 if (PCMFile.empty()) 2437 return std::make_pair(false, false); 2438 2439 // Clang module DWARF skeleton CUs abuse this for the path to the module. 2440 uint64_t DwoId = getDwoId(CUDie); 2441 2442 std::string Name = dwarf::toString(CUDie.find(dwarf::DW_AT_name), ""); 2443 if (Name.empty()) { 2444 if (!Quiet) 2445 reportWarning("Anonymous module skeleton CU for " + PCMFile, 2446 Context.File); 2447 return std::make_pair(true, true); 2448 } 2449 2450 if (!Quiet && Options.Verbose) { 2451 outs().indent(Indent); 2452 outs() << "Found clang module reference " << PCMFile; 2453 } 2454 2455 auto Cached = ClangModules.find(PCMFile); 2456 if (Cached != ClangModules.end()) { 2457 // FIXME: Until PR27449 (https://llvm.org/bugs/show_bug.cgi?id=27449) is 2458 // fixed in clang, only warn about DWO_id mismatches in verbose mode. 2459 // ASTFileSignatures will change randomly when a module is rebuilt. 2460 if (!Quiet && Options.Verbose && (Cached->second != DwoId)) 2461 reportWarning(Twine("hash mismatch: this object file was built against a " 2462 "different version of the module ") + 2463 PCMFile, 2464 Context.File); 2465 if (!Quiet && Options.Verbose) 2466 outs() << " [cached].\n"; 2467 return std::make_pair(true, true); 2468 } 2469 2470 return std::make_pair(true, false); 2471 } 2472 2473 bool DWARFLinker::registerModuleReference(const DWARFDie &CUDie, 2474 LinkContext &Context, 2475 ObjFileLoaderTy Loader, 2476 CompileUnitHandlerTy OnCUDieLoaded, 2477 unsigned Indent) { 2478 std::string PCMFile = getPCMFile(CUDie, Options.ObjectPrefixMap); 2479 std::pair<bool, bool> IsClangModuleRef = 2480 isClangModuleRef(CUDie, PCMFile, Context, Indent, false); 2481 2482 if (!IsClangModuleRef.first) 2483 return false; 2484 2485 if (IsClangModuleRef.second) 2486 return true; 2487 2488 if (Options.Verbose) 2489 outs() << " ...\n"; 2490 2491 // Cyclic dependencies are disallowed by Clang, but we still 2492 // shouldn't run into an infinite loop, so mark it as processed now. 2493 ClangModules.insert({PCMFile, getDwoId(CUDie)}); 2494 2495 if (Error E = loadClangModule(Loader, CUDie, PCMFile, Context, OnCUDieLoaded, 2496 Indent + 2)) { 2497 consumeError(std::move(E)); 2498 return false; 2499 } 2500 return true; 2501 } 2502 2503 Error DWARFLinker::loadClangModule( 2504 ObjFileLoaderTy Loader, const DWARFDie &CUDie, const std::string &PCMFile, 2505 LinkContext &Context, CompileUnitHandlerTy OnCUDieLoaded, unsigned Indent) { 2506 2507 uint64_t DwoId = getDwoId(CUDie); 2508 std::string ModuleName = dwarf::toString(CUDie.find(dwarf::DW_AT_name), ""); 2509 2510 /// Using a SmallString<0> because loadClangModule() is recursive. 2511 SmallString<0> Path(Options.PrependPath); 2512 if (sys::path::is_relative(PCMFile)) 2513 resolveRelativeObjectPath(Path, CUDie); 2514 sys::path::append(Path, PCMFile); 2515 // Don't use the cached binary holder because we have no thread-safety 2516 // guarantee and the lifetime is limited. 2517 2518 if (Loader == nullptr) { 2519 reportError("Could not load clang module: loader is not specified.\n", 2520 Context.File); 2521 return Error::success(); 2522 } 2523 2524 auto ErrOrObj = Loader(Context.File.FileName, Path); 2525 if (!ErrOrObj) 2526 return Error::success(); 2527 2528 std::unique_ptr<CompileUnit> Unit; 2529 for (const auto &CU : ErrOrObj->Dwarf->compile_units()) { 2530 OnCUDieLoaded(*CU); 2531 // Recursively get all modules imported by this one. 2532 auto ChildCUDie = CU->getUnitDIE(); 2533 if (!ChildCUDie) 2534 continue; 2535 if (!registerModuleReference(ChildCUDie, Context, Loader, OnCUDieLoaded, 2536 Indent)) { 2537 if (Unit) { 2538 std::string Err = 2539 (PCMFile + 2540 ": Clang modules are expected to have exactly 1 compile unit.\n"); 2541 reportError(Err, Context.File); 2542 return make_error<StringError>(Err, inconvertibleErrorCode()); 2543 } 2544 // FIXME: Until PR27449 (https://llvm.org/bugs/show_bug.cgi?id=27449) is 2545 // fixed in clang, only warn about DWO_id mismatches in verbose mode. 2546 // ASTFileSignatures will change randomly when a module is rebuilt. 2547 uint64_t PCMDwoId = getDwoId(ChildCUDie); 2548 if (PCMDwoId != DwoId) { 2549 if (Options.Verbose) 2550 reportWarning( 2551 Twine("hash mismatch: this object file was built against a " 2552 "different version of the module ") + 2553 PCMFile, 2554 Context.File); 2555 // Update the cache entry with the DwoId of the module loaded from disk. 2556 ClangModules[PCMFile] = PCMDwoId; 2557 } 2558 2559 // Add this module. 2560 Unit = std::make_unique<CompileUnit>(*CU, UniqueUnitID++, !Options.NoODR, 2561 ModuleName); 2562 } 2563 } 2564 2565 if (Unit) 2566 Context.ModuleUnits.emplace_back(RefModuleUnit{*ErrOrObj, std::move(Unit)}); 2567 2568 return Error::success(); 2569 } 2570 2571 uint64_t DWARFLinker::DIECloner::cloneAllCompileUnits( 2572 DWARFContext &DwarfContext, const DWARFFile &File, bool IsLittleEndian) { 2573 uint64_t OutputDebugInfoSize = 2574 (Emitter == nullptr) ? 0 : Emitter->getDebugInfoSectionSize(); 2575 const uint64_t StartOutputDebugInfoSize = OutputDebugInfoSize; 2576 2577 for (auto &CurrentUnit : CompileUnits) { 2578 const uint16_t DwarfVersion = CurrentUnit->getOrigUnit().getVersion(); 2579 const uint32_t UnitHeaderSize = DwarfVersion >= 5 ? 12 : 11; 2580 auto InputDIE = CurrentUnit->getOrigUnit().getUnitDIE(); 2581 CurrentUnit->setStartOffset(OutputDebugInfoSize); 2582 if (!InputDIE) { 2583 OutputDebugInfoSize = CurrentUnit->computeNextUnitOffset(DwarfVersion); 2584 continue; 2585 } 2586 if (CurrentUnit->getInfo(0).Keep) { 2587 // Clone the InputDIE into your Unit DIE in our compile unit since it 2588 // already has a DIE inside of it. 2589 CurrentUnit->createOutputDIE(); 2590 rememberUnitForMacroOffset(*CurrentUnit); 2591 cloneDIE(InputDIE, File, *CurrentUnit, 0 /* PC offset */, UnitHeaderSize, 2592 0, IsLittleEndian, CurrentUnit->getOutputUnitDIE()); 2593 } 2594 2595 OutputDebugInfoSize = CurrentUnit->computeNextUnitOffset(DwarfVersion); 2596 2597 if (Emitter != nullptr) { 2598 2599 generateLineTableForUnit(*CurrentUnit); 2600 2601 Linker.emitAcceleratorEntriesForUnit(*CurrentUnit); 2602 2603 if (LLVM_UNLIKELY(Linker.Options.Update)) 2604 continue; 2605 2606 Linker.generateUnitRanges(*CurrentUnit, File, AddrPool); 2607 2608 auto ProcessExpr = [&](SmallVectorImpl<uint8_t> &SrcBytes, 2609 SmallVectorImpl<uint8_t> &OutBytes, 2610 int64_t RelocAdjustment) { 2611 DWARFUnit &OrigUnit = CurrentUnit->getOrigUnit(); 2612 DataExtractor Data(SrcBytes, IsLittleEndian, 2613 OrigUnit.getAddressByteSize()); 2614 cloneExpression(Data, 2615 DWARFExpression(Data, OrigUnit.getAddressByteSize(), 2616 OrigUnit.getFormParams().Format), 2617 File, *CurrentUnit, OutBytes, RelocAdjustment, 2618 IsLittleEndian); 2619 }; 2620 generateUnitLocations(*CurrentUnit, File, ProcessExpr); 2621 emitDebugAddrSection(*CurrentUnit, DwarfVersion); 2622 } 2623 AddrPool.clear(); 2624 } 2625 2626 if (Emitter != nullptr) { 2627 assert(Emitter); 2628 // Emit macro tables. 2629 Emitter->emitMacroTables(File.Dwarf.get(), UnitMacroMap, DebugStrPool); 2630 2631 // Emit all the compile unit's debug information. 2632 for (auto &CurrentUnit : CompileUnits) { 2633 CurrentUnit->fixupForwardReferences(); 2634 2635 if (!CurrentUnit->getOutputUnitDIE()) 2636 continue; 2637 2638 unsigned DwarfVersion = CurrentUnit->getOrigUnit().getVersion(); 2639 2640 assert(Emitter->getDebugInfoSectionSize() == 2641 CurrentUnit->getStartOffset()); 2642 Emitter->emitCompileUnitHeader(*CurrentUnit, DwarfVersion); 2643 Emitter->emitDIE(*CurrentUnit->getOutputUnitDIE()); 2644 assert(Emitter->getDebugInfoSectionSize() == 2645 CurrentUnit->computeNextUnitOffset(DwarfVersion)); 2646 } 2647 } 2648 2649 return OutputDebugInfoSize - StartOutputDebugInfoSize; 2650 } 2651 2652 void DWARFLinker::copyInvariantDebugSection(DWARFContext &Dwarf) { 2653 TheDwarfEmitter->emitSectionContents(Dwarf.getDWARFObj().getLocSection().Data, 2654 DebugSectionKind::DebugLoc); 2655 TheDwarfEmitter->emitSectionContents( 2656 Dwarf.getDWARFObj().getRangesSection().Data, 2657 DebugSectionKind::DebugRange); 2658 TheDwarfEmitter->emitSectionContents( 2659 Dwarf.getDWARFObj().getFrameSection().Data, DebugSectionKind::DebugFrame); 2660 TheDwarfEmitter->emitSectionContents(Dwarf.getDWARFObj().getArangesSection(), 2661 DebugSectionKind::DebugARanges); 2662 TheDwarfEmitter->emitSectionContents( 2663 Dwarf.getDWARFObj().getAddrSection().Data, DebugSectionKind::DebugAddr); 2664 TheDwarfEmitter->emitSectionContents( 2665 Dwarf.getDWARFObj().getRnglistsSection().Data, 2666 DebugSectionKind::DebugRngLists); 2667 TheDwarfEmitter->emitSectionContents( 2668 Dwarf.getDWARFObj().getLoclistsSection().Data, 2669 DebugSectionKind::DebugLocLists); 2670 } 2671 2672 void DWARFLinker::addObjectFile(DWARFFile &File, ObjFileLoaderTy Loader, 2673 CompileUnitHandlerTy OnCUDieLoaded) { 2674 ObjectContexts.emplace_back(LinkContext(File)); 2675 2676 if (ObjectContexts.back().File.Dwarf) { 2677 for (const std::unique_ptr<DWARFUnit> &CU : 2678 ObjectContexts.back().File.Dwarf->compile_units()) { 2679 DWARFDie CUDie = CU->getUnitDIE(); 2680 2681 if (!CUDie) 2682 continue; 2683 2684 OnCUDieLoaded(*CU); 2685 2686 if (!LLVM_UNLIKELY(Options.Update)) 2687 registerModuleReference(CUDie, ObjectContexts.back(), Loader, 2688 OnCUDieLoaded); 2689 } 2690 } 2691 } 2692 2693 Error DWARFLinker::link() { 2694 assert((Options.TargetDWARFVersion != 0) && 2695 "TargetDWARFVersion should be set"); 2696 2697 // First populate the data structure we need for each iteration of the 2698 // parallel loop. 2699 unsigned NumObjects = ObjectContexts.size(); 2700 2701 // This Dwarf string pool which is used for emission. It must be used 2702 // serially as the order of calling getStringOffset matters for 2703 // reproducibility. 2704 OffsetsStringPool DebugStrPool(StringsTranslator, true); 2705 OffsetsStringPool DebugLineStrPool(StringsTranslator, false); 2706 DebugDieValuePool StringOffsetPool; 2707 2708 // ODR Contexts for the optimize. 2709 DeclContextTree ODRContexts; 2710 2711 for (LinkContext &OptContext : ObjectContexts) { 2712 if (Options.Verbose) 2713 outs() << "DEBUG MAP OBJECT: " << OptContext.File.FileName << "\n"; 2714 2715 if (!OptContext.File.Dwarf) 2716 continue; 2717 2718 if (Options.VerifyInputDWARF) 2719 verifyInput(OptContext.File); 2720 2721 // Look for relocations that correspond to address map entries. 2722 2723 // there was findvalidrelocations previously ... probably we need to gather 2724 // info here 2725 if (LLVM_LIKELY(!Options.Update) && 2726 !OptContext.File.Addresses->hasValidRelocs()) { 2727 if (Options.Verbose) 2728 outs() << "No valid relocations found. Skipping.\n"; 2729 2730 // Set "Skip" flag as a signal to other loops that we should not 2731 // process this iteration. 2732 OptContext.Skip = true; 2733 continue; 2734 } 2735 2736 // Setup access to the debug info. 2737 if (!OptContext.File.Dwarf) 2738 continue; 2739 2740 // Check whether type units are presented. 2741 if (!OptContext.File.Dwarf->types_section_units().empty()) { 2742 reportWarning("type units are not currently supported: file will " 2743 "be skipped", 2744 OptContext.File); 2745 OptContext.Skip = true; 2746 continue; 2747 } 2748 2749 // Clone all the clang modules with requires extracting the DIE units. We 2750 // don't need the full debug info until the Analyze phase. 2751 OptContext.CompileUnits.reserve( 2752 OptContext.File.Dwarf->getNumCompileUnits()); 2753 for (const auto &CU : OptContext.File.Dwarf->compile_units()) { 2754 auto CUDie = CU->getUnitDIE(/*ExtractUnitDIEOnly=*/true); 2755 if (Options.Verbose) { 2756 outs() << "Input compilation unit:"; 2757 DIDumpOptions DumpOpts; 2758 DumpOpts.ChildRecurseDepth = 0; 2759 DumpOpts.Verbose = Options.Verbose; 2760 CUDie.dump(outs(), 0, DumpOpts); 2761 } 2762 } 2763 2764 for (auto &CU : OptContext.ModuleUnits) { 2765 if (Error Err = cloneModuleUnit(OptContext, CU, ODRContexts, DebugStrPool, 2766 DebugLineStrPool, StringOffsetPool)) 2767 reportWarning(toString(std::move(Err)), CU.File); 2768 } 2769 } 2770 2771 // At this point we know how much data we have emitted. We use this value to 2772 // compare canonical DIE offsets in analyzeContextInfo to see if a definition 2773 // is already emitted, without being affected by canonical die offsets set 2774 // later. This prevents undeterminism when analyze and clone execute 2775 // concurrently, as clone set the canonical DIE offset and analyze reads it. 2776 const uint64_t ModulesEndOffset = 2777 (TheDwarfEmitter == nullptr) ? 0 2778 : TheDwarfEmitter->getDebugInfoSectionSize(); 2779 2780 // These variables manage the list of processed object files. 2781 // The mutex and condition variable are to ensure that this is thread safe. 2782 std::mutex ProcessedFilesMutex; 2783 std::condition_variable ProcessedFilesConditionVariable; 2784 BitVector ProcessedFiles(NumObjects, false); 2785 2786 // Analyzing the context info is particularly expensive so it is executed in 2787 // parallel with emitting the previous compile unit. 2788 auto AnalyzeLambda = [&](size_t I) { 2789 auto &Context = ObjectContexts[I]; 2790 2791 if (Context.Skip || !Context.File.Dwarf) 2792 return; 2793 2794 for (const auto &CU : Context.File.Dwarf->compile_units()) { 2795 // Previously we only extracted the unit DIEs. We need the full debug info 2796 // now. 2797 auto CUDie = CU->getUnitDIE(/*ExtractUnitDIEOnly=*/false); 2798 std::string PCMFile = getPCMFile(CUDie, Options.ObjectPrefixMap); 2799 2800 if (!CUDie || LLVM_UNLIKELY(Options.Update) || 2801 !isClangModuleRef(CUDie, PCMFile, Context, 0, true).first) { 2802 Context.CompileUnits.push_back(std::make_unique<CompileUnit>( 2803 *CU, UniqueUnitID++, !Options.NoODR && !Options.Update, "")); 2804 } 2805 } 2806 2807 // Now build the DIE parent links that we will use during the next phase. 2808 for (auto &CurrentUnit : Context.CompileUnits) { 2809 auto CUDie = CurrentUnit->getOrigUnit().getUnitDIE(); 2810 if (!CUDie) 2811 continue; 2812 analyzeContextInfo(CurrentUnit->getOrigUnit().getUnitDIE(), 0, 2813 *CurrentUnit, &ODRContexts.getRoot(), ODRContexts, 2814 ModulesEndOffset, Options.ParseableSwiftInterfaces, 2815 [&](const Twine &Warning, const DWARFDie &DIE) { 2816 reportWarning(Warning, Context.File, &DIE); 2817 }); 2818 } 2819 }; 2820 2821 // For each object file map how many bytes were emitted. 2822 StringMap<DebugInfoSize> SizeByObject; 2823 2824 // And then the remaining work in serial again. 2825 // Note, although this loop runs in serial, it can run in parallel with 2826 // the analyzeContextInfo loop so long as we process files with indices >= 2827 // than those processed by analyzeContextInfo. 2828 auto CloneLambda = [&](size_t I) { 2829 auto &OptContext = ObjectContexts[I]; 2830 if (OptContext.Skip || !OptContext.File.Dwarf) 2831 return; 2832 2833 // Then mark all the DIEs that need to be present in the generated output 2834 // and collect some information about them. 2835 // Note that this loop can not be merged with the previous one because 2836 // cross-cu references require the ParentIdx to be setup for every CU in 2837 // the object file before calling this. 2838 if (LLVM_UNLIKELY(Options.Update)) { 2839 for (auto &CurrentUnit : OptContext.CompileUnits) 2840 CurrentUnit->markEverythingAsKept(); 2841 copyInvariantDebugSection(*OptContext.File.Dwarf); 2842 } else { 2843 for (auto &CurrentUnit : OptContext.CompileUnits) { 2844 lookForDIEsToKeep(*OptContext.File.Addresses, OptContext.CompileUnits, 2845 CurrentUnit->getOrigUnit().getUnitDIE(), 2846 OptContext.File, *CurrentUnit, 0); 2847 #ifndef NDEBUG 2848 verifyKeepChain(*CurrentUnit); 2849 #endif 2850 } 2851 } 2852 2853 // The calls to applyValidRelocs inside cloneDIE will walk the reloc 2854 // array again (in the same way findValidRelocsInDebugInfo() did). We 2855 // need to reset the NextValidReloc index to the beginning. 2856 if (OptContext.File.Addresses->hasValidRelocs() || 2857 LLVM_UNLIKELY(Options.Update)) { 2858 SizeByObject[OptContext.File.FileName].Input = 2859 getDebugInfoSize(*OptContext.File.Dwarf); 2860 SizeByObject[OptContext.File.FileName].Output = 2861 DIECloner(*this, TheDwarfEmitter, OptContext.File, DIEAlloc, 2862 OptContext.CompileUnits, Options.Update, DebugStrPool, 2863 DebugLineStrPool, StringOffsetPool) 2864 .cloneAllCompileUnits(*OptContext.File.Dwarf, OptContext.File, 2865 OptContext.File.Dwarf->isLittleEndian()); 2866 } 2867 if ((TheDwarfEmitter != nullptr) && !OptContext.CompileUnits.empty() && 2868 LLVM_LIKELY(!Options.Update)) 2869 patchFrameInfoForObject(OptContext); 2870 2871 // Clean-up before starting working on the next object. 2872 cleanupAuxiliarryData(OptContext); 2873 }; 2874 2875 auto EmitLambda = [&]() { 2876 // Emit everything that's global. 2877 if (TheDwarfEmitter != nullptr) { 2878 TheDwarfEmitter->emitAbbrevs(Abbreviations, Options.TargetDWARFVersion); 2879 TheDwarfEmitter->emitStrings(DebugStrPool); 2880 TheDwarfEmitter->emitStringOffsets(StringOffsetPool.getValues(), 2881 Options.TargetDWARFVersion); 2882 TheDwarfEmitter->emitLineStrings(DebugLineStrPool); 2883 for (AccelTableKind TableKind : Options.AccelTables) { 2884 switch (TableKind) { 2885 case AccelTableKind::Apple: 2886 TheDwarfEmitter->emitAppleNamespaces(AppleNamespaces); 2887 TheDwarfEmitter->emitAppleNames(AppleNames); 2888 TheDwarfEmitter->emitAppleTypes(AppleTypes); 2889 TheDwarfEmitter->emitAppleObjc(AppleObjc); 2890 break; 2891 case AccelTableKind::Pub: 2892 // Already emitted by emitAcceleratorEntriesForUnit. 2893 // Already emitted by emitAcceleratorEntriesForUnit. 2894 break; 2895 case AccelTableKind::DebugNames: 2896 TheDwarfEmitter->emitDebugNames(DebugNames); 2897 break; 2898 } 2899 } 2900 } 2901 }; 2902 2903 auto AnalyzeAll = [&]() { 2904 for (unsigned I = 0, E = NumObjects; I != E; ++I) { 2905 AnalyzeLambda(I); 2906 2907 std::unique_lock<std::mutex> LockGuard(ProcessedFilesMutex); 2908 ProcessedFiles.set(I); 2909 ProcessedFilesConditionVariable.notify_one(); 2910 } 2911 }; 2912 2913 auto CloneAll = [&]() { 2914 for (unsigned I = 0, E = NumObjects; I != E; ++I) { 2915 { 2916 std::unique_lock<std::mutex> LockGuard(ProcessedFilesMutex); 2917 if (!ProcessedFiles[I]) { 2918 ProcessedFilesConditionVariable.wait( 2919 LockGuard, [&]() { return ProcessedFiles[I]; }); 2920 } 2921 } 2922 2923 CloneLambda(I); 2924 } 2925 EmitLambda(); 2926 }; 2927 2928 // To limit memory usage in the single threaded case, analyze and clone are 2929 // run sequentially so the OptContext is freed after processing each object 2930 // in endDebugObject. 2931 if (Options.Threads == 1) { 2932 for (unsigned I = 0, E = NumObjects; I != E; ++I) { 2933 AnalyzeLambda(I); 2934 CloneLambda(I); 2935 } 2936 EmitLambda(); 2937 } else { 2938 ThreadPool Pool(hardware_concurrency(2)); 2939 Pool.async(AnalyzeAll); 2940 Pool.async(CloneAll); 2941 Pool.wait(); 2942 } 2943 2944 if (Options.Statistics) { 2945 // Create a vector sorted in descending order by output size. 2946 std::vector<std::pair<StringRef, DebugInfoSize>> Sorted; 2947 for (auto &E : SizeByObject) 2948 Sorted.emplace_back(E.first(), E.second); 2949 llvm::sort(Sorted, [](auto &LHS, auto &RHS) { 2950 return LHS.second.Output > RHS.second.Output; 2951 }); 2952 2953 auto ComputePercentange = [](int64_t Input, int64_t Output) -> float { 2954 const float Difference = Output - Input; 2955 const float Sum = Input + Output; 2956 if (Sum == 0) 2957 return 0; 2958 return (Difference / (Sum / 2)); 2959 }; 2960 2961 int64_t InputTotal = 0; 2962 int64_t OutputTotal = 0; 2963 const char *FormatStr = "{0,-45} {1,10}b {2,10}b {3,8:P}\n"; 2964 2965 // Print header. 2966 outs() << ".debug_info section size (in bytes)\n"; 2967 outs() << "----------------------------------------------------------------" 2968 "---------------\n"; 2969 outs() << "Filename Object " 2970 " dSYM Change\n"; 2971 outs() << "----------------------------------------------------------------" 2972 "---------------\n"; 2973 2974 // Print body. 2975 for (auto &E : Sorted) { 2976 InputTotal += E.second.Input; 2977 OutputTotal += E.second.Output; 2978 llvm::outs() << formatv( 2979 FormatStr, sys::path::filename(E.first).take_back(45), E.second.Input, 2980 E.second.Output, ComputePercentange(E.second.Input, E.second.Output)); 2981 } 2982 // Print total and footer. 2983 outs() << "----------------------------------------------------------------" 2984 "---------------\n"; 2985 llvm::outs() << formatv(FormatStr, "Total", InputTotal, OutputTotal, 2986 ComputePercentange(InputTotal, OutputTotal)); 2987 outs() << "----------------------------------------------------------------" 2988 "---------------\n\n"; 2989 } 2990 2991 return Error::success(); 2992 } 2993 2994 Error DWARFLinker::cloneModuleUnit(LinkContext &Context, RefModuleUnit &Unit, 2995 DeclContextTree &ODRContexts, 2996 OffsetsStringPool &DebugStrPool, 2997 OffsetsStringPool &DebugLineStrPool, 2998 DebugDieValuePool &StringOffsetPool, 2999 unsigned Indent) { 3000 assert(Unit.Unit.get() != nullptr); 3001 3002 if (!Unit.Unit->getOrigUnit().getUnitDIE().hasChildren()) 3003 return Error::success(); 3004 3005 if (Options.Verbose) { 3006 outs().indent(Indent); 3007 outs() << "cloning .debug_info from " << Unit.File.FileName << "\n"; 3008 } 3009 3010 // Analyze context for the module. 3011 analyzeContextInfo(Unit.Unit->getOrigUnit().getUnitDIE(), 0, *(Unit.Unit), 3012 &ODRContexts.getRoot(), ODRContexts, 0, 3013 Options.ParseableSwiftInterfaces, 3014 [&](const Twine &Warning, const DWARFDie &DIE) { 3015 reportWarning(Warning, Context.File, &DIE); 3016 }); 3017 // Keep everything. 3018 Unit.Unit->markEverythingAsKept(); 3019 3020 // Clone unit. 3021 UnitListTy CompileUnits; 3022 CompileUnits.emplace_back(std::move(Unit.Unit)); 3023 assert(TheDwarfEmitter); 3024 DIECloner(*this, TheDwarfEmitter, Unit.File, DIEAlloc, CompileUnits, 3025 Options.Update, DebugStrPool, DebugLineStrPool, StringOffsetPool) 3026 .cloneAllCompileUnits(*Unit.File.Dwarf, Unit.File, 3027 Unit.File.Dwarf->isLittleEndian()); 3028 return Error::success(); 3029 } 3030 3031 void DWARFLinker::verifyInput(const DWARFFile &File) { 3032 assert(File.Dwarf); 3033 3034 std::string Buffer; 3035 raw_string_ostream OS(Buffer); 3036 DIDumpOptions DumpOpts; 3037 if (!File.Dwarf->verify(OS, DumpOpts.noImplicitRecursion())) { 3038 if (Options.InputVerificationHandler) 3039 Options.InputVerificationHandler(File, OS.str()); 3040 } 3041 } 3042 3043 } // namespace llvm 3044