1 //===- MetadataLoader.cpp - Internal BitcodeReader implementation ---------===// 2 // 3 // Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions. 4 // See https://llvm.org/LICENSE.txt for license information. 5 // SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception 6 // 7 //===----------------------------------------------------------------------===// 8 9 #include "MetadataLoader.h" 10 #include "ValueList.h" 11 12 #include "llvm/ADT/APInt.h" 13 #include "llvm/ADT/ArrayRef.h" 14 #include "llvm/ADT/BitmaskEnum.h" 15 #include "llvm/ADT/DenseMap.h" 16 #include "llvm/ADT/DenseSet.h" 17 #include "llvm/ADT/STLFunctionalExtras.h" 18 #include "llvm/ADT/SetVector.h" 19 #include "llvm/ADT/SmallString.h" 20 #include "llvm/ADT/SmallVector.h" 21 #include "llvm/ADT/Statistic.h" 22 #include "llvm/ADT/StringRef.h" 23 #include "llvm/ADT/Twine.h" 24 #include "llvm/ADT/ilist_iterator.h" 25 #include "llvm/ADT/iterator_range.h" 26 #include "llvm/BinaryFormat/Dwarf.h" 27 #include "llvm/Bitcode/BitcodeReader.h" 28 #include "llvm/Bitcode/LLVMBitCodes.h" 29 #include "llvm/Bitstream/BitstreamReader.h" 30 #include "llvm/IR/AutoUpgrade.h" 31 #include "llvm/IR/BasicBlock.h" 32 #include "llvm/IR/Constants.h" 33 #include "llvm/IR/DebugInfoMetadata.h" 34 #include "llvm/IR/Function.h" 35 #include "llvm/IR/GlobalObject.h" 36 #include "llvm/IR/GlobalVariable.h" 37 #include "llvm/IR/Instruction.h" 38 #include "llvm/IR/IntrinsicInst.h" 39 #include "llvm/IR/LLVMContext.h" 40 #include "llvm/IR/Metadata.h" 41 #include "llvm/IR/Module.h" 42 #include "llvm/IR/TrackingMDRef.h" 43 #include "llvm/IR/Type.h" 44 #include "llvm/Support/Casting.h" 45 #include "llvm/Support/CommandLine.h" 46 #include "llvm/Support/Compiler.h" 47 #include "llvm/Support/ErrorHandling.h" 48 #include "llvm/Support/type_traits.h" 49 50 #include <algorithm> 51 #include <cassert> 52 #include <cstddef> 53 #include <cstdint> 54 #include <deque> 55 #include <iterator> 56 #include <limits> 57 #include <map> 58 #include <optional> 59 #include <string> 60 #include <tuple> 61 #include <type_traits> 62 #include <utility> 63 #include <vector> 64 namespace llvm { 65 class Argument; 66 } 67 68 using namespace llvm; 69 70 #define DEBUG_TYPE "bitcode-reader" 71 72 STATISTIC(NumMDStringLoaded, "Number of MDStrings loaded"); 73 STATISTIC(NumMDNodeTemporary, "Number of MDNode::Temporary created"); 74 STATISTIC(NumMDRecordLoaded, "Number of Metadata records loaded"); 75 76 /// Flag whether we need to import full type definitions for ThinLTO. 77 /// Currently needed for Darwin and LLDB. 78 static cl::opt<bool> ImportFullTypeDefinitions( 79 "import-full-type-definitions", cl::init(false), cl::Hidden, 80 cl::desc("Import full type definitions for ThinLTO.")); 81 82 static cl::opt<bool> DisableLazyLoading( 83 "disable-ondemand-mds-loading", cl::init(false), cl::Hidden, 84 cl::desc("Force disable the lazy-loading on-demand of metadata when " 85 "loading bitcode for importing.")); 86 87 namespace { 88 89 static int64_t unrotateSign(uint64_t U) { return (U & 1) ? ~(U >> 1) : U >> 1; } 90 91 class BitcodeReaderMetadataList { 92 /// Array of metadata references. 93 /// 94 /// Don't use std::vector here. Some versions of libc++ copy (instead of 95 /// move) on resize, and TrackingMDRef is very expensive to copy. 96 SmallVector<TrackingMDRef, 1> MetadataPtrs; 97 98 /// The set of indices in MetadataPtrs above of forward references that were 99 /// generated. 100 SmallDenseSet<unsigned, 1> ForwardReference; 101 102 /// The set of indices in MetadataPtrs above of Metadata that need to be 103 /// resolved. 104 SmallDenseSet<unsigned, 1> UnresolvedNodes; 105 106 /// Structures for resolving old type refs. 107 struct { 108 SmallDenseMap<MDString *, TempMDTuple, 1> Unknown; 109 SmallDenseMap<MDString *, DICompositeType *, 1> Final; 110 SmallDenseMap<MDString *, DICompositeType *, 1> FwdDecls; 111 SmallVector<std::pair<TrackingMDRef, TempMDTuple>, 1> Arrays; 112 } OldTypeRefs; 113 114 LLVMContext &Context; 115 116 /// Maximum number of valid references. Forward references exceeding the 117 /// maximum must be invalid. 118 unsigned RefsUpperBound; 119 120 public: 121 BitcodeReaderMetadataList(LLVMContext &C, size_t RefsUpperBound) 122 : Context(C), 123 RefsUpperBound(std::min((size_t)std::numeric_limits<unsigned>::max(), 124 RefsUpperBound)) {} 125 126 // vector compatibility methods 127 unsigned size() const { return MetadataPtrs.size(); } 128 void resize(unsigned N) { MetadataPtrs.resize(N); } 129 void push_back(Metadata *MD) { MetadataPtrs.emplace_back(MD); } 130 void clear() { MetadataPtrs.clear(); } 131 Metadata *back() const { return MetadataPtrs.back(); } 132 void pop_back() { MetadataPtrs.pop_back(); } 133 bool empty() const { return MetadataPtrs.empty(); } 134 135 Metadata *operator[](unsigned i) const { 136 assert(i < MetadataPtrs.size()); 137 return MetadataPtrs[i]; 138 } 139 140 Metadata *lookup(unsigned I) const { 141 if (I < MetadataPtrs.size()) 142 return MetadataPtrs[I]; 143 return nullptr; 144 } 145 146 void shrinkTo(unsigned N) { 147 assert(N <= size() && "Invalid shrinkTo request!"); 148 assert(ForwardReference.empty() && "Unexpected forward refs"); 149 assert(UnresolvedNodes.empty() && "Unexpected unresolved node"); 150 MetadataPtrs.resize(N); 151 } 152 153 /// Return the given metadata, creating a replaceable forward reference if 154 /// necessary. 155 Metadata *getMetadataFwdRef(unsigned Idx); 156 157 /// Return the given metadata only if it is fully resolved. 158 /// 159 /// Gives the same result as \a lookup(), unless \a MDNode::isResolved() 160 /// would give \c false. 161 Metadata *getMetadataIfResolved(unsigned Idx); 162 163 MDNode *getMDNodeFwdRefOrNull(unsigned Idx); 164 void assignValue(Metadata *MD, unsigned Idx); 165 void tryToResolveCycles(); 166 bool hasFwdRefs() const { return !ForwardReference.empty(); } 167 int getNextFwdRef() { 168 assert(hasFwdRefs()); 169 return *ForwardReference.begin(); 170 } 171 172 /// Upgrade a type that had an MDString reference. 173 void addTypeRef(MDString &UUID, DICompositeType &CT); 174 175 /// Upgrade a type that had an MDString reference. 176 Metadata *upgradeTypeRef(Metadata *MaybeUUID); 177 178 /// Upgrade a type ref array that may have MDString references. 179 Metadata *upgradeTypeRefArray(Metadata *MaybeTuple); 180 181 private: 182 Metadata *resolveTypeRefArray(Metadata *MaybeTuple); 183 }; 184 185 void BitcodeReaderMetadataList::assignValue(Metadata *MD, unsigned Idx) { 186 if (auto *MDN = dyn_cast<MDNode>(MD)) 187 if (!MDN->isResolved()) 188 UnresolvedNodes.insert(Idx); 189 190 if (Idx == size()) { 191 push_back(MD); 192 return; 193 } 194 195 if (Idx >= size()) 196 resize(Idx + 1); 197 198 TrackingMDRef &OldMD = MetadataPtrs[Idx]; 199 if (!OldMD) { 200 OldMD.reset(MD); 201 return; 202 } 203 204 // If there was a forward reference to this value, replace it. 205 TempMDTuple PrevMD(cast<MDTuple>(OldMD.get())); 206 PrevMD->replaceAllUsesWith(MD); 207 ForwardReference.erase(Idx); 208 } 209 210 Metadata *BitcodeReaderMetadataList::getMetadataFwdRef(unsigned Idx) { 211 // Bail out for a clearly invalid value. 212 if (Idx >= RefsUpperBound) 213 return nullptr; 214 215 if (Idx >= size()) 216 resize(Idx + 1); 217 218 if (Metadata *MD = MetadataPtrs[Idx]) 219 return MD; 220 221 // Track forward refs to be resolved later. 222 ForwardReference.insert(Idx); 223 224 // Create and return a placeholder, which will later be RAUW'd. 225 ++NumMDNodeTemporary; 226 Metadata *MD = MDNode::getTemporary(Context, std::nullopt).release(); 227 MetadataPtrs[Idx].reset(MD); 228 return MD; 229 } 230 231 Metadata *BitcodeReaderMetadataList::getMetadataIfResolved(unsigned Idx) { 232 Metadata *MD = lookup(Idx); 233 if (auto *N = dyn_cast_or_null<MDNode>(MD)) 234 if (!N->isResolved()) 235 return nullptr; 236 return MD; 237 } 238 239 MDNode *BitcodeReaderMetadataList::getMDNodeFwdRefOrNull(unsigned Idx) { 240 return dyn_cast_or_null<MDNode>(getMetadataFwdRef(Idx)); 241 } 242 243 void BitcodeReaderMetadataList::tryToResolveCycles() { 244 if (!ForwardReference.empty()) 245 // Still forward references... can't resolve cycles. 246 return; 247 248 // Give up on finding a full definition for any forward decls that remain. 249 for (const auto &Ref : OldTypeRefs.FwdDecls) 250 OldTypeRefs.Final.insert(Ref); 251 OldTypeRefs.FwdDecls.clear(); 252 253 // Upgrade from old type ref arrays. In strange cases, this could add to 254 // OldTypeRefs.Unknown. 255 for (const auto &Array : OldTypeRefs.Arrays) 256 Array.second->replaceAllUsesWith(resolveTypeRefArray(Array.first.get())); 257 OldTypeRefs.Arrays.clear(); 258 259 // Replace old string-based type refs with the resolved node, if possible. 260 // If we haven't seen the node, leave it to the verifier to complain about 261 // the invalid string reference. 262 for (const auto &Ref : OldTypeRefs.Unknown) { 263 if (DICompositeType *CT = OldTypeRefs.Final.lookup(Ref.first)) 264 Ref.second->replaceAllUsesWith(CT); 265 else 266 Ref.second->replaceAllUsesWith(Ref.first); 267 } 268 OldTypeRefs.Unknown.clear(); 269 270 if (UnresolvedNodes.empty()) 271 // Nothing to do. 272 return; 273 274 // Resolve any cycles. 275 for (unsigned I : UnresolvedNodes) { 276 auto &MD = MetadataPtrs[I]; 277 auto *N = dyn_cast_or_null<MDNode>(MD); 278 if (!N) 279 continue; 280 281 assert(!N->isTemporary() && "Unexpected forward reference"); 282 N->resolveCycles(); 283 } 284 285 // Make sure we return early again until there's another unresolved ref. 286 UnresolvedNodes.clear(); 287 } 288 289 void BitcodeReaderMetadataList::addTypeRef(MDString &UUID, 290 DICompositeType &CT) { 291 assert(CT.getRawIdentifier() == &UUID && "Mismatched UUID"); 292 if (CT.isForwardDecl()) 293 OldTypeRefs.FwdDecls.insert(std::make_pair(&UUID, &CT)); 294 else 295 OldTypeRefs.Final.insert(std::make_pair(&UUID, &CT)); 296 } 297 298 Metadata *BitcodeReaderMetadataList::upgradeTypeRef(Metadata *MaybeUUID) { 299 auto *UUID = dyn_cast_or_null<MDString>(MaybeUUID); 300 if (LLVM_LIKELY(!UUID)) 301 return MaybeUUID; 302 303 if (auto *CT = OldTypeRefs.Final.lookup(UUID)) 304 return CT; 305 306 auto &Ref = OldTypeRefs.Unknown[UUID]; 307 if (!Ref) 308 Ref = MDNode::getTemporary(Context, std::nullopt); 309 return Ref.get(); 310 } 311 312 Metadata *BitcodeReaderMetadataList::upgradeTypeRefArray(Metadata *MaybeTuple) { 313 auto *Tuple = dyn_cast_or_null<MDTuple>(MaybeTuple); 314 if (!Tuple || Tuple->isDistinct()) 315 return MaybeTuple; 316 317 // Look through the array immediately if possible. 318 if (!Tuple->isTemporary()) 319 return resolveTypeRefArray(Tuple); 320 321 // Create and return a placeholder to use for now. Eventually 322 // resolveTypeRefArrays() will be resolve this forward reference. 323 OldTypeRefs.Arrays.emplace_back( 324 std::piecewise_construct, std::forward_as_tuple(Tuple), 325 std::forward_as_tuple(MDTuple::getTemporary(Context, std::nullopt))); 326 return OldTypeRefs.Arrays.back().second.get(); 327 } 328 329 Metadata *BitcodeReaderMetadataList::resolveTypeRefArray(Metadata *MaybeTuple) { 330 auto *Tuple = dyn_cast_or_null<MDTuple>(MaybeTuple); 331 if (!Tuple || Tuple->isDistinct()) 332 return MaybeTuple; 333 334 // Look through the DITypeRefArray, upgrading each DIType *. 335 SmallVector<Metadata *, 32> Ops; 336 Ops.reserve(Tuple->getNumOperands()); 337 for (Metadata *MD : Tuple->operands()) 338 Ops.push_back(upgradeTypeRef(MD)); 339 340 return MDTuple::get(Context, Ops); 341 } 342 343 namespace { 344 345 class PlaceholderQueue { 346 // Placeholders would thrash around when moved, so store in a std::deque 347 // instead of some sort of vector. 348 std::deque<DistinctMDOperandPlaceholder> PHs; 349 350 public: 351 ~PlaceholderQueue() { 352 assert(empty() && 353 "PlaceholderQueue hasn't been flushed before being destroyed"); 354 } 355 bool empty() const { return PHs.empty(); } 356 DistinctMDOperandPlaceholder &getPlaceholderOp(unsigned ID); 357 void flush(BitcodeReaderMetadataList &MetadataList); 358 359 /// Return the list of temporaries nodes in the queue, these need to be 360 /// loaded before we can flush the queue. 361 void getTemporaries(BitcodeReaderMetadataList &MetadataList, 362 DenseSet<unsigned> &Temporaries) { 363 for (auto &PH : PHs) { 364 auto ID = PH.getID(); 365 auto *MD = MetadataList.lookup(ID); 366 if (!MD) { 367 Temporaries.insert(ID); 368 continue; 369 } 370 auto *N = dyn_cast_or_null<MDNode>(MD); 371 if (N && N->isTemporary()) 372 Temporaries.insert(ID); 373 } 374 } 375 }; 376 377 } // end anonymous namespace 378 379 DistinctMDOperandPlaceholder &PlaceholderQueue::getPlaceholderOp(unsigned ID) { 380 PHs.emplace_back(ID); 381 return PHs.back(); 382 } 383 384 void PlaceholderQueue::flush(BitcodeReaderMetadataList &MetadataList) { 385 while (!PHs.empty()) { 386 auto *MD = MetadataList.lookup(PHs.front().getID()); 387 assert(MD && "Flushing placeholder on unassigned MD"); 388 #ifndef NDEBUG 389 if (auto *MDN = dyn_cast<MDNode>(MD)) 390 assert(MDN->isResolved() && 391 "Flushing Placeholder while cycles aren't resolved"); 392 #endif 393 PHs.front().replaceUseWith(MD); 394 PHs.pop_front(); 395 } 396 } 397 398 } // anonymous namespace 399 400 static Error error(const Twine &Message) { 401 return make_error<StringError>( 402 Message, make_error_code(BitcodeError::CorruptedBitcode)); 403 } 404 405 class MetadataLoader::MetadataLoaderImpl { 406 BitcodeReaderMetadataList MetadataList; 407 BitcodeReaderValueList &ValueList; 408 BitstreamCursor &Stream; 409 LLVMContext &Context; 410 Module &TheModule; 411 MetadataLoaderCallbacks Callbacks; 412 413 /// Cursor associated with the lazy-loading of Metadata. This is the easy way 414 /// to keep around the right "context" (Abbrev list) to be able to jump in 415 /// the middle of the metadata block and load any record. 416 BitstreamCursor IndexCursor; 417 418 /// Index that keeps track of MDString values. 419 std::vector<StringRef> MDStringRef; 420 421 /// On-demand loading of a single MDString. Requires the index above to be 422 /// populated. 423 MDString *lazyLoadOneMDString(unsigned Idx); 424 425 /// Index that keeps track of where to find a metadata record in the stream. 426 std::vector<uint64_t> GlobalMetadataBitPosIndex; 427 428 /// Cursor position of the start of the global decl attachments, to enable 429 /// loading using the index built for lazy loading, instead of forward 430 /// references. 431 uint64_t GlobalDeclAttachmentPos = 0; 432 433 #ifndef NDEBUG 434 /// Baisic correctness check that we end up parsing all of the global decl 435 /// attachments. 436 unsigned NumGlobalDeclAttachSkipped = 0; 437 unsigned NumGlobalDeclAttachParsed = 0; 438 #endif 439 440 /// Load the global decl attachments, using the index built for lazy loading. 441 Expected<bool> loadGlobalDeclAttachments(); 442 443 /// Populate the index above to enable lazily loading of metadata, and load 444 /// the named metadata as well as the transitively referenced global 445 /// Metadata. 446 Expected<bool> lazyLoadModuleMetadataBlock(); 447 448 /// On-demand loading of a single metadata. Requires the index above to be 449 /// populated. 450 void lazyLoadOneMetadata(unsigned Idx, PlaceholderQueue &Placeholders); 451 452 // Keep mapping of seens pair of old-style CU <-> SP, and update pointers to 453 // point from SP to CU after a block is completly parsed. 454 std::vector<std::pair<DICompileUnit *, Metadata *>> CUSubprograms; 455 456 /// Functions that need to be matched with subprograms when upgrading old 457 /// metadata. 458 SmallDenseMap<Function *, DISubprogram *, 16> FunctionsWithSPs; 459 460 // Map the bitcode's custom MDKind ID to the Module's MDKind ID. 461 DenseMap<unsigned, unsigned> MDKindMap; 462 463 bool StripTBAA = false; 464 bool HasSeenOldLoopTags = false; 465 bool NeedUpgradeToDIGlobalVariableExpression = false; 466 bool NeedDeclareExpressionUpgrade = false; 467 468 /// Map DILocalScope to the enclosing DISubprogram, if any. 469 DenseMap<DILocalScope *, DISubprogram *> ParentSubprogram; 470 471 /// True if metadata is being parsed for a module being ThinLTO imported. 472 bool IsImporting = false; 473 474 Error parseOneMetadata(SmallVectorImpl<uint64_t> &Record, unsigned Code, 475 PlaceholderQueue &Placeholders, StringRef Blob, 476 unsigned &NextMetadataNo); 477 Error parseMetadataStrings(ArrayRef<uint64_t> Record, StringRef Blob, 478 function_ref<void(StringRef)> CallBack); 479 Error parseGlobalObjectAttachment(GlobalObject &GO, 480 ArrayRef<uint64_t> Record); 481 Error parseMetadataKindRecord(SmallVectorImpl<uint64_t> &Record); 482 483 void resolveForwardRefsAndPlaceholders(PlaceholderQueue &Placeholders); 484 485 /// Upgrade old-style CU <-> SP pointers to point from SP to CU. 486 void upgradeCUSubprograms() { 487 for (auto CU_SP : CUSubprograms) 488 if (auto *SPs = dyn_cast_or_null<MDTuple>(CU_SP.second)) 489 for (auto &Op : SPs->operands()) 490 if (auto *SP = dyn_cast_or_null<DISubprogram>(Op)) 491 SP->replaceUnit(CU_SP.first); 492 CUSubprograms.clear(); 493 } 494 495 /// Upgrade old-style bare DIGlobalVariables to DIGlobalVariableExpressions. 496 void upgradeCUVariables() { 497 if (!NeedUpgradeToDIGlobalVariableExpression) 498 return; 499 500 // Upgrade list of variables attached to the CUs. 501 if (NamedMDNode *CUNodes = TheModule.getNamedMetadata("llvm.dbg.cu")) 502 for (unsigned I = 0, E = CUNodes->getNumOperands(); I != E; ++I) { 503 auto *CU = cast<DICompileUnit>(CUNodes->getOperand(I)); 504 if (auto *GVs = dyn_cast_or_null<MDTuple>(CU->getRawGlobalVariables())) 505 for (unsigned I = 0; I < GVs->getNumOperands(); I++) 506 if (auto *GV = 507 dyn_cast_or_null<DIGlobalVariable>(GVs->getOperand(I))) { 508 auto *DGVE = DIGlobalVariableExpression::getDistinct( 509 Context, GV, DIExpression::get(Context, {})); 510 GVs->replaceOperandWith(I, DGVE); 511 } 512 } 513 514 // Upgrade variables attached to globals. 515 for (auto &GV : TheModule.globals()) { 516 SmallVector<MDNode *, 1> MDs; 517 GV.getMetadata(LLVMContext::MD_dbg, MDs); 518 GV.eraseMetadata(LLVMContext::MD_dbg); 519 for (auto *MD : MDs) 520 if (auto *DGV = dyn_cast<DIGlobalVariable>(MD)) { 521 auto *DGVE = DIGlobalVariableExpression::getDistinct( 522 Context, DGV, DIExpression::get(Context, {})); 523 GV.addMetadata(LLVMContext::MD_dbg, *DGVE); 524 } else 525 GV.addMetadata(LLVMContext::MD_dbg, *MD); 526 } 527 } 528 529 DISubprogram *findEnclosingSubprogram(DILocalScope *S) { 530 if (!S) 531 return nullptr; 532 if (auto *SP = ParentSubprogram[S]) { 533 return SP; 534 } 535 536 DILocalScope *InitialScope = S; 537 DenseSet<DILocalScope *> Visited; 538 while (S && !isa<DISubprogram>(S)) { 539 S = dyn_cast_or_null<DILocalScope>(S->getScope()); 540 if (Visited.contains(S)) 541 break; 542 Visited.insert(S); 543 } 544 ParentSubprogram[InitialScope] = llvm::dyn_cast_or_null<DISubprogram>(S); 545 546 return ParentSubprogram[InitialScope]; 547 } 548 549 /// Move local imports from DICompileUnit's 'imports' field to 550 /// DISubprogram's retainedNodes. 551 void upgradeCULocals() { 552 if (NamedMDNode *CUNodes = TheModule.getNamedMetadata("llvm.dbg.cu")) { 553 for (unsigned I = 0, E = CUNodes->getNumOperands(); I != E; ++I) { 554 auto *CU = dyn_cast<DICompileUnit>(CUNodes->getOperand(I)); 555 if (!CU) 556 continue; 557 558 if (auto *RawImported = CU->getRawImportedEntities()) { 559 // Collect a set of imported entities to be moved. 560 SetVector<Metadata *> EntitiesToRemove; 561 for (Metadata *Op : CU->getImportedEntities()->operands()) { 562 auto *IE = cast<DIImportedEntity>(Op); 563 if (auto *S = dyn_cast_or_null<DILocalScope>(IE->getScope())) { 564 EntitiesToRemove.insert(IE); 565 } 566 } 567 568 if (!EntitiesToRemove.empty()) { 569 // Make a new list of CU's 'imports'. 570 SmallVector<Metadata *> NewImports; 571 for (Metadata *Op : CU->getImportedEntities()->operands()) { 572 if (!EntitiesToRemove.contains(cast<DIImportedEntity>(Op))) { 573 NewImports.push_back(Op); 574 } 575 } 576 577 // Find DISubprogram corresponding to each entity. 578 std::map<DISubprogram *, SmallVector<Metadata *>> SPToEntities; 579 for (auto *I : EntitiesToRemove) { 580 auto *Entity = cast<DIImportedEntity>(I); 581 if (auto *SP = findEnclosingSubprogram( 582 cast<DILocalScope>(Entity->getScope()))) { 583 SPToEntities[SP].push_back(Entity); 584 } 585 } 586 587 // Update DISubprograms' retainedNodes. 588 for (auto I = SPToEntities.begin(); I != SPToEntities.end(); ++I) { 589 auto *SP = I->first; 590 auto RetainedNodes = SP->getRetainedNodes(); 591 SmallVector<Metadata *> MDs(RetainedNodes.begin(), 592 RetainedNodes.end()); 593 MDs.append(I->second); 594 SP->replaceRetainedNodes(MDNode::get(Context, MDs)); 595 } 596 597 // Remove entities with local scope from CU. 598 CU->replaceImportedEntities(MDTuple::get(Context, NewImports)); 599 } 600 } 601 } 602 } 603 604 ParentSubprogram.clear(); 605 } 606 607 /// Remove a leading DW_OP_deref from DIExpressions in a dbg.declare that 608 /// describes a function argument. 609 void upgradeDeclareExpressions(Function &F) { 610 if (!NeedDeclareExpressionUpgrade) 611 return; 612 613 for (auto &BB : F) 614 for (auto &I : BB) 615 if (auto *DDI = dyn_cast<DbgDeclareInst>(&I)) 616 if (auto *DIExpr = DDI->getExpression()) 617 if (DIExpr->startsWithDeref() && 618 isa_and_nonnull<Argument>(DDI->getAddress())) { 619 SmallVector<uint64_t, 8> Ops; 620 Ops.append(std::next(DIExpr->elements_begin()), 621 DIExpr->elements_end()); 622 DDI->setExpression(DIExpression::get(Context, Ops)); 623 } 624 } 625 626 /// Upgrade the expression from previous versions. 627 Error upgradeDIExpression(uint64_t FromVersion, 628 MutableArrayRef<uint64_t> &Expr, 629 SmallVectorImpl<uint64_t> &Buffer) { 630 auto N = Expr.size(); 631 switch (FromVersion) { 632 default: 633 return error("Invalid record"); 634 case 0: 635 if (N >= 3 && Expr[N - 3] == dwarf::DW_OP_bit_piece) 636 Expr[N - 3] = dwarf::DW_OP_LLVM_fragment; 637 [[fallthrough]]; 638 case 1: 639 // Move DW_OP_deref to the end. 640 if (N && Expr[0] == dwarf::DW_OP_deref) { 641 auto End = Expr.end(); 642 if (Expr.size() >= 3 && 643 *std::prev(End, 3) == dwarf::DW_OP_LLVM_fragment) 644 End = std::prev(End, 3); 645 std::move(std::next(Expr.begin()), End, Expr.begin()); 646 *std::prev(End) = dwarf::DW_OP_deref; 647 } 648 NeedDeclareExpressionUpgrade = true; 649 [[fallthrough]]; 650 case 2: { 651 // Change DW_OP_plus to DW_OP_plus_uconst. 652 // Change DW_OP_minus to DW_OP_uconst, DW_OP_minus 653 auto SubExpr = ArrayRef<uint64_t>(Expr); 654 while (!SubExpr.empty()) { 655 // Skip past other operators with their operands 656 // for this version of the IR, obtained from 657 // from historic DIExpression::ExprOperand::getSize(). 658 size_t HistoricSize; 659 switch (SubExpr.front()) { 660 default: 661 HistoricSize = 1; 662 break; 663 case dwarf::DW_OP_constu: 664 case dwarf::DW_OP_minus: 665 case dwarf::DW_OP_plus: 666 HistoricSize = 2; 667 break; 668 case dwarf::DW_OP_LLVM_fragment: 669 HistoricSize = 3; 670 break; 671 } 672 673 // If the expression is malformed, make sure we don't 674 // copy more elements than we should. 675 HistoricSize = std::min(SubExpr.size(), HistoricSize); 676 ArrayRef<uint64_t> Args = SubExpr.slice(1, HistoricSize - 1); 677 678 switch (SubExpr.front()) { 679 case dwarf::DW_OP_plus: 680 Buffer.push_back(dwarf::DW_OP_plus_uconst); 681 Buffer.append(Args.begin(), Args.end()); 682 break; 683 case dwarf::DW_OP_minus: 684 Buffer.push_back(dwarf::DW_OP_constu); 685 Buffer.append(Args.begin(), Args.end()); 686 Buffer.push_back(dwarf::DW_OP_minus); 687 break; 688 default: 689 Buffer.push_back(*SubExpr.begin()); 690 Buffer.append(Args.begin(), Args.end()); 691 break; 692 } 693 694 // Continue with remaining elements. 695 SubExpr = SubExpr.slice(HistoricSize); 696 } 697 Expr = MutableArrayRef<uint64_t>(Buffer); 698 [[fallthrough]]; 699 } 700 case 3: 701 // Up-to-date! 702 break; 703 } 704 705 return Error::success(); 706 } 707 708 void upgradeDebugInfo() { 709 upgradeCUSubprograms(); 710 upgradeCUVariables(); 711 upgradeCULocals(); 712 } 713 714 void callMDTypeCallback(Metadata **Val, unsigned TypeID); 715 716 public: 717 MetadataLoaderImpl(BitstreamCursor &Stream, Module &TheModule, 718 BitcodeReaderValueList &ValueList, 719 MetadataLoaderCallbacks Callbacks, bool IsImporting) 720 : MetadataList(TheModule.getContext(), Stream.SizeInBytes()), 721 ValueList(ValueList), Stream(Stream), Context(TheModule.getContext()), 722 TheModule(TheModule), Callbacks(std::move(Callbacks)), 723 IsImporting(IsImporting) {} 724 725 Error parseMetadata(bool ModuleLevel); 726 727 bool hasFwdRefs() const { return MetadataList.hasFwdRefs(); } 728 729 Metadata *getMetadataFwdRefOrLoad(unsigned ID) { 730 if (ID < MDStringRef.size()) 731 return lazyLoadOneMDString(ID); 732 if (auto *MD = MetadataList.lookup(ID)) 733 return MD; 734 // If lazy-loading is enabled, we try recursively to load the operand 735 // instead of creating a temporary. 736 if (ID < (MDStringRef.size() + GlobalMetadataBitPosIndex.size())) { 737 PlaceholderQueue Placeholders; 738 lazyLoadOneMetadata(ID, Placeholders); 739 resolveForwardRefsAndPlaceholders(Placeholders); 740 return MetadataList.lookup(ID); 741 } 742 return MetadataList.getMetadataFwdRef(ID); 743 } 744 745 DISubprogram *lookupSubprogramForFunction(Function *F) { 746 return FunctionsWithSPs.lookup(F); 747 } 748 749 bool hasSeenOldLoopTags() const { return HasSeenOldLoopTags; } 750 751 Error parseMetadataAttachment(Function &F, 752 ArrayRef<Instruction *> InstructionList); 753 754 Error parseMetadataKinds(); 755 756 void setStripTBAA(bool Value) { StripTBAA = Value; } 757 bool isStrippingTBAA() const { return StripTBAA; } 758 759 unsigned size() const { return MetadataList.size(); } 760 void shrinkTo(unsigned N) { MetadataList.shrinkTo(N); } 761 void upgradeDebugIntrinsics(Function &F) { upgradeDeclareExpressions(F); } 762 }; 763 764 Expected<bool> 765 MetadataLoader::MetadataLoaderImpl::lazyLoadModuleMetadataBlock() { 766 IndexCursor = Stream; 767 SmallVector<uint64_t, 64> Record; 768 GlobalDeclAttachmentPos = 0; 769 // Get the abbrevs, and preload record positions to make them lazy-loadable. 770 while (true) { 771 uint64_t SavedPos = IndexCursor.GetCurrentBitNo(); 772 BitstreamEntry Entry; 773 if (Error E = 774 IndexCursor 775 .advanceSkippingSubblocks(BitstreamCursor::AF_DontPopBlockAtEnd) 776 .moveInto(Entry)) 777 return std::move(E); 778 779 switch (Entry.Kind) { 780 case BitstreamEntry::SubBlock: // Handled for us already. 781 case BitstreamEntry::Error: 782 return error("Malformed block"); 783 case BitstreamEntry::EndBlock: { 784 return true; 785 } 786 case BitstreamEntry::Record: { 787 // The interesting case. 788 ++NumMDRecordLoaded; 789 uint64_t CurrentPos = IndexCursor.GetCurrentBitNo(); 790 unsigned Code; 791 if (Error E = IndexCursor.skipRecord(Entry.ID).moveInto(Code)) 792 return std::move(E); 793 switch (Code) { 794 case bitc::METADATA_STRINGS: { 795 // Rewind and parse the strings. 796 if (Error Err = IndexCursor.JumpToBit(CurrentPos)) 797 return std::move(Err); 798 StringRef Blob; 799 Record.clear(); 800 if (Expected<unsigned> MaybeRecord = 801 IndexCursor.readRecord(Entry.ID, Record, &Blob)) 802 ; 803 else 804 return MaybeRecord.takeError(); 805 unsigned NumStrings = Record[0]; 806 MDStringRef.reserve(NumStrings); 807 auto IndexNextMDString = [&](StringRef Str) { 808 MDStringRef.push_back(Str); 809 }; 810 if (auto Err = parseMetadataStrings(Record, Blob, IndexNextMDString)) 811 return std::move(Err); 812 break; 813 } 814 case bitc::METADATA_INDEX_OFFSET: { 815 // This is the offset to the index, when we see this we skip all the 816 // records and load only an index to these. 817 if (Error Err = IndexCursor.JumpToBit(CurrentPos)) 818 return std::move(Err); 819 Record.clear(); 820 if (Expected<unsigned> MaybeRecord = 821 IndexCursor.readRecord(Entry.ID, Record)) 822 ; 823 else 824 return MaybeRecord.takeError(); 825 if (Record.size() != 2) 826 return error("Invalid record"); 827 auto Offset = Record[0] + (Record[1] << 32); 828 auto BeginPos = IndexCursor.GetCurrentBitNo(); 829 if (Error Err = IndexCursor.JumpToBit(BeginPos + Offset)) 830 return std::move(Err); 831 Expected<BitstreamEntry> MaybeEntry = 832 IndexCursor.advanceSkippingSubblocks( 833 BitstreamCursor::AF_DontPopBlockAtEnd); 834 if (!MaybeEntry) 835 return MaybeEntry.takeError(); 836 Entry = MaybeEntry.get(); 837 assert(Entry.Kind == BitstreamEntry::Record && 838 "Corrupted bitcode: Expected `Record` when trying to find the " 839 "Metadata index"); 840 Record.clear(); 841 if (Expected<unsigned> MaybeCode = 842 IndexCursor.readRecord(Entry.ID, Record)) 843 assert(MaybeCode.get() == bitc::METADATA_INDEX && 844 "Corrupted bitcode: Expected `METADATA_INDEX` when trying to " 845 "find the Metadata index"); 846 else 847 return MaybeCode.takeError(); 848 // Delta unpack 849 auto CurrentValue = BeginPos; 850 GlobalMetadataBitPosIndex.reserve(Record.size()); 851 for (auto &Elt : Record) { 852 CurrentValue += Elt; 853 GlobalMetadataBitPosIndex.push_back(CurrentValue); 854 } 855 break; 856 } 857 case bitc::METADATA_INDEX: 858 // We don't expect to get there, the Index is loaded when we encounter 859 // the offset. 860 return error("Corrupted Metadata block"); 861 case bitc::METADATA_NAME: { 862 // Named metadata need to be materialized now and aren't deferred. 863 if (Error Err = IndexCursor.JumpToBit(CurrentPos)) 864 return std::move(Err); 865 Record.clear(); 866 867 unsigned Code; 868 if (Expected<unsigned> MaybeCode = 869 IndexCursor.readRecord(Entry.ID, Record)) { 870 Code = MaybeCode.get(); 871 assert(Code == bitc::METADATA_NAME); 872 } else 873 return MaybeCode.takeError(); 874 875 // Read name of the named metadata. 876 SmallString<8> Name(Record.begin(), Record.end()); 877 if (Expected<unsigned> MaybeCode = IndexCursor.ReadCode()) 878 Code = MaybeCode.get(); 879 else 880 return MaybeCode.takeError(); 881 882 // Named Metadata comes in two parts, we expect the name to be followed 883 // by the node 884 Record.clear(); 885 if (Expected<unsigned> MaybeNextBitCode = 886 IndexCursor.readRecord(Code, Record)) 887 assert(MaybeNextBitCode.get() == bitc::METADATA_NAMED_NODE); 888 else 889 return MaybeNextBitCode.takeError(); 890 891 // Read named metadata elements. 892 unsigned Size = Record.size(); 893 NamedMDNode *NMD = TheModule.getOrInsertNamedMetadata(Name); 894 for (unsigned i = 0; i != Size; ++i) { 895 // FIXME: We could use a placeholder here, however NamedMDNode are 896 // taking MDNode as operand and not using the Metadata infrastructure. 897 // It is acknowledged by 'TODO: Inherit from Metadata' in the 898 // NamedMDNode class definition. 899 MDNode *MD = MetadataList.getMDNodeFwdRefOrNull(Record[i]); 900 assert(MD && "Invalid metadata: expect fwd ref to MDNode"); 901 NMD->addOperand(MD); 902 } 903 break; 904 } 905 case bitc::METADATA_GLOBAL_DECL_ATTACHMENT: { 906 if (!GlobalDeclAttachmentPos) 907 GlobalDeclAttachmentPos = SavedPos; 908 #ifndef NDEBUG 909 NumGlobalDeclAttachSkipped++; 910 #endif 911 break; 912 } 913 case bitc::METADATA_KIND: 914 case bitc::METADATA_STRING_OLD: 915 case bitc::METADATA_OLD_FN_NODE: 916 case bitc::METADATA_OLD_NODE: 917 case bitc::METADATA_VALUE: 918 case bitc::METADATA_DISTINCT_NODE: 919 case bitc::METADATA_NODE: 920 case bitc::METADATA_LOCATION: 921 case bitc::METADATA_GENERIC_DEBUG: 922 case bitc::METADATA_SUBRANGE: 923 case bitc::METADATA_ENUMERATOR: 924 case bitc::METADATA_BASIC_TYPE: 925 case bitc::METADATA_STRING_TYPE: 926 case bitc::METADATA_DERIVED_TYPE: 927 case bitc::METADATA_COMPOSITE_TYPE: 928 case bitc::METADATA_SUBROUTINE_TYPE: 929 case bitc::METADATA_MODULE: 930 case bitc::METADATA_FILE: 931 case bitc::METADATA_COMPILE_UNIT: 932 case bitc::METADATA_SUBPROGRAM: 933 case bitc::METADATA_LEXICAL_BLOCK: 934 case bitc::METADATA_LEXICAL_BLOCK_FILE: 935 case bitc::METADATA_NAMESPACE: 936 case bitc::METADATA_COMMON_BLOCK: 937 case bitc::METADATA_MACRO: 938 case bitc::METADATA_MACRO_FILE: 939 case bitc::METADATA_TEMPLATE_TYPE: 940 case bitc::METADATA_TEMPLATE_VALUE: 941 case bitc::METADATA_GLOBAL_VAR: 942 case bitc::METADATA_LOCAL_VAR: 943 case bitc::METADATA_ASSIGN_ID: 944 case bitc::METADATA_LABEL: 945 case bitc::METADATA_EXPRESSION: 946 case bitc::METADATA_OBJC_PROPERTY: 947 case bitc::METADATA_IMPORTED_ENTITY: 948 case bitc::METADATA_GLOBAL_VAR_EXPR: 949 case bitc::METADATA_GENERIC_SUBRANGE: 950 // We don't expect to see any of these, if we see one, give up on 951 // lazy-loading and fallback. 952 MDStringRef.clear(); 953 GlobalMetadataBitPosIndex.clear(); 954 return false; 955 } 956 break; 957 } 958 } 959 } 960 } 961 962 // Load the global decl attachments after building the lazy loading index. 963 // We don't load them "lazily" - all global decl attachments must be 964 // parsed since they aren't materialized on demand. However, by delaying 965 // their parsing until after the index is created, we can use the index 966 // instead of creating temporaries. 967 Expected<bool> MetadataLoader::MetadataLoaderImpl::loadGlobalDeclAttachments() { 968 // Nothing to do if we didn't find any of these metadata records. 969 if (!GlobalDeclAttachmentPos) 970 return true; 971 // Use a temporary cursor so that we don't mess up the main Stream cursor or 972 // the lazy loading IndexCursor (which holds the necessary abbrev ids). 973 BitstreamCursor TempCursor = Stream; 974 SmallVector<uint64_t, 64> Record; 975 // Jump to the position before the first global decl attachment, so we can 976 // scan for the first BitstreamEntry record. 977 if (Error Err = TempCursor.JumpToBit(GlobalDeclAttachmentPos)) 978 return std::move(Err); 979 while (true) { 980 BitstreamEntry Entry; 981 if (Error E = 982 TempCursor 983 .advanceSkippingSubblocks(BitstreamCursor::AF_DontPopBlockAtEnd) 984 .moveInto(Entry)) 985 return std::move(E); 986 987 switch (Entry.Kind) { 988 case BitstreamEntry::SubBlock: // Handled for us already. 989 case BitstreamEntry::Error: 990 return error("Malformed block"); 991 case BitstreamEntry::EndBlock: 992 // Check that we parsed them all. 993 assert(NumGlobalDeclAttachSkipped == NumGlobalDeclAttachParsed); 994 return true; 995 case BitstreamEntry::Record: 996 break; 997 } 998 uint64_t CurrentPos = TempCursor.GetCurrentBitNo(); 999 Expected<unsigned> MaybeCode = TempCursor.skipRecord(Entry.ID); 1000 if (!MaybeCode) 1001 return MaybeCode.takeError(); 1002 if (MaybeCode.get() != bitc::METADATA_GLOBAL_DECL_ATTACHMENT) { 1003 // Anything other than a global decl attachment signals the end of 1004 // these records. Check that we parsed them all. 1005 assert(NumGlobalDeclAttachSkipped == NumGlobalDeclAttachParsed); 1006 return true; 1007 } 1008 #ifndef NDEBUG 1009 NumGlobalDeclAttachParsed++; 1010 #endif 1011 // FIXME: we need to do this early because we don't materialize global 1012 // value explicitly. 1013 if (Error Err = TempCursor.JumpToBit(CurrentPos)) 1014 return std::move(Err); 1015 Record.clear(); 1016 if (Expected<unsigned> MaybeRecord = 1017 TempCursor.readRecord(Entry.ID, Record)) 1018 ; 1019 else 1020 return MaybeRecord.takeError(); 1021 if (Record.size() % 2 == 0) 1022 return error("Invalid record"); 1023 unsigned ValueID = Record[0]; 1024 if (ValueID >= ValueList.size()) 1025 return error("Invalid record"); 1026 if (auto *GO = dyn_cast<GlobalObject>(ValueList[ValueID])) { 1027 // Need to save and restore the current position since 1028 // parseGlobalObjectAttachment will resolve all forward references which 1029 // would require parsing from locations stored in the index. 1030 CurrentPos = TempCursor.GetCurrentBitNo(); 1031 if (Error Err = parseGlobalObjectAttachment( 1032 *GO, ArrayRef<uint64_t>(Record).slice(1))) 1033 return std::move(Err); 1034 if (Error Err = TempCursor.JumpToBit(CurrentPos)) 1035 return std::move(Err); 1036 } 1037 } 1038 } 1039 1040 void MetadataLoader::MetadataLoaderImpl::callMDTypeCallback(Metadata **Val, 1041 unsigned TypeID) { 1042 if (Callbacks.MDType) { 1043 (*Callbacks.MDType)(Val, TypeID, Callbacks.GetTypeByID, 1044 Callbacks.GetContainedTypeID); 1045 } 1046 } 1047 1048 /// Parse a METADATA_BLOCK. If ModuleLevel is true then we are parsing 1049 /// module level metadata. 1050 Error MetadataLoader::MetadataLoaderImpl::parseMetadata(bool ModuleLevel) { 1051 if (!ModuleLevel && MetadataList.hasFwdRefs()) 1052 return error("Invalid metadata: fwd refs into function blocks"); 1053 1054 // Record the entry position so that we can jump back here and efficiently 1055 // skip the whole block in case we lazy-load. 1056 auto EntryPos = Stream.GetCurrentBitNo(); 1057 1058 if (Error Err = Stream.EnterSubBlock(bitc::METADATA_BLOCK_ID)) 1059 return Err; 1060 1061 SmallVector<uint64_t, 64> Record; 1062 PlaceholderQueue Placeholders; 1063 1064 // We lazy-load module-level metadata: we build an index for each record, and 1065 // then load individual record as needed, starting with the named metadata. 1066 if (ModuleLevel && IsImporting && MetadataList.empty() && 1067 !DisableLazyLoading) { 1068 auto SuccessOrErr = lazyLoadModuleMetadataBlock(); 1069 if (!SuccessOrErr) 1070 return SuccessOrErr.takeError(); 1071 if (SuccessOrErr.get()) { 1072 // An index was successfully created and we will be able to load metadata 1073 // on-demand. 1074 MetadataList.resize(MDStringRef.size() + 1075 GlobalMetadataBitPosIndex.size()); 1076 1077 // Now that we have built the index, load the global decl attachments 1078 // that were deferred during that process. This avoids creating 1079 // temporaries. 1080 SuccessOrErr = loadGlobalDeclAttachments(); 1081 if (!SuccessOrErr) 1082 return SuccessOrErr.takeError(); 1083 assert(SuccessOrErr.get()); 1084 1085 // Reading the named metadata created forward references and/or 1086 // placeholders, that we flush here. 1087 resolveForwardRefsAndPlaceholders(Placeholders); 1088 upgradeDebugInfo(); 1089 // Return at the beginning of the block, since it is easy to skip it 1090 // entirely from there. 1091 Stream.ReadBlockEnd(); // Pop the abbrev block context. 1092 if (Error Err = IndexCursor.JumpToBit(EntryPos)) 1093 return Err; 1094 if (Error Err = Stream.SkipBlock()) { 1095 // FIXME this drops the error on the floor, which 1096 // ThinLTO/X86/debuginfo-cu-import.ll relies on. 1097 consumeError(std::move(Err)); 1098 return Error::success(); 1099 } 1100 return Error::success(); 1101 } 1102 // Couldn't load an index, fallback to loading all the block "old-style". 1103 } 1104 1105 unsigned NextMetadataNo = MetadataList.size(); 1106 1107 // Read all the records. 1108 while (true) { 1109 BitstreamEntry Entry; 1110 if (Error E = Stream.advanceSkippingSubblocks().moveInto(Entry)) 1111 return E; 1112 1113 switch (Entry.Kind) { 1114 case BitstreamEntry::SubBlock: // Handled for us already. 1115 case BitstreamEntry::Error: 1116 return error("Malformed block"); 1117 case BitstreamEntry::EndBlock: 1118 resolveForwardRefsAndPlaceholders(Placeholders); 1119 upgradeDebugInfo(); 1120 return Error::success(); 1121 case BitstreamEntry::Record: 1122 // The interesting case. 1123 break; 1124 } 1125 1126 // Read a record. 1127 Record.clear(); 1128 StringRef Blob; 1129 ++NumMDRecordLoaded; 1130 if (Expected<unsigned> MaybeCode = 1131 Stream.readRecord(Entry.ID, Record, &Blob)) { 1132 if (Error Err = parseOneMetadata(Record, MaybeCode.get(), Placeholders, 1133 Blob, NextMetadataNo)) 1134 return Err; 1135 } else 1136 return MaybeCode.takeError(); 1137 } 1138 } 1139 1140 MDString *MetadataLoader::MetadataLoaderImpl::lazyLoadOneMDString(unsigned ID) { 1141 ++NumMDStringLoaded; 1142 if (Metadata *MD = MetadataList.lookup(ID)) 1143 return cast<MDString>(MD); 1144 auto MDS = MDString::get(Context, MDStringRef[ID]); 1145 MetadataList.assignValue(MDS, ID); 1146 return MDS; 1147 } 1148 1149 void MetadataLoader::MetadataLoaderImpl::lazyLoadOneMetadata( 1150 unsigned ID, PlaceholderQueue &Placeholders) { 1151 assert(ID < (MDStringRef.size()) + GlobalMetadataBitPosIndex.size()); 1152 assert(ID >= MDStringRef.size() && "Unexpected lazy-loading of MDString"); 1153 // Lookup first if the metadata hasn't already been loaded. 1154 if (auto *MD = MetadataList.lookup(ID)) { 1155 auto *N = cast<MDNode>(MD); 1156 if (!N->isTemporary()) 1157 return; 1158 } 1159 SmallVector<uint64_t, 64> Record; 1160 StringRef Blob; 1161 if (Error Err = IndexCursor.JumpToBit( 1162 GlobalMetadataBitPosIndex[ID - MDStringRef.size()])) 1163 report_fatal_error("lazyLoadOneMetadata failed jumping: " + 1164 Twine(toString(std::move(Err)))); 1165 BitstreamEntry Entry; 1166 if (Error E = IndexCursor.advanceSkippingSubblocks().moveInto(Entry)) 1167 // FIXME this drops the error on the floor. 1168 report_fatal_error("lazyLoadOneMetadata failed advanceSkippingSubblocks: " + 1169 Twine(toString(std::move(E)))); 1170 ++NumMDRecordLoaded; 1171 if (Expected<unsigned> MaybeCode = 1172 IndexCursor.readRecord(Entry.ID, Record, &Blob)) { 1173 if (Error Err = 1174 parseOneMetadata(Record, MaybeCode.get(), Placeholders, Blob, ID)) 1175 report_fatal_error("Can't lazyload MD, parseOneMetadata: " + 1176 Twine(toString(std::move(Err)))); 1177 } else 1178 report_fatal_error("Can't lazyload MD: " + 1179 Twine(toString(MaybeCode.takeError()))); 1180 } 1181 1182 /// Ensure that all forward-references and placeholders are resolved. 1183 /// Iteratively lazy-loading metadata on-demand if needed. 1184 void MetadataLoader::MetadataLoaderImpl::resolveForwardRefsAndPlaceholders( 1185 PlaceholderQueue &Placeholders) { 1186 DenseSet<unsigned> Temporaries; 1187 while (true) { 1188 // Populate Temporaries with the placeholders that haven't been loaded yet. 1189 Placeholders.getTemporaries(MetadataList, Temporaries); 1190 1191 // If we don't have any temporary, or FwdReference, we're done! 1192 if (Temporaries.empty() && !MetadataList.hasFwdRefs()) 1193 break; 1194 1195 // First, load all the temporaries. This can add new placeholders or 1196 // forward references. 1197 for (auto ID : Temporaries) 1198 lazyLoadOneMetadata(ID, Placeholders); 1199 Temporaries.clear(); 1200 1201 // Second, load the forward-references. This can also add new placeholders 1202 // or forward references. 1203 while (MetadataList.hasFwdRefs()) 1204 lazyLoadOneMetadata(MetadataList.getNextFwdRef(), Placeholders); 1205 } 1206 // At this point we don't have any forward reference remaining, or temporary 1207 // that haven't been loaded. We can safely drop RAUW support and mark cycles 1208 // as resolved. 1209 MetadataList.tryToResolveCycles(); 1210 1211 // Finally, everything is in place, we can replace the placeholders operands 1212 // with the final node they refer to. 1213 Placeholders.flush(MetadataList); 1214 } 1215 1216 Error MetadataLoader::MetadataLoaderImpl::parseOneMetadata( 1217 SmallVectorImpl<uint64_t> &Record, unsigned Code, 1218 PlaceholderQueue &Placeholders, StringRef Blob, unsigned &NextMetadataNo) { 1219 1220 bool IsDistinct = false; 1221 auto getMD = [&](unsigned ID) -> Metadata * { 1222 if (ID < MDStringRef.size()) 1223 return lazyLoadOneMDString(ID); 1224 if (!IsDistinct) { 1225 if (auto *MD = MetadataList.lookup(ID)) 1226 return MD; 1227 // If lazy-loading is enabled, we try recursively to load the operand 1228 // instead of creating a temporary. 1229 if (ID < (MDStringRef.size() + GlobalMetadataBitPosIndex.size())) { 1230 // Create a temporary for the node that is referencing the operand we 1231 // will lazy-load. It is needed before recursing in case there are 1232 // uniquing cycles. 1233 MetadataList.getMetadataFwdRef(NextMetadataNo); 1234 lazyLoadOneMetadata(ID, Placeholders); 1235 return MetadataList.lookup(ID); 1236 } 1237 // Return a temporary. 1238 return MetadataList.getMetadataFwdRef(ID); 1239 } 1240 if (auto *MD = MetadataList.getMetadataIfResolved(ID)) 1241 return MD; 1242 return &Placeholders.getPlaceholderOp(ID); 1243 }; 1244 auto getMDOrNull = [&](unsigned ID) -> Metadata * { 1245 if (ID) 1246 return getMD(ID - 1); 1247 return nullptr; 1248 }; 1249 auto getMDOrNullWithoutPlaceholders = [&](unsigned ID) -> Metadata * { 1250 if (ID) 1251 return MetadataList.getMetadataFwdRef(ID - 1); 1252 return nullptr; 1253 }; 1254 auto getMDString = [&](unsigned ID) -> MDString * { 1255 // This requires that the ID is not really a forward reference. In 1256 // particular, the MDString must already have been resolved. 1257 auto MDS = getMDOrNull(ID); 1258 return cast_or_null<MDString>(MDS); 1259 }; 1260 1261 // Support for old type refs. 1262 auto getDITypeRefOrNull = [&](unsigned ID) { 1263 return MetadataList.upgradeTypeRef(getMDOrNull(ID)); 1264 }; 1265 1266 #define GET_OR_DISTINCT(CLASS, ARGS) \ 1267 (IsDistinct ? CLASS::getDistinct ARGS : CLASS::get ARGS) 1268 1269 switch (Code) { 1270 default: // Default behavior: ignore. 1271 break; 1272 case bitc::METADATA_NAME: { 1273 // Read name of the named metadata. 1274 SmallString<8> Name(Record.begin(), Record.end()); 1275 Record.clear(); 1276 if (Error E = Stream.ReadCode().moveInto(Code)) 1277 return E; 1278 1279 ++NumMDRecordLoaded; 1280 if (Expected<unsigned> MaybeNextBitCode = Stream.readRecord(Code, Record)) { 1281 if (MaybeNextBitCode.get() != bitc::METADATA_NAMED_NODE) 1282 return error("METADATA_NAME not followed by METADATA_NAMED_NODE"); 1283 } else 1284 return MaybeNextBitCode.takeError(); 1285 1286 // Read named metadata elements. 1287 unsigned Size = Record.size(); 1288 NamedMDNode *NMD = TheModule.getOrInsertNamedMetadata(Name); 1289 for (unsigned i = 0; i != Size; ++i) { 1290 MDNode *MD = MetadataList.getMDNodeFwdRefOrNull(Record[i]); 1291 if (!MD) 1292 return error("Invalid named metadata: expect fwd ref to MDNode"); 1293 NMD->addOperand(MD); 1294 } 1295 break; 1296 } 1297 case bitc::METADATA_OLD_FN_NODE: { 1298 // Deprecated, but still needed to read old bitcode files. 1299 // This is a LocalAsMetadata record, the only type of function-local 1300 // metadata. 1301 if (Record.size() % 2 == 1) 1302 return error("Invalid record"); 1303 1304 // If this isn't a LocalAsMetadata record, we're dropping it. This used 1305 // to be legal, but there's no upgrade path. 1306 auto dropRecord = [&] { 1307 MetadataList.assignValue(MDNode::get(Context, std::nullopt), 1308 NextMetadataNo); 1309 NextMetadataNo++; 1310 }; 1311 if (Record.size() != 2) { 1312 dropRecord(); 1313 break; 1314 } 1315 1316 unsigned TyID = Record[0]; 1317 Type *Ty = Callbacks.GetTypeByID(TyID); 1318 if (Ty->isMetadataTy() || Ty->isVoidTy()) { 1319 dropRecord(); 1320 break; 1321 } 1322 1323 Value *V = ValueList.getValueFwdRef(Record[1], Ty, TyID, 1324 /*ConstExprInsertBB*/ nullptr); 1325 if (!V) 1326 return error("Invalid value reference from old fn metadata"); 1327 1328 MetadataList.assignValue(LocalAsMetadata::get(V), NextMetadataNo); 1329 NextMetadataNo++; 1330 break; 1331 } 1332 case bitc::METADATA_OLD_NODE: { 1333 // Deprecated, but still needed to read old bitcode files. 1334 if (Record.size() % 2 == 1) 1335 return error("Invalid record"); 1336 1337 unsigned Size = Record.size(); 1338 SmallVector<Metadata *, 8> Elts; 1339 for (unsigned i = 0; i != Size; i += 2) { 1340 unsigned TyID = Record[i]; 1341 Type *Ty = Callbacks.GetTypeByID(TyID); 1342 if (!Ty) 1343 return error("Invalid record"); 1344 if (Ty->isMetadataTy()) 1345 Elts.push_back(getMD(Record[i + 1])); 1346 else if (!Ty->isVoidTy()) { 1347 Value *V = ValueList.getValueFwdRef(Record[i + 1], Ty, TyID, 1348 /*ConstExprInsertBB*/ nullptr); 1349 if (!V) 1350 return error("Invalid value reference from old metadata"); 1351 Metadata *MD = ValueAsMetadata::get(V); 1352 assert(isa<ConstantAsMetadata>(MD) && 1353 "Expected non-function-local metadata"); 1354 callMDTypeCallback(&MD, TyID); 1355 Elts.push_back(MD); 1356 } else 1357 Elts.push_back(nullptr); 1358 } 1359 MetadataList.assignValue(MDNode::get(Context, Elts), NextMetadataNo); 1360 NextMetadataNo++; 1361 break; 1362 } 1363 case bitc::METADATA_VALUE: { 1364 if (Record.size() != 2) 1365 return error("Invalid record"); 1366 1367 unsigned TyID = Record[0]; 1368 Type *Ty = Callbacks.GetTypeByID(TyID); 1369 if (Ty->isMetadataTy() || Ty->isVoidTy()) 1370 return error("Invalid record"); 1371 1372 Value *V = ValueList.getValueFwdRef(Record[1], Ty, TyID, 1373 /*ConstExprInsertBB*/ nullptr); 1374 if (!V) 1375 return error("Invalid value reference from metadata"); 1376 1377 Metadata *MD = ValueAsMetadata::get(V); 1378 callMDTypeCallback(&MD, TyID); 1379 MetadataList.assignValue(MD, NextMetadataNo); 1380 NextMetadataNo++; 1381 break; 1382 } 1383 case bitc::METADATA_DISTINCT_NODE: 1384 IsDistinct = true; 1385 [[fallthrough]]; 1386 case bitc::METADATA_NODE: { 1387 SmallVector<Metadata *, 8> Elts; 1388 Elts.reserve(Record.size()); 1389 for (unsigned ID : Record) 1390 Elts.push_back(getMDOrNull(ID)); 1391 MetadataList.assignValue(IsDistinct ? MDNode::getDistinct(Context, Elts) 1392 : MDNode::get(Context, Elts), 1393 NextMetadataNo); 1394 NextMetadataNo++; 1395 break; 1396 } 1397 case bitc::METADATA_LOCATION: { 1398 if (Record.size() != 5 && Record.size() != 6) 1399 return error("Invalid record"); 1400 1401 IsDistinct = Record[0]; 1402 unsigned Line = Record[1]; 1403 unsigned Column = Record[2]; 1404 Metadata *Scope = getMD(Record[3]); 1405 Metadata *InlinedAt = getMDOrNull(Record[4]); 1406 bool ImplicitCode = Record.size() == 6 && Record[5]; 1407 MetadataList.assignValue( 1408 GET_OR_DISTINCT(DILocation, (Context, Line, Column, Scope, InlinedAt, 1409 ImplicitCode)), 1410 NextMetadataNo); 1411 NextMetadataNo++; 1412 break; 1413 } 1414 case bitc::METADATA_GENERIC_DEBUG: { 1415 if (Record.size() < 4) 1416 return error("Invalid record"); 1417 1418 IsDistinct = Record[0]; 1419 unsigned Tag = Record[1]; 1420 unsigned Version = Record[2]; 1421 1422 if (Tag >= 1u << 16 || Version != 0) 1423 return error("Invalid record"); 1424 1425 auto *Header = getMDString(Record[3]); 1426 SmallVector<Metadata *, 8> DwarfOps; 1427 for (unsigned I = 4, E = Record.size(); I != E; ++I) 1428 DwarfOps.push_back(getMDOrNull(Record[I])); 1429 MetadataList.assignValue( 1430 GET_OR_DISTINCT(GenericDINode, (Context, Tag, Header, DwarfOps)), 1431 NextMetadataNo); 1432 NextMetadataNo++; 1433 break; 1434 } 1435 case bitc::METADATA_SUBRANGE: { 1436 Metadata *Val = nullptr; 1437 // Operand 'count' is interpreted as: 1438 // - Signed integer (version 0) 1439 // - Metadata node (version 1) 1440 // Operand 'lowerBound' is interpreted as: 1441 // - Signed integer (version 0 and 1) 1442 // - Metadata node (version 2) 1443 // Operands 'upperBound' and 'stride' are interpreted as: 1444 // - Metadata node (version 2) 1445 switch (Record[0] >> 1) { 1446 case 0: 1447 Val = GET_OR_DISTINCT(DISubrange, 1448 (Context, Record[1], unrotateSign(Record[2]))); 1449 break; 1450 case 1: 1451 Val = GET_OR_DISTINCT(DISubrange, (Context, getMDOrNull(Record[1]), 1452 unrotateSign(Record[2]))); 1453 break; 1454 case 2: 1455 Val = GET_OR_DISTINCT( 1456 DISubrange, (Context, getMDOrNull(Record[1]), getMDOrNull(Record[2]), 1457 getMDOrNull(Record[3]), getMDOrNull(Record[4]))); 1458 break; 1459 default: 1460 return error("Invalid record: Unsupported version of DISubrange"); 1461 } 1462 1463 MetadataList.assignValue(Val, NextMetadataNo); 1464 IsDistinct = Record[0] & 1; 1465 NextMetadataNo++; 1466 break; 1467 } 1468 case bitc::METADATA_GENERIC_SUBRANGE: { 1469 Metadata *Val = nullptr; 1470 Val = GET_OR_DISTINCT(DIGenericSubrange, 1471 (Context, getMDOrNull(Record[1]), 1472 getMDOrNull(Record[2]), getMDOrNull(Record[3]), 1473 getMDOrNull(Record[4]))); 1474 1475 MetadataList.assignValue(Val, NextMetadataNo); 1476 IsDistinct = Record[0] & 1; 1477 NextMetadataNo++; 1478 break; 1479 } 1480 case bitc::METADATA_ENUMERATOR: { 1481 if (Record.size() < 3) 1482 return error("Invalid record"); 1483 1484 IsDistinct = Record[0] & 1; 1485 bool IsUnsigned = Record[0] & 2; 1486 bool IsBigInt = Record[0] & 4; 1487 APInt Value; 1488 1489 if (IsBigInt) { 1490 const uint64_t BitWidth = Record[1]; 1491 const size_t NumWords = Record.size() - 3; 1492 Value = readWideAPInt(ArrayRef(&Record[3], NumWords), BitWidth); 1493 } else 1494 Value = APInt(64, unrotateSign(Record[1]), !IsUnsigned); 1495 1496 MetadataList.assignValue( 1497 GET_OR_DISTINCT(DIEnumerator, 1498 (Context, Value, IsUnsigned, getMDString(Record[2]))), 1499 NextMetadataNo); 1500 NextMetadataNo++; 1501 break; 1502 } 1503 case bitc::METADATA_BASIC_TYPE: { 1504 if (Record.size() < 6 || Record.size() > 7) 1505 return error("Invalid record"); 1506 1507 IsDistinct = Record[0]; 1508 DINode::DIFlags Flags = (Record.size() > 6) 1509 ? static_cast<DINode::DIFlags>(Record[6]) 1510 : DINode::FlagZero; 1511 1512 MetadataList.assignValue( 1513 GET_OR_DISTINCT(DIBasicType, 1514 (Context, Record[1], getMDString(Record[2]), Record[3], 1515 Record[4], Record[5], Flags)), 1516 NextMetadataNo); 1517 NextMetadataNo++; 1518 break; 1519 } 1520 case bitc::METADATA_STRING_TYPE: { 1521 if (Record.size() > 9 || Record.size() < 8) 1522 return error("Invalid record"); 1523 1524 IsDistinct = Record[0]; 1525 bool SizeIs8 = Record.size() == 8; 1526 // StringLocationExp (i.e. Record[5]) is added at a later time 1527 // than the other fields. The code here enables backward compatibility. 1528 Metadata *StringLocationExp = SizeIs8 ? nullptr : getMDOrNull(Record[5]); 1529 unsigned Offset = SizeIs8 ? 5 : 6; 1530 MetadataList.assignValue( 1531 GET_OR_DISTINCT(DIStringType, 1532 (Context, Record[1], getMDString(Record[2]), 1533 getMDOrNull(Record[3]), getMDOrNull(Record[4]), 1534 StringLocationExp, Record[Offset], Record[Offset + 1], 1535 Record[Offset + 2])), 1536 NextMetadataNo); 1537 NextMetadataNo++; 1538 break; 1539 } 1540 case bitc::METADATA_DERIVED_TYPE: { 1541 if (Record.size() < 12 || Record.size() > 14) 1542 return error("Invalid record"); 1543 1544 // DWARF address space is encoded as N->getDWARFAddressSpace() + 1. 0 means 1545 // that there is no DWARF address space associated with DIDerivedType. 1546 std::optional<unsigned> DWARFAddressSpace; 1547 if (Record.size() > 12 && Record[12]) 1548 DWARFAddressSpace = Record[12] - 1; 1549 1550 Metadata *Annotations = nullptr; 1551 if (Record.size() > 13 && Record[13]) 1552 Annotations = getMDOrNull(Record[13]); 1553 1554 IsDistinct = Record[0]; 1555 DINode::DIFlags Flags = static_cast<DINode::DIFlags>(Record[10]); 1556 MetadataList.assignValue( 1557 GET_OR_DISTINCT(DIDerivedType, 1558 (Context, Record[1], getMDString(Record[2]), 1559 getMDOrNull(Record[3]), Record[4], 1560 getDITypeRefOrNull(Record[5]), 1561 getDITypeRefOrNull(Record[6]), Record[7], Record[8], 1562 Record[9], DWARFAddressSpace, Flags, 1563 getDITypeRefOrNull(Record[11]), Annotations)), 1564 NextMetadataNo); 1565 NextMetadataNo++; 1566 break; 1567 } 1568 case bitc::METADATA_COMPOSITE_TYPE: { 1569 if (Record.size() < 16 || Record.size() > 22) 1570 return error("Invalid record"); 1571 1572 // If we have a UUID and this is not a forward declaration, lookup the 1573 // mapping. 1574 IsDistinct = Record[0] & 0x1; 1575 bool IsNotUsedInTypeRef = Record[0] >= 2; 1576 unsigned Tag = Record[1]; 1577 MDString *Name = getMDString(Record[2]); 1578 Metadata *File = getMDOrNull(Record[3]); 1579 unsigned Line = Record[4]; 1580 Metadata *Scope = getDITypeRefOrNull(Record[5]); 1581 Metadata *BaseType = nullptr; 1582 uint64_t SizeInBits = Record[7]; 1583 if (Record[8] > (uint64_t)std::numeric_limits<uint32_t>::max()) 1584 return error("Alignment value is too large"); 1585 uint32_t AlignInBits = Record[8]; 1586 uint64_t OffsetInBits = 0; 1587 DINode::DIFlags Flags = static_cast<DINode::DIFlags>(Record[10]); 1588 Metadata *Elements = nullptr; 1589 unsigned RuntimeLang = Record[12]; 1590 Metadata *VTableHolder = nullptr; 1591 Metadata *TemplateParams = nullptr; 1592 Metadata *Discriminator = nullptr; 1593 Metadata *DataLocation = nullptr; 1594 Metadata *Associated = nullptr; 1595 Metadata *Allocated = nullptr; 1596 Metadata *Rank = nullptr; 1597 Metadata *Annotations = nullptr; 1598 auto *Identifier = getMDString(Record[15]); 1599 // If this module is being parsed so that it can be ThinLTO imported 1600 // into another module, composite types only need to be imported 1601 // as type declarations (unless full type definitions requested). 1602 // Create type declarations up front to save memory. Also, buildODRType 1603 // handles the case where this is type ODRed with a definition needed 1604 // by the importing module, in which case the existing definition is 1605 // used. 1606 if (IsImporting && !ImportFullTypeDefinitions && Identifier && 1607 (Tag == dwarf::DW_TAG_enumeration_type || 1608 Tag == dwarf::DW_TAG_class_type || 1609 Tag == dwarf::DW_TAG_structure_type || 1610 Tag == dwarf::DW_TAG_union_type)) { 1611 Flags = Flags | DINode::FlagFwdDecl; 1612 if (Name) { 1613 // This is a hack around preserving template parameters for simplified 1614 // template names - it should probably be replaced with a 1615 // DICompositeType flag specifying whether template parameters are 1616 // required on declarations of this type. 1617 StringRef NameStr = Name->getString(); 1618 if (!NameStr.contains('<') || NameStr.startswith("_STN|")) 1619 TemplateParams = getMDOrNull(Record[14]); 1620 } 1621 } else { 1622 BaseType = getDITypeRefOrNull(Record[6]); 1623 OffsetInBits = Record[9]; 1624 Elements = getMDOrNull(Record[11]); 1625 VTableHolder = getDITypeRefOrNull(Record[13]); 1626 TemplateParams = getMDOrNull(Record[14]); 1627 if (Record.size() > 16) 1628 Discriminator = getMDOrNull(Record[16]); 1629 if (Record.size() > 17) 1630 DataLocation = getMDOrNull(Record[17]); 1631 if (Record.size() > 19) { 1632 Associated = getMDOrNull(Record[18]); 1633 Allocated = getMDOrNull(Record[19]); 1634 } 1635 if (Record.size() > 20) { 1636 Rank = getMDOrNull(Record[20]); 1637 } 1638 if (Record.size() > 21) { 1639 Annotations = getMDOrNull(Record[21]); 1640 } 1641 } 1642 DICompositeType *CT = nullptr; 1643 if (Identifier) 1644 CT = DICompositeType::buildODRType( 1645 Context, *Identifier, Tag, Name, File, Line, Scope, BaseType, 1646 SizeInBits, AlignInBits, OffsetInBits, Flags, Elements, RuntimeLang, 1647 VTableHolder, TemplateParams, Discriminator, DataLocation, Associated, 1648 Allocated, Rank, Annotations); 1649 1650 // Create a node if we didn't get a lazy ODR type. 1651 if (!CT) 1652 CT = GET_OR_DISTINCT(DICompositeType, 1653 (Context, Tag, Name, File, Line, Scope, BaseType, 1654 SizeInBits, AlignInBits, OffsetInBits, Flags, 1655 Elements, RuntimeLang, VTableHolder, TemplateParams, 1656 Identifier, Discriminator, DataLocation, Associated, 1657 Allocated, Rank, Annotations)); 1658 if (!IsNotUsedInTypeRef && Identifier) 1659 MetadataList.addTypeRef(*Identifier, *cast<DICompositeType>(CT)); 1660 1661 MetadataList.assignValue(CT, NextMetadataNo); 1662 NextMetadataNo++; 1663 break; 1664 } 1665 case bitc::METADATA_SUBROUTINE_TYPE: { 1666 if (Record.size() < 3 || Record.size() > 4) 1667 return error("Invalid record"); 1668 bool IsOldTypeRefArray = Record[0] < 2; 1669 unsigned CC = (Record.size() > 3) ? Record[3] : 0; 1670 1671 IsDistinct = Record[0] & 0x1; 1672 DINode::DIFlags Flags = static_cast<DINode::DIFlags>(Record[1]); 1673 Metadata *Types = getMDOrNull(Record[2]); 1674 if (LLVM_UNLIKELY(IsOldTypeRefArray)) 1675 Types = MetadataList.upgradeTypeRefArray(Types); 1676 1677 MetadataList.assignValue( 1678 GET_OR_DISTINCT(DISubroutineType, (Context, Flags, CC, Types)), 1679 NextMetadataNo); 1680 NextMetadataNo++; 1681 break; 1682 } 1683 1684 case bitc::METADATA_MODULE: { 1685 if (Record.size() < 5 || Record.size() > 9) 1686 return error("Invalid record"); 1687 1688 unsigned Offset = Record.size() >= 8 ? 2 : 1; 1689 IsDistinct = Record[0]; 1690 MetadataList.assignValue( 1691 GET_OR_DISTINCT( 1692 DIModule, 1693 (Context, Record.size() >= 8 ? getMDOrNull(Record[1]) : nullptr, 1694 getMDOrNull(Record[0 + Offset]), getMDString(Record[1 + Offset]), 1695 getMDString(Record[2 + Offset]), getMDString(Record[3 + Offset]), 1696 getMDString(Record[4 + Offset]), 1697 Record.size() <= 7 ? 0 : Record[7], 1698 Record.size() <= 8 ? false : Record[8])), 1699 NextMetadataNo); 1700 NextMetadataNo++; 1701 break; 1702 } 1703 1704 case bitc::METADATA_FILE: { 1705 if (Record.size() != 3 && Record.size() != 5 && Record.size() != 6) 1706 return error("Invalid record"); 1707 1708 IsDistinct = Record[0]; 1709 std::optional<DIFile::ChecksumInfo<MDString *>> Checksum; 1710 // The BitcodeWriter writes null bytes into Record[3:4] when the Checksum 1711 // is not present. This matches up with the old internal representation, 1712 // and the old encoding for CSK_None in the ChecksumKind. The new 1713 // representation reserves the value 0 in the ChecksumKind to continue to 1714 // encode None in a backwards-compatible way. 1715 if (Record.size() > 4 && Record[3] && Record[4]) 1716 Checksum.emplace(static_cast<DIFile::ChecksumKind>(Record[3]), 1717 getMDString(Record[4])); 1718 MetadataList.assignValue( 1719 GET_OR_DISTINCT(DIFile, 1720 (Context, getMDString(Record[1]), 1721 getMDString(Record[2]), Checksum, 1722 Record.size() > 5 ? getMDString(Record[5]) : nullptr)), 1723 NextMetadataNo); 1724 NextMetadataNo++; 1725 break; 1726 } 1727 case bitc::METADATA_COMPILE_UNIT: { 1728 if (Record.size() < 14 || Record.size() > 22) 1729 return error("Invalid record"); 1730 1731 // Ignore Record[0], which indicates whether this compile unit is 1732 // distinct. It's always distinct. 1733 IsDistinct = true; 1734 auto *CU = DICompileUnit::getDistinct( 1735 Context, Record[1], getMDOrNull(Record[2]), getMDString(Record[3]), 1736 Record[4], getMDString(Record[5]), Record[6], getMDString(Record[7]), 1737 Record[8], getMDOrNull(Record[9]), getMDOrNull(Record[10]), 1738 getMDOrNull(Record[12]), getMDOrNull(Record[13]), 1739 Record.size() <= 15 ? nullptr : getMDOrNull(Record[15]), 1740 Record.size() <= 14 ? 0 : Record[14], 1741 Record.size() <= 16 ? true : Record[16], 1742 Record.size() <= 17 ? false : Record[17], 1743 Record.size() <= 18 ? 0 : Record[18], 1744 Record.size() <= 19 ? false : Record[19], 1745 Record.size() <= 20 ? nullptr : getMDString(Record[20]), 1746 Record.size() <= 21 ? nullptr : getMDString(Record[21])); 1747 1748 MetadataList.assignValue(CU, NextMetadataNo); 1749 NextMetadataNo++; 1750 1751 // Move the Upgrade the list of subprograms. 1752 if (Metadata *SPs = getMDOrNullWithoutPlaceholders(Record[11])) 1753 CUSubprograms.push_back({CU, SPs}); 1754 break; 1755 } 1756 case bitc::METADATA_SUBPROGRAM: { 1757 if (Record.size() < 18 || Record.size() > 21) 1758 return error("Invalid record"); 1759 1760 bool HasSPFlags = Record[0] & 4; 1761 1762 DINode::DIFlags Flags; 1763 DISubprogram::DISPFlags SPFlags; 1764 if (!HasSPFlags) 1765 Flags = static_cast<DINode::DIFlags>(Record[11 + 2]); 1766 else { 1767 Flags = static_cast<DINode::DIFlags>(Record[11]); 1768 SPFlags = static_cast<DISubprogram::DISPFlags>(Record[9]); 1769 } 1770 1771 // Support for old metadata when 1772 // subprogram specific flags are placed in DIFlags. 1773 const unsigned DIFlagMainSubprogram = 1 << 21; 1774 bool HasOldMainSubprogramFlag = Flags & DIFlagMainSubprogram; 1775 if (HasOldMainSubprogramFlag) 1776 // Remove old DIFlagMainSubprogram from DIFlags. 1777 // Note: This assumes that any future use of bit 21 defaults to it 1778 // being 0. 1779 Flags &= ~static_cast<DINode::DIFlags>(DIFlagMainSubprogram); 1780 1781 if (HasOldMainSubprogramFlag && HasSPFlags) 1782 SPFlags |= DISubprogram::SPFlagMainSubprogram; 1783 else if (!HasSPFlags) 1784 SPFlags = DISubprogram::toSPFlags( 1785 /*IsLocalToUnit=*/Record[7], /*IsDefinition=*/Record[8], 1786 /*IsOptimized=*/Record[14], /*Virtuality=*/Record[11], 1787 /*IsMainSubprogram=*/HasOldMainSubprogramFlag); 1788 1789 // All definitions should be distinct. 1790 IsDistinct = (Record[0] & 1) || (SPFlags & DISubprogram::SPFlagDefinition); 1791 // Version 1 has a Function as Record[15]. 1792 // Version 2 has removed Record[15]. 1793 // Version 3 has the Unit as Record[15]. 1794 // Version 4 added thisAdjustment. 1795 // Version 5 repacked flags into DISPFlags, changing many element numbers. 1796 bool HasUnit = Record[0] & 2; 1797 if (!HasSPFlags && HasUnit && Record.size() < 19) 1798 return error("Invalid record"); 1799 if (HasSPFlags && !HasUnit) 1800 return error("Invalid record"); 1801 // Accommodate older formats. 1802 bool HasFn = false; 1803 bool HasThisAdj = true; 1804 bool HasThrownTypes = true; 1805 bool HasAnnotations = false; 1806 bool HasTargetFuncName = false; 1807 unsigned OffsetA = 0; 1808 unsigned OffsetB = 0; 1809 if (!HasSPFlags) { 1810 OffsetA = 2; 1811 OffsetB = 2; 1812 if (Record.size() >= 19) { 1813 HasFn = !HasUnit; 1814 OffsetB++; 1815 } 1816 HasThisAdj = Record.size() >= 20; 1817 HasThrownTypes = Record.size() >= 21; 1818 } else { 1819 HasAnnotations = Record.size() >= 19; 1820 HasTargetFuncName = Record.size() >= 20; 1821 } 1822 Metadata *CUorFn = getMDOrNull(Record[12 + OffsetB]); 1823 DISubprogram *SP = GET_OR_DISTINCT( 1824 DISubprogram, 1825 (Context, 1826 getDITypeRefOrNull(Record[1]), // scope 1827 getMDString(Record[2]), // name 1828 getMDString(Record[3]), // linkageName 1829 getMDOrNull(Record[4]), // file 1830 Record[5], // line 1831 getMDOrNull(Record[6]), // type 1832 Record[7 + OffsetA], // scopeLine 1833 getDITypeRefOrNull(Record[8 + OffsetA]), // containingType 1834 Record[10 + OffsetA], // virtualIndex 1835 HasThisAdj ? Record[16 + OffsetB] : 0, // thisAdjustment 1836 Flags, // flags 1837 SPFlags, // SPFlags 1838 HasUnit ? CUorFn : nullptr, // unit 1839 getMDOrNull(Record[13 + OffsetB]), // templateParams 1840 getMDOrNull(Record[14 + OffsetB]), // declaration 1841 getMDOrNull(Record[15 + OffsetB]), // retainedNodes 1842 HasThrownTypes ? getMDOrNull(Record[17 + OffsetB]) 1843 : nullptr, // thrownTypes 1844 HasAnnotations ? getMDOrNull(Record[18 + OffsetB]) 1845 : nullptr, // annotations 1846 HasTargetFuncName ? getMDString(Record[19 + OffsetB]) 1847 : nullptr // targetFuncName 1848 )); 1849 MetadataList.assignValue(SP, NextMetadataNo); 1850 NextMetadataNo++; 1851 1852 // Upgrade sp->function mapping to function->sp mapping. 1853 if (HasFn) { 1854 if (auto *CMD = dyn_cast_or_null<ConstantAsMetadata>(CUorFn)) 1855 if (auto *F = dyn_cast<Function>(CMD->getValue())) { 1856 if (F->isMaterializable()) 1857 // Defer until materialized; unmaterialized functions may not have 1858 // metadata. 1859 FunctionsWithSPs[F] = SP; 1860 else if (!F->empty()) 1861 F->setSubprogram(SP); 1862 } 1863 } 1864 break; 1865 } 1866 case bitc::METADATA_LEXICAL_BLOCK: { 1867 if (Record.size() != 5) 1868 return error("Invalid record"); 1869 1870 IsDistinct = Record[0]; 1871 MetadataList.assignValue( 1872 GET_OR_DISTINCT(DILexicalBlock, 1873 (Context, getMDOrNull(Record[1]), 1874 getMDOrNull(Record[2]), Record[3], Record[4])), 1875 NextMetadataNo); 1876 NextMetadataNo++; 1877 break; 1878 } 1879 case bitc::METADATA_LEXICAL_BLOCK_FILE: { 1880 if (Record.size() != 4) 1881 return error("Invalid record"); 1882 1883 IsDistinct = Record[0]; 1884 MetadataList.assignValue( 1885 GET_OR_DISTINCT(DILexicalBlockFile, 1886 (Context, getMDOrNull(Record[1]), 1887 getMDOrNull(Record[2]), Record[3])), 1888 NextMetadataNo); 1889 NextMetadataNo++; 1890 break; 1891 } 1892 case bitc::METADATA_COMMON_BLOCK: { 1893 IsDistinct = Record[0] & 1; 1894 MetadataList.assignValue( 1895 GET_OR_DISTINCT(DICommonBlock, 1896 (Context, getMDOrNull(Record[1]), 1897 getMDOrNull(Record[2]), getMDString(Record[3]), 1898 getMDOrNull(Record[4]), Record[5])), 1899 NextMetadataNo); 1900 NextMetadataNo++; 1901 break; 1902 } 1903 case bitc::METADATA_NAMESPACE: { 1904 // Newer versions of DINamespace dropped file and line. 1905 MDString *Name; 1906 if (Record.size() == 3) 1907 Name = getMDString(Record[2]); 1908 else if (Record.size() == 5) 1909 Name = getMDString(Record[3]); 1910 else 1911 return error("Invalid record"); 1912 1913 IsDistinct = Record[0] & 1; 1914 bool ExportSymbols = Record[0] & 2; 1915 MetadataList.assignValue( 1916 GET_OR_DISTINCT(DINamespace, 1917 (Context, getMDOrNull(Record[1]), Name, ExportSymbols)), 1918 NextMetadataNo); 1919 NextMetadataNo++; 1920 break; 1921 } 1922 case bitc::METADATA_MACRO: { 1923 if (Record.size() != 5) 1924 return error("Invalid record"); 1925 1926 IsDistinct = Record[0]; 1927 MetadataList.assignValue( 1928 GET_OR_DISTINCT(DIMacro, 1929 (Context, Record[1], Record[2], getMDString(Record[3]), 1930 getMDString(Record[4]))), 1931 NextMetadataNo); 1932 NextMetadataNo++; 1933 break; 1934 } 1935 case bitc::METADATA_MACRO_FILE: { 1936 if (Record.size() != 5) 1937 return error("Invalid record"); 1938 1939 IsDistinct = Record[0]; 1940 MetadataList.assignValue( 1941 GET_OR_DISTINCT(DIMacroFile, 1942 (Context, Record[1], Record[2], getMDOrNull(Record[3]), 1943 getMDOrNull(Record[4]))), 1944 NextMetadataNo); 1945 NextMetadataNo++; 1946 break; 1947 } 1948 case bitc::METADATA_TEMPLATE_TYPE: { 1949 if (Record.size() < 3 || Record.size() > 4) 1950 return error("Invalid record"); 1951 1952 IsDistinct = Record[0]; 1953 MetadataList.assignValue( 1954 GET_OR_DISTINCT(DITemplateTypeParameter, 1955 (Context, getMDString(Record[1]), 1956 getDITypeRefOrNull(Record[2]), 1957 (Record.size() == 4) ? getMDOrNull(Record[3]) 1958 : getMDOrNull(false))), 1959 NextMetadataNo); 1960 NextMetadataNo++; 1961 break; 1962 } 1963 case bitc::METADATA_TEMPLATE_VALUE: { 1964 if (Record.size() < 5 || Record.size() > 6) 1965 return error("Invalid record"); 1966 1967 IsDistinct = Record[0]; 1968 1969 MetadataList.assignValue( 1970 GET_OR_DISTINCT( 1971 DITemplateValueParameter, 1972 (Context, Record[1], getMDString(Record[2]), 1973 getDITypeRefOrNull(Record[3]), 1974 (Record.size() == 6) ? getMDOrNull(Record[4]) : getMDOrNull(false), 1975 (Record.size() == 6) ? getMDOrNull(Record[5]) 1976 : getMDOrNull(Record[4]))), 1977 NextMetadataNo); 1978 NextMetadataNo++; 1979 break; 1980 } 1981 case bitc::METADATA_GLOBAL_VAR: { 1982 if (Record.size() < 11 || Record.size() > 13) 1983 return error("Invalid record"); 1984 1985 IsDistinct = Record[0] & 1; 1986 unsigned Version = Record[0] >> 1; 1987 1988 if (Version == 2) { 1989 Metadata *Annotations = nullptr; 1990 if (Record.size() > 12) 1991 Annotations = getMDOrNull(Record[12]); 1992 1993 MetadataList.assignValue( 1994 GET_OR_DISTINCT(DIGlobalVariable, 1995 (Context, getMDOrNull(Record[1]), 1996 getMDString(Record[2]), getMDString(Record[3]), 1997 getMDOrNull(Record[4]), Record[5], 1998 getDITypeRefOrNull(Record[6]), Record[7], Record[8], 1999 getMDOrNull(Record[9]), getMDOrNull(Record[10]), 2000 Record[11], Annotations)), 2001 NextMetadataNo); 2002 2003 NextMetadataNo++; 2004 } else if (Version == 1) { 2005 // No upgrade necessary. A null field will be introduced to indicate 2006 // that no parameter information is available. 2007 MetadataList.assignValue( 2008 GET_OR_DISTINCT( 2009 DIGlobalVariable, 2010 (Context, getMDOrNull(Record[1]), getMDString(Record[2]), 2011 getMDString(Record[3]), getMDOrNull(Record[4]), Record[5], 2012 getDITypeRefOrNull(Record[6]), Record[7], Record[8], 2013 getMDOrNull(Record[10]), nullptr, Record[11], nullptr)), 2014 NextMetadataNo); 2015 2016 NextMetadataNo++; 2017 } else if (Version == 0) { 2018 // Upgrade old metadata, which stored a global variable reference or a 2019 // ConstantInt here. 2020 NeedUpgradeToDIGlobalVariableExpression = true; 2021 Metadata *Expr = getMDOrNull(Record[9]); 2022 uint32_t AlignInBits = 0; 2023 if (Record.size() > 11) { 2024 if (Record[11] > (uint64_t)std::numeric_limits<uint32_t>::max()) 2025 return error("Alignment value is too large"); 2026 AlignInBits = Record[11]; 2027 } 2028 GlobalVariable *Attach = nullptr; 2029 if (auto *CMD = dyn_cast_or_null<ConstantAsMetadata>(Expr)) { 2030 if (auto *GV = dyn_cast<GlobalVariable>(CMD->getValue())) { 2031 Attach = GV; 2032 Expr = nullptr; 2033 } else if (auto *CI = dyn_cast<ConstantInt>(CMD->getValue())) { 2034 Expr = DIExpression::get(Context, 2035 {dwarf::DW_OP_constu, CI->getZExtValue(), 2036 dwarf::DW_OP_stack_value}); 2037 } else { 2038 Expr = nullptr; 2039 } 2040 } 2041 DIGlobalVariable *DGV = GET_OR_DISTINCT( 2042 DIGlobalVariable, 2043 (Context, getMDOrNull(Record[1]), getMDString(Record[2]), 2044 getMDString(Record[3]), getMDOrNull(Record[4]), Record[5], 2045 getDITypeRefOrNull(Record[6]), Record[7], Record[8], 2046 getMDOrNull(Record[10]), nullptr, AlignInBits, nullptr)); 2047 2048 DIGlobalVariableExpression *DGVE = nullptr; 2049 if (Attach || Expr) 2050 DGVE = DIGlobalVariableExpression::getDistinct( 2051 Context, DGV, Expr ? Expr : DIExpression::get(Context, {})); 2052 if (Attach) 2053 Attach->addDebugInfo(DGVE); 2054 2055 auto *MDNode = Expr ? cast<Metadata>(DGVE) : cast<Metadata>(DGV); 2056 MetadataList.assignValue(MDNode, NextMetadataNo); 2057 NextMetadataNo++; 2058 } else 2059 return error("Invalid record"); 2060 2061 break; 2062 } 2063 case bitc::METADATA_ASSIGN_ID: { 2064 if (Record.size() != 1) 2065 return error("Invalid DIAssignID record."); 2066 2067 IsDistinct = Record[0] & 1; 2068 if (!IsDistinct) 2069 return error("Invalid DIAssignID record. Must be distinct"); 2070 2071 MetadataList.assignValue(DIAssignID::getDistinct(Context), NextMetadataNo); 2072 NextMetadataNo++; 2073 break; 2074 } 2075 case bitc::METADATA_LOCAL_VAR: { 2076 // 10th field is for the obseleted 'inlinedAt:' field. 2077 if (Record.size() < 8 || Record.size() > 10) 2078 return error("Invalid record"); 2079 2080 IsDistinct = Record[0] & 1; 2081 bool HasAlignment = Record[0] & 2; 2082 // 2nd field used to be an artificial tag, either DW_TAG_auto_variable or 2083 // DW_TAG_arg_variable, if we have alignment flag encoded it means, that 2084 // this is newer version of record which doesn't have artificial tag. 2085 bool HasTag = !HasAlignment && Record.size() > 8; 2086 DINode::DIFlags Flags = static_cast<DINode::DIFlags>(Record[7 + HasTag]); 2087 uint32_t AlignInBits = 0; 2088 Metadata *Annotations = nullptr; 2089 if (HasAlignment) { 2090 if (Record[8] > (uint64_t)std::numeric_limits<uint32_t>::max()) 2091 return error("Alignment value is too large"); 2092 AlignInBits = Record[8]; 2093 if (Record.size() > 9) 2094 Annotations = getMDOrNull(Record[9]); 2095 } 2096 2097 MetadataList.assignValue( 2098 GET_OR_DISTINCT(DILocalVariable, 2099 (Context, getMDOrNull(Record[1 + HasTag]), 2100 getMDString(Record[2 + HasTag]), 2101 getMDOrNull(Record[3 + HasTag]), Record[4 + HasTag], 2102 getDITypeRefOrNull(Record[5 + HasTag]), 2103 Record[6 + HasTag], Flags, AlignInBits, Annotations)), 2104 NextMetadataNo); 2105 NextMetadataNo++; 2106 break; 2107 } 2108 case bitc::METADATA_LABEL: { 2109 if (Record.size() != 5) 2110 return error("Invalid record"); 2111 2112 IsDistinct = Record[0] & 1; 2113 MetadataList.assignValue( 2114 GET_OR_DISTINCT(DILabel, (Context, getMDOrNull(Record[1]), 2115 getMDString(Record[2]), 2116 getMDOrNull(Record[3]), Record[4])), 2117 NextMetadataNo); 2118 NextMetadataNo++; 2119 break; 2120 } 2121 case bitc::METADATA_EXPRESSION: { 2122 if (Record.size() < 1) 2123 return error("Invalid record"); 2124 2125 IsDistinct = Record[0] & 1; 2126 uint64_t Version = Record[0] >> 1; 2127 auto Elts = MutableArrayRef<uint64_t>(Record).slice(1); 2128 2129 SmallVector<uint64_t, 6> Buffer; 2130 if (Error Err = upgradeDIExpression(Version, Elts, Buffer)) 2131 return Err; 2132 2133 MetadataList.assignValue(GET_OR_DISTINCT(DIExpression, (Context, Elts)), 2134 NextMetadataNo); 2135 NextMetadataNo++; 2136 break; 2137 } 2138 case bitc::METADATA_GLOBAL_VAR_EXPR: { 2139 if (Record.size() != 3) 2140 return error("Invalid record"); 2141 2142 IsDistinct = Record[0]; 2143 Metadata *Expr = getMDOrNull(Record[2]); 2144 if (!Expr) 2145 Expr = DIExpression::get(Context, {}); 2146 MetadataList.assignValue( 2147 GET_OR_DISTINCT(DIGlobalVariableExpression, 2148 (Context, getMDOrNull(Record[1]), Expr)), 2149 NextMetadataNo); 2150 NextMetadataNo++; 2151 break; 2152 } 2153 case bitc::METADATA_OBJC_PROPERTY: { 2154 if (Record.size() != 8) 2155 return error("Invalid record"); 2156 2157 IsDistinct = Record[0]; 2158 MetadataList.assignValue( 2159 GET_OR_DISTINCT(DIObjCProperty, 2160 (Context, getMDString(Record[1]), 2161 getMDOrNull(Record[2]), Record[3], 2162 getMDString(Record[4]), getMDString(Record[5]), 2163 Record[6], getDITypeRefOrNull(Record[7]))), 2164 NextMetadataNo); 2165 NextMetadataNo++; 2166 break; 2167 } 2168 case bitc::METADATA_IMPORTED_ENTITY: { 2169 if (Record.size() < 6 || Record.size() > 8) 2170 return error("Invalid DIImportedEntity record"); 2171 2172 IsDistinct = Record[0]; 2173 bool HasFile = (Record.size() >= 7); 2174 bool HasElements = (Record.size() >= 8); 2175 MetadataList.assignValue( 2176 GET_OR_DISTINCT(DIImportedEntity, 2177 (Context, Record[1], getMDOrNull(Record[2]), 2178 getDITypeRefOrNull(Record[3]), 2179 HasFile ? getMDOrNull(Record[6]) : nullptr, 2180 HasFile ? Record[4] : 0, getMDString(Record[5]), 2181 HasElements ? getMDOrNull(Record[7]) : nullptr)), 2182 NextMetadataNo); 2183 NextMetadataNo++; 2184 break; 2185 } 2186 case bitc::METADATA_STRING_OLD: { 2187 std::string String(Record.begin(), Record.end()); 2188 2189 // Test for upgrading !llvm.loop. 2190 HasSeenOldLoopTags |= mayBeOldLoopAttachmentTag(String); 2191 ++NumMDStringLoaded; 2192 Metadata *MD = MDString::get(Context, String); 2193 MetadataList.assignValue(MD, NextMetadataNo); 2194 NextMetadataNo++; 2195 break; 2196 } 2197 case bitc::METADATA_STRINGS: { 2198 auto CreateNextMDString = [&](StringRef Str) { 2199 ++NumMDStringLoaded; 2200 MetadataList.assignValue(MDString::get(Context, Str), NextMetadataNo); 2201 NextMetadataNo++; 2202 }; 2203 if (Error Err = parseMetadataStrings(Record, Blob, CreateNextMDString)) 2204 return Err; 2205 break; 2206 } 2207 case bitc::METADATA_GLOBAL_DECL_ATTACHMENT: { 2208 if (Record.size() % 2 == 0) 2209 return error("Invalid record"); 2210 unsigned ValueID = Record[0]; 2211 if (ValueID >= ValueList.size()) 2212 return error("Invalid record"); 2213 if (auto *GO = dyn_cast<GlobalObject>(ValueList[ValueID])) 2214 if (Error Err = parseGlobalObjectAttachment( 2215 *GO, ArrayRef<uint64_t>(Record).slice(1))) 2216 return Err; 2217 break; 2218 } 2219 case bitc::METADATA_KIND: { 2220 // Support older bitcode files that had METADATA_KIND records in a 2221 // block with METADATA_BLOCK_ID. 2222 if (Error Err = parseMetadataKindRecord(Record)) 2223 return Err; 2224 break; 2225 } 2226 case bitc::METADATA_ARG_LIST: { 2227 SmallVector<ValueAsMetadata *, 4> Elts; 2228 Elts.reserve(Record.size()); 2229 for (uint64_t Elt : Record) { 2230 Metadata *MD = getMD(Elt); 2231 if (isa<MDNode>(MD) && cast<MDNode>(MD)->isTemporary()) 2232 return error( 2233 "Invalid record: DIArgList should not contain forward refs"); 2234 if (!isa<ValueAsMetadata>(MD)) 2235 return error("Invalid record"); 2236 Elts.push_back(cast<ValueAsMetadata>(MD)); 2237 } 2238 2239 MetadataList.assignValue(DIArgList::get(Context, Elts), NextMetadataNo); 2240 NextMetadataNo++; 2241 break; 2242 } 2243 } 2244 return Error::success(); 2245 #undef GET_OR_DISTINCT 2246 } 2247 2248 Error MetadataLoader::MetadataLoaderImpl::parseMetadataStrings( 2249 ArrayRef<uint64_t> Record, StringRef Blob, 2250 function_ref<void(StringRef)> CallBack) { 2251 // All the MDStrings in the block are emitted together in a single 2252 // record. The strings are concatenated and stored in a blob along with 2253 // their sizes. 2254 if (Record.size() != 2) 2255 return error("Invalid record: metadata strings layout"); 2256 2257 unsigned NumStrings = Record[0]; 2258 unsigned StringsOffset = Record[1]; 2259 if (!NumStrings) 2260 return error("Invalid record: metadata strings with no strings"); 2261 if (StringsOffset > Blob.size()) 2262 return error("Invalid record: metadata strings corrupt offset"); 2263 2264 StringRef Lengths = Blob.slice(0, StringsOffset); 2265 SimpleBitstreamCursor R(Lengths); 2266 2267 StringRef Strings = Blob.drop_front(StringsOffset); 2268 do { 2269 if (R.AtEndOfStream()) 2270 return error("Invalid record: metadata strings bad length"); 2271 2272 uint32_t Size; 2273 if (Error E = R.ReadVBR(6).moveInto(Size)) 2274 return E; 2275 if (Strings.size() < Size) 2276 return error("Invalid record: metadata strings truncated chars"); 2277 2278 CallBack(Strings.slice(0, Size)); 2279 Strings = Strings.drop_front(Size); 2280 } while (--NumStrings); 2281 2282 return Error::success(); 2283 } 2284 2285 Error MetadataLoader::MetadataLoaderImpl::parseGlobalObjectAttachment( 2286 GlobalObject &GO, ArrayRef<uint64_t> Record) { 2287 assert(Record.size() % 2 == 0); 2288 for (unsigned I = 0, E = Record.size(); I != E; I += 2) { 2289 auto K = MDKindMap.find(Record[I]); 2290 if (K == MDKindMap.end()) 2291 return error("Invalid ID"); 2292 MDNode *MD = 2293 dyn_cast_or_null<MDNode>(getMetadataFwdRefOrLoad(Record[I + 1])); 2294 if (!MD) 2295 return error("Invalid metadata attachment: expect fwd ref to MDNode"); 2296 GO.addMetadata(K->second, *MD); 2297 } 2298 return Error::success(); 2299 } 2300 2301 /// Parse metadata attachments. 2302 Error MetadataLoader::MetadataLoaderImpl::parseMetadataAttachment( 2303 Function &F, ArrayRef<Instruction *> InstructionList) { 2304 if (Error Err = Stream.EnterSubBlock(bitc::METADATA_ATTACHMENT_ID)) 2305 return Err; 2306 2307 SmallVector<uint64_t, 64> Record; 2308 PlaceholderQueue Placeholders; 2309 2310 while (true) { 2311 BitstreamEntry Entry; 2312 if (Error E = Stream.advanceSkippingSubblocks().moveInto(Entry)) 2313 return E; 2314 2315 switch (Entry.Kind) { 2316 case BitstreamEntry::SubBlock: // Handled for us already. 2317 case BitstreamEntry::Error: 2318 return error("Malformed block"); 2319 case BitstreamEntry::EndBlock: 2320 resolveForwardRefsAndPlaceholders(Placeholders); 2321 return Error::success(); 2322 case BitstreamEntry::Record: 2323 // The interesting case. 2324 break; 2325 } 2326 2327 // Read a metadata attachment record. 2328 Record.clear(); 2329 ++NumMDRecordLoaded; 2330 Expected<unsigned> MaybeRecord = Stream.readRecord(Entry.ID, Record); 2331 if (!MaybeRecord) 2332 return MaybeRecord.takeError(); 2333 switch (MaybeRecord.get()) { 2334 default: // Default behavior: ignore. 2335 break; 2336 case bitc::METADATA_ATTACHMENT: { 2337 unsigned RecordLength = Record.size(); 2338 if (Record.empty()) 2339 return error("Invalid record"); 2340 if (RecordLength % 2 == 0) { 2341 // A function attachment. 2342 if (Error Err = parseGlobalObjectAttachment(F, Record)) 2343 return Err; 2344 continue; 2345 } 2346 2347 // An instruction attachment. 2348 Instruction *Inst = InstructionList[Record[0]]; 2349 for (unsigned i = 1; i != RecordLength; i = i + 2) { 2350 unsigned Kind = Record[i]; 2351 DenseMap<unsigned, unsigned>::iterator I = MDKindMap.find(Kind); 2352 if (I == MDKindMap.end()) 2353 return error("Invalid ID"); 2354 if (I->second == LLVMContext::MD_tbaa && StripTBAA) 2355 continue; 2356 2357 auto Idx = Record[i + 1]; 2358 if (Idx < (MDStringRef.size() + GlobalMetadataBitPosIndex.size()) && 2359 !MetadataList.lookup(Idx)) { 2360 // Load the attachment if it is in the lazy-loadable range and hasn't 2361 // been loaded yet. 2362 lazyLoadOneMetadata(Idx, Placeholders); 2363 resolveForwardRefsAndPlaceholders(Placeholders); 2364 } 2365 2366 Metadata *Node = MetadataList.getMetadataFwdRef(Idx); 2367 if (isa<LocalAsMetadata>(Node)) 2368 // Drop the attachment. This used to be legal, but there's no 2369 // upgrade path. 2370 break; 2371 MDNode *MD = dyn_cast_or_null<MDNode>(Node); 2372 if (!MD) 2373 return error("Invalid metadata attachment"); 2374 2375 if (HasSeenOldLoopTags && I->second == LLVMContext::MD_loop) 2376 MD = upgradeInstructionLoopAttachment(*MD); 2377 2378 if (I->second == LLVMContext::MD_tbaa) { 2379 assert(!MD->isTemporary() && "should load MDs before attachments"); 2380 MD = UpgradeTBAANode(*MD); 2381 } 2382 Inst->setMetadata(I->second, MD); 2383 } 2384 break; 2385 } 2386 } 2387 } 2388 } 2389 2390 /// Parse a single METADATA_KIND record, inserting result in MDKindMap. 2391 Error MetadataLoader::MetadataLoaderImpl::parseMetadataKindRecord( 2392 SmallVectorImpl<uint64_t> &Record) { 2393 if (Record.size() < 2) 2394 return error("Invalid record"); 2395 2396 unsigned Kind = Record[0]; 2397 SmallString<8> Name(Record.begin() + 1, Record.end()); 2398 2399 unsigned NewKind = TheModule.getMDKindID(Name.str()); 2400 if (!MDKindMap.insert(std::make_pair(Kind, NewKind)).second) 2401 return error("Conflicting METADATA_KIND records"); 2402 return Error::success(); 2403 } 2404 2405 /// Parse the metadata kinds out of the METADATA_KIND_BLOCK. 2406 Error MetadataLoader::MetadataLoaderImpl::parseMetadataKinds() { 2407 if (Error Err = Stream.EnterSubBlock(bitc::METADATA_KIND_BLOCK_ID)) 2408 return Err; 2409 2410 SmallVector<uint64_t, 64> Record; 2411 2412 // Read all the records. 2413 while (true) { 2414 BitstreamEntry Entry; 2415 if (Error E = Stream.advanceSkippingSubblocks().moveInto(Entry)) 2416 return E; 2417 2418 switch (Entry.Kind) { 2419 case BitstreamEntry::SubBlock: // Handled for us already. 2420 case BitstreamEntry::Error: 2421 return error("Malformed block"); 2422 case BitstreamEntry::EndBlock: 2423 return Error::success(); 2424 case BitstreamEntry::Record: 2425 // The interesting case. 2426 break; 2427 } 2428 2429 // Read a record. 2430 Record.clear(); 2431 ++NumMDRecordLoaded; 2432 Expected<unsigned> MaybeCode = Stream.readRecord(Entry.ID, Record); 2433 if (!MaybeCode) 2434 return MaybeCode.takeError(); 2435 switch (MaybeCode.get()) { 2436 default: // Default behavior: ignore. 2437 break; 2438 case bitc::METADATA_KIND: { 2439 if (Error Err = parseMetadataKindRecord(Record)) 2440 return Err; 2441 break; 2442 } 2443 } 2444 } 2445 } 2446 2447 MetadataLoader &MetadataLoader::operator=(MetadataLoader &&RHS) { 2448 Pimpl = std::move(RHS.Pimpl); 2449 return *this; 2450 } 2451 MetadataLoader::MetadataLoader(MetadataLoader &&RHS) 2452 : Pimpl(std::move(RHS.Pimpl)) {} 2453 2454 MetadataLoader::~MetadataLoader() = default; 2455 MetadataLoader::MetadataLoader(BitstreamCursor &Stream, Module &TheModule, 2456 BitcodeReaderValueList &ValueList, 2457 bool IsImporting, 2458 MetadataLoaderCallbacks Callbacks) 2459 : Pimpl(std::make_unique<MetadataLoaderImpl>( 2460 Stream, TheModule, ValueList, std::move(Callbacks), IsImporting)) {} 2461 2462 Error MetadataLoader::parseMetadata(bool ModuleLevel) { 2463 return Pimpl->parseMetadata(ModuleLevel); 2464 } 2465 2466 bool MetadataLoader::hasFwdRefs() const { return Pimpl->hasFwdRefs(); } 2467 2468 /// Return the given metadata, creating a replaceable forward reference if 2469 /// necessary. 2470 Metadata *MetadataLoader::getMetadataFwdRefOrLoad(unsigned Idx) { 2471 return Pimpl->getMetadataFwdRefOrLoad(Idx); 2472 } 2473 2474 DISubprogram *MetadataLoader::lookupSubprogramForFunction(Function *F) { 2475 return Pimpl->lookupSubprogramForFunction(F); 2476 } 2477 2478 Error MetadataLoader::parseMetadataAttachment( 2479 Function &F, ArrayRef<Instruction *> InstructionList) { 2480 return Pimpl->parseMetadataAttachment(F, InstructionList); 2481 } 2482 2483 Error MetadataLoader::parseMetadataKinds() { 2484 return Pimpl->parseMetadataKinds(); 2485 } 2486 2487 void MetadataLoader::setStripTBAA(bool StripTBAA) { 2488 return Pimpl->setStripTBAA(StripTBAA); 2489 } 2490 2491 bool MetadataLoader::isStrippingTBAA() { return Pimpl->isStrippingTBAA(); } 2492 2493 unsigned MetadataLoader::size() const { return Pimpl->size(); } 2494 void MetadataLoader::shrinkTo(unsigned N) { return Pimpl->shrinkTo(N); } 2495 2496 void MetadataLoader::upgradeDebugIntrinsics(Function &F) { 2497 return Pimpl->upgradeDebugIntrinsics(F); 2498 } 2499