1 //===- InstrRefBasedImpl.h - Tracking Debug Value MIs ---------------------===// 2 // 3 // Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions. 4 // See https://llvm.org/LICENSE.txt for license information. 5 // SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception 6 // 7 //===----------------------------------------------------------------------===// 8 9 #ifndef LLVM_LIB_CODEGEN_LIVEDEBUGVALUES_INSTRREFBASEDLDV_H 10 #define LLVM_LIB_CODEGEN_LIVEDEBUGVALUES_INSTRREFBASEDLDV_H 11 12 #include "llvm/ADT/DenseMap.h" 13 #include "llvm/ADT/IndexedMap.h" 14 #include "llvm/ADT/SmallPtrSet.h" 15 #include "llvm/ADT/SmallVector.h" 16 #include "llvm/ADT/UniqueVector.h" 17 #include "llvm/CodeGen/LexicalScopes.h" 18 #include "llvm/CodeGen/MachineBasicBlock.h" 19 #include "llvm/CodeGen/MachineInstr.h" 20 #include "llvm/CodeGen/TargetRegisterInfo.h" 21 #include "llvm/IR/DebugInfoMetadata.h" 22 #include "llvm/Support/Compiler.h" 23 #include <optional> 24 25 #include "LiveDebugValues.h" 26 27 class TransferTracker; 28 29 // Forward dec of unit test class, so that we can peer into the LDV object. 30 class InstrRefLDVTest; 31 32 namespace LiveDebugValues { 33 34 class MLocTracker; 35 class DbgOpIDMap; 36 37 using namespace llvm; 38 39 using DebugVariableID = unsigned; 40 using VarAndLoc = std::pair<DebugVariable, const DILocation *>; 41 42 /// Mapping from DebugVariable to/from a unique identifying number. Each 43 /// DebugVariable consists of three pointers, and after a small amount of 44 /// work to identify overlapping fragments of variables we mostly only use 45 /// DebugVariables as identities of variables. It's much more compile-time 46 /// efficient to use an ID number instead, which this class provides. 47 class DebugVariableMap { 48 DenseMap<DebugVariable, unsigned> VarToIdx; 49 SmallVector<VarAndLoc> IdxToVar; 50 51 public: 52 DebugVariableID getDVID(const DebugVariable &Var) const { 53 auto It = VarToIdx.find(Var); 54 assert(It != VarToIdx.end()); 55 return It->second; 56 } 57 58 DebugVariableID insertDVID(DebugVariable &Var, const DILocation *Loc) { 59 unsigned Size = VarToIdx.size(); 60 auto ItPair = VarToIdx.insert({Var, Size}); 61 if (ItPair.second) { 62 IdxToVar.push_back({Var, Loc}); 63 return Size; 64 } 65 66 return ItPair.first->second; 67 } 68 69 const VarAndLoc &lookupDVID(DebugVariableID ID) const { return IdxToVar[ID]; } 70 71 void clear() { 72 VarToIdx.clear(); 73 IdxToVar.clear(); 74 } 75 }; 76 77 /// Handle-class for a particular "location". This value-type uniquely 78 /// symbolises a register or stack location, allowing manipulation of locations 79 /// without concern for where that location is. Practically, this allows us to 80 /// treat the state of the machine at a particular point as an array of values, 81 /// rather than a map of values. 82 class LocIdx { 83 unsigned Location; 84 85 // Default constructor is private, initializing to an illegal location number. 86 // Use only for "not an entry" elements in IndexedMaps. 87 LocIdx() : Location(UINT_MAX) {} 88 89 public: 90 #define NUM_LOC_BITS 24 91 LocIdx(unsigned L) : Location(L) { 92 assert(L < (1 << NUM_LOC_BITS) && "Machine locations must fit in 24 bits"); 93 } 94 95 static LocIdx MakeIllegalLoc() { return LocIdx(); } 96 static LocIdx MakeTombstoneLoc() { 97 LocIdx L = LocIdx(); 98 --L.Location; 99 return L; 100 } 101 102 bool isIllegal() const { return Location == UINT_MAX; } 103 104 uint64_t asU64() const { return Location; } 105 106 bool operator==(unsigned L) const { return Location == L; } 107 108 bool operator==(const LocIdx &L) const { return Location == L.Location; } 109 110 bool operator!=(unsigned L) const { return !(*this == L); } 111 112 bool operator!=(const LocIdx &L) const { return !(*this == L); } 113 114 bool operator<(const LocIdx &Other) const { 115 return Location < Other.Location; 116 } 117 }; 118 119 // The location at which a spilled value resides. It consists of a register and 120 // an offset. 121 struct SpillLoc { 122 unsigned SpillBase; 123 StackOffset SpillOffset; 124 bool operator==(const SpillLoc &Other) const { 125 return std::make_pair(SpillBase, SpillOffset) == 126 std::make_pair(Other.SpillBase, Other.SpillOffset); 127 } 128 bool operator<(const SpillLoc &Other) const { 129 return std::make_tuple(SpillBase, SpillOffset.getFixed(), 130 SpillOffset.getScalable()) < 131 std::make_tuple(Other.SpillBase, Other.SpillOffset.getFixed(), 132 Other.SpillOffset.getScalable()); 133 } 134 }; 135 136 /// Unique identifier for a value defined by an instruction, as a value type. 137 /// Casts back and forth to a uint64_t. Probably replacable with something less 138 /// bit-constrained. Each value identifies the instruction and machine location 139 /// where the value is defined, although there may be no corresponding machine 140 /// operand for it (ex: regmasks clobbering values). The instructions are 141 /// one-based, and definitions that are PHIs have instruction number zero. 142 /// 143 /// The obvious limits of a 1M block function or 1M instruction blocks are 144 /// problematic; but by that point we should probably have bailed out of 145 /// trying to analyse the function. 146 class ValueIDNum { 147 union { 148 struct { 149 uint64_t BlockNo : 20; /// The block where the def happens. 150 uint64_t InstNo : 20; /// The Instruction where the def happens. 151 /// One based, is distance from start of block. 152 uint64_t LocNo 153 : NUM_LOC_BITS; /// The machine location where the def happens. 154 } s; 155 uint64_t Value; 156 } u; 157 158 static_assert(sizeof(u) == 8, "Badly packed ValueIDNum?"); 159 160 public: 161 // Default-initialize to EmptyValue. This is necessary to make IndexedMaps 162 // of values to work. 163 ValueIDNum() { u.Value = EmptyValue.asU64(); } 164 165 ValueIDNum(uint64_t Block, uint64_t Inst, uint64_t Loc) { 166 u.s = {Block, Inst, Loc}; 167 } 168 169 ValueIDNum(uint64_t Block, uint64_t Inst, LocIdx Loc) { 170 u.s = {Block, Inst, Loc.asU64()}; 171 } 172 173 uint64_t getBlock() const { return u.s.BlockNo; } 174 uint64_t getInst() const { return u.s.InstNo; } 175 uint64_t getLoc() const { return u.s.LocNo; } 176 bool isPHI() const { return u.s.InstNo == 0; } 177 178 uint64_t asU64() const { return u.Value; } 179 180 static ValueIDNum fromU64(uint64_t v) { 181 ValueIDNum Val; 182 Val.u.Value = v; 183 return Val; 184 } 185 186 bool operator<(const ValueIDNum &Other) const { 187 return asU64() < Other.asU64(); 188 } 189 190 bool operator==(const ValueIDNum &Other) const { 191 return u.Value == Other.u.Value; 192 } 193 194 bool operator!=(const ValueIDNum &Other) const { return !(*this == Other); } 195 196 std::string asString(const std::string &mlocname) const { 197 return Twine("Value{bb: ") 198 .concat(Twine(u.s.BlockNo) 199 .concat(Twine(", inst: ") 200 .concat((u.s.InstNo ? Twine(u.s.InstNo) 201 : Twine("live-in")) 202 .concat(Twine(", loc: ").concat( 203 Twine(mlocname))) 204 .concat(Twine("}"))))) 205 .str(); 206 } 207 208 LLVM_ABI_FOR_TEST static ValueIDNum EmptyValue; 209 LLVM_ABI_FOR_TEST static ValueIDNum TombstoneValue; 210 }; 211 212 } // End namespace LiveDebugValues 213 214 namespace llvm { 215 using namespace LiveDebugValues; 216 217 template <> struct DenseMapInfo<LocIdx> { 218 static inline LocIdx getEmptyKey() { return LocIdx::MakeIllegalLoc(); } 219 static inline LocIdx getTombstoneKey() { return LocIdx::MakeTombstoneLoc(); } 220 221 static unsigned getHashValue(const LocIdx &Loc) { return Loc.asU64(); } 222 223 static bool isEqual(const LocIdx &A, const LocIdx &B) { return A == B; } 224 }; 225 226 template <> struct DenseMapInfo<ValueIDNum> { 227 static inline ValueIDNum getEmptyKey() { return ValueIDNum::EmptyValue; } 228 static inline ValueIDNum getTombstoneKey() { 229 return ValueIDNum::TombstoneValue; 230 } 231 232 static unsigned getHashValue(const ValueIDNum &Val) { 233 return hash_value(Val.asU64()); 234 } 235 236 static bool isEqual(const ValueIDNum &A, const ValueIDNum &B) { 237 return A == B; 238 } 239 }; 240 241 } // end namespace llvm 242 243 namespace LiveDebugValues { 244 using namespace llvm; 245 246 /// Type for a table of values in a block. 247 using ValueTable = SmallVector<ValueIDNum, 0>; 248 249 /// A collection of ValueTables, one per BB in a function, with convenient 250 /// accessor methods. 251 struct FuncValueTable { 252 FuncValueTable(int NumBBs, int NumLocs) { 253 Storage.reserve(NumBBs); 254 for (int i = 0; i != NumBBs; ++i) 255 Storage.push_back( 256 std::make_unique<ValueTable>(NumLocs, ValueIDNum::EmptyValue)); 257 } 258 259 /// Returns the ValueTable associated with MBB. 260 ValueTable &operator[](const MachineBasicBlock &MBB) const { 261 return (*this)[MBB.getNumber()]; 262 } 263 264 /// Returns the ValueTable associated with the MachineBasicBlock whose number 265 /// is MBBNum. 266 ValueTable &operator[](int MBBNum) const { 267 auto &TablePtr = Storage[MBBNum]; 268 assert(TablePtr && "Trying to access a deleted table"); 269 return *TablePtr; 270 } 271 272 /// Returns the ValueTable associated with the entry MachineBasicBlock. 273 ValueTable &tableForEntryMBB() const { return (*this)[0]; } 274 275 /// Returns true if the ValueTable associated with MBB has not been freed. 276 bool hasTableFor(MachineBasicBlock &MBB) const { 277 return Storage[MBB.getNumber()] != nullptr; 278 } 279 280 /// Frees the memory of the ValueTable associated with MBB. 281 void ejectTableForBlock(const MachineBasicBlock &MBB) { 282 Storage[MBB.getNumber()].reset(); 283 } 284 285 private: 286 /// ValueTables are stored as unique_ptrs to allow for deallocation during 287 /// LDV; this was measured to have a significant impact on compiler memory 288 /// usage. 289 SmallVector<std::unique_ptr<ValueTable>, 0> Storage; 290 }; 291 292 /// Thin wrapper around an integer -- designed to give more type safety to 293 /// spill location numbers. 294 class SpillLocationNo { 295 public: 296 explicit SpillLocationNo(unsigned SpillNo) : SpillNo(SpillNo) {} 297 unsigned SpillNo; 298 unsigned id() const { return SpillNo; } 299 300 bool operator<(const SpillLocationNo &Other) const { 301 return SpillNo < Other.SpillNo; 302 } 303 304 bool operator==(const SpillLocationNo &Other) const { 305 return SpillNo == Other.SpillNo; 306 } 307 bool operator!=(const SpillLocationNo &Other) const { 308 return !(*this == Other); 309 } 310 }; 311 312 /// Meta qualifiers for a value. Pair of whatever expression is used to qualify 313 /// the value, and Boolean of whether or not it's indirect. 314 class DbgValueProperties { 315 public: 316 DbgValueProperties(const DIExpression *DIExpr, bool Indirect, bool IsVariadic) 317 : DIExpr(DIExpr), Indirect(Indirect), IsVariadic(IsVariadic) {} 318 319 /// Extract properties from an existing DBG_VALUE instruction. 320 DbgValueProperties(const MachineInstr &MI) { 321 assert(MI.isDebugValue()); 322 assert(MI.getDebugExpression()->getNumLocationOperands() == 0 || 323 MI.isDebugValueList() || MI.isUndefDebugValue()); 324 IsVariadic = MI.isDebugValueList(); 325 DIExpr = MI.getDebugExpression(); 326 Indirect = MI.isDebugOffsetImm(); 327 } 328 329 bool isJoinable(const DbgValueProperties &Other) const { 330 return DIExpression::isEqualExpression(DIExpr, Indirect, Other.DIExpr, 331 Other.Indirect); 332 } 333 334 bool operator==(const DbgValueProperties &Other) const { 335 return std::tie(DIExpr, Indirect, IsVariadic) == 336 std::tie(Other.DIExpr, Other.Indirect, Other.IsVariadic); 337 } 338 339 bool operator!=(const DbgValueProperties &Other) const { 340 return !(*this == Other); 341 } 342 343 unsigned getLocationOpCount() const { 344 return IsVariadic ? DIExpr->getNumLocationOperands() : 1; 345 } 346 347 const DIExpression *DIExpr; 348 bool Indirect; 349 bool IsVariadic; 350 }; 351 352 /// TODO: Might pack better if we changed this to a Struct of Arrays, since 353 /// MachineOperand is width 32, making this struct width 33. We could also 354 /// potentially avoid storing the whole MachineOperand (sizeof=32), instead 355 /// choosing to store just the contents portion (sizeof=8) and a Kind enum, 356 /// since we already know it is some type of immediate value. 357 /// Stores a single debug operand, which can either be a MachineOperand for 358 /// directly storing immediate values, or a ValueIDNum representing some value 359 /// computed at some point in the program. IsConst is used as a discriminator. 360 struct DbgOp { 361 union { 362 ValueIDNum ID; 363 MachineOperand MO; 364 }; 365 bool IsConst; 366 367 DbgOp() : ID(ValueIDNum::EmptyValue), IsConst(false) {} 368 DbgOp(ValueIDNum ID) : ID(ID), IsConst(false) {} 369 DbgOp(MachineOperand MO) : MO(MO), IsConst(true) {} 370 371 bool isUndef() const { return !IsConst && ID == ValueIDNum::EmptyValue; } 372 373 #ifndef NDEBUG 374 void dump(const MLocTracker *MTrack) const; 375 #endif 376 }; 377 378 /// A DbgOp whose ID (if any) has resolved to an actual location, LocIdx. Used 379 /// when working with concrete debug values, i.e. when joining MLocs and VLocs 380 /// in the TransferTracker or emitting DBG_VALUE/DBG_VALUE_LIST instructions in 381 /// the MLocTracker. 382 struct ResolvedDbgOp { 383 union { 384 LocIdx Loc; 385 MachineOperand MO; 386 }; 387 bool IsConst; 388 389 ResolvedDbgOp(LocIdx Loc) : Loc(Loc), IsConst(false) {} 390 ResolvedDbgOp(MachineOperand MO) : MO(MO), IsConst(true) {} 391 392 bool operator==(const ResolvedDbgOp &Other) const { 393 if (IsConst != Other.IsConst) 394 return false; 395 if (IsConst) 396 return MO.isIdenticalTo(Other.MO); 397 return Loc == Other.Loc; 398 } 399 400 #ifndef NDEBUG 401 void dump(const MLocTracker *MTrack) const; 402 #endif 403 }; 404 405 /// An ID used in the DbgOpIDMap (below) to lookup a stored DbgOp. This is used 406 /// in place of actual DbgOps inside of a DbgValue to reduce its size, as 407 /// DbgValue is very frequently used and passed around, and the actual DbgOp is 408 /// over 8x larger than this class, due to storing a MachineOperand. This ID 409 /// should be equal for all equal DbgOps, and also encodes whether the mapped 410 /// DbgOp is a constant, meaning that for simple equality or const-ness checks 411 /// it is not necessary to lookup this ID. 412 struct DbgOpID { 413 struct IsConstIndexPair { 414 uint32_t IsConst : 1; 415 uint32_t Index : 31; 416 }; 417 418 union { 419 struct IsConstIndexPair ID; 420 uint32_t RawID; 421 }; 422 423 DbgOpID() : RawID(UndefID.RawID) { 424 static_assert(sizeof(DbgOpID) == 4, "DbgOpID should fit within 4 bytes."); 425 } 426 DbgOpID(uint32_t RawID) : RawID(RawID) {} 427 DbgOpID(bool IsConst, uint32_t Index) : ID({IsConst, Index}) {} 428 429 LLVM_ABI_FOR_TEST static DbgOpID UndefID; 430 431 bool operator==(const DbgOpID &Other) const { return RawID == Other.RawID; } 432 bool operator!=(const DbgOpID &Other) const { return !(*this == Other); } 433 434 uint32_t asU32() const { return RawID; } 435 436 bool isUndef() const { return *this == UndefID; } 437 bool isConst() const { return ID.IsConst && !isUndef(); } 438 uint32_t getIndex() const { return ID.Index; } 439 440 #ifndef NDEBUG 441 void dump(const MLocTracker *MTrack, const DbgOpIDMap *OpStore) const; 442 #endif 443 }; 444 445 /// Class storing the complete set of values that are observed by DbgValues 446 /// within the current function. Allows 2-way lookup, with `find` returning the 447 /// Op for a given ID and `insert` returning the ID for a given Op (creating one 448 /// if none exists). 449 class DbgOpIDMap { 450 451 SmallVector<ValueIDNum, 0> ValueOps; 452 SmallVector<MachineOperand, 0> ConstOps; 453 454 DenseMap<ValueIDNum, DbgOpID> ValueOpToID; 455 DenseMap<MachineOperand, DbgOpID> ConstOpToID; 456 457 public: 458 /// If \p Op does not already exist in this map, it is inserted and the 459 /// corresponding DbgOpID is returned. If Op already exists in this map, then 460 /// no change is made and the existing ID for Op is returned. 461 /// Calling this with the undef DbgOp will always return DbgOpID::UndefID. 462 DbgOpID insert(DbgOp Op) { 463 if (Op.isUndef()) 464 return DbgOpID::UndefID; 465 if (Op.IsConst) 466 return insertConstOp(Op.MO); 467 return insertValueOp(Op.ID); 468 } 469 /// Returns the DbgOp associated with \p ID. Should only be used for IDs 470 /// returned from calling `insert` from this map or DbgOpID::UndefID. 471 DbgOp find(DbgOpID ID) const { 472 if (ID == DbgOpID::UndefID) 473 return DbgOp(); 474 if (ID.isConst()) 475 return DbgOp(ConstOps[ID.getIndex()]); 476 return DbgOp(ValueOps[ID.getIndex()]); 477 } 478 479 void clear() { 480 ValueOps.clear(); 481 ConstOps.clear(); 482 ValueOpToID.clear(); 483 ConstOpToID.clear(); 484 } 485 486 private: 487 DbgOpID insertConstOp(MachineOperand &MO) { 488 auto [It, Inserted] = ConstOpToID.try_emplace(MO, true, ConstOps.size()); 489 if (Inserted) 490 ConstOps.push_back(MO); 491 return It->second; 492 } 493 DbgOpID insertValueOp(ValueIDNum VID) { 494 auto [It, Inserted] = ValueOpToID.try_emplace(VID, false, ValueOps.size()); 495 if (Inserted) 496 ValueOps.push_back(VID); 497 return It->second; 498 } 499 }; 500 501 // We set the maximum number of operands that we will handle to keep DbgValue 502 // within a reasonable size (64 bytes), as we store and pass a lot of them 503 // around. 504 #define MAX_DBG_OPS 8 505 506 /// Class recording the (high level) _value_ of a variable. Identifies the value 507 /// of the variable as a list of ValueIDNums and constant MachineOperands, or as 508 /// an empty list for undef debug values or VPHI values which we have not found 509 /// valid locations for. 510 /// This class also stores meta-information about how the value is qualified. 511 /// Used to reason about variable values when performing the second 512 /// (DebugVariable specific) dataflow analysis. 513 class DbgValue { 514 private: 515 /// If Kind is Def or VPHI, the set of IDs corresponding to the DbgOps that 516 /// are used. VPHIs set every ID to EmptyID when we have not found a valid 517 /// machine-value for every operand, and sets them to the corresponding 518 /// machine-values when we have found all of them. 519 DbgOpID DbgOps[MAX_DBG_OPS]; 520 unsigned OpCount; 521 522 public: 523 /// For a NoVal or VPHI DbgValue, which block it was generated in. 524 int BlockNo; 525 526 /// Qualifiers for the ValueIDNum above. 527 DbgValueProperties Properties; 528 529 typedef enum { 530 Undef, // Represents a DBG_VALUE $noreg in the transfer function only. 531 Def, // This value is defined by some combination of constants, 532 // instructions, or PHI values. 533 VPHI, // Incoming values to BlockNo differ, those values must be joined by 534 // a PHI in this block. 535 NoVal, // Empty DbgValue indicating an unknown value. Used as initializer, 536 // before dominating blocks values are propagated in. 537 } KindT; 538 /// Discriminator for whether this is a constant or an in-program value. 539 KindT Kind; 540 541 DbgValue(ArrayRef<DbgOpID> DbgOps, const DbgValueProperties &Prop) 542 : OpCount(DbgOps.size()), BlockNo(0), Properties(Prop), Kind(Def) { 543 static_assert(sizeof(DbgValue) <= 64, 544 "DbgValue should fit within 64 bytes."); 545 assert(DbgOps.size() == Prop.getLocationOpCount()); 546 if (DbgOps.size() > MAX_DBG_OPS || 547 any_of(DbgOps, [](DbgOpID ID) { return ID.isUndef(); })) { 548 Kind = Undef; 549 OpCount = 0; 550 #define DEBUG_TYPE "LiveDebugValues" 551 if (DbgOps.size() > MAX_DBG_OPS) { 552 LLVM_DEBUG(dbgs() << "Found DbgValue with more than maximum allowed " 553 "operands.\n"); 554 } 555 #undef DEBUG_TYPE 556 } else { 557 for (unsigned Idx = 0; Idx < DbgOps.size(); ++Idx) 558 this->DbgOps[Idx] = DbgOps[Idx]; 559 } 560 } 561 562 DbgValue(unsigned BlockNo, const DbgValueProperties &Prop, KindT Kind) 563 : OpCount(0), BlockNo(BlockNo), Properties(Prop), Kind(Kind) { 564 assert(Kind == NoVal || Kind == VPHI); 565 } 566 567 DbgValue(const DbgValueProperties &Prop, KindT Kind) 568 : OpCount(0), BlockNo(0), Properties(Prop), Kind(Kind) { 569 assert(Kind == Undef && 570 "Empty DbgValue constructor must pass in Undef kind"); 571 } 572 573 #ifndef NDEBUG 574 void dump(const MLocTracker *MTrack = nullptr, 575 const DbgOpIDMap *OpStore = nullptr) const; 576 #endif 577 578 bool operator==(const DbgValue &Other) const { 579 if (std::tie(Kind, Properties) != std::tie(Other.Kind, Other.Properties)) 580 return false; 581 else if (Kind == Def && !equal(getDbgOpIDs(), Other.getDbgOpIDs())) 582 return false; 583 else if (Kind == NoVal && BlockNo != Other.BlockNo) 584 return false; 585 else if (Kind == VPHI && BlockNo != Other.BlockNo) 586 return false; 587 else if (Kind == VPHI && !equal(getDbgOpIDs(), Other.getDbgOpIDs())) 588 return false; 589 590 return true; 591 } 592 593 bool operator!=(const DbgValue &Other) const { return !(*this == Other); } 594 595 // Returns an array of all the machine values used to calculate this variable 596 // value, or an empty list for an Undef or unjoined VPHI. 597 ArrayRef<DbgOpID> getDbgOpIDs() const { return {DbgOps, OpCount}; } 598 599 // Returns either DbgOps[Index] if this DbgValue has Debug Operands, or 600 // the ID for ValueIDNum::EmptyValue otherwise (i.e. if this is an Undef, 601 // NoVal, or an unjoined VPHI). 602 DbgOpID getDbgOpID(unsigned Index) const { 603 if (!OpCount) 604 return DbgOpID::UndefID; 605 assert(Index < OpCount); 606 return DbgOps[Index]; 607 } 608 // Replaces this DbgValue's existing DbgOpIDs (if any) with the contents of 609 // \p NewIDs. The number of DbgOpIDs passed must be equal to the number of 610 // arguments expected by this DbgValue's properties (the return value of 611 // `getLocationOpCount()`). 612 void setDbgOpIDs(ArrayRef<DbgOpID> NewIDs) { 613 // We can go from no ops to some ops, but not from some ops to no ops. 614 assert(NewIDs.size() == getLocationOpCount() && 615 "Incorrect number of Debug Operands for this DbgValue."); 616 OpCount = NewIDs.size(); 617 for (unsigned Idx = 0; Idx < NewIDs.size(); ++Idx) 618 DbgOps[Idx] = NewIDs[Idx]; 619 } 620 621 // The number of debug operands expected by this DbgValue's expression. 622 // getDbgOpIDs() should return an array of this length, unless this is an 623 // Undef or an unjoined VPHI. 624 unsigned getLocationOpCount() const { 625 return Properties.getLocationOpCount(); 626 } 627 628 // Returns true if this or Other are unjoined PHIs, which do not have defined 629 // Loc Ops, or if the `n`th Loc Op for this has a different constness to the 630 // `n`th Loc Op for Other. 631 bool hasJoinableLocOps(const DbgValue &Other) const { 632 if (isUnjoinedPHI() || Other.isUnjoinedPHI()) 633 return true; 634 for (unsigned Idx = 0; Idx < getLocationOpCount(); ++Idx) { 635 if (getDbgOpID(Idx).isConst() != Other.getDbgOpID(Idx).isConst()) 636 return false; 637 } 638 return true; 639 } 640 641 bool isUnjoinedPHI() const { return Kind == VPHI && OpCount == 0; } 642 643 bool hasIdenticalValidLocOps(const DbgValue &Other) const { 644 if (!OpCount) 645 return false; 646 return equal(getDbgOpIDs(), Other.getDbgOpIDs()); 647 } 648 }; 649 650 class LocIdxToIndexFunctor { 651 public: 652 using argument_type = LocIdx; 653 unsigned operator()(const LocIdx &L) const { return L.asU64(); } 654 }; 655 656 /// Tracker for what values are in machine locations. Listens to the Things 657 /// being Done by various instructions, and maintains a table of what machine 658 /// locations have what values (as defined by a ValueIDNum). 659 /// 660 /// There are potentially a much larger number of machine locations on the 661 /// target machine than the actual working-set size of the function. On x86 for 662 /// example, we're extremely unlikely to want to track values through control 663 /// or debug registers. To avoid doing so, MLocTracker has several layers of 664 /// indirection going on, described below, to avoid unnecessarily tracking 665 /// any location. 666 /// 667 /// Here's a sort of diagram of the indexes, read from the bottom up: 668 /// 669 /// Size on stack Offset on stack 670 /// \ / 671 /// Stack Idx (Where in slot is this?) 672 /// / 673 /// / 674 /// Slot Num (%stack.0) / 675 /// FrameIdx => SpillNum / 676 /// \ / 677 /// SpillID (int) Register number (int) 678 /// \ / 679 /// LocationID => LocIdx 680 /// | 681 /// LocIdx => ValueIDNum 682 /// 683 /// The aim here is that the LocIdx => ValueIDNum vector is just an array of 684 /// values in numbered locations, so that later analyses can ignore whether the 685 /// location is a register or otherwise. To map a register / spill location to 686 /// a LocIdx, you have to use the (sparse) LocationID => LocIdx map. And to 687 /// build a LocationID for a stack slot, you need to combine identifiers for 688 /// which stack slot it is and where within that slot is being described. 689 /// 690 /// Register mask operands cause trouble by technically defining every register; 691 /// various hacks are used to avoid tracking registers that are never read and 692 /// only written by regmasks. 693 class MLocTracker { 694 public: 695 MachineFunction &MF; 696 const TargetInstrInfo &TII; 697 const TargetRegisterInfo &TRI; 698 const TargetLowering &TLI; 699 700 /// IndexedMap type, mapping from LocIdx to ValueIDNum. 701 using LocToValueType = IndexedMap<ValueIDNum, LocIdxToIndexFunctor>; 702 703 /// Map of LocIdxes to the ValueIDNums that they store. This is tightly 704 /// packed, entries only exist for locations that are being tracked. 705 LocToValueType LocIdxToIDNum; 706 707 /// "Map" of machine location IDs (i.e., raw register or spill number) to the 708 /// LocIdx key / number for that location. There are always at least as many 709 /// as the number of registers on the target -- if the value in the register 710 /// is not being tracked, then the LocIdx value will be zero. New entries are 711 /// appended if a new spill slot begins being tracked. 712 /// This, and the corresponding reverse map persist for the analysis of the 713 /// whole function, and is necessarying for decoding various vectors of 714 /// values. 715 std::vector<LocIdx> LocIDToLocIdx; 716 717 /// Inverse map of LocIDToLocIdx. 718 IndexedMap<unsigned, LocIdxToIndexFunctor> LocIdxToLocID; 719 720 /// When clobbering register masks, we chose to not believe the machine model 721 /// and don't clobber SP. Do the same for SP aliases, and for efficiency, 722 /// keep a set of them here. 723 SmallSet<Register, 8> SPAliases; 724 725 /// Unique-ification of spill. Used to number them -- their LocID number is 726 /// the index in SpillLocs minus one plus NumRegs. 727 UniqueVector<SpillLoc> SpillLocs; 728 729 // If we discover a new machine location, assign it an mphi with this 730 // block number. 731 unsigned CurBB = -1; 732 733 /// Cached local copy of the number of registers the target has. 734 unsigned NumRegs; 735 736 /// Number of slot indexes the target has -- distinct segments of a stack 737 /// slot that can take on the value of a subregister, when a super-register 738 /// is written to the stack. 739 unsigned NumSlotIdxes; 740 741 /// Collection of register mask operands that have been observed. Second part 742 /// of pair indicates the instruction that they happened in. Used to 743 /// reconstruct where defs happened if we start tracking a location later 744 /// on. 745 SmallVector<std::pair<const MachineOperand *, unsigned>, 32> Masks; 746 747 /// Pair for describing a position within a stack slot -- first the size in 748 /// bits, then the offset. 749 typedef std::pair<unsigned short, unsigned short> StackSlotPos; 750 751 /// Map from a size/offset pair describing a position in a stack slot, to a 752 /// numeric identifier for that position. Allows easier identification of 753 /// individual positions. 754 DenseMap<StackSlotPos, unsigned> StackSlotIdxes; 755 756 /// Inverse of StackSlotIdxes. 757 DenseMap<unsigned, StackSlotPos> StackIdxesToPos; 758 759 /// Iterator for locations and the values they contain. Dereferencing 760 /// produces a struct/pair containing the LocIdx key for this location, 761 /// and a reference to the value currently stored. Simplifies the process 762 /// of seeking a particular location. 763 class MLocIterator { 764 LocToValueType &ValueMap; 765 LocIdx Idx; 766 767 public: 768 class value_type { 769 public: 770 value_type(LocIdx Idx, ValueIDNum &Value) : Idx(Idx), Value(Value) {} 771 const LocIdx Idx; /// Read-only index of this location. 772 ValueIDNum &Value; /// Reference to the stored value at this location. 773 }; 774 775 MLocIterator(LocToValueType &ValueMap, LocIdx Idx) 776 : ValueMap(ValueMap), Idx(Idx) {} 777 778 bool operator==(const MLocIterator &Other) const { 779 assert(&ValueMap == &Other.ValueMap); 780 return Idx == Other.Idx; 781 } 782 783 bool operator!=(const MLocIterator &Other) const { 784 return !(*this == Other); 785 } 786 787 void operator++() { Idx = LocIdx(Idx.asU64() + 1); } 788 789 value_type operator*() { return value_type(Idx, ValueMap[LocIdx(Idx)]); } 790 }; 791 792 LLVM_ABI_FOR_TEST MLocTracker(MachineFunction &MF, const TargetInstrInfo &TII, 793 const TargetRegisterInfo &TRI, 794 const TargetLowering &TLI); 795 796 /// Produce location ID number for a Register. Provides some small amount of 797 /// type safety. 798 /// \param Reg The register we're looking up. 799 unsigned getLocID(Register Reg) { return Reg.id(); } 800 801 /// Produce location ID number for a spill position. 802 /// \param Spill The number of the spill we're fetching the location for. 803 /// \param SpillSubReg Subregister within the spill we're addressing. 804 unsigned getLocID(SpillLocationNo Spill, unsigned SpillSubReg) { 805 unsigned short Size = TRI.getSubRegIdxSize(SpillSubReg); 806 unsigned short Offs = TRI.getSubRegIdxOffset(SpillSubReg); 807 return getLocID(Spill, {Size, Offs}); 808 } 809 810 /// Produce location ID number for a spill position. 811 /// \param Spill The number of the spill we're fetching the location for. 812 /// \apram SpillIdx size/offset within the spill slot to be addressed. 813 unsigned getLocID(SpillLocationNo Spill, StackSlotPos Idx) { 814 unsigned SlotNo = Spill.id() - 1; 815 SlotNo *= NumSlotIdxes; 816 assert(StackSlotIdxes.contains(Idx)); 817 SlotNo += StackSlotIdxes[Idx]; 818 SlotNo += NumRegs; 819 return SlotNo; 820 } 821 822 /// Given a spill number, and a slot within the spill, calculate the ID number 823 /// for that location. 824 unsigned getSpillIDWithIdx(SpillLocationNo Spill, unsigned Idx) { 825 unsigned SlotNo = Spill.id() - 1; 826 SlotNo *= NumSlotIdxes; 827 SlotNo += Idx; 828 SlotNo += NumRegs; 829 return SlotNo; 830 } 831 832 /// Return the spill number that a location ID corresponds to. 833 SpillLocationNo locIDToSpill(unsigned ID) const { 834 assert(ID >= NumRegs); 835 ID -= NumRegs; 836 // Truncate away the index part, leaving only the spill number. 837 ID /= NumSlotIdxes; 838 return SpillLocationNo(ID + 1); // The UniqueVector is one-based. 839 } 840 841 /// Returns the spill-slot size/offs that a location ID corresponds to. 842 StackSlotPos locIDToSpillIdx(unsigned ID) const { 843 assert(ID >= NumRegs); 844 ID -= NumRegs; 845 unsigned Idx = ID % NumSlotIdxes; 846 return StackIdxesToPos.find(Idx)->second; 847 } 848 849 unsigned getNumLocs() const { return LocIdxToIDNum.size(); } 850 851 /// Reset all locations to contain a PHI value at the designated block. Used 852 /// sometimes for actual PHI values, othertimes to indicate the block entry 853 /// value (before any more information is known). 854 void setMPhis(unsigned NewCurBB) { 855 CurBB = NewCurBB; 856 for (auto Location : locations()) 857 Location.Value = {CurBB, 0, Location.Idx}; 858 } 859 860 /// Load values for each location from array of ValueIDNums. Take current 861 /// bbnum just in case we read a value from a hitherto untouched register. 862 void loadFromArray(ValueTable &Locs, unsigned NewCurBB) { 863 CurBB = NewCurBB; 864 // Iterate over all tracked locations, and load each locations live-in 865 // value into our local index. 866 for (auto Location : locations()) 867 Location.Value = Locs[Location.Idx.asU64()]; 868 } 869 870 /// Wipe any un-necessary location records after traversing a block. 871 void reset() { 872 // We could reset all the location values too; however either loadFromArray 873 // or setMPhis should be called before this object is re-used. Just 874 // clear Masks, they're definitely not needed. 875 Masks.clear(); 876 } 877 878 /// Clear all data. Destroys the LocID <=> LocIdx map, which makes most of 879 /// the information in this pass uninterpretable. 880 void clear() { 881 reset(); 882 LocIDToLocIdx.clear(); 883 LocIdxToLocID.clear(); 884 LocIdxToIDNum.clear(); 885 // SpillLocs.reset(); XXX UniqueVector::reset assumes a SpillLoc casts from 886 // 0 887 SpillLocs = decltype(SpillLocs)(); 888 StackSlotIdxes.clear(); 889 StackIdxesToPos.clear(); 890 891 LocIDToLocIdx.resize(NumRegs, LocIdx::MakeIllegalLoc()); 892 } 893 894 /// Set a locaiton to a certain value. 895 void setMLoc(LocIdx L, ValueIDNum Num) { 896 assert(L.asU64() < LocIdxToIDNum.size()); 897 LocIdxToIDNum[L] = Num; 898 } 899 900 /// Read the value of a particular location 901 ValueIDNum readMLoc(LocIdx L) { 902 assert(L.asU64() < LocIdxToIDNum.size()); 903 return LocIdxToIDNum[L]; 904 } 905 906 /// Create a LocIdx for an untracked register ID. Initialize it to either an 907 /// mphi value representing a live-in, or a recent register mask clobber. 908 LLVM_ABI_FOR_TEST LocIdx trackRegister(unsigned ID); 909 910 LocIdx lookupOrTrackRegister(unsigned ID) { 911 LocIdx &Index = LocIDToLocIdx[ID]; 912 if (Index.isIllegal()) 913 Index = trackRegister(ID); 914 return Index; 915 } 916 917 /// Is register R currently tracked by MLocTracker? 918 bool isRegisterTracked(Register R) { 919 LocIdx &Index = LocIDToLocIdx[R]; 920 return !Index.isIllegal(); 921 } 922 923 /// Record a definition of the specified register at the given block / inst. 924 /// This doesn't take a ValueIDNum, because the definition and its location 925 /// are synonymous. 926 void defReg(Register R, unsigned BB, unsigned Inst) { 927 unsigned ID = getLocID(R); 928 LocIdx Idx = lookupOrTrackRegister(ID); 929 ValueIDNum ValueID = {BB, Inst, Idx}; 930 LocIdxToIDNum[Idx] = ValueID; 931 } 932 933 /// Set a register to a value number. To be used if the value number is 934 /// known in advance. 935 void setReg(Register R, ValueIDNum ValueID) { 936 unsigned ID = getLocID(R); 937 LocIdx Idx = lookupOrTrackRegister(ID); 938 LocIdxToIDNum[Idx] = ValueID; 939 } 940 941 ValueIDNum readReg(Register R) { 942 unsigned ID = getLocID(R); 943 LocIdx Idx = lookupOrTrackRegister(ID); 944 return LocIdxToIDNum[Idx]; 945 } 946 947 /// Reset a register value to zero / empty. Needed to replicate the 948 /// VarLoc implementation where a copy to/from a register effectively 949 /// clears the contents of the source register. (Values can only have one 950 /// machine location in VarLocBasedImpl). 951 void wipeRegister(Register R) { 952 unsigned ID = getLocID(R); 953 LocIdx Idx = LocIDToLocIdx[ID]; 954 LocIdxToIDNum[Idx] = ValueIDNum::EmptyValue; 955 } 956 957 /// Determine the LocIdx of an existing register. 958 LocIdx getRegMLoc(Register R) { 959 unsigned ID = getLocID(R); 960 assert(ID < LocIDToLocIdx.size()); 961 assert(LocIDToLocIdx[ID] != UINT_MAX); // Sentinel for IndexedMap. 962 return LocIDToLocIdx[ID]; 963 } 964 965 /// Record a RegMask operand being executed. Defs any register we currently 966 /// track, stores a pointer to the mask in case we have to account for it 967 /// later. 968 void writeRegMask(const MachineOperand *MO, unsigned CurBB, unsigned InstID); 969 970 /// Find LocIdx for SpillLoc \p L, creating a new one if it's not tracked. 971 /// Returns std::nullopt when in scenarios where a spill slot could be 972 /// tracked, but we would likely run into resource limitations. 973 LLVM_ABI_FOR_TEST std::optional<SpillLocationNo> 974 getOrTrackSpillLoc(SpillLoc L); 975 976 // Get LocIdx of a spill ID. 977 LocIdx getSpillMLoc(unsigned SpillID) { 978 assert(LocIDToLocIdx[SpillID] != UINT_MAX); // Sentinel for IndexedMap. 979 return LocIDToLocIdx[SpillID]; 980 } 981 982 /// Return true if Idx is a spill machine location. 983 bool isSpill(LocIdx Idx) const { return LocIdxToLocID[Idx] >= NumRegs; } 984 985 /// How large is this location (aka, how wide is a value defined there?). 986 unsigned getLocSizeInBits(LocIdx L) const { 987 unsigned ID = LocIdxToLocID[L]; 988 if (!isSpill(L)) { 989 return TRI.getRegSizeInBits(Register(ID), MF.getRegInfo()); 990 } else { 991 // The slot location on the stack is uninteresting, we care about the 992 // position of the value within the slot (which comes with a size). 993 StackSlotPos Pos = locIDToSpillIdx(ID); 994 return Pos.first; 995 } 996 } 997 998 MLocIterator begin() { return MLocIterator(LocIdxToIDNum, 0); } 999 1000 MLocIterator end() { 1001 return MLocIterator(LocIdxToIDNum, LocIdxToIDNum.size()); 1002 } 1003 1004 /// Return a range over all locations currently tracked. 1005 iterator_range<MLocIterator> locations() { 1006 return llvm::make_range(begin(), end()); 1007 } 1008 1009 std::string LocIdxToName(LocIdx Idx) const; 1010 1011 std::string IDAsString(const ValueIDNum &Num) const; 1012 1013 #ifndef NDEBUG 1014 LLVM_DUMP_METHOD void dump(); 1015 1016 LLVM_DUMP_METHOD void dump_mloc_map(); 1017 #endif 1018 1019 /// Create a DBG_VALUE based on debug operands \p DbgOps. Qualify it with the 1020 /// information in \pProperties, for variable Var. Don't insert it anywhere, 1021 /// just return the builder for it. 1022 MachineInstrBuilder emitLoc(const SmallVectorImpl<ResolvedDbgOp> &DbgOps, 1023 const DebugVariable &Var, const DILocation *DILoc, 1024 const DbgValueProperties &Properties); 1025 }; 1026 1027 /// Types for recording sets of variable fragments that overlap. For a given 1028 /// local variable, we record all other fragments of that variable that could 1029 /// overlap it, to reduce search time. 1030 using FragmentOfVar = 1031 std::pair<const DILocalVariable *, DIExpression::FragmentInfo>; 1032 using OverlapMap = 1033 DenseMap<FragmentOfVar, SmallVector<DIExpression::FragmentInfo, 1>>; 1034 1035 /// Collection of DBG_VALUEs observed when traversing a block. Records each 1036 /// variable and the value the DBG_VALUE refers to. Requires the machine value 1037 /// location dataflow algorithm to have run already, so that values can be 1038 /// identified. 1039 class VLocTracker { 1040 public: 1041 /// Ref to function-wide map of DebugVariable <=> ID-numbers. 1042 DebugVariableMap &DVMap; 1043 /// Map DebugVariable to the latest Value it's defined to have. 1044 /// Needs to be a MapVector because we determine order-in-the-input-MIR from 1045 /// the order in this container. (FIXME: likely no longer true as the ordering 1046 /// is now provided by DebugVariableMap). 1047 /// We only retain the last DbgValue in each block for each variable, to 1048 /// determine the blocks live-out variable value. The Vars container forms the 1049 /// transfer function for this block, as part of the dataflow analysis. The 1050 /// movement of values between locations inside of a block is handled at a 1051 /// much later stage, in the TransferTracker class. 1052 SmallMapVector<DebugVariableID, DbgValue, 8> Vars; 1053 SmallDenseMap<DebugVariableID, const DILocation *, 8> Scopes; 1054 MachineBasicBlock *MBB = nullptr; 1055 const OverlapMap &OverlappingFragments; 1056 DbgValueProperties EmptyProperties; 1057 1058 public: 1059 VLocTracker(DebugVariableMap &DVMap, const OverlapMap &O, 1060 const DIExpression *EmptyExpr) 1061 : DVMap(DVMap), OverlappingFragments(O), 1062 EmptyProperties(EmptyExpr, false, false) {} 1063 1064 void defVar(const MachineInstr &MI, const DbgValueProperties &Properties, 1065 const SmallVectorImpl<DbgOpID> &DebugOps) { 1066 assert(MI.isDebugValueLike()); 1067 DebugVariable Var(MI.getDebugVariable(), MI.getDebugExpression(), 1068 MI.getDebugLoc()->getInlinedAt()); 1069 // Either insert or fetch an ID number for this variable. 1070 DebugVariableID VarID = DVMap.insertDVID(Var, MI.getDebugLoc().get()); 1071 DbgValue Rec = (DebugOps.size() > 0) 1072 ? DbgValue(DebugOps, Properties) 1073 : DbgValue(Properties, DbgValue::Undef); 1074 1075 // Attempt insertion; overwrite if it's already mapped. 1076 Vars.insert_or_assign(VarID, Rec); 1077 Scopes[VarID] = MI.getDebugLoc().get(); 1078 1079 considerOverlaps(Var, MI.getDebugLoc().get()); 1080 } 1081 1082 void considerOverlaps(const DebugVariable &Var, const DILocation *Loc) { 1083 auto Overlaps = OverlappingFragments.find( 1084 {Var.getVariable(), Var.getFragmentOrDefault()}); 1085 if (Overlaps == OverlappingFragments.end()) 1086 return; 1087 1088 // Otherwise: terminate any overlapped variable locations. 1089 for (auto FragmentInfo : Overlaps->second) { 1090 // The "empty" fragment is stored as DebugVariable::DefaultFragment, so 1091 // that it overlaps with everything, however its cannonical representation 1092 // in a DebugVariable is as "None". 1093 std::optional<DIExpression::FragmentInfo> OptFragmentInfo = FragmentInfo; 1094 if (DebugVariable::isDefaultFragment(FragmentInfo)) 1095 OptFragmentInfo = std::nullopt; 1096 1097 DebugVariable Overlapped(Var.getVariable(), OptFragmentInfo, 1098 Var.getInlinedAt()); 1099 // Produce an ID number for this overlapping fragment of a variable. 1100 DebugVariableID OverlappedID = DVMap.insertDVID(Overlapped, Loc); 1101 DbgValue Rec = DbgValue(EmptyProperties, DbgValue::Undef); 1102 1103 // Attempt insertion; overwrite if it's already mapped. 1104 Vars.insert_or_assign(OverlappedID, Rec); 1105 Scopes[OverlappedID] = Loc; 1106 } 1107 } 1108 1109 void clear() { 1110 Vars.clear(); 1111 Scopes.clear(); 1112 } 1113 }; 1114 1115 // XXX XXX docs 1116 class InstrRefBasedLDV : public LDVImpl { 1117 public: 1118 friend class ::InstrRefLDVTest; 1119 1120 using FragmentInfo = DIExpression::FragmentInfo; 1121 using OptFragmentInfo = std::optional<DIExpression::FragmentInfo>; 1122 1123 // Helper while building OverlapMap, a map of all fragments seen for a given 1124 // DILocalVariable. 1125 using VarToFragments = 1126 DenseMap<const DILocalVariable *, SmallSet<FragmentInfo, 4>>; 1127 1128 /// Machine location/value transfer function, a mapping of which locations 1129 /// are assigned which new values. 1130 using MLocTransferMap = SmallDenseMap<LocIdx, ValueIDNum>; 1131 1132 /// Live in/out structure for the variable values: a per-block map of 1133 /// variables to their values. 1134 using LiveIdxT = SmallDenseMap<const MachineBasicBlock *, DbgValue *, 16>; 1135 1136 using VarAndLoc = std::pair<DebugVariableID, DbgValue>; 1137 1138 /// Type for a live-in value: the predecessor block, and its value. 1139 using InValueT = std::pair<MachineBasicBlock *, DbgValue *>; 1140 1141 /// Vector (per block) of a collection (inner smallvector) of live-ins. 1142 /// Used as the result type for the variable value dataflow problem. 1143 using LiveInsT = SmallVector<SmallVector<VarAndLoc, 8>, 8>; 1144 1145 /// Mapping from lexical scopes to a DILocation in that scope. 1146 using ScopeToDILocT = DenseMap<const LexicalScope *, const DILocation *>; 1147 1148 /// Mapping from lexical scopes to variables in that scope. 1149 using ScopeToVarsT = 1150 DenseMap<const LexicalScope *, SmallSet<DebugVariableID, 4>>; 1151 1152 /// Mapping from lexical scopes to blocks where variables in that scope are 1153 /// assigned. Such blocks aren't necessarily "in" the lexical scope, it's 1154 /// just a block where an assignment happens. 1155 using ScopeToAssignBlocksT = DenseMap<const LexicalScope *, SmallPtrSet<MachineBasicBlock *, 4>>; 1156 1157 private: 1158 MachineDominatorTree *DomTree; 1159 const TargetRegisterInfo *TRI; 1160 const MachineRegisterInfo *MRI; 1161 const TargetInstrInfo *TII; 1162 const TargetFrameLowering *TFI; 1163 const MachineFrameInfo *MFI; 1164 BitVector CalleeSavedRegs; 1165 LexicalScopes LS; 1166 1167 // An empty DIExpression. Used default / placeholder DbgValueProperties 1168 // objects, as we can't have null expressions. 1169 const DIExpression *EmptyExpr; 1170 1171 /// Object to track machine locations as we step through a block. Could 1172 /// probably be a field rather than a pointer, as it's always used. 1173 MLocTracker *MTracker = nullptr; 1174 1175 /// Number of the current block LiveDebugValues is stepping through. 1176 unsigned CurBB = -1; 1177 1178 /// Number of the current instruction LiveDebugValues is evaluating. 1179 unsigned CurInst; 1180 1181 /// Variable tracker -- listens to DBG_VALUEs occurring as InstrRefBasedImpl 1182 /// steps through a block. Reads the values at each location from the 1183 /// MLocTracker object. 1184 VLocTracker *VTracker = nullptr; 1185 1186 /// Tracker for transfers, listens to DBG_VALUEs and transfers of values 1187 /// between locations during stepping, creates new DBG_VALUEs when values move 1188 /// location. 1189 TransferTracker *TTracker = nullptr; 1190 1191 /// Blocks which are artificial, i.e. blocks which exclusively contain 1192 /// instructions without DebugLocs, or with line 0 locations. 1193 SmallPtrSet<MachineBasicBlock *, 16> ArtificialBlocks; 1194 1195 // Mapping of blocks to and from their RPOT order. 1196 SmallVector<MachineBasicBlock *> OrderToBB; 1197 DenseMap<const MachineBasicBlock *, unsigned int> BBToOrder; 1198 DenseMap<unsigned, unsigned> BBNumToRPO; 1199 1200 /// Pair of MachineInstr, and its 1-based offset into the containing block. 1201 using InstAndNum = std::pair<const MachineInstr *, unsigned>; 1202 /// Map from debug instruction number to the MachineInstr labelled with that 1203 /// number, and its location within the function. Used to transform 1204 /// instruction numbers in DBG_INSTR_REFs into machine value numbers. 1205 std::map<uint64_t, InstAndNum> DebugInstrNumToInstr; 1206 1207 /// Record of where we observed a DBG_PHI instruction. 1208 class DebugPHIRecord { 1209 public: 1210 /// Instruction number of this DBG_PHI. 1211 uint64_t InstrNum; 1212 /// Block where DBG_PHI occurred. 1213 MachineBasicBlock *MBB; 1214 /// The value number read by the DBG_PHI -- or std::nullopt if it didn't 1215 /// refer to a value. 1216 std::optional<ValueIDNum> ValueRead; 1217 /// Register/Stack location the DBG_PHI reads -- or std::nullopt if it 1218 /// referred to something unexpected. 1219 std::optional<LocIdx> ReadLoc; 1220 1221 operator unsigned() const { return InstrNum; } 1222 }; 1223 1224 /// Map from instruction numbers defined by DBG_PHIs to a record of what that 1225 /// DBG_PHI read and where. Populated and edited during the machine value 1226 /// location problem -- we use LLVMs SSA Updater to fix changes by 1227 /// optimizations that destroy PHI instructions. 1228 SmallVector<DebugPHIRecord, 32> DebugPHINumToValue; 1229 1230 // Map of overlapping variable fragments. 1231 OverlapMap OverlapFragments; 1232 VarToFragments SeenFragments; 1233 1234 /// Mapping of DBG_INSTR_REF instructions to their values, for those 1235 /// DBG_INSTR_REFs that call resolveDbgPHIs. These variable references solve 1236 /// a mini SSA problem caused by DBG_PHIs being cloned, this collection caches 1237 /// the result. 1238 DenseMap<std::pair<MachineInstr *, unsigned>, std::optional<ValueIDNum>> 1239 SeenDbgPHIs; 1240 1241 DbgOpIDMap DbgOpStore; 1242 1243 /// Mapping between DebugVariables and unique ID numbers. This is a more 1244 /// efficient way to represent the identity of a variable, versus a plain 1245 /// DebugVariable. 1246 DebugVariableMap DVMap; 1247 1248 /// True if we need to examine call instructions for stack clobbers. We 1249 /// normally assume that they don't clobber SP, but stack probes on Windows 1250 /// do. 1251 bool AdjustsStackInCalls = false; 1252 1253 /// If AdjustsStackInCalls is true, this holds the name of the target's stack 1254 /// probe function, which is the function we expect will alter the stack 1255 /// pointer. 1256 StringRef StackProbeSymbolName; 1257 1258 /// Tests whether this instruction is a spill to a stack slot. 1259 std::optional<SpillLocationNo> isSpillInstruction(const MachineInstr &MI, 1260 MachineFunction *MF); 1261 1262 /// Decide if @MI is a spill instruction and return true if it is. We use 2 1263 /// criteria to make this decision: 1264 /// - Is this instruction a store to a spill slot? 1265 /// - Is there a register operand that is both used and killed? 1266 /// TODO: Store optimization can fold spills into other stores (including 1267 /// other spills). We do not handle this yet (more than one memory operand). 1268 bool isLocationSpill(const MachineInstr &MI, MachineFunction *MF, 1269 unsigned &Reg); 1270 1271 /// If a given instruction is identified as a spill, return the spill slot 1272 /// and set \p Reg to the spilled register. 1273 std::optional<SpillLocationNo> isRestoreInstruction(const MachineInstr &MI, 1274 MachineFunction *MF, 1275 unsigned &Reg); 1276 1277 /// Given a spill instruction, extract the spill slot information, ensure it's 1278 /// tracked, and return the spill number. 1279 std::optional<SpillLocationNo> 1280 extractSpillBaseRegAndOffset(const MachineInstr &MI); 1281 1282 /// For an instruction reference given by \p InstNo and \p OpNo in instruction 1283 /// \p MI returns the Value pointed to by that instruction reference if any 1284 /// exists, otherwise returns std::nullopt. 1285 std::optional<ValueIDNum> getValueForInstrRef(unsigned InstNo, unsigned OpNo, 1286 MachineInstr &MI, 1287 const FuncValueTable *MLiveOuts, 1288 const FuncValueTable *MLiveIns); 1289 1290 /// Observe a single instruction while stepping through a block. 1291 void process(MachineInstr &MI, const FuncValueTable *MLiveOuts, 1292 const FuncValueTable *MLiveIns); 1293 1294 /// Examines whether \p MI is a DBG_VALUE and notifies trackers. 1295 /// \returns true if MI was recognized and processed. 1296 bool transferDebugValue(const MachineInstr &MI); 1297 1298 /// Examines whether \p MI is a DBG_INSTR_REF and notifies trackers. 1299 /// \returns true if MI was recognized and processed. 1300 bool transferDebugInstrRef(MachineInstr &MI, const FuncValueTable *MLiveOuts, 1301 const FuncValueTable *MLiveIns); 1302 1303 /// Stores value-information about where this PHI occurred, and what 1304 /// instruction number is associated with it. 1305 /// \returns true if MI was recognized and processed. 1306 bool transferDebugPHI(MachineInstr &MI); 1307 1308 /// Examines whether \p MI is copy instruction, and notifies trackers. 1309 /// \returns true if MI was recognized and processed. 1310 bool transferRegisterCopy(MachineInstr &MI); 1311 1312 /// Examines whether \p MI is stack spill or restore instruction, and 1313 /// notifies trackers. \returns true if MI was recognized and processed. 1314 bool transferSpillOrRestoreInst(MachineInstr &MI); 1315 1316 /// Examines \p MI for any registers that it defines, and notifies trackers. 1317 void transferRegisterDef(MachineInstr &MI); 1318 1319 /// Copy one location to the other, accounting for movement of subregisters 1320 /// too. 1321 void performCopy(Register Src, Register Dst); 1322 1323 void accumulateFragmentMap(MachineInstr &MI); 1324 1325 /// Determine the machine value number referred to by (potentially several) 1326 /// DBG_PHI instructions. Block duplication and tail folding can duplicate 1327 /// DBG_PHIs, shifting the position where values in registers merge, and 1328 /// forming another mini-ssa problem to solve. 1329 /// \p Here the position of a DBG_INSTR_REF seeking a machine value number 1330 /// \p InstrNum Debug instruction number defined by DBG_PHI instructions. 1331 /// \returns The machine value number at position Here, or std::nullopt. 1332 std::optional<ValueIDNum> resolveDbgPHIs(MachineFunction &MF, 1333 const FuncValueTable &MLiveOuts, 1334 const FuncValueTable &MLiveIns, 1335 MachineInstr &Here, 1336 uint64_t InstrNum); 1337 1338 std::optional<ValueIDNum> resolveDbgPHIsImpl(MachineFunction &MF, 1339 const FuncValueTable &MLiveOuts, 1340 const FuncValueTable &MLiveIns, 1341 MachineInstr &Here, 1342 uint64_t InstrNum); 1343 1344 /// Step through the function, recording register definitions and movements 1345 /// in an MLocTracker. Convert the observations into a per-block transfer 1346 /// function in \p MLocTransfer, suitable for using with the machine value 1347 /// location dataflow problem. 1348 LLVM_ABI_FOR_TEST void 1349 produceMLocTransferFunction(MachineFunction &MF, 1350 SmallVectorImpl<MLocTransferMap> &MLocTransfer, 1351 unsigned MaxNumBlocks); 1352 1353 /// Solve the machine value location dataflow problem. Takes as input the 1354 /// transfer functions in \p MLocTransfer. Writes the output live-in and 1355 /// live-out arrays to the (initialized to zero) multidimensional arrays in 1356 /// \p MInLocs and \p MOutLocs. The outer dimension is indexed by block 1357 /// number, the inner by LocIdx. 1358 LLVM_ABI_FOR_TEST void 1359 buildMLocValueMap(MachineFunction &MF, FuncValueTable &MInLocs, 1360 FuncValueTable &MOutLocs, 1361 SmallVectorImpl<MLocTransferMap> &MLocTransfer); 1362 1363 /// Examine the stack indexes (i.e. offsets within the stack) to find the 1364 /// basic units of interference -- like reg units, but for the stack. 1365 void findStackIndexInterference(SmallVectorImpl<unsigned> &Slots); 1366 1367 /// Install PHI values into the live-in array for each block, according to 1368 /// the IDF of each register. 1369 LLVM_ABI_FOR_TEST void placeMLocPHIs( 1370 MachineFunction &MF, SmallPtrSetImpl<MachineBasicBlock *> &AllBlocks, 1371 FuncValueTable &MInLocs, SmallVectorImpl<MLocTransferMap> &MLocTransfer); 1372 1373 /// Propagate variable values to blocks in the common case where there's 1374 /// only one value assigned to the variable. This function has better 1375 /// performance as it doesn't have to find the dominance frontier between 1376 /// different assignments. 1377 void placePHIsForSingleVarDefinition( 1378 const SmallPtrSetImpl<MachineBasicBlock *> &InScopeBlocks, 1379 MachineBasicBlock *MBB, SmallVectorImpl<VLocTracker> &AllTheVLocs, 1380 DebugVariableID Var, LiveInsT &Output); 1381 1382 /// Calculate the iterated-dominance-frontier for a set of defs, using the 1383 /// existing LLVM facilities for this. Works for a single "value" or 1384 /// machine/variable location. 1385 /// \p AllBlocks Set of blocks where we might consume the value. 1386 /// \p DefBlocks Set of blocks where the value/location is defined. 1387 /// \p PHIBlocks Output set of blocks where PHIs must be placed. 1388 void BlockPHIPlacement(const SmallPtrSetImpl<MachineBasicBlock *> &AllBlocks, 1389 const SmallPtrSetImpl<MachineBasicBlock *> &DefBlocks, 1390 SmallVectorImpl<MachineBasicBlock *> &PHIBlocks); 1391 1392 /// Perform a control flow join (lattice value meet) of the values in machine 1393 /// locations at \p MBB. Follows the algorithm described in the file-comment, 1394 /// reading live-outs of predecessors from \p OutLocs, the current live ins 1395 /// from \p InLocs, and assigning the newly computed live ins back into 1396 /// \p InLocs. \returns two bools -- the first indicates whether a change 1397 /// was made, the second whether a lattice downgrade occurred. If the latter 1398 /// is true, revisiting this block is necessary. 1399 bool mlocJoin(MachineBasicBlock &MBB, 1400 SmallPtrSet<const MachineBasicBlock *, 16> &Visited, 1401 FuncValueTable &OutLocs, ValueTable &InLocs); 1402 1403 /// Produce a set of blocks that are in the current lexical scope. This means 1404 /// those blocks that contain instructions "in" the scope, blocks where 1405 /// assignments to variables in scope occur, and artificial blocks that are 1406 /// successors to any of the earlier blocks. See https://llvm.org/PR48091 for 1407 /// more commentry on what "in scope" means. 1408 /// \p DILoc A location in the scope that we're fetching blocks for. 1409 /// \p Output Set to put in-scope-blocks into. 1410 /// \p AssignBlocks Blocks known to contain assignments of variables in scope. 1411 void 1412 getBlocksForScope(const DILocation *DILoc, 1413 SmallPtrSetImpl<const MachineBasicBlock *> &Output, 1414 const SmallPtrSetImpl<MachineBasicBlock *> &AssignBlocks); 1415 1416 /// Solve the variable value dataflow problem, for a single lexical scope. 1417 /// Uses the algorithm from the file comment to resolve control flow joins 1418 /// using PHI placement and value propagation. Reads the locations of machine 1419 /// values from the \p MInLocs and \p MOutLocs arrays (see buildMLocValueMap) 1420 /// and reads the variable values transfer function from \p AllTheVlocs. 1421 /// Live-in and Live-out variable values are stored locally, with the live-ins 1422 /// permanently stored to \p Output once a fixedpoint is reached. 1423 /// \p VarsWeCareAbout contains a collection of the variables in \p Scope 1424 /// that we should be tracking. 1425 /// \p AssignBlocks contains the set of blocks that aren't in \p DILoc's 1426 /// scope, but which do contain DBG_VALUEs, which VarLocBasedImpl tracks 1427 /// locations through. 1428 LLVM_ABI_FOR_TEST void 1429 buildVLocValueMap(const DILocation *DILoc, 1430 const SmallSet<DebugVariableID, 4> &VarsWeCareAbout, 1431 SmallPtrSetImpl<MachineBasicBlock *> &AssignBlocks, 1432 LiveInsT &Output, FuncValueTable &MOutLocs, 1433 FuncValueTable &MInLocs, 1434 SmallVectorImpl<VLocTracker> &AllTheVLocs); 1435 1436 /// Attempt to eliminate un-necessary PHIs on entry to a block. Examines the 1437 /// live-in values coming from predecessors live-outs, and replaces any PHIs 1438 /// already present in this blocks live-ins with a live-through value if the 1439 /// PHI isn't needed. 1440 /// \p LiveIn Old live-in value, overwritten with new one if live-in changes. 1441 /// \returns true if any live-ins change value, either from value propagation 1442 /// or PHI elimination. 1443 LLVM_ABI_FOR_TEST bool 1444 vlocJoin(MachineBasicBlock &MBB, LiveIdxT &VLOCOutLocs, 1445 SmallPtrSet<const MachineBasicBlock *, 8> &BlocksToExplore, 1446 DbgValue &LiveIn); 1447 1448 /// For the given block and live-outs feeding into it, try to find 1449 /// machine locations for each debug operand where all the values feeding 1450 /// into that operand join together. 1451 /// \returns true if a joined location was found for every value that needed 1452 /// to be joined. 1453 LLVM_ABI_FOR_TEST bool 1454 pickVPHILoc(SmallVectorImpl<DbgOpID> &OutValues, const MachineBasicBlock &MBB, 1455 const LiveIdxT &LiveOuts, FuncValueTable &MOutLocs, 1456 const SmallVectorImpl<const MachineBasicBlock *> &BlockOrders); 1457 1458 std::optional<ValueIDNum> pickOperandPHILoc( 1459 unsigned DbgOpIdx, const MachineBasicBlock &MBB, const LiveIdxT &LiveOuts, 1460 FuncValueTable &MOutLocs, 1461 const SmallVectorImpl<const MachineBasicBlock *> &BlockOrders); 1462 1463 /// Take collections of DBG_VALUE instructions stored in TTracker, and 1464 /// install them into their output blocks. 1465 bool emitTransfers(); 1466 1467 /// Boilerplate computation of some initial sets, artifical blocks and 1468 /// RPOT block ordering. 1469 LLVM_ABI_FOR_TEST void initialSetup(MachineFunction &MF); 1470 1471 /// Produce a map of the last lexical scope that uses a block, using the 1472 /// scopes DFSOut number. Mapping is block-number to DFSOut. 1473 /// \p EjectionMap Pre-allocated vector in which to install the built ma. 1474 /// \p ScopeToDILocation Mapping of LexicalScopes to their DILocations. 1475 /// \p AssignBlocks Map of blocks where assignments happen for a scope. 1476 void makeDepthFirstEjectionMap(SmallVectorImpl<unsigned> &EjectionMap, 1477 const ScopeToDILocT &ScopeToDILocation, 1478 ScopeToAssignBlocksT &AssignBlocks); 1479 1480 /// When determining per-block variable values and emitting to DBG_VALUEs, 1481 /// this function explores by lexical scope depth. Doing so means that per 1482 /// block information can be fully computed before exploration finishes, 1483 /// allowing us to emit it and free data structures earlier than otherwise. 1484 /// It's also good for locality. 1485 bool depthFirstVLocAndEmit( 1486 unsigned MaxNumBlocks, const ScopeToDILocT &ScopeToDILocation, 1487 const ScopeToVarsT &ScopeToVars, ScopeToAssignBlocksT &ScopeToBlocks, 1488 LiveInsT &Output, FuncValueTable &MOutLocs, FuncValueTable &MInLocs, 1489 SmallVectorImpl<VLocTracker> &AllTheVLocs, MachineFunction &MF, 1490 bool ShouldEmitDebugEntryValues); 1491 1492 bool ExtendRanges(MachineFunction &MF, MachineDominatorTree *DomTree, 1493 bool ShouldEmitDebugEntryValues, unsigned InputBBLimit, 1494 unsigned InputDbgValLimit) override; 1495 1496 public: 1497 /// Default construct and initialize the pass. 1498 LLVM_ABI_FOR_TEST InstrRefBasedLDV(); 1499 1500 LLVM_DUMP_METHOD 1501 void dump_mloc_transfer(const MLocTransferMap &mloc_transfer) const; 1502 1503 bool isCalleeSaved(LocIdx L) const; 1504 bool isCalleeSavedReg(Register R) const; 1505 1506 bool hasFoldedStackStore(const MachineInstr &MI) { 1507 // Instruction must have a memory operand that's a stack slot, and isn't 1508 // aliased, meaning it's a spill from regalloc instead of a variable. 1509 // If it's aliased, we can't guarantee its value. 1510 if (!MI.hasOneMemOperand()) 1511 return false; 1512 auto *MemOperand = *MI.memoperands_begin(); 1513 return MemOperand->isStore() && 1514 MemOperand->getPseudoValue() && 1515 MemOperand->getPseudoValue()->kind() == PseudoSourceValue::FixedStack 1516 && !MemOperand->getPseudoValue()->isAliased(MFI); 1517 } 1518 1519 std::optional<LocIdx> findLocationForMemOperand(const MachineInstr &MI); 1520 1521 // Utility for unit testing, don't use directly. 1522 DebugVariableMap &getDVMap() { 1523 return DVMap; 1524 } 1525 }; 1526 1527 } // namespace LiveDebugValues 1528 1529 #endif /* LLVM_LIB_CODEGEN_LIVEDEBUGVALUES_INSTRREFBASEDLDV_H */ 1530