1 //==- RegAllocGreedy.h ------- greedy register allocator ----------*-C++-*-==// 2 // 3 // Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions. 4 // See https://llvm.org/LICENSE.txt for license information. 5 // SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception 6 // 7 //===----------------------------------------------------------------------===// 8 // This file defines the RAGreedy function pass for register allocation in 9 // optimized builds. 10 //===----------------------------------------------------------------------===// 11 12 #ifndef LLVM_CODEGEN_REGALLOCGREEDY_H_ 13 #define LLVM_CODEGEN_REGALLOCGREEDY_H_ 14 15 #include "InterferenceCache.h" 16 #include "RegAllocBase.h" 17 #include "RegAllocEvictionAdvisor.h" 18 #include "SpillPlacement.h" 19 #include "SplitKit.h" 20 #include "llvm/ADT/ArrayRef.h" 21 #include "llvm/ADT/BitVector.h" 22 #include "llvm/ADT/DenseMap.h" 23 #include "llvm/ADT/IndexedMap.h" 24 #include "llvm/ADT/SetVector.h" 25 #include "llvm/ADT/SmallPtrSet.h" 26 #include "llvm/ADT/SmallVector.h" 27 #include "llvm/ADT/StringRef.h" 28 #include "llvm/CodeGen/CalcSpillWeights.h" 29 #include "llvm/CodeGen/LiveInterval.h" 30 #include "llvm/CodeGen/LiveRangeEdit.h" 31 #include "llvm/CodeGen/MachineFunction.h" 32 #include "llvm/CodeGen/MachineFunctionPass.h" 33 #include "llvm/CodeGen/RegisterClassInfo.h" 34 #include "llvm/CodeGen/Spiller.h" 35 #include "llvm/CodeGen/TargetRegisterInfo.h" 36 #include <algorithm> 37 #include <cstdint> 38 #include <memory> 39 #include <queue> 40 #include <utility> 41 42 namespace llvm { 43 class AllocationOrder; 44 class AnalysisUsage; 45 class EdgeBundles; 46 class LiveDebugVariables; 47 class LiveIntervals; 48 class LiveRegMatrix; 49 class MachineBasicBlock; 50 class MachineBlockFrequencyInfo; 51 class MachineDominatorTree; 52 class MachineLoop; 53 class MachineLoopInfo; 54 class MachineOptimizationRemarkEmitter; 55 class MachineOptimizationRemarkMissed; 56 class SlotIndexes; 57 class TargetInstrInfo; 58 class VirtRegMap; 59 60 class LLVM_LIBRARY_VISIBILITY RAGreedy : public MachineFunctionPass, 61 public RegAllocBase, 62 private LiveRangeEdit::Delegate { 63 // Interface to eviction advisers 64 public: 65 /// Track allocation stage and eviction loop prevention during allocation. 66 class ExtraRegInfo final { 67 // RegInfo - Keep additional information about each live range. 68 struct RegInfo { 69 LiveRangeStage Stage = RS_New; 70 71 // Cascade - Eviction loop prevention. See 72 // canEvictInterferenceBasedOnCost(). 73 unsigned Cascade = 0; 74 75 RegInfo() = default; 76 }; 77 78 IndexedMap<RegInfo, VirtReg2IndexFunctor> Info; 79 unsigned NextCascade = 1; 80 81 public: 82 ExtraRegInfo() = default; 83 ExtraRegInfo(const ExtraRegInfo &) = delete; 84 85 LiveRangeStage getStage(Register Reg) const { return Info[Reg].Stage; } 86 87 LiveRangeStage getStage(const LiveInterval &VirtReg) const { 88 return getStage(VirtReg.reg()); 89 } 90 91 void setStage(Register Reg, LiveRangeStage Stage) { 92 Info.grow(Reg.id()); 93 Info[Reg].Stage = Stage; 94 } 95 96 void setStage(const LiveInterval &VirtReg, LiveRangeStage Stage) { 97 setStage(VirtReg.reg(), Stage); 98 } 99 100 /// Return the current stage of the register, if present, otherwise 101 /// initialize it and return that. 102 LiveRangeStage getOrInitStage(Register Reg) { 103 Info.grow(Reg.id()); 104 return getStage(Reg); 105 } 106 107 unsigned getCascade(Register Reg) const { return Info[Reg].Cascade; } 108 109 void setCascade(Register Reg, unsigned Cascade) { 110 Info.grow(Reg.id()); 111 Info[Reg].Cascade = Cascade; 112 } 113 114 unsigned getOrAssignNewCascade(Register Reg) { 115 unsigned Cascade = getCascade(Reg); 116 if (!Cascade) { 117 Cascade = NextCascade++; 118 setCascade(Reg, Cascade); 119 } 120 return Cascade; 121 } 122 123 unsigned getCascadeOrCurrentNext(Register Reg) const { 124 unsigned Cascade = getCascade(Reg); 125 if (!Cascade) 126 Cascade = NextCascade; 127 return Cascade; 128 } 129 130 template <typename Iterator> 131 void setStage(Iterator Begin, Iterator End, LiveRangeStage NewStage) { 132 for (; Begin != End; ++Begin) { 133 Register Reg = *Begin; 134 Info.grow(Reg.id()); 135 if (Info[Reg].Stage == RS_New) 136 Info[Reg].Stage = NewStage; 137 } 138 } 139 void LRE_DidCloneVirtReg(Register New, Register Old); 140 }; 141 142 LiveRegMatrix *getInterferenceMatrix() const { return Matrix; } 143 LiveIntervals *getLiveIntervals() const { return LIS; } 144 VirtRegMap *getVirtRegMap() const { return VRM; } 145 const RegisterClassInfo &getRegClassInfo() const { return RegClassInfo; } 146 const ExtraRegInfo &getExtraInfo() const { return *ExtraInfo; } 147 size_t getQueueSize() const { return Queue.size(); } 148 // end (interface to eviction advisers) 149 150 private: 151 // Convenient shortcuts. 152 using PQueue = std::priority_queue<std::pair<unsigned, unsigned>>; 153 using SmallLISet = SmallPtrSet<const LiveInterval *, 4>; 154 155 // We need to track all tentative recolorings so we can roll back any 156 // successful and unsuccessful recoloring attempts. 157 using RecoloringStack = 158 SmallVector<std::pair<const LiveInterval *, MCRegister>, 8>; 159 160 // context 161 MachineFunction *MF; 162 163 // Shortcuts to some useful interface. 164 const TargetInstrInfo *TII; 165 166 // analyses 167 SlotIndexes *Indexes; 168 MachineBlockFrequencyInfo *MBFI; 169 MachineDominatorTree *DomTree; 170 MachineLoopInfo *Loops; 171 MachineOptimizationRemarkEmitter *ORE; 172 EdgeBundles *Bundles; 173 SpillPlacement *SpillPlacer; 174 LiveDebugVariables *DebugVars; 175 176 // state 177 std::unique_ptr<Spiller> SpillerInstance; 178 PQueue Queue; 179 std::unique_ptr<VirtRegAuxInfo> VRAI; 180 Optional<ExtraRegInfo> ExtraInfo; 181 std::unique_ptr<RegAllocEvictionAdvisor> EvictAdvisor; 182 183 // Enum CutOffStage to keep a track whether the register allocation failed 184 // because of the cutoffs encountered in last chance recoloring. 185 // Note: This is used as bitmask. New value should be next power of 2. 186 enum CutOffStage { 187 // No cutoffs encountered 188 CO_None = 0, 189 190 // lcr-max-depth cutoff encountered 191 CO_Depth = 1, 192 193 // lcr-max-interf cutoff encountered 194 CO_Interf = 2 195 }; 196 197 uint8_t CutOffInfo; 198 199 #ifndef NDEBUG 200 static const char *const StageName[]; 201 #endif 202 203 // splitting state. 204 std::unique_ptr<SplitAnalysis> SA; 205 std::unique_ptr<SplitEditor> SE; 206 207 /// Cached per-block interference maps 208 InterferenceCache IntfCache; 209 210 /// All basic blocks where the current register has uses. 211 SmallVector<SpillPlacement::BlockConstraint, 8> SplitConstraints; 212 213 /// Global live range splitting candidate info. 214 struct GlobalSplitCandidate { 215 // Register intended for assignment, or 0. 216 MCRegister PhysReg; 217 218 // SplitKit interval index for this candidate. 219 unsigned IntvIdx; 220 221 // Interference for PhysReg. 222 InterferenceCache::Cursor Intf; 223 224 // Bundles where this candidate should be live. 225 BitVector LiveBundles; 226 SmallVector<unsigned, 8> ActiveBlocks; 227 228 void reset(InterferenceCache &Cache, MCRegister Reg) { 229 PhysReg = Reg; 230 IntvIdx = 0; 231 Intf.setPhysReg(Cache, Reg); 232 LiveBundles.clear(); 233 ActiveBlocks.clear(); 234 } 235 236 // Set B[I] = C for every live bundle where B[I] was NoCand. 237 unsigned getBundles(SmallVectorImpl<unsigned> &B, unsigned C) { 238 unsigned Count = 0; 239 for (unsigned I : LiveBundles.set_bits()) 240 if (B[I] == NoCand) { 241 B[I] = C; 242 Count++; 243 } 244 return Count; 245 } 246 }; 247 248 /// Candidate info for each PhysReg in AllocationOrder. 249 /// This vector never shrinks, but grows to the size of the largest register 250 /// class. 251 SmallVector<GlobalSplitCandidate, 32> GlobalCand; 252 253 enum : unsigned { NoCand = ~0u }; 254 255 /// Candidate map. Each edge bundle is assigned to a GlobalCand entry, or to 256 /// NoCand which indicates the stack interval. 257 SmallVector<unsigned, 32> BundleCand; 258 259 /// Callee-save register cost, calculated once per machine function. 260 BlockFrequency CSRCost; 261 262 /// Set of broken hints that may be reconciled later because of eviction. 263 SmallSetVector<const LiveInterval *, 8> SetOfBrokenHints; 264 265 /// The register cost values. This list will be recreated for each Machine 266 /// Function 267 ArrayRef<uint8_t> RegCosts; 268 269 /// Flags for the live range priority calculation, determined once per 270 /// machine function. 271 bool RegClassPriorityTrumpsGlobalness; 272 273 bool ReverseLocalAssignment; 274 275 public: 276 RAGreedy(const RegClassFilterFunc F = allocateAllRegClasses); 277 278 /// Return the pass name. 279 StringRef getPassName() const override { return "Greedy Register Allocator"; } 280 281 /// RAGreedy analysis usage. 282 void getAnalysisUsage(AnalysisUsage &AU) const override; 283 void releaseMemory() override; 284 Spiller &spiller() override { return *SpillerInstance; } 285 void enqueueImpl(const LiveInterval *LI) override; 286 const LiveInterval *dequeue() override; 287 MCRegister selectOrSplit(const LiveInterval &, 288 SmallVectorImpl<Register> &) override; 289 void aboutToRemoveInterval(const LiveInterval &) override; 290 291 /// Perform register allocation. 292 bool runOnMachineFunction(MachineFunction &mf) override; 293 294 MachineFunctionProperties getRequiredProperties() const override { 295 return MachineFunctionProperties().set( 296 MachineFunctionProperties::Property::NoPHIs); 297 } 298 299 MachineFunctionProperties getClearedProperties() const override { 300 return MachineFunctionProperties().set( 301 MachineFunctionProperties::Property::IsSSA); 302 } 303 304 static char ID; 305 306 private: 307 MCRegister selectOrSplitImpl(const LiveInterval &, 308 SmallVectorImpl<Register> &, SmallVirtRegSet &, 309 RecoloringStack &, unsigned = 0); 310 311 bool LRE_CanEraseVirtReg(Register) override; 312 void LRE_WillShrinkVirtReg(Register) override; 313 void LRE_DidCloneVirtReg(Register, Register) override; 314 void enqueue(PQueue &CurQueue, const LiveInterval *LI); 315 const LiveInterval *dequeue(PQueue &CurQueue); 316 317 bool hasVirtRegAlloc(); 318 BlockFrequency calcSpillCost(); 319 bool addSplitConstraints(InterferenceCache::Cursor, BlockFrequency &); 320 bool addThroughConstraints(InterferenceCache::Cursor, ArrayRef<unsigned>); 321 bool growRegion(GlobalSplitCandidate &Cand); 322 BlockFrequency calcGlobalSplitCost(GlobalSplitCandidate &, 323 const AllocationOrder &Order); 324 bool calcCompactRegion(GlobalSplitCandidate &); 325 void splitAroundRegion(LiveRangeEdit &, ArrayRef<unsigned>); 326 void calcGapWeights(MCRegister, SmallVectorImpl<float> &); 327 void evictInterference(const LiveInterval &, MCRegister, 328 SmallVectorImpl<Register> &); 329 bool mayRecolorAllInterferences(MCRegister PhysReg, 330 const LiveInterval &VirtReg, 331 SmallLISet &RecoloringCandidates, 332 const SmallVirtRegSet &FixedRegisters); 333 334 MCRegister tryAssign(const LiveInterval &, AllocationOrder &, 335 SmallVectorImpl<Register> &, const SmallVirtRegSet &); 336 MCRegister tryEvict(const LiveInterval &, AllocationOrder &, 337 SmallVectorImpl<Register> &, uint8_t, 338 const SmallVirtRegSet &); 339 MCRegister tryRegionSplit(const LiveInterval &, AllocationOrder &, 340 SmallVectorImpl<Register> &); 341 /// Calculate cost of region splitting. 342 unsigned calculateRegionSplitCost(const LiveInterval &VirtReg, 343 AllocationOrder &Order, 344 BlockFrequency &BestCost, 345 unsigned &NumCands, bool IgnoreCSR); 346 /// Perform region splitting. 347 unsigned doRegionSplit(const LiveInterval &VirtReg, unsigned BestCand, 348 bool HasCompact, SmallVectorImpl<Register> &NewVRegs); 349 /// Check other options before using a callee-saved register for the first 350 /// time. 351 MCRegister tryAssignCSRFirstTime(const LiveInterval &VirtReg, 352 AllocationOrder &Order, MCRegister PhysReg, 353 uint8_t &CostPerUseLimit, 354 SmallVectorImpl<Register> &NewVRegs); 355 void initializeCSRCost(); 356 unsigned tryBlockSplit(const LiveInterval &, AllocationOrder &, 357 SmallVectorImpl<Register> &); 358 unsigned tryInstructionSplit(const LiveInterval &, AllocationOrder &, 359 SmallVectorImpl<Register> &); 360 unsigned tryLocalSplit(const LiveInterval &, AllocationOrder &, 361 SmallVectorImpl<Register> &); 362 unsigned trySplit(const LiveInterval &, AllocationOrder &, 363 SmallVectorImpl<Register> &, const SmallVirtRegSet &); 364 unsigned tryLastChanceRecoloring(const LiveInterval &, AllocationOrder &, 365 SmallVectorImpl<Register> &, 366 SmallVirtRegSet &, RecoloringStack &, 367 unsigned); 368 bool tryRecoloringCandidates(PQueue &, SmallVectorImpl<Register> &, 369 SmallVirtRegSet &, RecoloringStack &, unsigned); 370 void tryHintRecoloring(const LiveInterval &); 371 void tryHintsRecoloring(); 372 373 /// Model the information carried by one end of a copy. 374 struct HintInfo { 375 /// The frequency of the copy. 376 BlockFrequency Freq; 377 /// The virtual register or physical register. 378 Register Reg; 379 /// Its currently assigned register. 380 /// In case of a physical register Reg == PhysReg. 381 MCRegister PhysReg; 382 383 HintInfo(BlockFrequency Freq, Register Reg, MCRegister PhysReg) 384 : Freq(Freq), Reg(Reg), PhysReg(PhysReg) {} 385 }; 386 using HintsInfo = SmallVector<HintInfo, 4>; 387 388 BlockFrequency getBrokenHintFreq(const HintsInfo &, MCRegister); 389 void collectHintInfo(Register, HintsInfo &); 390 391 /// Greedy RA statistic to remark. 392 struct RAGreedyStats { 393 unsigned Reloads = 0; 394 unsigned FoldedReloads = 0; 395 unsigned ZeroCostFoldedReloads = 0; 396 unsigned Spills = 0; 397 unsigned FoldedSpills = 0; 398 unsigned Copies = 0; 399 float ReloadsCost = 0.0f; 400 float FoldedReloadsCost = 0.0f; 401 float SpillsCost = 0.0f; 402 float FoldedSpillsCost = 0.0f; 403 float CopiesCost = 0.0f; 404 405 bool isEmpty() { 406 return !(Reloads || FoldedReloads || Spills || FoldedSpills || 407 ZeroCostFoldedReloads || Copies); 408 } 409 410 void add(RAGreedyStats other) { 411 Reloads += other.Reloads; 412 FoldedReloads += other.FoldedReloads; 413 ZeroCostFoldedReloads += other.ZeroCostFoldedReloads; 414 Spills += other.Spills; 415 FoldedSpills += other.FoldedSpills; 416 Copies += other.Copies; 417 ReloadsCost += other.ReloadsCost; 418 FoldedReloadsCost += other.FoldedReloadsCost; 419 SpillsCost += other.SpillsCost; 420 FoldedSpillsCost += other.FoldedSpillsCost; 421 CopiesCost += other.CopiesCost; 422 } 423 424 void report(MachineOptimizationRemarkMissed &R); 425 }; 426 427 /// Compute statistic for a basic block. 428 RAGreedyStats computeStats(MachineBasicBlock &MBB); 429 430 /// Compute and report statistic through a remark. 431 RAGreedyStats reportStats(MachineLoop *L); 432 433 /// Report the statistic for each loop. 434 void reportStats(); 435 }; 436 } // namespace llvm 437 #endif // #ifndef LLVM_CODEGEN_REGALLOCGREEDY_H_ 438