1 //===- SIAnnotateControlFlow.cpp ------------------------------------------===// 2 // 3 // Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions. 4 // See https://llvm.org/LICENSE.txt for license information. 5 // SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception 6 // 7 //===----------------------------------------------------------------------===// 8 // 9 /// \file 10 /// Annotates the control flow with hardware specific intrinsics. 11 // 12 //===----------------------------------------------------------------------===// 13 14 #include "AMDGPU.h" 15 #include "GCNSubtarget.h" 16 #include "llvm/Analysis/LoopInfo.h" 17 #include "llvm/Analysis/UniformityAnalysis.h" 18 #include "llvm/CodeGen/TargetPassConfig.h" 19 #include "llvm/IR/BasicBlock.h" 20 #include "llvm/IR/Constants.h" 21 #include "llvm/IR/Dominators.h" 22 #include "llvm/IR/IRBuilder.h" 23 #include "llvm/IR/IntrinsicsAMDGPU.h" 24 #include "llvm/InitializePasses.h" 25 #include "llvm/Target/TargetMachine.h" 26 #include "llvm/Transforms/Utils/BasicBlockUtils.h" 27 #include "llvm/Transforms/Utils/Local.h" 28 29 using namespace llvm; 30 31 #define DEBUG_TYPE "si-annotate-control-flow" 32 33 namespace { 34 35 // Complex types used in this pass 36 using StackEntry = std::pair<BasicBlock *, Value *>; 37 using StackVector = SmallVector<StackEntry, 16>; 38 39 class SIAnnotateControlFlow : public FunctionPass { 40 UniformityInfo *UA; 41 42 Type *Boolean; 43 Type *Void; 44 Type *IntMask; 45 Type *ReturnStruct; 46 47 ConstantInt *BoolTrue; 48 ConstantInt *BoolFalse; 49 UndefValue *BoolUndef; 50 Constant *IntMaskZero; 51 52 Function *If; 53 Function *Else; 54 Function *IfBreak; 55 Function *Loop; 56 Function *EndCf; 57 58 DominatorTree *DT; 59 StackVector Stack; 60 61 LoopInfo *LI; 62 63 void initialize(Module &M, const GCNSubtarget &ST); 64 65 bool isUniform(BranchInst *T); 66 67 bool isTopOfStack(BasicBlock *BB); 68 69 Value *popSaved(); 70 71 void push(BasicBlock *BB, Value *Saved); 72 73 bool isElse(PHINode *Phi); 74 75 bool hasKill(const BasicBlock *BB); 76 77 bool eraseIfUnused(PHINode *Phi); 78 79 bool openIf(BranchInst *Term); 80 81 bool insertElse(BranchInst *Term); 82 83 Value * 84 handleLoopCondition(Value *Cond, PHINode *Broken, llvm::Loop *L, 85 BranchInst *Term); 86 87 bool handleLoop(BranchInst *Term); 88 89 bool closeControlFlow(BasicBlock *BB); 90 91 public: 92 static char ID; 93 94 SIAnnotateControlFlow() : FunctionPass(ID) {} 95 96 bool runOnFunction(Function &F) override; 97 98 StringRef getPassName() const override { return "SI annotate control flow"; } 99 100 void getAnalysisUsage(AnalysisUsage &AU) const override { 101 AU.addRequired<LoopInfoWrapperPass>(); 102 AU.addRequired<DominatorTreeWrapperPass>(); 103 AU.addRequired<UniformityInfoWrapperPass>(); 104 AU.addPreserved<LoopInfoWrapperPass>(); 105 AU.addPreserved<DominatorTreeWrapperPass>(); 106 AU.addRequired<TargetPassConfig>(); 107 FunctionPass::getAnalysisUsage(AU); 108 } 109 }; 110 111 } // end anonymous namespace 112 113 INITIALIZE_PASS_BEGIN(SIAnnotateControlFlow, DEBUG_TYPE, 114 "Annotate SI Control Flow", false, false) 115 INITIALIZE_PASS_DEPENDENCY(DominatorTreeWrapperPass) 116 INITIALIZE_PASS_DEPENDENCY(UniformityInfoWrapperPass) 117 INITIALIZE_PASS_DEPENDENCY(TargetPassConfig) 118 INITIALIZE_PASS_END(SIAnnotateControlFlow, DEBUG_TYPE, 119 "Annotate SI Control Flow", false, false) 120 121 char SIAnnotateControlFlow::ID = 0; 122 123 /// Initialize all the types and constants used in the pass 124 void SIAnnotateControlFlow::initialize(Module &M, const GCNSubtarget &ST) { 125 LLVMContext &Context = M.getContext(); 126 127 Void = Type::getVoidTy(Context); 128 Boolean = Type::getInt1Ty(Context); 129 IntMask = ST.isWave32() ? Type::getInt32Ty(Context) 130 : Type::getInt64Ty(Context); 131 ReturnStruct = StructType::get(Boolean, IntMask); 132 133 BoolTrue = ConstantInt::getTrue(Context); 134 BoolFalse = ConstantInt::getFalse(Context); 135 BoolUndef = PoisonValue::get(Boolean); 136 IntMaskZero = ConstantInt::get(IntMask, 0); 137 138 If = Intrinsic::getDeclaration(&M, Intrinsic::amdgcn_if, { IntMask }); 139 Else = Intrinsic::getDeclaration(&M, Intrinsic::amdgcn_else, 140 { IntMask, IntMask }); 141 IfBreak = Intrinsic::getDeclaration(&M, Intrinsic::amdgcn_if_break, 142 { IntMask }); 143 Loop = Intrinsic::getDeclaration(&M, Intrinsic::amdgcn_loop, { IntMask }); 144 EndCf = Intrinsic::getDeclaration(&M, Intrinsic::amdgcn_end_cf, { IntMask }); 145 } 146 147 /// Is the branch condition uniform or did the StructurizeCFG pass 148 /// consider it as such? 149 bool SIAnnotateControlFlow::isUniform(BranchInst *T) { 150 return UA->isUniform(T) || T->hasMetadata("structurizecfg.uniform"); 151 } 152 153 /// Is BB the last block saved on the stack ? 154 bool SIAnnotateControlFlow::isTopOfStack(BasicBlock *BB) { 155 return !Stack.empty() && Stack.back().first == BB; 156 } 157 158 /// Pop the last saved value from the control flow stack 159 Value *SIAnnotateControlFlow::popSaved() { 160 return Stack.pop_back_val().second; 161 } 162 163 /// Push a BB and saved value to the control flow stack 164 void SIAnnotateControlFlow::push(BasicBlock *BB, Value *Saved) { 165 Stack.push_back(std::pair(BB, Saved)); 166 } 167 168 /// Can the condition represented by this PHI node treated like 169 /// an "Else" block? 170 bool SIAnnotateControlFlow::isElse(PHINode *Phi) { 171 BasicBlock *IDom = DT->getNode(Phi->getParent())->getIDom()->getBlock(); 172 for (unsigned i = 0, e = Phi->getNumIncomingValues(); i != e; ++i) { 173 if (Phi->getIncomingBlock(i) == IDom) { 174 175 if (Phi->getIncomingValue(i) != BoolTrue) 176 return false; 177 178 } else { 179 if (Phi->getIncomingValue(i) != BoolFalse) 180 return false; 181 182 } 183 } 184 return true; 185 } 186 187 bool SIAnnotateControlFlow::hasKill(const BasicBlock *BB) { 188 for (const Instruction &I : *BB) { 189 if (const CallInst *CI = dyn_cast<CallInst>(&I)) 190 if (CI->getIntrinsicID() == Intrinsic::amdgcn_kill) 191 return true; 192 } 193 return false; 194 } 195 196 // Erase "Phi" if it is not used any more. Return true if any change was made. 197 bool SIAnnotateControlFlow::eraseIfUnused(PHINode *Phi) { 198 bool Changed = RecursivelyDeleteDeadPHINode(Phi); 199 if (Changed) 200 LLVM_DEBUG(dbgs() << "Erased unused condition phi\n"); 201 return Changed; 202 } 203 204 /// Open a new "If" block 205 bool SIAnnotateControlFlow::openIf(BranchInst *Term) { 206 if (isUniform(Term)) 207 return false; 208 209 IRBuilder<> IRB(Term); 210 Value *IfCall = IRB.CreateCall(If, {Term->getCondition()}); 211 Value *Cond = IRB.CreateExtractValue(IfCall, {0}); 212 Value *Mask = IRB.CreateExtractValue(IfCall, {1}); 213 Term->setCondition(Cond); 214 push(Term->getSuccessor(1), Mask); 215 return true; 216 } 217 218 /// Close the last "If" block and open a new "Else" block 219 bool SIAnnotateControlFlow::insertElse(BranchInst *Term) { 220 if (isUniform(Term)) { 221 return false; 222 } 223 224 IRBuilder<> IRB(Term); 225 Value *ElseCall = IRB.CreateCall(Else, {popSaved()}); 226 Value *Cond = IRB.CreateExtractValue(ElseCall, {0}); 227 Value *Mask = IRB.CreateExtractValue(ElseCall, {1}); 228 Term->setCondition(Cond); 229 push(Term->getSuccessor(1), Mask); 230 return true; 231 } 232 233 /// Recursively handle the condition leading to a loop 234 Value *SIAnnotateControlFlow::handleLoopCondition( 235 Value *Cond, PHINode *Broken, llvm::Loop *L, BranchInst *Term) { 236 237 auto CreateBreak = [this, Cond, Broken](Instruction *I) -> CallInst * { 238 return IRBuilder<>(I).CreateCall(IfBreak, {Cond, Broken}); 239 }; 240 241 if (Instruction *Inst = dyn_cast<Instruction>(Cond)) { 242 BasicBlock *Parent = Inst->getParent(); 243 Instruction *Insert; 244 if (L->contains(Inst)) { 245 Insert = Parent->getTerminator(); 246 } else { 247 Insert = L->getHeader()->getFirstNonPHIOrDbgOrLifetime(); 248 } 249 250 return CreateBreak(Insert); 251 } 252 253 // Insert IfBreak in the loop header TERM for constant COND other than true. 254 if (isa<Constant>(Cond)) { 255 Instruction *Insert = Cond == BoolTrue ? 256 Term : L->getHeader()->getTerminator(); 257 258 return CreateBreak(Insert); 259 } 260 261 if (isa<Argument>(Cond)) { 262 Instruction *Insert = L->getHeader()->getFirstNonPHIOrDbgOrLifetime(); 263 return CreateBreak(Insert); 264 } 265 266 llvm_unreachable("Unhandled loop condition!"); 267 } 268 269 /// Handle a back edge (loop) 270 bool SIAnnotateControlFlow::handleLoop(BranchInst *Term) { 271 if (isUniform(Term)) 272 return false; 273 274 BasicBlock *BB = Term->getParent(); 275 llvm::Loop *L = LI->getLoopFor(BB); 276 if (!L) 277 return false; 278 279 BasicBlock *Target = Term->getSuccessor(1); 280 PHINode *Broken = PHINode::Create(IntMask, 0, "phi.broken"); 281 Broken->insertBefore(Target->begin()); 282 283 Value *Cond = Term->getCondition(); 284 Term->setCondition(BoolTrue); 285 Value *Arg = handleLoopCondition(Cond, Broken, L, Term); 286 287 for (BasicBlock *Pred : predecessors(Target)) { 288 Value *PHIValue = IntMaskZero; 289 if (Pred == BB) // Remember the value of the previous iteration. 290 PHIValue = Arg; 291 // If the backedge from Pred to Target could be executed before the exit 292 // of the loop at BB, it should not reset or change "Broken", which keeps 293 // track of the number of threads exited the loop at BB. 294 else if (L->contains(Pred) && DT->dominates(Pred, BB)) 295 PHIValue = Broken; 296 Broken->addIncoming(PHIValue, Pred); 297 } 298 299 CallInst *LoopCall = IRBuilder<>(Term).CreateCall(Loop, {Arg}); 300 Term->setCondition(LoopCall); 301 302 push(Term->getSuccessor(0), Arg); 303 304 return true; 305 } 306 307 /// Close the last opened control flow 308 bool SIAnnotateControlFlow::closeControlFlow(BasicBlock *BB) { 309 llvm::Loop *L = LI->getLoopFor(BB); 310 311 assert(Stack.back().first == BB); 312 313 if (L && L->getHeader() == BB) { 314 // We can't insert an EndCF call into a loop header, because it will 315 // get executed on every iteration of the loop, when it should be 316 // executed only once before the loop. 317 SmallVector <BasicBlock *, 8> Latches; 318 L->getLoopLatches(Latches); 319 320 SmallVector<BasicBlock *, 2> Preds; 321 for (BasicBlock *Pred : predecessors(BB)) { 322 if (!is_contained(Latches, Pred)) 323 Preds.push_back(Pred); 324 } 325 326 BB = SplitBlockPredecessors(BB, Preds, "endcf.split", DT, LI, nullptr, 327 false); 328 } 329 330 Value *Exec = popSaved(); 331 BasicBlock::iterator FirstInsertionPt = BB->getFirstInsertionPt(); 332 if (!isa<UndefValue>(Exec) && !isa<UnreachableInst>(FirstInsertionPt)) { 333 Instruction *ExecDef = cast<Instruction>(Exec); 334 BasicBlock *DefBB = ExecDef->getParent(); 335 if (!DT->dominates(DefBB, BB)) { 336 // Split edge to make Def dominate Use 337 FirstInsertionPt = SplitEdge(DefBB, BB, DT, LI)->getFirstInsertionPt(); 338 } 339 IRBuilder<> IRB(FirstInsertionPt->getParent(), FirstInsertionPt); 340 // TODO: StructurizeCFG 'Flow' blocks have debug locations from the 341 // condition, for now just avoid copying these DebugLocs so that stepping 342 // out of the then/else block in a debugger doesn't step to the condition. 343 IRB.SetCurrentDebugLocation(DebugLoc()); 344 IRB.CreateCall(EndCf, {Exec}); 345 } 346 347 return true; 348 } 349 350 /// Annotate the control flow with intrinsics so the backend can 351 /// recognize if/then/else and loops. 352 bool SIAnnotateControlFlow::runOnFunction(Function &F) { 353 DT = &getAnalysis<DominatorTreeWrapperPass>().getDomTree(); 354 LI = &getAnalysis<LoopInfoWrapperPass>().getLoopInfo(); 355 UA = &getAnalysis<UniformityInfoWrapperPass>().getUniformityInfo(); 356 TargetPassConfig &TPC = getAnalysis<TargetPassConfig>(); 357 const TargetMachine &TM = TPC.getTM<TargetMachine>(); 358 359 bool Changed = false; 360 initialize(*F.getParent(), TM.getSubtarget<GCNSubtarget>(F)); 361 for (df_iterator<BasicBlock *> I = df_begin(&F.getEntryBlock()), 362 E = df_end(&F.getEntryBlock()); I != E; ++I) { 363 BasicBlock *BB = *I; 364 BranchInst *Term = dyn_cast<BranchInst>(BB->getTerminator()); 365 366 if (!Term || Term->isUnconditional()) { 367 if (isTopOfStack(BB)) 368 Changed |= closeControlFlow(BB); 369 370 continue; 371 } 372 373 if (I.nodeVisited(Term->getSuccessor(1))) { 374 if (isTopOfStack(BB)) 375 Changed |= closeControlFlow(BB); 376 377 if (DT->dominates(Term->getSuccessor(1), BB)) 378 Changed |= handleLoop(Term); 379 continue; 380 } 381 382 if (isTopOfStack(BB)) { 383 PHINode *Phi = dyn_cast<PHINode>(Term->getCondition()); 384 if (Phi && Phi->getParent() == BB && isElse(Phi) && !hasKill(BB)) { 385 Changed |= insertElse(Term); 386 Changed |= eraseIfUnused(Phi); 387 continue; 388 } 389 390 Changed |= closeControlFlow(BB); 391 } 392 393 Changed |= openIf(Term); 394 } 395 396 if (!Stack.empty()) { 397 // CFG was probably not structured. 398 report_fatal_error("failed to annotate CFG"); 399 } 400 401 return Changed; 402 } 403 404 /// Create the annotation pass 405 FunctionPass *llvm::createSIAnnotateControlFlowPass() { 406 return new SIAnnotateControlFlow(); 407 } 408