1 //===- CodeMoverUtils.cpp - CodeMover Utilities ----------------------------==// 2 // 3 // Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions. 4 // See https://llvm.org/LICENSE.txt for license information. 5 // SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception 6 // 7 //===----------------------------------------------------------------------===// 8 // 9 // This family of functions perform movements on basic blocks, and instructions 10 // contained within a function. 11 // 12 //===----------------------------------------------------------------------===// 13 14 #include "llvm/Transforms/Utils/CodeMoverUtils.h" 15 #include "llvm/ADT/Optional.h" 16 #include "llvm/ADT/Statistic.h" 17 #include "llvm/Analysis/DependenceAnalysis.h" 18 #include "llvm/Analysis/PostDominators.h" 19 #include "llvm/Analysis/ValueTracking.h" 20 #include "llvm/IR/Dominators.h" 21 22 using namespace llvm; 23 24 #define DEBUG_TYPE "codemover-utils" 25 26 STATISTIC(HasDependences, 27 "Cannot move across instructions that has memory dependences"); 28 STATISTIC(MayThrowException, "Cannot move across instructions that may throw"); 29 STATISTIC(NotControlFlowEquivalent, 30 "Instructions are not control flow equivalent"); 31 STATISTIC(NotMovedPHINode, "Movement of PHINodes are not supported"); 32 STATISTIC(NotMovedTerminator, "Movement of Terminator are not supported"); 33 34 namespace { 35 /// Represent a control condition. A control condition is a condition of a 36 /// terminator to decide which successors to execute. The pointer field 37 /// represents the address of the condition of the terminator. The integer field 38 /// is a bool, it is true when the basic block is executed when V is true. For 39 /// example, `br %cond, bb0, bb1` %cond is a control condition of bb0 with the 40 /// integer field equals to true, while %cond is a control condition of bb1 with 41 /// the integer field equals to false. 42 using ControlCondition = PointerIntPair<Value *, 1, bool>; 43 #ifndef NDEBUG 44 raw_ostream &operator<<(raw_ostream &OS, const ControlCondition &C) { 45 OS << "[" << *C.getPointer() << ", " << (C.getInt() ? "true" : "false") 46 << "]"; 47 return OS; 48 } 49 #endif 50 51 /// Represent a set of control conditions required to execute ToBB from FromBB. 52 class ControlConditions { 53 using ConditionVectorTy = SmallVector<ControlCondition, 6>; 54 55 /// A SmallVector of control conditions. 56 ConditionVectorTy Conditions; 57 58 public: 59 /// Return a ControlConditions which stores all conditions required to execute 60 /// \p BB from \p Dominator. If \p MaxLookup is non-zero, it limits the 61 /// number of conditions to collect. Return None if not all conditions are 62 /// collected successfully, or we hit the limit. 63 static const Optional<ControlConditions> 64 collectControlConditions(const BasicBlock &BB, const BasicBlock &Dominator, 65 const DominatorTree &DT, 66 const PostDominatorTree &PDT, 67 unsigned MaxLookup = 6); 68 69 /// Return true if there exists no control conditions required to execute ToBB 70 /// from FromBB. 71 bool isUnconditional() const { return Conditions.empty(); } 72 73 /// Return a constant reference of Conditions. 74 const ConditionVectorTy &getControlConditions() const { return Conditions; } 75 76 /// Add \p V as one of the ControlCondition in Condition with IsTrueCondition 77 /// equals to \p True. Return true if inserted successfully. 78 bool addControlCondition(ControlCondition C); 79 80 /// Return true if for all control conditions in Conditions, there exists an 81 /// equivalent control condition in \p Other.Conditions. 82 bool isEquivalent(const ControlConditions &Other) const; 83 84 /// Return true if \p C1 and \p C2 are equivalent. 85 static bool isEquivalent(const ControlCondition &C1, 86 const ControlCondition &C2); 87 88 private: 89 ControlConditions() = default; 90 91 static bool isEquivalent(const Value &V1, const Value &V2); 92 static bool isInverse(const Value &V1, const Value &V2); 93 }; 94 } // namespace 95 96 static bool domTreeLevelBefore(DominatorTree *DT, const Instruction *InstA, 97 const Instruction *InstB) { 98 // Use ordered basic block in case the 2 instructions are in the same 99 // block. 100 if (InstA->getParent() == InstB->getParent()) 101 return InstA->comesBefore(InstB); 102 103 DomTreeNode *DA = DT->getNode(InstA->getParent()); 104 DomTreeNode *DB = DT->getNode(InstB->getParent()); 105 return DA->getLevel() < DB->getLevel(); 106 } 107 108 const Optional<ControlConditions> ControlConditions::collectControlConditions( 109 const BasicBlock &BB, const BasicBlock &Dominator, const DominatorTree &DT, 110 const PostDominatorTree &PDT, unsigned MaxLookup) { 111 assert(DT.dominates(&Dominator, &BB) && "Expecting Dominator to dominate BB"); 112 113 ControlConditions Conditions; 114 unsigned NumConditions = 0; 115 116 // BB is executed unconditional from itself. 117 if (&Dominator == &BB) 118 return Conditions; 119 120 const BasicBlock *CurBlock = &BB; 121 // Walk up the dominator tree from the associated DT node for BB to the 122 // associated DT node for Dominator. 123 do { 124 assert(DT.getNode(CurBlock) && "Expecting a valid DT node for CurBlock"); 125 BasicBlock *IDom = DT.getNode(CurBlock)->getIDom()->getBlock(); 126 assert(DT.dominates(&Dominator, IDom) && 127 "Expecting Dominator to dominate IDom"); 128 129 // Limitation: can only handle branch instruction currently. 130 const BranchInst *BI = dyn_cast<BranchInst>(IDom->getTerminator()); 131 if (!BI) 132 return None; 133 134 bool Inserted = false; 135 if (PDT.dominates(CurBlock, IDom)) { 136 LLVM_DEBUG(dbgs() << CurBlock->getName() 137 << " is executed unconditionally from " 138 << IDom->getName() << "\n"); 139 } else if (PDT.dominates(CurBlock, BI->getSuccessor(0))) { 140 LLVM_DEBUG(dbgs() << CurBlock->getName() << " is executed when \"" 141 << *BI->getCondition() << "\" is true from " 142 << IDom->getName() << "\n"); 143 Inserted = Conditions.addControlCondition( 144 ControlCondition(BI->getCondition(), true)); 145 } else if (PDT.dominates(CurBlock, BI->getSuccessor(1))) { 146 LLVM_DEBUG(dbgs() << CurBlock->getName() << " is executed when \"" 147 << *BI->getCondition() << "\" is false from " 148 << IDom->getName() << "\n"); 149 Inserted = Conditions.addControlCondition( 150 ControlCondition(BI->getCondition(), false)); 151 } else 152 return None; 153 154 if (Inserted) 155 ++NumConditions; 156 157 if (MaxLookup != 0 && NumConditions > MaxLookup) 158 return None; 159 160 CurBlock = IDom; 161 } while (CurBlock != &Dominator); 162 163 return Conditions; 164 } 165 166 bool ControlConditions::addControlCondition(ControlCondition C) { 167 bool Inserted = false; 168 if (none_of(Conditions, [&](ControlCondition &Exists) { 169 return ControlConditions::isEquivalent(C, Exists); 170 })) { 171 Conditions.push_back(C); 172 Inserted = true; 173 } 174 175 LLVM_DEBUG(dbgs() << (Inserted ? "Inserted " : "Not inserted ") << C << "\n"); 176 return Inserted; 177 } 178 179 bool ControlConditions::isEquivalent(const ControlConditions &Other) const { 180 if (Conditions.empty() && Other.Conditions.empty()) 181 return true; 182 183 if (Conditions.size() != Other.Conditions.size()) 184 return false; 185 186 return all_of(Conditions, [&](const ControlCondition &C) { 187 return any_of(Other.Conditions, [&](const ControlCondition &OtherC) { 188 return ControlConditions::isEquivalent(C, OtherC); 189 }); 190 }); 191 } 192 193 bool ControlConditions::isEquivalent(const ControlCondition &C1, 194 const ControlCondition &C2) { 195 if (C1.getInt() == C2.getInt()) { 196 if (isEquivalent(*C1.getPointer(), *C2.getPointer())) 197 return true; 198 } else if (isInverse(*C1.getPointer(), *C2.getPointer())) 199 return true; 200 201 return false; 202 } 203 204 // FIXME: Use SCEV and reuse GVN/CSE logic to check for equivalence between 205 // Values. 206 // Currently, isEquivalent rely on other passes to ensure equivalent conditions 207 // have the same value, e.g. GVN. 208 bool ControlConditions::isEquivalent(const Value &V1, const Value &V2) { 209 return &V1 == &V2; 210 } 211 212 bool ControlConditions::isInverse(const Value &V1, const Value &V2) { 213 if (const CmpInst *Cmp1 = dyn_cast<CmpInst>(&V1)) 214 if (const CmpInst *Cmp2 = dyn_cast<CmpInst>(&V2)) { 215 if (Cmp1->getPredicate() == Cmp2->getInversePredicate() && 216 Cmp1->getOperand(0) == Cmp2->getOperand(0) && 217 Cmp1->getOperand(1) == Cmp2->getOperand(1)) 218 return true; 219 220 if (Cmp1->getPredicate() == 221 CmpInst::getSwappedPredicate(Cmp2->getInversePredicate()) && 222 Cmp1->getOperand(0) == Cmp2->getOperand(1) && 223 Cmp1->getOperand(1) == Cmp2->getOperand(0)) 224 return true; 225 } 226 return false; 227 } 228 229 bool llvm::isControlFlowEquivalent(const Instruction &I0, const Instruction &I1, 230 const DominatorTree &DT, 231 const PostDominatorTree &PDT) { 232 return isControlFlowEquivalent(*I0.getParent(), *I1.getParent(), DT, PDT); 233 } 234 235 bool llvm::isControlFlowEquivalent(const BasicBlock &BB0, const BasicBlock &BB1, 236 const DominatorTree &DT, 237 const PostDominatorTree &PDT) { 238 if (&BB0 == &BB1) 239 return true; 240 241 if ((DT.dominates(&BB0, &BB1) && PDT.dominates(&BB1, &BB0)) || 242 (PDT.dominates(&BB0, &BB1) && DT.dominates(&BB1, &BB0))) 243 return true; 244 245 // If the set of conditions required to execute BB0 and BB1 from their common 246 // dominator are the same, then BB0 and BB1 are control flow equivalent. 247 const BasicBlock *CommonDominator = DT.findNearestCommonDominator(&BB0, &BB1); 248 LLVM_DEBUG(dbgs() << "The nearest common dominator of " << BB0.getName() 249 << " and " << BB1.getName() << " is " 250 << CommonDominator->getName() << "\n"); 251 252 const Optional<ControlConditions> BB0Conditions = 253 ControlConditions::collectControlConditions(BB0, *CommonDominator, DT, 254 PDT); 255 if (BB0Conditions == None) 256 return false; 257 258 const Optional<ControlConditions> BB1Conditions = 259 ControlConditions::collectControlConditions(BB1, *CommonDominator, DT, 260 PDT); 261 if (BB1Conditions == None) 262 return false; 263 264 return BB0Conditions->isEquivalent(*BB1Conditions); 265 } 266 267 static bool reportInvalidCandidate(const Instruction &I, 268 llvm::Statistic &Stat) { 269 ++Stat; 270 LLVM_DEBUG(dbgs() << "Unable to move instruction: " << I << ". " 271 << Stat.getDesc()); 272 return false; 273 } 274 275 /// Collect all instructions in between \p StartInst and \p EndInst, and store 276 /// them in \p InBetweenInsts. 277 static void 278 collectInstructionsInBetween(Instruction &StartInst, const Instruction &EndInst, 279 SmallPtrSetImpl<Instruction *> &InBetweenInsts) { 280 assert(InBetweenInsts.empty() && "Expecting InBetweenInsts to be empty"); 281 282 /// Get the next instructions of \p I, and push them to \p WorkList. 283 auto getNextInsts = [](Instruction &I, 284 SmallPtrSetImpl<Instruction *> &WorkList) { 285 if (Instruction *NextInst = I.getNextNode()) 286 WorkList.insert(NextInst); 287 else { 288 assert(I.isTerminator() && "Expecting a terminator instruction"); 289 for (BasicBlock *Succ : successors(&I)) 290 WorkList.insert(&Succ->front()); 291 } 292 }; 293 294 SmallPtrSet<Instruction *, 10> WorkList; 295 getNextInsts(StartInst, WorkList); 296 while (!WorkList.empty()) { 297 Instruction *CurInst = *WorkList.begin(); 298 WorkList.erase(CurInst); 299 300 if (CurInst == &EndInst) 301 continue; 302 303 if (!InBetweenInsts.insert(CurInst).second) 304 continue; 305 306 getNextInsts(*CurInst, WorkList); 307 } 308 } 309 310 bool llvm::isSafeToMoveBefore(Instruction &I, Instruction &InsertPoint, 311 DominatorTree &DT, const PostDominatorTree *PDT, 312 DependenceInfo *DI) { 313 // Skip tests when we don't have PDT or DI 314 if (!PDT || !DI) 315 return false; 316 317 // Cannot move itself before itself. 318 if (&I == &InsertPoint) 319 return false; 320 321 // Not moved. 322 if (I.getNextNode() == &InsertPoint) 323 return true; 324 325 if (isa<PHINode>(I) || isa<PHINode>(InsertPoint)) 326 return reportInvalidCandidate(I, NotMovedPHINode); 327 328 if (I.isTerminator()) 329 return reportInvalidCandidate(I, NotMovedTerminator); 330 331 // TODO remove this limitation. 332 if (!isControlFlowEquivalent(I, InsertPoint, DT, *PDT)) 333 return reportInvalidCandidate(I, NotControlFlowEquivalent); 334 335 if (!DT.dominates(&InsertPoint, &I)) 336 for (const Use &U : I.uses()) 337 if (auto *UserInst = dyn_cast<Instruction>(U.getUser())) 338 if (UserInst != &InsertPoint && !DT.dominates(&InsertPoint, U)) 339 return false; 340 if (!DT.dominates(&I, &InsertPoint)) 341 for (const Value *Op : I.operands()) 342 if (auto *OpInst = dyn_cast<Instruction>(Op)) 343 if (&InsertPoint == OpInst || !DT.dominates(OpInst, &InsertPoint)) 344 return false; 345 346 DT.updateDFSNumbers(); 347 const bool MoveForward = domTreeLevelBefore(&DT, &I, &InsertPoint); 348 Instruction &StartInst = (MoveForward ? I : InsertPoint); 349 Instruction &EndInst = (MoveForward ? InsertPoint : I); 350 SmallPtrSet<Instruction *, 10> InstsToCheck; 351 collectInstructionsInBetween(StartInst, EndInst, InstsToCheck); 352 if (!MoveForward) 353 InstsToCheck.insert(&InsertPoint); 354 355 // Check if there exists instructions which may throw, may synchonize, or may 356 // never return, from I to InsertPoint. 357 if (!isSafeToSpeculativelyExecute(&I)) 358 if (llvm::any_of(InstsToCheck, [](Instruction *I) { 359 if (I->mayThrow()) 360 return true; 361 362 const CallBase *CB = dyn_cast<CallBase>(I); 363 if (!CB) 364 return false; 365 if (!CB->hasFnAttr(Attribute::WillReturn)) 366 return true; 367 if (!CB->hasFnAttr(Attribute::NoSync)) 368 return true; 369 370 return false; 371 })) { 372 return reportInvalidCandidate(I, MayThrowException); 373 } 374 375 // Check if I has any output/flow/anti dependences with instructions from \p 376 // StartInst to \p EndInst. 377 if (llvm::any_of(InstsToCheck, [&DI, &I](Instruction *CurInst) { 378 auto DepResult = DI->depends(&I, CurInst, true); 379 if (DepResult && (DepResult->isOutput() || DepResult->isFlow() || 380 DepResult->isAnti())) 381 return true; 382 return false; 383 })) 384 return reportInvalidCandidate(I, HasDependences); 385 386 return true; 387 } 388 389 bool llvm::isSafeToMoveBefore(BasicBlock &BB, Instruction &InsertPoint, 390 DominatorTree &DT, const PostDominatorTree *PDT, 391 DependenceInfo *DI) { 392 return llvm::all_of(BB, [&](Instruction &I) { 393 if (BB.getTerminator() == &I) 394 return true; 395 396 return isSafeToMoveBefore(I, InsertPoint, DT, PDT, DI); 397 }); 398 } 399 400 void llvm::moveInstructionsToTheBeginning(BasicBlock &FromBB, BasicBlock &ToBB, 401 DominatorTree &DT, 402 const PostDominatorTree &PDT, 403 DependenceInfo &DI) { 404 for (auto It = ++FromBB.rbegin(); It != FromBB.rend();) { 405 Instruction *MovePos = ToBB.getFirstNonPHIOrDbg(); 406 Instruction &I = *It; 407 // Increment the iterator before modifying FromBB. 408 ++It; 409 410 if (isSafeToMoveBefore(I, *MovePos, DT, &PDT, &DI)) 411 I.moveBefore(MovePos); 412 } 413 } 414 415 void llvm::moveInstructionsToTheEnd(BasicBlock &FromBB, BasicBlock &ToBB, 416 DominatorTree &DT, 417 const PostDominatorTree &PDT, 418 DependenceInfo &DI) { 419 Instruction *MovePos = ToBB.getTerminator(); 420 while (FromBB.size() > 1) { 421 Instruction &I = FromBB.front(); 422 if (isSafeToMoveBefore(I, *MovePos, DT, &PDT, &DI)) 423 I.moveBefore(MovePos); 424 } 425 } 426