1 //===- LoopVersioningLICM.cpp - LICM Loop Versioning ----------------------===// 2 // 3 // Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions. 4 // See https://llvm.org/LICENSE.txt for license information. 5 // SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception 6 // 7 //===----------------------------------------------------------------------===// 8 // 9 // When alias analysis is uncertain about the aliasing between any two accesses, 10 // it will return MayAlias. This uncertainty from alias analysis restricts LICM 11 // from proceeding further. In cases where alias analysis is uncertain we might 12 // use loop versioning as an alternative. 13 // 14 // Loop Versioning will create a version of the loop with aggressive aliasing 15 // assumptions in addition to the original with conservative (default) aliasing 16 // assumptions. The version of the loop making aggressive aliasing assumptions 17 // will have all the memory accesses marked as no-alias. These two versions of 18 // loop will be preceded by a memory runtime check. This runtime check consists 19 // of bound checks for all unique memory accessed in loop, and it ensures the 20 // lack of memory aliasing. The result of the runtime check determines which of 21 // the loop versions is executed: If the runtime check detects any memory 22 // aliasing, then the original loop is executed. Otherwise, the version with 23 // aggressive aliasing assumptions is used. 24 // 25 // Following are the top level steps: 26 // 27 // a) Perform LoopVersioningLICM's feasibility check. 28 // b) If loop is a candidate for versioning then create a memory bound check, 29 // by considering all the memory accesses in loop body. 30 // c) Clone original loop and set all memory accesses as no-alias in new loop. 31 // d) Set original loop & versioned loop as a branch target of the runtime check 32 // result. 33 // 34 // It transforms loop as shown below: 35 // 36 // +----------------+ 37 // |Runtime Memcheck| 38 // +----------------+ 39 // | 40 // +----------+----------------+----------+ 41 // | | 42 // +---------+----------+ +-----------+----------+ 43 // |Orig Loop Preheader | |Cloned Loop Preheader | 44 // +--------------------+ +----------------------+ 45 // | | 46 // +--------------------+ +----------------------+ 47 // |Orig Loop Body | |Cloned Loop Body | 48 // +--------------------+ +----------------------+ 49 // | | 50 // +--------------------+ +----------------------+ 51 // |Orig Loop Exit Block| |Cloned Loop Exit Block| 52 // +--------------------+ +-----------+----------+ 53 // | | 54 // +----------+--------------+-----------+ 55 // | 56 // +-----+----+ 57 // |Join Block| 58 // +----------+ 59 // 60 //===----------------------------------------------------------------------===// 61 62 #include "llvm/Transforms/Scalar/LoopVersioningLICM.h" 63 #include "llvm/ADT/SmallVector.h" 64 #include "llvm/ADT/StringRef.h" 65 #include "llvm/Analysis/AliasAnalysis.h" 66 #include "llvm/Analysis/AliasSetTracker.h" 67 #include "llvm/Analysis/GlobalsModRef.h" 68 #include "llvm/Analysis/LoopAccessAnalysis.h" 69 #include "llvm/Analysis/LoopInfo.h" 70 #include "llvm/Analysis/LoopPass.h" 71 #include "llvm/Analysis/OptimizationRemarkEmitter.h" 72 #include "llvm/Analysis/ScalarEvolution.h" 73 #include "llvm/IR/Constants.h" 74 #include "llvm/IR/Dominators.h" 75 #include "llvm/IR/Instruction.h" 76 #include "llvm/IR/Instructions.h" 77 #include "llvm/IR/LLVMContext.h" 78 #include "llvm/IR/MDBuilder.h" 79 #include "llvm/IR/Metadata.h" 80 #include "llvm/IR/Type.h" 81 #include "llvm/IR/Value.h" 82 #include "llvm/InitializePasses.h" 83 #include "llvm/Pass.h" 84 #include "llvm/Support/Casting.h" 85 #include "llvm/Support/CommandLine.h" 86 #include "llvm/Support/Debug.h" 87 #include "llvm/Support/raw_ostream.h" 88 #include "llvm/Transforms/Scalar.h" 89 #include "llvm/Transforms/Utils.h" 90 #include "llvm/Transforms/Utils/LoopUtils.h" 91 #include "llvm/Transforms/Utils/LoopVersioning.h" 92 #include <cassert> 93 #include <memory> 94 95 using namespace llvm; 96 97 #define DEBUG_TYPE "loop-versioning-licm" 98 99 static const char *LICMVersioningMetaData = "llvm.loop.licm_versioning.disable"; 100 101 /// Threshold minimum allowed percentage for possible 102 /// invariant instructions in a loop. 103 static cl::opt<float> 104 LVInvarThreshold("licm-versioning-invariant-threshold", 105 cl::desc("LoopVersioningLICM's minimum allowed percentage" 106 "of possible invariant instructions per loop"), 107 cl::init(25), cl::Hidden); 108 109 /// Threshold for maximum allowed loop nest/depth 110 static cl::opt<unsigned> LVLoopDepthThreshold( 111 "licm-versioning-max-depth-threshold", 112 cl::desc( 113 "LoopVersioningLICM's threshold for maximum allowed loop nest/depth"), 114 cl::init(2), cl::Hidden); 115 116 namespace { 117 118 struct LoopVersioningLICMLegacyPass : public LoopPass { 119 static char ID; 120 121 LoopVersioningLICMLegacyPass() : LoopPass(ID) { 122 initializeLoopVersioningLICMLegacyPassPass( 123 *PassRegistry::getPassRegistry()); 124 } 125 126 bool runOnLoop(Loop *L, LPPassManager &LPM) override; 127 128 StringRef getPassName() const override { return "Loop Versioning for LICM"; } 129 130 void getAnalysisUsage(AnalysisUsage &AU) const override { 131 AU.setPreservesCFG(); 132 AU.addRequired<AAResultsWrapperPass>(); 133 AU.addRequired<DominatorTreeWrapperPass>(); 134 AU.addRequiredID(LCSSAID); 135 AU.addRequired<LoopAccessLegacyAnalysis>(); 136 AU.addRequired<LoopInfoWrapperPass>(); 137 AU.addRequiredID(LoopSimplifyID); 138 AU.addRequired<ScalarEvolutionWrapperPass>(); 139 AU.addPreserved<AAResultsWrapperPass>(); 140 AU.addPreserved<GlobalsAAWrapperPass>(); 141 AU.addRequired<OptimizationRemarkEmitterWrapperPass>(); 142 } 143 }; 144 145 struct LoopVersioningLICM { 146 // We don't explicitly pass in LoopAccessInfo to the constructor since the 147 // loop versioning might return early due to instructions that are not safe 148 // for versioning. By passing the proxy instead the construction of 149 // LoopAccessInfo will take place only when it's necessary. 150 LoopVersioningLICM(AliasAnalysis *AA, ScalarEvolution *SE, 151 OptimizationRemarkEmitter *ORE, 152 function_ref<const LoopAccessInfo &(Loop *)> GetLAI) 153 : AA(AA), SE(SE), GetLAI(GetLAI), 154 LoopDepthThreshold(LVLoopDepthThreshold), 155 InvariantThreshold(LVInvarThreshold), ORE(ORE) {} 156 157 bool runOnLoop(Loop *L, LoopInfo *LI, DominatorTree *DT); 158 159 void reset() { 160 AA = nullptr; 161 SE = nullptr; 162 CurLoop = nullptr; 163 LoadAndStoreCounter = 0; 164 InvariantCounter = 0; 165 IsReadOnlyLoop = true; 166 ORE = nullptr; 167 CurAST.reset(); 168 } 169 170 class AutoResetter { 171 public: 172 AutoResetter(LoopVersioningLICM &LVLICM) : LVLICM(LVLICM) {} 173 ~AutoResetter() { LVLICM.reset(); } 174 175 private: 176 LoopVersioningLICM &LVLICM; 177 }; 178 179 private: 180 // Current AliasAnalysis information 181 AliasAnalysis *AA = nullptr; 182 183 // Current ScalarEvolution 184 ScalarEvolution *SE = nullptr; 185 186 // Current Loop's LoopAccessInfo 187 const LoopAccessInfo *LAI = nullptr; 188 189 // Proxy for retrieving LoopAccessInfo. 190 function_ref<const LoopAccessInfo &(Loop *)> GetLAI; 191 192 // The current loop we are working on. 193 Loop *CurLoop = nullptr; 194 195 // AliasSet information for the current loop. 196 std::unique_ptr<AliasSetTracker> CurAST; 197 198 // Maximum loop nest threshold 199 unsigned LoopDepthThreshold; 200 201 // Minimum invariant threshold 202 float InvariantThreshold; 203 204 // Counter to track num of load & store 205 unsigned LoadAndStoreCounter = 0; 206 207 // Counter to track num of invariant 208 unsigned InvariantCounter = 0; 209 210 // Read only loop marker. 211 bool IsReadOnlyLoop = true; 212 213 // OptimizationRemarkEmitter 214 OptimizationRemarkEmitter *ORE; 215 216 bool isLegalForVersioning(); 217 bool legalLoopStructure(); 218 bool legalLoopInstructions(); 219 bool legalLoopMemoryAccesses(); 220 bool isLoopAlreadyVisited(); 221 void setNoAliasToLoop(Loop *VerLoop); 222 bool instructionSafeForVersioning(Instruction *I); 223 }; 224 225 } // end anonymous namespace 226 227 /// Check loop structure and confirms it's good for LoopVersioningLICM. 228 bool LoopVersioningLICM::legalLoopStructure() { 229 // Loop must be in loop simplify form. 230 if (!CurLoop->isLoopSimplifyForm()) { 231 LLVM_DEBUG(dbgs() << " loop is not in loop-simplify form.\n"); 232 return false; 233 } 234 // Loop should be innermost loop, if not return false. 235 if (!CurLoop->getSubLoops().empty()) { 236 LLVM_DEBUG(dbgs() << " loop is not innermost\n"); 237 return false; 238 } 239 // Loop should have a single backedge, if not return false. 240 if (CurLoop->getNumBackEdges() != 1) { 241 LLVM_DEBUG(dbgs() << " loop has multiple backedges\n"); 242 return false; 243 } 244 // Loop must have a single exiting block, if not return false. 245 if (!CurLoop->getExitingBlock()) { 246 LLVM_DEBUG(dbgs() << " loop has multiple exiting block\n"); 247 return false; 248 } 249 // We only handle bottom-tested loop, i.e. loop in which the condition is 250 // checked at the end of each iteration. With that we can assume that all 251 // instructions in the loop are executed the same number of times. 252 if (CurLoop->getExitingBlock() != CurLoop->getLoopLatch()) { 253 LLVM_DEBUG(dbgs() << " loop is not bottom tested\n"); 254 return false; 255 } 256 // Parallel loops must not have aliasing loop-invariant memory accesses. 257 // Hence we don't need to version anything in this case. 258 if (CurLoop->isAnnotatedParallel()) { 259 LLVM_DEBUG(dbgs() << " Parallel loop is not worth versioning\n"); 260 return false; 261 } 262 // Loop depth more then LoopDepthThreshold are not allowed 263 if (CurLoop->getLoopDepth() > LoopDepthThreshold) { 264 LLVM_DEBUG(dbgs() << " loop depth is more then threshold\n"); 265 return false; 266 } 267 // We need to be able to compute the loop trip count in order 268 // to generate the bound checks. 269 const SCEV *ExitCount = SE->getBackedgeTakenCount(CurLoop); 270 if (isa<SCEVCouldNotCompute>(ExitCount)) { 271 LLVM_DEBUG(dbgs() << " loop does not has trip count\n"); 272 return false; 273 } 274 return true; 275 } 276 277 /// Check memory accesses in loop and confirms it's good for 278 /// LoopVersioningLICM. 279 bool LoopVersioningLICM::legalLoopMemoryAccesses() { 280 bool HasMayAlias = false; 281 bool TypeSafety = false; 282 bool HasMod = false; 283 // Memory check: 284 // Transform phase will generate a versioned loop and also a runtime check to 285 // ensure the pointers are independent and they don’t alias. 286 // In version variant of loop, alias meta data asserts that all access are 287 // mutually independent. 288 // 289 // Pointers aliasing in alias domain are avoided because with multiple 290 // aliasing domains we may not be able to hoist potential loop invariant 291 // access out of the loop. 292 // 293 // Iterate over alias tracker sets, and confirm AliasSets doesn't have any 294 // must alias set. 295 for (const auto &I : *CurAST) { 296 const AliasSet &AS = I; 297 // Skip Forward Alias Sets, as this should be ignored as part of 298 // the AliasSetTracker object. 299 if (AS.isForwardingAliasSet()) 300 continue; 301 // With MustAlias its not worth adding runtime bound check. 302 if (AS.isMustAlias()) 303 return false; 304 Value *SomePtr = AS.begin()->getValue(); 305 bool TypeCheck = true; 306 // Check for Mod & MayAlias 307 HasMayAlias |= AS.isMayAlias(); 308 HasMod |= AS.isMod(); 309 for (const auto &A : AS) { 310 Value *Ptr = A.getValue(); 311 // Alias tracker should have pointers of same data type. 312 TypeCheck = (TypeCheck && (SomePtr->getType() == Ptr->getType())); 313 } 314 // At least one alias tracker should have pointers of same data type. 315 TypeSafety |= TypeCheck; 316 } 317 // Ensure types should be of same type. 318 if (!TypeSafety) { 319 LLVM_DEBUG(dbgs() << " Alias tracker type safety failed!\n"); 320 return false; 321 } 322 // Ensure loop body shouldn't be read only. 323 if (!HasMod) { 324 LLVM_DEBUG(dbgs() << " No memory modified in loop body\n"); 325 return false; 326 } 327 // Make sure alias set has may alias case. 328 // If there no alias memory ambiguity, return false. 329 if (!HasMayAlias) { 330 LLVM_DEBUG(dbgs() << " No ambiguity in memory access.\n"); 331 return false; 332 } 333 return true; 334 } 335 336 /// Check loop instructions safe for Loop versioning. 337 /// It returns true if it's safe else returns false. 338 /// Consider following: 339 /// 1) Check all load store in loop body are non atomic & non volatile. 340 /// 2) Check function call safety, by ensuring its not accessing memory. 341 /// 3) Loop body shouldn't have any may throw instruction. 342 /// 4) Loop body shouldn't have any convergent or noduplicate instructions. 343 bool LoopVersioningLICM::instructionSafeForVersioning(Instruction *I) { 344 assert(I != nullptr && "Null instruction found!"); 345 // Check function call safety 346 if (auto *Call = dyn_cast<CallBase>(I)) { 347 if (Call->isConvergent() || Call->cannotDuplicate()) { 348 LLVM_DEBUG(dbgs() << " Convergent call site found.\n"); 349 return false; 350 } 351 352 if (!AA->doesNotAccessMemory(Call)) { 353 LLVM_DEBUG(dbgs() << " Unsafe call site found.\n"); 354 return false; 355 } 356 } 357 358 // Avoid loops with possiblity of throw 359 if (I->mayThrow()) { 360 LLVM_DEBUG(dbgs() << " May throw instruction found in loop body\n"); 361 return false; 362 } 363 // If current instruction is load instructions 364 // make sure it's a simple load (non atomic & non volatile) 365 if (I->mayReadFromMemory()) { 366 LoadInst *Ld = dyn_cast<LoadInst>(I); 367 if (!Ld || !Ld->isSimple()) { 368 LLVM_DEBUG(dbgs() << " Found a non-simple load.\n"); 369 return false; 370 } 371 LoadAndStoreCounter++; 372 Value *Ptr = Ld->getPointerOperand(); 373 // Check loop invariant. 374 if (SE->isLoopInvariant(SE->getSCEV(Ptr), CurLoop)) 375 InvariantCounter++; 376 } 377 // If current instruction is store instruction 378 // make sure it's a simple store (non atomic & non volatile) 379 else if (I->mayWriteToMemory()) { 380 StoreInst *St = dyn_cast<StoreInst>(I); 381 if (!St || !St->isSimple()) { 382 LLVM_DEBUG(dbgs() << " Found a non-simple store.\n"); 383 return false; 384 } 385 LoadAndStoreCounter++; 386 Value *Ptr = St->getPointerOperand(); 387 // Check loop invariant. 388 if (SE->isLoopInvariant(SE->getSCEV(Ptr), CurLoop)) 389 InvariantCounter++; 390 391 IsReadOnlyLoop = false; 392 } 393 return true; 394 } 395 396 /// Check loop instructions and confirms it's good for 397 /// LoopVersioningLICM. 398 bool LoopVersioningLICM::legalLoopInstructions() { 399 // Resetting counters. 400 LoadAndStoreCounter = 0; 401 InvariantCounter = 0; 402 IsReadOnlyLoop = true; 403 using namespace ore; 404 // Iterate over loop blocks and instructions of each block and check 405 // instruction safety. 406 for (auto *Block : CurLoop->getBlocks()) 407 for (auto &Inst : *Block) { 408 // If instruction is unsafe just return false. 409 if (!instructionSafeForVersioning(&Inst)) { 410 ORE->emit([&]() { 411 return OptimizationRemarkMissed(DEBUG_TYPE, "IllegalLoopInst", &Inst) 412 << " Unsafe Loop Instruction"; 413 }); 414 return false; 415 } 416 } 417 // Get LoopAccessInfo from current loop via the proxy. 418 LAI = &GetLAI(CurLoop); 419 // Check LoopAccessInfo for need of runtime check. 420 if (LAI->getRuntimePointerChecking()->getChecks().empty()) { 421 LLVM_DEBUG(dbgs() << " LAA: Runtime check not found !!\n"); 422 return false; 423 } 424 // Number of runtime-checks should be less then RuntimeMemoryCheckThreshold 425 if (LAI->getNumRuntimePointerChecks() > 426 VectorizerParams::RuntimeMemoryCheckThreshold) { 427 LLVM_DEBUG( 428 dbgs() << " LAA: Runtime checks are more than threshold !!\n"); 429 ORE->emit([&]() { 430 return OptimizationRemarkMissed(DEBUG_TYPE, "RuntimeCheck", 431 CurLoop->getStartLoc(), 432 CurLoop->getHeader()) 433 << "Number of runtime checks " 434 << NV("RuntimeChecks", LAI->getNumRuntimePointerChecks()) 435 << " exceeds threshold " 436 << NV("Threshold", VectorizerParams::RuntimeMemoryCheckThreshold); 437 }); 438 return false; 439 } 440 // Loop should have at least one invariant load or store instruction. 441 if (!InvariantCounter) { 442 LLVM_DEBUG(dbgs() << " Invariant not found !!\n"); 443 return false; 444 } 445 // Read only loop not allowed. 446 if (IsReadOnlyLoop) { 447 LLVM_DEBUG(dbgs() << " Found a read-only loop!\n"); 448 return false; 449 } 450 // Profitablity check: 451 // Check invariant threshold, should be in limit. 452 if (InvariantCounter * 100 < InvariantThreshold * LoadAndStoreCounter) { 453 LLVM_DEBUG( 454 dbgs() 455 << " Invariant load & store are less then defined threshold\n"); 456 LLVM_DEBUG(dbgs() << " Invariant loads & stores: " 457 << ((InvariantCounter * 100) / LoadAndStoreCounter) 458 << "%\n"); 459 LLVM_DEBUG(dbgs() << " Invariant loads & store threshold: " 460 << InvariantThreshold << "%\n"); 461 ORE->emit([&]() { 462 return OptimizationRemarkMissed(DEBUG_TYPE, "InvariantThreshold", 463 CurLoop->getStartLoc(), 464 CurLoop->getHeader()) 465 << "Invariant load & store " 466 << NV("LoadAndStoreCounter", 467 ((InvariantCounter * 100) / LoadAndStoreCounter)) 468 << " are less then defined threshold " 469 << NV("Threshold", InvariantThreshold); 470 }); 471 return false; 472 } 473 return true; 474 } 475 476 /// It checks loop is already visited or not. 477 /// check loop meta data, if loop revisited return true 478 /// else false. 479 bool LoopVersioningLICM::isLoopAlreadyVisited() { 480 // Check LoopVersioningLICM metadata into loop 481 if (findStringMetadataForLoop(CurLoop, LICMVersioningMetaData)) { 482 return true; 483 } 484 return false; 485 } 486 487 /// Checks legality for LoopVersioningLICM by considering following: 488 /// a) loop structure legality b) loop instruction legality 489 /// c) loop memory access legality. 490 /// Return true if legal else returns false. 491 bool LoopVersioningLICM::isLegalForVersioning() { 492 using namespace ore; 493 LLVM_DEBUG(dbgs() << "Loop: " << *CurLoop); 494 // Make sure not re-visiting same loop again. 495 if (isLoopAlreadyVisited()) { 496 LLVM_DEBUG( 497 dbgs() << " Revisiting loop in LoopVersioningLICM not allowed.\n\n"); 498 return false; 499 } 500 // Check loop structure leagality. 501 if (!legalLoopStructure()) { 502 LLVM_DEBUG( 503 dbgs() << " Loop structure not suitable for LoopVersioningLICM\n\n"); 504 ORE->emit([&]() { 505 return OptimizationRemarkMissed(DEBUG_TYPE, "IllegalLoopStruct", 506 CurLoop->getStartLoc(), 507 CurLoop->getHeader()) 508 << " Unsafe Loop structure"; 509 }); 510 return false; 511 } 512 // Check loop instruction leagality. 513 if (!legalLoopInstructions()) { 514 LLVM_DEBUG( 515 dbgs() 516 << " Loop instructions not suitable for LoopVersioningLICM\n\n"); 517 return false; 518 } 519 // Check loop memory access leagality. 520 if (!legalLoopMemoryAccesses()) { 521 LLVM_DEBUG( 522 dbgs() 523 << " Loop memory access not suitable for LoopVersioningLICM\n\n"); 524 ORE->emit([&]() { 525 return OptimizationRemarkMissed(DEBUG_TYPE, "IllegalLoopMemoryAccess", 526 CurLoop->getStartLoc(), 527 CurLoop->getHeader()) 528 << " Unsafe Loop memory access"; 529 }); 530 return false; 531 } 532 // Loop versioning is feasible, return true. 533 LLVM_DEBUG(dbgs() << " Loop Versioning found to be beneficial\n\n"); 534 ORE->emit([&]() { 535 return OptimizationRemark(DEBUG_TYPE, "IsLegalForVersioning", 536 CurLoop->getStartLoc(), CurLoop->getHeader()) 537 << " Versioned loop for LICM." 538 << " Number of runtime checks we had to insert " 539 << NV("RuntimeChecks", LAI->getNumRuntimePointerChecks()); 540 }); 541 return true; 542 } 543 544 /// Update loop with aggressive aliasing assumptions. 545 /// It marks no-alias to any pairs of memory operations by assuming 546 /// loop should not have any must-alias memory accesses pairs. 547 /// During LoopVersioningLICM legality we ignore loops having must 548 /// aliasing memory accesses. 549 void LoopVersioningLICM::setNoAliasToLoop(Loop *VerLoop) { 550 // Get latch terminator instruction. 551 Instruction *I = VerLoop->getLoopLatch()->getTerminator(); 552 // Create alias scope domain. 553 MDBuilder MDB(I->getContext()); 554 MDNode *NewDomain = MDB.createAnonymousAliasScopeDomain("LVDomain"); 555 StringRef Name = "LVAliasScope"; 556 MDNode *NewScope = MDB.createAnonymousAliasScope(NewDomain, Name); 557 SmallVector<Metadata *, 4> Scopes{NewScope}, NoAliases{NewScope}; 558 // Iterate over each instruction of loop. 559 // set no-alias for all load & store instructions. 560 for (auto *Block : CurLoop->getBlocks()) { 561 for (auto &Inst : *Block) { 562 // Only interested in instruction that may modify or read memory. 563 if (!Inst.mayReadFromMemory() && !Inst.mayWriteToMemory()) 564 continue; 565 // Set no-alias for current instruction. 566 Inst.setMetadata( 567 LLVMContext::MD_noalias, 568 MDNode::concatenate(Inst.getMetadata(LLVMContext::MD_noalias), 569 MDNode::get(Inst.getContext(), NoAliases))); 570 // set alias-scope for current instruction. 571 Inst.setMetadata( 572 LLVMContext::MD_alias_scope, 573 MDNode::concatenate(Inst.getMetadata(LLVMContext::MD_alias_scope), 574 MDNode::get(Inst.getContext(), Scopes))); 575 } 576 } 577 } 578 579 bool LoopVersioningLICMLegacyPass::runOnLoop(Loop *L, LPPassManager &LPM) { 580 if (skipLoop(L)) 581 return false; 582 583 AliasAnalysis *AA = &getAnalysis<AAResultsWrapperPass>().getAAResults(); 584 ScalarEvolution *SE = &getAnalysis<ScalarEvolutionWrapperPass>().getSE(); 585 OptimizationRemarkEmitter *ORE = 586 &getAnalysis<OptimizationRemarkEmitterWrapperPass>().getORE(); 587 LoopInfo *LI = &getAnalysis<LoopInfoWrapperPass>().getLoopInfo(); 588 DominatorTree *DT = &getAnalysis<DominatorTreeWrapperPass>().getDomTree(); 589 590 auto GetLAI = [&](Loop *L) -> const LoopAccessInfo & { 591 return getAnalysis<LoopAccessLegacyAnalysis>().getInfo(L); 592 }; 593 594 return LoopVersioningLICM(AA, SE, ORE, GetLAI).runOnLoop(L, LI, DT); 595 } 596 597 bool LoopVersioningLICM::runOnLoop(Loop *L, LoopInfo *LI, DominatorTree *DT) { 598 // This will automatically release all resources hold by the current 599 // LoopVersioningLICM object. 600 AutoResetter Resetter(*this); 601 602 // Do not do the transformation if disabled by metadata. 603 if (hasLICMVersioningTransformation(L) & TM_Disable) 604 return false; 605 606 // Set Current Loop 607 CurLoop = L; 608 CurAST.reset(new AliasSetTracker(*AA)); 609 610 // Loop over the body of this loop, construct AST. 611 for (auto *Block : L->getBlocks()) { 612 if (LI->getLoopFor(Block) == L) // Ignore blocks in subloop. 613 CurAST->add(*Block); // Incorporate the specified basic block 614 } 615 616 bool Changed = false; 617 618 // Check feasiblity of LoopVersioningLICM. 619 // If versioning found to be feasible and beneficial then proceed 620 // else simply return, by cleaning up memory. 621 if (isLegalForVersioning()) { 622 // Do loop versioning. 623 // Create memcheck for memory accessed inside loop. 624 // Clone original loop, and set blocks properly. 625 LoopVersioning LVer(*LAI, LAI->getRuntimePointerChecking()->getChecks(), 626 CurLoop, LI, DT, SE); 627 LVer.versionLoop(); 628 // Set Loop Versioning metaData for original loop. 629 addStringMetadataToLoop(LVer.getNonVersionedLoop(), LICMVersioningMetaData); 630 // Set Loop Versioning metaData for version loop. 631 addStringMetadataToLoop(LVer.getVersionedLoop(), LICMVersioningMetaData); 632 // Set "llvm.mem.parallel_loop_access" metaData to versioned loop. 633 // FIXME: "llvm.mem.parallel_loop_access" annotates memory access 634 // instructions, not loops. 635 addStringMetadataToLoop(LVer.getVersionedLoop(), 636 "llvm.mem.parallel_loop_access"); 637 // Update version loop with aggressive aliasing assumption. 638 setNoAliasToLoop(LVer.getVersionedLoop()); 639 Changed = true; 640 } 641 return Changed; 642 } 643 644 char LoopVersioningLICMLegacyPass::ID = 0; 645 646 INITIALIZE_PASS_BEGIN(LoopVersioningLICMLegacyPass, "loop-versioning-licm", 647 "Loop Versioning For LICM", false, false) 648 INITIALIZE_PASS_DEPENDENCY(AAResultsWrapperPass) 649 INITIALIZE_PASS_DEPENDENCY(DominatorTreeWrapperPass) 650 INITIALIZE_PASS_DEPENDENCY(GlobalsAAWrapperPass) 651 INITIALIZE_PASS_DEPENDENCY(LCSSAWrapperPass) 652 INITIALIZE_PASS_DEPENDENCY(LoopAccessLegacyAnalysis) 653 INITIALIZE_PASS_DEPENDENCY(LoopInfoWrapperPass) 654 INITIALIZE_PASS_DEPENDENCY(LoopSimplify) 655 INITIALIZE_PASS_DEPENDENCY(ScalarEvolutionWrapperPass) 656 INITIALIZE_PASS_DEPENDENCY(OptimizationRemarkEmitterWrapperPass) 657 INITIALIZE_PASS_END(LoopVersioningLICMLegacyPass, "loop-versioning-licm", 658 "Loop Versioning For LICM", false, false) 659 660 Pass *llvm::createLoopVersioningLICMPass() { 661 return new LoopVersioningLICMLegacyPass(); 662 } 663 664 namespace llvm { 665 666 PreservedAnalyses LoopVersioningLICMPass::run(Loop &L, LoopAnalysisManager &AM, 667 LoopStandardAnalysisResults &LAR, 668 LPMUpdater &U) { 669 AliasAnalysis *AA = &LAR.AA; 670 ScalarEvolution *SE = &LAR.SE; 671 DominatorTree *DT = &LAR.DT; 672 LoopInfo *LI = &LAR.LI; 673 const Function *F = L.getHeader()->getParent(); 674 OptimizationRemarkEmitter ORE(F); 675 676 auto GetLAI = [&](Loop *L) -> const LoopAccessInfo & { 677 return AM.getResult<LoopAccessAnalysis>(*L, LAR); 678 }; 679 680 if (!LoopVersioningLICM(AA, SE, &ORE, GetLAI).runOnLoop(&L, LI, DT)) 681 return PreservedAnalyses::all(); 682 return getLoopPassPreservedAnalyses(); 683 } 684 } // namespace llvm 685