10b57cec5SDimitry Andric //===- BranchProbabilityInfo.cpp - Branch Probability Analysis ------------===// 20b57cec5SDimitry Andric // 30b57cec5SDimitry Andric // Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions. 40b57cec5SDimitry Andric // See https://llvm.org/LICENSE.txt for license information. 50b57cec5SDimitry Andric // SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception 60b57cec5SDimitry Andric // 70b57cec5SDimitry Andric //===----------------------------------------------------------------------===// 80b57cec5SDimitry Andric // 90b57cec5SDimitry Andric // Loops should be simplified before this analysis. 100b57cec5SDimitry Andric // 110b57cec5SDimitry Andric //===----------------------------------------------------------------------===// 120b57cec5SDimitry Andric 130b57cec5SDimitry Andric #include "llvm/Analysis/BranchProbabilityInfo.h" 140b57cec5SDimitry Andric #include "llvm/ADT/PostOrderIterator.h" 150b57cec5SDimitry Andric #include "llvm/ADT/SCCIterator.h" 160b57cec5SDimitry Andric #include "llvm/ADT/STLExtras.h" 170b57cec5SDimitry Andric #include "llvm/ADT/SmallVector.h" 180b57cec5SDimitry Andric #include "llvm/Analysis/LoopInfo.h" 19480093f4SDimitry Andric #include "llvm/Analysis/PostDominators.h" 200b57cec5SDimitry Andric #include "llvm/Analysis/TargetLibraryInfo.h" 210b57cec5SDimitry Andric #include "llvm/IR/Attributes.h" 220b57cec5SDimitry Andric #include "llvm/IR/BasicBlock.h" 230b57cec5SDimitry Andric #include "llvm/IR/CFG.h" 240b57cec5SDimitry Andric #include "llvm/IR/Constants.h" 250b57cec5SDimitry Andric #include "llvm/IR/Dominators.h" 260b57cec5SDimitry Andric #include "llvm/IR/Function.h" 270b57cec5SDimitry Andric #include "llvm/IR/InstrTypes.h" 280b57cec5SDimitry Andric #include "llvm/IR/Instruction.h" 290b57cec5SDimitry Andric #include "llvm/IR/Instructions.h" 300b57cec5SDimitry Andric #include "llvm/IR/LLVMContext.h" 310b57cec5SDimitry Andric #include "llvm/IR/Metadata.h" 320b57cec5SDimitry Andric #include "llvm/IR/PassManager.h" 330b57cec5SDimitry Andric #include "llvm/IR/Type.h" 340b57cec5SDimitry Andric #include "llvm/IR/Value.h" 35480093f4SDimitry Andric #include "llvm/InitializePasses.h" 360b57cec5SDimitry Andric #include "llvm/Pass.h" 370b57cec5SDimitry Andric #include "llvm/Support/BranchProbability.h" 380b57cec5SDimitry Andric #include "llvm/Support/Casting.h" 39480093f4SDimitry Andric #include "llvm/Support/CommandLine.h" 400b57cec5SDimitry Andric #include "llvm/Support/Debug.h" 410b57cec5SDimitry Andric #include "llvm/Support/raw_ostream.h" 420b57cec5SDimitry Andric #include <cassert> 430b57cec5SDimitry Andric #include <cstdint> 440b57cec5SDimitry Andric #include <iterator> 4504eeddc0SDimitry Andric #include <map> 460b57cec5SDimitry Andric #include <utility> 470b57cec5SDimitry Andric 480b57cec5SDimitry Andric using namespace llvm; 490b57cec5SDimitry Andric 500b57cec5SDimitry Andric #define DEBUG_TYPE "branch-prob" 510b57cec5SDimitry Andric 520b57cec5SDimitry Andric static cl::opt<bool> PrintBranchProb( 530b57cec5SDimitry Andric "print-bpi", cl::init(false), cl::Hidden, 540b57cec5SDimitry Andric cl::desc("Print the branch probability info.")); 550b57cec5SDimitry Andric 560b57cec5SDimitry Andric cl::opt<std::string> PrintBranchProbFuncName( 570b57cec5SDimitry Andric "print-bpi-func-name", cl::Hidden, 580b57cec5SDimitry Andric cl::desc("The option to specify the name of the function " 590b57cec5SDimitry Andric "whose branch probability info is printed.")); 600b57cec5SDimitry Andric 610b57cec5SDimitry Andric INITIALIZE_PASS_BEGIN(BranchProbabilityInfoWrapperPass, "branch-prob", 620b57cec5SDimitry Andric "Branch Probability Analysis", false, true) 630b57cec5SDimitry Andric INITIALIZE_PASS_DEPENDENCY(LoopInfoWrapperPass) 640b57cec5SDimitry Andric INITIALIZE_PASS_DEPENDENCY(TargetLibraryInfoWrapperPass) 65e8d8bef9SDimitry Andric INITIALIZE_PASS_DEPENDENCY(DominatorTreeWrapperPass) 665ffd83dbSDimitry Andric INITIALIZE_PASS_DEPENDENCY(PostDominatorTreeWrapperPass) 670b57cec5SDimitry Andric INITIALIZE_PASS_END(BranchProbabilityInfoWrapperPass, "branch-prob", 680b57cec5SDimitry Andric "Branch Probability Analysis", false, true) 690b57cec5SDimitry Andric 70480093f4SDimitry Andric BranchProbabilityInfoWrapperPass::BranchProbabilityInfoWrapperPass() 71480093f4SDimitry Andric : FunctionPass(ID) { 72480093f4SDimitry Andric initializeBranchProbabilityInfoWrapperPassPass( 73480093f4SDimitry Andric *PassRegistry::getPassRegistry()); 74480093f4SDimitry Andric } 75480093f4SDimitry Andric 760b57cec5SDimitry Andric char BranchProbabilityInfoWrapperPass::ID = 0; 770b57cec5SDimitry Andric 780b57cec5SDimitry Andric // Weights are for internal use only. They are used by heuristics to help to 790b57cec5SDimitry Andric // estimate edges' probability. Example: 800b57cec5SDimitry Andric // 810b57cec5SDimitry Andric // Using "Loop Branch Heuristics" we predict weights of edges for the 820b57cec5SDimitry Andric // block BB2. 830b57cec5SDimitry Andric // ... 840b57cec5SDimitry Andric // | 850b57cec5SDimitry Andric // V 860b57cec5SDimitry Andric // BB1<-+ 870b57cec5SDimitry Andric // | | 880b57cec5SDimitry Andric // | | (Weight = 124) 890b57cec5SDimitry Andric // V | 900b57cec5SDimitry Andric // BB2--+ 910b57cec5SDimitry Andric // | 920b57cec5SDimitry Andric // | (Weight = 4) 930b57cec5SDimitry Andric // V 940b57cec5SDimitry Andric // BB3 950b57cec5SDimitry Andric // 960b57cec5SDimitry Andric // Probability of the edge BB2->BB1 = 124 / (124 + 4) = 0.96875 970b57cec5SDimitry Andric // Probability of the edge BB2->BB3 = 4 / (124 + 4) = 0.03125 980b57cec5SDimitry Andric static const uint32_t LBH_TAKEN_WEIGHT = 124; 990b57cec5SDimitry Andric static const uint32_t LBH_NONTAKEN_WEIGHT = 4; 1000b57cec5SDimitry Andric 1010b57cec5SDimitry Andric /// Unreachable-terminating branch taken probability. 1020b57cec5SDimitry Andric /// 1030b57cec5SDimitry Andric /// This is the probability for a branch being taken to a block that terminates 1040b57cec5SDimitry Andric /// (eventually) in unreachable. These are predicted as unlikely as possible. 1055ffd83dbSDimitry Andric /// All reachable probability will proportionally share the remaining part. 1060b57cec5SDimitry Andric static const BranchProbability UR_TAKEN_PROB = BranchProbability::getRaw(1); 1070b57cec5SDimitry Andric 1084824e7fdSDimitry Andric /// Heuristics and lookup tables for non-loop branches: 1094824e7fdSDimitry Andric /// Pointer Heuristics (PH) 1100b57cec5SDimitry Andric static const uint32_t PH_TAKEN_WEIGHT = 20; 1110b57cec5SDimitry Andric static const uint32_t PH_NONTAKEN_WEIGHT = 12; 1124824e7fdSDimitry Andric static const BranchProbability 1134824e7fdSDimitry Andric PtrTakenProb(PH_TAKEN_WEIGHT, PH_TAKEN_WEIGHT + PH_NONTAKEN_WEIGHT); 1144824e7fdSDimitry Andric static const BranchProbability 1154824e7fdSDimitry Andric PtrUntakenProb(PH_NONTAKEN_WEIGHT, PH_TAKEN_WEIGHT + PH_NONTAKEN_WEIGHT); 1160b57cec5SDimitry Andric 1174824e7fdSDimitry Andric using ProbabilityList = SmallVector<BranchProbability>; 1184824e7fdSDimitry Andric using ProbabilityTable = std::map<CmpInst::Predicate, ProbabilityList>; 1194824e7fdSDimitry Andric 1204824e7fdSDimitry Andric /// Pointer comparisons: 1214824e7fdSDimitry Andric static const ProbabilityTable PointerTable{ 1224824e7fdSDimitry Andric {ICmpInst::ICMP_NE, {PtrTakenProb, PtrUntakenProb}}, /// p != q -> Likely 1234824e7fdSDimitry Andric {ICmpInst::ICMP_EQ, {PtrUntakenProb, PtrTakenProb}}, /// p == q -> Unlikely 1244824e7fdSDimitry Andric }; 1254824e7fdSDimitry Andric 1264824e7fdSDimitry Andric /// Zero Heuristics (ZH) 1270b57cec5SDimitry Andric static const uint32_t ZH_TAKEN_WEIGHT = 20; 1280b57cec5SDimitry Andric static const uint32_t ZH_NONTAKEN_WEIGHT = 12; 1294824e7fdSDimitry Andric static const BranchProbability 1304824e7fdSDimitry Andric ZeroTakenProb(ZH_TAKEN_WEIGHT, ZH_TAKEN_WEIGHT + ZH_NONTAKEN_WEIGHT); 1314824e7fdSDimitry Andric static const BranchProbability 1324824e7fdSDimitry Andric ZeroUntakenProb(ZH_NONTAKEN_WEIGHT, ZH_TAKEN_WEIGHT + ZH_NONTAKEN_WEIGHT); 1330b57cec5SDimitry Andric 1344824e7fdSDimitry Andric /// Integer compares with 0: 1354824e7fdSDimitry Andric static const ProbabilityTable ICmpWithZeroTable{ 1364824e7fdSDimitry Andric {CmpInst::ICMP_EQ, {ZeroUntakenProb, ZeroTakenProb}}, /// X == 0 -> Unlikely 1374824e7fdSDimitry Andric {CmpInst::ICMP_NE, {ZeroTakenProb, ZeroUntakenProb}}, /// X != 0 -> Likely 1384824e7fdSDimitry Andric {CmpInst::ICMP_SLT, {ZeroUntakenProb, ZeroTakenProb}}, /// X < 0 -> Unlikely 1394824e7fdSDimitry Andric {CmpInst::ICMP_SGT, {ZeroTakenProb, ZeroUntakenProb}}, /// X > 0 -> Likely 1404824e7fdSDimitry Andric }; 1414824e7fdSDimitry Andric 1424824e7fdSDimitry Andric /// Integer compares with -1: 1434824e7fdSDimitry Andric static const ProbabilityTable ICmpWithMinusOneTable{ 1444824e7fdSDimitry Andric {CmpInst::ICMP_EQ, {ZeroUntakenProb, ZeroTakenProb}}, /// X == -1 -> Unlikely 1454824e7fdSDimitry Andric {CmpInst::ICMP_NE, {ZeroTakenProb, ZeroUntakenProb}}, /// X != -1 -> Likely 1464824e7fdSDimitry Andric // InstCombine canonicalizes X >= 0 into X > -1 1474824e7fdSDimitry Andric {CmpInst::ICMP_SGT, {ZeroTakenProb, ZeroUntakenProb}}, /// X >= 0 -> Likely 1484824e7fdSDimitry Andric }; 1494824e7fdSDimitry Andric 1504824e7fdSDimitry Andric /// Integer compares with 1: 1514824e7fdSDimitry Andric static const ProbabilityTable ICmpWithOneTable{ 1524824e7fdSDimitry Andric // InstCombine canonicalizes X <= 0 into X < 1 1534824e7fdSDimitry Andric {CmpInst::ICMP_SLT, {ZeroUntakenProb, ZeroTakenProb}}, /// X <= 0 -> Unlikely 1544824e7fdSDimitry Andric }; 1554824e7fdSDimitry Andric 1564824e7fdSDimitry Andric /// strcmp and similar functions return zero, negative, or positive, if the 1574824e7fdSDimitry Andric /// first string is equal, less, or greater than the second. We consider it 1584824e7fdSDimitry Andric /// likely that the strings are not equal, so a comparison with zero is 1594824e7fdSDimitry Andric /// probably false, but also a comparison with any other number is also 1604824e7fdSDimitry Andric /// probably false given that what exactly is returned for nonzero values is 1614824e7fdSDimitry Andric /// not specified. Any kind of comparison other than equality we know 1624824e7fdSDimitry Andric /// nothing about. 1634824e7fdSDimitry Andric static const ProbabilityTable ICmpWithLibCallTable{ 1644824e7fdSDimitry Andric {CmpInst::ICMP_EQ, {ZeroUntakenProb, ZeroTakenProb}}, 1654824e7fdSDimitry Andric {CmpInst::ICMP_NE, {ZeroTakenProb, ZeroUntakenProb}}, 1664824e7fdSDimitry Andric }; 1674824e7fdSDimitry Andric 1684824e7fdSDimitry Andric // Floating-Point Heuristics (FPH) 1690b57cec5SDimitry Andric static const uint32_t FPH_TAKEN_WEIGHT = 20; 1700b57cec5SDimitry Andric static const uint32_t FPH_NONTAKEN_WEIGHT = 12; 1710b57cec5SDimitry Andric 1728bcb0991SDimitry Andric /// This is the probability for an ordered floating point comparison. 1738bcb0991SDimitry Andric static const uint32_t FPH_ORD_WEIGHT = 1024 * 1024 - 1; 1748bcb0991SDimitry Andric /// This is the probability for an unordered floating point comparison, it means 1758bcb0991SDimitry Andric /// one or two of the operands are NaN. Usually it is used to test for an 1768bcb0991SDimitry Andric /// exceptional case, so the result is unlikely. 1778bcb0991SDimitry Andric static const uint32_t FPH_UNO_WEIGHT = 1; 1788bcb0991SDimitry Andric 1794824e7fdSDimitry Andric static const BranchProbability FPOrdTakenProb(FPH_ORD_WEIGHT, 1804824e7fdSDimitry Andric FPH_ORD_WEIGHT + FPH_UNO_WEIGHT); 1814824e7fdSDimitry Andric static const BranchProbability 1824824e7fdSDimitry Andric FPOrdUntakenProb(FPH_UNO_WEIGHT, FPH_ORD_WEIGHT + FPH_UNO_WEIGHT); 1834824e7fdSDimitry Andric static const BranchProbability 1844824e7fdSDimitry Andric FPTakenProb(FPH_TAKEN_WEIGHT, FPH_TAKEN_WEIGHT + FPH_NONTAKEN_WEIGHT); 1854824e7fdSDimitry Andric static const BranchProbability 1864824e7fdSDimitry Andric FPUntakenProb(FPH_NONTAKEN_WEIGHT, FPH_TAKEN_WEIGHT + FPH_NONTAKEN_WEIGHT); 1874824e7fdSDimitry Andric 1884824e7fdSDimitry Andric /// Floating-Point compares: 1894824e7fdSDimitry Andric static const ProbabilityTable FCmpTable{ 1904824e7fdSDimitry Andric {FCmpInst::FCMP_ORD, {FPOrdTakenProb, FPOrdUntakenProb}}, /// !isnan -> Likely 1914824e7fdSDimitry Andric {FCmpInst::FCMP_UNO, {FPOrdUntakenProb, FPOrdTakenProb}}, /// isnan -> Unlikely 1924824e7fdSDimitry Andric }; 1934824e7fdSDimitry Andric 194e8d8bef9SDimitry Andric /// Set of dedicated "absolute" execution weights for a block. These weights are 195e8d8bef9SDimitry Andric /// meaningful relative to each other and their derivatives only. 196e8d8bef9SDimitry Andric enum class BlockExecWeight : std::uint32_t { 197e8d8bef9SDimitry Andric /// Special weight used for cases with exact zero probability. 198e8d8bef9SDimitry Andric ZERO = 0x0, 199e8d8bef9SDimitry Andric /// Minimal possible non zero weight. 200e8d8bef9SDimitry Andric LOWEST_NON_ZERO = 0x1, 201e8d8bef9SDimitry Andric /// Weight to an 'unreachable' block. 202e8d8bef9SDimitry Andric UNREACHABLE = ZERO, 203e8d8bef9SDimitry Andric /// Weight to a block containing non returning call. 204e8d8bef9SDimitry Andric NORETURN = LOWEST_NON_ZERO, 205e8d8bef9SDimitry Andric /// Weight to 'unwind' block of an invoke instruction. 206e8d8bef9SDimitry Andric UNWIND = LOWEST_NON_ZERO, 207e8d8bef9SDimitry Andric /// Weight to a 'cold' block. Cold blocks are the ones containing calls marked 208e8d8bef9SDimitry Andric /// with attribute 'cold'. 209e8d8bef9SDimitry Andric COLD = 0xffff, 210e8d8bef9SDimitry Andric /// Default weight is used in cases when there is no dedicated execution 211e8d8bef9SDimitry Andric /// weight set. It is not propagated through the domination line either. 212e8d8bef9SDimitry Andric DEFAULT = 0xfffff 213e8d8bef9SDimitry Andric }; 2140b57cec5SDimitry Andric 215e8d8bef9SDimitry Andric BranchProbabilityInfo::SccInfo::SccInfo(const Function &F) { 216e8d8bef9SDimitry Andric // Record SCC numbers of blocks in the CFG to identify irreducible loops. 217e8d8bef9SDimitry Andric // FIXME: We could only calculate this if the CFG is known to be irreducible 218e8d8bef9SDimitry Andric // (perhaps cache this info in LoopInfo if we can easily calculate it there?). 219e8d8bef9SDimitry Andric int SccNum = 0; 220e8d8bef9SDimitry Andric for (scc_iterator<const Function *> It = scc_begin(&F); !It.isAtEnd(); 221e8d8bef9SDimitry Andric ++It, ++SccNum) { 222e8d8bef9SDimitry Andric // Ignore single-block SCCs since they either aren't loops or LoopInfo will 223e8d8bef9SDimitry Andric // catch them. 224e8d8bef9SDimitry Andric const std::vector<const BasicBlock *> &Scc = *It; 225e8d8bef9SDimitry Andric if (Scc.size() == 1) 226480093f4SDimitry Andric continue; 227e8d8bef9SDimitry Andric 228e8d8bef9SDimitry Andric LLVM_DEBUG(dbgs() << "BPI: SCC " << SccNum << ":"); 229e8d8bef9SDimitry Andric for (const auto *BB : Scc) { 230e8d8bef9SDimitry Andric LLVM_DEBUG(dbgs() << " " << BB->getName()); 231e8d8bef9SDimitry Andric SccNums[BB] = SccNum; 232e8d8bef9SDimitry Andric calculateSccBlockType(BB, SccNum); 233480093f4SDimitry Andric } 234e8d8bef9SDimitry Andric LLVM_DEBUG(dbgs() << "\n"); 235e8d8bef9SDimitry Andric } 236e8d8bef9SDimitry Andric } 237e8d8bef9SDimitry Andric 238e8d8bef9SDimitry Andric int BranchProbabilityInfo::SccInfo::getSCCNum(const BasicBlock *BB) const { 239e8d8bef9SDimitry Andric auto SccIt = SccNums.find(BB); 240e8d8bef9SDimitry Andric if (SccIt == SccNums.end()) 241e8d8bef9SDimitry Andric return -1; 242e8d8bef9SDimitry Andric return SccIt->second; 243e8d8bef9SDimitry Andric } 244e8d8bef9SDimitry Andric 245e8d8bef9SDimitry Andric void BranchProbabilityInfo::SccInfo::getSccEnterBlocks( 246e8d8bef9SDimitry Andric int SccNum, SmallVectorImpl<BasicBlock *> &Enters) const { 247e8d8bef9SDimitry Andric 248e8d8bef9SDimitry Andric for (auto MapIt : SccBlocks[SccNum]) { 249e8d8bef9SDimitry Andric const auto *BB = MapIt.first; 250e8d8bef9SDimitry Andric if (isSCCHeader(BB, SccNum)) 251e8d8bef9SDimitry Andric for (const auto *Pred : predecessors(BB)) 252e8d8bef9SDimitry Andric if (getSCCNum(Pred) != SccNum) 253e8d8bef9SDimitry Andric Enters.push_back(const_cast<BasicBlock *>(BB)); 254e8d8bef9SDimitry Andric } 255e8d8bef9SDimitry Andric } 256e8d8bef9SDimitry Andric 257e8d8bef9SDimitry Andric void BranchProbabilityInfo::SccInfo::getSccExitBlocks( 258e8d8bef9SDimitry Andric int SccNum, SmallVectorImpl<BasicBlock *> &Exits) const { 259e8d8bef9SDimitry Andric for (auto MapIt : SccBlocks[SccNum]) { 260e8d8bef9SDimitry Andric const auto *BB = MapIt.first; 261e8d8bef9SDimitry Andric if (isSCCExitingBlock(BB, SccNum)) 262e8d8bef9SDimitry Andric for (const auto *Succ : successors(BB)) 263e8d8bef9SDimitry Andric if (getSCCNum(Succ) != SccNum) 264349cc55cSDimitry Andric Exits.push_back(const_cast<BasicBlock *>(Succ)); 265e8d8bef9SDimitry Andric } 266e8d8bef9SDimitry Andric } 267e8d8bef9SDimitry Andric 268e8d8bef9SDimitry Andric uint32_t BranchProbabilityInfo::SccInfo::getSccBlockType(const BasicBlock *BB, 269e8d8bef9SDimitry Andric int SccNum) const { 270e8d8bef9SDimitry Andric assert(getSCCNum(BB) == SccNum); 271e8d8bef9SDimitry Andric 272e8d8bef9SDimitry Andric assert(SccBlocks.size() > static_cast<unsigned>(SccNum) && "Unknown SCC"); 273e8d8bef9SDimitry Andric const auto &SccBlockTypes = SccBlocks[SccNum]; 274e8d8bef9SDimitry Andric 275e8d8bef9SDimitry Andric auto It = SccBlockTypes.find(BB); 276e8d8bef9SDimitry Andric if (It != SccBlockTypes.end()) { 277e8d8bef9SDimitry Andric return It->second; 278e8d8bef9SDimitry Andric } 279e8d8bef9SDimitry Andric return Inner; 280e8d8bef9SDimitry Andric } 281e8d8bef9SDimitry Andric 282e8d8bef9SDimitry Andric void BranchProbabilityInfo::SccInfo::calculateSccBlockType(const BasicBlock *BB, 283e8d8bef9SDimitry Andric int SccNum) { 284e8d8bef9SDimitry Andric assert(getSCCNum(BB) == SccNum); 285e8d8bef9SDimitry Andric uint32_t BlockType = Inner; 286e8d8bef9SDimitry Andric 287e8d8bef9SDimitry Andric if (llvm::any_of(predecessors(BB), [&](const BasicBlock *Pred) { 288e8d8bef9SDimitry Andric // Consider any block that is an entry point to the SCC as 289e8d8bef9SDimitry Andric // a header. 290e8d8bef9SDimitry Andric return getSCCNum(Pred) != SccNum; 291480093f4SDimitry Andric })) 292e8d8bef9SDimitry Andric BlockType |= Header; 2930b57cec5SDimitry Andric 294e8d8bef9SDimitry Andric if (llvm::any_of(successors(BB), [&](const BasicBlock *Succ) { 295e8d8bef9SDimitry Andric return getSCCNum(Succ) != SccNum; 296480093f4SDimitry Andric })) 297e8d8bef9SDimitry Andric BlockType |= Exiting; 298e8d8bef9SDimitry Andric 299e8d8bef9SDimitry Andric // Lazily compute the set of headers for a given SCC and cache the results 300e8d8bef9SDimitry Andric // in the SccHeaderMap. 301e8d8bef9SDimitry Andric if (SccBlocks.size() <= static_cast<unsigned>(SccNum)) 302e8d8bef9SDimitry Andric SccBlocks.resize(SccNum + 1); 303e8d8bef9SDimitry Andric auto &SccBlockTypes = SccBlocks[SccNum]; 304e8d8bef9SDimitry Andric 305e8d8bef9SDimitry Andric if (BlockType != Inner) { 306e8d8bef9SDimitry Andric bool IsInserted; 307e8d8bef9SDimitry Andric std::tie(std::ignore, IsInserted) = 308e8d8bef9SDimitry Andric SccBlockTypes.insert(std::make_pair(BB, BlockType)); 309e8d8bef9SDimitry Andric assert(IsInserted && "Duplicated block in SCC"); 3100b57cec5SDimitry Andric } 3110b57cec5SDimitry Andric } 3120b57cec5SDimitry Andric 313e8d8bef9SDimitry Andric BranchProbabilityInfo::LoopBlock::LoopBlock(const BasicBlock *BB, 314e8d8bef9SDimitry Andric const LoopInfo &LI, 315e8d8bef9SDimitry Andric const SccInfo &SccI) 316e8d8bef9SDimitry Andric : BB(BB) { 317e8d8bef9SDimitry Andric LD.first = LI.getLoopFor(BB); 318e8d8bef9SDimitry Andric if (!LD.first) { 319e8d8bef9SDimitry Andric LD.second = SccI.getSCCNum(BB); 320e8d8bef9SDimitry Andric } 3210b57cec5SDimitry Andric } 3220b57cec5SDimitry Andric 323e8d8bef9SDimitry Andric bool BranchProbabilityInfo::isLoopEnteringEdge(const LoopEdge &Edge) const { 324e8d8bef9SDimitry Andric const auto &SrcBlock = Edge.first; 325e8d8bef9SDimitry Andric const auto &DstBlock = Edge.second; 326e8d8bef9SDimitry Andric return (DstBlock.getLoop() && 327e8d8bef9SDimitry Andric !DstBlock.getLoop()->contains(SrcBlock.getLoop())) || 328e8d8bef9SDimitry Andric // Assume that SCCs can't be nested. 329e8d8bef9SDimitry Andric (DstBlock.getSccNum() != -1 && 330e8d8bef9SDimitry Andric SrcBlock.getSccNum() != DstBlock.getSccNum()); 331e8d8bef9SDimitry Andric } 3320b57cec5SDimitry Andric 333e8d8bef9SDimitry Andric bool BranchProbabilityInfo::isLoopExitingEdge(const LoopEdge &Edge) const { 334e8d8bef9SDimitry Andric return isLoopEnteringEdge({Edge.second, Edge.first}); 335e8d8bef9SDimitry Andric } 3360b57cec5SDimitry Andric 337e8d8bef9SDimitry Andric bool BranchProbabilityInfo::isLoopEnteringExitingEdge( 338e8d8bef9SDimitry Andric const LoopEdge &Edge) const { 339e8d8bef9SDimitry Andric return isLoopEnteringEdge(Edge) || isLoopExitingEdge(Edge); 340e8d8bef9SDimitry Andric } 341e8d8bef9SDimitry Andric 342e8d8bef9SDimitry Andric bool BranchProbabilityInfo::isLoopBackEdge(const LoopEdge &Edge) const { 343e8d8bef9SDimitry Andric const auto &SrcBlock = Edge.first; 344e8d8bef9SDimitry Andric const auto &DstBlock = Edge.second; 345e8d8bef9SDimitry Andric return SrcBlock.belongsToSameLoop(DstBlock) && 346e8d8bef9SDimitry Andric ((DstBlock.getLoop() && 347e8d8bef9SDimitry Andric DstBlock.getLoop()->getHeader() == DstBlock.getBlock()) || 348e8d8bef9SDimitry Andric (DstBlock.getSccNum() != -1 && 349e8d8bef9SDimitry Andric SccI->isSCCHeader(DstBlock.getBlock(), DstBlock.getSccNum()))); 350e8d8bef9SDimitry Andric } 351e8d8bef9SDimitry Andric 352e8d8bef9SDimitry Andric void BranchProbabilityInfo::getLoopEnterBlocks( 353e8d8bef9SDimitry Andric const LoopBlock &LB, SmallVectorImpl<BasicBlock *> &Enters) const { 354e8d8bef9SDimitry Andric if (LB.getLoop()) { 355e8d8bef9SDimitry Andric auto *Header = LB.getLoop()->getHeader(); 356e8d8bef9SDimitry Andric Enters.append(pred_begin(Header), pred_end(Header)); 357e8d8bef9SDimitry Andric } else { 358e8d8bef9SDimitry Andric assert(LB.getSccNum() != -1 && "LB doesn't belong to any loop?"); 359e8d8bef9SDimitry Andric SccI->getSccEnterBlocks(LB.getSccNum(), Enters); 360e8d8bef9SDimitry Andric } 361e8d8bef9SDimitry Andric } 362e8d8bef9SDimitry Andric 363e8d8bef9SDimitry Andric void BranchProbabilityInfo::getLoopExitBlocks( 364e8d8bef9SDimitry Andric const LoopBlock &LB, SmallVectorImpl<BasicBlock *> &Exits) const { 365e8d8bef9SDimitry Andric if (LB.getLoop()) { 366e8d8bef9SDimitry Andric LB.getLoop()->getExitBlocks(Exits); 367e8d8bef9SDimitry Andric } else { 368e8d8bef9SDimitry Andric assert(LB.getSccNum() != -1 && "LB doesn't belong to any loop?"); 369e8d8bef9SDimitry Andric SccI->getSccExitBlocks(LB.getSccNum(), Exits); 370e8d8bef9SDimitry Andric } 3710b57cec5SDimitry Andric } 3720b57cec5SDimitry Andric 3730b57cec5SDimitry Andric // Propagate existing explicit probabilities from either profile data or 3740b57cec5SDimitry Andric // 'expect' intrinsic processing. Examine metadata against unreachable 3750b57cec5SDimitry Andric // heuristic. The probability of the edge coming to unreachable block is 3760b57cec5SDimitry Andric // set to min of metadata and unreachable heuristic. 3770b57cec5SDimitry Andric bool BranchProbabilityInfo::calcMetadataWeights(const BasicBlock *BB) { 3780b57cec5SDimitry Andric const Instruction *TI = BB->getTerminator(); 3790b57cec5SDimitry Andric assert(TI->getNumSuccessors() > 1 && "expected more than one successor!"); 3805ffd83dbSDimitry Andric if (!(isa<BranchInst>(TI) || isa<SwitchInst>(TI) || isa<IndirectBrInst>(TI) || 3815ffd83dbSDimitry Andric isa<InvokeInst>(TI))) 3820b57cec5SDimitry Andric return false; 3830b57cec5SDimitry Andric 3840b57cec5SDimitry Andric MDNode *WeightsNode = TI->getMetadata(LLVMContext::MD_prof); 3850b57cec5SDimitry Andric if (!WeightsNode) 3860b57cec5SDimitry Andric return false; 3870b57cec5SDimitry Andric 3880b57cec5SDimitry Andric // Check that the number of successors is manageable. 3890b57cec5SDimitry Andric assert(TI->getNumSuccessors() < UINT32_MAX && "Too many successors"); 3900b57cec5SDimitry Andric 3910b57cec5SDimitry Andric // Ensure there are weights for all of the successors. Note that the first 3920b57cec5SDimitry Andric // operand to the metadata node is a name, not a weight. 3930b57cec5SDimitry Andric if (WeightsNode->getNumOperands() != TI->getNumSuccessors() + 1) 3940b57cec5SDimitry Andric return false; 3950b57cec5SDimitry Andric 3960b57cec5SDimitry Andric // Build up the final weights that will be used in a temporary buffer. 3970b57cec5SDimitry Andric // Compute the sum of all weights to later decide whether they need to 3980b57cec5SDimitry Andric // be scaled to fit in 32 bits. 3990b57cec5SDimitry Andric uint64_t WeightSum = 0; 4000b57cec5SDimitry Andric SmallVector<uint32_t, 2> Weights; 4010b57cec5SDimitry Andric SmallVector<unsigned, 2> UnreachableIdxs; 4020b57cec5SDimitry Andric SmallVector<unsigned, 2> ReachableIdxs; 4030b57cec5SDimitry Andric Weights.reserve(TI->getNumSuccessors()); 4045ffd83dbSDimitry Andric for (unsigned I = 1, E = WeightsNode->getNumOperands(); I != E; ++I) { 4050b57cec5SDimitry Andric ConstantInt *Weight = 4065ffd83dbSDimitry Andric mdconst::dyn_extract<ConstantInt>(WeightsNode->getOperand(I)); 4070b57cec5SDimitry Andric if (!Weight) 4080b57cec5SDimitry Andric return false; 4090b57cec5SDimitry Andric assert(Weight->getValue().getActiveBits() <= 32 && 4100b57cec5SDimitry Andric "Too many bits for uint32_t"); 4110b57cec5SDimitry Andric Weights.push_back(Weight->getZExtValue()); 4120b57cec5SDimitry Andric WeightSum += Weights.back(); 413e8d8bef9SDimitry Andric const LoopBlock SrcLoopBB = getLoopBlock(BB); 414e8d8bef9SDimitry Andric const LoopBlock DstLoopBB = getLoopBlock(TI->getSuccessor(I - 1)); 415e8d8bef9SDimitry Andric auto EstimatedWeight = getEstimatedEdgeWeight({SrcLoopBB, DstLoopBB}); 416e8d8bef9SDimitry Andric if (EstimatedWeight && 417*81ad6265SDimitry Andric *EstimatedWeight <= static_cast<uint32_t>(BlockExecWeight::UNREACHABLE)) 4185ffd83dbSDimitry Andric UnreachableIdxs.push_back(I - 1); 4190b57cec5SDimitry Andric else 4205ffd83dbSDimitry Andric ReachableIdxs.push_back(I - 1); 4210b57cec5SDimitry Andric } 4220b57cec5SDimitry Andric assert(Weights.size() == TI->getNumSuccessors() && "Checked above"); 4230b57cec5SDimitry Andric 4240b57cec5SDimitry Andric // If the sum of weights does not fit in 32 bits, scale every weight down 4250b57cec5SDimitry Andric // accordingly. 4260b57cec5SDimitry Andric uint64_t ScalingFactor = 4270b57cec5SDimitry Andric (WeightSum > UINT32_MAX) ? WeightSum / UINT32_MAX + 1 : 1; 4280b57cec5SDimitry Andric 4290b57cec5SDimitry Andric if (ScalingFactor > 1) { 4300b57cec5SDimitry Andric WeightSum = 0; 4315ffd83dbSDimitry Andric for (unsigned I = 0, E = TI->getNumSuccessors(); I != E; ++I) { 4325ffd83dbSDimitry Andric Weights[I] /= ScalingFactor; 4335ffd83dbSDimitry Andric WeightSum += Weights[I]; 4340b57cec5SDimitry Andric } 4350b57cec5SDimitry Andric } 4360b57cec5SDimitry Andric assert(WeightSum <= UINT32_MAX && 4370b57cec5SDimitry Andric "Expected weights to scale down to 32 bits"); 4380b57cec5SDimitry Andric 4390b57cec5SDimitry Andric if (WeightSum == 0 || ReachableIdxs.size() == 0) { 4405ffd83dbSDimitry Andric for (unsigned I = 0, E = TI->getNumSuccessors(); I != E; ++I) 4415ffd83dbSDimitry Andric Weights[I] = 1; 4420b57cec5SDimitry Andric WeightSum = TI->getNumSuccessors(); 4430b57cec5SDimitry Andric } 4440b57cec5SDimitry Andric 4450b57cec5SDimitry Andric // Set the probability. 4460b57cec5SDimitry Andric SmallVector<BranchProbability, 2> BP; 4475ffd83dbSDimitry Andric for (unsigned I = 0, E = TI->getNumSuccessors(); I != E; ++I) 4485ffd83dbSDimitry Andric BP.push_back({ Weights[I], static_cast<uint32_t>(WeightSum) }); 4490b57cec5SDimitry Andric 4500b57cec5SDimitry Andric // Examine the metadata against unreachable heuristic. 4510b57cec5SDimitry Andric // If the unreachable heuristic is more strong then we use it for this edge. 4525ffd83dbSDimitry Andric if (UnreachableIdxs.size() == 0 || ReachableIdxs.size() == 0) { 4535ffd83dbSDimitry Andric setEdgeProbability(BB, BP); 4545ffd83dbSDimitry Andric return true; 4555ffd83dbSDimitry Andric } 4565ffd83dbSDimitry Andric 4570b57cec5SDimitry Andric auto UnreachableProb = UR_TAKEN_PROB; 4585ffd83dbSDimitry Andric for (auto I : UnreachableIdxs) 4595ffd83dbSDimitry Andric if (UnreachableProb < BP[I]) { 4605ffd83dbSDimitry Andric BP[I] = UnreachableProb; 4610b57cec5SDimitry Andric } 4620b57cec5SDimitry Andric 4635ffd83dbSDimitry Andric // Sum of all edge probabilities must be 1.0. If we modified the probability 4645ffd83dbSDimitry Andric // of some edges then we must distribute the introduced difference over the 4655ffd83dbSDimitry Andric // reachable blocks. 4665ffd83dbSDimitry Andric // 4675ffd83dbSDimitry Andric // Proportional distribution: the relation between probabilities of the 4685ffd83dbSDimitry Andric // reachable edges is kept unchanged. That is for any reachable edges i and j: 4695ffd83dbSDimitry Andric // newBP[i] / newBP[j] == oldBP[i] / oldBP[j] => 4705ffd83dbSDimitry Andric // newBP[i] / oldBP[i] == newBP[j] / oldBP[j] == K 4715ffd83dbSDimitry Andric // Where K is independent of i,j. 4725ffd83dbSDimitry Andric // newBP[i] == oldBP[i] * K 4735ffd83dbSDimitry Andric // We need to find K. 4745ffd83dbSDimitry Andric // Make sum of all reachables of the left and right parts: 4755ffd83dbSDimitry Andric // sum_of_reachable(newBP) == K * sum_of_reachable(oldBP) 4765ffd83dbSDimitry Andric // Sum of newBP must be equal to 1.0: 4775ffd83dbSDimitry Andric // sum_of_reachable(newBP) + sum_of_unreachable(newBP) == 1.0 => 4785ffd83dbSDimitry Andric // sum_of_reachable(newBP) = 1.0 - sum_of_unreachable(newBP) 4795ffd83dbSDimitry Andric // Where sum_of_unreachable(newBP) is what has been just changed. 4805ffd83dbSDimitry Andric // Finally: 4815ffd83dbSDimitry Andric // K == sum_of_reachable(newBP) / sum_of_reachable(oldBP) => 4825ffd83dbSDimitry Andric // K == (1.0 - sum_of_unreachable(newBP)) / sum_of_reachable(oldBP) 4835ffd83dbSDimitry Andric BranchProbability NewUnreachableSum = BranchProbability::getZero(); 4845ffd83dbSDimitry Andric for (auto I : UnreachableIdxs) 4855ffd83dbSDimitry Andric NewUnreachableSum += BP[I]; 4865ffd83dbSDimitry Andric 4875ffd83dbSDimitry Andric BranchProbability NewReachableSum = 4885ffd83dbSDimitry Andric BranchProbability::getOne() - NewUnreachableSum; 4895ffd83dbSDimitry Andric 4905ffd83dbSDimitry Andric BranchProbability OldReachableSum = BranchProbability::getZero(); 4915ffd83dbSDimitry Andric for (auto I : ReachableIdxs) 4925ffd83dbSDimitry Andric OldReachableSum += BP[I]; 4935ffd83dbSDimitry Andric 4945ffd83dbSDimitry Andric if (OldReachableSum != NewReachableSum) { // Anything to dsitribute? 4955ffd83dbSDimitry Andric if (OldReachableSum.isZero()) { 4965ffd83dbSDimitry Andric // If all oldBP[i] are zeroes then the proportional distribution results 4975ffd83dbSDimitry Andric // in all zero probabilities and the error stays big. In this case we 4985ffd83dbSDimitry Andric // evenly spread NewReachableSum over the reachable edges. 4995ffd83dbSDimitry Andric BranchProbability PerEdge = NewReachableSum / ReachableIdxs.size(); 5005ffd83dbSDimitry Andric for (auto I : ReachableIdxs) 5015ffd83dbSDimitry Andric BP[I] = PerEdge; 5025ffd83dbSDimitry Andric } else { 5035ffd83dbSDimitry Andric for (auto I : ReachableIdxs) { 5045ffd83dbSDimitry Andric // We use uint64_t to avoid double rounding error of the following 5055ffd83dbSDimitry Andric // calculation: BP[i] = BP[i] * NewReachableSum / OldReachableSum 5065ffd83dbSDimitry Andric // The formula is taken from the private constructor 5075ffd83dbSDimitry Andric // BranchProbability(uint32_t Numerator, uint32_t Denominator) 5085ffd83dbSDimitry Andric uint64_t Mul = static_cast<uint64_t>(NewReachableSum.getNumerator()) * 5095ffd83dbSDimitry Andric BP[I].getNumerator(); 5105ffd83dbSDimitry Andric uint32_t Div = static_cast<uint32_t>( 5115ffd83dbSDimitry Andric divideNearest(Mul, OldReachableSum.getNumerator())); 5125ffd83dbSDimitry Andric BP[I] = BranchProbability::getRaw(Div); 5135ffd83dbSDimitry Andric } 5140b57cec5SDimitry Andric } 5150b57cec5SDimitry Andric } 5160b57cec5SDimitry Andric 5175ffd83dbSDimitry Andric setEdgeProbability(BB, BP); 5180b57cec5SDimitry Andric 5190b57cec5SDimitry Andric return true; 5200b57cec5SDimitry Andric } 5210b57cec5SDimitry Andric 5220b57cec5SDimitry Andric // Calculate Edge Weights using "Pointer Heuristics". Predict a comparison 5230b57cec5SDimitry Andric // between two pointer or pointer and NULL will fail. 5240b57cec5SDimitry Andric bool BranchProbabilityInfo::calcPointerHeuristics(const BasicBlock *BB) { 5250b57cec5SDimitry Andric const BranchInst *BI = dyn_cast<BranchInst>(BB->getTerminator()); 5260b57cec5SDimitry Andric if (!BI || !BI->isConditional()) 5270b57cec5SDimitry Andric return false; 5280b57cec5SDimitry Andric 5290b57cec5SDimitry Andric Value *Cond = BI->getCondition(); 5300b57cec5SDimitry Andric ICmpInst *CI = dyn_cast<ICmpInst>(Cond); 5310b57cec5SDimitry Andric if (!CI || !CI->isEquality()) 5320b57cec5SDimitry Andric return false; 5330b57cec5SDimitry Andric 5340b57cec5SDimitry Andric Value *LHS = CI->getOperand(0); 5350b57cec5SDimitry Andric 5360b57cec5SDimitry Andric if (!LHS->getType()->isPointerTy()) 5370b57cec5SDimitry Andric return false; 5380b57cec5SDimitry Andric 5390b57cec5SDimitry Andric assert(CI->getOperand(1)->getType()->isPointerTy()); 5400b57cec5SDimitry Andric 5414824e7fdSDimitry Andric auto Search = PointerTable.find(CI->getPredicate()); 5424824e7fdSDimitry Andric if (Search == PointerTable.end()) 5434824e7fdSDimitry Andric return false; 5444824e7fdSDimitry Andric setEdgeProbability(BB, Search->second); 5450b57cec5SDimitry Andric return true; 5460b57cec5SDimitry Andric } 5470b57cec5SDimitry Andric 5480b57cec5SDimitry Andric // Compute the unlikely successors to the block BB in the loop L, specifically 5490b57cec5SDimitry Andric // those that are unlikely because this is a loop, and add them to the 5500b57cec5SDimitry Andric // UnlikelyBlocks set. 5510b57cec5SDimitry Andric static void 5520b57cec5SDimitry Andric computeUnlikelySuccessors(const BasicBlock *BB, Loop *L, 5530b57cec5SDimitry Andric SmallPtrSetImpl<const BasicBlock*> &UnlikelyBlocks) { 5540b57cec5SDimitry Andric // Sometimes in a loop we have a branch whose condition is made false by 5550b57cec5SDimitry Andric // taking it. This is typically something like 5560b57cec5SDimitry Andric // int n = 0; 5570b57cec5SDimitry Andric // while (...) { 5580b57cec5SDimitry Andric // if (++n >= MAX) { 5590b57cec5SDimitry Andric // n = 0; 5600b57cec5SDimitry Andric // } 5610b57cec5SDimitry Andric // } 5620b57cec5SDimitry Andric // In this sort of situation taking the branch means that at the very least it 5630b57cec5SDimitry Andric // won't be taken again in the next iteration of the loop, so we should 5640b57cec5SDimitry Andric // consider it less likely than a typical branch. 5650b57cec5SDimitry Andric // 5660b57cec5SDimitry Andric // We detect this by looking back through the graph of PHI nodes that sets the 5670b57cec5SDimitry Andric // value that the condition depends on, and seeing if we can reach a successor 5680b57cec5SDimitry Andric // block which can be determined to make the condition false. 5690b57cec5SDimitry Andric // 5700b57cec5SDimitry Andric // FIXME: We currently consider unlikely blocks to be half as likely as other 5710b57cec5SDimitry Andric // blocks, but if we consider the example above the likelyhood is actually 5720b57cec5SDimitry Andric // 1/MAX. We could therefore be more precise in how unlikely we consider 5730b57cec5SDimitry Andric // blocks to be, but it would require more careful examination of the form 5740b57cec5SDimitry Andric // of the comparison expression. 5750b57cec5SDimitry Andric const BranchInst *BI = dyn_cast<BranchInst>(BB->getTerminator()); 5760b57cec5SDimitry Andric if (!BI || !BI->isConditional()) 5770b57cec5SDimitry Andric return; 5780b57cec5SDimitry Andric 5790b57cec5SDimitry Andric // Check if the branch is based on an instruction compared with a constant 5800b57cec5SDimitry Andric CmpInst *CI = dyn_cast<CmpInst>(BI->getCondition()); 5810b57cec5SDimitry Andric if (!CI || !isa<Instruction>(CI->getOperand(0)) || 5820b57cec5SDimitry Andric !isa<Constant>(CI->getOperand(1))) 5830b57cec5SDimitry Andric return; 5840b57cec5SDimitry Andric 5850b57cec5SDimitry Andric // Either the instruction must be a PHI, or a chain of operations involving 5860b57cec5SDimitry Andric // constants that ends in a PHI which we can then collapse into a single value 5870b57cec5SDimitry Andric // if the PHI value is known. 5880b57cec5SDimitry Andric Instruction *CmpLHS = dyn_cast<Instruction>(CI->getOperand(0)); 5890b57cec5SDimitry Andric PHINode *CmpPHI = dyn_cast<PHINode>(CmpLHS); 5900b57cec5SDimitry Andric Constant *CmpConst = dyn_cast<Constant>(CI->getOperand(1)); 5910b57cec5SDimitry Andric // Collect the instructions until we hit a PHI 5920b57cec5SDimitry Andric SmallVector<BinaryOperator *, 1> InstChain; 5930b57cec5SDimitry Andric while (!CmpPHI && CmpLHS && isa<BinaryOperator>(CmpLHS) && 5940b57cec5SDimitry Andric isa<Constant>(CmpLHS->getOperand(1))) { 5950b57cec5SDimitry Andric // Stop if the chain extends outside of the loop 5960b57cec5SDimitry Andric if (!L->contains(CmpLHS)) 5970b57cec5SDimitry Andric return; 5980b57cec5SDimitry Andric InstChain.push_back(cast<BinaryOperator>(CmpLHS)); 5990b57cec5SDimitry Andric CmpLHS = dyn_cast<Instruction>(CmpLHS->getOperand(0)); 6000b57cec5SDimitry Andric if (CmpLHS) 6010b57cec5SDimitry Andric CmpPHI = dyn_cast<PHINode>(CmpLHS); 6020b57cec5SDimitry Andric } 6030b57cec5SDimitry Andric if (!CmpPHI || !L->contains(CmpPHI)) 6040b57cec5SDimitry Andric return; 6050b57cec5SDimitry Andric 6060b57cec5SDimitry Andric // Trace the phi node to find all values that come from successors of BB 6070b57cec5SDimitry Andric SmallPtrSet<PHINode*, 8> VisitedInsts; 6080b57cec5SDimitry Andric SmallVector<PHINode*, 8> WorkList; 6090b57cec5SDimitry Andric WorkList.push_back(CmpPHI); 6100b57cec5SDimitry Andric VisitedInsts.insert(CmpPHI); 6110b57cec5SDimitry Andric while (!WorkList.empty()) { 612fe6060f1SDimitry Andric PHINode *P = WorkList.pop_back_val(); 6130b57cec5SDimitry Andric for (BasicBlock *B : P->blocks()) { 6140b57cec5SDimitry Andric // Skip blocks that aren't part of the loop 6150b57cec5SDimitry Andric if (!L->contains(B)) 6160b57cec5SDimitry Andric continue; 6170b57cec5SDimitry Andric Value *V = P->getIncomingValueForBlock(B); 6180b57cec5SDimitry Andric // If the source is a PHI add it to the work list if we haven't 6190b57cec5SDimitry Andric // already visited it. 6200b57cec5SDimitry Andric if (PHINode *PN = dyn_cast<PHINode>(V)) { 6210b57cec5SDimitry Andric if (VisitedInsts.insert(PN).second) 6220b57cec5SDimitry Andric WorkList.push_back(PN); 6230b57cec5SDimitry Andric continue; 6240b57cec5SDimitry Andric } 6250b57cec5SDimitry Andric // If this incoming value is a constant and B is a successor of BB, then 6260b57cec5SDimitry Andric // we can constant-evaluate the compare to see if it makes the branch be 6270b57cec5SDimitry Andric // taken or not. 6280b57cec5SDimitry Andric Constant *CmpLHSConst = dyn_cast<Constant>(V); 629e8d8bef9SDimitry Andric if (!CmpLHSConst || !llvm::is_contained(successors(BB), B)) 6300b57cec5SDimitry Andric continue; 6310b57cec5SDimitry Andric // First collapse InstChain 6320b57cec5SDimitry Andric for (Instruction *I : llvm::reverse(InstChain)) { 6330b57cec5SDimitry Andric CmpLHSConst = ConstantExpr::get(I->getOpcode(), CmpLHSConst, 6340b57cec5SDimitry Andric cast<Constant>(I->getOperand(1)), true); 6350b57cec5SDimitry Andric if (!CmpLHSConst) 6360b57cec5SDimitry Andric break; 6370b57cec5SDimitry Andric } 6380b57cec5SDimitry Andric if (!CmpLHSConst) 6390b57cec5SDimitry Andric continue; 6400b57cec5SDimitry Andric // Now constant-evaluate the compare 6410b57cec5SDimitry Andric Constant *Result = ConstantExpr::getCompare(CI->getPredicate(), 6420b57cec5SDimitry Andric CmpLHSConst, CmpConst, true); 6430b57cec5SDimitry Andric // If the result means we don't branch to the block then that block is 6440b57cec5SDimitry Andric // unlikely. 6450b57cec5SDimitry Andric if (Result && 6460b57cec5SDimitry Andric ((Result->isZeroValue() && B == BI->getSuccessor(0)) || 6470b57cec5SDimitry Andric (Result->isOneValue() && B == BI->getSuccessor(1)))) 6480b57cec5SDimitry Andric UnlikelyBlocks.insert(B); 6490b57cec5SDimitry Andric } 6500b57cec5SDimitry Andric } 6510b57cec5SDimitry Andric } 6520b57cec5SDimitry Andric 653e8d8bef9SDimitry Andric Optional<uint32_t> 654e8d8bef9SDimitry Andric BranchProbabilityInfo::getEstimatedBlockWeight(const BasicBlock *BB) const { 655e8d8bef9SDimitry Andric auto WeightIt = EstimatedBlockWeight.find(BB); 656e8d8bef9SDimitry Andric if (WeightIt == EstimatedBlockWeight.end()) 657e8d8bef9SDimitry Andric return None; 658e8d8bef9SDimitry Andric return WeightIt->second; 6590b57cec5SDimitry Andric } 6600b57cec5SDimitry Andric 661e8d8bef9SDimitry Andric Optional<uint32_t> 662e8d8bef9SDimitry Andric BranchProbabilityInfo::getEstimatedLoopWeight(const LoopData &L) const { 663e8d8bef9SDimitry Andric auto WeightIt = EstimatedLoopWeight.find(L); 664e8d8bef9SDimitry Andric if (WeightIt == EstimatedLoopWeight.end()) 665e8d8bef9SDimitry Andric return None; 666e8d8bef9SDimitry Andric return WeightIt->second; 667e8d8bef9SDimitry Andric } 668e8d8bef9SDimitry Andric 669e8d8bef9SDimitry Andric Optional<uint32_t> 670e8d8bef9SDimitry Andric BranchProbabilityInfo::getEstimatedEdgeWeight(const LoopEdge &Edge) const { 671e8d8bef9SDimitry Andric // For edges entering a loop take weight of a loop rather than an individual 672e8d8bef9SDimitry Andric // block in the loop. 673e8d8bef9SDimitry Andric return isLoopEnteringEdge(Edge) 674e8d8bef9SDimitry Andric ? getEstimatedLoopWeight(Edge.second.getLoopData()) 675e8d8bef9SDimitry Andric : getEstimatedBlockWeight(Edge.second.getBlock()); 676e8d8bef9SDimitry Andric } 677e8d8bef9SDimitry Andric 678e8d8bef9SDimitry Andric template <class IterT> 679e8d8bef9SDimitry Andric Optional<uint32_t> BranchProbabilityInfo::getMaxEstimatedEdgeWeight( 680e8d8bef9SDimitry Andric const LoopBlock &SrcLoopBB, iterator_range<IterT> Successors) const { 681e8d8bef9SDimitry Andric SmallVector<uint32_t, 4> Weights; 682e8d8bef9SDimitry Andric Optional<uint32_t> MaxWeight; 683e8d8bef9SDimitry Andric for (const BasicBlock *DstBB : Successors) { 684e8d8bef9SDimitry Andric const LoopBlock DstLoopBB = getLoopBlock(DstBB); 685e8d8bef9SDimitry Andric auto Weight = getEstimatedEdgeWeight({SrcLoopBB, DstLoopBB}); 686e8d8bef9SDimitry Andric 687e8d8bef9SDimitry Andric if (!Weight) 688e8d8bef9SDimitry Andric return None; 689e8d8bef9SDimitry Andric 690*81ad6265SDimitry Andric if (!MaxWeight || *MaxWeight < *Weight) 691e8d8bef9SDimitry Andric MaxWeight = Weight; 692e8d8bef9SDimitry Andric } 693e8d8bef9SDimitry Andric 694e8d8bef9SDimitry Andric return MaxWeight; 695e8d8bef9SDimitry Andric } 696e8d8bef9SDimitry Andric 697e8d8bef9SDimitry Andric // Updates \p LoopBB's weight and returns true. If \p LoopBB has already 698e8d8bef9SDimitry Andric // an associated weight it is unchanged and false is returned. 699e8d8bef9SDimitry Andric // 700e8d8bef9SDimitry Andric // Please note by the algorithm the weight is not expected to change once set 701e8d8bef9SDimitry Andric // thus 'false' status is used to track visited blocks. 702e8d8bef9SDimitry Andric bool BranchProbabilityInfo::updateEstimatedBlockWeight( 703e8d8bef9SDimitry Andric LoopBlock &LoopBB, uint32_t BBWeight, 704e8d8bef9SDimitry Andric SmallVectorImpl<BasicBlock *> &BlockWorkList, 705e8d8bef9SDimitry Andric SmallVectorImpl<LoopBlock> &LoopWorkList) { 706e8d8bef9SDimitry Andric BasicBlock *BB = LoopBB.getBlock(); 707e8d8bef9SDimitry Andric 708e8d8bef9SDimitry Andric // In general, weight is assigned to a block when it has final value and 709e8d8bef9SDimitry Andric // can't/shouldn't be changed. However, there are cases when a block 710e8d8bef9SDimitry Andric // inherently has several (possibly "contradicting") weights. For example, 711e8d8bef9SDimitry Andric // "unwind" block may also contain "cold" call. In that case the first 712e8d8bef9SDimitry Andric // set weight is favored and all consequent weights are ignored. 713e8d8bef9SDimitry Andric if (!EstimatedBlockWeight.insert({BB, BBWeight}).second) 714e8d8bef9SDimitry Andric return false; 715e8d8bef9SDimitry Andric 716e8d8bef9SDimitry Andric for (BasicBlock *PredBlock : predecessors(BB)) { 717e8d8bef9SDimitry Andric LoopBlock PredLoop = getLoopBlock(PredBlock); 718e8d8bef9SDimitry Andric // Add affected block/loop to a working list. 719e8d8bef9SDimitry Andric if (isLoopExitingEdge({PredLoop, LoopBB})) { 720e8d8bef9SDimitry Andric if (!EstimatedLoopWeight.count(PredLoop.getLoopData())) 721e8d8bef9SDimitry Andric LoopWorkList.push_back(PredLoop); 722e8d8bef9SDimitry Andric } else if (!EstimatedBlockWeight.count(PredBlock)) 723e8d8bef9SDimitry Andric BlockWorkList.push_back(PredBlock); 724e8d8bef9SDimitry Andric } 725e8d8bef9SDimitry Andric return true; 726e8d8bef9SDimitry Andric } 727e8d8bef9SDimitry Andric 728e8d8bef9SDimitry Andric // Starting from \p BB traverse through dominator blocks and assign \p BBWeight 729e8d8bef9SDimitry Andric // to all such blocks that are post dominated by \BB. In other words to all 730e8d8bef9SDimitry Andric // blocks that the one is executed if and only if another one is executed. 731e8d8bef9SDimitry Andric // Importantly, we skip loops here for two reasons. First weights of blocks in 732e8d8bef9SDimitry Andric // a loop should be scaled by trip count (yet possibly unknown). Second there is 733e8d8bef9SDimitry Andric // no any value in doing that because that doesn't give any additional 734e8d8bef9SDimitry Andric // information regarding distribution of probabilities inside the loop. 735e8d8bef9SDimitry Andric // Exception is loop 'enter' and 'exit' edges that are handled in a special way 736e8d8bef9SDimitry Andric // at calcEstimatedHeuristics. 737e8d8bef9SDimitry Andric // 738e8d8bef9SDimitry Andric // In addition, \p WorkList is populated with basic blocks if at leas one 739e8d8bef9SDimitry Andric // successor has updated estimated weight. 740e8d8bef9SDimitry Andric void BranchProbabilityInfo::propagateEstimatedBlockWeight( 741e8d8bef9SDimitry Andric const LoopBlock &LoopBB, DominatorTree *DT, PostDominatorTree *PDT, 742e8d8bef9SDimitry Andric uint32_t BBWeight, SmallVectorImpl<BasicBlock *> &BlockWorkList, 743e8d8bef9SDimitry Andric SmallVectorImpl<LoopBlock> &LoopWorkList) { 744e8d8bef9SDimitry Andric const BasicBlock *BB = LoopBB.getBlock(); 745e8d8bef9SDimitry Andric const auto *DTStartNode = DT->getNode(BB); 746e8d8bef9SDimitry Andric const auto *PDTStartNode = PDT->getNode(BB); 747e8d8bef9SDimitry Andric 748e8d8bef9SDimitry Andric // TODO: Consider propagating weight down the domination line as well. 749e8d8bef9SDimitry Andric for (const auto *DTNode = DTStartNode; DTNode != nullptr; 750e8d8bef9SDimitry Andric DTNode = DTNode->getIDom()) { 751e8d8bef9SDimitry Andric auto *DomBB = DTNode->getBlock(); 752e8d8bef9SDimitry Andric // Consider blocks which lie on one 'line'. 753e8d8bef9SDimitry Andric if (!PDT->dominates(PDTStartNode, PDT->getNode(DomBB))) 754e8d8bef9SDimitry Andric // If BB doesn't post dominate DomBB it will not post dominate dominators 755e8d8bef9SDimitry Andric // of DomBB as well. 756e8d8bef9SDimitry Andric break; 757e8d8bef9SDimitry Andric 758e8d8bef9SDimitry Andric LoopBlock DomLoopBB = getLoopBlock(DomBB); 759e8d8bef9SDimitry Andric const LoopEdge Edge{DomLoopBB, LoopBB}; 760e8d8bef9SDimitry Andric // Don't propagate weight to blocks belonging to different loops. 761e8d8bef9SDimitry Andric if (!isLoopEnteringExitingEdge(Edge)) { 762e8d8bef9SDimitry Andric if (!updateEstimatedBlockWeight(DomLoopBB, BBWeight, BlockWorkList, 763e8d8bef9SDimitry Andric LoopWorkList)) 764e8d8bef9SDimitry Andric // If DomBB has weight set then all it's predecessors are already 765e8d8bef9SDimitry Andric // processed (since we propagate weight up to the top of IR each time). 766e8d8bef9SDimitry Andric break; 767e8d8bef9SDimitry Andric } else if (isLoopExitingEdge(Edge)) { 768e8d8bef9SDimitry Andric LoopWorkList.push_back(DomLoopBB); 769e8d8bef9SDimitry Andric } 770e8d8bef9SDimitry Andric } 771e8d8bef9SDimitry Andric } 772e8d8bef9SDimitry Andric 773e8d8bef9SDimitry Andric Optional<uint32_t> BranchProbabilityInfo::getInitialEstimatedBlockWeight( 774e8d8bef9SDimitry Andric const BasicBlock *BB) { 775e8d8bef9SDimitry Andric // Returns true if \p BB has call marked with "NoReturn" attribute. 776e8d8bef9SDimitry Andric auto hasNoReturn = [&](const BasicBlock *BB) { 777e8d8bef9SDimitry Andric for (const auto &I : reverse(*BB)) 778e8d8bef9SDimitry Andric if (const CallInst *CI = dyn_cast<CallInst>(&I)) 779e8d8bef9SDimitry Andric if (CI->hasFnAttr(Attribute::NoReturn)) 780e8d8bef9SDimitry Andric return true; 781e8d8bef9SDimitry Andric 782e8d8bef9SDimitry Andric return false; 783e8d8bef9SDimitry Andric }; 784e8d8bef9SDimitry Andric 785e8d8bef9SDimitry Andric // Important note regarding the order of checks. They are ordered by weight 786e8d8bef9SDimitry Andric // from lowest to highest. Doing that allows to avoid "unstable" results 787e8d8bef9SDimitry Andric // when several conditions heuristics can be applied simultaneously. 788e8d8bef9SDimitry Andric if (isa<UnreachableInst>(BB->getTerminator()) || 789e8d8bef9SDimitry Andric // If this block is terminated by a call to 790e8d8bef9SDimitry Andric // @llvm.experimental.deoptimize then treat it like an unreachable 791e8d8bef9SDimitry Andric // since it is expected to practically never execute. 792e8d8bef9SDimitry Andric // TODO: Should we actually treat as never returning call? 793e8d8bef9SDimitry Andric BB->getTerminatingDeoptimizeCall()) 794e8d8bef9SDimitry Andric return hasNoReturn(BB) 795e8d8bef9SDimitry Andric ? static_cast<uint32_t>(BlockExecWeight::NORETURN) 796e8d8bef9SDimitry Andric : static_cast<uint32_t>(BlockExecWeight::UNREACHABLE); 797e8d8bef9SDimitry Andric 798e8d8bef9SDimitry Andric // Check if the block is 'unwind' handler of some invoke instruction. 799e8d8bef9SDimitry Andric for (const auto *Pred : predecessors(BB)) 800e8d8bef9SDimitry Andric if (Pred) 801e8d8bef9SDimitry Andric if (const auto *II = dyn_cast<InvokeInst>(Pred->getTerminator())) 802e8d8bef9SDimitry Andric if (II->getUnwindDest() == BB) 803e8d8bef9SDimitry Andric return static_cast<uint32_t>(BlockExecWeight::UNWIND); 804e8d8bef9SDimitry Andric 805e8d8bef9SDimitry Andric // Check if the block contains 'cold' call. 806e8d8bef9SDimitry Andric for (const auto &I : *BB) 807e8d8bef9SDimitry Andric if (const CallInst *CI = dyn_cast<CallInst>(&I)) 808e8d8bef9SDimitry Andric if (CI->hasFnAttr(Attribute::Cold)) 809e8d8bef9SDimitry Andric return static_cast<uint32_t>(BlockExecWeight::COLD); 810e8d8bef9SDimitry Andric 811e8d8bef9SDimitry Andric return None; 812e8d8bef9SDimitry Andric } 813e8d8bef9SDimitry Andric 814e8d8bef9SDimitry Andric // Does RPO traversal over all blocks in \p F and assigns weights to 815e8d8bef9SDimitry Andric // 'unreachable', 'noreturn', 'cold', 'unwind' blocks. In addition it does its 816e8d8bef9SDimitry Andric // best to propagate the weight to up/down the IR. 817e8d8bef9SDimitry Andric void BranchProbabilityInfo::computeEestimateBlockWeight( 818e8d8bef9SDimitry Andric const Function &F, DominatorTree *DT, PostDominatorTree *PDT) { 819e8d8bef9SDimitry Andric SmallVector<BasicBlock *, 8> BlockWorkList; 820e8d8bef9SDimitry Andric SmallVector<LoopBlock, 8> LoopWorkList; 821e8d8bef9SDimitry Andric 822e8d8bef9SDimitry Andric // By doing RPO we make sure that all predecessors already have weights 823e8d8bef9SDimitry Andric // calculated before visiting theirs successors. 824e8d8bef9SDimitry Andric ReversePostOrderTraversal<const Function *> RPOT(&F); 825e8d8bef9SDimitry Andric for (const auto *BB : RPOT) 826e8d8bef9SDimitry Andric if (auto BBWeight = getInitialEstimatedBlockWeight(BB)) 827e8d8bef9SDimitry Andric // If we were able to find estimated weight for the block set it to this 828e8d8bef9SDimitry Andric // block and propagate up the IR. 829e8d8bef9SDimitry Andric propagateEstimatedBlockWeight(getLoopBlock(BB), DT, PDT, 830e8d8bef9SDimitry Andric BBWeight.getValue(), BlockWorkList, 831e8d8bef9SDimitry Andric LoopWorkList); 832e8d8bef9SDimitry Andric 833e8d8bef9SDimitry Andric // BlockWorklist/LoopWorkList contains blocks/loops with at least one 834e8d8bef9SDimitry Andric // successor/exit having estimated weight. Try to propagate weight to such 835e8d8bef9SDimitry Andric // blocks/loops from successors/exits. 836e8d8bef9SDimitry Andric // Process loops and blocks. Order is not important. 837e8d8bef9SDimitry Andric do { 838e8d8bef9SDimitry Andric while (!LoopWorkList.empty()) { 839e8d8bef9SDimitry Andric const LoopBlock LoopBB = LoopWorkList.pop_back_val(); 840e8d8bef9SDimitry Andric 841e8d8bef9SDimitry Andric if (EstimatedLoopWeight.count(LoopBB.getLoopData())) 842e8d8bef9SDimitry Andric continue; 843e8d8bef9SDimitry Andric 844e8d8bef9SDimitry Andric SmallVector<BasicBlock *, 4> Exits; 845e8d8bef9SDimitry Andric getLoopExitBlocks(LoopBB, Exits); 846e8d8bef9SDimitry Andric auto LoopWeight = getMaxEstimatedEdgeWeight( 847e8d8bef9SDimitry Andric LoopBB, make_range(Exits.begin(), Exits.end())); 848e8d8bef9SDimitry Andric 849e8d8bef9SDimitry Andric if (LoopWeight) { 850e8d8bef9SDimitry Andric // If we never exit the loop then we can enter it once at maximum. 851e8d8bef9SDimitry Andric if (LoopWeight <= static_cast<uint32_t>(BlockExecWeight::UNREACHABLE)) 852e8d8bef9SDimitry Andric LoopWeight = static_cast<uint32_t>(BlockExecWeight::LOWEST_NON_ZERO); 853e8d8bef9SDimitry Andric 854*81ad6265SDimitry Andric EstimatedLoopWeight.insert({LoopBB.getLoopData(), *LoopWeight}); 855e8d8bef9SDimitry Andric // Add all blocks entering the loop into working list. 856e8d8bef9SDimitry Andric getLoopEnterBlocks(LoopBB, BlockWorkList); 857e8d8bef9SDimitry Andric } 858e8d8bef9SDimitry Andric } 859e8d8bef9SDimitry Andric 860e8d8bef9SDimitry Andric while (!BlockWorkList.empty()) { 861e8d8bef9SDimitry Andric // We can reach here only if BlockWorkList is not empty. 862e8d8bef9SDimitry Andric const BasicBlock *BB = BlockWorkList.pop_back_val(); 863e8d8bef9SDimitry Andric if (EstimatedBlockWeight.count(BB)) 864e8d8bef9SDimitry Andric continue; 865e8d8bef9SDimitry Andric 866e8d8bef9SDimitry Andric // We take maximum over all weights of successors. In other words we take 867e8d8bef9SDimitry Andric // weight of "hot" path. In theory we can probably find a better function 868e8d8bef9SDimitry Andric // which gives higher accuracy results (comparing to "maximum") but I 869e8d8bef9SDimitry Andric // can't 870e8d8bef9SDimitry Andric // think of any right now. And I doubt it will make any difference in 871e8d8bef9SDimitry Andric // practice. 872e8d8bef9SDimitry Andric const LoopBlock LoopBB = getLoopBlock(BB); 873e8d8bef9SDimitry Andric auto MaxWeight = getMaxEstimatedEdgeWeight(LoopBB, successors(BB)); 874e8d8bef9SDimitry Andric 875e8d8bef9SDimitry Andric if (MaxWeight) 876*81ad6265SDimitry Andric propagateEstimatedBlockWeight(LoopBB, DT, PDT, *MaxWeight, 877e8d8bef9SDimitry Andric BlockWorkList, LoopWorkList); 878e8d8bef9SDimitry Andric } 879e8d8bef9SDimitry Andric } while (!BlockWorkList.empty() || !LoopWorkList.empty()); 880e8d8bef9SDimitry Andric } 881e8d8bef9SDimitry Andric 882e8d8bef9SDimitry Andric // Calculate edge probabilities based on block's estimated weight. 883e8d8bef9SDimitry Andric // Note that gathered weights were not scaled for loops. Thus edges entering 884e8d8bef9SDimitry Andric // and exiting loops requires special processing. 885e8d8bef9SDimitry Andric bool BranchProbabilityInfo::calcEstimatedHeuristics(const BasicBlock *BB) { 886e8d8bef9SDimitry Andric assert(BB->getTerminator()->getNumSuccessors() > 1 && 887e8d8bef9SDimitry Andric "expected more than one successor!"); 888e8d8bef9SDimitry Andric 889e8d8bef9SDimitry Andric const LoopBlock LoopBB = getLoopBlock(BB); 890e8d8bef9SDimitry Andric 8910b57cec5SDimitry Andric SmallPtrSet<const BasicBlock *, 8> UnlikelyBlocks; 892e8d8bef9SDimitry Andric uint32_t TC = LBH_TAKEN_WEIGHT / LBH_NONTAKEN_WEIGHT; 893e8d8bef9SDimitry Andric if (LoopBB.getLoop()) 894e8d8bef9SDimitry Andric computeUnlikelySuccessors(BB, LoopBB.getLoop(), UnlikelyBlocks); 8950b57cec5SDimitry Andric 896e8d8bef9SDimitry Andric // Changed to 'true' if at least one successor has estimated weight. 897e8d8bef9SDimitry Andric bool FoundEstimatedWeight = false; 898e8d8bef9SDimitry Andric SmallVector<uint32_t, 4> SuccWeights; 899e8d8bef9SDimitry Andric uint64_t TotalWeight = 0; 900e8d8bef9SDimitry Andric // Go over all successors of BB and put their weights into SuccWeights. 901fe6060f1SDimitry Andric for (const BasicBlock *SuccBB : successors(BB)) { 902e8d8bef9SDimitry Andric Optional<uint32_t> Weight; 903e8d8bef9SDimitry Andric const LoopBlock SuccLoopBB = getLoopBlock(SuccBB); 904e8d8bef9SDimitry Andric const LoopEdge Edge{LoopBB, SuccLoopBB}; 905e8d8bef9SDimitry Andric 906e8d8bef9SDimitry Andric Weight = getEstimatedEdgeWeight(Edge); 907e8d8bef9SDimitry Andric 908e8d8bef9SDimitry Andric if (isLoopExitingEdge(Edge) && 909e8d8bef9SDimitry Andric // Avoid adjustment of ZERO weight since it should remain unchanged. 910e8d8bef9SDimitry Andric Weight != static_cast<uint32_t>(BlockExecWeight::ZERO)) { 911e8d8bef9SDimitry Andric // Scale down loop exiting weight by trip count. 912e8d8bef9SDimitry Andric Weight = std::max( 913e8d8bef9SDimitry Andric static_cast<uint32_t>(BlockExecWeight::LOWEST_NON_ZERO), 914*81ad6265SDimitry Andric Weight.value_or(static_cast<uint32_t>(BlockExecWeight::DEFAULT)) / 915e8d8bef9SDimitry Andric TC); 9160b57cec5SDimitry Andric } 917e8d8bef9SDimitry Andric bool IsUnlikelyEdge = LoopBB.getLoop() && UnlikelyBlocks.contains(SuccBB); 918e8d8bef9SDimitry Andric if (IsUnlikelyEdge && 919e8d8bef9SDimitry Andric // Avoid adjustment of ZERO weight since it should remain unchanged. 920e8d8bef9SDimitry Andric Weight != static_cast<uint32_t>(BlockExecWeight::ZERO)) { 921e8d8bef9SDimitry Andric // 'Unlikely' blocks have twice lower weight. 922e8d8bef9SDimitry Andric Weight = std::max( 923e8d8bef9SDimitry Andric static_cast<uint32_t>(BlockExecWeight::LOWEST_NON_ZERO), 924*81ad6265SDimitry Andric Weight.value_or(static_cast<uint32_t>(BlockExecWeight::DEFAULT)) / 2); 9250b57cec5SDimitry Andric } 9260b57cec5SDimitry Andric 927e8d8bef9SDimitry Andric if (Weight) 928e8d8bef9SDimitry Andric FoundEstimatedWeight = true; 929e8d8bef9SDimitry Andric 930e8d8bef9SDimitry Andric auto WeightVal = 931*81ad6265SDimitry Andric Weight.value_or(static_cast<uint32_t>(BlockExecWeight::DEFAULT)); 932e8d8bef9SDimitry Andric TotalWeight += WeightVal; 933e8d8bef9SDimitry Andric SuccWeights.push_back(WeightVal); 934e8d8bef9SDimitry Andric } 935e8d8bef9SDimitry Andric 936e8d8bef9SDimitry Andric // If non of blocks have estimated weight bail out. 937e8d8bef9SDimitry Andric // If TotalWeight is 0 that means weight of each successor is 0 as well and 938e8d8bef9SDimitry Andric // equally likely. Bail out early to not deal with devision by zero. 939e8d8bef9SDimitry Andric if (!FoundEstimatedWeight || TotalWeight == 0) 9400b57cec5SDimitry Andric return false; 9410b57cec5SDimitry Andric 942e8d8bef9SDimitry Andric assert(SuccWeights.size() == succ_size(BB) && "Missed successor?"); 943e8d8bef9SDimitry Andric const unsigned SuccCount = SuccWeights.size(); 9440b57cec5SDimitry Andric 945e8d8bef9SDimitry Andric // If the sum of weights does not fit in 32 bits, scale every weight down 946e8d8bef9SDimitry Andric // accordingly. 947e8d8bef9SDimitry Andric if (TotalWeight > UINT32_MAX) { 948e8d8bef9SDimitry Andric uint64_t ScalingFactor = TotalWeight / UINT32_MAX + 1; 949e8d8bef9SDimitry Andric TotalWeight = 0; 950e8d8bef9SDimitry Andric for (unsigned Idx = 0; Idx < SuccCount; ++Idx) { 951e8d8bef9SDimitry Andric SuccWeights[Idx] /= ScalingFactor; 952e8d8bef9SDimitry Andric if (SuccWeights[Idx] == static_cast<uint32_t>(BlockExecWeight::ZERO)) 953e8d8bef9SDimitry Andric SuccWeights[Idx] = 954e8d8bef9SDimitry Andric static_cast<uint32_t>(BlockExecWeight::LOWEST_NON_ZERO); 955e8d8bef9SDimitry Andric TotalWeight += SuccWeights[Idx]; 956e8d8bef9SDimitry Andric } 957e8d8bef9SDimitry Andric assert(TotalWeight <= UINT32_MAX && "Total weight overflows"); 958e8d8bef9SDimitry Andric } 959e8d8bef9SDimitry Andric 960e8d8bef9SDimitry Andric // Finally set probabilities to edges according to estimated block weights. 9615ffd83dbSDimitry Andric SmallVector<BranchProbability, 4> EdgeProbabilities( 962e8d8bef9SDimitry Andric SuccCount, BranchProbability::getUnknown()); 9630b57cec5SDimitry Andric 964e8d8bef9SDimitry Andric for (unsigned Idx = 0; Idx < SuccCount; ++Idx) { 965e8d8bef9SDimitry Andric EdgeProbabilities[Idx] = 966e8d8bef9SDimitry Andric BranchProbability(SuccWeights[Idx], (uint32_t)TotalWeight); 9670b57cec5SDimitry Andric } 9685ffd83dbSDimitry Andric setEdgeProbability(BB, EdgeProbabilities); 9690b57cec5SDimitry Andric return true; 9700b57cec5SDimitry Andric } 9710b57cec5SDimitry Andric 9720b57cec5SDimitry Andric bool BranchProbabilityInfo::calcZeroHeuristics(const BasicBlock *BB, 9730b57cec5SDimitry Andric const TargetLibraryInfo *TLI) { 9740b57cec5SDimitry Andric const BranchInst *BI = dyn_cast<BranchInst>(BB->getTerminator()); 9750b57cec5SDimitry Andric if (!BI || !BI->isConditional()) 9760b57cec5SDimitry Andric return false; 9770b57cec5SDimitry Andric 9780b57cec5SDimitry Andric Value *Cond = BI->getCondition(); 9790b57cec5SDimitry Andric ICmpInst *CI = dyn_cast<ICmpInst>(Cond); 9800b57cec5SDimitry Andric if (!CI) 9810b57cec5SDimitry Andric return false; 9820b57cec5SDimitry Andric 9830b57cec5SDimitry Andric auto GetConstantInt = [](Value *V) { 9840b57cec5SDimitry Andric if (auto *I = dyn_cast<BitCastInst>(V)) 9850b57cec5SDimitry Andric return dyn_cast<ConstantInt>(I->getOperand(0)); 9860b57cec5SDimitry Andric return dyn_cast<ConstantInt>(V); 9870b57cec5SDimitry Andric }; 9880b57cec5SDimitry Andric 9890b57cec5SDimitry Andric Value *RHS = CI->getOperand(1); 9900b57cec5SDimitry Andric ConstantInt *CV = GetConstantInt(RHS); 9910b57cec5SDimitry Andric if (!CV) 9920b57cec5SDimitry Andric return false; 9930b57cec5SDimitry Andric 9940b57cec5SDimitry Andric // If the LHS is the result of AND'ing a value with a single bit bitmask, 9950b57cec5SDimitry Andric // we don't have information about probabilities. 9960b57cec5SDimitry Andric if (Instruction *LHS = dyn_cast<Instruction>(CI->getOperand(0))) 9970b57cec5SDimitry Andric if (LHS->getOpcode() == Instruction::And) 998e8d8bef9SDimitry Andric if (ConstantInt *AndRHS = GetConstantInt(LHS->getOperand(1))) 9990b57cec5SDimitry Andric if (AndRHS->getValue().isPowerOf2()) 10000b57cec5SDimitry Andric return false; 10010b57cec5SDimitry Andric 10020b57cec5SDimitry Andric // Check if the LHS is the return value of a library function 10030b57cec5SDimitry Andric LibFunc Func = NumLibFuncs; 10040b57cec5SDimitry Andric if (TLI) 10050b57cec5SDimitry Andric if (CallInst *Call = dyn_cast<CallInst>(CI->getOperand(0))) 10060b57cec5SDimitry Andric if (Function *CalledFn = Call->getCalledFunction()) 10070b57cec5SDimitry Andric TLI->getLibFunc(*CalledFn, Func); 10080b57cec5SDimitry Andric 10094824e7fdSDimitry Andric ProbabilityTable::const_iterator Search; 10100b57cec5SDimitry Andric if (Func == LibFunc_strcasecmp || 10110b57cec5SDimitry Andric Func == LibFunc_strcmp || 10120b57cec5SDimitry Andric Func == LibFunc_strncasecmp || 10130b57cec5SDimitry Andric Func == LibFunc_strncmp || 1014e8d8bef9SDimitry Andric Func == LibFunc_memcmp || 1015e8d8bef9SDimitry Andric Func == LibFunc_bcmp) { 10164824e7fdSDimitry Andric Search = ICmpWithLibCallTable.find(CI->getPredicate()); 10174824e7fdSDimitry Andric if (Search == ICmpWithLibCallTable.end()) 10180b57cec5SDimitry Andric return false; 10190b57cec5SDimitry Andric } else if (CV->isZero()) { 10204824e7fdSDimitry Andric Search = ICmpWithZeroTable.find(CI->getPredicate()); 10214824e7fdSDimitry Andric if (Search == ICmpWithZeroTable.end()) 10220b57cec5SDimitry Andric return false; 10234824e7fdSDimitry Andric } else if (CV->isOne()) { 10244824e7fdSDimitry Andric Search = ICmpWithOneTable.find(CI->getPredicate()); 10254824e7fdSDimitry Andric if (Search == ICmpWithOneTable.end()) 10264824e7fdSDimitry Andric return false; 10270b57cec5SDimitry Andric } else if (CV->isMinusOne()) { 10284824e7fdSDimitry Andric Search = ICmpWithMinusOneTable.find(CI->getPredicate()); 10294824e7fdSDimitry Andric if (Search == ICmpWithMinusOneTable.end()) 10300b57cec5SDimitry Andric return false; 10310b57cec5SDimitry Andric } else { 10320b57cec5SDimitry Andric return false; 10330b57cec5SDimitry Andric } 10340b57cec5SDimitry Andric 10354824e7fdSDimitry Andric setEdgeProbability(BB, Search->second); 10360b57cec5SDimitry Andric return true; 10370b57cec5SDimitry Andric } 10380b57cec5SDimitry Andric 10390b57cec5SDimitry Andric bool BranchProbabilityInfo::calcFloatingPointHeuristics(const BasicBlock *BB) { 10400b57cec5SDimitry Andric const BranchInst *BI = dyn_cast<BranchInst>(BB->getTerminator()); 10410b57cec5SDimitry Andric if (!BI || !BI->isConditional()) 10420b57cec5SDimitry Andric return false; 10430b57cec5SDimitry Andric 10440b57cec5SDimitry Andric Value *Cond = BI->getCondition(); 10450b57cec5SDimitry Andric FCmpInst *FCmp = dyn_cast<FCmpInst>(Cond); 10460b57cec5SDimitry Andric if (!FCmp) 10470b57cec5SDimitry Andric return false; 10480b57cec5SDimitry Andric 10494824e7fdSDimitry Andric ProbabilityList ProbList; 10500b57cec5SDimitry Andric if (FCmp->isEquality()) { 10514824e7fdSDimitry Andric ProbList = !FCmp->isTrueWhenEqual() ? 10520b57cec5SDimitry Andric // f1 == f2 -> Unlikely 10534824e7fdSDimitry Andric ProbabilityList({FPTakenProb, FPUntakenProb}) : 10540b57cec5SDimitry Andric // f1 != f2 -> Likely 10554824e7fdSDimitry Andric ProbabilityList({FPUntakenProb, FPTakenProb}); 10560b57cec5SDimitry Andric } else { 10574824e7fdSDimitry Andric auto Search = FCmpTable.find(FCmp->getPredicate()); 10584824e7fdSDimitry Andric if (Search == FCmpTable.end()) 10590b57cec5SDimitry Andric return false; 10604824e7fdSDimitry Andric ProbList = Search->second; 10610b57cec5SDimitry Andric } 10620b57cec5SDimitry Andric 10634824e7fdSDimitry Andric setEdgeProbability(BB, ProbList); 10640b57cec5SDimitry Andric return true; 10650b57cec5SDimitry Andric } 10660b57cec5SDimitry Andric 10670b57cec5SDimitry Andric void BranchProbabilityInfo::releaseMemory() { 10680b57cec5SDimitry Andric Probs.clear(); 10695ffd83dbSDimitry Andric Handles.clear(); 10705ffd83dbSDimitry Andric } 10715ffd83dbSDimitry Andric 10725ffd83dbSDimitry Andric bool BranchProbabilityInfo::invalidate(Function &, const PreservedAnalyses &PA, 10735ffd83dbSDimitry Andric FunctionAnalysisManager::Invalidator &) { 10745ffd83dbSDimitry Andric // Check whether the analysis, all analyses on functions, or the function's 10755ffd83dbSDimitry Andric // CFG have been preserved. 10765ffd83dbSDimitry Andric auto PAC = PA.getChecker<BranchProbabilityAnalysis>(); 10775ffd83dbSDimitry Andric return !(PAC.preserved() || PAC.preservedSet<AllAnalysesOn<Function>>() || 10785ffd83dbSDimitry Andric PAC.preservedSet<CFGAnalyses>()); 10790b57cec5SDimitry Andric } 10800b57cec5SDimitry Andric 10810b57cec5SDimitry Andric void BranchProbabilityInfo::print(raw_ostream &OS) const { 10820b57cec5SDimitry Andric OS << "---- Branch Probabilities ----\n"; 10830b57cec5SDimitry Andric // We print the probabilities from the last function the analysis ran over, 10840b57cec5SDimitry Andric // or the function it is currently running over. 10850b57cec5SDimitry Andric assert(LastF && "Cannot print prior to running over a function"); 10860b57cec5SDimitry Andric for (const auto &BI : *LastF) { 1087fe6060f1SDimitry Andric for (const BasicBlock *Succ : successors(&BI)) 1088fe6060f1SDimitry Andric printEdgeProbability(OS << " ", &BI, Succ); 10890b57cec5SDimitry Andric } 10900b57cec5SDimitry Andric } 10910b57cec5SDimitry Andric 10920b57cec5SDimitry Andric bool BranchProbabilityInfo:: 10930b57cec5SDimitry Andric isEdgeHot(const BasicBlock *Src, const BasicBlock *Dst) const { 10940b57cec5SDimitry Andric // Hot probability is at least 4/5 = 80% 10950b57cec5SDimitry Andric // FIXME: Compare against a static "hot" BranchProbability. 10960b57cec5SDimitry Andric return getEdgeProbability(Src, Dst) > BranchProbability(4, 5); 10970b57cec5SDimitry Andric } 10980b57cec5SDimitry Andric 10990b57cec5SDimitry Andric /// Get the raw edge probability for the edge. If can't find it, return a 11000b57cec5SDimitry Andric /// default probability 1/N where N is the number of successors. Here an edge is 11010b57cec5SDimitry Andric /// specified using PredBlock and an 11020b57cec5SDimitry Andric /// index to the successors. 11030b57cec5SDimitry Andric BranchProbability 11040b57cec5SDimitry Andric BranchProbabilityInfo::getEdgeProbability(const BasicBlock *Src, 11050b57cec5SDimitry Andric unsigned IndexInSuccessors) const { 11060b57cec5SDimitry Andric auto I = Probs.find(std::make_pair(Src, IndexInSuccessors)); 1107e8d8bef9SDimitry Andric assert((Probs.end() == Probs.find(std::make_pair(Src, 0))) == 1108e8d8bef9SDimitry Andric (Probs.end() == I) && 1109e8d8bef9SDimitry Andric "Probability for I-th successor must always be defined along with the " 1110e8d8bef9SDimitry Andric "probability for the first successor"); 11110b57cec5SDimitry Andric 11120b57cec5SDimitry Andric if (I != Probs.end()) 11130b57cec5SDimitry Andric return I->second; 11140b57cec5SDimitry Andric 11150b57cec5SDimitry Andric return {1, static_cast<uint32_t>(succ_size(Src))}; 11160b57cec5SDimitry Andric } 11170b57cec5SDimitry Andric 11180b57cec5SDimitry Andric BranchProbability 11190b57cec5SDimitry Andric BranchProbabilityInfo::getEdgeProbability(const BasicBlock *Src, 11205ffd83dbSDimitry Andric const_succ_iterator Dst) const { 11210b57cec5SDimitry Andric return getEdgeProbability(Src, Dst.getSuccessorIndex()); 11220b57cec5SDimitry Andric } 11230b57cec5SDimitry Andric 11240b57cec5SDimitry Andric /// Get the raw edge probability calculated for the block pair. This returns the 11250b57cec5SDimitry Andric /// sum of all raw edge probabilities from Src to Dst. 11260b57cec5SDimitry Andric BranchProbability 11270b57cec5SDimitry Andric BranchProbabilityInfo::getEdgeProbability(const BasicBlock *Src, 11280b57cec5SDimitry Andric const BasicBlock *Dst) const { 1129e8d8bef9SDimitry Andric if (!Probs.count(std::make_pair(Src, 0))) 1130e8d8bef9SDimitry Andric return BranchProbability(llvm::count(successors(Src), Dst), succ_size(Src)); 11310b57cec5SDimitry Andric 1132e8d8bef9SDimitry Andric auto Prob = BranchProbability::getZero(); 1133e8d8bef9SDimitry Andric for (const_succ_iterator I = succ_begin(Src), E = succ_end(Src); I != E; ++I) 1134e8d8bef9SDimitry Andric if (*I == Dst) 1135e8d8bef9SDimitry Andric Prob += Probs.find(std::make_pair(Src, I.getSuccessorIndex()))->second; 1136e8d8bef9SDimitry Andric 1137e8d8bef9SDimitry Andric return Prob; 11380b57cec5SDimitry Andric } 11390b57cec5SDimitry Andric 11405ffd83dbSDimitry Andric /// Set the edge probability for all edges at once. 11415ffd83dbSDimitry Andric void BranchProbabilityInfo::setEdgeProbability( 11425ffd83dbSDimitry Andric const BasicBlock *Src, const SmallVectorImpl<BranchProbability> &Probs) { 11435ffd83dbSDimitry Andric assert(Src->getTerminator()->getNumSuccessors() == Probs.size()); 1144e8d8bef9SDimitry Andric eraseBlock(Src); // Erase stale data if any. 11455ffd83dbSDimitry Andric if (Probs.size() == 0) 11465ffd83dbSDimitry Andric return; // Nothing to set. 11475ffd83dbSDimitry Andric 1148e8d8bef9SDimitry Andric Handles.insert(BasicBlockCallbackVH(Src, this)); 11495ffd83dbSDimitry Andric uint64_t TotalNumerator = 0; 11505ffd83dbSDimitry Andric for (unsigned SuccIdx = 0; SuccIdx < Probs.size(); ++SuccIdx) { 1151e8d8bef9SDimitry Andric this->Probs[std::make_pair(Src, SuccIdx)] = Probs[SuccIdx]; 1152e8d8bef9SDimitry Andric LLVM_DEBUG(dbgs() << "set edge " << Src->getName() << " -> " << SuccIdx 1153e8d8bef9SDimitry Andric << " successor probability to " << Probs[SuccIdx] 1154e8d8bef9SDimitry Andric << "\n"); 11555ffd83dbSDimitry Andric TotalNumerator += Probs[SuccIdx].getNumerator(); 11565ffd83dbSDimitry Andric } 11575ffd83dbSDimitry Andric 11585ffd83dbSDimitry Andric // Because of rounding errors the total probability cannot be checked to be 11595ffd83dbSDimitry Andric // 1.0 exactly. That is TotalNumerator == BranchProbability::getDenominator. 11605ffd83dbSDimitry Andric // Instead, every single probability in Probs must be as accurate as possible. 11615ffd83dbSDimitry Andric // This results in error 1/denominator at most, thus the total absolute error 11625ffd83dbSDimitry Andric // should be within Probs.size / BranchProbability::getDenominator. 11635ffd83dbSDimitry Andric assert(TotalNumerator <= BranchProbability::getDenominator() + Probs.size()); 11645ffd83dbSDimitry Andric assert(TotalNumerator >= BranchProbability::getDenominator() - Probs.size()); 1165fe6060f1SDimitry Andric (void)TotalNumerator; 11665ffd83dbSDimitry Andric } 11675ffd83dbSDimitry Andric 1168e8d8bef9SDimitry Andric void BranchProbabilityInfo::copyEdgeProbabilities(BasicBlock *Src, 1169e8d8bef9SDimitry Andric BasicBlock *Dst) { 1170e8d8bef9SDimitry Andric eraseBlock(Dst); // Erase stale data if any. 1171e8d8bef9SDimitry Andric unsigned NumSuccessors = Src->getTerminator()->getNumSuccessors(); 1172e8d8bef9SDimitry Andric assert(NumSuccessors == Dst->getTerminator()->getNumSuccessors()); 1173e8d8bef9SDimitry Andric if (NumSuccessors == 0) 1174e8d8bef9SDimitry Andric return; // Nothing to set. 1175e8d8bef9SDimitry Andric if (this->Probs.find(std::make_pair(Src, 0)) == this->Probs.end()) 1176e8d8bef9SDimitry Andric return; // No probability is set for edges from Src. Keep the same for Dst. 1177e8d8bef9SDimitry Andric 1178e8d8bef9SDimitry Andric Handles.insert(BasicBlockCallbackVH(Dst, this)); 1179e8d8bef9SDimitry Andric for (unsigned SuccIdx = 0; SuccIdx < NumSuccessors; ++SuccIdx) { 1180e8d8bef9SDimitry Andric auto Prob = this->Probs[std::make_pair(Src, SuccIdx)]; 1181e8d8bef9SDimitry Andric this->Probs[std::make_pair(Dst, SuccIdx)] = Prob; 1182e8d8bef9SDimitry Andric LLVM_DEBUG(dbgs() << "set edge " << Dst->getName() << " -> " << SuccIdx 1183e8d8bef9SDimitry Andric << " successor probability to " << Prob << "\n"); 1184e8d8bef9SDimitry Andric } 1185e8d8bef9SDimitry Andric } 1186e8d8bef9SDimitry Andric 11870b57cec5SDimitry Andric raw_ostream & 11880b57cec5SDimitry Andric BranchProbabilityInfo::printEdgeProbability(raw_ostream &OS, 11890b57cec5SDimitry Andric const BasicBlock *Src, 11900b57cec5SDimitry Andric const BasicBlock *Dst) const { 11910b57cec5SDimitry Andric const BranchProbability Prob = getEdgeProbability(Src, Dst); 11920b57cec5SDimitry Andric OS << "edge " << Src->getName() << " -> " << Dst->getName() 11930b57cec5SDimitry Andric << " probability is " << Prob 11940b57cec5SDimitry Andric << (isEdgeHot(Src, Dst) ? " [HOT edge]\n" : "\n"); 11950b57cec5SDimitry Andric 11960b57cec5SDimitry Andric return OS; 11970b57cec5SDimitry Andric } 11980b57cec5SDimitry Andric 11990b57cec5SDimitry Andric void BranchProbabilityInfo::eraseBlock(const BasicBlock *BB) { 1200e8d8bef9SDimitry Andric LLVM_DEBUG(dbgs() << "eraseBlock " << BB->getName() << "\n"); 1201e8d8bef9SDimitry Andric 1202e8d8bef9SDimitry Andric // Note that we cannot use successors of BB because the terminator of BB may 1203e8d8bef9SDimitry Andric // have changed when eraseBlock is called as a BasicBlockCallbackVH callback. 1204e8d8bef9SDimitry Andric // Instead we remove prob data for the block by iterating successors by their 1205e8d8bef9SDimitry Andric // indices from 0 till the last which exists. There could not be prob data for 1206e8d8bef9SDimitry Andric // a pair (BB, N) if there is no data for (BB, N-1) because the data is always 1207e8d8bef9SDimitry Andric // set for all successors from 0 to M at once by the method 1208e8d8bef9SDimitry Andric // setEdgeProbability(). 1209e8d8bef9SDimitry Andric Handles.erase(BasicBlockCallbackVH(BB, this)); 1210e8d8bef9SDimitry Andric for (unsigned I = 0;; ++I) { 1211e8d8bef9SDimitry Andric auto MapI = Probs.find(std::make_pair(BB, I)); 1212e8d8bef9SDimitry Andric if (MapI == Probs.end()) { 1213e8d8bef9SDimitry Andric assert(Probs.count(std::make_pair(BB, I + 1)) == 0 && 1214e8d8bef9SDimitry Andric "Must be no more successors"); 1215e8d8bef9SDimitry Andric return; 1216e8d8bef9SDimitry Andric } 12175ffd83dbSDimitry Andric Probs.erase(MapI); 12180b57cec5SDimitry Andric } 12190b57cec5SDimitry Andric } 12200b57cec5SDimitry Andric 1221e8d8bef9SDimitry Andric void BranchProbabilityInfo::calculate(const Function &F, const LoopInfo &LoopI, 12225ffd83dbSDimitry Andric const TargetLibraryInfo *TLI, 1223e8d8bef9SDimitry Andric DominatorTree *DT, 12245ffd83dbSDimitry Andric PostDominatorTree *PDT) { 12250b57cec5SDimitry Andric LLVM_DEBUG(dbgs() << "---- Branch Probability Info : " << F.getName() 12260b57cec5SDimitry Andric << " ----\n\n"); 12270b57cec5SDimitry Andric LastF = &F; // Store the last function we ran on for printing. 1228e8d8bef9SDimitry Andric LI = &LoopI; 12290b57cec5SDimitry Andric 1230e8d8bef9SDimitry Andric SccI = std::make_unique<SccInfo>(F); 12310b57cec5SDimitry Andric 1232e8d8bef9SDimitry Andric assert(EstimatedBlockWeight.empty()); 1233e8d8bef9SDimitry Andric assert(EstimatedLoopWeight.empty()); 12340b57cec5SDimitry Andric 1235e8d8bef9SDimitry Andric std::unique_ptr<DominatorTree> DTPtr; 12365ffd83dbSDimitry Andric std::unique_ptr<PostDominatorTree> PDTPtr; 12375ffd83dbSDimitry Andric 1238e8d8bef9SDimitry Andric if (!DT) { 1239e8d8bef9SDimitry Andric DTPtr = std::make_unique<DominatorTree>(const_cast<Function &>(F)); 1240e8d8bef9SDimitry Andric DT = DTPtr.get(); 1241e8d8bef9SDimitry Andric } 1242e8d8bef9SDimitry Andric 12435ffd83dbSDimitry Andric if (!PDT) { 12445ffd83dbSDimitry Andric PDTPtr = std::make_unique<PostDominatorTree>(const_cast<Function &>(F)); 12455ffd83dbSDimitry Andric PDT = PDTPtr.get(); 12465ffd83dbSDimitry Andric } 12475ffd83dbSDimitry Andric 1248e8d8bef9SDimitry Andric computeEestimateBlockWeight(F, DT, PDT); 1249480093f4SDimitry Andric 12500b57cec5SDimitry Andric // Walk the basic blocks in post-order so that we can build up state about 12510b57cec5SDimitry Andric // the successors of a block iteratively. 12520b57cec5SDimitry Andric for (auto BB : post_order(&F.getEntryBlock())) { 12530b57cec5SDimitry Andric LLVM_DEBUG(dbgs() << "Computing probabilities for " << BB->getName() 12540b57cec5SDimitry Andric << "\n"); 12550b57cec5SDimitry Andric // If there is no at least two successors, no sense to set probability. 12560b57cec5SDimitry Andric if (BB->getTerminator()->getNumSuccessors() < 2) 12570b57cec5SDimitry Andric continue; 12580b57cec5SDimitry Andric if (calcMetadataWeights(BB)) 12590b57cec5SDimitry Andric continue; 1260e8d8bef9SDimitry Andric if (calcEstimatedHeuristics(BB)) 12610b57cec5SDimitry Andric continue; 12620b57cec5SDimitry Andric if (calcPointerHeuristics(BB)) 12630b57cec5SDimitry Andric continue; 12640b57cec5SDimitry Andric if (calcZeroHeuristics(BB, TLI)) 12650b57cec5SDimitry Andric continue; 12660b57cec5SDimitry Andric if (calcFloatingPointHeuristics(BB)) 12670b57cec5SDimitry Andric continue; 12680b57cec5SDimitry Andric } 12690b57cec5SDimitry Andric 1270e8d8bef9SDimitry Andric EstimatedLoopWeight.clear(); 1271e8d8bef9SDimitry Andric EstimatedBlockWeight.clear(); 1272e8d8bef9SDimitry Andric SccI.reset(); 12730b57cec5SDimitry Andric 12740b57cec5SDimitry Andric if (PrintBranchProb && 12750b57cec5SDimitry Andric (PrintBranchProbFuncName.empty() || 12760b57cec5SDimitry Andric F.getName().equals(PrintBranchProbFuncName))) { 12770b57cec5SDimitry Andric print(dbgs()); 12780b57cec5SDimitry Andric } 12790b57cec5SDimitry Andric } 12800b57cec5SDimitry Andric 12810b57cec5SDimitry Andric void BranchProbabilityInfoWrapperPass::getAnalysisUsage( 12820b57cec5SDimitry Andric AnalysisUsage &AU) const { 12830b57cec5SDimitry Andric // We require DT so it's available when LI is available. The LI updating code 12840b57cec5SDimitry Andric // asserts that DT is also present so if we don't make sure that we have DT 12850b57cec5SDimitry Andric // here, that assert will trigger. 12860b57cec5SDimitry Andric AU.addRequired<DominatorTreeWrapperPass>(); 12870b57cec5SDimitry Andric AU.addRequired<LoopInfoWrapperPass>(); 12880b57cec5SDimitry Andric AU.addRequired<TargetLibraryInfoWrapperPass>(); 1289e8d8bef9SDimitry Andric AU.addRequired<DominatorTreeWrapperPass>(); 12905ffd83dbSDimitry Andric AU.addRequired<PostDominatorTreeWrapperPass>(); 12910b57cec5SDimitry Andric AU.setPreservesAll(); 12920b57cec5SDimitry Andric } 12930b57cec5SDimitry Andric 12940b57cec5SDimitry Andric bool BranchProbabilityInfoWrapperPass::runOnFunction(Function &F) { 12950b57cec5SDimitry Andric const LoopInfo &LI = getAnalysis<LoopInfoWrapperPass>().getLoopInfo(); 12968bcb0991SDimitry Andric const TargetLibraryInfo &TLI = 12978bcb0991SDimitry Andric getAnalysis<TargetLibraryInfoWrapperPass>().getTLI(F); 1298e8d8bef9SDimitry Andric DominatorTree &DT = getAnalysis<DominatorTreeWrapperPass>().getDomTree(); 12995ffd83dbSDimitry Andric PostDominatorTree &PDT = 13005ffd83dbSDimitry Andric getAnalysis<PostDominatorTreeWrapperPass>().getPostDomTree(); 1301e8d8bef9SDimitry Andric BPI.calculate(F, LI, &TLI, &DT, &PDT); 13020b57cec5SDimitry Andric return false; 13030b57cec5SDimitry Andric } 13040b57cec5SDimitry Andric 13050b57cec5SDimitry Andric void BranchProbabilityInfoWrapperPass::releaseMemory() { BPI.releaseMemory(); } 13060b57cec5SDimitry Andric 13070b57cec5SDimitry Andric void BranchProbabilityInfoWrapperPass::print(raw_ostream &OS, 13080b57cec5SDimitry Andric const Module *) const { 13090b57cec5SDimitry Andric BPI.print(OS); 13100b57cec5SDimitry Andric } 13110b57cec5SDimitry Andric 13120b57cec5SDimitry Andric AnalysisKey BranchProbabilityAnalysis::Key; 13130b57cec5SDimitry Andric BranchProbabilityInfo 13140b57cec5SDimitry Andric BranchProbabilityAnalysis::run(Function &F, FunctionAnalysisManager &AM) { 13150b57cec5SDimitry Andric BranchProbabilityInfo BPI; 13165ffd83dbSDimitry Andric BPI.calculate(F, AM.getResult<LoopAnalysis>(F), 13175ffd83dbSDimitry Andric &AM.getResult<TargetLibraryAnalysis>(F), 1318e8d8bef9SDimitry Andric &AM.getResult<DominatorTreeAnalysis>(F), 13195ffd83dbSDimitry Andric &AM.getResult<PostDominatorTreeAnalysis>(F)); 13200b57cec5SDimitry Andric return BPI; 13210b57cec5SDimitry Andric } 13220b57cec5SDimitry Andric 13230b57cec5SDimitry Andric PreservedAnalyses 13240b57cec5SDimitry Andric BranchProbabilityPrinterPass::run(Function &F, FunctionAnalysisManager &AM) { 13250b57cec5SDimitry Andric OS << "Printing analysis results of BPI for function " 13260b57cec5SDimitry Andric << "'" << F.getName() << "':" 13270b57cec5SDimitry Andric << "\n"; 13280b57cec5SDimitry Andric AM.getResult<BranchProbabilityAnalysis>(F).print(OS); 13290b57cec5SDimitry Andric return PreservedAnalyses::all(); 13300b57cec5SDimitry Andric } 1331