//===- IndirectBrExpandPass.cpp - Expand indirectbr to switch -------------===// // // Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions. // See https://llvm.org/LICENSE.txt for license information. // SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception // //===----------------------------------------------------------------------===// /// \file /// /// Implements an expansion pass to turn `indirectbr` instructions in the IR /// into `switch` instructions. This works by enumerating the basic blocks in /// a dense range of integers, replacing each `blockaddr` constant with the /// corresponding integer constant, and then building a switch that maps from /// the integers to the actual blocks. All of the indirectbr instructions in the /// function are redirected to this common switch. /// /// While this is generically useful if a target is unable to codegen /// `indirectbr` natively, it is primarily useful when there is some desire to /// get the builtin non-jump-table lowering of a switch even when the input /// source contained an explicit indirect branch construct. /// /// Note that it doesn't make any sense to enable this pass unless a target also /// disables jump-table lowering of switches. Doing that is likely to pessimize /// the code. /// //===----------------------------------------------------------------------===// #include "llvm/ADT/STLExtras.h" #include "llvm/ADT/Sequence.h" #include "llvm/ADT/SmallVector.h" #include "llvm/Analysis/DomTreeUpdater.h" #include "llvm/CodeGen/TargetPassConfig.h" #include "llvm/CodeGen/TargetSubtargetInfo.h" #include "llvm/IR/BasicBlock.h" #include "llvm/IR/Constants.h" #include "llvm/IR/Dominators.h" #include "llvm/IR/Function.h" #include "llvm/IR/Instructions.h" #include "llvm/InitializePasses.h" #include "llvm/Pass.h" #include "llvm/Support/ErrorHandling.h" #include "llvm/Target/TargetMachine.h" #include using namespace llvm; #define DEBUG_TYPE "indirectbr-expand" namespace { class IndirectBrExpandPass : public FunctionPass { const TargetLowering *TLI = nullptr; public: static char ID; // Pass identification, replacement for typeid IndirectBrExpandPass() : FunctionPass(ID) { initializeIndirectBrExpandPassPass(*PassRegistry::getPassRegistry()); } void getAnalysisUsage(AnalysisUsage &AU) const override { AU.addPreserved(); } bool runOnFunction(Function &F) override; }; } // end anonymous namespace char IndirectBrExpandPass::ID = 0; INITIALIZE_PASS_BEGIN(IndirectBrExpandPass, DEBUG_TYPE, "Expand indirectbr instructions", false, false) INITIALIZE_PASS_DEPENDENCY(DominatorTreeWrapperPass) INITIALIZE_PASS_END(IndirectBrExpandPass, DEBUG_TYPE, "Expand indirectbr instructions", false, false) FunctionPass *llvm::createIndirectBrExpandPass() { return new IndirectBrExpandPass(); } bool IndirectBrExpandPass::runOnFunction(Function &F) { auto &DL = F.getParent()->getDataLayout(); auto *TPC = getAnalysisIfAvailable(); if (!TPC) return false; auto &TM = TPC->getTM(); auto &STI = *TM.getSubtargetImpl(F); if (!STI.enableIndirectBrExpand()) return false; TLI = STI.getTargetLowering(); std::optional DTU; if (auto *DTWP = getAnalysisIfAvailable()) DTU.emplace(DTWP->getDomTree(), DomTreeUpdater::UpdateStrategy::Lazy); SmallVector IndirectBrs; // Set of all potential successors for indirectbr instructions. SmallPtrSet IndirectBrSuccs; // Build a list of indirectbrs that we want to rewrite. for (BasicBlock &BB : F) if (auto *IBr = dyn_cast(BB.getTerminator())) { // Handle the degenerate case of no successors by replacing the indirectbr // with unreachable as there is no successor available. if (IBr->getNumSuccessors() == 0) { (void)new UnreachableInst(F.getContext(), IBr); IBr->eraseFromParent(); continue; } IndirectBrs.push_back(IBr); for (BasicBlock *SuccBB : IBr->successors()) IndirectBrSuccs.insert(SuccBB); } if (IndirectBrs.empty()) return false; // If we need to replace any indirectbrs we need to establish integer // constants that will correspond to each of the basic blocks in the function // whose address escapes. We do that here and rewrite all the blockaddress // constants to just be those integer constants cast to a pointer type. SmallVector BBs; for (BasicBlock &BB : F) { // Skip blocks that aren't successors to an indirectbr we're going to // rewrite. if (!IndirectBrSuccs.count(&BB)) continue; auto IsBlockAddressUse = [&](const Use &U) { return isa(U.getUser()); }; auto BlockAddressUseIt = llvm::find_if(BB.uses(), IsBlockAddressUse); if (BlockAddressUseIt == BB.use_end()) continue; assert(std::find_if(std::next(BlockAddressUseIt), BB.use_end(), IsBlockAddressUse) == BB.use_end() && "There should only ever be a single blockaddress use because it is " "a constant and should be uniqued."); auto *BA = cast(BlockAddressUseIt->getUser()); // Skip if the constant was formed but ended up not being used (due to DCE // or whatever). if (!BA->isConstantUsed()) continue; // Compute the index we want to use for this basic block. We can't use zero // because null can be compared with block addresses. int BBIndex = BBs.size() + 1; BBs.push_back(&BB); auto *ITy = cast(DL.getIntPtrType(BA->getType())); ConstantInt *BBIndexC = ConstantInt::get(ITy, BBIndex); // Now rewrite the blockaddress to an integer constant based on the index. // FIXME: This part doesn't properly recognize other uses of blockaddress // expressions, for instance, where they are used to pass labels to // asm-goto. This part of the pass needs a rework. BA->replaceAllUsesWith(ConstantExpr::getIntToPtr(BBIndexC, BA->getType())); } if (BBs.empty()) { // There are no blocks whose address is taken, so any indirectbr instruction // cannot get a valid input and we can replace all of them with unreachable. SmallVector Updates; if (DTU) Updates.reserve(IndirectBrSuccs.size()); for (auto *IBr : IndirectBrs) { if (DTU) { for (BasicBlock *SuccBB : IBr->successors()) Updates.push_back({DominatorTree::Delete, IBr->getParent(), SuccBB}); } (void)new UnreachableInst(F.getContext(), IBr); IBr->eraseFromParent(); } if (DTU) { assert(Updates.size() == IndirectBrSuccs.size() && "Got unexpected update count."); DTU->applyUpdates(Updates); } return true; } BasicBlock *SwitchBB; Value *SwitchValue; // Compute a common integer type across all the indirectbr instructions. IntegerType *CommonITy = nullptr; for (auto *IBr : IndirectBrs) { auto *ITy = cast(DL.getIntPtrType(IBr->getAddress()->getType())); if (!CommonITy || ITy->getBitWidth() > CommonITy->getBitWidth()) CommonITy = ITy; } auto GetSwitchValue = [CommonITy](IndirectBrInst *IBr) { return CastInst::CreatePointerCast( IBr->getAddress(), CommonITy, Twine(IBr->getAddress()->getName()) + ".switch_cast", IBr); }; SmallVector Updates; if (IndirectBrs.size() == 1) { // If we only have one indirectbr, we can just directly replace it within // its block. IndirectBrInst *IBr = IndirectBrs[0]; SwitchBB = IBr->getParent(); SwitchValue = GetSwitchValue(IBr); if (DTU) { Updates.reserve(IndirectBrSuccs.size()); for (BasicBlock *SuccBB : IBr->successors()) Updates.push_back({DominatorTree::Delete, IBr->getParent(), SuccBB}); assert(Updates.size() == IndirectBrSuccs.size() && "Got unexpected update count."); } IBr->eraseFromParent(); } else { // Otherwise we need to create a new block to hold the switch across BBs, // jump to that block instead of each indirectbr, and phi together the // values for the switch. SwitchBB = BasicBlock::Create(F.getContext(), "switch_bb", &F); auto *SwitchPN = PHINode::Create(CommonITy, IndirectBrs.size(), "switch_value_phi", SwitchBB); SwitchValue = SwitchPN; // Now replace the indirectbr instructions with direct branches to the // switch block and fill out the PHI operands. if (DTU) Updates.reserve(IndirectBrs.size() + 2 * IndirectBrSuccs.size()); for (auto *IBr : IndirectBrs) { SwitchPN->addIncoming(GetSwitchValue(IBr), IBr->getParent()); BranchInst::Create(SwitchBB, IBr); if (DTU) { Updates.push_back({DominatorTree::Insert, IBr->getParent(), SwitchBB}); for (BasicBlock *SuccBB : IBr->successors()) Updates.push_back({DominatorTree::Delete, IBr->getParent(), SuccBB}); } IBr->eraseFromParent(); } } // Now build the switch in the block. The block will have no terminator // already. auto *SI = SwitchInst::Create(SwitchValue, BBs[0], BBs.size(), SwitchBB); // Add a case for each block. for (int i : llvm::seq(1, BBs.size())) SI->addCase(ConstantInt::get(CommonITy, i + 1), BBs[i]); if (DTU) { // If there were multiple indirectbr's, they may have common successors, // but in the dominator tree, we only track unique edges. SmallPtrSet UniqueSuccessors; Updates.reserve(Updates.size() + BBs.size()); for (BasicBlock *BB : BBs) { if (UniqueSuccessors.insert(BB).second) Updates.push_back({DominatorTree::Insert, SwitchBB, BB}); } DTU->applyUpdates(Updates); } return true; }