//===- HexagonOptAddrMode.cpp ---------------------------------------------===// // // Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions. // See https://llvm.org/LICENSE.txt for license information. // SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception // //===----------------------------------------------------------------------===// // This implements a Hexagon-specific pass to optimize addressing mode for // load/store instructions. //===----------------------------------------------------------------------===// #include "HexagonInstrInfo.h" #include "HexagonSubtarget.h" #include "MCTargetDesc/HexagonBaseInfo.h" #include "llvm/ADT/DenseMap.h" #include "llvm/ADT/DenseSet.h" #include "llvm/ADT/StringRef.h" #include "llvm/CodeGen/MachineBasicBlock.h" #include "llvm/CodeGen/MachineDominanceFrontier.h" #include "llvm/CodeGen/MachineDominators.h" #include "llvm/CodeGen/MachineFunction.h" #include "llvm/CodeGen/MachineFunctionPass.h" #include "llvm/CodeGen/MachineInstr.h" #include "llvm/CodeGen/MachineInstrBuilder.h" #include "llvm/CodeGen/MachineOperand.h" #include "llvm/CodeGen/MachineRegisterInfo.h" #include "llvm/CodeGen/RDFGraph.h" #include "llvm/CodeGen/RDFLiveness.h" #include "llvm/CodeGen/RDFRegisters.h" #include "llvm/CodeGen/TargetSubtargetInfo.h" #include "llvm/InitializePasses.h" #include "llvm/MC/MCInstrDesc.h" #include "llvm/Pass.h" #include "llvm/Support/CommandLine.h" #include "llvm/Support/Debug.h" #include "llvm/Support/ErrorHandling.h" #include "llvm/Support/raw_ostream.h" #include #include #define DEBUG_TYPE "opt-addr-mode" using namespace llvm; using namespace rdf; static cl::opt CodeGrowthLimit("hexagon-amode-growth-limit", cl::Hidden, cl::init(0), cl::desc("Code growth limit for address mode " "optimization")); namespace llvm { FunctionPass *createHexagonOptAddrMode(); void initializeHexagonOptAddrModePass(PassRegistry&); } // end namespace llvm namespace { class HexagonOptAddrMode : public MachineFunctionPass { public: static char ID; HexagonOptAddrMode() : MachineFunctionPass(ID) {} StringRef getPassName() const override { return "Optimize addressing mode of load/store"; } void getAnalysisUsage(AnalysisUsage &AU) const override { MachineFunctionPass::getAnalysisUsage(AU); AU.addRequired(); AU.addRequired(); AU.setPreservesAll(); } bool runOnMachineFunction(MachineFunction &MF) override; private: using MISetType = DenseSet; using InstrEvalMap = DenseMap; MachineRegisterInfo *MRI = nullptr; const HexagonInstrInfo *HII = nullptr; const HexagonRegisterInfo *HRI = nullptr; MachineDominatorTree *MDT = nullptr; DataFlowGraph *DFG = nullptr; DataFlowGraph::DefStackMap DefM; Liveness *LV = nullptr; MISetType Deleted; bool processBlock(NodeAddr BA); bool xformUseMI(MachineInstr *TfrMI, MachineInstr *UseMI, NodeAddr UseN, unsigned UseMOnum); bool processAddUses(NodeAddr AddSN, MachineInstr *AddMI, const NodeList &UNodeList); bool updateAddUses(MachineInstr *AddMI, MachineInstr *UseMI); bool analyzeUses(unsigned DefR, const NodeList &UNodeList, InstrEvalMap &InstrEvalResult, short &SizeInc); bool hasRepForm(MachineInstr &MI, unsigned TfrDefR); bool canRemoveAddasl(NodeAddr AddAslSN, MachineInstr &MI, const NodeList &UNodeList); bool isSafeToExtLR(NodeAddr SN, MachineInstr *MI, unsigned LRExtReg, const NodeList &UNodeList); void getAllRealUses(NodeAddr SN, NodeList &UNodeList); bool allValidCandidates(NodeAddr SA, NodeList &UNodeList); short getBaseWithLongOffset(const MachineInstr &MI) const; bool changeStore(MachineInstr *OldMI, MachineOperand ImmOp, unsigned ImmOpNum); bool changeLoad(MachineInstr *OldMI, MachineOperand ImmOp, unsigned ImmOpNum); bool changeAddAsl(NodeAddr AddAslUN, MachineInstr *AddAslMI, const MachineOperand &ImmOp, unsigned ImmOpNum); bool isValidOffset(MachineInstr *MI, int Offset); unsigned getBaseOpPosition(MachineInstr *MI); unsigned getOffsetOpPosition(MachineInstr *MI); }; } // end anonymous namespace char HexagonOptAddrMode::ID = 0; INITIALIZE_PASS_BEGIN(HexagonOptAddrMode, "amode-opt", "Optimize addressing mode", false, false) INITIALIZE_PASS_DEPENDENCY(MachineDominatorTree) INITIALIZE_PASS_DEPENDENCY(MachineDominanceFrontier) INITIALIZE_PASS_END(HexagonOptAddrMode, "amode-opt", "Optimize addressing mode", false, false) bool HexagonOptAddrMode::hasRepForm(MachineInstr &MI, unsigned TfrDefR) { const MCInstrDesc &MID = MI.getDesc(); if ((!MID.mayStore() && !MID.mayLoad()) || HII->isPredicated(MI)) return false; if (MID.mayStore()) { MachineOperand StOp = MI.getOperand(MI.getNumOperands() - 1); if (StOp.isReg() && StOp.getReg() == TfrDefR) return false; } if (HII->getAddrMode(MI) == HexagonII::BaseRegOffset) // Tranform to Absolute plus register offset. return (HII->changeAddrMode_rr_ur(MI) >= 0); else if (HII->getAddrMode(MI) == HexagonII::BaseImmOffset) // Tranform to absolute addressing mode. return (HII->changeAddrMode_io_abs(MI) >= 0); return false; } // Check if addasl instruction can be removed. This is possible only // if it's feeding to only load/store instructions with base + register // offset as these instruction can be tranformed to use 'absolute plus // shifted register offset'. // ex: // Rs = ##foo // Rx = addasl(Rs, Rt, #2) // Rd = memw(Rx + #28) // Above three instructions can be replaced with Rd = memw(Rt<<#2 + ##foo+28) bool HexagonOptAddrMode::canRemoveAddasl(NodeAddr AddAslSN, MachineInstr &MI, const NodeList &UNodeList) { // check offset size in addasl. if 'offset > 3' return false const MachineOperand &OffsetOp = MI.getOperand(3); if (!OffsetOp.isImm() || OffsetOp.getImm() > 3) return false; Register OffsetReg = MI.getOperand(2).getReg(); RegisterRef OffsetRR; NodeId OffsetRegRD = 0; for (NodeAddr UA : AddAslSN.Addr->members_if(DFG->IsUse, *DFG)) { RegisterRef RR = UA.Addr->getRegRef(*DFG); if (OffsetReg == RR.Reg) { OffsetRR = RR; OffsetRegRD = UA.Addr->getReachingDef(); } } for (auto I = UNodeList.rbegin(), E = UNodeList.rend(); I != E; ++I) { NodeAddr UA = *I; NodeAddr IA = UA.Addr->getOwner(*DFG); if (UA.Addr->getFlags() & NodeAttrs::PhiRef) return false; NodeAddr AA = LV->getNearestAliasedRef(OffsetRR, IA); if ((DFG->IsDef(AA) && AA.Id != OffsetRegRD) || AA.Addr->getReachingDef() != OffsetRegRD) return false; MachineInstr &UseMI = *NodeAddr(IA).Addr->getCode(); NodeAddr OffsetRegDN = DFG->addr(OffsetRegRD); // Reaching Def to an offset register can't be a phi. if ((OffsetRegDN.Addr->getFlags() & NodeAttrs::PhiRef) && MI.getParent() != UseMI.getParent()) return false; const MCInstrDesc &UseMID = UseMI.getDesc(); if ((!UseMID.mayLoad() && !UseMID.mayStore()) || HII->getAddrMode(UseMI) != HexagonII::BaseImmOffset || getBaseWithLongOffset(UseMI) < 0) return false; // Addasl output can't be a store value. if (UseMID.mayStore() && UseMI.getOperand(2).isReg() && UseMI.getOperand(2).getReg() == MI.getOperand(0).getReg()) return false; for (auto &Mo : UseMI.operands()) if (Mo.isFI()) return false; } return true; } bool HexagonOptAddrMode::allValidCandidates(NodeAddr SA, NodeList &UNodeList) { for (auto I = UNodeList.rbegin(), E = UNodeList.rend(); I != E; ++I) { NodeAddr UN = *I; RegisterRef UR = UN.Addr->getRegRef(*DFG); NodeSet Visited, Defs; const auto &P = LV->getAllReachingDefsRec(UR, UN, Visited, Defs); if (!P.second) { LLVM_DEBUG({ dbgs() << "*** Unable to collect all reaching defs for use ***\n" << PrintNode(UN, *DFG) << '\n' << "The program's complexity may exceed the limits.\n"; }); return false; } const auto &ReachingDefs = P.first; if (ReachingDefs.size() > 1) { LLVM_DEBUG({ dbgs() << "*** Multiple Reaching Defs found!!! ***\n"; for (auto DI : ReachingDefs) { NodeAddr DA = DFG->addr(DI); NodeAddr TempIA = DA.Addr->getOwner(*DFG); dbgs() << "\t\t[Reaching Def]: " << Print>(TempIA, *DFG) << "\n"; } }); return false; } } return true; } void HexagonOptAddrMode::getAllRealUses(NodeAddr SA, NodeList &UNodeList) { for (NodeAddr DA : SA.Addr->members_if(DFG->IsDef, *DFG)) { LLVM_DEBUG(dbgs() << "\t\t[DefNode]: " << Print>(DA, *DFG) << "\n"); RegisterRef DR = DA.Addr->getRegRef(*DFG); auto UseSet = LV->getAllReachedUses(DR, DA); for (auto UI : UseSet) { NodeAddr UA = DFG->addr(UI); LLVM_DEBUG({ NodeAddr TempIA = UA.Addr->getOwner(*DFG); dbgs() << "\t\t\t[Reached Use]: " << Print>(TempIA, *DFG) << "\n"; }); if (UA.Addr->getFlags() & NodeAttrs::PhiRef) { NodeAddr PA = UA.Addr->getOwner(*DFG); NodeId id = PA.Id; const Liveness::RefMap &phiUse = LV->getRealUses(id); LLVM_DEBUG(dbgs() << "\t\t\t\tphi real Uses" << Print(phiUse, *DFG) << "\n"); if (!phiUse.empty()) { for (auto I : phiUse) { if (!DFG->getPRI().alias(RegisterRef(I.first), DR)) continue; auto phiUseSet = I.second; for (auto phiUI : phiUseSet) { NodeAddr phiUA = DFG->addr(phiUI.first); UNodeList.push_back(phiUA); } } } } else UNodeList.push_back(UA); } } } bool HexagonOptAddrMode::isSafeToExtLR(NodeAddr SN, MachineInstr *MI, unsigned LRExtReg, const NodeList &UNodeList) { RegisterRef LRExtRR; NodeId LRExtRegRD = 0; // Iterate through all the UseNodes in SN and find the reaching def // for the LRExtReg. for (NodeAddr UA : SN.Addr->members_if(DFG->IsUse, *DFG)) { RegisterRef RR = UA.Addr->getRegRef(*DFG); if (LRExtReg == RR.Reg) { LRExtRR = RR; LRExtRegRD = UA.Addr->getReachingDef(); } } for (auto I = UNodeList.rbegin(), E = UNodeList.rend(); I != E; ++I) { NodeAddr UA = *I; NodeAddr IA = UA.Addr->getOwner(*DFG); // The reaching def of LRExtRR at load/store node should be same as the // one reaching at the SN. if (UA.Addr->getFlags() & NodeAttrs::PhiRef) return false; NodeAddr AA = LV->getNearestAliasedRef(LRExtRR, IA); if ((DFG->IsDef(AA) && AA.Id != LRExtRegRD) || AA.Addr->getReachingDef() != LRExtRegRD) { LLVM_DEBUG( dbgs() << "isSafeToExtLR: Returning false; another reaching def\n"); return false; } // If the register is undefined (for example if it's a reserved register), // it may still be possible to extend the range, but it's safer to be // conservative and just punt. if (LRExtRegRD == 0) return false; MachineInstr *UseMI = NodeAddr(IA).Addr->getCode(); NodeAddr LRExtRegDN = DFG->addr(LRExtRegRD); // Reaching Def to LRExtReg can't be a phi. if ((LRExtRegDN.Addr->getFlags() & NodeAttrs::PhiRef) && MI->getParent() != UseMI->getParent()) return false; } return true; } bool HexagonOptAddrMode::isValidOffset(MachineInstr *MI, int Offset) { if (HII->isHVXVec(*MI)) { // only HVX vgather instructions handled // TODO: extend the pass to other vector load/store operations switch (MI->getOpcode()) { case Hexagon::V6_vgathermh_pseudo: case Hexagon::V6_vgathermw_pseudo: case Hexagon::V6_vgathermhw_pseudo: case Hexagon::V6_vgathermhq_pseudo: case Hexagon::V6_vgathermwq_pseudo: case Hexagon::V6_vgathermhwq_pseudo: return HII->isValidOffset(MI->getOpcode(), Offset, HRI, false); default: return false; } } if (HII->getAddrMode(*MI) != HexagonII::BaseImmOffset) return false; unsigned AlignMask = 0; switch (HII->getMemAccessSize(*MI)) { case HexagonII::MemAccessSize::DoubleWordAccess: AlignMask = 0x7; break; case HexagonII::MemAccessSize::WordAccess: AlignMask = 0x3; break; case HexagonII::MemAccessSize::HalfWordAccess: AlignMask = 0x1; break; case HexagonII::MemAccessSize::ByteAccess: AlignMask = 0x0; break; default: return false; } if ((AlignMask & Offset) != 0) return false; return HII->isValidOffset(MI->getOpcode(), Offset, HRI, false); } unsigned HexagonOptAddrMode::getBaseOpPosition(MachineInstr *MI) { const MCInstrDesc &MID = MI->getDesc(); switch (MI->getOpcode()) { // vgather pseudos are mayLoad and mayStore // hence need to explicitly specify Base and // Offset operand positions case Hexagon::V6_vgathermh_pseudo: case Hexagon::V6_vgathermw_pseudo: case Hexagon::V6_vgathermhw_pseudo: case Hexagon::V6_vgathermhq_pseudo: case Hexagon::V6_vgathermwq_pseudo: case Hexagon::V6_vgathermhwq_pseudo: return 0; default: return MID.mayLoad() ? 1 : 0; } } unsigned HexagonOptAddrMode::getOffsetOpPosition(MachineInstr *MI) { assert( (HII->getAddrMode(*MI) == HexagonII::BaseImmOffset) && "Looking for an offset in non-BaseImmOffset addressing mode instruction"); const MCInstrDesc &MID = MI->getDesc(); switch (MI->getOpcode()) { // vgather pseudos are mayLoad and mayStore // hence need to explicitly specify Base and // Offset operand positions case Hexagon::V6_vgathermh_pseudo: case Hexagon::V6_vgathermw_pseudo: case Hexagon::V6_vgathermhw_pseudo: case Hexagon::V6_vgathermhq_pseudo: case Hexagon::V6_vgathermwq_pseudo: case Hexagon::V6_vgathermhwq_pseudo: return 1; default: return MID.mayLoad() ? 2 : 1; } } bool HexagonOptAddrMode::processAddUses(NodeAddr AddSN, MachineInstr *AddMI, const NodeList &UNodeList) { Register AddDefR = AddMI->getOperand(0).getReg(); Register BaseReg = AddMI->getOperand(1).getReg(); for (auto I = UNodeList.rbegin(), E = UNodeList.rend(); I != E; ++I) { NodeAddr UN = *I; NodeAddr SN = UN.Addr->getOwner(*DFG); MachineInstr *MI = SN.Addr->getCode(); const MCInstrDesc &MID = MI->getDesc(); if ((!MID.mayLoad() && !MID.mayStore()) || HII->getAddrMode(*MI) != HexagonII::BaseImmOffset) return false; MachineOperand BaseOp = MI->getOperand(getBaseOpPosition(MI)); if (!BaseOp.isReg() || BaseOp.getReg() != AddDefR) return false; MachineOperand OffsetOp = MI->getOperand(getOffsetOpPosition(MI)); if (!OffsetOp.isImm()) return false; int64_t newOffset = OffsetOp.getImm() + AddMI->getOperand(2).getImm(); if (!isValidOffset(MI, newOffset)) return false; // Since we'll be extending the live range of Rt in the following example, // make sure that is safe. another definition of Rt doesn't exist between 'add' // and load/store instruction. // // Ex: Rx= add(Rt,#10) // memw(Rx+#0) = Rs // will be replaced with => memw(Rt+#10) = Rs if (!isSafeToExtLR(AddSN, AddMI, BaseReg, UNodeList)) return false; } NodeId LRExtRegRD = 0; // Iterate through all the UseNodes in SN and find the reaching def // for the LRExtReg. for (NodeAddr UA : AddSN.Addr->members_if(DFG->IsUse, *DFG)) { RegisterRef RR = UA.Addr->getRegRef(*DFG); if (BaseReg == RR.Reg) LRExtRegRD = UA.Addr->getReachingDef(); } // Update all the uses of 'add' with the appropriate base and offset // values. bool Changed = false; for (auto I = UNodeList.rbegin(), E = UNodeList.rend(); I != E; ++I) { NodeAddr UseN = *I; assert(!(UseN.Addr->getFlags() & NodeAttrs::PhiRef) && "Found a PhiRef node as a real reached use!!"); NodeAddr OwnerN = UseN.Addr->getOwner(*DFG); MachineInstr *UseMI = OwnerN.Addr->getCode(); LLVM_DEBUG(dbgs() << "\t\t[MI getParent()->getNumber() << ">]: " << *UseMI << "\n"); Changed |= updateAddUses(AddMI, UseMI); // Set the reachingDef for UseNode under consideration // after updating the Add use. This local change is // to avoid rebuilding of the RDF graph after update. NodeAddr LRExtRegDN = DFG->addr(LRExtRegRD); UseN.Addr->linkToDef(UseN.Id, LRExtRegDN); } if (Changed) Deleted.insert(AddMI); return Changed; } bool HexagonOptAddrMode::updateAddUses(MachineInstr *AddMI, MachineInstr *UseMI) { const MachineOperand ImmOp = AddMI->getOperand(2); const MachineOperand AddRegOp = AddMI->getOperand(1); Register NewReg = AddRegOp.getReg(); MachineOperand &BaseOp = UseMI->getOperand(getBaseOpPosition(UseMI)); MachineOperand &OffsetOp = UseMI->getOperand(getOffsetOpPosition(UseMI)); BaseOp.setReg(NewReg); BaseOp.setIsUndef(AddRegOp.isUndef()); BaseOp.setImplicit(AddRegOp.isImplicit()); OffsetOp.setImm(ImmOp.getImm() + OffsetOp.getImm()); MRI->clearKillFlags(NewReg); return true; } bool HexagonOptAddrMode::analyzeUses(unsigned tfrDefR, const NodeList &UNodeList, InstrEvalMap &InstrEvalResult, short &SizeInc) { bool KeepTfr = false; bool HasRepInstr = false; InstrEvalResult.clear(); for (auto I = UNodeList.rbegin(), E = UNodeList.rend(); I != E; ++I) { bool CanBeReplaced = false; NodeAddr UN = *I; NodeAddr SN = UN.Addr->getOwner(*DFG); MachineInstr &MI = *SN.Addr->getCode(); const MCInstrDesc &MID = MI.getDesc(); if ((MID.mayLoad() || MID.mayStore())) { if (!hasRepForm(MI, tfrDefR)) { KeepTfr = true; continue; } SizeInc++; CanBeReplaced = true; } else if (MI.getOpcode() == Hexagon::S2_addasl_rrri) { NodeList AddaslUseList; LLVM_DEBUG(dbgs() << "\nGetting ReachedUses for === " << MI << "\n"); getAllRealUses(SN, AddaslUseList); // Process phi nodes. if (allValidCandidates(SN, AddaslUseList) && canRemoveAddasl(SN, MI, AddaslUseList)) { SizeInc += AddaslUseList.size(); SizeInc -= 1; // Reduce size by 1 as addasl itself can be removed. CanBeReplaced = true; } else SizeInc++; } else // Currently, only load/store and addasl are handled. // Some other instructions to consider - // A2_add -> A2_addi // M4_mpyrr_addr -> M4_mpyrr_addi KeepTfr = true; InstrEvalResult[&MI] = CanBeReplaced; HasRepInstr |= CanBeReplaced; } // Reduce total size by 2 if original tfr can be deleted. if (!KeepTfr) SizeInc -= 2; return HasRepInstr; } bool HexagonOptAddrMode::changeLoad(MachineInstr *OldMI, MachineOperand ImmOp, unsigned ImmOpNum) { bool Changed = false; MachineBasicBlock *BB = OldMI->getParent(); auto UsePos = MachineBasicBlock::iterator(OldMI); MachineBasicBlock::instr_iterator InsertPt = UsePos.getInstrIterator(); ++InsertPt; unsigned OpStart; unsigned OpEnd = OldMI->getNumOperands(); MachineInstrBuilder MIB; if (ImmOpNum == 1) { if (HII->getAddrMode(*OldMI) == HexagonII::BaseRegOffset) { short NewOpCode = HII->changeAddrMode_rr_ur(*OldMI); assert(NewOpCode >= 0 && "Invalid New opcode\n"); MIB = BuildMI(*BB, InsertPt, OldMI->getDebugLoc(), HII->get(NewOpCode)); MIB.add(OldMI->getOperand(0)); MIB.add(OldMI->getOperand(2)); MIB.add(OldMI->getOperand(3)); MIB.add(ImmOp); OpStart = 4; Changed = true; } else if (HII->getAddrMode(*OldMI) == HexagonII::BaseImmOffset && OldMI->getOperand(2).isImm()) { short NewOpCode = HII->changeAddrMode_io_abs(*OldMI); assert(NewOpCode >= 0 && "Invalid New opcode\n"); MIB = BuildMI(*BB, InsertPt, OldMI->getDebugLoc(), HII->get(NewOpCode)) .add(OldMI->getOperand(0)); const GlobalValue *GV = ImmOp.getGlobal(); int64_t Offset = ImmOp.getOffset() + OldMI->getOperand(2).getImm(); MIB.addGlobalAddress(GV, Offset, ImmOp.getTargetFlags()); OpStart = 3; Changed = true; } else Changed = false; LLVM_DEBUG(dbgs() << "[Changing]: " << *OldMI << "\n"); LLVM_DEBUG(dbgs() << "[TO]: " << *MIB << "\n"); } else if (ImmOpNum == 2) { if (OldMI->getOperand(3).isImm() && OldMI->getOperand(3).getImm() == 0) { short NewOpCode = HII->changeAddrMode_rr_io(*OldMI); assert(NewOpCode >= 0 && "Invalid New opcode\n"); MIB = BuildMI(*BB, InsertPt, OldMI->getDebugLoc(), HII->get(NewOpCode)); MIB.add(OldMI->getOperand(0)); MIB.add(OldMI->getOperand(1)); MIB.add(ImmOp); OpStart = 4; Changed = true; LLVM_DEBUG(dbgs() << "[Changing]: " << *OldMI << "\n"); LLVM_DEBUG(dbgs() << "[TO]: " << *MIB << "\n"); } } if (Changed) for (unsigned i = OpStart; i < OpEnd; ++i) MIB.add(OldMI->getOperand(i)); return Changed; } bool HexagonOptAddrMode::changeStore(MachineInstr *OldMI, MachineOperand ImmOp, unsigned ImmOpNum) { bool Changed = false; unsigned OpStart = 0; unsigned OpEnd = OldMI->getNumOperands(); MachineBasicBlock *BB = OldMI->getParent(); auto UsePos = MachineBasicBlock::iterator(OldMI); MachineBasicBlock::instr_iterator InsertPt = UsePos.getInstrIterator(); ++InsertPt; MachineInstrBuilder MIB; if (ImmOpNum == 0) { if (HII->getAddrMode(*OldMI) == HexagonII::BaseRegOffset) { short NewOpCode = HII->changeAddrMode_rr_ur(*OldMI); assert(NewOpCode >= 0 && "Invalid New opcode\n"); MIB = BuildMI(*BB, InsertPt, OldMI->getDebugLoc(), HII->get(NewOpCode)); MIB.add(OldMI->getOperand(1)); MIB.add(OldMI->getOperand(2)); MIB.add(ImmOp); MIB.add(OldMI->getOperand(3)); OpStart = 4; Changed = true; } else if (HII->getAddrMode(*OldMI) == HexagonII::BaseImmOffset) { short NewOpCode = HII->changeAddrMode_io_abs(*OldMI); assert(NewOpCode >= 0 && "Invalid New opcode\n"); MIB = BuildMI(*BB, InsertPt, OldMI->getDebugLoc(), HII->get(NewOpCode)); const GlobalValue *GV = ImmOp.getGlobal(); int64_t Offset = ImmOp.getOffset() + OldMI->getOperand(1).getImm(); MIB.addGlobalAddress(GV, Offset, ImmOp.getTargetFlags()); MIB.add(OldMI->getOperand(2)); OpStart = 3; Changed = true; } } else if (ImmOpNum == 1 && OldMI->getOperand(2).getImm() == 0) { short NewOpCode = HII->changeAddrMode_rr_io(*OldMI); assert(NewOpCode >= 0 && "Invalid New opcode\n"); MIB = BuildMI(*BB, InsertPt, OldMI->getDebugLoc(), HII->get(NewOpCode)); MIB.add(OldMI->getOperand(0)); MIB.add(ImmOp); OpStart = 3; Changed = true; } if (Changed) { LLVM_DEBUG(dbgs() << "[Changing]: " << *OldMI << "\n"); LLVM_DEBUG(dbgs() << "[TO]: " << *MIB << "\n"); for (unsigned i = OpStart; i < OpEnd; ++i) MIB.add(OldMI->getOperand(i)); } return Changed; } short HexagonOptAddrMode::getBaseWithLongOffset(const MachineInstr &MI) const { if (HII->getAddrMode(MI) == HexagonII::BaseImmOffset) { short TempOpCode = HII->changeAddrMode_io_rr(MI); return HII->changeAddrMode_rr_ur(TempOpCode); } return HII->changeAddrMode_rr_ur(MI); } bool HexagonOptAddrMode::changeAddAsl(NodeAddr AddAslUN, MachineInstr *AddAslMI, const MachineOperand &ImmOp, unsigned ImmOpNum) { NodeAddr SA = AddAslUN.Addr->getOwner(*DFG); LLVM_DEBUG(dbgs() << "Processing addasl :" << *AddAslMI << "\n"); NodeList UNodeList; getAllRealUses(SA, UNodeList); for (auto I = UNodeList.rbegin(), E = UNodeList.rend(); I != E; ++I) { NodeAddr UseUN = *I; assert(!(UseUN.Addr->getFlags() & NodeAttrs::PhiRef) && "Can't transform this 'AddAsl' instruction!"); NodeAddr UseIA = UseUN.Addr->getOwner(*DFG); LLVM_DEBUG(dbgs() << "[InstrNode]: " << Print>(UseIA, *DFG) << "\n"); MachineInstr *UseMI = UseIA.Addr->getCode(); LLVM_DEBUG(dbgs() << "[MI <" << printMBBReference(*UseMI->getParent()) << ">]: " << *UseMI << "\n"); const MCInstrDesc &UseMID = UseMI->getDesc(); assert(HII->getAddrMode(*UseMI) == HexagonII::BaseImmOffset); auto UsePos = MachineBasicBlock::iterator(UseMI); MachineBasicBlock::instr_iterator InsertPt = UsePos.getInstrIterator(); short NewOpCode = getBaseWithLongOffset(*UseMI); assert(NewOpCode >= 0 && "Invalid New opcode\n"); unsigned OpStart; unsigned OpEnd = UseMI->getNumOperands(); MachineBasicBlock *BB = UseMI->getParent(); MachineInstrBuilder MIB = BuildMI(*BB, InsertPt, UseMI->getDebugLoc(), HII->get(NewOpCode)); // change mem(Rs + # ) -> mem(Rt << # + ##) if (UseMID.mayLoad()) { MIB.add(UseMI->getOperand(0)); MIB.add(AddAslMI->getOperand(2)); MIB.add(AddAslMI->getOperand(3)); const GlobalValue *GV = ImmOp.getGlobal(); MIB.addGlobalAddress(GV, UseMI->getOperand(2).getImm()+ImmOp.getOffset(), ImmOp.getTargetFlags()); OpStart = 3; } else if (UseMID.mayStore()) { MIB.add(AddAslMI->getOperand(2)); MIB.add(AddAslMI->getOperand(3)); const GlobalValue *GV = ImmOp.getGlobal(); MIB.addGlobalAddress(GV, UseMI->getOperand(1).getImm()+ImmOp.getOffset(), ImmOp.getTargetFlags()); MIB.add(UseMI->getOperand(2)); OpStart = 3; } else llvm_unreachable("Unhandled instruction"); for (unsigned i = OpStart; i < OpEnd; ++i) MIB.add(UseMI->getOperand(i)); Deleted.insert(UseMI); } return true; } bool HexagonOptAddrMode::xformUseMI(MachineInstr *TfrMI, MachineInstr *UseMI, NodeAddr UseN, unsigned UseMOnum) { const MachineOperand ImmOp = TfrMI->getOperand(1); const MCInstrDesc &MID = UseMI->getDesc(); unsigned Changed = false; if (MID.mayLoad()) Changed = changeLoad(UseMI, ImmOp, UseMOnum); else if (MID.mayStore()) Changed = changeStore(UseMI, ImmOp, UseMOnum); else if (UseMI->getOpcode() == Hexagon::S2_addasl_rrri) Changed = changeAddAsl(UseN, UseMI, ImmOp, UseMOnum); if (Changed) Deleted.insert(UseMI); return Changed; } bool HexagonOptAddrMode::processBlock(NodeAddr BA) { bool Changed = false; for (auto IA : BA.Addr->members(*DFG)) { if (!DFG->IsCode(IA)) continue; NodeAddr SA = IA; MachineInstr *MI = SA.Addr->getCode(); if ((MI->getOpcode() != Hexagon::A2_tfrsi || !MI->getOperand(1).isGlobal()) && (MI->getOpcode() != Hexagon::A2_addi || !MI->getOperand(2).isImm() || HII->isConstExtended(*MI))) continue; LLVM_DEBUG(dbgs() << "[Analyzing " << HII->getName(MI->getOpcode()) << "]: " << *MI << "\n\t[InstrNode]: " << Print>(IA, *DFG) << '\n'); NodeList UNodeList; getAllRealUses(SA, UNodeList); if (!allValidCandidates(SA, UNodeList)) continue; // Analyze all uses of 'add'. If the output of 'add' is used as an address // in the base+immediate addressing mode load/store instructions, see if // they can be updated to use the immediate value as an offet. Thus, // providing us the opportunity to eliminate 'add'. // Ex: Rx= add(Rt,#12) // memw(Rx+#0) = Rs // This can be replaced with memw(Rt+#12) = Rs // // This transformation is only performed if all uses can be updated and // the offset isn't required to be constant extended. if (MI->getOpcode() == Hexagon::A2_addi) { Changed |= processAddUses(SA, MI, UNodeList); continue; } short SizeInc = 0; Register DefR = MI->getOperand(0).getReg(); InstrEvalMap InstrEvalResult; // Analyze all uses and calculate increase in size. Perform the optimization // only if there is no increase in size. if (!analyzeUses(DefR, UNodeList, InstrEvalResult, SizeInc)) continue; if (SizeInc > CodeGrowthLimit) continue; bool KeepTfr = false; LLVM_DEBUG(dbgs() << "\t[Total reached uses] : " << UNodeList.size() << "\n"); LLVM_DEBUG(dbgs() << "\t[Processing Reached Uses] ===\n"); for (auto I = UNodeList.rbegin(), E = UNodeList.rend(); I != E; ++I) { NodeAddr UseN = *I; assert(!(UseN.Addr->getFlags() & NodeAttrs::PhiRef) && "Found a PhiRef node as a real reached use!!"); NodeAddr OwnerN = UseN.Addr->getOwner(*DFG); MachineInstr *UseMI = OwnerN.Addr->getCode(); LLVM_DEBUG(dbgs() << "\t\t[MI <" << printMBBReference(*UseMI->getParent()) << ">]: " << *UseMI << "\n"); int UseMOnum = -1; unsigned NumOperands = UseMI->getNumOperands(); for (unsigned j = 0; j < NumOperands - 1; ++j) { const MachineOperand &op = UseMI->getOperand(j); if (op.isReg() && op.isUse() && DefR == op.getReg()) UseMOnum = j; } // It is possible that the register will not be found in any operand. // This could happen, for example, when DefR = R4, but the used // register is D2. // Change UseMI if replacement is possible. If any replacement failed, // or wasn't attempted, make sure to keep the TFR. bool Xformed = false; if (UseMOnum >= 0 && InstrEvalResult[UseMI]) Xformed = xformUseMI(MI, UseMI, UseN, UseMOnum); Changed |= Xformed; KeepTfr |= !Xformed; } if (!KeepTfr) Deleted.insert(MI); } return Changed; } bool HexagonOptAddrMode::runOnMachineFunction(MachineFunction &MF) { if (skipFunction(MF.getFunction())) return false; bool Changed = false; auto &HST = MF.getSubtarget(); MRI = &MF.getRegInfo(); HII = HST.getInstrInfo(); HRI = HST.getRegisterInfo(); const auto &MDF = getAnalysis(); MDT = &getAnalysis(); const TargetOperandInfo TOI(*HII); DataFlowGraph G(MF, *HII, *HRI, *MDT, MDF, TOI); // Need to keep dead phis because we can propagate uses of registers into // nodes dominated by those would-be phis. G.build(BuildOptions::KeepDeadPhis); DFG = &G; Liveness L(*MRI, *DFG); L.computePhiInfo(); LV = &L; Deleted.clear(); NodeAddr FA = DFG->getFunc(); LLVM_DEBUG(dbgs() << "==== [RefMap#]=====:\n " << Print>(FA, *DFG) << "\n"); for (NodeAddr BA : FA.Addr->members(*DFG)) Changed |= processBlock(BA); for (auto MI : Deleted) MI->eraseFromParent(); if (Changed) { G.build(); L.computeLiveIns(); L.resetLiveIns(); L.resetKills(); } return Changed; } //===----------------------------------------------------------------------===// // Public Constructor Functions //===----------------------------------------------------------------------===// FunctionPass *llvm::createHexagonOptAddrMode() { return new HexagonOptAddrMode(); }