10b57cec5SDimitry Andric //===-- LanaiMemAluCombiner.cpp - Pass to combine memory & ALU operations -===// 20b57cec5SDimitry Andric // 30b57cec5SDimitry Andric // Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions. 40b57cec5SDimitry Andric // See https://llvm.org/LICENSE.txt for license information. 50b57cec5SDimitry Andric // SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception 60b57cec5SDimitry Andric // 70b57cec5SDimitry Andric //===----------------------------------------------------------------------===// 80b57cec5SDimitry Andric // Simple pass to combine memory and ALU operations 90b57cec5SDimitry Andric // 100b57cec5SDimitry Andric // The Lanai ISA supports instructions where a load/store modifies the base 110b57cec5SDimitry Andric // register used in the load/store operation. This pass finds suitable 120b57cec5SDimitry Andric // load/store and ALU instructions and combines them into one instruction. 130b57cec5SDimitry Andric // 140b57cec5SDimitry Andric // For example, 150b57cec5SDimitry Andric // ld [ %r6 -- ], %r12 160b57cec5SDimitry Andric // is a supported instruction that is not currently generated by the instruction 170b57cec5SDimitry Andric // selection pass of this backend. This pass generates these instructions by 180b57cec5SDimitry Andric // merging 190b57cec5SDimitry Andric // add %r6, -4, %r6 200b57cec5SDimitry Andric // followed by 210b57cec5SDimitry Andric // ld [ %r6 ], %r12 220b57cec5SDimitry Andric // in the same machine basic block into one machine instruction. 230b57cec5SDimitry Andric //===----------------------------------------------------------------------===// 240b57cec5SDimitry Andric 250b57cec5SDimitry Andric #include "LanaiAluCode.h" 260b57cec5SDimitry Andric #include "LanaiTargetMachine.h" 270b57cec5SDimitry Andric #include "llvm/ADT/Statistic.h" 280b57cec5SDimitry Andric #include "llvm/CodeGen/MachineFunctionPass.h" 290b57cec5SDimitry Andric #include "llvm/CodeGen/MachineInstrBuilder.h" 300b57cec5SDimitry Andric #include "llvm/CodeGen/RegisterScavenging.h" 310b57cec5SDimitry Andric #include "llvm/CodeGen/TargetInstrInfo.h" 320b57cec5SDimitry Andric #include "llvm/Support/CommandLine.h" 330b57cec5SDimitry Andric using namespace llvm; 340b57cec5SDimitry Andric 350b57cec5SDimitry Andric #define GET_INSTRMAP_INFO 360b57cec5SDimitry Andric #include "LanaiGenInstrInfo.inc" 370b57cec5SDimitry Andric 380b57cec5SDimitry Andric #define DEBUG_TYPE "lanai-mem-alu-combiner" 390b57cec5SDimitry Andric 400b57cec5SDimitry Andric STATISTIC(NumLdStAluCombined, "Number of memory and ALU instructions combined"); 410b57cec5SDimitry Andric 420b57cec5SDimitry Andric static llvm::cl::opt<bool> DisableMemAluCombiner( 430b57cec5SDimitry Andric "disable-lanai-mem-alu-combiner", llvm::cl::init(false), 440b57cec5SDimitry Andric llvm::cl::desc("Do not combine ALU and memory operators"), 450b57cec5SDimitry Andric llvm::cl::Hidden); 460b57cec5SDimitry Andric 470b57cec5SDimitry Andric namespace llvm { 480b57cec5SDimitry Andric void initializeLanaiMemAluCombinerPass(PassRegistry &); 490b57cec5SDimitry Andric } // namespace llvm 500b57cec5SDimitry Andric 510b57cec5SDimitry Andric namespace { 520b57cec5SDimitry Andric typedef MachineBasicBlock::iterator MbbIterator; 530b57cec5SDimitry Andric typedef MachineFunction::iterator MfIterator; 540b57cec5SDimitry Andric 550b57cec5SDimitry Andric class LanaiMemAluCombiner : public MachineFunctionPass { 560b57cec5SDimitry Andric public: 570b57cec5SDimitry Andric static char ID; 580b57cec5SDimitry Andric explicit LanaiMemAluCombiner() : MachineFunctionPass(ID) { 590b57cec5SDimitry Andric initializeLanaiMemAluCombinerPass(*PassRegistry::getPassRegistry()); 600b57cec5SDimitry Andric } 610b57cec5SDimitry Andric 620b57cec5SDimitry Andric StringRef getPassName() const override { 630b57cec5SDimitry Andric return "Lanai load / store optimization pass"; 640b57cec5SDimitry Andric } 650b57cec5SDimitry Andric 660b57cec5SDimitry Andric bool runOnMachineFunction(MachineFunction &F) override; 670b57cec5SDimitry Andric 680b57cec5SDimitry Andric MachineFunctionProperties getRequiredProperties() const override { 690b57cec5SDimitry Andric return MachineFunctionProperties().set( 700b57cec5SDimitry Andric MachineFunctionProperties::Property::NoVRegs); 710b57cec5SDimitry Andric } 720b57cec5SDimitry Andric 730b57cec5SDimitry Andric private: 740b57cec5SDimitry Andric MbbIterator findClosestSuitableAluInstr(MachineBasicBlock *BB, 750b57cec5SDimitry Andric const MbbIterator &MemInstr, 760b57cec5SDimitry Andric bool Decrement); 770b57cec5SDimitry Andric void insertMergedInstruction(MachineBasicBlock *BB, 780b57cec5SDimitry Andric const MbbIterator &MemInstr, 790b57cec5SDimitry Andric const MbbIterator &AluInstr, bool Before); 800b57cec5SDimitry Andric bool combineMemAluInBasicBlock(MachineBasicBlock *BB); 810b57cec5SDimitry Andric 820b57cec5SDimitry Andric // Target machine description which we query for register names, data 830b57cec5SDimitry Andric // layout, etc. 840b57cec5SDimitry Andric const TargetInstrInfo *TII; 850b57cec5SDimitry Andric }; 860b57cec5SDimitry Andric } // namespace 870b57cec5SDimitry Andric 880b57cec5SDimitry Andric char LanaiMemAluCombiner::ID = 0; 890b57cec5SDimitry Andric 900b57cec5SDimitry Andric INITIALIZE_PASS(LanaiMemAluCombiner, DEBUG_TYPE, 910b57cec5SDimitry Andric "Lanai memory ALU combiner pass", false, false) 920b57cec5SDimitry Andric 930b57cec5SDimitry Andric namespace { 940b57cec5SDimitry Andric bool isSpls(uint16_t Opcode) { return Lanai::splsIdempotent(Opcode) == Opcode; } 950b57cec5SDimitry Andric 960b57cec5SDimitry Andric // Determine the opcode for the merged instruction created by considering the 970b57cec5SDimitry Andric // old memory operation's opcode and whether the merged opcode will have an 980b57cec5SDimitry Andric // immediate offset. 990b57cec5SDimitry Andric unsigned mergedOpcode(unsigned OldOpcode, bool ImmediateOffset) { 1000b57cec5SDimitry Andric switch (OldOpcode) { 1010b57cec5SDimitry Andric case Lanai::LDW_RI: 1020b57cec5SDimitry Andric case Lanai::LDW_RR: 1030b57cec5SDimitry Andric if (ImmediateOffset) 1040b57cec5SDimitry Andric return Lanai::LDW_RI; 1050b57cec5SDimitry Andric return Lanai::LDW_RR; 1060b57cec5SDimitry Andric case Lanai::LDHs_RI: 1070b57cec5SDimitry Andric case Lanai::LDHs_RR: 1080b57cec5SDimitry Andric if (ImmediateOffset) 1090b57cec5SDimitry Andric return Lanai::LDHs_RI; 1100b57cec5SDimitry Andric return Lanai::LDHs_RR; 1110b57cec5SDimitry Andric case Lanai::LDHz_RI: 1120b57cec5SDimitry Andric case Lanai::LDHz_RR: 1130b57cec5SDimitry Andric if (ImmediateOffset) 1140b57cec5SDimitry Andric return Lanai::LDHz_RI; 1150b57cec5SDimitry Andric return Lanai::LDHz_RR; 1160b57cec5SDimitry Andric case Lanai::LDBs_RI: 1170b57cec5SDimitry Andric case Lanai::LDBs_RR: 1180b57cec5SDimitry Andric if (ImmediateOffset) 1190b57cec5SDimitry Andric return Lanai::LDBs_RI; 1200b57cec5SDimitry Andric return Lanai::LDBs_RR; 1210b57cec5SDimitry Andric case Lanai::LDBz_RI: 1220b57cec5SDimitry Andric case Lanai::LDBz_RR: 1230b57cec5SDimitry Andric if (ImmediateOffset) 1240b57cec5SDimitry Andric return Lanai::LDBz_RI; 1250b57cec5SDimitry Andric return Lanai::LDBz_RR; 1260b57cec5SDimitry Andric case Lanai::SW_RI: 1270b57cec5SDimitry Andric case Lanai::SW_RR: 1280b57cec5SDimitry Andric if (ImmediateOffset) 1290b57cec5SDimitry Andric return Lanai::SW_RI; 1300b57cec5SDimitry Andric return Lanai::SW_RR; 1310b57cec5SDimitry Andric case Lanai::STB_RI: 1320b57cec5SDimitry Andric case Lanai::STB_RR: 1330b57cec5SDimitry Andric if (ImmediateOffset) 1340b57cec5SDimitry Andric return Lanai::STB_RI; 1350b57cec5SDimitry Andric return Lanai::STB_RR; 1360b57cec5SDimitry Andric case Lanai::STH_RI: 1370b57cec5SDimitry Andric case Lanai::STH_RR: 1380b57cec5SDimitry Andric if (ImmediateOffset) 1390b57cec5SDimitry Andric return Lanai::STH_RI; 1400b57cec5SDimitry Andric return Lanai::STH_RR; 1410b57cec5SDimitry Andric default: 1420b57cec5SDimitry Andric return 0; 1430b57cec5SDimitry Andric } 1440b57cec5SDimitry Andric } 1450b57cec5SDimitry Andric 1460b57cec5SDimitry Andric // Check if the machine instruction has non-volatile memory operands of the type 1470b57cec5SDimitry Andric // supported for combining with ALU instructions. 1480b57cec5SDimitry Andric bool isNonVolatileMemoryOp(const MachineInstr &MI) { 1490b57cec5SDimitry Andric if (!MI.hasOneMemOperand()) 1500b57cec5SDimitry Andric return false; 1510b57cec5SDimitry Andric 1520b57cec5SDimitry Andric // Determine if the machine instruction is a supported memory operation by 1530b57cec5SDimitry Andric // testing if the computed merge opcode is a valid memory operation opcode. 1540b57cec5SDimitry Andric if (mergedOpcode(MI.getOpcode(), false) == 0) 1550b57cec5SDimitry Andric return false; 1560b57cec5SDimitry Andric 1570b57cec5SDimitry Andric const MachineMemOperand *MemOperand = *MI.memoperands_begin(); 1580b57cec5SDimitry Andric 1590b57cec5SDimitry Andric // Don't move volatile memory accesses 1600b57cec5SDimitry Andric // TODO: unclear if we need to be as conservative about atomics 1610b57cec5SDimitry Andric if (MemOperand->isVolatile() || MemOperand->isAtomic()) 1620b57cec5SDimitry Andric return false; 1630b57cec5SDimitry Andric 1640b57cec5SDimitry Andric return true; 1650b57cec5SDimitry Andric } 1660b57cec5SDimitry Andric 1670b57cec5SDimitry Andric // Test to see if two machine operands are of the same type. This test is less 1680b57cec5SDimitry Andric // strict than the MachineOperand::isIdenticalTo function. 1690b57cec5SDimitry Andric bool isSameOperand(const MachineOperand &Op1, const MachineOperand &Op2) { 1700b57cec5SDimitry Andric if (Op1.getType() != Op2.getType()) 1710b57cec5SDimitry Andric return false; 1720b57cec5SDimitry Andric 1730b57cec5SDimitry Andric switch (Op1.getType()) { 1740b57cec5SDimitry Andric case MachineOperand::MO_Register: 1750b57cec5SDimitry Andric return Op1.getReg() == Op2.getReg(); 1760b57cec5SDimitry Andric case MachineOperand::MO_Immediate: 1770b57cec5SDimitry Andric return Op1.getImm() == Op2.getImm(); 1780b57cec5SDimitry Andric default: 1790b57cec5SDimitry Andric return false; 1800b57cec5SDimitry Andric } 1810b57cec5SDimitry Andric } 1820b57cec5SDimitry Andric 1830b57cec5SDimitry Andric bool isZeroOperand(const MachineOperand &Op) { 1840b57cec5SDimitry Andric return ((Op.isReg() && Op.getReg() == Lanai::R0) || 1850b57cec5SDimitry Andric (Op.isImm() && Op.getImm() == 0)); 1860b57cec5SDimitry Andric } 1870b57cec5SDimitry Andric 1880b57cec5SDimitry Andric // Determines whether a register is used by an instruction. 1890b57cec5SDimitry Andric bool InstrUsesReg(const MbbIterator &Instr, const MachineOperand *Reg) { 1900b57cec5SDimitry Andric for (MachineInstr::const_mop_iterator Mop = Instr->operands_begin(); 1910b57cec5SDimitry Andric Mop != Instr->operands_end(); ++Mop) { 1920b57cec5SDimitry Andric if (isSameOperand(*Mop, *Reg)) 1930b57cec5SDimitry Andric return true; 1940b57cec5SDimitry Andric } 1950b57cec5SDimitry Andric return false; 1960b57cec5SDimitry Andric } 1970b57cec5SDimitry Andric 1980b57cec5SDimitry Andric // Converts between machine opcode and AluCode. 1990b57cec5SDimitry Andric // Flag using/modifying ALU operations should not be considered for merging and 2000b57cec5SDimitry Andric // are omitted from this list. 2010b57cec5SDimitry Andric LPAC::AluCode mergedAluCode(unsigned AluOpcode) { 2020b57cec5SDimitry Andric switch (AluOpcode) { 2030b57cec5SDimitry Andric case Lanai::ADD_I_LO: 2040b57cec5SDimitry Andric case Lanai::ADD_R: 2050b57cec5SDimitry Andric return LPAC::ADD; 2060b57cec5SDimitry Andric case Lanai::SUB_I_LO: 2070b57cec5SDimitry Andric case Lanai::SUB_R: 2080b57cec5SDimitry Andric return LPAC::SUB; 2090b57cec5SDimitry Andric case Lanai::AND_I_LO: 2100b57cec5SDimitry Andric case Lanai::AND_R: 2110b57cec5SDimitry Andric return LPAC::AND; 2120b57cec5SDimitry Andric case Lanai::OR_I_LO: 2130b57cec5SDimitry Andric case Lanai::OR_R: 2140b57cec5SDimitry Andric return LPAC::OR; 2150b57cec5SDimitry Andric case Lanai::XOR_I_LO: 2160b57cec5SDimitry Andric case Lanai::XOR_R: 2170b57cec5SDimitry Andric return LPAC::XOR; 2180b57cec5SDimitry Andric case Lanai::SHL_R: 2190b57cec5SDimitry Andric return LPAC::SHL; 2200b57cec5SDimitry Andric case Lanai::SRL_R: 2210b57cec5SDimitry Andric return LPAC::SRL; 2220b57cec5SDimitry Andric case Lanai::SRA_R: 2230b57cec5SDimitry Andric return LPAC::SRA; 2240b57cec5SDimitry Andric case Lanai::SA_I: 2250b57cec5SDimitry Andric case Lanai::SL_I: 2260b57cec5SDimitry Andric default: 2270b57cec5SDimitry Andric return LPAC::UNKNOWN; 2280b57cec5SDimitry Andric } 2290b57cec5SDimitry Andric } 2300b57cec5SDimitry Andric 2310b57cec5SDimitry Andric // Insert a new combined memory and ALU operation instruction. 2320b57cec5SDimitry Andric // 2330b57cec5SDimitry Andric // This function builds a new machine instruction using the MachineInstrBuilder 2340b57cec5SDimitry Andric // class and inserts it before the memory instruction. 2350b57cec5SDimitry Andric void LanaiMemAluCombiner::insertMergedInstruction(MachineBasicBlock *BB, 2360b57cec5SDimitry Andric const MbbIterator &MemInstr, 2370b57cec5SDimitry Andric const MbbIterator &AluInstr, 2380b57cec5SDimitry Andric bool Before) { 2390b57cec5SDimitry Andric // Insert new combined load/store + alu operation 2400b57cec5SDimitry Andric MachineOperand Dest = MemInstr->getOperand(0); 2410b57cec5SDimitry Andric MachineOperand Base = MemInstr->getOperand(1); 2420b57cec5SDimitry Andric MachineOperand MemOffset = MemInstr->getOperand(2); 2430b57cec5SDimitry Andric MachineOperand AluOffset = AluInstr->getOperand(2); 2440b57cec5SDimitry Andric 2450b57cec5SDimitry Andric // Abort if ALU offset is not a register or immediate 2460b57cec5SDimitry Andric assert((AluOffset.isReg() || AluOffset.isImm()) && 2470b57cec5SDimitry Andric "Unsupported operand type in merge"); 2480b57cec5SDimitry Andric 2490b57cec5SDimitry Andric // Determined merged instructions opcode and ALU code 2500b57cec5SDimitry Andric LPAC::AluCode AluOpcode = mergedAluCode(AluInstr->getOpcode()); 2510b57cec5SDimitry Andric unsigned NewOpc = mergedOpcode(MemInstr->getOpcode(), AluOffset.isImm()); 2520b57cec5SDimitry Andric 2530b57cec5SDimitry Andric assert(AluOpcode != LPAC::UNKNOWN && "Unknown ALU code in merging"); 2540b57cec5SDimitry Andric assert(NewOpc != 0 && "Unknown merged node opcode"); 2550b57cec5SDimitry Andric 2560b57cec5SDimitry Andric // Build and insert new machine instruction 2570b57cec5SDimitry Andric MachineInstrBuilder InstrBuilder = 2580b57cec5SDimitry Andric BuildMI(*BB, MemInstr, MemInstr->getDebugLoc(), TII->get(NewOpc)); 2590b57cec5SDimitry Andric InstrBuilder.addReg(Dest.getReg(), getDefRegState(true)); 2600b57cec5SDimitry Andric InstrBuilder.addReg(Base.getReg(), getKillRegState(true)); 2610b57cec5SDimitry Andric 2620b57cec5SDimitry Andric // Add offset to machine instruction 2630b57cec5SDimitry Andric if (AluOffset.isReg()) 2640b57cec5SDimitry Andric InstrBuilder.addReg(AluOffset.getReg()); 2650b57cec5SDimitry Andric else if (AluOffset.isImm()) 2660b57cec5SDimitry Andric InstrBuilder.addImm(AluOffset.getImm()); 2670b57cec5SDimitry Andric else 2680b57cec5SDimitry Andric llvm_unreachable("Unsupported ld/st ALU merge."); 2690b57cec5SDimitry Andric 2700b57cec5SDimitry Andric // Create a pre-op if the ALU operation preceded the memory operation or the 2710b57cec5SDimitry Andric // MemOffset is non-zero (i.e. the memory value should be adjusted before 2720b57cec5SDimitry Andric // accessing it), else create a post-op. 2730b57cec5SDimitry Andric if (Before || !isZeroOperand(MemOffset)) 2740b57cec5SDimitry Andric InstrBuilder.addImm(LPAC::makePreOp(AluOpcode)); 2750b57cec5SDimitry Andric else 2760b57cec5SDimitry Andric InstrBuilder.addImm(LPAC::makePostOp(AluOpcode)); 2770b57cec5SDimitry Andric 2780b57cec5SDimitry Andric // Transfer memory operands. 2790b57cec5SDimitry Andric InstrBuilder.setMemRefs(MemInstr->memoperands()); 2800b57cec5SDimitry Andric } 2810b57cec5SDimitry Andric 2820b57cec5SDimitry Andric // Function determines if ALU operation (in alu_iter) can be combined with 2830b57cec5SDimitry Andric // a load/store with base and offset. 2840b57cec5SDimitry Andric bool isSuitableAluInstr(bool IsSpls, const MbbIterator &AluIter, 2850b57cec5SDimitry Andric const MachineOperand &Base, 2860b57cec5SDimitry Andric const MachineOperand &Offset) { 2870b57cec5SDimitry Andric // ALU operations have 3 operands 2880b57cec5SDimitry Andric if (AluIter->getNumOperands() != 3) 2890b57cec5SDimitry Andric return false; 2900b57cec5SDimitry Andric 2910b57cec5SDimitry Andric MachineOperand &Dest = AluIter->getOperand(0); 2920b57cec5SDimitry Andric MachineOperand &Op1 = AluIter->getOperand(1); 2930b57cec5SDimitry Andric MachineOperand &Op2 = AluIter->getOperand(2); 2940b57cec5SDimitry Andric 2950b57cec5SDimitry Andric // Only match instructions using the base register as destination and with the 2960b57cec5SDimitry Andric // base and first operand equal 2970b57cec5SDimitry Andric if (!isSameOperand(Dest, Base) || !isSameOperand(Dest, Op1)) 2980b57cec5SDimitry Andric return false; 2990b57cec5SDimitry Andric 3000b57cec5SDimitry Andric if (Op2.isImm()) { 3010b57cec5SDimitry Andric // It is not a match if the 2nd operand in the ALU operation is an 3020b57cec5SDimitry Andric // immediate but the ALU operation is not an addition. 3030b57cec5SDimitry Andric if (AluIter->getOpcode() != Lanai::ADD_I_LO) 3040b57cec5SDimitry Andric return false; 3050b57cec5SDimitry Andric 3060b57cec5SDimitry Andric if (Offset.isReg() && Offset.getReg() == Lanai::R0) 3070b57cec5SDimitry Andric return true; 3080b57cec5SDimitry Andric 3090b57cec5SDimitry Andric if (Offset.isImm() && 3100b57cec5SDimitry Andric ((Offset.getImm() == 0 && 3110b57cec5SDimitry Andric // Check that the Op2 would fit in the immediate field of the 3120b57cec5SDimitry Andric // memory operation. 3130b57cec5SDimitry Andric ((IsSpls && isInt<10>(Op2.getImm())) || 3140b57cec5SDimitry Andric (!IsSpls && isInt<16>(Op2.getImm())))) || 3150b57cec5SDimitry Andric Offset.getImm() == Op2.getImm())) 3160b57cec5SDimitry Andric return true; 3170b57cec5SDimitry Andric } else if (Op2.isReg()) { 3180b57cec5SDimitry Andric // The Offset and 2nd operand are both registers and equal 3190b57cec5SDimitry Andric if (Offset.isReg() && Op2.getReg() == Offset.getReg()) 3200b57cec5SDimitry Andric return true; 3210b57cec5SDimitry Andric } else 3220b57cec5SDimitry Andric // Only consider operations with register or immediate values 3230b57cec5SDimitry Andric return false; 3240b57cec5SDimitry Andric 3250b57cec5SDimitry Andric return false; 3260b57cec5SDimitry Andric } 3270b57cec5SDimitry Andric 3280b57cec5SDimitry Andric MbbIterator LanaiMemAluCombiner::findClosestSuitableAluInstr( 3290b57cec5SDimitry Andric MachineBasicBlock *BB, const MbbIterator &MemInstr, const bool Decrement) { 3300b57cec5SDimitry Andric MachineOperand *Base = &MemInstr->getOperand(1); 3310b57cec5SDimitry Andric MachineOperand *Offset = &MemInstr->getOperand(2); 3320b57cec5SDimitry Andric bool IsSpls = isSpls(MemInstr->getOpcode()); 3330b57cec5SDimitry Andric 3340b57cec5SDimitry Andric MbbIterator First = MemInstr; 3350b57cec5SDimitry Andric MbbIterator Last = Decrement ? BB->begin() : BB->end(); 3360b57cec5SDimitry Andric 3370b57cec5SDimitry Andric while (First != Last) { 3380b57cec5SDimitry Andric Decrement ? --First : ++First; 3390b57cec5SDimitry Andric 3400b57cec5SDimitry Andric if (First == Last) 3410b57cec5SDimitry Andric break; 3420b57cec5SDimitry Andric 3430b57cec5SDimitry Andric // Skip over debug instructions 3440b57cec5SDimitry Andric if (First->isDebugInstr()) 3450b57cec5SDimitry Andric continue; 3460b57cec5SDimitry Andric 3470b57cec5SDimitry Andric if (isSuitableAluInstr(IsSpls, First, *Base, *Offset)) { 3480b57cec5SDimitry Andric return First; 3490b57cec5SDimitry Andric } 3500b57cec5SDimitry Andric 3510b57cec5SDimitry Andric // Usage of the base or offset register is not a form suitable for merging. 3520b57cec5SDimitry Andric if (First != Last) { 3530b57cec5SDimitry Andric if (InstrUsesReg(First, Base)) 3540b57cec5SDimitry Andric break; 3550b57cec5SDimitry Andric if (Offset->isReg() && InstrUsesReg(First, Offset)) 3560b57cec5SDimitry Andric break; 3570b57cec5SDimitry Andric } 3580b57cec5SDimitry Andric } 3590b57cec5SDimitry Andric 3600b57cec5SDimitry Andric return MemInstr; 3610b57cec5SDimitry Andric } 3620b57cec5SDimitry Andric 3630b57cec5SDimitry Andric bool LanaiMemAluCombiner::combineMemAluInBasicBlock(MachineBasicBlock *BB) { 3640b57cec5SDimitry Andric bool Modified = false; 3650b57cec5SDimitry Andric 3660b57cec5SDimitry Andric MbbIterator MBBIter = BB->begin(), End = BB->end(); 3670b57cec5SDimitry Andric while (MBBIter != End) { 3680b57cec5SDimitry Andric bool IsMemOp = isNonVolatileMemoryOp(*MBBIter); 3690b57cec5SDimitry Andric 3700b57cec5SDimitry Andric if (IsMemOp) { 3710b57cec5SDimitry Andric MachineOperand AluOperand = MBBIter->getOperand(3); 3720b57cec5SDimitry Andric unsigned int DestReg = MBBIter->getOperand(0).getReg(), 3730b57cec5SDimitry Andric BaseReg = MBBIter->getOperand(1).getReg(); 3740b57cec5SDimitry Andric assert(AluOperand.isImm() && "Unexpected memory operator type"); 3750b57cec5SDimitry Andric LPAC::AluCode AluOpcode = static_cast<LPAC::AluCode>(AluOperand.getImm()); 3760b57cec5SDimitry Andric 3770b57cec5SDimitry Andric // Skip memory operations that already modify the base register or if 3780b57cec5SDimitry Andric // the destination and base register are the same 3790b57cec5SDimitry Andric if (!LPAC::modifiesOp(AluOpcode) && DestReg != BaseReg) { 3800b57cec5SDimitry Andric for (int Inc = 0; Inc <= 1; ++Inc) { 3810b57cec5SDimitry Andric MbbIterator AluIter = 3820b57cec5SDimitry Andric findClosestSuitableAluInstr(BB, MBBIter, Inc == 0); 3830b57cec5SDimitry Andric if (AluIter != MBBIter) { 3840b57cec5SDimitry Andric insertMergedInstruction(BB, MBBIter, AluIter, Inc == 0); 3850b57cec5SDimitry Andric 3860b57cec5SDimitry Andric ++NumLdStAluCombined; 3870b57cec5SDimitry Andric Modified = true; 3880b57cec5SDimitry Andric 3890b57cec5SDimitry Andric // Erase the matching ALU instruction 3900b57cec5SDimitry Andric BB->erase(AluIter); 3910b57cec5SDimitry Andric // Erase old load/store instruction 3920b57cec5SDimitry Andric BB->erase(MBBIter++); 3930b57cec5SDimitry Andric break; 3940b57cec5SDimitry Andric } 3950b57cec5SDimitry Andric } 3960b57cec5SDimitry Andric } 3970b57cec5SDimitry Andric } 3980b57cec5SDimitry Andric if (MBBIter == End) 3990b57cec5SDimitry Andric break; 4000b57cec5SDimitry Andric ++MBBIter; 4010b57cec5SDimitry Andric } 4020b57cec5SDimitry Andric 4030b57cec5SDimitry Andric return Modified; 4040b57cec5SDimitry Andric } 4050b57cec5SDimitry Andric 4060b57cec5SDimitry Andric // Driver function that iterates over the machine basic building blocks of a 4070b57cec5SDimitry Andric // machine function 4080b57cec5SDimitry Andric bool LanaiMemAluCombiner::runOnMachineFunction(MachineFunction &MF) { 4090b57cec5SDimitry Andric if (DisableMemAluCombiner) 4100b57cec5SDimitry Andric return false; 4110b57cec5SDimitry Andric 4120b57cec5SDimitry Andric TII = MF.getSubtarget<LanaiSubtarget>().getInstrInfo(); 4130b57cec5SDimitry Andric bool Modified = false; 414*04eeddc0SDimitry Andric for (MachineBasicBlock &MBB : MF) 415*04eeddc0SDimitry Andric Modified |= combineMemAluInBasicBlock(&MBB); 4160b57cec5SDimitry Andric return Modified; 4170b57cec5SDimitry Andric } 4180b57cec5SDimitry Andric } // namespace 4190b57cec5SDimitry Andric 4200b57cec5SDimitry Andric FunctionPass *llvm::createLanaiMemAluCombinerPass() { 4210b57cec5SDimitry Andric return new LanaiMemAluCombiner(); 4220b57cec5SDimitry Andric } 423