xref: /freebsd/contrib/llvm-project/llvm/lib/Target/Lanai/LanaiMemAluCombiner.cpp (revision 5f757f3ff9144b609b3c433dfd370cc6bdc191ad)
10b57cec5SDimitry Andric //===-- LanaiMemAluCombiner.cpp - Pass to combine memory & ALU operations -===//
20b57cec5SDimitry Andric //
30b57cec5SDimitry Andric // Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions.
40b57cec5SDimitry Andric // See https://llvm.org/LICENSE.txt for license information.
50b57cec5SDimitry Andric // SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception
60b57cec5SDimitry Andric //
70b57cec5SDimitry Andric //===----------------------------------------------------------------------===//
80b57cec5SDimitry Andric // Simple pass to combine memory and ALU operations
90b57cec5SDimitry Andric //
100b57cec5SDimitry Andric // The Lanai ISA supports instructions where a load/store modifies the base
110b57cec5SDimitry Andric // register used in the load/store operation. This pass finds suitable
120b57cec5SDimitry Andric // load/store and ALU instructions and combines them into one instruction.
130b57cec5SDimitry Andric //
140b57cec5SDimitry Andric // For example,
150b57cec5SDimitry Andric //   ld [ %r6 -- ], %r12
160b57cec5SDimitry Andric // is a supported instruction that is not currently generated by the instruction
170b57cec5SDimitry Andric // selection pass of this backend. This pass generates these instructions by
180b57cec5SDimitry Andric // merging
190b57cec5SDimitry Andric //   add %r6, -4, %r6
200b57cec5SDimitry Andric // followed by
210b57cec5SDimitry Andric //   ld [ %r6 ], %r12
220b57cec5SDimitry Andric // in the same machine basic block into one machine instruction.
230b57cec5SDimitry Andric //===----------------------------------------------------------------------===//
240b57cec5SDimitry Andric 
250b57cec5SDimitry Andric #include "LanaiAluCode.h"
260b57cec5SDimitry Andric #include "LanaiTargetMachine.h"
270b57cec5SDimitry Andric #include "llvm/ADT/Statistic.h"
280b57cec5SDimitry Andric #include "llvm/CodeGen/MachineFunctionPass.h"
290b57cec5SDimitry Andric #include "llvm/CodeGen/MachineInstrBuilder.h"
300b57cec5SDimitry Andric #include "llvm/CodeGen/RegisterScavenging.h"
310b57cec5SDimitry Andric #include "llvm/CodeGen/TargetInstrInfo.h"
320b57cec5SDimitry Andric #include "llvm/Support/CommandLine.h"
330b57cec5SDimitry Andric using namespace llvm;
340b57cec5SDimitry Andric 
350b57cec5SDimitry Andric #define GET_INSTRMAP_INFO
360b57cec5SDimitry Andric #include "LanaiGenInstrInfo.inc"
370b57cec5SDimitry Andric 
380b57cec5SDimitry Andric #define DEBUG_TYPE "lanai-mem-alu-combiner"
390b57cec5SDimitry Andric 
400b57cec5SDimitry Andric STATISTIC(NumLdStAluCombined, "Number of memory and ALU instructions combined");
410b57cec5SDimitry Andric 
420b57cec5SDimitry Andric static llvm::cl::opt<bool> DisableMemAluCombiner(
430b57cec5SDimitry Andric     "disable-lanai-mem-alu-combiner", llvm::cl::init(false),
440b57cec5SDimitry Andric     llvm::cl::desc("Do not combine ALU and memory operators"),
450b57cec5SDimitry Andric     llvm::cl::Hidden);
460b57cec5SDimitry Andric 
470b57cec5SDimitry Andric namespace llvm {
480b57cec5SDimitry Andric void initializeLanaiMemAluCombinerPass(PassRegistry &);
490b57cec5SDimitry Andric } // namespace llvm
500b57cec5SDimitry Andric 
510b57cec5SDimitry Andric namespace {
520b57cec5SDimitry Andric typedef MachineBasicBlock::iterator MbbIterator;
530b57cec5SDimitry Andric typedef MachineFunction::iterator MfIterator;
540b57cec5SDimitry Andric 
550b57cec5SDimitry Andric class LanaiMemAluCombiner : public MachineFunctionPass {
560b57cec5SDimitry Andric public:
570b57cec5SDimitry Andric   static char ID;
580b57cec5SDimitry Andric   explicit LanaiMemAluCombiner() : MachineFunctionPass(ID) {
590b57cec5SDimitry Andric     initializeLanaiMemAluCombinerPass(*PassRegistry::getPassRegistry());
600b57cec5SDimitry Andric   }
610b57cec5SDimitry Andric 
620b57cec5SDimitry Andric   StringRef getPassName() const override {
630b57cec5SDimitry Andric     return "Lanai load / store optimization pass";
640b57cec5SDimitry Andric   }
650b57cec5SDimitry Andric 
660b57cec5SDimitry Andric   bool runOnMachineFunction(MachineFunction &F) override;
670b57cec5SDimitry Andric 
680b57cec5SDimitry Andric   MachineFunctionProperties getRequiredProperties() const override {
690b57cec5SDimitry Andric     return MachineFunctionProperties().set(
700b57cec5SDimitry Andric         MachineFunctionProperties::Property::NoVRegs);
710b57cec5SDimitry Andric   }
720b57cec5SDimitry Andric 
730b57cec5SDimitry Andric private:
740b57cec5SDimitry Andric   MbbIterator findClosestSuitableAluInstr(MachineBasicBlock *BB,
750b57cec5SDimitry Andric                                           const MbbIterator &MemInstr,
760b57cec5SDimitry Andric                                           bool Decrement);
770b57cec5SDimitry Andric   void insertMergedInstruction(MachineBasicBlock *BB,
780b57cec5SDimitry Andric                                const MbbIterator &MemInstr,
790b57cec5SDimitry Andric                                const MbbIterator &AluInstr, bool Before);
800b57cec5SDimitry Andric   bool combineMemAluInBasicBlock(MachineBasicBlock *BB);
810b57cec5SDimitry Andric 
820b57cec5SDimitry Andric   // Target machine description which we query for register names, data
830b57cec5SDimitry Andric   // layout, etc.
840b57cec5SDimitry Andric   const TargetInstrInfo *TII;
850b57cec5SDimitry Andric };
860b57cec5SDimitry Andric } // namespace
870b57cec5SDimitry Andric 
880b57cec5SDimitry Andric char LanaiMemAluCombiner::ID = 0;
890b57cec5SDimitry Andric 
900b57cec5SDimitry Andric INITIALIZE_PASS(LanaiMemAluCombiner, DEBUG_TYPE,
910b57cec5SDimitry Andric                 "Lanai memory ALU combiner pass", false, false)
920b57cec5SDimitry Andric 
930b57cec5SDimitry Andric namespace {
940b57cec5SDimitry Andric bool isSpls(uint16_t Opcode) { return Lanai::splsIdempotent(Opcode) == Opcode; }
950b57cec5SDimitry Andric 
960b57cec5SDimitry Andric // Determine the opcode for the merged instruction created by considering the
970b57cec5SDimitry Andric // old memory operation's opcode and whether the merged opcode will have an
980b57cec5SDimitry Andric // immediate offset.
990b57cec5SDimitry Andric unsigned mergedOpcode(unsigned OldOpcode, bool ImmediateOffset) {
1000b57cec5SDimitry Andric   switch (OldOpcode) {
1010b57cec5SDimitry Andric   case Lanai::LDW_RI:
1020b57cec5SDimitry Andric   case Lanai::LDW_RR:
1030b57cec5SDimitry Andric     if (ImmediateOffset)
1040b57cec5SDimitry Andric       return Lanai::LDW_RI;
1050b57cec5SDimitry Andric     return Lanai::LDW_RR;
1060b57cec5SDimitry Andric   case Lanai::LDHs_RI:
1070b57cec5SDimitry Andric   case Lanai::LDHs_RR:
1080b57cec5SDimitry Andric     if (ImmediateOffset)
1090b57cec5SDimitry Andric       return Lanai::LDHs_RI;
1100b57cec5SDimitry Andric     return Lanai::LDHs_RR;
1110b57cec5SDimitry Andric   case Lanai::LDHz_RI:
1120b57cec5SDimitry Andric   case Lanai::LDHz_RR:
1130b57cec5SDimitry Andric     if (ImmediateOffset)
1140b57cec5SDimitry Andric       return Lanai::LDHz_RI;
1150b57cec5SDimitry Andric     return Lanai::LDHz_RR;
1160b57cec5SDimitry Andric   case Lanai::LDBs_RI:
1170b57cec5SDimitry Andric   case Lanai::LDBs_RR:
1180b57cec5SDimitry Andric     if (ImmediateOffset)
1190b57cec5SDimitry Andric       return Lanai::LDBs_RI;
1200b57cec5SDimitry Andric     return Lanai::LDBs_RR;
1210b57cec5SDimitry Andric   case Lanai::LDBz_RI:
1220b57cec5SDimitry Andric   case Lanai::LDBz_RR:
1230b57cec5SDimitry Andric     if (ImmediateOffset)
1240b57cec5SDimitry Andric       return Lanai::LDBz_RI;
1250b57cec5SDimitry Andric     return Lanai::LDBz_RR;
1260b57cec5SDimitry Andric   case Lanai::SW_RI:
1270b57cec5SDimitry Andric   case Lanai::SW_RR:
1280b57cec5SDimitry Andric     if (ImmediateOffset)
1290b57cec5SDimitry Andric       return Lanai::SW_RI;
1300b57cec5SDimitry Andric     return Lanai::SW_RR;
1310b57cec5SDimitry Andric   case Lanai::STB_RI:
1320b57cec5SDimitry Andric   case Lanai::STB_RR:
1330b57cec5SDimitry Andric     if (ImmediateOffset)
1340b57cec5SDimitry Andric       return Lanai::STB_RI;
1350b57cec5SDimitry Andric     return Lanai::STB_RR;
1360b57cec5SDimitry Andric   case Lanai::STH_RI:
1370b57cec5SDimitry Andric   case Lanai::STH_RR:
1380b57cec5SDimitry Andric     if (ImmediateOffset)
1390b57cec5SDimitry Andric       return Lanai::STH_RI;
1400b57cec5SDimitry Andric     return Lanai::STH_RR;
1410b57cec5SDimitry Andric   default:
1420b57cec5SDimitry Andric     return 0;
1430b57cec5SDimitry Andric   }
1440b57cec5SDimitry Andric }
1450b57cec5SDimitry Andric 
1460b57cec5SDimitry Andric // Check if the machine instruction has non-volatile memory operands of the type
1470b57cec5SDimitry Andric // supported for combining with ALU instructions.
1480b57cec5SDimitry Andric bool isNonVolatileMemoryOp(const MachineInstr &MI) {
1490b57cec5SDimitry Andric   if (!MI.hasOneMemOperand())
1500b57cec5SDimitry Andric     return false;
1510b57cec5SDimitry Andric 
1520b57cec5SDimitry Andric   // Determine if the machine instruction is a supported memory operation by
1530b57cec5SDimitry Andric   // testing if the computed merge opcode is a valid memory operation opcode.
1540b57cec5SDimitry Andric   if (mergedOpcode(MI.getOpcode(), false) == 0)
1550b57cec5SDimitry Andric     return false;
1560b57cec5SDimitry Andric 
1570b57cec5SDimitry Andric   const MachineMemOperand *MemOperand = *MI.memoperands_begin();
1580b57cec5SDimitry Andric 
1590b57cec5SDimitry Andric   // Don't move volatile memory accesses
1600b57cec5SDimitry Andric   // TODO: unclear if we need to be as conservative about atomics
1610b57cec5SDimitry Andric   if (MemOperand->isVolatile() || MemOperand->isAtomic())
1620b57cec5SDimitry Andric     return false;
1630b57cec5SDimitry Andric 
1640b57cec5SDimitry Andric   return true;
1650b57cec5SDimitry Andric }
1660b57cec5SDimitry Andric 
1670b57cec5SDimitry Andric // Test to see if two machine operands are of the same type. This test is less
1680b57cec5SDimitry Andric // strict than the MachineOperand::isIdenticalTo function.
1690b57cec5SDimitry Andric bool isSameOperand(const MachineOperand &Op1, const MachineOperand &Op2) {
1700b57cec5SDimitry Andric   if (Op1.getType() != Op2.getType())
1710b57cec5SDimitry Andric     return false;
1720b57cec5SDimitry Andric 
1730b57cec5SDimitry Andric   switch (Op1.getType()) {
1740b57cec5SDimitry Andric   case MachineOperand::MO_Register:
1750b57cec5SDimitry Andric     return Op1.getReg() == Op2.getReg();
1760b57cec5SDimitry Andric   case MachineOperand::MO_Immediate:
1770b57cec5SDimitry Andric     return Op1.getImm() == Op2.getImm();
1780b57cec5SDimitry Andric   default:
1790b57cec5SDimitry Andric     return false;
1800b57cec5SDimitry Andric   }
1810b57cec5SDimitry Andric }
1820b57cec5SDimitry Andric 
1830b57cec5SDimitry Andric bool isZeroOperand(const MachineOperand &Op) {
1840b57cec5SDimitry Andric   return ((Op.isReg() && Op.getReg() == Lanai::R0) ||
1850b57cec5SDimitry Andric           (Op.isImm() && Op.getImm() == 0));
1860b57cec5SDimitry Andric }
1870b57cec5SDimitry Andric 
1880b57cec5SDimitry Andric // Determines whether a register is used by an instruction.
1890b57cec5SDimitry Andric bool InstrUsesReg(const MbbIterator &Instr, const MachineOperand *Reg) {
1900b57cec5SDimitry Andric   for (MachineInstr::const_mop_iterator Mop = Instr->operands_begin();
1910b57cec5SDimitry Andric        Mop != Instr->operands_end(); ++Mop) {
1920b57cec5SDimitry Andric     if (isSameOperand(*Mop, *Reg))
1930b57cec5SDimitry Andric       return true;
1940b57cec5SDimitry Andric   }
1950b57cec5SDimitry Andric   return false;
1960b57cec5SDimitry Andric }
1970b57cec5SDimitry Andric 
1980b57cec5SDimitry Andric // Converts between machine opcode and AluCode.
1990b57cec5SDimitry Andric // Flag using/modifying ALU operations should not be considered for merging and
2000b57cec5SDimitry Andric // are omitted from this list.
2010b57cec5SDimitry Andric LPAC::AluCode mergedAluCode(unsigned AluOpcode) {
2020b57cec5SDimitry Andric   switch (AluOpcode) {
2030b57cec5SDimitry Andric   case Lanai::ADD_I_LO:
2040b57cec5SDimitry Andric   case Lanai::ADD_R:
2050b57cec5SDimitry Andric     return LPAC::ADD;
2060b57cec5SDimitry Andric   case Lanai::SUB_I_LO:
2070b57cec5SDimitry Andric   case Lanai::SUB_R:
2080b57cec5SDimitry Andric     return LPAC::SUB;
2090b57cec5SDimitry Andric   case Lanai::AND_I_LO:
2100b57cec5SDimitry Andric   case Lanai::AND_R:
2110b57cec5SDimitry Andric     return LPAC::AND;
2120b57cec5SDimitry Andric   case Lanai::OR_I_LO:
2130b57cec5SDimitry Andric   case Lanai::OR_R:
2140b57cec5SDimitry Andric     return LPAC::OR;
2150b57cec5SDimitry Andric   case Lanai::XOR_I_LO:
2160b57cec5SDimitry Andric   case Lanai::XOR_R:
2170b57cec5SDimitry Andric     return LPAC::XOR;
2180b57cec5SDimitry Andric   case Lanai::SHL_R:
2190b57cec5SDimitry Andric     return LPAC::SHL;
2200b57cec5SDimitry Andric   case Lanai::SRL_R:
2210b57cec5SDimitry Andric     return LPAC::SRL;
2220b57cec5SDimitry Andric   case Lanai::SRA_R:
2230b57cec5SDimitry Andric     return LPAC::SRA;
2240b57cec5SDimitry Andric   case Lanai::SA_I:
2250b57cec5SDimitry Andric   case Lanai::SL_I:
2260b57cec5SDimitry Andric   default:
2270b57cec5SDimitry Andric     return LPAC::UNKNOWN;
2280b57cec5SDimitry Andric   }
2290b57cec5SDimitry Andric }
2300b57cec5SDimitry Andric 
2310b57cec5SDimitry Andric // Insert a new combined memory and ALU operation instruction.
2320b57cec5SDimitry Andric //
2330b57cec5SDimitry Andric // This function builds a new machine instruction using the MachineInstrBuilder
2340b57cec5SDimitry Andric // class and inserts it before the memory instruction.
2350b57cec5SDimitry Andric void LanaiMemAluCombiner::insertMergedInstruction(MachineBasicBlock *BB,
2360b57cec5SDimitry Andric                                                   const MbbIterator &MemInstr,
2370b57cec5SDimitry Andric                                                   const MbbIterator &AluInstr,
2380b57cec5SDimitry Andric                                                   bool Before) {
2390b57cec5SDimitry Andric   // Insert new combined load/store + alu operation
2400b57cec5SDimitry Andric   MachineOperand Dest = MemInstr->getOperand(0);
2410b57cec5SDimitry Andric   MachineOperand Base = MemInstr->getOperand(1);
2420b57cec5SDimitry Andric   MachineOperand MemOffset = MemInstr->getOperand(2);
2430b57cec5SDimitry Andric   MachineOperand AluOffset = AluInstr->getOperand(2);
2440b57cec5SDimitry Andric 
2450b57cec5SDimitry Andric   // Abort if ALU offset is not a register or immediate
2460b57cec5SDimitry Andric   assert((AluOffset.isReg() || AluOffset.isImm()) &&
2470b57cec5SDimitry Andric          "Unsupported operand type in merge");
2480b57cec5SDimitry Andric 
2490b57cec5SDimitry Andric   // Determined merged instructions opcode and ALU code
2500b57cec5SDimitry Andric   LPAC::AluCode AluOpcode = mergedAluCode(AluInstr->getOpcode());
2510b57cec5SDimitry Andric   unsigned NewOpc = mergedOpcode(MemInstr->getOpcode(), AluOffset.isImm());
2520b57cec5SDimitry Andric 
2530b57cec5SDimitry Andric   assert(AluOpcode != LPAC::UNKNOWN && "Unknown ALU code in merging");
2540b57cec5SDimitry Andric   assert(NewOpc != 0 && "Unknown merged node opcode");
2550b57cec5SDimitry Andric 
2560b57cec5SDimitry Andric   // Build and insert new machine instruction
2570b57cec5SDimitry Andric   MachineInstrBuilder InstrBuilder =
2580b57cec5SDimitry Andric       BuildMI(*BB, MemInstr, MemInstr->getDebugLoc(), TII->get(NewOpc));
2590b57cec5SDimitry Andric   InstrBuilder.addReg(Dest.getReg(), getDefRegState(true));
2600b57cec5SDimitry Andric   InstrBuilder.addReg(Base.getReg(), getKillRegState(true));
2610b57cec5SDimitry Andric 
2620b57cec5SDimitry Andric   // Add offset to machine instruction
2630b57cec5SDimitry Andric   if (AluOffset.isReg())
2640b57cec5SDimitry Andric     InstrBuilder.addReg(AluOffset.getReg());
2650b57cec5SDimitry Andric   else if (AluOffset.isImm())
2660b57cec5SDimitry Andric     InstrBuilder.addImm(AluOffset.getImm());
2670b57cec5SDimitry Andric   else
2680b57cec5SDimitry Andric     llvm_unreachable("Unsupported ld/st ALU merge.");
2690b57cec5SDimitry Andric 
2700b57cec5SDimitry Andric   // Create a pre-op if the ALU operation preceded the memory operation or the
2710b57cec5SDimitry Andric   // MemOffset is non-zero (i.e. the memory value should be adjusted before
2720b57cec5SDimitry Andric   // accessing it), else create a post-op.
2730b57cec5SDimitry Andric   if (Before || !isZeroOperand(MemOffset))
2740b57cec5SDimitry Andric     InstrBuilder.addImm(LPAC::makePreOp(AluOpcode));
2750b57cec5SDimitry Andric   else
2760b57cec5SDimitry Andric     InstrBuilder.addImm(LPAC::makePostOp(AluOpcode));
2770b57cec5SDimitry Andric 
2780b57cec5SDimitry Andric   // Transfer memory operands.
2790b57cec5SDimitry Andric   InstrBuilder.setMemRefs(MemInstr->memoperands());
2800b57cec5SDimitry Andric }
2810b57cec5SDimitry Andric 
2820b57cec5SDimitry Andric // Function determines if ALU operation (in alu_iter) can be combined with
2830b57cec5SDimitry Andric // a load/store with base and offset.
2840b57cec5SDimitry Andric bool isSuitableAluInstr(bool IsSpls, const MbbIterator &AluIter,
2850b57cec5SDimitry Andric                         const MachineOperand &Base,
2860b57cec5SDimitry Andric                         const MachineOperand &Offset) {
2870b57cec5SDimitry Andric   // ALU operations have 3 operands
2880b57cec5SDimitry Andric   if (AluIter->getNumOperands() != 3)
2890b57cec5SDimitry Andric     return false;
2900b57cec5SDimitry Andric 
2910b57cec5SDimitry Andric   MachineOperand &Dest = AluIter->getOperand(0);
2920b57cec5SDimitry Andric   MachineOperand &Op1 = AluIter->getOperand(1);
2930b57cec5SDimitry Andric   MachineOperand &Op2 = AluIter->getOperand(2);
2940b57cec5SDimitry Andric 
2950b57cec5SDimitry Andric   // Only match instructions using the base register as destination and with the
2960b57cec5SDimitry Andric   // base and first operand equal
2970b57cec5SDimitry Andric   if (!isSameOperand(Dest, Base) || !isSameOperand(Dest, Op1))
2980b57cec5SDimitry Andric     return false;
2990b57cec5SDimitry Andric 
3000b57cec5SDimitry Andric   if (Op2.isImm()) {
3010b57cec5SDimitry Andric     // It is not a match if the 2nd operand in the ALU operation is an
3020b57cec5SDimitry Andric     // immediate but the ALU operation is not an addition.
3030b57cec5SDimitry Andric     if (AluIter->getOpcode() != Lanai::ADD_I_LO)
3040b57cec5SDimitry Andric       return false;
3050b57cec5SDimitry Andric 
3060b57cec5SDimitry Andric     if (Offset.isReg() && Offset.getReg() == Lanai::R0)
3070b57cec5SDimitry Andric       return true;
3080b57cec5SDimitry Andric 
3090b57cec5SDimitry Andric     if (Offset.isImm() &&
3100b57cec5SDimitry Andric         ((Offset.getImm() == 0 &&
3110b57cec5SDimitry Andric           // Check that the Op2 would fit in the immediate field of the
3120b57cec5SDimitry Andric           // memory operation.
3130b57cec5SDimitry Andric           ((IsSpls && isInt<10>(Op2.getImm())) ||
3140b57cec5SDimitry Andric            (!IsSpls && isInt<16>(Op2.getImm())))) ||
3150b57cec5SDimitry Andric          Offset.getImm() == Op2.getImm()))
3160b57cec5SDimitry Andric       return true;
3170b57cec5SDimitry Andric   } else if (Op2.isReg()) {
3180b57cec5SDimitry Andric     // The Offset and 2nd operand are both registers and equal
3190b57cec5SDimitry Andric     if (Offset.isReg() && Op2.getReg() == Offset.getReg())
3200b57cec5SDimitry Andric       return true;
3210b57cec5SDimitry Andric   } else
3220b57cec5SDimitry Andric     // Only consider operations with register or immediate values
3230b57cec5SDimitry Andric     return false;
3240b57cec5SDimitry Andric 
3250b57cec5SDimitry Andric   return false;
3260b57cec5SDimitry Andric }
3270b57cec5SDimitry Andric 
3280b57cec5SDimitry Andric MbbIterator LanaiMemAluCombiner::findClosestSuitableAluInstr(
3290b57cec5SDimitry Andric     MachineBasicBlock *BB, const MbbIterator &MemInstr, const bool Decrement) {
3300b57cec5SDimitry Andric   MachineOperand *Base = &MemInstr->getOperand(1);
3310b57cec5SDimitry Andric   MachineOperand *Offset = &MemInstr->getOperand(2);
3320b57cec5SDimitry Andric   bool IsSpls = isSpls(MemInstr->getOpcode());
3330b57cec5SDimitry Andric 
3340b57cec5SDimitry Andric   MbbIterator First = MemInstr;
3350b57cec5SDimitry Andric   MbbIterator Last = Decrement ? BB->begin() : BB->end();
3360b57cec5SDimitry Andric 
3370b57cec5SDimitry Andric   while (First != Last) {
3380b57cec5SDimitry Andric     Decrement ? --First : ++First;
3390b57cec5SDimitry Andric 
3400b57cec5SDimitry Andric     if (First == Last)
3410b57cec5SDimitry Andric       break;
3420b57cec5SDimitry Andric 
3430b57cec5SDimitry Andric     // Skip over debug instructions
3440b57cec5SDimitry Andric     if (First->isDebugInstr())
3450b57cec5SDimitry Andric       continue;
3460b57cec5SDimitry Andric 
3470b57cec5SDimitry Andric     if (isSuitableAluInstr(IsSpls, First, *Base, *Offset)) {
3480b57cec5SDimitry Andric       return First;
3490b57cec5SDimitry Andric     }
3500b57cec5SDimitry Andric 
3510b57cec5SDimitry Andric     // Usage of the base or offset register is not a form suitable for merging.
3520b57cec5SDimitry Andric     if (First != Last) {
3530b57cec5SDimitry Andric       if (InstrUsesReg(First, Base))
3540b57cec5SDimitry Andric         break;
3550b57cec5SDimitry Andric       if (Offset->isReg() && InstrUsesReg(First, Offset))
3560b57cec5SDimitry Andric         break;
3570b57cec5SDimitry Andric     }
3580b57cec5SDimitry Andric   }
3590b57cec5SDimitry Andric 
3600b57cec5SDimitry Andric   return MemInstr;
3610b57cec5SDimitry Andric }
3620b57cec5SDimitry Andric 
3630b57cec5SDimitry Andric bool LanaiMemAluCombiner::combineMemAluInBasicBlock(MachineBasicBlock *BB) {
3640b57cec5SDimitry Andric   bool Modified = false;
3650b57cec5SDimitry Andric 
3660b57cec5SDimitry Andric   MbbIterator MBBIter = BB->begin(), End = BB->end();
3670b57cec5SDimitry Andric   while (MBBIter != End) {
3680b57cec5SDimitry Andric     bool IsMemOp = isNonVolatileMemoryOp(*MBBIter);
3690b57cec5SDimitry Andric 
3700b57cec5SDimitry Andric     if (IsMemOp) {
3710b57cec5SDimitry Andric       MachineOperand AluOperand = MBBIter->getOperand(3);
3720b57cec5SDimitry Andric       unsigned int DestReg = MBBIter->getOperand(0).getReg(),
3730b57cec5SDimitry Andric                    BaseReg = MBBIter->getOperand(1).getReg();
3740b57cec5SDimitry Andric       assert(AluOperand.isImm() && "Unexpected memory operator type");
3750b57cec5SDimitry Andric       LPAC::AluCode AluOpcode = static_cast<LPAC::AluCode>(AluOperand.getImm());
3760b57cec5SDimitry Andric 
3770b57cec5SDimitry Andric       // Skip memory operations that already modify the base register or if
3780b57cec5SDimitry Andric       // the destination and base register are the same
3790b57cec5SDimitry Andric       if (!LPAC::modifiesOp(AluOpcode) && DestReg != BaseReg) {
3800b57cec5SDimitry Andric         for (int Inc = 0; Inc <= 1; ++Inc) {
3810b57cec5SDimitry Andric           MbbIterator AluIter =
3820b57cec5SDimitry Andric               findClosestSuitableAluInstr(BB, MBBIter, Inc == 0);
3830b57cec5SDimitry Andric           if (AluIter != MBBIter) {
3840b57cec5SDimitry Andric             insertMergedInstruction(BB, MBBIter, AluIter, Inc == 0);
3850b57cec5SDimitry Andric 
3860b57cec5SDimitry Andric             ++NumLdStAluCombined;
3870b57cec5SDimitry Andric             Modified = true;
3880b57cec5SDimitry Andric 
3890b57cec5SDimitry Andric             // Erase the matching ALU instruction
3900b57cec5SDimitry Andric             BB->erase(AluIter);
3910b57cec5SDimitry Andric             // Erase old load/store instruction
3920b57cec5SDimitry Andric             BB->erase(MBBIter++);
3930b57cec5SDimitry Andric             break;
3940b57cec5SDimitry Andric           }
3950b57cec5SDimitry Andric         }
3960b57cec5SDimitry Andric       }
3970b57cec5SDimitry Andric     }
3980b57cec5SDimitry Andric     if (MBBIter == End)
3990b57cec5SDimitry Andric       break;
4000b57cec5SDimitry Andric     ++MBBIter;
4010b57cec5SDimitry Andric   }
4020b57cec5SDimitry Andric 
4030b57cec5SDimitry Andric   return Modified;
4040b57cec5SDimitry Andric }
4050b57cec5SDimitry Andric 
4060b57cec5SDimitry Andric // Driver function that iterates over the machine basic building blocks of a
4070b57cec5SDimitry Andric // machine function
4080b57cec5SDimitry Andric bool LanaiMemAluCombiner::runOnMachineFunction(MachineFunction &MF) {
4090b57cec5SDimitry Andric   if (DisableMemAluCombiner)
4100b57cec5SDimitry Andric     return false;
4110b57cec5SDimitry Andric 
4120b57cec5SDimitry Andric   TII = MF.getSubtarget<LanaiSubtarget>().getInstrInfo();
4130b57cec5SDimitry Andric   bool Modified = false;
414*04eeddc0SDimitry Andric   for (MachineBasicBlock &MBB : MF)
415*04eeddc0SDimitry Andric     Modified |= combineMemAluInBasicBlock(&MBB);
4160b57cec5SDimitry Andric   return Modified;
4170b57cec5SDimitry Andric }
4180b57cec5SDimitry Andric } // namespace
4190b57cec5SDimitry Andric 
4200b57cec5SDimitry Andric FunctionPass *llvm::createLanaiMemAluCombinerPass() {
4210b57cec5SDimitry Andric   return new LanaiMemAluCombiner();
4220b57cec5SDimitry Andric }
423