xref: /freebsd/contrib/llvm-project/llvm/lib/Target/Mips/MipsSEISelDAGToDAG.cpp (revision 71ac745d76c3ba442e753daff1870893f272b29d)
1 //===-- MipsSEISelDAGToDAG.cpp - A Dag to Dag Inst Selector for MipsSE ----===//
2 //
3 // Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions.
4 // See https://llvm.org/LICENSE.txt for license information.
5 // SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception
6 //
7 //===----------------------------------------------------------------------===//
8 //
9 // Subclass of MipsDAGToDAGISel specialized for mips32/64.
10 //
11 //===----------------------------------------------------------------------===//
12 
13 #include "MipsSEISelDAGToDAG.h"
14 #include "MCTargetDesc/MipsBaseInfo.h"
15 #include "Mips.h"
16 #include "MipsAnalyzeImmediate.h"
17 #include "MipsMachineFunction.h"
18 #include "MipsRegisterInfo.h"
19 #include "llvm/CodeGen/MachineConstantPool.h"
20 #include "llvm/CodeGen/MachineFrameInfo.h"
21 #include "llvm/CodeGen/MachineFunction.h"
22 #include "llvm/CodeGen/MachineInstrBuilder.h"
23 #include "llvm/CodeGen/MachineRegisterInfo.h"
24 #include "llvm/CodeGen/SelectionDAGNodes.h"
25 #include "llvm/IR/CFG.h"
26 #include "llvm/IR/Dominators.h"
27 #include "llvm/IR/GlobalValue.h"
28 #include "llvm/IR/Instructions.h"
29 #include "llvm/IR/Intrinsics.h"
30 #include "llvm/IR/IntrinsicsMips.h"
31 #include "llvm/IR/Type.h"
32 #include "llvm/Support/Debug.h"
33 #include "llvm/Support/ErrorHandling.h"
34 #include "llvm/Support/raw_ostream.h"
35 #include "llvm/Target/TargetMachine.h"
36 using namespace llvm;
37 
38 #define DEBUG_TYPE "mips-isel"
39 
runOnMachineFunction(MachineFunction & MF)40 bool MipsSEDAGToDAGISel::runOnMachineFunction(MachineFunction &MF) {
41   Subtarget = &MF.getSubtarget<MipsSubtarget>();
42   if (Subtarget->inMips16Mode())
43     return false;
44   return MipsDAGToDAGISel::runOnMachineFunction(MF);
45 }
46 
getAnalysisUsage(AnalysisUsage & AU) const47 void MipsSEDAGToDAGISelLegacy::getAnalysisUsage(AnalysisUsage &AU) const {
48   AU.addRequired<DominatorTreeWrapperPass>();
49   SelectionDAGISelLegacy::getAnalysisUsage(AU);
50 }
51 
addDSPCtrlRegOperands(bool IsDef,MachineInstr & MI,MachineFunction & MF)52 void MipsSEDAGToDAGISel::addDSPCtrlRegOperands(bool IsDef, MachineInstr &MI,
53                                                MachineFunction &MF) {
54   MachineInstrBuilder MIB(MF, &MI);
55   unsigned Mask = MI.getOperand(1).getImm();
56   unsigned Flag =
57       IsDef ? RegState::ImplicitDefine : RegState::Implicit | RegState::Undef;
58 
59   if (Mask & 1)
60     MIB.addReg(Mips::DSPPos, Flag);
61 
62   if (Mask & 2)
63     MIB.addReg(Mips::DSPSCount, Flag);
64 
65   if (Mask & 4)
66     MIB.addReg(Mips::DSPCarry, Flag);
67 
68   if (Mask & 8)
69     MIB.addReg(Mips::DSPOutFlag, Flag);
70 
71   if (Mask & 16)
72     MIB.addReg(Mips::DSPCCond, Flag);
73 
74   if (Mask & 32)
75     MIB.addReg(Mips::DSPEFI, Flag);
76 }
77 
getMSACtrlReg(const SDValue RegIdx) const78 unsigned MipsSEDAGToDAGISel::getMSACtrlReg(const SDValue RegIdx) const {
79   uint64_t RegNum = RegIdx->getAsZExtVal();
80   return Mips::MSACtrlRegClass.getRegister(RegNum);
81 }
82 
replaceUsesWithZeroReg(MachineRegisterInfo * MRI,const MachineInstr & MI)83 bool MipsSEDAGToDAGISel::replaceUsesWithZeroReg(MachineRegisterInfo *MRI,
84                                                 const MachineInstr& MI) {
85   unsigned DstReg = 0, ZeroReg = 0;
86 
87   // Check if MI is "addiu $dst, $zero, 0" or "daddiu $dst, $zero, 0".
88   if ((MI.getOpcode() == Mips::ADDiu) &&
89       (MI.getOperand(1).getReg() == Mips::ZERO) &&
90       (MI.getOperand(2).isImm()) &&
91       (MI.getOperand(2).getImm() == 0)) {
92     DstReg = MI.getOperand(0).getReg();
93     ZeroReg = Mips::ZERO;
94   } else if ((MI.getOpcode() == Mips::DADDiu) &&
95              (MI.getOperand(1).getReg() == Mips::ZERO_64) &&
96              (MI.getOperand(2).isImm()) &&
97              (MI.getOperand(2).getImm() == 0)) {
98     DstReg = MI.getOperand(0).getReg();
99     ZeroReg = Mips::ZERO_64;
100   }
101 
102   if (!DstReg)
103     return false;
104 
105   // Replace uses with ZeroReg.
106   for (MachineRegisterInfo::use_iterator U = MRI->use_begin(DstReg),
107        E = MRI->use_end(); U != E;) {
108     MachineOperand &MO = *U;
109     unsigned OpNo = U.getOperandNo();
110     MachineInstr *MI = MO.getParent();
111     ++U;
112 
113     // Do not replace if it is a phi's operand or is tied to def operand.
114     if (MI->isPHI() || MI->isRegTiedToDefOperand(OpNo) || MI->isPseudo())
115       continue;
116 
117     // Also, we have to check that the register class of the operand
118     // contains the zero register.
119     if (!MRI->getRegClass(MO.getReg())->contains(ZeroReg))
120       continue;
121 
122     MO.setReg(ZeroReg);
123   }
124 
125   return true;
126 }
127 
emitMCountABI(MachineInstr & MI,MachineBasicBlock & MBB,MachineFunction & MF)128 void MipsSEDAGToDAGISel::emitMCountABI(MachineInstr &MI, MachineBasicBlock &MBB,
129                                        MachineFunction &MF) {
130   MachineInstrBuilder MIB(MF, &MI);
131   if (!Subtarget->isABI_O32()) { // N32, N64
132     // Save current return address.
133     BuildMI(MBB, &MI, MI.getDebugLoc(), TII->get(Mips::OR64))
134         .addDef(Mips::AT_64)
135         .addUse(Mips::RA_64, RegState::Undef)
136         .addUse(Mips::ZERO_64);
137     // Stops instruction above from being removed later on.
138     MIB.addUse(Mips::AT_64, RegState::Implicit);
139   } else {  // O32
140     // Save current return address.
141     BuildMI(MBB, &MI, MI.getDebugLoc(), TII->get(Mips::OR))
142         .addDef(Mips::AT)
143         .addUse(Mips::RA, RegState::Undef)
144         .addUse(Mips::ZERO);
145     // _mcount pops 2 words from stack.
146     BuildMI(MBB, &MI, MI.getDebugLoc(), TII->get(Mips::ADDiu))
147         .addDef(Mips::SP)
148         .addUse(Mips::SP)
149         .addImm(-8);
150     // Stops first instruction above from being removed later on.
151     MIB.addUse(Mips::AT, RegState::Implicit);
152   }
153 }
154 
processFunctionAfterISel(MachineFunction & MF)155 void MipsSEDAGToDAGISel::processFunctionAfterISel(MachineFunction &MF) {
156   MF.getInfo<MipsFunctionInfo>()->initGlobalBaseReg(MF);
157 
158   MachineRegisterInfo *MRI = &MF.getRegInfo();
159 
160   for (auto &MBB: MF) {
161     for (auto &MI: MBB) {
162       switch (MI.getOpcode()) {
163       case Mips::RDDSP:
164         addDSPCtrlRegOperands(false, MI, MF);
165         break;
166       case Mips::WRDSP:
167         addDSPCtrlRegOperands(true, MI, MF);
168         break;
169       case Mips::BuildPairF64_64:
170       case Mips::ExtractElementF64_64:
171         if (!Subtarget->useOddSPReg()) {
172           MI.addOperand(MachineOperand::CreateReg(Mips::SP, false, true));
173           break;
174         }
175         [[fallthrough]];
176       case Mips::BuildPairF64:
177       case Mips::ExtractElementF64:
178         if (Subtarget->isABI_FPXX() && !Subtarget->hasMTHC1())
179           MI.addOperand(MachineOperand::CreateReg(Mips::SP, false, true));
180         break;
181       case Mips::JAL:
182       case Mips::JAL_MM:
183         if (MI.getOperand(0).isGlobal() &&
184             MI.getOperand(0).getGlobal()->getGlobalIdentifier() == "_mcount")
185           emitMCountABI(MI, MBB, MF);
186         break;
187       case Mips::JALRPseudo:
188       case Mips::JALR64Pseudo:
189       case Mips::JALR16_MM:
190         if (MI.getOperand(2).isMCSymbol() &&
191             MI.getOperand(2).getMCSymbol()->getName() == "_mcount")
192           emitMCountABI(MI, MBB, MF);
193         break;
194       case Mips::JALR:
195         if (MI.getOperand(3).isMCSymbol() &&
196             MI.getOperand(3).getMCSymbol()->getName() == "_mcount")
197           emitMCountABI(MI, MBB, MF);
198         break;
199       default:
200         replaceUsesWithZeroReg(MRI, MI);
201       }
202     }
203   }
204 }
205 
selectAddE(SDNode * Node,const SDLoc & DL) const206 void MipsSEDAGToDAGISel::selectAddE(SDNode *Node, const SDLoc &DL) const {
207   SDValue InGlue = Node->getOperand(2);
208   unsigned Opc = InGlue.getOpcode();
209   SDValue LHS = Node->getOperand(0), RHS = Node->getOperand(1);
210   EVT VT = LHS.getValueType();
211 
212   // In the base case, we can rely on the carry bit from the addsc
213   // instruction.
214   if (Opc == ISD::ADDC) {
215     SDValue Ops[3] = {LHS, RHS, InGlue};
216     CurDAG->SelectNodeTo(Node, Mips::ADDWC, VT, MVT::Glue, Ops);
217     return;
218   }
219 
220   assert(Opc == ISD::ADDE && "ISD::ADDE not in a chain of ADDE nodes!");
221 
222   // The more complex case is when there is a chain of ISD::ADDE nodes like:
223   // (adde (adde (adde (addc a b) c) d) e).
224   //
225   // The addwc instruction does not write to the carry bit, instead it writes
226   // to bit 20 of the dsp control register. To match this series of nodes, each
227   // intermediate adde node must be expanded to write the carry bit before the
228   // addition.
229 
230   // Start by reading the overflow field for addsc and moving the value to the
231   // carry field. The usage of 1 here with MipsISD::RDDSP / Mips::WRDSP
232   // corresponds to reading/writing the entire control register to/from a GPR.
233 
234   SDValue CstOne = CurDAG->getTargetConstant(1, DL, MVT::i32);
235 
236   SDValue OuFlag = CurDAG->getTargetConstant(20, DL, MVT::i32);
237 
238   SDNode *DSPCtrlField = CurDAG->getMachineNode(Mips::RDDSP, DL, MVT::i32,
239                                                 MVT::Glue, CstOne, InGlue);
240 
241   SDNode *Carry = CurDAG->getMachineNode(
242       Mips::EXT, DL, MVT::i32, SDValue(DSPCtrlField, 0), OuFlag, CstOne);
243 
244   SDValue Ops[4] = {SDValue(DSPCtrlField, 0),
245                     CurDAG->getTargetConstant(6, DL, MVT::i32), CstOne,
246                     SDValue(Carry, 0)};
247   SDNode *DSPCFWithCarry = CurDAG->getMachineNode(Mips::INS, DL, MVT::i32, Ops);
248 
249   // My reading of the MIPS DSP 3.01 specification isn't as clear as I
250   // would like about whether bit 20 always gets overwritten by addwc.
251   // Hence take an extremely conservative view and presume it's sticky. We
252   // therefore need to clear it.
253 
254   SDValue Zero = CurDAG->getRegister(Mips::ZERO, MVT::i32);
255 
256   SDValue InsOps[4] = {Zero, OuFlag, CstOne, SDValue(DSPCFWithCarry, 0)};
257   SDNode *DSPCtrlFinal =
258       CurDAG->getMachineNode(Mips::INS, DL, MVT::i32, InsOps);
259 
260   SDNode *WrDSP = CurDAG->getMachineNode(Mips::WRDSP, DL, MVT::Glue,
261                                          SDValue(DSPCtrlFinal, 0), CstOne);
262 
263   SDValue Operands[3] = {LHS, RHS, SDValue(WrDSP, 0)};
264   CurDAG->SelectNodeTo(Node, Mips::ADDWC, VT, MVT::Glue, Operands);
265 }
266 
267 /// Match frameindex
selectAddrFrameIndex(SDValue Addr,SDValue & Base,SDValue & Offset) const268 bool MipsSEDAGToDAGISel::selectAddrFrameIndex(SDValue Addr, SDValue &Base,
269                                               SDValue &Offset) const {
270   if (FrameIndexSDNode *FIN = dyn_cast<FrameIndexSDNode>(Addr)) {
271     EVT ValTy = Addr.getValueType();
272 
273     Base   = CurDAG->getTargetFrameIndex(FIN->getIndex(), ValTy);
274     Offset = CurDAG->getTargetConstant(0, SDLoc(Addr), ValTy);
275     return true;
276   }
277   return false;
278 }
279 
280 /// Match frameindex+offset and frameindex|offset
selectAddrFrameIndexOffset(SDValue Addr,SDValue & Base,SDValue & Offset,unsigned OffsetBits,unsigned ShiftAmount=0) const281 bool MipsSEDAGToDAGISel::selectAddrFrameIndexOffset(
282     SDValue Addr, SDValue &Base, SDValue &Offset, unsigned OffsetBits,
283     unsigned ShiftAmount = 0) const {
284   if (CurDAG->isBaseWithConstantOffset(Addr)) {
285     auto *CN = cast<ConstantSDNode>(Addr.getOperand(1));
286     if (isIntN(OffsetBits + ShiftAmount, CN->getSExtValue())) {
287       EVT ValTy = Addr.getValueType();
288 
289       // If the first operand is a FI, get the TargetFI Node
290       if (FrameIndexSDNode *FIN =
291               dyn_cast<FrameIndexSDNode>(Addr.getOperand(0)))
292         Base = CurDAG->getTargetFrameIndex(FIN->getIndex(), ValTy);
293       else {
294         Base = Addr.getOperand(0);
295         // If base is a FI, additional offset calculation is done in
296         // eliminateFrameIndex, otherwise we need to check the alignment
297         const Align Alignment(1ULL << ShiftAmount);
298         if (!isAligned(Alignment, CN->getZExtValue()))
299           return false;
300       }
301 
302       Offset = CurDAG->getTargetConstant(CN->getZExtValue(), SDLoc(Addr),
303                                          ValTy);
304       return true;
305     }
306   }
307   return false;
308 }
309 
310 /// ComplexPattern used on MipsInstrInfo
311 /// Used on Mips Load/Store instructions
selectAddrRegImm(SDValue Addr,SDValue & Base,SDValue & Offset) const312 bool MipsSEDAGToDAGISel::selectAddrRegImm(SDValue Addr, SDValue &Base,
313                                           SDValue &Offset) const {
314   // if Address is FI, get the TargetFrameIndex.
315   if (selectAddrFrameIndex(Addr, Base, Offset))
316     return true;
317 
318   // on PIC code Load GA
319   if (Addr.getOpcode() == MipsISD::Wrapper) {
320     Base   = Addr.getOperand(0);
321     Offset = Addr.getOperand(1);
322     return true;
323   }
324 
325   if (!TM.isPositionIndependent()) {
326     if ((Addr.getOpcode() == ISD::TargetExternalSymbol ||
327         Addr.getOpcode() == ISD::TargetGlobalAddress))
328       return false;
329   }
330 
331   // Addresses of the form FI+const or FI|const
332   if (selectAddrFrameIndexOffset(Addr, Base, Offset, 16))
333     return true;
334 
335   // Operand is a result from an ADD.
336   if (Addr.getOpcode() == ISD::ADD) {
337     // When loading from constant pools, load the lower address part in
338     // the instruction itself. Example, instead of:
339     //  lui $2, %hi($CPI1_0)
340     //  addiu $2, $2, %lo($CPI1_0)
341     //  lwc1 $f0, 0($2)
342     // Generate:
343     //  lui $2, %hi($CPI1_0)
344     //  lwc1 $f0, %lo($CPI1_0)($2)
345     if (Addr.getOperand(1).getOpcode() == MipsISD::Lo ||
346         Addr.getOperand(1).getOpcode() == MipsISD::GPRel) {
347       SDValue Opnd0 = Addr.getOperand(1).getOperand(0);
348       if (isa<ConstantPoolSDNode>(Opnd0) || isa<GlobalAddressSDNode>(Opnd0) ||
349           isa<JumpTableSDNode>(Opnd0)) {
350         Base = Addr.getOperand(0);
351         Offset = Opnd0;
352         return true;
353       }
354     }
355   }
356 
357   return false;
358 }
359 
360 /// ComplexPattern used on MipsInstrInfo
361 /// Used on Mips Load/Store instructions
selectAddrDefault(SDValue Addr,SDValue & Base,SDValue & Offset) const362 bool MipsSEDAGToDAGISel::selectAddrDefault(SDValue Addr, SDValue &Base,
363                                            SDValue &Offset) const {
364   Base = Addr;
365   Offset = CurDAG->getTargetConstant(0, SDLoc(Addr), Addr.getValueType());
366   return true;
367 }
368 
selectIntAddr(SDValue Addr,SDValue & Base,SDValue & Offset) const369 bool MipsSEDAGToDAGISel::selectIntAddr(SDValue Addr, SDValue &Base,
370                                        SDValue &Offset) const {
371   return selectAddrRegImm(Addr, Base, Offset) ||
372     selectAddrDefault(Addr, Base, Offset);
373 }
374 
selectAddrRegImm9(SDValue Addr,SDValue & Base,SDValue & Offset) const375 bool MipsSEDAGToDAGISel::selectAddrRegImm9(SDValue Addr, SDValue &Base,
376                                            SDValue &Offset) const {
377   if (selectAddrFrameIndex(Addr, Base, Offset))
378     return true;
379 
380   if (selectAddrFrameIndexOffset(Addr, Base, Offset, 9))
381     return true;
382 
383   return false;
384 }
385 
386 /// Used on microMIPS LWC2, LDC2, SWC2 and SDC2 instructions (11-bit offset)
selectAddrRegImm11(SDValue Addr,SDValue & Base,SDValue & Offset) const387 bool MipsSEDAGToDAGISel::selectAddrRegImm11(SDValue Addr, SDValue &Base,
388                                             SDValue &Offset) const {
389   if (selectAddrFrameIndex(Addr, Base, Offset))
390     return true;
391 
392   if (selectAddrFrameIndexOffset(Addr, Base, Offset, 11))
393     return true;
394 
395   return false;
396 }
397 
398 /// Used on microMIPS Load/Store unaligned instructions (12-bit offset)
selectAddrRegImm12(SDValue Addr,SDValue & Base,SDValue & Offset) const399 bool MipsSEDAGToDAGISel::selectAddrRegImm12(SDValue Addr, SDValue &Base,
400                                             SDValue &Offset) const {
401   if (selectAddrFrameIndex(Addr, Base, Offset))
402     return true;
403 
404   if (selectAddrFrameIndexOffset(Addr, Base, Offset, 12))
405     return true;
406 
407   return false;
408 }
409 
selectAddrRegImm16(SDValue Addr,SDValue & Base,SDValue & Offset) const410 bool MipsSEDAGToDAGISel::selectAddrRegImm16(SDValue Addr, SDValue &Base,
411                                             SDValue &Offset) const {
412   if (selectAddrFrameIndex(Addr, Base, Offset))
413     return true;
414 
415   if (selectAddrFrameIndexOffset(Addr, Base, Offset, 16))
416     return true;
417 
418   return false;
419 }
420 
selectIntAddr11MM(SDValue Addr,SDValue & Base,SDValue & Offset) const421 bool MipsSEDAGToDAGISel::selectIntAddr11MM(SDValue Addr, SDValue &Base,
422                                          SDValue &Offset) const {
423   return selectAddrRegImm11(Addr, Base, Offset) ||
424     selectAddrDefault(Addr, Base, Offset);
425 }
426 
selectIntAddr12MM(SDValue Addr,SDValue & Base,SDValue & Offset) const427 bool MipsSEDAGToDAGISel::selectIntAddr12MM(SDValue Addr, SDValue &Base,
428                                          SDValue &Offset) const {
429   return selectAddrRegImm12(Addr, Base, Offset) ||
430     selectAddrDefault(Addr, Base, Offset);
431 }
432 
selectIntAddr16MM(SDValue Addr,SDValue & Base,SDValue & Offset) const433 bool MipsSEDAGToDAGISel::selectIntAddr16MM(SDValue Addr, SDValue &Base,
434                                          SDValue &Offset) const {
435   return selectAddrRegImm16(Addr, Base, Offset) ||
436     selectAddrDefault(Addr, Base, Offset);
437 }
438 
selectIntAddrLSL2MM(SDValue Addr,SDValue & Base,SDValue & Offset) const439 bool MipsSEDAGToDAGISel::selectIntAddrLSL2MM(SDValue Addr, SDValue &Base,
440                                              SDValue &Offset) const {
441   if (selectAddrFrameIndexOffset(Addr, Base, Offset, 7)) {
442     if (isa<FrameIndexSDNode>(Base))
443       return false;
444 
445     if (ConstantSDNode *CN = dyn_cast<ConstantSDNode>(Offset)) {
446       unsigned CnstOff = CN->getZExtValue();
447       return (CnstOff == (CnstOff & 0x3c));
448     }
449 
450     return false;
451   }
452 
453   // For all other cases where "lw" would be selected, don't select "lw16"
454   // because it would result in additional instructions to prepare operands.
455   if (selectAddrRegImm(Addr, Base, Offset))
456     return false;
457 
458   return selectAddrDefault(Addr, Base, Offset);
459 }
460 
selectIntAddrSImm10(SDValue Addr,SDValue & Base,SDValue & Offset) const461 bool MipsSEDAGToDAGISel::selectIntAddrSImm10(SDValue Addr, SDValue &Base,
462                                              SDValue &Offset) const {
463 
464   if (selectAddrFrameIndex(Addr, Base, Offset))
465     return true;
466 
467   if (selectAddrFrameIndexOffset(Addr, Base, Offset, 10))
468     return true;
469 
470   return selectAddrDefault(Addr, Base, Offset);
471 }
472 
selectIntAddrSImm10Lsl1(SDValue Addr,SDValue & Base,SDValue & Offset) const473 bool MipsSEDAGToDAGISel::selectIntAddrSImm10Lsl1(SDValue Addr, SDValue &Base,
474                                                  SDValue &Offset) const {
475   if (selectAddrFrameIndex(Addr, Base, Offset))
476     return true;
477 
478   if (selectAddrFrameIndexOffset(Addr, Base, Offset, 10, 1))
479     return true;
480 
481   return selectAddrDefault(Addr, Base, Offset);
482 }
483 
selectIntAddrSImm10Lsl2(SDValue Addr,SDValue & Base,SDValue & Offset) const484 bool MipsSEDAGToDAGISel::selectIntAddrSImm10Lsl2(SDValue Addr, SDValue &Base,
485                                                  SDValue &Offset) const {
486   if (selectAddrFrameIndex(Addr, Base, Offset))
487     return true;
488 
489   if (selectAddrFrameIndexOffset(Addr, Base, Offset, 10, 2))
490     return true;
491 
492   return selectAddrDefault(Addr, Base, Offset);
493 }
494 
selectIntAddrSImm10Lsl3(SDValue Addr,SDValue & Base,SDValue & Offset) const495 bool MipsSEDAGToDAGISel::selectIntAddrSImm10Lsl3(SDValue Addr, SDValue &Base,
496                                                  SDValue &Offset) const {
497   if (selectAddrFrameIndex(Addr, Base, Offset))
498     return true;
499 
500   if (selectAddrFrameIndexOffset(Addr, Base, Offset, 10, 3))
501     return true;
502 
503   return selectAddrDefault(Addr, Base, Offset);
504 }
505 
506 // Select constant vector splats.
507 //
508 // Returns true and sets Imm if:
509 // * MSA is enabled
510 // * N is a ISD::BUILD_VECTOR representing a constant splat
selectVSplat(SDNode * N,APInt & Imm,unsigned MinSizeInBits) const511 bool MipsSEDAGToDAGISel::selectVSplat(SDNode *N, APInt &Imm,
512                                       unsigned MinSizeInBits) const {
513   if (!Subtarget->hasMSA())
514     return false;
515 
516   BuildVectorSDNode *Node = dyn_cast<BuildVectorSDNode>(N);
517 
518   if (!Node)
519     return false;
520 
521   APInt SplatValue, SplatUndef;
522   unsigned SplatBitSize;
523   bool HasAnyUndefs;
524 
525   if (!Node->isConstantSplat(SplatValue, SplatUndef, SplatBitSize, HasAnyUndefs,
526                              MinSizeInBits, !Subtarget->isLittle()))
527     return false;
528 
529   Imm = SplatValue;
530 
531   return true;
532 }
533 
534 // Select constant vector splats.
535 //
536 // In addition to the requirements of selectVSplat(), this function returns
537 // true and sets Imm if:
538 // * The splat value is the same width as the elements of the vector
539 // * The splat value fits in an integer with the specified signed-ness and
540 //   width.
541 //
542 // This function looks through ISD::BITCAST nodes.
543 // TODO: This might not be appropriate for big-endian MSA since BITCAST is
544 //       sometimes a shuffle in big-endian mode.
545 //
546 // It's worth noting that this function is not used as part of the selection
547 // of ldi.[bhwd] since it does not permit using the wrong-typed ldi.[bhwd]
548 // instruction to achieve the desired bit pattern. ldi.[bhwd] is selected in
549 // MipsSEDAGToDAGISel::selectNode.
550 bool MipsSEDAGToDAGISel::
selectVSplatCommon(SDValue N,SDValue & Imm,bool Signed,unsigned ImmBitSize) const551 selectVSplatCommon(SDValue N, SDValue &Imm, bool Signed,
552                    unsigned ImmBitSize) const {
553   APInt ImmValue;
554   EVT EltTy = N->getValueType(0).getVectorElementType();
555 
556   if (N->getOpcode() == ISD::BITCAST)
557     N = N->getOperand(0);
558 
559   if (selectVSplat(N.getNode(), ImmValue, EltTy.getSizeInBits()) &&
560       ImmValue.getBitWidth() == EltTy.getSizeInBits()) {
561 
562     if (( Signed && ImmValue.isSignedIntN(ImmBitSize)) ||
563         (!Signed && ImmValue.isIntN(ImmBitSize))) {
564       Imm = CurDAG->getTargetConstant(ImmValue, SDLoc(N), EltTy);
565       return true;
566     }
567   }
568 
569   return false;
570 }
571 
572 // Select constant vector splats.
573 bool MipsSEDAGToDAGISel::
selectVSplatUimm1(SDValue N,SDValue & Imm) const574 selectVSplatUimm1(SDValue N, SDValue &Imm) const {
575   return selectVSplatCommon(N, Imm, false, 1);
576 }
577 
578 bool MipsSEDAGToDAGISel::
selectVSplatUimm2(SDValue N,SDValue & Imm) const579 selectVSplatUimm2(SDValue N, SDValue &Imm) const {
580   return selectVSplatCommon(N, Imm, false, 2);
581 }
582 
583 bool MipsSEDAGToDAGISel::
selectVSplatUimm3(SDValue N,SDValue & Imm) const584 selectVSplatUimm3(SDValue N, SDValue &Imm) const {
585   return selectVSplatCommon(N, Imm, false, 3);
586 }
587 
588 // Select constant vector splats.
589 bool MipsSEDAGToDAGISel::
selectVSplatUimm4(SDValue N,SDValue & Imm) const590 selectVSplatUimm4(SDValue N, SDValue &Imm) const {
591   return selectVSplatCommon(N, Imm, false, 4);
592 }
593 
594 // Select constant vector splats.
595 bool MipsSEDAGToDAGISel::
selectVSplatUimm5(SDValue N,SDValue & Imm) const596 selectVSplatUimm5(SDValue N, SDValue &Imm) const {
597   return selectVSplatCommon(N, Imm, false, 5);
598 }
599 
600 // Select constant vector splats.
601 bool MipsSEDAGToDAGISel::
selectVSplatUimm6(SDValue N,SDValue & Imm) const602 selectVSplatUimm6(SDValue N, SDValue &Imm) const {
603   return selectVSplatCommon(N, Imm, false, 6);
604 }
605 
606 // Select constant vector splats.
607 bool MipsSEDAGToDAGISel::
selectVSplatUimm8(SDValue N,SDValue & Imm) const608 selectVSplatUimm8(SDValue N, SDValue &Imm) const {
609   return selectVSplatCommon(N, Imm, false, 8);
610 }
611 
612 // Select constant vector splats.
613 bool MipsSEDAGToDAGISel::
selectVSplatSimm5(SDValue N,SDValue & Imm) const614 selectVSplatSimm5(SDValue N, SDValue &Imm) const {
615   return selectVSplatCommon(N, Imm, true, 5);
616 }
617 
618 // Select constant vector splats whose value is a power of 2.
619 //
620 // In addition to the requirements of selectVSplat(), this function returns
621 // true and sets Imm if:
622 // * The splat value is the same width as the elements of the vector
623 // * The splat value is a power of two.
624 //
625 // This function looks through ISD::BITCAST nodes.
626 // TODO: This might not be appropriate for big-endian MSA since BITCAST is
627 //       sometimes a shuffle in big-endian mode.
selectVSplatUimmPow2(SDValue N,SDValue & Imm) const628 bool MipsSEDAGToDAGISel::selectVSplatUimmPow2(SDValue N, SDValue &Imm) const {
629   APInt ImmValue;
630   EVT EltTy = N->getValueType(0).getVectorElementType();
631 
632   if (N->getOpcode() == ISD::BITCAST)
633     N = N->getOperand(0);
634 
635   if (selectVSplat(N.getNode(), ImmValue, EltTy.getSizeInBits()) &&
636       ImmValue.getBitWidth() == EltTy.getSizeInBits()) {
637     int32_t Log2 = ImmValue.exactLogBase2();
638 
639     if (Log2 != -1) {
640       Imm = CurDAG->getTargetConstant(Log2, SDLoc(N), EltTy);
641       return true;
642     }
643   }
644 
645   return false;
646 }
647 
648 // Select constant vector splats whose value only has a consecutive sequence
649 // of left-most bits set (e.g. 0b11...1100...00).
650 //
651 // In addition to the requirements of selectVSplat(), this function returns
652 // true and sets Imm if:
653 // * The splat value is the same width as the elements of the vector
654 // * The splat value is a consecutive sequence of left-most bits.
655 //
656 // This function looks through ISD::BITCAST nodes.
657 // TODO: This might not be appropriate for big-endian MSA since BITCAST is
658 //       sometimes a shuffle in big-endian mode.
selectVSplatMaskL(SDValue N,SDValue & Imm) const659 bool MipsSEDAGToDAGISel::selectVSplatMaskL(SDValue N, SDValue &Imm) const {
660   APInt ImmValue;
661   EVT EltTy = N->getValueType(0).getVectorElementType();
662 
663   if (N->getOpcode() == ISD::BITCAST)
664     N = N->getOperand(0);
665 
666   if (selectVSplat(N.getNode(), ImmValue, EltTy.getSizeInBits()) &&
667       ImmValue.getBitWidth() == EltTy.getSizeInBits()) {
668     // Extract the run of set bits starting with bit zero from the bitwise
669     // inverse of ImmValue, and test that the inverse of this is the same
670     // as the original value.
671     if (ImmValue == ~(~ImmValue & ~(~ImmValue + 1))) {
672 
673       Imm = CurDAG->getTargetConstant(ImmValue.popcount() - 1, SDLoc(N), EltTy);
674       return true;
675     }
676   }
677 
678   return false;
679 }
680 
681 // Select constant vector splats whose value only has a consecutive sequence
682 // of right-most bits set (e.g. 0b00...0011...11).
683 //
684 // In addition to the requirements of selectVSplat(), this function returns
685 // true and sets Imm if:
686 // * The splat value is the same width as the elements of the vector
687 // * The splat value is a consecutive sequence of right-most bits.
688 //
689 // This function looks through ISD::BITCAST nodes.
690 // TODO: This might not be appropriate for big-endian MSA since BITCAST is
691 //       sometimes a shuffle in big-endian mode.
selectVSplatMaskR(SDValue N,SDValue & Imm) const692 bool MipsSEDAGToDAGISel::selectVSplatMaskR(SDValue N, SDValue &Imm) const {
693   APInt ImmValue;
694   EVT EltTy = N->getValueType(0).getVectorElementType();
695 
696   if (N->getOpcode() == ISD::BITCAST)
697     N = N->getOperand(0);
698 
699   if (selectVSplat(N.getNode(), ImmValue, EltTy.getSizeInBits()) &&
700       ImmValue.getBitWidth() == EltTy.getSizeInBits()) {
701     // Extract the run of set bits starting with bit zero, and test that the
702     // result is the same as the original value
703     if (ImmValue == (ImmValue & ~(ImmValue + 1))) {
704       Imm = CurDAG->getTargetConstant(ImmValue.popcount() - 1, SDLoc(N), EltTy);
705       return true;
706     }
707   }
708 
709   return false;
710 }
711 
selectVSplatUimmInvPow2(SDValue N,SDValue & Imm) const712 bool MipsSEDAGToDAGISel::selectVSplatUimmInvPow2(SDValue N,
713                                                  SDValue &Imm) const {
714   APInt ImmValue;
715   EVT EltTy = N->getValueType(0).getVectorElementType();
716 
717   if (N->getOpcode() == ISD::BITCAST)
718     N = N->getOperand(0);
719 
720   if (selectVSplat(N.getNode(), ImmValue, EltTy.getSizeInBits()) &&
721       ImmValue.getBitWidth() == EltTy.getSizeInBits()) {
722     int32_t Log2 = (~ImmValue).exactLogBase2();
723 
724     if (Log2 != -1) {
725       Imm = CurDAG->getTargetConstant(Log2, SDLoc(N), EltTy);
726       return true;
727     }
728   }
729 
730   return false;
731 }
732 
733 // Select const vector splat of 1.
selectVSplatImmEq1(SDValue N) const734 bool MipsSEDAGToDAGISel::selectVSplatImmEq1(SDValue N) const {
735   APInt ImmValue;
736   EVT EltTy = N->getValueType(0).getVectorElementType();
737 
738   if (N->getOpcode() == ISD::BITCAST)
739     N = N->getOperand(0);
740 
741   return selectVSplat(N.getNode(), ImmValue, EltTy.getSizeInBits()) &&
742          ImmValue.getBitWidth() == EltTy.getSizeInBits() && ImmValue == 1;
743 }
744 
trySelect(SDNode * Node)745 bool MipsSEDAGToDAGISel::trySelect(SDNode *Node) {
746   unsigned Opcode = Node->getOpcode();
747   SDLoc DL(Node);
748 
749   ///
750   // Instruction Selection not handled by the auto-generated
751   // tablegen selection should be handled here.
752   ///
753   switch(Opcode) {
754   default: break;
755 
756   case MipsISD::DOUBLE_SELECT_I:
757   case MipsISD::DOUBLE_SELECT_I64: {
758     MVT VT = Subtarget->isGP64bit() ? MVT::i64 : MVT::i32;
759     SDValue cond = Node->getOperand(0);
760     SDValue Hi1 = Node->getOperand(1);
761     SDValue Lo1 = Node->getOperand(2);
762     SDValue Hi2 = Node->getOperand(3);
763     SDValue Lo2 = Node->getOperand(4);
764 
765     SDValue ops[] = {cond, Hi1, Lo1, Hi2, Lo2};
766     EVT NodeTys[] = {VT, VT};
767     ReplaceNode(Node, CurDAG->getMachineNode(Subtarget->isGP64bit()
768                                                  ? Mips::PseudoD_SELECT_I64
769                                                  : Mips::PseudoD_SELECT_I,
770                                              DL, NodeTys, ops));
771     return true;
772   }
773 
774   case ISD::ADDE: {
775     selectAddE(Node, DL);
776     return true;
777   }
778 
779   case ISD::ConstantFP: {
780     auto *CN = cast<ConstantFPSDNode>(Node);
781     if (Node->getValueType(0) == MVT::f64 && CN->isExactlyValue(+0.0)) {
782       if (Subtarget->isGP64bit()) {
783         SDValue Zero = CurDAG->getCopyFromReg(CurDAG->getEntryNode(), DL,
784                                               Mips::ZERO_64, MVT::i64);
785         ReplaceNode(Node,
786                     CurDAG->getMachineNode(Mips::DMTC1, DL, MVT::f64, Zero));
787       } else if (Subtarget->isFP64bit()) {
788         SDValue Zero = CurDAG->getCopyFromReg(CurDAG->getEntryNode(), DL,
789                                               Mips::ZERO, MVT::i32);
790         ReplaceNode(Node, CurDAG->getMachineNode(Mips::BuildPairF64_64, DL,
791                                                  MVT::f64, Zero, Zero));
792       } else {
793         SDValue Zero = CurDAG->getCopyFromReg(CurDAG->getEntryNode(), DL,
794                                               Mips::ZERO, MVT::i32);
795         ReplaceNode(Node, CurDAG->getMachineNode(Mips::BuildPairF64, DL,
796                                                  MVT::f64, Zero, Zero));
797       }
798       return true;
799     }
800     break;
801   }
802 
803   case ISD::Constant: {
804     auto *CN = cast<ConstantSDNode>(Node);
805     int64_t Imm = CN->getSExtValue();
806     unsigned Size = CN->getValueSizeInBits(0);
807 
808     if (isInt<32>(Imm))
809       break;
810 
811     MipsAnalyzeImmediate AnalyzeImm;
812 
813     const MipsAnalyzeImmediate::InstSeq &Seq =
814       AnalyzeImm.Analyze(Imm, Size, false);
815 
816     MipsAnalyzeImmediate::InstSeq::const_iterator Inst = Seq.begin();
817     SDLoc DL(CN);
818     SDNode *RegOpnd;
819     SDValue ImmOpnd = CurDAG->getTargetConstant(SignExtend64<16>(Inst->ImmOpnd),
820                                                 DL, MVT::i64);
821 
822     // The first instruction can be a LUi which is different from other
823     // instructions (ADDiu, ORI and SLL) in that it does not have a register
824     // operand.
825     if (Inst->Opc == Mips::LUi64)
826       RegOpnd = CurDAG->getMachineNode(Inst->Opc, DL, MVT::i64, ImmOpnd);
827     else
828       RegOpnd =
829         CurDAG->getMachineNode(Inst->Opc, DL, MVT::i64,
830                                CurDAG->getRegister(Mips::ZERO_64, MVT::i64),
831                                ImmOpnd);
832 
833     // The remaining instructions in the sequence are handled here.
834     for (++Inst; Inst != Seq.end(); ++Inst) {
835       ImmOpnd = CurDAG->getTargetConstant(SignExtend64<16>(Inst->ImmOpnd), DL,
836                                           MVT::i64);
837       RegOpnd = CurDAG->getMachineNode(Inst->Opc, DL, MVT::i64,
838                                        SDValue(RegOpnd, 0), ImmOpnd);
839     }
840 
841     ReplaceNode(Node, RegOpnd);
842     return true;
843   }
844 
845   case ISD::INTRINSIC_W_CHAIN: {
846     const unsigned IntrinsicOpcode = Node->getConstantOperandVal(1);
847     switch (IntrinsicOpcode) {
848     default:
849       break;
850 
851     case Intrinsic::mips_cfcmsa: {
852       SDValue ChainIn = Node->getOperand(0);
853       SDValue RegIdx = Node->getOperand(2);
854       SDValue Reg = CurDAG->getCopyFromReg(ChainIn, DL,
855                                            getMSACtrlReg(RegIdx), MVT::i32);
856       ReplaceNode(Node, Reg.getNode());
857       return true;
858     }
859     case Intrinsic::mips_ldr_d:
860     case Intrinsic::mips_ldr_w: {
861       unsigned Op = (IntrinsicOpcode == Intrinsic::mips_ldr_d) ? Mips::LDR_D
862                                                                : Mips::LDR_W;
863 
864       SDLoc DL(Node);
865       assert(Node->getNumOperands() == 4 && "Unexpected number of operands.");
866       const SDValue &Chain = Node->getOperand(0);
867       const SDValue &Intrinsic = Node->getOperand(1);
868       const SDValue &Pointer = Node->getOperand(2);
869       const SDValue &Constant = Node->getOperand(3);
870 
871       assert(Chain.getValueType() == MVT::Other);
872       (void)Intrinsic;
873       assert(Intrinsic.getOpcode() == ISD::TargetConstant &&
874              Constant.getOpcode() == ISD::Constant &&
875              "Invalid instruction operand.");
876 
877       // Convert Constant to TargetConstant.
878       const ConstantInt *Val =
879           cast<ConstantSDNode>(Constant)->getConstantIntValue();
880       SDValue Imm =
881           CurDAG->getTargetConstant(*Val, DL, Constant.getValueType());
882 
883       SmallVector<SDValue, 3> Ops{Pointer, Imm, Chain};
884 
885       assert(Node->getNumValues() == 2);
886       assert(Node->getValueType(0).is128BitVector());
887       assert(Node->getValueType(1) == MVT::Other);
888       SmallVector<EVT, 2> ResTys{Node->getValueType(0), Node->getValueType(1)};
889 
890       ReplaceNode(Node, CurDAG->getMachineNode(Op, DL, ResTys, Ops));
891 
892       return true;
893     }
894     }
895     break;
896   }
897 
898   case ISD::INTRINSIC_WO_CHAIN: {
899     switch (Node->getConstantOperandVal(0)) {
900     default:
901       break;
902 
903     case Intrinsic::mips_move_v:
904       // Like an assignment but will always produce a move.v even if
905       // unnecessary.
906       ReplaceNode(Node, CurDAG->getMachineNode(Mips::MOVE_V, DL,
907                                                Node->getValueType(0),
908                                                Node->getOperand(1)));
909       return true;
910     }
911     break;
912   }
913 
914   case ISD::INTRINSIC_VOID: {
915     const unsigned IntrinsicOpcode = Node->getConstantOperandVal(1);
916     switch (IntrinsicOpcode) {
917     default:
918       break;
919 
920     case Intrinsic::mips_ctcmsa: {
921       SDValue ChainIn = Node->getOperand(0);
922       SDValue RegIdx  = Node->getOperand(2);
923       SDValue Value   = Node->getOperand(3);
924       SDValue ChainOut = CurDAG->getCopyToReg(ChainIn, DL,
925                                               getMSACtrlReg(RegIdx), Value);
926       ReplaceNode(Node, ChainOut.getNode());
927       return true;
928     }
929     case Intrinsic::mips_str_d:
930     case Intrinsic::mips_str_w: {
931       unsigned Op = (IntrinsicOpcode == Intrinsic::mips_str_d) ? Mips::STR_D
932                                                                : Mips::STR_W;
933 
934       SDLoc DL(Node);
935       assert(Node->getNumOperands() == 5 && "Unexpected number of operands.");
936       const SDValue &Chain = Node->getOperand(0);
937       const SDValue &Intrinsic = Node->getOperand(1);
938       const SDValue &Vec = Node->getOperand(2);
939       const SDValue &Pointer = Node->getOperand(3);
940       const SDValue &Constant = Node->getOperand(4);
941 
942       assert(Chain.getValueType() == MVT::Other);
943       (void)Intrinsic;
944       assert(Intrinsic.getOpcode() == ISD::TargetConstant &&
945              Constant.getOpcode() == ISD::Constant &&
946              "Invalid instruction operand.");
947 
948       // Convert Constant to TargetConstant.
949       const ConstantInt *Val =
950           cast<ConstantSDNode>(Constant)->getConstantIntValue();
951       SDValue Imm =
952           CurDAG->getTargetConstant(*Val, DL, Constant.getValueType());
953 
954       SmallVector<SDValue, 4> Ops{Vec, Pointer, Imm, Chain};
955 
956       assert(Node->getNumValues() == 1);
957       assert(Node->getValueType(0) == MVT::Other);
958       SmallVector<EVT, 1> ResTys{Node->getValueType(0)};
959 
960       ReplaceNode(Node, CurDAG->getMachineNode(Op, DL, ResTys, Ops));
961       return true;
962     }
963     }
964     break;
965   }
966 
967   case MipsISD::FAbs: {
968     MVT ResTy = Node->getSimpleValueType(0);
969     assert((ResTy == MVT::f64 || ResTy == MVT::f32) &&
970            "Unsupported float type!");
971     unsigned Opc = 0;
972     if (ResTy == MVT::f64)
973       Opc = (Subtarget->isFP64bit() ? Mips::FABS_D64 : Mips::FABS_D32);
974     else
975       Opc = Mips::FABS_S;
976 
977     if (Subtarget->inMicroMipsMode()) {
978       switch (Opc) {
979       case Mips::FABS_D64:
980         Opc = Mips::FABS_D64_MM;
981         break;
982       case Mips::FABS_D32:
983         Opc = Mips::FABS_D32_MM;
984         break;
985       case Mips::FABS_S:
986         Opc = Mips::FABS_S_MM;
987         break;
988       default:
989         llvm_unreachable("Unknown opcode for MIPS floating point abs!");
990       }
991     }
992 
993     ReplaceNode(Node,
994                 CurDAG->getMachineNode(Opc, DL, ResTy, Node->getOperand(0)));
995 
996     return true;
997   }
998 
999   // Manually match MipsISD::Ins nodes to get the correct instruction. It has
1000   // to be done in this fashion so that we respect the differences between
1001   // dins and dinsm, as the difference is that the size operand has the range
1002   // 0 < size <= 32 for dins while dinsm has the range 2 <= size <= 64 which
1003   // means SelectionDAGISel would have to test all the operands at once to
1004   // match the instruction.
1005   case MipsISD::Ins: {
1006 
1007     // Validating the node operands.
1008     if (Node->getValueType(0) != MVT::i32 && Node->getValueType(0) != MVT::i64)
1009       return false;
1010 
1011     if (Node->getNumOperands() != 4)
1012       return false;
1013 
1014     if (Node->getOperand(1)->getOpcode() != ISD::Constant ||
1015         Node->getOperand(2)->getOpcode() != ISD::Constant)
1016       return false;
1017 
1018     MVT ResTy = Node->getSimpleValueType(0);
1019     uint64_t Pos = Node->getConstantOperandVal(1);
1020     uint64_t Size = Node->getConstantOperandVal(2);
1021 
1022     // Size has to be >0 for 'ins', 'dins' and 'dinsu'.
1023     if (!Size)
1024       return false;
1025 
1026     if (Pos + Size > 64)
1027       return false;
1028 
1029     if (ResTy != MVT::i32 && ResTy != MVT::i64)
1030       return false;
1031 
1032     unsigned Opcode = 0;
1033     if (ResTy == MVT::i32) {
1034       if (Pos + Size <= 32)
1035         Opcode = Mips::INS;
1036     } else {
1037       if (Pos + Size <= 32)
1038         Opcode = Mips::DINS;
1039       else if (Pos < 32 && 1 < Size)
1040         Opcode = Mips::DINSM;
1041       else
1042         Opcode = Mips::DINSU;
1043     }
1044 
1045     if (Opcode) {
1046       SDValue Ops[4] = {
1047           Node->getOperand(0), CurDAG->getTargetConstant(Pos, DL, MVT::i32),
1048           CurDAG->getTargetConstant(Size, DL, MVT::i32), Node->getOperand(3)};
1049 
1050       ReplaceNode(Node, CurDAG->getMachineNode(Opcode, DL, ResTy, Ops));
1051       return true;
1052     }
1053 
1054     return false;
1055   }
1056 
1057   case MipsISD::ThreadPointer: {
1058     EVT PtrVT = getTargetLowering()->getPointerTy(CurDAG->getDataLayout());
1059     unsigned RdhwrOpc, DestReg;
1060 
1061     if (PtrVT == MVT::i32) {
1062       RdhwrOpc = Mips::RDHWR;
1063       DestReg = Mips::V1;
1064     } else {
1065       RdhwrOpc = Mips::RDHWR64;
1066       DestReg = Mips::V1_64;
1067     }
1068 
1069     SDNode *Rdhwr =
1070         CurDAG->getMachineNode(RdhwrOpc, DL, Node->getValueType(0), MVT::Glue,
1071                                CurDAG->getRegister(Mips::HWR29, MVT::i32),
1072                                CurDAG->getTargetConstant(0, DL, MVT::i32));
1073     SDValue Chain = CurDAG->getCopyToReg(CurDAG->getEntryNode(), DL, DestReg,
1074                                          SDValue(Rdhwr, 0), SDValue(Rdhwr, 1));
1075     SDValue ResNode = CurDAG->getCopyFromReg(Chain, DL, DestReg, PtrVT,
1076                                              Chain.getValue(1));
1077     ReplaceNode(Node, ResNode.getNode());
1078     return true;
1079   }
1080 
1081   case ISD::BUILD_VECTOR: {
1082     // Select appropriate ldi.[bhwd] instructions for constant splats of
1083     // 128-bit when MSA is enabled. Fixup any register class mismatches that
1084     // occur as a result.
1085     //
1086     // This allows the compiler to use a wider range of immediates than would
1087     // otherwise be allowed. If, for example, v4i32 could only use ldi.h then
1088     // it would not be possible to load { 0x01010101, 0x01010101, 0x01010101,
1089     // 0x01010101 } without using a constant pool. This would be sub-optimal
1090     // when // 'ldi.b wd, 1' is capable of producing that bit-pattern in the
1091     // same set/ of registers. Similarly, ldi.h isn't capable of producing {
1092     // 0x00000000, 0x00000001, 0x00000000, 0x00000001 } but 'ldi.d wd, 1' can.
1093 
1094     const MipsABIInfo &ABI =
1095         static_cast<const MipsTargetMachine &>(TM).getABI();
1096 
1097     BuildVectorSDNode *BVN = cast<BuildVectorSDNode>(Node);
1098     APInt SplatValue, SplatUndef;
1099     unsigned SplatBitSize;
1100     bool HasAnyUndefs;
1101     unsigned LdiOp;
1102     EVT ResVecTy = BVN->getValueType(0);
1103     EVT ViaVecTy;
1104 
1105     if (!Subtarget->hasMSA() || !BVN->getValueType(0).is128BitVector())
1106       return false;
1107 
1108     if (!BVN->isConstantSplat(SplatValue, SplatUndef, SplatBitSize,
1109                               HasAnyUndefs, 8,
1110                               !Subtarget->isLittle()))
1111       return false;
1112 
1113     switch (SplatBitSize) {
1114     default:
1115       return false;
1116     case 8:
1117       LdiOp = Mips::LDI_B;
1118       ViaVecTy = MVT::v16i8;
1119       break;
1120     case 16:
1121       LdiOp = Mips::LDI_H;
1122       ViaVecTy = MVT::v8i16;
1123       break;
1124     case 32:
1125       LdiOp = Mips::LDI_W;
1126       ViaVecTy = MVT::v4i32;
1127       break;
1128     case 64:
1129       LdiOp = Mips::LDI_D;
1130       ViaVecTy = MVT::v2i64;
1131       break;
1132     }
1133 
1134     SDNode *Res = nullptr;
1135 
1136     // If we have a signed 10 bit integer, we can splat it directly.
1137     //
1138     // If we have something bigger we can synthesize the value into a GPR and
1139     // splat from there.
1140     if (SplatValue.isSignedIntN(10)) {
1141       SDValue Imm = CurDAG->getTargetConstant(SplatValue, DL,
1142                                               ViaVecTy.getVectorElementType());
1143 
1144       Res = CurDAG->getMachineNode(LdiOp, DL, ViaVecTy, Imm);
1145     } else if (SplatValue.isSignedIntN(16) &&
1146                ((ABI.IsO32() && SplatBitSize < 64) ||
1147                 (ABI.IsN32() || ABI.IsN64()))) {
1148       // Only handle signed 16 bit values when the element size is GPR width.
1149       // MIPS64 can handle all the cases but MIPS32 would need to handle
1150       // negative cases specifically here. Instead, handle those cases as
1151       // 64bit values.
1152 
1153       bool Is32BitSplat = ABI.IsO32() || SplatBitSize < 64;
1154       const unsigned ADDiuOp = Is32BitSplat ? Mips::ADDiu : Mips::DADDiu;
1155       const MVT SplatMVT = Is32BitSplat ? MVT::i32 : MVT::i64;
1156       SDValue ZeroVal = CurDAG->getRegister(
1157           Is32BitSplat ? Mips::ZERO : Mips::ZERO_64, SplatMVT);
1158 
1159       const unsigned FILLOp =
1160           SplatBitSize == 16
1161               ? Mips::FILL_H
1162               : (SplatBitSize == 32 ? Mips::FILL_W
1163                                     : (SplatBitSize == 64 ? Mips::FILL_D : 0));
1164 
1165       assert(FILLOp != 0 && "Unknown FILL Op for splat synthesis!");
1166       assert((!ABI.IsO32() || (FILLOp != Mips::FILL_D)) &&
1167              "Attempting to use fill.d on MIPS32!");
1168 
1169       const unsigned Lo = SplatValue.getLoBits(16).getZExtValue();
1170       SDValue LoVal = CurDAG->getTargetConstant(Lo, DL, SplatMVT);
1171 
1172       Res = CurDAG->getMachineNode(ADDiuOp, DL, SplatMVT, ZeroVal, LoVal);
1173       Res = CurDAG->getMachineNode(FILLOp, DL, ViaVecTy, SDValue(Res, 0));
1174 
1175     } else if (SplatValue.isSignedIntN(32) && SplatBitSize == 32) {
1176       // Only handle the cases where the splat size agrees with the size
1177       // of the SplatValue here.
1178       const unsigned Lo = SplatValue.getLoBits(16).getZExtValue();
1179       const unsigned Hi = SplatValue.lshr(16).getLoBits(16).getZExtValue();
1180       SDValue ZeroVal = CurDAG->getRegister(Mips::ZERO, MVT::i32);
1181 
1182       SDValue LoVal = CurDAG->getTargetConstant(Lo, DL, MVT::i32);
1183       SDValue HiVal = CurDAG->getTargetConstant(Hi, DL, MVT::i32);
1184 
1185       if (Hi)
1186         Res = CurDAG->getMachineNode(Mips::LUi, DL, MVT::i32, HiVal);
1187 
1188       if (Lo)
1189         Res = CurDAG->getMachineNode(Mips::ORi, DL, MVT::i32,
1190                                      Hi ? SDValue(Res, 0) : ZeroVal, LoVal);
1191 
1192       assert((Hi || Lo) && "Zero case reached 32 bit case splat synthesis!");
1193       Res =
1194           CurDAG->getMachineNode(Mips::FILL_W, DL, MVT::v4i32, SDValue(Res, 0));
1195 
1196     } else if (SplatValue.isSignedIntN(32) && SplatBitSize == 64 &&
1197                (ABI.IsN32() || ABI.IsN64())) {
1198       // N32 and N64 can perform some tricks that O32 can't for signed 32 bit
1199       // integers due to having 64bit registers. lui will cause the necessary
1200       // zero/sign extension.
1201       const unsigned Lo = SplatValue.getLoBits(16).getZExtValue();
1202       const unsigned Hi = SplatValue.lshr(16).getLoBits(16).getZExtValue();
1203       SDValue ZeroVal = CurDAG->getRegister(Mips::ZERO, MVT::i32);
1204 
1205       SDValue LoVal = CurDAG->getTargetConstant(Lo, DL, MVT::i32);
1206       SDValue HiVal = CurDAG->getTargetConstant(Hi, DL, MVT::i32);
1207 
1208       if (Hi)
1209         Res = CurDAG->getMachineNode(Mips::LUi, DL, MVT::i32, HiVal);
1210 
1211       if (Lo)
1212         Res = CurDAG->getMachineNode(Mips::ORi, DL, MVT::i32,
1213                                      Hi ? SDValue(Res, 0) : ZeroVal, LoVal);
1214 
1215       Res = CurDAG->getMachineNode(
1216               Mips::SUBREG_TO_REG, DL, MVT::i64,
1217               CurDAG->getTargetConstant(((Hi >> 15) & 0x1), DL, MVT::i64),
1218               SDValue(Res, 0),
1219               CurDAG->getTargetConstant(Mips::sub_32, DL, MVT::i64));
1220 
1221       Res =
1222           CurDAG->getMachineNode(Mips::FILL_D, DL, MVT::v2i64, SDValue(Res, 0));
1223 
1224     } else if (SplatValue.isSignedIntN(64)) {
1225       // If we have a 64 bit Splat value, we perform a similar sequence to the
1226       // above:
1227       //
1228       // MIPS32:                            MIPS64:
1229       //   lui $res, %highest(val)            lui $res, %highest(val)
1230       //   ori $res, $res, %higher(val)       ori $res, $res, %higher(val)
1231       //   lui $res2, %hi(val)                lui $res2, %hi(val)
1232       //   ori $res2, %res2, %lo(val)         ori $res2, %res2, %lo(val)
1233       //   $res3 = fill $res2                 dinsu $res, $res2, 0, 32
1234       //   $res4 = insert.w $res3[1], $res    fill.d $res
1235       //   splat.d $res4, 0
1236       //
1237       // The ability to use dinsu is guaranteed as MSA requires MIPSR5.
1238       // This saves having to materialize the value by shifts and ors.
1239       //
1240       // FIXME: Implement the preferred sequence for MIPS64R6:
1241       //
1242       // MIPS64R6:
1243       //   ori $res, $zero, %lo(val)
1244       //   daui $res, $res, %hi(val)
1245       //   dahi $res, $res, %higher(val)
1246       //   dati $res, $res, %highest(cal)
1247       //   fill.d $res
1248       //
1249 
1250       const unsigned Lo = SplatValue.getLoBits(16).getZExtValue();
1251       const unsigned Hi = SplatValue.lshr(16).getLoBits(16).getZExtValue();
1252       const unsigned Higher = SplatValue.lshr(32).getLoBits(16).getZExtValue();
1253       const unsigned Highest = SplatValue.lshr(48).getLoBits(16).getZExtValue();
1254 
1255       SDValue LoVal = CurDAG->getTargetConstant(Lo, DL, MVT::i32);
1256       SDValue HiVal = CurDAG->getTargetConstant(Hi, DL, MVT::i32);
1257       SDValue HigherVal = CurDAG->getTargetConstant(Higher, DL, MVT::i32);
1258       SDValue HighestVal = CurDAG->getTargetConstant(Highest, DL, MVT::i32);
1259       SDValue ZeroVal = CurDAG->getRegister(Mips::ZERO, MVT::i32);
1260 
1261       // Independent of whether we're targeting MIPS64 or not, the basic
1262       // operations are the same. Also, directly use the $zero register if
1263       // the 16 bit chunk is zero.
1264       //
1265       // For optimization purposes we always synthesize the splat value as
1266       // an i32 value, then if we're targetting MIPS64, use SUBREG_TO_REG
1267       // just before combining the values with dinsu to produce an i64. This
1268       // enables SelectionDAG to aggressively share components of splat values
1269       // where possible.
1270       //
1271       // FIXME: This is the general constant synthesis problem. This code
1272       //        should be factored out into a class shared between all the
1273       //        classes that need it. Specifically, for a splat size of 64
1274       //        bits that's a negative number we can do better than LUi/ORi
1275       //        for the upper 32bits.
1276 
1277       if (Hi)
1278         Res = CurDAG->getMachineNode(Mips::LUi, DL, MVT::i32, HiVal);
1279 
1280       if (Lo)
1281         Res = CurDAG->getMachineNode(Mips::ORi, DL, MVT::i32,
1282                                      Hi ? SDValue(Res, 0) : ZeroVal, LoVal);
1283 
1284       SDNode *HiRes;
1285       if (Highest)
1286         HiRes = CurDAG->getMachineNode(Mips::LUi, DL, MVT::i32, HighestVal);
1287 
1288       if (Higher)
1289         HiRes = CurDAG->getMachineNode(Mips::ORi, DL, MVT::i32,
1290                                        Highest ? SDValue(HiRes, 0) : ZeroVal,
1291                                        HigherVal);
1292 
1293 
1294       if (ABI.IsO32()) {
1295         Res = CurDAG->getMachineNode(Mips::FILL_W, DL, MVT::v4i32,
1296                                      (Hi || Lo) ? SDValue(Res, 0) : ZeroVal);
1297 
1298         Res = CurDAG->getMachineNode(
1299             Mips::INSERT_W, DL, MVT::v4i32, SDValue(Res, 0),
1300             (Highest || Higher) ? SDValue(HiRes, 0) : ZeroVal,
1301             CurDAG->getTargetConstant(1, DL, MVT::i32));
1302 
1303         const TargetLowering *TLI = getTargetLowering();
1304         const TargetRegisterClass *RC =
1305             TLI->getRegClassFor(ViaVecTy.getSimpleVT());
1306 
1307         Res = CurDAG->getMachineNode(
1308             Mips::COPY_TO_REGCLASS, DL, ViaVecTy, SDValue(Res, 0),
1309             CurDAG->getTargetConstant(RC->getID(), DL, MVT::i32));
1310 
1311         Res = CurDAG->getMachineNode(
1312             Mips::SPLATI_D, DL, MVT::v2i64, SDValue(Res, 0),
1313             CurDAG->getTargetConstant(0, DL, MVT::i32));
1314       } else if (ABI.IsN64() || ABI.IsN32()) {
1315 
1316         SDValue Zero64Val = CurDAG->getRegister(Mips::ZERO_64, MVT::i64);
1317         const bool HiResNonZero = Highest || Higher;
1318         const bool ResNonZero = Hi || Lo;
1319 
1320         if (HiResNonZero)
1321           HiRes = CurDAG->getMachineNode(
1322               Mips::SUBREG_TO_REG, DL, MVT::i64,
1323               CurDAG->getTargetConstant(((Highest >> 15) & 0x1), DL, MVT::i64),
1324               SDValue(HiRes, 0),
1325               CurDAG->getTargetConstant(Mips::sub_32, DL, MVT::i64));
1326 
1327         if (ResNonZero)
1328           Res = CurDAG->getMachineNode(
1329               Mips::SUBREG_TO_REG, DL, MVT::i64,
1330               CurDAG->getTargetConstant(((Hi >> 15) & 0x1), DL, MVT::i64),
1331               SDValue(Res, 0),
1332               CurDAG->getTargetConstant(Mips::sub_32, DL, MVT::i64));
1333 
1334         // We have 3 cases:
1335         //   The HiRes is nonzero but Res is $zero  => dsll32 HiRes, 0
1336         //   The Res is nonzero but HiRes is $zero  => dinsu Res, $zero, 32, 32
1337         //   Both are non zero                      => dinsu Res, HiRes, 32, 32
1338         //
1339         // The obvious "missing" case is when both are zero, but that case is
1340         // handled by the ldi case.
1341         if (ResNonZero) {
1342           IntegerType *Int32Ty =
1343               IntegerType::get(MF->getFunction().getContext(), 32);
1344           const ConstantInt *Const32 = ConstantInt::get(Int32Ty, 32);
1345           SDValue Ops[4] = {HiResNonZero ? SDValue(HiRes, 0) : Zero64Val,
1346                             CurDAG->getConstant(*Const32, DL, MVT::i32),
1347                             CurDAG->getConstant(*Const32, DL, MVT::i32),
1348                             SDValue(Res, 0)};
1349 
1350           Res = CurDAG->getMachineNode(Mips::DINSU, DL, MVT::i64, Ops);
1351         } else if (HiResNonZero) {
1352           Res = CurDAG->getMachineNode(
1353               Mips::DSLL32, DL, MVT::i64, SDValue(HiRes, 0),
1354               CurDAG->getTargetConstant(0, DL, MVT::i32));
1355         } else
1356           llvm_unreachable(
1357               "Zero splat value handled by non-zero 64bit splat synthesis!");
1358 
1359         Res = CurDAG->getMachineNode(Mips::FILL_D, DL, MVT::v2i64,
1360                                      SDValue(Res, 0));
1361       } else
1362         llvm_unreachable("Unknown ABI in MipsISelDAGToDAG!");
1363 
1364     } else
1365       return false;
1366 
1367     if (ResVecTy != ViaVecTy) {
1368       // If LdiOp is writing to a different register class to ResVecTy, then
1369       // fix it up here. This COPY_TO_REGCLASS should never cause a move.v
1370       // since the source and destination register sets contain the same
1371       // registers.
1372       const TargetLowering *TLI = getTargetLowering();
1373       MVT ResVecTySimple = ResVecTy.getSimpleVT();
1374       const TargetRegisterClass *RC = TLI->getRegClassFor(ResVecTySimple);
1375       Res = CurDAG->getMachineNode(Mips::COPY_TO_REGCLASS, DL,
1376                                    ResVecTy, SDValue(Res, 0),
1377                                    CurDAG->getTargetConstant(RC->getID(), DL,
1378                                                              MVT::i32));
1379     }
1380 
1381     ReplaceNode(Node, Res);
1382     return true;
1383   }
1384 
1385   }
1386 
1387   return false;
1388 }
1389 
SelectInlineAsmMemoryOperand(const SDValue & Op,InlineAsm::ConstraintCode ConstraintID,std::vector<SDValue> & OutOps)1390 bool MipsSEDAGToDAGISel::SelectInlineAsmMemoryOperand(
1391     const SDValue &Op, InlineAsm::ConstraintCode ConstraintID,
1392     std::vector<SDValue> &OutOps) {
1393   SDValue Base, Offset;
1394 
1395   switch(ConstraintID) {
1396   default:
1397     llvm_unreachable("Unexpected asm memory constraint");
1398   // All memory constraints can at least accept raw pointers.
1399   case InlineAsm::ConstraintCode::m:
1400   case InlineAsm::ConstraintCode::o:
1401     if (selectAddrRegImm16(Op, Base, Offset)) {
1402       OutOps.push_back(Base);
1403       OutOps.push_back(Offset);
1404       return false;
1405     }
1406     OutOps.push_back(Op);
1407     OutOps.push_back(CurDAG->getTargetConstant(0, SDLoc(Op), MVT::i32));
1408     return false;
1409   case InlineAsm::ConstraintCode::R:
1410     // The 'R' constraint is supposed to be much more complicated than this.
1411     // However, it's becoming less useful due to architectural changes and
1412     // ought to be replaced by other constraints such as 'ZC'.
1413     // For now, support 9-bit signed offsets which is supportable by all
1414     // subtargets for all instructions.
1415     if (selectAddrRegImm9(Op, Base, Offset)) {
1416       OutOps.push_back(Base);
1417       OutOps.push_back(Offset);
1418       return false;
1419     }
1420     OutOps.push_back(Op);
1421     OutOps.push_back(CurDAG->getTargetConstant(0, SDLoc(Op), MVT::i32));
1422     return false;
1423   case InlineAsm::ConstraintCode::ZC:
1424     // ZC matches whatever the pref, ll, and sc instructions can handle for the
1425     // given subtarget.
1426     if (Subtarget->inMicroMipsMode()) {
1427       // On microMIPS, they can handle 12-bit offsets.
1428       if (selectAddrRegImm12(Op, Base, Offset)) {
1429         OutOps.push_back(Base);
1430         OutOps.push_back(Offset);
1431         return false;
1432       }
1433     } else if (Subtarget->hasMips32r6()) {
1434       // On MIPS32r6/MIPS64r6, they can only handle 9-bit offsets.
1435       if (selectAddrRegImm9(Op, Base, Offset)) {
1436         OutOps.push_back(Base);
1437         OutOps.push_back(Offset);
1438         return false;
1439       }
1440     } else if (selectAddrRegImm16(Op, Base, Offset)) {
1441       // Prior to MIPS32r6/MIPS64r6, they can handle 16-bit offsets.
1442       OutOps.push_back(Base);
1443       OutOps.push_back(Offset);
1444       return false;
1445     }
1446     // In all cases, 0-bit offsets are acceptable.
1447     OutOps.push_back(Op);
1448     OutOps.push_back(CurDAG->getTargetConstant(0, SDLoc(Op), MVT::i32));
1449     return false;
1450   }
1451   return true;
1452 }
1453 
MipsSEDAGToDAGISelLegacy(MipsTargetMachine & TM,CodeGenOptLevel OL)1454 MipsSEDAGToDAGISelLegacy::MipsSEDAGToDAGISelLegacy(MipsTargetMachine &TM,
1455                                                    CodeGenOptLevel OL)
1456     : MipsDAGToDAGISelLegacy(std::make_unique<MipsSEDAGToDAGISel>(TM, OL)) {}
1457 
createMipsSEISelDag(MipsTargetMachine & TM,CodeGenOptLevel OptLevel)1458 FunctionPass *llvm::createMipsSEISelDag(MipsTargetMachine &TM,
1459                                         CodeGenOptLevel OptLevel) {
1460   return new MipsSEDAGToDAGISelLegacy(TM, OptLevel);
1461 }
1462