1 //===-- MipsSEISelDAGToDAG.cpp - A Dag to Dag Inst Selector for MipsSE ----===//
2 //
3 // Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions.
4 // See https://llvm.org/LICENSE.txt for license information.
5 // SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception
6 //
7 //===----------------------------------------------------------------------===//
8 //
9 // Subclass of MipsDAGToDAGISel specialized for mips32/64.
10 //
11 //===----------------------------------------------------------------------===//
12
13 #include "MipsSEISelDAGToDAG.h"
14 #include "MCTargetDesc/MipsBaseInfo.h"
15 #include "Mips.h"
16 #include "MipsAnalyzeImmediate.h"
17 #include "MipsMachineFunction.h"
18 #include "MipsRegisterInfo.h"
19 #include "llvm/CodeGen/MachineConstantPool.h"
20 #include "llvm/CodeGen/MachineFrameInfo.h"
21 #include "llvm/CodeGen/MachineFunction.h"
22 #include "llvm/CodeGen/MachineInstrBuilder.h"
23 #include "llvm/CodeGen/MachineRegisterInfo.h"
24 #include "llvm/CodeGen/SelectionDAGNodes.h"
25 #include "llvm/IR/CFG.h"
26 #include "llvm/IR/Dominators.h"
27 #include "llvm/IR/GlobalValue.h"
28 #include "llvm/IR/Instructions.h"
29 #include "llvm/IR/Intrinsics.h"
30 #include "llvm/IR/IntrinsicsMips.h"
31 #include "llvm/IR/Type.h"
32 #include "llvm/Support/Debug.h"
33 #include "llvm/Support/ErrorHandling.h"
34 #include "llvm/Support/raw_ostream.h"
35 #include "llvm/Target/TargetMachine.h"
36 using namespace llvm;
37
38 #define DEBUG_TYPE "mips-isel"
39
runOnMachineFunction(MachineFunction & MF)40 bool MipsSEDAGToDAGISel::runOnMachineFunction(MachineFunction &MF) {
41 Subtarget = &MF.getSubtarget<MipsSubtarget>();
42 if (Subtarget->inMips16Mode())
43 return false;
44 return MipsDAGToDAGISel::runOnMachineFunction(MF);
45 }
46
getAnalysisUsage(AnalysisUsage & AU) const47 void MipsSEDAGToDAGISelLegacy::getAnalysisUsage(AnalysisUsage &AU) const {
48 AU.addRequired<DominatorTreeWrapperPass>();
49 SelectionDAGISelLegacy::getAnalysisUsage(AU);
50 }
51
addDSPCtrlRegOperands(bool IsDef,MachineInstr & MI,MachineFunction & MF)52 void MipsSEDAGToDAGISel::addDSPCtrlRegOperands(bool IsDef, MachineInstr &MI,
53 MachineFunction &MF) {
54 MachineInstrBuilder MIB(MF, &MI);
55 unsigned Mask = MI.getOperand(1).getImm();
56 unsigned Flag =
57 IsDef ? RegState::ImplicitDefine : RegState::Implicit | RegState::Undef;
58
59 if (Mask & 1)
60 MIB.addReg(Mips::DSPPos, Flag);
61
62 if (Mask & 2)
63 MIB.addReg(Mips::DSPSCount, Flag);
64
65 if (Mask & 4)
66 MIB.addReg(Mips::DSPCarry, Flag);
67
68 if (Mask & 8)
69 MIB.addReg(Mips::DSPOutFlag, Flag);
70
71 if (Mask & 16)
72 MIB.addReg(Mips::DSPCCond, Flag);
73
74 if (Mask & 32)
75 MIB.addReg(Mips::DSPEFI, Flag);
76 }
77
getMSACtrlReg(const SDValue RegIdx) const78 unsigned MipsSEDAGToDAGISel::getMSACtrlReg(const SDValue RegIdx) const {
79 uint64_t RegNum = RegIdx->getAsZExtVal();
80 return Mips::MSACtrlRegClass.getRegister(RegNum);
81 }
82
replaceUsesWithZeroReg(MachineRegisterInfo * MRI,const MachineInstr & MI)83 bool MipsSEDAGToDAGISel::replaceUsesWithZeroReg(MachineRegisterInfo *MRI,
84 const MachineInstr& MI) {
85 unsigned DstReg = 0, ZeroReg = 0;
86
87 // Check if MI is "addiu $dst, $zero, 0" or "daddiu $dst, $zero, 0".
88 if ((MI.getOpcode() == Mips::ADDiu) &&
89 (MI.getOperand(1).getReg() == Mips::ZERO) &&
90 (MI.getOperand(2).isImm()) &&
91 (MI.getOperand(2).getImm() == 0)) {
92 DstReg = MI.getOperand(0).getReg();
93 ZeroReg = Mips::ZERO;
94 } else if ((MI.getOpcode() == Mips::DADDiu) &&
95 (MI.getOperand(1).getReg() == Mips::ZERO_64) &&
96 (MI.getOperand(2).isImm()) &&
97 (MI.getOperand(2).getImm() == 0)) {
98 DstReg = MI.getOperand(0).getReg();
99 ZeroReg = Mips::ZERO_64;
100 }
101
102 if (!DstReg)
103 return false;
104
105 // Replace uses with ZeroReg.
106 for (MachineRegisterInfo::use_iterator U = MRI->use_begin(DstReg),
107 E = MRI->use_end(); U != E;) {
108 MachineOperand &MO = *U;
109 unsigned OpNo = U.getOperandNo();
110 MachineInstr *MI = MO.getParent();
111 ++U;
112
113 // Do not replace if it is a phi's operand or is tied to def operand.
114 if (MI->isPHI() || MI->isRegTiedToDefOperand(OpNo) || MI->isPseudo())
115 continue;
116
117 // Also, we have to check that the register class of the operand
118 // contains the zero register.
119 if (!MRI->getRegClass(MO.getReg())->contains(ZeroReg))
120 continue;
121
122 MO.setReg(ZeroReg);
123 }
124
125 return true;
126 }
127
emitMCountABI(MachineInstr & MI,MachineBasicBlock & MBB,MachineFunction & MF)128 void MipsSEDAGToDAGISel::emitMCountABI(MachineInstr &MI, MachineBasicBlock &MBB,
129 MachineFunction &MF) {
130 MachineInstrBuilder MIB(MF, &MI);
131 if (!Subtarget->isABI_O32()) { // N32, N64
132 // Save current return address.
133 BuildMI(MBB, &MI, MI.getDebugLoc(), TII->get(Mips::OR64))
134 .addDef(Mips::AT_64)
135 .addUse(Mips::RA_64, RegState::Undef)
136 .addUse(Mips::ZERO_64);
137 // Stops instruction above from being removed later on.
138 MIB.addUse(Mips::AT_64, RegState::Implicit);
139 } else { // O32
140 // Save current return address.
141 BuildMI(MBB, &MI, MI.getDebugLoc(), TII->get(Mips::OR))
142 .addDef(Mips::AT)
143 .addUse(Mips::RA, RegState::Undef)
144 .addUse(Mips::ZERO);
145 // _mcount pops 2 words from stack.
146 BuildMI(MBB, &MI, MI.getDebugLoc(), TII->get(Mips::ADDiu))
147 .addDef(Mips::SP)
148 .addUse(Mips::SP)
149 .addImm(-8);
150 // Stops first instruction above from being removed later on.
151 MIB.addUse(Mips::AT, RegState::Implicit);
152 }
153 }
154
processFunctionAfterISel(MachineFunction & MF)155 void MipsSEDAGToDAGISel::processFunctionAfterISel(MachineFunction &MF) {
156 MF.getInfo<MipsFunctionInfo>()->initGlobalBaseReg(MF);
157
158 MachineRegisterInfo *MRI = &MF.getRegInfo();
159
160 for (auto &MBB: MF) {
161 for (auto &MI: MBB) {
162 switch (MI.getOpcode()) {
163 case Mips::RDDSP:
164 addDSPCtrlRegOperands(false, MI, MF);
165 break;
166 case Mips::WRDSP:
167 addDSPCtrlRegOperands(true, MI, MF);
168 break;
169 case Mips::BuildPairF64_64:
170 case Mips::ExtractElementF64_64:
171 if (!Subtarget->useOddSPReg()) {
172 MI.addOperand(MachineOperand::CreateReg(Mips::SP, false, true));
173 break;
174 }
175 [[fallthrough]];
176 case Mips::BuildPairF64:
177 case Mips::ExtractElementF64:
178 if (Subtarget->isABI_FPXX() && !Subtarget->hasMTHC1())
179 MI.addOperand(MachineOperand::CreateReg(Mips::SP, false, true));
180 break;
181 case Mips::JAL:
182 case Mips::JAL_MM:
183 if (MI.getOperand(0).isGlobal() &&
184 MI.getOperand(0).getGlobal()->getGlobalIdentifier() == "_mcount")
185 emitMCountABI(MI, MBB, MF);
186 break;
187 case Mips::JALRPseudo:
188 case Mips::JALR64Pseudo:
189 case Mips::JALR16_MM:
190 if (MI.getOperand(2).isMCSymbol() &&
191 MI.getOperand(2).getMCSymbol()->getName() == "_mcount")
192 emitMCountABI(MI, MBB, MF);
193 break;
194 case Mips::JALR:
195 if (MI.getOperand(3).isMCSymbol() &&
196 MI.getOperand(3).getMCSymbol()->getName() == "_mcount")
197 emitMCountABI(MI, MBB, MF);
198 break;
199 default:
200 replaceUsesWithZeroReg(MRI, MI);
201 }
202 }
203 }
204 }
205
selectAddE(SDNode * Node,const SDLoc & DL) const206 void MipsSEDAGToDAGISel::selectAddE(SDNode *Node, const SDLoc &DL) const {
207 SDValue InGlue = Node->getOperand(2);
208 unsigned Opc = InGlue.getOpcode();
209 SDValue LHS = Node->getOperand(0), RHS = Node->getOperand(1);
210 EVT VT = LHS.getValueType();
211
212 // In the base case, we can rely on the carry bit from the addsc
213 // instruction.
214 if (Opc == ISD::ADDC) {
215 SDValue Ops[3] = {LHS, RHS, InGlue};
216 CurDAG->SelectNodeTo(Node, Mips::ADDWC, VT, MVT::Glue, Ops);
217 return;
218 }
219
220 assert(Opc == ISD::ADDE && "ISD::ADDE not in a chain of ADDE nodes!");
221
222 // The more complex case is when there is a chain of ISD::ADDE nodes like:
223 // (adde (adde (adde (addc a b) c) d) e).
224 //
225 // The addwc instruction does not write to the carry bit, instead it writes
226 // to bit 20 of the dsp control register. To match this series of nodes, each
227 // intermediate adde node must be expanded to write the carry bit before the
228 // addition.
229
230 // Start by reading the overflow field for addsc and moving the value to the
231 // carry field. The usage of 1 here with MipsISD::RDDSP / Mips::WRDSP
232 // corresponds to reading/writing the entire control register to/from a GPR.
233
234 SDValue CstOne = CurDAG->getTargetConstant(1, DL, MVT::i32);
235
236 SDValue OuFlag = CurDAG->getTargetConstant(20, DL, MVT::i32);
237
238 SDNode *DSPCtrlField = CurDAG->getMachineNode(Mips::RDDSP, DL, MVT::i32,
239 MVT::Glue, CstOne, InGlue);
240
241 SDNode *Carry = CurDAG->getMachineNode(
242 Mips::EXT, DL, MVT::i32, SDValue(DSPCtrlField, 0), OuFlag, CstOne);
243
244 SDValue Ops[4] = {SDValue(DSPCtrlField, 0),
245 CurDAG->getTargetConstant(6, DL, MVT::i32), CstOne,
246 SDValue(Carry, 0)};
247 SDNode *DSPCFWithCarry = CurDAG->getMachineNode(Mips::INS, DL, MVT::i32, Ops);
248
249 // My reading of the MIPS DSP 3.01 specification isn't as clear as I
250 // would like about whether bit 20 always gets overwritten by addwc.
251 // Hence take an extremely conservative view and presume it's sticky. We
252 // therefore need to clear it.
253
254 SDValue Zero = CurDAG->getRegister(Mips::ZERO, MVT::i32);
255
256 SDValue InsOps[4] = {Zero, OuFlag, CstOne, SDValue(DSPCFWithCarry, 0)};
257 SDNode *DSPCtrlFinal =
258 CurDAG->getMachineNode(Mips::INS, DL, MVT::i32, InsOps);
259
260 SDNode *WrDSP = CurDAG->getMachineNode(Mips::WRDSP, DL, MVT::Glue,
261 SDValue(DSPCtrlFinal, 0), CstOne);
262
263 SDValue Operands[3] = {LHS, RHS, SDValue(WrDSP, 0)};
264 CurDAG->SelectNodeTo(Node, Mips::ADDWC, VT, MVT::Glue, Operands);
265 }
266
267 /// Match frameindex
selectAddrFrameIndex(SDValue Addr,SDValue & Base,SDValue & Offset) const268 bool MipsSEDAGToDAGISel::selectAddrFrameIndex(SDValue Addr, SDValue &Base,
269 SDValue &Offset) const {
270 if (FrameIndexSDNode *FIN = dyn_cast<FrameIndexSDNode>(Addr)) {
271 EVT ValTy = Addr.getValueType();
272
273 Base = CurDAG->getTargetFrameIndex(FIN->getIndex(), ValTy);
274 Offset = CurDAG->getTargetConstant(0, SDLoc(Addr), ValTy);
275 return true;
276 }
277 return false;
278 }
279
280 /// Match frameindex+offset and frameindex|offset
selectAddrFrameIndexOffset(SDValue Addr,SDValue & Base,SDValue & Offset,unsigned OffsetBits,unsigned ShiftAmount=0) const281 bool MipsSEDAGToDAGISel::selectAddrFrameIndexOffset(
282 SDValue Addr, SDValue &Base, SDValue &Offset, unsigned OffsetBits,
283 unsigned ShiftAmount = 0) const {
284 if (CurDAG->isBaseWithConstantOffset(Addr)) {
285 auto *CN = cast<ConstantSDNode>(Addr.getOperand(1));
286 if (isIntN(OffsetBits + ShiftAmount, CN->getSExtValue())) {
287 EVT ValTy = Addr.getValueType();
288
289 // If the first operand is a FI, get the TargetFI Node
290 if (FrameIndexSDNode *FIN =
291 dyn_cast<FrameIndexSDNode>(Addr.getOperand(0)))
292 Base = CurDAG->getTargetFrameIndex(FIN->getIndex(), ValTy);
293 else {
294 Base = Addr.getOperand(0);
295 // If base is a FI, additional offset calculation is done in
296 // eliminateFrameIndex, otherwise we need to check the alignment
297 const Align Alignment(1ULL << ShiftAmount);
298 if (!isAligned(Alignment, CN->getZExtValue()))
299 return false;
300 }
301
302 Offset = CurDAG->getTargetConstant(CN->getZExtValue(), SDLoc(Addr),
303 ValTy);
304 return true;
305 }
306 }
307 return false;
308 }
309
310 /// ComplexPattern used on MipsInstrInfo
311 /// Used on Mips Load/Store instructions
selectAddrRegImm(SDValue Addr,SDValue & Base,SDValue & Offset) const312 bool MipsSEDAGToDAGISel::selectAddrRegImm(SDValue Addr, SDValue &Base,
313 SDValue &Offset) const {
314 // if Address is FI, get the TargetFrameIndex.
315 if (selectAddrFrameIndex(Addr, Base, Offset))
316 return true;
317
318 // on PIC code Load GA
319 if (Addr.getOpcode() == MipsISD::Wrapper) {
320 Base = Addr.getOperand(0);
321 Offset = Addr.getOperand(1);
322 return true;
323 }
324
325 if (!TM.isPositionIndependent()) {
326 if ((Addr.getOpcode() == ISD::TargetExternalSymbol ||
327 Addr.getOpcode() == ISD::TargetGlobalAddress))
328 return false;
329 }
330
331 // Addresses of the form FI+const or FI|const
332 if (selectAddrFrameIndexOffset(Addr, Base, Offset, 16))
333 return true;
334
335 // Operand is a result from an ADD.
336 if (Addr.getOpcode() == ISD::ADD) {
337 // When loading from constant pools, load the lower address part in
338 // the instruction itself. Example, instead of:
339 // lui $2, %hi($CPI1_0)
340 // addiu $2, $2, %lo($CPI1_0)
341 // lwc1 $f0, 0($2)
342 // Generate:
343 // lui $2, %hi($CPI1_0)
344 // lwc1 $f0, %lo($CPI1_0)($2)
345 if (Addr.getOperand(1).getOpcode() == MipsISD::Lo ||
346 Addr.getOperand(1).getOpcode() == MipsISD::GPRel) {
347 SDValue Opnd0 = Addr.getOperand(1).getOperand(0);
348 if (isa<ConstantPoolSDNode>(Opnd0) || isa<GlobalAddressSDNode>(Opnd0) ||
349 isa<JumpTableSDNode>(Opnd0)) {
350 Base = Addr.getOperand(0);
351 Offset = Opnd0;
352 return true;
353 }
354 }
355 }
356
357 return false;
358 }
359
360 /// ComplexPattern used on MipsInstrInfo
361 /// Used on Mips Load/Store instructions
selectAddrDefault(SDValue Addr,SDValue & Base,SDValue & Offset) const362 bool MipsSEDAGToDAGISel::selectAddrDefault(SDValue Addr, SDValue &Base,
363 SDValue &Offset) const {
364 Base = Addr;
365 Offset = CurDAG->getTargetConstant(0, SDLoc(Addr), Addr.getValueType());
366 return true;
367 }
368
selectIntAddr(SDValue Addr,SDValue & Base,SDValue & Offset) const369 bool MipsSEDAGToDAGISel::selectIntAddr(SDValue Addr, SDValue &Base,
370 SDValue &Offset) const {
371 return selectAddrRegImm(Addr, Base, Offset) ||
372 selectAddrDefault(Addr, Base, Offset);
373 }
374
selectAddrRegImm9(SDValue Addr,SDValue & Base,SDValue & Offset) const375 bool MipsSEDAGToDAGISel::selectAddrRegImm9(SDValue Addr, SDValue &Base,
376 SDValue &Offset) const {
377 if (selectAddrFrameIndex(Addr, Base, Offset))
378 return true;
379
380 if (selectAddrFrameIndexOffset(Addr, Base, Offset, 9))
381 return true;
382
383 return false;
384 }
385
386 /// Used on microMIPS LWC2, LDC2, SWC2 and SDC2 instructions (11-bit offset)
selectAddrRegImm11(SDValue Addr,SDValue & Base,SDValue & Offset) const387 bool MipsSEDAGToDAGISel::selectAddrRegImm11(SDValue Addr, SDValue &Base,
388 SDValue &Offset) const {
389 if (selectAddrFrameIndex(Addr, Base, Offset))
390 return true;
391
392 if (selectAddrFrameIndexOffset(Addr, Base, Offset, 11))
393 return true;
394
395 return false;
396 }
397
398 /// Used on microMIPS Load/Store unaligned instructions (12-bit offset)
selectAddrRegImm12(SDValue Addr,SDValue & Base,SDValue & Offset) const399 bool MipsSEDAGToDAGISel::selectAddrRegImm12(SDValue Addr, SDValue &Base,
400 SDValue &Offset) const {
401 if (selectAddrFrameIndex(Addr, Base, Offset))
402 return true;
403
404 if (selectAddrFrameIndexOffset(Addr, Base, Offset, 12))
405 return true;
406
407 return false;
408 }
409
selectAddrRegImm16(SDValue Addr,SDValue & Base,SDValue & Offset) const410 bool MipsSEDAGToDAGISel::selectAddrRegImm16(SDValue Addr, SDValue &Base,
411 SDValue &Offset) const {
412 if (selectAddrFrameIndex(Addr, Base, Offset))
413 return true;
414
415 if (selectAddrFrameIndexOffset(Addr, Base, Offset, 16))
416 return true;
417
418 return false;
419 }
420
selectIntAddr11MM(SDValue Addr,SDValue & Base,SDValue & Offset) const421 bool MipsSEDAGToDAGISel::selectIntAddr11MM(SDValue Addr, SDValue &Base,
422 SDValue &Offset) const {
423 return selectAddrRegImm11(Addr, Base, Offset) ||
424 selectAddrDefault(Addr, Base, Offset);
425 }
426
selectIntAddr12MM(SDValue Addr,SDValue & Base,SDValue & Offset) const427 bool MipsSEDAGToDAGISel::selectIntAddr12MM(SDValue Addr, SDValue &Base,
428 SDValue &Offset) const {
429 return selectAddrRegImm12(Addr, Base, Offset) ||
430 selectAddrDefault(Addr, Base, Offset);
431 }
432
selectIntAddr16MM(SDValue Addr,SDValue & Base,SDValue & Offset) const433 bool MipsSEDAGToDAGISel::selectIntAddr16MM(SDValue Addr, SDValue &Base,
434 SDValue &Offset) const {
435 return selectAddrRegImm16(Addr, Base, Offset) ||
436 selectAddrDefault(Addr, Base, Offset);
437 }
438
selectIntAddrLSL2MM(SDValue Addr,SDValue & Base,SDValue & Offset) const439 bool MipsSEDAGToDAGISel::selectIntAddrLSL2MM(SDValue Addr, SDValue &Base,
440 SDValue &Offset) const {
441 if (selectAddrFrameIndexOffset(Addr, Base, Offset, 7)) {
442 if (isa<FrameIndexSDNode>(Base))
443 return false;
444
445 if (ConstantSDNode *CN = dyn_cast<ConstantSDNode>(Offset)) {
446 unsigned CnstOff = CN->getZExtValue();
447 return (CnstOff == (CnstOff & 0x3c));
448 }
449
450 return false;
451 }
452
453 // For all other cases where "lw" would be selected, don't select "lw16"
454 // because it would result in additional instructions to prepare operands.
455 if (selectAddrRegImm(Addr, Base, Offset))
456 return false;
457
458 return selectAddrDefault(Addr, Base, Offset);
459 }
460
selectIntAddrSImm10(SDValue Addr,SDValue & Base,SDValue & Offset) const461 bool MipsSEDAGToDAGISel::selectIntAddrSImm10(SDValue Addr, SDValue &Base,
462 SDValue &Offset) const {
463
464 if (selectAddrFrameIndex(Addr, Base, Offset))
465 return true;
466
467 if (selectAddrFrameIndexOffset(Addr, Base, Offset, 10))
468 return true;
469
470 return selectAddrDefault(Addr, Base, Offset);
471 }
472
selectIntAddrSImm10Lsl1(SDValue Addr,SDValue & Base,SDValue & Offset) const473 bool MipsSEDAGToDAGISel::selectIntAddrSImm10Lsl1(SDValue Addr, SDValue &Base,
474 SDValue &Offset) const {
475 if (selectAddrFrameIndex(Addr, Base, Offset))
476 return true;
477
478 if (selectAddrFrameIndexOffset(Addr, Base, Offset, 10, 1))
479 return true;
480
481 return selectAddrDefault(Addr, Base, Offset);
482 }
483
selectIntAddrSImm10Lsl2(SDValue Addr,SDValue & Base,SDValue & Offset) const484 bool MipsSEDAGToDAGISel::selectIntAddrSImm10Lsl2(SDValue Addr, SDValue &Base,
485 SDValue &Offset) const {
486 if (selectAddrFrameIndex(Addr, Base, Offset))
487 return true;
488
489 if (selectAddrFrameIndexOffset(Addr, Base, Offset, 10, 2))
490 return true;
491
492 return selectAddrDefault(Addr, Base, Offset);
493 }
494
selectIntAddrSImm10Lsl3(SDValue Addr,SDValue & Base,SDValue & Offset) const495 bool MipsSEDAGToDAGISel::selectIntAddrSImm10Lsl3(SDValue Addr, SDValue &Base,
496 SDValue &Offset) const {
497 if (selectAddrFrameIndex(Addr, Base, Offset))
498 return true;
499
500 if (selectAddrFrameIndexOffset(Addr, Base, Offset, 10, 3))
501 return true;
502
503 return selectAddrDefault(Addr, Base, Offset);
504 }
505
506 // Select constant vector splats.
507 //
508 // Returns true and sets Imm if:
509 // * MSA is enabled
510 // * N is a ISD::BUILD_VECTOR representing a constant splat
selectVSplat(SDNode * N,APInt & Imm,unsigned MinSizeInBits) const511 bool MipsSEDAGToDAGISel::selectVSplat(SDNode *N, APInt &Imm,
512 unsigned MinSizeInBits) const {
513 if (!Subtarget->hasMSA())
514 return false;
515
516 BuildVectorSDNode *Node = dyn_cast<BuildVectorSDNode>(N);
517
518 if (!Node)
519 return false;
520
521 APInt SplatValue, SplatUndef;
522 unsigned SplatBitSize;
523 bool HasAnyUndefs;
524
525 if (!Node->isConstantSplat(SplatValue, SplatUndef, SplatBitSize, HasAnyUndefs,
526 MinSizeInBits, !Subtarget->isLittle()))
527 return false;
528
529 Imm = SplatValue;
530
531 return true;
532 }
533
534 // Select constant vector splats.
535 //
536 // In addition to the requirements of selectVSplat(), this function returns
537 // true and sets Imm if:
538 // * The splat value is the same width as the elements of the vector
539 // * The splat value fits in an integer with the specified signed-ness and
540 // width.
541 //
542 // This function looks through ISD::BITCAST nodes.
543 // TODO: This might not be appropriate for big-endian MSA since BITCAST is
544 // sometimes a shuffle in big-endian mode.
545 //
546 // It's worth noting that this function is not used as part of the selection
547 // of ldi.[bhwd] since it does not permit using the wrong-typed ldi.[bhwd]
548 // instruction to achieve the desired bit pattern. ldi.[bhwd] is selected in
549 // MipsSEDAGToDAGISel::selectNode.
550 bool MipsSEDAGToDAGISel::
selectVSplatCommon(SDValue N,SDValue & Imm,bool Signed,unsigned ImmBitSize) const551 selectVSplatCommon(SDValue N, SDValue &Imm, bool Signed,
552 unsigned ImmBitSize) const {
553 APInt ImmValue;
554 EVT EltTy = N->getValueType(0).getVectorElementType();
555
556 if (N->getOpcode() == ISD::BITCAST)
557 N = N->getOperand(0);
558
559 if (selectVSplat(N.getNode(), ImmValue, EltTy.getSizeInBits()) &&
560 ImmValue.getBitWidth() == EltTy.getSizeInBits()) {
561
562 if (( Signed && ImmValue.isSignedIntN(ImmBitSize)) ||
563 (!Signed && ImmValue.isIntN(ImmBitSize))) {
564 Imm = CurDAG->getTargetConstant(ImmValue, SDLoc(N), EltTy);
565 return true;
566 }
567 }
568
569 return false;
570 }
571
572 // Select constant vector splats.
573 bool MipsSEDAGToDAGISel::
selectVSplatUimm1(SDValue N,SDValue & Imm) const574 selectVSplatUimm1(SDValue N, SDValue &Imm) const {
575 return selectVSplatCommon(N, Imm, false, 1);
576 }
577
578 bool MipsSEDAGToDAGISel::
selectVSplatUimm2(SDValue N,SDValue & Imm) const579 selectVSplatUimm2(SDValue N, SDValue &Imm) const {
580 return selectVSplatCommon(N, Imm, false, 2);
581 }
582
583 bool MipsSEDAGToDAGISel::
selectVSplatUimm3(SDValue N,SDValue & Imm) const584 selectVSplatUimm3(SDValue N, SDValue &Imm) const {
585 return selectVSplatCommon(N, Imm, false, 3);
586 }
587
588 // Select constant vector splats.
589 bool MipsSEDAGToDAGISel::
selectVSplatUimm4(SDValue N,SDValue & Imm) const590 selectVSplatUimm4(SDValue N, SDValue &Imm) const {
591 return selectVSplatCommon(N, Imm, false, 4);
592 }
593
594 // Select constant vector splats.
595 bool MipsSEDAGToDAGISel::
selectVSplatUimm5(SDValue N,SDValue & Imm) const596 selectVSplatUimm5(SDValue N, SDValue &Imm) const {
597 return selectVSplatCommon(N, Imm, false, 5);
598 }
599
600 // Select constant vector splats.
601 bool MipsSEDAGToDAGISel::
selectVSplatUimm6(SDValue N,SDValue & Imm) const602 selectVSplatUimm6(SDValue N, SDValue &Imm) const {
603 return selectVSplatCommon(N, Imm, false, 6);
604 }
605
606 // Select constant vector splats.
607 bool MipsSEDAGToDAGISel::
selectVSplatUimm8(SDValue N,SDValue & Imm) const608 selectVSplatUimm8(SDValue N, SDValue &Imm) const {
609 return selectVSplatCommon(N, Imm, false, 8);
610 }
611
612 // Select constant vector splats.
613 bool MipsSEDAGToDAGISel::
selectVSplatSimm5(SDValue N,SDValue & Imm) const614 selectVSplatSimm5(SDValue N, SDValue &Imm) const {
615 return selectVSplatCommon(N, Imm, true, 5);
616 }
617
618 // Select constant vector splats whose value is a power of 2.
619 //
620 // In addition to the requirements of selectVSplat(), this function returns
621 // true and sets Imm if:
622 // * The splat value is the same width as the elements of the vector
623 // * The splat value is a power of two.
624 //
625 // This function looks through ISD::BITCAST nodes.
626 // TODO: This might not be appropriate for big-endian MSA since BITCAST is
627 // sometimes a shuffle in big-endian mode.
selectVSplatUimmPow2(SDValue N,SDValue & Imm) const628 bool MipsSEDAGToDAGISel::selectVSplatUimmPow2(SDValue N, SDValue &Imm) const {
629 APInt ImmValue;
630 EVT EltTy = N->getValueType(0).getVectorElementType();
631
632 if (N->getOpcode() == ISD::BITCAST)
633 N = N->getOperand(0);
634
635 if (selectVSplat(N.getNode(), ImmValue, EltTy.getSizeInBits()) &&
636 ImmValue.getBitWidth() == EltTy.getSizeInBits()) {
637 int32_t Log2 = ImmValue.exactLogBase2();
638
639 if (Log2 != -1) {
640 Imm = CurDAG->getTargetConstant(Log2, SDLoc(N), EltTy);
641 return true;
642 }
643 }
644
645 return false;
646 }
647
648 // Select constant vector splats whose value only has a consecutive sequence
649 // of left-most bits set (e.g. 0b11...1100...00).
650 //
651 // In addition to the requirements of selectVSplat(), this function returns
652 // true and sets Imm if:
653 // * The splat value is the same width as the elements of the vector
654 // * The splat value is a consecutive sequence of left-most bits.
655 //
656 // This function looks through ISD::BITCAST nodes.
657 // TODO: This might not be appropriate for big-endian MSA since BITCAST is
658 // sometimes a shuffle in big-endian mode.
selectVSplatMaskL(SDValue N,SDValue & Imm) const659 bool MipsSEDAGToDAGISel::selectVSplatMaskL(SDValue N, SDValue &Imm) const {
660 APInt ImmValue;
661 EVT EltTy = N->getValueType(0).getVectorElementType();
662
663 if (N->getOpcode() == ISD::BITCAST)
664 N = N->getOperand(0);
665
666 if (selectVSplat(N.getNode(), ImmValue, EltTy.getSizeInBits()) &&
667 ImmValue.getBitWidth() == EltTy.getSizeInBits()) {
668 // Extract the run of set bits starting with bit zero from the bitwise
669 // inverse of ImmValue, and test that the inverse of this is the same
670 // as the original value.
671 if (ImmValue == ~(~ImmValue & ~(~ImmValue + 1))) {
672
673 Imm = CurDAG->getTargetConstant(ImmValue.popcount() - 1, SDLoc(N), EltTy);
674 return true;
675 }
676 }
677
678 return false;
679 }
680
681 // Select constant vector splats whose value only has a consecutive sequence
682 // of right-most bits set (e.g. 0b00...0011...11).
683 //
684 // In addition to the requirements of selectVSplat(), this function returns
685 // true and sets Imm if:
686 // * The splat value is the same width as the elements of the vector
687 // * The splat value is a consecutive sequence of right-most bits.
688 //
689 // This function looks through ISD::BITCAST nodes.
690 // TODO: This might not be appropriate for big-endian MSA since BITCAST is
691 // sometimes a shuffle in big-endian mode.
selectVSplatMaskR(SDValue N,SDValue & Imm) const692 bool MipsSEDAGToDAGISel::selectVSplatMaskR(SDValue N, SDValue &Imm) const {
693 APInt ImmValue;
694 EVT EltTy = N->getValueType(0).getVectorElementType();
695
696 if (N->getOpcode() == ISD::BITCAST)
697 N = N->getOperand(0);
698
699 if (selectVSplat(N.getNode(), ImmValue, EltTy.getSizeInBits()) &&
700 ImmValue.getBitWidth() == EltTy.getSizeInBits()) {
701 // Extract the run of set bits starting with bit zero, and test that the
702 // result is the same as the original value
703 if (ImmValue == (ImmValue & ~(ImmValue + 1))) {
704 Imm = CurDAG->getTargetConstant(ImmValue.popcount() - 1, SDLoc(N), EltTy);
705 return true;
706 }
707 }
708
709 return false;
710 }
711
selectVSplatUimmInvPow2(SDValue N,SDValue & Imm) const712 bool MipsSEDAGToDAGISel::selectVSplatUimmInvPow2(SDValue N,
713 SDValue &Imm) const {
714 APInt ImmValue;
715 EVT EltTy = N->getValueType(0).getVectorElementType();
716
717 if (N->getOpcode() == ISD::BITCAST)
718 N = N->getOperand(0);
719
720 if (selectVSplat(N.getNode(), ImmValue, EltTy.getSizeInBits()) &&
721 ImmValue.getBitWidth() == EltTy.getSizeInBits()) {
722 int32_t Log2 = (~ImmValue).exactLogBase2();
723
724 if (Log2 != -1) {
725 Imm = CurDAG->getTargetConstant(Log2, SDLoc(N), EltTy);
726 return true;
727 }
728 }
729
730 return false;
731 }
732
733 // Select const vector splat of 1.
selectVSplatImmEq1(SDValue N) const734 bool MipsSEDAGToDAGISel::selectVSplatImmEq1(SDValue N) const {
735 APInt ImmValue;
736 EVT EltTy = N->getValueType(0).getVectorElementType();
737
738 if (N->getOpcode() == ISD::BITCAST)
739 N = N->getOperand(0);
740
741 return selectVSplat(N.getNode(), ImmValue, EltTy.getSizeInBits()) &&
742 ImmValue.getBitWidth() == EltTy.getSizeInBits() && ImmValue == 1;
743 }
744
trySelect(SDNode * Node)745 bool MipsSEDAGToDAGISel::trySelect(SDNode *Node) {
746 unsigned Opcode = Node->getOpcode();
747 SDLoc DL(Node);
748
749 ///
750 // Instruction Selection not handled by the auto-generated
751 // tablegen selection should be handled here.
752 ///
753 switch(Opcode) {
754 default: break;
755
756 case MipsISD::DOUBLE_SELECT_I:
757 case MipsISD::DOUBLE_SELECT_I64: {
758 MVT VT = Subtarget->isGP64bit() ? MVT::i64 : MVT::i32;
759 SDValue cond = Node->getOperand(0);
760 SDValue Hi1 = Node->getOperand(1);
761 SDValue Lo1 = Node->getOperand(2);
762 SDValue Hi2 = Node->getOperand(3);
763 SDValue Lo2 = Node->getOperand(4);
764
765 SDValue ops[] = {cond, Hi1, Lo1, Hi2, Lo2};
766 EVT NodeTys[] = {VT, VT};
767 ReplaceNode(Node, CurDAG->getMachineNode(Subtarget->isGP64bit()
768 ? Mips::PseudoD_SELECT_I64
769 : Mips::PseudoD_SELECT_I,
770 DL, NodeTys, ops));
771 return true;
772 }
773
774 case ISD::ADDE: {
775 selectAddE(Node, DL);
776 return true;
777 }
778
779 case ISD::ConstantFP: {
780 auto *CN = cast<ConstantFPSDNode>(Node);
781 if (Node->getValueType(0) == MVT::f64 && CN->isExactlyValue(+0.0)) {
782 if (Subtarget->isGP64bit()) {
783 SDValue Zero = CurDAG->getCopyFromReg(CurDAG->getEntryNode(), DL,
784 Mips::ZERO_64, MVT::i64);
785 ReplaceNode(Node,
786 CurDAG->getMachineNode(Mips::DMTC1, DL, MVT::f64, Zero));
787 } else if (Subtarget->isFP64bit()) {
788 SDValue Zero = CurDAG->getCopyFromReg(CurDAG->getEntryNode(), DL,
789 Mips::ZERO, MVT::i32);
790 ReplaceNode(Node, CurDAG->getMachineNode(Mips::BuildPairF64_64, DL,
791 MVT::f64, Zero, Zero));
792 } else {
793 SDValue Zero = CurDAG->getCopyFromReg(CurDAG->getEntryNode(), DL,
794 Mips::ZERO, MVT::i32);
795 ReplaceNode(Node, CurDAG->getMachineNode(Mips::BuildPairF64, DL,
796 MVT::f64, Zero, Zero));
797 }
798 return true;
799 }
800 break;
801 }
802
803 case ISD::Constant: {
804 auto *CN = cast<ConstantSDNode>(Node);
805 int64_t Imm = CN->getSExtValue();
806 unsigned Size = CN->getValueSizeInBits(0);
807
808 if (isInt<32>(Imm))
809 break;
810
811 MipsAnalyzeImmediate AnalyzeImm;
812
813 const MipsAnalyzeImmediate::InstSeq &Seq =
814 AnalyzeImm.Analyze(Imm, Size, false);
815
816 MipsAnalyzeImmediate::InstSeq::const_iterator Inst = Seq.begin();
817 SDLoc DL(CN);
818 SDNode *RegOpnd;
819 SDValue ImmOpnd = CurDAG->getTargetConstant(SignExtend64<16>(Inst->ImmOpnd),
820 DL, MVT::i64);
821
822 // The first instruction can be a LUi which is different from other
823 // instructions (ADDiu, ORI and SLL) in that it does not have a register
824 // operand.
825 if (Inst->Opc == Mips::LUi64)
826 RegOpnd = CurDAG->getMachineNode(Inst->Opc, DL, MVT::i64, ImmOpnd);
827 else
828 RegOpnd =
829 CurDAG->getMachineNode(Inst->Opc, DL, MVT::i64,
830 CurDAG->getRegister(Mips::ZERO_64, MVT::i64),
831 ImmOpnd);
832
833 // The remaining instructions in the sequence are handled here.
834 for (++Inst; Inst != Seq.end(); ++Inst) {
835 ImmOpnd = CurDAG->getTargetConstant(SignExtend64<16>(Inst->ImmOpnd), DL,
836 MVT::i64);
837 RegOpnd = CurDAG->getMachineNode(Inst->Opc, DL, MVT::i64,
838 SDValue(RegOpnd, 0), ImmOpnd);
839 }
840
841 ReplaceNode(Node, RegOpnd);
842 return true;
843 }
844
845 case ISD::INTRINSIC_W_CHAIN: {
846 const unsigned IntrinsicOpcode = Node->getConstantOperandVal(1);
847 switch (IntrinsicOpcode) {
848 default:
849 break;
850
851 case Intrinsic::mips_cfcmsa: {
852 SDValue ChainIn = Node->getOperand(0);
853 SDValue RegIdx = Node->getOperand(2);
854 SDValue Reg = CurDAG->getCopyFromReg(ChainIn, DL,
855 getMSACtrlReg(RegIdx), MVT::i32);
856 ReplaceNode(Node, Reg.getNode());
857 return true;
858 }
859 case Intrinsic::mips_ldr_d:
860 case Intrinsic::mips_ldr_w: {
861 unsigned Op = (IntrinsicOpcode == Intrinsic::mips_ldr_d) ? Mips::LDR_D
862 : Mips::LDR_W;
863
864 SDLoc DL(Node);
865 assert(Node->getNumOperands() == 4 && "Unexpected number of operands.");
866 const SDValue &Chain = Node->getOperand(0);
867 const SDValue &Intrinsic = Node->getOperand(1);
868 const SDValue &Pointer = Node->getOperand(2);
869 const SDValue &Constant = Node->getOperand(3);
870
871 assert(Chain.getValueType() == MVT::Other);
872 (void)Intrinsic;
873 assert(Intrinsic.getOpcode() == ISD::TargetConstant &&
874 Constant.getOpcode() == ISD::Constant &&
875 "Invalid instruction operand.");
876
877 // Convert Constant to TargetConstant.
878 const ConstantInt *Val =
879 cast<ConstantSDNode>(Constant)->getConstantIntValue();
880 SDValue Imm =
881 CurDAG->getTargetConstant(*Val, DL, Constant.getValueType());
882
883 SmallVector<SDValue, 3> Ops{Pointer, Imm, Chain};
884
885 assert(Node->getNumValues() == 2);
886 assert(Node->getValueType(0).is128BitVector());
887 assert(Node->getValueType(1) == MVT::Other);
888 SmallVector<EVT, 2> ResTys{Node->getValueType(0), Node->getValueType(1)};
889
890 ReplaceNode(Node, CurDAG->getMachineNode(Op, DL, ResTys, Ops));
891
892 return true;
893 }
894 }
895 break;
896 }
897
898 case ISD::INTRINSIC_WO_CHAIN: {
899 switch (Node->getConstantOperandVal(0)) {
900 default:
901 break;
902
903 case Intrinsic::mips_move_v:
904 // Like an assignment but will always produce a move.v even if
905 // unnecessary.
906 ReplaceNode(Node, CurDAG->getMachineNode(Mips::MOVE_V, DL,
907 Node->getValueType(0),
908 Node->getOperand(1)));
909 return true;
910 }
911 break;
912 }
913
914 case ISD::INTRINSIC_VOID: {
915 const unsigned IntrinsicOpcode = Node->getConstantOperandVal(1);
916 switch (IntrinsicOpcode) {
917 default:
918 break;
919
920 case Intrinsic::mips_ctcmsa: {
921 SDValue ChainIn = Node->getOperand(0);
922 SDValue RegIdx = Node->getOperand(2);
923 SDValue Value = Node->getOperand(3);
924 SDValue ChainOut = CurDAG->getCopyToReg(ChainIn, DL,
925 getMSACtrlReg(RegIdx), Value);
926 ReplaceNode(Node, ChainOut.getNode());
927 return true;
928 }
929 case Intrinsic::mips_str_d:
930 case Intrinsic::mips_str_w: {
931 unsigned Op = (IntrinsicOpcode == Intrinsic::mips_str_d) ? Mips::STR_D
932 : Mips::STR_W;
933
934 SDLoc DL(Node);
935 assert(Node->getNumOperands() == 5 && "Unexpected number of operands.");
936 const SDValue &Chain = Node->getOperand(0);
937 const SDValue &Intrinsic = Node->getOperand(1);
938 const SDValue &Vec = Node->getOperand(2);
939 const SDValue &Pointer = Node->getOperand(3);
940 const SDValue &Constant = Node->getOperand(4);
941
942 assert(Chain.getValueType() == MVT::Other);
943 (void)Intrinsic;
944 assert(Intrinsic.getOpcode() == ISD::TargetConstant &&
945 Constant.getOpcode() == ISD::Constant &&
946 "Invalid instruction operand.");
947
948 // Convert Constant to TargetConstant.
949 const ConstantInt *Val =
950 cast<ConstantSDNode>(Constant)->getConstantIntValue();
951 SDValue Imm =
952 CurDAG->getTargetConstant(*Val, DL, Constant.getValueType());
953
954 SmallVector<SDValue, 4> Ops{Vec, Pointer, Imm, Chain};
955
956 assert(Node->getNumValues() == 1);
957 assert(Node->getValueType(0) == MVT::Other);
958 SmallVector<EVT, 1> ResTys{Node->getValueType(0)};
959
960 ReplaceNode(Node, CurDAG->getMachineNode(Op, DL, ResTys, Ops));
961 return true;
962 }
963 }
964 break;
965 }
966
967 case MipsISD::FAbs: {
968 MVT ResTy = Node->getSimpleValueType(0);
969 assert((ResTy == MVT::f64 || ResTy == MVT::f32) &&
970 "Unsupported float type!");
971 unsigned Opc = 0;
972 if (ResTy == MVT::f64)
973 Opc = (Subtarget->isFP64bit() ? Mips::FABS_D64 : Mips::FABS_D32);
974 else
975 Opc = Mips::FABS_S;
976
977 if (Subtarget->inMicroMipsMode()) {
978 switch (Opc) {
979 case Mips::FABS_D64:
980 Opc = Mips::FABS_D64_MM;
981 break;
982 case Mips::FABS_D32:
983 Opc = Mips::FABS_D32_MM;
984 break;
985 case Mips::FABS_S:
986 Opc = Mips::FABS_S_MM;
987 break;
988 default:
989 llvm_unreachable("Unknown opcode for MIPS floating point abs!");
990 }
991 }
992
993 ReplaceNode(Node,
994 CurDAG->getMachineNode(Opc, DL, ResTy, Node->getOperand(0)));
995
996 return true;
997 }
998
999 // Manually match MipsISD::Ins nodes to get the correct instruction. It has
1000 // to be done in this fashion so that we respect the differences between
1001 // dins and dinsm, as the difference is that the size operand has the range
1002 // 0 < size <= 32 for dins while dinsm has the range 2 <= size <= 64 which
1003 // means SelectionDAGISel would have to test all the operands at once to
1004 // match the instruction.
1005 case MipsISD::Ins: {
1006
1007 // Validating the node operands.
1008 if (Node->getValueType(0) != MVT::i32 && Node->getValueType(0) != MVT::i64)
1009 return false;
1010
1011 if (Node->getNumOperands() != 4)
1012 return false;
1013
1014 if (Node->getOperand(1)->getOpcode() != ISD::Constant ||
1015 Node->getOperand(2)->getOpcode() != ISD::Constant)
1016 return false;
1017
1018 MVT ResTy = Node->getSimpleValueType(0);
1019 uint64_t Pos = Node->getConstantOperandVal(1);
1020 uint64_t Size = Node->getConstantOperandVal(2);
1021
1022 // Size has to be >0 for 'ins', 'dins' and 'dinsu'.
1023 if (!Size)
1024 return false;
1025
1026 if (Pos + Size > 64)
1027 return false;
1028
1029 if (ResTy != MVT::i32 && ResTy != MVT::i64)
1030 return false;
1031
1032 unsigned Opcode = 0;
1033 if (ResTy == MVT::i32) {
1034 if (Pos + Size <= 32)
1035 Opcode = Mips::INS;
1036 } else {
1037 if (Pos + Size <= 32)
1038 Opcode = Mips::DINS;
1039 else if (Pos < 32 && 1 < Size)
1040 Opcode = Mips::DINSM;
1041 else
1042 Opcode = Mips::DINSU;
1043 }
1044
1045 if (Opcode) {
1046 SDValue Ops[4] = {
1047 Node->getOperand(0), CurDAG->getTargetConstant(Pos, DL, MVT::i32),
1048 CurDAG->getTargetConstant(Size, DL, MVT::i32), Node->getOperand(3)};
1049
1050 ReplaceNode(Node, CurDAG->getMachineNode(Opcode, DL, ResTy, Ops));
1051 return true;
1052 }
1053
1054 return false;
1055 }
1056
1057 case MipsISD::ThreadPointer: {
1058 EVT PtrVT = getTargetLowering()->getPointerTy(CurDAG->getDataLayout());
1059 unsigned RdhwrOpc, DestReg;
1060
1061 if (PtrVT == MVT::i32) {
1062 RdhwrOpc = Mips::RDHWR;
1063 DestReg = Mips::V1;
1064 } else {
1065 RdhwrOpc = Mips::RDHWR64;
1066 DestReg = Mips::V1_64;
1067 }
1068
1069 SDNode *Rdhwr =
1070 CurDAG->getMachineNode(RdhwrOpc, DL, Node->getValueType(0), MVT::Glue,
1071 CurDAG->getRegister(Mips::HWR29, MVT::i32),
1072 CurDAG->getTargetConstant(0, DL, MVT::i32));
1073 SDValue Chain = CurDAG->getCopyToReg(CurDAG->getEntryNode(), DL, DestReg,
1074 SDValue(Rdhwr, 0), SDValue(Rdhwr, 1));
1075 SDValue ResNode = CurDAG->getCopyFromReg(Chain, DL, DestReg, PtrVT,
1076 Chain.getValue(1));
1077 ReplaceNode(Node, ResNode.getNode());
1078 return true;
1079 }
1080
1081 case ISD::BUILD_VECTOR: {
1082 // Select appropriate ldi.[bhwd] instructions for constant splats of
1083 // 128-bit when MSA is enabled. Fixup any register class mismatches that
1084 // occur as a result.
1085 //
1086 // This allows the compiler to use a wider range of immediates than would
1087 // otherwise be allowed. If, for example, v4i32 could only use ldi.h then
1088 // it would not be possible to load { 0x01010101, 0x01010101, 0x01010101,
1089 // 0x01010101 } without using a constant pool. This would be sub-optimal
1090 // when // 'ldi.b wd, 1' is capable of producing that bit-pattern in the
1091 // same set/ of registers. Similarly, ldi.h isn't capable of producing {
1092 // 0x00000000, 0x00000001, 0x00000000, 0x00000001 } but 'ldi.d wd, 1' can.
1093
1094 const MipsABIInfo &ABI =
1095 static_cast<const MipsTargetMachine &>(TM).getABI();
1096
1097 BuildVectorSDNode *BVN = cast<BuildVectorSDNode>(Node);
1098 APInt SplatValue, SplatUndef;
1099 unsigned SplatBitSize;
1100 bool HasAnyUndefs;
1101 unsigned LdiOp;
1102 EVT ResVecTy = BVN->getValueType(0);
1103 EVT ViaVecTy;
1104
1105 if (!Subtarget->hasMSA() || !BVN->getValueType(0).is128BitVector())
1106 return false;
1107
1108 if (!BVN->isConstantSplat(SplatValue, SplatUndef, SplatBitSize,
1109 HasAnyUndefs, 8,
1110 !Subtarget->isLittle()))
1111 return false;
1112
1113 switch (SplatBitSize) {
1114 default:
1115 return false;
1116 case 8:
1117 LdiOp = Mips::LDI_B;
1118 ViaVecTy = MVT::v16i8;
1119 break;
1120 case 16:
1121 LdiOp = Mips::LDI_H;
1122 ViaVecTy = MVT::v8i16;
1123 break;
1124 case 32:
1125 LdiOp = Mips::LDI_W;
1126 ViaVecTy = MVT::v4i32;
1127 break;
1128 case 64:
1129 LdiOp = Mips::LDI_D;
1130 ViaVecTy = MVT::v2i64;
1131 break;
1132 }
1133
1134 SDNode *Res = nullptr;
1135
1136 // If we have a signed 10 bit integer, we can splat it directly.
1137 //
1138 // If we have something bigger we can synthesize the value into a GPR and
1139 // splat from there.
1140 if (SplatValue.isSignedIntN(10)) {
1141 SDValue Imm = CurDAG->getTargetConstant(SplatValue, DL,
1142 ViaVecTy.getVectorElementType());
1143
1144 Res = CurDAG->getMachineNode(LdiOp, DL, ViaVecTy, Imm);
1145 } else if (SplatValue.isSignedIntN(16) &&
1146 ((ABI.IsO32() && SplatBitSize < 64) ||
1147 (ABI.IsN32() || ABI.IsN64()))) {
1148 // Only handle signed 16 bit values when the element size is GPR width.
1149 // MIPS64 can handle all the cases but MIPS32 would need to handle
1150 // negative cases specifically here. Instead, handle those cases as
1151 // 64bit values.
1152
1153 bool Is32BitSplat = ABI.IsO32() || SplatBitSize < 64;
1154 const unsigned ADDiuOp = Is32BitSplat ? Mips::ADDiu : Mips::DADDiu;
1155 const MVT SplatMVT = Is32BitSplat ? MVT::i32 : MVT::i64;
1156 SDValue ZeroVal = CurDAG->getRegister(
1157 Is32BitSplat ? Mips::ZERO : Mips::ZERO_64, SplatMVT);
1158
1159 const unsigned FILLOp =
1160 SplatBitSize == 16
1161 ? Mips::FILL_H
1162 : (SplatBitSize == 32 ? Mips::FILL_W
1163 : (SplatBitSize == 64 ? Mips::FILL_D : 0));
1164
1165 assert(FILLOp != 0 && "Unknown FILL Op for splat synthesis!");
1166 assert((!ABI.IsO32() || (FILLOp != Mips::FILL_D)) &&
1167 "Attempting to use fill.d on MIPS32!");
1168
1169 const unsigned Lo = SplatValue.getLoBits(16).getZExtValue();
1170 SDValue LoVal = CurDAG->getTargetConstant(Lo, DL, SplatMVT);
1171
1172 Res = CurDAG->getMachineNode(ADDiuOp, DL, SplatMVT, ZeroVal, LoVal);
1173 Res = CurDAG->getMachineNode(FILLOp, DL, ViaVecTy, SDValue(Res, 0));
1174
1175 } else if (SplatValue.isSignedIntN(32) && SplatBitSize == 32) {
1176 // Only handle the cases where the splat size agrees with the size
1177 // of the SplatValue here.
1178 const unsigned Lo = SplatValue.getLoBits(16).getZExtValue();
1179 const unsigned Hi = SplatValue.lshr(16).getLoBits(16).getZExtValue();
1180 SDValue ZeroVal = CurDAG->getRegister(Mips::ZERO, MVT::i32);
1181
1182 SDValue LoVal = CurDAG->getTargetConstant(Lo, DL, MVT::i32);
1183 SDValue HiVal = CurDAG->getTargetConstant(Hi, DL, MVT::i32);
1184
1185 if (Hi)
1186 Res = CurDAG->getMachineNode(Mips::LUi, DL, MVT::i32, HiVal);
1187
1188 if (Lo)
1189 Res = CurDAG->getMachineNode(Mips::ORi, DL, MVT::i32,
1190 Hi ? SDValue(Res, 0) : ZeroVal, LoVal);
1191
1192 assert((Hi || Lo) && "Zero case reached 32 bit case splat synthesis!");
1193 Res =
1194 CurDAG->getMachineNode(Mips::FILL_W, DL, MVT::v4i32, SDValue(Res, 0));
1195
1196 } else if (SplatValue.isSignedIntN(32) && SplatBitSize == 64 &&
1197 (ABI.IsN32() || ABI.IsN64())) {
1198 // N32 and N64 can perform some tricks that O32 can't for signed 32 bit
1199 // integers due to having 64bit registers. lui will cause the necessary
1200 // zero/sign extension.
1201 const unsigned Lo = SplatValue.getLoBits(16).getZExtValue();
1202 const unsigned Hi = SplatValue.lshr(16).getLoBits(16).getZExtValue();
1203 SDValue ZeroVal = CurDAG->getRegister(Mips::ZERO, MVT::i32);
1204
1205 SDValue LoVal = CurDAG->getTargetConstant(Lo, DL, MVT::i32);
1206 SDValue HiVal = CurDAG->getTargetConstant(Hi, DL, MVT::i32);
1207
1208 if (Hi)
1209 Res = CurDAG->getMachineNode(Mips::LUi, DL, MVT::i32, HiVal);
1210
1211 if (Lo)
1212 Res = CurDAG->getMachineNode(Mips::ORi, DL, MVT::i32,
1213 Hi ? SDValue(Res, 0) : ZeroVal, LoVal);
1214
1215 Res = CurDAG->getMachineNode(
1216 Mips::SUBREG_TO_REG, DL, MVT::i64,
1217 CurDAG->getTargetConstant(((Hi >> 15) & 0x1), DL, MVT::i64),
1218 SDValue(Res, 0),
1219 CurDAG->getTargetConstant(Mips::sub_32, DL, MVT::i64));
1220
1221 Res =
1222 CurDAG->getMachineNode(Mips::FILL_D, DL, MVT::v2i64, SDValue(Res, 0));
1223
1224 } else if (SplatValue.isSignedIntN(64)) {
1225 // If we have a 64 bit Splat value, we perform a similar sequence to the
1226 // above:
1227 //
1228 // MIPS32: MIPS64:
1229 // lui $res, %highest(val) lui $res, %highest(val)
1230 // ori $res, $res, %higher(val) ori $res, $res, %higher(val)
1231 // lui $res2, %hi(val) lui $res2, %hi(val)
1232 // ori $res2, %res2, %lo(val) ori $res2, %res2, %lo(val)
1233 // $res3 = fill $res2 dinsu $res, $res2, 0, 32
1234 // $res4 = insert.w $res3[1], $res fill.d $res
1235 // splat.d $res4, 0
1236 //
1237 // The ability to use dinsu is guaranteed as MSA requires MIPSR5.
1238 // This saves having to materialize the value by shifts and ors.
1239 //
1240 // FIXME: Implement the preferred sequence for MIPS64R6:
1241 //
1242 // MIPS64R6:
1243 // ori $res, $zero, %lo(val)
1244 // daui $res, $res, %hi(val)
1245 // dahi $res, $res, %higher(val)
1246 // dati $res, $res, %highest(cal)
1247 // fill.d $res
1248 //
1249
1250 const unsigned Lo = SplatValue.getLoBits(16).getZExtValue();
1251 const unsigned Hi = SplatValue.lshr(16).getLoBits(16).getZExtValue();
1252 const unsigned Higher = SplatValue.lshr(32).getLoBits(16).getZExtValue();
1253 const unsigned Highest = SplatValue.lshr(48).getLoBits(16).getZExtValue();
1254
1255 SDValue LoVal = CurDAG->getTargetConstant(Lo, DL, MVT::i32);
1256 SDValue HiVal = CurDAG->getTargetConstant(Hi, DL, MVT::i32);
1257 SDValue HigherVal = CurDAG->getTargetConstant(Higher, DL, MVT::i32);
1258 SDValue HighestVal = CurDAG->getTargetConstant(Highest, DL, MVT::i32);
1259 SDValue ZeroVal = CurDAG->getRegister(Mips::ZERO, MVT::i32);
1260
1261 // Independent of whether we're targeting MIPS64 or not, the basic
1262 // operations are the same. Also, directly use the $zero register if
1263 // the 16 bit chunk is zero.
1264 //
1265 // For optimization purposes we always synthesize the splat value as
1266 // an i32 value, then if we're targetting MIPS64, use SUBREG_TO_REG
1267 // just before combining the values with dinsu to produce an i64. This
1268 // enables SelectionDAG to aggressively share components of splat values
1269 // where possible.
1270 //
1271 // FIXME: This is the general constant synthesis problem. This code
1272 // should be factored out into a class shared between all the
1273 // classes that need it. Specifically, for a splat size of 64
1274 // bits that's a negative number we can do better than LUi/ORi
1275 // for the upper 32bits.
1276
1277 if (Hi)
1278 Res = CurDAG->getMachineNode(Mips::LUi, DL, MVT::i32, HiVal);
1279
1280 if (Lo)
1281 Res = CurDAG->getMachineNode(Mips::ORi, DL, MVT::i32,
1282 Hi ? SDValue(Res, 0) : ZeroVal, LoVal);
1283
1284 SDNode *HiRes;
1285 if (Highest)
1286 HiRes = CurDAG->getMachineNode(Mips::LUi, DL, MVT::i32, HighestVal);
1287
1288 if (Higher)
1289 HiRes = CurDAG->getMachineNode(Mips::ORi, DL, MVT::i32,
1290 Highest ? SDValue(HiRes, 0) : ZeroVal,
1291 HigherVal);
1292
1293
1294 if (ABI.IsO32()) {
1295 Res = CurDAG->getMachineNode(Mips::FILL_W, DL, MVT::v4i32,
1296 (Hi || Lo) ? SDValue(Res, 0) : ZeroVal);
1297
1298 Res = CurDAG->getMachineNode(
1299 Mips::INSERT_W, DL, MVT::v4i32, SDValue(Res, 0),
1300 (Highest || Higher) ? SDValue(HiRes, 0) : ZeroVal,
1301 CurDAG->getTargetConstant(1, DL, MVT::i32));
1302
1303 const TargetLowering *TLI = getTargetLowering();
1304 const TargetRegisterClass *RC =
1305 TLI->getRegClassFor(ViaVecTy.getSimpleVT());
1306
1307 Res = CurDAG->getMachineNode(
1308 Mips::COPY_TO_REGCLASS, DL, ViaVecTy, SDValue(Res, 0),
1309 CurDAG->getTargetConstant(RC->getID(), DL, MVT::i32));
1310
1311 Res = CurDAG->getMachineNode(
1312 Mips::SPLATI_D, DL, MVT::v2i64, SDValue(Res, 0),
1313 CurDAG->getTargetConstant(0, DL, MVT::i32));
1314 } else if (ABI.IsN64() || ABI.IsN32()) {
1315
1316 SDValue Zero64Val = CurDAG->getRegister(Mips::ZERO_64, MVT::i64);
1317 const bool HiResNonZero = Highest || Higher;
1318 const bool ResNonZero = Hi || Lo;
1319
1320 if (HiResNonZero)
1321 HiRes = CurDAG->getMachineNode(
1322 Mips::SUBREG_TO_REG, DL, MVT::i64,
1323 CurDAG->getTargetConstant(((Highest >> 15) & 0x1), DL, MVT::i64),
1324 SDValue(HiRes, 0),
1325 CurDAG->getTargetConstant(Mips::sub_32, DL, MVT::i64));
1326
1327 if (ResNonZero)
1328 Res = CurDAG->getMachineNode(
1329 Mips::SUBREG_TO_REG, DL, MVT::i64,
1330 CurDAG->getTargetConstant(((Hi >> 15) & 0x1), DL, MVT::i64),
1331 SDValue(Res, 0),
1332 CurDAG->getTargetConstant(Mips::sub_32, DL, MVT::i64));
1333
1334 // We have 3 cases:
1335 // The HiRes is nonzero but Res is $zero => dsll32 HiRes, 0
1336 // The Res is nonzero but HiRes is $zero => dinsu Res, $zero, 32, 32
1337 // Both are non zero => dinsu Res, HiRes, 32, 32
1338 //
1339 // The obvious "missing" case is when both are zero, but that case is
1340 // handled by the ldi case.
1341 if (ResNonZero) {
1342 IntegerType *Int32Ty =
1343 IntegerType::get(MF->getFunction().getContext(), 32);
1344 const ConstantInt *Const32 = ConstantInt::get(Int32Ty, 32);
1345 SDValue Ops[4] = {HiResNonZero ? SDValue(HiRes, 0) : Zero64Val,
1346 CurDAG->getConstant(*Const32, DL, MVT::i32),
1347 CurDAG->getConstant(*Const32, DL, MVT::i32),
1348 SDValue(Res, 0)};
1349
1350 Res = CurDAG->getMachineNode(Mips::DINSU, DL, MVT::i64, Ops);
1351 } else if (HiResNonZero) {
1352 Res = CurDAG->getMachineNode(
1353 Mips::DSLL32, DL, MVT::i64, SDValue(HiRes, 0),
1354 CurDAG->getTargetConstant(0, DL, MVT::i32));
1355 } else
1356 llvm_unreachable(
1357 "Zero splat value handled by non-zero 64bit splat synthesis!");
1358
1359 Res = CurDAG->getMachineNode(Mips::FILL_D, DL, MVT::v2i64,
1360 SDValue(Res, 0));
1361 } else
1362 llvm_unreachable("Unknown ABI in MipsISelDAGToDAG!");
1363
1364 } else
1365 return false;
1366
1367 if (ResVecTy != ViaVecTy) {
1368 // If LdiOp is writing to a different register class to ResVecTy, then
1369 // fix it up here. This COPY_TO_REGCLASS should never cause a move.v
1370 // since the source and destination register sets contain the same
1371 // registers.
1372 const TargetLowering *TLI = getTargetLowering();
1373 MVT ResVecTySimple = ResVecTy.getSimpleVT();
1374 const TargetRegisterClass *RC = TLI->getRegClassFor(ResVecTySimple);
1375 Res = CurDAG->getMachineNode(Mips::COPY_TO_REGCLASS, DL,
1376 ResVecTy, SDValue(Res, 0),
1377 CurDAG->getTargetConstant(RC->getID(), DL,
1378 MVT::i32));
1379 }
1380
1381 ReplaceNode(Node, Res);
1382 return true;
1383 }
1384
1385 }
1386
1387 return false;
1388 }
1389
SelectInlineAsmMemoryOperand(const SDValue & Op,InlineAsm::ConstraintCode ConstraintID,std::vector<SDValue> & OutOps)1390 bool MipsSEDAGToDAGISel::SelectInlineAsmMemoryOperand(
1391 const SDValue &Op, InlineAsm::ConstraintCode ConstraintID,
1392 std::vector<SDValue> &OutOps) {
1393 SDValue Base, Offset;
1394
1395 switch(ConstraintID) {
1396 default:
1397 llvm_unreachable("Unexpected asm memory constraint");
1398 // All memory constraints can at least accept raw pointers.
1399 case InlineAsm::ConstraintCode::m:
1400 case InlineAsm::ConstraintCode::o:
1401 if (selectAddrRegImm16(Op, Base, Offset)) {
1402 OutOps.push_back(Base);
1403 OutOps.push_back(Offset);
1404 return false;
1405 }
1406 OutOps.push_back(Op);
1407 OutOps.push_back(CurDAG->getTargetConstant(0, SDLoc(Op), MVT::i32));
1408 return false;
1409 case InlineAsm::ConstraintCode::R:
1410 // The 'R' constraint is supposed to be much more complicated than this.
1411 // However, it's becoming less useful due to architectural changes and
1412 // ought to be replaced by other constraints such as 'ZC'.
1413 // For now, support 9-bit signed offsets which is supportable by all
1414 // subtargets for all instructions.
1415 if (selectAddrRegImm9(Op, Base, Offset)) {
1416 OutOps.push_back(Base);
1417 OutOps.push_back(Offset);
1418 return false;
1419 }
1420 OutOps.push_back(Op);
1421 OutOps.push_back(CurDAG->getTargetConstant(0, SDLoc(Op), MVT::i32));
1422 return false;
1423 case InlineAsm::ConstraintCode::ZC:
1424 // ZC matches whatever the pref, ll, and sc instructions can handle for the
1425 // given subtarget.
1426 if (Subtarget->inMicroMipsMode()) {
1427 // On microMIPS, they can handle 12-bit offsets.
1428 if (selectAddrRegImm12(Op, Base, Offset)) {
1429 OutOps.push_back(Base);
1430 OutOps.push_back(Offset);
1431 return false;
1432 }
1433 } else if (Subtarget->hasMips32r6()) {
1434 // On MIPS32r6/MIPS64r6, they can only handle 9-bit offsets.
1435 if (selectAddrRegImm9(Op, Base, Offset)) {
1436 OutOps.push_back(Base);
1437 OutOps.push_back(Offset);
1438 return false;
1439 }
1440 } else if (selectAddrRegImm16(Op, Base, Offset)) {
1441 // Prior to MIPS32r6/MIPS64r6, they can handle 16-bit offsets.
1442 OutOps.push_back(Base);
1443 OutOps.push_back(Offset);
1444 return false;
1445 }
1446 // In all cases, 0-bit offsets are acceptable.
1447 OutOps.push_back(Op);
1448 OutOps.push_back(CurDAG->getTargetConstant(0, SDLoc(Op), MVT::i32));
1449 return false;
1450 }
1451 return true;
1452 }
1453
MipsSEDAGToDAGISelLegacy(MipsTargetMachine & TM,CodeGenOptLevel OL)1454 MipsSEDAGToDAGISelLegacy::MipsSEDAGToDAGISelLegacy(MipsTargetMachine &TM,
1455 CodeGenOptLevel OL)
1456 : MipsDAGToDAGISelLegacy(std::make_unique<MipsSEDAGToDAGISel>(TM, OL)) {}
1457
createMipsSEISelDag(MipsTargetMachine & TM,CodeGenOptLevel OptLevel)1458 FunctionPass *llvm::createMipsSEISelDag(MipsTargetMachine &TM,
1459 CodeGenOptLevel OptLevel) {
1460 return new MipsSEDAGToDAGISelLegacy(TM, OptLevel);
1461 }
1462