xref: /freebsd/contrib/llvm-project/llvm/lib/Target/AMDGPU/AMDGPUInstructions.td (revision 0fca6ea1d4eea4c934cfff25ac9ee8ad6fe95583)
10b57cec5SDimitry Andric//===-- AMDGPUInstructions.td - Common instruction defs ---*- tablegen -*-===//
20b57cec5SDimitry Andric//
30b57cec5SDimitry Andric// Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions.
40b57cec5SDimitry Andric// See https://llvm.org/LICENSE.txt for license information.
50b57cec5SDimitry Andric// SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception
60b57cec5SDimitry Andric//
70b57cec5SDimitry Andric//===----------------------------------------------------------------------===//
80b57cec5SDimitry Andric//
90b57cec5SDimitry Andric// This file contains instruction defs that are common to all hw codegen
100b57cec5SDimitry Andric// targets.
110b57cec5SDimitry Andric//
120b57cec5SDimitry Andric//===----------------------------------------------------------------------===//
130b57cec5SDimitry Andric
140b57cec5SDimitry Andricclass AddressSpacesImpl {
150b57cec5SDimitry Andric  int Flat = 0;
160b57cec5SDimitry Andric  int Global = 1;
170b57cec5SDimitry Andric  int Region = 2;
180b57cec5SDimitry Andric  int Local = 3;
190b57cec5SDimitry Andric  int Constant = 4;
200b57cec5SDimitry Andric  int Private = 5;
2104eeddc0SDimitry Andric  int Constant32Bit = 6;
220b57cec5SDimitry Andric}
230b57cec5SDimitry Andric
240b57cec5SDimitry Andricdef AddrSpaces : AddressSpacesImpl;
250b57cec5SDimitry Andric
260b57cec5SDimitry Andric
270b57cec5SDimitry Andricclass AMDGPUInst <dag outs, dag ins, string asm = "",
280b57cec5SDimitry Andric  list<dag> pattern = []> : Instruction {
290b57cec5SDimitry Andric  field bit isRegisterLoad = 0;
300b57cec5SDimitry Andric  field bit isRegisterStore = 0;
310b57cec5SDimitry Andric
320b57cec5SDimitry Andric  let Namespace = "AMDGPU";
330b57cec5SDimitry Andric  let OutOperandList = outs;
340b57cec5SDimitry Andric  let InOperandList = ins;
350b57cec5SDimitry Andric  let AsmString = asm;
360b57cec5SDimitry Andric  let Pattern = pattern;
370b57cec5SDimitry Andric  let Itinerary = NullALU;
380b57cec5SDimitry Andric
390b57cec5SDimitry Andric  // SoftFail is a field the disassembler can use to provide a way for
400b57cec5SDimitry Andric  // instructions to not match without killing the whole decode process. It is
410b57cec5SDimitry Andric  // mainly used for ARM, but Tablegen expects this field to exist or it fails
420b57cec5SDimitry Andric  // to build the decode table.
4381ad6265SDimitry Andric  field bits<96> SoftFail = 0;
440b57cec5SDimitry Andric
450b57cec5SDimitry Andric  let DecoderNamespace = Namespace;
460b57cec5SDimitry Andric
470b57cec5SDimitry Andric  let TSFlags{63} = isRegisterLoad;
480b57cec5SDimitry Andric  let TSFlags{62} = isRegisterStore;
490b57cec5SDimitry Andric}
500b57cec5SDimitry Andric
510b57cec5SDimitry Andricclass AMDGPUShaderInst <dag outs, dag ins, string asm = "",
520b57cec5SDimitry Andric  list<dag> pattern = []> : AMDGPUInst<outs, ins, asm, pattern> {
530b57cec5SDimitry Andric
540b57cec5SDimitry Andric  field bits<32> Inst = 0xffffffff;
550b57cec5SDimitry Andric}
560b57cec5SDimitry Andric
570b57cec5SDimitry Andric//===---------------------------------------------------------------------===//
580b57cec5SDimitry Andric// Return instruction
590b57cec5SDimitry Andric//===---------------------------------------------------------------------===//
600b57cec5SDimitry Andric
610b57cec5SDimitry Andricclass ILFormat<dag outs, dag ins, string asmstr, list<dag> pattern>
620b57cec5SDimitry Andric: Instruction {
630b57cec5SDimitry Andric
640b57cec5SDimitry Andric     let Namespace = "AMDGPU";
650b57cec5SDimitry Andric     dag OutOperandList = outs;
660b57cec5SDimitry Andric     dag InOperandList = ins;
670b57cec5SDimitry Andric     let Pattern = pattern;
680b57cec5SDimitry Andric     let AsmString = !strconcat(asmstr, "\n");
690b57cec5SDimitry Andric     let isPseudo = 1;
700b57cec5SDimitry Andric     let Itinerary = NullALU;
710b57cec5SDimitry Andric     bit hasIEEEFlag = 0;
720b57cec5SDimitry Andric     bit hasZeroOpFlag = 0;
730b57cec5SDimitry Andric     let mayLoad = 0;
740b57cec5SDimitry Andric     let mayStore = 0;
750b57cec5SDimitry Andric     let hasSideEffects = 0;
760b57cec5SDimitry Andric     let isCodeGenOnly = 1;
770b57cec5SDimitry Andric}
780b57cec5SDimitry Andric
7981ad6265SDimitry Andric// Get the union of two Register lists
8081ad6265SDimitry Andricclass RegListUnion<list<Register> lstA, list<Register> lstB> {
81bdd1243dSDimitry Andric  list<Register> ret = !listconcat(lstA, !listremove(lstB, lstA));
8281ad6265SDimitry Andric}
8381ad6265SDimitry Andric
840b57cec5SDimitry Andricclass AMDGPUPat<dag pattern, dag result> : Pat<pattern, result>,
8506c3fb27SDimitry Andric      PredicateControl, GISelFlags;
8606c3fb27SDimitry Andric
8706c3fb27SDimitry Andriclet GIIgnoreCopies = 1 in
8806c3fb27SDimitry Andricclass AMDGPUPatIgnoreCopies<dag pattern, dag result> : AMDGPUPat<pattern, result>;
890b57cec5SDimitry Andric
90480093f4SDimitry Andriclet RecomputePerFunction = 1 in {
9106c3fb27SDimitry Andricdef FP16Denormals : Predicate<"MF->getInfo<SIMachineFunctionInfo>()->getMode().FP64FP16Denormals != DenormalMode::getPreserveSign()">;
9206c3fb27SDimitry Andricdef FP32Denormals : Predicate<"MF->getInfo<SIMachineFunctionInfo>()->getMode().FP32Denormals != DenormalMode::getPreserveSign()">;
9306c3fb27SDimitry Andricdef FP64Denormals : Predicate<"MF->getInfo<SIMachineFunctionInfo>()->getMode().FP64FP16Denormals != DenormalMode::getPreserveSign()">;
9406c3fb27SDimitry Andricdef NoFP16Denormals : Predicate<"MF->getInfo<SIMachineFunctionInfo>()->getMode().FP64FP16Denormals == DenormalMode::getPreserveSign()">;
9506c3fb27SDimitry Andricdef NoFP32Denormals : Predicate<"MF->getInfo<SIMachineFunctionInfo>()->getMode().FP32Denormals == DenormalMode::getPreserveSign()">;
9606c3fb27SDimitry Andricdef NoFP64Denormals : Predicate<"MF->getInfo<SIMachineFunctionInfo>()->getMode().FP64FP16Denormals == DenormalMode::getPreserveSign()">;
970b57cec5SDimitry Andricdef UnsafeFPMath : Predicate<"TM.Options.UnsafeFPMath">;
98480093f4SDimitry Andric}
99480093f4SDimitry Andric
1000b57cec5SDimitry Andricdef FMA : Predicate<"Subtarget->hasFMA()">;
1010b57cec5SDimitry Andric
1020b57cec5SDimitry Andricdef InstFlag : OperandWithDefaultOps <i32, (ops (i32 0))>;
1030b57cec5SDimitry Andric
10406c3fb27SDimitry Andricdef i1imm_0 : OperandWithDefaultOps<i1, (ops (i1 0))>;
10506c3fb27SDimitry Andric
1065f757f3fSDimitry Andricclass CustomOperandClass<string name, bit optional, string predicateMethod,
1075f757f3fSDimitry Andric                         string parserMethod, string defaultMethod>
10806c3fb27SDimitry Andric    : AsmOperandClass {
10906c3fb27SDimitry Andric  let Name = name;
1105f757f3fSDimitry Andric  let PredicateMethod = predicateMethod;
11106c3fb27SDimitry Andric  let ParserMethod = parserMethod;
1120b57cec5SDimitry Andric  let RenderMethod = "addImmOperands";
11306c3fb27SDimitry Andric  let IsOptional = optional;
11406c3fb27SDimitry Andric  let DefaultMethod = defaultMethod;
1150b57cec5SDimitry Andric}
1160b57cec5SDimitry Andric
11706c3fb27SDimitry Andricclass CustomOperandProps<bit optional = 0, string name = NAME> {
11806c3fb27SDimitry Andric  string ImmTy = "ImmTy"#name;
1195f757f3fSDimitry Andric  string PredicateMethod = "is"#name;
12006c3fb27SDimitry Andric  string ParserMethod = "parse"#name;
12106c3fb27SDimitry Andric  string DefaultValue = "0";
12206c3fb27SDimitry Andric  string DefaultMethod = "[this]() { return "#
12306c3fb27SDimitry Andric    "AMDGPUOperand::CreateImm(this, "#DefaultValue#", SMLoc(), "#
12406c3fb27SDimitry Andric    "AMDGPUOperand::"#ImmTy#"); }";
12506c3fb27SDimitry Andric  string PrintMethod = "print"#name;
12606c3fb27SDimitry Andric  AsmOperandClass ParserMatchClass =
1275f757f3fSDimitry Andric    CustomOperandClass<name, optional, PredicateMethod, ParserMethod,
1285f757f3fSDimitry Andric                       DefaultMethod>;
12906c3fb27SDimitry Andric  string OperandType = "OPERAND_IMMEDIATE";
1300b57cec5SDimitry Andric}
1310b57cec5SDimitry Andric
13206c3fb27SDimitry Andricclass CustomOperand<ValueType type, bit optional = 0, string name = NAME>
13306c3fb27SDimitry Andric  : Operand<type>, CustomOperandProps<optional, name>;
1340b57cec5SDimitry Andric
13506c3fb27SDimitry Andricclass ImmOperand<ValueType type, string name = NAME, bit optional = 0,
13606c3fb27SDimitry Andric                 string printer = "print"#name>
13706c3fb27SDimitry Andric    : CustomOperand<type, optional, name> {
13806c3fb27SDimitry Andric  let ImmTy = "ImmTyNone";
13906c3fb27SDimitry Andric  let ParserMethod = "";
14006c3fb27SDimitry Andric  let PrintMethod = printer;
1410b57cec5SDimitry Andric}
1420b57cec5SDimitry Andric
143*0fca6ea1SDimitry Andricclass S16ImmOperand : ImmOperand<i16, "S16Imm", 0, "printU16ImmOperand">;
144*0fca6ea1SDimitry Andric
145*0fca6ea1SDimitry Andricdef s16imm : S16ImmOperand;
14606c3fb27SDimitry Andricdef u16imm : ImmOperand<i16, "U16Imm", 0, "printU16ImmOperand">;
1470b57cec5SDimitry Andric
1485f757f3fSDimitry Andricclass ValuePredicatedOperand<CustomOperand op, string valuePredicate,
1495f757f3fSDimitry Andric                             bit optional = 0>
1505f757f3fSDimitry Andric    : CustomOperand<op.Type, optional> {
1515f757f3fSDimitry Andric  let ImmTy = op.ImmTy;
1525f757f3fSDimitry Andric  defvar OpPredicate = op.ParserMatchClass.PredicateMethod;
1535f757f3fSDimitry Andric  let PredicateMethod =
1545f757f3fSDimitry Andric    "getPredicate([](const AMDGPUOperand &Op) -> bool { "#
1555f757f3fSDimitry Andric    "return Op."#OpPredicate#"() && "#valuePredicate#"; })";
1565f757f3fSDimitry Andric  let ParserMethod = op.ParserMatchClass.ParserMethod;
1575f757f3fSDimitry Andric  let DefaultValue = op.DefaultValue;
1585f757f3fSDimitry Andric  let DefaultMethod = op.DefaultMethod;
1595f757f3fSDimitry Andric  let PrintMethod = op.PrintMethod;
1605f757f3fSDimitry Andric}
1615f757f3fSDimitry Andric
1620b57cec5SDimitry Andric//===--------------------------------------------------------------------===//
1630b57cec5SDimitry Andric// Custom Operands
1640b57cec5SDimitry Andric//===--------------------------------------------------------------------===//
1650b57cec5SDimitry Andricdef brtarget   : Operand<OtherVT>;
1660b57cec5SDimitry Andric
1670b57cec5SDimitry Andric//===----------------------------------------------------------------------===//
1680b57cec5SDimitry Andric// Misc. PatFrags
1690b57cec5SDimitry Andric//===----------------------------------------------------------------------===//
1700b57cec5SDimitry Andric
1710b57cec5SDimitry Andricclass HasOneUseUnaryOp<SDPatternOperator op> : PatFrag<
1720b57cec5SDimitry Andric  (ops node:$src0),
173*0fca6ea1SDimitry Andric  (op $src0)> {
174*0fca6ea1SDimitry Andric  let HasOneUse = 1;
175480093f4SDimitry Andric}
1760b57cec5SDimitry Andric
1770b57cec5SDimitry Andricclass HasOneUseBinOp<SDPatternOperator op> : PatFrag<
1780b57cec5SDimitry Andric  (ops node:$src0, node:$src1),
179*0fca6ea1SDimitry Andric  (op $src0, $src1)> {
180*0fca6ea1SDimitry Andric  let HasOneUse = 1;
181480093f4SDimitry Andric}
1820b57cec5SDimitry Andric
1830b57cec5SDimitry Andricclass HasOneUseTernaryOp<SDPatternOperator op> : PatFrag<
1840b57cec5SDimitry Andric  (ops node:$src0, node:$src1, node:$src2),
185*0fca6ea1SDimitry Andric  (op $src0, $src1, $src2)> {
186*0fca6ea1SDimitry Andric  let HasOneUse = 1;
187*0fca6ea1SDimitry Andric}
188*0fca6ea1SDimitry Andric
189*0fca6ea1SDimitry Andricclass is_canonicalized_1<SDPatternOperator op> : PatFrag<
190*0fca6ea1SDimitry Andric  (ops node:$src0),
191*0fca6ea1SDimitry Andric  (op $src0),
192*0fca6ea1SDimitry Andric  [{
193*0fca6ea1SDimitry Andric    const SITargetLowering &Lowering =
194*0fca6ea1SDimitry Andric              *static_cast<const SITargetLowering *>(getTargetLowering());
195*0fca6ea1SDimitry Andric
196*0fca6ea1SDimitry Andric    return Lowering.isCanonicalized(*CurDAG, N->getOperand(0));
197*0fca6ea1SDimitry Andric   }]> {
198*0fca6ea1SDimitry Andric
199480093f4SDimitry Andric  let GISelPredicateCode = [{
200*0fca6ea1SDimitry Andric    const SITargetLowering *TLI = static_cast<const SITargetLowering *>(
201*0fca6ea1SDimitry Andric      MF.getSubtarget().getTargetLowering());
202*0fca6ea1SDimitry Andric
203*0fca6ea1SDimitry Andric    return TLI->isCanonicalized(MI.getOperand(1).getReg(), MF);
204480093f4SDimitry Andric  }];
205480093f4SDimitry Andric}
2060b57cec5SDimitry Andric
207*0fca6ea1SDimitry Andricclass is_canonicalized_2<SDPatternOperator op> : PatFrag<
208fe6060f1SDimitry Andric  (ops node:$src0, node:$src1),
209fe6060f1SDimitry Andric  (op $src0, $src1),
210fe6060f1SDimitry Andric  [{
211fe6060f1SDimitry Andric    const SITargetLowering &Lowering =
212fe6060f1SDimitry Andric              *static_cast<const SITargetLowering *>(getTargetLowering());
213fe6060f1SDimitry Andric
214fe6060f1SDimitry Andric    return Lowering.isCanonicalized(*CurDAG, N->getOperand(0)) &&
215fe6060f1SDimitry Andric      Lowering.isCanonicalized(*CurDAG, N->getOperand(1));
216fe6060f1SDimitry Andric   }]> {
217fe6060f1SDimitry Andric
218fe6060f1SDimitry Andric  // TODO: Improve the Legalizer for g_build_vector in Global Isel to match this class
219fe6060f1SDimitry Andric  let GISelPredicateCode = [{
220fe6060f1SDimitry Andric    const SITargetLowering *TLI = static_cast<const SITargetLowering *>(
221fe6060f1SDimitry Andric      MF.getSubtarget().getTargetLowering());
222fe6060f1SDimitry Andric
223*0fca6ea1SDimitry Andric    return TLI->isCanonicalized(MI.getOperand(1).getReg(), MF) &&
224*0fca6ea1SDimitry Andric      TLI->isCanonicalized(MI.getOperand(2).getReg(), MF);
225fe6060f1SDimitry Andric  }];
226fe6060f1SDimitry Andric}
227fe6060f1SDimitry Andric
22806c3fb27SDimitry Andricclass FoldTernaryOpPat<SDPatternOperator op1, SDPatternOperator op2> : PatFrag<
22906c3fb27SDimitry Andric  (ops node:$src0, node:$src1, node:$src2),
23006c3fb27SDimitry Andric  (op2 (op1 node:$src0, node:$src1), node:$src2)
23106c3fb27SDimitry Andric>;
23206c3fb27SDimitry Andric
23306c3fb27SDimitry Andricdef imad : FoldTernaryOpPat<mul, add>;
234fe6060f1SDimitry Andric
2350b57cec5SDimitry Andriclet Properties = [SDNPCommutative, SDNPAssociative] in {
2360b57cec5SDimitry Andricdef smax_oneuse : HasOneUseBinOp<smax>;
2370b57cec5SDimitry Andricdef smin_oneuse : HasOneUseBinOp<smin>;
2380b57cec5SDimitry Andricdef umax_oneuse : HasOneUseBinOp<umax>;
2390b57cec5SDimitry Andricdef umin_oneuse : HasOneUseBinOp<umin>;
2400b57cec5SDimitry Andric
2410b57cec5SDimitry Andricdef fminnum_oneuse : HasOneUseBinOp<fminnum>;
2420b57cec5SDimitry Andricdef fmaxnum_oneuse : HasOneUseBinOp<fmaxnum>;
2435f757f3fSDimitry Andricdef fminimum_oneuse : HasOneUseBinOp<fminimum>;
2445f757f3fSDimitry Andricdef fmaximum_oneuse : HasOneUseBinOp<fmaximum>;
2450b57cec5SDimitry Andric
2460b57cec5SDimitry Andricdef fminnum_ieee_oneuse : HasOneUseBinOp<fminnum_ieee>;
2470b57cec5SDimitry Andricdef fmaxnum_ieee_oneuse : HasOneUseBinOp<fmaxnum_ieee>;
2480b57cec5SDimitry Andric
2490b57cec5SDimitry Andric
2500b57cec5SDimitry Andricdef and_oneuse : HasOneUseBinOp<and>;
2510b57cec5SDimitry Andricdef or_oneuse : HasOneUseBinOp<or>;
2520b57cec5SDimitry Andricdef xor_oneuse : HasOneUseBinOp<xor>;
2530b57cec5SDimitry Andric} // Properties = [SDNPCommutative, SDNPAssociative]
2540b57cec5SDimitry Andric
2550b57cec5SDimitry Andricdef not_oneuse : HasOneUseUnaryOp<not>;
2560b57cec5SDimitry Andric
2570b57cec5SDimitry Andricdef add_oneuse : HasOneUseBinOp<add>;
2580b57cec5SDimitry Andricdef sub_oneuse : HasOneUseBinOp<sub>;
2590b57cec5SDimitry Andric
2600b57cec5SDimitry Andricdef srl_oneuse : HasOneUseBinOp<srl>;
2610b57cec5SDimitry Andricdef shl_oneuse : HasOneUseBinOp<shl>;
2620b57cec5SDimitry Andric
2630b57cec5SDimitry Andricdef select_oneuse : HasOneUseTernaryOp<select>;
2640b57cec5SDimitry Andric
2650b57cec5SDimitry Andricdef AMDGPUmul_u24_oneuse : HasOneUseBinOp<AMDGPUmul_u24>;
2660b57cec5SDimitry Andricdef AMDGPUmul_i24_oneuse : HasOneUseBinOp<AMDGPUmul_i24>;
2670b57cec5SDimitry Andric
268349cc55cSDimitry Andric//===----------------------------------------------------------------------===//
269349cc55cSDimitry Andric// PatFrags for shifts
270349cc55cSDimitry Andric//===----------------------------------------------------------------------===//
271349cc55cSDimitry Andric
272349cc55cSDimitry Andric// Constrained shift PatFrags.
2734824e7fdSDimitry Andric
2744824e7fdSDimitry Andricdef csh_mask_16 : PatFrag<(ops node:$src0), (and node:$src0, imm),
2754824e7fdSDimitry Andric  [{ return isUnneededShiftMask(N, 4); }]> {
2764824e7fdSDimitry Andric    let GISelPredicateCode = [{ return isUnneededShiftMask(MI, 4); }];
2774824e7fdSDimitry Andric  }
2784824e7fdSDimitry Andric
2794824e7fdSDimitry Andricdef csh_mask_32 : PatFrag<(ops node:$src0), (and node:$src0, imm),
2804824e7fdSDimitry Andric  [{ return isUnneededShiftMask(N, 5); }]> {
2814824e7fdSDimitry Andric    let GISelPredicateCode = [{ return isUnneededShiftMask(MI, 5); }];
2824824e7fdSDimitry Andric  }
2834824e7fdSDimitry Andric
2844824e7fdSDimitry Andricdef csh_mask_64 : PatFrag<(ops node:$src0), (and node:$src0, imm),
2854824e7fdSDimitry Andric  [{ return isUnneededShiftMask(N, 6); }]> {
2864824e7fdSDimitry Andric    let GISelPredicateCode = [{ return isUnneededShiftMask(MI, 6); }];
2874824e7fdSDimitry Andric  }
2884824e7fdSDimitry Andric
289349cc55cSDimitry Andricforeach width = [16, 32, 64] in {
2904824e7fdSDimitry Andricdefvar csh_mask = !cast<SDPatternOperator>("csh_mask_"#width);
291349cc55cSDimitry Andric
292349cc55cSDimitry Andricdef cshl_#width : PatFrags<(ops node:$src0, node:$src1),
2934824e7fdSDimitry Andric  [(shl node:$src0, node:$src1), (shl node:$src0, (csh_mask node:$src1))]>;
294349cc55cSDimitry Andricdefvar cshl = !cast<SDPatternOperator>("cshl_"#width);
295349cc55cSDimitry Andricdef cshl_#width#_oneuse : HasOneUseBinOp<cshl>;
296349cc55cSDimitry Andricdef clshl_rev_#width : PatFrag <(ops node:$src0, node:$src1),
297349cc55cSDimitry Andric  (cshl $src1, $src0)>;
298349cc55cSDimitry Andric
299349cc55cSDimitry Andricdef csrl_#width : PatFrags<(ops node:$src0, node:$src1),
3004824e7fdSDimitry Andric  [(srl node:$src0, node:$src1), (srl node:$src0, (csh_mask node:$src1))]>;
301349cc55cSDimitry Andricdefvar csrl = !cast<SDPatternOperator>("csrl_"#width);
302349cc55cSDimitry Andricdef csrl_#width#_oneuse : HasOneUseBinOp<csrl>;
303349cc55cSDimitry Andricdef clshr_rev_#width : PatFrag <(ops node:$src0, node:$src1),
304349cc55cSDimitry Andric  (csrl $src1, $src0)>;
305349cc55cSDimitry Andric
306349cc55cSDimitry Andricdef csra_#width : PatFrags<(ops node:$src0, node:$src1),
3074824e7fdSDimitry Andric  [(sra node:$src0, node:$src1), (sra node:$src0, (csh_mask node:$src1))]>;
308349cc55cSDimitry Andricdefvar csra = !cast<SDPatternOperator>("csra_"#width);
309349cc55cSDimitry Andricdef csra_#width#_oneuse : HasOneUseBinOp<csra>;
310349cc55cSDimitry Andricdef cashr_rev_#width : PatFrag <(ops node:$src0, node:$src1),
311349cc55cSDimitry Andric  (csra $src1, $src0)>;
312349cc55cSDimitry Andric} // end foreach width
313349cc55cSDimitry Andric
3140b57cec5SDimitry Andricdef srl_16 : PatFrag<
3150b57cec5SDimitry Andric  (ops node:$src0), (srl_oneuse node:$src0, (i32 16))
3160b57cec5SDimitry Andric>;
3170b57cec5SDimitry Andric
3180b57cec5SDimitry Andric
3190b57cec5SDimitry Andricdef hi_i16_elt : PatFrag<
3200b57cec5SDimitry Andric  (ops node:$src0), (i16 (trunc (i32 (srl_16 node:$src0))))
3210b57cec5SDimitry Andric>;
3220b57cec5SDimitry Andric
3230b57cec5SDimitry Andric
3240b57cec5SDimitry Andricdef hi_f16_elt : PatLeaf<
3250b57cec5SDimitry Andric  (vt), [{
3260b57cec5SDimitry Andric  if (N->getOpcode() != ISD::BITCAST)
3270b57cec5SDimitry Andric    return false;
3280b57cec5SDimitry Andric  SDValue Tmp = N->getOperand(0);
3290b57cec5SDimitry Andric
3300b57cec5SDimitry Andric  if (Tmp.getOpcode() != ISD::SRL)
3310b57cec5SDimitry Andric    return false;
3320b57cec5SDimitry Andric    if (const auto *RHS = dyn_cast<ConstantSDNode>(Tmp.getOperand(1))
3330b57cec5SDimitry Andric      return RHS->getZExtValue() == 16;
3340b57cec5SDimitry Andric    return false;
3350b57cec5SDimitry Andric}]>;
3360b57cec5SDimitry Andric
3370b57cec5SDimitry Andric//===----------------------------------------------------------------------===//
338bdd1243dSDimitry Andric// PatLeafs for zero immediate
339bdd1243dSDimitry Andric//===----------------------------------------------------------------------===//
340bdd1243dSDimitry Andric
341bdd1243dSDimitry Andricdef immzero : PatLeaf<(imm), [{ return N->isZero(); }]>;
342bdd1243dSDimitry Andricdef fpimmzero : PatLeaf<(fpimm), [{ return N->isZero(); }]>;
343bdd1243dSDimitry Andric
344bdd1243dSDimitry Andric//===----------------------------------------------------------------------===//
3450b57cec5SDimitry Andric// PatLeafs for floating-point comparisons
3460b57cec5SDimitry Andric//===----------------------------------------------------------------------===//
3470b57cec5SDimitry Andric
3488bcb0991SDimitry Andricdef COND_OEQ : PatFrags<(ops), [(OtherVT SETOEQ), (OtherVT SETEQ)]>;
3498bcb0991SDimitry Andricdef COND_ONE : PatFrags<(ops), [(OtherVT SETONE), (OtherVT SETNE)]>;
3508bcb0991SDimitry Andricdef COND_OGT : PatFrags<(ops), [(OtherVT SETOGT), (OtherVT SETGT)]>;
3518bcb0991SDimitry Andricdef COND_OGE : PatFrags<(ops), [(OtherVT SETOGE), (OtherVT SETGE)]>;
3528bcb0991SDimitry Andricdef COND_OLT : PatFrags<(ops), [(OtherVT SETOLT), (OtherVT SETLT)]>;
3538bcb0991SDimitry Andricdef COND_OLE : PatFrags<(ops), [(OtherVT SETOLE), (OtherVT SETLE)]>;
3548bcb0991SDimitry Andricdef COND_O   : PatFrags<(ops), [(OtherVT SETO)]>;
3558bcb0991SDimitry Andricdef COND_UO  : PatFrags<(ops), [(OtherVT SETUO)]>;
3560b57cec5SDimitry Andric
3570b57cec5SDimitry Andric//===----------------------------------------------------------------------===//
3580b57cec5SDimitry Andric// PatLeafs for unsigned / unordered comparisons
3590b57cec5SDimitry Andric//===----------------------------------------------------------------------===//
3600b57cec5SDimitry Andric
3618bcb0991SDimitry Andricdef COND_UEQ : PatFrag<(ops), (OtherVT SETUEQ)>;
3628bcb0991SDimitry Andricdef COND_UNE : PatFrag<(ops), (OtherVT SETUNE)>;
3638bcb0991SDimitry Andricdef COND_UGT : PatFrag<(ops), (OtherVT SETUGT)>;
3648bcb0991SDimitry Andricdef COND_UGE : PatFrag<(ops), (OtherVT SETUGE)>;
3658bcb0991SDimitry Andricdef COND_ULT : PatFrag<(ops), (OtherVT SETULT)>;
3668bcb0991SDimitry Andricdef COND_ULE : PatFrag<(ops), (OtherVT SETULE)>;
3670b57cec5SDimitry Andric
3680b57cec5SDimitry Andric// XXX - For some reason R600 version is preferring to use unordered
3690b57cec5SDimitry Andric// for setne?
3708bcb0991SDimitry Andricdef COND_UNE_NE  : PatFrags<(ops), [(OtherVT SETUNE), (OtherVT SETNE)]>;
3710b57cec5SDimitry Andric
3720b57cec5SDimitry Andric//===----------------------------------------------------------------------===//
3730b57cec5SDimitry Andric// PatLeafs for signed comparisons
3740b57cec5SDimitry Andric//===----------------------------------------------------------------------===//
3750b57cec5SDimitry Andric
3768bcb0991SDimitry Andricdef COND_SGT : PatFrag<(ops), (OtherVT SETGT)>;
3778bcb0991SDimitry Andricdef COND_SGE : PatFrag<(ops), (OtherVT SETGE)>;
3788bcb0991SDimitry Andricdef COND_SLT : PatFrag<(ops), (OtherVT SETLT)>;
3798bcb0991SDimitry Andricdef COND_SLE : PatFrag<(ops), (OtherVT SETLE)>;
3800b57cec5SDimitry Andric
3810b57cec5SDimitry Andric//===----------------------------------------------------------------------===//
3820b57cec5SDimitry Andric// PatLeafs for integer equality
3830b57cec5SDimitry Andric//===----------------------------------------------------------------------===//
3840b57cec5SDimitry Andric
3858bcb0991SDimitry Andricdef COND_EQ : PatFrags<(ops), [(OtherVT SETEQ), (OtherVT SETUEQ)]>;
3868bcb0991SDimitry Andricdef COND_NE : PatFrags<(ops), [(OtherVT SETNE), (OtherVT SETUNE)]>;
3870b57cec5SDimitry Andric
3888bcb0991SDimitry Andric// FIXME: Should not need code predicate
3898bcb0991SDimitry Andric//def COND_NULL : PatLeaf<(OtherVT null_frag)>;
3900b57cec5SDimitry Andricdef COND_NULL : PatLeaf <
3910b57cec5SDimitry Andric  (cond),
3920b57cec5SDimitry Andric  [{(void)N; return false;}]
3930b57cec5SDimitry Andric>;
3940b57cec5SDimitry Andric
3950b57cec5SDimitry Andric//===----------------------------------------------------------------------===//
3960b57cec5SDimitry Andric// PatLeafs for Texture Constants
3970b57cec5SDimitry Andric//===----------------------------------------------------------------------===//
3980b57cec5SDimitry Andric
3990b57cec5SDimitry Andricdef TEX_ARRAY : PatLeaf<
4000b57cec5SDimitry Andric  (imm),
4010b57cec5SDimitry Andric  [{uint32_t TType = (uint32_t)N->getZExtValue();
4020b57cec5SDimitry Andric    return TType == 9 || TType == 10 || TType == 16;
4030b57cec5SDimitry Andric  }]
4040b57cec5SDimitry Andric>;
4050b57cec5SDimitry Andric
4060b57cec5SDimitry Andricdef TEX_RECT : PatLeaf<
4070b57cec5SDimitry Andric  (imm),
4080b57cec5SDimitry Andric  [{uint32_t TType = (uint32_t)N->getZExtValue();
4090b57cec5SDimitry Andric    return TType == 5;
4100b57cec5SDimitry Andric  }]
4110b57cec5SDimitry Andric>;
4120b57cec5SDimitry Andric
4130b57cec5SDimitry Andricdef TEX_SHADOW : PatLeaf<
4140b57cec5SDimitry Andric  (imm),
4150b57cec5SDimitry Andric  [{uint32_t TType = (uint32_t)N->getZExtValue();
4160b57cec5SDimitry Andric    return (TType >= 6 && TType <= 8) || TType == 13;
4170b57cec5SDimitry Andric  }]
4180b57cec5SDimitry Andric>;
4190b57cec5SDimitry Andric
4200b57cec5SDimitry Andricdef TEX_SHADOW_ARRAY : PatLeaf<
4210b57cec5SDimitry Andric  (imm),
4220b57cec5SDimitry Andric  [{uint32_t TType = (uint32_t)N->getZExtValue();
4230b57cec5SDimitry Andric    return TType == 11 || TType == 12 || TType == 17;
4240b57cec5SDimitry Andric  }]
4250b57cec5SDimitry Andric>;
4260b57cec5SDimitry Andric
4270b57cec5SDimitry Andric//===----------------------------------------------------------------------===//
4280b57cec5SDimitry Andric// Load/Store Pattern Fragments
4290b57cec5SDimitry Andric//===----------------------------------------------------------------------===//
4300b57cec5SDimitry Andric
4318bcb0991SDimitry Andricdef atomic_cmp_swap_glue : SDNode <"ISD::ATOMIC_CMP_SWAP", SDTAtomic3,
4328bcb0991SDimitry Andric  [SDNPHasChain, SDNPMayStore, SDNPMayLoad, SDNPMemOperand, SDNPInGlue]
4338bcb0991SDimitry Andric>;
4348bcb0991SDimitry Andric
4350b57cec5SDimitry Andricclass AddressSpaceList<list<int> AS> {
4360b57cec5SDimitry Andric  list<int> AddrSpaces = AS;
4370b57cec5SDimitry Andric}
4380b57cec5SDimitry Andric
4398bcb0991SDimitry Andricclass Aligned<int Bytes> {
4408bcb0991SDimitry Andric  int MinAlignment = Bytes;
4418bcb0991SDimitry Andric}
4420b57cec5SDimitry Andric
44304eeddc0SDimitry Andricclass StoreHi16<SDPatternOperator op, ValueType vt> : PatFrag <
444480093f4SDimitry Andric  (ops node:$value, node:$ptr), (op (srl node:$value, (i32 16)), node:$ptr)> {
445480093f4SDimitry Andric  let IsStore = 1;
44604eeddc0SDimitry Andric  let MemoryVT = vt;
447480093f4SDimitry Andric}
4480b57cec5SDimitry Andric
44904eeddc0SDimitry Andricdef LoadAddress_constant : AddressSpaceList<[ AddrSpaces.Constant,
45004eeddc0SDimitry Andric                                              AddrSpaces.Constant32Bit ]>;
45104eeddc0SDimitry Andricdef LoadAddress_global : AddressSpaceList<[ AddrSpaces.Global,
45204eeddc0SDimitry Andric                                            AddrSpaces.Constant,
45304eeddc0SDimitry Andric                                            AddrSpaces.Constant32Bit ]>;
4540b57cec5SDimitry Andricdef StoreAddress_global : AddressSpaceList<[ AddrSpaces.Global ]>;
4550b57cec5SDimitry Andric
4560b57cec5SDimitry Andricdef LoadAddress_flat : AddressSpaceList<[ AddrSpaces.Flat,
4570b57cec5SDimitry Andric                                          AddrSpaces.Global,
45804eeddc0SDimitry Andric                                          AddrSpaces.Constant,
45904eeddc0SDimitry Andric                                          AddrSpaces.Constant32Bit ]>;
4600b57cec5SDimitry Andricdef StoreAddress_flat : AddressSpaceList<[ AddrSpaces.Flat, AddrSpaces.Global ]>;
4610b57cec5SDimitry Andric
4620b57cec5SDimitry Andricdef LoadAddress_private : AddressSpaceList<[ AddrSpaces.Private ]>;
4630b57cec5SDimitry Andricdef StoreAddress_private : AddressSpaceList<[ AddrSpaces.Private ]>;
4640b57cec5SDimitry Andric
4650b57cec5SDimitry Andricdef LoadAddress_local : AddressSpaceList<[ AddrSpaces.Local ]>;
4660b57cec5SDimitry Andricdef StoreAddress_local : AddressSpaceList<[ AddrSpaces.Local ]>;
4670b57cec5SDimitry Andric
4680b57cec5SDimitry Andricdef LoadAddress_region : AddressSpaceList<[ AddrSpaces.Region ]>;
4690b57cec5SDimitry Andricdef StoreAddress_region : AddressSpaceList<[ AddrSpaces.Region ]>;
4700b57cec5SDimitry Andric
4710b57cec5SDimitry Andric
4720b57cec5SDimitry Andric
4730b57cec5SDimitry Andricforeach as = [ "global", "flat", "constant", "local", "private", "region" ] in {
4740b57cec5SDimitry Andriclet AddressSpaces = !cast<AddressSpaceList>("LoadAddress_"#as).AddrSpaces in {
4750b57cec5SDimitry Andric
4760b57cec5SDimitry Andricdef load_#as : PatFrag<(ops node:$ptr), (unindexedload node:$ptr)> {
4770b57cec5SDimitry Andric  let IsLoad = 1;
4780b57cec5SDimitry Andric  let IsNonExtLoad = 1;
4790b57cec5SDimitry Andric}
4800b57cec5SDimitry Andric
48181ad6265SDimitry Andricdef extloadi8_#as  : PatFrag<(ops node:$ptr), (extloadi8 node:$ptr)> {
4820b57cec5SDimitry Andric  let IsLoad = 1;
4830b57cec5SDimitry Andric}
4840b57cec5SDimitry Andric
48581ad6265SDimitry Andricdef extloadi16_#as : PatFrag<(ops node:$ptr), (extloadi16 node:$ptr)> {
4860b57cec5SDimitry Andric  let IsLoad = 1;
4870b57cec5SDimitry Andric}
4880b57cec5SDimitry Andric
48981ad6265SDimitry Andricdef sextloadi8_#as  : PatFrag<(ops node:$ptr), (sextloadi8 node:$ptr)> {
4900b57cec5SDimitry Andric  let IsLoad = 1;
4910b57cec5SDimitry Andric}
4920b57cec5SDimitry Andric
49381ad6265SDimitry Andricdef sextloadi16_#as : PatFrag<(ops node:$ptr), (sextloadi16 node:$ptr)> {
4940b57cec5SDimitry Andric  let IsLoad = 1;
4950b57cec5SDimitry Andric}
4960b57cec5SDimitry Andric
49781ad6265SDimitry Andricdef zextloadi8_#as  : PatFrag<(ops node:$ptr), (zextloadi8 node:$ptr)> {
4980b57cec5SDimitry Andric  let IsLoad = 1;
4990b57cec5SDimitry Andric}
5000b57cec5SDimitry Andric
50181ad6265SDimitry Andricdef zextloadi16_#as : PatFrag<(ops node:$ptr), (zextloadi16 node:$ptr)> {
5020b57cec5SDimitry Andric  let IsLoad = 1;
5030b57cec5SDimitry Andric}
5040b57cec5SDimitry Andric
505349cc55cSDimitry Andricdef atomic_load_8_#as : PatFrag<(ops node:$ptr), (atomic_load_8 node:$ptr)> {
506349cc55cSDimitry Andric  let IsAtomic = 1;
507349cc55cSDimitry Andric  let MemoryVT = i8;
508349cc55cSDimitry Andric}
509349cc55cSDimitry Andric
510349cc55cSDimitry Andricdef atomic_load_16_#as : PatFrag<(ops node:$ptr), (atomic_load_16 node:$ptr)> {
511349cc55cSDimitry Andric  let IsAtomic = 1;
512349cc55cSDimitry Andric  let MemoryVT = i16;
513349cc55cSDimitry Andric}
514349cc55cSDimitry Andric
5150b57cec5SDimitry Andricdef atomic_load_32_#as : PatFrag<(ops node:$ptr), (atomic_load_32 node:$ptr)> {
5160b57cec5SDimitry Andric  let IsAtomic = 1;
5170b57cec5SDimitry Andric  let MemoryVT = i32;
5180b57cec5SDimitry Andric}
5190b57cec5SDimitry Andric
5200b57cec5SDimitry Andricdef atomic_load_64_#as : PatFrag<(ops node:$ptr), (atomic_load_64 node:$ptr)> {
5210b57cec5SDimitry Andric  let IsAtomic = 1;
5220b57cec5SDimitry Andric  let MemoryVT = i64;
5230b57cec5SDimitry Andric}
5245ffd83dbSDimitry Andric} // End let AddressSpaces
5255ffd83dbSDimitry Andric} // End foreach as
5260b57cec5SDimitry Andric
5275ffd83dbSDimitry Andric
5285ffd83dbSDimitry Andricforeach as = [ "global", "flat", "local", "private", "region" ] in {
52981ad6265SDimitry Andriclet IsStore = 1, AddressSpaces = !cast<AddressSpaceList>("StoreAddress_"#as).AddrSpaces in {
5300b57cec5SDimitry Andricdef store_#as : PatFrag<(ops node:$val, node:$ptr),
5310b57cec5SDimitry Andric                    (unindexedstore node:$val, node:$ptr)> {
5320b57cec5SDimitry Andric  let IsTruncStore = 0;
5330b57cec5SDimitry Andric}
5340b57cec5SDimitry Andric
5350b57cec5SDimitry Andric// truncstore fragments.
5360b57cec5SDimitry Andricdef truncstore_#as : PatFrag<(ops node:$val, node:$ptr),
5370b57cec5SDimitry Andric                             (unindexedstore node:$val, node:$ptr)> {
5380b57cec5SDimitry Andric  let IsTruncStore = 1;
5390b57cec5SDimitry Andric}
5400b57cec5SDimitry Andric
5410b57cec5SDimitry Andric// TODO: We don't really need the truncstore here. We can use
5420b57cec5SDimitry Andric// unindexedstore with MemoryVT directly, which will save an
5430b57cec5SDimitry Andric// unnecessary check that the memory size is less than the value type
5440b57cec5SDimitry Andric// in the generated matcher table.
5450b57cec5SDimitry Andricdef truncstorei8_#as : PatFrag<(ops node:$val, node:$ptr),
54681ad6265SDimitry Andric                               (truncstorei8 node:$val, node:$ptr)>;
5470b57cec5SDimitry Andricdef truncstorei16_#as : PatFrag<(ops node:$val, node:$ptr),
54881ad6265SDimitry Andric                                (truncstorei16 node:$val, node:$ptr)>;
5490b57cec5SDimitry Andric
55004eeddc0SDimitry Andricdef store_hi16_#as : StoreHi16 <truncstorei16, i16>;
55104eeddc0SDimitry Andricdef truncstorei8_hi16_#as : StoreHi16<truncstorei8, i8>;
55204eeddc0SDimitry Andricdef truncstorei16_hi16_#as : StoreHi16<truncstorei16, i16>;
55381ad6265SDimitry Andric} // End let IsStore = 1, AddressSpaces = ...
5540b57cec5SDimitry Andric
55581ad6265SDimitry Andriclet IsAtomic = 1, AddressSpaces = !cast<AddressSpaceList>("StoreAddress_"#as).AddrSpaces in {
5565f757f3fSDimitry Andricdef atomic_store_8_#as : PatFrag<(ops node:$val, node:$ptr),
5575f757f3fSDimitry Andric                                 (atomic_store_8 node:$val, node:$ptr)>;
5585f757f3fSDimitry Andricdef atomic_store_16_#as : PatFrag<(ops node:$val, node:$ptr),
5595f757f3fSDimitry Andric                                  (atomic_store_16 node:$val, node:$ptr)>;
5605f757f3fSDimitry Andricdef atomic_store_32_#as : PatFrag<(ops node:$val, node:$ptr),
5615f757f3fSDimitry Andric                                  (atomic_store_32 node:$val, node:$ptr)>;
5625f757f3fSDimitry Andricdef atomic_store_64_#as : PatFrag<(ops node:$val, node:$ptr),
5635f757f3fSDimitry Andric                                  (atomic_store_64 node:$val, node:$ptr)>;
5645f757f3fSDimitry Andric} // End let IsAtomic = 1, AddressSpaces = ...
5655ffd83dbSDimitry Andric} // End foreach as
5660b57cec5SDimitry Andric
567753f127fSDimitry Andricmulticlass noret_op {
568753f127fSDimitry Andric  let HasNoUse = true in
56981ad6265SDimitry Andric  def "_noret" : PatFrag<(ops node:$ptr, node:$data),
57081ad6265SDimitry Andric    (!cast<SDPatternOperator>(NAME) node:$ptr, node:$data)>;
57181ad6265SDimitry Andric}
57281ad6265SDimitry Andric
573bdd1243dSDimitry Andricmulticlass global_addr_space_atomic_op {
574bdd1243dSDimitry Andric  def "_noret_global_addrspace" :
575bdd1243dSDimitry Andric    PatFrag<(ops node:$ptr, node:$data),
576bdd1243dSDimitry Andric            (!cast<SDPatternOperator>(NAME) node:$ptr, node:$data)>{
577bdd1243dSDimitry Andric      let HasNoUse = true;
578bdd1243dSDimitry Andric      let AddressSpaces = LoadAddress_global.AddrSpaces;
579bdd1243dSDimitry Andric      let IsAtomic = 1;
580bdd1243dSDimitry Andric    }
581bdd1243dSDimitry Andric    def "_global_addrspace" :
582bdd1243dSDimitry Andric    PatFrag<(ops node:$ptr, node:$data),
583bdd1243dSDimitry Andric            (!cast<SDPatternOperator>(NAME) node:$ptr, node:$data)>{
584bdd1243dSDimitry Andric      let AddressSpaces = LoadAddress_global.AddrSpaces;
585bdd1243dSDimitry Andric      let IsAtomic = 1;
586bdd1243dSDimitry Andric    }
587bdd1243dSDimitry Andric}
588bdd1243dSDimitry Andric
589bdd1243dSDimitry Andricmulticlass flat_addr_space_atomic_op {
590bdd1243dSDimitry Andric  def "_noret_flat_addrspace" :
591bdd1243dSDimitry Andric    PatFrag<(ops node:$ptr, node:$data),
592bdd1243dSDimitry Andric            (!cast<SDPatternOperator>(NAME) node:$ptr, node:$data)>{
593bdd1243dSDimitry Andric      let HasNoUse = true;
594bdd1243dSDimitry Andric      let AddressSpaces = LoadAddress_flat.AddrSpaces;
595bdd1243dSDimitry Andric      let IsAtomic = 1;
596bdd1243dSDimitry Andric    }
597bdd1243dSDimitry Andric    def "_flat_addrspace" :
598bdd1243dSDimitry Andric    PatFrag<(ops node:$ptr, node:$data),
599bdd1243dSDimitry Andric            (!cast<SDPatternOperator>(NAME) node:$ptr, node:$data)>{
600bdd1243dSDimitry Andric      let AddressSpaces = LoadAddress_flat.AddrSpaces;
601bdd1243dSDimitry Andric      let IsAtomic = 1;
602bdd1243dSDimitry Andric    }
603bdd1243dSDimitry Andric}
604bdd1243dSDimitry Andric
605bdd1243dSDimitry Andricmulticlass local_addr_space_atomic_op {
606bdd1243dSDimitry Andric  def "_noret_local_addrspace" :
607bdd1243dSDimitry Andric    PatFrag<(ops node:$ptr, node:$data),
608bdd1243dSDimitry Andric            (!cast<SDPatternOperator>(NAME) node:$ptr, node:$data)>{
609bdd1243dSDimitry Andric      let HasNoUse = true;
610bdd1243dSDimitry Andric      let AddressSpaces = LoadAddress_local.AddrSpaces;
611bdd1243dSDimitry Andric      let IsAtomic = 1;
612bdd1243dSDimitry Andric    }
613bdd1243dSDimitry Andric    def "_local_addrspace" :
614bdd1243dSDimitry Andric    PatFrag<(ops node:$ptr, node:$data),
615bdd1243dSDimitry Andric            (!cast<SDPatternOperator>(NAME) node:$ptr, node:$data)>{
616bdd1243dSDimitry Andric      let AddressSpaces = LoadAddress_local.AddrSpaces;
617bdd1243dSDimitry Andric      let IsAtomic = 1;
618bdd1243dSDimitry Andric    }
619bdd1243dSDimitry Andric}
620bdd1243dSDimitry Andric
621*0fca6ea1SDimitry Andricdefm int_amdgcn_flat_atomic_fadd : noret_op;
622bdd1243dSDimitry Andricdefm int_amdgcn_flat_atomic_fadd : flat_addr_space_atomic_op;
623753f127fSDimitry Andricdefm int_amdgcn_flat_atomic_fadd_v2bf16 : noret_op;
624753f127fSDimitry Andricdefm int_amdgcn_flat_atomic_fmin : noret_op;
625753f127fSDimitry Andricdefm int_amdgcn_flat_atomic_fmax : noret_op;
626bdd1243dSDimitry Andricdefm int_amdgcn_global_atomic_fadd : global_addr_space_atomic_op;
627bdd1243dSDimitry Andricdefm int_amdgcn_flat_atomic_fadd : global_addr_space_atomic_op;
628753f127fSDimitry Andricdefm int_amdgcn_global_atomic_fadd_v2bf16 : noret_op;
629753f127fSDimitry Andricdefm int_amdgcn_global_atomic_fmin : noret_op;
630753f127fSDimitry Andricdefm int_amdgcn_global_atomic_fmax : noret_op;
6315f757f3fSDimitry Andricdefm int_amdgcn_global_atomic_csub : noret_op;
632bdd1243dSDimitry Andricdefm int_amdgcn_flat_atomic_fadd : local_addr_space_atomic_op;
633647cbc5dSDimitry Andricdefm int_amdgcn_global_atomic_ordered_add_b64 : noret_op;
6345f757f3fSDimitry Andricdefm int_amdgcn_flat_atomic_fmin_num : noret_op;
6355f757f3fSDimitry Andricdefm int_amdgcn_flat_atomic_fmax_num : noret_op;
6365f757f3fSDimitry Andricdefm int_amdgcn_global_atomic_fmin_num : noret_op;
6375f757f3fSDimitry Andricdefm int_amdgcn_global_atomic_fmax_num : noret_op;
6387a6dacacSDimitry Andricdefm int_amdgcn_atomic_cond_sub_u32 : local_addr_space_atomic_op;
6397a6dacacSDimitry Andricdefm int_amdgcn_atomic_cond_sub_u32 : flat_addr_space_atomic_op;
6407a6dacacSDimitry Andricdefm int_amdgcn_atomic_cond_sub_u32 : global_addr_space_atomic_op;
6410b57cec5SDimitry Andric
642*0fca6ea1SDimitry Andricmulticlass noret_binary_atomic_op<SDNode atomic_op> {
643753f127fSDimitry Andric  let HasNoUse = true in
644*0fca6ea1SDimitry Andric  defm "_noret" : binary_atomic_op<atomic_op>;
645*0fca6ea1SDimitry Andric}
646*0fca6ea1SDimitry Andric
647*0fca6ea1SDimitry Andricmulticlass noret_binary_atomic_op_fp<SDNode atomic_op> {
648*0fca6ea1SDimitry Andric  let HasNoUse = true in
649*0fca6ea1SDimitry Andric  defm "_noret" : binary_atomic_op_fp<atomic_op>;
65081ad6265SDimitry Andric}
65181ad6265SDimitry Andric
652753f127fSDimitry Andricmulticlass noret_ternary_atomic_op<SDNode atomic_op> {
653753f127fSDimitry Andric  let HasNoUse = true in
65481ad6265SDimitry Andric  defm "_noret" : ternary_atomic_op<atomic_op>;
65581ad6265SDimitry Andric}
65681ad6265SDimitry Andric
657*0fca6ea1SDimitry Andricdefvar atomic_addrspace_names = [ "global", "flat", "constant", "local", "private", "region" ];
658*0fca6ea1SDimitry Andric
659*0fca6ea1SDimitry Andricmulticlass binary_atomic_op_all_as<SDNode atomic_op> {
660*0fca6ea1SDimitry Andric  foreach as = atomic_addrspace_names in {
6618bcb0991SDimitry Andric    let AddressSpaces = !cast<AddressSpaceList>("LoadAddress_"#as).AddrSpaces in {
662*0fca6ea1SDimitry Andric      defm "_"#as : binary_atomic_op<atomic_op>;
663*0fca6ea1SDimitry Andric      defm "_"#as : noret_binary_atomic_op<atomic_op>;
664*0fca6ea1SDimitry Andric    }
665*0fca6ea1SDimitry Andric  }
666*0fca6ea1SDimitry Andric}
667*0fca6ea1SDimitry Andricmulticlass binary_atomic_op_fp_all_as<SDNode atomic_op> {
668*0fca6ea1SDimitry Andric  foreach as = atomic_addrspace_names in {
669*0fca6ea1SDimitry Andric    let AddressSpaces = !cast<AddressSpaceList>("LoadAddress_"#as).AddrSpaces in {
670*0fca6ea1SDimitry Andric      defm "_"#as : binary_atomic_op_fp<atomic_op>;
671*0fca6ea1SDimitry Andric      defm "_"#as : noret_binary_atomic_op_fp<atomic_op>;
6728bcb0991SDimitry Andric    }
6738bcb0991SDimitry Andric  }
6748bcb0991SDimitry Andric}
6758bcb0991SDimitry Andric
67681ad6265SDimitry Andricdefm atomic_swap : binary_atomic_op_all_as<atomic_swap>;
67781ad6265SDimitry Andricdefm atomic_load_add : binary_atomic_op_all_as<atomic_load_add>;
67881ad6265SDimitry Andricdefm atomic_load_and : binary_atomic_op_all_as<atomic_load_and>;
67981ad6265SDimitry Andricdefm atomic_load_max : binary_atomic_op_all_as<atomic_load_max>;
68081ad6265SDimitry Andricdefm atomic_load_min : binary_atomic_op_all_as<atomic_load_min>;
68181ad6265SDimitry Andricdefm atomic_load_or : binary_atomic_op_all_as<atomic_load_or>;
68281ad6265SDimitry Andricdefm atomic_load_sub : binary_atomic_op_all_as<atomic_load_sub>;
68381ad6265SDimitry Andricdefm atomic_load_umax : binary_atomic_op_all_as<atomic_load_umax>;
68481ad6265SDimitry Andricdefm atomic_load_umin : binary_atomic_op_all_as<atomic_load_umin>;
68581ad6265SDimitry Andricdefm atomic_load_xor : binary_atomic_op_all_as<atomic_load_xor>;
686*0fca6ea1SDimitry Andricdefm atomic_load_fadd : binary_atomic_op_fp_all_as<atomic_load_fadd>;
687*0fca6ea1SDimitry Andricdefm atomic_load_fmin : binary_atomic_op_fp_all_as<atomic_load_fmin>;
688*0fca6ea1SDimitry Andricdefm atomic_load_fmax : binary_atomic_op_fp_all_as<atomic_load_fmax>;
68906c3fb27SDimitry Andricdefm atomic_load_uinc_wrap : binary_atomic_op_all_as<atomic_load_uinc_wrap>;
69006c3fb27SDimitry Andricdefm atomic_load_udec_wrap : binary_atomic_op_all_as<atomic_load_udec_wrap>;
69181ad6265SDimitry Andricdefm AMDGPUatomic_cmp_swap : binary_atomic_op_all_as<AMDGPUatomic_cmp_swap>;
6920b57cec5SDimitry Andric
693e8d8bef9SDimitry Andricdef load_align8_local : PatFrag<(ops node:$ptr), (load_local node:$ptr)>,
694e8d8bef9SDimitry Andric                       Aligned<8> {
6958bcb0991SDimitry Andric  let IsLoad = 1;
6968bcb0991SDimitry Andric}
6970b57cec5SDimitry Andric
698e8d8bef9SDimitry Andricdef load_align16_local : PatFrag<(ops node:$ptr), (load_local node:$ptr)>,
699e8d8bef9SDimitry Andric                        Aligned<16> {
7008bcb0991SDimitry Andric  let IsLoad = 1;
7018bcb0991SDimitry Andric}
7020b57cec5SDimitry Andric
7038bcb0991SDimitry Andricdef store_align8_local: PatFrag<(ops node:$val, node:$ptr),
7048bcb0991SDimitry Andric                                (store_local node:$val, node:$ptr)>, Aligned<8> {
7058bcb0991SDimitry Andric  let IsStore = 1;
7068bcb0991SDimitry Andric}
7078bcb0991SDimitry Andric
7088bcb0991SDimitry Andricdef store_align16_local: PatFrag<(ops node:$val, node:$ptr),
7098bcb0991SDimitry Andric                                (store_local node:$val, node:$ptr)>, Aligned<16> {
7108bcb0991SDimitry Andric  let IsStore = 1;
7118bcb0991SDimitry Andric}
7128bcb0991SDimitry Andric
7138bcb0991SDimitry Andriclet AddressSpaces = StoreAddress_local.AddrSpaces in {
7148bcb0991SDimitry Andricdefm atomic_cmp_swap_local : ternary_atomic_op<atomic_cmp_swap>;
715753f127fSDimitry Andricdefm atomic_cmp_swap_local : noret_ternary_atomic_op<atomic_cmp_swap>;
716753f127fSDimitry Andricdefm atomic_cmp_swap_local_m0 : noret_ternary_atomic_op<atomic_cmp_swap_glue>;
717753f127fSDimitry Andricdefm atomic_cmp_swap_local_m0 : ternary_atomic_op<atomic_cmp_swap_glue>;
7188bcb0991SDimitry Andric}
7190b57cec5SDimitry Andric
7208bcb0991SDimitry Andriclet AddressSpaces = StoreAddress_region.AddrSpaces in {
721753f127fSDimitry Andricdefm atomic_cmp_swap_region : noret_ternary_atomic_op<atomic_cmp_swap>;
722753f127fSDimitry Andricdefm atomic_cmp_swap_region_m0 : noret_ternary_atomic_op<atomic_cmp_swap_glue>;
723753f127fSDimitry Andricdefm atomic_cmp_swap_region_m0 : ternary_atomic_op<atomic_cmp_swap_glue>;
7248bcb0991SDimitry Andric}
7250b57cec5SDimitry Andric
7260b57cec5SDimitry Andric//===----------------------------------------------------------------------===//
7270b57cec5SDimitry Andric// Misc Pattern Fragments
7280b57cec5SDimitry Andric//===----------------------------------------------------------------------===//
7290b57cec5SDimitry Andric
7300b57cec5SDimitry Andricclass Constants {
7310b57cec5SDimitry Andricint TWO_PI = 0x40c90fdb;
7320b57cec5SDimitry Andricint PI = 0x40490fdb;
7330b57cec5SDimitry Andricint TWO_PI_INV = 0x3e22f983;
7345ffd83dbSDimitry Andricint FP_4294966784 = 0x4f7ffffe; // 4294966784 = 4294967296 - 512 = 2^32 - 2^9
7350b57cec5SDimitry Andricint FP16_ONE = 0x3C00;
7360b57cec5SDimitry Andricint FP16_NEG_ONE = 0xBC00;
7370b57cec5SDimitry Andricint FP32_ONE = 0x3f800000;
7380b57cec5SDimitry Andricint FP32_NEG_ONE = 0xbf800000;
7390b57cec5SDimitry Andricint FP64_ONE = 0x3ff0000000000000;
7400b57cec5SDimitry Andricint FP64_NEG_ONE = 0xbff0000000000000;
7410b57cec5SDimitry Andric}
7420b57cec5SDimitry Andricdef CONST : Constants;
7430b57cec5SDimitry Andric
7440b57cec5SDimitry Andricdef FP_ZERO : PatLeaf <
7450b57cec5SDimitry Andric  (fpimm),
7460b57cec5SDimitry Andric  [{return N->getValueAPF().isZero();}]
7470b57cec5SDimitry Andric>;
7480b57cec5SDimitry Andric
7490b57cec5SDimitry Andricdef FP_ONE : PatLeaf <
7500b57cec5SDimitry Andric  (fpimm),
7510b57cec5SDimitry Andric  [{return N->isExactlyValue(1.0);}]
7520b57cec5SDimitry Andric>;
7530b57cec5SDimitry Andric
7540b57cec5SDimitry Andricdef FP_HALF : PatLeaf <
7550b57cec5SDimitry Andric  (fpimm),
7560b57cec5SDimitry Andric  [{return N->isExactlyValue(0.5);}]
7570b57cec5SDimitry Andric>;
7580b57cec5SDimitry Andric
7590b57cec5SDimitry Andric/* Generic helper patterns for intrinsics */
7600b57cec5SDimitry Andric/* -------------------------------------- */
7610b57cec5SDimitry Andric
7620b57cec5SDimitry Andricclass POW_Common <AMDGPUInst log_ieee, AMDGPUInst exp_ieee, AMDGPUInst mul>
7630b57cec5SDimitry Andric  : AMDGPUPat <
7640b57cec5SDimitry Andric  (fpow f32:$src0, f32:$src1),
7650b57cec5SDimitry Andric  (exp_ieee (mul f32:$src1, (log_ieee f32:$src0)))
7660b57cec5SDimitry Andric>;
7670b57cec5SDimitry Andric
7680b57cec5SDimitry Andric/* Other helper patterns */
7690b57cec5SDimitry Andric/* --------------------- */
7700b57cec5SDimitry Andric
7710b57cec5SDimitry Andric/* Extract element pattern */
7720b57cec5SDimitry Andricclass Extract_Element <ValueType sub_type, ValueType vec_type, int sub_idx,
7730b57cec5SDimitry Andric                       SubRegIndex sub_reg>
7740b57cec5SDimitry Andric  : AMDGPUPat<
7750b57cec5SDimitry Andric  (sub_type (extractelt vec_type:$src, sub_idx)),
7760b57cec5SDimitry Andric  (EXTRACT_SUBREG $src, sub_reg)
7770b57cec5SDimitry Andric>;
7780b57cec5SDimitry Andric
7790b57cec5SDimitry Andric/* Insert element pattern */
7800b57cec5SDimitry Andricclass Insert_Element <ValueType elem_type, ValueType vec_type,
7810b57cec5SDimitry Andric                      int sub_idx, SubRegIndex sub_reg>
7820b57cec5SDimitry Andric  : AMDGPUPat <
7830b57cec5SDimitry Andric  (insertelt vec_type:$vec, elem_type:$elem, sub_idx),
7840b57cec5SDimitry Andric  (INSERT_SUBREG $vec, $elem, sub_reg)
7850b57cec5SDimitry Andric>;
7860b57cec5SDimitry Andric
7870b57cec5SDimitry Andric// XXX: Convert to new syntax and use COPY_TO_REG, once the DFAPacketizer
7880b57cec5SDimitry Andric// can handle COPY instructions.
7890b57cec5SDimitry Andric// bitconvert pattern
7900b57cec5SDimitry Andricclass BitConvert <ValueType dt, ValueType st, RegisterClass rc> : AMDGPUPat <
7910b57cec5SDimitry Andric  (dt (bitconvert (st rc:$src0))),
7920b57cec5SDimitry Andric  (dt rc:$src0)
7930b57cec5SDimitry Andric>;
7940b57cec5SDimitry Andric
7950b57cec5SDimitry Andric// XXX: Convert to new syntax and use COPY_TO_REG, once the DFAPacketizer
7960b57cec5SDimitry Andric// can handle COPY instructions.
7970b57cec5SDimitry Andricclass DwordAddrPat<ValueType vt, RegisterClass rc> : AMDGPUPat <
7980b57cec5SDimitry Andric  (vt (AMDGPUdwordaddr (vt rc:$addr))),
7990b57cec5SDimitry Andric  (vt rc:$addr)
8000b57cec5SDimitry Andric>;
8010b57cec5SDimitry Andric
8020b57cec5SDimitry Andric// rotr pattern
8030b57cec5SDimitry Andricclass ROTRPattern <Instruction BIT_ALIGN> : AMDGPUPat <
8040b57cec5SDimitry Andric  (rotr i32:$src0, i32:$src1),
8050b57cec5SDimitry Andric  (BIT_ALIGN $src0, $src0, $src1)
8060b57cec5SDimitry Andric>;
8070b57cec5SDimitry Andric
8080b57cec5SDimitry Andric// Special conversion patterns
8090b57cec5SDimitry Andric
8100b57cec5SDimitry Andricdef cvt_rpi_i32_f32 : PatFrag <
8110b57cec5SDimitry Andric  (ops node:$src),
8120b57cec5SDimitry Andric  (fp_to_sint (ffloor (fadd $src, FP_HALF))),
8130b57cec5SDimitry Andric  [{ (void) N; return TM.Options.NoNaNsFPMath; }]
8140b57cec5SDimitry Andric>;
8150b57cec5SDimitry Andric
8160b57cec5SDimitry Andricdef cvt_flr_i32_f32 : PatFrag <
8170b57cec5SDimitry Andric  (ops node:$src),
8180b57cec5SDimitry Andric  (fp_to_sint (ffloor $src)),
8190b57cec5SDimitry Andric  [{ (void)N; return TM.Options.NoNaNsFPMath; }]
8200b57cec5SDimitry Andric>;
8210b57cec5SDimitry Andric
8220b57cec5SDimitry Andriclet AddedComplexity = 2 in {
8230b57cec5SDimitry Andricclass IMad24Pat<Instruction Inst, bit HasClamp = 0> : AMDGPUPat <
8240b57cec5SDimitry Andric  (add (AMDGPUmul_i24 i32:$src0, i32:$src1), i32:$src2),
8250b57cec5SDimitry Andric  !if(HasClamp, (Inst $src0, $src1, $src2, (i1 0)),
8260b57cec5SDimitry Andric                (Inst $src0, $src1, $src2))
8270b57cec5SDimitry Andric>;
8280b57cec5SDimitry Andric
8290b57cec5SDimitry Andricclass UMad24Pat<Instruction Inst, bit HasClamp = 0> : AMDGPUPat <
8300b57cec5SDimitry Andric  (add (AMDGPUmul_u24 i32:$src0, i32:$src1), i32:$src2),
8310b57cec5SDimitry Andric  !if(HasClamp, (Inst $src0, $src1, $src2, (i1 0)),
8320b57cec5SDimitry Andric                (Inst $src0, $src1, $src2))
8330b57cec5SDimitry Andric>;
8340b57cec5SDimitry Andric} // AddedComplexity.
8350b57cec5SDimitry Andric
8360b57cec5SDimitry Andricclass RcpPat<Instruction RcpInst, ValueType vt> : AMDGPUPat <
8370b57cec5SDimitry Andric  (fdiv FP_ONE, vt:$src),
8380b57cec5SDimitry Andric  (RcpInst $src)
8390b57cec5SDimitry Andric>;
8400b57cec5SDimitry Andric
8410b57cec5SDimitry Andric// Instructions which select to the same v_min_f*
8420b57cec5SDimitry Andricdef fminnum_like : PatFrags<(ops node:$src0, node:$src1),
8430b57cec5SDimitry Andric  [(fminnum_ieee node:$src0, node:$src1),
8440b57cec5SDimitry Andric   (fminnum node:$src0, node:$src1)]
8450b57cec5SDimitry Andric>;
8460b57cec5SDimitry Andric
8470b57cec5SDimitry Andric// Instructions which select to the same v_max_f*
8480b57cec5SDimitry Andricdef fmaxnum_like : PatFrags<(ops node:$src0, node:$src1),
8490b57cec5SDimitry Andric  [(fmaxnum_ieee node:$src0, node:$src1),
8500b57cec5SDimitry Andric   (fmaxnum node:$src0, node:$src1)]
8510b57cec5SDimitry Andric>;
8520b57cec5SDimitry Andric
853bdd1243dSDimitry Andricclass NeverNaNPats<dag ops, list<dag> frags> : PatFrags<ops, frags> {
854bdd1243dSDimitry Andric  let PredicateCode = [{
855bdd1243dSDimitry Andric    return CurDAG->isKnownNeverNaN(SDValue(N,0));
856bdd1243dSDimitry Andric  }];
857bdd1243dSDimitry Andric  let GISelPredicateCode = [{
858bdd1243dSDimitry Andric    return isKnownNeverNaN(MI.getOperand(0).getReg(), MRI);
859bdd1243dSDimitry Andric  }];
860bdd1243dSDimitry Andric}
861bdd1243dSDimitry Andric
862bdd1243dSDimitry Andricdef fminnum_like_nnan : NeverNaNPats<(ops node:$src0, node:$src1),
863bdd1243dSDimitry Andric  [(fminnum_ieee node:$src0, node:$src1),
864bdd1243dSDimitry Andric   (fminnum node:$src0, node:$src1)]
865bdd1243dSDimitry Andric>;
866bdd1243dSDimitry Andric
867bdd1243dSDimitry Andricdef fmaxnum_like_nnan : NeverNaNPats<(ops node:$src0, node:$src1),
868bdd1243dSDimitry Andric  [(fmaxnum_ieee node:$src0, node:$src1),
869bdd1243dSDimitry Andric   (fmaxnum node:$src0, node:$src1)]
870bdd1243dSDimitry Andric>;
871bdd1243dSDimitry Andric
8720b57cec5SDimitry Andricdef fminnum_like_oneuse : PatFrags<(ops node:$src0, node:$src1),
8730b57cec5SDimitry Andric  [(fminnum_ieee_oneuse node:$src0, node:$src1),
8740b57cec5SDimitry Andric   (fminnum_oneuse node:$src0, node:$src1)]
8750b57cec5SDimitry Andric>;
8760b57cec5SDimitry Andric
8770b57cec5SDimitry Andricdef fmaxnum_like_oneuse : PatFrags<(ops node:$src0, node:$src1),
8780b57cec5SDimitry Andric  [(fmaxnum_ieee_oneuse node:$src0, node:$src1),
8790b57cec5SDimitry Andric   (fmaxnum_oneuse node:$src0, node:$src1)]
8800b57cec5SDimitry Andric>;
8815ffd83dbSDimitry Andric
8825ffd83dbSDimitry Andricdef any_fmad : PatFrags<(ops node:$src0, node:$src1, node:$src2),
8835ffd83dbSDimitry Andric  [(fmad node:$src0, node:$src1, node:$src2),
8845ffd83dbSDimitry Andric   (AMDGPUfmad_ftz node:$src0, node:$src1, node:$src2)]
8855ffd83dbSDimitry Andric>;
8865ffd83dbSDimitry Andric
8875ffd83dbSDimitry Andric// FIXME: fsqrt should not select directly
8885ffd83dbSDimitry Andricdef any_amdgcn_sqrt : PatFrags<(ops node:$src0),
8895ffd83dbSDimitry Andric  [(fsqrt node:$src0), (int_amdgcn_sqrt node:$src0)]
8905ffd83dbSDimitry Andric>;
891