10b57cec5SDimitry Andric//===-- AMDGPUInstructions.td - Common instruction defs ---*- tablegen -*-===// 20b57cec5SDimitry Andric// 30b57cec5SDimitry Andric// Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions. 40b57cec5SDimitry Andric// See https://llvm.org/LICENSE.txt for license information. 50b57cec5SDimitry Andric// SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception 60b57cec5SDimitry Andric// 70b57cec5SDimitry Andric//===----------------------------------------------------------------------===// 80b57cec5SDimitry Andric// 90b57cec5SDimitry Andric// This file contains instruction defs that are common to all hw codegen 100b57cec5SDimitry Andric// targets. 110b57cec5SDimitry Andric// 120b57cec5SDimitry Andric//===----------------------------------------------------------------------===// 130b57cec5SDimitry Andric 140b57cec5SDimitry Andricclass AddressSpacesImpl { 150b57cec5SDimitry Andric int Flat = 0; 160b57cec5SDimitry Andric int Global = 1; 170b57cec5SDimitry Andric int Region = 2; 180b57cec5SDimitry Andric int Local = 3; 190b57cec5SDimitry Andric int Constant = 4; 200b57cec5SDimitry Andric int Private = 5; 2104eeddc0SDimitry Andric int Constant32Bit = 6; 220b57cec5SDimitry Andric} 230b57cec5SDimitry Andric 240b57cec5SDimitry Andricdef AddrSpaces : AddressSpacesImpl; 250b57cec5SDimitry Andric 260b57cec5SDimitry Andric 270b57cec5SDimitry Andricclass AMDGPUInst <dag outs, dag ins, string asm = "", 280b57cec5SDimitry Andric list<dag> pattern = []> : Instruction { 290b57cec5SDimitry Andric field bit isRegisterLoad = 0; 300b57cec5SDimitry Andric field bit isRegisterStore = 0; 310b57cec5SDimitry Andric 320b57cec5SDimitry Andric let Namespace = "AMDGPU"; 330b57cec5SDimitry Andric let OutOperandList = outs; 340b57cec5SDimitry Andric let InOperandList = ins; 350b57cec5SDimitry Andric let AsmString = asm; 360b57cec5SDimitry Andric let Pattern = pattern; 370b57cec5SDimitry Andric let Itinerary = NullALU; 380b57cec5SDimitry Andric 390b57cec5SDimitry Andric // SoftFail is a field the disassembler can use to provide a way for 400b57cec5SDimitry Andric // instructions to not match without killing the whole decode process. It is 410b57cec5SDimitry Andric // mainly used for ARM, but Tablegen expects this field to exist or it fails 420b57cec5SDimitry Andric // to build the decode table. 4381ad6265SDimitry Andric field bits<96> SoftFail = 0; 440b57cec5SDimitry Andric 450b57cec5SDimitry Andric let DecoderNamespace = Namespace; 460b57cec5SDimitry Andric 470b57cec5SDimitry Andric let TSFlags{63} = isRegisterLoad; 480b57cec5SDimitry Andric let TSFlags{62} = isRegisterStore; 490b57cec5SDimitry Andric} 500b57cec5SDimitry Andric 510b57cec5SDimitry Andricclass AMDGPUShaderInst <dag outs, dag ins, string asm = "", 520b57cec5SDimitry Andric list<dag> pattern = []> : AMDGPUInst<outs, ins, asm, pattern> { 530b57cec5SDimitry Andric 540b57cec5SDimitry Andric field bits<32> Inst = 0xffffffff; 550b57cec5SDimitry Andric} 560b57cec5SDimitry Andric 570b57cec5SDimitry Andric//===---------------------------------------------------------------------===// 580b57cec5SDimitry Andric// Return instruction 590b57cec5SDimitry Andric//===---------------------------------------------------------------------===// 600b57cec5SDimitry Andric 610b57cec5SDimitry Andricclass ILFormat<dag outs, dag ins, string asmstr, list<dag> pattern> 620b57cec5SDimitry Andric: Instruction { 630b57cec5SDimitry Andric 640b57cec5SDimitry Andric let Namespace = "AMDGPU"; 650b57cec5SDimitry Andric dag OutOperandList = outs; 660b57cec5SDimitry Andric dag InOperandList = ins; 670b57cec5SDimitry Andric let Pattern = pattern; 680b57cec5SDimitry Andric let AsmString = !strconcat(asmstr, "\n"); 690b57cec5SDimitry Andric let isPseudo = 1; 700b57cec5SDimitry Andric let Itinerary = NullALU; 710b57cec5SDimitry Andric bit hasIEEEFlag = 0; 720b57cec5SDimitry Andric bit hasZeroOpFlag = 0; 730b57cec5SDimitry Andric let mayLoad = 0; 740b57cec5SDimitry Andric let mayStore = 0; 750b57cec5SDimitry Andric let hasSideEffects = 0; 760b57cec5SDimitry Andric let isCodeGenOnly = 1; 770b57cec5SDimitry Andric} 780b57cec5SDimitry Andric 7981ad6265SDimitry Andric// Get the union of two Register lists 8081ad6265SDimitry Andricclass RegListUnion<list<Register> lstA, list<Register> lstB> { 81bdd1243dSDimitry Andric list<Register> ret = !listconcat(lstA, !listremove(lstB, lstA)); 8281ad6265SDimitry Andric} 8381ad6265SDimitry Andric 840b57cec5SDimitry Andricclass AMDGPUPat<dag pattern, dag result> : Pat<pattern, result>, 8506c3fb27SDimitry Andric PredicateControl, GISelFlags; 8606c3fb27SDimitry Andric 8706c3fb27SDimitry Andriclet GIIgnoreCopies = 1 in 8806c3fb27SDimitry Andricclass AMDGPUPatIgnoreCopies<dag pattern, dag result> : AMDGPUPat<pattern, result>; 890b57cec5SDimitry Andric 90480093f4SDimitry Andriclet RecomputePerFunction = 1 in { 9106c3fb27SDimitry Andricdef FP16Denormals : Predicate<"MF->getInfo<SIMachineFunctionInfo>()->getMode().FP64FP16Denormals != DenormalMode::getPreserveSign()">; 9206c3fb27SDimitry Andricdef FP32Denormals : Predicate<"MF->getInfo<SIMachineFunctionInfo>()->getMode().FP32Denormals != DenormalMode::getPreserveSign()">; 9306c3fb27SDimitry Andricdef FP64Denormals : Predicate<"MF->getInfo<SIMachineFunctionInfo>()->getMode().FP64FP16Denormals != DenormalMode::getPreserveSign()">; 9406c3fb27SDimitry Andricdef NoFP16Denormals : Predicate<"MF->getInfo<SIMachineFunctionInfo>()->getMode().FP64FP16Denormals == DenormalMode::getPreserveSign()">; 9506c3fb27SDimitry Andricdef NoFP32Denormals : Predicate<"MF->getInfo<SIMachineFunctionInfo>()->getMode().FP32Denormals == DenormalMode::getPreserveSign()">; 9606c3fb27SDimitry Andricdef NoFP64Denormals : Predicate<"MF->getInfo<SIMachineFunctionInfo>()->getMode().FP64FP16Denormals == DenormalMode::getPreserveSign()">; 970b57cec5SDimitry Andricdef UnsafeFPMath : Predicate<"TM.Options.UnsafeFPMath">; 98480093f4SDimitry Andric} 99480093f4SDimitry Andric 1000b57cec5SDimitry Andricdef FMA : Predicate<"Subtarget->hasFMA()">; 1010b57cec5SDimitry Andric 1020b57cec5SDimitry Andricdef InstFlag : OperandWithDefaultOps <i32, (ops (i32 0))>; 1030b57cec5SDimitry Andric 10406c3fb27SDimitry Andricdef i1imm_0 : OperandWithDefaultOps<i1, (ops (i1 0))>; 10506c3fb27SDimitry Andric 1065f757f3fSDimitry Andricclass CustomOperandClass<string name, bit optional, string predicateMethod, 1075f757f3fSDimitry Andric string parserMethod, string defaultMethod> 10806c3fb27SDimitry Andric : AsmOperandClass { 10906c3fb27SDimitry Andric let Name = name; 1105f757f3fSDimitry Andric let PredicateMethod = predicateMethod; 11106c3fb27SDimitry Andric let ParserMethod = parserMethod; 1120b57cec5SDimitry Andric let RenderMethod = "addImmOperands"; 11306c3fb27SDimitry Andric let IsOptional = optional; 11406c3fb27SDimitry Andric let DefaultMethod = defaultMethod; 1150b57cec5SDimitry Andric} 1160b57cec5SDimitry Andric 11706c3fb27SDimitry Andricclass CustomOperandProps<bit optional = 0, string name = NAME> { 11806c3fb27SDimitry Andric string ImmTy = "ImmTy"#name; 1195f757f3fSDimitry Andric string PredicateMethod = "is"#name; 12006c3fb27SDimitry Andric string ParserMethod = "parse"#name; 12106c3fb27SDimitry Andric string DefaultValue = "0"; 12206c3fb27SDimitry Andric string DefaultMethod = "[this]() { return "# 12306c3fb27SDimitry Andric "AMDGPUOperand::CreateImm(this, "#DefaultValue#", SMLoc(), "# 12406c3fb27SDimitry Andric "AMDGPUOperand::"#ImmTy#"); }"; 12506c3fb27SDimitry Andric string PrintMethod = "print"#name; 12606c3fb27SDimitry Andric AsmOperandClass ParserMatchClass = 1275f757f3fSDimitry Andric CustomOperandClass<name, optional, PredicateMethod, ParserMethod, 1285f757f3fSDimitry Andric DefaultMethod>; 12906c3fb27SDimitry Andric string OperandType = "OPERAND_IMMEDIATE"; 1300b57cec5SDimitry Andric} 1310b57cec5SDimitry Andric 13206c3fb27SDimitry Andricclass CustomOperand<ValueType type, bit optional = 0, string name = NAME> 13306c3fb27SDimitry Andric : Operand<type>, CustomOperandProps<optional, name>; 1340b57cec5SDimitry Andric 13506c3fb27SDimitry Andricclass ImmOperand<ValueType type, string name = NAME, bit optional = 0, 13606c3fb27SDimitry Andric string printer = "print"#name> 13706c3fb27SDimitry Andric : CustomOperand<type, optional, name> { 13806c3fb27SDimitry Andric let ImmTy = "ImmTyNone"; 13906c3fb27SDimitry Andric let ParserMethod = ""; 14006c3fb27SDimitry Andric let PrintMethod = printer; 1410b57cec5SDimitry Andric} 1420b57cec5SDimitry Andric 143*0fca6ea1SDimitry Andricclass S16ImmOperand : ImmOperand<i16, "S16Imm", 0, "printU16ImmOperand">; 144*0fca6ea1SDimitry Andric 145*0fca6ea1SDimitry Andricdef s16imm : S16ImmOperand; 14606c3fb27SDimitry Andricdef u16imm : ImmOperand<i16, "U16Imm", 0, "printU16ImmOperand">; 1470b57cec5SDimitry Andric 1485f757f3fSDimitry Andricclass ValuePredicatedOperand<CustomOperand op, string valuePredicate, 1495f757f3fSDimitry Andric bit optional = 0> 1505f757f3fSDimitry Andric : CustomOperand<op.Type, optional> { 1515f757f3fSDimitry Andric let ImmTy = op.ImmTy; 1525f757f3fSDimitry Andric defvar OpPredicate = op.ParserMatchClass.PredicateMethod; 1535f757f3fSDimitry Andric let PredicateMethod = 1545f757f3fSDimitry Andric "getPredicate([](const AMDGPUOperand &Op) -> bool { "# 1555f757f3fSDimitry Andric "return Op."#OpPredicate#"() && "#valuePredicate#"; })"; 1565f757f3fSDimitry Andric let ParserMethod = op.ParserMatchClass.ParserMethod; 1575f757f3fSDimitry Andric let DefaultValue = op.DefaultValue; 1585f757f3fSDimitry Andric let DefaultMethod = op.DefaultMethod; 1595f757f3fSDimitry Andric let PrintMethod = op.PrintMethod; 1605f757f3fSDimitry Andric} 1615f757f3fSDimitry Andric 1620b57cec5SDimitry Andric//===--------------------------------------------------------------------===// 1630b57cec5SDimitry Andric// Custom Operands 1640b57cec5SDimitry Andric//===--------------------------------------------------------------------===// 1650b57cec5SDimitry Andricdef brtarget : Operand<OtherVT>; 1660b57cec5SDimitry Andric 1670b57cec5SDimitry Andric//===----------------------------------------------------------------------===// 1680b57cec5SDimitry Andric// Misc. PatFrags 1690b57cec5SDimitry Andric//===----------------------------------------------------------------------===// 1700b57cec5SDimitry Andric 1710b57cec5SDimitry Andricclass HasOneUseUnaryOp<SDPatternOperator op> : PatFrag< 1720b57cec5SDimitry Andric (ops node:$src0), 173*0fca6ea1SDimitry Andric (op $src0)> { 174*0fca6ea1SDimitry Andric let HasOneUse = 1; 175480093f4SDimitry Andric} 1760b57cec5SDimitry Andric 1770b57cec5SDimitry Andricclass HasOneUseBinOp<SDPatternOperator op> : PatFrag< 1780b57cec5SDimitry Andric (ops node:$src0, node:$src1), 179*0fca6ea1SDimitry Andric (op $src0, $src1)> { 180*0fca6ea1SDimitry Andric let HasOneUse = 1; 181480093f4SDimitry Andric} 1820b57cec5SDimitry Andric 1830b57cec5SDimitry Andricclass HasOneUseTernaryOp<SDPatternOperator op> : PatFrag< 1840b57cec5SDimitry Andric (ops node:$src0, node:$src1, node:$src2), 185*0fca6ea1SDimitry Andric (op $src0, $src1, $src2)> { 186*0fca6ea1SDimitry Andric let HasOneUse = 1; 187*0fca6ea1SDimitry Andric} 188*0fca6ea1SDimitry Andric 189*0fca6ea1SDimitry Andricclass is_canonicalized_1<SDPatternOperator op> : PatFrag< 190*0fca6ea1SDimitry Andric (ops node:$src0), 191*0fca6ea1SDimitry Andric (op $src0), 192*0fca6ea1SDimitry Andric [{ 193*0fca6ea1SDimitry Andric const SITargetLowering &Lowering = 194*0fca6ea1SDimitry Andric *static_cast<const SITargetLowering *>(getTargetLowering()); 195*0fca6ea1SDimitry Andric 196*0fca6ea1SDimitry Andric return Lowering.isCanonicalized(*CurDAG, N->getOperand(0)); 197*0fca6ea1SDimitry Andric }]> { 198*0fca6ea1SDimitry Andric 199480093f4SDimitry Andric let GISelPredicateCode = [{ 200*0fca6ea1SDimitry Andric const SITargetLowering *TLI = static_cast<const SITargetLowering *>( 201*0fca6ea1SDimitry Andric MF.getSubtarget().getTargetLowering()); 202*0fca6ea1SDimitry Andric 203*0fca6ea1SDimitry Andric return TLI->isCanonicalized(MI.getOperand(1).getReg(), MF); 204480093f4SDimitry Andric }]; 205480093f4SDimitry Andric} 2060b57cec5SDimitry Andric 207*0fca6ea1SDimitry Andricclass is_canonicalized_2<SDPatternOperator op> : PatFrag< 208fe6060f1SDimitry Andric (ops node:$src0, node:$src1), 209fe6060f1SDimitry Andric (op $src0, $src1), 210fe6060f1SDimitry Andric [{ 211fe6060f1SDimitry Andric const SITargetLowering &Lowering = 212fe6060f1SDimitry Andric *static_cast<const SITargetLowering *>(getTargetLowering()); 213fe6060f1SDimitry Andric 214fe6060f1SDimitry Andric return Lowering.isCanonicalized(*CurDAG, N->getOperand(0)) && 215fe6060f1SDimitry Andric Lowering.isCanonicalized(*CurDAG, N->getOperand(1)); 216fe6060f1SDimitry Andric }]> { 217fe6060f1SDimitry Andric 218fe6060f1SDimitry Andric // TODO: Improve the Legalizer for g_build_vector in Global Isel to match this class 219fe6060f1SDimitry Andric let GISelPredicateCode = [{ 220fe6060f1SDimitry Andric const SITargetLowering *TLI = static_cast<const SITargetLowering *>( 221fe6060f1SDimitry Andric MF.getSubtarget().getTargetLowering()); 222fe6060f1SDimitry Andric 223*0fca6ea1SDimitry Andric return TLI->isCanonicalized(MI.getOperand(1).getReg(), MF) && 224*0fca6ea1SDimitry Andric TLI->isCanonicalized(MI.getOperand(2).getReg(), MF); 225fe6060f1SDimitry Andric }]; 226fe6060f1SDimitry Andric} 227fe6060f1SDimitry Andric 22806c3fb27SDimitry Andricclass FoldTernaryOpPat<SDPatternOperator op1, SDPatternOperator op2> : PatFrag< 22906c3fb27SDimitry Andric (ops node:$src0, node:$src1, node:$src2), 23006c3fb27SDimitry Andric (op2 (op1 node:$src0, node:$src1), node:$src2) 23106c3fb27SDimitry Andric>; 23206c3fb27SDimitry Andric 23306c3fb27SDimitry Andricdef imad : FoldTernaryOpPat<mul, add>; 234fe6060f1SDimitry Andric 2350b57cec5SDimitry Andriclet Properties = [SDNPCommutative, SDNPAssociative] in { 2360b57cec5SDimitry Andricdef smax_oneuse : HasOneUseBinOp<smax>; 2370b57cec5SDimitry Andricdef smin_oneuse : HasOneUseBinOp<smin>; 2380b57cec5SDimitry Andricdef umax_oneuse : HasOneUseBinOp<umax>; 2390b57cec5SDimitry Andricdef umin_oneuse : HasOneUseBinOp<umin>; 2400b57cec5SDimitry Andric 2410b57cec5SDimitry Andricdef fminnum_oneuse : HasOneUseBinOp<fminnum>; 2420b57cec5SDimitry Andricdef fmaxnum_oneuse : HasOneUseBinOp<fmaxnum>; 2435f757f3fSDimitry Andricdef fminimum_oneuse : HasOneUseBinOp<fminimum>; 2445f757f3fSDimitry Andricdef fmaximum_oneuse : HasOneUseBinOp<fmaximum>; 2450b57cec5SDimitry Andric 2460b57cec5SDimitry Andricdef fminnum_ieee_oneuse : HasOneUseBinOp<fminnum_ieee>; 2470b57cec5SDimitry Andricdef fmaxnum_ieee_oneuse : HasOneUseBinOp<fmaxnum_ieee>; 2480b57cec5SDimitry Andric 2490b57cec5SDimitry Andric 2500b57cec5SDimitry Andricdef and_oneuse : HasOneUseBinOp<and>; 2510b57cec5SDimitry Andricdef or_oneuse : HasOneUseBinOp<or>; 2520b57cec5SDimitry Andricdef xor_oneuse : HasOneUseBinOp<xor>; 2530b57cec5SDimitry Andric} // Properties = [SDNPCommutative, SDNPAssociative] 2540b57cec5SDimitry Andric 2550b57cec5SDimitry Andricdef not_oneuse : HasOneUseUnaryOp<not>; 2560b57cec5SDimitry Andric 2570b57cec5SDimitry Andricdef add_oneuse : HasOneUseBinOp<add>; 2580b57cec5SDimitry Andricdef sub_oneuse : HasOneUseBinOp<sub>; 2590b57cec5SDimitry Andric 2600b57cec5SDimitry Andricdef srl_oneuse : HasOneUseBinOp<srl>; 2610b57cec5SDimitry Andricdef shl_oneuse : HasOneUseBinOp<shl>; 2620b57cec5SDimitry Andric 2630b57cec5SDimitry Andricdef select_oneuse : HasOneUseTernaryOp<select>; 2640b57cec5SDimitry Andric 2650b57cec5SDimitry Andricdef AMDGPUmul_u24_oneuse : HasOneUseBinOp<AMDGPUmul_u24>; 2660b57cec5SDimitry Andricdef AMDGPUmul_i24_oneuse : HasOneUseBinOp<AMDGPUmul_i24>; 2670b57cec5SDimitry Andric 268349cc55cSDimitry Andric//===----------------------------------------------------------------------===// 269349cc55cSDimitry Andric// PatFrags for shifts 270349cc55cSDimitry Andric//===----------------------------------------------------------------------===// 271349cc55cSDimitry Andric 272349cc55cSDimitry Andric// Constrained shift PatFrags. 2734824e7fdSDimitry Andric 2744824e7fdSDimitry Andricdef csh_mask_16 : PatFrag<(ops node:$src0), (and node:$src0, imm), 2754824e7fdSDimitry Andric [{ return isUnneededShiftMask(N, 4); }]> { 2764824e7fdSDimitry Andric let GISelPredicateCode = [{ return isUnneededShiftMask(MI, 4); }]; 2774824e7fdSDimitry Andric } 2784824e7fdSDimitry Andric 2794824e7fdSDimitry Andricdef csh_mask_32 : PatFrag<(ops node:$src0), (and node:$src0, imm), 2804824e7fdSDimitry Andric [{ return isUnneededShiftMask(N, 5); }]> { 2814824e7fdSDimitry Andric let GISelPredicateCode = [{ return isUnneededShiftMask(MI, 5); }]; 2824824e7fdSDimitry Andric } 2834824e7fdSDimitry Andric 2844824e7fdSDimitry Andricdef csh_mask_64 : PatFrag<(ops node:$src0), (and node:$src0, imm), 2854824e7fdSDimitry Andric [{ return isUnneededShiftMask(N, 6); }]> { 2864824e7fdSDimitry Andric let GISelPredicateCode = [{ return isUnneededShiftMask(MI, 6); }]; 2874824e7fdSDimitry Andric } 2884824e7fdSDimitry Andric 289349cc55cSDimitry Andricforeach width = [16, 32, 64] in { 2904824e7fdSDimitry Andricdefvar csh_mask = !cast<SDPatternOperator>("csh_mask_"#width); 291349cc55cSDimitry Andric 292349cc55cSDimitry Andricdef cshl_#width : PatFrags<(ops node:$src0, node:$src1), 2934824e7fdSDimitry Andric [(shl node:$src0, node:$src1), (shl node:$src0, (csh_mask node:$src1))]>; 294349cc55cSDimitry Andricdefvar cshl = !cast<SDPatternOperator>("cshl_"#width); 295349cc55cSDimitry Andricdef cshl_#width#_oneuse : HasOneUseBinOp<cshl>; 296349cc55cSDimitry Andricdef clshl_rev_#width : PatFrag <(ops node:$src0, node:$src1), 297349cc55cSDimitry Andric (cshl $src1, $src0)>; 298349cc55cSDimitry Andric 299349cc55cSDimitry Andricdef csrl_#width : PatFrags<(ops node:$src0, node:$src1), 3004824e7fdSDimitry Andric [(srl node:$src0, node:$src1), (srl node:$src0, (csh_mask node:$src1))]>; 301349cc55cSDimitry Andricdefvar csrl = !cast<SDPatternOperator>("csrl_"#width); 302349cc55cSDimitry Andricdef csrl_#width#_oneuse : HasOneUseBinOp<csrl>; 303349cc55cSDimitry Andricdef clshr_rev_#width : PatFrag <(ops node:$src0, node:$src1), 304349cc55cSDimitry Andric (csrl $src1, $src0)>; 305349cc55cSDimitry Andric 306349cc55cSDimitry Andricdef csra_#width : PatFrags<(ops node:$src0, node:$src1), 3074824e7fdSDimitry Andric [(sra node:$src0, node:$src1), (sra node:$src0, (csh_mask node:$src1))]>; 308349cc55cSDimitry Andricdefvar csra = !cast<SDPatternOperator>("csra_"#width); 309349cc55cSDimitry Andricdef csra_#width#_oneuse : HasOneUseBinOp<csra>; 310349cc55cSDimitry Andricdef cashr_rev_#width : PatFrag <(ops node:$src0, node:$src1), 311349cc55cSDimitry Andric (csra $src1, $src0)>; 312349cc55cSDimitry Andric} // end foreach width 313349cc55cSDimitry Andric 3140b57cec5SDimitry Andricdef srl_16 : PatFrag< 3150b57cec5SDimitry Andric (ops node:$src0), (srl_oneuse node:$src0, (i32 16)) 3160b57cec5SDimitry Andric>; 3170b57cec5SDimitry Andric 3180b57cec5SDimitry Andric 3190b57cec5SDimitry Andricdef hi_i16_elt : PatFrag< 3200b57cec5SDimitry Andric (ops node:$src0), (i16 (trunc (i32 (srl_16 node:$src0)))) 3210b57cec5SDimitry Andric>; 3220b57cec5SDimitry Andric 3230b57cec5SDimitry Andric 3240b57cec5SDimitry Andricdef hi_f16_elt : PatLeaf< 3250b57cec5SDimitry Andric (vt), [{ 3260b57cec5SDimitry Andric if (N->getOpcode() != ISD::BITCAST) 3270b57cec5SDimitry Andric return false; 3280b57cec5SDimitry Andric SDValue Tmp = N->getOperand(0); 3290b57cec5SDimitry Andric 3300b57cec5SDimitry Andric if (Tmp.getOpcode() != ISD::SRL) 3310b57cec5SDimitry Andric return false; 3320b57cec5SDimitry Andric if (const auto *RHS = dyn_cast<ConstantSDNode>(Tmp.getOperand(1)) 3330b57cec5SDimitry Andric return RHS->getZExtValue() == 16; 3340b57cec5SDimitry Andric return false; 3350b57cec5SDimitry Andric}]>; 3360b57cec5SDimitry Andric 3370b57cec5SDimitry Andric//===----------------------------------------------------------------------===// 338bdd1243dSDimitry Andric// PatLeafs for zero immediate 339bdd1243dSDimitry Andric//===----------------------------------------------------------------------===// 340bdd1243dSDimitry Andric 341bdd1243dSDimitry Andricdef immzero : PatLeaf<(imm), [{ return N->isZero(); }]>; 342bdd1243dSDimitry Andricdef fpimmzero : PatLeaf<(fpimm), [{ return N->isZero(); }]>; 343bdd1243dSDimitry Andric 344bdd1243dSDimitry Andric//===----------------------------------------------------------------------===// 3450b57cec5SDimitry Andric// PatLeafs for floating-point comparisons 3460b57cec5SDimitry Andric//===----------------------------------------------------------------------===// 3470b57cec5SDimitry Andric 3488bcb0991SDimitry Andricdef COND_OEQ : PatFrags<(ops), [(OtherVT SETOEQ), (OtherVT SETEQ)]>; 3498bcb0991SDimitry Andricdef COND_ONE : PatFrags<(ops), [(OtherVT SETONE), (OtherVT SETNE)]>; 3508bcb0991SDimitry Andricdef COND_OGT : PatFrags<(ops), [(OtherVT SETOGT), (OtherVT SETGT)]>; 3518bcb0991SDimitry Andricdef COND_OGE : PatFrags<(ops), [(OtherVT SETOGE), (OtherVT SETGE)]>; 3528bcb0991SDimitry Andricdef COND_OLT : PatFrags<(ops), [(OtherVT SETOLT), (OtherVT SETLT)]>; 3538bcb0991SDimitry Andricdef COND_OLE : PatFrags<(ops), [(OtherVT SETOLE), (OtherVT SETLE)]>; 3548bcb0991SDimitry Andricdef COND_O : PatFrags<(ops), [(OtherVT SETO)]>; 3558bcb0991SDimitry Andricdef COND_UO : PatFrags<(ops), [(OtherVT SETUO)]>; 3560b57cec5SDimitry Andric 3570b57cec5SDimitry Andric//===----------------------------------------------------------------------===// 3580b57cec5SDimitry Andric// PatLeafs for unsigned / unordered comparisons 3590b57cec5SDimitry Andric//===----------------------------------------------------------------------===// 3600b57cec5SDimitry Andric 3618bcb0991SDimitry Andricdef COND_UEQ : PatFrag<(ops), (OtherVT SETUEQ)>; 3628bcb0991SDimitry Andricdef COND_UNE : PatFrag<(ops), (OtherVT SETUNE)>; 3638bcb0991SDimitry Andricdef COND_UGT : PatFrag<(ops), (OtherVT SETUGT)>; 3648bcb0991SDimitry Andricdef COND_UGE : PatFrag<(ops), (OtherVT SETUGE)>; 3658bcb0991SDimitry Andricdef COND_ULT : PatFrag<(ops), (OtherVT SETULT)>; 3668bcb0991SDimitry Andricdef COND_ULE : PatFrag<(ops), (OtherVT SETULE)>; 3670b57cec5SDimitry Andric 3680b57cec5SDimitry Andric// XXX - For some reason R600 version is preferring to use unordered 3690b57cec5SDimitry Andric// for setne? 3708bcb0991SDimitry Andricdef COND_UNE_NE : PatFrags<(ops), [(OtherVT SETUNE), (OtherVT SETNE)]>; 3710b57cec5SDimitry Andric 3720b57cec5SDimitry Andric//===----------------------------------------------------------------------===// 3730b57cec5SDimitry Andric// PatLeafs for signed comparisons 3740b57cec5SDimitry Andric//===----------------------------------------------------------------------===// 3750b57cec5SDimitry Andric 3768bcb0991SDimitry Andricdef COND_SGT : PatFrag<(ops), (OtherVT SETGT)>; 3778bcb0991SDimitry Andricdef COND_SGE : PatFrag<(ops), (OtherVT SETGE)>; 3788bcb0991SDimitry Andricdef COND_SLT : PatFrag<(ops), (OtherVT SETLT)>; 3798bcb0991SDimitry Andricdef COND_SLE : PatFrag<(ops), (OtherVT SETLE)>; 3800b57cec5SDimitry Andric 3810b57cec5SDimitry Andric//===----------------------------------------------------------------------===// 3820b57cec5SDimitry Andric// PatLeafs for integer equality 3830b57cec5SDimitry Andric//===----------------------------------------------------------------------===// 3840b57cec5SDimitry Andric 3858bcb0991SDimitry Andricdef COND_EQ : PatFrags<(ops), [(OtherVT SETEQ), (OtherVT SETUEQ)]>; 3868bcb0991SDimitry Andricdef COND_NE : PatFrags<(ops), [(OtherVT SETNE), (OtherVT SETUNE)]>; 3870b57cec5SDimitry Andric 3888bcb0991SDimitry Andric// FIXME: Should not need code predicate 3898bcb0991SDimitry Andric//def COND_NULL : PatLeaf<(OtherVT null_frag)>; 3900b57cec5SDimitry Andricdef COND_NULL : PatLeaf < 3910b57cec5SDimitry Andric (cond), 3920b57cec5SDimitry Andric [{(void)N; return false;}] 3930b57cec5SDimitry Andric>; 3940b57cec5SDimitry Andric 3950b57cec5SDimitry Andric//===----------------------------------------------------------------------===// 3960b57cec5SDimitry Andric// PatLeafs for Texture Constants 3970b57cec5SDimitry Andric//===----------------------------------------------------------------------===// 3980b57cec5SDimitry Andric 3990b57cec5SDimitry Andricdef TEX_ARRAY : PatLeaf< 4000b57cec5SDimitry Andric (imm), 4010b57cec5SDimitry Andric [{uint32_t TType = (uint32_t)N->getZExtValue(); 4020b57cec5SDimitry Andric return TType == 9 || TType == 10 || TType == 16; 4030b57cec5SDimitry Andric }] 4040b57cec5SDimitry Andric>; 4050b57cec5SDimitry Andric 4060b57cec5SDimitry Andricdef TEX_RECT : PatLeaf< 4070b57cec5SDimitry Andric (imm), 4080b57cec5SDimitry Andric [{uint32_t TType = (uint32_t)N->getZExtValue(); 4090b57cec5SDimitry Andric return TType == 5; 4100b57cec5SDimitry Andric }] 4110b57cec5SDimitry Andric>; 4120b57cec5SDimitry Andric 4130b57cec5SDimitry Andricdef TEX_SHADOW : PatLeaf< 4140b57cec5SDimitry Andric (imm), 4150b57cec5SDimitry Andric [{uint32_t TType = (uint32_t)N->getZExtValue(); 4160b57cec5SDimitry Andric return (TType >= 6 && TType <= 8) || TType == 13; 4170b57cec5SDimitry Andric }] 4180b57cec5SDimitry Andric>; 4190b57cec5SDimitry Andric 4200b57cec5SDimitry Andricdef TEX_SHADOW_ARRAY : PatLeaf< 4210b57cec5SDimitry Andric (imm), 4220b57cec5SDimitry Andric [{uint32_t TType = (uint32_t)N->getZExtValue(); 4230b57cec5SDimitry Andric return TType == 11 || TType == 12 || TType == 17; 4240b57cec5SDimitry Andric }] 4250b57cec5SDimitry Andric>; 4260b57cec5SDimitry Andric 4270b57cec5SDimitry Andric//===----------------------------------------------------------------------===// 4280b57cec5SDimitry Andric// Load/Store Pattern Fragments 4290b57cec5SDimitry Andric//===----------------------------------------------------------------------===// 4300b57cec5SDimitry Andric 4318bcb0991SDimitry Andricdef atomic_cmp_swap_glue : SDNode <"ISD::ATOMIC_CMP_SWAP", SDTAtomic3, 4328bcb0991SDimitry Andric [SDNPHasChain, SDNPMayStore, SDNPMayLoad, SDNPMemOperand, SDNPInGlue] 4338bcb0991SDimitry Andric>; 4348bcb0991SDimitry Andric 4350b57cec5SDimitry Andricclass AddressSpaceList<list<int> AS> { 4360b57cec5SDimitry Andric list<int> AddrSpaces = AS; 4370b57cec5SDimitry Andric} 4380b57cec5SDimitry Andric 4398bcb0991SDimitry Andricclass Aligned<int Bytes> { 4408bcb0991SDimitry Andric int MinAlignment = Bytes; 4418bcb0991SDimitry Andric} 4420b57cec5SDimitry Andric 44304eeddc0SDimitry Andricclass StoreHi16<SDPatternOperator op, ValueType vt> : PatFrag < 444480093f4SDimitry Andric (ops node:$value, node:$ptr), (op (srl node:$value, (i32 16)), node:$ptr)> { 445480093f4SDimitry Andric let IsStore = 1; 44604eeddc0SDimitry Andric let MemoryVT = vt; 447480093f4SDimitry Andric} 4480b57cec5SDimitry Andric 44904eeddc0SDimitry Andricdef LoadAddress_constant : AddressSpaceList<[ AddrSpaces.Constant, 45004eeddc0SDimitry Andric AddrSpaces.Constant32Bit ]>; 45104eeddc0SDimitry Andricdef LoadAddress_global : AddressSpaceList<[ AddrSpaces.Global, 45204eeddc0SDimitry Andric AddrSpaces.Constant, 45304eeddc0SDimitry Andric AddrSpaces.Constant32Bit ]>; 4540b57cec5SDimitry Andricdef StoreAddress_global : AddressSpaceList<[ AddrSpaces.Global ]>; 4550b57cec5SDimitry Andric 4560b57cec5SDimitry Andricdef LoadAddress_flat : AddressSpaceList<[ AddrSpaces.Flat, 4570b57cec5SDimitry Andric AddrSpaces.Global, 45804eeddc0SDimitry Andric AddrSpaces.Constant, 45904eeddc0SDimitry Andric AddrSpaces.Constant32Bit ]>; 4600b57cec5SDimitry Andricdef StoreAddress_flat : AddressSpaceList<[ AddrSpaces.Flat, AddrSpaces.Global ]>; 4610b57cec5SDimitry Andric 4620b57cec5SDimitry Andricdef LoadAddress_private : AddressSpaceList<[ AddrSpaces.Private ]>; 4630b57cec5SDimitry Andricdef StoreAddress_private : AddressSpaceList<[ AddrSpaces.Private ]>; 4640b57cec5SDimitry Andric 4650b57cec5SDimitry Andricdef LoadAddress_local : AddressSpaceList<[ AddrSpaces.Local ]>; 4660b57cec5SDimitry Andricdef StoreAddress_local : AddressSpaceList<[ AddrSpaces.Local ]>; 4670b57cec5SDimitry Andric 4680b57cec5SDimitry Andricdef LoadAddress_region : AddressSpaceList<[ AddrSpaces.Region ]>; 4690b57cec5SDimitry Andricdef StoreAddress_region : AddressSpaceList<[ AddrSpaces.Region ]>; 4700b57cec5SDimitry Andric 4710b57cec5SDimitry Andric 4720b57cec5SDimitry Andric 4730b57cec5SDimitry Andricforeach as = [ "global", "flat", "constant", "local", "private", "region" ] in { 4740b57cec5SDimitry Andriclet AddressSpaces = !cast<AddressSpaceList>("LoadAddress_"#as).AddrSpaces in { 4750b57cec5SDimitry Andric 4760b57cec5SDimitry Andricdef load_#as : PatFrag<(ops node:$ptr), (unindexedload node:$ptr)> { 4770b57cec5SDimitry Andric let IsLoad = 1; 4780b57cec5SDimitry Andric let IsNonExtLoad = 1; 4790b57cec5SDimitry Andric} 4800b57cec5SDimitry Andric 48181ad6265SDimitry Andricdef extloadi8_#as : PatFrag<(ops node:$ptr), (extloadi8 node:$ptr)> { 4820b57cec5SDimitry Andric let IsLoad = 1; 4830b57cec5SDimitry Andric} 4840b57cec5SDimitry Andric 48581ad6265SDimitry Andricdef extloadi16_#as : PatFrag<(ops node:$ptr), (extloadi16 node:$ptr)> { 4860b57cec5SDimitry Andric let IsLoad = 1; 4870b57cec5SDimitry Andric} 4880b57cec5SDimitry Andric 48981ad6265SDimitry Andricdef sextloadi8_#as : PatFrag<(ops node:$ptr), (sextloadi8 node:$ptr)> { 4900b57cec5SDimitry Andric let IsLoad = 1; 4910b57cec5SDimitry Andric} 4920b57cec5SDimitry Andric 49381ad6265SDimitry Andricdef sextloadi16_#as : PatFrag<(ops node:$ptr), (sextloadi16 node:$ptr)> { 4940b57cec5SDimitry Andric let IsLoad = 1; 4950b57cec5SDimitry Andric} 4960b57cec5SDimitry Andric 49781ad6265SDimitry Andricdef zextloadi8_#as : PatFrag<(ops node:$ptr), (zextloadi8 node:$ptr)> { 4980b57cec5SDimitry Andric let IsLoad = 1; 4990b57cec5SDimitry Andric} 5000b57cec5SDimitry Andric 50181ad6265SDimitry Andricdef zextloadi16_#as : PatFrag<(ops node:$ptr), (zextloadi16 node:$ptr)> { 5020b57cec5SDimitry Andric let IsLoad = 1; 5030b57cec5SDimitry Andric} 5040b57cec5SDimitry Andric 505349cc55cSDimitry Andricdef atomic_load_8_#as : PatFrag<(ops node:$ptr), (atomic_load_8 node:$ptr)> { 506349cc55cSDimitry Andric let IsAtomic = 1; 507349cc55cSDimitry Andric let MemoryVT = i8; 508349cc55cSDimitry Andric} 509349cc55cSDimitry Andric 510349cc55cSDimitry Andricdef atomic_load_16_#as : PatFrag<(ops node:$ptr), (atomic_load_16 node:$ptr)> { 511349cc55cSDimitry Andric let IsAtomic = 1; 512349cc55cSDimitry Andric let MemoryVT = i16; 513349cc55cSDimitry Andric} 514349cc55cSDimitry Andric 5150b57cec5SDimitry Andricdef atomic_load_32_#as : PatFrag<(ops node:$ptr), (atomic_load_32 node:$ptr)> { 5160b57cec5SDimitry Andric let IsAtomic = 1; 5170b57cec5SDimitry Andric let MemoryVT = i32; 5180b57cec5SDimitry Andric} 5190b57cec5SDimitry Andric 5200b57cec5SDimitry Andricdef atomic_load_64_#as : PatFrag<(ops node:$ptr), (atomic_load_64 node:$ptr)> { 5210b57cec5SDimitry Andric let IsAtomic = 1; 5220b57cec5SDimitry Andric let MemoryVT = i64; 5230b57cec5SDimitry Andric} 5245ffd83dbSDimitry Andric} // End let AddressSpaces 5255ffd83dbSDimitry Andric} // End foreach as 5260b57cec5SDimitry Andric 5275ffd83dbSDimitry Andric 5285ffd83dbSDimitry Andricforeach as = [ "global", "flat", "local", "private", "region" ] in { 52981ad6265SDimitry Andriclet IsStore = 1, AddressSpaces = !cast<AddressSpaceList>("StoreAddress_"#as).AddrSpaces in { 5300b57cec5SDimitry Andricdef store_#as : PatFrag<(ops node:$val, node:$ptr), 5310b57cec5SDimitry Andric (unindexedstore node:$val, node:$ptr)> { 5320b57cec5SDimitry Andric let IsTruncStore = 0; 5330b57cec5SDimitry Andric} 5340b57cec5SDimitry Andric 5350b57cec5SDimitry Andric// truncstore fragments. 5360b57cec5SDimitry Andricdef truncstore_#as : PatFrag<(ops node:$val, node:$ptr), 5370b57cec5SDimitry Andric (unindexedstore node:$val, node:$ptr)> { 5380b57cec5SDimitry Andric let IsTruncStore = 1; 5390b57cec5SDimitry Andric} 5400b57cec5SDimitry Andric 5410b57cec5SDimitry Andric// TODO: We don't really need the truncstore here. We can use 5420b57cec5SDimitry Andric// unindexedstore with MemoryVT directly, which will save an 5430b57cec5SDimitry Andric// unnecessary check that the memory size is less than the value type 5440b57cec5SDimitry Andric// in the generated matcher table. 5450b57cec5SDimitry Andricdef truncstorei8_#as : PatFrag<(ops node:$val, node:$ptr), 54681ad6265SDimitry Andric (truncstorei8 node:$val, node:$ptr)>; 5470b57cec5SDimitry Andricdef truncstorei16_#as : PatFrag<(ops node:$val, node:$ptr), 54881ad6265SDimitry Andric (truncstorei16 node:$val, node:$ptr)>; 5490b57cec5SDimitry Andric 55004eeddc0SDimitry Andricdef store_hi16_#as : StoreHi16 <truncstorei16, i16>; 55104eeddc0SDimitry Andricdef truncstorei8_hi16_#as : StoreHi16<truncstorei8, i8>; 55204eeddc0SDimitry Andricdef truncstorei16_hi16_#as : StoreHi16<truncstorei16, i16>; 55381ad6265SDimitry Andric} // End let IsStore = 1, AddressSpaces = ... 5540b57cec5SDimitry Andric 55581ad6265SDimitry Andriclet IsAtomic = 1, AddressSpaces = !cast<AddressSpaceList>("StoreAddress_"#as).AddrSpaces in { 5565f757f3fSDimitry Andricdef atomic_store_8_#as : PatFrag<(ops node:$val, node:$ptr), 5575f757f3fSDimitry Andric (atomic_store_8 node:$val, node:$ptr)>; 5585f757f3fSDimitry Andricdef atomic_store_16_#as : PatFrag<(ops node:$val, node:$ptr), 5595f757f3fSDimitry Andric (atomic_store_16 node:$val, node:$ptr)>; 5605f757f3fSDimitry Andricdef atomic_store_32_#as : PatFrag<(ops node:$val, node:$ptr), 5615f757f3fSDimitry Andric (atomic_store_32 node:$val, node:$ptr)>; 5625f757f3fSDimitry Andricdef atomic_store_64_#as : PatFrag<(ops node:$val, node:$ptr), 5635f757f3fSDimitry Andric (atomic_store_64 node:$val, node:$ptr)>; 5645f757f3fSDimitry Andric} // End let IsAtomic = 1, AddressSpaces = ... 5655ffd83dbSDimitry Andric} // End foreach as 5660b57cec5SDimitry Andric 567753f127fSDimitry Andricmulticlass noret_op { 568753f127fSDimitry Andric let HasNoUse = true in 56981ad6265SDimitry Andric def "_noret" : PatFrag<(ops node:$ptr, node:$data), 57081ad6265SDimitry Andric (!cast<SDPatternOperator>(NAME) node:$ptr, node:$data)>; 57181ad6265SDimitry Andric} 57281ad6265SDimitry Andric 573bdd1243dSDimitry Andricmulticlass global_addr_space_atomic_op { 574bdd1243dSDimitry Andric def "_noret_global_addrspace" : 575bdd1243dSDimitry Andric PatFrag<(ops node:$ptr, node:$data), 576bdd1243dSDimitry Andric (!cast<SDPatternOperator>(NAME) node:$ptr, node:$data)>{ 577bdd1243dSDimitry Andric let HasNoUse = true; 578bdd1243dSDimitry Andric let AddressSpaces = LoadAddress_global.AddrSpaces; 579bdd1243dSDimitry Andric let IsAtomic = 1; 580bdd1243dSDimitry Andric } 581bdd1243dSDimitry Andric def "_global_addrspace" : 582bdd1243dSDimitry Andric PatFrag<(ops node:$ptr, node:$data), 583bdd1243dSDimitry Andric (!cast<SDPatternOperator>(NAME) node:$ptr, node:$data)>{ 584bdd1243dSDimitry Andric let AddressSpaces = LoadAddress_global.AddrSpaces; 585bdd1243dSDimitry Andric let IsAtomic = 1; 586bdd1243dSDimitry Andric } 587bdd1243dSDimitry Andric} 588bdd1243dSDimitry Andric 589bdd1243dSDimitry Andricmulticlass flat_addr_space_atomic_op { 590bdd1243dSDimitry Andric def "_noret_flat_addrspace" : 591bdd1243dSDimitry Andric PatFrag<(ops node:$ptr, node:$data), 592bdd1243dSDimitry Andric (!cast<SDPatternOperator>(NAME) node:$ptr, node:$data)>{ 593bdd1243dSDimitry Andric let HasNoUse = true; 594bdd1243dSDimitry Andric let AddressSpaces = LoadAddress_flat.AddrSpaces; 595bdd1243dSDimitry Andric let IsAtomic = 1; 596bdd1243dSDimitry Andric } 597bdd1243dSDimitry Andric def "_flat_addrspace" : 598bdd1243dSDimitry Andric PatFrag<(ops node:$ptr, node:$data), 599bdd1243dSDimitry Andric (!cast<SDPatternOperator>(NAME) node:$ptr, node:$data)>{ 600bdd1243dSDimitry Andric let AddressSpaces = LoadAddress_flat.AddrSpaces; 601bdd1243dSDimitry Andric let IsAtomic = 1; 602bdd1243dSDimitry Andric } 603bdd1243dSDimitry Andric} 604bdd1243dSDimitry Andric 605bdd1243dSDimitry Andricmulticlass local_addr_space_atomic_op { 606bdd1243dSDimitry Andric def "_noret_local_addrspace" : 607bdd1243dSDimitry Andric PatFrag<(ops node:$ptr, node:$data), 608bdd1243dSDimitry Andric (!cast<SDPatternOperator>(NAME) node:$ptr, node:$data)>{ 609bdd1243dSDimitry Andric let HasNoUse = true; 610bdd1243dSDimitry Andric let AddressSpaces = LoadAddress_local.AddrSpaces; 611bdd1243dSDimitry Andric let IsAtomic = 1; 612bdd1243dSDimitry Andric } 613bdd1243dSDimitry Andric def "_local_addrspace" : 614bdd1243dSDimitry Andric PatFrag<(ops node:$ptr, node:$data), 615bdd1243dSDimitry Andric (!cast<SDPatternOperator>(NAME) node:$ptr, node:$data)>{ 616bdd1243dSDimitry Andric let AddressSpaces = LoadAddress_local.AddrSpaces; 617bdd1243dSDimitry Andric let IsAtomic = 1; 618bdd1243dSDimitry Andric } 619bdd1243dSDimitry Andric} 620bdd1243dSDimitry Andric 621*0fca6ea1SDimitry Andricdefm int_amdgcn_flat_atomic_fadd : noret_op; 622bdd1243dSDimitry Andricdefm int_amdgcn_flat_atomic_fadd : flat_addr_space_atomic_op; 623753f127fSDimitry Andricdefm int_amdgcn_flat_atomic_fadd_v2bf16 : noret_op; 624753f127fSDimitry Andricdefm int_amdgcn_flat_atomic_fmin : noret_op; 625753f127fSDimitry Andricdefm int_amdgcn_flat_atomic_fmax : noret_op; 626bdd1243dSDimitry Andricdefm int_amdgcn_global_atomic_fadd : global_addr_space_atomic_op; 627bdd1243dSDimitry Andricdefm int_amdgcn_flat_atomic_fadd : global_addr_space_atomic_op; 628753f127fSDimitry Andricdefm int_amdgcn_global_atomic_fadd_v2bf16 : noret_op; 629753f127fSDimitry Andricdefm int_amdgcn_global_atomic_fmin : noret_op; 630753f127fSDimitry Andricdefm int_amdgcn_global_atomic_fmax : noret_op; 6315f757f3fSDimitry Andricdefm int_amdgcn_global_atomic_csub : noret_op; 632bdd1243dSDimitry Andricdefm int_amdgcn_flat_atomic_fadd : local_addr_space_atomic_op; 633647cbc5dSDimitry Andricdefm int_amdgcn_global_atomic_ordered_add_b64 : noret_op; 6345f757f3fSDimitry Andricdefm int_amdgcn_flat_atomic_fmin_num : noret_op; 6355f757f3fSDimitry Andricdefm int_amdgcn_flat_atomic_fmax_num : noret_op; 6365f757f3fSDimitry Andricdefm int_amdgcn_global_atomic_fmin_num : noret_op; 6375f757f3fSDimitry Andricdefm int_amdgcn_global_atomic_fmax_num : noret_op; 6387a6dacacSDimitry Andricdefm int_amdgcn_atomic_cond_sub_u32 : local_addr_space_atomic_op; 6397a6dacacSDimitry Andricdefm int_amdgcn_atomic_cond_sub_u32 : flat_addr_space_atomic_op; 6407a6dacacSDimitry Andricdefm int_amdgcn_atomic_cond_sub_u32 : global_addr_space_atomic_op; 6410b57cec5SDimitry Andric 642*0fca6ea1SDimitry Andricmulticlass noret_binary_atomic_op<SDNode atomic_op> { 643753f127fSDimitry Andric let HasNoUse = true in 644*0fca6ea1SDimitry Andric defm "_noret" : binary_atomic_op<atomic_op>; 645*0fca6ea1SDimitry Andric} 646*0fca6ea1SDimitry Andric 647*0fca6ea1SDimitry Andricmulticlass noret_binary_atomic_op_fp<SDNode atomic_op> { 648*0fca6ea1SDimitry Andric let HasNoUse = true in 649*0fca6ea1SDimitry Andric defm "_noret" : binary_atomic_op_fp<atomic_op>; 65081ad6265SDimitry Andric} 65181ad6265SDimitry Andric 652753f127fSDimitry Andricmulticlass noret_ternary_atomic_op<SDNode atomic_op> { 653753f127fSDimitry Andric let HasNoUse = true in 65481ad6265SDimitry Andric defm "_noret" : ternary_atomic_op<atomic_op>; 65581ad6265SDimitry Andric} 65681ad6265SDimitry Andric 657*0fca6ea1SDimitry Andricdefvar atomic_addrspace_names = [ "global", "flat", "constant", "local", "private", "region" ]; 658*0fca6ea1SDimitry Andric 659*0fca6ea1SDimitry Andricmulticlass binary_atomic_op_all_as<SDNode atomic_op> { 660*0fca6ea1SDimitry Andric foreach as = atomic_addrspace_names in { 6618bcb0991SDimitry Andric let AddressSpaces = !cast<AddressSpaceList>("LoadAddress_"#as).AddrSpaces in { 662*0fca6ea1SDimitry Andric defm "_"#as : binary_atomic_op<atomic_op>; 663*0fca6ea1SDimitry Andric defm "_"#as : noret_binary_atomic_op<atomic_op>; 664*0fca6ea1SDimitry Andric } 665*0fca6ea1SDimitry Andric } 666*0fca6ea1SDimitry Andric} 667*0fca6ea1SDimitry Andricmulticlass binary_atomic_op_fp_all_as<SDNode atomic_op> { 668*0fca6ea1SDimitry Andric foreach as = atomic_addrspace_names in { 669*0fca6ea1SDimitry Andric let AddressSpaces = !cast<AddressSpaceList>("LoadAddress_"#as).AddrSpaces in { 670*0fca6ea1SDimitry Andric defm "_"#as : binary_atomic_op_fp<atomic_op>; 671*0fca6ea1SDimitry Andric defm "_"#as : noret_binary_atomic_op_fp<atomic_op>; 6728bcb0991SDimitry Andric } 6738bcb0991SDimitry Andric } 6748bcb0991SDimitry Andric} 6758bcb0991SDimitry Andric 67681ad6265SDimitry Andricdefm atomic_swap : binary_atomic_op_all_as<atomic_swap>; 67781ad6265SDimitry Andricdefm atomic_load_add : binary_atomic_op_all_as<atomic_load_add>; 67881ad6265SDimitry Andricdefm atomic_load_and : binary_atomic_op_all_as<atomic_load_and>; 67981ad6265SDimitry Andricdefm atomic_load_max : binary_atomic_op_all_as<atomic_load_max>; 68081ad6265SDimitry Andricdefm atomic_load_min : binary_atomic_op_all_as<atomic_load_min>; 68181ad6265SDimitry Andricdefm atomic_load_or : binary_atomic_op_all_as<atomic_load_or>; 68281ad6265SDimitry Andricdefm atomic_load_sub : binary_atomic_op_all_as<atomic_load_sub>; 68381ad6265SDimitry Andricdefm atomic_load_umax : binary_atomic_op_all_as<atomic_load_umax>; 68481ad6265SDimitry Andricdefm atomic_load_umin : binary_atomic_op_all_as<atomic_load_umin>; 68581ad6265SDimitry Andricdefm atomic_load_xor : binary_atomic_op_all_as<atomic_load_xor>; 686*0fca6ea1SDimitry Andricdefm atomic_load_fadd : binary_atomic_op_fp_all_as<atomic_load_fadd>; 687*0fca6ea1SDimitry Andricdefm atomic_load_fmin : binary_atomic_op_fp_all_as<atomic_load_fmin>; 688*0fca6ea1SDimitry Andricdefm atomic_load_fmax : binary_atomic_op_fp_all_as<atomic_load_fmax>; 68906c3fb27SDimitry Andricdefm atomic_load_uinc_wrap : binary_atomic_op_all_as<atomic_load_uinc_wrap>; 69006c3fb27SDimitry Andricdefm atomic_load_udec_wrap : binary_atomic_op_all_as<atomic_load_udec_wrap>; 69181ad6265SDimitry Andricdefm AMDGPUatomic_cmp_swap : binary_atomic_op_all_as<AMDGPUatomic_cmp_swap>; 6920b57cec5SDimitry Andric 693e8d8bef9SDimitry Andricdef load_align8_local : PatFrag<(ops node:$ptr), (load_local node:$ptr)>, 694e8d8bef9SDimitry Andric Aligned<8> { 6958bcb0991SDimitry Andric let IsLoad = 1; 6968bcb0991SDimitry Andric} 6970b57cec5SDimitry Andric 698e8d8bef9SDimitry Andricdef load_align16_local : PatFrag<(ops node:$ptr), (load_local node:$ptr)>, 699e8d8bef9SDimitry Andric Aligned<16> { 7008bcb0991SDimitry Andric let IsLoad = 1; 7018bcb0991SDimitry Andric} 7020b57cec5SDimitry Andric 7038bcb0991SDimitry Andricdef store_align8_local: PatFrag<(ops node:$val, node:$ptr), 7048bcb0991SDimitry Andric (store_local node:$val, node:$ptr)>, Aligned<8> { 7058bcb0991SDimitry Andric let IsStore = 1; 7068bcb0991SDimitry Andric} 7078bcb0991SDimitry Andric 7088bcb0991SDimitry Andricdef store_align16_local: PatFrag<(ops node:$val, node:$ptr), 7098bcb0991SDimitry Andric (store_local node:$val, node:$ptr)>, Aligned<16> { 7108bcb0991SDimitry Andric let IsStore = 1; 7118bcb0991SDimitry Andric} 7128bcb0991SDimitry Andric 7138bcb0991SDimitry Andriclet AddressSpaces = StoreAddress_local.AddrSpaces in { 7148bcb0991SDimitry Andricdefm atomic_cmp_swap_local : ternary_atomic_op<atomic_cmp_swap>; 715753f127fSDimitry Andricdefm atomic_cmp_swap_local : noret_ternary_atomic_op<atomic_cmp_swap>; 716753f127fSDimitry Andricdefm atomic_cmp_swap_local_m0 : noret_ternary_atomic_op<atomic_cmp_swap_glue>; 717753f127fSDimitry Andricdefm atomic_cmp_swap_local_m0 : ternary_atomic_op<atomic_cmp_swap_glue>; 7188bcb0991SDimitry Andric} 7190b57cec5SDimitry Andric 7208bcb0991SDimitry Andriclet AddressSpaces = StoreAddress_region.AddrSpaces in { 721753f127fSDimitry Andricdefm atomic_cmp_swap_region : noret_ternary_atomic_op<atomic_cmp_swap>; 722753f127fSDimitry Andricdefm atomic_cmp_swap_region_m0 : noret_ternary_atomic_op<atomic_cmp_swap_glue>; 723753f127fSDimitry Andricdefm atomic_cmp_swap_region_m0 : ternary_atomic_op<atomic_cmp_swap_glue>; 7248bcb0991SDimitry Andric} 7250b57cec5SDimitry Andric 7260b57cec5SDimitry Andric//===----------------------------------------------------------------------===// 7270b57cec5SDimitry Andric// Misc Pattern Fragments 7280b57cec5SDimitry Andric//===----------------------------------------------------------------------===// 7290b57cec5SDimitry Andric 7300b57cec5SDimitry Andricclass Constants { 7310b57cec5SDimitry Andricint TWO_PI = 0x40c90fdb; 7320b57cec5SDimitry Andricint PI = 0x40490fdb; 7330b57cec5SDimitry Andricint TWO_PI_INV = 0x3e22f983; 7345ffd83dbSDimitry Andricint FP_4294966784 = 0x4f7ffffe; // 4294966784 = 4294967296 - 512 = 2^32 - 2^9 7350b57cec5SDimitry Andricint FP16_ONE = 0x3C00; 7360b57cec5SDimitry Andricint FP16_NEG_ONE = 0xBC00; 7370b57cec5SDimitry Andricint FP32_ONE = 0x3f800000; 7380b57cec5SDimitry Andricint FP32_NEG_ONE = 0xbf800000; 7390b57cec5SDimitry Andricint FP64_ONE = 0x3ff0000000000000; 7400b57cec5SDimitry Andricint FP64_NEG_ONE = 0xbff0000000000000; 7410b57cec5SDimitry Andric} 7420b57cec5SDimitry Andricdef CONST : Constants; 7430b57cec5SDimitry Andric 7440b57cec5SDimitry Andricdef FP_ZERO : PatLeaf < 7450b57cec5SDimitry Andric (fpimm), 7460b57cec5SDimitry Andric [{return N->getValueAPF().isZero();}] 7470b57cec5SDimitry Andric>; 7480b57cec5SDimitry Andric 7490b57cec5SDimitry Andricdef FP_ONE : PatLeaf < 7500b57cec5SDimitry Andric (fpimm), 7510b57cec5SDimitry Andric [{return N->isExactlyValue(1.0);}] 7520b57cec5SDimitry Andric>; 7530b57cec5SDimitry Andric 7540b57cec5SDimitry Andricdef FP_HALF : PatLeaf < 7550b57cec5SDimitry Andric (fpimm), 7560b57cec5SDimitry Andric [{return N->isExactlyValue(0.5);}] 7570b57cec5SDimitry Andric>; 7580b57cec5SDimitry Andric 7590b57cec5SDimitry Andric/* Generic helper patterns for intrinsics */ 7600b57cec5SDimitry Andric/* -------------------------------------- */ 7610b57cec5SDimitry Andric 7620b57cec5SDimitry Andricclass POW_Common <AMDGPUInst log_ieee, AMDGPUInst exp_ieee, AMDGPUInst mul> 7630b57cec5SDimitry Andric : AMDGPUPat < 7640b57cec5SDimitry Andric (fpow f32:$src0, f32:$src1), 7650b57cec5SDimitry Andric (exp_ieee (mul f32:$src1, (log_ieee f32:$src0))) 7660b57cec5SDimitry Andric>; 7670b57cec5SDimitry Andric 7680b57cec5SDimitry Andric/* Other helper patterns */ 7690b57cec5SDimitry Andric/* --------------------- */ 7700b57cec5SDimitry Andric 7710b57cec5SDimitry Andric/* Extract element pattern */ 7720b57cec5SDimitry Andricclass Extract_Element <ValueType sub_type, ValueType vec_type, int sub_idx, 7730b57cec5SDimitry Andric SubRegIndex sub_reg> 7740b57cec5SDimitry Andric : AMDGPUPat< 7750b57cec5SDimitry Andric (sub_type (extractelt vec_type:$src, sub_idx)), 7760b57cec5SDimitry Andric (EXTRACT_SUBREG $src, sub_reg) 7770b57cec5SDimitry Andric>; 7780b57cec5SDimitry Andric 7790b57cec5SDimitry Andric/* Insert element pattern */ 7800b57cec5SDimitry Andricclass Insert_Element <ValueType elem_type, ValueType vec_type, 7810b57cec5SDimitry Andric int sub_idx, SubRegIndex sub_reg> 7820b57cec5SDimitry Andric : AMDGPUPat < 7830b57cec5SDimitry Andric (insertelt vec_type:$vec, elem_type:$elem, sub_idx), 7840b57cec5SDimitry Andric (INSERT_SUBREG $vec, $elem, sub_reg) 7850b57cec5SDimitry Andric>; 7860b57cec5SDimitry Andric 7870b57cec5SDimitry Andric// XXX: Convert to new syntax and use COPY_TO_REG, once the DFAPacketizer 7880b57cec5SDimitry Andric// can handle COPY instructions. 7890b57cec5SDimitry Andric// bitconvert pattern 7900b57cec5SDimitry Andricclass BitConvert <ValueType dt, ValueType st, RegisterClass rc> : AMDGPUPat < 7910b57cec5SDimitry Andric (dt (bitconvert (st rc:$src0))), 7920b57cec5SDimitry Andric (dt rc:$src0) 7930b57cec5SDimitry Andric>; 7940b57cec5SDimitry Andric 7950b57cec5SDimitry Andric// XXX: Convert to new syntax and use COPY_TO_REG, once the DFAPacketizer 7960b57cec5SDimitry Andric// can handle COPY instructions. 7970b57cec5SDimitry Andricclass DwordAddrPat<ValueType vt, RegisterClass rc> : AMDGPUPat < 7980b57cec5SDimitry Andric (vt (AMDGPUdwordaddr (vt rc:$addr))), 7990b57cec5SDimitry Andric (vt rc:$addr) 8000b57cec5SDimitry Andric>; 8010b57cec5SDimitry Andric 8020b57cec5SDimitry Andric// rotr pattern 8030b57cec5SDimitry Andricclass ROTRPattern <Instruction BIT_ALIGN> : AMDGPUPat < 8040b57cec5SDimitry Andric (rotr i32:$src0, i32:$src1), 8050b57cec5SDimitry Andric (BIT_ALIGN $src0, $src0, $src1) 8060b57cec5SDimitry Andric>; 8070b57cec5SDimitry Andric 8080b57cec5SDimitry Andric// Special conversion patterns 8090b57cec5SDimitry Andric 8100b57cec5SDimitry Andricdef cvt_rpi_i32_f32 : PatFrag < 8110b57cec5SDimitry Andric (ops node:$src), 8120b57cec5SDimitry Andric (fp_to_sint (ffloor (fadd $src, FP_HALF))), 8130b57cec5SDimitry Andric [{ (void) N; return TM.Options.NoNaNsFPMath; }] 8140b57cec5SDimitry Andric>; 8150b57cec5SDimitry Andric 8160b57cec5SDimitry Andricdef cvt_flr_i32_f32 : PatFrag < 8170b57cec5SDimitry Andric (ops node:$src), 8180b57cec5SDimitry Andric (fp_to_sint (ffloor $src)), 8190b57cec5SDimitry Andric [{ (void)N; return TM.Options.NoNaNsFPMath; }] 8200b57cec5SDimitry Andric>; 8210b57cec5SDimitry Andric 8220b57cec5SDimitry Andriclet AddedComplexity = 2 in { 8230b57cec5SDimitry Andricclass IMad24Pat<Instruction Inst, bit HasClamp = 0> : AMDGPUPat < 8240b57cec5SDimitry Andric (add (AMDGPUmul_i24 i32:$src0, i32:$src1), i32:$src2), 8250b57cec5SDimitry Andric !if(HasClamp, (Inst $src0, $src1, $src2, (i1 0)), 8260b57cec5SDimitry Andric (Inst $src0, $src1, $src2)) 8270b57cec5SDimitry Andric>; 8280b57cec5SDimitry Andric 8290b57cec5SDimitry Andricclass UMad24Pat<Instruction Inst, bit HasClamp = 0> : AMDGPUPat < 8300b57cec5SDimitry Andric (add (AMDGPUmul_u24 i32:$src0, i32:$src1), i32:$src2), 8310b57cec5SDimitry Andric !if(HasClamp, (Inst $src0, $src1, $src2, (i1 0)), 8320b57cec5SDimitry Andric (Inst $src0, $src1, $src2)) 8330b57cec5SDimitry Andric>; 8340b57cec5SDimitry Andric} // AddedComplexity. 8350b57cec5SDimitry Andric 8360b57cec5SDimitry Andricclass RcpPat<Instruction RcpInst, ValueType vt> : AMDGPUPat < 8370b57cec5SDimitry Andric (fdiv FP_ONE, vt:$src), 8380b57cec5SDimitry Andric (RcpInst $src) 8390b57cec5SDimitry Andric>; 8400b57cec5SDimitry Andric 8410b57cec5SDimitry Andric// Instructions which select to the same v_min_f* 8420b57cec5SDimitry Andricdef fminnum_like : PatFrags<(ops node:$src0, node:$src1), 8430b57cec5SDimitry Andric [(fminnum_ieee node:$src0, node:$src1), 8440b57cec5SDimitry Andric (fminnum node:$src0, node:$src1)] 8450b57cec5SDimitry Andric>; 8460b57cec5SDimitry Andric 8470b57cec5SDimitry Andric// Instructions which select to the same v_max_f* 8480b57cec5SDimitry Andricdef fmaxnum_like : PatFrags<(ops node:$src0, node:$src1), 8490b57cec5SDimitry Andric [(fmaxnum_ieee node:$src0, node:$src1), 8500b57cec5SDimitry Andric (fmaxnum node:$src0, node:$src1)] 8510b57cec5SDimitry Andric>; 8520b57cec5SDimitry Andric 853bdd1243dSDimitry Andricclass NeverNaNPats<dag ops, list<dag> frags> : PatFrags<ops, frags> { 854bdd1243dSDimitry Andric let PredicateCode = [{ 855bdd1243dSDimitry Andric return CurDAG->isKnownNeverNaN(SDValue(N,0)); 856bdd1243dSDimitry Andric }]; 857bdd1243dSDimitry Andric let GISelPredicateCode = [{ 858bdd1243dSDimitry Andric return isKnownNeverNaN(MI.getOperand(0).getReg(), MRI); 859bdd1243dSDimitry Andric }]; 860bdd1243dSDimitry Andric} 861bdd1243dSDimitry Andric 862bdd1243dSDimitry Andricdef fminnum_like_nnan : NeverNaNPats<(ops node:$src0, node:$src1), 863bdd1243dSDimitry Andric [(fminnum_ieee node:$src0, node:$src1), 864bdd1243dSDimitry Andric (fminnum node:$src0, node:$src1)] 865bdd1243dSDimitry Andric>; 866bdd1243dSDimitry Andric 867bdd1243dSDimitry Andricdef fmaxnum_like_nnan : NeverNaNPats<(ops node:$src0, node:$src1), 868bdd1243dSDimitry Andric [(fmaxnum_ieee node:$src0, node:$src1), 869bdd1243dSDimitry Andric (fmaxnum node:$src0, node:$src1)] 870bdd1243dSDimitry Andric>; 871bdd1243dSDimitry Andric 8720b57cec5SDimitry Andricdef fminnum_like_oneuse : PatFrags<(ops node:$src0, node:$src1), 8730b57cec5SDimitry Andric [(fminnum_ieee_oneuse node:$src0, node:$src1), 8740b57cec5SDimitry Andric (fminnum_oneuse node:$src0, node:$src1)] 8750b57cec5SDimitry Andric>; 8760b57cec5SDimitry Andric 8770b57cec5SDimitry Andricdef fmaxnum_like_oneuse : PatFrags<(ops node:$src0, node:$src1), 8780b57cec5SDimitry Andric [(fmaxnum_ieee_oneuse node:$src0, node:$src1), 8790b57cec5SDimitry Andric (fmaxnum_oneuse node:$src0, node:$src1)] 8800b57cec5SDimitry Andric>; 8815ffd83dbSDimitry Andric 8825ffd83dbSDimitry Andricdef any_fmad : PatFrags<(ops node:$src0, node:$src1, node:$src2), 8835ffd83dbSDimitry Andric [(fmad node:$src0, node:$src1, node:$src2), 8845ffd83dbSDimitry Andric (AMDGPUfmad_ftz node:$src0, node:$src1, node:$src2)] 8855ffd83dbSDimitry Andric>; 8865ffd83dbSDimitry Andric 8875ffd83dbSDimitry Andric// FIXME: fsqrt should not select directly 8885ffd83dbSDimitry Andricdef any_amdgcn_sqrt : PatFrags<(ops node:$src0), 8895ffd83dbSDimitry Andric [(fsqrt node:$src0), (int_amdgcn_sqrt node:$src0)] 8905ffd83dbSDimitry Andric>; 891