//===-- VOPInstructions.td - Vector Instruction Definitions ---------------===// // // Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions. // See https://llvm.org/LICENSE.txt for license information. // SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception // //===----------------------------------------------------------------------===// // dummies for outer let class LetDummies { bit TRANS; bit ReadsModeReg; bit mayRaiseFPException; bit isCommutable; bit isConvertibleToThreeAddress; bit isMoveImm; bit isReMaterializable; bit isAsCheapAsAMove; bit VOPAsmPrefer32Bit; bit FPDPRounding; Predicate SubtargetPredicate; string Constraints; string DisableEncoding; list SchedRW; list Uses; list Defs; list OtherPredicates; Predicate AssemblerPredicate; string DecoderNamespace; } //===----------------------------------------------------------------------===// // VOP Subtarget info //===----------------------------------------------------------------------===// class GFXGen { Predicate AssemblerPredicate = pred; string DecoderNamespace = dn; string Suffix = suffix; int Subtarget = sub; } def GFX12Gen : GFXGen; def GFX11Gen : GFXGen; //===----------------------------------------------------------------------===// class VOP { string OpName = opName; } // First 13 insts from VOPDY are also VOPDX. DOT2ACC_F32_BF16 is omitted defvar VOPDX_Max_Index = 12; class VOPD_Component OpIn, string vOPDName> { Instruction BaseVOP = !cast(NAME); string VOPDName = "v_dual_" # !substr(vOPDName, 2); bits<5> VOPDOp = OpIn; bit CanBeVOPDX = !le(VOPDOp, VOPDX_Max_Index); } class VOPAnyCommon pattern> : InstSI { let mayLoad = 0; let mayStore = 0; let hasSideEffects = 0; let UseNamedOperandTable = 1; let VALU = 1; let Uses = !if(ReadsModeReg, [MODE, EXEC], [EXEC]); } class VOP_Pseudo pattern> : InstSI , VOP , SIMCInstr { let isPseudo = 1; let isCodeGenOnly = 1; let UseNamedOperandTable = 1; string Mnemonic = opName; Instruction Opcode = !cast(NAME); bit IsTrue16 = P.IsTrue16; VOPProfile Pfl = P; string AsmOperands; } class VOP3Common pattern = [], bit HasMods = 0> : VOPAnyCommon { // Using complex patterns gives VOP3 patterns a very high complexity rating, // but standalone patterns are almost always preferred, so we need to adjust the // priority lower. The goal is to use a high number to reduce complexity to // zero (or less than zero). let AddedComplexity = -1000; let VOP3 = 1; let AsmVariantName = AMDGPUAsmVariants.VOP3; let AsmMatchConverter = !if(HasMods, "cvtVOP3", ""); let isCodeGenOnly = 0; int Size = 8; // Because SGPRs may be allowed if there are multiple operands, we // need a post-isel hook to insert copies in order to avoid // violating constant bus requirements. let hasPostISelHook = 1; } class VOP3_Pseudo pattern = [], bit isVOP3P = 0, bit isVop3OpSel = 0> : VOP_Pseudo { let VOP3_OPSEL = isVop3OpSel; let IsPacked = P.IsPacked; let IsMAI = P.IsMAI; let IsWMMA = P.IsWMMA; let IsSWMMAC = P.IsSWMMAC; let AsmOperands = !if(isVop3OpSel, P.AsmVOP3OpSel, !if(!and(isVOP3P, P.IsPacked), P.AsmVOP3P, P.Asm64)); let Size = 8; let mayLoad = 0; let mayStore = 0; let hasSideEffects = 0; // Because SGPRs may be allowed if there are multiple operands, we // need a post-isel hook to insert copies in order to avoid // violating constant bus requirements. let hasPostISelHook = 1; // Using complex patterns gives VOP3 patterns a very high complexity rating, // but standalone patterns are almost always preferred, so we need to adjust the // priority lower. The goal is to use a high number to reduce complexity to // zero (or less than zero). let AddedComplexity = -1000; let VOP3 = 1; let VALU = 1; let FPClamp = P.HasFPClamp; let IntClamp = P.HasIntClamp; let ClampLo = P.HasClampLo; let ClampHi = P.HasClampHi; let ReadsModeReg = !or(P.DstVT.isFP, P.Src0VT.isFP); let mayRaiseFPException = ReadsModeReg; let Uses = !if(ReadsModeReg, [MODE, EXEC], [EXEC]); let AsmVariantName = AMDGPUAsmVariants.VOP3; let AsmMatchConverter = !if(isVOP3P, "cvtVOP3P", !if(!or(P.HasModifiers, P.HasOMod, P.HasIntClamp), "cvtVOP3", "")); } class VOP3P_Pseudo pattern = []> : VOP3_Pseudo { let VOP3P = 1; let IsDOT = P.IsDOT; } class VOP_Real { Instruction Opcode = !cast(NAME); bit IsSingle = ps.Pfl.IsSingle; } class VOP3_Real : VOP_Real , InstSI , SIMCInstr { let VALU = 1; let VOP3 = 1; let isPseudo = 0; let isCodeGenOnly = 0; let UseNamedOperandTable = 1; // copy relevant pseudo op flags let SubtargetPredicate = ps.SubtargetPredicate; let OtherPredicates = ps.OtherPredicates; let AsmMatchConverter = ps.AsmMatchConverter; let AsmVariantName = ps.AsmVariantName; let Constraints = ps.Constraints; let DisableEncoding = ps.DisableEncoding; let TSFlags = ps.TSFlags; let UseNamedOperandTable = ps.UseNamedOperandTable; let Uses = ps.Uses; let Defs = ps.Defs; let SchedRW = ps.SchedRW; let mayLoad = ps.mayLoad; let mayStore = ps.mayStore; let TRANS = ps.TRANS; VOPProfile Pfl = ps.Pfl; } class VOP3_Real_Gen : VOP3_Real { let AssemblerPredicate = Gen.AssemblerPredicate; let OtherPredicates = !if(ps.Pfl.IsRealTrue16, [UseRealTrue16Insts], []); let DecoderNamespace = Gen.DecoderNamespace# !if(ps.Pfl.IsRealTrue16, "", "_FAKE16"); } // XXX - Is there any reason to distinguish this from regular VOP3 // here? class VOP3P_Real : VOP3_Real { // The v_wmma pseudos have extra constraints that we do not want to impose on the real instruction. let Constraints = !if(!eq(!substr(ps.Mnemonic,0,6), "v_wmma"), "", ps.Constraints); } class VOP3P_Real_Gen : VOP3P_Real { let AssemblerPredicate = Gen.AssemblerPredicate; let DecoderNamespace = Gen.DecoderNamespace; } class VOP3a : Enc64 { bits<4> src0_modifiers; bits<9> src0; bits<3> src1_modifiers; bits<9> src1; bits<3> src2_modifiers; bits<9> src2; bits<1> clamp; bits<2> omod; let Inst{8} = !if(P.HasSrc0Mods, src0_modifiers{1}, 0); let Inst{9} = !if(P.HasSrc1Mods, src1_modifiers{1}, 0); let Inst{10} = !if(P.HasSrc2Mods, src2_modifiers{1}, 0); let Inst{31-26} = 0x34; //encoding let Inst{40-32} = !if(P.HasSrc0, src0, 0); let Inst{49-41} = !if(P.HasSrc1, src1, 0); let Inst{58-50} = !if(P.HasSrc2, src2, 0); let Inst{60-59} = !if(P.HasOMod, omod, 0); let Inst{61} = !if(P.HasSrc0Mods, src0_modifiers{0}, 0); let Inst{62} = !if(P.HasSrc1Mods, src1_modifiers{0}, 0); let Inst{63} = !if(P.HasSrc2Mods, src2_modifiers{0}, 0); } class VOP3a_gfx6_gfx7 op, VOPProfile p> : VOP3a

{ let Inst{11} = !if(p.HasClamp, clamp{0}, 0); let Inst{25-17} = op; } class VOP3a_gfx10 op, VOPProfile p> : VOP3a

{ let Inst{15} = !if(p.HasClamp, clamp{0}, 0); let Inst{25-16} = op; let Inst{31-26} = 0x35; } class VOP3a_gfx11_gfx12 op, VOPProfile p> : VOP3a_gfx10; class VOP3a_vi op, VOPProfile P> : VOP3a

{ let Inst{25-16} = op; let Inst{15} = !if(P.HasClamp, clamp{0}, 0); } class VOP3e_gfx6_gfx7 op, VOPProfile p> : VOP3a_gfx6_gfx7 { bits<8> vdst; let Inst{7-0} = !if(p.EmitDst, vdst{7-0}, 0); } class VOP3e_gfx10 op, VOPProfile p> : VOP3a_gfx10 { bits<8> vdst; let Inst{7-0} = !if(p.EmitDst, vdst{7-0}, 0); } class VOP3e_gfx11_gfx12 op, VOPProfile p> : VOP3e_gfx10; class VOP3e_vi op, VOPProfile P> : VOP3a_vi { bits<8> vdst; let Inst{7-0} = !if(P.EmitDst, vdst{7-0}, 0); } class VOP3OpSel_gfx9 op, VOPProfile P> : VOP3e_vi { let Inst{11} = !if(P.HasSrc0, src0_modifiers{2}, 0); let Inst{12} = !if(P.HasSrc1, src1_modifiers{2}, 0); let Inst{13} = !if(P.HasSrc2, src2_modifiers{2}, 0); let Inst{14} = !if(P.HasDst, src0_modifiers{3}, 0); } class VOP3OpSel_gfx10 op, VOPProfile p> : VOP3e_gfx10 { let Inst{11} = !if(p.HasSrc0, src0_modifiers{2}, 0); let Inst{12} = !if(p.HasSrc1, src1_modifiers{2}, 0); let Inst{13} = !if(p.HasSrc2, src2_modifiers{2}, 0); let Inst{14} = !if(p.HasDst, src0_modifiers{3}, 0); } class VOP3OpSel_gfx11_gfx12 op, VOPProfile p> : VOP3OpSel_gfx10; class VOP3FP8OpSel_gfx11_gfx12 op, VOPProfile p> : VOP3e_gfx10 { let Inst{11} = !if(p.HasSrc0, src0_modifiers{2}, 0); let Inst{12} = !if(p.HasSrc0, src0_modifiers{3}, 0); } class VOP3DotOpSel_gfx11_gfx12 op, VOPProfile p> : VOP3OpSel_gfx11_gfx12{ let Inst{11} = ?; let Inst{12} = ?; } // NB: For V_INTERP* opcodes, src0 is encoded as src1 and vice versa class VOP3Interp_vi op, VOPProfile P> : VOP3e_vi { bits<2> attrchan; bits<6> attr; bits<1> high; let Inst{8} = 0; // No modifiers for src0 let Inst{61} = 0; let Inst{9} = !if(P.HasSrc0Mods, src0_modifiers{1}, 0); let Inst{62} = !if(P.HasSrc0Mods, src0_modifiers{0}, 0); let Inst{37-32} = attr; let Inst{39-38} = attrchan; let Inst{40} = !if(P.HasHigh, high, 0); let Inst{49-41} = src0; } class VOP3Interp_gfx10 op, VOPProfile p> : VOP3e_gfx10 { bits<6> attr; bits<2> attrchan; bits<1> high; let Inst{8} = 0; let Inst{9} = !if(p.HasSrc0Mods, src0_modifiers{1}, 0); let Inst{37-32} = attr; let Inst{39-38} = attrchan; let Inst{40} = !if(p.HasHigh, high, 0); let Inst{49-41} = src0; let Inst{61} = 0; let Inst{62} = !if(p.HasSrc0Mods, src0_modifiers{0}, 0); } class VOP3Interp_gfx11 op, VOPProfile p> : VOP3Interp_gfx10; class VOP3be : Enc64 { bits<8> vdst; bits<2> src0_modifiers; bits<9> src0; bits<2> src1_modifiers; bits<9> src1; bits<2> src2_modifiers; bits<9> src2; bits<7> sdst; bits<2> omod; let Inst{7-0} = vdst; let Inst{14-8} = sdst; let Inst{31-26} = 0x34; //encoding let Inst{40-32} = !if(P.HasSrc0, src0, 0); let Inst{49-41} = !if(P.HasSrc1, src1, 0); let Inst{58-50} = !if(P.HasSrc2, src2, 0); let Inst{60-59} = !if(P.HasOMod, omod, 0); let Inst{61} = !if(P.HasSrc0Mods, src0_modifiers{0}, 0); let Inst{62} = !if(P.HasSrc1Mods, src1_modifiers{0}, 0); let Inst{63} = !if(P.HasSrc2Mods, src2_modifiers{0}, 0); } class VOP3Pe op, VOPProfile P> : Enc64 { bits<8> vdst; bits<4> src0_modifiers; bits<9> src0; bits<4> src1_modifiers; bits<9> src1; bits<4> src2_modifiers; bits<9> src2; bits<1> clamp; bits<2> index_key_8bit; bits<1> index_key_16bit; let Inst{7-0} = vdst; let Inst{8} = !if(P.HasSrc0Mods, src0_modifiers{1}, 0); // neg_hi src0 let Inst{9} = !if(P.HasSrc1Mods, src1_modifiers{1}, 0); // neg_hi src1 let Inst{10} = !if(P.HasSrc2Mods, src2_modifiers{1}, 0); // neg_hi src2 let Inst{11} = !if(!and(P.HasSrc0, P.HasOpSel), src0_modifiers{2}, 0); // op_sel(0) let Inst{12} = !if(!and(P.HasSrc1, P.HasOpSel), src1_modifiers{2}, 0); // op_sel(1) let Inst{13} = !if(!and(P.HasSrc2, P.HasOpSel), src2_modifiers{2}, 0); // op_sel(2) let Inst{14} = !if(!and(P.HasSrc2, P.HasOpSel), src2_modifiers{3}, !if(P.IsDOT, 1, ?)); // op_sel_hi(2) let Inst{15} = !if(P.HasClamp, clamp{0}, 0); let Inst{22-16} = op; let Inst{31-23} = 0x1a7; //encoding let Inst{40-32} = !if(P.HasSrc0, src0, 0); let Inst{49-41} = !if(P.HasSrc1, src1, 0); let Inst{58-50} = !if(P.HasSrc2, src2, 0); let Inst{59} = !if(!and(P.HasSrc0, P.HasOpSel), src0_modifiers{3}, !if(P.IsDOT, 1, ?)); // op_sel_hi(0) let Inst{60} = !if(!and(P.HasSrc1, P.HasOpSel), src1_modifiers{3}, !if(P.IsDOT, 1, ?)); // op_sel_hi(1) let Inst{61} = !if(P.HasSrc0Mods, src0_modifiers{0}, 0); // neg (lo) let Inst{62} = !if(P.HasSrc1Mods, src1_modifiers{0}, 0); // neg (lo) let Inst{63} = !if(P.HasSrc2Mods, src2_modifiers{0}, 0); // neg (lo) } class VOP3Pe_MAI op, VOPProfile P, bit acc_cd = 0> : Enc64 { bits<8> vdst; bits<10> src0; bits<10> src1; bits<9> src2; bits<3> blgp; bits<3> cbsz; bits<4> abid; let Inst{7-0} = vdst; let Inst{10-8} = !if(P.HasSrc1, cbsz, 0); let Inst{14-11} = !if(P.HasSrc1, abid, 0); let Inst{15} = acc_cd; let Inst{22-16} = op; let Inst{31-23} = 0x1a7; //encoding let Inst{40-32} = !if(P.HasSrc0, src0{8-0}, 0); let Inst{49-41} = !if(P.HasSrc1, src1{8-0}, 0); let Inst{58-50} = !if(P.HasSrc2, src2, 0); let Inst{59} = !if(P.HasSrc0, src0{9}, 0); // acc(0) let Inst{60} = !if(P.HasSrc1, src1{9}, 0); // acc(1) let Inst{63-61} = !if(P.HasSrc1, blgp, 0); } class VOP3Pe_SMFMAC op> : Enc64 { bits<10> vdst; // VGPR or AGPR, but not SGPR. vdst{8} is not encoded in the instruction. bits<10> src0; bits<10> src1; bits<9> idx; bits<3> blgp; bits<3> cbsz; bits<4> abid; let blgp = 0; let Inst{7-0} = vdst{7-0}; let Inst{10-8} = cbsz; let Inst{14-11} = abid; let Inst{15} = vdst{9}; // acc(vdst) let Inst{22-16} = op; let Inst{31-23} = 0x1a7; // encoding let Inst{40-32} = src0{8-0}; let Inst{49-41} = src1{8-0}; let Inst{58-50} = idx; let Inst{59} = src0{9}; // acc(0) let Inst{60} = src1{9}; // acc(1) let Inst{63-61} = blgp; } class VOP3Pe_gfx10 op, VOPProfile P> : VOP3Pe { let Inst{31-23} = 0x198; //encoding } class VOP3Pe_gfx11_gfx12 op, VOPProfile P> : VOP3Pe_gfx10; class VOP3be_gfx6_gfx7 op, VOPProfile p> : VOP3be

{ let Inst{25-17} = op; } class VOP3be_gfx10 op, VOPProfile p> : VOP3be

{ bits<1> clamp; let Inst{15} = !if(p.HasClamp, clamp{0}, 0); let Inst{25-16} = op; let Inst{31-26} = 0x35; } class VOP3be_gfx11_gfx12 op, VOPProfile p> : VOP3be_gfx10; class VOP3be_vi op, VOPProfile P> : VOP3be

{ bits<1> clamp; let Inst{25-16} = op; let Inst{15} = !if(P.HasClamp, clamp{0}, 0); } def SDWA { // sdwa_sel int BYTE_0 = 0; int BYTE_1 = 1; int BYTE_2 = 2; int BYTE_3 = 3; int WORD_0 = 4; int WORD_1 = 5; int DWORD = 6; // dst_unused int UNUSED_PAD = 0; int UNUSED_SEXT = 1; int UNUSED_PRESERVE = 2; } class VOP_SDWAe : Enc64 { bits<8> src0; bits<3> src0_sel; bits<2> src0_modifiers; // float: {abs,neg}, int {sext} bits<3> src1_sel; bits<2> src1_modifiers; bits<3> dst_sel; bits<2> dst_unused; bits<1> clamp; let Inst{39-32} = !if(P.HasSrc0, src0{7-0}, 0); let Inst{42-40} = !if(P.EmitDstSel, dst_sel{2-0}, ?); let Inst{44-43} = !if(P.EmitDstSel, dst_unused{1-0}, ?); let Inst{45} = !if(P.HasSDWAClamp, clamp{0}, 0); let Inst{50-48} = !if(P.HasSrc0, src0_sel{2-0}, 0); let Inst{51} = !if(P.HasSrc0IntMods, src0_modifiers{0}, 0); let Inst{53-52} = !if(P.HasSrc0FloatMods, src0_modifiers{1-0}, 0); let Inst{58-56} = !if(P.HasSrc1, src1_sel{2-0}, 0); let Inst{59} = !if(P.HasSrc1IntMods, src1_modifiers{0}, 0); let Inst{61-60} = !if(P.HasSrc1FloatMods, src1_modifiers{1-0}, 0); } // GFX9 adds two features to SDWA: // 1. Add 3 fields to the SDWA microcode word: S0, S1 and OMOD. // a. S0 and S1 indicate that source 0 and 1 respectively are SGPRs rather // than VGPRs (at most 1 can be an SGPR); // b. OMOD is the standard output modifier (result *2, *4, /2) // 2. Add a new version of the SDWA microcode word for VOPC: SDWAB. This // replaces OMOD and the dest fields with SD and SDST (SGPR destination) // field. // a. When SD=1, the SDST is used as the destination for the compare result; // b. When SD=0, VCC is used. // // In GFX9, V_MAC_F16, V_MAC_F32 opcodes cannot be used with SDWA // gfx9 SDWA basic encoding class VOP_SDWA9e : Enc64 { bits<9> src0; // {src0_sgpr{0}, src0{7-0}} bits<3> src0_sel; bits<2> src0_modifiers; // float: {abs,neg}, int {sext} bits<3> src1_sel; bits<2> src1_modifiers; bits<1> src1_sgpr; let Inst{39-32} = !if(P.HasSrc0, src0{7-0}, 0); let Inst{50-48} = !if(P.HasSrc0, src0_sel{2-0}, 0); let Inst{51} = !if(P.HasSrc0IntMods, src0_modifiers{0}, 0); let Inst{53-52} = !if(P.HasSrc0FloatMods, src0_modifiers{1-0}, 0); let Inst{55} = !if(P.HasSrc0, src0{8}, 0); let Inst{58-56} = !if(P.HasSrc1, src1_sel{2-0}, 0); let Inst{59} = !if(P.HasSrc1IntMods, src1_modifiers{0}, 0); let Inst{61-60} = !if(P.HasSrc1FloatMods, src1_modifiers{1-0}, 0); let Inst{63} = 0; // src1_sgpr - should be specified in subclass } // gfx9 SDWA-A class VOP_SDWA9Ae : VOP_SDWA9e

{ bits<3> dst_sel; bits<2> dst_unused; bits<1> clamp; bits<2> omod; let Inst{42-40} = !if(P.EmitDstSel, dst_sel{2-0}, ?); let Inst{44-43} = !if(P.EmitDstSel, dst_unused{1-0}, ?); let Inst{45} = !if(P.HasSDWAClamp, clamp{0}, 0); let Inst{47-46} = !if(P.HasSDWAOMod, omod{1-0}, 0); } // gfx9 SDWA-B class VOP_SDWA9Be : VOP_SDWA9e

{ bits<8> sdst; // {vcc_sdst{0}, sdst{6-0}} let Inst{46-40} = !if(P.EmitDst, sdst{6-0}, ?); let Inst{47} = !if(P.EmitDst, sdst{7}, 0); } class VOP_SDWA_Pseudo pattern=[]> : InstSI , VOP , SIMCInstr { let isPseudo = 1; let isCodeGenOnly = 1; let UseNamedOperandTable = 1; string Mnemonic = opName; string AsmOperands = P.AsmSDWA; string AsmOperands9 = P.AsmSDWA9; let Size = 8; let mayLoad = 0; let mayStore = 0; let hasSideEffects = 0; let VALU = 1; let SDWA = 1; let ReadsModeReg = !or(P.DstVT.isFP, P.Src0VT.isFP); let mayRaiseFPException = ReadsModeReg; let Uses = !if(ReadsModeReg, [MODE, EXEC], [EXEC]); let SubtargetPredicate = HasSDWA; let AssemblerPredicate = HasSDWA; let AsmVariantName = !if(P.HasExtSDWA, AMDGPUAsmVariants.SDWA, AMDGPUAsmVariants.Disable); let DecoderNamespace = "SDWA"; VOPProfile Pfl = P; } class VOP_SDWA_Real : InstSI , SIMCInstr { let VALU = 1; let SDWA = 1; let isPseudo = 0; let isCodeGenOnly = 0; let Defs = ps.Defs; let Uses = ps.Uses; let hasSideEffects = ps.hasSideEffects; let Constraints = ps.Constraints; let DisableEncoding = ps.DisableEncoding; // Copy relevant pseudo op flags let SubtargetPredicate = ps.SubtargetPredicate; let AssemblerPredicate = ps.AssemblerPredicate; let AsmMatchConverter = ps.AsmMatchConverter; let AsmVariantName = ps.AsmVariantName; let UseNamedOperandTable = ps.UseNamedOperandTable; let DecoderNamespace = ps.DecoderNamespace; let Constraints = ps.Constraints; let DisableEncoding = ps.DisableEncoding; let TSFlags = ps.TSFlags; let SchedRW = ps.SchedRW; let mayLoad = ps.mayLoad; let mayStore = ps.mayStore; let TRANS = ps.TRANS; } class Base_VOP_SDWA9_Real : InstSI { let VALU = 1; let SDWA = 1; let isPseudo = 0; let isCodeGenOnly = 0; let Defs = ps.Defs; let Uses = ps.Uses; let hasSideEffects = ps.hasSideEffects; let Constraints = ps.Constraints; let DisableEncoding = ps.DisableEncoding; let SubtargetPredicate = HasSDWA9; let AssemblerPredicate = HasSDWA9; let AsmVariantName = !if(ps.Pfl.HasExtSDWA9, AMDGPUAsmVariants.SDWA9, AMDGPUAsmVariants.Disable); let DecoderNamespace = "SDWA9"; // Copy relevant pseudo op flags let AsmMatchConverter = ps.AsmMatchConverter; let UseNamedOperandTable = ps.UseNamedOperandTable; let Constraints = ps.Constraints; let DisableEncoding = ps.DisableEncoding; let TSFlags = ps.TSFlags; let SchedRW = ps.SchedRW; let mayLoad = ps.mayLoad; let mayStore = ps.mayStore; let TRANS = ps.TRANS; } class VOP_SDWA9_Real : Base_VOP_SDWA9_Real , SIMCInstr ; class Base_VOP_SDWA10_Real : Base_VOP_SDWA9_Real { let SubtargetPredicate = HasSDWA10; let AssemblerPredicate = HasSDWA10; let DecoderNamespace = "SDWA10"; } class VOP_SDWA10_Real : Base_VOP_SDWA10_Real, SIMCInstr; class VOP_DPPe : Enc64 { bits<2> src0_modifiers; bits<8> src0; bits<2> src1_modifiers; bits<9> dpp_ctrl; bits<1> bound_ctrl; bits<4> bank_mask; bits<4> row_mask; bit fi; let Inst{39-32} = !if(P.HasSrc0, src0{7-0}, 0); let Inst{48-40} = dpp_ctrl; let Inst{50} = !if(IsDPP16, fi, ?); let Inst{51} = bound_ctrl; let Inst{52} = !if(P.HasSrc0Mods, src0_modifiers{0}, 0); // src0_neg let Inst{53} = !if(P.HasSrc0Mods, src0_modifiers{1}, 0); // src0_abs let Inst{54} = !if(P.HasSrc1Mods, src1_modifiers{0}, 0); // src1_neg let Inst{55} = !if(P.HasSrc1Mods, src1_modifiers{1}, 0); // src1_abs let Inst{59-56} = bank_mask; let Inst{63-60} = row_mask; } class VOP3_DPPe_Fields_Base { bits<9> dpp_ctrl; bits<1> bound_ctrl; bits<4> bank_mask; bits<4> row_mask; bit fi; } class VOP3_DPPe_Fields : VOP3_DPPe_Fields_Base { bits<8> src0; } // Common refers to common between DPP and DPP8 class VOP3_DPPe_Common_Base op, VOPProfile P> : Enc96 { bits<4> src0_modifiers; bits<3> src1_modifiers; bits<3> src2_modifiers; bits<1> clamp; bits<2> omod; let Inst{8} = !if(P.HasSrc0Mods, src0_modifiers{1}, 0); let Inst{9} = !if(P.HasSrc1Mods, src1_modifiers{1}, 0); let Inst{10} = !if(P.HasSrc2Mods, src2_modifiers{1}, 0); // OPSEL must be set such that the low result only uses low inputs, and the high result only uses high inputs. let Inst{11} = !if(P.HasOpSel,!if(P.HasSrc0Mods, src0_modifiers{2}, 0),?); let Inst{12} = !if(P.HasOpSel,!if(P.HasSrc1Mods, src1_modifiers{2}, !if((P.IsFP8), src0_modifiers{3}, 0)), ?); let Inst{13} = !if(P.HasOpSel,!if(P.HasSrc2Mods, src2_modifiers{2}, 0),?); let Inst{14} = !if(P.HasOpSel,!if(P.HasSrc0Mods, src0_modifiers{3}, 0),?); let Inst{15} = !if(P.HasClamp, clamp, 0); let Inst{25-16} = op; let Inst{31-26} = 0x35; let Inst{60-59} = !if(P.HasOMod, omod, 0); let Inst{61} = !if(P.HasSrc0Mods, src0_modifiers{0}, 0); let Inst{62} = !if(P.HasSrc1Mods, src1_modifiers{0}, 0); let Inst{63} = !if(P.HasSrc2Mods, src2_modifiers{0}, 0); } class VOP3_DPPe_Common op, VOPProfile P> : VOP3_DPPe_Common_Base { bits<8> vdst; bits<9> src1; bits<9> src2; let Inst{7-0} = !if(P.EmitDst, vdst{7-0}, 0); let Inst{49-41} = !if(P.HasSrc1, src1, 0); let Inst{58-50} = !if(P.HasSrc2, src2, 0); } class VOP3P_DPPe_Common_Base op, VOPProfile P> : Enc96 { bits<4> src0_modifiers; bits<4> src1_modifiers; bits<4> src2_modifiers; bits<1> clamp; let Inst{8} = !if(P.HasSrc0Mods, src0_modifiers{1}, 0); // neg_hi src0 let Inst{9} = !if(P.HasSrc1Mods, src1_modifiers{1}, 0); // neg_hi src1 let Inst{10} = !if(P.HasSrc2Mods, src2_modifiers{1}, 0); // neg_hi src2 let Inst{11} = !if(!and(P.HasSrc0, P.HasOpSel), src0_modifiers{2}, 0); // op_sel(0) let Inst{12} = !if(!and(P.HasSrc1, P.HasOpSel), src1_modifiers{2}, 0); // op_sel(1) let Inst{13} = !if(!and(P.HasSrc2, P.HasOpSel), src2_modifiers{2}, 0); // op_sel(2) let Inst{14} = !if(!and(P.HasSrc2, P.HasOpSel), src2_modifiers{3}, !if(P.IsDOT, 1, ?)); // op_sel_hi(2) let Inst{15} = !if(P.HasClamp, clamp{0}, 0); let Inst{22-16} = op; let Inst{31-23} = 0x198; // encoding let Inst{59} = !if(!and(P.HasSrc0, P.HasOpSel), src0_modifiers{3}, !if(P.IsDOT, 1, ?)); // op_sel_hi(0) let Inst{60} = !if(!and(P.HasSrc1, P.HasOpSel), src1_modifiers{3}, !if(P.IsDOT, 1, ?)); // op_sel_hi(1) let Inst{61} = !if(P.HasSrc0Mods, src0_modifiers{0}, 0); // neg (lo) let Inst{62} = !if(P.HasSrc1Mods, src1_modifiers{0}, 0); // neg (lo) let Inst{63} = !if(P.HasSrc2Mods, src2_modifiers{0}, 0); // neg (lo) } class VOP3P_DPPe_Common op, VOPProfile P> : VOP3P_DPPe_Common_Base { bits<8> vdst; bits<9> src1; bits<9> src2; let Inst{7-0} = vdst; let Inst{49-41} = !if(P.HasSrc1, src1, 0); let Inst{58-50} = !if(P.HasSrc2, src2, 0); } class VOP_DPP_Pseudo pattern=[], dag Ins = P.InsDPP, string asmOps = P.AsmDPP> : InstSI , VOP , SIMCInstr { let isPseudo = 1; let isCodeGenOnly = 1; let mayLoad = 0; let mayStore = 0; let hasSideEffects = 0; let UseNamedOperandTable = 1; let VALU = 1; let DPP = 1; let Size = 8; let ReadsModeReg = !or(P.DstVT.isFP, P.Src0VT.isFP); let mayRaiseFPException = ReadsModeReg; let Uses = !if(ReadsModeReg, [MODE, EXEC], [EXEC]); let isConvergent = 1; string Mnemonic = OpName; string AsmOperands = asmOps; let AsmMatchConverter = !if(P.HasModifiers, "cvtDPP", ""); let SubtargetPredicate = !if(P.HasExt64BitDPP, HasDPALU_DPP, HasDPP); let AssemblerPredicate = !if(P.HasExt64BitDPP, HasDPALU_DPP, HasDPP); let AsmVariantName = !if(P.HasExtDPP, AMDGPUAsmVariants.DPP, AMDGPUAsmVariants.Disable); let Constraints = !if(P.NumSrcArgs, P.TieRegDPP # " = $vdst", ""); let DisableEncoding = !if(P.NumSrcArgs, P.TieRegDPP, ""); let DecoderNamespace = "DPP"; VOPProfile Pfl = P; } class VOP3_DPP_Pseudo : VOP_DPP_Pseudo { let PseudoInstr = OpName#"_e64"#"_dpp"; let OutOperandList = P.OutsVOP3DPP; let Size = 12; let VOP3 = 1; let AsmMatchConverter = "cvtVOP3DPP"; let AsmVariantName = !if(P.HasExtVOP3DPP, AMDGPUAsmVariants.VOP3_DPP, AMDGPUAsmVariants.Disable); } class VOP_DPP_Real : InstSI , SIMCInstr { let VALU = 1; let DPP = 1; let isPseudo = 0; let isCodeGenOnly = 0; let Defs = ps.Defs; let Uses = ps.Uses; let hasSideEffects = ps.hasSideEffects; let Constraints = ps.Constraints; let DisableEncoding = ps.DisableEncoding; // Copy relevant pseudo op flags let isConvergent = ps.isConvergent; let SubtargetPredicate = ps.SubtargetPredicate; let AssemblerPredicate = ps.AssemblerPredicate; let OtherPredicates = ps.OtherPredicates; let AsmMatchConverter = ps.AsmMatchConverter; let AsmVariantName = ps.AsmVariantName; let UseNamedOperandTable = ps.UseNamedOperandTable; let DecoderNamespace = ps.DecoderNamespace; let Constraints = ps.Constraints; let DisableEncoding = ps.DisableEncoding; let TSFlags = ps.TSFlags; let SchedRW = ps.SchedRW; let mayLoad = ps.mayLoad; let mayStore = ps.mayStore; let TRANS = ps.TRANS; } class VOP_DPP_Base : InstSI { let mayLoad = 0; let mayStore = 0; let hasSideEffects = 0; let UseNamedOperandTable = 1; let VALU = 1; let DPP = 1; let Size = 8; let AsmMatchConverter = !if(P.HasModifiers, "cvtDPP", ""); let SubtargetPredicate = !if(P.HasExt64BitDPP, HasDPALU_DPP, HasDPP); let AssemblerPredicate = !if(P.HasExt64BitDPP, HasDPALU_DPP, HasDPP); let AsmVariantName = !if(P.HasExtDPP, AMDGPUAsmVariants.DPP, AMDGPUAsmVariants.Disable); let Constraints = !if(P.NumSrcArgs, P.TieRegDPP # " = $vdst", ""); let DisableEncoding = !if(P.NumSrcArgs, P.TieRegDPP, ""); let DecoderNamespace = "DPP"; } class VOP_DPP : VOP_DPP_Base, VOP_DPPe; class VOP3_DPP_Base : VOP_DPP_Base { let OutOperandList = P.OutsVOP3DPP; let AsmMatchConverter = "cvtVOP3DPP"; let VOP3 = 1; let AsmVariantName = !if(P.HasExtVOP3DPP, AMDGPUAsmVariants.VOP3_DPP, AMDGPUAsmVariants.Disable); let Size = 12; } class VOP3_DPP op, string OpName, VOPProfile P, bit IsDPP16, dag InsDPP = !if(IsDPP16, P.InsVOP3DPP16, P.InsVOP3DPP), string AsmDPP = !if(IsDPP16, P.AsmVOP3DPP16, P.AsmVOP3DPP)> : VOP3_DPP_Base, VOP3_DPPe_Common, VOP3_DPPe_Fields { let Inst{40-32} = 0xfa; let Inst{71-64} = !if(P.HasSrc0, src0{7-0}, 0); let Inst{80-72} = dpp_ctrl; let Inst{82} = !if(IsDPP16, fi, ?); let Inst{83} = bound_ctrl; // Inst{87-84} ignored by hw let Inst{91-88} = bank_mask; let Inst{95-92} = row_mask; } class VOP3P_DPP op, string OpName, VOPProfile P, bit IsDPP16, dag InsDPP = !if(IsDPP16, P.InsVOP3DPP16, P.InsVOP3DPP), string AsmDPP = !if(IsDPP16, P.AsmVOP3DPP16, P.AsmVOP3DPP)> : VOP3_DPP_Base, VOP3P_DPPe_Common, VOP3_DPPe_Fields { let VOP3P = 1; let Inst{40-32} = 0xfa; let Inst{71-64} = !if(P.HasSrc0, src0{7-0}, 0); let Inst{80-72} = dpp_ctrl; let Inst{82} = !if(IsDPP16, fi, ?); let Inst{83} = bound_ctrl; // Inst{87-84} ignored by hw let Inst{91-88} = bank_mask; let Inst{95-92} = row_mask; } class VOP_DPP8e : Enc64 { bits<8> src0; bits<24> dpp8; bits<9> fi; let Inst{39-32} = !if(P.HasSrc0, src0{7-0}, 0); let Inst{63-40} = dpp8{23-0}; } class VOP3_DPP8e_Fields { bits<8> src0; bits<24> dpp8; bits<9> fi; } class VOP_DPP8_Base : InstSI { let mayLoad = 0; let mayStore = 0; let hasSideEffects = 0; let UseNamedOperandTable = 1; let VALU = 1; let DPP = 1; let Size = 8; let AsmMatchConverter = "cvtDPP8"; let SubtargetPredicate = HasDPP8; let AssemblerPredicate = HasDPP8; let AsmVariantName = AMDGPUAsmVariants.DPP; let Constraints = !if(P.NumSrcArgs, P.TieRegDPP # " = $vdst", ""); let DisableEncoding = !if(P.NumSrcArgs, P.TieRegDPP, ""); } class VOP_DPP8 : VOP_DPP8_Base, VOP_DPP8e

; class VOP3_DPP8_Base : VOP_DPP8_Base { let OutOperandList = P.OutsVOP3DPP8; let AsmMatchConverter = "cvtVOP3DPP8"; let AsmVariantName = !if(P.HasExtVOP3DPP, AMDGPUAsmVariants.VOP3_DPP, AMDGPUAsmVariants.Disable); let VOP3 = 1; let Size = 12; } class VOP3_DPP8 op, string OpName, VOPProfile P> : VOP3_DPP8_Base, VOP3_DPPe_Common, VOP3_DPP8e_Fields { let Inst{40-32} = fi; let Inst{71-64} = !if(P.HasSrc0, src0{7-0}, 0); let Inst{95-72} = dpp8{23-0}; } class VOP3P_DPP8 op, string OpName, VOPProfile P> : VOP3_DPP8_Base, VOP3P_DPPe_Common, VOP3_DPP8e_Fields { let VOP3P = 1; let Inst{40-32} = fi; let Inst{71-64} = !if(P.HasSrc0, src0{7-0}, 0); let Inst{95-72} = dpp8{23-0}; } def DPP8Mode { int FI_0 = 0xE9; int FI_1 = 0xEA; } class getNumNodeArgs { SDNode N = !cast(Op); SDTypeProfile TP = N.TypeProfile; int ret = TP.NumOperands; } class getDivergentFrag { assert !or(!isa(Op), !isa(Op)), "Expected SDNode or PatFrags"; int NumSrcArgs = !if(!isa(Op), getNumNodeArgs.ret, !size(!cast(Op).Operands)); PatFrag ret = PatFrag < !if(!eq(NumSrcArgs, 1), (ops node:$src0), !if(!eq(NumSrcArgs, 2), (ops node:$src0, node:$src1), (ops node:$src0, node:$src1, node:$src2))), !if(!eq(NumSrcArgs, 1), (Op $src0), !if(!eq(NumSrcArgs, 2), (Op $src0, $src1), (Op $src0, $src1, $src2))), [{ return N->isDivergent(); }] >; } class VOPPatGen { PatFrag Operator = getDivergentFrag < Op >.ret; dag Ins = !foreach(tmp, P.Ins32, !subst(ins, Operator, !subst(P.Src0RC32, P.Src0VT, !subst(P.Src1RC32, P.Src1VT, tmp)))); dag Outs = !foreach(tmp, P.Outs32, !subst(outs, set, !subst(P.DstRC, P.DstVT, tmp))); list ret = [!con(Outs, (set Ins))]; } class DivergentUnaryFrag : PatFrag < (ops node:$src0), (Op $src0), [{ return N->isDivergent(); }]> { // This check is unnecessary as it's captured by the result register // bank constraint. // // FIXME: Should add a way for the emitter to recognize this is a // trivially true predicate to eliminate the check. let GISelPredicateCode = [{return true;}]; } class VOPPatOrNull { list ret = !if(!ne(P.NeedPatGen,PatGenMode.NoPattern), VOPPatGen.ret, []); } class DivergentFragOrOp { SDPatternOperator ret = !if(!eq(P.NeedPatGen,PatGenMode.Pattern), !if(!isa(Op), getDivergentFrag.ret, Op), Op); } class getVSrcOp { RegisterOperand ret = !if(!eq(vt.Size, 32), VSrc_b32, VSrc_b16); } // Class for binary integer operations with the clamp bit set for saturation // TODO: Add sub with negated inline constant pattern. class VOPBinOpClampPat : GCNPat<(node vt:$src0, vt:$src1), (inst getVSrcOp.ret:$src0, getVSrcOp.ret:$src1, DSTCLAMP.ENABLE) >; //===----------------------------------------------------------------------===// // VOP3 Classes //===----------------------------------------------------------------------===// class getVOP3ModPat { dag src0 = !if(P.HasOMod, (VOP3Mods0 P.Src0VT:$src0, i32:$src0_modifiers, i1:$clamp, i32:$omod), (VOP3Mods0 P.Src0VT:$src0, i32:$src0_modifiers, i1:$clamp)); list ret3 = [(set P.DstVT:$vdst, (DivergentFragOrOp.ret (P.Src0VT src0), (P.Src1VT (VOP3Mods P.Src1VT:$src1, i32:$src1_modifiers)), (P.Src2VT (VOP3Mods P.Src2VT:$src2, i32:$src2_modifiers))))]; list ret2 = [(set P.DstVT:$vdst, (DivergentFragOrOp.ret (P.Src0VT src0), (P.Src1VT (VOP3Mods P.Src1VT:$src1, i32:$src1_modifiers))))]; list ret1 = [(set P.DstVT:$vdst, (DivergentFragOrOp.ret (P.Src0VT src0)))]; list ret = !if(!eq(P.NumSrcArgs, 3), ret3, !if(!eq(P.NumSrcArgs, 2), ret2, ret1)); } class getVOP3PModPat { dag src0_dag = (P.Src0VT (SrcPat P.Src0VT:$src0, i32:$src0_modifiers)); dag src1_dag = (P.Src1VT (SrcPat P.Src1VT:$src1, i32:$src1_modifiers)); dag src2_dag = (P.Src2VT (SrcPat P.Src2VT:$src2, i32:$src2_modifiers)); dag clamp_dag = (i1 timm:$clamp); list ret3 = [(set P.DstVT:$vdst, !if(HasExplicitClamp, (DivergentFragOrOp.ret src0_dag, src1_dag, src2_dag, clamp_dag), (DivergentFragOrOp.ret src0_dag, src1_dag, src2_dag)))]; list ret2 = [(set P.DstVT:$vdst, !if(HasExplicitClamp, (DivergentFragOrOp.ret src0_dag, src1_dag, clamp_dag), (DivergentFragOrOp.ret src0_dag, src1_dag)))]; list ret1 = [(set P.DstVT:$vdst, !if(HasExplicitClamp, (DivergentFragOrOp.ret src0_dag, clamp_dag), (DivergentFragOrOp.ret src0_dag)))]; list ret = !if(!eq(P.NumSrcArgs, 3), ret3, !if(!eq(P.NumSrcArgs, 2), ret2, ret1)); } class getVOP3OpSelPat { list ret3 = [(set P.DstVT:$vdst, (DivergentFragOrOp.ret (P.Src0VT (VOP3OpSel P.Src0VT:$src0, i32:$src0_modifiers)), (P.Src1VT (VOP3OpSel P.Src1VT:$src1, i32:$src1_modifiers)), (P.Src2VT (VOP3OpSel P.Src2VT:$src2, i32:$src2_modifiers))))]; list ret2 = [(set P.DstVT:$vdst, (DivergentFragOrOp.ret (P.Src0VT (VOP3OpSel P.Src0VT:$src0, i32:$src0_modifiers)), (P.Src1VT (VOP3OpSel P.Src1VT:$src1, i32:$src1_modifiers))))]; list ret1 = [(set P.DstVT:$vdst, (DivergentFragOrOp.ret (P.Src0VT (VOP3OpSel P.Src0VT:$src0, i32:$src0_modifiers))))]; list ret = !if(!eq(P.NumSrcArgs, 3), ret3, !if(!eq(P.NumSrcArgs, 2), ret2, ret1)); } class getVOP3OpSelModPat { list ret3 = [(set P.DstVT:$vdst, (DivergentFragOrOp.ret (P.Src0VT !if(P.HasClamp, (VOP3OpSelMods P.Src0VT:$src0, i32:$src0_modifiers), (VOP3OpSelMods P.Src0VT:$src0, i32:$src0_modifiers))), (P.Src1VT (VOP3OpSelMods P.Src1VT:$src1, i32:$src1_modifiers)), (P.Src2VT (VOP3OpSelMods P.Src2VT:$src2, i32:$src2_modifiers))))]; list ret2 = [(set P.DstVT:$vdst, (DivergentFragOrOp.ret !if(P.HasClamp, (P.Src0VT (VOP3OpSelMods P.Src0VT:$src0, i32:$src0_modifiers)), (P.Src0VT (VOP3OpSelMods P.Src0VT:$src0, i32:$src0_modifiers))), (P.Src1VT (VOP3OpSelMods P.Src1VT:$src1, i32:$src1_modifiers))))]; list ret1 = [(set P.DstVT:$vdst, (DivergentFragOrOp.ret (P.Src0VT (VOP3OpSelMods P.Src0VT:$src0, i32:$src0_modifiers))))]; list ret = !if(!eq(P.NumSrcArgs, 3), ret3, !if(!eq(P.NumSrcArgs, 2), ret2, ret1)); } class getVOP3FromVOP2Pat { list ret = [(set P.DstVT:$vdst, (node P.Src0VT:$src0, P.Src1VT:$src1))]; } // In VOP1, we can have clamp and omod even if !HasModifiers class getVOP3Pat { dag src0 = !if(P.HasOMod, !if(P.HasClamp, (VOP3Mods0 P.Src0VT:$src0, i1:$clamp, i32:$omod), (VOP3Mods0 P.Src0VT:$src0, i32:$omod)), // impossible? !if(P.HasClamp, (VOP3Mods0 P.Src0VT:$src0, i1:$clamp), (VOP3Mods0 P.Src0VT:$src0)) ); list ret3 = [(set P.DstVT:$vdst, (DivergentFragOrOp.ret (P.Src0VT src0), P.Src1VT:$src1, P.Src2VT:$src2))]; list ret2 = [(set P.DstVT:$vdst, (DivergentFragOrOp.ret (P.Src0VT src0), P.Src1VT:$src1))]; list ret1 = [(set P.DstVT:$vdst, (DivergentFragOrOp.ret (P.Src0VT src0)))]; list ret = !if(!eq(P.NumSrcArgs, 3), ret3, !if(!eq(P.NumSrcArgs, 2), ret2, ret1)); } class getVOP3ClampPat { list ret3 = [(set P.DstVT:$vdst, (node P.Src0VT:$src0, P.Src1VT:$src1, P.Src2VT:$src2, i1:$clamp))]; list ret2 = [(set P.DstVT:$vdst, (node P.Src0VT:$src0, P.Src1VT:$src1, i1:$clamp))]; list ret1 = [(set P.DstVT:$vdst, (node P.Src0VT:$src0, i1:$clamp))]; list ret = !if(!eq(P.NumSrcArgs, 3), ret3, !if(!eq(P.NumSrcArgs, 2), ret2, ret1)); } class getVOP3MAIPat { list ret = !if(!eq(P.Src0VT, P.Src1VT), // mfma [(set P.DstVT:$vdst, (node P.Src0VT:$src0, P.Src1VT:$src1, P.Src2VT:$src2, timm:$cbsz, timm:$abid, timm:$blgp))], // smfmac [(set P.DstVT:$vdst, (node P.Src0VT:$src0, P.Src1VT:$src1, P.Src2VT:$src2, i32:$idx, timm:$cbsz, timm:$abid))]); } class VOP3Features { bit HasClamp = Clamp; bit HasOpSel = OpSel; bit IsPacked = Packed; bit IsMAI = MAI; } def VOP3_REGULAR : VOP3Features<0, 0, 0, 0>; def VOP3_CLAMP : VOP3Features<1, 0, 0, 0>; def VOP3_OPSEL : VOP3Features<1, 1, 0, 0>; def VOP3_PACKED : VOP3Features<1, 1, 1, 0>; def VOP3_MAI : VOP3Features<0, 0, 0, 1>; class VOP3_Profile_Base : VOPProfile { let HasClamp = !if(Features.HasClamp, 1, P.HasClamp); let HasOpSel = !if(Features.HasOpSel, 1, P.HasOpSel); let IsMAI = !if(Features.IsMAI, 1, P.IsMAI); let IsPacked = !if(Features.IsPacked, 1, P.IsPacked); let HasModifiers = !if (Features.IsMAI, 0, !or(Features.IsPacked, Features.HasOpSel, P.HasModifiers)); } class VOP3_Profile : VOP3_Profile_Base { let IsSingle = 1; } // consistently gives instructions a _e64 suffix multiclass VOP3Inst_Pseudo_Wrapper pattern = [], bit VOP3Only = 0> { def _e64 : VOP3_Pseudo; } class VOP3InstBase : VOP3_Pseudo.ret, getVOP3OpSelPat.ret), !if(P.HasModifiers, getVOP3ModPat.ret, !if(IsVOP2, getVOP3FromVOP2Pat.ret, !if(P.HasIntClamp, getVOP3ClampPat.ret, !if (P.IsMAI, getVOP3MAIPat.ret, getVOP3Pat.ret))))), 0, P.HasOpSel> { let IntClamp = P.HasIntClamp; let AsmMatchConverter = !if(P.HasOpSel, "cvtVOP3OpSel", !if(!or(P.HasModifiers, P.HasOMod, P.HasIntClamp), "cvtVOP3", "")); } multiclass VOP3Inst { def _e64 : VOP3InstBase; let SubtargetPredicate = isGFX11Plus in { if P.HasExtVOP3DPP then def _e64_dpp : VOP3_DPP_Pseudo ; } // end SubtargetPredicate = isGFX11Plus } class UniformUnaryFragOrOp { SDPatternOperator ret = !if(!or(!isa(Op), !isa(Op)), UniformUnaryFrag, Op); } multiclass VOP3PseudoScalarInst { def _e64 : VOP3_Pseudo.ret (P.Src0VT (VOP3Mods0 P.Src0VT:$src0, i32:$src0_modifiers, i1:$clamp, i32:$omod))))]>; } //===----------------------------------------------------------------------===// // VOP3 DPP //===----------------------------------------------------------------------===// class Base_VOP3_DPP16 op, VOP_DPP_Pseudo ps, string opName = ps.OpName> : VOP3_DPP { let VOP3_OPSEL = ps.Pfl.HasOpSel; let IsDOT = ps.IsDOT; let hasSideEffects = ps.hasSideEffects; let Defs = ps.Defs; let SchedRW = ps.SchedRW; let Uses = ps.Uses; let AssemblerPredicate = HasDPP16; let SubtargetPredicate = HasDPP16; let OtherPredicates = ps.OtherPredicates; } class VOP3_DPP16 op, VOP_DPP_Pseudo ps, int subtarget, string opName = ps.OpName> : Base_VOP3_DPP16, SIMCInstr; class VOP3_DPP16_Gen op, VOP_DPP_Pseudo ps, GFXGen Gen, string opName = ps.OpName> : VOP3_DPP16 { let AssemblerPredicate = Gen.AssemblerPredicate; let OtherPredicates = !if(ps.Pfl.IsRealTrue16, [UseRealTrue16Insts], []); let DecoderNamespace = "DPP"#Gen.DecoderNamespace# !if(ps.Pfl.IsRealTrue16, "", "_FAKE16"); } class Base_VOP3_DPP8 op, VOP_Pseudo ps, string opName = ps.OpName> : VOP3_DPP8 { let VOP3_OPSEL = ps.Pfl.HasOpSel; let IsDOT = ps.IsDOT; let hasSideEffects = ps.hasSideEffects; let Defs = ps.Defs; let SchedRW = ps.SchedRW; let Uses = ps.Uses; let OtherPredicates = ps.OtherPredicates; } class Base_VOP3b_DPP16 op, VOP_DPP_Pseudo ps, string opName = ps.OpName> : Base_VOP3_DPP16 { bits<7> sdst; let Inst{14 - 8} = sdst; } class VOP3b_DPP8_Base op, VOP_Pseudo ps, string opName = ps.OpName> : Base_VOP3_DPP8 { bits<7> sdst; let Inst{14 - 8} = sdst; } //===----------------------------------------------------------------------===// // VOP3 GFX11, GFX12 //===----------------------------------------------------------------------===// multiclass VOP3_Real_Base op, string opName = NAME, bit isSingle = 0> { defvar ps = !cast(opName#"_e64"); let IsSingle = !or(isSingle, ps.Pfl.IsSingle) in { if ps.Pfl.HasOpSel then def _e64#Gen.Suffix : VOP3_Real_Gen, VOP3OpSel_gfx11_gfx12; if !not(ps.Pfl.HasOpSel) then def _e64#Gen.Suffix : VOP3_Real_Gen, VOP3e_gfx11_gfx12; } } multiclass VOP3Dot_Real_Base op, string opName = NAME, bit isSingle = 0> { defvar ps = !cast(opName#"_e64"); let IsSingle = !or(isSingle, ps.Pfl.IsSingle) in { def _e64#Gen.Suffix : VOP3_Real_Gen, VOP3DotOpSel_gfx11_gfx12; } } multiclass VOP3_Real_with_name op, string opName, string asmName, bit isSingle = 0> { defvar ps = !cast(opName#"_e64"); let AsmString = asmName # ps.AsmOperands, IsSingle = !or(isSingle, ps.Pfl.IsSingle) in { if ps.Pfl.IsFP8 then { def _e64#Gen.Suffix : VOP3_Real_Gen, VOP3FP8OpSel_gfx11_gfx12; } else { if ps.Pfl.HasOpSel then def _e64#Gen.Suffix : VOP3_Real_Gen, VOP3OpSel_gfx11_gfx12; if !not(ps.Pfl.HasOpSel) then def _e64#Gen.Suffix : VOP3_Real_Gen, VOP3e_gfx11_gfx12; } } def Gen.Suffix#"_VOP3_alias" : MnemonicAlias, Requires<[Gen.AssemblerPredicate]>, LetDummies; } // for READLANE/WRITELANE multiclass VOP3_Real_No_Suffix op, string opName = NAME> { defvar ps = !cast(opName); def _e64#Gen.Suffix : VOP3_Real_Gen, VOP3e_gfx11_gfx12; } multiclass VOP3_Real_dpp_Base op, string opName = NAME> { def _e64_dpp#Gen.Suffix : VOP3_DPP16_Gen(opName#"_e64"#"_dpp"), Gen>; } multiclass VOP3Dot_Real_dpp_Base op, string opName = NAME> { def _e64_dpp#Gen.Suffix : VOP3_DPP16_Gen(opName#"_e64"#"_dpp"), Gen> { let Inst{11} = ?; let Inst{12} = ?; } } multiclass VOP3_Real_dpp_with_name op, string opName, string asmName> { defvar ps = !cast(opName#"_e64"); let AsmString = asmName # ps.Pfl.AsmVOP3DPP16 in { defm NAME : VOP3_Real_dpp_Base; } } multiclass VOP3_Real_dpp8_Base op, string opName = NAME> { defvar ps = !cast(opName#"_e64"); def _e64_dpp8#Gen.Suffix : Base_VOP3_DPP8 { let DecoderNamespace = "DPP8"#Gen.DecoderNamespace; let AssemblerPredicate = Gen.AssemblerPredicate; } } multiclass VOP3Dot_Real_dpp8_Base op, string opName = NAME> { defvar ps = !cast(opName#"_e64"); def _e64_dpp8#Gen.Suffix : Base_VOP3_DPP8 { let Inst{11} = ?; let Inst{12} = ?; let DecoderNamespace = "DPP8"#Gen.DecoderNamespace; let AssemblerPredicate = Gen.AssemblerPredicate; } } multiclass VOP3_Real_dpp8_with_name op, string opName, string asmName> { defvar ps = !cast(opName#"_e64"); let AsmString = asmName # ps.Pfl.AsmVOP3DPP8, DecoderNamespace = "DPP8"#Gen.DecoderNamespace# !if(ps.Pfl.IsRealTrue16, "", "_FAKE16"), OtherPredicates = !if(ps.Pfl.IsRealTrue16, [UseRealTrue16Insts], [TruePredicate]) in { defm NAME : VOP3_Real_dpp8_Base; } } multiclass VOP3be_Real op, string opName, string asmName, bit isSingle = 0> { defvar ps = !cast(opName#"_e64"); let IsSingle = !or(isSingle, ps.Pfl.IsSingle) in def _e64#Gen.Suffix : VOP3_Real_Gen, VOP3be_gfx11_gfx12 ; } multiclass VOP3be_Real_dpp op, string opName, string asmName> { defvar ps = !cast(opName #"_e64"); defvar dpp_ps = !cast(opName #"_e64" #"_dpp"); def _e64_dpp#Gen.Suffix : Base_VOP3b_DPP16, SIMCInstr { let DecoderNamespace = "DPP"#Gen.DecoderNamespace; let AssemblerPredicate = Gen.AssemblerPredicate; } } multiclass VOP3be_Real_dpp8 op, string opName, string asmName> { defvar ps = !cast(opName #"_e64"); def _e64_dpp8#Gen.Suffix : VOP3b_DPP8_Base { let DecoderNamespace = "DPP8"#Gen.DecoderNamespace; let AssemblerPredicate = Gen.AssemblerPredicate; } } // VOP1 and VOP2 depend on these triple defs multiclass VOP3_Realtriple op, bit isSingle = 0, string opName = NAME> : VOP3_Real_Base, VOP3_Real_dpp_Base, VOP3_Real_dpp8_Base; multiclass VOP3Dot_Realtriple op, bit isSingle = 0, string opName = NAME> : VOP3Dot_Real_Base, VOP3Dot_Real_dpp_Base, VOP3Dot_Real_dpp8_Base; multiclass VOP3Only_Realtriple op> : VOP3_Realtriple; multiclass VOP3_Realtriple_with_name op, string opName, string asmName, bit isSingle = 0> : VOP3_Real_with_name, VOP3_Real_dpp_with_name, VOP3_Real_dpp8_with_name; multiclass VOP3Only_Realtriple_with_name op, string opName, string asmName> : VOP3_Realtriple_with_name; multiclass VOP3Only_Realtriple_t16 op, string asmName, string opName = NAME> : VOP3Only_Realtriple_with_name; multiclass VOP3be_Realtriple< GFXGen Gen, bits<10> op, bit isSingle = 0, string opName = NAME, string asmName = !cast(opName#"_e64").Mnemonic> : VOP3be_Real, VOP3be_Real_dpp, VOP3be_Real_dpp8; multiclass VOP3beOnly_Realtriple op> : VOP3be_Realtriple; //===----------------------------------------------------------------------===// // VOP3 GFX11 //===----------------------------------------------------------------------===// multiclass VOP3be_Real_gfx11 op, string opName, string asmName, bit isSingle = 0> : VOP3be_Real; multiclass VOP3_Real_Base_gfx11 op, string opName = NAME, bit isSingle = 0> : VOP3_Real_Base; multiclass VOP3_Realtriple_gfx11 op, bit isSingle = 0, string opName = NAME> : VOP3_Realtriple; multiclass VOP3Only_Realtriple_t16_gfx11 op, string asmName, string opName = NAME> : VOP3Only_Realtriple_with_name; //===----------------------------------------------------------------------===// // VOP3 GFX12 //===----------------------------------------------------------------------===// multiclass VOP3Only_Realtriple_gfx12 op, bit isSingle = 0> : VOP3_Realtriple; // IsSingle is captured from the vopprofile for these instructions, but the // following alternative is more explicit multiclass VOP3Only_Real_Base_gfx12 op> : VOP3_Real_Base; multiclass VOP3Only_Realtriple_t16_gfx12 op> : VOP3Only_Realtriple; multiclass VOP3be_Real_with_name_gfx12 op, string opName, string asmName, bit isSingle = 0> { defvar ps = !cast(opName#"_e64"); let AsmString = asmName # ps.AsmOperands, IsSingle = !or(isSingle, ps.Pfl.IsSingle) in def _e64_gfx12 : VOP3_Real_Gen, VOP3be_gfx11_gfx12, MnemonicAlias, Requires<[isGFX12Only]>; } multiclass VOP3_Realtriple_with_name_gfx12 op, string opName, string asmName, bit isSingle = 0> : VOP3_Realtriple_with_name; multiclass VOP3Only_Realtriple_with_name_gfx11_gfx12 op, string opName, string asmName> : VOP3Only_Realtriple_with_name, VOP3Only_Realtriple_with_name; multiclass VOP3Only_Realtriple_with_name_t16_gfx12 op, string asmName, string opName = NAME> : VOP3Only_Realtriple_with_name; //===----------------------------------------------------------------------===// include "VOPCInstructions.td" include "VOP1Instructions.td" include "VOP2Instructions.td" include "VOP3Instructions.td" include "VOP3PInstructions.td" include "VOPDInstructions.td" class ClassPat : GCNPat < (is_fpclass (vt (VOP3ModsNonCanonicalizing vt:$src0, i32:$src0_mods)), (i32 timm:$mask)), (inst i32:$src0_mods, vt:$src0, (V_MOV_B32_e32 timm:$mask)) >; def : ClassPat { let OtherPredicates = [NotHasTrue16BitInsts, Has16BitInsts]; } def : ClassPat { let OtherPredicates = [HasTrue16BitInsts]; } def : ClassPat; def : ClassPat; class VOPInfoTable : GenericTable { let FilterClass = Format # "_Real"; let CppTypeName = "VOPInfo"; let Fields = ["Opcode", "IsSingle"]; let PrimaryKey = ["Opcode"]; let PrimaryKeyName = "get" # Format # "OpcodeHelper"; } def VOP1InfoTable : VOPInfoTable<"VOP1">; def VOP2InfoTable : VOPInfoTable<"VOP2">; def VOP3InfoTable : VOPInfoTable<"VOP3">; class VOPC64Table : GenericTable { let FilterClass = "VOPC64_" # Format # "_Base"; let CppTypeName = "VOPC64DPPInfo"; let Fields = ["Opcode"]; let PrimaryKey = ["Opcode"]; let PrimaryKeyName = "isVOPC64" # Format # "OpcodeHelper"; } def VOPC64DPPTable : VOPC64Table<"DPP">; def VOPC64DPP8Table : VOPC64Table<"DPP8">; def VOPTrue16Table : GenericTable { let FilterClass = "VOP_Pseudo"; let CppTypeName = "VOPTrue16Info"; let Fields = ["Opcode", "IsTrue16"]; let PrimaryKey = ["Opcode"]; let PrimaryKeyName = "getTrue16OpcodeHelper"; }