xref: /freebsd/contrib/llvm-project/llvm/lib/Target/AMDGPU/SIInstrFormats.td (revision e2eeea75eb8b6dd50c1298067a0655880d186734)
1//===-- SIInstrFormats.td - SI Instruction Encodings ----------------------===//
2//
3// Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions.
4// See https://llvm.org/LICENSE.txt for license information.
5// SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception
6//
7//===----------------------------------------------------------------------===//
8//
9// SI Instruction format definitions.
10//
11//===----------------------------------------------------------------------===//
12
13class InstSI <dag outs, dag ins, string asm = "",
14              list<dag> pattern = []> :
15  AMDGPUInst<outs, ins, asm, pattern>, GCNPredicateControl {
16  // Low bits - basic encoding information.
17  field bit SALU = 0;
18  field bit VALU = 0;
19
20  // SALU instruction formats.
21  field bit SOP1 = 0;
22  field bit SOP2 = 0;
23  field bit SOPC = 0;
24  field bit SOPK = 0;
25  field bit SOPP = 0;
26
27  // VALU instruction formats.
28  field bit VOP1 = 0;
29  field bit VOP2 = 0;
30  field bit VOPC = 0;
31  field bit VOP3 = 0;
32  field bit VOP3P = 0;
33  field bit VINTRP = 0;
34  field bit SDWA = 0;
35  field bit DPP = 0;
36
37  // Memory instruction formats.
38  field bit MUBUF = 0;
39  field bit MTBUF = 0;
40  field bit SMRD = 0;
41  field bit MIMG = 0;
42  field bit EXP = 0;
43  field bit FLAT = 0;
44  field bit DS = 0;
45
46  // Pseudo instruction formats.
47  field bit VGPRSpill = 0;
48  field bit SGPRSpill = 0;
49
50  // High bits - other information.
51  field bit VM_CNT = 0;
52  field bit EXP_CNT = 0;
53  field bit LGKM_CNT = 0;
54
55  // Whether WQM _must_ be enabled for this instruction.
56  field bit WQM = 0;
57
58  // Whether WQM _must_ be disabled for this instruction.
59  field bit DisableWQM = 0;
60
61  field bit Gather4 = 0;
62
63  // Most sopk treat the immediate as a signed 16-bit, however some
64  // use it as unsigned.
65  field bit SOPKZext = 0;
66
67  // This is an s_store_dword* instruction that requires a cache flush
68  // on wave termination. It is necessary to distinguish from mayStore
69  // SMEM instructions like the cache flush ones.
70  field bit ScalarStore = 0;
71
72  // Whether the operands can be ignored when computing the
73  // instruction size.
74  field bit FixedSize = 0;
75
76  // This bit tells the assembler to use the 32-bit encoding in case it
77  // is unable to infer the encoding from the operands.
78  field bit VOPAsmPrefer32Bit = 0;
79
80  // This bit indicates that this is a VOP3 opcode which supports op_sel
81  // modifier (gfx9 only).
82  field bit VOP3_OPSEL = 0;
83
84  // Is it possible for this instruction to be atomic?
85  field bit maybeAtomic = 0;
86
87  // This bit indicates that this is a VI instruction which is renamed
88  // in GFX9. Required for correct mapping from pseudo to MC.
89  field bit renamedInGFX9 = 0;
90
91  // This bit indicates that this has a floating point result type, so
92  // the clamp modifier has floating point semantics.
93  field bit FPClamp = 0;
94
95  // This bit indicates that instruction may support integer clamping
96  // which depends on GPU features.
97  field bit IntClamp = 0;
98
99  // This field indicates that the clamp applies to the low component
100  // of a packed output register.
101  field bit ClampLo = 0;
102
103  // This field indicates that the clamp applies to the high component
104  // of a packed output register.
105  field bit ClampHi = 0;
106
107  // This bit indicates that this is a packed VOP3P instruction
108  field bit IsPacked = 0;
109
110  // This bit indicates that this is a D16 buffer instruction.
111  field bit D16Buf = 0;
112
113  // This field indicates that FLAT instruction accesses FLAT_GLBL or
114  // FLAT_SCRATCH segment. Must be 0 for non-FLAT instructions.
115  field bit IsNonFlatSeg = 0;
116
117  // Reads the mode register, usually for FP environment.
118  field bit ReadsModeReg = 0;
119
120  // This bit indicates that this uses the floating point double precision
121  // rounding mode flags
122  field bit FPDPRounding = 0;
123
124  // Instruction is FP atomic.
125  field bit FPAtomic = 0;
126
127  // This bit indicates that this is one of MFMA instructions.
128  field bit IsMAI = 0;
129
130  // This bit indicates that this is one of DOT instructions.
131  field bit IsDOT = 0;
132
133  // These need to be kept in sync with the enum in SIInstrFlags.
134  let TSFlags{0} = SALU;
135  let TSFlags{1} = VALU;
136
137  let TSFlags{2} = SOP1;
138  let TSFlags{3} = SOP2;
139  let TSFlags{4} = SOPC;
140  let TSFlags{5} = SOPK;
141  let TSFlags{6} = SOPP;
142
143  let TSFlags{7} = VOP1;
144  let TSFlags{8} = VOP2;
145  let TSFlags{9} = VOPC;
146  let TSFlags{10} = VOP3;
147  let TSFlags{12} = VOP3P;
148
149  let TSFlags{13} = VINTRP;
150  let TSFlags{14} = SDWA;
151  let TSFlags{15} = DPP;
152
153  let TSFlags{16} = MUBUF;
154  let TSFlags{17} = MTBUF;
155  let TSFlags{18} = SMRD;
156  let TSFlags{19} = MIMG;
157  let TSFlags{20} = EXP;
158  let TSFlags{21} = FLAT;
159  let TSFlags{22} = DS;
160
161  let TSFlags{23} = VGPRSpill;
162  let TSFlags{24} = SGPRSpill;
163
164  let TSFlags{32} = VM_CNT;
165  let TSFlags{33} = EXP_CNT;
166  let TSFlags{34} = LGKM_CNT;
167
168  let TSFlags{35} = WQM;
169  let TSFlags{36} = DisableWQM;
170  let TSFlags{37} = Gather4;
171
172  let TSFlags{38} = SOPKZext;
173  let TSFlags{39} = ScalarStore;
174  let TSFlags{40} = FixedSize;
175  let TSFlags{41} = VOPAsmPrefer32Bit;
176  let TSFlags{42} = VOP3_OPSEL;
177
178  let TSFlags{43} = maybeAtomic;
179  let TSFlags{44} = renamedInGFX9;
180
181  let TSFlags{45} = FPClamp;
182  let TSFlags{46} = IntClamp;
183  let TSFlags{47} = ClampLo;
184  let TSFlags{48} = ClampHi;
185
186  let TSFlags{49} = IsPacked;
187
188  let TSFlags{50} = D16Buf;
189
190  let TSFlags{51} = IsNonFlatSeg;
191
192  let TSFlags{52} = FPDPRounding;
193
194  let TSFlags{53} = FPAtomic;
195
196  let TSFlags{54} = IsMAI;
197
198  let TSFlags{55} = IsDOT;
199
200  let SchedRW = [Write32Bit];
201
202  field bits<1> DisableSIDecoder = 0;
203  field bits<1> DisableVIDecoder = 0;
204  field bits<1> DisableDecoder = 0;
205
206  let isAsmParserOnly = !if(!eq(DisableDecoder{0}, {0}), 0, 1);
207  let AsmVariantName = AMDGPUAsmVariants.Default;
208
209  // Avoid changing source registers in a way that violates constant bus read limitations.
210  let hasExtraSrcRegAllocReq = !if(VOP1,1,!if(VOP2,1,!if(VOP3,1,!if(VOPC,1,!if(SDWA,1, !if(VALU,1,0))))));
211}
212
213class PseudoInstSI<dag outs, dag ins, list<dag> pattern = [], string asm = "">
214  : InstSI<outs, ins, asm, pattern> {
215  let isPseudo = 1;
216  let isCodeGenOnly = 1;
217}
218
219class SPseudoInstSI<dag outs, dag ins, list<dag> pattern = [], string asm = "">
220  : PseudoInstSI<outs, ins, pattern, asm> {
221  let SALU = 1;
222}
223
224class VPseudoInstSI<dag outs, dag ins, list<dag> pattern = [], string asm = "">
225  : PseudoInstSI<outs, ins, pattern, asm> {
226  let VALU = 1;
227  let Uses = [EXEC];
228}
229
230class CFPseudoInstSI<dag outs, dag ins, list<dag> pattern = [],
231  bit UseExec = 0, bit DefExec = 0> :
232  SPseudoInstSI<outs, ins, pattern> {
233
234  let Uses = !if(UseExec, [EXEC], []);
235  let Defs = !if(DefExec, [EXEC, SCC], [SCC]);
236  let mayLoad = 0;
237  let mayStore = 0;
238  let hasSideEffects = 0;
239}
240
241class Enc32 {
242  field bits<32> Inst;
243  int Size = 4;
244}
245
246class Enc64 {
247  field bits<64> Inst;
248  int Size = 8;
249}
250
251class VOPDstOperand <RegisterClass rc> : RegisterOperand <rc, "printVOPDst">;
252
253class VINTRPe <bits<2> op> : Enc32 {
254  bits<8> vdst;
255  bits<8> vsrc;
256  bits<2> attrchan;
257  bits<6> attr;
258
259  let Inst{7-0} = vsrc;
260  let Inst{9-8} = attrchan;
261  let Inst{15-10} = attr;
262  let Inst{17-16} = op;
263  let Inst{25-18} = vdst;
264  let Inst{31-26} = 0x32; // encoding
265}
266
267class MIMGe : Enc64 {
268  bits<8> vdata;
269  bits<4> dmask;
270  bits<1> unorm;
271  bits<1> glc;
272  bits<1> r128;
273  bits<1> tfe;
274  bits<1> lwe;
275  bits<1> slc;
276  bit d16;
277  bits<7> srsrc;
278  bits<7> ssamp;
279
280  let Inst{11-8} = dmask;
281  let Inst{12} = unorm;
282  let Inst{13} = glc;
283  let Inst{15} = r128;
284  let Inst{16} = tfe;
285  let Inst{17} = lwe;
286  let Inst{25} = slc;
287  let Inst{31-26} = 0x3c;
288  let Inst{47-40} = vdata;
289  let Inst{52-48} = srsrc{6-2};
290  let Inst{57-53} = ssamp{6-2};
291  let Inst{63} = d16;
292}
293
294class MIMGe_gfx6789 <bits<8> op> : MIMGe {
295  bits<8> vaddr;
296  bits<1> da;
297
298  let Inst{0} = op{7};
299  let Inst{14} = da;
300  let Inst{24-18} = op{6-0};
301  let Inst{39-32} = vaddr;
302}
303
304class MIMGe_gfx10 <bits<8> op> : MIMGe {
305  bits<8> vaddr0;
306  bits<3> dim;
307  bits<2> nsa;
308  bits<1> dlc;
309  bits<1> a16;
310
311  let Inst{0} = op{7};
312  let Inst{2-1} = nsa;
313  let Inst{5-3} = dim;
314  let Inst{7} = dlc;
315  let Inst{24-18} = op{6-0};
316  let Inst{39-32} = vaddr0;
317  let Inst{62} = a16;
318}
319
320class EXPe : Enc64 {
321  bits<4> en;
322  bits<6> tgt;
323  bits<1> compr;
324  bits<1> done;
325  bits<1> vm;
326  bits<8> src0;
327  bits<8> src1;
328  bits<8> src2;
329  bits<8> src3;
330
331  let Inst{3-0} = en;
332  let Inst{9-4} = tgt;
333  let Inst{10} = compr;
334  let Inst{11} = done;
335  let Inst{12} = vm;
336  let Inst{31-26} = 0x3e;
337  let Inst{39-32} = src0;
338  let Inst{47-40} = src1;
339  let Inst{55-48} = src2;
340  let Inst{63-56} = src3;
341}
342
343let Uses = [EXEC] in {
344
345class VINTRPCommon <dag outs, dag ins, string asm, list<dag> pattern> :
346    InstSI <outs, ins, asm, pattern> {
347  let VINTRP = 1;
348  // VINTRP instructions read parameter values from LDS, but these parameter
349  // values are stored outside of the LDS memory that is allocated to the
350  // shader for general purpose use.
351  //
352  // While it may be possible for ds_read/ds_write instructions to access
353  // the parameter values in LDS, this would essentially be an out-of-bounds
354  // memory access which we consider to be undefined behavior.
355  //
356  // So even though these instructions read memory, this memory is outside the
357  // addressable memory space for the shader, and we consider these instructions
358  // to be readnone.
359  let mayLoad = 0;
360  let mayStore = 0;
361  let hasSideEffects = 0;
362  let VALU = 1;
363}
364
365class EXPCommon<dag outs, dag ins, string asm, list<dag> pattern> :
366  InstSI<outs, ins, asm, pattern> {
367  let EXP = 1;
368  let EXP_CNT = 1;
369  let mayLoad = 0; // Set to 1 if done bit is set.
370  let mayStore = 1;
371  let UseNamedOperandTable = 1;
372  let Uses = [EXEC];
373  let SchedRW = [WriteExport];
374}
375
376} // End Uses = [EXEC]
377