xref: /freebsd/contrib/llvm-project/llvm/lib/Target/AMDGPU/SMInstructions.td (revision e9e8876a4d6afc1ad5315faaa191b25121a813d7)
1//===---- SMInstructions.td - Scalar Memory Instruction Definitions -------===//
2//
3// Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions.
4// See https://llvm.org/LICENSE.txt for license information.
5// SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception
6//
7//===----------------------------------------------------------------------===//
8
9def smrd_offset_8 : NamedOperandU32<"SMRDOffset8",
10                                  NamedMatchClass<"SMRDOffset8">> {
11  let OperandType = "OPERAND_IMMEDIATE";
12}
13
14def smem_offset : NamedOperandU32<"SMEMOffset",
15                                  NamedMatchClass<"SMEMOffset">> {
16  let OperandType = "OPERAND_IMMEDIATE";
17  let EncoderMethod = "getSMEMOffsetEncoding";
18  let DecoderMethod = "decodeSMEMOffset";
19}
20
21//===----------------------------------------------------------------------===//
22// Scalar Memory classes
23//===----------------------------------------------------------------------===//
24
25class SM_Pseudo <string opName, dag outs, dag ins, string asmOps, list<dag> pattern=[]> :
26  InstSI <outs, ins, "", pattern>,
27  SIMCInstr<opName, SIEncodingFamily.NONE> {
28  let isPseudo = 1;
29  let isCodeGenOnly = 1;
30
31  let LGKM_CNT = 1;
32  let SMRD = 1;
33  let mayStore = 0;
34  let mayLoad = 1;
35  let hasSideEffects = 0;
36  let UseNamedOperandTable = 1;
37  let SchedRW = [WriteSMEM];
38
39  string Mnemonic = opName;
40  string AsmOperands = asmOps;
41
42  bits<1> has_sbase = 1;
43  bits<1> has_sdst = 1;
44  bit has_glc = 0;
45  bit has_dlc = 0;
46  bits<1> has_offset = 1;
47  bits<1> offset_is_imm = 0;
48  bit is_buffer = 0;
49}
50
51class SM_Real <SM_Pseudo ps>
52  : InstSI<ps.OutOperandList, ps.InOperandList, ps.Mnemonic # ps.AsmOperands, []> {
53
54  let isPseudo = 0;
55  let isCodeGenOnly = 0;
56
57  Instruction Opcode = !cast<Instruction>(NAME);
58
59  // copy relevant pseudo op flags
60  let LGKM_CNT             = ps.LGKM_CNT;
61  let SMRD                 = ps.SMRD;
62  let mayStore             = ps.mayStore;
63  let mayLoad              = ps.mayLoad;
64  let hasSideEffects       = ps.hasSideEffects;
65  let UseNamedOperandTable = ps.UseNamedOperandTable;
66  let SchedRW              = ps.SchedRW;
67  let SubtargetPredicate   = ps.SubtargetPredicate;
68  let AsmMatchConverter    = ps.AsmMatchConverter;
69  let IsAtomicRet          = ps.IsAtomicRet;
70  let IsAtomicNoRet        = ps.IsAtomicNoRet;
71
72  let TSFlags = ps.TSFlags;
73
74  bit is_buffer = ps.is_buffer;
75
76  // encoding
77  bits<7>  sbase;
78  bits<7>  sdst;
79  bits<32> offset;
80  bits<1> imm = !if(ps.has_offset, ps.offset_is_imm, 0);
81  bits<5> cpol;
82}
83
84class SM_Probe_Pseudo <string opName, dag ins, bit isImm>
85  : SM_Pseudo<opName, (outs), ins, " $sdata, $sbase, $offset"> {
86  let mayLoad = 0;
87  let mayStore = 0;
88  let has_glc = 0;
89  let LGKM_CNT = 0;
90  let ScalarStore = 0;
91  let hasSideEffects = 1;
92  let offset_is_imm = isImm;
93  let PseudoInstr = opName # !if(isImm, "_IMM", "_SGPR");
94}
95
96class SM_Load_Pseudo <string opName, dag outs, dag ins, string asmOps, list<dag> pattern=[]>
97  : SM_Pseudo<opName, outs, ins, asmOps, pattern> {
98  RegisterClass BaseClass;
99  let mayLoad = 1;
100  let mayStore = 0;
101  let has_glc = 1;
102  let has_dlc = 1;
103}
104
105class SM_Store_Pseudo <string opName, dag ins, string asmOps, list<dag> pattern = []>
106  : SM_Pseudo<opName, (outs), ins, asmOps, pattern> {
107  RegisterClass BaseClass;
108  RegisterClass SrcClass;
109  let mayLoad = 0;
110  let mayStore = 1;
111  let has_glc = 1;
112  let has_dlc = 1;
113  let ScalarStore = 1;
114}
115
116class SM_Discard_Pseudo <string opName, dag ins, bit isImm>
117  : SM_Pseudo<opName, (outs), ins, " $sbase, $offset"> {
118  let mayLoad = 0;
119  let mayStore = 0;
120  let has_glc = 0;
121  let has_sdst = 0;
122  let ScalarStore = 0;
123  let hasSideEffects = 1;
124  let offset_is_imm = isImm;
125  let PseudoInstr = opName # !if(isImm, "_IMM", "_SGPR");
126}
127
128multiclass SM_Pseudo_Loads<string opName,
129                           RegisterClass baseClass,
130                           RegisterClass dstClass> {
131  def _IMM  : SM_Load_Pseudo <opName,
132                              (outs dstClass:$sdst),
133                              (ins baseClass:$sbase, i32imm:$offset, CPol:$cpol),
134                              " $sdst, $sbase, $offset$cpol", []> {
135    let offset_is_imm = 1;
136    let BaseClass = baseClass;
137    let PseudoInstr = opName # "_IMM";
138    let has_glc = 1;
139    let has_dlc = 1;
140  }
141
142  def _SGPR  : SM_Load_Pseudo <opName,
143                              (outs dstClass:$sdst),
144                              (ins baseClass:$sbase, SReg_32:$soff, CPol:$cpol),
145                              " $sdst, $sbase, $offset$cpol", []> {
146    let BaseClass = baseClass;
147    let PseudoInstr = opName # "_SGPR";
148    let has_glc = 1;
149    let has_dlc = 1;
150  }
151}
152
153multiclass SM_Pseudo_Stores<string opName,
154                           RegisterClass baseClass,
155                           RegisterClass srcClass> {
156  def _IMM  : SM_Store_Pseudo <opName,
157    (ins srcClass:$sdata, baseClass:$sbase, i32imm:$offset, CPol:$cpol),
158    " $sdata, $sbase, $offset$cpol", []> {
159    let offset_is_imm = 1;
160    let BaseClass = baseClass;
161    let SrcClass = srcClass;
162    let PseudoInstr = opName # "_IMM";
163  }
164
165  def _SGPR  : SM_Store_Pseudo <opName,
166    (ins srcClass:$sdata, baseClass:$sbase, SReg_32:$soff, CPol:$cpol),
167    " $sdata, $sbase, $offset$cpol", []> {
168    let BaseClass = baseClass;
169    let SrcClass = srcClass;
170    let PseudoInstr = opName # "_SGPR";
171  }
172}
173
174multiclass SM_Pseudo_Discards<string opName> {
175  def _IMM  : SM_Discard_Pseudo <opName, (ins SReg_64:$sbase, smem_offset:$offset), 1>;
176  def _SGPR : SM_Discard_Pseudo <opName, (ins SReg_64:$sbase, SReg_32:$offset), 0>;
177}
178
179class SM_Time_Pseudo<string opName, SDPatternOperator node = null_frag> : SM_Pseudo<
180  opName, (outs SReg_64_XEXEC:$sdst), (ins),
181  " $sdst", [(set i64:$sdst, (node))]> {
182  let hasSideEffects = 1;
183
184  // FIXME: This should be definitively mayStore = 0. TableGen
185  // brokenly tries to infer these based on the intrinsic properties
186  // corresponding to the IR attributes. The target intrinsics are
187  // considered as writing to memory for IR dependency purposes, but
188  // those can be modeled with hasSideEffects here. These also end up
189  // inferring differently for llvm.readcyclecounter and the amdgcn
190  // intrinsics.
191  let mayStore = ?;
192  let mayLoad = 1;
193  let has_sbase = 0;
194  let has_offset = 0;
195}
196
197class SM_Inval_Pseudo <string opName, SDPatternOperator node = null_frag> : SM_Pseudo<
198  opName, (outs), (ins), "", [(node)]> {
199  let hasSideEffects = 1;
200  let mayStore = 0;
201  let has_sdst = 0;
202  let has_sbase = 0;
203  let has_offset = 0;
204}
205
206multiclass SM_Pseudo_Probe<string opName, RegisterClass baseClass> {
207  def _IMM  : SM_Probe_Pseudo <opName, (ins i8imm:$sdata, baseClass:$sbase, smem_offset:$offset), 1>;
208  def _SGPR : SM_Probe_Pseudo <opName, (ins i8imm:$sdata, baseClass:$sbase, SReg_32:$offset), 0>;
209}
210
211class SM_WaveId_Pseudo<string opName, SDPatternOperator node> : SM_Pseudo<
212  opName, (outs SReg_32_XM0_XEXEC:$sdst), (ins),
213  " $sdst", [(set i32:$sdst, (node))]> {
214  let hasSideEffects = 1;
215  let mayStore = 0;
216  let mayLoad = 1;
217  let has_sbase = 0;
218  let has_offset = 0;
219}
220
221//===----------------------------------------------------------------------===//
222// Scalar Atomic Memory Classes
223//===----------------------------------------------------------------------===//
224
225class SM_Atomic_Pseudo <string opName,
226                        dag outs, dag ins, string asmOps, bit isRet>
227  : SM_Pseudo<opName, outs, ins, asmOps, []> {
228
229  bit glc = isRet;
230
231  let mayLoad = 1;
232  let mayStore = 1;
233  let has_glc = 1;
234  let has_dlc = 1;
235
236  // Should these be set?
237  let ScalarStore = 1;
238  let hasSideEffects = 1;
239  let maybeAtomic = 1;
240
241  let IsAtomicNoRet = !not(isRet);
242  let IsAtomicRet = isRet;
243
244  let AsmMatchConverter = "cvtSMEMAtomic";
245}
246
247class SM_Pseudo_Atomic<string opName,
248                       RegisterClass baseClass,
249                       RegisterClass dataClass,
250                       bit isImm,
251                       bit isRet,
252                       string opNameWithSuffix = opName # !if(isImm,
253                                 !if(isRet, "_IMM_RTN", "_IMM"),
254                                 !if(isRet, "_SGPR_RTN", "_SGPR")),
255                       Operand CPolTy = !if(isRet, CPol_GLC1, CPol)> :
256  SM_Atomic_Pseudo<opName,
257                   !if(isRet, (outs dataClass:$sdst), (outs)),
258                   !if(isImm,
259                       (ins dataClass:$sdata, baseClass:$sbase, smem_offset:$offset, CPolTy:$cpol),
260                       (ins dataClass:$sdata, baseClass:$sbase, SReg_32:$offset, CPolTy:$cpol)),
261                   !if(isRet, " $sdst", " $sdata") # ", $sbase, $offset$cpol",
262                   isRet>,
263  AtomicNoRet <opNameWithSuffix, isRet> {
264  let offset_is_imm = isImm;
265  let PseudoInstr = opNameWithSuffix;
266
267  let Constraints = !if(isRet, "$sdst = $sdata", "");
268  let DisableEncoding = !if(isRet, "$sdata", "");
269}
270
271multiclass SM_Pseudo_Atomics<string opName,
272                             RegisterClass baseClass,
273                             RegisterClass dataClass> {
274  def _IMM      : SM_Pseudo_Atomic <opName, baseClass, dataClass, 1, 0>;
275  def _SGPR     : SM_Pseudo_Atomic <opName, baseClass, dataClass, 0, 0>;
276  def _IMM_RTN  : SM_Pseudo_Atomic <opName, baseClass, dataClass, 1, 1>;
277  def _SGPR_RTN : SM_Pseudo_Atomic <opName, baseClass, dataClass, 0, 1>;
278}
279
280//===----------------------------------------------------------------------===//
281// Scalar Memory Instructions
282//===----------------------------------------------------------------------===//
283
284// We are using the SReg_32_XM0 and not the SReg_32 register class for 32-bit
285// SMRD instructions, because the SReg_32_XM0 register class does not include M0
286// and writing to M0 from an SMRD instruction will hang the GPU.
287
288// XXX - SMEM instructions do not allow exec for data operand, but
289// does sdst for SMRD on SI/CI?
290defm S_LOAD_DWORD    : SM_Pseudo_Loads <"s_load_dword", SReg_64, SReg_32_XM0_XEXEC>;
291defm S_LOAD_DWORDX2  : SM_Pseudo_Loads <"s_load_dwordx2", SReg_64, SReg_64_XEXEC>;
292defm S_LOAD_DWORDX4  : SM_Pseudo_Loads <"s_load_dwordx4", SReg_64, SReg_128>;
293defm S_LOAD_DWORDX8  : SM_Pseudo_Loads <"s_load_dwordx8", SReg_64, SReg_256>;
294defm S_LOAD_DWORDX16 : SM_Pseudo_Loads <"s_load_dwordx16", SReg_64, SReg_512>;
295
296let is_buffer = 1 in {
297defm S_BUFFER_LOAD_DWORD : SM_Pseudo_Loads <
298  "s_buffer_load_dword", SReg_128, SReg_32_XM0_XEXEC
299>;
300
301// FIXME: exec_lo/exec_hi appear to be allowed for SMRD loads on
302// SI/CI, bit disallowed for SMEM on VI.
303defm S_BUFFER_LOAD_DWORDX2 : SM_Pseudo_Loads <
304  "s_buffer_load_dwordx2", SReg_128, SReg_64_XEXEC
305>;
306
307defm S_BUFFER_LOAD_DWORDX4 : SM_Pseudo_Loads <
308  "s_buffer_load_dwordx4", SReg_128, SReg_128
309>;
310
311defm S_BUFFER_LOAD_DWORDX8 : SM_Pseudo_Loads <
312  "s_buffer_load_dwordx8", SReg_128, SReg_256
313>;
314
315defm S_BUFFER_LOAD_DWORDX16 : SM_Pseudo_Loads <
316  "s_buffer_load_dwordx16", SReg_128, SReg_512
317>;
318}
319
320let SubtargetPredicate = HasScalarStores in {
321defm S_STORE_DWORD : SM_Pseudo_Stores <"s_store_dword", SReg_64, SReg_32_XM0_XEXEC>;
322defm S_STORE_DWORDX2 : SM_Pseudo_Stores <"s_store_dwordx2", SReg_64, SReg_64_XEXEC>;
323defm S_STORE_DWORDX4 : SM_Pseudo_Stores <"s_store_dwordx4", SReg_64, SReg_128>;
324
325let is_buffer = 1 in {
326defm S_BUFFER_STORE_DWORD : SM_Pseudo_Stores <
327  "s_buffer_store_dword", SReg_128, SReg_32_XM0_XEXEC
328>;
329
330defm S_BUFFER_STORE_DWORDX2 : SM_Pseudo_Stores <
331  "s_buffer_store_dwordx2", SReg_128, SReg_64_XEXEC
332>;
333
334defm S_BUFFER_STORE_DWORDX4 : SM_Pseudo_Stores <
335  "s_buffer_store_dwordx4", SReg_128, SReg_128
336>;
337}
338} // End SubtargetPredicate = HasScalarStores
339
340let SubtargetPredicate = HasSMemTimeInst in
341def S_MEMTIME : SM_Time_Pseudo <"s_memtime", int_amdgcn_s_memtime>;
342def S_DCACHE_INV : SM_Inval_Pseudo <"s_dcache_inv", int_amdgcn_s_dcache_inv>;
343
344let SubtargetPredicate = isGFX7GFX8GFX9 in {
345def S_DCACHE_INV_VOL : SM_Inval_Pseudo <"s_dcache_inv_vol", int_amdgcn_s_dcache_inv_vol>;
346} // let SubtargetPredicate = isGFX7GFX8GFX9
347
348let SubtargetPredicate = isGFX8Plus in {
349let OtherPredicates = [HasScalarStores] in {
350def S_DCACHE_WB     : SM_Inval_Pseudo <"s_dcache_wb", int_amdgcn_s_dcache_wb>;
351def S_DCACHE_WB_VOL : SM_Inval_Pseudo <"s_dcache_wb_vol", int_amdgcn_s_dcache_wb_vol>;
352} // End OtherPredicates = [HasScalarStores]
353
354defm S_ATC_PROBE        : SM_Pseudo_Probe <"s_atc_probe", SReg_64>;
355let is_buffer = 1 in {
356defm S_ATC_PROBE_BUFFER : SM_Pseudo_Probe <"s_atc_probe_buffer", SReg_128>;
357}
358} // SubtargetPredicate = isGFX8Plus
359
360let SubtargetPredicate = HasSMemRealTime in
361def S_MEMREALTIME   : SM_Time_Pseudo <"s_memrealtime", int_amdgcn_s_memrealtime>;
362
363let SubtargetPredicate = isGFX10Plus in
364def S_GL1_INV : SM_Inval_Pseudo<"s_gl1_inv">;
365let SubtargetPredicate = HasGetWaveIdInst in
366def S_GET_WAVEID_IN_WORKGROUP : SM_WaveId_Pseudo <"s_get_waveid_in_workgroup", int_amdgcn_s_get_waveid_in_workgroup>;
367
368
369let SubtargetPredicate = HasScalarFlatScratchInsts, Uses = [FLAT_SCR] in {
370defm S_SCRATCH_LOAD_DWORD    : SM_Pseudo_Loads <"s_scratch_load_dword",   SReg_64, SReg_32_XM0_XEXEC>;
371defm S_SCRATCH_LOAD_DWORDX2  : SM_Pseudo_Loads <"s_scratch_load_dwordx2", SReg_64, SReg_64_XEXEC>;
372defm S_SCRATCH_LOAD_DWORDX4  : SM_Pseudo_Loads <"s_scratch_load_dwordx4", SReg_64, SReg_128>;
373
374defm S_SCRATCH_STORE_DWORD   : SM_Pseudo_Stores <"s_scratch_store_dword",   SReg_64, SReg_32_XM0_XEXEC>;
375defm S_SCRATCH_STORE_DWORDX2 : SM_Pseudo_Stores <"s_scratch_store_dwordx2", SReg_64, SReg_64_XEXEC>;
376defm S_SCRATCH_STORE_DWORDX4 : SM_Pseudo_Stores <"s_scratch_store_dwordx4", SReg_64, SReg_128>;
377} // SubtargetPredicate = HasScalarFlatScratchInsts
378
379let SubtargetPredicate = HasScalarAtomics in {
380
381let is_buffer = 1 in {
382defm S_BUFFER_ATOMIC_SWAP         : SM_Pseudo_Atomics <"s_buffer_atomic_swap", SReg_128, SReg_32_XM0_XEXEC>;
383defm S_BUFFER_ATOMIC_CMPSWAP      : SM_Pseudo_Atomics <"s_buffer_atomic_cmpswap", SReg_128, SReg_64_XEXEC>;
384defm S_BUFFER_ATOMIC_ADD          : SM_Pseudo_Atomics <"s_buffer_atomic_add", SReg_128, SReg_32_XM0_XEXEC>;
385defm S_BUFFER_ATOMIC_SUB          : SM_Pseudo_Atomics <"s_buffer_atomic_sub", SReg_128, SReg_32_XM0_XEXEC>;
386defm S_BUFFER_ATOMIC_SMIN         : SM_Pseudo_Atomics <"s_buffer_atomic_smin", SReg_128, SReg_32_XM0_XEXEC>;
387defm S_BUFFER_ATOMIC_UMIN         : SM_Pseudo_Atomics <"s_buffer_atomic_umin", SReg_128, SReg_32_XM0_XEXEC>;
388defm S_BUFFER_ATOMIC_SMAX         : SM_Pseudo_Atomics <"s_buffer_atomic_smax", SReg_128, SReg_32_XM0_XEXEC>;
389defm S_BUFFER_ATOMIC_UMAX         : SM_Pseudo_Atomics <"s_buffer_atomic_umax", SReg_128, SReg_32_XM0_XEXEC>;
390defm S_BUFFER_ATOMIC_AND          : SM_Pseudo_Atomics <"s_buffer_atomic_and", SReg_128, SReg_32_XM0_XEXEC>;
391defm S_BUFFER_ATOMIC_OR           : SM_Pseudo_Atomics <"s_buffer_atomic_or", SReg_128, SReg_32_XM0_XEXEC>;
392defm S_BUFFER_ATOMIC_XOR          : SM_Pseudo_Atomics <"s_buffer_atomic_xor", SReg_128, SReg_32_XM0_XEXEC>;
393defm S_BUFFER_ATOMIC_INC          : SM_Pseudo_Atomics <"s_buffer_atomic_inc", SReg_128, SReg_32_XM0_XEXEC>;
394defm S_BUFFER_ATOMIC_DEC          : SM_Pseudo_Atomics <"s_buffer_atomic_dec", SReg_128, SReg_32_XM0_XEXEC>;
395
396defm S_BUFFER_ATOMIC_SWAP_X2      : SM_Pseudo_Atomics <"s_buffer_atomic_swap_x2", SReg_128, SReg_64_XEXEC>;
397defm S_BUFFER_ATOMIC_CMPSWAP_X2   : SM_Pseudo_Atomics <"s_buffer_atomic_cmpswap_x2", SReg_128, SReg_128>;
398defm S_BUFFER_ATOMIC_ADD_X2       : SM_Pseudo_Atomics <"s_buffer_atomic_add_x2", SReg_128, SReg_64_XEXEC>;
399defm S_BUFFER_ATOMIC_SUB_X2       : SM_Pseudo_Atomics <"s_buffer_atomic_sub_x2", SReg_128, SReg_64_XEXEC>;
400defm S_BUFFER_ATOMIC_SMIN_X2      : SM_Pseudo_Atomics <"s_buffer_atomic_smin_x2", SReg_128, SReg_64_XEXEC>;
401defm S_BUFFER_ATOMIC_UMIN_X2      : SM_Pseudo_Atomics <"s_buffer_atomic_umin_x2", SReg_128, SReg_64_XEXEC>;
402defm S_BUFFER_ATOMIC_SMAX_X2      : SM_Pseudo_Atomics <"s_buffer_atomic_smax_x2", SReg_128, SReg_64_XEXEC>;
403defm S_BUFFER_ATOMIC_UMAX_X2      : SM_Pseudo_Atomics <"s_buffer_atomic_umax_x2", SReg_128, SReg_64_XEXEC>;
404defm S_BUFFER_ATOMIC_AND_X2       : SM_Pseudo_Atomics <"s_buffer_atomic_and_x2", SReg_128, SReg_64_XEXEC>;
405defm S_BUFFER_ATOMIC_OR_X2        : SM_Pseudo_Atomics <"s_buffer_atomic_or_x2", SReg_128, SReg_64_XEXEC>;
406defm S_BUFFER_ATOMIC_XOR_X2       : SM_Pseudo_Atomics <"s_buffer_atomic_xor_x2", SReg_128, SReg_64_XEXEC>;
407defm S_BUFFER_ATOMIC_INC_X2       : SM_Pseudo_Atomics <"s_buffer_atomic_inc_x2", SReg_128, SReg_64_XEXEC>;
408defm S_BUFFER_ATOMIC_DEC_X2       : SM_Pseudo_Atomics <"s_buffer_atomic_dec_x2", SReg_128, SReg_64_XEXEC>;
409}
410
411defm S_ATOMIC_SWAP                : SM_Pseudo_Atomics <"s_atomic_swap", SReg_64, SReg_32_XM0_XEXEC>;
412defm S_ATOMIC_CMPSWAP             : SM_Pseudo_Atomics <"s_atomic_cmpswap", SReg_64, SReg_64_XEXEC>;
413defm S_ATOMIC_ADD                 : SM_Pseudo_Atomics <"s_atomic_add", SReg_64, SReg_32_XM0_XEXEC>;
414defm S_ATOMIC_SUB                 : SM_Pseudo_Atomics <"s_atomic_sub", SReg_64, SReg_32_XM0_XEXEC>;
415defm S_ATOMIC_SMIN                : SM_Pseudo_Atomics <"s_atomic_smin", SReg_64, SReg_32_XM0_XEXEC>;
416defm S_ATOMIC_UMIN                : SM_Pseudo_Atomics <"s_atomic_umin", SReg_64, SReg_32_XM0_XEXEC>;
417defm S_ATOMIC_SMAX                : SM_Pseudo_Atomics <"s_atomic_smax", SReg_64, SReg_32_XM0_XEXEC>;
418defm S_ATOMIC_UMAX                : SM_Pseudo_Atomics <"s_atomic_umax", SReg_64, SReg_32_XM0_XEXEC>;
419defm S_ATOMIC_AND                 : SM_Pseudo_Atomics <"s_atomic_and", SReg_64, SReg_32_XM0_XEXEC>;
420defm S_ATOMIC_OR                  : SM_Pseudo_Atomics <"s_atomic_or", SReg_64, SReg_32_XM0_XEXEC>;
421defm S_ATOMIC_XOR                 : SM_Pseudo_Atomics <"s_atomic_xor", SReg_64, SReg_32_XM0_XEXEC>;
422defm S_ATOMIC_INC                 : SM_Pseudo_Atomics <"s_atomic_inc", SReg_64, SReg_32_XM0_XEXEC>;
423defm S_ATOMIC_DEC                 : SM_Pseudo_Atomics <"s_atomic_dec", SReg_64, SReg_32_XM0_XEXEC>;
424
425defm S_ATOMIC_SWAP_X2             : SM_Pseudo_Atomics <"s_atomic_swap_x2", SReg_64, SReg_64_XEXEC>;
426defm S_ATOMIC_CMPSWAP_X2          : SM_Pseudo_Atomics <"s_atomic_cmpswap_x2", SReg_64, SReg_128>;
427defm S_ATOMIC_ADD_X2              : SM_Pseudo_Atomics <"s_atomic_add_x2", SReg_64, SReg_64_XEXEC>;
428defm S_ATOMIC_SUB_X2              : SM_Pseudo_Atomics <"s_atomic_sub_x2", SReg_64, SReg_64_XEXEC>;
429defm S_ATOMIC_SMIN_X2             : SM_Pseudo_Atomics <"s_atomic_smin_x2", SReg_64, SReg_64_XEXEC>;
430defm S_ATOMIC_UMIN_X2             : SM_Pseudo_Atomics <"s_atomic_umin_x2", SReg_64, SReg_64_XEXEC>;
431defm S_ATOMIC_SMAX_X2             : SM_Pseudo_Atomics <"s_atomic_smax_x2", SReg_64, SReg_64_XEXEC>;
432defm S_ATOMIC_UMAX_X2             : SM_Pseudo_Atomics <"s_atomic_umax_x2", SReg_64, SReg_64_XEXEC>;
433defm S_ATOMIC_AND_X2              : SM_Pseudo_Atomics <"s_atomic_and_x2", SReg_64, SReg_64_XEXEC>;
434defm S_ATOMIC_OR_X2               : SM_Pseudo_Atomics <"s_atomic_or_x2", SReg_64, SReg_64_XEXEC>;
435defm S_ATOMIC_XOR_X2              : SM_Pseudo_Atomics <"s_atomic_xor_x2", SReg_64, SReg_64_XEXEC>;
436defm S_ATOMIC_INC_X2              : SM_Pseudo_Atomics <"s_atomic_inc_x2", SReg_64, SReg_64_XEXEC>;
437defm S_ATOMIC_DEC_X2              : SM_Pseudo_Atomics <"s_atomic_dec_x2", SReg_64, SReg_64_XEXEC>;
438
439} // let SubtargetPredicate = HasScalarAtomics
440
441let SubtargetPredicate = HasScalarAtomics in {
442defm S_DCACHE_DISCARD    : SM_Pseudo_Discards <"s_dcache_discard">;
443defm S_DCACHE_DISCARD_X2 : SM_Pseudo_Discards <"s_dcache_discard_x2">;
444}
445
446//===----------------------------------------------------------------------===//
447// Targets
448//===----------------------------------------------------------------------===//
449
450//===----------------------------------------------------------------------===//
451// SI
452//===----------------------------------------------------------------------===//
453
454class SMRD_Real_si <bits<5> op, SM_Pseudo ps>
455  : SM_Real<ps>
456  , SIMCInstr<ps.PseudoInstr, SIEncodingFamily.SI>
457  , Enc32 {
458
459  let AssemblerPredicate = isGFX6GFX7;
460  let DecoderNamespace = "GFX6GFX7";
461
462  let Inst{7-0}   = !if(ps.has_offset, offset{7-0}, ?);
463  let Inst{8}     = imm;
464  let Inst{14-9}  = !if(ps.has_sbase, sbase{6-1}, ?);
465  let Inst{21-15} = !if(ps.has_sdst, sdst{6-0}, ?);
466  let Inst{26-22} = op;
467  let Inst{31-27} = 0x18; //encoding
468}
469
470// FIXME: Assembler should reject trying to use glc on SMRD
471// instructions on SI.
472multiclass SM_Real_Loads_si<bits<5> op, string ps,
473                            SM_Load_Pseudo immPs = !cast<SM_Load_Pseudo>(ps#_IMM),
474                            SM_Load_Pseudo sgprPs = !cast<SM_Load_Pseudo>(ps#_SGPR)> {
475
476  def _IMM_si : SMRD_Real_si <op, immPs> {
477    let InOperandList = (ins immPs.BaseClass:$sbase, smrd_offset_8:$offset, CPol:$cpol);
478  }
479
480  // FIXME: The operand name $offset is inconsistent with $soff used
481  // in the pseudo
482  def _SGPR_si : SMRD_Real_si <op, sgprPs> {
483    let InOperandList = (ins sgprPs.BaseClass:$sbase, SReg_32:$offset, CPol:$cpol);
484  }
485
486}
487
488defm S_LOAD_DWORD           : SM_Real_Loads_si <0x00, "S_LOAD_DWORD">;
489defm S_LOAD_DWORDX2         : SM_Real_Loads_si <0x01, "S_LOAD_DWORDX2">;
490defm S_LOAD_DWORDX4         : SM_Real_Loads_si <0x02, "S_LOAD_DWORDX4">;
491defm S_LOAD_DWORDX8         : SM_Real_Loads_si <0x03, "S_LOAD_DWORDX8">;
492defm S_LOAD_DWORDX16        : SM_Real_Loads_si <0x04, "S_LOAD_DWORDX16">;
493defm S_BUFFER_LOAD_DWORD    : SM_Real_Loads_si <0x08, "S_BUFFER_LOAD_DWORD">;
494defm S_BUFFER_LOAD_DWORDX2  : SM_Real_Loads_si <0x09, "S_BUFFER_LOAD_DWORDX2">;
495defm S_BUFFER_LOAD_DWORDX4  : SM_Real_Loads_si <0x0a, "S_BUFFER_LOAD_DWORDX4">;
496defm S_BUFFER_LOAD_DWORDX8  : SM_Real_Loads_si <0x0b, "S_BUFFER_LOAD_DWORDX8">;
497defm S_BUFFER_LOAD_DWORDX16 : SM_Real_Loads_si <0x0c, "S_BUFFER_LOAD_DWORDX16">;
498
499def S_MEMTIME_si    : SMRD_Real_si <0x1e, S_MEMTIME>;
500def S_DCACHE_INV_si : SMRD_Real_si <0x1f, S_DCACHE_INV>;
501
502
503//===----------------------------------------------------------------------===//
504// VI
505//===----------------------------------------------------------------------===//
506
507class SMEM_Real_vi <bits<8> op, SM_Pseudo ps>
508  : SM_Real<ps>
509  , SIMCInstr<ps.PseudoInstr, SIEncodingFamily.VI>
510  , Enc64 {
511  let AssemblerPredicate = isGFX8GFX9;
512  let DecoderNamespace = "GFX8";
513
514  let Inst{5-0}   = !if(ps.has_sbase, sbase{6-1}, ?);
515  let Inst{12-6}  = !if(ps.has_sdst, sdst{6-0}, ?);
516
517  let Inst{16} = !if(ps.has_glc, cpol{CPolBit.GLC}, ?);
518  let Inst{17} = imm;
519  let Inst{25-18} = op;
520  let Inst{31-26} = 0x30; //encoding
521
522  // VI supports 20-bit unsigned offsets while GFX9+ supports 21-bit signed.
523  // Offset value is corrected accordingly when offset is encoded/decoded.
524  let Inst{38-32} = !if(ps.has_offset, offset{6-0}, ?);
525  let Inst{52-39} = !if(ps.has_offset, !if(imm, offset{20-7}, ?), ?);
526}
527
528multiclass SM_Real_Loads_vi<bits<8> op, string ps,
529                            SM_Load_Pseudo immPs = !cast<SM_Load_Pseudo>(ps#_IMM),
530                            SM_Load_Pseudo sgprPs = !cast<SM_Load_Pseudo>(ps#_SGPR)> {
531  def _IMM_vi : SMEM_Real_vi <op, immPs> {
532    let InOperandList = (ins immPs.BaseClass:$sbase, smem_offset:$offset, CPol:$cpol);
533  }
534  def _SGPR_vi : SMEM_Real_vi <op, sgprPs> {
535    let InOperandList = (ins sgprPs.BaseClass:$sbase, SReg_32:$offset, CPol:$cpol);
536  }
537}
538
539class SMEM_Real_Store_vi <bits<8> op, SM_Pseudo ps> : SMEM_Real_vi <op, ps> {
540  // encoding
541  bits<7> sdata;
542
543  let sdst = ?;
544  let Inst{12-6}  = !if(ps.has_sdst, sdata{6-0}, ?);
545}
546
547multiclass SM_Real_Stores_vi<bits<8> op, string ps,
548                            SM_Store_Pseudo immPs = !cast<SM_Store_Pseudo>(ps#_IMM),
549                            SM_Store_Pseudo sgprPs = !cast<SM_Store_Pseudo>(ps#_SGPR)> {
550  // FIXME: The operand name $offset is inconsistent with $soff used
551  // in the pseudo
552  def _IMM_vi : SMEM_Real_Store_vi <op, immPs> {
553    let InOperandList = (ins immPs.SrcClass:$sdata, immPs.BaseClass:$sbase, smem_offset:$offset, CPol:$cpol);
554  }
555
556  def _SGPR_vi : SMEM_Real_Store_vi <op, sgprPs> {
557    let InOperandList = (ins sgprPs.SrcClass:$sdata, sgprPs.BaseClass:$sbase, SReg_32:$offset, CPol:$cpol);
558  }
559}
560
561multiclass SM_Real_Probe_vi<bits<8> op, string ps> {
562  def _IMM_vi  : SMEM_Real_Store_vi <op, !cast<SM_Probe_Pseudo>(ps#_IMM)>;
563  def _SGPR_vi : SMEM_Real_Store_vi <op, !cast<SM_Probe_Pseudo>(ps#_SGPR)>;
564}
565
566defm S_LOAD_DWORD           : SM_Real_Loads_vi <0x00, "S_LOAD_DWORD">;
567defm S_LOAD_DWORDX2         : SM_Real_Loads_vi <0x01, "S_LOAD_DWORDX2">;
568defm S_LOAD_DWORDX4         : SM_Real_Loads_vi <0x02, "S_LOAD_DWORDX4">;
569defm S_LOAD_DWORDX8         : SM_Real_Loads_vi <0x03, "S_LOAD_DWORDX8">;
570defm S_LOAD_DWORDX16        : SM_Real_Loads_vi <0x04, "S_LOAD_DWORDX16">;
571defm S_BUFFER_LOAD_DWORD    : SM_Real_Loads_vi <0x08, "S_BUFFER_LOAD_DWORD">;
572defm S_BUFFER_LOAD_DWORDX2  : SM_Real_Loads_vi <0x09, "S_BUFFER_LOAD_DWORDX2">;
573defm S_BUFFER_LOAD_DWORDX4  : SM_Real_Loads_vi <0x0a, "S_BUFFER_LOAD_DWORDX4">;
574defm S_BUFFER_LOAD_DWORDX8  : SM_Real_Loads_vi <0x0b, "S_BUFFER_LOAD_DWORDX8">;
575defm S_BUFFER_LOAD_DWORDX16 : SM_Real_Loads_vi <0x0c, "S_BUFFER_LOAD_DWORDX16">;
576
577defm S_STORE_DWORD : SM_Real_Stores_vi <0x10, "S_STORE_DWORD">;
578defm S_STORE_DWORDX2 : SM_Real_Stores_vi <0x11, "S_STORE_DWORDX2">;
579defm S_STORE_DWORDX4 : SM_Real_Stores_vi <0x12, "S_STORE_DWORDX4">;
580
581defm S_BUFFER_STORE_DWORD    : SM_Real_Stores_vi <0x18, "S_BUFFER_STORE_DWORD">;
582defm S_BUFFER_STORE_DWORDX2  : SM_Real_Stores_vi <0x19, "S_BUFFER_STORE_DWORDX2">;
583defm S_BUFFER_STORE_DWORDX4  : SM_Real_Stores_vi <0x1a, "S_BUFFER_STORE_DWORDX4">;
584
585// These instructions use same encoding
586def S_DCACHE_INV_vi         : SMEM_Real_vi <0x20, S_DCACHE_INV>;
587def S_DCACHE_WB_vi          : SMEM_Real_vi <0x21, S_DCACHE_WB>;
588def S_DCACHE_INV_VOL_vi     : SMEM_Real_vi <0x22, S_DCACHE_INV_VOL>;
589def S_DCACHE_WB_VOL_vi      : SMEM_Real_vi <0x23, S_DCACHE_WB_VOL>;
590def S_MEMTIME_vi            : SMEM_Real_vi <0x24, S_MEMTIME>;
591def S_MEMREALTIME_vi        : SMEM_Real_vi <0x25, S_MEMREALTIME>;
592
593defm S_SCRATCH_LOAD_DWORD    : SM_Real_Loads_vi <0x05, "S_SCRATCH_LOAD_DWORD">;
594defm S_SCRATCH_LOAD_DWORDX2  : SM_Real_Loads_vi <0x06, "S_SCRATCH_LOAD_DWORDX2">;
595defm S_SCRATCH_LOAD_DWORDX4  : SM_Real_Loads_vi <0x07, "S_SCRATCH_LOAD_DWORDX4">;
596
597defm S_SCRATCH_STORE_DWORD   : SM_Real_Stores_vi <0x15, "S_SCRATCH_STORE_DWORD">;
598defm S_SCRATCH_STORE_DWORDX2 : SM_Real_Stores_vi <0x16, "S_SCRATCH_STORE_DWORDX2">;
599defm S_SCRATCH_STORE_DWORDX4 : SM_Real_Stores_vi <0x17, "S_SCRATCH_STORE_DWORDX4">;
600
601defm S_ATC_PROBE        : SM_Real_Probe_vi <0x26, "S_ATC_PROBE">;
602defm S_ATC_PROBE_BUFFER : SM_Real_Probe_vi <0x27, "S_ATC_PROBE_BUFFER">;
603
604//===----------------------------------------------------------------------===//
605// GFX9
606//===----------------------------------------------------------------------===//
607
608class SMEM_Atomic_Real_vi <bits<8> op, SM_Atomic_Pseudo ps>
609  : SMEM_Real_vi <op, ps>,
610    AtomicNoRet <!subst("_RTN","",NAME), ps.glc> {
611
612  bits<7> sdata;
613
614  let Constraints = ps.Constraints;
615  let DisableEncoding = ps.DisableEncoding;
616
617  let cpol{CPolBit.GLC} = ps.glc;
618  let Inst{12-6} = !if(ps.glc, sdst{6-0}, sdata{6-0});
619}
620
621multiclass SM_Real_Atomics_vi<bits<8> op, string ps> {
622  def _IMM_vi       : SMEM_Atomic_Real_vi <op, !cast<SM_Atomic_Pseudo>(ps#_IMM)>;
623  def _SGPR_vi      : SMEM_Atomic_Real_vi <op, !cast<SM_Atomic_Pseudo>(ps#_SGPR)>;
624  def _IMM_RTN_vi   : SMEM_Atomic_Real_vi <op, !cast<SM_Atomic_Pseudo>(ps#_IMM_RTN)>;
625  def _SGPR_RTN_vi  : SMEM_Atomic_Real_vi <op, !cast<SM_Atomic_Pseudo>(ps#_SGPR_RTN)>;
626}
627
628defm S_BUFFER_ATOMIC_SWAP         : SM_Real_Atomics_vi <0x40, "S_BUFFER_ATOMIC_SWAP">;
629defm S_BUFFER_ATOMIC_CMPSWAP      : SM_Real_Atomics_vi <0x41, "S_BUFFER_ATOMIC_CMPSWAP">;
630defm S_BUFFER_ATOMIC_ADD          : SM_Real_Atomics_vi <0x42, "S_BUFFER_ATOMIC_ADD">;
631defm S_BUFFER_ATOMIC_SUB          : SM_Real_Atomics_vi <0x43, "S_BUFFER_ATOMIC_SUB">;
632defm S_BUFFER_ATOMIC_SMIN         : SM_Real_Atomics_vi <0x44, "S_BUFFER_ATOMIC_SMIN">;
633defm S_BUFFER_ATOMIC_UMIN         : SM_Real_Atomics_vi <0x45, "S_BUFFER_ATOMIC_UMIN">;
634defm S_BUFFER_ATOMIC_SMAX         : SM_Real_Atomics_vi <0x46, "S_BUFFER_ATOMIC_SMAX">;
635defm S_BUFFER_ATOMIC_UMAX         : SM_Real_Atomics_vi <0x47, "S_BUFFER_ATOMIC_UMAX">;
636defm S_BUFFER_ATOMIC_AND          : SM_Real_Atomics_vi <0x48, "S_BUFFER_ATOMIC_AND">;
637defm S_BUFFER_ATOMIC_OR           : SM_Real_Atomics_vi <0x49, "S_BUFFER_ATOMIC_OR">;
638defm S_BUFFER_ATOMIC_XOR          : SM_Real_Atomics_vi <0x4a, "S_BUFFER_ATOMIC_XOR">;
639defm S_BUFFER_ATOMIC_INC          : SM_Real_Atomics_vi <0x4b, "S_BUFFER_ATOMIC_INC">;
640defm S_BUFFER_ATOMIC_DEC          : SM_Real_Atomics_vi <0x4c, "S_BUFFER_ATOMIC_DEC">;
641
642defm S_BUFFER_ATOMIC_SWAP_X2      : SM_Real_Atomics_vi <0x60, "S_BUFFER_ATOMIC_SWAP_X2">;
643defm S_BUFFER_ATOMIC_CMPSWAP_X2   : SM_Real_Atomics_vi <0x61, "S_BUFFER_ATOMIC_CMPSWAP_X2">;
644defm S_BUFFER_ATOMIC_ADD_X2       : SM_Real_Atomics_vi <0x62, "S_BUFFER_ATOMIC_ADD_X2">;
645defm S_BUFFER_ATOMIC_SUB_X2       : SM_Real_Atomics_vi <0x63, "S_BUFFER_ATOMIC_SUB_X2">;
646defm S_BUFFER_ATOMIC_SMIN_X2      : SM_Real_Atomics_vi <0x64, "S_BUFFER_ATOMIC_SMIN_X2">;
647defm S_BUFFER_ATOMIC_UMIN_X2      : SM_Real_Atomics_vi <0x65, "S_BUFFER_ATOMIC_UMIN_X2">;
648defm S_BUFFER_ATOMIC_SMAX_X2      : SM_Real_Atomics_vi <0x66, "S_BUFFER_ATOMIC_SMAX_X2">;
649defm S_BUFFER_ATOMIC_UMAX_X2      : SM_Real_Atomics_vi <0x67, "S_BUFFER_ATOMIC_UMAX_X2">;
650defm S_BUFFER_ATOMIC_AND_X2       : SM_Real_Atomics_vi <0x68, "S_BUFFER_ATOMIC_AND_X2">;
651defm S_BUFFER_ATOMIC_OR_X2        : SM_Real_Atomics_vi <0x69, "S_BUFFER_ATOMIC_OR_X2">;
652defm S_BUFFER_ATOMIC_XOR_X2       : SM_Real_Atomics_vi <0x6a, "S_BUFFER_ATOMIC_XOR_X2">;
653defm S_BUFFER_ATOMIC_INC_X2       : SM_Real_Atomics_vi <0x6b, "S_BUFFER_ATOMIC_INC_X2">;
654defm S_BUFFER_ATOMIC_DEC_X2       : SM_Real_Atomics_vi <0x6c, "S_BUFFER_ATOMIC_DEC_X2">;
655
656defm S_ATOMIC_SWAP                : SM_Real_Atomics_vi <0x80, "S_ATOMIC_SWAP">;
657defm S_ATOMIC_CMPSWAP             : SM_Real_Atomics_vi <0x81, "S_ATOMIC_CMPSWAP">;
658defm S_ATOMIC_ADD                 : SM_Real_Atomics_vi <0x82, "S_ATOMIC_ADD">;
659defm S_ATOMIC_SUB                 : SM_Real_Atomics_vi <0x83, "S_ATOMIC_SUB">;
660defm S_ATOMIC_SMIN                : SM_Real_Atomics_vi <0x84, "S_ATOMIC_SMIN">;
661defm S_ATOMIC_UMIN                : SM_Real_Atomics_vi <0x85, "S_ATOMIC_UMIN">;
662defm S_ATOMIC_SMAX                : SM_Real_Atomics_vi <0x86, "S_ATOMIC_SMAX">;
663defm S_ATOMIC_UMAX                : SM_Real_Atomics_vi <0x87, "S_ATOMIC_UMAX">;
664defm S_ATOMIC_AND                 : SM_Real_Atomics_vi <0x88, "S_ATOMIC_AND">;
665defm S_ATOMIC_OR                  : SM_Real_Atomics_vi <0x89, "S_ATOMIC_OR">;
666defm S_ATOMIC_XOR                 : SM_Real_Atomics_vi <0x8a, "S_ATOMIC_XOR">;
667defm S_ATOMIC_INC                 : SM_Real_Atomics_vi <0x8b, "S_ATOMIC_INC">;
668defm S_ATOMIC_DEC                 : SM_Real_Atomics_vi <0x8c, "S_ATOMIC_DEC">;
669
670defm S_ATOMIC_SWAP_X2             : SM_Real_Atomics_vi <0xa0, "S_ATOMIC_SWAP_X2">;
671defm S_ATOMIC_CMPSWAP_X2          : SM_Real_Atomics_vi <0xa1, "S_ATOMIC_CMPSWAP_X2">;
672defm S_ATOMIC_ADD_X2              : SM_Real_Atomics_vi <0xa2, "S_ATOMIC_ADD_X2">;
673defm S_ATOMIC_SUB_X2              : SM_Real_Atomics_vi <0xa3, "S_ATOMIC_SUB_X2">;
674defm S_ATOMIC_SMIN_X2             : SM_Real_Atomics_vi <0xa4, "S_ATOMIC_SMIN_X2">;
675defm S_ATOMIC_UMIN_X2             : SM_Real_Atomics_vi <0xa5, "S_ATOMIC_UMIN_X2">;
676defm S_ATOMIC_SMAX_X2             : SM_Real_Atomics_vi <0xa6, "S_ATOMIC_SMAX_X2">;
677defm S_ATOMIC_UMAX_X2             : SM_Real_Atomics_vi <0xa7, "S_ATOMIC_UMAX_X2">;
678defm S_ATOMIC_AND_X2              : SM_Real_Atomics_vi <0xa8, "S_ATOMIC_AND_X2">;
679defm S_ATOMIC_OR_X2               : SM_Real_Atomics_vi <0xa9, "S_ATOMIC_OR_X2">;
680defm S_ATOMIC_XOR_X2              : SM_Real_Atomics_vi <0xaa, "S_ATOMIC_XOR_X2">;
681defm S_ATOMIC_INC_X2              : SM_Real_Atomics_vi <0xab, "S_ATOMIC_INC_X2">;
682defm S_ATOMIC_DEC_X2              : SM_Real_Atomics_vi <0xac, "S_ATOMIC_DEC_X2">;
683
684multiclass SM_Real_Discard_vi<bits<8> op, string ps> {
685  def _IMM_vi  : SMEM_Real_vi <op, !cast<SM_Discard_Pseudo>(ps#_IMM)>;
686  def _SGPR_vi : SMEM_Real_vi <op, !cast<SM_Discard_Pseudo>(ps#_SGPR)>;
687}
688
689defm S_DCACHE_DISCARD    : SM_Real_Discard_vi <0x28, "S_DCACHE_DISCARD">;
690defm S_DCACHE_DISCARD_X2 : SM_Real_Discard_vi <0x29, "S_DCACHE_DISCARD_X2">;
691
692//===----------------------------------------------------------------------===//
693// CI
694//===----------------------------------------------------------------------===//
695
696def smrd_literal_offset : NamedOperandU32<"SMRDLiteralOffset",
697                                          NamedMatchClass<"SMRDLiteralOffset">> {
698  let OperandType = "OPERAND_IMMEDIATE";
699}
700
701class SMRD_Real_Load_IMM_ci <bits<5> op, SM_Load_Pseudo ps> :
702  SM_Real<ps>,
703  Enc64 {
704
705  let AssemblerPredicate = isGFX7Only;
706  let DecoderNamespace = "GFX7";
707  let InOperandList = (ins ps.BaseClass:$sbase, smrd_literal_offset:$offset, CPol:$cpol);
708
709  let Inst{7-0}   = 0xff;
710  let Inst{8}     = 0;
711  let Inst{14-9}  = sbase{6-1};
712  let Inst{21-15} = sdst{6-0};
713  let Inst{26-22} = op;
714  let Inst{31-27} = 0x18; //encoding
715  let Inst{63-32} = offset{31-0};
716}
717
718def S_LOAD_DWORD_IMM_ci           : SMRD_Real_Load_IMM_ci <0x00, S_LOAD_DWORD_IMM>;
719def S_LOAD_DWORDX2_IMM_ci         : SMRD_Real_Load_IMM_ci <0x01, S_LOAD_DWORDX2_IMM>;
720def S_LOAD_DWORDX4_IMM_ci         : SMRD_Real_Load_IMM_ci <0x02, S_LOAD_DWORDX4_IMM>;
721def S_LOAD_DWORDX8_IMM_ci         : SMRD_Real_Load_IMM_ci <0x03, S_LOAD_DWORDX8_IMM>;
722def S_LOAD_DWORDX16_IMM_ci        : SMRD_Real_Load_IMM_ci <0x04, S_LOAD_DWORDX16_IMM>;
723def S_BUFFER_LOAD_DWORD_IMM_ci    : SMRD_Real_Load_IMM_ci <0x08, S_BUFFER_LOAD_DWORD_IMM>;
724def S_BUFFER_LOAD_DWORDX2_IMM_ci  : SMRD_Real_Load_IMM_ci <0x09, S_BUFFER_LOAD_DWORDX2_IMM>;
725def S_BUFFER_LOAD_DWORDX4_IMM_ci  : SMRD_Real_Load_IMM_ci <0x0a, S_BUFFER_LOAD_DWORDX4_IMM>;
726def S_BUFFER_LOAD_DWORDX8_IMM_ci  : SMRD_Real_Load_IMM_ci <0x0b, S_BUFFER_LOAD_DWORDX8_IMM>;
727def S_BUFFER_LOAD_DWORDX16_IMM_ci : SMRD_Real_Load_IMM_ci <0x0c, S_BUFFER_LOAD_DWORDX16_IMM>;
728
729class SMRD_Real_ci <bits<5> op, SM_Pseudo ps>
730  : SM_Real<ps>
731  , SIMCInstr<ps.PseudoInstr, SIEncodingFamily.SI>
732  , Enc32 {
733
734  let AssemblerPredicate = isGFX7Only;
735  let DecoderNamespace = "GFX7";
736
737  let Inst{7-0}   = !if(ps.has_offset, offset{7-0}, ?);
738  let Inst{8}     = imm;
739  let Inst{14-9}  = !if(ps.has_sbase, sbase{6-1}, ?);
740  let Inst{21-15} = !if(ps.has_sdst, sdst{6-0}, ?);
741  let Inst{26-22} = op;
742  let Inst{31-27} = 0x18; //encoding
743}
744
745def S_DCACHE_INV_VOL_ci : SMRD_Real_ci <0x1d, S_DCACHE_INV_VOL>;
746
747//===----------------------------------------------------------------------===//
748// Scalar Memory Patterns
749//===----------------------------------------------------------------------===//
750
751def smrd_load : PatFrag <(ops node:$ptr), (load node:$ptr), [{ return isUniformLoad(N);}]> {
752  let GISelPredicateCode = [{
753    if (!MI.hasOneMemOperand())
754      return false;
755    if (!isInstrUniform(MI))
756      return false;
757
758    // FIXME: We should probably be caching this.
759    SmallVector<GEPInfo, 4> AddrInfo;
760    getAddrModeInfo(MI, MRI, AddrInfo);
761
762    if (hasVgprParts(AddrInfo))
763      return false;
764    return true;
765  }];
766}
767
768def SMRDImm         : ComplexPattern<i64, 2, "SelectSMRDImm">;
769def SMRDImm32       : ComplexPattern<i64, 2, "SelectSMRDImm32">;
770def SMRDSgpr        : ComplexPattern<i64, 2, "SelectSMRDSgpr">;
771def SMRDBufferImm   : ComplexPattern<i32, 1, "SelectSMRDBufferImm">;
772def SMRDBufferImm32 : ComplexPattern<i32, 1, "SelectSMRDBufferImm32">;
773
774multiclass SMRD_Pattern <string Instr, ValueType vt> {
775
776  // 1. IMM offset
777  def : GCNPat <
778    (smrd_load (SMRDImm i64:$sbase, i32:$offset)),
779    (vt (!cast<SM_Pseudo>(Instr#"_IMM") $sbase, $offset, 0))
780  >;
781
782  // 2. 32-bit IMM offset on CI
783  def : GCNPat <
784    (smrd_load (SMRDImm32 i64:$sbase, i32:$offset)),
785    (vt (!cast<InstSI>(Instr#"_IMM_ci") $sbase, $offset, 0))> {
786    let OtherPredicates = [isGFX7Only];
787  }
788
789  // 3. SGPR offset
790  def : GCNPat <
791    (smrd_load (SMRDSgpr i64:$sbase, i32:$offset)),
792    (vt (!cast<SM_Pseudo>(Instr#"_SGPR") $sbase, $offset, 0))
793  >;
794
795  // 4. No offset
796  def : GCNPat <
797    (vt (smrd_load (i64 SReg_64:$sbase))),
798    (vt (!cast<SM_Pseudo>(Instr#"_IMM") i64:$sbase, 0, 0))
799  >;
800}
801
802multiclass SMLoad_Pattern <string Instr, ValueType vt> {
803  // 1. Offset as an immediate
804  def : GCNPat <
805    (SIsbuffer_load v4i32:$sbase, (SMRDBufferImm i32:$offset), timm:$cachepolicy),
806    (vt (!cast<SM_Pseudo>(Instr#"_IMM") SReg_128:$sbase, i32imm:$offset, (extract_cpol $cachepolicy)))> {
807    let AddedComplexity = 2;
808  }
809
810  // 2. 32-bit IMM offset on CI
811  def : GCNPat <
812    (vt (SIsbuffer_load v4i32:$sbase, (SMRDBufferImm32 i32:$offset), timm:$cachepolicy)),
813    (!cast<InstSI>(Instr#"_IMM_ci") SReg_128:$sbase, smrd_literal_offset:$offset,
814                                    (extract_cpol $cachepolicy))> {
815    let OtherPredicates = [isGFX7Only];
816    let AddedComplexity = 1;
817  }
818
819  // 3. Offset loaded in an 32bit SGPR
820  def : GCNPat <
821    (SIsbuffer_load v4i32:$sbase, i32:$offset, timm:$cachepolicy),
822    (vt (!cast<SM_Pseudo>(Instr#"_SGPR") SReg_128:$sbase, SReg_32:$offset, (extract_cpol $cachepolicy)))
823  >;
824}
825
826// Global and constant loads can be selected to either MUBUF or SMRD
827// instructions, but SMRD instructions are faster so we want the instruction
828// selector to prefer those.
829let AddedComplexity = 100 in {
830
831foreach vt = Reg32Types.types in {
832defm : SMRD_Pattern <"S_LOAD_DWORD", vt>;
833}
834
835foreach vt = SReg_64.RegTypes in {
836defm : SMRD_Pattern <"S_LOAD_DWORDX2", vt>;
837}
838
839foreach vt = SReg_128.RegTypes in {
840defm : SMRD_Pattern <"S_LOAD_DWORDX4", vt>;
841}
842
843foreach vt = SReg_256.RegTypes in {
844defm : SMRD_Pattern <"S_LOAD_DWORDX8", vt>;
845}
846
847foreach vt = SReg_512.RegTypes in {
848defm : SMRD_Pattern <"S_LOAD_DWORDX16", vt>;
849}
850
851defm : SMLoad_Pattern <"S_BUFFER_LOAD_DWORD",     i32>;
852defm : SMLoad_Pattern <"S_BUFFER_LOAD_DWORDX2",   v2i32>;
853defm : SMLoad_Pattern <"S_BUFFER_LOAD_DWORDX4",   v4i32>;
854defm : SMLoad_Pattern <"S_BUFFER_LOAD_DWORDX8",   v8i32>;
855defm : SMLoad_Pattern <"S_BUFFER_LOAD_DWORDX16",  v16i32>;
856
857defm : SMLoad_Pattern <"S_BUFFER_LOAD_DWORD",     f32>;
858defm : SMLoad_Pattern <"S_BUFFER_LOAD_DWORDX2",   v2f32>;
859defm : SMLoad_Pattern <"S_BUFFER_LOAD_DWORDX4",   v4f32>;
860defm : SMLoad_Pattern <"S_BUFFER_LOAD_DWORDX8",   v8f32>;
861defm : SMLoad_Pattern <"S_BUFFER_LOAD_DWORDX16",  v16f32>;
862} // End let AddedComplexity = 100
863
864let OtherPredicates = [HasSMemTimeInst] in {
865def : GCNPat <
866  (i64 (readcyclecounter)),
867  (S_MEMTIME)
868>;
869} // let OtherPredicates = [HasSMemTimeInst]
870
871let OtherPredicates = [HasShaderCyclesRegister] in {
872def : GCNPat <
873  (i64 (readcyclecounter)),
874  (REG_SEQUENCE SReg_64,
875    (S_GETREG_B32 getHwRegImm<HWREG.SHADER_CYCLES, 0, -12>.ret), sub0,
876    (S_MOV_B32 (i32 0)), sub1)> {
877  // Prefer this to s_memtime because it has lower and more predictable latency.
878  let AddedComplexity = 1;
879}
880} // let OtherPredicates = [HasShaderCyclesRegister]
881
882//===----------------------------------------------------------------------===//
883// GFX10.
884//===----------------------------------------------------------------------===//
885
886class SMEM_Real_gfx10<bits<8> op, SM_Pseudo ps> :
887    SM_Real<ps>, SIMCInstr<ps.PseudoInstr, SIEncodingFamily.GFX10>, Enc64 {
888  let AssemblerPredicate = isGFX10Plus;
889  let DecoderNamespace = "GFX10";
890
891  let Inst{5-0}   = !if(ps.has_sbase, sbase{6-1}, ?);
892  let Inst{12-6}  = !if(ps.has_sdst, sdst{6-0}, ?);
893  let Inst{14}    = !if(ps.has_dlc, cpol{CPolBit.DLC}, ?);
894  let Inst{16}    = !if(ps.has_glc, cpol{CPolBit.GLC}, ?);
895  let Inst{25-18} = op;
896  let Inst{31-26} = 0x3d;
897  let Inst{52-32} = !if(ps.offset_is_imm, !if(ps.has_offset, offset{20-0}, ?), ?);
898  let Inst{63-57} = !if(ps.offset_is_imm, !cast<int>(SGPR_NULL.HWEncoding),
899                                          !if(ps.has_offset, offset{6-0}, ?));
900}
901
902multiclass SM_Real_Loads_gfx10<bits<8> op, string ps,
903                               SM_Load_Pseudo immPs = !cast<SM_Load_Pseudo>(ps#_IMM),
904                               SM_Load_Pseudo sgprPs = !cast<SM_Load_Pseudo>(ps#_SGPR)> {
905  def _IMM_gfx10 : SMEM_Real_gfx10<op, immPs> {
906    let InOperandList = (ins immPs.BaseClass:$sbase, smem_offset:$offset, CPol:$cpol);
907  }
908  def _SGPR_gfx10 : SMEM_Real_gfx10<op, sgprPs> {
909    let InOperandList = (ins sgprPs.BaseClass:$sbase, SReg_32:$offset, CPol:$cpol);
910  }
911}
912
913class SMEM_Real_Store_gfx10<bits<8> op, SM_Pseudo ps> : SMEM_Real_gfx10<op, ps> {
914  bits<7> sdata;
915
916  let sdst = ?;
917  let Inst{12-6} = !if(ps.has_sdst, sdata{6-0}, ?);
918}
919
920multiclass SM_Real_Stores_gfx10<bits<8> op, string ps,
921                                SM_Store_Pseudo immPs = !cast<SM_Store_Pseudo>(ps#_IMM),
922                                SM_Store_Pseudo sgprPs = !cast<SM_Store_Pseudo>(ps#_SGPR)> {
923  // FIXME: The operand name $offset is inconsistent with $soff used
924  // in the pseudo
925  def _IMM_gfx10 : SMEM_Real_Store_gfx10 <op, immPs> {
926    let InOperandList = (ins immPs.SrcClass:$sdata, immPs.BaseClass:$sbase, smem_offset:$offset, CPol:$cpol);
927  }
928
929  def _SGPR_gfx10 : SMEM_Real_Store_gfx10 <op, sgprPs> {
930    let InOperandList = (ins sgprPs.SrcClass:$sdata, sgprPs.BaseClass:$sbase, SReg_32:$offset, CPol:$cpol);
931  }
932}
933
934defm S_LOAD_DWORD            : SM_Real_Loads_gfx10<0x000, "S_LOAD_DWORD">;
935defm S_LOAD_DWORDX2          : SM_Real_Loads_gfx10<0x001, "S_LOAD_DWORDX2">;
936defm S_LOAD_DWORDX4          : SM_Real_Loads_gfx10<0x002, "S_LOAD_DWORDX4">;
937defm S_LOAD_DWORDX8          : SM_Real_Loads_gfx10<0x003, "S_LOAD_DWORDX8">;
938defm S_LOAD_DWORDX16         : SM_Real_Loads_gfx10<0x004, "S_LOAD_DWORDX16">;
939
940let SubtargetPredicate = HasScalarFlatScratchInsts in {
941defm S_SCRATCH_LOAD_DWORD    : SM_Real_Loads_gfx10<0x005, "S_SCRATCH_LOAD_DWORD">;
942defm S_SCRATCH_LOAD_DWORDX2  : SM_Real_Loads_gfx10<0x006, "S_SCRATCH_LOAD_DWORDX2">;
943defm S_SCRATCH_LOAD_DWORDX4  : SM_Real_Loads_gfx10<0x007, "S_SCRATCH_LOAD_DWORDX4">;
944} // End SubtargetPredicate = HasScalarFlatScratchInsts
945
946defm S_BUFFER_LOAD_DWORD     : SM_Real_Loads_gfx10<0x008, "S_BUFFER_LOAD_DWORD">;
947defm S_BUFFER_LOAD_DWORDX2   : SM_Real_Loads_gfx10<0x009, "S_BUFFER_LOAD_DWORDX2">;
948defm S_BUFFER_LOAD_DWORDX4   : SM_Real_Loads_gfx10<0x00a, "S_BUFFER_LOAD_DWORDX4">;
949defm S_BUFFER_LOAD_DWORDX8   : SM_Real_Loads_gfx10<0x00b, "S_BUFFER_LOAD_DWORDX8">;
950defm S_BUFFER_LOAD_DWORDX16  : SM_Real_Loads_gfx10<0x00c, "S_BUFFER_LOAD_DWORDX16">;
951
952let SubtargetPredicate = HasScalarStores in {
953defm S_STORE_DWORD           : SM_Real_Stores_gfx10<0x010, "S_STORE_DWORD">;
954defm S_STORE_DWORDX2         : SM_Real_Stores_gfx10<0x011, "S_STORE_DWORDX2">;
955defm S_STORE_DWORDX4         : SM_Real_Stores_gfx10<0x012, "S_STORE_DWORDX4">;
956let OtherPredicates = [HasScalarFlatScratchInsts] in {
957defm S_SCRATCH_STORE_DWORD   : SM_Real_Stores_gfx10<0x015, "S_SCRATCH_STORE_DWORD">;
958defm S_SCRATCH_STORE_DWORDX2 : SM_Real_Stores_gfx10<0x016, "S_SCRATCH_STORE_DWORDX2">;
959defm S_SCRATCH_STORE_DWORDX4 : SM_Real_Stores_gfx10<0x017, "S_SCRATCH_STORE_DWORDX4">;
960} // End OtherPredicates = [HasScalarFlatScratchInsts]
961defm S_BUFFER_STORE_DWORD    : SM_Real_Stores_gfx10<0x018, "S_BUFFER_STORE_DWORD">;
962defm S_BUFFER_STORE_DWORDX2  : SM_Real_Stores_gfx10<0x019, "S_BUFFER_STORE_DWORDX2">;
963defm S_BUFFER_STORE_DWORDX4  : SM_Real_Stores_gfx10<0x01a, "S_BUFFER_STORE_DWORDX4">;
964} // End SubtargetPredicate = HasScalarStores
965
966def S_MEMREALTIME_gfx10              : SMEM_Real_gfx10<0x025, S_MEMREALTIME>;
967def S_MEMTIME_gfx10                  : SMEM_Real_gfx10<0x024, S_MEMTIME>;
968def S_GL1_INV_gfx10                  : SMEM_Real_gfx10<0x01f, S_GL1_INV>;
969def S_GET_WAVEID_IN_WORKGROUP_gfx10  : SMEM_Real_gfx10<0x02a, S_GET_WAVEID_IN_WORKGROUP>;
970def S_DCACHE_INV_gfx10               : SMEM_Real_gfx10<0x020, S_DCACHE_INV>;
971
972let SubtargetPredicate = HasScalarStores in {
973def S_DCACHE_WB_gfx10                : SMEM_Real_gfx10<0x021, S_DCACHE_WB>;
974} // End SubtargetPredicate = HasScalarStores
975
976multiclass SM_Real_Probe_gfx10<bits<8> op, string ps> {
977  def _IMM_gfx10  : SMEM_Real_Store_gfx10 <op, !cast<SM_Pseudo>(ps#_IMM)>;
978  def _SGPR_gfx10 : SMEM_Real_Store_gfx10 <op, !cast<SM_Pseudo>(ps#_SGPR)>;
979}
980
981defm S_ATC_PROBE        : SM_Real_Probe_gfx10 <0x26, "S_ATC_PROBE">;
982defm S_ATC_PROBE_BUFFER : SM_Real_Probe_gfx10 <0x27, "S_ATC_PROBE_BUFFER">;
983
984class SMEM_Atomic_Real_gfx10 <bits<8> op, SM_Atomic_Pseudo ps>
985  : SMEM_Real_gfx10 <op, ps>,
986    AtomicNoRet <!subst("_RTN","",NAME), ps.glc> {
987
988  bits<7> sdata;
989
990  let Constraints = ps.Constraints;
991  let DisableEncoding = ps.DisableEncoding;
992
993  let cpol{CPolBit.GLC} = ps.glc;
994
995  let Inst{14} = !if(ps.has_dlc, cpol{CPolBit.DLC}, 0);
996  let Inst{12-6} = !if(ps.glc, sdst{6-0}, sdata{6-0});
997}
998
999multiclass SM_Real_Atomics_gfx10<bits<8> op, string ps> {
1000  def _IMM_gfx10       : SMEM_Atomic_Real_gfx10 <op, !cast<SM_Atomic_Pseudo>(ps#_IMM)>;
1001  def _SGPR_gfx10      : SMEM_Atomic_Real_gfx10 <op, !cast<SM_Atomic_Pseudo>(ps#_SGPR)>;
1002  def _IMM_RTN_gfx10   : SMEM_Atomic_Real_gfx10 <op, !cast<SM_Atomic_Pseudo>(ps#_IMM_RTN)>;
1003  def _SGPR_RTN_gfx10  : SMEM_Atomic_Real_gfx10 <op, !cast<SM_Atomic_Pseudo>(ps#_SGPR_RTN)>;
1004}
1005
1006let SubtargetPredicate = HasScalarAtomics in {
1007
1008defm S_BUFFER_ATOMIC_SWAP         : SM_Real_Atomics_gfx10 <0x40, "S_BUFFER_ATOMIC_SWAP">;
1009defm S_BUFFER_ATOMIC_CMPSWAP      : SM_Real_Atomics_gfx10 <0x41, "S_BUFFER_ATOMIC_CMPSWAP">;
1010defm S_BUFFER_ATOMIC_ADD          : SM_Real_Atomics_gfx10 <0x42, "S_BUFFER_ATOMIC_ADD">;
1011defm S_BUFFER_ATOMIC_SUB          : SM_Real_Atomics_gfx10 <0x43, "S_BUFFER_ATOMIC_SUB">;
1012defm S_BUFFER_ATOMIC_SMIN         : SM_Real_Atomics_gfx10 <0x44, "S_BUFFER_ATOMIC_SMIN">;
1013defm S_BUFFER_ATOMIC_UMIN         : SM_Real_Atomics_gfx10 <0x45, "S_BUFFER_ATOMIC_UMIN">;
1014defm S_BUFFER_ATOMIC_SMAX         : SM_Real_Atomics_gfx10 <0x46, "S_BUFFER_ATOMIC_SMAX">;
1015defm S_BUFFER_ATOMIC_UMAX         : SM_Real_Atomics_gfx10 <0x47, "S_BUFFER_ATOMIC_UMAX">;
1016defm S_BUFFER_ATOMIC_AND          : SM_Real_Atomics_gfx10 <0x48, "S_BUFFER_ATOMIC_AND">;
1017defm S_BUFFER_ATOMIC_OR           : SM_Real_Atomics_gfx10 <0x49, "S_BUFFER_ATOMIC_OR">;
1018defm S_BUFFER_ATOMIC_XOR          : SM_Real_Atomics_gfx10 <0x4a, "S_BUFFER_ATOMIC_XOR">;
1019defm S_BUFFER_ATOMIC_INC          : SM_Real_Atomics_gfx10 <0x4b, "S_BUFFER_ATOMIC_INC">;
1020defm S_BUFFER_ATOMIC_DEC          : SM_Real_Atomics_gfx10 <0x4c, "S_BUFFER_ATOMIC_DEC">;
1021
1022defm S_BUFFER_ATOMIC_SWAP_X2      : SM_Real_Atomics_gfx10 <0x60, "S_BUFFER_ATOMIC_SWAP_X2">;
1023defm S_BUFFER_ATOMIC_CMPSWAP_X2   : SM_Real_Atomics_gfx10 <0x61, "S_BUFFER_ATOMIC_CMPSWAP_X2">;
1024defm S_BUFFER_ATOMIC_ADD_X2       : SM_Real_Atomics_gfx10 <0x62, "S_BUFFER_ATOMIC_ADD_X2">;
1025defm S_BUFFER_ATOMIC_SUB_X2       : SM_Real_Atomics_gfx10 <0x63, "S_BUFFER_ATOMIC_SUB_X2">;
1026defm S_BUFFER_ATOMIC_SMIN_X2      : SM_Real_Atomics_gfx10 <0x64, "S_BUFFER_ATOMIC_SMIN_X2">;
1027defm S_BUFFER_ATOMIC_UMIN_X2      : SM_Real_Atomics_gfx10 <0x65, "S_BUFFER_ATOMIC_UMIN_X2">;
1028defm S_BUFFER_ATOMIC_SMAX_X2      : SM_Real_Atomics_gfx10 <0x66, "S_BUFFER_ATOMIC_SMAX_X2">;
1029defm S_BUFFER_ATOMIC_UMAX_X2      : SM_Real_Atomics_gfx10 <0x67, "S_BUFFER_ATOMIC_UMAX_X2">;
1030defm S_BUFFER_ATOMIC_AND_X2       : SM_Real_Atomics_gfx10 <0x68, "S_BUFFER_ATOMIC_AND_X2">;
1031defm S_BUFFER_ATOMIC_OR_X2        : SM_Real_Atomics_gfx10 <0x69, "S_BUFFER_ATOMIC_OR_X2">;
1032defm S_BUFFER_ATOMIC_XOR_X2       : SM_Real_Atomics_gfx10 <0x6a, "S_BUFFER_ATOMIC_XOR_X2">;
1033defm S_BUFFER_ATOMIC_INC_X2       : SM_Real_Atomics_gfx10 <0x6b, "S_BUFFER_ATOMIC_INC_X2">;
1034defm S_BUFFER_ATOMIC_DEC_X2       : SM_Real_Atomics_gfx10 <0x6c, "S_BUFFER_ATOMIC_DEC_X2">;
1035
1036defm S_ATOMIC_SWAP                : SM_Real_Atomics_gfx10 <0x80, "S_ATOMIC_SWAP">;
1037defm S_ATOMIC_CMPSWAP             : SM_Real_Atomics_gfx10 <0x81, "S_ATOMIC_CMPSWAP">;
1038defm S_ATOMIC_ADD                 : SM_Real_Atomics_gfx10 <0x82, "S_ATOMIC_ADD">;
1039defm S_ATOMIC_SUB                 : SM_Real_Atomics_gfx10 <0x83, "S_ATOMIC_SUB">;
1040defm S_ATOMIC_SMIN                : SM_Real_Atomics_gfx10 <0x84, "S_ATOMIC_SMIN">;
1041defm S_ATOMIC_UMIN                : SM_Real_Atomics_gfx10 <0x85, "S_ATOMIC_UMIN">;
1042defm S_ATOMIC_SMAX                : SM_Real_Atomics_gfx10 <0x86, "S_ATOMIC_SMAX">;
1043defm S_ATOMIC_UMAX                : SM_Real_Atomics_gfx10 <0x87, "S_ATOMIC_UMAX">;
1044defm S_ATOMIC_AND                 : SM_Real_Atomics_gfx10 <0x88, "S_ATOMIC_AND">;
1045defm S_ATOMIC_OR                  : SM_Real_Atomics_gfx10 <0x89, "S_ATOMIC_OR">;
1046defm S_ATOMIC_XOR                 : SM_Real_Atomics_gfx10 <0x8a, "S_ATOMIC_XOR">;
1047defm S_ATOMIC_INC                 : SM_Real_Atomics_gfx10 <0x8b, "S_ATOMIC_INC">;
1048defm S_ATOMIC_DEC                 : SM_Real_Atomics_gfx10 <0x8c, "S_ATOMIC_DEC">;
1049
1050defm S_ATOMIC_SWAP_X2             : SM_Real_Atomics_gfx10 <0xa0, "S_ATOMIC_SWAP_X2">;
1051defm S_ATOMIC_CMPSWAP_X2          : SM_Real_Atomics_gfx10 <0xa1, "S_ATOMIC_CMPSWAP_X2">;
1052defm S_ATOMIC_ADD_X2              : SM_Real_Atomics_gfx10 <0xa2, "S_ATOMIC_ADD_X2">;
1053defm S_ATOMIC_SUB_X2              : SM_Real_Atomics_gfx10 <0xa3, "S_ATOMIC_SUB_X2">;
1054defm S_ATOMIC_SMIN_X2             : SM_Real_Atomics_gfx10 <0xa4, "S_ATOMIC_SMIN_X2">;
1055defm S_ATOMIC_UMIN_X2             : SM_Real_Atomics_gfx10 <0xa5, "S_ATOMIC_UMIN_X2">;
1056defm S_ATOMIC_SMAX_X2             : SM_Real_Atomics_gfx10 <0xa6, "S_ATOMIC_SMAX_X2">;
1057defm S_ATOMIC_UMAX_X2             : SM_Real_Atomics_gfx10 <0xa7, "S_ATOMIC_UMAX_X2">;
1058defm S_ATOMIC_AND_X2              : SM_Real_Atomics_gfx10 <0xa8, "S_ATOMIC_AND_X2">;
1059defm S_ATOMIC_OR_X2               : SM_Real_Atomics_gfx10 <0xa9, "S_ATOMIC_OR_X2">;
1060defm S_ATOMIC_XOR_X2              : SM_Real_Atomics_gfx10 <0xaa, "S_ATOMIC_XOR_X2">;
1061defm S_ATOMIC_INC_X2              : SM_Real_Atomics_gfx10 <0xab, "S_ATOMIC_INC_X2">;
1062defm S_ATOMIC_DEC_X2              : SM_Real_Atomics_gfx10 <0xac, "S_ATOMIC_DEC_X2">;
1063
1064multiclass SM_Real_Discard_gfx10<bits<8> op, string ps> {
1065  def _IMM_gfx10  : SMEM_Real_gfx10 <op, !cast<SM_Pseudo>(ps#_IMM)>;
1066  def _SGPR_gfx10 : SMEM_Real_gfx10 <op, !cast<SM_Pseudo>(ps#_SGPR)>;
1067}
1068
1069defm S_DCACHE_DISCARD    : SM_Real_Discard_gfx10 <0x28, "S_DCACHE_DISCARD">;
1070defm S_DCACHE_DISCARD_X2 : SM_Real_Discard_gfx10 <0x29, "S_DCACHE_DISCARD_X2">;
1071
1072} // End SubtargetPredicate = HasScalarAtomics
1073
1074def SMInfoTable : GenericTable {
1075  let FilterClass = "SM_Real";
1076  let CppTypeName = "SMInfo";
1077  let Fields = ["Opcode", "is_buffer"];
1078
1079  let PrimaryKey = ["Opcode"];
1080  let PrimaryKeyName = "getSMEMOpcodeHelper";
1081}
1082