xref: /freebsd/contrib/llvm-project/llvm/lib/Target/AMDGPU/SMInstructions.td (revision 90ec6a30353aa7caaf995ea50e2e23aa5a099600)
1//===---- SMInstructions.td - Scalar Memory Instruction Definitions -------===//
2//
3// Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions.
4// See https://llvm.org/LICENSE.txt for license information.
5// SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception
6//
7//===----------------------------------------------------------------------===//
8
9def smrd_offset_8 : NamedOperandU32<"SMRDOffset8",
10                                  NamedMatchClass<"SMRDOffset8">> {
11  let OperandType = "OPERAND_IMMEDIATE";
12}
13
14def smem_offset : NamedOperandU32<"SMEMOffset",
15                                  NamedMatchClass<"SMEMOffset">> {
16  let OperandType = "OPERAND_IMMEDIATE";
17  let EncoderMethod = "getSMEMOffsetEncoding";
18  let DecoderMethod = "decodeSMEMOffset";
19}
20
21//===----------------------------------------------------------------------===//
22// Scalar Memory classes
23//===----------------------------------------------------------------------===//
24
25class SM_Pseudo <string opName, dag outs, dag ins, string asmOps, list<dag> pattern=[]> :
26  InstSI <outs, ins, "", pattern>,
27  SIMCInstr<opName, SIEncodingFamily.NONE> {
28  let isPseudo = 1;
29  let isCodeGenOnly = 1;
30
31  let LGKM_CNT = 1;
32  let SMRD = 1;
33  let mayStore = 0;
34  let mayLoad = 1;
35  let hasSideEffects = 0;
36  let UseNamedOperandTable = 1;
37  let SchedRW = [WriteSMEM];
38
39  string Mnemonic = opName;
40  string AsmOperands = asmOps;
41
42  bits<1> has_sbase = 1;
43  bits<1> has_sdst = 1;
44  bit has_glc = 0;
45  bit has_dlc = 0;
46  bits<1> has_offset = 1;
47  bits<1> offset_is_imm = 0;
48  bit is_buffer = 0;
49}
50
51class SM_Real <SM_Pseudo ps>
52  : InstSI<ps.OutOperandList, ps.InOperandList, ps.Mnemonic # ps.AsmOperands, []> {
53
54  let isPseudo = 0;
55  let isCodeGenOnly = 0;
56
57  Instruction Opcode = !cast<Instruction>(NAME);
58
59  // copy relevant pseudo op flags
60  let SubtargetPredicate = ps.SubtargetPredicate;
61  let AsmMatchConverter  = ps.AsmMatchConverter;
62  let UseNamedOperandTable = ps.UseNamedOperandTable;
63  let SMRD = ps.SMRD;
64
65  bit is_buffer = ps.is_buffer;
66
67  // encoding
68  bits<7>  sbase;
69  bits<7>  sdst;
70  bits<32> offset;
71  bits<1> imm = !if(ps.has_offset, ps.offset_is_imm, 0);
72}
73
74class SM_Probe_Pseudo <string opName, dag ins, bit isImm>
75  : SM_Pseudo<opName, (outs), ins, " $sdata, $sbase, $offset"> {
76  let mayLoad = 0;
77  let mayStore = 0;
78  let has_glc = 0;
79  let LGKM_CNT = 0;
80  let ScalarStore = 0;
81  let hasSideEffects = 1;
82  let offset_is_imm = isImm;
83  let PseudoInstr = opName # !if(isImm, "_IMM", "_SGPR");
84}
85
86class SM_Load_Pseudo <string opName, dag outs, dag ins, string asmOps, list<dag> pattern=[]>
87  : SM_Pseudo<opName, outs, ins, asmOps, pattern> {
88  RegisterClass BaseClass;
89  let mayLoad = 1;
90  let mayStore = 0;
91  let has_glc = 1;
92  let has_dlc = 1;
93}
94
95class SM_Store_Pseudo <string opName, dag ins, string asmOps, list<dag> pattern = []>
96  : SM_Pseudo<opName, (outs), ins, asmOps, pattern> {
97  RegisterClass BaseClass;
98  RegisterClass SrcClass;
99  let mayLoad = 0;
100  let mayStore = 1;
101  let has_glc = 1;
102  let has_dlc = 1;
103  let ScalarStore = 1;
104}
105
106class SM_Discard_Pseudo <string opName, dag ins, bit isImm>
107  : SM_Pseudo<opName, (outs), ins, " $sbase, $offset"> {
108  let mayLoad = 0;
109  let mayStore = 0;
110  let has_glc = 0;
111  let has_sdst = 0;
112  let ScalarStore = 0;
113  let hasSideEffects = 1;
114  let offset_is_imm = isImm;
115  let PseudoInstr = opName # !if(isImm, "_IMM", "_SGPR");
116}
117
118multiclass SM_Pseudo_Loads<string opName,
119                           RegisterClass baseClass,
120                           RegisterClass dstClass> {
121  def _IMM  : SM_Load_Pseudo <opName,
122                              (outs dstClass:$sdst),
123                              (ins baseClass:$sbase, i32imm:$offset, i1imm:$glc, i1imm:$dlc),
124                              " $sdst, $sbase, $offset$glc$dlc", []> {
125    let offset_is_imm = 1;
126    let BaseClass = baseClass;
127    let PseudoInstr = opName # "_IMM";
128    let has_glc = 1;
129    let has_dlc = 1;
130  }
131
132  def _SGPR  : SM_Load_Pseudo <opName,
133                              (outs dstClass:$sdst),
134                              (ins baseClass:$sbase, SReg_32:$soff, i1imm:$glc, i1imm:$dlc),
135                              " $sdst, $sbase, $offset$glc$dlc", []> {
136    let BaseClass = baseClass;
137    let PseudoInstr = opName # "_SGPR";
138    let has_glc = 1;
139    let has_dlc = 1;
140  }
141}
142
143multiclass SM_Pseudo_Stores<string opName,
144                           RegisterClass baseClass,
145                           RegisterClass srcClass> {
146  def _IMM  : SM_Store_Pseudo <opName,
147    (ins srcClass:$sdata, baseClass:$sbase, i32imm:$offset, i1imm:$glc, i1imm:$dlc),
148    " $sdata, $sbase, $offset$glc$dlc", []> {
149    let offset_is_imm = 1;
150    let BaseClass = baseClass;
151    let SrcClass = srcClass;
152    let PseudoInstr = opName # "_IMM";
153  }
154
155  def _SGPR  : SM_Store_Pseudo <opName,
156    (ins srcClass:$sdata, baseClass:$sbase, SReg_32:$soff, i1imm:$glc, i1imm:$dlc),
157    " $sdata, $sbase, $offset$glc$dlc", []> {
158    let BaseClass = baseClass;
159    let SrcClass = srcClass;
160    let PseudoInstr = opName # "_SGPR";
161  }
162}
163
164multiclass SM_Pseudo_Discards<string opName> {
165  def _IMM  : SM_Discard_Pseudo <opName, (ins SReg_64:$sbase, smem_offset:$offset), 1>;
166  def _SGPR : SM_Discard_Pseudo <opName, (ins SReg_64:$sbase, SReg_32:$offset), 0>;
167}
168
169class SM_Time_Pseudo<string opName, SDPatternOperator node = null_frag> : SM_Pseudo<
170  opName, (outs SReg_64_XEXEC:$sdst), (ins),
171  " $sdst", [(set i64:$sdst, (node))]> {
172  let hasSideEffects = 1;
173
174  // FIXME: This should be definitively mayStore = 0. TableGen
175  // brokenly tries to infer these based on the intrinsic properties
176  // corresponding to the IR attributes. The target intrinsics are
177  // considered as writing to memory for IR dependency purposes, but
178  // those can be modeled with hasSideEffects here. These also end up
179  // inferring differently for llvm.readcyclecounter and the amdgcn
180  // intrinsics.
181  let mayStore = ?;
182  let mayLoad = 1;
183  let has_sbase = 0;
184  let has_offset = 0;
185}
186
187class SM_Inval_Pseudo <string opName, SDPatternOperator node = null_frag> : SM_Pseudo<
188  opName, (outs), (ins), "", [(node)]> {
189  let hasSideEffects = 1;
190  let mayStore = 0;
191  let has_sdst = 0;
192  let has_sbase = 0;
193  let has_offset = 0;
194}
195
196multiclass SM_Pseudo_Probe<string opName, RegisterClass baseClass> {
197  def _IMM  : SM_Probe_Pseudo <opName, (ins i8imm:$sdata, baseClass:$sbase, smem_offset:$offset), 1>;
198  def _SGPR : SM_Probe_Pseudo <opName, (ins i8imm:$sdata, baseClass:$sbase, SReg_32:$offset), 0>;
199}
200
201class SM_WaveId_Pseudo<string opName, SDPatternOperator node> : SM_Pseudo<
202  opName, (outs SReg_32_XM0_XEXEC:$sdst), (ins),
203  " $sdst", [(set i32:$sdst, (node))]> {
204  let hasSideEffects = 1;
205  let mayStore = 0;
206  let mayLoad = 1;
207  let has_sbase = 0;
208  let has_offset = 0;
209}
210
211//===----------------------------------------------------------------------===//
212// Scalar Atomic Memory Classes
213//===----------------------------------------------------------------------===//
214
215class SM_Atomic_Pseudo <string opName,
216                        dag outs, dag ins, string asmOps, bit isRet>
217  : SM_Pseudo<opName, outs, ins, asmOps, []> {
218
219  bit glc = isRet;
220
221  let mayLoad = 1;
222  let mayStore = 1;
223  let has_glc = 1;
224  let has_dlc = 1;
225
226  // Should these be set?
227  let ScalarStore = 1;
228  let hasSideEffects = 1;
229  let maybeAtomic = 1;
230}
231
232class SM_Pseudo_Atomic<string opName,
233                       RegisterClass baseClass,
234                       RegisterClass dataClass,
235                       bit isImm,
236                       bit isRet> :
237  SM_Atomic_Pseudo<opName,
238                   !if(isRet, (outs dataClass:$sdst), (outs)),
239                   !if(isImm,
240                       (ins dataClass:$sdata, baseClass:$sbase, smem_offset:$offset, DLC:$dlc),
241                       (ins dataClass:$sdata, baseClass:$sbase, SReg_32:$offset, DLC:$dlc)),
242                   !if(isRet, " $sdst", " $sdata") # ", $sbase, $offset" # !if(isRet, " glc", "") # "$dlc",
243                   isRet> {
244  let offset_is_imm = isImm;
245  let PseudoInstr = opName # !if(isImm,
246                                 !if(isRet, "_IMM_RTN", "_IMM"),
247                                 !if(isRet, "_SGPR_RTN", "_SGPR"));
248
249  let Constraints = !if(isRet, "$sdst = $sdata", "");
250  let DisableEncoding = !if(isRet, "$sdata", "");
251}
252
253multiclass SM_Pseudo_Atomics<string opName,
254                             RegisterClass baseClass,
255                             RegisterClass dataClass> {
256  def _IMM      : SM_Pseudo_Atomic <opName, baseClass, dataClass, 1, 0>;
257  def _SGPR     : SM_Pseudo_Atomic <opName, baseClass, dataClass, 0, 0>;
258  def _IMM_RTN  : SM_Pseudo_Atomic <opName, baseClass, dataClass, 1, 1>;
259  def _SGPR_RTN : SM_Pseudo_Atomic <opName, baseClass, dataClass, 0, 1>;
260}
261
262//===----------------------------------------------------------------------===//
263// Scalar Memory Instructions
264//===----------------------------------------------------------------------===//
265
266// We are using the SReg_32_XM0 and not the SReg_32 register class for 32-bit
267// SMRD instructions, because the SReg_32_XM0 register class does not include M0
268// and writing to M0 from an SMRD instruction will hang the GPU.
269
270// XXX - SMEM instructions do not allow exec for data operand, but
271// does sdst for SMRD on SI/CI?
272defm S_LOAD_DWORD    : SM_Pseudo_Loads <"s_load_dword", SReg_64, SReg_32_XM0_XEXEC>;
273defm S_LOAD_DWORDX2  : SM_Pseudo_Loads <"s_load_dwordx2", SReg_64, SReg_64_XEXEC>;
274defm S_LOAD_DWORDX4  : SM_Pseudo_Loads <"s_load_dwordx4", SReg_64, SReg_128>;
275defm S_LOAD_DWORDX8  : SM_Pseudo_Loads <"s_load_dwordx8", SReg_64, SReg_256>;
276defm S_LOAD_DWORDX16 : SM_Pseudo_Loads <"s_load_dwordx16", SReg_64, SReg_512>;
277
278let is_buffer = 1 in {
279defm S_BUFFER_LOAD_DWORD : SM_Pseudo_Loads <
280  "s_buffer_load_dword", SReg_128, SReg_32_XM0_XEXEC
281>;
282
283// FIXME: exec_lo/exec_hi appear to be allowed for SMRD loads on
284// SI/CI, bit disallowed for SMEM on VI.
285defm S_BUFFER_LOAD_DWORDX2 : SM_Pseudo_Loads <
286  "s_buffer_load_dwordx2", SReg_128, SReg_64_XEXEC
287>;
288
289defm S_BUFFER_LOAD_DWORDX4 : SM_Pseudo_Loads <
290  "s_buffer_load_dwordx4", SReg_128, SReg_128
291>;
292
293defm S_BUFFER_LOAD_DWORDX8 : SM_Pseudo_Loads <
294  "s_buffer_load_dwordx8", SReg_128, SReg_256
295>;
296
297defm S_BUFFER_LOAD_DWORDX16 : SM_Pseudo_Loads <
298  "s_buffer_load_dwordx16", SReg_128, SReg_512
299>;
300}
301
302let SubtargetPredicate = HasScalarStores in {
303defm S_STORE_DWORD : SM_Pseudo_Stores <"s_store_dword", SReg_64, SReg_32_XM0_XEXEC>;
304defm S_STORE_DWORDX2 : SM_Pseudo_Stores <"s_store_dwordx2", SReg_64, SReg_64_XEXEC>;
305defm S_STORE_DWORDX4 : SM_Pseudo_Stores <"s_store_dwordx4", SReg_64, SReg_128>;
306
307let is_buffer = 1 in {
308defm S_BUFFER_STORE_DWORD : SM_Pseudo_Stores <
309  "s_buffer_store_dword", SReg_128, SReg_32_XM0_XEXEC
310>;
311
312defm S_BUFFER_STORE_DWORDX2 : SM_Pseudo_Stores <
313  "s_buffer_store_dwordx2", SReg_128, SReg_64_XEXEC
314>;
315
316defm S_BUFFER_STORE_DWORDX4 : SM_Pseudo_Stores <
317  "s_buffer_store_dwordx4", SReg_128, SReg_128
318>;
319}
320} // End SubtargetPredicate = HasScalarStores
321
322let SubtargetPredicate = HasSMemTimeInst in
323def S_MEMTIME : SM_Time_Pseudo <"s_memtime", int_amdgcn_s_memtime>;
324def S_DCACHE_INV : SM_Inval_Pseudo <"s_dcache_inv", int_amdgcn_s_dcache_inv>;
325
326let SubtargetPredicate = isGFX7GFX8GFX9 in {
327def S_DCACHE_INV_VOL : SM_Inval_Pseudo <"s_dcache_inv_vol", int_amdgcn_s_dcache_inv_vol>;
328} // let SubtargetPredicate = isGFX7GFX8GFX9
329
330let SubtargetPredicate = isGFX8Plus in {
331let OtherPredicates = [HasScalarStores] in {
332def S_DCACHE_WB     : SM_Inval_Pseudo <"s_dcache_wb", int_amdgcn_s_dcache_wb>;
333def S_DCACHE_WB_VOL : SM_Inval_Pseudo <"s_dcache_wb_vol", int_amdgcn_s_dcache_wb_vol>;
334} // End OtherPredicates = [HasScalarStores]
335def S_MEMREALTIME   : SM_Time_Pseudo <"s_memrealtime", int_amdgcn_s_memrealtime>;
336
337defm S_ATC_PROBE        : SM_Pseudo_Probe <"s_atc_probe", SReg_64>;
338let is_buffer = 1 in {
339defm S_ATC_PROBE_BUFFER : SM_Pseudo_Probe <"s_atc_probe_buffer", SReg_128>;
340}
341} // SubtargetPredicate = isGFX8Plus
342
343let SubtargetPredicate = isGFX10Plus in
344def S_GL1_INV : SM_Inval_Pseudo<"s_gl1_inv">;
345let SubtargetPredicate = HasGetWaveIdInst in
346def S_GET_WAVEID_IN_WORKGROUP : SM_WaveId_Pseudo <"s_get_waveid_in_workgroup", int_amdgcn_s_get_waveid_in_workgroup>;
347
348
349let SubtargetPredicate = HasScalarFlatScratchInsts, Uses = [FLAT_SCR] in {
350defm S_SCRATCH_LOAD_DWORD    : SM_Pseudo_Loads <"s_scratch_load_dword",   SReg_64, SReg_32_XM0_XEXEC>;
351defm S_SCRATCH_LOAD_DWORDX2  : SM_Pseudo_Loads <"s_scratch_load_dwordx2", SReg_64, SReg_64_XEXEC>;
352defm S_SCRATCH_LOAD_DWORDX4  : SM_Pseudo_Loads <"s_scratch_load_dwordx4", SReg_64, SReg_128>;
353
354defm S_SCRATCH_STORE_DWORD   : SM_Pseudo_Stores <"s_scratch_store_dword",   SReg_64, SReg_32_XM0_XEXEC>;
355defm S_SCRATCH_STORE_DWORDX2 : SM_Pseudo_Stores <"s_scratch_store_dwordx2", SReg_64, SReg_64_XEXEC>;
356defm S_SCRATCH_STORE_DWORDX4 : SM_Pseudo_Stores <"s_scratch_store_dwordx4", SReg_64, SReg_128>;
357} // SubtargetPredicate = HasScalarFlatScratchInsts
358
359let SubtargetPredicate = HasScalarAtomics in {
360
361let is_buffer = 1 in {
362defm S_BUFFER_ATOMIC_SWAP         : SM_Pseudo_Atomics <"s_buffer_atomic_swap", SReg_128, SReg_32_XM0_XEXEC>;
363defm S_BUFFER_ATOMIC_CMPSWAP      : SM_Pseudo_Atomics <"s_buffer_atomic_cmpswap", SReg_128, SReg_64_XEXEC>;
364defm S_BUFFER_ATOMIC_ADD          : SM_Pseudo_Atomics <"s_buffer_atomic_add", SReg_128, SReg_32_XM0_XEXEC>;
365defm S_BUFFER_ATOMIC_SUB          : SM_Pseudo_Atomics <"s_buffer_atomic_sub", SReg_128, SReg_32_XM0_XEXEC>;
366defm S_BUFFER_ATOMIC_SMIN         : SM_Pseudo_Atomics <"s_buffer_atomic_smin", SReg_128, SReg_32_XM0_XEXEC>;
367defm S_BUFFER_ATOMIC_UMIN         : SM_Pseudo_Atomics <"s_buffer_atomic_umin", SReg_128, SReg_32_XM0_XEXEC>;
368defm S_BUFFER_ATOMIC_SMAX         : SM_Pseudo_Atomics <"s_buffer_atomic_smax", SReg_128, SReg_32_XM0_XEXEC>;
369defm S_BUFFER_ATOMIC_UMAX         : SM_Pseudo_Atomics <"s_buffer_atomic_umax", SReg_128, SReg_32_XM0_XEXEC>;
370defm S_BUFFER_ATOMIC_AND          : SM_Pseudo_Atomics <"s_buffer_atomic_and", SReg_128, SReg_32_XM0_XEXEC>;
371defm S_BUFFER_ATOMIC_OR           : SM_Pseudo_Atomics <"s_buffer_atomic_or", SReg_128, SReg_32_XM0_XEXEC>;
372defm S_BUFFER_ATOMIC_XOR          : SM_Pseudo_Atomics <"s_buffer_atomic_xor", SReg_128, SReg_32_XM0_XEXEC>;
373defm S_BUFFER_ATOMIC_INC          : SM_Pseudo_Atomics <"s_buffer_atomic_inc", SReg_128, SReg_32_XM0_XEXEC>;
374defm S_BUFFER_ATOMIC_DEC          : SM_Pseudo_Atomics <"s_buffer_atomic_dec", SReg_128, SReg_32_XM0_XEXEC>;
375
376defm S_BUFFER_ATOMIC_SWAP_X2      : SM_Pseudo_Atomics <"s_buffer_atomic_swap_x2", SReg_128, SReg_64_XEXEC>;
377defm S_BUFFER_ATOMIC_CMPSWAP_X2   : SM_Pseudo_Atomics <"s_buffer_atomic_cmpswap_x2", SReg_128, SReg_128>;
378defm S_BUFFER_ATOMIC_ADD_X2       : SM_Pseudo_Atomics <"s_buffer_atomic_add_x2", SReg_128, SReg_64_XEXEC>;
379defm S_BUFFER_ATOMIC_SUB_X2       : SM_Pseudo_Atomics <"s_buffer_atomic_sub_x2", SReg_128, SReg_64_XEXEC>;
380defm S_BUFFER_ATOMIC_SMIN_X2      : SM_Pseudo_Atomics <"s_buffer_atomic_smin_x2", SReg_128, SReg_64_XEXEC>;
381defm S_BUFFER_ATOMIC_UMIN_X2      : SM_Pseudo_Atomics <"s_buffer_atomic_umin_x2", SReg_128, SReg_64_XEXEC>;
382defm S_BUFFER_ATOMIC_SMAX_X2      : SM_Pseudo_Atomics <"s_buffer_atomic_smax_x2", SReg_128, SReg_64_XEXEC>;
383defm S_BUFFER_ATOMIC_UMAX_X2      : SM_Pseudo_Atomics <"s_buffer_atomic_umax_x2", SReg_128, SReg_64_XEXEC>;
384defm S_BUFFER_ATOMIC_AND_X2       : SM_Pseudo_Atomics <"s_buffer_atomic_and_x2", SReg_128, SReg_64_XEXEC>;
385defm S_BUFFER_ATOMIC_OR_X2        : SM_Pseudo_Atomics <"s_buffer_atomic_or_x2", SReg_128, SReg_64_XEXEC>;
386defm S_BUFFER_ATOMIC_XOR_X2       : SM_Pseudo_Atomics <"s_buffer_atomic_xor_x2", SReg_128, SReg_64_XEXEC>;
387defm S_BUFFER_ATOMIC_INC_X2       : SM_Pseudo_Atomics <"s_buffer_atomic_inc_x2", SReg_128, SReg_64_XEXEC>;
388defm S_BUFFER_ATOMIC_DEC_X2       : SM_Pseudo_Atomics <"s_buffer_atomic_dec_x2", SReg_128, SReg_64_XEXEC>;
389}
390
391defm S_ATOMIC_SWAP                : SM_Pseudo_Atomics <"s_atomic_swap", SReg_64, SReg_32_XM0_XEXEC>;
392defm S_ATOMIC_CMPSWAP             : SM_Pseudo_Atomics <"s_atomic_cmpswap", SReg_64, SReg_64_XEXEC>;
393defm S_ATOMIC_ADD                 : SM_Pseudo_Atomics <"s_atomic_add", SReg_64, SReg_32_XM0_XEXEC>;
394defm S_ATOMIC_SUB                 : SM_Pseudo_Atomics <"s_atomic_sub", SReg_64, SReg_32_XM0_XEXEC>;
395defm S_ATOMIC_SMIN                : SM_Pseudo_Atomics <"s_atomic_smin", SReg_64, SReg_32_XM0_XEXEC>;
396defm S_ATOMIC_UMIN                : SM_Pseudo_Atomics <"s_atomic_umin", SReg_64, SReg_32_XM0_XEXEC>;
397defm S_ATOMIC_SMAX                : SM_Pseudo_Atomics <"s_atomic_smax", SReg_64, SReg_32_XM0_XEXEC>;
398defm S_ATOMIC_UMAX                : SM_Pseudo_Atomics <"s_atomic_umax", SReg_64, SReg_32_XM0_XEXEC>;
399defm S_ATOMIC_AND                 : SM_Pseudo_Atomics <"s_atomic_and", SReg_64, SReg_32_XM0_XEXEC>;
400defm S_ATOMIC_OR                  : SM_Pseudo_Atomics <"s_atomic_or", SReg_64, SReg_32_XM0_XEXEC>;
401defm S_ATOMIC_XOR                 : SM_Pseudo_Atomics <"s_atomic_xor", SReg_64, SReg_32_XM0_XEXEC>;
402defm S_ATOMIC_INC                 : SM_Pseudo_Atomics <"s_atomic_inc", SReg_64, SReg_32_XM0_XEXEC>;
403defm S_ATOMIC_DEC                 : SM_Pseudo_Atomics <"s_atomic_dec", SReg_64, SReg_32_XM0_XEXEC>;
404
405defm S_ATOMIC_SWAP_X2             : SM_Pseudo_Atomics <"s_atomic_swap_x2", SReg_64, SReg_64_XEXEC>;
406defm S_ATOMIC_CMPSWAP_X2          : SM_Pseudo_Atomics <"s_atomic_cmpswap_x2", SReg_64, SReg_128>;
407defm S_ATOMIC_ADD_X2              : SM_Pseudo_Atomics <"s_atomic_add_x2", SReg_64, SReg_64_XEXEC>;
408defm S_ATOMIC_SUB_X2              : SM_Pseudo_Atomics <"s_atomic_sub_x2", SReg_64, SReg_64_XEXEC>;
409defm S_ATOMIC_SMIN_X2             : SM_Pseudo_Atomics <"s_atomic_smin_x2", SReg_64, SReg_64_XEXEC>;
410defm S_ATOMIC_UMIN_X2             : SM_Pseudo_Atomics <"s_atomic_umin_x2", SReg_64, SReg_64_XEXEC>;
411defm S_ATOMIC_SMAX_X2             : SM_Pseudo_Atomics <"s_atomic_smax_x2", SReg_64, SReg_64_XEXEC>;
412defm S_ATOMIC_UMAX_X2             : SM_Pseudo_Atomics <"s_atomic_umax_x2", SReg_64, SReg_64_XEXEC>;
413defm S_ATOMIC_AND_X2              : SM_Pseudo_Atomics <"s_atomic_and_x2", SReg_64, SReg_64_XEXEC>;
414defm S_ATOMIC_OR_X2               : SM_Pseudo_Atomics <"s_atomic_or_x2", SReg_64, SReg_64_XEXEC>;
415defm S_ATOMIC_XOR_X2              : SM_Pseudo_Atomics <"s_atomic_xor_x2", SReg_64, SReg_64_XEXEC>;
416defm S_ATOMIC_INC_X2              : SM_Pseudo_Atomics <"s_atomic_inc_x2", SReg_64, SReg_64_XEXEC>;
417defm S_ATOMIC_DEC_X2              : SM_Pseudo_Atomics <"s_atomic_dec_x2", SReg_64, SReg_64_XEXEC>;
418
419} // let SubtargetPredicate = HasScalarAtomics
420
421let SubtargetPredicate = HasScalarAtomics in {
422defm S_DCACHE_DISCARD    : SM_Pseudo_Discards <"s_dcache_discard">;
423defm S_DCACHE_DISCARD_X2 : SM_Pseudo_Discards <"s_dcache_discard_x2">;
424}
425
426//===----------------------------------------------------------------------===//
427// Targets
428//===----------------------------------------------------------------------===//
429
430//===----------------------------------------------------------------------===//
431// SI
432//===----------------------------------------------------------------------===//
433
434class SMRD_Real_si <bits<5> op, SM_Pseudo ps>
435  : SM_Real<ps>
436  , SIMCInstr<ps.PseudoInstr, SIEncodingFamily.SI>
437  , Enc32 {
438
439  let AssemblerPredicate = isGFX6GFX7;
440  let DecoderNamespace = "GFX6GFX7";
441
442  let Inst{7-0}   = !if(ps.has_offset, offset{7-0}, ?);
443  let Inst{8}     = imm;
444  let Inst{14-9}  = !if(ps.has_sbase, sbase{6-1}, ?);
445  let Inst{21-15} = !if(ps.has_sdst, sdst{6-0}, ?);
446  let Inst{26-22} = op;
447  let Inst{31-27} = 0x18; //encoding
448}
449
450// FIXME: Assembler should reject trying to use glc on SMRD
451// instructions on SI.
452multiclass SM_Real_Loads_si<bits<5> op, string ps,
453                            SM_Load_Pseudo immPs = !cast<SM_Load_Pseudo>(ps#_IMM),
454                            SM_Load_Pseudo sgprPs = !cast<SM_Load_Pseudo>(ps#_SGPR)> {
455
456  def _IMM_si : SMRD_Real_si <op, immPs> {
457    let InOperandList = (ins immPs.BaseClass:$sbase, smrd_offset_8:$offset, GLC:$glc, DLC:$dlc);
458  }
459
460  // FIXME: The operand name $offset is inconsistent with $soff used
461  // in the pseudo
462  def _SGPR_si : SMRD_Real_si <op, sgprPs> {
463    let InOperandList = (ins sgprPs.BaseClass:$sbase, SReg_32:$offset, GLC:$glc, DLC:$dlc);
464  }
465
466}
467
468defm S_LOAD_DWORD           : SM_Real_Loads_si <0x00, "S_LOAD_DWORD">;
469defm S_LOAD_DWORDX2         : SM_Real_Loads_si <0x01, "S_LOAD_DWORDX2">;
470defm S_LOAD_DWORDX4         : SM_Real_Loads_si <0x02, "S_LOAD_DWORDX4">;
471defm S_LOAD_DWORDX8         : SM_Real_Loads_si <0x03, "S_LOAD_DWORDX8">;
472defm S_LOAD_DWORDX16        : SM_Real_Loads_si <0x04, "S_LOAD_DWORDX16">;
473defm S_BUFFER_LOAD_DWORD    : SM_Real_Loads_si <0x08, "S_BUFFER_LOAD_DWORD">;
474defm S_BUFFER_LOAD_DWORDX2  : SM_Real_Loads_si <0x09, "S_BUFFER_LOAD_DWORDX2">;
475defm S_BUFFER_LOAD_DWORDX4  : SM_Real_Loads_si <0x0a, "S_BUFFER_LOAD_DWORDX4">;
476defm S_BUFFER_LOAD_DWORDX8  : SM_Real_Loads_si <0x0b, "S_BUFFER_LOAD_DWORDX8">;
477defm S_BUFFER_LOAD_DWORDX16 : SM_Real_Loads_si <0x0c, "S_BUFFER_LOAD_DWORDX16">;
478
479def S_MEMTIME_si    : SMRD_Real_si <0x1e, S_MEMTIME>;
480def S_DCACHE_INV_si : SMRD_Real_si <0x1f, S_DCACHE_INV>;
481
482
483//===----------------------------------------------------------------------===//
484// VI
485//===----------------------------------------------------------------------===//
486
487class SMEM_Real_vi <bits<8> op, SM_Pseudo ps>
488  : SM_Real<ps>
489  , SIMCInstr<ps.PseudoInstr, SIEncodingFamily.VI>
490  , Enc64 {
491  bit glc;
492
493  let AssemblerPredicate = isGFX8GFX9;
494  let DecoderNamespace = "GFX8";
495
496  let Inst{5-0}   = !if(ps.has_sbase, sbase{6-1}, ?);
497  let Inst{12-6}  = !if(ps.has_sdst, sdst{6-0}, ?);
498
499  let Inst{16} = !if(ps.has_glc, glc, ?);
500  let Inst{17} = imm;
501  let Inst{25-18} = op;
502  let Inst{31-26} = 0x30; //encoding
503
504  // VI supports 20-bit unsigned offsets while GFX9+ supports 21-bit signed.
505  // Offset value is corrected accordingly when offset is encoded/decoded.
506  let Inst{52-32} = !if(ps.has_offset, offset{20-0}, ?);
507}
508
509multiclass SM_Real_Loads_vi<bits<8> op, string ps,
510                            SM_Load_Pseudo immPs = !cast<SM_Load_Pseudo>(ps#_IMM),
511                            SM_Load_Pseudo sgprPs = !cast<SM_Load_Pseudo>(ps#_SGPR)> {
512  def _IMM_vi : SMEM_Real_vi <op, immPs> {
513    let InOperandList = (ins immPs.BaseClass:$sbase, smem_offset:$offset, GLC:$glc, DLC:$dlc);
514  }
515  def _SGPR_vi : SMEM_Real_vi <op, sgprPs> {
516    let InOperandList = (ins sgprPs.BaseClass:$sbase, SReg_32:$offset, GLC:$glc, DLC:$dlc);
517  }
518}
519
520class SMEM_Real_Store_vi <bits<8> op, SM_Pseudo ps> : SMEM_Real_vi <op, ps> {
521  // encoding
522  bits<7> sdata;
523
524  let sdst = ?;
525  let Inst{12-6}  = !if(ps.has_sdst, sdata{6-0}, ?);
526}
527
528multiclass SM_Real_Stores_vi<bits<8> op, string ps,
529                            SM_Store_Pseudo immPs = !cast<SM_Store_Pseudo>(ps#_IMM),
530                            SM_Store_Pseudo sgprPs = !cast<SM_Store_Pseudo>(ps#_SGPR)> {
531  // FIXME: The operand name $offset is inconsistent with $soff used
532  // in the pseudo
533  def _IMM_vi : SMEM_Real_Store_vi <op, immPs> {
534    let InOperandList = (ins immPs.SrcClass:$sdata, immPs.BaseClass:$sbase, smem_offset:$offset, GLC:$glc, DLC:$dlc);
535  }
536
537  def _SGPR_vi : SMEM_Real_Store_vi <op, sgprPs> {
538    let InOperandList = (ins sgprPs.SrcClass:$sdata, sgprPs.BaseClass:$sbase, SReg_32:$offset, GLC:$glc, DLC:$dlc);
539  }
540}
541
542multiclass SM_Real_Probe_vi<bits<8> op, string ps> {
543  def _IMM_vi  : SMEM_Real_Store_vi <op, !cast<SM_Probe_Pseudo>(ps#_IMM)>;
544  def _SGPR_vi : SMEM_Real_Store_vi <op, !cast<SM_Probe_Pseudo>(ps#_SGPR)>;
545}
546
547defm S_LOAD_DWORD           : SM_Real_Loads_vi <0x00, "S_LOAD_DWORD">;
548defm S_LOAD_DWORDX2         : SM_Real_Loads_vi <0x01, "S_LOAD_DWORDX2">;
549defm S_LOAD_DWORDX4         : SM_Real_Loads_vi <0x02, "S_LOAD_DWORDX4">;
550defm S_LOAD_DWORDX8         : SM_Real_Loads_vi <0x03, "S_LOAD_DWORDX8">;
551defm S_LOAD_DWORDX16        : SM_Real_Loads_vi <0x04, "S_LOAD_DWORDX16">;
552defm S_BUFFER_LOAD_DWORD    : SM_Real_Loads_vi <0x08, "S_BUFFER_LOAD_DWORD">;
553defm S_BUFFER_LOAD_DWORDX2  : SM_Real_Loads_vi <0x09, "S_BUFFER_LOAD_DWORDX2">;
554defm S_BUFFER_LOAD_DWORDX4  : SM_Real_Loads_vi <0x0a, "S_BUFFER_LOAD_DWORDX4">;
555defm S_BUFFER_LOAD_DWORDX8  : SM_Real_Loads_vi <0x0b, "S_BUFFER_LOAD_DWORDX8">;
556defm S_BUFFER_LOAD_DWORDX16 : SM_Real_Loads_vi <0x0c, "S_BUFFER_LOAD_DWORDX16">;
557
558defm S_STORE_DWORD : SM_Real_Stores_vi <0x10, "S_STORE_DWORD">;
559defm S_STORE_DWORDX2 : SM_Real_Stores_vi <0x11, "S_STORE_DWORDX2">;
560defm S_STORE_DWORDX4 : SM_Real_Stores_vi <0x12, "S_STORE_DWORDX4">;
561
562defm S_BUFFER_STORE_DWORD    : SM_Real_Stores_vi <0x18, "S_BUFFER_STORE_DWORD">;
563defm S_BUFFER_STORE_DWORDX2  : SM_Real_Stores_vi <0x19, "S_BUFFER_STORE_DWORDX2">;
564defm S_BUFFER_STORE_DWORDX4  : SM_Real_Stores_vi <0x1a, "S_BUFFER_STORE_DWORDX4">;
565
566// These instructions use same encoding
567def S_DCACHE_INV_vi         : SMEM_Real_vi <0x20, S_DCACHE_INV>;
568def S_DCACHE_WB_vi          : SMEM_Real_vi <0x21, S_DCACHE_WB>;
569def S_DCACHE_INV_VOL_vi     : SMEM_Real_vi <0x22, S_DCACHE_INV_VOL>;
570def S_DCACHE_WB_VOL_vi      : SMEM_Real_vi <0x23, S_DCACHE_WB_VOL>;
571def S_MEMTIME_vi            : SMEM_Real_vi <0x24, S_MEMTIME>;
572def S_MEMREALTIME_vi        : SMEM_Real_vi <0x25, S_MEMREALTIME>;
573
574defm S_SCRATCH_LOAD_DWORD    : SM_Real_Loads_vi <0x05, "S_SCRATCH_LOAD_DWORD">;
575defm S_SCRATCH_LOAD_DWORDX2  : SM_Real_Loads_vi <0x06, "S_SCRATCH_LOAD_DWORDX2">;
576defm S_SCRATCH_LOAD_DWORDX4  : SM_Real_Loads_vi <0x07, "S_SCRATCH_LOAD_DWORDX4">;
577
578defm S_SCRATCH_STORE_DWORD   : SM_Real_Stores_vi <0x15, "S_SCRATCH_STORE_DWORD">;
579defm S_SCRATCH_STORE_DWORDX2 : SM_Real_Stores_vi <0x16, "S_SCRATCH_STORE_DWORDX2">;
580defm S_SCRATCH_STORE_DWORDX4 : SM_Real_Stores_vi <0x17, "S_SCRATCH_STORE_DWORDX4">;
581
582defm S_ATC_PROBE        : SM_Real_Probe_vi <0x26, "S_ATC_PROBE">;
583defm S_ATC_PROBE_BUFFER : SM_Real_Probe_vi <0x27, "S_ATC_PROBE_BUFFER">;
584
585//===----------------------------------------------------------------------===//
586// GFX9
587//===----------------------------------------------------------------------===//
588
589class SMEM_Atomic_Real_vi <bits<8> op, SM_Atomic_Pseudo ps>
590  : SMEM_Real_vi <op, ps> {
591
592  bits<7> sdata;
593
594  let Constraints = ps.Constraints;
595  let DisableEncoding = ps.DisableEncoding;
596
597  let glc = ps.glc;
598  let Inst{12-6} = !if(glc, sdst{6-0}, sdata{6-0});
599}
600
601multiclass SM_Real_Atomics_vi<bits<8> op, string ps> {
602  def _IMM_vi       : SMEM_Atomic_Real_vi <op, !cast<SM_Atomic_Pseudo>(ps#_IMM)>;
603  def _SGPR_vi      : SMEM_Atomic_Real_vi <op, !cast<SM_Atomic_Pseudo>(ps#_SGPR)>;
604  def _IMM_RTN_vi   : SMEM_Atomic_Real_vi <op, !cast<SM_Atomic_Pseudo>(ps#_IMM_RTN)>;
605  def _SGPR_RTN_vi  : SMEM_Atomic_Real_vi <op, !cast<SM_Atomic_Pseudo>(ps#_SGPR_RTN)>;
606}
607
608defm S_BUFFER_ATOMIC_SWAP         : SM_Real_Atomics_vi <0x40, "S_BUFFER_ATOMIC_SWAP">;
609defm S_BUFFER_ATOMIC_CMPSWAP      : SM_Real_Atomics_vi <0x41, "S_BUFFER_ATOMIC_CMPSWAP">;
610defm S_BUFFER_ATOMIC_ADD          : SM_Real_Atomics_vi <0x42, "S_BUFFER_ATOMIC_ADD">;
611defm S_BUFFER_ATOMIC_SUB          : SM_Real_Atomics_vi <0x43, "S_BUFFER_ATOMIC_SUB">;
612defm S_BUFFER_ATOMIC_SMIN         : SM_Real_Atomics_vi <0x44, "S_BUFFER_ATOMIC_SMIN">;
613defm S_BUFFER_ATOMIC_UMIN         : SM_Real_Atomics_vi <0x45, "S_BUFFER_ATOMIC_UMIN">;
614defm S_BUFFER_ATOMIC_SMAX         : SM_Real_Atomics_vi <0x46, "S_BUFFER_ATOMIC_SMAX">;
615defm S_BUFFER_ATOMIC_UMAX         : SM_Real_Atomics_vi <0x47, "S_BUFFER_ATOMIC_UMAX">;
616defm S_BUFFER_ATOMIC_AND          : SM_Real_Atomics_vi <0x48, "S_BUFFER_ATOMIC_AND">;
617defm S_BUFFER_ATOMIC_OR           : SM_Real_Atomics_vi <0x49, "S_BUFFER_ATOMIC_OR">;
618defm S_BUFFER_ATOMIC_XOR          : SM_Real_Atomics_vi <0x4a, "S_BUFFER_ATOMIC_XOR">;
619defm S_BUFFER_ATOMIC_INC          : SM_Real_Atomics_vi <0x4b, "S_BUFFER_ATOMIC_INC">;
620defm S_BUFFER_ATOMIC_DEC          : SM_Real_Atomics_vi <0x4c, "S_BUFFER_ATOMIC_DEC">;
621
622defm S_BUFFER_ATOMIC_SWAP_X2      : SM_Real_Atomics_vi <0x60, "S_BUFFER_ATOMIC_SWAP_X2">;
623defm S_BUFFER_ATOMIC_CMPSWAP_X2   : SM_Real_Atomics_vi <0x61, "S_BUFFER_ATOMIC_CMPSWAP_X2">;
624defm S_BUFFER_ATOMIC_ADD_X2       : SM_Real_Atomics_vi <0x62, "S_BUFFER_ATOMIC_ADD_X2">;
625defm S_BUFFER_ATOMIC_SUB_X2       : SM_Real_Atomics_vi <0x63, "S_BUFFER_ATOMIC_SUB_X2">;
626defm S_BUFFER_ATOMIC_SMIN_X2      : SM_Real_Atomics_vi <0x64, "S_BUFFER_ATOMIC_SMIN_X2">;
627defm S_BUFFER_ATOMIC_UMIN_X2      : SM_Real_Atomics_vi <0x65, "S_BUFFER_ATOMIC_UMIN_X2">;
628defm S_BUFFER_ATOMIC_SMAX_X2      : SM_Real_Atomics_vi <0x66, "S_BUFFER_ATOMIC_SMAX_X2">;
629defm S_BUFFER_ATOMIC_UMAX_X2      : SM_Real_Atomics_vi <0x67, "S_BUFFER_ATOMIC_UMAX_X2">;
630defm S_BUFFER_ATOMIC_AND_X2       : SM_Real_Atomics_vi <0x68, "S_BUFFER_ATOMIC_AND_X2">;
631defm S_BUFFER_ATOMIC_OR_X2        : SM_Real_Atomics_vi <0x69, "S_BUFFER_ATOMIC_OR_X2">;
632defm S_BUFFER_ATOMIC_XOR_X2       : SM_Real_Atomics_vi <0x6a, "S_BUFFER_ATOMIC_XOR_X2">;
633defm S_BUFFER_ATOMIC_INC_X2       : SM_Real_Atomics_vi <0x6b, "S_BUFFER_ATOMIC_INC_X2">;
634defm S_BUFFER_ATOMIC_DEC_X2       : SM_Real_Atomics_vi <0x6c, "S_BUFFER_ATOMIC_DEC_X2">;
635
636defm S_ATOMIC_SWAP                : SM_Real_Atomics_vi <0x80, "S_ATOMIC_SWAP">;
637defm S_ATOMIC_CMPSWAP             : SM_Real_Atomics_vi <0x81, "S_ATOMIC_CMPSWAP">;
638defm S_ATOMIC_ADD                 : SM_Real_Atomics_vi <0x82, "S_ATOMIC_ADD">;
639defm S_ATOMIC_SUB                 : SM_Real_Atomics_vi <0x83, "S_ATOMIC_SUB">;
640defm S_ATOMIC_SMIN                : SM_Real_Atomics_vi <0x84, "S_ATOMIC_SMIN">;
641defm S_ATOMIC_UMIN                : SM_Real_Atomics_vi <0x85, "S_ATOMIC_UMIN">;
642defm S_ATOMIC_SMAX                : SM_Real_Atomics_vi <0x86, "S_ATOMIC_SMAX">;
643defm S_ATOMIC_UMAX                : SM_Real_Atomics_vi <0x87, "S_ATOMIC_UMAX">;
644defm S_ATOMIC_AND                 : SM_Real_Atomics_vi <0x88, "S_ATOMIC_AND">;
645defm S_ATOMIC_OR                  : SM_Real_Atomics_vi <0x89, "S_ATOMIC_OR">;
646defm S_ATOMIC_XOR                 : SM_Real_Atomics_vi <0x8a, "S_ATOMIC_XOR">;
647defm S_ATOMIC_INC                 : SM_Real_Atomics_vi <0x8b, "S_ATOMIC_INC">;
648defm S_ATOMIC_DEC                 : SM_Real_Atomics_vi <0x8c, "S_ATOMIC_DEC">;
649
650defm S_ATOMIC_SWAP_X2             : SM_Real_Atomics_vi <0xa0, "S_ATOMIC_SWAP_X2">;
651defm S_ATOMIC_CMPSWAP_X2          : SM_Real_Atomics_vi <0xa1, "S_ATOMIC_CMPSWAP_X2">;
652defm S_ATOMIC_ADD_X2              : SM_Real_Atomics_vi <0xa2, "S_ATOMIC_ADD_X2">;
653defm S_ATOMIC_SUB_X2              : SM_Real_Atomics_vi <0xa3, "S_ATOMIC_SUB_X2">;
654defm S_ATOMIC_SMIN_X2             : SM_Real_Atomics_vi <0xa4, "S_ATOMIC_SMIN_X2">;
655defm S_ATOMIC_UMIN_X2             : SM_Real_Atomics_vi <0xa5, "S_ATOMIC_UMIN_X2">;
656defm S_ATOMIC_SMAX_X2             : SM_Real_Atomics_vi <0xa6, "S_ATOMIC_SMAX_X2">;
657defm S_ATOMIC_UMAX_X2             : SM_Real_Atomics_vi <0xa7, "S_ATOMIC_UMAX_X2">;
658defm S_ATOMIC_AND_X2              : SM_Real_Atomics_vi <0xa8, "S_ATOMIC_AND_X2">;
659defm S_ATOMIC_OR_X2               : SM_Real_Atomics_vi <0xa9, "S_ATOMIC_OR_X2">;
660defm S_ATOMIC_XOR_X2              : SM_Real_Atomics_vi <0xaa, "S_ATOMIC_XOR_X2">;
661defm S_ATOMIC_INC_X2              : SM_Real_Atomics_vi <0xab, "S_ATOMIC_INC_X2">;
662defm S_ATOMIC_DEC_X2              : SM_Real_Atomics_vi <0xac, "S_ATOMIC_DEC_X2">;
663
664multiclass SM_Real_Discard_vi<bits<8> op, string ps> {
665  def _IMM_vi  : SMEM_Real_vi <op, !cast<SM_Discard_Pseudo>(ps#_IMM)>;
666  def _SGPR_vi : SMEM_Real_vi <op, !cast<SM_Discard_Pseudo>(ps#_SGPR)>;
667}
668
669defm S_DCACHE_DISCARD    : SM_Real_Discard_vi <0x28, "S_DCACHE_DISCARD">;
670defm S_DCACHE_DISCARD_X2 : SM_Real_Discard_vi <0x29, "S_DCACHE_DISCARD_X2">;
671
672//===----------------------------------------------------------------------===//
673// CI
674//===----------------------------------------------------------------------===//
675
676def smrd_literal_offset : NamedOperandU32<"SMRDLiteralOffset",
677                                          NamedMatchClass<"SMRDLiteralOffset">> {
678  let OperandType = "OPERAND_IMMEDIATE";
679}
680
681class SMRD_Real_Load_IMM_ci <bits<5> op, SM_Load_Pseudo ps> :
682  SM_Real<ps>,
683  Enc64 {
684
685  let AssemblerPredicate = isGFX7Only;
686  let DecoderNamespace = "GFX7";
687  let InOperandList = (ins ps.BaseClass:$sbase, smrd_literal_offset:$offset, GLC:$glc, DLC:$dlc);
688
689  let LGKM_CNT = ps.LGKM_CNT;
690  let mayLoad = ps.mayLoad;
691  let mayStore = ps.mayStore;
692  let hasSideEffects = ps.hasSideEffects;
693  let SchedRW = ps.SchedRW;
694
695  let Inst{7-0}   = 0xff;
696  let Inst{8}     = 0;
697  let Inst{14-9}  = sbase{6-1};
698  let Inst{21-15} = sdst{6-0};
699  let Inst{26-22} = op;
700  let Inst{31-27} = 0x18; //encoding
701  let Inst{63-32} = offset{31-0};
702}
703
704def S_LOAD_DWORD_IMM_ci           : SMRD_Real_Load_IMM_ci <0x00, S_LOAD_DWORD_IMM>;
705def S_LOAD_DWORDX2_IMM_ci         : SMRD_Real_Load_IMM_ci <0x01, S_LOAD_DWORDX2_IMM>;
706def S_LOAD_DWORDX4_IMM_ci         : SMRD_Real_Load_IMM_ci <0x02, S_LOAD_DWORDX4_IMM>;
707def S_LOAD_DWORDX8_IMM_ci         : SMRD_Real_Load_IMM_ci <0x03, S_LOAD_DWORDX8_IMM>;
708def S_LOAD_DWORDX16_IMM_ci        : SMRD_Real_Load_IMM_ci <0x04, S_LOAD_DWORDX16_IMM>;
709def S_BUFFER_LOAD_DWORD_IMM_ci    : SMRD_Real_Load_IMM_ci <0x08, S_BUFFER_LOAD_DWORD_IMM>;
710def S_BUFFER_LOAD_DWORDX2_IMM_ci  : SMRD_Real_Load_IMM_ci <0x09, S_BUFFER_LOAD_DWORDX2_IMM>;
711def S_BUFFER_LOAD_DWORDX4_IMM_ci  : SMRD_Real_Load_IMM_ci <0x0a, S_BUFFER_LOAD_DWORDX4_IMM>;
712def S_BUFFER_LOAD_DWORDX8_IMM_ci  : SMRD_Real_Load_IMM_ci <0x0b, S_BUFFER_LOAD_DWORDX8_IMM>;
713def S_BUFFER_LOAD_DWORDX16_IMM_ci : SMRD_Real_Load_IMM_ci <0x0c, S_BUFFER_LOAD_DWORDX16_IMM>;
714
715class SMRD_Real_ci <bits<5> op, SM_Pseudo ps>
716  : SM_Real<ps>
717  , SIMCInstr<ps.PseudoInstr, SIEncodingFamily.SI>
718  , Enc32 {
719
720  let AssemblerPredicate = isGFX7Only;
721  let DecoderNamespace = "GFX7";
722
723  let Inst{7-0}   = !if(ps.has_offset, offset{7-0}, ?);
724  let Inst{8}     = imm;
725  let Inst{14-9}  = !if(ps.has_sbase, sbase{6-1}, ?);
726  let Inst{21-15} = !if(ps.has_sdst, sdst{6-0}, ?);
727  let Inst{26-22} = op;
728  let Inst{31-27} = 0x18; //encoding
729}
730
731def S_DCACHE_INV_VOL_ci : SMRD_Real_ci <0x1d, S_DCACHE_INV_VOL>;
732
733//===----------------------------------------------------------------------===//
734// Scalar Memory Patterns
735//===----------------------------------------------------------------------===//
736
737def smrd_load : PatFrag <(ops node:$ptr), (load node:$ptr), [{ return isUniformLoad(N);}]> {
738  let GISelPredicateCode = [{
739    if (!MI.hasOneMemOperand())
740      return false;
741    if (!isInstrUniform(MI))
742      return false;
743
744    // FIXME: We should probably be caching this.
745    SmallVector<GEPInfo, 4> AddrInfo;
746    getAddrModeInfo(MI, MRI, AddrInfo);
747
748    if (hasVgprParts(AddrInfo))
749      return false;
750    return true;
751  }];
752}
753
754def SMRDImm         : ComplexPattern<i64, 2, "SelectSMRDImm">;
755def SMRDImm32       : ComplexPattern<i64, 2, "SelectSMRDImm32">;
756def SMRDSgpr        : ComplexPattern<i64, 2, "SelectSMRDSgpr">;
757def SMRDBufferImm   : ComplexPattern<i32, 1, "SelectSMRDBufferImm">;
758def SMRDBufferImm32 : ComplexPattern<i32, 1, "SelectSMRDBufferImm32">;
759
760multiclass SMRD_Pattern <string Instr, ValueType vt> {
761
762  // 1. IMM offset
763  def : GCNPat <
764    (smrd_load (SMRDImm i64:$sbase, i32:$offset)),
765    (vt (!cast<SM_Pseudo>(Instr#"_IMM") $sbase, $offset, 0, 0))
766  >;
767
768  // 2. 32-bit IMM offset on CI
769  def : GCNPat <
770    (smrd_load (SMRDImm32 i64:$sbase, i32:$offset)),
771    (vt (!cast<InstSI>(Instr#"_IMM_ci") $sbase, $offset, 0, 0))> {
772    let OtherPredicates = [isGFX7Only];
773  }
774
775  // 3. SGPR offset
776  def : GCNPat <
777    (smrd_load (SMRDSgpr i64:$sbase, i32:$offset)),
778    (vt (!cast<SM_Pseudo>(Instr#"_SGPR") $sbase, $offset, 0, 0))
779  >;
780
781  // 4. No offset
782  def : GCNPat <
783    (vt (smrd_load (i64 SReg_64:$sbase))),
784    (vt (!cast<SM_Pseudo>(Instr#"_IMM") i64:$sbase, 0, 0, 0))
785  >;
786}
787
788multiclass SMLoad_Pattern <string Instr, ValueType vt> {
789  // 1. Offset as an immediate
790  def : GCNPat <
791    (SIsbuffer_load v4i32:$sbase, (SMRDBufferImm i32:$offset), timm:$cachepolicy),
792    (vt (!cast<SM_Pseudo>(Instr#"_IMM") SReg_128:$sbase, i32imm:$offset, (extract_glc $cachepolicy),
793                                        (extract_dlc $cachepolicy)))> {
794    let AddedComplexity = 2;
795  }
796
797  // 2. 32-bit IMM offset on CI
798  def : GCNPat <
799    (vt (SIsbuffer_load v4i32:$sbase, (SMRDBufferImm32 i32:$offset), timm:$cachepolicy)),
800    (!cast<InstSI>(Instr#"_IMM_ci") SReg_128:$sbase, smrd_literal_offset:$offset,
801                                    (extract_glc $cachepolicy), (extract_dlc $cachepolicy))> {
802    let OtherPredicates = [isGFX7Only];
803    let AddedComplexity = 1;
804  }
805
806  // 3. Offset loaded in an 32bit SGPR
807  def : GCNPat <
808    (SIsbuffer_load v4i32:$sbase, i32:$offset, timm:$cachepolicy),
809    (vt (!cast<SM_Pseudo>(Instr#"_SGPR") SReg_128:$sbase, SReg_32:$offset, (extract_glc $cachepolicy),
810                                         (extract_dlc $cachepolicy)))
811  >;
812}
813
814// Global and constant loads can be selected to either MUBUF or SMRD
815// instructions, but SMRD instructions are faster so we want the instruction
816// selector to prefer those.
817let AddedComplexity = 100 in {
818
819foreach vt = Reg32Types.types in {
820defm : SMRD_Pattern <"S_LOAD_DWORD", vt>;
821}
822
823foreach vt = SReg_64.RegTypes in {
824defm : SMRD_Pattern <"S_LOAD_DWORDX2", vt>;
825}
826
827foreach vt = SReg_128.RegTypes in {
828defm : SMRD_Pattern <"S_LOAD_DWORDX4", vt>;
829}
830
831foreach vt = SReg_256.RegTypes in {
832defm : SMRD_Pattern <"S_LOAD_DWORDX8", vt>;
833}
834
835foreach vt = SReg_512.RegTypes in {
836defm : SMRD_Pattern <"S_LOAD_DWORDX16", vt>;
837}
838
839defm : SMLoad_Pattern <"S_BUFFER_LOAD_DWORD",     i32>;
840defm : SMLoad_Pattern <"S_BUFFER_LOAD_DWORDX2",   v2i32>;
841defm : SMLoad_Pattern <"S_BUFFER_LOAD_DWORDX4",   v4i32>;
842defm : SMLoad_Pattern <"S_BUFFER_LOAD_DWORDX8",   v8i32>;
843defm : SMLoad_Pattern <"S_BUFFER_LOAD_DWORDX16",  v16i32>;
844
845defm : SMLoad_Pattern <"S_BUFFER_LOAD_DWORD",     f32>;
846defm : SMLoad_Pattern <"S_BUFFER_LOAD_DWORDX2",   v2f32>;
847defm : SMLoad_Pattern <"S_BUFFER_LOAD_DWORDX4",   v4f32>;
848defm : SMLoad_Pattern <"S_BUFFER_LOAD_DWORDX8",   v8f32>;
849defm : SMLoad_Pattern <"S_BUFFER_LOAD_DWORDX16",  v16f32>;
850} // End let AddedComplexity = 100
851
852let OtherPredicates = [HasSMemTimeInst] in {
853def : GCNPat <
854  (i64 (readcyclecounter)),
855  (S_MEMTIME)
856>;
857} // let OtherPredicates = [HasSMemTimeInst]
858
859let OtherPredicates = [HasNoSMemTimeInst] in {
860def : GCNPat <
861  (i64 (readcyclecounter)),
862  (REG_SEQUENCE SReg_64,
863    (S_GETREG_B32 getHwRegImm<HWREG.SHADER_CYCLES, 0, -12>.ret), sub0,
864    (S_MOV_B32 (i32 0)), sub1)
865>;
866} // let OtherPredicates = [HasNoSMemTimeInst]
867
868//===----------------------------------------------------------------------===//
869// GFX10.
870//===----------------------------------------------------------------------===//
871
872class SMEM_Real_gfx10<bits<8> op, SM_Pseudo ps> :
873    SM_Real<ps>, SIMCInstr<ps.PseudoInstr, SIEncodingFamily.GFX10>, Enc64 {
874  bit glc;
875  bit dlc;
876
877  let AssemblerPredicate = isGFX10Plus;
878  let DecoderNamespace = "GFX10";
879
880  let Inst{5-0}   = !if(ps.has_sbase, sbase{6-1}, ?);
881  let Inst{12-6}  = !if(ps.has_sdst, sdst{6-0}, ?);
882  let Inst{14}    = !if(ps.has_dlc, dlc, ?);
883  let Inst{16}    = !if(ps.has_glc, glc, ?);
884  let Inst{25-18} = op;
885  let Inst{31-26} = 0x3d;
886  let Inst{52-32} = !if(ps.offset_is_imm, !if(ps.has_offset, offset{20-0}, ?), ?);
887  let Inst{63-57} = !if(ps.offset_is_imm, !cast<int>(SGPR_NULL.HWEncoding),
888                                          !if(ps.has_offset, offset{6-0}, ?));
889}
890
891multiclass SM_Real_Loads_gfx10<bits<8> op, string ps,
892                               SM_Load_Pseudo immPs = !cast<SM_Load_Pseudo>(ps#_IMM),
893                               SM_Load_Pseudo sgprPs = !cast<SM_Load_Pseudo>(ps#_SGPR)> {
894  def _IMM_gfx10 : SMEM_Real_gfx10<op, immPs> {
895    let InOperandList = (ins immPs.BaseClass:$sbase, smem_offset:$offset, GLC:$glc, DLC:$dlc);
896  }
897  def _SGPR_gfx10 : SMEM_Real_gfx10<op, sgprPs> {
898    let InOperandList = (ins sgprPs.BaseClass:$sbase, SReg_32:$offset, GLC:$glc, DLC:$dlc);
899  }
900}
901
902class SMEM_Real_Store_gfx10<bits<8> op, SM_Pseudo ps> : SMEM_Real_gfx10<op, ps> {
903  bits<7> sdata;
904
905  let sdst = ?;
906  let Inst{12-6} = !if(ps.has_sdst, sdata{6-0}, ?);
907}
908
909multiclass SM_Real_Stores_gfx10<bits<8> op, string ps,
910                                SM_Store_Pseudo immPs = !cast<SM_Store_Pseudo>(ps#_IMM),
911                                SM_Store_Pseudo sgprPs = !cast<SM_Store_Pseudo>(ps#_SGPR)> {
912  // FIXME: The operand name $offset is inconsistent with $soff used
913  // in the pseudo
914  def _IMM_gfx10 : SMEM_Real_Store_gfx10 <op, immPs> {
915    let InOperandList = (ins immPs.SrcClass:$sdata, immPs.BaseClass:$sbase, smem_offset:$offset, GLC:$glc, DLC:$dlc);
916  }
917
918  def _SGPR_gfx10 : SMEM_Real_Store_gfx10 <op, sgprPs> {
919    let InOperandList = (ins sgprPs.SrcClass:$sdata, sgprPs.BaseClass:$sbase, SReg_32:$offset, GLC:$glc, DLC:$dlc);
920  }
921}
922
923defm S_LOAD_DWORD            : SM_Real_Loads_gfx10<0x000, "S_LOAD_DWORD">;
924defm S_LOAD_DWORDX2          : SM_Real_Loads_gfx10<0x001, "S_LOAD_DWORDX2">;
925defm S_LOAD_DWORDX4          : SM_Real_Loads_gfx10<0x002, "S_LOAD_DWORDX4">;
926defm S_LOAD_DWORDX8          : SM_Real_Loads_gfx10<0x003, "S_LOAD_DWORDX8">;
927defm S_LOAD_DWORDX16         : SM_Real_Loads_gfx10<0x004, "S_LOAD_DWORDX16">;
928
929let SubtargetPredicate = HasScalarFlatScratchInsts in {
930defm S_SCRATCH_LOAD_DWORD    : SM_Real_Loads_gfx10<0x005, "S_SCRATCH_LOAD_DWORD">;
931defm S_SCRATCH_LOAD_DWORDX2  : SM_Real_Loads_gfx10<0x006, "S_SCRATCH_LOAD_DWORDX2">;
932defm S_SCRATCH_LOAD_DWORDX4  : SM_Real_Loads_gfx10<0x007, "S_SCRATCH_LOAD_DWORDX4">;
933} // End SubtargetPredicate = HasScalarFlatScratchInsts
934
935defm S_BUFFER_LOAD_DWORD     : SM_Real_Loads_gfx10<0x008, "S_BUFFER_LOAD_DWORD">;
936defm S_BUFFER_LOAD_DWORDX2   : SM_Real_Loads_gfx10<0x009, "S_BUFFER_LOAD_DWORDX2">;
937defm S_BUFFER_LOAD_DWORDX4   : SM_Real_Loads_gfx10<0x00a, "S_BUFFER_LOAD_DWORDX4">;
938defm S_BUFFER_LOAD_DWORDX8   : SM_Real_Loads_gfx10<0x00b, "S_BUFFER_LOAD_DWORDX8">;
939defm S_BUFFER_LOAD_DWORDX16  : SM_Real_Loads_gfx10<0x00c, "S_BUFFER_LOAD_DWORDX16">;
940
941let SubtargetPredicate = HasScalarStores in {
942defm S_STORE_DWORD           : SM_Real_Stores_gfx10<0x010, "S_STORE_DWORD">;
943defm S_STORE_DWORDX2         : SM_Real_Stores_gfx10<0x011, "S_STORE_DWORDX2">;
944defm S_STORE_DWORDX4         : SM_Real_Stores_gfx10<0x012, "S_STORE_DWORDX4">;
945let OtherPredicates = [HasScalarFlatScratchInsts] in {
946defm S_SCRATCH_STORE_DWORD   : SM_Real_Stores_gfx10<0x015, "S_SCRATCH_STORE_DWORD">;
947defm S_SCRATCH_STORE_DWORDX2 : SM_Real_Stores_gfx10<0x016, "S_SCRATCH_STORE_DWORDX2">;
948defm S_SCRATCH_STORE_DWORDX4 : SM_Real_Stores_gfx10<0x017, "S_SCRATCH_STORE_DWORDX4">;
949} // End OtherPredicates = [HasScalarFlatScratchInsts]
950defm S_BUFFER_STORE_DWORD    : SM_Real_Stores_gfx10<0x018, "S_BUFFER_STORE_DWORD">;
951defm S_BUFFER_STORE_DWORDX2  : SM_Real_Stores_gfx10<0x019, "S_BUFFER_STORE_DWORDX2">;
952defm S_BUFFER_STORE_DWORDX4  : SM_Real_Stores_gfx10<0x01a, "S_BUFFER_STORE_DWORDX4">;
953} // End SubtargetPredicate = HasScalarStores
954
955def S_MEMREALTIME_gfx10              : SMEM_Real_gfx10<0x025, S_MEMREALTIME>;
956def S_MEMTIME_gfx10                  : SMEM_Real_gfx10<0x024, S_MEMTIME>;
957def S_GL1_INV_gfx10                  : SMEM_Real_gfx10<0x01f, S_GL1_INV>;
958def S_GET_WAVEID_IN_WORKGROUP_gfx10  : SMEM_Real_gfx10<0x02a, S_GET_WAVEID_IN_WORKGROUP>;
959def S_DCACHE_INV_gfx10               : SMEM_Real_gfx10<0x020, S_DCACHE_INV>;
960
961let SubtargetPredicate = HasScalarStores in {
962def S_DCACHE_WB_gfx10                : SMEM_Real_gfx10<0x021, S_DCACHE_WB>;
963} // End SubtargetPredicate = HasScalarStores
964
965multiclass SM_Real_Probe_gfx10<bits<8> op, string ps> {
966  def _IMM_gfx10  : SMEM_Real_Store_gfx10 <op, !cast<SM_Pseudo>(ps#_IMM)>;
967  def _SGPR_gfx10 : SMEM_Real_Store_gfx10 <op, !cast<SM_Pseudo>(ps#_SGPR)>;
968}
969
970defm S_ATC_PROBE        : SM_Real_Probe_gfx10 <0x26, "S_ATC_PROBE">;
971defm S_ATC_PROBE_BUFFER : SM_Real_Probe_gfx10 <0x27, "S_ATC_PROBE_BUFFER">;
972
973class SMEM_Atomic_Real_gfx10 <bits<8> op, SM_Atomic_Pseudo ps>
974  : SMEM_Real_gfx10 <op, ps> {
975
976  bits<7> sdata;
977  bit dlc;
978
979  let Constraints = ps.Constraints;
980  let DisableEncoding = ps.DisableEncoding;
981
982  let glc = ps.glc;
983
984  let Inst{14} = !if(ps.has_dlc, dlc, 0);
985  let Inst{12-6} = !if(glc, sdst{6-0}, sdata{6-0});
986}
987
988multiclass SM_Real_Atomics_gfx10<bits<8> op, string ps> {
989  def _IMM_gfx10       : SMEM_Atomic_Real_gfx10 <op, !cast<SM_Atomic_Pseudo>(ps#_IMM)>;
990  def _SGPR_gfx10      : SMEM_Atomic_Real_gfx10 <op, !cast<SM_Atomic_Pseudo>(ps#_SGPR)>;
991  def _IMM_RTN_gfx10   : SMEM_Atomic_Real_gfx10 <op, !cast<SM_Atomic_Pseudo>(ps#_IMM_RTN)>;
992  def _SGPR_RTN_gfx10  : SMEM_Atomic_Real_gfx10 <op, !cast<SM_Atomic_Pseudo>(ps#_SGPR_RTN)>;
993}
994
995let SubtargetPredicate = HasScalarAtomics in {
996
997defm S_BUFFER_ATOMIC_SWAP         : SM_Real_Atomics_gfx10 <0x40, "S_BUFFER_ATOMIC_SWAP">;
998defm S_BUFFER_ATOMIC_CMPSWAP      : SM_Real_Atomics_gfx10 <0x41, "S_BUFFER_ATOMIC_CMPSWAP">;
999defm S_BUFFER_ATOMIC_ADD          : SM_Real_Atomics_gfx10 <0x42, "S_BUFFER_ATOMIC_ADD">;
1000defm S_BUFFER_ATOMIC_SUB          : SM_Real_Atomics_gfx10 <0x43, "S_BUFFER_ATOMIC_SUB">;
1001defm S_BUFFER_ATOMIC_SMIN         : SM_Real_Atomics_gfx10 <0x44, "S_BUFFER_ATOMIC_SMIN">;
1002defm S_BUFFER_ATOMIC_UMIN         : SM_Real_Atomics_gfx10 <0x45, "S_BUFFER_ATOMIC_UMIN">;
1003defm S_BUFFER_ATOMIC_SMAX         : SM_Real_Atomics_gfx10 <0x46, "S_BUFFER_ATOMIC_SMAX">;
1004defm S_BUFFER_ATOMIC_UMAX         : SM_Real_Atomics_gfx10 <0x47, "S_BUFFER_ATOMIC_UMAX">;
1005defm S_BUFFER_ATOMIC_AND          : SM_Real_Atomics_gfx10 <0x48, "S_BUFFER_ATOMIC_AND">;
1006defm S_BUFFER_ATOMIC_OR           : SM_Real_Atomics_gfx10 <0x49, "S_BUFFER_ATOMIC_OR">;
1007defm S_BUFFER_ATOMIC_XOR          : SM_Real_Atomics_gfx10 <0x4a, "S_BUFFER_ATOMIC_XOR">;
1008defm S_BUFFER_ATOMIC_INC          : SM_Real_Atomics_gfx10 <0x4b, "S_BUFFER_ATOMIC_INC">;
1009defm S_BUFFER_ATOMIC_DEC          : SM_Real_Atomics_gfx10 <0x4c, "S_BUFFER_ATOMIC_DEC">;
1010
1011defm S_BUFFER_ATOMIC_SWAP_X2      : SM_Real_Atomics_gfx10 <0x60, "S_BUFFER_ATOMIC_SWAP_X2">;
1012defm S_BUFFER_ATOMIC_CMPSWAP_X2   : SM_Real_Atomics_gfx10 <0x61, "S_BUFFER_ATOMIC_CMPSWAP_X2">;
1013defm S_BUFFER_ATOMIC_ADD_X2       : SM_Real_Atomics_gfx10 <0x62, "S_BUFFER_ATOMIC_ADD_X2">;
1014defm S_BUFFER_ATOMIC_SUB_X2       : SM_Real_Atomics_gfx10 <0x63, "S_BUFFER_ATOMIC_SUB_X2">;
1015defm S_BUFFER_ATOMIC_SMIN_X2      : SM_Real_Atomics_gfx10 <0x64, "S_BUFFER_ATOMIC_SMIN_X2">;
1016defm S_BUFFER_ATOMIC_UMIN_X2      : SM_Real_Atomics_gfx10 <0x65, "S_BUFFER_ATOMIC_UMIN_X2">;
1017defm S_BUFFER_ATOMIC_SMAX_X2      : SM_Real_Atomics_gfx10 <0x66, "S_BUFFER_ATOMIC_SMAX_X2">;
1018defm S_BUFFER_ATOMIC_UMAX_X2      : SM_Real_Atomics_gfx10 <0x67, "S_BUFFER_ATOMIC_UMAX_X2">;
1019defm S_BUFFER_ATOMIC_AND_X2       : SM_Real_Atomics_gfx10 <0x68, "S_BUFFER_ATOMIC_AND_X2">;
1020defm S_BUFFER_ATOMIC_OR_X2        : SM_Real_Atomics_gfx10 <0x69, "S_BUFFER_ATOMIC_OR_X2">;
1021defm S_BUFFER_ATOMIC_XOR_X2       : SM_Real_Atomics_gfx10 <0x6a, "S_BUFFER_ATOMIC_XOR_X2">;
1022defm S_BUFFER_ATOMIC_INC_X2       : SM_Real_Atomics_gfx10 <0x6b, "S_BUFFER_ATOMIC_INC_X2">;
1023defm S_BUFFER_ATOMIC_DEC_X2       : SM_Real_Atomics_gfx10 <0x6c, "S_BUFFER_ATOMIC_DEC_X2">;
1024
1025defm S_ATOMIC_SWAP                : SM_Real_Atomics_gfx10 <0x80, "S_ATOMIC_SWAP">;
1026defm S_ATOMIC_CMPSWAP             : SM_Real_Atomics_gfx10 <0x81, "S_ATOMIC_CMPSWAP">;
1027defm S_ATOMIC_ADD                 : SM_Real_Atomics_gfx10 <0x82, "S_ATOMIC_ADD">;
1028defm S_ATOMIC_SUB                 : SM_Real_Atomics_gfx10 <0x83, "S_ATOMIC_SUB">;
1029defm S_ATOMIC_SMIN                : SM_Real_Atomics_gfx10 <0x84, "S_ATOMIC_SMIN">;
1030defm S_ATOMIC_UMIN                : SM_Real_Atomics_gfx10 <0x85, "S_ATOMIC_UMIN">;
1031defm S_ATOMIC_SMAX                : SM_Real_Atomics_gfx10 <0x86, "S_ATOMIC_SMAX">;
1032defm S_ATOMIC_UMAX                : SM_Real_Atomics_gfx10 <0x87, "S_ATOMIC_UMAX">;
1033defm S_ATOMIC_AND                 : SM_Real_Atomics_gfx10 <0x88, "S_ATOMIC_AND">;
1034defm S_ATOMIC_OR                  : SM_Real_Atomics_gfx10 <0x89, "S_ATOMIC_OR">;
1035defm S_ATOMIC_XOR                 : SM_Real_Atomics_gfx10 <0x8a, "S_ATOMIC_XOR">;
1036defm S_ATOMIC_INC                 : SM_Real_Atomics_gfx10 <0x8b, "S_ATOMIC_INC">;
1037defm S_ATOMIC_DEC                 : SM_Real_Atomics_gfx10 <0x8c, "S_ATOMIC_DEC">;
1038
1039defm S_ATOMIC_SWAP_X2             : SM_Real_Atomics_gfx10 <0xa0, "S_ATOMIC_SWAP_X2">;
1040defm S_ATOMIC_CMPSWAP_X2          : SM_Real_Atomics_gfx10 <0xa1, "S_ATOMIC_CMPSWAP_X2">;
1041defm S_ATOMIC_ADD_X2              : SM_Real_Atomics_gfx10 <0xa2, "S_ATOMIC_ADD_X2">;
1042defm S_ATOMIC_SUB_X2              : SM_Real_Atomics_gfx10 <0xa3, "S_ATOMIC_SUB_X2">;
1043defm S_ATOMIC_SMIN_X2             : SM_Real_Atomics_gfx10 <0xa4, "S_ATOMIC_SMIN_X2">;
1044defm S_ATOMIC_UMIN_X2             : SM_Real_Atomics_gfx10 <0xa5, "S_ATOMIC_UMIN_X2">;
1045defm S_ATOMIC_SMAX_X2             : SM_Real_Atomics_gfx10 <0xa6, "S_ATOMIC_SMAX_X2">;
1046defm S_ATOMIC_UMAX_X2             : SM_Real_Atomics_gfx10 <0xa7, "S_ATOMIC_UMAX_X2">;
1047defm S_ATOMIC_AND_X2              : SM_Real_Atomics_gfx10 <0xa8, "S_ATOMIC_AND_X2">;
1048defm S_ATOMIC_OR_X2               : SM_Real_Atomics_gfx10 <0xa9, "S_ATOMIC_OR_X2">;
1049defm S_ATOMIC_XOR_X2              : SM_Real_Atomics_gfx10 <0xaa, "S_ATOMIC_XOR_X2">;
1050defm S_ATOMIC_INC_X2              : SM_Real_Atomics_gfx10 <0xab, "S_ATOMIC_INC_X2">;
1051defm S_ATOMIC_DEC_X2              : SM_Real_Atomics_gfx10 <0xac, "S_ATOMIC_DEC_X2">;
1052
1053multiclass SM_Real_Discard_gfx10<bits<8> op, string ps> {
1054  def _IMM_gfx10  : SMEM_Real_gfx10 <op, !cast<SM_Pseudo>(ps#_IMM)>;
1055  def _SGPR_gfx10 : SMEM_Real_gfx10 <op, !cast<SM_Pseudo>(ps#_SGPR)>;
1056}
1057
1058defm S_DCACHE_DISCARD    : SM_Real_Discard_gfx10 <0x28, "S_DCACHE_DISCARD">;
1059defm S_DCACHE_DISCARD_X2 : SM_Real_Discard_gfx10 <0x29, "S_DCACHE_DISCARD_X2">;
1060
1061} // End SubtargetPredicate = HasScalarAtomics
1062
1063def SMInfoTable : GenericTable {
1064  let FilterClass = "SM_Real";
1065  let CppTypeName = "SMInfo";
1066  let Fields = ["Opcode", "is_buffer"];
1067
1068  let PrimaryKey = ["Opcode"];
1069  let PrimaryKeyName = "getSMEMOpcodeHelper";
1070}
1071