xref: /freebsd/contrib/llvm-project/llvm/lib/Target/AMDGPU/SMInstructions.td (revision 4b50c451720d8b427757a6da1dd2bb4c52cd9e35)
1//===---- SMInstructions.td - Scalar Memory Instruction Defintions --------===//
2//
3// Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions.
4// See https://llvm.org/LICENSE.txt for license information.
5// SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception
6//
7//===----------------------------------------------------------------------===//
8
9def smrd_offset_8 : NamedOperandU32<"SMRDOffset8",
10                                  NamedMatchClass<"SMRDOffset8">> {
11  let OperandType = "OPERAND_IMMEDIATE";
12}
13
14def smrd_offset_20 : NamedOperandU32<"SMRDOffset20",
15                                  NamedMatchClass<"SMRDOffset20">> {
16  let OperandType = "OPERAND_IMMEDIATE";
17}
18
19//===----------------------------------------------------------------------===//
20// Scalar Memory classes
21//===----------------------------------------------------------------------===//
22
23class SM_Pseudo <string opName, dag outs, dag ins, string asmOps, list<dag> pattern=[]> :
24  InstSI <outs, ins, "", pattern>,
25  SIMCInstr<opName, SIEncodingFamily.NONE> {
26  let isPseudo = 1;
27  let isCodeGenOnly = 1;
28
29  let LGKM_CNT = 1;
30  let SMRD = 1;
31  let mayStore = 0;
32  let mayLoad = 1;
33  let hasSideEffects = 0;
34  let UseNamedOperandTable = 1;
35  let SchedRW = [WriteSMEM];
36
37  string Mnemonic = opName;
38  string AsmOperands = asmOps;
39
40  bits<1> has_sbase = 1;
41  bits<1> has_sdst = 1;
42  bit has_glc = 0;
43  bit has_dlc = 0;
44  bits<1> has_offset = 1;
45  bits<1> offset_is_imm = 0;
46}
47
48class SM_Real <SM_Pseudo ps>
49  : InstSI<ps.OutOperandList, ps.InOperandList, ps.Mnemonic # ps.AsmOperands, []> {
50
51  let isPseudo = 0;
52  let isCodeGenOnly = 0;
53
54  // copy relevant pseudo op flags
55  let SubtargetPredicate = ps.SubtargetPredicate;
56  let AsmMatchConverter  = ps.AsmMatchConverter;
57
58  // encoding
59  bits<7>  sbase;
60  bits<7>  sdst;
61  bits<32> offset;
62  bits<1> imm = !if(ps.has_offset, ps.offset_is_imm, 0);
63}
64
65class SM_Probe_Pseudo <string opName, dag ins, bit isImm>
66  : SM_Pseudo<opName, (outs), ins, " $sdata, $sbase, $offset"> {
67  let mayLoad = 0;
68  let mayStore = 0;
69  let has_glc = 0;
70  let LGKM_CNT = 0;
71  let ScalarStore = 0;
72  let hasSideEffects = 1;
73  let offset_is_imm = isImm;
74  let PseudoInstr = opName # !if(isImm, "_IMM", "_SGPR");
75}
76
77class SM_Load_Pseudo <string opName, dag outs, dag ins, string asmOps, list<dag> pattern=[]>
78  : SM_Pseudo<opName, outs, ins, asmOps, pattern> {
79  RegisterClass BaseClass;
80  let mayLoad = 1;
81  let mayStore = 0;
82  let has_glc = 1;
83  let has_dlc = 1;
84}
85
86class SM_Store_Pseudo <string opName, dag ins, string asmOps, list<dag> pattern = []>
87  : SM_Pseudo<opName, (outs), ins, asmOps, pattern> {
88  RegisterClass BaseClass;
89  RegisterClass SrcClass;
90  let mayLoad = 0;
91  let mayStore = 1;
92  let has_glc = 1;
93  let has_dlc = 1;
94  let ScalarStore = 1;
95}
96
97class SM_Discard_Pseudo <string opName, dag ins, bit isImm>
98  : SM_Pseudo<opName, (outs), ins, " $sbase, $offset"> {
99  let mayLoad = 0;
100  let mayStore = 0;
101  let has_glc = 0;
102  let has_sdst = 0;
103  let ScalarStore = 0;
104  let hasSideEffects = 1;
105  let offset_is_imm = isImm;
106  let PseudoInstr = opName # !if(isImm, "_IMM", "_SGPR");
107}
108
109multiclass SM_Pseudo_Loads<string opName,
110                           RegisterClass baseClass,
111                           RegisterClass dstClass> {
112  def _IMM  : SM_Load_Pseudo <opName,
113                              (outs dstClass:$sdst),
114                              (ins baseClass:$sbase, i32imm:$offset, i1imm:$glc, i1imm:$dlc),
115                              " $sdst, $sbase, $offset$glc$dlc", []> {
116    let offset_is_imm = 1;
117    let BaseClass = baseClass;
118    let PseudoInstr = opName # "_IMM";
119    let has_glc = 1;
120    let has_dlc = 1;
121  }
122
123  def _SGPR  : SM_Load_Pseudo <opName,
124                              (outs dstClass:$sdst),
125                              (ins baseClass:$sbase, SReg_32:$soff, i1imm:$glc, i1imm:$dlc),
126                              " $sdst, $sbase, $offset$glc$dlc", []> {
127    let BaseClass = baseClass;
128    let PseudoInstr = opName # "_SGPR";
129    let has_glc = 1;
130    let has_dlc = 1;
131  }
132}
133
134multiclass SM_Pseudo_Stores<string opName,
135                           RegisterClass baseClass,
136                           RegisterClass srcClass> {
137  def _IMM  : SM_Store_Pseudo <opName,
138    (ins srcClass:$sdata, baseClass:$sbase, i32imm:$offset, i1imm:$glc, i1imm:$dlc),
139    " $sdata, $sbase, $offset$glc$dlc", []> {
140    let offset_is_imm = 1;
141    let BaseClass = baseClass;
142    let SrcClass = srcClass;
143    let PseudoInstr = opName # "_IMM";
144  }
145
146  def _SGPR  : SM_Store_Pseudo <opName,
147    (ins srcClass:$sdata, baseClass:$sbase, SReg_32:$soff, i1imm:$glc, i1imm:$dlc),
148    " $sdata, $sbase, $offset$glc$dlc", []> {
149    let BaseClass = baseClass;
150    let SrcClass = srcClass;
151    let PseudoInstr = opName # "_SGPR";
152  }
153}
154
155multiclass SM_Pseudo_Discards<string opName> {
156  def _IMM  : SM_Discard_Pseudo <opName, (ins SReg_64:$sbase, smrd_offset_20:$offset), 1>;
157  def _SGPR : SM_Discard_Pseudo <opName, (ins SReg_64:$sbase, SReg_32:$offset), 0>;
158}
159
160class SM_Time_Pseudo<string opName, SDPatternOperator node = null_frag> : SM_Pseudo<
161  opName, (outs SReg_64_XEXEC:$sdst), (ins),
162  " $sdst", [(set i64:$sdst, (node))]> {
163  let hasSideEffects = 1;
164
165  // FIXME: This should be definitively mayStore = 0. TableGen
166  // brokenly tries to infer these based on the intrinsic properties
167  // corresponding to the IR attributes. The target intrinsics are
168  // considered as writing to memory for IR dependency purposes, but
169  // those can be modeled with hasSideEffects here. These also end up
170  // inferring differently for llvm.readcyclecounter and the amdgcn
171  // intrinsics.
172  let mayStore = ?;
173  let mayLoad = 1;
174  let has_sbase = 0;
175  let has_offset = 0;
176}
177
178class SM_Inval_Pseudo <string opName, SDPatternOperator node = null_frag> : SM_Pseudo<
179  opName, (outs), (ins), "", [(node)]> {
180  let hasSideEffects = 1;
181  let mayStore = 1;
182  let has_sdst = 0;
183  let has_sbase = 0;
184  let has_offset = 0;
185}
186
187multiclass SM_Pseudo_Probe<string opName, RegisterClass baseClass> {
188  def _IMM  : SM_Probe_Pseudo <opName, (ins i8imm:$sdata, baseClass:$sbase, smrd_offset_20:$offset), 1>;
189  def _SGPR : SM_Probe_Pseudo <opName, (ins i8imm:$sdata, baseClass:$sbase, SReg_32:$offset), 0>;
190}
191
192class SM_WaveId_Pseudo<string opName, SDPatternOperator node> : SM_Pseudo<
193  opName, (outs SReg_32_XM0_XEXEC:$sdst), (ins),
194  " $sdst", [(set i32:$sdst, (node))]> {
195  let hasSideEffects = 1;
196  let mayStore = 0;
197  let mayLoad = 1;
198  let has_sbase = 0;
199  let has_offset = 0;
200}
201
202//===----------------------------------------------------------------------===//
203// Scalar Atomic Memory Classes
204//===----------------------------------------------------------------------===//
205
206class SM_Atomic_Pseudo <string opName,
207                        dag outs, dag ins, string asmOps, bit isRet>
208  : SM_Pseudo<opName, outs, ins, asmOps, []> {
209
210  bit glc = isRet;
211
212  let mayLoad = 1;
213  let mayStore = 1;
214  let has_glc = 1;
215  let has_dlc = 1;
216
217  // Should these be set?
218  let ScalarStore = 1;
219  let hasSideEffects = 1;
220  let maybeAtomic = 1;
221}
222
223class SM_Pseudo_Atomic<string opName,
224                       RegisterClass baseClass,
225                       RegisterClass dataClass,
226                       bit isImm,
227                       bit isRet> :
228  SM_Atomic_Pseudo<opName,
229                   !if(isRet, (outs dataClass:$sdst), (outs)),
230                   !if(isImm,
231                       (ins dataClass:$sdata, baseClass:$sbase, smrd_offset_20:$offset, DLC:$dlc),
232                       (ins dataClass:$sdata, baseClass:$sbase, SReg_32:$offset, DLC:$dlc)),
233                   !if(isRet, " $sdst", " $sdata") # ", $sbase, $offset" # !if(isRet, " glc", "") # "$dlc",
234                   isRet> {
235  let offset_is_imm = isImm;
236  let PseudoInstr = opName # !if(isImm,
237                                 !if(isRet, "_IMM_RTN", "_IMM"),
238                                 !if(isRet, "_SGPR_RTN", "_SGPR"));
239
240  let Constraints = !if(isRet, "$sdst = $sdata", "");
241  let DisableEncoding = !if(isRet, "$sdata", "");
242}
243
244multiclass SM_Pseudo_Atomics<string opName,
245                             RegisterClass baseClass,
246                             RegisterClass dataClass> {
247  def _IMM      : SM_Pseudo_Atomic <opName, baseClass, dataClass, 1, 0>;
248  def _SGPR     : SM_Pseudo_Atomic <opName, baseClass, dataClass, 0, 0>;
249  def _IMM_RTN  : SM_Pseudo_Atomic <opName, baseClass, dataClass, 1, 1>;
250  def _SGPR_RTN : SM_Pseudo_Atomic <opName, baseClass, dataClass, 0, 1>;
251}
252
253//===----------------------------------------------------------------------===//
254// Scalar Memory Instructions
255//===----------------------------------------------------------------------===//
256
257// We are using the SReg_32_XM0 and not the SReg_32 register class for 32-bit
258// SMRD instructions, because the SReg_32_XM0 register class does not include M0
259// and writing to M0 from an SMRD instruction will hang the GPU.
260
261// XXX - SMEM instructions do not allow exec for data operand, but
262// does sdst for SMRD on SI/CI?
263defm S_LOAD_DWORD    : SM_Pseudo_Loads <"s_load_dword", SReg_64, SReg_32_XM0_XEXEC>;
264defm S_LOAD_DWORDX2  : SM_Pseudo_Loads <"s_load_dwordx2", SReg_64, SReg_64_XEXEC>;
265defm S_LOAD_DWORDX4  : SM_Pseudo_Loads <"s_load_dwordx4", SReg_64, SReg_128>;
266defm S_LOAD_DWORDX8  : SM_Pseudo_Loads <"s_load_dwordx8", SReg_64, SReg_256>;
267defm S_LOAD_DWORDX16 : SM_Pseudo_Loads <"s_load_dwordx16", SReg_64, SReg_512>;
268
269defm S_BUFFER_LOAD_DWORD : SM_Pseudo_Loads <
270  "s_buffer_load_dword", SReg_128, SReg_32_XM0_XEXEC
271>;
272
273// FIXME: exec_lo/exec_hi appear to be allowed for SMRD loads on
274// SI/CI, bit disallowed for SMEM on VI.
275defm S_BUFFER_LOAD_DWORDX2 : SM_Pseudo_Loads <
276  "s_buffer_load_dwordx2", SReg_128, SReg_64_XEXEC
277>;
278
279defm S_BUFFER_LOAD_DWORDX4 : SM_Pseudo_Loads <
280  "s_buffer_load_dwordx4", SReg_128, SReg_128
281>;
282
283defm S_BUFFER_LOAD_DWORDX8 : SM_Pseudo_Loads <
284  "s_buffer_load_dwordx8", SReg_128, SReg_256
285>;
286
287defm S_BUFFER_LOAD_DWORDX16 : SM_Pseudo_Loads <
288  "s_buffer_load_dwordx16", SReg_128, SReg_512
289>;
290
291let SubtargetPredicate = HasScalarStores in {
292defm S_STORE_DWORD : SM_Pseudo_Stores <"s_store_dword", SReg_64, SReg_32_XM0_XEXEC>;
293defm S_STORE_DWORDX2 : SM_Pseudo_Stores <"s_store_dwordx2", SReg_64, SReg_64_XEXEC>;
294defm S_STORE_DWORDX4 : SM_Pseudo_Stores <"s_store_dwordx4", SReg_64, SReg_128>;
295
296defm S_BUFFER_STORE_DWORD : SM_Pseudo_Stores <
297  "s_buffer_store_dword", SReg_128, SReg_32_XM0_XEXEC
298>;
299
300defm S_BUFFER_STORE_DWORDX2 : SM_Pseudo_Stores <
301  "s_buffer_store_dwordx2", SReg_128, SReg_64_XEXEC
302>;
303
304defm S_BUFFER_STORE_DWORDX4 : SM_Pseudo_Stores <
305  "s_buffer_store_dwordx4", SReg_128, SReg_128
306>;
307} // End SubtargetPredicate = HasScalarStores
308
309def S_MEMTIME : SM_Time_Pseudo <"s_memtime", int_amdgcn_s_memtime>;
310def S_DCACHE_INV : SM_Inval_Pseudo <"s_dcache_inv", int_amdgcn_s_dcache_inv>;
311
312let SubtargetPredicate = isGFX7GFX8GFX9 in {
313def S_DCACHE_INV_VOL : SM_Inval_Pseudo <"s_dcache_inv_vol", int_amdgcn_s_dcache_inv_vol>;
314} // let SubtargetPredicate = isGFX7GFX8GFX9
315
316let SubtargetPredicate = isGFX8Plus in {
317let OtherPredicates = [HasScalarStores] in {
318def S_DCACHE_WB     : SM_Inval_Pseudo <"s_dcache_wb", int_amdgcn_s_dcache_wb>;
319def S_DCACHE_WB_VOL : SM_Inval_Pseudo <"s_dcache_wb_vol", int_amdgcn_s_dcache_wb_vol>;
320} // End OtherPredicates = [HasScalarStores]
321def S_MEMREALTIME   : SM_Time_Pseudo <"s_memrealtime", int_amdgcn_s_memrealtime>;
322
323defm S_ATC_PROBE        : SM_Pseudo_Probe <"s_atc_probe", SReg_64>;
324defm S_ATC_PROBE_BUFFER : SM_Pseudo_Probe <"s_atc_probe_buffer", SReg_128>;
325} // SubtargetPredicate = isGFX8Plus
326
327let SubtargetPredicate = isGFX10Plus in {
328def S_GL1_INV : SM_Inval_Pseudo<"s_gl1_inv">;
329def S_GET_WAVEID_IN_WORKGROUP : SM_WaveId_Pseudo <"s_get_waveid_in_workgroup", int_amdgcn_s_get_waveid_in_workgroup>;
330} // End SubtargetPredicate = isGFX10Plus
331
332let SubtargetPredicate = HasScalarFlatScratchInsts, Uses = [FLAT_SCR] in {
333defm S_SCRATCH_LOAD_DWORD    : SM_Pseudo_Loads <"s_scratch_load_dword",   SReg_64, SReg_32_XM0_XEXEC>;
334defm S_SCRATCH_LOAD_DWORDX2  : SM_Pseudo_Loads <"s_scratch_load_dwordx2", SReg_64, SReg_64_XEXEC>;
335defm S_SCRATCH_LOAD_DWORDX4  : SM_Pseudo_Loads <"s_scratch_load_dwordx4", SReg_64, SReg_128>;
336
337defm S_SCRATCH_STORE_DWORD   : SM_Pseudo_Stores <"s_scratch_store_dword",   SReg_64, SReg_32_XM0_XEXEC>;
338defm S_SCRATCH_STORE_DWORDX2 : SM_Pseudo_Stores <"s_scratch_store_dwordx2", SReg_64, SReg_64_XEXEC>;
339defm S_SCRATCH_STORE_DWORDX4 : SM_Pseudo_Stores <"s_scratch_store_dwordx4", SReg_64, SReg_128>;
340} // SubtargetPredicate = HasScalarFlatScratchInsts
341
342let SubtargetPredicate = HasScalarAtomics in {
343
344defm S_BUFFER_ATOMIC_SWAP         : SM_Pseudo_Atomics <"s_buffer_atomic_swap", SReg_128, SReg_32_XM0_XEXEC>;
345defm S_BUFFER_ATOMIC_CMPSWAP      : SM_Pseudo_Atomics <"s_buffer_atomic_cmpswap", SReg_128, SReg_64_XEXEC>;
346defm S_BUFFER_ATOMIC_ADD          : SM_Pseudo_Atomics <"s_buffer_atomic_add", SReg_128, SReg_32_XM0_XEXEC>;
347defm S_BUFFER_ATOMIC_SUB          : SM_Pseudo_Atomics <"s_buffer_atomic_sub", SReg_128, SReg_32_XM0_XEXEC>;
348defm S_BUFFER_ATOMIC_SMIN         : SM_Pseudo_Atomics <"s_buffer_atomic_smin", SReg_128, SReg_32_XM0_XEXEC>;
349defm S_BUFFER_ATOMIC_UMIN         : SM_Pseudo_Atomics <"s_buffer_atomic_umin", SReg_128, SReg_32_XM0_XEXEC>;
350defm S_BUFFER_ATOMIC_SMAX         : SM_Pseudo_Atomics <"s_buffer_atomic_smax", SReg_128, SReg_32_XM0_XEXEC>;
351defm S_BUFFER_ATOMIC_UMAX         : SM_Pseudo_Atomics <"s_buffer_atomic_umax", SReg_128, SReg_32_XM0_XEXEC>;
352defm S_BUFFER_ATOMIC_AND          : SM_Pseudo_Atomics <"s_buffer_atomic_and", SReg_128, SReg_32_XM0_XEXEC>;
353defm S_BUFFER_ATOMIC_OR           : SM_Pseudo_Atomics <"s_buffer_atomic_or", SReg_128, SReg_32_XM0_XEXEC>;
354defm S_BUFFER_ATOMIC_XOR          : SM_Pseudo_Atomics <"s_buffer_atomic_xor", SReg_128, SReg_32_XM0_XEXEC>;
355defm S_BUFFER_ATOMIC_INC          : SM_Pseudo_Atomics <"s_buffer_atomic_inc", SReg_128, SReg_32_XM0_XEXEC>;
356defm S_BUFFER_ATOMIC_DEC          : SM_Pseudo_Atomics <"s_buffer_atomic_dec", SReg_128, SReg_32_XM0_XEXEC>;
357
358defm S_BUFFER_ATOMIC_SWAP_X2      : SM_Pseudo_Atomics <"s_buffer_atomic_swap_x2", SReg_128, SReg_64_XEXEC>;
359defm S_BUFFER_ATOMIC_CMPSWAP_X2   : SM_Pseudo_Atomics <"s_buffer_atomic_cmpswap_x2", SReg_128, SReg_128>;
360defm S_BUFFER_ATOMIC_ADD_X2       : SM_Pseudo_Atomics <"s_buffer_atomic_add_x2", SReg_128, SReg_64_XEXEC>;
361defm S_BUFFER_ATOMIC_SUB_X2       : SM_Pseudo_Atomics <"s_buffer_atomic_sub_x2", SReg_128, SReg_64_XEXEC>;
362defm S_BUFFER_ATOMIC_SMIN_X2      : SM_Pseudo_Atomics <"s_buffer_atomic_smin_x2", SReg_128, SReg_64_XEXEC>;
363defm S_BUFFER_ATOMIC_UMIN_X2      : SM_Pseudo_Atomics <"s_buffer_atomic_umin_x2", SReg_128, SReg_64_XEXEC>;
364defm S_BUFFER_ATOMIC_SMAX_X2      : SM_Pseudo_Atomics <"s_buffer_atomic_smax_x2", SReg_128, SReg_64_XEXEC>;
365defm S_BUFFER_ATOMIC_UMAX_X2      : SM_Pseudo_Atomics <"s_buffer_atomic_umax_x2", SReg_128, SReg_64_XEXEC>;
366defm S_BUFFER_ATOMIC_AND_X2       : SM_Pseudo_Atomics <"s_buffer_atomic_and_x2", SReg_128, SReg_64_XEXEC>;
367defm S_BUFFER_ATOMIC_OR_X2        : SM_Pseudo_Atomics <"s_buffer_atomic_or_x2", SReg_128, SReg_64_XEXEC>;
368defm S_BUFFER_ATOMIC_XOR_X2       : SM_Pseudo_Atomics <"s_buffer_atomic_xor_x2", SReg_128, SReg_64_XEXEC>;
369defm S_BUFFER_ATOMIC_INC_X2       : SM_Pseudo_Atomics <"s_buffer_atomic_inc_x2", SReg_128, SReg_64_XEXEC>;
370defm S_BUFFER_ATOMIC_DEC_X2       : SM_Pseudo_Atomics <"s_buffer_atomic_dec_x2", SReg_128, SReg_64_XEXEC>;
371
372defm S_ATOMIC_SWAP                : SM_Pseudo_Atomics <"s_atomic_swap", SReg_64, SReg_32_XM0_XEXEC>;
373defm S_ATOMIC_CMPSWAP             : SM_Pseudo_Atomics <"s_atomic_cmpswap", SReg_64, SReg_64_XEXEC>;
374defm S_ATOMIC_ADD                 : SM_Pseudo_Atomics <"s_atomic_add", SReg_64, SReg_32_XM0_XEXEC>;
375defm S_ATOMIC_SUB                 : SM_Pseudo_Atomics <"s_atomic_sub", SReg_64, SReg_32_XM0_XEXEC>;
376defm S_ATOMIC_SMIN                : SM_Pseudo_Atomics <"s_atomic_smin", SReg_64, SReg_32_XM0_XEXEC>;
377defm S_ATOMIC_UMIN                : SM_Pseudo_Atomics <"s_atomic_umin", SReg_64, SReg_32_XM0_XEXEC>;
378defm S_ATOMIC_SMAX                : SM_Pseudo_Atomics <"s_atomic_smax", SReg_64, SReg_32_XM0_XEXEC>;
379defm S_ATOMIC_UMAX                : SM_Pseudo_Atomics <"s_atomic_umax", SReg_64, SReg_32_XM0_XEXEC>;
380defm S_ATOMIC_AND                 : SM_Pseudo_Atomics <"s_atomic_and", SReg_64, SReg_32_XM0_XEXEC>;
381defm S_ATOMIC_OR                  : SM_Pseudo_Atomics <"s_atomic_or", SReg_64, SReg_32_XM0_XEXEC>;
382defm S_ATOMIC_XOR                 : SM_Pseudo_Atomics <"s_atomic_xor", SReg_64, SReg_32_XM0_XEXEC>;
383defm S_ATOMIC_INC                 : SM_Pseudo_Atomics <"s_atomic_inc", SReg_64, SReg_32_XM0_XEXEC>;
384defm S_ATOMIC_DEC                 : SM_Pseudo_Atomics <"s_atomic_dec", SReg_64, SReg_32_XM0_XEXEC>;
385
386defm S_ATOMIC_SWAP_X2             : SM_Pseudo_Atomics <"s_atomic_swap_x2", SReg_64, SReg_64_XEXEC>;
387defm S_ATOMIC_CMPSWAP_X2          : SM_Pseudo_Atomics <"s_atomic_cmpswap_x2", SReg_64, SReg_128>;
388defm S_ATOMIC_ADD_X2              : SM_Pseudo_Atomics <"s_atomic_add_x2", SReg_64, SReg_64_XEXEC>;
389defm S_ATOMIC_SUB_X2              : SM_Pseudo_Atomics <"s_atomic_sub_x2", SReg_64, SReg_64_XEXEC>;
390defm S_ATOMIC_SMIN_X2             : SM_Pseudo_Atomics <"s_atomic_smin_x2", SReg_64, SReg_64_XEXEC>;
391defm S_ATOMIC_UMIN_X2             : SM_Pseudo_Atomics <"s_atomic_umin_x2", SReg_64, SReg_64_XEXEC>;
392defm S_ATOMIC_SMAX_X2             : SM_Pseudo_Atomics <"s_atomic_smax_x2", SReg_64, SReg_64_XEXEC>;
393defm S_ATOMIC_UMAX_X2             : SM_Pseudo_Atomics <"s_atomic_umax_x2", SReg_64, SReg_64_XEXEC>;
394defm S_ATOMIC_AND_X2              : SM_Pseudo_Atomics <"s_atomic_and_x2", SReg_64, SReg_64_XEXEC>;
395defm S_ATOMIC_OR_X2               : SM_Pseudo_Atomics <"s_atomic_or_x2", SReg_64, SReg_64_XEXEC>;
396defm S_ATOMIC_XOR_X2              : SM_Pseudo_Atomics <"s_atomic_xor_x2", SReg_64, SReg_64_XEXEC>;
397defm S_ATOMIC_INC_X2              : SM_Pseudo_Atomics <"s_atomic_inc_x2", SReg_64, SReg_64_XEXEC>;
398defm S_ATOMIC_DEC_X2              : SM_Pseudo_Atomics <"s_atomic_dec_x2", SReg_64, SReg_64_XEXEC>;
399
400} // let SubtargetPredicate = HasScalarAtomics
401
402let SubtargetPredicate = HasScalarAtomics in {
403defm S_DCACHE_DISCARD    : SM_Pseudo_Discards <"s_dcache_discard">;
404defm S_DCACHE_DISCARD_X2 : SM_Pseudo_Discards <"s_dcache_discard_x2">;
405}
406
407//===----------------------------------------------------------------------===//
408// Targets
409//===----------------------------------------------------------------------===//
410
411//===----------------------------------------------------------------------===//
412// SI
413//===----------------------------------------------------------------------===//
414
415class SMRD_Real_si <bits<5> op, SM_Pseudo ps>
416  : SM_Real<ps>
417  , SIMCInstr<ps.PseudoInstr, SIEncodingFamily.SI>
418  , Enc32 {
419
420  let AssemblerPredicates = [isGFX6GFX7];
421  let DecoderNamespace = "GFX6GFX7";
422
423  let Inst{7-0}   = !if(ps.has_offset, offset{7-0}, ?);
424  let Inst{8}     = imm;
425  let Inst{14-9}  = !if(ps.has_sbase, sbase{6-1}, ?);
426  let Inst{21-15} = !if(ps.has_sdst, sdst{6-0}, ?);
427  let Inst{26-22} = op;
428  let Inst{31-27} = 0x18; //encoding
429}
430
431// FIXME: Assembler should reject trying to use glc on SMRD
432// instructions on SI.
433multiclass SM_Real_Loads_si<bits<5> op, string ps,
434                            SM_Load_Pseudo immPs = !cast<SM_Load_Pseudo>(ps#_IMM),
435                            SM_Load_Pseudo sgprPs = !cast<SM_Load_Pseudo>(ps#_SGPR)> {
436
437  def _IMM_si : SMRD_Real_si <op, immPs> {
438    let InOperandList = (ins immPs.BaseClass:$sbase, smrd_offset_8:$offset, GLC:$glc, DLC:$dlc);
439  }
440
441  // FIXME: The operand name $offset is inconsistent with $soff used
442  // in the pseudo
443  def _SGPR_si : SMRD_Real_si <op, sgprPs> {
444    let InOperandList = (ins sgprPs.BaseClass:$sbase, SReg_32:$offset, GLC:$glc, DLC:$dlc);
445  }
446
447}
448
449defm S_LOAD_DWORD           : SM_Real_Loads_si <0x00, "S_LOAD_DWORD">;
450defm S_LOAD_DWORDX2         : SM_Real_Loads_si <0x01, "S_LOAD_DWORDX2">;
451defm S_LOAD_DWORDX4         : SM_Real_Loads_si <0x02, "S_LOAD_DWORDX4">;
452defm S_LOAD_DWORDX8         : SM_Real_Loads_si <0x03, "S_LOAD_DWORDX8">;
453defm S_LOAD_DWORDX16        : SM_Real_Loads_si <0x04, "S_LOAD_DWORDX16">;
454defm S_BUFFER_LOAD_DWORD    : SM_Real_Loads_si <0x08, "S_BUFFER_LOAD_DWORD">;
455defm S_BUFFER_LOAD_DWORDX2  : SM_Real_Loads_si <0x09, "S_BUFFER_LOAD_DWORDX2">;
456defm S_BUFFER_LOAD_DWORDX4  : SM_Real_Loads_si <0x0a, "S_BUFFER_LOAD_DWORDX4">;
457defm S_BUFFER_LOAD_DWORDX8  : SM_Real_Loads_si <0x0b, "S_BUFFER_LOAD_DWORDX8">;
458defm S_BUFFER_LOAD_DWORDX16 : SM_Real_Loads_si <0x0c, "S_BUFFER_LOAD_DWORDX16">;
459
460def S_MEMTIME_si    : SMRD_Real_si <0x1e, S_MEMTIME>;
461def S_DCACHE_INV_si : SMRD_Real_si <0x1f, S_DCACHE_INV>;
462
463
464//===----------------------------------------------------------------------===//
465// VI
466//===----------------------------------------------------------------------===//
467
468class SMEM_Real_vi <bits<8> op, SM_Pseudo ps>
469  : SM_Real<ps>
470  , SIMCInstr<ps.PseudoInstr, SIEncodingFamily.VI>
471  , Enc64 {
472  bit glc;
473
474  let AssemblerPredicates = [isGFX8GFX9];
475  let DecoderNamespace = "GFX8";
476
477  let Inst{5-0}   = !if(ps.has_sbase, sbase{6-1}, ?);
478  let Inst{12-6}  = !if(ps.has_sdst, sdst{6-0}, ?);
479
480  let Inst{16} = !if(ps.has_glc, glc, ?);
481  let Inst{17} = imm;
482  let Inst{25-18} = op;
483  let Inst{31-26} = 0x30; //encoding
484  let Inst{51-32} = !if(ps.has_offset, offset{19-0}, ?);
485}
486
487multiclass SM_Real_Loads_vi<bits<8> op, string ps,
488                            SM_Load_Pseudo immPs = !cast<SM_Load_Pseudo>(ps#_IMM),
489                            SM_Load_Pseudo sgprPs = !cast<SM_Load_Pseudo>(ps#_SGPR)> {
490  def _IMM_vi : SMEM_Real_vi <op, immPs> {
491    let InOperandList = (ins immPs.BaseClass:$sbase, smrd_offset_20:$offset, GLC:$glc, DLC:$dlc);
492  }
493  def _SGPR_vi : SMEM_Real_vi <op, sgprPs> {
494    let InOperandList = (ins sgprPs.BaseClass:$sbase, SReg_32:$offset, GLC:$glc, DLC:$dlc);
495  }
496}
497
498class SMEM_Real_Store_vi <bits<8> op, SM_Pseudo ps> : SMEM_Real_vi <op, ps> {
499  // encoding
500  bits<7> sdata;
501
502  let sdst = ?;
503  let Inst{12-6}  = !if(ps.has_sdst, sdata{6-0}, ?);
504}
505
506multiclass SM_Real_Stores_vi<bits<8> op, string ps,
507                            SM_Store_Pseudo immPs = !cast<SM_Store_Pseudo>(ps#_IMM),
508                            SM_Store_Pseudo sgprPs = !cast<SM_Store_Pseudo>(ps#_SGPR)> {
509  // FIXME: The operand name $offset is inconsistent with $soff used
510  // in the pseudo
511  def _IMM_vi : SMEM_Real_Store_vi <op, immPs> {
512    let InOperandList = (ins immPs.SrcClass:$sdata, immPs.BaseClass:$sbase, smrd_offset_20:$offset, GLC:$glc, DLC:$dlc);
513  }
514
515  def _SGPR_vi : SMEM_Real_Store_vi <op, sgprPs> {
516    let InOperandList = (ins sgprPs.SrcClass:$sdata, sgprPs.BaseClass:$sbase, SReg_32:$offset, GLC:$glc, DLC:$dlc);
517  }
518}
519
520multiclass SM_Real_Probe_vi<bits<8> op, string ps> {
521  def _IMM_vi  : SMEM_Real_Store_vi <op, !cast<SM_Probe_Pseudo>(ps#_IMM)>;
522  def _SGPR_vi : SMEM_Real_Store_vi <op, !cast<SM_Probe_Pseudo>(ps#_SGPR)>;
523}
524
525defm S_LOAD_DWORD           : SM_Real_Loads_vi <0x00, "S_LOAD_DWORD">;
526defm S_LOAD_DWORDX2         : SM_Real_Loads_vi <0x01, "S_LOAD_DWORDX2">;
527defm S_LOAD_DWORDX4         : SM_Real_Loads_vi <0x02, "S_LOAD_DWORDX4">;
528defm S_LOAD_DWORDX8         : SM_Real_Loads_vi <0x03, "S_LOAD_DWORDX8">;
529defm S_LOAD_DWORDX16        : SM_Real_Loads_vi <0x04, "S_LOAD_DWORDX16">;
530defm S_BUFFER_LOAD_DWORD    : SM_Real_Loads_vi <0x08, "S_BUFFER_LOAD_DWORD">;
531defm S_BUFFER_LOAD_DWORDX2  : SM_Real_Loads_vi <0x09, "S_BUFFER_LOAD_DWORDX2">;
532defm S_BUFFER_LOAD_DWORDX4  : SM_Real_Loads_vi <0x0a, "S_BUFFER_LOAD_DWORDX4">;
533defm S_BUFFER_LOAD_DWORDX8  : SM_Real_Loads_vi <0x0b, "S_BUFFER_LOAD_DWORDX8">;
534defm S_BUFFER_LOAD_DWORDX16 : SM_Real_Loads_vi <0x0c, "S_BUFFER_LOAD_DWORDX16">;
535
536defm S_STORE_DWORD : SM_Real_Stores_vi <0x10, "S_STORE_DWORD">;
537defm S_STORE_DWORDX2 : SM_Real_Stores_vi <0x11, "S_STORE_DWORDX2">;
538defm S_STORE_DWORDX4 : SM_Real_Stores_vi <0x12, "S_STORE_DWORDX4">;
539
540defm S_BUFFER_STORE_DWORD    : SM_Real_Stores_vi <0x18, "S_BUFFER_STORE_DWORD">;
541defm S_BUFFER_STORE_DWORDX2  : SM_Real_Stores_vi <0x19, "S_BUFFER_STORE_DWORDX2">;
542defm S_BUFFER_STORE_DWORDX4  : SM_Real_Stores_vi <0x1a, "S_BUFFER_STORE_DWORDX4">;
543
544// These instructions use same encoding
545def S_DCACHE_INV_vi         : SMEM_Real_vi <0x20, S_DCACHE_INV>;
546def S_DCACHE_WB_vi          : SMEM_Real_vi <0x21, S_DCACHE_WB>;
547def S_DCACHE_INV_VOL_vi     : SMEM_Real_vi <0x22, S_DCACHE_INV_VOL>;
548def S_DCACHE_WB_VOL_vi      : SMEM_Real_vi <0x23, S_DCACHE_WB_VOL>;
549def S_MEMTIME_vi            : SMEM_Real_vi <0x24, S_MEMTIME>;
550def S_MEMREALTIME_vi        : SMEM_Real_vi <0x25, S_MEMREALTIME>;
551
552defm S_SCRATCH_LOAD_DWORD    : SM_Real_Loads_vi <0x05, "S_SCRATCH_LOAD_DWORD">;
553defm S_SCRATCH_LOAD_DWORDX2  : SM_Real_Loads_vi <0x06, "S_SCRATCH_LOAD_DWORDX2">;
554defm S_SCRATCH_LOAD_DWORDX4  : SM_Real_Loads_vi <0x07, "S_SCRATCH_LOAD_DWORDX4">;
555
556defm S_SCRATCH_STORE_DWORD   : SM_Real_Stores_vi <0x15, "S_SCRATCH_STORE_DWORD">;
557defm S_SCRATCH_STORE_DWORDX2 : SM_Real_Stores_vi <0x16, "S_SCRATCH_STORE_DWORDX2">;
558defm S_SCRATCH_STORE_DWORDX4 : SM_Real_Stores_vi <0x17, "S_SCRATCH_STORE_DWORDX4">;
559
560defm S_ATC_PROBE        : SM_Real_Probe_vi <0x26, "S_ATC_PROBE">;
561defm S_ATC_PROBE_BUFFER : SM_Real_Probe_vi <0x27, "S_ATC_PROBE_BUFFER">;
562
563//===----------------------------------------------------------------------===//
564// GFX9
565//===----------------------------------------------------------------------===//
566
567class SMEM_Atomic_Real_vi <bits<8> op, SM_Atomic_Pseudo ps>
568  : SMEM_Real_vi <op, ps> {
569
570  bits<7> sdata;
571
572  let Constraints = ps.Constraints;
573  let DisableEncoding = ps.DisableEncoding;
574
575  let glc = ps.glc;
576  let Inst{12-6} = !if(glc, sdst{6-0}, sdata{6-0});
577}
578
579multiclass SM_Real_Atomics_vi<bits<8> op, string ps> {
580  def _IMM_vi       : SMEM_Atomic_Real_vi <op, !cast<SM_Atomic_Pseudo>(ps#_IMM)>;
581  def _SGPR_vi      : SMEM_Atomic_Real_vi <op, !cast<SM_Atomic_Pseudo>(ps#_SGPR)>;
582  def _IMM_RTN_vi   : SMEM_Atomic_Real_vi <op, !cast<SM_Atomic_Pseudo>(ps#_IMM_RTN)>;
583  def _SGPR_RTN_vi  : SMEM_Atomic_Real_vi <op, !cast<SM_Atomic_Pseudo>(ps#_SGPR_RTN)>;
584}
585
586defm S_BUFFER_ATOMIC_SWAP         : SM_Real_Atomics_vi <0x40, "S_BUFFER_ATOMIC_SWAP">;
587defm S_BUFFER_ATOMIC_CMPSWAP      : SM_Real_Atomics_vi <0x41, "S_BUFFER_ATOMIC_CMPSWAP">;
588defm S_BUFFER_ATOMIC_ADD          : SM_Real_Atomics_vi <0x42, "S_BUFFER_ATOMIC_ADD">;
589defm S_BUFFER_ATOMIC_SUB          : SM_Real_Atomics_vi <0x43, "S_BUFFER_ATOMIC_SUB">;
590defm S_BUFFER_ATOMIC_SMIN         : SM_Real_Atomics_vi <0x44, "S_BUFFER_ATOMIC_SMIN">;
591defm S_BUFFER_ATOMIC_UMIN         : SM_Real_Atomics_vi <0x45, "S_BUFFER_ATOMIC_UMIN">;
592defm S_BUFFER_ATOMIC_SMAX         : SM_Real_Atomics_vi <0x46, "S_BUFFER_ATOMIC_SMAX">;
593defm S_BUFFER_ATOMIC_UMAX         : SM_Real_Atomics_vi <0x47, "S_BUFFER_ATOMIC_UMAX">;
594defm S_BUFFER_ATOMIC_AND          : SM_Real_Atomics_vi <0x48, "S_BUFFER_ATOMIC_AND">;
595defm S_BUFFER_ATOMIC_OR           : SM_Real_Atomics_vi <0x49, "S_BUFFER_ATOMIC_OR">;
596defm S_BUFFER_ATOMIC_XOR          : SM_Real_Atomics_vi <0x4a, "S_BUFFER_ATOMIC_XOR">;
597defm S_BUFFER_ATOMIC_INC          : SM_Real_Atomics_vi <0x4b, "S_BUFFER_ATOMIC_INC">;
598defm S_BUFFER_ATOMIC_DEC          : SM_Real_Atomics_vi <0x4c, "S_BUFFER_ATOMIC_DEC">;
599
600defm S_BUFFER_ATOMIC_SWAP_X2      : SM_Real_Atomics_vi <0x60, "S_BUFFER_ATOMIC_SWAP_X2">;
601defm S_BUFFER_ATOMIC_CMPSWAP_X2   : SM_Real_Atomics_vi <0x61, "S_BUFFER_ATOMIC_CMPSWAP_X2">;
602defm S_BUFFER_ATOMIC_ADD_X2       : SM_Real_Atomics_vi <0x62, "S_BUFFER_ATOMIC_ADD_X2">;
603defm S_BUFFER_ATOMIC_SUB_X2       : SM_Real_Atomics_vi <0x63, "S_BUFFER_ATOMIC_SUB_X2">;
604defm S_BUFFER_ATOMIC_SMIN_X2      : SM_Real_Atomics_vi <0x64, "S_BUFFER_ATOMIC_SMIN_X2">;
605defm S_BUFFER_ATOMIC_UMIN_X2      : SM_Real_Atomics_vi <0x65, "S_BUFFER_ATOMIC_UMIN_X2">;
606defm S_BUFFER_ATOMIC_SMAX_X2      : SM_Real_Atomics_vi <0x66, "S_BUFFER_ATOMIC_SMAX_X2">;
607defm S_BUFFER_ATOMIC_UMAX_X2      : SM_Real_Atomics_vi <0x67, "S_BUFFER_ATOMIC_UMAX_X2">;
608defm S_BUFFER_ATOMIC_AND_X2       : SM_Real_Atomics_vi <0x68, "S_BUFFER_ATOMIC_AND_X2">;
609defm S_BUFFER_ATOMIC_OR_X2        : SM_Real_Atomics_vi <0x69, "S_BUFFER_ATOMIC_OR_X2">;
610defm S_BUFFER_ATOMIC_XOR_X2       : SM_Real_Atomics_vi <0x6a, "S_BUFFER_ATOMIC_XOR_X2">;
611defm S_BUFFER_ATOMIC_INC_X2       : SM_Real_Atomics_vi <0x6b, "S_BUFFER_ATOMIC_INC_X2">;
612defm S_BUFFER_ATOMIC_DEC_X2       : SM_Real_Atomics_vi <0x6c, "S_BUFFER_ATOMIC_DEC_X2">;
613
614defm S_ATOMIC_SWAP                : SM_Real_Atomics_vi <0x80, "S_ATOMIC_SWAP">;
615defm S_ATOMIC_CMPSWAP             : SM_Real_Atomics_vi <0x81, "S_ATOMIC_CMPSWAP">;
616defm S_ATOMIC_ADD                 : SM_Real_Atomics_vi <0x82, "S_ATOMIC_ADD">;
617defm S_ATOMIC_SUB                 : SM_Real_Atomics_vi <0x83, "S_ATOMIC_SUB">;
618defm S_ATOMIC_SMIN                : SM_Real_Atomics_vi <0x84, "S_ATOMIC_SMIN">;
619defm S_ATOMIC_UMIN                : SM_Real_Atomics_vi <0x85, "S_ATOMIC_UMIN">;
620defm S_ATOMIC_SMAX                : SM_Real_Atomics_vi <0x86, "S_ATOMIC_SMAX">;
621defm S_ATOMIC_UMAX                : SM_Real_Atomics_vi <0x87, "S_ATOMIC_UMAX">;
622defm S_ATOMIC_AND                 : SM_Real_Atomics_vi <0x88, "S_ATOMIC_AND">;
623defm S_ATOMIC_OR                  : SM_Real_Atomics_vi <0x89, "S_ATOMIC_OR">;
624defm S_ATOMIC_XOR                 : SM_Real_Atomics_vi <0x8a, "S_ATOMIC_XOR">;
625defm S_ATOMIC_INC                 : SM_Real_Atomics_vi <0x8b, "S_ATOMIC_INC">;
626defm S_ATOMIC_DEC                 : SM_Real_Atomics_vi <0x8c, "S_ATOMIC_DEC">;
627
628defm S_ATOMIC_SWAP_X2             : SM_Real_Atomics_vi <0xa0, "S_ATOMIC_SWAP_X2">;
629defm S_ATOMIC_CMPSWAP_X2          : SM_Real_Atomics_vi <0xa1, "S_ATOMIC_CMPSWAP_X2">;
630defm S_ATOMIC_ADD_X2              : SM_Real_Atomics_vi <0xa2, "S_ATOMIC_ADD_X2">;
631defm S_ATOMIC_SUB_X2              : SM_Real_Atomics_vi <0xa3, "S_ATOMIC_SUB_X2">;
632defm S_ATOMIC_SMIN_X2             : SM_Real_Atomics_vi <0xa4, "S_ATOMIC_SMIN_X2">;
633defm S_ATOMIC_UMIN_X2             : SM_Real_Atomics_vi <0xa5, "S_ATOMIC_UMIN_X2">;
634defm S_ATOMIC_SMAX_X2             : SM_Real_Atomics_vi <0xa6, "S_ATOMIC_SMAX_X2">;
635defm S_ATOMIC_UMAX_X2             : SM_Real_Atomics_vi <0xa7, "S_ATOMIC_UMAX_X2">;
636defm S_ATOMIC_AND_X2              : SM_Real_Atomics_vi <0xa8, "S_ATOMIC_AND_X2">;
637defm S_ATOMIC_OR_X2               : SM_Real_Atomics_vi <0xa9, "S_ATOMIC_OR_X2">;
638defm S_ATOMIC_XOR_X2              : SM_Real_Atomics_vi <0xaa, "S_ATOMIC_XOR_X2">;
639defm S_ATOMIC_INC_X2              : SM_Real_Atomics_vi <0xab, "S_ATOMIC_INC_X2">;
640defm S_ATOMIC_DEC_X2              : SM_Real_Atomics_vi <0xac, "S_ATOMIC_DEC_X2">;
641
642multiclass SM_Real_Discard_vi<bits<8> op, string ps> {
643  def _IMM_vi  : SMEM_Real_vi <op, !cast<SM_Discard_Pseudo>(ps#_IMM)>;
644  def _SGPR_vi : SMEM_Real_vi <op, !cast<SM_Discard_Pseudo>(ps#_SGPR)>;
645}
646
647defm S_DCACHE_DISCARD    : SM_Real_Discard_vi <0x28, "S_DCACHE_DISCARD">;
648defm S_DCACHE_DISCARD_X2 : SM_Real_Discard_vi <0x29, "S_DCACHE_DISCARD_X2">;
649
650//===----------------------------------------------------------------------===//
651// CI
652//===----------------------------------------------------------------------===//
653
654def smrd_literal_offset : NamedOperandU32<"SMRDLiteralOffset",
655                                          NamedMatchClass<"SMRDLiteralOffset">> {
656  let OperandType = "OPERAND_IMMEDIATE";
657}
658
659class SMRD_Real_Load_IMM_ci <bits<5> op, SM_Load_Pseudo ps> :
660  SM_Real<ps>,
661  Enc64 {
662
663  let AssemblerPredicates = [isGFX7Only];
664  let DecoderNamespace = "GFX7";
665  let InOperandList = (ins ps.BaseClass:$sbase, smrd_literal_offset:$offset, GLC:$glc, DLC:$dlc);
666
667  let LGKM_CNT = ps.LGKM_CNT;
668  let SMRD = ps.SMRD;
669  let mayLoad = ps.mayLoad;
670  let mayStore = ps.mayStore;
671  let hasSideEffects = ps.hasSideEffects;
672  let SchedRW = ps.SchedRW;
673  let UseNamedOperandTable = ps.UseNamedOperandTable;
674
675  let Inst{7-0}   = 0xff;
676  let Inst{8}     = 0;
677  let Inst{14-9}  = sbase{6-1};
678  let Inst{21-15} = sdst{6-0};
679  let Inst{26-22} = op;
680  let Inst{31-27} = 0x18; //encoding
681  let Inst{63-32} = offset{31-0};
682}
683
684def S_LOAD_DWORD_IMM_ci           : SMRD_Real_Load_IMM_ci <0x00, S_LOAD_DWORD_IMM>;
685def S_LOAD_DWORDX2_IMM_ci         : SMRD_Real_Load_IMM_ci <0x01, S_LOAD_DWORDX2_IMM>;
686def S_LOAD_DWORDX4_IMM_ci         : SMRD_Real_Load_IMM_ci <0x02, S_LOAD_DWORDX4_IMM>;
687def S_LOAD_DWORDX8_IMM_ci         : SMRD_Real_Load_IMM_ci <0x03, S_LOAD_DWORDX8_IMM>;
688def S_LOAD_DWORDX16_IMM_ci        : SMRD_Real_Load_IMM_ci <0x04, S_LOAD_DWORDX16_IMM>;
689def S_BUFFER_LOAD_DWORD_IMM_ci    : SMRD_Real_Load_IMM_ci <0x08, S_BUFFER_LOAD_DWORD_IMM>;
690def S_BUFFER_LOAD_DWORDX2_IMM_ci  : SMRD_Real_Load_IMM_ci <0x09, S_BUFFER_LOAD_DWORDX2_IMM>;
691def S_BUFFER_LOAD_DWORDX4_IMM_ci  : SMRD_Real_Load_IMM_ci <0x0a, S_BUFFER_LOAD_DWORDX4_IMM>;
692def S_BUFFER_LOAD_DWORDX8_IMM_ci  : SMRD_Real_Load_IMM_ci <0x0b, S_BUFFER_LOAD_DWORDX8_IMM>;
693def S_BUFFER_LOAD_DWORDX16_IMM_ci : SMRD_Real_Load_IMM_ci <0x0c, S_BUFFER_LOAD_DWORDX16_IMM>;
694
695class SMRD_Real_ci <bits<5> op, SM_Pseudo ps>
696  : SM_Real<ps>
697  , SIMCInstr<ps.PseudoInstr, SIEncodingFamily.SI>
698  , Enc32 {
699
700  let AssemblerPredicates = [isGFX7Only];
701  let DecoderNamespace = "GFX7";
702
703  let Inst{7-0}   = !if(ps.has_offset, offset{7-0}, ?);
704  let Inst{8}     = imm;
705  let Inst{14-9}  = !if(ps.has_sbase, sbase{6-1}, ?);
706  let Inst{21-15} = !if(ps.has_sdst, sdst{6-0}, ?);
707  let Inst{26-22} = op;
708  let Inst{31-27} = 0x18; //encoding
709}
710
711def S_DCACHE_INV_VOL_ci : SMRD_Real_ci <0x1d, S_DCACHE_INV_VOL>;
712
713//===----------------------------------------------------------------------===//
714// Scalar Memory Patterns
715//===----------------------------------------------------------------------===//
716
717def smrd_load : PatFrag <(ops node:$ptr), (load node:$ptr), [{ return isUniformLoad(N);}]> {
718  let GISelPredicateCode = [{
719    if (!MI.hasOneMemOperand())
720      return false;
721    if (!isInstrUniform(MI))
722      return false;
723
724    // FIXME: We should probably be caching this.
725    SmallVector<GEPInfo, 4> AddrInfo;
726    getAddrModeInfo(MI, MRI, AddrInfo);
727
728    if (hasVgprParts(AddrInfo))
729      return false;
730    return true;
731  }];
732}
733
734def SMRDImm         : ComplexPattern<i64, 2, "SelectSMRDImm">;
735def SMRDImm32       : ComplexPattern<i64, 2, "SelectSMRDImm32">;
736def SMRDSgpr        : ComplexPattern<i64, 2, "SelectSMRDSgpr">;
737def SMRDBufferImm   : ComplexPattern<i32, 1, "SelectSMRDBufferImm">;
738def SMRDBufferImm32 : ComplexPattern<i32, 1, "SelectSMRDBufferImm32">;
739
740multiclass SMRD_Pattern <string Instr, ValueType vt> {
741
742  // 1. IMM offset
743  def : GCNPat <
744    (smrd_load (SMRDImm i64:$sbase, i32:$offset)),
745    (vt (!cast<SM_Pseudo>(Instr#"_IMM") $sbase, $offset, 0, 0))
746  >;
747
748  // 2. 32-bit IMM offset on CI
749  def : GCNPat <
750    (smrd_load (SMRDImm32 i64:$sbase, i32:$offset)),
751    (vt (!cast<InstSI>(Instr#"_IMM_ci") $sbase, $offset, 0, 0))> {
752    let OtherPredicates = [isGFX7Only];
753  }
754
755  // 3. SGPR offset
756  def : GCNPat <
757    (smrd_load (SMRDSgpr i64:$sbase, i32:$offset)),
758    (vt (!cast<SM_Pseudo>(Instr#"_SGPR") $sbase, $offset, 0, 0))
759  >;
760
761  // 4. No offset
762  def : GCNPat <
763    (vt (smrd_load (i64 SReg_64:$sbase))),
764    (vt (!cast<SM_Pseudo>(Instr#"_IMM") i64:$sbase, 0, 0, 0))
765  >;
766}
767
768multiclass SMLoad_Pattern <string Instr, ValueType vt> {
769  // 1. Offset as an immediate
770  def : GCNPat <
771    (SIsbuffer_load v4i32:$sbase, (SMRDBufferImm i32:$offset), i1:$glc, i1:$dlc),
772    (vt (!cast<SM_Pseudo>(Instr#"_IMM") $sbase, $offset, (as_i1imm $glc),
773                                        (as_i1imm $dlc)))
774  >;
775
776  // 2. 32-bit IMM offset on CI
777  def : GCNPat <
778    (vt (SIsbuffer_load v4i32:$sbase, (SMRDBufferImm32 i32:$offset), i1:$glc, i1:$dlc)),
779    (!cast<InstSI>(Instr#"_IMM_ci") $sbase, $offset, (as_i1imm $glc), (as_i1imm $dlc))> {
780    let OtherPredicates = [isGFX7Only];
781  }
782
783  // 3. Offset loaded in an 32bit SGPR
784  def : GCNPat <
785    (SIsbuffer_load v4i32:$sbase, i32:$offset, i1:$glc, i1:$dlc),
786    (vt (!cast<SM_Pseudo>(Instr#"_SGPR") $sbase, $offset, (as_i1imm $glc),
787                                         (as_i1imm $dlc)))
788  >;
789}
790
791// Global and constant loads can be selected to either MUBUF or SMRD
792// instructions, but SMRD instructions are faster so we want the instruction
793// selector to prefer those.
794let AddedComplexity = 100 in {
795
796defm : SMRD_Pattern <"S_LOAD_DWORD",    i32>;
797defm : SMRD_Pattern <"S_LOAD_DWORDX2",  v2i32>;
798defm : SMRD_Pattern <"S_LOAD_DWORDX4",  v4i32>;
799defm : SMRD_Pattern <"S_LOAD_DWORDX8",  v8i32>;
800defm : SMRD_Pattern <"S_LOAD_DWORDX16", v16i32>;
801
802defm : SMLoad_Pattern <"S_BUFFER_LOAD_DWORD",     i32>;
803defm : SMLoad_Pattern <"S_BUFFER_LOAD_DWORDX2",   v2i32>;
804defm : SMLoad_Pattern <"S_BUFFER_LOAD_DWORDX4",   v4i32>;
805defm : SMLoad_Pattern <"S_BUFFER_LOAD_DWORDX8",   v8i32>;
806defm : SMLoad_Pattern <"S_BUFFER_LOAD_DWORDX16",  v16i32>;
807
808defm : SMLoad_Pattern <"S_BUFFER_LOAD_DWORD",     f32>;
809defm : SMLoad_Pattern <"S_BUFFER_LOAD_DWORDX2",   v2f32>;
810defm : SMLoad_Pattern <"S_BUFFER_LOAD_DWORDX4",   v4f32>;
811defm : SMLoad_Pattern <"S_BUFFER_LOAD_DWORDX8",   v8f32>;
812defm : SMLoad_Pattern <"S_BUFFER_LOAD_DWORDX16",  v16f32>;
813} // End let AddedComplexity = 100
814
815def : GCNPat <
816  (i64 (readcyclecounter)),
817  (S_MEMTIME)
818>;
819
820//===----------------------------------------------------------------------===//
821// GFX10.
822//===----------------------------------------------------------------------===//
823
824class SMEM_Real_gfx10<bits<8> op, SM_Pseudo ps> :
825    SM_Real<ps>, SIMCInstr<ps.PseudoInstr, SIEncodingFamily.GFX10>, Enc64 {
826  bit glc;
827  bit dlc;
828
829  let AssemblerPredicates = [isGFX10Plus];
830  let DecoderNamespace = "GFX10";
831
832  let Inst{5-0}   = !if(ps.has_sbase, sbase{6-1}, ?);
833  let Inst{12-6}  = !if(ps.has_sdst, sdst{6-0}, ?);
834  let Inst{14}    = !if(ps.has_dlc, dlc, ?);
835  let Inst{16}    = !if(ps.has_glc, glc, ?);
836  let Inst{25-18} = op;
837  let Inst{31-26} = 0x3d;
838  let Inst{51-32} = !if(ps.offset_is_imm, !if(ps.has_offset, offset{19-0}, ?), ?);
839  let Inst{63-57} = !if(ps.offset_is_imm, !cast<int>(SGPR_NULL.HWEncoding),
840                                          !if(ps.has_offset, offset{6-0}, ?));
841}
842
843multiclass SM_Real_Loads_gfx10<bits<8> op, string ps,
844                               SM_Load_Pseudo immPs = !cast<SM_Load_Pseudo>(ps#_IMM),
845                               SM_Load_Pseudo sgprPs = !cast<SM_Load_Pseudo>(ps#_SGPR)> {
846  def _IMM_gfx10 : SMEM_Real_gfx10<op, immPs> {
847    let InOperandList = (ins immPs.BaseClass:$sbase, smrd_offset_20:$offset, GLC:$glc, DLC:$dlc);
848  }
849  def _SGPR_gfx10 : SMEM_Real_gfx10<op, sgprPs> {
850    let InOperandList = (ins sgprPs.BaseClass:$sbase, SReg_32:$offset, GLC:$glc, DLC:$dlc);
851  }
852}
853
854class SMEM_Real_Store_gfx10<bits<8> op, SM_Pseudo ps> : SMEM_Real_gfx10<op, ps> {
855  bits<7> sdata;
856
857  let sdst = ?;
858  let Inst{12-6} = !if(ps.has_sdst, sdata{6-0}, ?);
859}
860
861multiclass SM_Real_Stores_gfx10<bits<8> op, string ps,
862                                SM_Store_Pseudo immPs = !cast<SM_Store_Pseudo>(ps#_IMM),
863                                SM_Store_Pseudo sgprPs = !cast<SM_Store_Pseudo>(ps#_SGPR)> {
864  // FIXME: The operand name $offset is inconsistent with $soff used
865  // in the pseudo
866  def _IMM_gfx10 : SMEM_Real_Store_gfx10 <op, immPs> {
867    let InOperandList = (ins immPs.SrcClass:$sdata, immPs.BaseClass:$sbase, smrd_offset_20:$offset, GLC:$glc, DLC:$dlc);
868  }
869
870  def _SGPR_gfx10 : SMEM_Real_Store_gfx10 <op, sgprPs> {
871    let InOperandList = (ins sgprPs.SrcClass:$sdata, sgprPs.BaseClass:$sbase, SReg_32:$offset, GLC:$glc, DLC:$dlc);
872  }
873}
874
875defm S_LOAD_DWORD            : SM_Real_Loads_gfx10<0x000, "S_LOAD_DWORD">;
876defm S_LOAD_DWORDX2          : SM_Real_Loads_gfx10<0x001, "S_LOAD_DWORDX2">;
877defm S_LOAD_DWORDX4          : SM_Real_Loads_gfx10<0x002, "S_LOAD_DWORDX4">;
878defm S_LOAD_DWORDX8          : SM_Real_Loads_gfx10<0x003, "S_LOAD_DWORDX8">;
879defm S_LOAD_DWORDX16         : SM_Real_Loads_gfx10<0x004, "S_LOAD_DWORDX16">;
880
881let SubtargetPredicate = HasScalarFlatScratchInsts in {
882defm S_SCRATCH_LOAD_DWORD    : SM_Real_Loads_gfx10<0x005, "S_SCRATCH_LOAD_DWORD">;
883defm S_SCRATCH_LOAD_DWORDX2  : SM_Real_Loads_gfx10<0x006, "S_SCRATCH_LOAD_DWORDX2">;
884defm S_SCRATCH_LOAD_DWORDX4  : SM_Real_Loads_gfx10<0x007, "S_SCRATCH_LOAD_DWORDX4">;
885} // End SubtargetPredicate = HasScalarFlatScratchInsts
886
887defm S_BUFFER_LOAD_DWORD     : SM_Real_Loads_gfx10<0x008, "S_BUFFER_LOAD_DWORD">;
888defm S_BUFFER_LOAD_DWORDX2   : SM_Real_Loads_gfx10<0x009, "S_BUFFER_LOAD_DWORDX2">;
889defm S_BUFFER_LOAD_DWORDX4   : SM_Real_Loads_gfx10<0x00a, "S_BUFFER_LOAD_DWORDX4">;
890defm S_BUFFER_LOAD_DWORDX8   : SM_Real_Loads_gfx10<0x00b, "S_BUFFER_LOAD_DWORDX8">;
891defm S_BUFFER_LOAD_DWORDX16  : SM_Real_Loads_gfx10<0x00c, "S_BUFFER_LOAD_DWORDX16">;
892
893let SubtargetPredicate = HasScalarStores in {
894defm S_STORE_DWORD           : SM_Real_Stores_gfx10<0x010, "S_STORE_DWORD">;
895defm S_STORE_DWORDX2         : SM_Real_Stores_gfx10<0x011, "S_STORE_DWORDX2">;
896defm S_STORE_DWORDX4         : SM_Real_Stores_gfx10<0x012, "S_STORE_DWORDX4">;
897let OtherPredicates = [HasScalarFlatScratchInsts] in {
898defm S_SCRATCH_STORE_DWORD   : SM_Real_Stores_gfx10<0x015, "S_SCRATCH_STORE_DWORD">;
899defm S_SCRATCH_STORE_DWORDX2 : SM_Real_Stores_gfx10<0x016, "S_SCRATCH_STORE_DWORDX2">;
900defm S_SCRATCH_STORE_DWORDX4 : SM_Real_Stores_gfx10<0x017, "S_SCRATCH_STORE_DWORDX4">;
901} // End OtherPredicates = [HasScalarFlatScratchInsts]
902defm S_BUFFER_STORE_DWORD    : SM_Real_Stores_gfx10<0x018, "S_BUFFER_STORE_DWORD">;
903defm S_BUFFER_STORE_DWORDX2  : SM_Real_Stores_gfx10<0x019, "S_BUFFER_STORE_DWORDX2">;
904defm S_BUFFER_STORE_DWORDX4  : SM_Real_Stores_gfx10<0x01a, "S_BUFFER_STORE_DWORDX4">;
905} // End SubtargetPredicate = HasScalarStores
906
907def S_MEMREALTIME_gfx10              : SMEM_Real_gfx10<0x025, S_MEMREALTIME>;
908def S_MEMTIME_gfx10                  : SMEM_Real_gfx10<0x024, S_MEMTIME>;
909def S_GL1_INV_gfx10                  : SMEM_Real_gfx10<0x01f, S_GL1_INV>;
910def S_GET_WAVEID_IN_WORKGROUP_gfx10  : SMEM_Real_gfx10<0x02a, S_GET_WAVEID_IN_WORKGROUP>;
911def S_DCACHE_INV_gfx10               : SMEM_Real_gfx10<0x020, S_DCACHE_INV>;
912
913let SubtargetPredicate = HasScalarStores in {
914def S_DCACHE_WB_gfx10                : SMEM_Real_gfx10<0x021, S_DCACHE_WB>;
915} // End SubtargetPredicate = HasScalarStores
916
917multiclass SM_Real_Probe_gfx10<bits<8> op, string ps> {
918  def _IMM_gfx10  : SMEM_Real_Store_gfx10 <op, !cast<SM_Pseudo>(ps#_IMM)>;
919  def _SGPR_gfx10 : SMEM_Real_Store_gfx10 <op, !cast<SM_Pseudo>(ps#_SGPR)>;
920}
921
922defm S_ATC_PROBE        : SM_Real_Probe_gfx10 <0x26, "S_ATC_PROBE">;
923defm S_ATC_PROBE_BUFFER : SM_Real_Probe_gfx10 <0x27, "S_ATC_PROBE_BUFFER">;
924
925class SMEM_Atomic_Real_gfx10 <bits<8> op, SM_Atomic_Pseudo ps>
926  : SMEM_Real_gfx10 <op, ps> {
927
928  bits<7> sdata;
929  bit dlc;
930
931  let Constraints = ps.Constraints;
932  let DisableEncoding = ps.DisableEncoding;
933
934  let glc = ps.glc;
935
936  let Inst{14} = !if(ps.has_dlc, dlc, 0);
937  let Inst{12-6} = !if(glc, sdst{6-0}, sdata{6-0});
938}
939
940multiclass SM_Real_Atomics_gfx10<bits<8> op, string ps> {
941  def _IMM_gfx10       : SMEM_Atomic_Real_gfx10 <op, !cast<SM_Atomic_Pseudo>(ps#_IMM)>;
942  def _SGPR_gfx10      : SMEM_Atomic_Real_gfx10 <op, !cast<SM_Atomic_Pseudo>(ps#_SGPR)>;
943  def _IMM_RTN_gfx10   : SMEM_Atomic_Real_gfx10 <op, !cast<SM_Atomic_Pseudo>(ps#_IMM_RTN)>;
944  def _SGPR_RTN_gfx10  : SMEM_Atomic_Real_gfx10 <op, !cast<SM_Atomic_Pseudo>(ps#_SGPR_RTN)>;
945}
946
947let SubtargetPredicate = HasScalarAtomics in {
948
949defm S_BUFFER_ATOMIC_SWAP         : SM_Real_Atomics_gfx10 <0x40, "S_BUFFER_ATOMIC_SWAP">;
950defm S_BUFFER_ATOMIC_CMPSWAP      : SM_Real_Atomics_gfx10 <0x41, "S_BUFFER_ATOMIC_CMPSWAP">;
951defm S_BUFFER_ATOMIC_ADD          : SM_Real_Atomics_gfx10 <0x42, "S_BUFFER_ATOMIC_ADD">;
952defm S_BUFFER_ATOMIC_SUB          : SM_Real_Atomics_gfx10 <0x43, "S_BUFFER_ATOMIC_SUB">;
953defm S_BUFFER_ATOMIC_SMIN         : SM_Real_Atomics_gfx10 <0x44, "S_BUFFER_ATOMIC_SMIN">;
954defm S_BUFFER_ATOMIC_UMIN         : SM_Real_Atomics_gfx10 <0x45, "S_BUFFER_ATOMIC_UMIN">;
955defm S_BUFFER_ATOMIC_SMAX         : SM_Real_Atomics_gfx10 <0x46, "S_BUFFER_ATOMIC_SMAX">;
956defm S_BUFFER_ATOMIC_UMAX         : SM_Real_Atomics_gfx10 <0x47, "S_BUFFER_ATOMIC_UMAX">;
957defm S_BUFFER_ATOMIC_AND          : SM_Real_Atomics_gfx10 <0x48, "S_BUFFER_ATOMIC_AND">;
958defm S_BUFFER_ATOMIC_OR           : SM_Real_Atomics_gfx10 <0x49, "S_BUFFER_ATOMIC_OR">;
959defm S_BUFFER_ATOMIC_XOR          : SM_Real_Atomics_gfx10 <0x4a, "S_BUFFER_ATOMIC_XOR">;
960defm S_BUFFER_ATOMIC_INC          : SM_Real_Atomics_gfx10 <0x4b, "S_BUFFER_ATOMIC_INC">;
961defm S_BUFFER_ATOMIC_DEC          : SM_Real_Atomics_gfx10 <0x4c, "S_BUFFER_ATOMIC_DEC">;
962
963defm S_BUFFER_ATOMIC_SWAP_X2      : SM_Real_Atomics_gfx10 <0x60, "S_BUFFER_ATOMIC_SWAP_X2">;
964defm S_BUFFER_ATOMIC_CMPSWAP_X2   : SM_Real_Atomics_gfx10 <0x61, "S_BUFFER_ATOMIC_CMPSWAP_X2">;
965defm S_BUFFER_ATOMIC_ADD_X2       : SM_Real_Atomics_gfx10 <0x62, "S_BUFFER_ATOMIC_ADD_X2">;
966defm S_BUFFER_ATOMIC_SUB_X2       : SM_Real_Atomics_gfx10 <0x63, "S_BUFFER_ATOMIC_SUB_X2">;
967defm S_BUFFER_ATOMIC_SMIN_X2      : SM_Real_Atomics_gfx10 <0x64, "S_BUFFER_ATOMIC_SMIN_X2">;
968defm S_BUFFER_ATOMIC_UMIN_X2      : SM_Real_Atomics_gfx10 <0x65, "S_BUFFER_ATOMIC_UMIN_X2">;
969defm S_BUFFER_ATOMIC_SMAX_X2      : SM_Real_Atomics_gfx10 <0x66, "S_BUFFER_ATOMIC_SMAX_X2">;
970defm S_BUFFER_ATOMIC_UMAX_X2      : SM_Real_Atomics_gfx10 <0x67, "S_BUFFER_ATOMIC_UMAX_X2">;
971defm S_BUFFER_ATOMIC_AND_X2       : SM_Real_Atomics_gfx10 <0x68, "S_BUFFER_ATOMIC_AND_X2">;
972defm S_BUFFER_ATOMIC_OR_X2        : SM_Real_Atomics_gfx10 <0x69, "S_BUFFER_ATOMIC_OR_X2">;
973defm S_BUFFER_ATOMIC_XOR_X2       : SM_Real_Atomics_gfx10 <0x6a, "S_BUFFER_ATOMIC_XOR_X2">;
974defm S_BUFFER_ATOMIC_INC_X2       : SM_Real_Atomics_gfx10 <0x6b, "S_BUFFER_ATOMIC_INC_X2">;
975defm S_BUFFER_ATOMIC_DEC_X2       : SM_Real_Atomics_gfx10 <0x6c, "S_BUFFER_ATOMIC_DEC_X2">;
976
977defm S_ATOMIC_SWAP                : SM_Real_Atomics_gfx10 <0x80, "S_ATOMIC_SWAP">;
978defm S_ATOMIC_CMPSWAP             : SM_Real_Atomics_gfx10 <0x81, "S_ATOMIC_CMPSWAP">;
979defm S_ATOMIC_ADD                 : SM_Real_Atomics_gfx10 <0x82, "S_ATOMIC_ADD">;
980defm S_ATOMIC_SUB                 : SM_Real_Atomics_gfx10 <0x83, "S_ATOMIC_SUB">;
981defm S_ATOMIC_SMIN                : SM_Real_Atomics_gfx10 <0x84, "S_ATOMIC_SMIN">;
982defm S_ATOMIC_UMIN                : SM_Real_Atomics_gfx10 <0x85, "S_ATOMIC_UMIN">;
983defm S_ATOMIC_SMAX                : SM_Real_Atomics_gfx10 <0x86, "S_ATOMIC_SMAX">;
984defm S_ATOMIC_UMAX                : SM_Real_Atomics_gfx10 <0x87, "S_ATOMIC_UMAX">;
985defm S_ATOMIC_AND                 : SM_Real_Atomics_gfx10 <0x88, "S_ATOMIC_AND">;
986defm S_ATOMIC_OR                  : SM_Real_Atomics_gfx10 <0x89, "S_ATOMIC_OR">;
987defm S_ATOMIC_XOR                 : SM_Real_Atomics_gfx10 <0x8a, "S_ATOMIC_XOR">;
988defm S_ATOMIC_INC                 : SM_Real_Atomics_gfx10 <0x8b, "S_ATOMIC_INC">;
989defm S_ATOMIC_DEC                 : SM_Real_Atomics_gfx10 <0x8c, "S_ATOMIC_DEC">;
990
991defm S_ATOMIC_SWAP_X2             : SM_Real_Atomics_gfx10 <0xa0, "S_ATOMIC_SWAP_X2">;
992defm S_ATOMIC_CMPSWAP_X2          : SM_Real_Atomics_gfx10 <0xa1, "S_ATOMIC_CMPSWAP_X2">;
993defm S_ATOMIC_ADD_X2              : SM_Real_Atomics_gfx10 <0xa2, "S_ATOMIC_ADD_X2">;
994defm S_ATOMIC_SUB_X2              : SM_Real_Atomics_gfx10 <0xa3, "S_ATOMIC_SUB_X2">;
995defm S_ATOMIC_SMIN_X2             : SM_Real_Atomics_gfx10 <0xa4, "S_ATOMIC_SMIN_X2">;
996defm S_ATOMIC_UMIN_X2             : SM_Real_Atomics_gfx10 <0xa5, "S_ATOMIC_UMIN_X2">;
997defm S_ATOMIC_SMAX_X2             : SM_Real_Atomics_gfx10 <0xa6, "S_ATOMIC_SMAX_X2">;
998defm S_ATOMIC_UMAX_X2             : SM_Real_Atomics_gfx10 <0xa7, "S_ATOMIC_UMAX_X2">;
999defm S_ATOMIC_AND_X2              : SM_Real_Atomics_gfx10 <0xa8, "S_ATOMIC_AND_X2">;
1000defm S_ATOMIC_OR_X2               : SM_Real_Atomics_gfx10 <0xa9, "S_ATOMIC_OR_X2">;
1001defm S_ATOMIC_XOR_X2              : SM_Real_Atomics_gfx10 <0xaa, "S_ATOMIC_XOR_X2">;
1002defm S_ATOMIC_INC_X2              : SM_Real_Atomics_gfx10 <0xab, "S_ATOMIC_INC_X2">;
1003defm S_ATOMIC_DEC_X2              : SM_Real_Atomics_gfx10 <0xac, "S_ATOMIC_DEC_X2">;
1004
1005multiclass SM_Real_Discard_gfx10<bits<8> op, string ps> {
1006  def _IMM_gfx10  : SMEM_Real_gfx10 <op, !cast<SM_Pseudo>(ps#_IMM)>;
1007  def _SGPR_gfx10 : SMEM_Real_gfx10 <op, !cast<SM_Pseudo>(ps#_SGPR)>;
1008}
1009
1010defm S_DCACHE_DISCARD    : SM_Real_Discard_gfx10 <0x28, "S_DCACHE_DISCARD">;
1011defm S_DCACHE_DISCARD_X2 : SM_Real_Discard_gfx10 <0x29, "S_DCACHE_DISCARD_X2">;
1012
1013} // End SubtargetPredicate = HasScalarAtomics
1014