blob: f58eb21152dd866b2cca4db0e3a9d1e71efc85d4 [file] [log] [blame]
Valery Pykhtin1b138862016-09-01 09:56:47 +00001//===---- SMInstructions.td - Scalar Memory Instruction Defintions --------===//
2//
3// The LLVM Compiler Infrastructure
4//
5// This file is distributed under the University of Illinois Open Source
6// License. See LICENSE.TXT for details.
7//
8//===----------------------------------------------------------------------===//
9
Artem Tamazov54bfd542016-10-31 16:07:39 +000010def smrd_offset_8 : NamedOperandU32<"SMRDOffset8",
11 NamedMatchClass<"SMRDOffset8">> {
Valery Pykhtin1b138862016-09-01 09:56:47 +000012 let OperandType = "OPERAND_IMMEDIATE";
13}
14
Artem Tamazov54bfd542016-10-31 16:07:39 +000015def smrd_offset_20 : NamedOperandU32<"SMRDOffset20",
16 NamedMatchClass<"SMRDOffset20">> {
17 let OperandType = "OPERAND_IMMEDIATE";
18}
Valery Pykhtin1b138862016-09-01 09:56:47 +000019
20//===----------------------------------------------------------------------===//
21// Scalar Memory classes
22//===----------------------------------------------------------------------===//
23
24class SM_Pseudo <string opName, dag outs, dag ins, string asmOps, list<dag> pattern=[]> :
25 InstSI <outs, ins, "", pattern>,
26 SIMCInstr<opName, SIEncodingFamily.NONE> {
27 let isPseudo = 1;
28 let isCodeGenOnly = 1;
29
30 let LGKM_CNT = 1;
31 let SMRD = 1;
32 let mayStore = 0;
33 let mayLoad = 1;
34 let hasSideEffects = 0;
35 let UseNamedOperandTable = 1;
36 let SchedRW = [WriteSMEM];
37 let SubtargetPredicate = isGCN;
38
39 string Mnemonic = opName;
40 string AsmOperands = asmOps;
41
42 bits<1> has_sbase = 1;
43 bits<1> has_sdst = 1;
Matt Arsenault7b647552016-10-28 21:55:15 +000044 bit has_glc = 0;
Valery Pykhtin1b138862016-09-01 09:56:47 +000045 bits<1> has_offset = 1;
46 bits<1> offset_is_imm = 0;
47}
48
49class SM_Real <SM_Pseudo ps>
50 : InstSI<ps.OutOperandList, ps.InOperandList, ps.Mnemonic # ps.AsmOperands, []> {
51
52 let isPseudo = 0;
53 let isCodeGenOnly = 0;
54
55 // copy relevant pseudo op flags
56 let SubtargetPredicate = ps.SubtargetPredicate;
57 let AsmMatchConverter = ps.AsmMatchConverter;
58
59 // encoding
60 bits<7> sbase;
61 bits<7> sdst;
62 bits<32> offset;
Matt Arsenault7b647552016-10-28 21:55:15 +000063 bits<1> imm = !if(ps.has_offset, ps.offset_is_imm, 0);
Valery Pykhtin1b138862016-09-01 09:56:47 +000064}
65
66class SM_Load_Pseudo <string opName, dag outs, dag ins, string asmOps, list<dag> pattern=[]>
67 : SM_Pseudo<opName, outs, ins, asmOps, pattern> {
68 RegisterClass BaseClass;
Matt Arsenault7b647552016-10-28 21:55:15 +000069 let mayLoad = 1;
70 let mayStore = 0;
71 let has_glc = 1;
72}
73
74class SM_Store_Pseudo <string opName, dag ins, string asmOps, list<dag> pattern = []>
75 : SM_Pseudo<opName, (outs), ins, asmOps, pattern> {
76 RegisterClass BaseClass;
77 RegisterClass SrcClass;
78 let mayLoad = 0;
79 let mayStore = 1;
80 let has_glc = 1;
81 let ScalarStore = 1;
Valery Pykhtin1b138862016-09-01 09:56:47 +000082}
83
Dmitry Preobrazhensky4732d872018-04-06 15:08:42 +000084class SM_Discard_Pseudo <string opName, dag ins, bit isImm>
85 : SM_Pseudo<opName, (outs), ins, " $sbase, $offset"> {
86 let mayLoad = 0;
87 let mayStore = 0;
88 let has_glc = 0;
89 let has_sdst = 0;
90 let ScalarStore = 0;
91 let hasSideEffects = 1;
92 let offset_is_imm = isImm;
93 let PseudoInstr = opName # !if(isImm, "_IMM", "_SGPR");
94}
95
Valery Pykhtin1b138862016-09-01 09:56:47 +000096multiclass SM_Pseudo_Loads<string opName,
97 RegisterClass baseClass,
98 RegisterClass dstClass> {
99 def _IMM : SM_Load_Pseudo <opName,
100 (outs dstClass:$sdst),
Matt Arsenault7b647552016-10-28 21:55:15 +0000101 (ins baseClass:$sbase, i32imm:$offset, i1imm:$glc),
102 " $sdst, $sbase, $offset$glc", []> {
Valery Pykhtin1b138862016-09-01 09:56:47 +0000103 let offset_is_imm = 1;
104 let BaseClass = baseClass;
105 let PseudoInstr = opName # "_IMM";
Matt Arsenault7b647552016-10-28 21:55:15 +0000106 let has_glc = 1;
Valery Pykhtin1b138862016-09-01 09:56:47 +0000107 }
Matt Arsenault7b647552016-10-28 21:55:15 +0000108
Valery Pykhtin1b138862016-09-01 09:56:47 +0000109 def _SGPR : SM_Load_Pseudo <opName,
110 (outs dstClass:$sdst),
Matt Arsenault7b647552016-10-28 21:55:15 +0000111 (ins baseClass:$sbase, SReg_32:$soff, i1imm:$glc),
112 " $sdst, $sbase, $offset$glc", []> {
Valery Pykhtin1b138862016-09-01 09:56:47 +0000113 let BaseClass = baseClass;
114 let PseudoInstr = opName # "_SGPR";
Matt Arsenault7b647552016-10-28 21:55:15 +0000115 let has_glc = 1;
116 }
117}
118
119multiclass SM_Pseudo_Stores<string opName,
120 RegisterClass baseClass,
121 RegisterClass srcClass> {
122 def _IMM : SM_Store_Pseudo <opName,
123 (ins srcClass:$sdata, baseClass:$sbase, i32imm:$offset, i1imm:$glc),
124 " $sdata, $sbase, $offset$glc", []> {
125 let offset_is_imm = 1;
126 let BaseClass = baseClass;
127 let SrcClass = srcClass;
128 let PseudoInstr = opName # "_IMM";
129 }
130
131 def _SGPR : SM_Store_Pseudo <opName,
132 (ins srcClass:$sdata, baseClass:$sbase, SReg_32:$soff, i1imm:$glc),
133 " $sdata, $sbase, $offset$glc", []> {
134 let BaseClass = baseClass;
135 let SrcClass = srcClass;
136 let PseudoInstr = opName # "_SGPR";
Valery Pykhtin1b138862016-09-01 09:56:47 +0000137 }
138}
139
Dmitry Preobrazhensky4732d872018-04-06 15:08:42 +0000140multiclass SM_Pseudo_Discards<string opName> {
141 def _IMM : SM_Discard_Pseudo <opName, (ins SReg_64:$sbase, smrd_offset_20:$offset), 1>;
142 def _SGPR : SM_Discard_Pseudo <opName, (ins SReg_64:$sbase, SReg_32:$offset), 0>;
143}
144
Valery Pykhtin1b138862016-09-01 09:56:47 +0000145class SM_Time_Pseudo<string opName, SDPatternOperator node> : SM_Pseudo<
Matt Arsenault640c44b2016-11-29 19:39:53 +0000146 opName, (outs SReg_64_XEXEC:$sdst), (ins),
Valery Pykhtin1b138862016-09-01 09:56:47 +0000147 " $sdst", [(set i64:$sdst, (node))]> {
148 let hasSideEffects = 1;
Matt Arsenault73ce93b2017-12-08 20:01:02 +0000149 let mayStore = 0;
150 let mayLoad = 1;
Valery Pykhtin1b138862016-09-01 09:56:47 +0000151 let has_sbase = 0;
152 let has_offset = 0;
153}
154
155class SM_Inval_Pseudo <string opName, SDPatternOperator node> : SM_Pseudo<
156 opName, (outs), (ins), "", [(node)]> {
157 let hasSideEffects = 1;
158 let mayStore = 1;
159 let has_sdst = 0;
160 let has_sbase = 0;
161 let has_offset = 0;
162}
163
Dmitry Preobrazhensky6bad04e2018-04-02 16:10:25 +0000164//===----------------------------------------------------------------------===//
165// Scalar Atomic Memory Classes
166//===----------------------------------------------------------------------===//
167
168class SM_Atomic_Pseudo <string opName,
169 dag outs, dag ins, string asmOps, bit isRet>
170 : SM_Pseudo<opName, outs, ins, asmOps, []> {
171
172 bit glc = isRet;
173
174 let mayLoad = 1;
175 let mayStore = 1;
176 let has_glc = 1;
177
178 // Should these be set?
179 let ScalarStore = 1;
180 let hasSideEffects = 1;
181 let maybeAtomic = 1;
182}
183
184class SM_Pseudo_Atomic<string opName,
185 RegisterClass baseClass,
186 RegisterClass dataClass,
187 bit isImm,
188 bit isRet> :
189 SM_Atomic_Pseudo<opName,
190 !if(isRet, (outs dataClass:$sdst), (outs)),
191 !if(isImm,
192 (ins dataClass:$sdata, baseClass:$sbase, smrd_offset_20:$offset),
193 (ins dataClass:$sdata, baseClass:$sbase, SReg_32:$offset)),
194 !if(isRet, " $sdst", " $sdata") # ", $sbase, $offset" # !if(isRet, " glc", ""),
195 isRet> {
196 let offset_is_imm = isImm;
197 let PseudoInstr = opName # !if(isImm,
198 !if(isRet, "_IMM_RTN", "_IMM"),
199 !if(isRet, "_SGPR_RTN", "_SGPR"));
200
201 let Constraints = !if(isRet, "$sdst = $sdata", "");
202 let DisableEncoding = !if(isRet, "$sdata", "");
203}
204
205multiclass SM_Pseudo_Atomics<string opName,
206 RegisterClass baseClass,
207 RegisterClass dataClass> {
208 def _IMM : SM_Pseudo_Atomic <opName, baseClass, dataClass, 1, 0>;
209 def _SGPR : SM_Pseudo_Atomic <opName, baseClass, dataClass, 0, 0>;
210 def _IMM_RTN : SM_Pseudo_Atomic <opName, baseClass, dataClass, 1, 1>;
211 def _SGPR_RTN : SM_Pseudo_Atomic <opName, baseClass, dataClass, 0, 1>;
212}
Valery Pykhtin1b138862016-09-01 09:56:47 +0000213
214//===----------------------------------------------------------------------===//
215// Scalar Memory Instructions
216//===----------------------------------------------------------------------===//
217
218// We are using the SReg_32_XM0 and not the SReg_32 register class for 32-bit
219// SMRD instructions, because the SReg_32_XM0 register class does not include M0
220// and writing to M0 from an SMRD instruction will hang the GPU.
Matt Arsenault640c44b2016-11-29 19:39:53 +0000221
222// XXX - SMEM instructions do not allow exec for data operand, but
223// does sdst for SMRD on SI/CI?
224defm S_LOAD_DWORD : SM_Pseudo_Loads <"s_load_dword", SReg_64, SReg_32_XM0_XEXEC>;
225defm S_LOAD_DWORDX2 : SM_Pseudo_Loads <"s_load_dwordx2", SReg_64, SReg_64_XEXEC>;
Valery Pykhtin1b138862016-09-01 09:56:47 +0000226defm S_LOAD_DWORDX4 : SM_Pseudo_Loads <"s_load_dwordx4", SReg_64, SReg_128>;
227defm S_LOAD_DWORDX8 : SM_Pseudo_Loads <"s_load_dwordx8", SReg_64, SReg_256>;
228defm S_LOAD_DWORDX16 : SM_Pseudo_Loads <"s_load_dwordx16", SReg_64, SReg_512>;
229
230defm S_BUFFER_LOAD_DWORD : SM_Pseudo_Loads <
Matt Arsenault640c44b2016-11-29 19:39:53 +0000231 "s_buffer_load_dword", SReg_128, SReg_32_XM0_XEXEC
Valery Pykhtin1b138862016-09-01 09:56:47 +0000232>;
233
Matt Arsenault640c44b2016-11-29 19:39:53 +0000234// FIXME: exec_lo/exec_hi appear to be allowed for SMRD loads on
235// SI/CI, bit disallowed for SMEM on VI.
Valery Pykhtin1b138862016-09-01 09:56:47 +0000236defm S_BUFFER_LOAD_DWORDX2 : SM_Pseudo_Loads <
Matt Arsenault640c44b2016-11-29 19:39:53 +0000237 "s_buffer_load_dwordx2", SReg_128, SReg_64_XEXEC
Valery Pykhtin1b138862016-09-01 09:56:47 +0000238>;
239
240defm S_BUFFER_LOAD_DWORDX4 : SM_Pseudo_Loads <
241 "s_buffer_load_dwordx4", SReg_128, SReg_128
242>;
243
244defm S_BUFFER_LOAD_DWORDX8 : SM_Pseudo_Loads <
245 "s_buffer_load_dwordx8", SReg_128, SReg_256
246>;
247
248defm S_BUFFER_LOAD_DWORDX16 : SM_Pseudo_Loads <
249 "s_buffer_load_dwordx16", SReg_128, SReg_512
250>;
251
Matt Arsenault640c44b2016-11-29 19:39:53 +0000252defm S_STORE_DWORD : SM_Pseudo_Stores <"s_store_dword", SReg_64, SReg_32_XM0_XEXEC>;
253defm S_STORE_DWORDX2 : SM_Pseudo_Stores <"s_store_dwordx2", SReg_64, SReg_64_XEXEC>;
Matt Arsenault7b647552016-10-28 21:55:15 +0000254defm S_STORE_DWORDX4 : SM_Pseudo_Stores <"s_store_dwordx4", SReg_64, SReg_128>;
255
256defm S_BUFFER_STORE_DWORD : SM_Pseudo_Stores <
Matt Arsenault640c44b2016-11-29 19:39:53 +0000257 "s_buffer_store_dword", SReg_128, SReg_32_XM0_XEXEC
Matt Arsenault7b647552016-10-28 21:55:15 +0000258>;
259
260defm S_BUFFER_STORE_DWORDX2 : SM_Pseudo_Stores <
Matt Arsenault640c44b2016-11-29 19:39:53 +0000261 "s_buffer_store_dwordx2", SReg_128, SReg_64_XEXEC
Matt Arsenault7b647552016-10-28 21:55:15 +0000262>;
263
264defm S_BUFFER_STORE_DWORDX4 : SM_Pseudo_Stores <
265 "s_buffer_store_dwordx4", SReg_128, SReg_128
266>;
267
268
Valery Pykhtin1b138862016-09-01 09:56:47 +0000269def S_MEMTIME : SM_Time_Pseudo <"s_memtime", int_amdgcn_s_memtime>;
270def S_DCACHE_INV : SM_Inval_Pseudo <"s_dcache_inv", int_amdgcn_s_dcache_inv>;
271
272let SubtargetPredicate = isCIVI in {
273def S_DCACHE_INV_VOL : SM_Inval_Pseudo <"s_dcache_inv_vol", int_amdgcn_s_dcache_inv_vol>;
274} // let SubtargetPredicate = isCIVI
275
276let SubtargetPredicate = isVI in {
277def S_DCACHE_WB : SM_Inval_Pseudo <"s_dcache_wb", int_amdgcn_s_dcache_wb>;
278def S_DCACHE_WB_VOL : SM_Inval_Pseudo <"s_dcache_wb_vol", int_amdgcn_s_dcache_wb_vol>;
279def S_MEMREALTIME : SM_Time_Pseudo <"s_memrealtime", int_amdgcn_s_memrealtime>;
280} // SubtargetPredicate = isVI
281
Dmitry Preobrazhenskydd2b9292018-03-28 14:08:03 +0000282let SubtargetPredicate = HasFlatScratchInsts, Uses = [FLAT_SCR] in {
283defm S_SCRATCH_LOAD_DWORD : SM_Pseudo_Loads <"s_scratch_load_dword", SReg_64, SReg_32_XM0_XEXEC>;
284defm S_SCRATCH_LOAD_DWORDX2 : SM_Pseudo_Loads <"s_scratch_load_dwordx2", SReg_64, SReg_64_XEXEC>;
285defm S_SCRATCH_LOAD_DWORDX4 : SM_Pseudo_Loads <"s_scratch_load_dwordx4", SReg_64, SReg_128>;
Valery Pykhtin1b138862016-09-01 09:56:47 +0000286
Dmitry Preobrazhenskydd2b9292018-03-28 14:08:03 +0000287defm S_SCRATCH_STORE_DWORD : SM_Pseudo_Stores <"s_scratch_store_dword", SReg_64, SReg_32_XM0_XEXEC>;
288defm S_SCRATCH_STORE_DWORDX2 : SM_Pseudo_Stores <"s_scratch_store_dwordx2", SReg_64, SReg_64_XEXEC>;
289defm S_SCRATCH_STORE_DWORDX4 : SM_Pseudo_Stores <"s_scratch_store_dwordx4", SReg_64, SReg_128>;
290} // SubtargetPredicate = HasFlatScratchInsts
Valery Pykhtin1b138862016-09-01 09:56:47 +0000291
Dmitry Preobrazhensky6bad04e2018-04-02 16:10:25 +0000292let SubtargetPredicate = HasScalarAtomics in {
293
294defm S_BUFFER_ATOMIC_SWAP : SM_Pseudo_Atomics <"s_buffer_atomic_swap", SReg_128, SReg_32_XM0_XEXEC>;
295defm S_BUFFER_ATOMIC_CMPSWAP : SM_Pseudo_Atomics <"s_buffer_atomic_cmpswap", SReg_128, SReg_64_XEXEC>;
296defm S_BUFFER_ATOMIC_ADD : SM_Pseudo_Atomics <"s_buffer_atomic_add", SReg_128, SReg_32_XM0_XEXEC>;
297defm S_BUFFER_ATOMIC_SUB : SM_Pseudo_Atomics <"s_buffer_atomic_sub", SReg_128, SReg_32_XM0_XEXEC>;
298defm S_BUFFER_ATOMIC_SMIN : SM_Pseudo_Atomics <"s_buffer_atomic_smin", SReg_128, SReg_32_XM0_XEXEC>;
299defm S_BUFFER_ATOMIC_UMIN : SM_Pseudo_Atomics <"s_buffer_atomic_umin", SReg_128, SReg_32_XM0_XEXEC>;
300defm S_BUFFER_ATOMIC_SMAX : SM_Pseudo_Atomics <"s_buffer_atomic_smax", SReg_128, SReg_32_XM0_XEXEC>;
301defm S_BUFFER_ATOMIC_UMAX : SM_Pseudo_Atomics <"s_buffer_atomic_umax", SReg_128, SReg_32_XM0_XEXEC>;
302defm S_BUFFER_ATOMIC_AND : SM_Pseudo_Atomics <"s_buffer_atomic_and", SReg_128, SReg_32_XM0_XEXEC>;
303defm S_BUFFER_ATOMIC_OR : SM_Pseudo_Atomics <"s_buffer_atomic_or", SReg_128, SReg_32_XM0_XEXEC>;
304defm S_BUFFER_ATOMIC_XOR : SM_Pseudo_Atomics <"s_buffer_atomic_xor", SReg_128, SReg_32_XM0_XEXEC>;
305defm S_BUFFER_ATOMIC_INC : SM_Pseudo_Atomics <"s_buffer_atomic_inc", SReg_128, SReg_32_XM0_XEXEC>;
306defm S_BUFFER_ATOMIC_DEC : SM_Pseudo_Atomics <"s_buffer_atomic_dec", SReg_128, SReg_32_XM0_XEXEC>;
307
308defm S_BUFFER_ATOMIC_SWAP_X2 : SM_Pseudo_Atomics <"s_buffer_atomic_swap_x2", SReg_128, SReg_64_XEXEC>;
309defm S_BUFFER_ATOMIC_CMPSWAP_X2 : SM_Pseudo_Atomics <"s_buffer_atomic_cmpswap_x2", SReg_128, SReg_128>;
310defm S_BUFFER_ATOMIC_ADD_X2 : SM_Pseudo_Atomics <"s_buffer_atomic_add_x2", SReg_128, SReg_64_XEXEC>;
311defm S_BUFFER_ATOMIC_SUB_X2 : SM_Pseudo_Atomics <"s_buffer_atomic_sub_x2", SReg_128, SReg_64_XEXEC>;
312defm S_BUFFER_ATOMIC_SMIN_X2 : SM_Pseudo_Atomics <"s_buffer_atomic_smin_x2", SReg_128, SReg_64_XEXEC>;
313defm S_BUFFER_ATOMIC_UMIN_X2 : SM_Pseudo_Atomics <"s_buffer_atomic_umin_x2", SReg_128, SReg_64_XEXEC>;
314defm S_BUFFER_ATOMIC_SMAX_X2 : SM_Pseudo_Atomics <"s_buffer_atomic_smax_x2", SReg_128, SReg_64_XEXEC>;
315defm S_BUFFER_ATOMIC_UMAX_X2 : SM_Pseudo_Atomics <"s_buffer_atomic_umax_x2", SReg_128, SReg_64_XEXEC>;
316defm S_BUFFER_ATOMIC_AND_X2 : SM_Pseudo_Atomics <"s_buffer_atomic_and_x2", SReg_128, SReg_64_XEXEC>;
317defm S_BUFFER_ATOMIC_OR_X2 : SM_Pseudo_Atomics <"s_buffer_atomic_or_x2", SReg_128, SReg_64_XEXEC>;
318defm S_BUFFER_ATOMIC_XOR_X2 : SM_Pseudo_Atomics <"s_buffer_atomic_xor_x2", SReg_128, SReg_64_XEXEC>;
319defm S_BUFFER_ATOMIC_INC_X2 : SM_Pseudo_Atomics <"s_buffer_atomic_inc_x2", SReg_128, SReg_64_XEXEC>;
320defm S_BUFFER_ATOMIC_DEC_X2 : SM_Pseudo_Atomics <"s_buffer_atomic_dec_x2", SReg_128, SReg_64_XEXEC>;
321
322defm S_ATOMIC_SWAP : SM_Pseudo_Atomics <"s_atomic_swap", SReg_64, SReg_32_XM0_XEXEC>;
323defm S_ATOMIC_CMPSWAP : SM_Pseudo_Atomics <"s_atomic_cmpswap", SReg_64, SReg_64_XEXEC>;
324defm S_ATOMIC_ADD : SM_Pseudo_Atomics <"s_atomic_add", SReg_64, SReg_32_XM0_XEXEC>;
325defm S_ATOMIC_SUB : SM_Pseudo_Atomics <"s_atomic_sub", SReg_64, SReg_32_XM0_XEXEC>;
326defm S_ATOMIC_SMIN : SM_Pseudo_Atomics <"s_atomic_smin", SReg_64, SReg_32_XM0_XEXEC>;
327defm S_ATOMIC_UMIN : SM_Pseudo_Atomics <"s_atomic_umin", SReg_64, SReg_32_XM0_XEXEC>;
328defm S_ATOMIC_SMAX : SM_Pseudo_Atomics <"s_atomic_smax", SReg_64, SReg_32_XM0_XEXEC>;
329defm S_ATOMIC_UMAX : SM_Pseudo_Atomics <"s_atomic_umax", SReg_64, SReg_32_XM0_XEXEC>;
330defm S_ATOMIC_AND : SM_Pseudo_Atomics <"s_atomic_and", SReg_64, SReg_32_XM0_XEXEC>;
331defm S_ATOMIC_OR : SM_Pseudo_Atomics <"s_atomic_or", SReg_64, SReg_32_XM0_XEXEC>;
332defm S_ATOMIC_XOR : SM_Pseudo_Atomics <"s_atomic_xor", SReg_64, SReg_32_XM0_XEXEC>;
333defm S_ATOMIC_INC : SM_Pseudo_Atomics <"s_atomic_inc", SReg_64, SReg_32_XM0_XEXEC>;
334defm S_ATOMIC_DEC : SM_Pseudo_Atomics <"s_atomic_dec", SReg_64, SReg_32_XM0_XEXEC>;
335
336defm S_ATOMIC_SWAP_X2 : SM_Pseudo_Atomics <"s_atomic_swap_x2", SReg_64, SReg_64_XEXEC>;
337defm S_ATOMIC_CMPSWAP_X2 : SM_Pseudo_Atomics <"s_atomic_cmpswap_x2", SReg_64, SReg_128>;
338defm S_ATOMIC_ADD_X2 : SM_Pseudo_Atomics <"s_atomic_add_x2", SReg_64, SReg_64_XEXEC>;
339defm S_ATOMIC_SUB_X2 : SM_Pseudo_Atomics <"s_atomic_sub_x2", SReg_64, SReg_64_XEXEC>;
340defm S_ATOMIC_SMIN_X2 : SM_Pseudo_Atomics <"s_atomic_smin_x2", SReg_64, SReg_64_XEXEC>;
341defm S_ATOMIC_UMIN_X2 : SM_Pseudo_Atomics <"s_atomic_umin_x2", SReg_64, SReg_64_XEXEC>;
342defm S_ATOMIC_SMAX_X2 : SM_Pseudo_Atomics <"s_atomic_smax_x2", SReg_64, SReg_64_XEXEC>;
343defm S_ATOMIC_UMAX_X2 : SM_Pseudo_Atomics <"s_atomic_umax_x2", SReg_64, SReg_64_XEXEC>;
344defm S_ATOMIC_AND_X2 : SM_Pseudo_Atomics <"s_atomic_and_x2", SReg_64, SReg_64_XEXEC>;
345defm S_ATOMIC_OR_X2 : SM_Pseudo_Atomics <"s_atomic_or_x2", SReg_64, SReg_64_XEXEC>;
346defm S_ATOMIC_XOR_X2 : SM_Pseudo_Atomics <"s_atomic_xor_x2", SReg_64, SReg_64_XEXEC>;
347defm S_ATOMIC_INC_X2 : SM_Pseudo_Atomics <"s_atomic_inc_x2", SReg_64, SReg_64_XEXEC>;
348defm S_ATOMIC_DEC_X2 : SM_Pseudo_Atomics <"s_atomic_dec_x2", SReg_64, SReg_64_XEXEC>;
349
350} // let SubtargetPredicate = HasScalarAtomics
351
Dmitry Preobrazhensky4732d872018-04-06 15:08:42 +0000352let SubtargetPredicate = isGFX9 in {
353defm S_DCACHE_DISCARD : SM_Pseudo_Discards <"s_dcache_discard">;
354defm S_DCACHE_DISCARD_X2 : SM_Pseudo_Discards <"s_dcache_discard_x2">;
355}
356
Valery Pykhtin1b138862016-09-01 09:56:47 +0000357//===----------------------------------------------------------------------===//
358// Scalar Memory Patterns
359//===----------------------------------------------------------------------===//
360
Alexander Timofeev18009562016-12-08 17:28:47 +0000361
Valery Pykhtin1b138862016-09-01 09:56:47 +0000362def smrd_load : PatFrag <(ops node:$ptr), (load node:$ptr), [{
363 auto Ld = cast<LoadSDNode>(N);
364 return Ld->getAlignment() >= 4 &&
Alexander Timofeev2e5eece2018-03-05 15:12:21 +0000365 ((((Ld->getAddressSpace() == AMDGPUASI.CONSTANT_ADDRESS) || (Ld->getAddressSpace() == AMDGPUASI.CONSTANT_ADDRESS_32BIT)) && !N->isDivergent()) ||
Yaxun Liu1a14bfa2017-03-27 14:04:01 +0000366 (Subtarget->getScalarizeGlobalBehavior() && Ld->getAddressSpace() == AMDGPUASI.GLOBAL_ADDRESS &&
Alexander Timofeev2e5eece2018-03-05 15:12:21 +0000367 !Ld->isVolatile() && !N->isDivergent() &&
Alexander Timofeev18009562016-12-08 17:28:47 +0000368 static_cast<const SITargetLowering *>(getTargetLowering())->isMemOpHasNoClobberedMemOperand(N)));
Valery Pykhtin1b138862016-09-01 09:56:47 +0000369}]>;
370
371def SMRDImm : ComplexPattern<i64, 2, "SelectSMRDImm">;
Marek Olsak8973a0a2017-05-24 14:53:50 +0000372def SMRDImm32 : ComplexPattern<i64, 2, "SelectSMRDImm32">;
Valery Pykhtin1b138862016-09-01 09:56:47 +0000373def SMRDSgpr : ComplexPattern<i64, 2, "SelectSMRDSgpr">;
374def SMRDBufferImm : ComplexPattern<i32, 1, "SelectSMRDBufferImm">;
Marek Olsak8973a0a2017-05-24 14:53:50 +0000375def SMRDBufferImm32 : ComplexPattern<i32, 1, "SelectSMRDBufferImm32">;
Valery Pykhtin1b138862016-09-01 09:56:47 +0000376
Valery Pykhtin1b138862016-09-01 09:56:47 +0000377multiclass SMRD_Pattern <string Instr, ValueType vt> {
378
379 // 1. IMM offset
Matt Arsenault90c75932017-10-03 00:06:41 +0000380 def : GCNPat <
Valery Pykhtin1b138862016-09-01 09:56:47 +0000381 (smrd_load (SMRDImm i64:$sbase, i32:$offset)),
Matt Arsenault7b647552016-10-28 21:55:15 +0000382 (vt (!cast<SM_Pseudo>(Instr#"_IMM") $sbase, $offset, 0))
Valery Pykhtin1b138862016-09-01 09:56:47 +0000383 >;
384
385 // 2. SGPR offset
Matt Arsenault90c75932017-10-03 00:06:41 +0000386 def : GCNPat <
Valery Pykhtin1b138862016-09-01 09:56:47 +0000387 (smrd_load (SMRDSgpr i64:$sbase, i32:$offset)),
Matt Arsenault7b647552016-10-28 21:55:15 +0000388 (vt (!cast<SM_Pseudo>(Instr#"_SGPR") $sbase, $offset, 0))
Valery Pykhtin1b138862016-09-01 09:56:47 +0000389 >;
390}
391
Matt Arsenault90c75932017-10-03 00:06:41 +0000392let OtherPredicates = [isSICI] in {
393def : GCNPat <
Valery Pykhtin1b138862016-09-01 09:56:47 +0000394 (i64 (readcyclecounter)),
395 (S_MEMTIME)
396>;
397}
398
399// Global and constant loads can be selected to either MUBUF or SMRD
400// instructions, but SMRD instructions are faster so we want the instruction
401// selector to prefer those.
402let AddedComplexity = 100 in {
403
404defm : SMRD_Pattern <"S_LOAD_DWORD", i32>;
405defm : SMRD_Pattern <"S_LOAD_DWORDX2", v2i32>;
406defm : SMRD_Pattern <"S_LOAD_DWORDX4", v4i32>;
407defm : SMRD_Pattern <"S_LOAD_DWORDX8", v8i32>;
408defm : SMRD_Pattern <"S_LOAD_DWORDX16", v16i32>;
409
410// 1. Offset as an immediate
Matt Arsenault90c75932017-10-03 00:06:41 +0000411def SM_LOAD_PATTERN : GCNPat < // name this pattern to reuse AddedComplexity on CI
Valery Pykhtin1b138862016-09-01 09:56:47 +0000412 (SIload_constant v4i32:$sbase, (SMRDBufferImm i32:$offset)),
Matt Arsenault7b647552016-10-28 21:55:15 +0000413 (S_BUFFER_LOAD_DWORD_IMM $sbase, $offset, 0)
Valery Pykhtin1b138862016-09-01 09:56:47 +0000414>;
415
416// 2. Offset loaded in an 32bit SGPR
Matt Arsenault90c75932017-10-03 00:06:41 +0000417def : GCNPat <
Marek Olsak5914ece2017-10-31 21:06:42 +0000418 (SIload_constant v4i32:$sbase, i32:$offset),
Matt Arsenault7b647552016-10-28 21:55:15 +0000419 (S_BUFFER_LOAD_DWORD_SGPR $sbase, $offset, 0)
Valery Pykhtin1b138862016-09-01 09:56:47 +0000420>;
421
422} // End let AddedComplexity = 100
423
Matt Arsenault90c75932017-10-03 00:06:41 +0000424let OtherPredicates = [isVI] in {
Valery Pykhtin1b138862016-09-01 09:56:47 +0000425
Matt Arsenault90c75932017-10-03 00:06:41 +0000426def : GCNPat <
Valery Pykhtin1b138862016-09-01 09:56:47 +0000427 (i64 (readcyclecounter)),
428 (S_MEMREALTIME)
429>;
430
Matt Arsenault90c75932017-10-03 00:06:41 +0000431} // let OtherPredicates = [isVI]
Valery Pykhtin1b138862016-09-01 09:56:47 +0000432
433
434//===----------------------------------------------------------------------===//
435// Targets
436//===----------------------------------------------------------------------===//
437
438//===----------------------------------------------------------------------===//
439// SI
440//===----------------------------------------------------------------------===//
441
442class SMRD_Real_si <bits<5> op, SM_Pseudo ps>
443 : SM_Real<ps>
444 , SIMCInstr<ps.PseudoInstr, SIEncodingFamily.SI>
445 , Enc32 {
446
447 let AssemblerPredicates = [isSICI];
448 let DecoderNamespace = "SICI";
449
450 let Inst{7-0} = !if(ps.has_offset, offset{7-0}, ?);
451 let Inst{8} = imm;
452 let Inst{14-9} = !if(ps.has_sbase, sbase{6-1}, ?);
453 let Inst{21-15} = !if(ps.has_sdst, sdst{6-0}, ?);
454 let Inst{26-22} = op;
455 let Inst{31-27} = 0x18; //encoding
456}
457
Matt Arsenault7b647552016-10-28 21:55:15 +0000458// FIXME: Assembler should reject trying to use glc on SMRD
459// instructions on SI.
Valery Pykhtin1b138862016-09-01 09:56:47 +0000460multiclass SM_Real_Loads_si<bits<5> op, string ps,
461 SM_Load_Pseudo immPs = !cast<SM_Load_Pseudo>(ps#_IMM),
462 SM_Load_Pseudo sgprPs = !cast<SM_Load_Pseudo>(ps#_SGPR)> {
Matt Arsenault7b647552016-10-28 21:55:15 +0000463
Valery Pykhtin1b138862016-09-01 09:56:47 +0000464 def _IMM_si : SMRD_Real_si <op, immPs> {
Artem Tamazov54bfd542016-10-31 16:07:39 +0000465 let InOperandList = (ins immPs.BaseClass:$sbase, smrd_offset_8:$offset, GLC:$glc);
Valery Pykhtin1b138862016-09-01 09:56:47 +0000466 }
Matt Arsenault7b647552016-10-28 21:55:15 +0000467
468 // FIXME: The operand name $offset is inconsistent with $soff used
469 // in the pseudo
Valery Pykhtin1b138862016-09-01 09:56:47 +0000470 def _SGPR_si : SMRD_Real_si <op, sgprPs> {
Matt Arsenault7b647552016-10-28 21:55:15 +0000471 let InOperandList = (ins sgprPs.BaseClass:$sbase, SReg_32:$offset, GLC:$glc);
Valery Pykhtin1b138862016-09-01 09:56:47 +0000472 }
Matt Arsenault7b647552016-10-28 21:55:15 +0000473
Valery Pykhtin1b138862016-09-01 09:56:47 +0000474}
475
476defm S_LOAD_DWORD : SM_Real_Loads_si <0x00, "S_LOAD_DWORD">;
477defm S_LOAD_DWORDX2 : SM_Real_Loads_si <0x01, "S_LOAD_DWORDX2">;
478defm S_LOAD_DWORDX4 : SM_Real_Loads_si <0x02, "S_LOAD_DWORDX4">;
479defm S_LOAD_DWORDX8 : SM_Real_Loads_si <0x03, "S_LOAD_DWORDX8">;
480defm S_LOAD_DWORDX16 : SM_Real_Loads_si <0x04, "S_LOAD_DWORDX16">;
481defm S_BUFFER_LOAD_DWORD : SM_Real_Loads_si <0x08, "S_BUFFER_LOAD_DWORD">;
482defm S_BUFFER_LOAD_DWORDX2 : SM_Real_Loads_si <0x09, "S_BUFFER_LOAD_DWORDX2">;
483defm S_BUFFER_LOAD_DWORDX4 : SM_Real_Loads_si <0x0a, "S_BUFFER_LOAD_DWORDX4">;
484defm S_BUFFER_LOAD_DWORDX8 : SM_Real_Loads_si <0x0b, "S_BUFFER_LOAD_DWORDX8">;
485defm S_BUFFER_LOAD_DWORDX16 : SM_Real_Loads_si <0x0c, "S_BUFFER_LOAD_DWORDX16">;
486
487def S_MEMTIME_si : SMRD_Real_si <0x1e, S_MEMTIME>;
488def S_DCACHE_INV_si : SMRD_Real_si <0x1f, S_DCACHE_INV>;
489
490
491//===----------------------------------------------------------------------===//
492// VI
493//===----------------------------------------------------------------------===//
494
495class SMEM_Real_vi <bits<8> op, SM_Pseudo ps>
496 : SM_Real<ps>
497 , SIMCInstr<ps.PseudoInstr, SIEncodingFamily.VI>
498 , Enc64 {
Matt Arsenault7b647552016-10-28 21:55:15 +0000499 bit glc;
Valery Pykhtin1b138862016-09-01 09:56:47 +0000500
501 let AssemblerPredicates = [isVI];
502 let DecoderNamespace = "VI";
503
504 let Inst{5-0} = !if(ps.has_sbase, sbase{6-1}, ?);
505 let Inst{12-6} = !if(ps.has_sdst, sdst{6-0}, ?);
506
Matt Arsenault7b647552016-10-28 21:55:15 +0000507 let Inst{16} = !if(ps.has_glc, glc, ?);
508 let Inst{17} = imm;
Valery Pykhtin1b138862016-09-01 09:56:47 +0000509 let Inst{25-18} = op;
510 let Inst{31-26} = 0x30; //encoding
511 let Inst{51-32} = !if(ps.has_offset, offset{19-0}, ?);
512}
513
514multiclass SM_Real_Loads_vi<bits<8> op, string ps,
515 SM_Load_Pseudo immPs = !cast<SM_Load_Pseudo>(ps#_IMM),
516 SM_Load_Pseudo sgprPs = !cast<SM_Load_Pseudo>(ps#_SGPR)> {
517 def _IMM_vi : SMEM_Real_vi <op, immPs> {
Artem Tamazov54bfd542016-10-31 16:07:39 +0000518 let InOperandList = (ins immPs.BaseClass:$sbase, smrd_offset_20:$offset, GLC:$glc);
Valery Pykhtin1b138862016-09-01 09:56:47 +0000519 }
520 def _SGPR_vi : SMEM_Real_vi <op, sgprPs> {
Matt Arsenault7b647552016-10-28 21:55:15 +0000521 let InOperandList = (ins sgprPs.BaseClass:$sbase, SReg_32:$offset, GLC:$glc);
522 }
523}
524
Sam Kolton83102d92016-12-05 09:58:51 +0000525class SMEM_Real_Store_vi <bits<8> op, SM_Pseudo ps> : SMEM_Real_vi <op, ps> {
526 // encoding
527 bits<7> sdata;
528
529 let sdst = ?;
530 let Inst{12-6} = !if(ps.has_sdst, sdata{6-0}, ?);
531}
532
Matt Arsenault7b647552016-10-28 21:55:15 +0000533multiclass SM_Real_Stores_vi<bits<8> op, string ps,
534 SM_Store_Pseudo immPs = !cast<SM_Store_Pseudo>(ps#_IMM),
535 SM_Store_Pseudo sgprPs = !cast<SM_Store_Pseudo>(ps#_SGPR)> {
536 // FIXME: The operand name $offset is inconsistent with $soff used
537 // in the pseudo
Sam Kolton83102d92016-12-05 09:58:51 +0000538 def _IMM_vi : SMEM_Real_Store_vi <op, immPs> {
Artem Tamazov54bfd542016-10-31 16:07:39 +0000539 let InOperandList = (ins immPs.SrcClass:$sdata, immPs.BaseClass:$sbase, smrd_offset_20:$offset, GLC:$glc);
Matt Arsenault7b647552016-10-28 21:55:15 +0000540 }
541
Sam Kolton83102d92016-12-05 09:58:51 +0000542 def _SGPR_vi : SMEM_Real_Store_vi <op, sgprPs> {
Matt Arsenault7b647552016-10-28 21:55:15 +0000543 let InOperandList = (ins sgprPs.SrcClass:$sdata, sgprPs.BaseClass:$sbase, SReg_32:$offset, GLC:$glc);
Valery Pykhtin1b138862016-09-01 09:56:47 +0000544 }
545}
546
547defm S_LOAD_DWORD : SM_Real_Loads_vi <0x00, "S_LOAD_DWORD">;
548defm S_LOAD_DWORDX2 : SM_Real_Loads_vi <0x01, "S_LOAD_DWORDX2">;
549defm S_LOAD_DWORDX4 : SM_Real_Loads_vi <0x02, "S_LOAD_DWORDX4">;
550defm S_LOAD_DWORDX8 : SM_Real_Loads_vi <0x03, "S_LOAD_DWORDX8">;
551defm S_LOAD_DWORDX16 : SM_Real_Loads_vi <0x04, "S_LOAD_DWORDX16">;
552defm S_BUFFER_LOAD_DWORD : SM_Real_Loads_vi <0x08, "S_BUFFER_LOAD_DWORD">;
553defm S_BUFFER_LOAD_DWORDX2 : SM_Real_Loads_vi <0x09, "S_BUFFER_LOAD_DWORDX2">;
554defm S_BUFFER_LOAD_DWORDX4 : SM_Real_Loads_vi <0x0a, "S_BUFFER_LOAD_DWORDX4">;
555defm S_BUFFER_LOAD_DWORDX8 : SM_Real_Loads_vi <0x0b, "S_BUFFER_LOAD_DWORDX8">;
556defm S_BUFFER_LOAD_DWORDX16 : SM_Real_Loads_vi <0x0c, "S_BUFFER_LOAD_DWORDX16">;
557
Matt Arsenault7b647552016-10-28 21:55:15 +0000558defm S_STORE_DWORD : SM_Real_Stores_vi <0x10, "S_STORE_DWORD">;
559defm S_STORE_DWORDX2 : SM_Real_Stores_vi <0x11, "S_STORE_DWORDX2">;
560defm S_STORE_DWORDX4 : SM_Real_Stores_vi <0x12, "S_STORE_DWORDX4">;
561
562defm S_BUFFER_STORE_DWORD : SM_Real_Stores_vi <0x18, "S_BUFFER_STORE_DWORD">;
563defm S_BUFFER_STORE_DWORDX2 : SM_Real_Stores_vi <0x19, "S_BUFFER_STORE_DWORDX2">;
564defm S_BUFFER_STORE_DWORDX4 : SM_Real_Stores_vi <0x1a, "S_BUFFER_STORE_DWORDX4">;
565
Sam Kolton83102d92016-12-05 09:58:51 +0000566// These instructions use same encoding
Valery Pykhtin1b138862016-09-01 09:56:47 +0000567def S_DCACHE_INV_vi : SMEM_Real_vi <0x20, S_DCACHE_INV>;
568def S_DCACHE_WB_vi : SMEM_Real_vi <0x21, S_DCACHE_WB>;
569def S_DCACHE_INV_VOL_vi : SMEM_Real_vi <0x22, S_DCACHE_INV_VOL>;
570def S_DCACHE_WB_VOL_vi : SMEM_Real_vi <0x23, S_DCACHE_WB_VOL>;
571def S_MEMTIME_vi : SMEM_Real_vi <0x24, S_MEMTIME>;
572def S_MEMREALTIME_vi : SMEM_Real_vi <0x25, S_MEMREALTIME>;
573
Dmitry Preobrazhenskydd2b9292018-03-28 14:08:03 +0000574defm S_SCRATCH_LOAD_DWORD : SM_Real_Loads_vi <0x05, "S_SCRATCH_LOAD_DWORD">;
575defm S_SCRATCH_LOAD_DWORDX2 : SM_Real_Loads_vi <0x06, "S_SCRATCH_LOAD_DWORDX2">;
576defm S_SCRATCH_LOAD_DWORDX4 : SM_Real_Loads_vi <0x07, "S_SCRATCH_LOAD_DWORDX4">;
577
578defm S_SCRATCH_STORE_DWORD : SM_Real_Stores_vi <0x15, "S_SCRATCH_STORE_DWORD">;
579defm S_SCRATCH_STORE_DWORDX2 : SM_Real_Stores_vi <0x16, "S_SCRATCH_STORE_DWORDX2">;
580defm S_SCRATCH_STORE_DWORDX4 : SM_Real_Stores_vi <0x17, "S_SCRATCH_STORE_DWORDX4">;
Valery Pykhtin1b138862016-09-01 09:56:47 +0000581
582//===----------------------------------------------------------------------===//
Dmitry Preobrazhensky6bad04e2018-04-02 16:10:25 +0000583// GFX9
584//===----------------------------------------------------------------------===//
585
586class SMEM_Atomic_Real_vi <bits<8> op, SM_Atomic_Pseudo ps>
587 : SMEM_Real_vi <op, ps> {
588
589 bits<7> sdata;
590
591 let Constraints = ps.Constraints;
592 let DisableEncoding = ps.DisableEncoding;
593
594 let glc = ps.glc;
595 let Inst{12-6} = !if(glc, sdst{6-0}, sdata{6-0});
596}
597
598multiclass SM_Real_Atomics_vi<bits<8> op, string ps> {
599 def _IMM_vi : SMEM_Atomic_Real_vi <op, !cast<SM_Atomic_Pseudo>(ps#_IMM)>;
600 def _SGPR_vi : SMEM_Atomic_Real_vi <op, !cast<SM_Atomic_Pseudo>(ps#_SGPR)>;
601 def _IMM_RTN_vi : SMEM_Atomic_Real_vi <op, !cast<SM_Atomic_Pseudo>(ps#_IMM_RTN)>;
602 def _SGPR_RTN_vi : SMEM_Atomic_Real_vi <op, !cast<SM_Atomic_Pseudo>(ps#_SGPR_RTN)>;
603}
604
605defm S_BUFFER_ATOMIC_SWAP : SM_Real_Atomics_vi <0x40, "S_BUFFER_ATOMIC_SWAP">;
606defm S_BUFFER_ATOMIC_CMPSWAP : SM_Real_Atomics_vi <0x41, "S_BUFFER_ATOMIC_CMPSWAP">;
607defm S_BUFFER_ATOMIC_ADD : SM_Real_Atomics_vi <0x42, "S_BUFFER_ATOMIC_ADD">;
608defm S_BUFFER_ATOMIC_SUB : SM_Real_Atomics_vi <0x43, "S_BUFFER_ATOMIC_SUB">;
609defm S_BUFFER_ATOMIC_SMIN : SM_Real_Atomics_vi <0x44, "S_BUFFER_ATOMIC_SMIN">;
610defm S_BUFFER_ATOMIC_UMIN : SM_Real_Atomics_vi <0x45, "S_BUFFER_ATOMIC_UMIN">;
611defm S_BUFFER_ATOMIC_SMAX : SM_Real_Atomics_vi <0x46, "S_BUFFER_ATOMIC_SMAX">;
612defm S_BUFFER_ATOMIC_UMAX : SM_Real_Atomics_vi <0x47, "S_BUFFER_ATOMIC_UMAX">;
613defm S_BUFFER_ATOMIC_AND : SM_Real_Atomics_vi <0x48, "S_BUFFER_ATOMIC_AND">;
614defm S_BUFFER_ATOMIC_OR : SM_Real_Atomics_vi <0x49, "S_BUFFER_ATOMIC_OR">;
615defm S_BUFFER_ATOMIC_XOR : SM_Real_Atomics_vi <0x4a, "S_BUFFER_ATOMIC_XOR">;
616defm S_BUFFER_ATOMIC_INC : SM_Real_Atomics_vi <0x4b, "S_BUFFER_ATOMIC_INC">;
617defm S_BUFFER_ATOMIC_DEC : SM_Real_Atomics_vi <0x4c, "S_BUFFER_ATOMIC_DEC">;
618
619defm S_BUFFER_ATOMIC_SWAP_X2 : SM_Real_Atomics_vi <0x60, "S_BUFFER_ATOMIC_SWAP_X2">;
620defm S_BUFFER_ATOMIC_CMPSWAP_X2 : SM_Real_Atomics_vi <0x61, "S_BUFFER_ATOMIC_CMPSWAP_X2">;
621defm S_BUFFER_ATOMIC_ADD_X2 : SM_Real_Atomics_vi <0x62, "S_BUFFER_ATOMIC_ADD_X2">;
622defm S_BUFFER_ATOMIC_SUB_X2 : SM_Real_Atomics_vi <0x63, "S_BUFFER_ATOMIC_SUB_X2">;
623defm S_BUFFER_ATOMIC_SMIN_X2 : SM_Real_Atomics_vi <0x64, "S_BUFFER_ATOMIC_SMIN_X2">;
624defm S_BUFFER_ATOMIC_UMIN_X2 : SM_Real_Atomics_vi <0x65, "S_BUFFER_ATOMIC_UMIN_X2">;
625defm S_BUFFER_ATOMIC_SMAX_X2 : SM_Real_Atomics_vi <0x66, "S_BUFFER_ATOMIC_SMAX_X2">;
626defm S_BUFFER_ATOMIC_UMAX_X2 : SM_Real_Atomics_vi <0x67, "S_BUFFER_ATOMIC_UMAX_X2">;
627defm S_BUFFER_ATOMIC_AND_X2 : SM_Real_Atomics_vi <0x68, "S_BUFFER_ATOMIC_AND_X2">;
628defm S_BUFFER_ATOMIC_OR_X2 : SM_Real_Atomics_vi <0x69, "S_BUFFER_ATOMIC_OR_X2">;
629defm S_BUFFER_ATOMIC_XOR_X2 : SM_Real_Atomics_vi <0x6a, "S_BUFFER_ATOMIC_XOR_X2">;
630defm S_BUFFER_ATOMIC_INC_X2 : SM_Real_Atomics_vi <0x6b, "S_BUFFER_ATOMIC_INC_X2">;
631defm S_BUFFER_ATOMIC_DEC_X2 : SM_Real_Atomics_vi <0x6c, "S_BUFFER_ATOMIC_DEC_X2">;
632
633defm S_ATOMIC_SWAP : SM_Real_Atomics_vi <0x80, "S_ATOMIC_SWAP">;
634defm S_ATOMIC_CMPSWAP : SM_Real_Atomics_vi <0x81, "S_ATOMIC_CMPSWAP">;
635defm S_ATOMIC_ADD : SM_Real_Atomics_vi <0x82, "S_ATOMIC_ADD">;
636defm S_ATOMIC_SUB : SM_Real_Atomics_vi <0x83, "S_ATOMIC_SUB">;
637defm S_ATOMIC_SMIN : SM_Real_Atomics_vi <0x84, "S_ATOMIC_SMIN">;
638defm S_ATOMIC_UMIN : SM_Real_Atomics_vi <0x85, "S_ATOMIC_UMIN">;
639defm S_ATOMIC_SMAX : SM_Real_Atomics_vi <0x86, "S_ATOMIC_SMAX">;
640defm S_ATOMIC_UMAX : SM_Real_Atomics_vi <0x87, "S_ATOMIC_UMAX">;
641defm S_ATOMIC_AND : SM_Real_Atomics_vi <0x88, "S_ATOMIC_AND">;
642defm S_ATOMIC_OR : SM_Real_Atomics_vi <0x89, "S_ATOMIC_OR">;
643defm S_ATOMIC_XOR : SM_Real_Atomics_vi <0x8a, "S_ATOMIC_XOR">;
644defm S_ATOMIC_INC : SM_Real_Atomics_vi <0x8b, "S_ATOMIC_INC">;
645defm S_ATOMIC_DEC : SM_Real_Atomics_vi <0x8c, "S_ATOMIC_DEC">;
646
647defm S_ATOMIC_SWAP_X2 : SM_Real_Atomics_vi <0xa0, "S_ATOMIC_SWAP_X2">;
648defm S_ATOMIC_CMPSWAP_X2 : SM_Real_Atomics_vi <0xa1, "S_ATOMIC_CMPSWAP_X2">;
649defm S_ATOMIC_ADD_X2 : SM_Real_Atomics_vi <0xa2, "S_ATOMIC_ADD_X2">;
650defm S_ATOMIC_SUB_X2 : SM_Real_Atomics_vi <0xa3, "S_ATOMIC_SUB_X2">;
651defm S_ATOMIC_SMIN_X2 : SM_Real_Atomics_vi <0xa4, "S_ATOMIC_SMIN_X2">;
652defm S_ATOMIC_UMIN_X2 : SM_Real_Atomics_vi <0xa5, "S_ATOMIC_UMIN_X2">;
653defm S_ATOMIC_SMAX_X2 : SM_Real_Atomics_vi <0xa6, "S_ATOMIC_SMAX_X2">;
654defm S_ATOMIC_UMAX_X2 : SM_Real_Atomics_vi <0xa7, "S_ATOMIC_UMAX_X2">;
655defm S_ATOMIC_AND_X2 : SM_Real_Atomics_vi <0xa8, "S_ATOMIC_AND_X2">;
656defm S_ATOMIC_OR_X2 : SM_Real_Atomics_vi <0xa9, "S_ATOMIC_OR_X2">;
657defm S_ATOMIC_XOR_X2 : SM_Real_Atomics_vi <0xaa, "S_ATOMIC_XOR_X2">;
658defm S_ATOMIC_INC_X2 : SM_Real_Atomics_vi <0xab, "S_ATOMIC_INC_X2">;
659defm S_ATOMIC_DEC_X2 : SM_Real_Atomics_vi <0xac, "S_ATOMIC_DEC_X2">;
660
Dmitry Preobrazhensky4732d872018-04-06 15:08:42 +0000661multiclass SM_Real_Discard_vi<bits<8> op, string ps> {
662 def _IMM_vi : SMEM_Real_vi <op, !cast<SM_Discard_Pseudo>(ps#_IMM)>;
663 def _SGPR_vi : SMEM_Real_vi <op, !cast<SM_Discard_Pseudo>(ps#_SGPR)>;
664}
665
666defm S_DCACHE_DISCARD : SM_Real_Discard_vi <0x28, "S_DCACHE_DISCARD">;
667defm S_DCACHE_DISCARD_X2 : SM_Real_Discard_vi <0x29, "S_DCACHE_DISCARD_X2">;
668
Dmitry Preobrazhensky6bad04e2018-04-02 16:10:25 +0000669//===----------------------------------------------------------------------===//
Valery Pykhtin1b138862016-09-01 09:56:47 +0000670// CI
671//===----------------------------------------------------------------------===//
672
673def smrd_literal_offset : NamedOperandU32<"SMRDLiteralOffset",
674 NamedMatchClass<"SMRDLiteralOffset">> {
675 let OperandType = "OPERAND_IMMEDIATE";
676}
677
678class SMRD_Real_Load_IMM_ci <bits<5> op, SM_Load_Pseudo ps> :
679 SM_Real<ps>,
680 Enc64 {
681
682 let AssemblerPredicates = [isCIOnly];
683 let DecoderNamespace = "CI";
Matt Arsenault7b647552016-10-28 21:55:15 +0000684 let InOperandList = (ins ps.BaseClass:$sbase, smrd_literal_offset:$offset, GLC:$glc);
Valery Pykhtin1b138862016-09-01 09:56:47 +0000685
686 let LGKM_CNT = ps.LGKM_CNT;
687 let SMRD = ps.SMRD;
688 let mayLoad = ps.mayLoad;
689 let mayStore = ps.mayStore;
690 let hasSideEffects = ps.hasSideEffects;
691 let SchedRW = ps.SchedRW;
692 let UseNamedOperandTable = ps.UseNamedOperandTable;
693
694 let Inst{7-0} = 0xff;
695 let Inst{8} = 0;
696 let Inst{14-9} = sbase{6-1};
697 let Inst{21-15} = sdst{6-0};
698 let Inst{26-22} = op;
699 let Inst{31-27} = 0x18; //encoding
700 let Inst{63-32} = offset{31-0};
701}
702
703def S_LOAD_DWORD_IMM_ci : SMRD_Real_Load_IMM_ci <0x00, S_LOAD_DWORD_IMM>;
704def S_LOAD_DWORDX2_IMM_ci : SMRD_Real_Load_IMM_ci <0x01, S_LOAD_DWORDX2_IMM>;
705def S_LOAD_DWORDX4_IMM_ci : SMRD_Real_Load_IMM_ci <0x02, S_LOAD_DWORDX4_IMM>;
706def S_LOAD_DWORDX8_IMM_ci : SMRD_Real_Load_IMM_ci <0x03, S_LOAD_DWORDX8_IMM>;
707def S_LOAD_DWORDX16_IMM_ci : SMRD_Real_Load_IMM_ci <0x04, S_LOAD_DWORDX16_IMM>;
708def S_BUFFER_LOAD_DWORD_IMM_ci : SMRD_Real_Load_IMM_ci <0x08, S_BUFFER_LOAD_DWORD_IMM>;
709def S_BUFFER_LOAD_DWORDX2_IMM_ci : SMRD_Real_Load_IMM_ci <0x09, S_BUFFER_LOAD_DWORDX2_IMM>;
710def S_BUFFER_LOAD_DWORDX4_IMM_ci : SMRD_Real_Load_IMM_ci <0x0a, S_BUFFER_LOAD_DWORDX4_IMM>;
711def S_BUFFER_LOAD_DWORDX8_IMM_ci : SMRD_Real_Load_IMM_ci <0x0b, S_BUFFER_LOAD_DWORDX8_IMM>;
712def S_BUFFER_LOAD_DWORDX16_IMM_ci : SMRD_Real_Load_IMM_ci <0x0c, S_BUFFER_LOAD_DWORDX16_IMM>;
713
714class SMRD_Real_ci <bits<5> op, SM_Pseudo ps>
715 : SM_Real<ps>
716 , SIMCInstr<ps.PseudoInstr, SIEncodingFamily.SI>
717 , Enc32 {
718
719 let AssemblerPredicates = [isCIOnly];
720 let DecoderNamespace = "CI";
721
722 let Inst{7-0} = !if(ps.has_offset, offset{7-0}, ?);
723 let Inst{8} = imm;
724 let Inst{14-9} = !if(ps.has_sbase, sbase{6-1}, ?);
725 let Inst{21-15} = !if(ps.has_sdst, sdst{6-0}, ?);
726 let Inst{26-22} = op;
727 let Inst{31-27} = 0x18; //encoding
728}
729
730def S_DCACHE_INV_VOL_ci : SMRD_Real_ci <0x1d, S_DCACHE_INV_VOL>;
Marek Olsak8973a0a2017-05-24 14:53:50 +0000731
732let AddedComplexity = SM_LOAD_PATTERN.AddedComplexity in {
733
Matt Arsenault90c75932017-10-03 00:06:41 +0000734class SMRD_Pattern_ci <string Instr, ValueType vt> : GCNPat <
Marek Olsak8973a0a2017-05-24 14:53:50 +0000735 (smrd_load (SMRDImm32 i64:$sbase, i32:$offset)),
Nicolai Haehnle4186cc72018-03-19 14:14:20 +0000736 (vt (!cast<InstSI>(Instr#"_IMM_ci") $sbase, $offset, 0))> {
Matt Arsenault90c75932017-10-03 00:06:41 +0000737 let OtherPredicates = [isCIOnly];
Marek Olsak8973a0a2017-05-24 14:53:50 +0000738}
739
740def : SMRD_Pattern_ci <"S_LOAD_DWORD", i32>;
741def : SMRD_Pattern_ci <"S_LOAD_DWORDX2", v2i32>;
742def : SMRD_Pattern_ci <"S_LOAD_DWORDX4", v4i32>;
743def : SMRD_Pattern_ci <"S_LOAD_DWORDX8", v8i32>;
744def : SMRD_Pattern_ci <"S_LOAD_DWORDX16", v16i32>;
745
Matt Arsenault90c75932017-10-03 00:06:41 +0000746def : GCNPat <
Marek Olsak8973a0a2017-05-24 14:53:50 +0000747 (SIload_constant v4i32:$sbase, (SMRDBufferImm32 i32:$offset)),
748 (S_BUFFER_LOAD_DWORD_IMM_ci $sbase, $offset, 0)> {
Matt Arsenault90c75932017-10-03 00:06:41 +0000749 let OtherPredicates = [isCI]; // should this be isCIOnly?
Marek Olsak8973a0a2017-05-24 14:53:50 +0000750}
751
752} // End let AddedComplexity = SM_LOAD_PATTERN.AddedComplexity
753