blob: 75e0133135c0d55a52381eb844afb84777c799fb [file] [log] [blame]
Valery Pykhtin1b138862016-09-01 09:56:47 +00001//===---- SMInstructions.td - Scalar Memory Instruction Defintions --------===//
2//
Chandler Carruth2946cd72019-01-19 08:50:56 +00003// Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions.
4// See https://llvm.org/LICENSE.txt for license information.
5// SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception
Valery Pykhtin1b138862016-09-01 09:56:47 +00006//
7//===----------------------------------------------------------------------===//
8
Artem Tamazov54bfd542016-10-31 16:07:39 +00009def smrd_offset_8 : NamedOperandU32<"SMRDOffset8",
10 NamedMatchClass<"SMRDOffset8">> {
Valery Pykhtin1b138862016-09-01 09:56:47 +000011 let OperandType = "OPERAND_IMMEDIATE";
12}
13
Artem Tamazov54bfd542016-10-31 16:07:39 +000014def smrd_offset_20 : NamedOperandU32<"SMRDOffset20",
15 NamedMatchClass<"SMRDOffset20">> {
16 let OperandType = "OPERAND_IMMEDIATE";
17}
Valery Pykhtin1b138862016-09-01 09:56:47 +000018
19//===----------------------------------------------------------------------===//
20// Scalar Memory classes
21//===----------------------------------------------------------------------===//
22
23class SM_Pseudo <string opName, dag outs, dag ins, string asmOps, list<dag> pattern=[]> :
24 InstSI <outs, ins, "", pattern>,
25 SIMCInstr<opName, SIEncodingFamily.NONE> {
26 let isPseudo = 1;
27 let isCodeGenOnly = 1;
28
29 let LGKM_CNT = 1;
30 let SMRD = 1;
31 let mayStore = 0;
32 let mayLoad = 1;
33 let hasSideEffects = 0;
34 let UseNamedOperandTable = 1;
35 let SchedRW = [WriteSMEM];
36 let SubtargetPredicate = isGCN;
37
38 string Mnemonic = opName;
39 string AsmOperands = asmOps;
40
41 bits<1> has_sbase = 1;
42 bits<1> has_sdst = 1;
Matt Arsenault7b647552016-10-28 21:55:15 +000043 bit has_glc = 0;
Valery Pykhtin1b138862016-09-01 09:56:47 +000044 bits<1> has_offset = 1;
45 bits<1> offset_is_imm = 0;
46}
47
48class SM_Real <SM_Pseudo ps>
49 : InstSI<ps.OutOperandList, ps.InOperandList, ps.Mnemonic # ps.AsmOperands, []> {
50
51 let isPseudo = 0;
52 let isCodeGenOnly = 0;
53
54 // copy relevant pseudo op flags
55 let SubtargetPredicate = ps.SubtargetPredicate;
56 let AsmMatchConverter = ps.AsmMatchConverter;
57
58 // encoding
59 bits<7> sbase;
60 bits<7> sdst;
61 bits<32> offset;
Matt Arsenault7b647552016-10-28 21:55:15 +000062 bits<1> imm = !if(ps.has_offset, ps.offset_is_imm, 0);
Valery Pykhtin1b138862016-09-01 09:56:47 +000063}
64
Dmitry Preobrazhensky59399ae2018-04-06 15:48:39 +000065class SM_Probe_Pseudo <string opName, dag ins, bit isImm>
66 : SM_Pseudo<opName, (outs), ins, " $sdata, $sbase, $offset"> {
67 let mayLoad = 0;
68 let mayStore = 0;
69 let has_glc = 0;
70 let LGKM_CNT = 0;
71 let ScalarStore = 0;
72 let hasSideEffects = 1;
73 let offset_is_imm = isImm;
74 let PseudoInstr = opName # !if(isImm, "_IMM", "_SGPR");
75}
76
Valery Pykhtin1b138862016-09-01 09:56:47 +000077class SM_Load_Pseudo <string opName, dag outs, dag ins, string asmOps, list<dag> pattern=[]>
78 : SM_Pseudo<opName, outs, ins, asmOps, pattern> {
79 RegisterClass BaseClass;
Matt Arsenault7b647552016-10-28 21:55:15 +000080 let mayLoad = 1;
81 let mayStore = 0;
82 let has_glc = 1;
83}
84
85class SM_Store_Pseudo <string opName, dag ins, string asmOps, list<dag> pattern = []>
86 : SM_Pseudo<opName, (outs), ins, asmOps, pattern> {
87 RegisterClass BaseClass;
88 RegisterClass SrcClass;
89 let mayLoad = 0;
90 let mayStore = 1;
91 let has_glc = 1;
92 let ScalarStore = 1;
Valery Pykhtin1b138862016-09-01 09:56:47 +000093}
94
Dmitry Preobrazhensky4732d872018-04-06 15:08:42 +000095class SM_Discard_Pseudo <string opName, dag ins, bit isImm>
96 : SM_Pseudo<opName, (outs), ins, " $sbase, $offset"> {
97 let mayLoad = 0;
98 let mayStore = 0;
99 let has_glc = 0;
100 let has_sdst = 0;
101 let ScalarStore = 0;
102 let hasSideEffects = 1;
103 let offset_is_imm = isImm;
104 let PseudoInstr = opName # !if(isImm, "_IMM", "_SGPR");
105}
106
Valery Pykhtin1b138862016-09-01 09:56:47 +0000107multiclass SM_Pseudo_Loads<string opName,
108 RegisterClass baseClass,
109 RegisterClass dstClass> {
110 def _IMM : SM_Load_Pseudo <opName,
111 (outs dstClass:$sdst),
Matt Arsenault7b647552016-10-28 21:55:15 +0000112 (ins baseClass:$sbase, i32imm:$offset, i1imm:$glc),
113 " $sdst, $sbase, $offset$glc", []> {
Valery Pykhtin1b138862016-09-01 09:56:47 +0000114 let offset_is_imm = 1;
115 let BaseClass = baseClass;
116 let PseudoInstr = opName # "_IMM";
Matt Arsenault7b647552016-10-28 21:55:15 +0000117 let has_glc = 1;
Valery Pykhtin1b138862016-09-01 09:56:47 +0000118 }
Matt Arsenault7b647552016-10-28 21:55:15 +0000119
Valery Pykhtin1b138862016-09-01 09:56:47 +0000120 def _SGPR : SM_Load_Pseudo <opName,
121 (outs dstClass:$sdst),
Matt Arsenault7b647552016-10-28 21:55:15 +0000122 (ins baseClass:$sbase, SReg_32:$soff, i1imm:$glc),
123 " $sdst, $sbase, $offset$glc", []> {
Valery Pykhtin1b138862016-09-01 09:56:47 +0000124 let BaseClass = baseClass;
125 let PseudoInstr = opName # "_SGPR";
Matt Arsenault7b647552016-10-28 21:55:15 +0000126 let has_glc = 1;
127 }
128}
129
130multiclass SM_Pseudo_Stores<string opName,
131 RegisterClass baseClass,
132 RegisterClass srcClass> {
133 def _IMM : SM_Store_Pseudo <opName,
134 (ins srcClass:$sdata, baseClass:$sbase, i32imm:$offset, i1imm:$glc),
135 " $sdata, $sbase, $offset$glc", []> {
136 let offset_is_imm = 1;
137 let BaseClass = baseClass;
138 let SrcClass = srcClass;
139 let PseudoInstr = opName # "_IMM";
140 }
141
142 def _SGPR : SM_Store_Pseudo <opName,
143 (ins srcClass:$sdata, baseClass:$sbase, SReg_32:$soff, i1imm:$glc),
144 " $sdata, $sbase, $offset$glc", []> {
145 let BaseClass = baseClass;
146 let SrcClass = srcClass;
147 let PseudoInstr = opName # "_SGPR";
Valery Pykhtin1b138862016-09-01 09:56:47 +0000148 }
149}
150
Dmitry Preobrazhensky4732d872018-04-06 15:08:42 +0000151multiclass SM_Pseudo_Discards<string opName> {
152 def _IMM : SM_Discard_Pseudo <opName, (ins SReg_64:$sbase, smrd_offset_20:$offset), 1>;
153 def _SGPR : SM_Discard_Pseudo <opName, (ins SReg_64:$sbase, SReg_32:$offset), 0>;
154}
155
Valery Pykhtin1b138862016-09-01 09:56:47 +0000156class SM_Time_Pseudo<string opName, SDPatternOperator node> : SM_Pseudo<
Matt Arsenault640c44b2016-11-29 19:39:53 +0000157 opName, (outs SReg_64_XEXEC:$sdst), (ins),
Valery Pykhtin1b138862016-09-01 09:56:47 +0000158 " $sdst", [(set i64:$sdst, (node))]> {
159 let hasSideEffects = 1;
Matt Arsenault73ce93b2017-12-08 20:01:02 +0000160 let mayStore = 0;
161 let mayLoad = 1;
Valery Pykhtin1b138862016-09-01 09:56:47 +0000162 let has_sbase = 0;
163 let has_offset = 0;
164}
165
166class SM_Inval_Pseudo <string opName, SDPatternOperator node> : SM_Pseudo<
167 opName, (outs), (ins), "", [(node)]> {
168 let hasSideEffects = 1;
169 let mayStore = 1;
170 let has_sdst = 0;
171 let has_sbase = 0;
172 let has_offset = 0;
173}
174
Dmitry Preobrazhensky59399ae2018-04-06 15:48:39 +0000175multiclass SM_Pseudo_Probe<string opName, RegisterClass baseClass> {
176 def _IMM : SM_Probe_Pseudo <opName, (ins i8imm:$sdata, baseClass:$sbase, smrd_offset_20:$offset), 1>;
177 def _SGPR : SM_Probe_Pseudo <opName, (ins i8imm:$sdata, baseClass:$sbase, SReg_32:$offset), 0>;
178}
179
Dmitry Preobrazhensky6bad04e2018-04-02 16:10:25 +0000180//===----------------------------------------------------------------------===//
181// Scalar Atomic Memory Classes
182//===----------------------------------------------------------------------===//
183
184class SM_Atomic_Pseudo <string opName,
185 dag outs, dag ins, string asmOps, bit isRet>
186 : SM_Pseudo<opName, outs, ins, asmOps, []> {
187
188 bit glc = isRet;
189
190 let mayLoad = 1;
191 let mayStore = 1;
192 let has_glc = 1;
193
194 // Should these be set?
195 let ScalarStore = 1;
196 let hasSideEffects = 1;
197 let maybeAtomic = 1;
198}
199
200class SM_Pseudo_Atomic<string opName,
201 RegisterClass baseClass,
202 RegisterClass dataClass,
203 bit isImm,
204 bit isRet> :
205 SM_Atomic_Pseudo<opName,
206 !if(isRet, (outs dataClass:$sdst), (outs)),
207 !if(isImm,
208 (ins dataClass:$sdata, baseClass:$sbase, smrd_offset_20:$offset),
209 (ins dataClass:$sdata, baseClass:$sbase, SReg_32:$offset)),
210 !if(isRet, " $sdst", " $sdata") # ", $sbase, $offset" # !if(isRet, " glc", ""),
211 isRet> {
212 let offset_is_imm = isImm;
213 let PseudoInstr = opName # !if(isImm,
214 !if(isRet, "_IMM_RTN", "_IMM"),
215 !if(isRet, "_SGPR_RTN", "_SGPR"));
216
217 let Constraints = !if(isRet, "$sdst = $sdata", "");
218 let DisableEncoding = !if(isRet, "$sdata", "");
219}
220
221multiclass SM_Pseudo_Atomics<string opName,
222 RegisterClass baseClass,
223 RegisterClass dataClass> {
224 def _IMM : SM_Pseudo_Atomic <opName, baseClass, dataClass, 1, 0>;
225 def _SGPR : SM_Pseudo_Atomic <opName, baseClass, dataClass, 0, 0>;
226 def _IMM_RTN : SM_Pseudo_Atomic <opName, baseClass, dataClass, 1, 1>;
227 def _SGPR_RTN : SM_Pseudo_Atomic <opName, baseClass, dataClass, 0, 1>;
228}
Valery Pykhtin1b138862016-09-01 09:56:47 +0000229
230//===----------------------------------------------------------------------===//
231// Scalar Memory Instructions
232//===----------------------------------------------------------------------===//
233
234// We are using the SReg_32_XM0 and not the SReg_32 register class for 32-bit
235// SMRD instructions, because the SReg_32_XM0 register class does not include M0
236// and writing to M0 from an SMRD instruction will hang the GPU.
Matt Arsenault640c44b2016-11-29 19:39:53 +0000237
238// XXX - SMEM instructions do not allow exec for data operand, but
239// does sdst for SMRD on SI/CI?
240defm S_LOAD_DWORD : SM_Pseudo_Loads <"s_load_dword", SReg_64, SReg_32_XM0_XEXEC>;
241defm S_LOAD_DWORDX2 : SM_Pseudo_Loads <"s_load_dwordx2", SReg_64, SReg_64_XEXEC>;
Valery Pykhtin1b138862016-09-01 09:56:47 +0000242defm S_LOAD_DWORDX4 : SM_Pseudo_Loads <"s_load_dwordx4", SReg_64, SReg_128>;
243defm S_LOAD_DWORDX8 : SM_Pseudo_Loads <"s_load_dwordx8", SReg_64, SReg_256>;
244defm S_LOAD_DWORDX16 : SM_Pseudo_Loads <"s_load_dwordx16", SReg_64, SReg_512>;
245
246defm S_BUFFER_LOAD_DWORD : SM_Pseudo_Loads <
Matt Arsenault640c44b2016-11-29 19:39:53 +0000247 "s_buffer_load_dword", SReg_128, SReg_32_XM0_XEXEC
Valery Pykhtin1b138862016-09-01 09:56:47 +0000248>;
249
Matt Arsenault640c44b2016-11-29 19:39:53 +0000250// FIXME: exec_lo/exec_hi appear to be allowed for SMRD loads on
251// SI/CI, bit disallowed for SMEM on VI.
Valery Pykhtin1b138862016-09-01 09:56:47 +0000252defm S_BUFFER_LOAD_DWORDX2 : SM_Pseudo_Loads <
Matt Arsenault640c44b2016-11-29 19:39:53 +0000253 "s_buffer_load_dwordx2", SReg_128, SReg_64_XEXEC
Valery Pykhtin1b138862016-09-01 09:56:47 +0000254>;
255
256defm S_BUFFER_LOAD_DWORDX4 : SM_Pseudo_Loads <
257 "s_buffer_load_dwordx4", SReg_128, SReg_128
258>;
259
260defm S_BUFFER_LOAD_DWORDX8 : SM_Pseudo_Loads <
261 "s_buffer_load_dwordx8", SReg_128, SReg_256
262>;
263
264defm S_BUFFER_LOAD_DWORDX16 : SM_Pseudo_Loads <
265 "s_buffer_load_dwordx16", SReg_128, SReg_512
266>;
267
Matt Arsenault640c44b2016-11-29 19:39:53 +0000268defm S_STORE_DWORD : SM_Pseudo_Stores <"s_store_dword", SReg_64, SReg_32_XM0_XEXEC>;
269defm S_STORE_DWORDX2 : SM_Pseudo_Stores <"s_store_dwordx2", SReg_64, SReg_64_XEXEC>;
Matt Arsenault7b647552016-10-28 21:55:15 +0000270defm S_STORE_DWORDX4 : SM_Pseudo_Stores <"s_store_dwordx4", SReg_64, SReg_128>;
271
272defm S_BUFFER_STORE_DWORD : SM_Pseudo_Stores <
Matt Arsenault640c44b2016-11-29 19:39:53 +0000273 "s_buffer_store_dword", SReg_128, SReg_32_XM0_XEXEC
Matt Arsenault7b647552016-10-28 21:55:15 +0000274>;
275
276defm S_BUFFER_STORE_DWORDX2 : SM_Pseudo_Stores <
Matt Arsenault640c44b2016-11-29 19:39:53 +0000277 "s_buffer_store_dwordx2", SReg_128, SReg_64_XEXEC
Matt Arsenault7b647552016-10-28 21:55:15 +0000278>;
279
280defm S_BUFFER_STORE_DWORDX4 : SM_Pseudo_Stores <
281 "s_buffer_store_dwordx4", SReg_128, SReg_128
282>;
283
284
Valery Pykhtin1b138862016-09-01 09:56:47 +0000285def S_MEMTIME : SM_Time_Pseudo <"s_memtime", int_amdgcn_s_memtime>;
286def S_DCACHE_INV : SM_Inval_Pseudo <"s_dcache_inv", int_amdgcn_s_dcache_inv>;
287
288let SubtargetPredicate = isCIVI in {
289def S_DCACHE_INV_VOL : SM_Inval_Pseudo <"s_dcache_inv_vol", int_amdgcn_s_dcache_inv_vol>;
290} // let SubtargetPredicate = isCIVI
291
292let SubtargetPredicate = isVI in {
293def S_DCACHE_WB : SM_Inval_Pseudo <"s_dcache_wb", int_amdgcn_s_dcache_wb>;
294def S_DCACHE_WB_VOL : SM_Inval_Pseudo <"s_dcache_wb_vol", int_amdgcn_s_dcache_wb_vol>;
295def S_MEMREALTIME : SM_Time_Pseudo <"s_memrealtime", int_amdgcn_s_memrealtime>;
Dmitry Preobrazhensky59399ae2018-04-06 15:48:39 +0000296
297defm S_ATC_PROBE : SM_Pseudo_Probe <"s_atc_probe", SReg_64>;
298defm S_ATC_PROBE_BUFFER : SM_Pseudo_Probe <"s_atc_probe_buffer", SReg_128>;
Valery Pykhtin1b138862016-09-01 09:56:47 +0000299} // SubtargetPredicate = isVI
300
Dmitry Preobrazhenskydd2b9292018-03-28 14:08:03 +0000301let SubtargetPredicate = HasFlatScratchInsts, Uses = [FLAT_SCR] in {
302defm S_SCRATCH_LOAD_DWORD : SM_Pseudo_Loads <"s_scratch_load_dword", SReg_64, SReg_32_XM0_XEXEC>;
303defm S_SCRATCH_LOAD_DWORDX2 : SM_Pseudo_Loads <"s_scratch_load_dwordx2", SReg_64, SReg_64_XEXEC>;
304defm S_SCRATCH_LOAD_DWORDX4 : SM_Pseudo_Loads <"s_scratch_load_dwordx4", SReg_64, SReg_128>;
Valery Pykhtin1b138862016-09-01 09:56:47 +0000305
Dmitry Preobrazhenskydd2b9292018-03-28 14:08:03 +0000306defm S_SCRATCH_STORE_DWORD : SM_Pseudo_Stores <"s_scratch_store_dword", SReg_64, SReg_32_XM0_XEXEC>;
307defm S_SCRATCH_STORE_DWORDX2 : SM_Pseudo_Stores <"s_scratch_store_dwordx2", SReg_64, SReg_64_XEXEC>;
308defm S_SCRATCH_STORE_DWORDX4 : SM_Pseudo_Stores <"s_scratch_store_dwordx4", SReg_64, SReg_128>;
309} // SubtargetPredicate = HasFlatScratchInsts
Valery Pykhtin1b138862016-09-01 09:56:47 +0000310
Dmitry Preobrazhensky6bad04e2018-04-02 16:10:25 +0000311let SubtargetPredicate = HasScalarAtomics in {
312
313defm S_BUFFER_ATOMIC_SWAP : SM_Pseudo_Atomics <"s_buffer_atomic_swap", SReg_128, SReg_32_XM0_XEXEC>;
314defm S_BUFFER_ATOMIC_CMPSWAP : SM_Pseudo_Atomics <"s_buffer_atomic_cmpswap", SReg_128, SReg_64_XEXEC>;
315defm S_BUFFER_ATOMIC_ADD : SM_Pseudo_Atomics <"s_buffer_atomic_add", SReg_128, SReg_32_XM0_XEXEC>;
316defm S_BUFFER_ATOMIC_SUB : SM_Pseudo_Atomics <"s_buffer_atomic_sub", SReg_128, SReg_32_XM0_XEXEC>;
317defm S_BUFFER_ATOMIC_SMIN : SM_Pseudo_Atomics <"s_buffer_atomic_smin", SReg_128, SReg_32_XM0_XEXEC>;
318defm S_BUFFER_ATOMIC_UMIN : SM_Pseudo_Atomics <"s_buffer_atomic_umin", SReg_128, SReg_32_XM0_XEXEC>;
319defm S_BUFFER_ATOMIC_SMAX : SM_Pseudo_Atomics <"s_buffer_atomic_smax", SReg_128, SReg_32_XM0_XEXEC>;
320defm S_BUFFER_ATOMIC_UMAX : SM_Pseudo_Atomics <"s_buffer_atomic_umax", SReg_128, SReg_32_XM0_XEXEC>;
321defm S_BUFFER_ATOMIC_AND : SM_Pseudo_Atomics <"s_buffer_atomic_and", SReg_128, SReg_32_XM0_XEXEC>;
322defm S_BUFFER_ATOMIC_OR : SM_Pseudo_Atomics <"s_buffer_atomic_or", SReg_128, SReg_32_XM0_XEXEC>;
323defm S_BUFFER_ATOMIC_XOR : SM_Pseudo_Atomics <"s_buffer_atomic_xor", SReg_128, SReg_32_XM0_XEXEC>;
324defm S_BUFFER_ATOMIC_INC : SM_Pseudo_Atomics <"s_buffer_atomic_inc", SReg_128, SReg_32_XM0_XEXEC>;
325defm S_BUFFER_ATOMIC_DEC : SM_Pseudo_Atomics <"s_buffer_atomic_dec", SReg_128, SReg_32_XM0_XEXEC>;
326
327defm S_BUFFER_ATOMIC_SWAP_X2 : SM_Pseudo_Atomics <"s_buffer_atomic_swap_x2", SReg_128, SReg_64_XEXEC>;
328defm S_BUFFER_ATOMIC_CMPSWAP_X2 : SM_Pseudo_Atomics <"s_buffer_atomic_cmpswap_x2", SReg_128, SReg_128>;
329defm S_BUFFER_ATOMIC_ADD_X2 : SM_Pseudo_Atomics <"s_buffer_atomic_add_x2", SReg_128, SReg_64_XEXEC>;
330defm S_BUFFER_ATOMIC_SUB_X2 : SM_Pseudo_Atomics <"s_buffer_atomic_sub_x2", SReg_128, SReg_64_XEXEC>;
331defm S_BUFFER_ATOMIC_SMIN_X2 : SM_Pseudo_Atomics <"s_buffer_atomic_smin_x2", SReg_128, SReg_64_XEXEC>;
332defm S_BUFFER_ATOMIC_UMIN_X2 : SM_Pseudo_Atomics <"s_buffer_atomic_umin_x2", SReg_128, SReg_64_XEXEC>;
333defm S_BUFFER_ATOMIC_SMAX_X2 : SM_Pseudo_Atomics <"s_buffer_atomic_smax_x2", SReg_128, SReg_64_XEXEC>;
334defm S_BUFFER_ATOMIC_UMAX_X2 : SM_Pseudo_Atomics <"s_buffer_atomic_umax_x2", SReg_128, SReg_64_XEXEC>;
335defm S_BUFFER_ATOMIC_AND_X2 : SM_Pseudo_Atomics <"s_buffer_atomic_and_x2", SReg_128, SReg_64_XEXEC>;
336defm S_BUFFER_ATOMIC_OR_X2 : SM_Pseudo_Atomics <"s_buffer_atomic_or_x2", SReg_128, SReg_64_XEXEC>;
337defm S_BUFFER_ATOMIC_XOR_X2 : SM_Pseudo_Atomics <"s_buffer_atomic_xor_x2", SReg_128, SReg_64_XEXEC>;
338defm S_BUFFER_ATOMIC_INC_X2 : SM_Pseudo_Atomics <"s_buffer_atomic_inc_x2", SReg_128, SReg_64_XEXEC>;
339defm S_BUFFER_ATOMIC_DEC_X2 : SM_Pseudo_Atomics <"s_buffer_atomic_dec_x2", SReg_128, SReg_64_XEXEC>;
340
341defm S_ATOMIC_SWAP : SM_Pseudo_Atomics <"s_atomic_swap", SReg_64, SReg_32_XM0_XEXEC>;
342defm S_ATOMIC_CMPSWAP : SM_Pseudo_Atomics <"s_atomic_cmpswap", SReg_64, SReg_64_XEXEC>;
343defm S_ATOMIC_ADD : SM_Pseudo_Atomics <"s_atomic_add", SReg_64, SReg_32_XM0_XEXEC>;
344defm S_ATOMIC_SUB : SM_Pseudo_Atomics <"s_atomic_sub", SReg_64, SReg_32_XM0_XEXEC>;
345defm S_ATOMIC_SMIN : SM_Pseudo_Atomics <"s_atomic_smin", SReg_64, SReg_32_XM0_XEXEC>;
346defm S_ATOMIC_UMIN : SM_Pseudo_Atomics <"s_atomic_umin", SReg_64, SReg_32_XM0_XEXEC>;
347defm S_ATOMIC_SMAX : SM_Pseudo_Atomics <"s_atomic_smax", SReg_64, SReg_32_XM0_XEXEC>;
348defm S_ATOMIC_UMAX : SM_Pseudo_Atomics <"s_atomic_umax", SReg_64, SReg_32_XM0_XEXEC>;
349defm S_ATOMIC_AND : SM_Pseudo_Atomics <"s_atomic_and", SReg_64, SReg_32_XM0_XEXEC>;
350defm S_ATOMIC_OR : SM_Pseudo_Atomics <"s_atomic_or", SReg_64, SReg_32_XM0_XEXEC>;
351defm S_ATOMIC_XOR : SM_Pseudo_Atomics <"s_atomic_xor", SReg_64, SReg_32_XM0_XEXEC>;
352defm S_ATOMIC_INC : SM_Pseudo_Atomics <"s_atomic_inc", SReg_64, SReg_32_XM0_XEXEC>;
353defm S_ATOMIC_DEC : SM_Pseudo_Atomics <"s_atomic_dec", SReg_64, SReg_32_XM0_XEXEC>;
354
355defm S_ATOMIC_SWAP_X2 : SM_Pseudo_Atomics <"s_atomic_swap_x2", SReg_64, SReg_64_XEXEC>;
356defm S_ATOMIC_CMPSWAP_X2 : SM_Pseudo_Atomics <"s_atomic_cmpswap_x2", SReg_64, SReg_128>;
357defm S_ATOMIC_ADD_X2 : SM_Pseudo_Atomics <"s_atomic_add_x2", SReg_64, SReg_64_XEXEC>;
358defm S_ATOMIC_SUB_X2 : SM_Pseudo_Atomics <"s_atomic_sub_x2", SReg_64, SReg_64_XEXEC>;
359defm S_ATOMIC_SMIN_X2 : SM_Pseudo_Atomics <"s_atomic_smin_x2", SReg_64, SReg_64_XEXEC>;
360defm S_ATOMIC_UMIN_X2 : SM_Pseudo_Atomics <"s_atomic_umin_x2", SReg_64, SReg_64_XEXEC>;
361defm S_ATOMIC_SMAX_X2 : SM_Pseudo_Atomics <"s_atomic_smax_x2", SReg_64, SReg_64_XEXEC>;
362defm S_ATOMIC_UMAX_X2 : SM_Pseudo_Atomics <"s_atomic_umax_x2", SReg_64, SReg_64_XEXEC>;
363defm S_ATOMIC_AND_X2 : SM_Pseudo_Atomics <"s_atomic_and_x2", SReg_64, SReg_64_XEXEC>;
364defm S_ATOMIC_OR_X2 : SM_Pseudo_Atomics <"s_atomic_or_x2", SReg_64, SReg_64_XEXEC>;
365defm S_ATOMIC_XOR_X2 : SM_Pseudo_Atomics <"s_atomic_xor_x2", SReg_64, SReg_64_XEXEC>;
366defm S_ATOMIC_INC_X2 : SM_Pseudo_Atomics <"s_atomic_inc_x2", SReg_64, SReg_64_XEXEC>;
367defm S_ATOMIC_DEC_X2 : SM_Pseudo_Atomics <"s_atomic_dec_x2", SReg_64, SReg_64_XEXEC>;
368
369} // let SubtargetPredicate = HasScalarAtomics
370
Dmitry Preobrazhensky4732d872018-04-06 15:08:42 +0000371let SubtargetPredicate = isGFX9 in {
372defm S_DCACHE_DISCARD : SM_Pseudo_Discards <"s_dcache_discard">;
373defm S_DCACHE_DISCARD_X2 : SM_Pseudo_Discards <"s_dcache_discard_x2">;
374}
375
Valery Pykhtin1b138862016-09-01 09:56:47 +0000376//===----------------------------------------------------------------------===//
Valery Pykhtin1b138862016-09-01 09:56:47 +0000377// Targets
378//===----------------------------------------------------------------------===//
379
380//===----------------------------------------------------------------------===//
381// SI
382//===----------------------------------------------------------------------===//
383
384class SMRD_Real_si <bits<5> op, SM_Pseudo ps>
385 : SM_Real<ps>
386 , SIMCInstr<ps.PseudoInstr, SIEncodingFamily.SI>
387 , Enc32 {
388
389 let AssemblerPredicates = [isSICI];
390 let DecoderNamespace = "SICI";
391
392 let Inst{7-0} = !if(ps.has_offset, offset{7-0}, ?);
393 let Inst{8} = imm;
394 let Inst{14-9} = !if(ps.has_sbase, sbase{6-1}, ?);
395 let Inst{21-15} = !if(ps.has_sdst, sdst{6-0}, ?);
396 let Inst{26-22} = op;
397 let Inst{31-27} = 0x18; //encoding
398}
399
Matt Arsenault7b647552016-10-28 21:55:15 +0000400// FIXME: Assembler should reject trying to use glc on SMRD
401// instructions on SI.
Valery Pykhtin1b138862016-09-01 09:56:47 +0000402multiclass SM_Real_Loads_si<bits<5> op, string ps,
403 SM_Load_Pseudo immPs = !cast<SM_Load_Pseudo>(ps#_IMM),
404 SM_Load_Pseudo sgprPs = !cast<SM_Load_Pseudo>(ps#_SGPR)> {
Matt Arsenault7b647552016-10-28 21:55:15 +0000405
Valery Pykhtin1b138862016-09-01 09:56:47 +0000406 def _IMM_si : SMRD_Real_si <op, immPs> {
Artem Tamazov54bfd542016-10-31 16:07:39 +0000407 let InOperandList = (ins immPs.BaseClass:$sbase, smrd_offset_8:$offset, GLC:$glc);
Valery Pykhtin1b138862016-09-01 09:56:47 +0000408 }
Matt Arsenault7b647552016-10-28 21:55:15 +0000409
410 // FIXME: The operand name $offset is inconsistent with $soff used
411 // in the pseudo
Valery Pykhtin1b138862016-09-01 09:56:47 +0000412 def _SGPR_si : SMRD_Real_si <op, sgprPs> {
Matt Arsenault7b647552016-10-28 21:55:15 +0000413 let InOperandList = (ins sgprPs.BaseClass:$sbase, SReg_32:$offset, GLC:$glc);
Valery Pykhtin1b138862016-09-01 09:56:47 +0000414 }
Matt Arsenault7b647552016-10-28 21:55:15 +0000415
Valery Pykhtin1b138862016-09-01 09:56:47 +0000416}
417
418defm S_LOAD_DWORD : SM_Real_Loads_si <0x00, "S_LOAD_DWORD">;
419defm S_LOAD_DWORDX2 : SM_Real_Loads_si <0x01, "S_LOAD_DWORDX2">;
420defm S_LOAD_DWORDX4 : SM_Real_Loads_si <0x02, "S_LOAD_DWORDX4">;
421defm S_LOAD_DWORDX8 : SM_Real_Loads_si <0x03, "S_LOAD_DWORDX8">;
422defm S_LOAD_DWORDX16 : SM_Real_Loads_si <0x04, "S_LOAD_DWORDX16">;
423defm S_BUFFER_LOAD_DWORD : SM_Real_Loads_si <0x08, "S_BUFFER_LOAD_DWORD">;
424defm S_BUFFER_LOAD_DWORDX2 : SM_Real_Loads_si <0x09, "S_BUFFER_LOAD_DWORDX2">;
425defm S_BUFFER_LOAD_DWORDX4 : SM_Real_Loads_si <0x0a, "S_BUFFER_LOAD_DWORDX4">;
426defm S_BUFFER_LOAD_DWORDX8 : SM_Real_Loads_si <0x0b, "S_BUFFER_LOAD_DWORDX8">;
427defm S_BUFFER_LOAD_DWORDX16 : SM_Real_Loads_si <0x0c, "S_BUFFER_LOAD_DWORDX16">;
428
429def S_MEMTIME_si : SMRD_Real_si <0x1e, S_MEMTIME>;
430def S_DCACHE_INV_si : SMRD_Real_si <0x1f, S_DCACHE_INV>;
431
432
433//===----------------------------------------------------------------------===//
434// VI
435//===----------------------------------------------------------------------===//
436
437class SMEM_Real_vi <bits<8> op, SM_Pseudo ps>
438 : SM_Real<ps>
439 , SIMCInstr<ps.PseudoInstr, SIEncodingFamily.VI>
440 , Enc64 {
Matt Arsenault7b647552016-10-28 21:55:15 +0000441 bit glc;
Valery Pykhtin1b138862016-09-01 09:56:47 +0000442
443 let AssemblerPredicates = [isVI];
444 let DecoderNamespace = "VI";
445
446 let Inst{5-0} = !if(ps.has_sbase, sbase{6-1}, ?);
447 let Inst{12-6} = !if(ps.has_sdst, sdst{6-0}, ?);
448
Matt Arsenault7b647552016-10-28 21:55:15 +0000449 let Inst{16} = !if(ps.has_glc, glc, ?);
450 let Inst{17} = imm;
Valery Pykhtin1b138862016-09-01 09:56:47 +0000451 let Inst{25-18} = op;
452 let Inst{31-26} = 0x30; //encoding
453 let Inst{51-32} = !if(ps.has_offset, offset{19-0}, ?);
454}
455
456multiclass SM_Real_Loads_vi<bits<8> op, string ps,
457 SM_Load_Pseudo immPs = !cast<SM_Load_Pseudo>(ps#_IMM),
458 SM_Load_Pseudo sgprPs = !cast<SM_Load_Pseudo>(ps#_SGPR)> {
459 def _IMM_vi : SMEM_Real_vi <op, immPs> {
Artem Tamazov54bfd542016-10-31 16:07:39 +0000460 let InOperandList = (ins immPs.BaseClass:$sbase, smrd_offset_20:$offset, GLC:$glc);
Valery Pykhtin1b138862016-09-01 09:56:47 +0000461 }
462 def _SGPR_vi : SMEM_Real_vi <op, sgprPs> {
Matt Arsenault7b647552016-10-28 21:55:15 +0000463 let InOperandList = (ins sgprPs.BaseClass:$sbase, SReg_32:$offset, GLC:$glc);
464 }
465}
466
Sam Kolton83102d92016-12-05 09:58:51 +0000467class SMEM_Real_Store_vi <bits<8> op, SM_Pseudo ps> : SMEM_Real_vi <op, ps> {
468 // encoding
469 bits<7> sdata;
470
471 let sdst = ?;
472 let Inst{12-6} = !if(ps.has_sdst, sdata{6-0}, ?);
473}
474
Matt Arsenault7b647552016-10-28 21:55:15 +0000475multiclass SM_Real_Stores_vi<bits<8> op, string ps,
476 SM_Store_Pseudo immPs = !cast<SM_Store_Pseudo>(ps#_IMM),
477 SM_Store_Pseudo sgprPs = !cast<SM_Store_Pseudo>(ps#_SGPR)> {
478 // FIXME: The operand name $offset is inconsistent with $soff used
479 // in the pseudo
Sam Kolton83102d92016-12-05 09:58:51 +0000480 def _IMM_vi : SMEM_Real_Store_vi <op, immPs> {
Artem Tamazov54bfd542016-10-31 16:07:39 +0000481 let InOperandList = (ins immPs.SrcClass:$sdata, immPs.BaseClass:$sbase, smrd_offset_20:$offset, GLC:$glc);
Matt Arsenault7b647552016-10-28 21:55:15 +0000482 }
483
Sam Kolton83102d92016-12-05 09:58:51 +0000484 def _SGPR_vi : SMEM_Real_Store_vi <op, sgprPs> {
Matt Arsenault7b647552016-10-28 21:55:15 +0000485 let InOperandList = (ins sgprPs.SrcClass:$sdata, sgprPs.BaseClass:$sbase, SReg_32:$offset, GLC:$glc);
Valery Pykhtin1b138862016-09-01 09:56:47 +0000486 }
487}
488
Dmitry Preobrazhensky59399ae2018-04-06 15:48:39 +0000489multiclass SM_Real_Probe_vi<bits<8> op, string ps> {
490 def _IMM_vi : SMEM_Real_Store_vi <op, !cast<SM_Probe_Pseudo>(ps#_IMM)>;
491 def _SGPR_vi : SMEM_Real_Store_vi <op, !cast<SM_Probe_Pseudo>(ps#_SGPR)>;
492}
493
Valery Pykhtin1b138862016-09-01 09:56:47 +0000494defm S_LOAD_DWORD : SM_Real_Loads_vi <0x00, "S_LOAD_DWORD">;
495defm S_LOAD_DWORDX2 : SM_Real_Loads_vi <0x01, "S_LOAD_DWORDX2">;
496defm S_LOAD_DWORDX4 : SM_Real_Loads_vi <0x02, "S_LOAD_DWORDX4">;
497defm S_LOAD_DWORDX8 : SM_Real_Loads_vi <0x03, "S_LOAD_DWORDX8">;
498defm S_LOAD_DWORDX16 : SM_Real_Loads_vi <0x04, "S_LOAD_DWORDX16">;
499defm S_BUFFER_LOAD_DWORD : SM_Real_Loads_vi <0x08, "S_BUFFER_LOAD_DWORD">;
500defm S_BUFFER_LOAD_DWORDX2 : SM_Real_Loads_vi <0x09, "S_BUFFER_LOAD_DWORDX2">;
501defm S_BUFFER_LOAD_DWORDX4 : SM_Real_Loads_vi <0x0a, "S_BUFFER_LOAD_DWORDX4">;
502defm S_BUFFER_LOAD_DWORDX8 : SM_Real_Loads_vi <0x0b, "S_BUFFER_LOAD_DWORDX8">;
503defm S_BUFFER_LOAD_DWORDX16 : SM_Real_Loads_vi <0x0c, "S_BUFFER_LOAD_DWORDX16">;
504
Matt Arsenault7b647552016-10-28 21:55:15 +0000505defm S_STORE_DWORD : SM_Real_Stores_vi <0x10, "S_STORE_DWORD">;
506defm S_STORE_DWORDX2 : SM_Real_Stores_vi <0x11, "S_STORE_DWORDX2">;
507defm S_STORE_DWORDX4 : SM_Real_Stores_vi <0x12, "S_STORE_DWORDX4">;
508
509defm S_BUFFER_STORE_DWORD : SM_Real_Stores_vi <0x18, "S_BUFFER_STORE_DWORD">;
510defm S_BUFFER_STORE_DWORDX2 : SM_Real_Stores_vi <0x19, "S_BUFFER_STORE_DWORDX2">;
511defm S_BUFFER_STORE_DWORDX4 : SM_Real_Stores_vi <0x1a, "S_BUFFER_STORE_DWORDX4">;
512
Sam Kolton83102d92016-12-05 09:58:51 +0000513// These instructions use same encoding
Valery Pykhtin1b138862016-09-01 09:56:47 +0000514def S_DCACHE_INV_vi : SMEM_Real_vi <0x20, S_DCACHE_INV>;
515def S_DCACHE_WB_vi : SMEM_Real_vi <0x21, S_DCACHE_WB>;
516def S_DCACHE_INV_VOL_vi : SMEM_Real_vi <0x22, S_DCACHE_INV_VOL>;
517def S_DCACHE_WB_VOL_vi : SMEM_Real_vi <0x23, S_DCACHE_WB_VOL>;
518def S_MEMTIME_vi : SMEM_Real_vi <0x24, S_MEMTIME>;
519def S_MEMREALTIME_vi : SMEM_Real_vi <0x25, S_MEMREALTIME>;
520
Dmitry Preobrazhenskydd2b9292018-03-28 14:08:03 +0000521defm S_SCRATCH_LOAD_DWORD : SM_Real_Loads_vi <0x05, "S_SCRATCH_LOAD_DWORD">;
522defm S_SCRATCH_LOAD_DWORDX2 : SM_Real_Loads_vi <0x06, "S_SCRATCH_LOAD_DWORDX2">;
523defm S_SCRATCH_LOAD_DWORDX4 : SM_Real_Loads_vi <0x07, "S_SCRATCH_LOAD_DWORDX4">;
524
525defm S_SCRATCH_STORE_DWORD : SM_Real_Stores_vi <0x15, "S_SCRATCH_STORE_DWORD">;
526defm S_SCRATCH_STORE_DWORDX2 : SM_Real_Stores_vi <0x16, "S_SCRATCH_STORE_DWORDX2">;
527defm S_SCRATCH_STORE_DWORDX4 : SM_Real_Stores_vi <0x17, "S_SCRATCH_STORE_DWORDX4">;
Valery Pykhtin1b138862016-09-01 09:56:47 +0000528
Dmitry Preobrazhensky59399ae2018-04-06 15:48:39 +0000529defm S_ATC_PROBE : SM_Real_Probe_vi <0x26, "S_ATC_PROBE">;
530defm S_ATC_PROBE_BUFFER : SM_Real_Probe_vi <0x27, "S_ATC_PROBE_BUFFER">;
531
Valery Pykhtin1b138862016-09-01 09:56:47 +0000532//===----------------------------------------------------------------------===//
Dmitry Preobrazhensky6bad04e2018-04-02 16:10:25 +0000533// GFX9
534//===----------------------------------------------------------------------===//
535
536class SMEM_Atomic_Real_vi <bits<8> op, SM_Atomic_Pseudo ps>
537 : SMEM_Real_vi <op, ps> {
538
539 bits<7> sdata;
540
541 let Constraints = ps.Constraints;
542 let DisableEncoding = ps.DisableEncoding;
543
544 let glc = ps.glc;
545 let Inst{12-6} = !if(glc, sdst{6-0}, sdata{6-0});
546}
547
548multiclass SM_Real_Atomics_vi<bits<8> op, string ps> {
549 def _IMM_vi : SMEM_Atomic_Real_vi <op, !cast<SM_Atomic_Pseudo>(ps#_IMM)>;
550 def _SGPR_vi : SMEM_Atomic_Real_vi <op, !cast<SM_Atomic_Pseudo>(ps#_SGPR)>;
551 def _IMM_RTN_vi : SMEM_Atomic_Real_vi <op, !cast<SM_Atomic_Pseudo>(ps#_IMM_RTN)>;
552 def _SGPR_RTN_vi : SMEM_Atomic_Real_vi <op, !cast<SM_Atomic_Pseudo>(ps#_SGPR_RTN)>;
553}
554
555defm S_BUFFER_ATOMIC_SWAP : SM_Real_Atomics_vi <0x40, "S_BUFFER_ATOMIC_SWAP">;
556defm S_BUFFER_ATOMIC_CMPSWAP : SM_Real_Atomics_vi <0x41, "S_BUFFER_ATOMIC_CMPSWAP">;
557defm S_BUFFER_ATOMIC_ADD : SM_Real_Atomics_vi <0x42, "S_BUFFER_ATOMIC_ADD">;
558defm S_BUFFER_ATOMIC_SUB : SM_Real_Atomics_vi <0x43, "S_BUFFER_ATOMIC_SUB">;
559defm S_BUFFER_ATOMIC_SMIN : SM_Real_Atomics_vi <0x44, "S_BUFFER_ATOMIC_SMIN">;
560defm S_BUFFER_ATOMIC_UMIN : SM_Real_Atomics_vi <0x45, "S_BUFFER_ATOMIC_UMIN">;
561defm S_BUFFER_ATOMIC_SMAX : SM_Real_Atomics_vi <0x46, "S_BUFFER_ATOMIC_SMAX">;
562defm S_BUFFER_ATOMIC_UMAX : SM_Real_Atomics_vi <0x47, "S_BUFFER_ATOMIC_UMAX">;
563defm S_BUFFER_ATOMIC_AND : SM_Real_Atomics_vi <0x48, "S_BUFFER_ATOMIC_AND">;
564defm S_BUFFER_ATOMIC_OR : SM_Real_Atomics_vi <0x49, "S_BUFFER_ATOMIC_OR">;
565defm S_BUFFER_ATOMIC_XOR : SM_Real_Atomics_vi <0x4a, "S_BUFFER_ATOMIC_XOR">;
566defm S_BUFFER_ATOMIC_INC : SM_Real_Atomics_vi <0x4b, "S_BUFFER_ATOMIC_INC">;
567defm S_BUFFER_ATOMIC_DEC : SM_Real_Atomics_vi <0x4c, "S_BUFFER_ATOMIC_DEC">;
568
569defm S_BUFFER_ATOMIC_SWAP_X2 : SM_Real_Atomics_vi <0x60, "S_BUFFER_ATOMIC_SWAP_X2">;
570defm S_BUFFER_ATOMIC_CMPSWAP_X2 : SM_Real_Atomics_vi <0x61, "S_BUFFER_ATOMIC_CMPSWAP_X2">;
571defm S_BUFFER_ATOMIC_ADD_X2 : SM_Real_Atomics_vi <0x62, "S_BUFFER_ATOMIC_ADD_X2">;
572defm S_BUFFER_ATOMIC_SUB_X2 : SM_Real_Atomics_vi <0x63, "S_BUFFER_ATOMIC_SUB_X2">;
573defm S_BUFFER_ATOMIC_SMIN_X2 : SM_Real_Atomics_vi <0x64, "S_BUFFER_ATOMIC_SMIN_X2">;
574defm S_BUFFER_ATOMIC_UMIN_X2 : SM_Real_Atomics_vi <0x65, "S_BUFFER_ATOMIC_UMIN_X2">;
575defm S_BUFFER_ATOMIC_SMAX_X2 : SM_Real_Atomics_vi <0x66, "S_BUFFER_ATOMIC_SMAX_X2">;
576defm S_BUFFER_ATOMIC_UMAX_X2 : SM_Real_Atomics_vi <0x67, "S_BUFFER_ATOMIC_UMAX_X2">;
577defm S_BUFFER_ATOMIC_AND_X2 : SM_Real_Atomics_vi <0x68, "S_BUFFER_ATOMIC_AND_X2">;
578defm S_BUFFER_ATOMIC_OR_X2 : SM_Real_Atomics_vi <0x69, "S_BUFFER_ATOMIC_OR_X2">;
579defm S_BUFFER_ATOMIC_XOR_X2 : SM_Real_Atomics_vi <0x6a, "S_BUFFER_ATOMIC_XOR_X2">;
580defm S_BUFFER_ATOMIC_INC_X2 : SM_Real_Atomics_vi <0x6b, "S_BUFFER_ATOMIC_INC_X2">;
581defm S_BUFFER_ATOMIC_DEC_X2 : SM_Real_Atomics_vi <0x6c, "S_BUFFER_ATOMIC_DEC_X2">;
582
583defm S_ATOMIC_SWAP : SM_Real_Atomics_vi <0x80, "S_ATOMIC_SWAP">;
584defm S_ATOMIC_CMPSWAP : SM_Real_Atomics_vi <0x81, "S_ATOMIC_CMPSWAP">;
585defm S_ATOMIC_ADD : SM_Real_Atomics_vi <0x82, "S_ATOMIC_ADD">;
586defm S_ATOMIC_SUB : SM_Real_Atomics_vi <0x83, "S_ATOMIC_SUB">;
587defm S_ATOMIC_SMIN : SM_Real_Atomics_vi <0x84, "S_ATOMIC_SMIN">;
588defm S_ATOMIC_UMIN : SM_Real_Atomics_vi <0x85, "S_ATOMIC_UMIN">;
589defm S_ATOMIC_SMAX : SM_Real_Atomics_vi <0x86, "S_ATOMIC_SMAX">;
590defm S_ATOMIC_UMAX : SM_Real_Atomics_vi <0x87, "S_ATOMIC_UMAX">;
591defm S_ATOMIC_AND : SM_Real_Atomics_vi <0x88, "S_ATOMIC_AND">;
592defm S_ATOMIC_OR : SM_Real_Atomics_vi <0x89, "S_ATOMIC_OR">;
593defm S_ATOMIC_XOR : SM_Real_Atomics_vi <0x8a, "S_ATOMIC_XOR">;
594defm S_ATOMIC_INC : SM_Real_Atomics_vi <0x8b, "S_ATOMIC_INC">;
595defm S_ATOMIC_DEC : SM_Real_Atomics_vi <0x8c, "S_ATOMIC_DEC">;
596
597defm S_ATOMIC_SWAP_X2 : SM_Real_Atomics_vi <0xa0, "S_ATOMIC_SWAP_X2">;
598defm S_ATOMIC_CMPSWAP_X2 : SM_Real_Atomics_vi <0xa1, "S_ATOMIC_CMPSWAP_X2">;
599defm S_ATOMIC_ADD_X2 : SM_Real_Atomics_vi <0xa2, "S_ATOMIC_ADD_X2">;
600defm S_ATOMIC_SUB_X2 : SM_Real_Atomics_vi <0xa3, "S_ATOMIC_SUB_X2">;
601defm S_ATOMIC_SMIN_X2 : SM_Real_Atomics_vi <0xa4, "S_ATOMIC_SMIN_X2">;
602defm S_ATOMIC_UMIN_X2 : SM_Real_Atomics_vi <0xa5, "S_ATOMIC_UMIN_X2">;
603defm S_ATOMIC_SMAX_X2 : SM_Real_Atomics_vi <0xa6, "S_ATOMIC_SMAX_X2">;
604defm S_ATOMIC_UMAX_X2 : SM_Real_Atomics_vi <0xa7, "S_ATOMIC_UMAX_X2">;
605defm S_ATOMIC_AND_X2 : SM_Real_Atomics_vi <0xa8, "S_ATOMIC_AND_X2">;
606defm S_ATOMIC_OR_X2 : SM_Real_Atomics_vi <0xa9, "S_ATOMIC_OR_X2">;
607defm S_ATOMIC_XOR_X2 : SM_Real_Atomics_vi <0xaa, "S_ATOMIC_XOR_X2">;
608defm S_ATOMIC_INC_X2 : SM_Real_Atomics_vi <0xab, "S_ATOMIC_INC_X2">;
609defm S_ATOMIC_DEC_X2 : SM_Real_Atomics_vi <0xac, "S_ATOMIC_DEC_X2">;
610
Dmitry Preobrazhensky4732d872018-04-06 15:08:42 +0000611multiclass SM_Real_Discard_vi<bits<8> op, string ps> {
612 def _IMM_vi : SMEM_Real_vi <op, !cast<SM_Discard_Pseudo>(ps#_IMM)>;
613 def _SGPR_vi : SMEM_Real_vi <op, !cast<SM_Discard_Pseudo>(ps#_SGPR)>;
614}
615
616defm S_DCACHE_DISCARD : SM_Real_Discard_vi <0x28, "S_DCACHE_DISCARD">;
617defm S_DCACHE_DISCARD_X2 : SM_Real_Discard_vi <0x29, "S_DCACHE_DISCARD_X2">;
618
Dmitry Preobrazhensky6bad04e2018-04-02 16:10:25 +0000619//===----------------------------------------------------------------------===//
Valery Pykhtin1b138862016-09-01 09:56:47 +0000620// CI
621//===----------------------------------------------------------------------===//
622
623def smrd_literal_offset : NamedOperandU32<"SMRDLiteralOffset",
624 NamedMatchClass<"SMRDLiteralOffset">> {
625 let OperandType = "OPERAND_IMMEDIATE";
626}
627
628class SMRD_Real_Load_IMM_ci <bits<5> op, SM_Load_Pseudo ps> :
629 SM_Real<ps>,
630 Enc64 {
631
632 let AssemblerPredicates = [isCIOnly];
633 let DecoderNamespace = "CI";
Matt Arsenault7b647552016-10-28 21:55:15 +0000634 let InOperandList = (ins ps.BaseClass:$sbase, smrd_literal_offset:$offset, GLC:$glc);
Valery Pykhtin1b138862016-09-01 09:56:47 +0000635
636 let LGKM_CNT = ps.LGKM_CNT;
637 let SMRD = ps.SMRD;
638 let mayLoad = ps.mayLoad;
639 let mayStore = ps.mayStore;
640 let hasSideEffects = ps.hasSideEffects;
641 let SchedRW = ps.SchedRW;
642 let UseNamedOperandTable = ps.UseNamedOperandTable;
643
644 let Inst{7-0} = 0xff;
645 let Inst{8} = 0;
646 let Inst{14-9} = sbase{6-1};
647 let Inst{21-15} = sdst{6-0};
648 let Inst{26-22} = op;
649 let Inst{31-27} = 0x18; //encoding
650 let Inst{63-32} = offset{31-0};
651}
652
653def S_LOAD_DWORD_IMM_ci : SMRD_Real_Load_IMM_ci <0x00, S_LOAD_DWORD_IMM>;
654def S_LOAD_DWORDX2_IMM_ci : SMRD_Real_Load_IMM_ci <0x01, S_LOAD_DWORDX2_IMM>;
655def S_LOAD_DWORDX4_IMM_ci : SMRD_Real_Load_IMM_ci <0x02, S_LOAD_DWORDX4_IMM>;
656def S_LOAD_DWORDX8_IMM_ci : SMRD_Real_Load_IMM_ci <0x03, S_LOAD_DWORDX8_IMM>;
657def S_LOAD_DWORDX16_IMM_ci : SMRD_Real_Load_IMM_ci <0x04, S_LOAD_DWORDX16_IMM>;
658def S_BUFFER_LOAD_DWORD_IMM_ci : SMRD_Real_Load_IMM_ci <0x08, S_BUFFER_LOAD_DWORD_IMM>;
659def S_BUFFER_LOAD_DWORDX2_IMM_ci : SMRD_Real_Load_IMM_ci <0x09, S_BUFFER_LOAD_DWORDX2_IMM>;
660def S_BUFFER_LOAD_DWORDX4_IMM_ci : SMRD_Real_Load_IMM_ci <0x0a, S_BUFFER_LOAD_DWORDX4_IMM>;
661def S_BUFFER_LOAD_DWORDX8_IMM_ci : SMRD_Real_Load_IMM_ci <0x0b, S_BUFFER_LOAD_DWORDX8_IMM>;
662def S_BUFFER_LOAD_DWORDX16_IMM_ci : SMRD_Real_Load_IMM_ci <0x0c, S_BUFFER_LOAD_DWORDX16_IMM>;
663
664class SMRD_Real_ci <bits<5> op, SM_Pseudo ps>
665 : SM_Real<ps>
666 , SIMCInstr<ps.PseudoInstr, SIEncodingFamily.SI>
667 , Enc32 {
668
669 let AssemblerPredicates = [isCIOnly];
670 let DecoderNamespace = "CI";
671
672 let Inst{7-0} = !if(ps.has_offset, offset{7-0}, ?);
673 let Inst{8} = imm;
674 let Inst{14-9} = !if(ps.has_sbase, sbase{6-1}, ?);
675 let Inst{21-15} = !if(ps.has_sdst, sdst{6-0}, ?);
676 let Inst{26-22} = op;
677 let Inst{31-27} = 0x18; //encoding
678}
679
680def S_DCACHE_INV_VOL_ci : SMRD_Real_ci <0x1d, S_DCACHE_INV_VOL>;
Marek Olsak8973a0a2017-05-24 14:53:50 +0000681
Tom Stellard251ee082018-10-06 03:32:43 +0000682//===----------------------------------------------------------------------===//
683// Scalar Memory Patterns
684//===----------------------------------------------------------------------===//
Marek Olsak8973a0a2017-05-24 14:53:50 +0000685
Tom Stellard251ee082018-10-06 03:32:43 +0000686def smrd_load : PatFrag <(ops node:$ptr), (load node:$ptr), [{ return isUniformLoad(N);}]>;
687
688def SMRDImm : ComplexPattern<i64, 2, "SelectSMRDImm">;
689def SMRDImm32 : ComplexPattern<i64, 2, "SelectSMRDImm32">;
690def SMRDSgpr : ComplexPattern<i64, 2, "SelectSMRDSgpr">;
691def SMRDBufferImm : ComplexPattern<i32, 1, "SelectSMRDBufferImm">;
692def SMRDBufferImm32 : ComplexPattern<i32, 1, "SelectSMRDBufferImm32">;
693
694multiclass SMRD_Pattern <string Instr, ValueType vt> {
695
696 // 1. IMM offset
697 def : GCNPat <
698 (smrd_load (SMRDImm i64:$sbase, i32:$offset)),
699 (vt (!cast<SM_Pseudo>(Instr#"_IMM") $sbase, $offset, 0))
700 >;
701
702 // 2. 32-bit IMM offset on CI
703 def : GCNPat <
704 (smrd_load (SMRDImm32 i64:$sbase, i32:$offset)),
705 (vt (!cast<InstSI>(Instr#"_IMM_ci") $sbase, $offset, 0))> {
706 let OtherPredicates = [isCIOnly];
707 }
708
709 // 3. SGPR offset
710 def : GCNPat <
711 (smrd_load (SMRDSgpr i64:$sbase, i32:$offset)),
712 (vt (!cast<SM_Pseudo>(Instr#"_SGPR") $sbase, $offset, 0))
713 >;
Marek Olsak8973a0a2017-05-24 14:53:50 +0000714}
715
Tom Stellard251ee082018-10-06 03:32:43 +0000716multiclass SMLoad_Pattern <string Instr, ValueType vt> {
717 // 1. Offset as an immediate
718 def : GCNPat <
719 (SIsbuffer_load v4i32:$sbase, (SMRDBufferImm i32:$offset), i1:$glc),
720 (vt (!cast<SM_Pseudo>(Instr#"_IMM") $sbase, $offset, (as_i1imm $glc)))
721 >;
Marek Olsak8973a0a2017-05-24 14:53:50 +0000722
Tom Stellard251ee082018-10-06 03:32:43 +0000723 // 2. 32-bit IMM offset on CI
724 def : GCNPat <
725 (vt (SIsbuffer_load v4i32:$sbase, (SMRDBufferImm32 i32:$offset), i1:$glc)),
726 (!cast<InstSI>(Instr#"_IMM_ci") $sbase, $offset, (as_i1imm $glc))> {
727 let OtherPredicates = [isCIOnly];
728 }
729
730 // 3. Offset loaded in an 32bit SGPR
731 def : GCNPat <
732 (SIsbuffer_load v4i32:$sbase, i32:$offset, i1:$glc),
733 (vt (!cast<SM_Pseudo>(Instr#"_SGPR") $sbase, $offset, (as_i1imm $glc)))
734 >;
Marek Olsak8973a0a2017-05-24 14:53:50 +0000735}
736
Tom Stellard251ee082018-10-06 03:32:43 +0000737// Global and constant loads can be selected to either MUBUF or SMRD
738// instructions, but SMRD instructions are faster so we want the instruction
739// selector to prefer those.
740let AddedComplexity = 100 in {
Tim Renouf904343f2018-08-25 14:53:17 +0000741
Tom Stellard251ee082018-10-06 03:32:43 +0000742defm : SMRD_Pattern <"S_LOAD_DWORD", i32>;
743defm : SMRD_Pattern <"S_LOAD_DWORDX2", v2i32>;
744defm : SMRD_Pattern <"S_LOAD_DWORDX4", v4i32>;
745defm : SMRD_Pattern <"S_LOAD_DWORDX8", v8i32>;
746defm : SMRD_Pattern <"S_LOAD_DWORDX16", v16i32>;
Marek Olsak8973a0a2017-05-24 14:53:50 +0000747
Tom Stellard251ee082018-10-06 03:32:43 +0000748defm : SMLoad_Pattern <"S_BUFFER_LOAD_DWORD", i32>;
749defm : SMLoad_Pattern <"S_BUFFER_LOAD_DWORDX2", v2i32>;
750defm : SMLoad_Pattern <"S_BUFFER_LOAD_DWORDX4", v4i32>;
751defm : SMLoad_Pattern <"S_BUFFER_LOAD_DWORDX8", v8i32>;
752defm : SMLoad_Pattern <"S_BUFFER_LOAD_DWORDX16", v16i32>;
Matt Arsenaultce2e0532018-12-07 18:41:39 +0000753
754defm : SMLoad_Pattern <"S_BUFFER_LOAD_DWORD", f32>;
755defm : SMLoad_Pattern <"S_BUFFER_LOAD_DWORDX2", v2f32>;
756defm : SMLoad_Pattern <"S_BUFFER_LOAD_DWORDX4", v4f32>;
757defm : SMLoad_Pattern <"S_BUFFER_LOAD_DWORDX8", v8f32>;
758defm : SMLoad_Pattern <"S_BUFFER_LOAD_DWORDX16", v16f32>;
Tom Stellard251ee082018-10-06 03:32:43 +0000759} // End let AddedComplexity = 100
760
761let OtherPredicates = [isSICI] in {
762def : GCNPat <
763 (i64 (readcyclecounter)),
764 (S_MEMTIME)
765>;
766}
767
768let OtherPredicates = [isVI] in {
769
770def : GCNPat <
771 (i64 (readcyclecounter)),
772 (S_MEMREALTIME)
773>;
774
775} // let OtherPredicates = [isVI]