blob: c543814cae0db9efbf4c939fbe4e7ea25658c20a [file] [log] [blame]
Marek Olsak5df00d62014-12-07 12:18:57 +00001//===-- CIInstructions.td - CI Instruction Defintions ---------------------===//
2//
3// The LLVM Compiler Infrastructure
4//
5// This file is distributed under the University of Illinois Open Source
6// License. See LICENSE.TXT for details.
7//
8//===----------------------------------------------------------------------===//
9// Instruction definitions for CI and newer.
10//===----------------------------------------------------------------------===//
Matt Arsenault6adf07a2015-08-22 00:16:34 +000011// Remaining instructions:
Matt Arsenault6adf07a2015-08-22 00:16:34 +000012// S_CBRANCH_CDBGUSER
13// S_CBRANCH_CDBGSYS
14// S_CBRANCH_CDBGSYS_OR_USER
15// S_CBRANCH_CDBGSYS_AND_USER
Matt Arsenault6adf07a2015-08-22 00:16:34 +000016// DS_NOP
17// DS_GWS_SEMA_RELEASE_ALL
18// DS_WRAP_RTN_B32
19// DS_CNDXCHG32_RTN_B64
20// DS_WRITE_B96
21// DS_WRITE_B128
22// DS_CONDXCHG32_RTN_B128
23// DS_READ_B96
24// DS_READ_B128
25// BUFFER_LOAD_DWORDX3
26// BUFFER_STORE_DWORDX3
Marek Olsak5df00d62014-12-07 12:18:57 +000027
28
29def isCIVI : Predicate <
Eric Christopher7792e322015-01-30 23:24:40 +000030 "Subtarget->getGeneration() == AMDGPUSubtarget::SEA_ISLANDS || "
31 "Subtarget->getGeneration() == AMDGPUSubtarget::VOLCANIC_ISLANDS"
Tom Stellardd1f0f022015-04-23 19:33:54 +000032>, AssemblerPredicate<"FeatureCIInsts">;
Marek Olsak5df00d62014-12-07 12:18:57 +000033
Tom Stellard731c9272015-06-11 14:51:49 +000034def HasFlatAddressSpace : Predicate<"Subtarget->hasFlatAddressSpace()">;
35
Marek Olsak5df00d62014-12-07 12:18:57 +000036//===----------------------------------------------------------------------===//
37// VOP1 Instructions
38//===----------------------------------------------------------------------===//
39
40let SubtargetPredicate = isCIVI in {
41
Matt Arsenaulte8df8792015-08-22 00:50:41 +000042let SchedRW = [WriteDoubleAdd] in {
Marek Olsak5df00d62014-12-07 12:18:57 +000043defm V_TRUNC_F64 : VOP1Inst <vop1<0x17>, "v_trunc_f64",
44 VOP_F64_F64, ftrunc
45>;
46defm V_CEIL_F64 : VOP1Inst <vop1<0x18>, "v_ceil_f64",
47 VOP_F64_F64, fceil
48>;
49defm V_FLOOR_F64 : VOP1Inst <vop1<0x1A>, "v_floor_f64",
50 VOP_F64_F64, ffloor
51>;
52defm V_RNDNE_F64 : VOP1Inst <vop1<0x19>, "v_rndne_f64",
53 VOP_F64_F64, frint
54>;
Matt Arsenaulte8df8792015-08-22 00:50:41 +000055} // End SchedRW = [WriteDoubleAdd]
56
57let SchedRW = [WriteQuarterRate32] in {
Marek Olsak5df00d62014-12-07 12:18:57 +000058defm V_LOG_LEGACY_F32 : VOP1Inst <vop1<0x45, 0x4c>, "v_log_legacy_f32",
59 VOP_F32_F32
60>;
61defm V_EXP_LEGACY_F32 : VOP1Inst <vop1<0x46, 0x4b>, "v_exp_legacy_f32",
62 VOP_F32_F32
63>;
Matt Arsenaulte8df8792015-08-22 00:50:41 +000064} // End SchedRW = [WriteQuarterRate32]
Tom Stellard731c9272015-06-11 14:51:49 +000065
66//===----------------------------------------------------------------------===//
Matt Arsenault6adf07a2015-08-22 00:16:34 +000067// VOP3 Instructions
68//===----------------------------------------------------------------------===//
69
70defm V_QSAD_PK_U16_U8 : VOP3Inst <vop3<0x173>, "v_qsad_pk_u16_u8",
71 VOP_I32_I32_I32
72>;
73defm V_MQSAD_U16_U8 : VOP3Inst <vop3<0x172>, "v_mqsad_u16_u8",
74 VOP_I32_I32_I32
75>;
76defm V_MQSAD_U32_U8 : VOP3Inst <vop3<0x175>, "v_mqsad_u32_u8",
77 VOP_I32_I32_I32
78>;
79
80let isCommutable = 1 in {
81defm V_MAD_U64_U32 : VOP3Inst <vop3<0x176>, "v_mad_u64_u32",
82 VOP_I64_I32_I32_I64
83>;
84
85// XXX - Does this set VCC?
86defm V_MAD_I64_I32 : VOP3Inst <vop3<0x177>, "v_mad_i64_i32",
87 VOP_I64_I32_I32_I64
88>;
89} // End isCommutable = 1
90
91
92//===----------------------------------------------------------------------===//
93// DS Instructions
94//===----------------------------------------------------------------------===//
95defm DS_WRAP_RTN_F32 : DS_1A1D_RET <0x34, "ds_wrap_rtn_f32", VGPR_32, "ds_wrap_f32">;
96
97// DS_CONDXCHG32_RTN_B64
98// DS_CONDXCHG32_RTN_B128
99
100//===----------------------------------------------------------------------===//
Matt Arsenaulte66621b2015-09-24 19:52:27 +0000101// SMRD Instructions
102//===----------------------------------------------------------------------===//
103
104defm S_DCACHE_INV_VOL : SMRD_Inval <smrd<0x1d, 0x22>,
105 "s_dcache_inv_vol", int_amdgcn_s_dcache_inv_vol>;
106
107//===----------------------------------------------------------------------===//
Matt Arsenaultd6adfb42015-09-24 19:52:21 +0000108// MUBUF Instructions
109//===----------------------------------------------------------------------===//
110
111defm BUFFER_WBINVL1_VOL : MUBUF_Invalidate <mubuf<0x70, 0x3f>,
112 "buffer_wbinvl1_vol", int_amdgcn_buffer_wbinvl1_vol
113>;
114
115//===----------------------------------------------------------------------===//
Tom Stellard731c9272015-06-11 14:51:49 +0000116// Flat Instructions
117//===----------------------------------------------------------------------===//
118
Tom Stellard5ebdfbe2015-12-24 03:18:18 +0000119defm FLAT_LOAD_UBYTE : FLAT_Load_Helper <
120 flat<0x8, 0x10>, "flat_load_ubyte", VGPR_32
Tom Stellard731c9272015-06-11 14:51:49 +0000121>;
Tom Stellard5ebdfbe2015-12-24 03:18:18 +0000122defm FLAT_LOAD_SBYTE : FLAT_Load_Helper <
123 flat<0x9, 0x11>, "flat_load_sbyte", VGPR_32
Tom Stellard731c9272015-06-11 14:51:49 +0000124>;
Tom Stellard5ebdfbe2015-12-24 03:18:18 +0000125defm FLAT_LOAD_USHORT : FLAT_Load_Helper <
126 flat<0xa, 0x12>, "flat_load_ushort", VGPR_32
Tom Stellard731c9272015-06-11 14:51:49 +0000127>;
Tom Stellard5ebdfbe2015-12-24 03:18:18 +0000128defm FLAT_LOAD_SSHORT : FLAT_Load_Helper <
129 flat<0xb, 0x13>, "flat_load_sshort", VGPR_32>
130;
131defm FLAT_LOAD_DWORD : FLAT_Load_Helper <
132 flat<0xc, 0x14>, "flat_load_dword", VGPR_32
133>;
134defm FLAT_LOAD_DWORDX2 : FLAT_Load_Helper <
135 flat<0xd, 0x15>, "flat_load_dwordx2", VReg_64
136>;
137defm FLAT_LOAD_DWORDX4 : FLAT_Load_Helper <
138 flat<0xe, 0x17>, "flat_load_dwordx4", VReg_128
139>;
140defm FLAT_LOAD_DWORDX3 : FLAT_Load_Helper <
141 flat<0xf, 0x16>, "flat_load_dwordx3", VReg_96
142>;
143defm FLAT_STORE_BYTE : FLAT_Store_Helper <
144 flat<0x18>, "flat_store_byte", VGPR_32
145>;
146defm FLAT_STORE_SHORT : FLAT_Store_Helper <
147 flat <0x1a>, "flat_store_short", VGPR_32
148>;
149defm FLAT_STORE_DWORD : FLAT_Store_Helper <
150 flat<0x1c>, "flat_store_dword", VGPR_32
151>;
152defm FLAT_STORE_DWORDX2 : FLAT_Store_Helper <
153 flat<0x1d>, "flat_store_dwordx2", VReg_64
154>;
155defm FLAT_STORE_DWORDX4 : FLAT_Store_Helper <
156 flat<0x1e, 0x1f>, "flat_store_dwordx4", VReg_128
157>;
158defm FLAT_STORE_DWORDX3 : FLAT_Store_Helper <
159 flat<0x1f, 0x1e>, "flat_store_dwordx3", VReg_96
160>;
161defm FLAT_ATOMIC_SWAP : FLAT_ATOMIC <
162 flat<0x30, 0x40>, "flat_atomic_swap", VGPR_32
163>;
Tom Stellard12a19102015-06-12 20:47:06 +0000164defm FLAT_ATOMIC_CMPSWAP : FLAT_ATOMIC <
Tom Stellard5ebdfbe2015-12-24 03:18:18 +0000165 flat<0x31, 0x41>, "flat_atomic_cmpswap", VGPR_32, VReg_64
Tom Stellard12a19102015-06-12 20:47:06 +0000166>;
Tom Stellard5ebdfbe2015-12-24 03:18:18 +0000167defm FLAT_ATOMIC_ADD : FLAT_ATOMIC <
168 flat<0x32, 0x42>, "flat_atomic_add", VGPR_32
Tom Stellard12a19102015-06-12 20:47:06 +0000169>;
Tom Stellard5ebdfbe2015-12-24 03:18:18 +0000170defm FLAT_ATOMIC_SUB : FLAT_ATOMIC <
171 flat<0x33, 0x43>, "flat_atomic_sub", VGPR_32
172>;
173defm FLAT_ATOMIC_SMIN : FLAT_ATOMIC <
174 flat<0x35, 0x44>, "flat_atomic_smin", VGPR_32
175>;
176defm FLAT_ATOMIC_UMIN : FLAT_ATOMIC <
177 flat<0x36, 0x45>, "flat_atomic_umin", VGPR_32
178>;
179defm FLAT_ATOMIC_SMAX : FLAT_ATOMIC <
180 flat<0x37, 0x46>, "flat_atomic_smax", VGPR_32
181>;
182defm FLAT_ATOMIC_UMAX : FLAT_ATOMIC <
183 flat<0x38, 0x47>, "flat_atomic_umax", VGPR_32
184>;
185defm FLAT_ATOMIC_AND : FLAT_ATOMIC <
186 flat<0x39, 0x48>, "flat_atomic_and", VGPR_32
187>;
188defm FLAT_ATOMIC_OR : FLAT_ATOMIC <
189 flat<0x3a, 0x49>, "flat_atomic_or", VGPR_32
190>;
191defm FLAT_ATOMIC_XOR : FLAT_ATOMIC <
192 flat<0x3b, 0x4a>, "flat_atomic_xor", VGPR_32
193>;
194defm FLAT_ATOMIC_INC : FLAT_ATOMIC <
195 flat<0x3c, 0x4b>, "flat_atomic_inc", VGPR_32
196>;
197defm FLAT_ATOMIC_DEC : FLAT_ATOMIC <
198 flat<0x3d, 0x4c>, "flat_atomic_dec", VGPR_32
199>;
200defm FLAT_ATOMIC_SWAP_X2 : FLAT_ATOMIC <
201 flat<0x50, 0x60>, "flat_atomic_swap_x2", VReg_64
202>;
Tom Stellard12a19102015-06-12 20:47:06 +0000203defm FLAT_ATOMIC_CMPSWAP_X2 : FLAT_ATOMIC <
Tom Stellard5ebdfbe2015-12-24 03:18:18 +0000204 flat<0x51, 0x61>, "flat_atomic_cmpswap_x2", VReg_64, VReg_128
Tom Stellard12a19102015-06-12 20:47:06 +0000205>;
Tom Stellard5ebdfbe2015-12-24 03:18:18 +0000206defm FLAT_ATOMIC_ADD_X2 : FLAT_ATOMIC <
207 flat<0x52, 0x62>, "flat_atomic_add_x2", VReg_64
Tom Stellard12a19102015-06-12 20:47:06 +0000208>;
Tom Stellard5ebdfbe2015-12-24 03:18:18 +0000209defm FLAT_ATOMIC_SUB_X2 : FLAT_ATOMIC <
210 flat<0x53, 0x63>, "flat_atomic_sub_x2", VReg_64
211>;
212defm FLAT_ATOMIC_SMIN_X2 : FLAT_ATOMIC <
213 flat<0x55, 0x64>, "flat_atomic_smin_x2", VReg_64
214>;
215defm FLAT_ATOMIC_UMIN_X2 : FLAT_ATOMIC <
216 flat<0x56, 0x65>, "flat_atomic_umin_x2", VReg_64
217>;
218defm FLAT_ATOMIC_SMAX_X2 : FLAT_ATOMIC <
219 flat<0x57, 0x66>, "flat_atomic_smax_x2", VReg_64
220>;
221defm FLAT_ATOMIC_UMAX_X2 : FLAT_ATOMIC <
222 flat<0x58, 0x67>, "flat_atomic_umax_x2", VReg_64
223>;
224defm FLAT_ATOMIC_AND_X2 : FLAT_ATOMIC <
225 flat<0x59, 0x68>, "flat_atomic_and_x2", VReg_64
226>;
227defm FLAT_ATOMIC_OR_X2 : FLAT_ATOMIC <
228 flat<0x5a, 0x69>, "flat_atomic_or_x2", VReg_64
229>;
230defm FLAT_ATOMIC_XOR_X2 : FLAT_ATOMIC <
231 flat<0x5b, 0x6a>, "flat_atomic_xor_x2", VReg_64
232>;
233defm FLAT_ATOMIC_INC_X2 : FLAT_ATOMIC <
234 flat<0x5c, 0x6b>, "flat_atomic_inc_x2", VReg_64
235>;
236defm FLAT_ATOMIC_DEC_X2 : FLAT_ATOMIC <
237 flat<0x5d, 0x6c>, "flat_atomic_dec_x2", VReg_64
238>;
Tom Stellard731c9272015-06-11 14:51:49 +0000239
Tom Stellard12a19102015-06-12 20:47:06 +0000240} // End SubtargetPredicate = isCIVI
Tom Stellard731c9272015-06-11 14:51:49 +0000241
Tom Stellard5ebdfbe2015-12-24 03:18:18 +0000242// CI Only flat instructions
243
244let SubtargetPredicate = isCI, VIAssemblerPredicate = DisableInst in {
245
246defm FLAT_ATOMIC_FCMPSWAP : FLAT_ATOMIC <
247 flat<0x3e>, "flat_atomic_fcmpswap", VGPR_32, VReg_64
248>;
249defm FLAT_ATOMIC_FMIN : FLAT_ATOMIC <
250 flat<0x3f>, "flat_atomic_fmin", VGPR_32
251>;
252defm FLAT_ATOMIC_FMAX : FLAT_ATOMIC <
253 flat<0x40>, "flat_atomic_fmax", VGPR_32
254>;
255defm FLAT_ATOMIC_FCMPSWAP_X2 : FLAT_ATOMIC <
256 flat<0x5e>, "flat_atomic_fcmpswap_x2", VReg_64, VReg_128
257>;
258defm FLAT_ATOMIC_FMIN_X2 : FLAT_ATOMIC <
259 flat<0x5f>, "flat_atomic_fmin_x2", VReg_64
260>;
261defm FLAT_ATOMIC_FMAX_X2 : FLAT_ATOMIC <
262 flat<0x60>, "flat_atomic_fmax_x2", VReg_64
263>;
264
265} // End let SubtargetPredicate = isCI, VIAssemblerPredicate = DisableInst
266
Matt Arsenault6adf07a2015-08-22 00:16:34 +0000267let Predicates = [isCI] in {
268
269// Convert (x - floor(x)) to fract(x)
270def : Pat <
271 (f32 (fsub (f32 (VOP3Mods f32:$x, i32:$mods)),
272 (f32 (ffloor (f32 (VOP3Mods f32:$x, i32:$mods)))))),
273 (V_FRACT_F32_e64 $mods, $x, DSTCLAMP.NONE, DSTOMOD.NONE)
274>;
275
276// Convert (x + (-floor(x))) to fract(x)
277def : Pat <
278 (f64 (fadd (f64 (VOP3Mods f64:$x, i32:$mods)),
279 (f64 (fneg (f64 (ffloor (f64 (VOP3Mods f64:$x, i32:$mods)))))))),
280 (V_FRACT_F64_e64 $mods, $x, DSTCLAMP.NONE, DSTOMOD.NONE)
281>;
282
283} // End Predicates = [isCI]
Changpeng Fangb41574a2015-12-22 20:55:23 +0000284
285
286//===----------------------------------------------------------------------===//
Tom Stellard2c82ee62016-01-05 02:26:37 +0000287// Flat Patterns
Changpeng Fangb41574a2015-12-22 20:55:23 +0000288//===----------------------------------------------------------------------===//
289
Tom Stellard2c82ee62016-01-05 02:26:37 +0000290let Predicates = [isCIVI] in {
Changpeng Fangb41574a2015-12-22 20:55:23 +0000291
Changpeng Fangb41574a2015-12-22 20:55:23 +0000292// Patterns for global loads with no offset
293class FlatLoadPat <FLAT inst, SDPatternOperator node, ValueType vt> : Pat <
294 (vt (node i64:$addr)),
295 (inst $addr, 0, 0, 0)
296>;
297
Tom Stellard2c82ee62016-01-05 02:26:37 +0000298def : FlatLoadPat <FLAT_LOAD_UBYTE, flat_az_extloadi8, i32>;
299def : FlatLoadPat <FLAT_LOAD_SBYTE, flat_sextloadi8, i32>;
300def : FlatLoadPat <FLAT_LOAD_USHORT, flat_az_extloadi16, i32>;
301def : FlatLoadPat <FLAT_LOAD_SSHORT, flat_sextloadi16, i32>;
302def : FlatLoadPat <FLAT_LOAD_DWORD, flat_load, i32>;
303def : FlatLoadPat <FLAT_LOAD_DWORDX2, flat_load, v2i32>;
304def : FlatLoadPat <FLAT_LOAD_DWORDX4, flat_load, v4i32>;
Changpeng Fangb41574a2015-12-22 20:55:23 +0000305
306class FlatStorePat <FLAT inst, SDPatternOperator node, ValueType vt> : Pat <
307 (node vt:$data, i64:$addr),
308 (inst $data, $addr, 0, 0, 0)
309>;
310
Tom Stellard2c82ee62016-01-05 02:26:37 +0000311def : FlatStorePat <FLAT_STORE_BYTE, flat_truncstorei8, i32>;
312def : FlatStorePat <FLAT_STORE_SHORT, flat_truncstorei16, i32>;
313def : FlatStorePat <FLAT_STORE_DWORD, flat_store, i32>;
314def : FlatStorePat <FLAT_STORE_DWORDX2, flat_store, v2i32>;
315def : FlatStorePat <FLAT_STORE_DWORDX4, flat_store, v4i32>;
Changpeng Fangb41574a2015-12-22 20:55:23 +0000316
317class FlatAtomicPat <FLAT inst, SDPatternOperator node, ValueType vt> : Pat <
318 (vt (node i64:$addr, vt:$data)),
319 (inst $addr, $data, 0, 0)
320>;
321
322def : FlatAtomicPat <FLAT_ATOMIC_ADD_RTN, atomic_add_global, i32>;
323def : FlatAtomicPat <FLAT_ATOMIC_AND_RTN, atomic_and_global, i32>;
324def : FlatAtomicPat <FLAT_ATOMIC_SUB_RTN, atomic_sub_global, i32>;
325def : FlatAtomicPat <FLAT_ATOMIC_SMAX_RTN, atomic_max_global, i32>;
326def : FlatAtomicPat <FLAT_ATOMIC_UMAX_RTN, atomic_umax_global, i32>;
327def : FlatAtomicPat <FLAT_ATOMIC_SMIN_RTN, atomic_min_global, i32>;
328def : FlatAtomicPat <FLAT_ATOMIC_UMIN_RTN, atomic_umin_global, i32>;
329def : FlatAtomicPat <FLAT_ATOMIC_OR_RTN, atomic_or_global, i32>;
330def : FlatAtomicPat <FLAT_ATOMIC_SWAP_RTN, atomic_swap_global, i32>;
331def : FlatAtomicPat <FLAT_ATOMIC_XOR_RTN, atomic_xor_global, i32>;
332
Tom Stellard2c82ee62016-01-05 02:26:37 +0000333} // End Predicates = [isCIVI]