blob: 9ec6fd124993ef2c3600297cfc81e1ffc4bc7361 [file] [log] [blame]
Marek Olsak5df00d62014-12-07 12:18:57 +00001//===-- CIInstructions.td - CI Instruction Defintions ---------------------===//
2//
3// The LLVM Compiler Infrastructure
4//
5// This file is distributed under the University of Illinois Open Source
6// License. See LICENSE.TXT for details.
7//
8//===----------------------------------------------------------------------===//
9// Instruction definitions for CI and newer.
10//===----------------------------------------------------------------------===//
Matt Arsenault6adf07a2015-08-22 00:16:34 +000011// Remaining instructions:
12// FLAT_*
13// S_CBRANCH_CDBGUSER
14// S_CBRANCH_CDBGSYS
15// S_CBRANCH_CDBGSYS_OR_USER
16// S_CBRANCH_CDBGSYS_AND_USER
17// S_DCACHE_INV_VOL
18// DS_NOP
19// DS_GWS_SEMA_RELEASE_ALL
20// DS_WRAP_RTN_B32
21// DS_CNDXCHG32_RTN_B64
22// DS_WRITE_B96
23// DS_WRITE_B128
24// DS_CONDXCHG32_RTN_B128
25// DS_READ_B96
26// DS_READ_B128
27// BUFFER_LOAD_DWORDX3
28// BUFFER_STORE_DWORDX3
Marek Olsak5df00d62014-12-07 12:18:57 +000029
30
31def isCIVI : Predicate <
Eric Christopher7792e322015-01-30 23:24:40 +000032 "Subtarget->getGeneration() == AMDGPUSubtarget::SEA_ISLANDS || "
33 "Subtarget->getGeneration() == AMDGPUSubtarget::VOLCANIC_ISLANDS"
Tom Stellardd1f0f022015-04-23 19:33:54 +000034>, AssemblerPredicate<"FeatureCIInsts">;
Marek Olsak5df00d62014-12-07 12:18:57 +000035
Tom Stellard731c9272015-06-11 14:51:49 +000036def HasFlatAddressSpace : Predicate<"Subtarget->hasFlatAddressSpace()">;
37
Marek Olsak5df00d62014-12-07 12:18:57 +000038//===----------------------------------------------------------------------===//
39// VOP1 Instructions
40//===----------------------------------------------------------------------===//
41
42let SubtargetPredicate = isCIVI in {
43
Matt Arsenaulte8df8792015-08-22 00:50:41 +000044let SchedRW = [WriteDoubleAdd] in {
Marek Olsak5df00d62014-12-07 12:18:57 +000045defm V_TRUNC_F64 : VOP1Inst <vop1<0x17>, "v_trunc_f64",
46 VOP_F64_F64, ftrunc
47>;
48defm V_CEIL_F64 : VOP1Inst <vop1<0x18>, "v_ceil_f64",
49 VOP_F64_F64, fceil
50>;
51defm V_FLOOR_F64 : VOP1Inst <vop1<0x1A>, "v_floor_f64",
52 VOP_F64_F64, ffloor
53>;
54defm V_RNDNE_F64 : VOP1Inst <vop1<0x19>, "v_rndne_f64",
55 VOP_F64_F64, frint
56>;
Matt Arsenaulte8df8792015-08-22 00:50:41 +000057} // End SchedRW = [WriteDoubleAdd]
58
59let SchedRW = [WriteQuarterRate32] in {
Marek Olsak5df00d62014-12-07 12:18:57 +000060defm V_LOG_LEGACY_F32 : VOP1Inst <vop1<0x45, 0x4c>, "v_log_legacy_f32",
61 VOP_F32_F32
62>;
63defm V_EXP_LEGACY_F32 : VOP1Inst <vop1<0x46, 0x4b>, "v_exp_legacy_f32",
64 VOP_F32_F32
65>;
Matt Arsenaulte8df8792015-08-22 00:50:41 +000066} // End SchedRW = [WriteQuarterRate32]
Tom Stellard731c9272015-06-11 14:51:49 +000067
68//===----------------------------------------------------------------------===//
Matt Arsenault6adf07a2015-08-22 00:16:34 +000069// VOP3 Instructions
70//===----------------------------------------------------------------------===//
71
72defm V_QSAD_PK_U16_U8 : VOP3Inst <vop3<0x173>, "v_qsad_pk_u16_u8",
73 VOP_I32_I32_I32
74>;
75defm V_MQSAD_U16_U8 : VOP3Inst <vop3<0x172>, "v_mqsad_u16_u8",
76 VOP_I32_I32_I32
77>;
78defm V_MQSAD_U32_U8 : VOP3Inst <vop3<0x175>, "v_mqsad_u32_u8",
79 VOP_I32_I32_I32
80>;
81
82let isCommutable = 1 in {
83defm V_MAD_U64_U32 : VOP3Inst <vop3<0x176>, "v_mad_u64_u32",
84 VOP_I64_I32_I32_I64
85>;
86
87// XXX - Does this set VCC?
88defm V_MAD_I64_I32 : VOP3Inst <vop3<0x177>, "v_mad_i64_i32",
89 VOP_I64_I32_I32_I64
90>;
91} // End isCommutable = 1
92
93
94//===----------------------------------------------------------------------===//
95// DS Instructions
96//===----------------------------------------------------------------------===//
97defm DS_WRAP_RTN_F32 : DS_1A1D_RET <0x34, "ds_wrap_rtn_f32", VGPR_32, "ds_wrap_f32">;
98
99// DS_CONDXCHG32_RTN_B64
100// DS_CONDXCHG32_RTN_B128
101
102//===----------------------------------------------------------------------===//
Tom Stellard731c9272015-06-11 14:51:49 +0000103// Flat Instructions
104//===----------------------------------------------------------------------===//
105
Tom Stellard12a19102015-06-12 20:47:06 +0000106def FLAT_LOAD_UBYTE : FLAT_Load_Helper <0x8, "flat_load_ubyte", VGPR_32>;
107def FLAT_LOAD_SBYTE : FLAT_Load_Helper <0x9, "flat_load_sbyte", VGPR_32>;
108def FLAT_LOAD_USHORT : FLAT_Load_Helper <0xa, "flat_load_ushort", VGPR_32>;
109def FLAT_LOAD_SSHORT : FLAT_Load_Helper <0xb, "flat_load_sshort", VGPR_32>;
110def FLAT_LOAD_DWORD : FLAT_Load_Helper <0xc, "flat_load_dword", VGPR_32>;
111def FLAT_LOAD_DWORDX2 : FLAT_Load_Helper <0xd, "flat_load_dwordx2", VReg_64>;
112def FLAT_LOAD_DWORDX4 : FLAT_Load_Helper <0xe, "flat_load_dwordx4", VReg_128>;
113def FLAT_LOAD_DWORDX3 : FLAT_Load_Helper <0xf, "flat_load_dwordx3", VReg_96>;
114def FLAT_STORE_BYTE : FLAT_Store_Helper <0x18, "flat_store_byte", VGPR_32>;
115def FLAT_STORE_SHORT : FLAT_Store_Helper <0x1a, "flat_store_short", VGPR_32>;
116def FLAT_STORE_DWORD : FLAT_Store_Helper <0x1c, "flat_store_dword", VGPR_32>;
Tom Stellard731c9272015-06-11 14:51:49 +0000117def FLAT_STORE_DWORDX2 : FLAT_Store_Helper <
Tom Stellard12a19102015-06-12 20:47:06 +0000118 0x1d, "flat_store_dwordx2", VReg_64
Tom Stellard731c9272015-06-11 14:51:49 +0000119>;
Tom Stellard731c9272015-06-11 14:51:49 +0000120def FLAT_STORE_DWORDX4 : FLAT_Store_Helper <
Tom Stellard12a19102015-06-12 20:47:06 +0000121 0x1e, "flat_store_dwordx4", VReg_128
Tom Stellard731c9272015-06-11 14:51:49 +0000122>;
Tom Stellard731c9272015-06-11 14:51:49 +0000123def FLAT_STORE_DWORDX3 : FLAT_Store_Helper <
Tom Stellard12a19102015-06-12 20:47:06 +0000124 0x1f, "flat_store_dwordx3", VReg_96
Tom Stellard731c9272015-06-11 14:51:49 +0000125>;
Tom Stellard12a19102015-06-12 20:47:06 +0000126defm FLAT_ATOMIC_SWAP : FLAT_ATOMIC <0x30, "flat_atomic_swap", VGPR_32>;
127defm FLAT_ATOMIC_CMPSWAP : FLAT_ATOMIC <
128 0x31, "flat_atomic_cmpswap", VGPR_32, VReg_64
129>;
130defm FLAT_ATOMIC_ADD : FLAT_ATOMIC <0x32, "flat_atomic_add", VGPR_32>;
131defm FLAT_ATOMIC_SUB : FLAT_ATOMIC <0x33, "flat_atomic_sub", VGPR_32>;
132defm FLAT_ATOMIC_RSUB : FLAT_ATOMIC <0x34, "flat_atomic_rsub", VGPR_32>;
133defm FLAT_ATOMIC_SMIN : FLAT_ATOMIC <0x35, "flat_atomic_smin", VGPR_32>;
134defm FLAT_ATOMIC_UMIN : FLAT_ATOMIC <0x36, "flat_atomic_umin", VGPR_32>;
135defm FLAT_ATOMIC_SMAX : FLAT_ATOMIC <0x37, "flat_atomic_smax", VGPR_32>;
136defm FLAT_ATOMIC_UMAX : FLAT_ATOMIC <0x38, "flat_atomic_umax", VGPR_32>;
137defm FLAT_ATOMIC_AND : FLAT_ATOMIC <0x39, "flat_atomic_and", VGPR_32>;
138defm FLAT_ATOMIC_OR : FLAT_ATOMIC <0x3a, "flat_atomic_or", VGPR_32>;
139defm FLAT_ATOMIC_XOR : FLAT_ATOMIC <0x3b, "flat_atomic_xor", VGPR_32>;
140defm FLAT_ATOMIC_INC : FLAT_ATOMIC <0x3c, "flat_atomic_inc", VGPR_32>;
141defm FLAT_ATOMIC_DEC : FLAT_ATOMIC <0x3d, "flat_atomic_dec", VGPR_32>;
142defm FLAT_ATOMIC_FCMPSWAP : FLAT_ATOMIC <
143 0x3e, "flat_atomic_fcmpswap", VGPR_32, VReg_64
144>;
145defm FLAT_ATOMIC_FMIN : FLAT_ATOMIC <0x3f, "flat_atomic_fmin", VGPR_32>;
146defm FLAT_ATOMIC_FMAX : FLAT_ATOMIC <0x40, "flat_atomic_fmax", VGPR_32>;
147defm FLAT_ATOMIC_SWAP_X2 : FLAT_ATOMIC <0x50, "flat_atomic_swap_x2", VReg_64>;
148defm FLAT_ATOMIC_CMPSWAP_X2 : FLAT_ATOMIC <
149 0x51, "flat_atomic_cmpswap_x2", VReg_64, VReg_128
150>;
151defm FLAT_ATOMIC_ADD_X2 : FLAT_ATOMIC <0x52, "flat_atomic_add_x2", VReg_64>;
152defm FLAT_ATOMIC_SUB_X2 : FLAT_ATOMIC <0x53, "flat_atomic_sub_x2", VReg_64>;
153defm FLAT_ATOMIC_RSUB_X2 : FLAT_ATOMIC <0x54, "flat_atomic_rsub_x2", VReg_64>;
154defm FLAT_ATOMIC_SMIN_X2 : FLAT_ATOMIC <0x55, "flat_atomic_smin_x2", VReg_64>;
155defm FLAT_ATOMIC_UMIN_X2 : FLAT_ATOMIC <0x56, "flat_atomic_umin_x2", VReg_64>;
156defm FLAT_ATOMIC_SMAX_X2 : FLAT_ATOMIC <0x57, "flat_atomic_smax_x2", VReg_64>;
157defm FLAT_ATOMIC_UMAX_X2 : FLAT_ATOMIC <0x58, "flat_atomic_umax_x2", VReg_64>;
158defm FLAT_ATOMIC_AND_X2 : FLAT_ATOMIC <0x59, "flat_atomic_and_x2", VReg_64>;
159defm FLAT_ATOMIC_OR_X2 : FLAT_ATOMIC <0x5a, "flat_atomic_or_x2", VReg_64>;
160defm FLAT_ATOMIC_XOR_X2 : FLAT_ATOMIC <0x5b, "flat_atomic_xor_x2", VReg_64>;
161defm FLAT_ATOMIC_INC_X2 : FLAT_ATOMIC <0x5c, "flat_atomic_inc_x2", VReg_64>;
162defm FLAT_ATOMIC_DEC_X2 : FLAT_ATOMIC <0x5d, "flat_atomic_dec_x2", VReg_64>;
163defm FLAT_ATOMIC_FCMPSWAP_X2 : FLAT_ATOMIC <
164 0x5e, "flat_atomic_fcmpswap_x2", VReg_64, VReg_128
165>;
166defm FLAT_ATOMIC_FMIN_X2 : FLAT_ATOMIC <0x5f, "flat_atomic_fmin_x2", VReg_64>;
167defm FLAT_ATOMIC_FMAX_X2 : FLAT_ATOMIC <0x60, "flat_atomic_fmax_x2", VReg_64>;
Tom Stellard731c9272015-06-11 14:51:49 +0000168
Tom Stellard12a19102015-06-12 20:47:06 +0000169} // End SubtargetPredicate = isCIVI
Tom Stellard731c9272015-06-11 14:51:49 +0000170
171//===----------------------------------------------------------------------===//
172// Flat Patterns
173//===----------------------------------------------------------------------===//
174
Tom Stellard12a19102015-06-12 20:47:06 +0000175let Predicates = [HasFlatAddressSpace] in {
176
Tom Stellard731c9272015-06-11 14:51:49 +0000177class FLATLoad_Pattern <FLAT Instr_ADDR64, ValueType vt,
178 PatFrag flat_ld> :
179 Pat <(vt (flat_ld i64:$ptr)),
Tom Stellard12a19102015-06-12 20:47:06 +0000180 (Instr_ADDR64 $ptr, 0, 0, 0)
Tom Stellard731c9272015-06-11 14:51:49 +0000181>;
182
183def : FLATLoad_Pattern <FLAT_LOAD_SBYTE, i32, sextloadi8_flat>;
184def : FLATLoad_Pattern <FLAT_LOAD_UBYTE, i32, az_extloadi8_flat>;
185def : FLATLoad_Pattern <FLAT_LOAD_SSHORT, i32, sextloadi16_flat>;
186def : FLATLoad_Pattern <FLAT_LOAD_USHORT, i32, az_extloadi16_flat>;
187def : FLATLoad_Pattern <FLAT_LOAD_DWORD, i32, flat_load>;
188def : FLATLoad_Pattern <FLAT_LOAD_DWORDX2, i64, flat_load>;
189def : FLATLoad_Pattern <FLAT_LOAD_DWORDX2, i64, az_extloadi32_flat>;
190def : FLATLoad_Pattern <FLAT_LOAD_DWORDX2, v2i32, flat_load>;
191def : FLATLoad_Pattern <FLAT_LOAD_DWORDX4, v4i32, flat_load>;
192
193class FLATStore_Pattern <FLAT Instr, ValueType vt, PatFrag st> :
194 Pat <(st vt:$value, i64:$ptr),
Tom Stellard12a19102015-06-12 20:47:06 +0000195 (Instr $value, $ptr, 0, 0, 0)
Tom Stellard731c9272015-06-11 14:51:49 +0000196 >;
197
198def : FLATStore_Pattern <FLAT_STORE_BYTE, i32, truncstorei8_flat>;
199def : FLATStore_Pattern <FLAT_STORE_SHORT, i32, truncstorei16_flat>;
200def : FLATStore_Pattern <FLAT_STORE_DWORD, i32, flat_store>;
201def : FLATStore_Pattern <FLAT_STORE_DWORDX2, i64, flat_store>;
202def : FLATStore_Pattern <FLAT_STORE_DWORDX2, v2i32, flat_store>;
203def : FLATStore_Pattern <FLAT_STORE_DWORDX4, v4i32, flat_store>;
204
205} // End HasFlatAddressSpace predicate
206
Matt Arsenault6adf07a2015-08-22 00:16:34 +0000207let Predicates = [isCI] in {
208
209// Convert (x - floor(x)) to fract(x)
210def : Pat <
211 (f32 (fsub (f32 (VOP3Mods f32:$x, i32:$mods)),
212 (f32 (ffloor (f32 (VOP3Mods f32:$x, i32:$mods)))))),
213 (V_FRACT_F32_e64 $mods, $x, DSTCLAMP.NONE, DSTOMOD.NONE)
214>;
215
216// Convert (x + (-floor(x))) to fract(x)
217def : Pat <
218 (f64 (fadd (f64 (VOP3Mods f64:$x, i32:$mods)),
219 (f64 (fneg (f64 (ffloor (f64 (VOP3Mods f64:$x, i32:$mods)))))))),
220 (V_FRACT_F64_e64 $mods, $x, DSTCLAMP.NONE, DSTOMOD.NONE)
221>;
222
223} // End Predicates = [isCI]