blob: 4caa8a997066cfa3534dedd91037c70930ef0595 [file] [log] [blame]
Valery Pykhtina34fb492016-08-30 15:20:31 +00001//===-- SOPInstructions.td - SOP Instruction Defintions -------------------===//
2//
Chandler Carruth2946cd72019-01-19 08:50:56 +00003// Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions.
4// See https://llvm.org/LICENSE.txt for license information.
5// SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception
Valery Pykhtina34fb492016-08-30 15:20:31 +00006//
7//===----------------------------------------------------------------------===//
8
Matt Arsenaultcc88ce32016-10-12 18:00:51 +00009def GPRIdxModeMatchClass : AsmOperandClass {
10 let Name = "GPRIdxMode";
11 let PredicateMethod = "isGPRIdxMode";
Dmitry Preobrazhenskyef920352019-02-27 13:12:12 +000012 let ParserMethod = "parseGPRIdxMode";
Matt Arsenaultcc88ce32016-10-12 18:00:51 +000013 let RenderMethod = "addImmOperands";
14}
15
16def GPRIdxMode : Operand<i32> {
17 let PrintMethod = "printVGPRIndexMode";
18 let ParserMatchClass = GPRIdxModeMatchClass;
19 let OperandType = "OPERAND_IMMEDIATE";
20}
21
Nicolai Haehnle4f850ea2018-03-26 13:56:53 +000022class SOP_Pseudo<string opName, dag outs, dag ins, string asmOps,
23 list<dag> pattern=[]> :
24 InstSI<outs, ins, "", pattern>,
25 SIMCInstr<opName, SIEncodingFamily.NONE> {
26
27 let isPseudo = 1;
28 let isCodeGenOnly = 1;
Nicolai Haehnle4f850ea2018-03-26 13:56:53 +000029
30 string Mnemonic = opName;
31 string AsmOperands = asmOps;
32
33 bits<1> has_sdst = 0;
34}
35
Valery Pykhtina34fb492016-08-30 15:20:31 +000036//===----------------------------------------------------------------------===//
37// SOP1 Instructions
38//===----------------------------------------------------------------------===//
39
40class SOP1_Pseudo <string opName, dag outs, dag ins,
41 string asmOps, list<dag> pattern=[]> :
Nicolai Haehnle4f850ea2018-03-26 13:56:53 +000042 SOP_Pseudo<opName, outs, ins, asmOps, pattern> {
Valery Pykhtina34fb492016-08-30 15:20:31 +000043
44 let mayLoad = 0;
45 let mayStore = 0;
46 let hasSideEffects = 0;
47 let SALU = 1;
48 let SOP1 = 1;
49 let SchedRW = [WriteSALU];
Matt Arsenault6bc43d82016-10-06 16:20:41 +000050 let Size = 4;
Tom Stellard2add8a12016-09-06 20:00:26 +000051 let UseNamedOperandTable = 1;
Valery Pykhtina34fb492016-08-30 15:20:31 +000052
Valery Pykhtina34fb492016-08-30 15:20:31 +000053 bits<1> has_src0 = 1;
54 bits<1> has_sdst = 1;
55}
56
57class SOP1_Real<bits<8> op, SOP1_Pseudo ps> :
58 InstSI <ps.OutOperandList, ps.InOperandList,
59 ps.Mnemonic # " " # ps.AsmOperands, []>,
60 Enc32 {
61
62 let isPseudo = 0;
63 let isCodeGenOnly = 0;
Matt Arsenault6bc43d82016-10-06 16:20:41 +000064 let Size = 4;
Valery Pykhtina34fb492016-08-30 15:20:31 +000065
66 // copy relevant pseudo op flags
67 let SubtargetPredicate = ps.SubtargetPredicate;
68 let AsmMatchConverter = ps.AsmMatchConverter;
69
70 // encoding
71 bits<7> sdst;
72 bits<8> src0;
73
74 let Inst{7-0} = !if(ps.has_src0, src0, ?);
75 let Inst{15-8} = op;
76 let Inst{22-16} = !if(ps.has_sdst, sdst, ?);
77 let Inst{31-23} = 0x17d; //encoding;
78}
79
Matt Arsenaultfd6fd002019-02-25 19:24:46 +000080class SOP1_32 <string opName, list<dag> pattern=[], bit tied_in = 0> : SOP1_Pseudo <
81 opName, (outs SReg_32:$sdst),
82 !if(tied_in, (ins SSrc_b32:$src0, SReg_32:$sdst_in),
83 (ins SSrc_b32:$src0)),
84 "$sdst, $src0", pattern> {
85 let Constraints = !if(tied_in, "$sdst = $sdst_in", "");
86}
Valery Pykhtina34fb492016-08-30 15:20:31 +000087
Matt Arsenaultcc88ce32016-10-12 18:00:51 +000088// 32-bit input, no output.
89class SOP1_0_32 <string opName, list<dag> pattern = []> : SOP1_Pseudo <
90 opName, (outs), (ins SSrc_b32:$src0),
91 "$src0", pattern> {
92 let has_sdst = 0;
93}
94
Dmitry Preobrazhensky12194e92017-04-12 12:40:19 +000095class SOP1_0_32R <string opName, list<dag> pattern = []> : SOP1_Pseudo <
96 opName, (outs), (ins SReg_32:$src0),
97 "$src0", pattern> {
98 let has_sdst = 0;
99}
100
Valery Pykhtina34fb492016-08-30 15:20:31 +0000101class SOP1_64 <string opName, list<dag> pattern=[]> : SOP1_Pseudo <
Sam Kolton1eeb11b2016-09-09 14:44:04 +0000102 opName, (outs SReg_64:$sdst), (ins SSrc_b64:$src0),
Valery Pykhtina34fb492016-08-30 15:20:31 +0000103 "$sdst, $src0", pattern
104>;
105
106// 64-bit input, 32-bit output.
107class SOP1_32_64 <string opName, list<dag> pattern=[]> : SOP1_Pseudo <
Sam Kolton1eeb11b2016-09-09 14:44:04 +0000108 opName, (outs SReg_32:$sdst), (ins SSrc_b64:$src0),
Valery Pykhtina34fb492016-08-30 15:20:31 +0000109 "$sdst, $src0", pattern
110>;
111
112// 32-bit input, 64-bit output.
Matt Arsenaultfd6fd002019-02-25 19:24:46 +0000113class SOP1_64_32 <string opName, list<dag> pattern=[], bit tied_in = 0> : SOP1_Pseudo <
114 opName, (outs SReg_64:$sdst),
115 !if(tied_in, (ins SSrc_b32:$src0, SReg_64:$sdst_in),
116 (ins SSrc_b32:$src0)),
117 "$sdst, $src0", pattern> {
118 let Constraints = !if(tied_in, "$sdst = $sdst_in", "");
119}
Valery Pykhtina34fb492016-08-30 15:20:31 +0000120
121// no input, 64-bit output.
122class SOP1_64_0 <string opName, list<dag> pattern=[]> : SOP1_Pseudo <
123 opName, (outs SReg_64:$sdst), (ins), "$sdst", pattern> {
124 let has_src0 = 0;
125}
126
127// 64-bit input, no output
128class SOP1_1 <string opName, list<dag> pattern=[]> : SOP1_Pseudo <
129 opName, (outs), (ins SReg_64:$src0), "$src0", pattern> {
130 let has_sdst = 0;
131}
132
133
134let isMoveImm = 1 in {
135 let isReMaterializable = 1, isAsCheapAsAMove = 1 in {
136 def S_MOV_B32 : SOP1_32 <"s_mov_b32">;
137 def S_MOV_B64 : SOP1_64 <"s_mov_b64">;
138 } // End isRematerializeable = 1
139
140 let Uses = [SCC] in {
141 def S_CMOV_B32 : SOP1_32 <"s_cmov_b32">;
142 def S_CMOV_B64 : SOP1_64 <"s_cmov_b64">;
143 } // End Uses = [SCC]
144} // End isMoveImm = 1
145
146let Defs = [SCC] in {
147 def S_NOT_B32 : SOP1_32 <"s_not_b32",
148 [(set i32:$sdst, (not i32:$src0))]
149 >;
150
151 def S_NOT_B64 : SOP1_64 <"s_not_b64",
152 [(set i64:$sdst, (not i64:$src0))]
153 >;
154 def S_WQM_B32 : SOP1_32 <"s_wqm_b32">;
Marek Olsak2114fc32017-10-24 10:26:59 +0000155 def S_WQM_B64 : SOP1_64 <"s_wqm_b64",
156 [(set i1:$sdst, (int_amdgcn_wqm_vote i1:$src0))]
157 >;
Valery Pykhtina34fb492016-08-30 15:20:31 +0000158} // End Defs = [SCC]
159
160
161def S_BREV_B32 : SOP1_32 <"s_brev_b32",
162 [(set i32:$sdst, (bitreverse i32:$src0))]
163>;
164def S_BREV_B64 : SOP1_64 <"s_brev_b64">;
165
166let Defs = [SCC] in {
167def S_BCNT0_I32_B32 : SOP1_32 <"s_bcnt0_i32_b32">;
168def S_BCNT0_I32_B64 : SOP1_32_64 <"s_bcnt0_i32_b64">;
169def S_BCNT1_I32_B32 : SOP1_32 <"s_bcnt1_i32_b32",
170 [(set i32:$sdst, (ctpop i32:$src0))]
171>;
172def S_BCNT1_I32_B64 : SOP1_32_64 <"s_bcnt1_i32_b64">;
173} // End Defs = [SCC]
174
175def S_FF0_I32_B32 : SOP1_32 <"s_ff0_i32_b32">;
176def S_FF0_I32_B64 : SOP1_32_64 <"s_ff0_i32_b64">;
Valery Pykhtina34fb492016-08-30 15:20:31 +0000177def S_FF1_I32_B64 : SOP1_32_64 <"s_ff1_i32_b64">;
178
Wei Ding5676aca2017-10-12 19:37:14 +0000179def S_FF1_I32_B32 : SOP1_32 <"s_ff1_i32_b32",
180 [(set i32:$sdst, (AMDGPUffbl_b32 i32:$src0))]
181>;
182
Valery Pykhtina34fb492016-08-30 15:20:31 +0000183def S_FLBIT_I32_B32 : SOP1_32 <"s_flbit_i32_b32",
184 [(set i32:$sdst, (AMDGPUffbh_u32 i32:$src0))]
185>;
186
187def S_FLBIT_I32_B64 : SOP1_32_64 <"s_flbit_i32_b64">;
188def S_FLBIT_I32 : SOP1_32 <"s_flbit_i32",
189 [(set i32:$sdst, (AMDGPUffbh_i32 i32:$src0))]
190>;
191def S_FLBIT_I32_I64 : SOP1_32_64 <"s_flbit_i32_i64">;
192def S_SEXT_I32_I8 : SOP1_32 <"s_sext_i32_i8",
193 [(set i32:$sdst, (sext_inreg i32:$src0, i8))]
194>;
195def S_SEXT_I32_I16 : SOP1_32 <"s_sext_i32_i16",
196 [(set i32:$sdst, (sext_inreg i32:$src0, i16))]
197>;
198
Matt Arsenaultfd6fd002019-02-25 19:24:46 +0000199def S_BITSET0_B32 : SOP1_32 <"s_bitset0_b32", [], 1>;
200def S_BITSET0_B64 : SOP1_64_32 <"s_bitset0_b64", [], 1>;
201def S_BITSET1_B32 : SOP1_32 <"s_bitset1_b32", [], 1>;
202def S_BITSET1_B64 : SOP1_64_32 <"s_bitset1_b64", [], 1>;
Konstantin Zhuravlyovb2ff8df2017-05-26 20:38:26 +0000203def S_GETPC_B64 : SOP1_64_0 <"s_getpc_b64",
204 [(set i64:$sdst, (int_amdgcn_s_getpc))]
205>;
Valery Pykhtina34fb492016-08-30 15:20:31 +0000206
Matt Arsenault2b1f9aa2017-05-17 21:56:25 +0000207let isTerminator = 1, isBarrier = 1, SchedRW = [WriteBranch] in {
208
209let isBranch = 1, isIndirectBranch = 1 in {
Valery Pykhtina34fb492016-08-30 15:20:31 +0000210def S_SETPC_B64 : SOP1_1 <"s_setpc_b64">;
Matt Arsenault2b1f9aa2017-05-17 21:56:25 +0000211} // End isBranch = 1, isIndirectBranch = 1
212
213let isReturn = 1 in {
214// Define variant marked as return rather than branch.
215def S_SETPC_B64_return : SOP1_1<"", [(AMDGPUret_flag i64:$src0)]>;
Valery Pykhtina34fb492016-08-30 15:20:31 +0000216}
Matt Arsenault2b1f9aa2017-05-17 21:56:25 +0000217} // End isTerminator = 1, isBarrier = 1
218
219let isCall = 1 in {
220def S_SWAPPC_B64 : SOP1_64 <"s_swappc_b64"
221>;
222}
223
Valery Pykhtina34fb492016-08-30 15:20:31 +0000224def S_RFE_B64 : SOP1_1 <"s_rfe_b64">;
225
226let hasSideEffects = 1, Uses = [EXEC], Defs = [EXEC, SCC] in {
227
228def S_AND_SAVEEXEC_B64 : SOP1_64 <"s_and_saveexec_b64">;
229def S_OR_SAVEEXEC_B64 : SOP1_64 <"s_or_saveexec_b64">;
230def S_XOR_SAVEEXEC_B64 : SOP1_64 <"s_xor_saveexec_b64">;
231def S_ANDN2_SAVEEXEC_B64 : SOP1_64 <"s_andn2_saveexec_b64">;
232def S_ORN2_SAVEEXEC_B64 : SOP1_64 <"s_orn2_saveexec_b64">;
233def S_NAND_SAVEEXEC_B64 : SOP1_64 <"s_nand_saveexec_b64">;
234def S_NOR_SAVEEXEC_B64 : SOP1_64 <"s_nor_saveexec_b64">;
235def S_XNOR_SAVEEXEC_B64 : SOP1_64 <"s_xnor_saveexec_b64">;
236
237} // End hasSideEffects = 1, Uses = [EXEC], Defs = [EXEC, SCC]
238
239def S_QUADMASK_B32 : SOP1_32 <"s_quadmask_b32">;
240def S_QUADMASK_B64 : SOP1_64 <"s_quadmask_b64">;
241
242let Uses = [M0] in {
243def S_MOVRELS_B32 : SOP1_32 <"s_movrels_b32">;
244def S_MOVRELS_B64 : SOP1_64 <"s_movrels_b64">;
245def S_MOVRELD_B32 : SOP1_32 <"s_movreld_b32">;
246def S_MOVRELD_B64 : SOP1_64 <"s_movreld_b64">;
247} // End Uses = [M0]
248
Stanislav Mekhanoshin9d287352019-04-24 20:44:34 +0000249let SubtargetPredicate = isGFX6GFX7GFX8GFX9 in {
Dmitry Preobrazhensky12194e92017-04-12 12:40:19 +0000250def S_CBRANCH_JOIN : SOP1_0_32R <"s_cbranch_join">;
Valery Pykhtina34fb492016-08-30 15:20:31 +0000251def S_MOV_REGRD_B32 : SOP1_32 <"s_mov_regrd_b32">;
Stanislav Mekhanoshin9d287352019-04-24 20:44:34 +0000252} // End SubtargetPredicate = isGFX6GFX7GFX8GFX9
Stanislav Mekhanoshin7895c032019-04-05 18:24:34 +0000253
Valery Pykhtina34fb492016-08-30 15:20:31 +0000254let Defs = [SCC] in {
255def S_ABS_I32 : SOP1_32 <"s_abs_i32">;
256} // End Defs = [SCC]
257def S_MOV_FED_B32 : SOP1_32 <"s_mov_fed_b32">;
258
Matt Arsenaultcc88ce32016-10-12 18:00:51 +0000259let SubtargetPredicate = HasVGPRIndexMode in {
260def S_SET_GPR_IDX_IDX : SOP1_0_32<"s_set_gpr_idx_idx"> {
261 let Uses = [M0];
262 let Defs = [M0];
263}
264}
Valery Pykhtina34fb492016-08-30 15:20:31 +0000265
Stanislav Mekhanoshin7895c032019-04-05 18:24:34 +0000266let SubtargetPredicate = isGFX9Plus in {
Dmitry Preobrazhenskyf20aff52018-04-06 16:35:11 +0000267 let hasSideEffects = 1, Defs = [EXEC, SCC], Uses = [EXEC] in {
268 def S_ANDN1_SAVEEXEC_B64 : SOP1_64<"s_andn1_saveexec_b64">;
269 def S_ORN1_SAVEEXEC_B64 : SOP1_64<"s_orn1_saveexec_b64">;
270 def S_ANDN1_WREXEC_B64 : SOP1_64<"s_andn1_wrexec_b64">;
271 def S_ANDN2_WREXEC_B64 : SOP1_64<"s_andn2_wrexec_b64">;
272 } // End hasSideEffects = 1, Defs = [EXEC, SCC], Uses = [EXEC]
273
274 def S_BITREPLICATE_B64_B32 : SOP1_64_32<"s_bitreplicate_b64_b32">;
Stanislav Mekhanoshin7895c032019-04-05 18:24:34 +0000275} // End SubtargetPredicate = isGFX9Plus
Dmitry Preobrazhenskyf20aff52018-04-06 16:35:11 +0000276
Stanislav Mekhanoshin9d287352019-04-24 20:44:34 +0000277let SubtargetPredicate = isGFX10Plus in {
Stanislav Mekhanoshin8bcc9bb2019-06-13 19:18:29 +0000278 let hasSideEffects = 1, Defs = [EXEC, SCC], Uses = [EXEC] in {
279 def S_AND_SAVEEXEC_B32 : SOP1_32<"s_and_saveexec_b32">;
280 def S_OR_SAVEEXEC_B32 : SOP1_32<"s_or_saveexec_b32">;
281 def S_XOR_SAVEEXEC_B32 : SOP1_32<"s_xor_saveexec_b32">;
282 def S_ANDN2_SAVEEXEC_B32 : SOP1_32<"s_andn2_saveexec_b32">;
283 def S_ORN2_SAVEEXEC_B32 : SOP1_32<"s_orn2_saveexec_b32">;
284 def S_NAND_SAVEEXEC_B32 : SOP1_32<"s_nand_saveexec_b32">;
285 def S_NOR_SAVEEXEC_B32 : SOP1_32<"s_nor_saveexec_b32">;
286 def S_XNOR_SAVEEXEC_B32 : SOP1_32<"s_xnor_saveexec_b32">;
287 def S_ANDN1_SAVEEXEC_B32 : SOP1_32<"s_andn1_saveexec_b32">;
288 def S_ORN1_SAVEEXEC_B32 : SOP1_32<"s_orn1_saveexec_b32">;
289 def S_ANDN1_WREXEC_B32 : SOP1_32<"s_andn1_wrexec_b32">;
290 def S_ANDN2_WREXEC_B32 : SOP1_32<"s_andn2_wrexec_b32">;
291 } // End hasSideEffects = 1, Defs = [EXEC, SCC], Uses = [EXEC]
292
Stanislav Mekhanoshin9d287352019-04-24 20:44:34 +0000293 let Uses = [M0] in {
294 def S_MOVRELSD_2_B32 : SOP1_32<"s_movrelsd_2_b32">;
295 } // End Uses = [M0]
296} // End SubtargetPredicate = isGFX10Plus
297
Valery Pykhtina34fb492016-08-30 15:20:31 +0000298//===----------------------------------------------------------------------===//
299// SOP2 Instructions
300//===----------------------------------------------------------------------===//
301
302class SOP2_Pseudo<string opName, dag outs, dag ins,
303 string asmOps, list<dag> pattern=[]> :
Nicolai Haehnle4f850ea2018-03-26 13:56:53 +0000304 SOP_Pseudo<opName, outs, ins, asmOps, pattern> {
305
Valery Pykhtina34fb492016-08-30 15:20:31 +0000306 let mayLoad = 0;
307 let mayStore = 0;
308 let hasSideEffects = 0;
309 let SALU = 1;
310 let SOP2 = 1;
311 let SchedRW = [WriteSALU];
312 let UseNamedOperandTable = 1;
313
Nicolai Haehnle4f850ea2018-03-26 13:56:53 +0000314 let has_sdst = 1;
Valery Pykhtina34fb492016-08-30 15:20:31 +0000315
316 // Pseudo instructions have no encodings, but adding this field here allows
317 // us to do:
318 // let sdst = xxx in {
319 // for multiclasses that include both real and pseudo instructions.
320 // field bits<7> sdst = 0;
321 // let Size = 4; // Do we need size here?
322}
323
Nicolai Haehnle4f850ea2018-03-26 13:56:53 +0000324class SOP2_Real<bits<7> op, SOP_Pseudo ps> :
Valery Pykhtina34fb492016-08-30 15:20:31 +0000325 InstSI <ps.OutOperandList, ps.InOperandList,
326 ps.Mnemonic # " " # ps.AsmOperands, []>,
327 Enc32 {
328 let isPseudo = 0;
329 let isCodeGenOnly = 0;
330
331 // copy relevant pseudo op flags
332 let SubtargetPredicate = ps.SubtargetPredicate;
333 let AsmMatchConverter = ps.AsmMatchConverter;
Dmitry Preobrazhensky61105ba2019-01-18 13:57:43 +0000334 let UseNamedOperandTable = ps.UseNamedOperandTable;
335 let TSFlags = ps.TSFlags;
Valery Pykhtina34fb492016-08-30 15:20:31 +0000336
337 // encoding
338 bits<7> sdst;
339 bits<8> src0;
340 bits<8> src1;
341
342 let Inst{7-0} = src0;
343 let Inst{15-8} = src1;
344 let Inst{22-16} = !if(ps.has_sdst, sdst, ?);
345 let Inst{29-23} = op;
346 let Inst{31-30} = 0x2; // encoding
347}
348
349
350class SOP2_32 <string opName, list<dag> pattern=[]> : SOP2_Pseudo <
Sam Kolton1eeb11b2016-09-09 14:44:04 +0000351 opName, (outs SReg_32:$sdst), (ins SSrc_b32:$src0, SSrc_b32:$src1),
Valery Pykhtina34fb492016-08-30 15:20:31 +0000352 "$sdst, $src0, $src1", pattern
353>;
354
355class SOP2_64 <string opName, list<dag> pattern=[]> : SOP2_Pseudo <
Sam Kolton1eeb11b2016-09-09 14:44:04 +0000356 opName, (outs SReg_64:$sdst), (ins SSrc_b64:$src0, SSrc_b64:$src1),
Valery Pykhtina34fb492016-08-30 15:20:31 +0000357 "$sdst, $src0, $src1", pattern
358>;
359
360class SOP2_64_32 <string opName, list<dag> pattern=[]> : SOP2_Pseudo <
Sam Kolton1eeb11b2016-09-09 14:44:04 +0000361 opName, (outs SReg_64:$sdst), (ins SSrc_b64:$src0, SSrc_b32:$src1),
Valery Pykhtina34fb492016-08-30 15:20:31 +0000362 "$sdst, $src0, $src1", pattern
363>;
364
365class SOP2_64_32_32 <string opName, list<dag> pattern=[]> : SOP2_Pseudo <
Sam Kolton1eeb11b2016-09-09 14:44:04 +0000366 opName, (outs SReg_64:$sdst), (ins SSrc_b32:$src0, SSrc_b32:$src1),
Valery Pykhtina34fb492016-08-30 15:20:31 +0000367 "$sdst, $src0, $src1", pattern
368>;
369
Graham Sellers04f7a4d2018-11-29 16:05:38 +0000370class UniformUnaryFrag<SDPatternOperator Op> : PatFrag <
371 (ops node:$src0),
372 (Op $src0),
373 [{ return !N->isDivergent(); }]
374>;
375
Alexander Timofeev36617f012018-09-21 10:31:22 +0000376class UniformBinFrag<SDPatternOperator Op> : PatFrag <
377 (ops node:$src0, node:$src1),
378 (Op $src0, $src1),
379 [{ return !N->isDivergent(); }]
380>;
381
Valery Pykhtina34fb492016-08-30 15:20:31 +0000382let Defs = [SCC] in { // Carry out goes to SCC
383let isCommutable = 1 in {
384def S_ADD_U32 : SOP2_32 <"s_add_u32">;
385def S_ADD_I32 : SOP2_32 <"s_add_i32",
Alexander Timofeev36617f012018-09-21 10:31:22 +0000386 [(set i32:$sdst, (UniformBinFrag<add> SSrc_b32:$src0, SSrc_b32:$src1))]
Valery Pykhtina34fb492016-08-30 15:20:31 +0000387>;
388} // End isCommutable = 1
389
390def S_SUB_U32 : SOP2_32 <"s_sub_u32">;
391def S_SUB_I32 : SOP2_32 <"s_sub_i32",
Alexander Timofeev36617f012018-09-21 10:31:22 +0000392 [(set i32:$sdst, (UniformBinFrag<sub> SSrc_b32:$src0, SSrc_b32:$src1))]
Valery Pykhtina34fb492016-08-30 15:20:31 +0000393>;
394
395let Uses = [SCC] in { // Carry in comes from SCC
396let isCommutable = 1 in {
397def S_ADDC_U32 : SOP2_32 <"s_addc_u32",
Alexander Timofeev36617f012018-09-21 10:31:22 +0000398 [(set i32:$sdst, (UniformBinFrag<adde> (i32 SSrc_b32:$src0), (i32 SSrc_b32:$src1)))]>;
Valery Pykhtina34fb492016-08-30 15:20:31 +0000399} // End isCommutable = 1
400
401def S_SUBB_U32 : SOP2_32 <"s_subb_u32",
Alexander Timofeev36617f012018-09-21 10:31:22 +0000402 [(set i32:$sdst, (UniformBinFrag<sube> (i32 SSrc_b32:$src0), (i32 SSrc_b32:$src1)))]>;
Valery Pykhtina34fb492016-08-30 15:20:31 +0000403} // End Uses = [SCC]
404
Matt Arsenault479ba3a2016-09-07 06:25:55 +0000405
406let isCommutable = 1 in {
Valery Pykhtina34fb492016-08-30 15:20:31 +0000407def S_MIN_I32 : SOP2_32 <"s_min_i32",
Alexander Timofeev36617f012018-09-21 10:31:22 +0000408 [(set i32:$sdst, (UniformBinFrag<smin> i32:$src0, i32:$src1))]
Valery Pykhtina34fb492016-08-30 15:20:31 +0000409>;
410def S_MIN_U32 : SOP2_32 <"s_min_u32",
Alexander Timofeev36617f012018-09-21 10:31:22 +0000411 [(set i32:$sdst, (UniformBinFrag<umin> i32:$src0, i32:$src1))]
Valery Pykhtina34fb492016-08-30 15:20:31 +0000412>;
413def S_MAX_I32 : SOP2_32 <"s_max_i32",
Alexander Timofeev36617f012018-09-21 10:31:22 +0000414 [(set i32:$sdst, (UniformBinFrag<smax> i32:$src0, i32:$src1))]
Valery Pykhtina34fb492016-08-30 15:20:31 +0000415>;
416def S_MAX_U32 : SOP2_32 <"s_max_u32",
Alexander Timofeev36617f012018-09-21 10:31:22 +0000417 [(set i32:$sdst, (UniformBinFrag<umax> i32:$src0, i32:$src1))]
Valery Pykhtina34fb492016-08-30 15:20:31 +0000418>;
Matt Arsenault479ba3a2016-09-07 06:25:55 +0000419} // End isCommutable = 1
Valery Pykhtina34fb492016-08-30 15:20:31 +0000420} // End Defs = [SCC]
421
422
423let Uses = [SCC] in {
424 def S_CSELECT_B32 : SOP2_32 <"s_cselect_b32">;
425 def S_CSELECT_B64 : SOP2_64 <"s_cselect_b64">;
426} // End Uses = [SCC]
427
428let Defs = [SCC] in {
Matt Arsenault479ba3a2016-09-07 06:25:55 +0000429let isCommutable = 1 in {
Valery Pykhtina34fb492016-08-30 15:20:31 +0000430def S_AND_B32 : SOP2_32 <"s_and_b32",
Alexander Timofeev36617f012018-09-21 10:31:22 +0000431 [(set i32:$sdst, (UniformBinFrag<and> i32:$src0, i32:$src1))]
Valery Pykhtina34fb492016-08-30 15:20:31 +0000432>;
433
434def S_AND_B64 : SOP2_64 <"s_and_b64",
Alexander Timofeev36617f012018-09-21 10:31:22 +0000435 [(set i64:$sdst, (UniformBinFrag<and> i64:$src0, i64:$src1))]
Valery Pykhtina34fb492016-08-30 15:20:31 +0000436>;
437
438def S_OR_B32 : SOP2_32 <"s_or_b32",
Alexander Timofeev36617f012018-09-21 10:31:22 +0000439 [(set i32:$sdst, (UniformBinFrag<or> i32:$src0, i32:$src1))]
Valery Pykhtina34fb492016-08-30 15:20:31 +0000440>;
441
442def S_OR_B64 : SOP2_64 <"s_or_b64",
Alexander Timofeev36617f012018-09-21 10:31:22 +0000443 [(set i64:$sdst, (UniformBinFrag<or> i64:$src0, i64:$src1))]
Valery Pykhtina34fb492016-08-30 15:20:31 +0000444>;
445
446def S_XOR_B32 : SOP2_32 <"s_xor_b32",
Alexander Timofeev36617f012018-09-21 10:31:22 +0000447 [(set i32:$sdst, (UniformBinFrag<xor> i32:$src0, i32:$src1))]
Valery Pykhtina34fb492016-08-30 15:20:31 +0000448>;
449
450def S_XOR_B64 : SOP2_64 <"s_xor_b64",
Alexander Timofeev36617f012018-09-21 10:31:22 +0000451 [(set i64:$sdst, (UniformBinFrag<xor> i64:$src0, i64:$src1))]
Valery Pykhtina34fb492016-08-30 15:20:31 +0000452>;
Konstantin Zhuravlyovca8946a2017-09-18 21:22:45 +0000453
454def S_XNOR_B32 : SOP2_32 <"s_xnor_b32",
455 [(set i32:$sdst, (not (xor_oneuse i32:$src0, i32:$src1)))]
456>;
457
458def S_XNOR_B64 : SOP2_64 <"s_xnor_b64",
459 [(set i64:$sdst, (not (xor_oneuse i64:$src0, i64:$src1)))]
460>;
Graham Sellers04f7a4d2018-11-29 16:05:38 +0000461
462def S_NAND_B32 : SOP2_32 <"s_nand_b32",
463 [(set i32:$sdst, (not (and_oneuse i32:$src0, i32:$src1)))]
464>;
465
466def S_NAND_B64 : SOP2_64 <"s_nand_b64",
467 [(set i64:$sdst, (not (and_oneuse i64:$src0, i64:$src1)))]
468>;
469
470def S_NOR_B32 : SOP2_32 <"s_nor_b32",
471 [(set i32:$sdst, (not (or_oneuse i32:$src0, i32:$src1)))]
472>;
473
474def S_NOR_B64 : SOP2_64 <"s_nor_b64",
475 [(set i64:$sdst, (not (or_oneuse i64:$src0, i64:$src1)))]
476>;
Matt Arsenault479ba3a2016-09-07 06:25:55 +0000477} // End isCommutable = 1
478
Graham Sellers04f7a4d2018-11-29 16:05:38 +0000479def S_ANDN2_B32 : SOP2_32 <"s_andn2_b32",
480 [(set i32:$sdst, (UniformBinFrag<and> i32:$src0, (UniformUnaryFrag<not> i32:$src1)))]
481>;
482
483def S_ANDN2_B64 : SOP2_64 <"s_andn2_b64",
484 [(set i64:$sdst, (UniformBinFrag<and> i64:$src0, (UniformUnaryFrag<not> i64:$src1)))]
485>;
486
487def S_ORN2_B32 : SOP2_32 <"s_orn2_b32",
488 [(set i32:$sdst, (UniformBinFrag<or> i32:$src0, (UniformUnaryFrag<not> i32:$src1)))]
489>;
490
491def S_ORN2_B64 : SOP2_64 <"s_orn2_b64",
492 [(set i64:$sdst, (UniformBinFrag<or> i64:$src0, (UniformUnaryFrag<not> i64:$src1)))]
493>;
Valery Pykhtina34fb492016-08-30 15:20:31 +0000494} // End Defs = [SCC]
495
496// Use added complexity so these patterns are preferred to the VALU patterns.
497let AddedComplexity = 1 in {
498
499let Defs = [SCC] in {
Alexander Timofeev36617f012018-09-21 10:31:22 +0000500// TODO: b64 versions require VOP3 change since v_lshlrev_b64 is VOP3
Valery Pykhtina34fb492016-08-30 15:20:31 +0000501def S_LSHL_B32 : SOP2_32 <"s_lshl_b32",
Alexander Timofeev36617f012018-09-21 10:31:22 +0000502 [(set i32:$sdst, (UniformBinFrag<shl> i32:$src0, i32:$src1))]
Valery Pykhtina34fb492016-08-30 15:20:31 +0000503>;
504def S_LSHL_B64 : SOP2_64_32 <"s_lshl_b64",
Alexander Timofeevb048fa32018-10-01 11:06:35 +0000505 [(set i64:$sdst, (UniformBinFrag<shl> i64:$src0, i32:$src1))]
Valery Pykhtina34fb492016-08-30 15:20:31 +0000506>;
507def S_LSHR_B32 : SOP2_32 <"s_lshr_b32",
Alexander Timofeev36617f012018-09-21 10:31:22 +0000508 [(set i32:$sdst, (UniformBinFrag<srl> i32:$src0, i32:$src1))]
Valery Pykhtina34fb492016-08-30 15:20:31 +0000509>;
510def S_LSHR_B64 : SOP2_64_32 <"s_lshr_b64",
Alexander Timofeevb048fa32018-10-01 11:06:35 +0000511 [(set i64:$sdst, (UniformBinFrag<srl> i64:$src0, i32:$src1))]
Valery Pykhtina34fb492016-08-30 15:20:31 +0000512>;
513def S_ASHR_I32 : SOP2_32 <"s_ashr_i32",
Alexander Timofeev36617f012018-09-21 10:31:22 +0000514 [(set i32:$sdst, (UniformBinFrag<sra> i32:$src0, i32:$src1))]
Valery Pykhtina34fb492016-08-30 15:20:31 +0000515>;
516def S_ASHR_I64 : SOP2_64_32 <"s_ashr_i64",
Alexander Timofeevb048fa32018-10-01 11:06:35 +0000517 [(set i64:$sdst, (UniformBinFrag<sra> i64:$src0, i32:$src1))]
Valery Pykhtina34fb492016-08-30 15:20:31 +0000518>;
519} // End Defs = [SCC]
520
521def S_BFM_B32 : SOP2_32 <"s_bfm_b32",
Alexander Timofeev36617f012018-09-21 10:31:22 +0000522 [(set i32:$sdst, (UniformBinFrag<AMDGPUbfm> i32:$src0, i32:$src1))]>;
Valery Pykhtina34fb492016-08-30 15:20:31 +0000523def S_BFM_B64 : SOP2_64_32_32 <"s_bfm_b64">;
Alexander Timofeev36617f012018-09-21 10:31:22 +0000524
525// TODO: S_MUL_I32 require V_MUL_LO_I32 from VOP3 change
Valery Pykhtina34fb492016-08-30 15:20:31 +0000526def S_MUL_I32 : SOP2_32 <"s_mul_i32",
Matt Arsenault479ba3a2016-09-07 06:25:55 +0000527 [(set i32:$sdst, (mul i32:$src0, i32:$src1))]> {
528 let isCommutable = 1;
529}
Valery Pykhtina34fb492016-08-30 15:20:31 +0000530
531} // End AddedComplexity = 1
532
533let Defs = [SCC] in {
534def S_BFE_U32 : SOP2_32 <"s_bfe_u32">;
535def S_BFE_I32 : SOP2_32 <"s_bfe_i32">;
536def S_BFE_U64 : SOP2_64_32 <"s_bfe_u64">;
537def S_BFE_I64 : SOP2_64_32 <"s_bfe_i64">;
538} // End Defs = [SCC]
539
540def S_CBRANCH_G_FORK : SOP2_Pseudo <
541 "s_cbranch_g_fork", (outs),
Dmitry Preobrazhensky57148602017-04-14 11:52:26 +0000542 (ins SCSrc_b64:$src0, SCSrc_b64:$src1),
Valery Pykhtina34fb492016-08-30 15:20:31 +0000543 "$src0, $src1"
544> {
545 let has_sdst = 0;
Stanislav Mekhanoshin9d287352019-04-24 20:44:34 +0000546 let SubtargetPredicate = isGFX6GFX7GFX8GFX9;
Valery Pykhtina34fb492016-08-30 15:20:31 +0000547}
548
549let Defs = [SCC] in {
550def S_ABSDIFF_I32 : SOP2_32 <"s_absdiff_i32">;
551} // End Defs = [SCC]
552
Stanislav Mekhanoshin51823022019-04-06 09:20:48 +0000553let SubtargetPredicate = isGFX8GFX9 in {
Dmitry Preobrazhensky14104e02017-04-12 17:10:07 +0000554 def S_RFE_RESTORE_B64 : SOP2_Pseudo <
555 "s_rfe_restore_b64", (outs),
556 (ins SSrc_b64:$src0, SSrc_b32:$src1),
557 "$src0, $src1"
558 > {
559 let hasSideEffects = 1;
560 let has_sdst = 0;
561 }
562}
563
Stanislav Mekhanoshin7895c032019-04-05 18:24:34 +0000564let SubtargetPredicate = isGFX9Plus in {
Matt Arsenault9be7b0d2017-02-27 18:49:11 +0000565 def S_PACK_LL_B32_B16 : SOP2_32<"s_pack_ll_b32_b16">;
566 def S_PACK_LH_B32_B16 : SOP2_32<"s_pack_lh_b32_b16">;
567 def S_PACK_HH_B32_B16 : SOP2_32<"s_pack_hh_b32_b16">;
Dmitry Preobrazhensky2f8e1462018-04-09 13:10:33 +0000568
569 let Defs = [SCC] in {
570 def S_LSHL1_ADD_U32 : SOP2_32<"s_lshl1_add_u32">;
571 def S_LSHL2_ADD_U32 : SOP2_32<"s_lshl2_add_u32">;
572 def S_LSHL3_ADD_U32 : SOP2_32<"s_lshl3_add_u32">;
573 def S_LSHL4_ADD_U32 : SOP2_32<"s_lshl4_add_u32">;
574 } // End Defs = [SCC]
575
Konstantin Zhuravlyovfe23ed22019-05-28 21:18:34 +0000576 def S_MUL_HI_U32 : SOP2_32<"s_mul_hi_u32">;
577 def S_MUL_HI_I32 : SOP2_32<"s_mul_hi_i32">;
Stanislav Mekhanoshin7895c032019-04-05 18:24:34 +0000578} // End SubtargetPredicate = isGFX9Plus
Valery Pykhtina34fb492016-08-30 15:20:31 +0000579
580//===----------------------------------------------------------------------===//
581// SOPK Instructions
582//===----------------------------------------------------------------------===//
583
584class SOPK_Pseudo <string opName, dag outs, dag ins,
585 string asmOps, list<dag> pattern=[]> :
586 InstSI <outs, ins, "", pattern>,
587 SIMCInstr<opName, SIEncodingFamily.NONE> {
588 let isPseudo = 1;
589 let isCodeGenOnly = 1;
Valery Pykhtina34fb492016-08-30 15:20:31 +0000590 let mayLoad = 0;
591 let mayStore = 0;
592 let hasSideEffects = 0;
593 let SALU = 1;
594 let SOPK = 1;
595 let SchedRW = [WriteSALU];
596 let UseNamedOperandTable = 1;
597 string Mnemonic = opName;
598 string AsmOperands = asmOps;
599
600 bits<1> has_sdst = 1;
601}
602
603class SOPK_Real<bits<5> op, SOPK_Pseudo ps> :
604 InstSI <ps.OutOperandList, ps.InOperandList,
605 ps.Mnemonic # " " # ps.AsmOperands, []> {
606 let isPseudo = 0;
607 let isCodeGenOnly = 0;
608
609 // copy relevant pseudo op flags
610 let SubtargetPredicate = ps.SubtargetPredicate;
611 let AsmMatchConverter = ps.AsmMatchConverter;
612 let DisableEncoding = ps.DisableEncoding;
613 let Constraints = ps.Constraints;
614
615 // encoding
616 bits<7> sdst;
617 bits<16> simm16;
618 bits<32> imm;
619}
620
621class SOPK_Real32<bits<5> op, SOPK_Pseudo ps> :
622 SOPK_Real <op, ps>,
623 Enc32 {
624 let Inst{15-0} = simm16;
625 let Inst{22-16} = !if(ps.has_sdst, sdst, ?);
626 let Inst{27-23} = op;
627 let Inst{31-28} = 0xb; //encoding
628}
629
630class SOPK_Real64<bits<5> op, SOPK_Pseudo ps> :
631 SOPK_Real<op, ps>,
632 Enc64 {
633 let Inst{15-0} = simm16;
634 let Inst{22-16} = !if(ps.has_sdst, sdst, ?);
635 let Inst{27-23} = op;
636 let Inst{31-28} = 0xb; //encoding
637 let Inst{63-32} = imm;
638}
639
Matt Arsenault7ccf6cd2016-09-16 21:41:16 +0000640class SOPKInstTable <bit is_sopk, string cmpOp = ""> {
641 bit IsSOPK = is_sopk;
642 string BaseCmpOp = cmpOp;
643}
644
Valery Pykhtina34fb492016-08-30 15:20:31 +0000645class SOPK_32 <string opName, list<dag> pattern=[]> : SOPK_Pseudo <
646 opName,
647 (outs SReg_32:$sdst),
Dmitry Preobrazhenskyc7d35a02017-04-26 15:34:19 +0000648 (ins s16imm:$simm16),
Valery Pykhtina34fb492016-08-30 15:20:31 +0000649 "$sdst, $simm16",
650 pattern>;
651
Stanislav Mekhanoshin9d287352019-04-24 20:44:34 +0000652class SOPK_32_BR <string opName, list<dag> pattern=[]> : SOPK_Pseudo <
653 opName,
654 (outs),
655 (ins sopp_brtarget:$simm16, SReg_32:$sdst),
656 "$sdst, $simm16",
657 pattern> {
658 let Defs = [EXEC];
659 let Uses = [EXEC];
660 let isBranch = 1;
661 let isTerminator = 1;
662 let SchedRW = [WriteBranch];
663}
664
Dmitry Preobrazhenskyc7d35a02017-04-26 15:34:19 +0000665class SOPK_SCC <string opName, string base_op, bit isSignExt> : SOPK_Pseudo <
Valery Pykhtina34fb492016-08-30 15:20:31 +0000666 opName,
667 (outs),
Dmitry Preobrazhenskyc7d35a02017-04-26 15:34:19 +0000668 !if(isSignExt,
669 (ins SReg_32:$sdst, s16imm:$simm16),
670 (ins SReg_32:$sdst, u16imm:$simm16)),
Matt Arsenault7ccf6cd2016-09-16 21:41:16 +0000671 "$sdst, $simm16", []>,
672 SOPKInstTable<1, base_op>{
Valery Pykhtina34fb492016-08-30 15:20:31 +0000673 let Defs = [SCC];
674}
675
676class SOPK_32TIE <string opName, list<dag> pattern=[]> : SOPK_Pseudo <
677 opName,
678 (outs SReg_32:$sdst),
Dmitry Preobrazhenskyc7d35a02017-04-26 15:34:19 +0000679 (ins SReg_32:$src0, s16imm:$simm16),
Valery Pykhtina34fb492016-08-30 15:20:31 +0000680 "$sdst, $simm16",
681 pattern
682>;
683
684let isReMaterializable = 1, isMoveImm = 1 in {
685def S_MOVK_I32 : SOPK_32 <"s_movk_i32">;
686} // End isReMaterializable = 1
687let Uses = [SCC] in {
688def S_CMOVK_I32 : SOPK_32 <"s_cmovk_i32">;
689}
690
691let isCompare = 1 in {
692
693// This instruction is disabled for now until we can figure out how to teach
694// the instruction selector to correctly use the S_CMP* vs V_CMP*
695// instructions.
696//
697// When this instruction is enabled the code generator sometimes produces this
698// invalid sequence:
699//
700// SCC = S_CMPK_EQ_I32 SGPR0, imm
701// VCC = COPY SCC
702// VGPR0 = V_CNDMASK VCC, VGPR0, VGPR1
703//
704// def S_CMPK_EQ_I32 : SOPK_SCC <"s_cmpk_eq_i32",
705// [(set i1:$dst, (setcc i32:$src0, imm:$src1, SETEQ))]
706// >;
707
Dmitry Preobrazhenskyc7d35a02017-04-26 15:34:19 +0000708def S_CMPK_EQ_I32 : SOPK_SCC <"s_cmpk_eq_i32", "s_cmp_eq_i32", 1>;
709def S_CMPK_LG_I32 : SOPK_SCC <"s_cmpk_lg_i32", "s_cmp_lg_i32", 1>;
710def S_CMPK_GT_I32 : SOPK_SCC <"s_cmpk_gt_i32", "s_cmp_gt_i32", 1>;
711def S_CMPK_GE_I32 : SOPK_SCC <"s_cmpk_ge_i32", "s_cmp_ge_i32", 1>;
712def S_CMPK_LT_I32 : SOPK_SCC <"s_cmpk_lt_i32", "s_cmp_lt_i32", 1>;
713def S_CMPK_LE_I32 : SOPK_SCC <"s_cmpk_le_i32", "s_cmp_le_i32", 1>;
Matt Arsenault7ccf6cd2016-09-16 21:41:16 +0000714
715let SOPKZext = 1 in {
Dmitry Preobrazhenskyc7d35a02017-04-26 15:34:19 +0000716def S_CMPK_EQ_U32 : SOPK_SCC <"s_cmpk_eq_u32", "s_cmp_eq_u32", 0>;
717def S_CMPK_LG_U32 : SOPK_SCC <"s_cmpk_lg_u32", "s_cmp_lg_u32", 0>;
718def S_CMPK_GT_U32 : SOPK_SCC <"s_cmpk_gt_u32", "s_cmp_gt_u32", 0>;
719def S_CMPK_GE_U32 : SOPK_SCC <"s_cmpk_ge_u32", "s_cmp_ge_u32", 0>;
720def S_CMPK_LT_U32 : SOPK_SCC <"s_cmpk_lt_u32", "s_cmp_lt_u32", 0>;
721def S_CMPK_LE_U32 : SOPK_SCC <"s_cmpk_le_u32", "s_cmp_le_u32", 0>;
Matt Arsenault7ccf6cd2016-09-16 21:41:16 +0000722} // End SOPKZext = 1
Valery Pykhtina34fb492016-08-30 15:20:31 +0000723} // End isCompare = 1
724
725let Defs = [SCC], isCommutable = 1, DisableEncoding = "$src0",
726 Constraints = "$sdst = $src0" in {
727 def S_ADDK_I32 : SOPK_32TIE <"s_addk_i32">;
728 def S_MULK_I32 : SOPK_32TIE <"s_mulk_i32">;
729}
730
Stanislav Mekhanoshin9d287352019-04-24 20:44:34 +0000731let SubtargetPredicate = isGFX6GFX7GFX8GFX9 in
Valery Pykhtina34fb492016-08-30 15:20:31 +0000732def S_CBRANCH_I_FORK : SOPK_Pseudo <
733 "s_cbranch_i_fork",
Dmitry Preobrazhensky5ae31132019-05-17 14:57:04 +0000734 (outs), (ins SReg_64:$sdst, sopp_brtarget:$simm16),
Valery Pykhtina34fb492016-08-30 15:20:31 +0000735 "$sdst, $simm16"
736>;
737
738let mayLoad = 1 in {
739def S_GETREG_B32 : SOPK_Pseudo <
740 "s_getreg_b32",
741 (outs SReg_32:$sdst), (ins hwreg:$simm16),
742 "$sdst, $simm16"
743>;
744}
745
Tom Stellard8485fa02016-12-07 02:42:15 +0000746let hasSideEffects = 1 in {
747
Valery Pykhtina34fb492016-08-30 15:20:31 +0000748def S_SETREG_B32 : SOPK_Pseudo <
749 "s_setreg_b32",
750 (outs), (ins SReg_32:$sdst, hwreg:$simm16),
Tom Stellard8485fa02016-12-07 02:42:15 +0000751 "$simm16, $sdst",
752 [(AMDGPUsetreg i32:$sdst, (i16 timm:$simm16))]
Valery Pykhtina34fb492016-08-30 15:20:31 +0000753>;
754
755// FIXME: Not on SI?
756//def S_GETREG_REGRD_B32 : SOPK_32 <sopk<0x14, 0x13>, "s_getreg_regrd_b32">;
757
758def S_SETREG_IMM32_B32 : SOPK_Pseudo <
759 "s_setreg_imm32_b32",
760 (outs), (ins i32imm:$imm, hwreg:$simm16),
Matt Arsenault10c17ca2016-10-06 10:13:23 +0000761 "$simm16, $imm"> {
762 let Size = 8; // Unlike every other SOPK instruction.
Valery Pykhtina34fb492016-08-30 15:20:31 +0000763 let has_sdst = 0;
764}
765
Tom Stellard8485fa02016-12-07 02:42:15 +0000766} // End hasSideEffects = 1
Valery Pykhtina34fb492016-08-30 15:20:31 +0000767
Stanislav Mekhanoshin9d287352019-04-24 20:44:34 +0000768class SOPK_WAITCNT<string opName, list<dag> pat=[]> :
769 SOPK_Pseudo<
770 opName,
771 (outs),
772 (ins SReg_32:$sdst, s16imm:$simm16),
773 "$sdst, $simm16",
774 pat> {
775 let hasSideEffects = 1;
776 let mayLoad = 1;
777 let mayStore = 1;
778 let has_sdst = 1; // First source takes place of sdst in encoding
779}
780
Stanislav Mekhanoshin7895c032019-04-05 18:24:34 +0000781let SubtargetPredicate = isGFX9Plus in {
Dmitry Preobrazhenskyae312232018-04-06 18:24:49 +0000782 def S_CALL_B64 : SOPK_Pseudo<
783 "s_call_b64",
784 (outs SReg_64:$sdst),
Dmitry Preobrazhensky5ae31132019-05-17 14:57:04 +0000785 (ins sopp_brtarget:$simm16),
Dmitry Preobrazhenskyae312232018-04-06 18:24:49 +0000786 "$sdst, $simm16"> {
787 let isCall = 1;
788 }
Stanislav Mekhanoshin7895c032019-04-05 18:24:34 +0000789} // End SubtargetPredicate = isGFX9Plus
Dmitry Preobrazhenskyae312232018-04-06 18:24:49 +0000790
Stanislav Mekhanoshin9d287352019-04-24 20:44:34 +0000791let SubtargetPredicate = isGFX10Plus in {
792 def S_VERSION : SOPK_Pseudo<
793 "s_version",
794 (outs),
795 (ins s16imm:$simm16),
796 "$simm16"> {
797 let has_sdst = 0;
798 }
799
Stanislav Mekhanoshin8bcc9bb2019-06-13 19:18:29 +0000800 def S_SUBVECTOR_LOOP_BEGIN : SOPK_32_BR<"s_subvector_loop_begin">;
801 def S_SUBVECTOR_LOOP_END : SOPK_32_BR<"s_subvector_loop_end">;
802
Stanislav Mekhanoshin9d287352019-04-24 20:44:34 +0000803 def S_WAITCNT_VSCNT : SOPK_WAITCNT<"s_waitcnt_vscnt">;
804 def S_WAITCNT_VMCNT : SOPK_WAITCNT<"s_waitcnt_vmcnt">;
805 def S_WAITCNT_EXPCNT : SOPK_WAITCNT<"s_waitcnt_expcnt">;
806 def S_WAITCNT_LGKMCNT : SOPK_WAITCNT<"s_waitcnt_lgkmcnt">;
807} // End SubtargetPredicate = isGFX10Plus
808
Valery Pykhtina34fb492016-08-30 15:20:31 +0000809//===----------------------------------------------------------------------===//
810// SOPC Instructions
811//===----------------------------------------------------------------------===//
812
813class SOPCe <bits<7> op> : Enc32 {
814 bits<8> src0;
815 bits<8> src1;
816
817 let Inst{7-0} = src0;
818 let Inst{15-8} = src1;
819 let Inst{22-16} = op;
820 let Inst{31-23} = 0x17e;
821}
822
Matt Arsenaultcc88ce32016-10-12 18:00:51 +0000823class SOPC <bits<7> op, dag outs, dag ins, string asm,
824 list<dag> pattern = []> :
Valery Pykhtina34fb492016-08-30 15:20:31 +0000825 InstSI<outs, ins, asm, pattern>, SOPCe <op> {
826 let mayLoad = 0;
827 let mayStore = 0;
828 let hasSideEffects = 0;
829 let SALU = 1;
830 let SOPC = 1;
831 let isCodeGenOnly = 0;
832 let Defs = [SCC];
833 let SchedRW = [WriteSALU];
834 let UseNamedOperandTable = 1;
Valery Pykhtina34fb492016-08-30 15:20:31 +0000835}
836
837class SOPC_Base <bits<7> op, RegisterOperand rc0, RegisterOperand rc1,
838 string opName, list<dag> pattern = []> : SOPC <
839 op, (outs), (ins rc0:$src0, rc1:$src1),
840 opName#" $src0, $src1", pattern > {
841 let Defs = [SCC];
842}
843class SOPC_Helper <bits<7> op, RegisterOperand rc, ValueType vt,
844 string opName, PatLeaf cond> : SOPC_Base <
845 op, rc, rc, opName,
846 [(set SCC, (si_setcc_uniform vt:$src0, vt:$src1, cond))] > {
847}
848
Matt Arsenault7ccf6cd2016-09-16 21:41:16 +0000849class SOPC_CMP_32<bits<7> op, string opName,
850 PatLeaf cond = COND_NULL, string revOp = opName>
851 : SOPC_Helper<op, SSrc_b32, i32, opName, cond>,
852 Commutable_REV<revOp, !eq(revOp, opName)>,
853 SOPKInstTable<0, opName> {
854 let isCompare = 1;
855 let isCommutable = 1;
856}
Valery Pykhtina34fb492016-08-30 15:20:31 +0000857
Matt Arsenault7b1dc2c2016-09-17 02:02:19 +0000858class SOPC_CMP_64<bits<7> op, string opName,
859 PatLeaf cond = COND_NULL, string revOp = opName>
860 : SOPC_Helper<op, SSrc_b64, i64, opName, cond>,
861 Commutable_REV<revOp, !eq(revOp, opName)> {
862 let isCompare = 1;
863 let isCommutable = 1;
864}
865
Valery Pykhtina34fb492016-08-30 15:20:31 +0000866class SOPC_32<bits<7> op, string opName, list<dag> pattern = []>
Sam Kolton1eeb11b2016-09-09 14:44:04 +0000867 : SOPC_Base<op, SSrc_b32, SSrc_b32, opName, pattern>;
Valery Pykhtina34fb492016-08-30 15:20:31 +0000868
869class SOPC_64_32<bits<7> op, string opName, list<dag> pattern = []>
Sam Kolton1eeb11b2016-09-09 14:44:04 +0000870 : SOPC_Base<op, SSrc_b64, SSrc_b32, opName, pattern>;
Valery Pykhtina34fb492016-08-30 15:20:31 +0000871
Matt Arsenault5d8eb252016-09-30 01:50:20 +0000872def S_CMP_EQ_I32 : SOPC_CMP_32 <0x00, "s_cmp_eq_i32">;
873def S_CMP_LG_I32 : SOPC_CMP_32 <0x01, "s_cmp_lg_i32">;
Valery Pykhtina34fb492016-08-30 15:20:31 +0000874def S_CMP_GT_I32 : SOPC_CMP_32 <0x02, "s_cmp_gt_i32", COND_SGT>;
875def S_CMP_GE_I32 : SOPC_CMP_32 <0x03, "s_cmp_ge_i32", COND_SGE>;
Matt Arsenault7ccf6cd2016-09-16 21:41:16 +0000876def S_CMP_LT_I32 : SOPC_CMP_32 <0x04, "s_cmp_lt_i32", COND_SLT, "s_cmp_gt_i32">;
877def S_CMP_LE_I32 : SOPC_CMP_32 <0x05, "s_cmp_le_i32", COND_SLE, "s_cmp_ge_i32">;
Valery Pykhtina34fb492016-08-30 15:20:31 +0000878def S_CMP_EQ_U32 : SOPC_CMP_32 <0x06, "s_cmp_eq_u32", COND_EQ>;
Matt Arsenault7ccf6cd2016-09-16 21:41:16 +0000879def S_CMP_LG_U32 : SOPC_CMP_32 <0x07, "s_cmp_lg_u32", COND_NE>;
Valery Pykhtina34fb492016-08-30 15:20:31 +0000880def S_CMP_GT_U32 : SOPC_CMP_32 <0x08, "s_cmp_gt_u32", COND_UGT>;
881def S_CMP_GE_U32 : SOPC_CMP_32 <0x09, "s_cmp_ge_u32", COND_UGE>;
Matt Arsenault7ccf6cd2016-09-16 21:41:16 +0000882def S_CMP_LT_U32 : SOPC_CMP_32 <0x0a, "s_cmp_lt_u32", COND_ULT, "s_cmp_gt_u32">;
883def S_CMP_LE_U32 : SOPC_CMP_32 <0x0b, "s_cmp_le_u32", COND_ULE, "s_cmp_ge_u32">;
884
Valery Pykhtina34fb492016-08-30 15:20:31 +0000885def S_BITCMP0_B32 : SOPC_32 <0x0c, "s_bitcmp0_b32">;
886def S_BITCMP1_B32 : SOPC_32 <0x0d, "s_bitcmp1_b32">;
887def S_BITCMP0_B64 : SOPC_64_32 <0x0e, "s_bitcmp0_b64">;
888def S_BITCMP1_B64 : SOPC_64_32 <0x0f, "s_bitcmp1_b64">;
Stanislav Mekhanoshin9d287352019-04-24 20:44:34 +0000889let SubtargetPredicate = isGFX6GFX7GFX8GFX9 in
Valery Pykhtina34fb492016-08-30 15:20:31 +0000890def S_SETVSKIP : SOPC_32 <0x10, "s_setvskip">;
891
Stanislav Mekhanoshin7895c032019-04-05 18:24:34 +0000892let SubtargetPredicate = isGFX8Plus in {
Matt Arsenault7b1dc2c2016-09-17 02:02:19 +0000893def S_CMP_EQ_U64 : SOPC_CMP_64 <0x12, "s_cmp_eq_u64", COND_EQ>;
894def S_CMP_LG_U64 : SOPC_CMP_64 <0x13, "s_cmp_lg_u64", COND_NE>;
Stanislav Mekhanoshin7895c032019-04-05 18:24:34 +0000895} // End SubtargetPredicate = isGFX8Plus
Valery Pykhtina34fb492016-08-30 15:20:31 +0000896
Matt Arsenaultcc88ce32016-10-12 18:00:51 +0000897let SubtargetPredicate = HasVGPRIndexMode in {
898def S_SET_GPR_IDX_ON : SOPC <0x11,
899 (outs),
900 (ins SSrc_b32:$src0, GPRIdxMode:$src1),
901 "s_set_gpr_idx_on $src0,$src1"> {
902 let Defs = [M0]; // No scc def
903 let Uses = [M0]; // Other bits of m0 unmodified.
904 let hasSideEffects = 1; // Sets mode.gpr_idx_en
Matt Arsenault2d8c2892016-11-01 20:42:24 +0000905 let FixedSize = 1;
Matt Arsenaultcc88ce32016-10-12 18:00:51 +0000906}
907}
908
Valery Pykhtina34fb492016-08-30 15:20:31 +0000909//===----------------------------------------------------------------------===//
910// SOPP Instructions
911//===----------------------------------------------------------------------===//
912
913class SOPPe <bits<7> op> : Enc32 {
914 bits <16> simm16;
915
916 let Inst{15-0} = simm16;
917 let Inst{22-16} = op;
918 let Inst{31-23} = 0x17f; // encoding
919}
920
921class SOPP <bits<7> op, dag ins, string asm, list<dag> pattern = []> :
922 InstSI <(outs), ins, asm, pattern >, SOPPe <op> {
923
924 let mayLoad = 0;
925 let mayStore = 0;
926 let hasSideEffects = 0;
927 let SALU = 1;
928 let SOPP = 1;
Matt Arsenault10c17ca2016-10-06 10:13:23 +0000929 let Size = 4;
Valery Pykhtina34fb492016-08-30 15:20:31 +0000930 let SchedRW = [WriteSALU];
931
932 let UseNamedOperandTable = 1;
Valery Pykhtina34fb492016-08-30 15:20:31 +0000933}
934
935
936def S_NOP : SOPP <0x00000000, (ins i16imm:$simm16), "s_nop $simm16">;
937
938let isTerminator = 1 in {
939
Matt Arsenault74d67c22019-06-14 13:26:29 +0000940def S_ENDPGM : SOPP <0x00000001, (ins EndpgmImm:$simm16), "s_endpgm$simm16"> {
Valery Pykhtina34fb492016-08-30 15:20:31 +0000941 let isBarrier = 1;
Matt Arsenault4e9c1e32016-10-28 23:00:38 +0000942 let isReturn = 1;
Valery Pykhtina34fb492016-08-30 15:20:31 +0000943}
944
Dmitry Preobrazhensky14104e02017-04-12 17:10:07 +0000945def S_ENDPGM_SAVED : SOPP <0x0000001B, (ins), "s_endpgm_saved"> {
Stanislav Mekhanoshin7895c032019-04-05 18:24:34 +0000946 let SubtargetPredicate = isGFX8Plus;
Dmitry Preobrazhensky14104e02017-04-12 17:10:07 +0000947 let simm16 = 0;
948 let isBarrier = 1;
949 let isReturn = 1;
950}
Dmitry Preobrazhensky14104e02017-04-12 17:10:07 +0000951
Stanislav Mekhanoshin7895c032019-04-05 18:24:34 +0000952let SubtargetPredicate = isGFX9Plus in {
Dmitry Preobrazhensky306b1a02018-04-06 17:25:00 +0000953 let isBarrier = 1, isReturn = 1, simm16 = 0 in {
954 def S_ENDPGM_ORDERED_PS_DONE :
955 SOPP<0x01e, (ins), "s_endpgm_ordered_ps_done">;
956 } // End isBarrier = 1, isReturn = 1, simm16 = 0
Stanislav Mekhanoshin7895c032019-04-05 18:24:34 +0000957} // End SubtargetPredicate = isGFX9Plus
Dmitry Preobrazhensky306b1a02018-04-06 17:25:00 +0000958
Stanislav Mekhanoshin9d287352019-04-24 20:44:34 +0000959let SubtargetPredicate = isGFX10Plus in {
960 let isBarrier = 1, isReturn = 1, simm16 = 0 in {
961 def S_CODE_END :
962 SOPP<0x01f, (ins), "s_code_end">;
963 } // End isBarrier = 1, isReturn = 1, simm16 = 0
964} // End SubtargetPredicate = isGFX10Plus
965
Valery Pykhtina34fb492016-08-30 15:20:31 +0000966let isBranch = 1, SchedRW = [WriteBranch] in {
967def S_BRANCH : SOPP <
968 0x00000002, (ins sopp_brtarget:$simm16), "s_branch $simm16",
969 [(br bb:$simm16)]> {
970 let isBarrier = 1;
971}
972
973let Uses = [SCC] in {
974def S_CBRANCH_SCC0 : SOPP <
975 0x00000004, (ins sopp_brtarget:$simm16),
976 "s_cbranch_scc0 $simm16"
977>;
978def S_CBRANCH_SCC1 : SOPP <
979 0x00000005, (ins sopp_brtarget:$simm16),
Matt Arsenaultd674e0a2017-10-10 20:34:49 +0000980 "s_cbranch_scc1 $simm16"
Valery Pykhtina34fb492016-08-30 15:20:31 +0000981>;
982} // End Uses = [SCC]
983
984let Uses = [VCC] in {
985def S_CBRANCH_VCCZ : SOPP <
986 0x00000006, (ins sopp_brtarget:$simm16),
987 "s_cbranch_vccz $simm16"
988>;
989def S_CBRANCH_VCCNZ : SOPP <
990 0x00000007, (ins sopp_brtarget:$simm16),
991 "s_cbranch_vccnz $simm16"
992>;
993} // End Uses = [VCC]
994
995let Uses = [EXEC] in {
996def S_CBRANCH_EXECZ : SOPP <
997 0x00000008, (ins sopp_brtarget:$simm16),
998 "s_cbranch_execz $simm16"
999>;
1000def S_CBRANCH_EXECNZ : SOPP <
1001 0x00000009, (ins sopp_brtarget:$simm16),
1002 "s_cbranch_execnz $simm16"
1003>;
1004} // End Uses = [EXEC]
1005
Dmitry Preobrazhensky3ac63112017-04-05 17:26:45 +00001006def S_CBRANCH_CDBGSYS : SOPP <
1007 0x00000017, (ins sopp_brtarget:$simm16),
1008 "s_cbranch_cdbgsys $simm16"
1009>;
1010
1011def S_CBRANCH_CDBGSYS_AND_USER : SOPP <
1012 0x0000001A, (ins sopp_brtarget:$simm16),
1013 "s_cbranch_cdbgsys_and_user $simm16"
1014>;
1015
1016def S_CBRANCH_CDBGSYS_OR_USER : SOPP <
1017 0x00000019, (ins sopp_brtarget:$simm16),
1018 "s_cbranch_cdbgsys_or_user $simm16"
1019>;
1020
1021def S_CBRANCH_CDBGUSER : SOPP <
1022 0x00000018, (ins sopp_brtarget:$simm16),
1023 "s_cbranch_cdbguser $simm16"
1024>;
Valery Pykhtina34fb492016-08-30 15:20:31 +00001025
1026} // End isBranch = 1
1027} // End isTerminator = 1
1028
1029let hasSideEffects = 1 in {
1030def S_BARRIER : SOPP <0x0000000a, (ins), "s_barrier",
1031 [(int_amdgcn_s_barrier)]> {
1032 let SchedRW = [WriteBarrier];
1033 let simm16 = 0;
1034 let mayLoad = 1;
1035 let mayStore = 1;
1036 let isConvergent = 1;
1037}
1038
Dmitry Preobrazhensky14104e02017-04-12 17:10:07 +00001039def S_WAKEUP : SOPP <0x00000003, (ins), "s_wakeup"> {
Stanislav Mekhanoshin7895c032019-04-05 18:24:34 +00001040 let SubtargetPredicate = isGFX8Plus;
Dmitry Preobrazhensky14104e02017-04-12 17:10:07 +00001041 let simm16 = 0;
1042 let mayLoad = 1;
1043 let mayStore = 1;
1044}
Dmitry Preobrazhensky14104e02017-04-12 17:10:07 +00001045
Valery Pykhtina34fb492016-08-30 15:20:31 +00001046let mayLoad = 1, mayStore = 1, hasSideEffects = 1 in
1047def S_WAITCNT : SOPP <0x0000000c, (ins WAIT_FLAG:$simm16), "s_waitcnt $simm16">;
1048def S_SETHALT : SOPP <0x0000000d, (ins i16imm:$simm16), "s_sethalt $simm16">;
Dmitry Preobrazhensky3ac63112017-04-05 17:26:45 +00001049def S_SETKILL : SOPP <0x0000000b, (ins i16imm:$simm16), "s_setkill $simm16">;
Valery Pykhtina34fb492016-08-30 15:20:31 +00001050
1051// On SI the documentation says sleep for approximately 64 * low 2
1052// bits, consistent with the reported maximum of 448. On VI the
1053// maximum reported is 960 cycles, so 960 / 64 = 15 max, so is the
1054// maximum really 15 on VI?
1055def S_SLEEP : SOPP <0x0000000e, (ins i32imm:$simm16),
1056 "s_sleep $simm16", [(int_amdgcn_s_sleep SIMM16bit:$simm16)]> {
1057 let hasSideEffects = 1;
1058 let mayLoad = 1;
1059 let mayStore = 1;
1060}
1061
1062def S_SETPRIO : SOPP <0x0000000f, (ins i16imm:$simm16), "s_setprio $simm16">;
1063
1064let Uses = [EXEC, M0] in {
1065// FIXME: Should this be mayLoad+mayStore?
1066def S_SENDMSG : SOPP <0x00000010, (ins SendMsgImm:$simm16), "s_sendmsg $simm16",
1067 [(AMDGPUsendmsg (i32 imm:$simm16))]
1068>;
Jan Veselyd48445d2017-01-04 18:06:55 +00001069
1070def S_SENDMSGHALT : SOPP <0x00000011, (ins SendMsgImm:$simm16), "s_sendmsghalt $simm16",
1071 [(AMDGPUsendmsghalt (i32 imm:$simm16))]
1072>;
Valery Pykhtina34fb492016-08-30 15:20:31 +00001073} // End Uses = [EXEC, M0]
1074
Valery Pykhtina34fb492016-08-30 15:20:31 +00001075def S_TRAP : SOPP <0x00000012, (ins i16imm:$simm16), "s_trap $simm16">;
1076def S_ICACHE_INV : SOPP <0x00000013, (ins), "s_icache_inv"> {
1077 let simm16 = 0;
1078}
1079def S_INCPERFLEVEL : SOPP <0x00000014, (ins i32imm:$simm16), "s_incperflevel $simm16",
1080 [(int_amdgcn_s_incperflevel SIMM16bit:$simm16)]> {
1081 let hasSideEffects = 1;
1082 let mayLoad = 1;
1083 let mayStore = 1;
1084}
1085def S_DECPERFLEVEL : SOPP <0x00000015, (ins i32imm:$simm16), "s_decperflevel $simm16",
1086 [(int_amdgcn_s_decperflevel SIMM16bit:$simm16)]> {
1087 let hasSideEffects = 1;
1088 let mayLoad = 1;
1089 let mayStore = 1;
1090}
1091def S_TTRACEDATA : SOPP <0x00000016, (ins), "s_ttracedata"> {
1092 let simm16 = 0;
1093}
Matt Arsenaultcc88ce32016-10-12 18:00:51 +00001094
1095let SubtargetPredicate = HasVGPRIndexMode in {
1096def S_SET_GPR_IDX_OFF : SOPP<0x1c, (ins), "s_set_gpr_idx_off"> {
1097 let simm16 = 0;
1098}
1099}
Valery Pykhtina34fb492016-08-30 15:20:31 +00001100} // End hasSideEffects
1101
Matt Arsenaultcc88ce32016-10-12 18:00:51 +00001102let SubtargetPredicate = HasVGPRIndexMode in {
1103def S_SET_GPR_IDX_MODE : SOPP<0x1d, (ins GPRIdxMode:$simm16),
1104 "s_set_gpr_idx_mode$simm16"> {
1105 let Defs = [M0];
1106}
1107}
Valery Pykhtina34fb492016-08-30 15:20:31 +00001108
Stanislav Mekhanoshin9d287352019-04-24 20:44:34 +00001109let SubtargetPredicate = isGFX10Plus in {
1110 def S_INST_PREFETCH :
1111 SOPP<0x020, (ins s16imm:$simm16), "s_inst_prefetch $simm16">;
1112 def S_CLAUSE :
1113 SOPP<0x021, (ins s16imm:$simm16), "s_clause $simm16">;
1114 def S_WAITCNT_IDLE :
1115 SOPP <0x022, (ins), "s_wait_idle"> {
1116 let simm16 = 0;
1117 }
1118 def S_WAITCNT_DEPCTR :
1119 SOPP <0x023, (ins s16imm:$simm16), "s_waitcnt_depctr $simm16">;
1120 def S_ROUND_MODE :
1121 SOPP<0x024, (ins s16imm:$simm16), "s_round_mode $simm16">;
1122 def S_DENORM_MODE :
1123 SOPP<0x025, (ins s16imm:$simm16), "s_denorm_mode $simm16">;
1124 def S_TTRACEDATA_IMM :
1125 SOPP<0x028, (ins s16imm:$simm16), "s_ttracedata_imm $simm16">;
1126} // End SubtargetPredicate = isGFX10Plus
1127
Valery Pykhtina34fb492016-08-30 15:20:31 +00001128//===----------------------------------------------------------------------===//
1129// S_GETREG_B32 Intrinsic Pattern.
1130//===----------------------------------------------------------------------===//
Matt Arsenault90c75932017-10-03 00:06:41 +00001131def : GCNPat <
Valery Pykhtina34fb492016-08-30 15:20:31 +00001132 (int_amdgcn_s_getreg imm:$simm16),
1133 (S_GETREG_B32 (as_i16imm $simm16))
1134>;
1135
1136//===----------------------------------------------------------------------===//
1137// SOP1 Patterns
1138//===----------------------------------------------------------------------===//
1139
Matt Arsenault90c75932017-10-03 00:06:41 +00001140def : GCNPat <
David Stuttard20ea21c2019-03-12 09:52:58 +00001141 (AMDGPUendpgm),
1142 (S_ENDPGM (i16 0))
1143>;
1144
1145def : GCNPat <
Valery Pykhtina34fb492016-08-30 15:20:31 +00001146 (i64 (ctpop i64:$src)),
1147 (i64 (REG_SEQUENCE SReg_64,
1148 (i32 (COPY_TO_REGCLASS (S_BCNT1_I32_B64 $src), SReg_32)), sub0,
Tom Stellard115a6152016-11-10 16:02:37 +00001149 (S_MOV_B32 (i32 0)), sub1))
Valery Pykhtina34fb492016-08-30 15:20:31 +00001150>;
1151
Matt Arsenault90c75932017-10-03 00:06:41 +00001152def : GCNPat <
Valery Pykhtina34fb492016-08-30 15:20:31 +00001153 (i32 (smax i32:$x, (i32 (ineg i32:$x)))),
1154 (S_ABS_I32 $x)
1155>;
1156
Matt Arsenault90c75932017-10-03 00:06:41 +00001157def : GCNPat <
Tom Stellard115a6152016-11-10 16:02:37 +00001158 (i16 imm:$imm),
1159 (S_MOV_B32 imm:$imm)
1160>;
1161
1162// Same as a 32-bit inreg
Matt Arsenault90c75932017-10-03 00:06:41 +00001163def : GCNPat<
Tom Stellard115a6152016-11-10 16:02:37 +00001164 (i32 (sext i16:$src)),
1165 (S_SEXT_I32_I16 $src)
1166>;
1167
1168
Valery Pykhtina34fb492016-08-30 15:20:31 +00001169//===----------------------------------------------------------------------===//
1170// SOP2 Patterns
1171//===----------------------------------------------------------------------===//
1172
1173// V_ADD_I32_e32/S_ADD_U32 produces carry in VCC/SCC. For the vector
1174// case, the sgpr-copies pass will fix this to use the vector version.
Matt Arsenault90c75932017-10-03 00:06:41 +00001175def : GCNPat <
Valery Pykhtina34fb492016-08-30 15:20:31 +00001176 (i32 (addc i32:$src0, i32:$src1)),
1177 (S_ADD_U32 $src0, $src1)
1178>;
1179
Tom Stellard115a6152016-11-10 16:02:37 +00001180// FIXME: We need to use COPY_TO_REGCLASS to work-around the fact that
1181// REG_SEQUENCE patterns don't support instructions with multiple
1182// outputs.
Matt Arsenault90c75932017-10-03 00:06:41 +00001183def : GCNPat<
Tom Stellard115a6152016-11-10 16:02:37 +00001184 (i64 (zext i16:$src)),
1185 (REG_SEQUENCE SReg_64,
1186 (i32 (COPY_TO_REGCLASS (S_AND_B32 $src, (S_MOV_B32 (i32 0xffff))), SGPR_32)), sub0,
1187 (S_MOV_B32 (i32 0)), sub1)
1188>;
1189
Matt Arsenault90c75932017-10-03 00:06:41 +00001190def : GCNPat <
Tom Stellard115a6152016-11-10 16:02:37 +00001191 (i64 (sext i16:$src)),
1192 (REG_SEQUENCE SReg_64, (i32 (S_SEXT_I32_I16 $src)), sub0,
1193 (i32 (COPY_TO_REGCLASS (S_ASHR_I32 (i32 (S_SEXT_I32_I16 $src)), (S_MOV_B32 (i32 31))), SGPR_32)), sub1)
1194>;
1195
Matt Arsenault90c75932017-10-03 00:06:41 +00001196def : GCNPat<
Tom Stellard115a6152016-11-10 16:02:37 +00001197 (i32 (zext i16:$src)),
1198 (S_AND_B32 (S_MOV_B32 (i32 0xffff)), $src)
1199>;
1200
1201
1202
Valery Pykhtina34fb492016-08-30 15:20:31 +00001203//===----------------------------------------------------------------------===//
1204// SOPP Patterns
1205//===----------------------------------------------------------------------===//
1206
Matt Arsenault90c75932017-10-03 00:06:41 +00001207def : GCNPat <
Valery Pykhtina34fb492016-08-30 15:20:31 +00001208 (int_amdgcn_s_waitcnt i32:$simm16),
1209 (S_WAITCNT (as_i16imm $simm16))
1210>;
1211
Valery Pykhtina34fb492016-08-30 15:20:31 +00001212
1213//===----------------------------------------------------------------------===//
Stanislav Mekhanoshin7895c032019-04-05 18:24:34 +00001214// Target-specific instruction encodings.
Valery Pykhtina34fb492016-08-30 15:20:31 +00001215//===----------------------------------------------------------------------===//
1216
Stanislav Mekhanoshin9d287352019-04-24 20:44:34 +00001217//===----------------------------------------------------------------------===//
1218// SOP1 - GFX10.
1219//===----------------------------------------------------------------------===//
1220
1221class Select_gfx10<string opName> : SIMCInstr<opName, SIEncodingFamily.GFX10> {
1222 Predicate AssemblerPredicate = isGFX10Plus;
1223 string DecoderNamespace = "GFX10";
Valery Pykhtina34fb492016-08-30 15:20:31 +00001224}
1225
Stanislav Mekhanoshin9d287352019-04-24 20:44:34 +00001226multiclass SOP1_Real_gfx10<bits<8> op> {
1227 def _gfx10 : SOP1_Real<op, !cast<SOP1_Pseudo>(NAME)>,
1228 Select_gfx10<!cast<SOP1_Pseudo>(NAME).Mnemonic>;
1229}
Valery Pykhtina34fb492016-08-30 15:20:31 +00001230
Stanislav Mekhanoshin9d287352019-04-24 20:44:34 +00001231defm S_ANDN1_SAVEEXEC_B64 : SOP1_Real_gfx10<0x037>;
1232defm S_ORN1_SAVEEXEC_B64 : SOP1_Real_gfx10<0x038>;
1233defm S_ANDN1_WREXEC_B64 : SOP1_Real_gfx10<0x039>;
1234defm S_ANDN2_WREXEC_B64 : SOP1_Real_gfx10<0x03a>;
1235defm S_BITREPLICATE_B64_B32 : SOP1_Real_gfx10<0x03b>;
Stanislav Mekhanoshin8bcc9bb2019-06-13 19:18:29 +00001236defm S_AND_SAVEEXEC_B32 : SOP1_Real_gfx10<0x03c>;
1237defm S_OR_SAVEEXEC_B32 : SOP1_Real_gfx10<0x03d>;
1238defm S_XOR_SAVEEXEC_B32 : SOP1_Real_gfx10<0x03e>;
1239defm S_ANDN2_SAVEEXEC_B32 : SOP1_Real_gfx10<0x03f>;
1240defm S_ORN2_SAVEEXEC_B32 : SOP1_Real_gfx10<0x040>;
1241defm S_NAND_SAVEEXEC_B32 : SOP1_Real_gfx10<0x041>;
1242defm S_NOR_SAVEEXEC_B32 : SOP1_Real_gfx10<0x042>;
1243defm S_XNOR_SAVEEXEC_B32 : SOP1_Real_gfx10<0x043>;
1244defm S_ANDN1_SAVEEXEC_B32 : SOP1_Real_gfx10<0x044>;
1245defm S_ORN1_SAVEEXEC_B32 : SOP1_Real_gfx10<0x045>;
1246defm S_ANDN1_WREXEC_B32 : SOP1_Real_gfx10<0x046>;
1247defm S_ANDN2_WREXEC_B32 : SOP1_Real_gfx10<0x047>;
Stanislav Mekhanoshin9d287352019-04-24 20:44:34 +00001248defm S_MOVRELSD_2_B32 : SOP1_Real_gfx10<0x049>;
Valery Pykhtina34fb492016-08-30 15:20:31 +00001249
Stanislav Mekhanoshin9d287352019-04-24 20:44:34 +00001250//===----------------------------------------------------------------------===//
1251// SOP1 - GFX6, GFX7.
1252//===----------------------------------------------------------------------===//
Valery Pykhtina34fb492016-08-30 15:20:31 +00001253
Stanislav Mekhanoshin9d287352019-04-24 20:44:34 +00001254class Select_gfx6_gfx7<string opName> : SIMCInstr<opName, SIEncodingFamily.SI> {
1255 Predicate AssemblerPredicate = isGFX6GFX7;
1256 string DecoderNamespace = "GFX6GFX7";
1257}
Valery Pykhtina34fb492016-08-30 15:20:31 +00001258
Stanislav Mekhanoshin9d287352019-04-24 20:44:34 +00001259multiclass SOP1_Real_gfx6_gfx7<bits<8> op> {
1260 def _gfx6_gfx7 : SOP1_Real<op, !cast<SOP1_Pseudo>(NAME)>,
1261 Select_gfx6_gfx7<!cast<SOP1_Pseudo>(NAME).Mnemonic>;
1262}
Valery Pykhtina34fb492016-08-30 15:20:31 +00001263
Stanislav Mekhanoshin9d287352019-04-24 20:44:34 +00001264multiclass SOP1_Real_gfx6_gfx7_gfx10<bits<8> op> :
1265 SOP1_Real_gfx6_gfx7<op>, SOP1_Real_gfx10<op>;
Valery Pykhtina34fb492016-08-30 15:20:31 +00001266
Stanislav Mekhanoshin9d287352019-04-24 20:44:34 +00001267defm S_CBRANCH_JOIN : SOP1_Real_gfx6_gfx7<0x032>;
1268defm S_MOV_REGRD_B32 : SOP1_Real_gfx6_gfx7<0x033>;
1269
1270defm S_MOV_B32 : SOP1_Real_gfx6_gfx7_gfx10<0x003>;
1271defm S_MOV_B64 : SOP1_Real_gfx6_gfx7_gfx10<0x004>;
1272defm S_CMOV_B32 : SOP1_Real_gfx6_gfx7_gfx10<0x005>;
1273defm S_CMOV_B64 : SOP1_Real_gfx6_gfx7_gfx10<0x006>;
1274defm S_NOT_B32 : SOP1_Real_gfx6_gfx7_gfx10<0x007>;
1275defm S_NOT_B64 : SOP1_Real_gfx6_gfx7_gfx10<0x008>;
1276defm S_WQM_B32 : SOP1_Real_gfx6_gfx7_gfx10<0x009>;
1277defm S_WQM_B64 : SOP1_Real_gfx6_gfx7_gfx10<0x00a>;
1278defm S_BREV_B32 : SOP1_Real_gfx6_gfx7_gfx10<0x00b>;
1279defm S_BREV_B64 : SOP1_Real_gfx6_gfx7_gfx10<0x00c>;
1280defm S_BCNT0_I32_B32 : SOP1_Real_gfx6_gfx7_gfx10<0x00d>;
1281defm S_BCNT0_I32_B64 : SOP1_Real_gfx6_gfx7_gfx10<0x00e>;
1282defm S_BCNT1_I32_B32 : SOP1_Real_gfx6_gfx7_gfx10<0x00f>;
1283defm S_BCNT1_I32_B64 : SOP1_Real_gfx6_gfx7_gfx10<0x010>;
1284defm S_FF0_I32_B32 : SOP1_Real_gfx6_gfx7_gfx10<0x011>;
1285defm S_FF0_I32_B64 : SOP1_Real_gfx6_gfx7_gfx10<0x012>;
1286defm S_FF1_I32_B32 : SOP1_Real_gfx6_gfx7_gfx10<0x013>;
1287defm S_FF1_I32_B64 : SOP1_Real_gfx6_gfx7_gfx10<0x014>;
1288defm S_FLBIT_I32_B32 : SOP1_Real_gfx6_gfx7_gfx10<0x015>;
1289defm S_FLBIT_I32_B64 : SOP1_Real_gfx6_gfx7_gfx10<0x016>;
1290defm S_FLBIT_I32 : SOP1_Real_gfx6_gfx7_gfx10<0x017>;
1291defm S_FLBIT_I32_I64 : SOP1_Real_gfx6_gfx7_gfx10<0x018>;
1292defm S_SEXT_I32_I8 : SOP1_Real_gfx6_gfx7_gfx10<0x019>;
1293defm S_SEXT_I32_I16 : SOP1_Real_gfx6_gfx7_gfx10<0x01a>;
1294defm S_BITSET0_B32 : SOP1_Real_gfx6_gfx7_gfx10<0x01b>;
1295defm S_BITSET0_B64 : SOP1_Real_gfx6_gfx7_gfx10<0x01c>;
1296defm S_BITSET1_B32 : SOP1_Real_gfx6_gfx7_gfx10<0x01d>;
1297defm S_BITSET1_B64 : SOP1_Real_gfx6_gfx7_gfx10<0x01e>;
1298defm S_GETPC_B64 : SOP1_Real_gfx6_gfx7_gfx10<0x01f>;
1299defm S_SETPC_B64 : SOP1_Real_gfx6_gfx7_gfx10<0x020>;
1300defm S_SWAPPC_B64 : SOP1_Real_gfx6_gfx7_gfx10<0x021>;
1301defm S_RFE_B64 : SOP1_Real_gfx6_gfx7_gfx10<0x022>;
1302defm S_AND_SAVEEXEC_B64 : SOP1_Real_gfx6_gfx7_gfx10<0x024>;
1303defm S_OR_SAVEEXEC_B64 : SOP1_Real_gfx6_gfx7_gfx10<0x025>;
1304defm S_XOR_SAVEEXEC_B64 : SOP1_Real_gfx6_gfx7_gfx10<0x026>;
1305defm S_ANDN2_SAVEEXEC_B64 : SOP1_Real_gfx6_gfx7_gfx10<0x027>;
1306defm S_ORN2_SAVEEXEC_B64 : SOP1_Real_gfx6_gfx7_gfx10<0x028>;
1307defm S_NAND_SAVEEXEC_B64 : SOP1_Real_gfx6_gfx7_gfx10<0x029>;
1308defm S_NOR_SAVEEXEC_B64 : SOP1_Real_gfx6_gfx7_gfx10<0x02a>;
1309defm S_XNOR_SAVEEXEC_B64 : SOP1_Real_gfx6_gfx7_gfx10<0x02b>;
1310defm S_QUADMASK_B32 : SOP1_Real_gfx6_gfx7_gfx10<0x02c>;
1311defm S_QUADMASK_B64 : SOP1_Real_gfx6_gfx7_gfx10<0x02d>;
1312defm S_MOVRELS_B32 : SOP1_Real_gfx6_gfx7_gfx10<0x02e>;
1313defm S_MOVRELS_B64 : SOP1_Real_gfx6_gfx7_gfx10<0x02f>;
1314defm S_MOVRELD_B32 : SOP1_Real_gfx6_gfx7_gfx10<0x030>;
1315defm S_MOVRELD_B64 : SOP1_Real_gfx6_gfx7_gfx10<0x031>;
1316defm S_ABS_I32 : SOP1_Real_gfx6_gfx7_gfx10<0x034>;
1317defm S_MOV_FED_B32 : SOP1_Real_gfx6_gfx7_gfx10<0x035>;
1318
1319//===----------------------------------------------------------------------===//
1320// SOP2 - GFX10.
1321//===----------------------------------------------------------------------===//
1322
1323multiclass SOP2_Real_gfx10<bits<7> op> {
1324 def _gfx10 : SOP2_Real<op, !cast<SOP2_Pseudo>(NAME)>,
1325 Select_gfx10<!cast<SOP2_Pseudo>(NAME).Mnemonic>;
1326}
1327
1328defm S_LSHL1_ADD_U32 : SOP2_Real_gfx10<0x02e>;
1329defm S_LSHL2_ADD_U32 : SOP2_Real_gfx10<0x02f>;
1330defm S_LSHL3_ADD_U32 : SOP2_Real_gfx10<0x030>;
1331defm S_LSHL4_ADD_U32 : SOP2_Real_gfx10<0x031>;
1332defm S_PACK_LL_B32_B16 : SOP2_Real_gfx10<0x032>;
1333defm S_PACK_LH_B32_B16 : SOP2_Real_gfx10<0x033>;
1334defm S_PACK_HH_B32_B16 : SOP2_Real_gfx10<0x034>;
1335defm S_MUL_HI_U32 : SOP2_Real_gfx10<0x035>;
1336defm S_MUL_HI_I32 : SOP2_Real_gfx10<0x036>;
1337
1338//===----------------------------------------------------------------------===//
1339// SOP2 - GFX6, GFX7.
1340//===----------------------------------------------------------------------===//
1341
1342multiclass SOP2_Real_gfx6_gfx7<bits<7> op> {
1343 def _gfx6_gfx7 : SOP2_Real<op, !cast<SOP_Pseudo>(NAME)>,
1344 Select_gfx6_gfx7<!cast<SOP_Pseudo>(NAME).Mnemonic>;
1345}
1346
1347multiclass SOP2_Real_gfx6_gfx7_gfx10<bits<7> op> :
1348 SOP2_Real_gfx6_gfx7<op>, SOP2_Real_gfx10<op>;
1349
1350defm S_CBRANCH_G_FORK : SOP2_Real_gfx6_gfx7<0x02b>;
1351
1352defm S_ADD_U32 : SOP2_Real_gfx6_gfx7_gfx10<0x000>;
1353defm S_SUB_U32 : SOP2_Real_gfx6_gfx7_gfx10<0x001>;
1354defm S_ADD_I32 : SOP2_Real_gfx6_gfx7_gfx10<0x002>;
1355defm S_SUB_I32 : SOP2_Real_gfx6_gfx7_gfx10<0x003>;
1356defm S_ADDC_U32 : SOP2_Real_gfx6_gfx7_gfx10<0x004>;
1357defm S_SUBB_U32 : SOP2_Real_gfx6_gfx7_gfx10<0x005>;
1358defm S_MIN_I32 : SOP2_Real_gfx6_gfx7_gfx10<0x006>;
1359defm S_MIN_U32 : SOP2_Real_gfx6_gfx7_gfx10<0x007>;
1360defm S_MAX_I32 : SOP2_Real_gfx6_gfx7_gfx10<0x008>;
1361defm S_MAX_U32 : SOP2_Real_gfx6_gfx7_gfx10<0x009>;
1362defm S_CSELECT_B32 : SOP2_Real_gfx6_gfx7_gfx10<0x00a>;
1363defm S_CSELECT_B64 : SOP2_Real_gfx6_gfx7_gfx10<0x00b>;
1364defm S_AND_B32 : SOP2_Real_gfx6_gfx7_gfx10<0x00e>;
1365defm S_AND_B64 : SOP2_Real_gfx6_gfx7_gfx10<0x00f>;
1366defm S_OR_B32 : SOP2_Real_gfx6_gfx7_gfx10<0x010>;
1367defm S_OR_B64 : SOP2_Real_gfx6_gfx7_gfx10<0x011>;
1368defm S_XOR_B32 : SOP2_Real_gfx6_gfx7_gfx10<0x012>;
1369defm S_XOR_B64 : SOP2_Real_gfx6_gfx7_gfx10<0x013>;
1370defm S_ANDN2_B32 : SOP2_Real_gfx6_gfx7_gfx10<0x014>;
1371defm S_ANDN2_B64 : SOP2_Real_gfx6_gfx7_gfx10<0x015>;
1372defm S_ORN2_B32 : SOP2_Real_gfx6_gfx7_gfx10<0x016>;
1373defm S_ORN2_B64 : SOP2_Real_gfx6_gfx7_gfx10<0x017>;
1374defm S_NAND_B32 : SOP2_Real_gfx6_gfx7_gfx10<0x018>;
1375defm S_NAND_B64 : SOP2_Real_gfx6_gfx7_gfx10<0x019>;
1376defm S_NOR_B32 : SOP2_Real_gfx6_gfx7_gfx10<0x01a>;
1377defm S_NOR_B64 : SOP2_Real_gfx6_gfx7_gfx10<0x01b>;
1378defm S_XNOR_B32 : SOP2_Real_gfx6_gfx7_gfx10<0x01c>;
1379defm S_XNOR_B64 : SOP2_Real_gfx6_gfx7_gfx10<0x01d>;
1380defm S_LSHL_B32 : SOP2_Real_gfx6_gfx7_gfx10<0x01e>;
1381defm S_LSHL_B64 : SOP2_Real_gfx6_gfx7_gfx10<0x01f>;
1382defm S_LSHR_B32 : SOP2_Real_gfx6_gfx7_gfx10<0x020>;
1383defm S_LSHR_B64 : SOP2_Real_gfx6_gfx7_gfx10<0x021>;
1384defm S_ASHR_I32 : SOP2_Real_gfx6_gfx7_gfx10<0x022>;
1385defm S_ASHR_I64 : SOP2_Real_gfx6_gfx7_gfx10<0x023>;
1386defm S_BFM_B32 : SOP2_Real_gfx6_gfx7_gfx10<0x024>;
1387defm S_BFM_B64 : SOP2_Real_gfx6_gfx7_gfx10<0x025>;
1388defm S_MUL_I32 : SOP2_Real_gfx6_gfx7_gfx10<0x026>;
1389defm S_BFE_U32 : SOP2_Real_gfx6_gfx7_gfx10<0x027>;
1390defm S_BFE_I32 : SOP2_Real_gfx6_gfx7_gfx10<0x028>;
1391defm S_BFE_U64 : SOP2_Real_gfx6_gfx7_gfx10<0x029>;
1392defm S_BFE_I64 : SOP2_Real_gfx6_gfx7_gfx10<0x02a>;
1393defm S_ABSDIFF_I32 : SOP2_Real_gfx6_gfx7_gfx10<0x02c>;
1394
1395//===----------------------------------------------------------------------===//
1396// SOPK - GFX10.
1397//===----------------------------------------------------------------------===//
1398
1399multiclass SOPK_Real32_gfx10<bits<5> op> {
1400 def _gfx10 : SOPK_Real32<op, !cast<SOPK_Pseudo>(NAME)>,
1401 Select_gfx10<!cast<SOPK_Pseudo>(NAME).Mnemonic>;
1402}
1403
1404multiclass SOPK_Real64_gfx10<bits<5> op> {
1405 def _gfx10 : SOPK_Real64<op, !cast<SOPK_Pseudo>(NAME)>,
1406 Select_gfx10<!cast<SOPK_Pseudo>(NAME).Mnemonic>;
1407}
1408
1409defm S_VERSION : SOPK_Real32_gfx10<0x001>;
1410defm S_CALL_B64 : SOPK_Real32_gfx10<0x016>;
1411defm S_WAITCNT_VSCNT : SOPK_Real32_gfx10<0x017>;
1412defm S_WAITCNT_VMCNT : SOPK_Real32_gfx10<0x018>;
1413defm S_WAITCNT_EXPCNT : SOPK_Real32_gfx10<0x019>;
1414defm S_WAITCNT_LGKMCNT : SOPK_Real32_gfx10<0x01a>;
Stanislav Mekhanoshin8bcc9bb2019-06-13 19:18:29 +00001415defm S_SUBVECTOR_LOOP_BEGIN : SOPK_Real32_gfx10<0x01b>;
1416defm S_SUBVECTOR_LOOP_END : SOPK_Real32_gfx10<0x01c>;
Stanislav Mekhanoshin9d287352019-04-24 20:44:34 +00001417
1418//===----------------------------------------------------------------------===//
1419// SOPK - GFX6, GFX7.
1420//===----------------------------------------------------------------------===//
1421
1422multiclass SOPK_Real32_gfx6_gfx7<bits<5> op> {
1423 def _gfx6_gfx7 : SOPK_Real32<op, !cast<SOPK_Pseudo>(NAME)>,
1424 Select_gfx6_gfx7<!cast<SOPK_Pseudo>(NAME).Mnemonic>;
1425}
1426
1427multiclass SOPK_Real64_gfx6_gfx7<bits<5> op> {
1428 def _gfx6_gfx7 : SOPK_Real64<op, !cast<SOPK_Pseudo>(NAME)>,
1429 Select_gfx6_gfx7<!cast<SOPK_Pseudo>(NAME).Mnemonic>;
1430}
1431
1432multiclass SOPK_Real32_gfx6_gfx7_gfx10<bits<5> op> :
1433 SOPK_Real32_gfx6_gfx7<op>, SOPK_Real32_gfx10<op>;
1434
1435multiclass SOPK_Real64_gfx6_gfx7_gfx10<bits<5> op> :
1436 SOPK_Real64_gfx6_gfx7<op>, SOPK_Real64_gfx10<op>;
1437
1438defm S_CBRANCH_I_FORK : SOPK_Real32_gfx6_gfx7<0x011>;
1439
1440defm S_MOVK_I32 : SOPK_Real32_gfx6_gfx7_gfx10<0x000>;
1441defm S_CMOVK_I32 : SOPK_Real32_gfx6_gfx7_gfx10<0x002>;
1442defm S_CMPK_EQ_I32 : SOPK_Real32_gfx6_gfx7_gfx10<0x003>;
1443defm S_CMPK_LG_I32 : SOPK_Real32_gfx6_gfx7_gfx10<0x004>;
1444defm S_CMPK_GT_I32 : SOPK_Real32_gfx6_gfx7_gfx10<0x005>;
1445defm S_CMPK_GE_I32 : SOPK_Real32_gfx6_gfx7_gfx10<0x006>;
1446defm S_CMPK_LT_I32 : SOPK_Real32_gfx6_gfx7_gfx10<0x007>;
1447defm S_CMPK_LE_I32 : SOPK_Real32_gfx6_gfx7_gfx10<0x008>;
1448defm S_CMPK_EQ_U32 : SOPK_Real32_gfx6_gfx7_gfx10<0x009>;
1449defm S_CMPK_LG_U32 : SOPK_Real32_gfx6_gfx7_gfx10<0x00a>;
1450defm S_CMPK_GT_U32 : SOPK_Real32_gfx6_gfx7_gfx10<0x00b>;
1451defm S_CMPK_GE_U32 : SOPK_Real32_gfx6_gfx7_gfx10<0x00c>;
1452defm S_CMPK_LT_U32 : SOPK_Real32_gfx6_gfx7_gfx10<0x00d>;
1453defm S_CMPK_LE_U32 : SOPK_Real32_gfx6_gfx7_gfx10<0x00e>;
1454defm S_ADDK_I32 : SOPK_Real32_gfx6_gfx7_gfx10<0x00f>;
1455defm S_MULK_I32 : SOPK_Real32_gfx6_gfx7_gfx10<0x010>;
1456defm S_GETREG_B32 : SOPK_Real32_gfx6_gfx7_gfx10<0x012>;
1457defm S_SETREG_B32 : SOPK_Real32_gfx6_gfx7_gfx10<0x013>;
1458defm S_SETREG_IMM32_B32 : SOPK_Real64_gfx6_gfx7_gfx10<0x015>;
1459
1460//===----------------------------------------------------------------------===//
1461// GFX8, GFX9 (VI).
1462//===----------------------------------------------------------------------===//
Valery Pykhtina34fb492016-08-30 15:20:31 +00001463
1464class Select_vi<string opName> :
1465 SIMCInstr<opName, SIEncodingFamily.VI> {
Stanislav Mekhanoshin51823022019-04-06 09:20:48 +00001466 list<Predicate> AssemblerPredicates = [isGFX8GFX9];
1467 string DecoderNamespace = "GFX8";
Valery Pykhtina34fb492016-08-30 15:20:31 +00001468}
1469
1470class SOP1_Real_vi<bits<8> op, SOP1_Pseudo ps> :
1471 SOP1_Real<op, ps>,
1472 Select_vi<ps.Mnemonic>;
1473
1474
1475class SOP2_Real_vi<bits<7> op, SOP2_Pseudo ps> :
1476 SOP2_Real<op, ps>,
1477 Select_vi<ps.Mnemonic>;
1478
1479class SOPK_Real_vi<bits<5> op, SOPK_Pseudo ps> :
1480 SOPK_Real32<op, ps>,
1481 Select_vi<ps.Mnemonic>;
1482
1483def S_MOV_B32_vi : SOP1_Real_vi <0x00, S_MOV_B32>;
1484def S_MOV_B64_vi : SOP1_Real_vi <0x01, S_MOV_B64>;
1485def S_CMOV_B32_vi : SOP1_Real_vi <0x02, S_CMOV_B32>;
1486def S_CMOV_B64_vi : SOP1_Real_vi <0x03, S_CMOV_B64>;
1487def S_NOT_B32_vi : SOP1_Real_vi <0x04, S_NOT_B32>;
1488def S_NOT_B64_vi : SOP1_Real_vi <0x05, S_NOT_B64>;
1489def S_WQM_B32_vi : SOP1_Real_vi <0x06, S_WQM_B32>;
1490def S_WQM_B64_vi : SOP1_Real_vi <0x07, S_WQM_B64>;
1491def S_BREV_B32_vi : SOP1_Real_vi <0x08, S_BREV_B32>;
1492def S_BREV_B64_vi : SOP1_Real_vi <0x09, S_BREV_B64>;
1493def S_BCNT0_I32_B32_vi : SOP1_Real_vi <0x0a, S_BCNT0_I32_B32>;
1494def S_BCNT0_I32_B64_vi : SOP1_Real_vi <0x0b, S_BCNT0_I32_B64>;
1495def S_BCNT1_I32_B32_vi : SOP1_Real_vi <0x0c, S_BCNT1_I32_B32>;
1496def S_BCNT1_I32_B64_vi : SOP1_Real_vi <0x0d, S_BCNT1_I32_B64>;
1497def S_FF0_I32_B32_vi : SOP1_Real_vi <0x0e, S_FF0_I32_B32>;
1498def S_FF0_I32_B64_vi : SOP1_Real_vi <0x0f, S_FF0_I32_B64>;
1499def S_FF1_I32_B32_vi : SOP1_Real_vi <0x10, S_FF1_I32_B32>;
1500def S_FF1_I32_B64_vi : SOP1_Real_vi <0x11, S_FF1_I32_B64>;
1501def S_FLBIT_I32_B32_vi : SOP1_Real_vi <0x12, S_FLBIT_I32_B32>;
1502def S_FLBIT_I32_B64_vi : SOP1_Real_vi <0x13, S_FLBIT_I32_B64>;
1503def S_FLBIT_I32_vi : SOP1_Real_vi <0x14, S_FLBIT_I32>;
1504def S_FLBIT_I32_I64_vi : SOP1_Real_vi <0x15, S_FLBIT_I32_I64>;
1505def S_SEXT_I32_I8_vi : SOP1_Real_vi <0x16, S_SEXT_I32_I8>;
1506def S_SEXT_I32_I16_vi : SOP1_Real_vi <0x17, S_SEXT_I32_I16>;
1507def S_BITSET0_B32_vi : SOP1_Real_vi <0x18, S_BITSET0_B32>;
1508def S_BITSET0_B64_vi : SOP1_Real_vi <0x19, S_BITSET0_B64>;
1509def S_BITSET1_B32_vi : SOP1_Real_vi <0x1a, S_BITSET1_B32>;
1510def S_BITSET1_B64_vi : SOP1_Real_vi <0x1b, S_BITSET1_B64>;
1511def S_GETPC_B64_vi : SOP1_Real_vi <0x1c, S_GETPC_B64>;
1512def S_SETPC_B64_vi : SOP1_Real_vi <0x1d, S_SETPC_B64>;
1513def S_SWAPPC_B64_vi : SOP1_Real_vi <0x1e, S_SWAPPC_B64>;
1514def S_RFE_B64_vi : SOP1_Real_vi <0x1f, S_RFE_B64>;
1515def S_AND_SAVEEXEC_B64_vi : SOP1_Real_vi <0x20, S_AND_SAVEEXEC_B64>;
1516def S_OR_SAVEEXEC_B64_vi : SOP1_Real_vi <0x21, S_OR_SAVEEXEC_B64>;
1517def S_XOR_SAVEEXEC_B64_vi : SOP1_Real_vi <0x22, S_XOR_SAVEEXEC_B64>;
1518def S_ANDN2_SAVEEXEC_B64_vi: SOP1_Real_vi <0x23, S_ANDN2_SAVEEXEC_B64>;
1519def S_ORN2_SAVEEXEC_B64_vi : SOP1_Real_vi <0x24, S_ORN2_SAVEEXEC_B64>;
1520def S_NAND_SAVEEXEC_B64_vi : SOP1_Real_vi <0x25, S_NAND_SAVEEXEC_B64>;
1521def S_NOR_SAVEEXEC_B64_vi : SOP1_Real_vi <0x26, S_NOR_SAVEEXEC_B64>;
1522def S_XNOR_SAVEEXEC_B64_vi : SOP1_Real_vi <0x27, S_XNOR_SAVEEXEC_B64>;
1523def S_QUADMASK_B32_vi : SOP1_Real_vi <0x28, S_QUADMASK_B32>;
1524def S_QUADMASK_B64_vi : SOP1_Real_vi <0x29, S_QUADMASK_B64>;
1525def S_MOVRELS_B32_vi : SOP1_Real_vi <0x2a, S_MOVRELS_B32>;
1526def S_MOVRELS_B64_vi : SOP1_Real_vi <0x2b, S_MOVRELS_B64>;
1527def S_MOVRELD_B32_vi : SOP1_Real_vi <0x2c, S_MOVRELD_B32>;
1528def S_MOVRELD_B64_vi : SOP1_Real_vi <0x2d, S_MOVRELD_B64>;
1529def S_CBRANCH_JOIN_vi : SOP1_Real_vi <0x2e, S_CBRANCH_JOIN>;
1530def S_MOV_REGRD_B32_vi : SOP1_Real_vi <0x2f, S_MOV_REGRD_B32>;
1531def S_ABS_I32_vi : SOP1_Real_vi <0x30, S_ABS_I32>;
1532def S_MOV_FED_B32_vi : SOP1_Real_vi <0x31, S_MOV_FED_B32>;
Matt Arsenaultcc88ce32016-10-12 18:00:51 +00001533def S_SET_GPR_IDX_IDX_vi : SOP1_Real_vi <0x32, S_SET_GPR_IDX_IDX>;
Valery Pykhtina34fb492016-08-30 15:20:31 +00001534
1535def S_ADD_U32_vi : SOP2_Real_vi <0x00, S_ADD_U32>;
1536def S_ADD_I32_vi : SOP2_Real_vi <0x02, S_ADD_I32>;
1537def S_SUB_U32_vi : SOP2_Real_vi <0x01, S_SUB_U32>;
1538def S_SUB_I32_vi : SOP2_Real_vi <0x03, S_SUB_I32>;
1539def S_ADDC_U32_vi : SOP2_Real_vi <0x04, S_ADDC_U32>;
1540def S_SUBB_U32_vi : SOP2_Real_vi <0x05, S_SUBB_U32>;
1541def S_MIN_I32_vi : SOP2_Real_vi <0x06, S_MIN_I32>;
1542def S_MIN_U32_vi : SOP2_Real_vi <0x07, S_MIN_U32>;
1543def S_MAX_I32_vi : SOP2_Real_vi <0x08, S_MAX_I32>;
1544def S_MAX_U32_vi : SOP2_Real_vi <0x09, S_MAX_U32>;
1545def S_CSELECT_B32_vi : SOP2_Real_vi <0x0a, S_CSELECT_B32>;
1546def S_CSELECT_B64_vi : SOP2_Real_vi <0x0b, S_CSELECT_B64>;
1547def S_AND_B32_vi : SOP2_Real_vi <0x0c, S_AND_B32>;
1548def S_AND_B64_vi : SOP2_Real_vi <0x0d, S_AND_B64>;
1549def S_OR_B32_vi : SOP2_Real_vi <0x0e, S_OR_B32>;
1550def S_OR_B64_vi : SOP2_Real_vi <0x0f, S_OR_B64>;
1551def S_XOR_B32_vi : SOP2_Real_vi <0x10, S_XOR_B32>;
1552def S_XOR_B64_vi : SOP2_Real_vi <0x11, S_XOR_B64>;
1553def S_ANDN2_B32_vi : SOP2_Real_vi <0x12, S_ANDN2_B32>;
1554def S_ANDN2_B64_vi : SOP2_Real_vi <0x13, S_ANDN2_B64>;
1555def S_ORN2_B32_vi : SOP2_Real_vi <0x14, S_ORN2_B32>;
1556def S_ORN2_B64_vi : SOP2_Real_vi <0x15, S_ORN2_B64>;
1557def S_NAND_B32_vi : SOP2_Real_vi <0x16, S_NAND_B32>;
1558def S_NAND_B64_vi : SOP2_Real_vi <0x17, S_NAND_B64>;
1559def S_NOR_B32_vi : SOP2_Real_vi <0x18, S_NOR_B32>;
1560def S_NOR_B64_vi : SOP2_Real_vi <0x19, S_NOR_B64>;
1561def S_XNOR_B32_vi : SOP2_Real_vi <0x1a, S_XNOR_B32>;
1562def S_XNOR_B64_vi : SOP2_Real_vi <0x1b, S_XNOR_B64>;
1563def S_LSHL_B32_vi : SOP2_Real_vi <0x1c, S_LSHL_B32>;
1564def S_LSHL_B64_vi : SOP2_Real_vi <0x1d, S_LSHL_B64>;
1565def S_LSHR_B32_vi : SOP2_Real_vi <0x1e, S_LSHR_B32>;
1566def S_LSHR_B64_vi : SOP2_Real_vi <0x1f, S_LSHR_B64>;
1567def S_ASHR_I32_vi : SOP2_Real_vi <0x20, S_ASHR_I32>;
1568def S_ASHR_I64_vi : SOP2_Real_vi <0x21, S_ASHR_I64>;
1569def S_BFM_B32_vi : SOP2_Real_vi <0x22, S_BFM_B32>;
1570def S_BFM_B64_vi : SOP2_Real_vi <0x23, S_BFM_B64>;
1571def S_MUL_I32_vi : SOP2_Real_vi <0x24, S_MUL_I32>;
1572def S_BFE_U32_vi : SOP2_Real_vi <0x25, S_BFE_U32>;
1573def S_BFE_I32_vi : SOP2_Real_vi <0x26, S_BFE_I32>;
1574def S_BFE_U64_vi : SOP2_Real_vi <0x27, S_BFE_U64>;
1575def S_BFE_I64_vi : SOP2_Real_vi <0x28, S_BFE_I64>;
1576def S_CBRANCH_G_FORK_vi : SOP2_Real_vi <0x29, S_CBRANCH_G_FORK>;
1577def S_ABSDIFF_I32_vi : SOP2_Real_vi <0x2a, S_ABSDIFF_I32>;
Matt Arsenault9be7b0d2017-02-27 18:49:11 +00001578def S_PACK_LL_B32_B16_vi : SOP2_Real_vi <0x32, S_PACK_LL_B32_B16>;
1579def S_PACK_LH_B32_B16_vi : SOP2_Real_vi <0x33, S_PACK_LH_B32_B16>;
1580def S_PACK_HH_B32_B16_vi : SOP2_Real_vi <0x34, S_PACK_HH_B32_B16>;
Dmitry Preobrazhensky14104e02017-04-12 17:10:07 +00001581def S_RFE_RESTORE_B64_vi : SOP2_Real_vi <0x2b, S_RFE_RESTORE_B64>;
Valery Pykhtina34fb492016-08-30 15:20:31 +00001582
1583def S_MOVK_I32_vi : SOPK_Real_vi <0x00, S_MOVK_I32>;
1584def S_CMOVK_I32_vi : SOPK_Real_vi <0x01, S_CMOVK_I32>;
1585def S_CMPK_EQ_I32_vi : SOPK_Real_vi <0x02, S_CMPK_EQ_I32>;
1586def S_CMPK_LG_I32_vi : SOPK_Real_vi <0x03, S_CMPK_LG_I32>;
1587def S_CMPK_GT_I32_vi : SOPK_Real_vi <0x04, S_CMPK_GT_I32>;
1588def S_CMPK_GE_I32_vi : SOPK_Real_vi <0x05, S_CMPK_GE_I32>;
1589def S_CMPK_LT_I32_vi : SOPK_Real_vi <0x06, S_CMPK_LT_I32>;
1590def S_CMPK_LE_I32_vi : SOPK_Real_vi <0x07, S_CMPK_LE_I32>;
1591def S_CMPK_EQ_U32_vi : SOPK_Real_vi <0x08, S_CMPK_EQ_U32>;
1592def S_CMPK_LG_U32_vi : SOPK_Real_vi <0x09, S_CMPK_LG_U32>;
1593def S_CMPK_GT_U32_vi : SOPK_Real_vi <0x0A, S_CMPK_GT_U32>;
1594def S_CMPK_GE_U32_vi : SOPK_Real_vi <0x0B, S_CMPK_GE_U32>;
1595def S_CMPK_LT_U32_vi : SOPK_Real_vi <0x0C, S_CMPK_LT_U32>;
1596def S_CMPK_LE_U32_vi : SOPK_Real_vi <0x0D, S_CMPK_LE_U32>;
1597def S_ADDK_I32_vi : SOPK_Real_vi <0x0E, S_ADDK_I32>;
1598def S_MULK_I32_vi : SOPK_Real_vi <0x0F, S_MULK_I32>;
1599def S_CBRANCH_I_FORK_vi : SOPK_Real_vi <0x10, S_CBRANCH_I_FORK>;
1600def S_GETREG_B32_vi : SOPK_Real_vi <0x11, S_GETREG_B32>;
1601def S_SETREG_B32_vi : SOPK_Real_vi <0x12, S_SETREG_B32>;
1602//def S_GETREG_REGRD_B32_vi : SOPK_Real_vi <0x13, S_GETREG_REGRD_B32>; // see pseudo for comments
1603def S_SETREG_IMM32_B32_vi : SOPK_Real64<0x14, S_SETREG_IMM32_B32>,
Tom Stellard2add8a12016-09-06 20:00:26 +00001604 Select_vi<S_SETREG_IMM32_B32.Mnemonic>;
Dmitry Preobrazhenskyf20aff52018-04-06 16:35:11 +00001605
Dmitry Preobrazhenskyae312232018-04-06 18:24:49 +00001606def S_CALL_B64_vi : SOPK_Real_vi <0x15, S_CALL_B64>;
1607
Dmitry Preobrazhenskyf20aff52018-04-06 16:35:11 +00001608//===----------------------------------------------------------------------===//
1609// SOP1 - GFX9.
1610//===----------------------------------------------------------------------===//
1611
1612def S_ANDN1_SAVEEXEC_B64_vi : SOP1_Real_vi<0x33, S_ANDN1_SAVEEXEC_B64>;
1613def S_ORN1_SAVEEXEC_B64_vi : SOP1_Real_vi<0x34, S_ORN1_SAVEEXEC_B64>;
1614def S_ANDN1_WREXEC_B64_vi : SOP1_Real_vi<0x35, S_ANDN1_WREXEC_B64>;
1615def S_ANDN2_WREXEC_B64_vi : SOP1_Real_vi<0x36, S_ANDN2_WREXEC_B64>;
1616def S_BITREPLICATE_B64_B32_vi : SOP1_Real_vi<0x37, S_BITREPLICATE_B64_B32>;
Dmitry Preobrazhensky2f8e1462018-04-09 13:10:33 +00001617
1618//===----------------------------------------------------------------------===//
1619// SOP2 - GFX9.
1620//===----------------------------------------------------------------------===//
1621
1622def S_LSHL1_ADD_U32_vi : SOP2_Real_vi<0x2e, S_LSHL1_ADD_U32>;
1623def S_LSHL2_ADD_U32_vi : SOP2_Real_vi<0x2f, S_LSHL2_ADD_U32>;
1624def S_LSHL3_ADD_U32_vi : SOP2_Real_vi<0x30, S_LSHL3_ADD_U32>;
1625def S_LSHL4_ADD_U32_vi : SOP2_Real_vi<0x31, S_LSHL4_ADD_U32>;
1626def S_MUL_HI_U32_vi : SOP2_Real_vi<0x2c, S_MUL_HI_U32>;
1627def S_MUL_HI_I32_vi : SOP2_Real_vi<0x2d, S_MUL_HI_I32>;