blob: ee72d28dd6c30edb90b9750221ad601cfb2ab48a [file] [log] [blame]
Valery Pykhtina34fb492016-08-30 15:20:31 +00001//===-- SOPInstructions.td - SOP Instruction Defintions -------------------===//
2//
3// The LLVM Compiler Infrastructure
4//
5// This file is distributed under the University of Illinois Open Source
6// License. See LICENSE.TXT for details.
7//
8//===----------------------------------------------------------------------===//
9
Matt Arsenaultcc88ce32016-10-12 18:00:51 +000010def GPRIdxModeMatchClass : AsmOperandClass {
11 let Name = "GPRIdxMode";
12 let PredicateMethod = "isGPRIdxMode";
13 let RenderMethod = "addImmOperands";
14}
15
16def GPRIdxMode : Operand<i32> {
17 let PrintMethod = "printVGPRIndexMode";
18 let ParserMatchClass = GPRIdxModeMatchClass;
19 let OperandType = "OPERAND_IMMEDIATE";
20}
21
Nicolai Haehnle4f850ea2018-03-26 13:56:53 +000022class SOP_Pseudo<string opName, dag outs, dag ins, string asmOps,
23 list<dag> pattern=[]> :
24 InstSI<outs, ins, "", pattern>,
25 SIMCInstr<opName, SIEncodingFamily.NONE> {
26
27 let isPseudo = 1;
28 let isCodeGenOnly = 1;
29 let SubtargetPredicate = isGCN;
30
31 string Mnemonic = opName;
32 string AsmOperands = asmOps;
33
34 bits<1> has_sdst = 0;
35}
36
Valery Pykhtina34fb492016-08-30 15:20:31 +000037//===----------------------------------------------------------------------===//
38// SOP1 Instructions
39//===----------------------------------------------------------------------===//
40
41class SOP1_Pseudo <string opName, dag outs, dag ins,
42 string asmOps, list<dag> pattern=[]> :
Nicolai Haehnle4f850ea2018-03-26 13:56:53 +000043 SOP_Pseudo<opName, outs, ins, asmOps, pattern> {
Valery Pykhtina34fb492016-08-30 15:20:31 +000044
45 let mayLoad = 0;
46 let mayStore = 0;
47 let hasSideEffects = 0;
48 let SALU = 1;
49 let SOP1 = 1;
50 let SchedRW = [WriteSALU];
Matt Arsenault6bc43d82016-10-06 16:20:41 +000051 let Size = 4;
Tom Stellard2add8a12016-09-06 20:00:26 +000052 let UseNamedOperandTable = 1;
Valery Pykhtina34fb492016-08-30 15:20:31 +000053
Valery Pykhtina34fb492016-08-30 15:20:31 +000054 bits<1> has_src0 = 1;
55 bits<1> has_sdst = 1;
56}
57
58class SOP1_Real<bits<8> op, SOP1_Pseudo ps> :
59 InstSI <ps.OutOperandList, ps.InOperandList,
60 ps.Mnemonic # " " # ps.AsmOperands, []>,
61 Enc32 {
62
63 let isPseudo = 0;
64 let isCodeGenOnly = 0;
Matt Arsenault6bc43d82016-10-06 16:20:41 +000065 let Size = 4;
Valery Pykhtina34fb492016-08-30 15:20:31 +000066
67 // copy relevant pseudo op flags
68 let SubtargetPredicate = ps.SubtargetPredicate;
69 let AsmMatchConverter = ps.AsmMatchConverter;
70
71 // encoding
72 bits<7> sdst;
73 bits<8> src0;
74
75 let Inst{7-0} = !if(ps.has_src0, src0, ?);
76 let Inst{15-8} = op;
77 let Inst{22-16} = !if(ps.has_sdst, sdst, ?);
78 let Inst{31-23} = 0x17d; //encoding;
79}
80
81class SOP1_32 <string opName, list<dag> pattern=[]> : SOP1_Pseudo <
Sam Kolton1eeb11b2016-09-09 14:44:04 +000082 opName, (outs SReg_32:$sdst), (ins SSrc_b32:$src0),
Valery Pykhtina34fb492016-08-30 15:20:31 +000083 "$sdst, $src0", pattern
84>;
85
Matt Arsenaultcc88ce32016-10-12 18:00:51 +000086// 32-bit input, no output.
87class SOP1_0_32 <string opName, list<dag> pattern = []> : SOP1_Pseudo <
88 opName, (outs), (ins SSrc_b32:$src0),
89 "$src0", pattern> {
90 let has_sdst = 0;
91}
92
Dmitry Preobrazhensky12194e92017-04-12 12:40:19 +000093class SOP1_0_32R <string opName, list<dag> pattern = []> : SOP1_Pseudo <
94 opName, (outs), (ins SReg_32:$src0),
95 "$src0", pattern> {
96 let has_sdst = 0;
97}
98
Valery Pykhtina34fb492016-08-30 15:20:31 +000099class SOP1_64 <string opName, list<dag> pattern=[]> : SOP1_Pseudo <
Sam Kolton1eeb11b2016-09-09 14:44:04 +0000100 opName, (outs SReg_64:$sdst), (ins SSrc_b64:$src0),
Valery Pykhtina34fb492016-08-30 15:20:31 +0000101 "$sdst, $src0", pattern
102>;
103
104// 64-bit input, 32-bit output.
105class SOP1_32_64 <string opName, list<dag> pattern=[]> : SOP1_Pseudo <
Sam Kolton1eeb11b2016-09-09 14:44:04 +0000106 opName, (outs SReg_32:$sdst), (ins SSrc_b64:$src0),
Valery Pykhtina34fb492016-08-30 15:20:31 +0000107 "$sdst, $src0", pattern
108>;
109
110// 32-bit input, 64-bit output.
111class SOP1_64_32 <string opName, list<dag> pattern=[]> : SOP1_Pseudo <
Sam Kolton1eeb11b2016-09-09 14:44:04 +0000112 opName, (outs SReg_64:$sdst), (ins SSrc_b32:$src0),
Valery Pykhtina34fb492016-08-30 15:20:31 +0000113 "$sdst, $src0", pattern
114>;
115
116// no input, 64-bit output.
117class SOP1_64_0 <string opName, list<dag> pattern=[]> : SOP1_Pseudo <
118 opName, (outs SReg_64:$sdst), (ins), "$sdst", pattern> {
119 let has_src0 = 0;
120}
121
122// 64-bit input, no output
123class SOP1_1 <string opName, list<dag> pattern=[]> : SOP1_Pseudo <
124 opName, (outs), (ins SReg_64:$src0), "$src0", pattern> {
125 let has_sdst = 0;
126}
127
128
129let isMoveImm = 1 in {
130 let isReMaterializable = 1, isAsCheapAsAMove = 1 in {
131 def S_MOV_B32 : SOP1_32 <"s_mov_b32">;
132 def S_MOV_B64 : SOP1_64 <"s_mov_b64">;
133 } // End isRematerializeable = 1
134
135 let Uses = [SCC] in {
136 def S_CMOV_B32 : SOP1_32 <"s_cmov_b32">;
137 def S_CMOV_B64 : SOP1_64 <"s_cmov_b64">;
138 } // End Uses = [SCC]
139} // End isMoveImm = 1
140
141let Defs = [SCC] in {
142 def S_NOT_B32 : SOP1_32 <"s_not_b32",
143 [(set i32:$sdst, (not i32:$src0))]
144 >;
145
146 def S_NOT_B64 : SOP1_64 <"s_not_b64",
147 [(set i64:$sdst, (not i64:$src0))]
148 >;
149 def S_WQM_B32 : SOP1_32 <"s_wqm_b32">;
Marek Olsak2114fc32017-10-24 10:26:59 +0000150 def S_WQM_B64 : SOP1_64 <"s_wqm_b64",
151 [(set i1:$sdst, (int_amdgcn_wqm_vote i1:$src0))]
152 >;
Valery Pykhtina34fb492016-08-30 15:20:31 +0000153} // End Defs = [SCC]
154
155
156def S_BREV_B32 : SOP1_32 <"s_brev_b32",
157 [(set i32:$sdst, (bitreverse i32:$src0))]
158>;
159def S_BREV_B64 : SOP1_64 <"s_brev_b64">;
160
161let Defs = [SCC] in {
162def S_BCNT0_I32_B32 : SOP1_32 <"s_bcnt0_i32_b32">;
163def S_BCNT0_I32_B64 : SOP1_32_64 <"s_bcnt0_i32_b64">;
164def S_BCNT1_I32_B32 : SOP1_32 <"s_bcnt1_i32_b32",
165 [(set i32:$sdst, (ctpop i32:$src0))]
166>;
167def S_BCNT1_I32_B64 : SOP1_32_64 <"s_bcnt1_i32_b64">;
168} // End Defs = [SCC]
169
170def S_FF0_I32_B32 : SOP1_32 <"s_ff0_i32_b32">;
171def S_FF0_I32_B64 : SOP1_32_64 <"s_ff0_i32_b64">;
Valery Pykhtina34fb492016-08-30 15:20:31 +0000172def S_FF1_I32_B64 : SOP1_32_64 <"s_ff1_i32_b64">;
173
Wei Ding5676aca2017-10-12 19:37:14 +0000174def S_FF1_I32_B32 : SOP1_32 <"s_ff1_i32_b32",
175 [(set i32:$sdst, (AMDGPUffbl_b32 i32:$src0))]
176>;
177
Valery Pykhtina34fb492016-08-30 15:20:31 +0000178def S_FLBIT_I32_B32 : SOP1_32 <"s_flbit_i32_b32",
179 [(set i32:$sdst, (AMDGPUffbh_u32 i32:$src0))]
180>;
181
182def S_FLBIT_I32_B64 : SOP1_32_64 <"s_flbit_i32_b64">;
183def S_FLBIT_I32 : SOP1_32 <"s_flbit_i32",
184 [(set i32:$sdst, (AMDGPUffbh_i32 i32:$src0))]
185>;
186def S_FLBIT_I32_I64 : SOP1_32_64 <"s_flbit_i32_i64">;
187def S_SEXT_I32_I8 : SOP1_32 <"s_sext_i32_i8",
188 [(set i32:$sdst, (sext_inreg i32:$src0, i8))]
189>;
190def S_SEXT_I32_I16 : SOP1_32 <"s_sext_i32_i16",
191 [(set i32:$sdst, (sext_inreg i32:$src0, i16))]
192>;
193
194def S_BITSET0_B32 : SOP1_32 <"s_bitset0_b32">;
195def S_BITSET0_B64 : SOP1_64_32 <"s_bitset0_b64">;
196def S_BITSET1_B32 : SOP1_32 <"s_bitset1_b32">;
197def S_BITSET1_B64 : SOP1_64_32 <"s_bitset1_b64">;
Konstantin Zhuravlyovb2ff8df2017-05-26 20:38:26 +0000198def S_GETPC_B64 : SOP1_64_0 <"s_getpc_b64",
199 [(set i64:$sdst, (int_amdgcn_s_getpc))]
200>;
Valery Pykhtina34fb492016-08-30 15:20:31 +0000201
Matt Arsenault2b1f9aa2017-05-17 21:56:25 +0000202let isTerminator = 1, isBarrier = 1, SchedRW = [WriteBranch] in {
203
204let isBranch = 1, isIndirectBranch = 1 in {
Valery Pykhtina34fb492016-08-30 15:20:31 +0000205def S_SETPC_B64 : SOP1_1 <"s_setpc_b64">;
Matt Arsenault2b1f9aa2017-05-17 21:56:25 +0000206} // End isBranch = 1, isIndirectBranch = 1
207
208let isReturn = 1 in {
209// Define variant marked as return rather than branch.
210def S_SETPC_B64_return : SOP1_1<"", [(AMDGPUret_flag i64:$src0)]>;
Valery Pykhtina34fb492016-08-30 15:20:31 +0000211}
Matt Arsenault2b1f9aa2017-05-17 21:56:25 +0000212} // End isTerminator = 1, isBarrier = 1
213
214let isCall = 1 in {
215def S_SWAPPC_B64 : SOP1_64 <"s_swappc_b64"
216>;
217}
218
Valery Pykhtina34fb492016-08-30 15:20:31 +0000219def S_RFE_B64 : SOP1_1 <"s_rfe_b64">;
220
221let hasSideEffects = 1, Uses = [EXEC], Defs = [EXEC, SCC] in {
222
223def S_AND_SAVEEXEC_B64 : SOP1_64 <"s_and_saveexec_b64">;
224def S_OR_SAVEEXEC_B64 : SOP1_64 <"s_or_saveexec_b64">;
225def S_XOR_SAVEEXEC_B64 : SOP1_64 <"s_xor_saveexec_b64">;
226def S_ANDN2_SAVEEXEC_B64 : SOP1_64 <"s_andn2_saveexec_b64">;
227def S_ORN2_SAVEEXEC_B64 : SOP1_64 <"s_orn2_saveexec_b64">;
228def S_NAND_SAVEEXEC_B64 : SOP1_64 <"s_nand_saveexec_b64">;
229def S_NOR_SAVEEXEC_B64 : SOP1_64 <"s_nor_saveexec_b64">;
230def S_XNOR_SAVEEXEC_B64 : SOP1_64 <"s_xnor_saveexec_b64">;
231
232} // End hasSideEffects = 1, Uses = [EXEC], Defs = [EXEC, SCC]
233
234def S_QUADMASK_B32 : SOP1_32 <"s_quadmask_b32">;
235def S_QUADMASK_B64 : SOP1_64 <"s_quadmask_b64">;
236
237let Uses = [M0] in {
238def S_MOVRELS_B32 : SOP1_32 <"s_movrels_b32">;
239def S_MOVRELS_B64 : SOP1_64 <"s_movrels_b64">;
240def S_MOVRELD_B32 : SOP1_32 <"s_movreld_b32">;
241def S_MOVRELD_B64 : SOP1_64 <"s_movreld_b64">;
242} // End Uses = [M0]
243
Dmitry Preobrazhensky12194e92017-04-12 12:40:19 +0000244def S_CBRANCH_JOIN : SOP1_0_32R <"s_cbranch_join">;
Valery Pykhtina34fb492016-08-30 15:20:31 +0000245def S_MOV_REGRD_B32 : SOP1_32 <"s_mov_regrd_b32">;
246let Defs = [SCC] in {
247def S_ABS_I32 : SOP1_32 <"s_abs_i32">;
248} // End Defs = [SCC]
249def S_MOV_FED_B32 : SOP1_32 <"s_mov_fed_b32">;
250
Matt Arsenaultcc88ce32016-10-12 18:00:51 +0000251let SubtargetPredicate = HasVGPRIndexMode in {
252def S_SET_GPR_IDX_IDX : SOP1_0_32<"s_set_gpr_idx_idx"> {
253 let Uses = [M0];
254 let Defs = [M0];
255}
256}
Valery Pykhtina34fb492016-08-30 15:20:31 +0000257
Dmitry Preobrazhenskyf20aff52018-04-06 16:35:11 +0000258let SubtargetPredicate = isGFX9 in {
259 let hasSideEffects = 1, Defs = [EXEC, SCC], Uses = [EXEC] in {
260 def S_ANDN1_SAVEEXEC_B64 : SOP1_64<"s_andn1_saveexec_b64">;
261 def S_ORN1_SAVEEXEC_B64 : SOP1_64<"s_orn1_saveexec_b64">;
262 def S_ANDN1_WREXEC_B64 : SOP1_64<"s_andn1_wrexec_b64">;
263 def S_ANDN2_WREXEC_B64 : SOP1_64<"s_andn2_wrexec_b64">;
264 } // End hasSideEffects = 1, Defs = [EXEC, SCC], Uses = [EXEC]
265
266 def S_BITREPLICATE_B64_B32 : SOP1_64_32<"s_bitreplicate_b64_b32">;
267} // End SubtargetPredicate = isGFX9
268
Valery Pykhtina34fb492016-08-30 15:20:31 +0000269//===----------------------------------------------------------------------===//
270// SOP2 Instructions
271//===----------------------------------------------------------------------===//
272
273class SOP2_Pseudo<string opName, dag outs, dag ins,
274 string asmOps, list<dag> pattern=[]> :
Nicolai Haehnle4f850ea2018-03-26 13:56:53 +0000275 SOP_Pseudo<opName, outs, ins, asmOps, pattern> {
276
Valery Pykhtina34fb492016-08-30 15:20:31 +0000277 let mayLoad = 0;
278 let mayStore = 0;
279 let hasSideEffects = 0;
280 let SALU = 1;
281 let SOP2 = 1;
282 let SchedRW = [WriteSALU];
283 let UseNamedOperandTable = 1;
284
Nicolai Haehnle4f850ea2018-03-26 13:56:53 +0000285 let has_sdst = 1;
Valery Pykhtina34fb492016-08-30 15:20:31 +0000286
287 // Pseudo instructions have no encodings, but adding this field here allows
288 // us to do:
289 // let sdst = xxx in {
290 // for multiclasses that include both real and pseudo instructions.
291 // field bits<7> sdst = 0;
292 // let Size = 4; // Do we need size here?
293}
294
Nicolai Haehnle4f850ea2018-03-26 13:56:53 +0000295class SOP2_Real<bits<7> op, SOP_Pseudo ps> :
Valery Pykhtina34fb492016-08-30 15:20:31 +0000296 InstSI <ps.OutOperandList, ps.InOperandList,
297 ps.Mnemonic # " " # ps.AsmOperands, []>,
298 Enc32 {
299 let isPseudo = 0;
300 let isCodeGenOnly = 0;
301
302 // copy relevant pseudo op flags
303 let SubtargetPredicate = ps.SubtargetPredicate;
304 let AsmMatchConverter = ps.AsmMatchConverter;
Dmitry Preobrazhensky61105ba2019-01-18 13:57:43 +0000305 let UseNamedOperandTable = ps.UseNamedOperandTable;
306 let TSFlags = ps.TSFlags;
Valery Pykhtina34fb492016-08-30 15:20:31 +0000307
308 // encoding
309 bits<7> sdst;
310 bits<8> src0;
311 bits<8> src1;
312
313 let Inst{7-0} = src0;
314 let Inst{15-8} = src1;
315 let Inst{22-16} = !if(ps.has_sdst, sdst, ?);
316 let Inst{29-23} = op;
317 let Inst{31-30} = 0x2; // encoding
318}
319
320
321class SOP2_32 <string opName, list<dag> pattern=[]> : SOP2_Pseudo <
Sam Kolton1eeb11b2016-09-09 14:44:04 +0000322 opName, (outs SReg_32:$sdst), (ins SSrc_b32:$src0, SSrc_b32:$src1),
Valery Pykhtina34fb492016-08-30 15:20:31 +0000323 "$sdst, $src0, $src1", pattern
324>;
325
326class SOP2_64 <string opName, list<dag> pattern=[]> : SOP2_Pseudo <
Sam Kolton1eeb11b2016-09-09 14:44:04 +0000327 opName, (outs SReg_64:$sdst), (ins SSrc_b64:$src0, SSrc_b64:$src1),
Valery Pykhtina34fb492016-08-30 15:20:31 +0000328 "$sdst, $src0, $src1", pattern
329>;
330
331class SOP2_64_32 <string opName, list<dag> pattern=[]> : SOP2_Pseudo <
Sam Kolton1eeb11b2016-09-09 14:44:04 +0000332 opName, (outs SReg_64:$sdst), (ins SSrc_b64:$src0, SSrc_b32:$src1),
Valery Pykhtina34fb492016-08-30 15:20:31 +0000333 "$sdst, $src0, $src1", pattern
334>;
335
336class SOP2_64_32_32 <string opName, list<dag> pattern=[]> : SOP2_Pseudo <
Sam Kolton1eeb11b2016-09-09 14:44:04 +0000337 opName, (outs SReg_64:$sdst), (ins SSrc_b32:$src0, SSrc_b32:$src1),
Valery Pykhtina34fb492016-08-30 15:20:31 +0000338 "$sdst, $src0, $src1", pattern
339>;
340
Graham Sellers04f7a4d2018-11-29 16:05:38 +0000341class UniformUnaryFrag<SDPatternOperator Op> : PatFrag <
342 (ops node:$src0),
343 (Op $src0),
344 [{ return !N->isDivergent(); }]
345>;
346
Alexander Timofeev36617f012018-09-21 10:31:22 +0000347class UniformBinFrag<SDPatternOperator Op> : PatFrag <
348 (ops node:$src0, node:$src1),
349 (Op $src0, $src1),
350 [{ return !N->isDivergent(); }]
351>;
352
Valery Pykhtina34fb492016-08-30 15:20:31 +0000353let Defs = [SCC] in { // Carry out goes to SCC
354let isCommutable = 1 in {
355def S_ADD_U32 : SOP2_32 <"s_add_u32">;
356def S_ADD_I32 : SOP2_32 <"s_add_i32",
Alexander Timofeev36617f012018-09-21 10:31:22 +0000357 [(set i32:$sdst, (UniformBinFrag<add> SSrc_b32:$src0, SSrc_b32:$src1))]
Valery Pykhtina34fb492016-08-30 15:20:31 +0000358>;
359} // End isCommutable = 1
360
361def S_SUB_U32 : SOP2_32 <"s_sub_u32">;
362def S_SUB_I32 : SOP2_32 <"s_sub_i32",
Alexander Timofeev36617f012018-09-21 10:31:22 +0000363 [(set i32:$sdst, (UniformBinFrag<sub> SSrc_b32:$src0, SSrc_b32:$src1))]
Valery Pykhtina34fb492016-08-30 15:20:31 +0000364>;
365
366let Uses = [SCC] in { // Carry in comes from SCC
367let isCommutable = 1 in {
368def S_ADDC_U32 : SOP2_32 <"s_addc_u32",
Alexander Timofeev36617f012018-09-21 10:31:22 +0000369 [(set i32:$sdst, (UniformBinFrag<adde> (i32 SSrc_b32:$src0), (i32 SSrc_b32:$src1)))]>;
Valery Pykhtina34fb492016-08-30 15:20:31 +0000370} // End isCommutable = 1
371
372def S_SUBB_U32 : SOP2_32 <"s_subb_u32",
Alexander Timofeev36617f012018-09-21 10:31:22 +0000373 [(set i32:$sdst, (UniformBinFrag<sube> (i32 SSrc_b32:$src0), (i32 SSrc_b32:$src1)))]>;
Valery Pykhtina34fb492016-08-30 15:20:31 +0000374} // End Uses = [SCC]
375
Matt Arsenault479ba3a2016-09-07 06:25:55 +0000376
377let isCommutable = 1 in {
Valery Pykhtina34fb492016-08-30 15:20:31 +0000378def S_MIN_I32 : SOP2_32 <"s_min_i32",
Alexander Timofeev36617f012018-09-21 10:31:22 +0000379 [(set i32:$sdst, (UniformBinFrag<smin> i32:$src0, i32:$src1))]
Valery Pykhtina34fb492016-08-30 15:20:31 +0000380>;
381def S_MIN_U32 : SOP2_32 <"s_min_u32",
Alexander Timofeev36617f012018-09-21 10:31:22 +0000382 [(set i32:$sdst, (UniformBinFrag<umin> i32:$src0, i32:$src1))]
Valery Pykhtina34fb492016-08-30 15:20:31 +0000383>;
384def S_MAX_I32 : SOP2_32 <"s_max_i32",
Alexander Timofeev36617f012018-09-21 10:31:22 +0000385 [(set i32:$sdst, (UniformBinFrag<smax> i32:$src0, i32:$src1))]
Valery Pykhtina34fb492016-08-30 15:20:31 +0000386>;
387def S_MAX_U32 : SOP2_32 <"s_max_u32",
Alexander Timofeev36617f012018-09-21 10:31:22 +0000388 [(set i32:$sdst, (UniformBinFrag<umax> i32:$src0, i32:$src1))]
Valery Pykhtina34fb492016-08-30 15:20:31 +0000389>;
Matt Arsenault479ba3a2016-09-07 06:25:55 +0000390} // End isCommutable = 1
Valery Pykhtina34fb492016-08-30 15:20:31 +0000391} // End Defs = [SCC]
392
393
394let Uses = [SCC] in {
395 def S_CSELECT_B32 : SOP2_32 <"s_cselect_b32">;
396 def S_CSELECT_B64 : SOP2_64 <"s_cselect_b64">;
397} // End Uses = [SCC]
398
399let Defs = [SCC] in {
Matt Arsenault479ba3a2016-09-07 06:25:55 +0000400let isCommutable = 1 in {
Valery Pykhtina34fb492016-08-30 15:20:31 +0000401def S_AND_B32 : SOP2_32 <"s_and_b32",
Alexander Timofeev36617f012018-09-21 10:31:22 +0000402 [(set i32:$sdst, (UniformBinFrag<and> i32:$src0, i32:$src1))]
Valery Pykhtina34fb492016-08-30 15:20:31 +0000403>;
404
405def S_AND_B64 : SOP2_64 <"s_and_b64",
Alexander Timofeev36617f012018-09-21 10:31:22 +0000406 [(set i64:$sdst, (UniformBinFrag<and> i64:$src0, i64:$src1))]
Valery Pykhtina34fb492016-08-30 15:20:31 +0000407>;
408
409def S_OR_B32 : SOP2_32 <"s_or_b32",
Alexander Timofeev36617f012018-09-21 10:31:22 +0000410 [(set i32:$sdst, (UniformBinFrag<or> i32:$src0, i32:$src1))]
Valery Pykhtina34fb492016-08-30 15:20:31 +0000411>;
412
413def S_OR_B64 : SOP2_64 <"s_or_b64",
Alexander Timofeev36617f012018-09-21 10:31:22 +0000414 [(set i64:$sdst, (UniformBinFrag<or> i64:$src0, i64:$src1))]
Valery Pykhtina34fb492016-08-30 15:20:31 +0000415>;
416
417def S_XOR_B32 : SOP2_32 <"s_xor_b32",
Alexander Timofeev36617f012018-09-21 10:31:22 +0000418 [(set i32:$sdst, (UniformBinFrag<xor> i32:$src0, i32:$src1))]
Valery Pykhtina34fb492016-08-30 15:20:31 +0000419>;
420
421def S_XOR_B64 : SOP2_64 <"s_xor_b64",
Alexander Timofeev36617f012018-09-21 10:31:22 +0000422 [(set i64:$sdst, (UniformBinFrag<xor> i64:$src0, i64:$src1))]
Valery Pykhtina34fb492016-08-30 15:20:31 +0000423>;
Konstantin Zhuravlyovca8946a2017-09-18 21:22:45 +0000424
425def S_XNOR_B32 : SOP2_32 <"s_xnor_b32",
426 [(set i32:$sdst, (not (xor_oneuse i32:$src0, i32:$src1)))]
427>;
428
429def S_XNOR_B64 : SOP2_64 <"s_xnor_b64",
430 [(set i64:$sdst, (not (xor_oneuse i64:$src0, i64:$src1)))]
431>;
Graham Sellers04f7a4d2018-11-29 16:05:38 +0000432
433def S_NAND_B32 : SOP2_32 <"s_nand_b32",
434 [(set i32:$sdst, (not (and_oneuse i32:$src0, i32:$src1)))]
435>;
436
437def S_NAND_B64 : SOP2_64 <"s_nand_b64",
438 [(set i64:$sdst, (not (and_oneuse i64:$src0, i64:$src1)))]
439>;
440
441def S_NOR_B32 : SOP2_32 <"s_nor_b32",
442 [(set i32:$sdst, (not (or_oneuse i32:$src0, i32:$src1)))]
443>;
444
445def S_NOR_B64 : SOP2_64 <"s_nor_b64",
446 [(set i64:$sdst, (not (or_oneuse i64:$src0, i64:$src1)))]
447>;
Matt Arsenault479ba3a2016-09-07 06:25:55 +0000448} // End isCommutable = 1
449
Graham Sellers04f7a4d2018-11-29 16:05:38 +0000450def S_ANDN2_B32 : SOP2_32 <"s_andn2_b32",
451 [(set i32:$sdst, (UniformBinFrag<and> i32:$src0, (UniformUnaryFrag<not> i32:$src1)))]
452>;
453
454def S_ANDN2_B64 : SOP2_64 <"s_andn2_b64",
455 [(set i64:$sdst, (UniformBinFrag<and> i64:$src0, (UniformUnaryFrag<not> i64:$src1)))]
456>;
457
458def S_ORN2_B32 : SOP2_32 <"s_orn2_b32",
459 [(set i32:$sdst, (UniformBinFrag<or> i32:$src0, (UniformUnaryFrag<not> i32:$src1)))]
460>;
461
462def S_ORN2_B64 : SOP2_64 <"s_orn2_b64",
463 [(set i64:$sdst, (UniformBinFrag<or> i64:$src0, (UniformUnaryFrag<not> i64:$src1)))]
464>;
Valery Pykhtina34fb492016-08-30 15:20:31 +0000465} // End Defs = [SCC]
466
467// Use added complexity so these patterns are preferred to the VALU patterns.
468let AddedComplexity = 1 in {
469
470let Defs = [SCC] in {
Alexander Timofeev36617f012018-09-21 10:31:22 +0000471// TODO: b64 versions require VOP3 change since v_lshlrev_b64 is VOP3
Valery Pykhtina34fb492016-08-30 15:20:31 +0000472def S_LSHL_B32 : SOP2_32 <"s_lshl_b32",
Alexander Timofeev36617f012018-09-21 10:31:22 +0000473 [(set i32:$sdst, (UniformBinFrag<shl> i32:$src0, i32:$src1))]
Valery Pykhtina34fb492016-08-30 15:20:31 +0000474>;
475def S_LSHL_B64 : SOP2_64_32 <"s_lshl_b64",
Alexander Timofeevb048fa32018-10-01 11:06:35 +0000476 [(set i64:$sdst, (UniformBinFrag<shl> i64:$src0, i32:$src1))]
Valery Pykhtina34fb492016-08-30 15:20:31 +0000477>;
478def S_LSHR_B32 : SOP2_32 <"s_lshr_b32",
Alexander Timofeev36617f012018-09-21 10:31:22 +0000479 [(set i32:$sdst, (UniformBinFrag<srl> i32:$src0, i32:$src1))]
Valery Pykhtina34fb492016-08-30 15:20:31 +0000480>;
481def S_LSHR_B64 : SOP2_64_32 <"s_lshr_b64",
Alexander Timofeevb048fa32018-10-01 11:06:35 +0000482 [(set i64:$sdst, (UniformBinFrag<srl> i64:$src0, i32:$src1))]
Valery Pykhtina34fb492016-08-30 15:20:31 +0000483>;
484def S_ASHR_I32 : SOP2_32 <"s_ashr_i32",
Alexander Timofeev36617f012018-09-21 10:31:22 +0000485 [(set i32:$sdst, (UniformBinFrag<sra> i32:$src0, i32:$src1))]
Valery Pykhtina34fb492016-08-30 15:20:31 +0000486>;
487def S_ASHR_I64 : SOP2_64_32 <"s_ashr_i64",
Alexander Timofeevb048fa32018-10-01 11:06:35 +0000488 [(set i64:$sdst, (UniformBinFrag<sra> i64:$src0, i32:$src1))]
Valery Pykhtina34fb492016-08-30 15:20:31 +0000489>;
490} // End Defs = [SCC]
491
492def S_BFM_B32 : SOP2_32 <"s_bfm_b32",
Alexander Timofeev36617f012018-09-21 10:31:22 +0000493 [(set i32:$sdst, (UniformBinFrag<AMDGPUbfm> i32:$src0, i32:$src1))]>;
Valery Pykhtina34fb492016-08-30 15:20:31 +0000494def S_BFM_B64 : SOP2_64_32_32 <"s_bfm_b64">;
Alexander Timofeev36617f012018-09-21 10:31:22 +0000495
496// TODO: S_MUL_I32 require V_MUL_LO_I32 from VOP3 change
Valery Pykhtina34fb492016-08-30 15:20:31 +0000497def S_MUL_I32 : SOP2_32 <"s_mul_i32",
Matt Arsenault479ba3a2016-09-07 06:25:55 +0000498 [(set i32:$sdst, (mul i32:$src0, i32:$src1))]> {
499 let isCommutable = 1;
500}
Valery Pykhtina34fb492016-08-30 15:20:31 +0000501
502} // End AddedComplexity = 1
503
504let Defs = [SCC] in {
505def S_BFE_U32 : SOP2_32 <"s_bfe_u32">;
506def S_BFE_I32 : SOP2_32 <"s_bfe_i32">;
507def S_BFE_U64 : SOP2_64_32 <"s_bfe_u64">;
508def S_BFE_I64 : SOP2_64_32 <"s_bfe_i64">;
509} // End Defs = [SCC]
510
511def S_CBRANCH_G_FORK : SOP2_Pseudo <
512 "s_cbranch_g_fork", (outs),
Dmitry Preobrazhensky57148602017-04-14 11:52:26 +0000513 (ins SCSrc_b64:$src0, SCSrc_b64:$src1),
Valery Pykhtina34fb492016-08-30 15:20:31 +0000514 "$src0, $src1"
515> {
516 let has_sdst = 0;
517}
518
519let Defs = [SCC] in {
520def S_ABSDIFF_I32 : SOP2_32 <"s_absdiff_i32">;
521} // End Defs = [SCC]
522
Dmitry Preobrazhensky14104e02017-04-12 17:10:07 +0000523let SubtargetPredicate = isVI in {
524 def S_RFE_RESTORE_B64 : SOP2_Pseudo <
525 "s_rfe_restore_b64", (outs),
526 (ins SSrc_b64:$src0, SSrc_b32:$src1),
527 "$src0, $src1"
528 > {
529 let hasSideEffects = 1;
530 let has_sdst = 0;
531 }
532}
533
Matt Arsenault9be7b0d2017-02-27 18:49:11 +0000534let SubtargetPredicate = isGFX9 in {
535 def S_PACK_LL_B32_B16 : SOP2_32<"s_pack_ll_b32_b16">;
536 def S_PACK_LH_B32_B16 : SOP2_32<"s_pack_lh_b32_b16">;
537 def S_PACK_HH_B32_B16 : SOP2_32<"s_pack_hh_b32_b16">;
Dmitry Preobrazhensky2f8e1462018-04-09 13:10:33 +0000538
539 let Defs = [SCC] in {
540 def S_LSHL1_ADD_U32 : SOP2_32<"s_lshl1_add_u32">;
541 def S_LSHL2_ADD_U32 : SOP2_32<"s_lshl2_add_u32">;
542 def S_LSHL3_ADD_U32 : SOP2_32<"s_lshl3_add_u32">;
543 def S_LSHL4_ADD_U32 : SOP2_32<"s_lshl4_add_u32">;
544 } // End Defs = [SCC]
545
546 def S_MUL_HI_U32 : SOP2_32<"s_mul_hi_u32">;
547 def S_MUL_HI_I32 : SOP2_32<"s_mul_hi_i32">;
Matt Arsenault9be7b0d2017-02-27 18:49:11 +0000548}
Valery Pykhtina34fb492016-08-30 15:20:31 +0000549
550//===----------------------------------------------------------------------===//
551// SOPK Instructions
552//===----------------------------------------------------------------------===//
553
554class SOPK_Pseudo <string opName, dag outs, dag ins,
555 string asmOps, list<dag> pattern=[]> :
556 InstSI <outs, ins, "", pattern>,
557 SIMCInstr<opName, SIEncodingFamily.NONE> {
558 let isPseudo = 1;
559 let isCodeGenOnly = 1;
560 let SubtargetPredicate = isGCN;
561 let mayLoad = 0;
562 let mayStore = 0;
563 let hasSideEffects = 0;
564 let SALU = 1;
565 let SOPK = 1;
566 let SchedRW = [WriteSALU];
567 let UseNamedOperandTable = 1;
568 string Mnemonic = opName;
569 string AsmOperands = asmOps;
570
571 bits<1> has_sdst = 1;
572}
573
574class SOPK_Real<bits<5> op, SOPK_Pseudo ps> :
575 InstSI <ps.OutOperandList, ps.InOperandList,
576 ps.Mnemonic # " " # ps.AsmOperands, []> {
577 let isPseudo = 0;
578 let isCodeGenOnly = 0;
579
580 // copy relevant pseudo op flags
581 let SubtargetPredicate = ps.SubtargetPredicate;
582 let AsmMatchConverter = ps.AsmMatchConverter;
583 let DisableEncoding = ps.DisableEncoding;
584 let Constraints = ps.Constraints;
585
586 // encoding
587 bits<7> sdst;
588 bits<16> simm16;
589 bits<32> imm;
590}
591
592class SOPK_Real32<bits<5> op, SOPK_Pseudo ps> :
593 SOPK_Real <op, ps>,
594 Enc32 {
595 let Inst{15-0} = simm16;
596 let Inst{22-16} = !if(ps.has_sdst, sdst, ?);
597 let Inst{27-23} = op;
598 let Inst{31-28} = 0xb; //encoding
599}
600
601class SOPK_Real64<bits<5> op, SOPK_Pseudo ps> :
602 SOPK_Real<op, ps>,
603 Enc64 {
604 let Inst{15-0} = simm16;
605 let Inst{22-16} = !if(ps.has_sdst, sdst, ?);
606 let Inst{27-23} = op;
607 let Inst{31-28} = 0xb; //encoding
608 let Inst{63-32} = imm;
609}
610
Matt Arsenault7ccf6cd2016-09-16 21:41:16 +0000611class SOPKInstTable <bit is_sopk, string cmpOp = ""> {
612 bit IsSOPK = is_sopk;
613 string BaseCmpOp = cmpOp;
614}
615
Valery Pykhtina34fb492016-08-30 15:20:31 +0000616class SOPK_32 <string opName, list<dag> pattern=[]> : SOPK_Pseudo <
617 opName,
618 (outs SReg_32:$sdst),
Dmitry Preobrazhenskyc7d35a02017-04-26 15:34:19 +0000619 (ins s16imm:$simm16),
Valery Pykhtina34fb492016-08-30 15:20:31 +0000620 "$sdst, $simm16",
621 pattern>;
622
Dmitry Preobrazhenskyc7d35a02017-04-26 15:34:19 +0000623class SOPK_SCC <string opName, string base_op, bit isSignExt> : SOPK_Pseudo <
Valery Pykhtina34fb492016-08-30 15:20:31 +0000624 opName,
625 (outs),
Dmitry Preobrazhenskyc7d35a02017-04-26 15:34:19 +0000626 !if(isSignExt,
627 (ins SReg_32:$sdst, s16imm:$simm16),
628 (ins SReg_32:$sdst, u16imm:$simm16)),
Matt Arsenault7ccf6cd2016-09-16 21:41:16 +0000629 "$sdst, $simm16", []>,
630 SOPKInstTable<1, base_op>{
Valery Pykhtina34fb492016-08-30 15:20:31 +0000631 let Defs = [SCC];
632}
633
634class SOPK_32TIE <string opName, list<dag> pattern=[]> : SOPK_Pseudo <
635 opName,
636 (outs SReg_32:$sdst),
Dmitry Preobrazhenskyc7d35a02017-04-26 15:34:19 +0000637 (ins SReg_32:$src0, s16imm:$simm16),
Valery Pykhtina34fb492016-08-30 15:20:31 +0000638 "$sdst, $simm16",
639 pattern
640>;
641
642let isReMaterializable = 1, isMoveImm = 1 in {
643def S_MOVK_I32 : SOPK_32 <"s_movk_i32">;
644} // End isReMaterializable = 1
645let Uses = [SCC] in {
646def S_CMOVK_I32 : SOPK_32 <"s_cmovk_i32">;
647}
648
649let isCompare = 1 in {
650
651// This instruction is disabled for now until we can figure out how to teach
652// the instruction selector to correctly use the S_CMP* vs V_CMP*
653// instructions.
654//
655// When this instruction is enabled the code generator sometimes produces this
656// invalid sequence:
657//
658// SCC = S_CMPK_EQ_I32 SGPR0, imm
659// VCC = COPY SCC
660// VGPR0 = V_CNDMASK VCC, VGPR0, VGPR1
661//
662// def S_CMPK_EQ_I32 : SOPK_SCC <"s_cmpk_eq_i32",
663// [(set i1:$dst, (setcc i32:$src0, imm:$src1, SETEQ))]
664// >;
665
Dmitry Preobrazhenskyc7d35a02017-04-26 15:34:19 +0000666def S_CMPK_EQ_I32 : SOPK_SCC <"s_cmpk_eq_i32", "s_cmp_eq_i32", 1>;
667def S_CMPK_LG_I32 : SOPK_SCC <"s_cmpk_lg_i32", "s_cmp_lg_i32", 1>;
668def S_CMPK_GT_I32 : SOPK_SCC <"s_cmpk_gt_i32", "s_cmp_gt_i32", 1>;
669def S_CMPK_GE_I32 : SOPK_SCC <"s_cmpk_ge_i32", "s_cmp_ge_i32", 1>;
670def S_CMPK_LT_I32 : SOPK_SCC <"s_cmpk_lt_i32", "s_cmp_lt_i32", 1>;
671def S_CMPK_LE_I32 : SOPK_SCC <"s_cmpk_le_i32", "s_cmp_le_i32", 1>;
Matt Arsenault7ccf6cd2016-09-16 21:41:16 +0000672
673let SOPKZext = 1 in {
Dmitry Preobrazhenskyc7d35a02017-04-26 15:34:19 +0000674def S_CMPK_EQ_U32 : SOPK_SCC <"s_cmpk_eq_u32", "s_cmp_eq_u32", 0>;
675def S_CMPK_LG_U32 : SOPK_SCC <"s_cmpk_lg_u32", "s_cmp_lg_u32", 0>;
676def S_CMPK_GT_U32 : SOPK_SCC <"s_cmpk_gt_u32", "s_cmp_gt_u32", 0>;
677def S_CMPK_GE_U32 : SOPK_SCC <"s_cmpk_ge_u32", "s_cmp_ge_u32", 0>;
678def S_CMPK_LT_U32 : SOPK_SCC <"s_cmpk_lt_u32", "s_cmp_lt_u32", 0>;
679def S_CMPK_LE_U32 : SOPK_SCC <"s_cmpk_le_u32", "s_cmp_le_u32", 0>;
Matt Arsenault7ccf6cd2016-09-16 21:41:16 +0000680} // End SOPKZext = 1
Valery Pykhtina34fb492016-08-30 15:20:31 +0000681} // End isCompare = 1
682
683let Defs = [SCC], isCommutable = 1, DisableEncoding = "$src0",
684 Constraints = "$sdst = $src0" in {
685 def S_ADDK_I32 : SOPK_32TIE <"s_addk_i32">;
686 def S_MULK_I32 : SOPK_32TIE <"s_mulk_i32">;
687}
688
689def S_CBRANCH_I_FORK : SOPK_Pseudo <
690 "s_cbranch_i_fork",
Dmitry Preobrazhenskyc7d35a02017-04-26 15:34:19 +0000691 (outs), (ins SReg_64:$sdst, s16imm:$simm16),
Valery Pykhtina34fb492016-08-30 15:20:31 +0000692 "$sdst, $simm16"
693>;
694
695let mayLoad = 1 in {
696def S_GETREG_B32 : SOPK_Pseudo <
697 "s_getreg_b32",
698 (outs SReg_32:$sdst), (ins hwreg:$simm16),
699 "$sdst, $simm16"
700>;
701}
702
Tom Stellard8485fa02016-12-07 02:42:15 +0000703let hasSideEffects = 1 in {
704
Valery Pykhtina34fb492016-08-30 15:20:31 +0000705def S_SETREG_B32 : SOPK_Pseudo <
706 "s_setreg_b32",
707 (outs), (ins SReg_32:$sdst, hwreg:$simm16),
Tom Stellard8485fa02016-12-07 02:42:15 +0000708 "$simm16, $sdst",
709 [(AMDGPUsetreg i32:$sdst, (i16 timm:$simm16))]
Valery Pykhtina34fb492016-08-30 15:20:31 +0000710>;
711
712// FIXME: Not on SI?
713//def S_GETREG_REGRD_B32 : SOPK_32 <sopk<0x14, 0x13>, "s_getreg_regrd_b32">;
714
715def S_SETREG_IMM32_B32 : SOPK_Pseudo <
716 "s_setreg_imm32_b32",
717 (outs), (ins i32imm:$imm, hwreg:$simm16),
Matt Arsenault10c17ca2016-10-06 10:13:23 +0000718 "$simm16, $imm"> {
719 let Size = 8; // Unlike every other SOPK instruction.
Valery Pykhtina34fb492016-08-30 15:20:31 +0000720 let has_sdst = 0;
721}
722
Tom Stellard8485fa02016-12-07 02:42:15 +0000723} // End hasSideEffects = 1
Valery Pykhtina34fb492016-08-30 15:20:31 +0000724
Dmitry Preobrazhenskyae312232018-04-06 18:24:49 +0000725let SubtargetPredicate = isGFX9 in {
726 def S_CALL_B64 : SOPK_Pseudo<
727 "s_call_b64",
728 (outs SReg_64:$sdst),
729 (ins s16imm:$simm16),
730 "$sdst, $simm16"> {
731 let isCall = 1;
732 }
733}
734
Valery Pykhtina34fb492016-08-30 15:20:31 +0000735//===----------------------------------------------------------------------===//
736// SOPC Instructions
737//===----------------------------------------------------------------------===//
738
739class SOPCe <bits<7> op> : Enc32 {
740 bits<8> src0;
741 bits<8> src1;
742
743 let Inst{7-0} = src0;
744 let Inst{15-8} = src1;
745 let Inst{22-16} = op;
746 let Inst{31-23} = 0x17e;
747}
748
Matt Arsenaultcc88ce32016-10-12 18:00:51 +0000749class SOPC <bits<7> op, dag outs, dag ins, string asm,
750 list<dag> pattern = []> :
Valery Pykhtina34fb492016-08-30 15:20:31 +0000751 InstSI<outs, ins, asm, pattern>, SOPCe <op> {
752 let mayLoad = 0;
753 let mayStore = 0;
754 let hasSideEffects = 0;
755 let SALU = 1;
756 let SOPC = 1;
757 let isCodeGenOnly = 0;
758 let Defs = [SCC];
759 let SchedRW = [WriteSALU];
760 let UseNamedOperandTable = 1;
761 let SubtargetPredicate = isGCN;
762}
763
764class SOPC_Base <bits<7> op, RegisterOperand rc0, RegisterOperand rc1,
765 string opName, list<dag> pattern = []> : SOPC <
766 op, (outs), (ins rc0:$src0, rc1:$src1),
767 opName#" $src0, $src1", pattern > {
768 let Defs = [SCC];
769}
770class SOPC_Helper <bits<7> op, RegisterOperand rc, ValueType vt,
771 string opName, PatLeaf cond> : SOPC_Base <
772 op, rc, rc, opName,
773 [(set SCC, (si_setcc_uniform vt:$src0, vt:$src1, cond))] > {
774}
775
Matt Arsenault7ccf6cd2016-09-16 21:41:16 +0000776class SOPC_CMP_32<bits<7> op, string opName,
777 PatLeaf cond = COND_NULL, string revOp = opName>
778 : SOPC_Helper<op, SSrc_b32, i32, opName, cond>,
779 Commutable_REV<revOp, !eq(revOp, opName)>,
780 SOPKInstTable<0, opName> {
781 let isCompare = 1;
782 let isCommutable = 1;
783}
Valery Pykhtina34fb492016-08-30 15:20:31 +0000784
Matt Arsenault7b1dc2c2016-09-17 02:02:19 +0000785class SOPC_CMP_64<bits<7> op, string opName,
786 PatLeaf cond = COND_NULL, string revOp = opName>
787 : SOPC_Helper<op, SSrc_b64, i64, opName, cond>,
788 Commutable_REV<revOp, !eq(revOp, opName)> {
789 let isCompare = 1;
790 let isCommutable = 1;
791}
792
Valery Pykhtina34fb492016-08-30 15:20:31 +0000793class SOPC_32<bits<7> op, string opName, list<dag> pattern = []>
Sam Kolton1eeb11b2016-09-09 14:44:04 +0000794 : SOPC_Base<op, SSrc_b32, SSrc_b32, opName, pattern>;
Valery Pykhtina34fb492016-08-30 15:20:31 +0000795
796class SOPC_64_32<bits<7> op, string opName, list<dag> pattern = []>
Sam Kolton1eeb11b2016-09-09 14:44:04 +0000797 : SOPC_Base<op, SSrc_b64, SSrc_b32, opName, pattern>;
Valery Pykhtina34fb492016-08-30 15:20:31 +0000798
Matt Arsenault5d8eb252016-09-30 01:50:20 +0000799def S_CMP_EQ_I32 : SOPC_CMP_32 <0x00, "s_cmp_eq_i32">;
800def S_CMP_LG_I32 : SOPC_CMP_32 <0x01, "s_cmp_lg_i32">;
Valery Pykhtina34fb492016-08-30 15:20:31 +0000801def S_CMP_GT_I32 : SOPC_CMP_32 <0x02, "s_cmp_gt_i32", COND_SGT>;
802def S_CMP_GE_I32 : SOPC_CMP_32 <0x03, "s_cmp_ge_i32", COND_SGE>;
Matt Arsenault7ccf6cd2016-09-16 21:41:16 +0000803def S_CMP_LT_I32 : SOPC_CMP_32 <0x04, "s_cmp_lt_i32", COND_SLT, "s_cmp_gt_i32">;
804def S_CMP_LE_I32 : SOPC_CMP_32 <0x05, "s_cmp_le_i32", COND_SLE, "s_cmp_ge_i32">;
Valery Pykhtina34fb492016-08-30 15:20:31 +0000805def S_CMP_EQ_U32 : SOPC_CMP_32 <0x06, "s_cmp_eq_u32", COND_EQ>;
Matt Arsenault7ccf6cd2016-09-16 21:41:16 +0000806def S_CMP_LG_U32 : SOPC_CMP_32 <0x07, "s_cmp_lg_u32", COND_NE>;
Valery Pykhtina34fb492016-08-30 15:20:31 +0000807def S_CMP_GT_U32 : SOPC_CMP_32 <0x08, "s_cmp_gt_u32", COND_UGT>;
808def S_CMP_GE_U32 : SOPC_CMP_32 <0x09, "s_cmp_ge_u32", COND_UGE>;
Matt Arsenault7ccf6cd2016-09-16 21:41:16 +0000809def S_CMP_LT_U32 : SOPC_CMP_32 <0x0a, "s_cmp_lt_u32", COND_ULT, "s_cmp_gt_u32">;
810def S_CMP_LE_U32 : SOPC_CMP_32 <0x0b, "s_cmp_le_u32", COND_ULE, "s_cmp_ge_u32">;
811
Valery Pykhtina34fb492016-08-30 15:20:31 +0000812def S_BITCMP0_B32 : SOPC_32 <0x0c, "s_bitcmp0_b32">;
813def S_BITCMP1_B32 : SOPC_32 <0x0d, "s_bitcmp1_b32">;
814def S_BITCMP0_B64 : SOPC_64_32 <0x0e, "s_bitcmp0_b64">;
815def S_BITCMP1_B64 : SOPC_64_32 <0x0f, "s_bitcmp1_b64">;
816def S_SETVSKIP : SOPC_32 <0x10, "s_setvskip">;
817
Matt Arsenault7b1dc2c2016-09-17 02:02:19 +0000818let SubtargetPredicate = isVI in {
819def S_CMP_EQ_U64 : SOPC_CMP_64 <0x12, "s_cmp_eq_u64", COND_EQ>;
820def S_CMP_LG_U64 : SOPC_CMP_64 <0x13, "s_cmp_lg_u64", COND_NE>;
821}
Valery Pykhtina34fb492016-08-30 15:20:31 +0000822
Matt Arsenaultcc88ce32016-10-12 18:00:51 +0000823let SubtargetPredicate = HasVGPRIndexMode in {
824def S_SET_GPR_IDX_ON : SOPC <0x11,
825 (outs),
826 (ins SSrc_b32:$src0, GPRIdxMode:$src1),
827 "s_set_gpr_idx_on $src0,$src1"> {
828 let Defs = [M0]; // No scc def
829 let Uses = [M0]; // Other bits of m0 unmodified.
830 let hasSideEffects = 1; // Sets mode.gpr_idx_en
Matt Arsenault2d8c2892016-11-01 20:42:24 +0000831 let FixedSize = 1;
Matt Arsenaultcc88ce32016-10-12 18:00:51 +0000832}
833}
834
Valery Pykhtina34fb492016-08-30 15:20:31 +0000835//===----------------------------------------------------------------------===//
836// SOPP Instructions
837//===----------------------------------------------------------------------===//
838
839class SOPPe <bits<7> op> : Enc32 {
840 bits <16> simm16;
841
842 let Inst{15-0} = simm16;
843 let Inst{22-16} = op;
844 let Inst{31-23} = 0x17f; // encoding
845}
846
847class SOPP <bits<7> op, dag ins, string asm, list<dag> pattern = []> :
848 InstSI <(outs), ins, asm, pattern >, SOPPe <op> {
849
850 let mayLoad = 0;
851 let mayStore = 0;
852 let hasSideEffects = 0;
853 let SALU = 1;
854 let SOPP = 1;
Matt Arsenault10c17ca2016-10-06 10:13:23 +0000855 let Size = 4;
Valery Pykhtina34fb492016-08-30 15:20:31 +0000856 let SchedRW = [WriteSALU];
857
858 let UseNamedOperandTable = 1;
859 let SubtargetPredicate = isGCN;
860}
861
862
863def S_NOP : SOPP <0x00000000, (ins i16imm:$simm16), "s_nop $simm16">;
864
865let isTerminator = 1 in {
866
867def S_ENDPGM : SOPP <0x00000001, (ins), "s_endpgm",
868 [(AMDGPUendpgm)]> {
869 let simm16 = 0;
870 let isBarrier = 1;
Matt Arsenault4e9c1e32016-10-28 23:00:38 +0000871 let isReturn = 1;
Valery Pykhtina34fb492016-08-30 15:20:31 +0000872}
873
Dmitry Preobrazhensky14104e02017-04-12 17:10:07 +0000874let SubtargetPredicate = isVI in {
875def S_ENDPGM_SAVED : SOPP <0x0000001B, (ins), "s_endpgm_saved"> {
876 let simm16 = 0;
877 let isBarrier = 1;
878 let isReturn = 1;
879}
880}
881
Dmitry Preobrazhensky306b1a02018-04-06 17:25:00 +0000882let SubtargetPredicate = isGFX9 in {
883 let isBarrier = 1, isReturn = 1, simm16 = 0 in {
884 def S_ENDPGM_ORDERED_PS_DONE :
885 SOPP<0x01e, (ins), "s_endpgm_ordered_ps_done">;
886 } // End isBarrier = 1, isReturn = 1, simm16 = 0
887} // End SubtargetPredicate = isGFX9
888
Valery Pykhtina34fb492016-08-30 15:20:31 +0000889let isBranch = 1, SchedRW = [WriteBranch] in {
890def S_BRANCH : SOPP <
891 0x00000002, (ins sopp_brtarget:$simm16), "s_branch $simm16",
892 [(br bb:$simm16)]> {
893 let isBarrier = 1;
894}
895
896let Uses = [SCC] in {
897def S_CBRANCH_SCC0 : SOPP <
898 0x00000004, (ins sopp_brtarget:$simm16),
899 "s_cbranch_scc0 $simm16"
900>;
901def S_CBRANCH_SCC1 : SOPP <
902 0x00000005, (ins sopp_brtarget:$simm16),
Matt Arsenaultd674e0a2017-10-10 20:34:49 +0000903 "s_cbranch_scc1 $simm16"
Valery Pykhtina34fb492016-08-30 15:20:31 +0000904>;
905} // End Uses = [SCC]
906
907let Uses = [VCC] in {
908def S_CBRANCH_VCCZ : SOPP <
909 0x00000006, (ins sopp_brtarget:$simm16),
910 "s_cbranch_vccz $simm16"
911>;
912def S_CBRANCH_VCCNZ : SOPP <
913 0x00000007, (ins sopp_brtarget:$simm16),
914 "s_cbranch_vccnz $simm16"
915>;
916} // End Uses = [VCC]
917
918let Uses = [EXEC] in {
919def S_CBRANCH_EXECZ : SOPP <
920 0x00000008, (ins sopp_brtarget:$simm16),
921 "s_cbranch_execz $simm16"
922>;
923def S_CBRANCH_EXECNZ : SOPP <
924 0x00000009, (ins sopp_brtarget:$simm16),
925 "s_cbranch_execnz $simm16"
926>;
927} // End Uses = [EXEC]
928
Dmitry Preobrazhensky3ac63112017-04-05 17:26:45 +0000929def S_CBRANCH_CDBGSYS : SOPP <
930 0x00000017, (ins sopp_brtarget:$simm16),
931 "s_cbranch_cdbgsys $simm16"
932>;
933
934def S_CBRANCH_CDBGSYS_AND_USER : SOPP <
935 0x0000001A, (ins sopp_brtarget:$simm16),
936 "s_cbranch_cdbgsys_and_user $simm16"
937>;
938
939def S_CBRANCH_CDBGSYS_OR_USER : SOPP <
940 0x00000019, (ins sopp_brtarget:$simm16),
941 "s_cbranch_cdbgsys_or_user $simm16"
942>;
943
944def S_CBRANCH_CDBGUSER : SOPP <
945 0x00000018, (ins sopp_brtarget:$simm16),
946 "s_cbranch_cdbguser $simm16"
947>;
Valery Pykhtina34fb492016-08-30 15:20:31 +0000948
949} // End isBranch = 1
950} // End isTerminator = 1
951
952let hasSideEffects = 1 in {
953def S_BARRIER : SOPP <0x0000000a, (ins), "s_barrier",
954 [(int_amdgcn_s_barrier)]> {
955 let SchedRW = [WriteBarrier];
956 let simm16 = 0;
957 let mayLoad = 1;
958 let mayStore = 1;
959 let isConvergent = 1;
960}
961
Dmitry Preobrazhensky14104e02017-04-12 17:10:07 +0000962let SubtargetPredicate = isVI in {
963def S_WAKEUP : SOPP <0x00000003, (ins), "s_wakeup"> {
964 let simm16 = 0;
965 let mayLoad = 1;
966 let mayStore = 1;
967}
968}
969
Valery Pykhtina34fb492016-08-30 15:20:31 +0000970let mayLoad = 1, mayStore = 1, hasSideEffects = 1 in
971def S_WAITCNT : SOPP <0x0000000c, (ins WAIT_FLAG:$simm16), "s_waitcnt $simm16">;
972def S_SETHALT : SOPP <0x0000000d, (ins i16imm:$simm16), "s_sethalt $simm16">;
Dmitry Preobrazhensky3ac63112017-04-05 17:26:45 +0000973def S_SETKILL : SOPP <0x0000000b, (ins i16imm:$simm16), "s_setkill $simm16">;
Valery Pykhtina34fb492016-08-30 15:20:31 +0000974
975// On SI the documentation says sleep for approximately 64 * low 2
976// bits, consistent with the reported maximum of 448. On VI the
977// maximum reported is 960 cycles, so 960 / 64 = 15 max, so is the
978// maximum really 15 on VI?
979def S_SLEEP : SOPP <0x0000000e, (ins i32imm:$simm16),
980 "s_sleep $simm16", [(int_amdgcn_s_sleep SIMM16bit:$simm16)]> {
981 let hasSideEffects = 1;
982 let mayLoad = 1;
983 let mayStore = 1;
984}
985
986def S_SETPRIO : SOPP <0x0000000f, (ins i16imm:$simm16), "s_setprio $simm16">;
987
988let Uses = [EXEC, M0] in {
989// FIXME: Should this be mayLoad+mayStore?
990def S_SENDMSG : SOPP <0x00000010, (ins SendMsgImm:$simm16), "s_sendmsg $simm16",
991 [(AMDGPUsendmsg (i32 imm:$simm16))]
992>;
Jan Veselyd48445d2017-01-04 18:06:55 +0000993
994def S_SENDMSGHALT : SOPP <0x00000011, (ins SendMsgImm:$simm16), "s_sendmsghalt $simm16",
995 [(AMDGPUsendmsghalt (i32 imm:$simm16))]
996>;
Valery Pykhtina34fb492016-08-30 15:20:31 +0000997} // End Uses = [EXEC, M0]
998
Valery Pykhtina34fb492016-08-30 15:20:31 +0000999def S_TRAP : SOPP <0x00000012, (ins i16imm:$simm16), "s_trap $simm16">;
1000def S_ICACHE_INV : SOPP <0x00000013, (ins), "s_icache_inv"> {
1001 let simm16 = 0;
1002}
1003def S_INCPERFLEVEL : SOPP <0x00000014, (ins i32imm:$simm16), "s_incperflevel $simm16",
1004 [(int_amdgcn_s_incperflevel SIMM16bit:$simm16)]> {
1005 let hasSideEffects = 1;
1006 let mayLoad = 1;
1007 let mayStore = 1;
1008}
1009def S_DECPERFLEVEL : SOPP <0x00000015, (ins i32imm:$simm16), "s_decperflevel $simm16",
1010 [(int_amdgcn_s_decperflevel SIMM16bit:$simm16)]> {
1011 let hasSideEffects = 1;
1012 let mayLoad = 1;
1013 let mayStore = 1;
1014}
1015def S_TTRACEDATA : SOPP <0x00000016, (ins), "s_ttracedata"> {
1016 let simm16 = 0;
1017}
Matt Arsenaultcc88ce32016-10-12 18:00:51 +00001018
1019let SubtargetPredicate = HasVGPRIndexMode in {
1020def S_SET_GPR_IDX_OFF : SOPP<0x1c, (ins), "s_set_gpr_idx_off"> {
1021 let simm16 = 0;
1022}
1023}
Valery Pykhtina34fb492016-08-30 15:20:31 +00001024} // End hasSideEffects
1025
Matt Arsenaultcc88ce32016-10-12 18:00:51 +00001026let SubtargetPredicate = HasVGPRIndexMode in {
1027def S_SET_GPR_IDX_MODE : SOPP<0x1d, (ins GPRIdxMode:$simm16),
1028 "s_set_gpr_idx_mode$simm16"> {
1029 let Defs = [M0];
1030}
1031}
Valery Pykhtina34fb492016-08-30 15:20:31 +00001032
Valery Pykhtina34fb492016-08-30 15:20:31 +00001033//===----------------------------------------------------------------------===//
1034// S_GETREG_B32 Intrinsic Pattern.
1035//===----------------------------------------------------------------------===//
Matt Arsenault90c75932017-10-03 00:06:41 +00001036def : GCNPat <
Valery Pykhtina34fb492016-08-30 15:20:31 +00001037 (int_amdgcn_s_getreg imm:$simm16),
1038 (S_GETREG_B32 (as_i16imm $simm16))
1039>;
1040
1041//===----------------------------------------------------------------------===//
1042// SOP1 Patterns
1043//===----------------------------------------------------------------------===//
1044
Matt Arsenault90c75932017-10-03 00:06:41 +00001045def : GCNPat <
Valery Pykhtina34fb492016-08-30 15:20:31 +00001046 (i64 (ctpop i64:$src)),
1047 (i64 (REG_SEQUENCE SReg_64,
1048 (i32 (COPY_TO_REGCLASS (S_BCNT1_I32_B64 $src), SReg_32)), sub0,
Tom Stellard115a6152016-11-10 16:02:37 +00001049 (S_MOV_B32 (i32 0)), sub1))
Valery Pykhtina34fb492016-08-30 15:20:31 +00001050>;
1051
Matt Arsenault90c75932017-10-03 00:06:41 +00001052def : GCNPat <
Valery Pykhtina34fb492016-08-30 15:20:31 +00001053 (i32 (smax i32:$x, (i32 (ineg i32:$x)))),
1054 (S_ABS_I32 $x)
1055>;
1056
Matt Arsenault90c75932017-10-03 00:06:41 +00001057def : GCNPat <
Tom Stellard115a6152016-11-10 16:02:37 +00001058 (i16 imm:$imm),
1059 (S_MOV_B32 imm:$imm)
1060>;
1061
1062// Same as a 32-bit inreg
Matt Arsenault90c75932017-10-03 00:06:41 +00001063def : GCNPat<
Tom Stellard115a6152016-11-10 16:02:37 +00001064 (i32 (sext i16:$src)),
1065 (S_SEXT_I32_I16 $src)
1066>;
1067
1068
Valery Pykhtina34fb492016-08-30 15:20:31 +00001069//===----------------------------------------------------------------------===//
1070// SOP2 Patterns
1071//===----------------------------------------------------------------------===//
1072
1073// V_ADD_I32_e32/S_ADD_U32 produces carry in VCC/SCC. For the vector
1074// case, the sgpr-copies pass will fix this to use the vector version.
Matt Arsenault90c75932017-10-03 00:06:41 +00001075def : GCNPat <
Valery Pykhtina34fb492016-08-30 15:20:31 +00001076 (i32 (addc i32:$src0, i32:$src1)),
1077 (S_ADD_U32 $src0, $src1)
1078>;
1079
Tom Stellard115a6152016-11-10 16:02:37 +00001080// FIXME: We need to use COPY_TO_REGCLASS to work-around the fact that
1081// REG_SEQUENCE patterns don't support instructions with multiple
1082// outputs.
Matt Arsenault90c75932017-10-03 00:06:41 +00001083def : GCNPat<
Tom Stellard115a6152016-11-10 16:02:37 +00001084 (i64 (zext i16:$src)),
1085 (REG_SEQUENCE SReg_64,
1086 (i32 (COPY_TO_REGCLASS (S_AND_B32 $src, (S_MOV_B32 (i32 0xffff))), SGPR_32)), sub0,
1087 (S_MOV_B32 (i32 0)), sub1)
1088>;
1089
Matt Arsenault90c75932017-10-03 00:06:41 +00001090def : GCNPat <
Tom Stellard115a6152016-11-10 16:02:37 +00001091 (i64 (sext i16:$src)),
1092 (REG_SEQUENCE SReg_64, (i32 (S_SEXT_I32_I16 $src)), sub0,
1093 (i32 (COPY_TO_REGCLASS (S_ASHR_I32 (i32 (S_SEXT_I32_I16 $src)), (S_MOV_B32 (i32 31))), SGPR_32)), sub1)
1094>;
1095
Matt Arsenault90c75932017-10-03 00:06:41 +00001096def : GCNPat<
Tom Stellard115a6152016-11-10 16:02:37 +00001097 (i32 (zext i16:$src)),
1098 (S_AND_B32 (S_MOV_B32 (i32 0xffff)), $src)
1099>;
1100
1101
1102
Valery Pykhtina34fb492016-08-30 15:20:31 +00001103//===----------------------------------------------------------------------===//
1104// SOPP Patterns
1105//===----------------------------------------------------------------------===//
1106
Matt Arsenault90c75932017-10-03 00:06:41 +00001107def : GCNPat <
Valery Pykhtina34fb492016-08-30 15:20:31 +00001108 (int_amdgcn_s_waitcnt i32:$simm16),
1109 (S_WAITCNT (as_i16imm $simm16))
1110>;
1111
Valery Pykhtina34fb492016-08-30 15:20:31 +00001112
1113//===----------------------------------------------------------------------===//
1114// Real target instructions, move this to the appropriate subtarget TD file
1115//===----------------------------------------------------------------------===//
1116
1117class Select_si<string opName> :
1118 SIMCInstr<opName, SIEncodingFamily.SI> {
1119 list<Predicate> AssemblerPredicates = [isSICI];
1120 string DecoderNamespace = "SICI";
1121}
1122
1123class SOP1_Real_si<bits<8> op, SOP1_Pseudo ps> :
1124 SOP1_Real<op, ps>,
1125 Select_si<ps.Mnemonic>;
1126
1127class SOP2_Real_si<bits<7> op, SOP2_Pseudo ps> :
1128 SOP2_Real<op, ps>,
1129 Select_si<ps.Mnemonic>;
1130
1131class SOPK_Real_si<bits<5> op, SOPK_Pseudo ps> :
1132 SOPK_Real32<op, ps>,
1133 Select_si<ps.Mnemonic>;
1134
1135def S_MOV_B32_si : SOP1_Real_si <0x03, S_MOV_B32>;
1136def S_MOV_B64_si : SOP1_Real_si <0x04, S_MOV_B64>;
1137def S_CMOV_B32_si : SOP1_Real_si <0x05, S_CMOV_B32>;
1138def S_CMOV_B64_si : SOP1_Real_si <0x06, S_CMOV_B64>;
1139def S_NOT_B32_si : SOP1_Real_si <0x07, S_NOT_B32>;
1140def S_NOT_B64_si : SOP1_Real_si <0x08, S_NOT_B64>;
1141def S_WQM_B32_si : SOP1_Real_si <0x09, S_WQM_B32>;
1142def S_WQM_B64_si : SOP1_Real_si <0x0a, S_WQM_B64>;
1143def S_BREV_B32_si : SOP1_Real_si <0x0b, S_BREV_B32>;
1144def S_BREV_B64_si : SOP1_Real_si <0x0c, S_BREV_B64>;
1145def S_BCNT0_I32_B32_si : SOP1_Real_si <0x0d, S_BCNT0_I32_B32>;
1146def S_BCNT0_I32_B64_si : SOP1_Real_si <0x0e, S_BCNT0_I32_B64>;
1147def S_BCNT1_I32_B32_si : SOP1_Real_si <0x0f, S_BCNT1_I32_B32>;
1148def S_BCNT1_I32_B64_si : SOP1_Real_si <0x10, S_BCNT1_I32_B64>;
1149def S_FF0_I32_B32_si : SOP1_Real_si <0x11, S_FF0_I32_B32>;
1150def S_FF0_I32_B64_si : SOP1_Real_si <0x12, S_FF0_I32_B64>;
1151def S_FF1_I32_B32_si : SOP1_Real_si <0x13, S_FF1_I32_B32>;
1152def S_FF1_I32_B64_si : SOP1_Real_si <0x14, S_FF1_I32_B64>;
1153def S_FLBIT_I32_B32_si : SOP1_Real_si <0x15, S_FLBIT_I32_B32>;
1154def S_FLBIT_I32_B64_si : SOP1_Real_si <0x16, S_FLBIT_I32_B64>;
1155def S_FLBIT_I32_si : SOP1_Real_si <0x17, S_FLBIT_I32>;
1156def S_FLBIT_I32_I64_si : SOP1_Real_si <0x18, S_FLBIT_I32_I64>;
1157def S_SEXT_I32_I8_si : SOP1_Real_si <0x19, S_SEXT_I32_I8>;
1158def S_SEXT_I32_I16_si : SOP1_Real_si <0x1a, S_SEXT_I32_I16>;
1159def S_BITSET0_B32_si : SOP1_Real_si <0x1b, S_BITSET0_B32>;
1160def S_BITSET0_B64_si : SOP1_Real_si <0x1c, S_BITSET0_B64>;
1161def S_BITSET1_B32_si : SOP1_Real_si <0x1d, S_BITSET1_B32>;
1162def S_BITSET1_B64_si : SOP1_Real_si <0x1e, S_BITSET1_B64>;
1163def S_GETPC_B64_si : SOP1_Real_si <0x1f, S_GETPC_B64>;
1164def S_SETPC_B64_si : SOP1_Real_si <0x20, S_SETPC_B64>;
1165def S_SWAPPC_B64_si : SOP1_Real_si <0x21, S_SWAPPC_B64>;
1166def S_RFE_B64_si : SOP1_Real_si <0x22, S_RFE_B64>;
1167def S_AND_SAVEEXEC_B64_si : SOP1_Real_si <0x24, S_AND_SAVEEXEC_B64>;
1168def S_OR_SAVEEXEC_B64_si : SOP1_Real_si <0x25, S_OR_SAVEEXEC_B64>;
1169def S_XOR_SAVEEXEC_B64_si : SOP1_Real_si <0x26, S_XOR_SAVEEXEC_B64>;
1170def S_ANDN2_SAVEEXEC_B64_si: SOP1_Real_si <0x27, S_ANDN2_SAVEEXEC_B64>;
1171def S_ORN2_SAVEEXEC_B64_si : SOP1_Real_si <0x28, S_ORN2_SAVEEXEC_B64>;
1172def S_NAND_SAVEEXEC_B64_si : SOP1_Real_si <0x29, S_NAND_SAVEEXEC_B64>;
1173def S_NOR_SAVEEXEC_B64_si : SOP1_Real_si <0x2a, S_NOR_SAVEEXEC_B64>;
1174def S_XNOR_SAVEEXEC_B64_si : SOP1_Real_si <0x2b, S_XNOR_SAVEEXEC_B64>;
1175def S_QUADMASK_B32_si : SOP1_Real_si <0x2c, S_QUADMASK_B32>;
1176def S_QUADMASK_B64_si : SOP1_Real_si <0x2d, S_QUADMASK_B64>;
1177def S_MOVRELS_B32_si : SOP1_Real_si <0x2e, S_MOVRELS_B32>;
1178def S_MOVRELS_B64_si : SOP1_Real_si <0x2f, S_MOVRELS_B64>;
1179def S_MOVRELD_B32_si : SOP1_Real_si <0x30, S_MOVRELD_B32>;
1180def S_MOVRELD_B64_si : SOP1_Real_si <0x31, S_MOVRELD_B64>;
1181def S_CBRANCH_JOIN_si : SOP1_Real_si <0x32, S_CBRANCH_JOIN>;
1182def S_MOV_REGRD_B32_si : SOP1_Real_si <0x33, S_MOV_REGRD_B32>;
1183def S_ABS_I32_si : SOP1_Real_si <0x34, S_ABS_I32>;
1184def S_MOV_FED_B32_si : SOP1_Real_si <0x35, S_MOV_FED_B32>;
1185
1186def S_ADD_U32_si : SOP2_Real_si <0x00, S_ADD_U32>;
1187def S_ADD_I32_si : SOP2_Real_si <0x02, S_ADD_I32>;
1188def S_SUB_U32_si : SOP2_Real_si <0x01, S_SUB_U32>;
1189def S_SUB_I32_si : SOP2_Real_si <0x03, S_SUB_I32>;
1190def S_ADDC_U32_si : SOP2_Real_si <0x04, S_ADDC_U32>;
1191def S_SUBB_U32_si : SOP2_Real_si <0x05, S_SUBB_U32>;
1192def S_MIN_I32_si : SOP2_Real_si <0x06, S_MIN_I32>;
1193def S_MIN_U32_si : SOP2_Real_si <0x07, S_MIN_U32>;
1194def S_MAX_I32_si : SOP2_Real_si <0x08, S_MAX_I32>;
1195def S_MAX_U32_si : SOP2_Real_si <0x09, S_MAX_U32>;
1196def S_CSELECT_B32_si : SOP2_Real_si <0x0a, S_CSELECT_B32>;
1197def S_CSELECT_B64_si : SOP2_Real_si <0x0b, S_CSELECT_B64>;
1198def S_AND_B32_si : SOP2_Real_si <0x0e, S_AND_B32>;
1199def S_AND_B64_si : SOP2_Real_si <0x0f, S_AND_B64>;
1200def S_OR_B32_si : SOP2_Real_si <0x10, S_OR_B32>;
1201def S_OR_B64_si : SOP2_Real_si <0x11, S_OR_B64>;
1202def S_XOR_B32_si : SOP2_Real_si <0x12, S_XOR_B32>;
1203def S_XOR_B64_si : SOP2_Real_si <0x13, S_XOR_B64>;
1204def S_ANDN2_B32_si : SOP2_Real_si <0x14, S_ANDN2_B32>;
1205def S_ANDN2_B64_si : SOP2_Real_si <0x15, S_ANDN2_B64>;
1206def S_ORN2_B32_si : SOP2_Real_si <0x16, S_ORN2_B32>;
1207def S_ORN2_B64_si : SOP2_Real_si <0x17, S_ORN2_B64>;
1208def S_NAND_B32_si : SOP2_Real_si <0x18, S_NAND_B32>;
1209def S_NAND_B64_si : SOP2_Real_si <0x19, S_NAND_B64>;
1210def S_NOR_B32_si : SOP2_Real_si <0x1a, S_NOR_B32>;
1211def S_NOR_B64_si : SOP2_Real_si <0x1b, S_NOR_B64>;
1212def S_XNOR_B32_si : SOP2_Real_si <0x1c, S_XNOR_B32>;
1213def S_XNOR_B64_si : SOP2_Real_si <0x1d, S_XNOR_B64>;
1214def S_LSHL_B32_si : SOP2_Real_si <0x1e, S_LSHL_B32>;
1215def S_LSHL_B64_si : SOP2_Real_si <0x1f, S_LSHL_B64>;
1216def S_LSHR_B32_si : SOP2_Real_si <0x20, S_LSHR_B32>;
1217def S_LSHR_B64_si : SOP2_Real_si <0x21, S_LSHR_B64>;
1218def S_ASHR_I32_si : SOP2_Real_si <0x22, S_ASHR_I32>;
1219def S_ASHR_I64_si : SOP2_Real_si <0x23, S_ASHR_I64>;
1220def S_BFM_B32_si : SOP2_Real_si <0x24, S_BFM_B32>;
1221def S_BFM_B64_si : SOP2_Real_si <0x25, S_BFM_B64>;
1222def S_MUL_I32_si : SOP2_Real_si <0x26, S_MUL_I32>;
1223def S_BFE_U32_si : SOP2_Real_si <0x27, S_BFE_U32>;
1224def S_BFE_I32_si : SOP2_Real_si <0x28, S_BFE_I32>;
1225def S_BFE_U64_si : SOP2_Real_si <0x29, S_BFE_U64>;
1226def S_BFE_I64_si : SOP2_Real_si <0x2a, S_BFE_I64>;
1227def S_CBRANCH_G_FORK_si : SOP2_Real_si <0x2b, S_CBRANCH_G_FORK>;
1228def S_ABSDIFF_I32_si : SOP2_Real_si <0x2c, S_ABSDIFF_I32>;
1229
1230def S_MOVK_I32_si : SOPK_Real_si <0x00, S_MOVK_I32>;
1231def S_CMOVK_I32_si : SOPK_Real_si <0x02, S_CMOVK_I32>;
1232def S_CMPK_EQ_I32_si : SOPK_Real_si <0x03, S_CMPK_EQ_I32>;
1233def S_CMPK_LG_I32_si : SOPK_Real_si <0x04, S_CMPK_LG_I32>;
1234def S_CMPK_GT_I32_si : SOPK_Real_si <0x05, S_CMPK_GT_I32>;
1235def S_CMPK_GE_I32_si : SOPK_Real_si <0x06, S_CMPK_GE_I32>;
1236def S_CMPK_LT_I32_si : SOPK_Real_si <0x07, S_CMPK_LT_I32>;
1237def S_CMPK_LE_I32_si : SOPK_Real_si <0x08, S_CMPK_LE_I32>;
1238def S_CMPK_EQ_U32_si : SOPK_Real_si <0x09, S_CMPK_EQ_U32>;
1239def S_CMPK_LG_U32_si : SOPK_Real_si <0x0a, S_CMPK_LG_U32>;
1240def S_CMPK_GT_U32_si : SOPK_Real_si <0x0b, S_CMPK_GT_U32>;
1241def S_CMPK_GE_U32_si : SOPK_Real_si <0x0c, S_CMPK_GE_U32>;
1242def S_CMPK_LT_U32_si : SOPK_Real_si <0x0d, S_CMPK_LT_U32>;
1243def S_CMPK_LE_U32_si : SOPK_Real_si <0x0e, S_CMPK_LE_U32>;
1244def S_ADDK_I32_si : SOPK_Real_si <0x0f, S_ADDK_I32>;
1245def S_MULK_I32_si : SOPK_Real_si <0x10, S_MULK_I32>;
1246def S_CBRANCH_I_FORK_si : SOPK_Real_si <0x11, S_CBRANCH_I_FORK>;
1247def S_GETREG_B32_si : SOPK_Real_si <0x12, S_GETREG_B32>;
1248def S_SETREG_B32_si : SOPK_Real_si <0x13, S_SETREG_B32>;
1249//def S_GETREG_REGRD_B32_si : SOPK_Real_si <0x14, S_GETREG_REGRD_B32>; // see pseudo for comments
1250def S_SETREG_IMM32_B32_si : SOPK_Real64<0x15, S_SETREG_IMM32_B32>,
1251 Select_si<S_SETREG_IMM32_B32.Mnemonic>;
1252
1253
1254class Select_vi<string opName> :
1255 SIMCInstr<opName, SIEncodingFamily.VI> {
1256 list<Predicate> AssemblerPredicates = [isVI];
1257 string DecoderNamespace = "VI";
1258}
1259
1260class SOP1_Real_vi<bits<8> op, SOP1_Pseudo ps> :
1261 SOP1_Real<op, ps>,
1262 Select_vi<ps.Mnemonic>;
1263
1264
1265class SOP2_Real_vi<bits<7> op, SOP2_Pseudo ps> :
1266 SOP2_Real<op, ps>,
1267 Select_vi<ps.Mnemonic>;
1268
1269class SOPK_Real_vi<bits<5> op, SOPK_Pseudo ps> :
1270 SOPK_Real32<op, ps>,
1271 Select_vi<ps.Mnemonic>;
1272
1273def S_MOV_B32_vi : SOP1_Real_vi <0x00, S_MOV_B32>;
1274def S_MOV_B64_vi : SOP1_Real_vi <0x01, S_MOV_B64>;
1275def S_CMOV_B32_vi : SOP1_Real_vi <0x02, S_CMOV_B32>;
1276def S_CMOV_B64_vi : SOP1_Real_vi <0x03, S_CMOV_B64>;
1277def S_NOT_B32_vi : SOP1_Real_vi <0x04, S_NOT_B32>;
1278def S_NOT_B64_vi : SOP1_Real_vi <0x05, S_NOT_B64>;
1279def S_WQM_B32_vi : SOP1_Real_vi <0x06, S_WQM_B32>;
1280def S_WQM_B64_vi : SOP1_Real_vi <0x07, S_WQM_B64>;
1281def S_BREV_B32_vi : SOP1_Real_vi <0x08, S_BREV_B32>;
1282def S_BREV_B64_vi : SOP1_Real_vi <0x09, S_BREV_B64>;
1283def S_BCNT0_I32_B32_vi : SOP1_Real_vi <0x0a, S_BCNT0_I32_B32>;
1284def S_BCNT0_I32_B64_vi : SOP1_Real_vi <0x0b, S_BCNT0_I32_B64>;
1285def S_BCNT1_I32_B32_vi : SOP1_Real_vi <0x0c, S_BCNT1_I32_B32>;
1286def S_BCNT1_I32_B64_vi : SOP1_Real_vi <0x0d, S_BCNT1_I32_B64>;
1287def S_FF0_I32_B32_vi : SOP1_Real_vi <0x0e, S_FF0_I32_B32>;
1288def S_FF0_I32_B64_vi : SOP1_Real_vi <0x0f, S_FF0_I32_B64>;
1289def S_FF1_I32_B32_vi : SOP1_Real_vi <0x10, S_FF1_I32_B32>;
1290def S_FF1_I32_B64_vi : SOP1_Real_vi <0x11, S_FF1_I32_B64>;
1291def S_FLBIT_I32_B32_vi : SOP1_Real_vi <0x12, S_FLBIT_I32_B32>;
1292def S_FLBIT_I32_B64_vi : SOP1_Real_vi <0x13, S_FLBIT_I32_B64>;
1293def S_FLBIT_I32_vi : SOP1_Real_vi <0x14, S_FLBIT_I32>;
1294def S_FLBIT_I32_I64_vi : SOP1_Real_vi <0x15, S_FLBIT_I32_I64>;
1295def S_SEXT_I32_I8_vi : SOP1_Real_vi <0x16, S_SEXT_I32_I8>;
1296def S_SEXT_I32_I16_vi : SOP1_Real_vi <0x17, S_SEXT_I32_I16>;
1297def S_BITSET0_B32_vi : SOP1_Real_vi <0x18, S_BITSET0_B32>;
1298def S_BITSET0_B64_vi : SOP1_Real_vi <0x19, S_BITSET0_B64>;
1299def S_BITSET1_B32_vi : SOP1_Real_vi <0x1a, S_BITSET1_B32>;
1300def S_BITSET1_B64_vi : SOP1_Real_vi <0x1b, S_BITSET1_B64>;
1301def S_GETPC_B64_vi : SOP1_Real_vi <0x1c, S_GETPC_B64>;
1302def S_SETPC_B64_vi : SOP1_Real_vi <0x1d, S_SETPC_B64>;
1303def S_SWAPPC_B64_vi : SOP1_Real_vi <0x1e, S_SWAPPC_B64>;
1304def S_RFE_B64_vi : SOP1_Real_vi <0x1f, S_RFE_B64>;
1305def S_AND_SAVEEXEC_B64_vi : SOP1_Real_vi <0x20, S_AND_SAVEEXEC_B64>;
1306def S_OR_SAVEEXEC_B64_vi : SOP1_Real_vi <0x21, S_OR_SAVEEXEC_B64>;
1307def S_XOR_SAVEEXEC_B64_vi : SOP1_Real_vi <0x22, S_XOR_SAVEEXEC_B64>;
1308def S_ANDN2_SAVEEXEC_B64_vi: SOP1_Real_vi <0x23, S_ANDN2_SAVEEXEC_B64>;
1309def S_ORN2_SAVEEXEC_B64_vi : SOP1_Real_vi <0x24, S_ORN2_SAVEEXEC_B64>;
1310def S_NAND_SAVEEXEC_B64_vi : SOP1_Real_vi <0x25, S_NAND_SAVEEXEC_B64>;
1311def S_NOR_SAVEEXEC_B64_vi : SOP1_Real_vi <0x26, S_NOR_SAVEEXEC_B64>;
1312def S_XNOR_SAVEEXEC_B64_vi : SOP1_Real_vi <0x27, S_XNOR_SAVEEXEC_B64>;
1313def S_QUADMASK_B32_vi : SOP1_Real_vi <0x28, S_QUADMASK_B32>;
1314def S_QUADMASK_B64_vi : SOP1_Real_vi <0x29, S_QUADMASK_B64>;
1315def S_MOVRELS_B32_vi : SOP1_Real_vi <0x2a, S_MOVRELS_B32>;
1316def S_MOVRELS_B64_vi : SOP1_Real_vi <0x2b, S_MOVRELS_B64>;
1317def S_MOVRELD_B32_vi : SOP1_Real_vi <0x2c, S_MOVRELD_B32>;
1318def S_MOVRELD_B64_vi : SOP1_Real_vi <0x2d, S_MOVRELD_B64>;
1319def S_CBRANCH_JOIN_vi : SOP1_Real_vi <0x2e, S_CBRANCH_JOIN>;
1320def S_MOV_REGRD_B32_vi : SOP1_Real_vi <0x2f, S_MOV_REGRD_B32>;
1321def S_ABS_I32_vi : SOP1_Real_vi <0x30, S_ABS_I32>;
1322def S_MOV_FED_B32_vi : SOP1_Real_vi <0x31, S_MOV_FED_B32>;
Matt Arsenaultcc88ce32016-10-12 18:00:51 +00001323def S_SET_GPR_IDX_IDX_vi : SOP1_Real_vi <0x32, S_SET_GPR_IDX_IDX>;
Valery Pykhtina34fb492016-08-30 15:20:31 +00001324
1325def S_ADD_U32_vi : SOP2_Real_vi <0x00, S_ADD_U32>;
1326def S_ADD_I32_vi : SOP2_Real_vi <0x02, S_ADD_I32>;
1327def S_SUB_U32_vi : SOP2_Real_vi <0x01, S_SUB_U32>;
1328def S_SUB_I32_vi : SOP2_Real_vi <0x03, S_SUB_I32>;
1329def S_ADDC_U32_vi : SOP2_Real_vi <0x04, S_ADDC_U32>;
1330def S_SUBB_U32_vi : SOP2_Real_vi <0x05, S_SUBB_U32>;
1331def S_MIN_I32_vi : SOP2_Real_vi <0x06, S_MIN_I32>;
1332def S_MIN_U32_vi : SOP2_Real_vi <0x07, S_MIN_U32>;
1333def S_MAX_I32_vi : SOP2_Real_vi <0x08, S_MAX_I32>;
1334def S_MAX_U32_vi : SOP2_Real_vi <0x09, S_MAX_U32>;
1335def S_CSELECT_B32_vi : SOP2_Real_vi <0x0a, S_CSELECT_B32>;
1336def S_CSELECT_B64_vi : SOP2_Real_vi <0x0b, S_CSELECT_B64>;
1337def S_AND_B32_vi : SOP2_Real_vi <0x0c, S_AND_B32>;
1338def S_AND_B64_vi : SOP2_Real_vi <0x0d, S_AND_B64>;
1339def S_OR_B32_vi : SOP2_Real_vi <0x0e, S_OR_B32>;
1340def S_OR_B64_vi : SOP2_Real_vi <0x0f, S_OR_B64>;
1341def S_XOR_B32_vi : SOP2_Real_vi <0x10, S_XOR_B32>;
1342def S_XOR_B64_vi : SOP2_Real_vi <0x11, S_XOR_B64>;
1343def S_ANDN2_B32_vi : SOP2_Real_vi <0x12, S_ANDN2_B32>;
1344def S_ANDN2_B64_vi : SOP2_Real_vi <0x13, S_ANDN2_B64>;
1345def S_ORN2_B32_vi : SOP2_Real_vi <0x14, S_ORN2_B32>;
1346def S_ORN2_B64_vi : SOP2_Real_vi <0x15, S_ORN2_B64>;
1347def S_NAND_B32_vi : SOP2_Real_vi <0x16, S_NAND_B32>;
1348def S_NAND_B64_vi : SOP2_Real_vi <0x17, S_NAND_B64>;
1349def S_NOR_B32_vi : SOP2_Real_vi <0x18, S_NOR_B32>;
1350def S_NOR_B64_vi : SOP2_Real_vi <0x19, S_NOR_B64>;
1351def S_XNOR_B32_vi : SOP2_Real_vi <0x1a, S_XNOR_B32>;
1352def S_XNOR_B64_vi : SOP2_Real_vi <0x1b, S_XNOR_B64>;
1353def S_LSHL_B32_vi : SOP2_Real_vi <0x1c, S_LSHL_B32>;
1354def S_LSHL_B64_vi : SOP2_Real_vi <0x1d, S_LSHL_B64>;
1355def S_LSHR_B32_vi : SOP2_Real_vi <0x1e, S_LSHR_B32>;
1356def S_LSHR_B64_vi : SOP2_Real_vi <0x1f, S_LSHR_B64>;
1357def S_ASHR_I32_vi : SOP2_Real_vi <0x20, S_ASHR_I32>;
1358def S_ASHR_I64_vi : SOP2_Real_vi <0x21, S_ASHR_I64>;
1359def S_BFM_B32_vi : SOP2_Real_vi <0x22, S_BFM_B32>;
1360def S_BFM_B64_vi : SOP2_Real_vi <0x23, S_BFM_B64>;
1361def S_MUL_I32_vi : SOP2_Real_vi <0x24, S_MUL_I32>;
1362def S_BFE_U32_vi : SOP2_Real_vi <0x25, S_BFE_U32>;
1363def S_BFE_I32_vi : SOP2_Real_vi <0x26, S_BFE_I32>;
1364def S_BFE_U64_vi : SOP2_Real_vi <0x27, S_BFE_U64>;
1365def S_BFE_I64_vi : SOP2_Real_vi <0x28, S_BFE_I64>;
1366def S_CBRANCH_G_FORK_vi : SOP2_Real_vi <0x29, S_CBRANCH_G_FORK>;
1367def S_ABSDIFF_I32_vi : SOP2_Real_vi <0x2a, S_ABSDIFF_I32>;
Matt Arsenault9be7b0d2017-02-27 18:49:11 +00001368def S_PACK_LL_B32_B16_vi : SOP2_Real_vi <0x32, S_PACK_LL_B32_B16>;
1369def S_PACK_LH_B32_B16_vi : SOP2_Real_vi <0x33, S_PACK_LH_B32_B16>;
1370def S_PACK_HH_B32_B16_vi : SOP2_Real_vi <0x34, S_PACK_HH_B32_B16>;
Dmitry Preobrazhensky14104e02017-04-12 17:10:07 +00001371def S_RFE_RESTORE_B64_vi : SOP2_Real_vi <0x2b, S_RFE_RESTORE_B64>;
Valery Pykhtina34fb492016-08-30 15:20:31 +00001372
1373def S_MOVK_I32_vi : SOPK_Real_vi <0x00, S_MOVK_I32>;
1374def S_CMOVK_I32_vi : SOPK_Real_vi <0x01, S_CMOVK_I32>;
1375def S_CMPK_EQ_I32_vi : SOPK_Real_vi <0x02, S_CMPK_EQ_I32>;
1376def S_CMPK_LG_I32_vi : SOPK_Real_vi <0x03, S_CMPK_LG_I32>;
1377def S_CMPK_GT_I32_vi : SOPK_Real_vi <0x04, S_CMPK_GT_I32>;
1378def S_CMPK_GE_I32_vi : SOPK_Real_vi <0x05, S_CMPK_GE_I32>;
1379def S_CMPK_LT_I32_vi : SOPK_Real_vi <0x06, S_CMPK_LT_I32>;
1380def S_CMPK_LE_I32_vi : SOPK_Real_vi <0x07, S_CMPK_LE_I32>;
1381def S_CMPK_EQ_U32_vi : SOPK_Real_vi <0x08, S_CMPK_EQ_U32>;
1382def S_CMPK_LG_U32_vi : SOPK_Real_vi <0x09, S_CMPK_LG_U32>;
1383def S_CMPK_GT_U32_vi : SOPK_Real_vi <0x0A, S_CMPK_GT_U32>;
1384def S_CMPK_GE_U32_vi : SOPK_Real_vi <0x0B, S_CMPK_GE_U32>;
1385def S_CMPK_LT_U32_vi : SOPK_Real_vi <0x0C, S_CMPK_LT_U32>;
1386def S_CMPK_LE_U32_vi : SOPK_Real_vi <0x0D, S_CMPK_LE_U32>;
1387def S_ADDK_I32_vi : SOPK_Real_vi <0x0E, S_ADDK_I32>;
1388def S_MULK_I32_vi : SOPK_Real_vi <0x0F, S_MULK_I32>;
1389def S_CBRANCH_I_FORK_vi : SOPK_Real_vi <0x10, S_CBRANCH_I_FORK>;
1390def S_GETREG_B32_vi : SOPK_Real_vi <0x11, S_GETREG_B32>;
1391def S_SETREG_B32_vi : SOPK_Real_vi <0x12, S_SETREG_B32>;
1392//def S_GETREG_REGRD_B32_vi : SOPK_Real_vi <0x13, S_GETREG_REGRD_B32>; // see pseudo for comments
1393def S_SETREG_IMM32_B32_vi : SOPK_Real64<0x14, S_SETREG_IMM32_B32>,
Tom Stellard2add8a12016-09-06 20:00:26 +00001394 Select_vi<S_SETREG_IMM32_B32.Mnemonic>;
Dmitry Preobrazhenskyf20aff52018-04-06 16:35:11 +00001395
Dmitry Preobrazhenskyae312232018-04-06 18:24:49 +00001396def S_CALL_B64_vi : SOPK_Real_vi <0x15, S_CALL_B64>;
1397
Dmitry Preobrazhenskyf20aff52018-04-06 16:35:11 +00001398//===----------------------------------------------------------------------===//
1399// SOP1 - GFX9.
1400//===----------------------------------------------------------------------===//
1401
1402def S_ANDN1_SAVEEXEC_B64_vi : SOP1_Real_vi<0x33, S_ANDN1_SAVEEXEC_B64>;
1403def S_ORN1_SAVEEXEC_B64_vi : SOP1_Real_vi<0x34, S_ORN1_SAVEEXEC_B64>;
1404def S_ANDN1_WREXEC_B64_vi : SOP1_Real_vi<0x35, S_ANDN1_WREXEC_B64>;
1405def S_ANDN2_WREXEC_B64_vi : SOP1_Real_vi<0x36, S_ANDN2_WREXEC_B64>;
1406def S_BITREPLICATE_B64_B32_vi : SOP1_Real_vi<0x37, S_BITREPLICATE_B64_B32>;
Dmitry Preobrazhensky2f8e1462018-04-09 13:10:33 +00001407
1408//===----------------------------------------------------------------------===//
1409// SOP2 - GFX9.
1410//===----------------------------------------------------------------------===//
1411
1412def S_LSHL1_ADD_U32_vi : SOP2_Real_vi<0x2e, S_LSHL1_ADD_U32>;
1413def S_LSHL2_ADD_U32_vi : SOP2_Real_vi<0x2f, S_LSHL2_ADD_U32>;
1414def S_LSHL3_ADD_U32_vi : SOP2_Real_vi<0x30, S_LSHL3_ADD_U32>;
1415def S_LSHL4_ADD_U32_vi : SOP2_Real_vi<0x31, S_LSHL4_ADD_U32>;
1416def S_MUL_HI_U32_vi : SOP2_Real_vi<0x2c, S_MUL_HI_U32>;
1417def S_MUL_HI_I32_vi : SOP2_Real_vi<0x2d, S_MUL_HI_I32>;