blob: 49df51f6111a01b98237865565c55a3424f8c596 [file] [log] [blame]
Valery Pykhtin2828b9b2016-09-19 14:39:49 +00001//===-- VOPInstructions.td - Vector Instruction Defintions ----------------===//
2//
Chandler Carruth2946cd72019-01-19 08:50:56 +00003// Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions.
4// See https://llvm.org/LICENSE.txt for license information.
5// SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception
Valery Pykhtin2828b9b2016-09-19 14:39:49 +00006//
7//===----------------------------------------------------------------------===//
8
Valery Pykhtin355103f2016-09-23 09:08:07 +00009// dummies for outer let
10class LetDummies {
11 bit isCommutable;
12 bit isConvertibleToThreeAddress;
13 bit isMoveImm;
14 bit isReMaterializable;
15 bit isAsCheapAsAMove;
16 bit VOPAsmPrefer32Bit;
17 Predicate SubtargetPredicate;
18 string Constraints;
19 string DisableEncoding;
20 list<SchedReadWrite> SchedRW;
21 list<Register> Uses;
22 list<Register> Defs;
23}
24
25class VOP <string opName> {
26 string OpName = opName;
27}
28
29class VOPAnyCommon <dag outs, dag ins, string asm, list<dag> pattern> :
30 InstSI <outs, ins, asm, pattern> {
31
32 let mayLoad = 0;
33 let mayStore = 0;
34 let hasSideEffects = 0;
35 let UseNamedOperandTable = 1;
36 let VALU = 1;
Matt Arsenaulteff1ad82016-11-18 04:42:59 +000037 let Uses = [EXEC];
Valery Pykhtin355103f2016-09-23 09:08:07 +000038}
39
Nicolai Haehnle4f850ea2018-03-26 13:56:53 +000040class VOP_Pseudo <string opName, string suffix, VOPProfile P, dag outs, dag ins,
41 string asm, list<dag> pattern> :
42 InstSI <outs, ins, asm, pattern>,
43 VOP <opName>,
44 SIMCInstr <opName#suffix, SIEncodingFamily.NONE>,
45 MnemonicAlias<opName#suffix, opName> {
46
47 let isPseudo = 1;
48 let isCodeGenOnly = 1;
49 let UseNamedOperandTable = 1;
50
51 string Mnemonic = opName;
52 VOPProfile Pfl = P;
53
54 string AsmOperands;
55}
56
Valery Pykhtin355103f2016-09-23 09:08:07 +000057class VOP3Common <dag outs, dag ins, string asm = "",
58 list<dag> pattern = [], bit HasMods = 0,
59 bit VOP3Only = 0> :
60 VOPAnyCommon <outs, ins, asm, pattern> {
61
62 // Using complex patterns gives VOP3 patterns a very high complexity rating,
Simon Pilgrime995a8082016-11-18 11:04:02 +000063 // but standalone patterns are almost always preferred, so we need to adjust the
Valery Pykhtin355103f2016-09-23 09:08:07 +000064 // priority lower. The goal is to use a high number to reduce complexity to
65 // zero (or less than zero).
66 let AddedComplexity = -1000;
67
68 let VOP3 = 1;
Valery Pykhtin355103f2016-09-23 09:08:07 +000069
Valery Pykhtin355103f2016-09-23 09:08:07 +000070 let AsmVariantName = AMDGPUAsmVariants.VOP3;
Sam Kolton10ac2fd2017-07-07 15:21:52 +000071 let AsmMatchConverter = !if(!eq(HasMods,1), "cvtVOP3", "");
Valery Pykhtin355103f2016-09-23 09:08:07 +000072
73 let isCodeGenOnly = 0;
74
75 int Size = 8;
76
77 // Because SGPRs may be allowed if there are multiple operands, we
78 // need a post-isel hook to insert copies in order to avoid
79 // violating constant bus requirements.
80 let hasPostISelHook = 1;
81}
82
Matt Arsenault9be7b0d2017-02-27 18:49:11 +000083class VOP3_Pseudo <string opName, VOPProfile P, list<dag> pattern = [],
Dmitry Preobrazhenskyabf28392017-07-21 13:54:11 +000084 bit VOP3Only = 0, bit isVOP3P = 0, bit isVop3OpSel = 0> :
Nicolai Haehnle4f850ea2018-03-26 13:56:53 +000085 VOP_Pseudo <opName, "_e64", P, P.Outs64,
86 !if(isVop3OpSel,
87 P.InsVOP3OpSel,
88 !if(!and(isVOP3P, P.IsPacked), P.InsVOP3P, P.Ins64)),
89 "", pattern> {
Valery Pykhtin2828b9b2016-09-19 14:39:49 +000090
Dmitry Preobrazhenskyabf28392017-07-21 13:54:11 +000091 let VOP3_OPSEL = isVop3OpSel;
Dmitry Preobrazhensky682a6542017-11-17 15:15:40 +000092 let IsPacked = P.IsPacked;
Valery Pykhtin2828b9b2016-09-19 14:39:49 +000093
Nicolai Haehnle4f850ea2018-03-26 13:56:53 +000094 let AsmOperands = !if(isVop3OpSel,
95 P.AsmVOP3OpSel,
96 !if(!and(isVOP3P, P.IsPacked), P.AsmVOP3P, P.Asm64));
Valery Pykhtin2828b9b2016-09-19 14:39:49 +000097
98 let Size = 8;
99 let mayLoad = 0;
100 let mayStore = 0;
101 let hasSideEffects = 0;
102 let SubtargetPredicate = isGCN;
103
104 // Because SGPRs may be allowed if there are multiple operands, we
105 // need a post-isel hook to insert copies in order to avoid
106 // violating constant bus requirements.
107 let hasPostISelHook = 1;
108
109 // Using complex patterns gives VOP3 patterns a very high complexity rating,
Simon Pilgrime995a8082016-11-18 11:04:02 +0000110 // but standalone patterns are almost always preferred, so we need to adjust the
Valery Pykhtin2828b9b2016-09-19 14:39:49 +0000111 // priority lower. The goal is to use a high number to reduce complexity to
112 // zero (or less than zero).
113 let AddedComplexity = -1000;
114
115 let VOP3 = 1;
116 let VALU = 1;
Matt Arsenaultd5c65152017-02-22 23:27:53 +0000117 let FPClamp = P.HasFPClamp;
Matt Arsenaultab4a5cd2017-08-31 23:53:50 +0000118 let IntClamp = P.HasIntClamp;
119 let ClampLo = P.HasClampLo;
120 let ClampHi = P.HasClampHi;
121
Valery Pykhtin2828b9b2016-09-19 14:39:49 +0000122 let Uses = [EXEC];
123
124 let AsmVariantName = AMDGPUAsmVariants.VOP3;
125 let AsmMatchConverter =
Dmitry Preobrazhensky682a6542017-11-17 15:15:40 +0000126 !if(isVOP3P,
Sam Kolton10ac2fd2017-07-07 15:21:52 +0000127 "cvtVOP3P",
Dmitry Preobrazhensky682a6542017-11-17 15:15:40 +0000128 !if(!or(P.HasModifiers, !or(P.HasOMod, P.HasIntClamp)),
129 "cvtVOP3",
130 ""));
Valery Pykhtin2828b9b2016-09-19 14:39:49 +0000131}
132
Matt Arsenault9be7b0d2017-02-27 18:49:11 +0000133class VOP3P_Pseudo <string opName, VOPProfile P, list<dag> pattern = []> :
134 VOP3_Pseudo<opName, P, pattern, 1, 1> {
135 let VOP3P = 1;
136}
137
Nicolai Haehnle4f850ea2018-03-26 13:56:53 +0000138class VOP3_Real <VOP_Pseudo ps, int EncodingFamily> :
Valery Pykhtin2828b9b2016-09-19 14:39:49 +0000139 InstSI <ps.OutOperandList, ps.InOperandList, ps.Mnemonic # ps.AsmOperands, []>,
140 SIMCInstr <ps.PseudoInstr, EncodingFamily> {
141
142 let isPseudo = 0;
143 let isCodeGenOnly = 0;
Matt Arsenault9be7b0d2017-02-27 18:49:11 +0000144 let UseNamedOperandTable = 1;
Valery Pykhtin2828b9b2016-09-19 14:39:49 +0000145
Sam Koltona6792a32016-12-22 11:30:48 +0000146 let Constraints = ps.Constraints;
147 let DisableEncoding = ps.DisableEncoding;
148
Valery Pykhtin2828b9b2016-09-19 14:39:49 +0000149 // copy relevant pseudo op flags
150 let SubtargetPredicate = ps.SubtargetPredicate;
151 let AsmMatchConverter = ps.AsmMatchConverter;
152 let AsmVariantName = ps.AsmVariantName;
153 let Constraints = ps.Constraints;
154 let DisableEncoding = ps.DisableEncoding;
155 let TSFlags = ps.TSFlags;
Dmitry Preobrazhensky03880f82017-03-03 14:31:06 +0000156 let UseNamedOperandTable = ps.UseNamedOperandTable;
157 let Uses = ps.Uses;
Stanislav Mekhanoshinf6300472018-01-15 17:55:35 +0000158 let Defs = ps.Defs;
Sam Kolton4685b70a2017-07-18 14:23:26 +0000159
160 VOPProfile Pfl = ps.Pfl;
Valery Pykhtin2828b9b2016-09-19 14:39:49 +0000161}
162
Matt Arsenault9be7b0d2017-02-27 18:49:11 +0000163// XXX - Is there any reason to distingusih this from regular VOP3
164// here?
Nicolai Haehnle4f850ea2018-03-26 13:56:53 +0000165class VOP3P_Real<VOP_Pseudo ps, int EncodingFamily> :
Matt Arsenault9be7b0d2017-02-27 18:49:11 +0000166 VOP3_Real<ps, EncodingFamily>;
167
Valery Pykhtin355103f2016-09-23 09:08:07 +0000168class VOP3a<VOPProfile P> : Enc64 {
Dmitry Preobrazhenskyabf28392017-07-21 13:54:11 +0000169 bits<4> src0_modifiers;
Valery Pykhtin2828b9b2016-09-19 14:39:49 +0000170 bits<9> src0;
Dmitry Preobrazhenskyabf28392017-07-21 13:54:11 +0000171 bits<3> src1_modifiers;
Valery Pykhtin2828b9b2016-09-19 14:39:49 +0000172 bits<9> src1;
Dmitry Preobrazhenskyabf28392017-07-21 13:54:11 +0000173 bits<3> src2_modifiers;
Valery Pykhtin2828b9b2016-09-19 14:39:49 +0000174 bits<9> src2;
175 bits<1> clamp;
176 bits<2> omod;
177
178 let Inst{8} = !if(P.HasSrc0Mods, src0_modifiers{1}, 0);
179 let Inst{9} = !if(P.HasSrc1Mods, src1_modifiers{1}, 0);
180 let Inst{10} = !if(P.HasSrc2Mods, src2_modifiers{1}, 0);
181
182 let Inst{31-26} = 0x34; //encoding
Valery Pykhtin355103f2016-09-23 09:08:07 +0000183 let Inst{40-32} = !if(P.HasSrc0, src0, 0);
Valery Pykhtin2828b9b2016-09-19 14:39:49 +0000184 let Inst{49-41} = !if(P.HasSrc1, src1, 0);
185 let Inst{58-50} = !if(P.HasSrc2, src2, 0);
186 let Inst{60-59} = !if(P.HasOMod, omod, 0);
187 let Inst{61} = !if(P.HasSrc0Mods, src0_modifiers{0}, 0);
188 let Inst{62} = !if(P.HasSrc1Mods, src1_modifiers{0}, 0);
189 let Inst{63} = !if(P.HasSrc2Mods, src2_modifiers{0}, 0);
190}
191
Valery Pykhtin355103f2016-09-23 09:08:07 +0000192class VOP3a_si <bits<9> op, VOPProfile P> : VOP3a<P> {
Valery Pykhtin2828b9b2016-09-19 14:39:49 +0000193 let Inst{25-17} = op;
Valery Pykhtin355103f2016-09-23 09:08:07 +0000194 let Inst{11} = !if(P.HasClamp, clamp{0}, 0);
Valery Pykhtin2828b9b2016-09-19 14:39:49 +0000195}
196
Valery Pykhtin355103f2016-09-23 09:08:07 +0000197class VOP3a_vi <bits<10> op, VOPProfile P> : VOP3a<P> {
Valery Pykhtin2828b9b2016-09-19 14:39:49 +0000198 let Inst{25-16} = op;
Valery Pykhtin355103f2016-09-23 09:08:07 +0000199 let Inst{15} = !if(P.HasClamp, clamp{0}, 0);
Valery Pykhtin2828b9b2016-09-19 14:39:49 +0000200}
201
Valery Pykhtin355103f2016-09-23 09:08:07 +0000202class VOP3e_si <bits<9> op, VOPProfile P> : VOP3a_si <op, P> {
Valery Pykhtine330cfa2016-09-20 10:41:16 +0000203 bits<8> vdst;
Valery Pykhtin355103f2016-09-23 09:08:07 +0000204 let Inst{7-0} = !if(P.EmitDst, vdst{7-0}, 0);
Valery Pykhtine330cfa2016-09-20 10:41:16 +0000205}
206
Valery Pykhtin355103f2016-09-23 09:08:07 +0000207class VOP3e_vi <bits<10> op, VOPProfile P> : VOP3a_vi <op, P> {
Valery Pykhtine330cfa2016-09-20 10:41:16 +0000208 bits<8> vdst;
Valery Pykhtin355103f2016-09-23 09:08:07 +0000209 let Inst{7-0} = !if(P.EmitDst, vdst{7-0}, 0);
Valery Pykhtine330cfa2016-09-20 10:41:16 +0000210}
211
Dmitry Preobrazhenskyabf28392017-07-21 13:54:11 +0000212class VOP3OpSel_gfx9 <bits<10> op, VOPProfile P> : VOP3e_vi <op, P> {
213 let Inst{11} = !if(P.HasSrc0, src0_modifiers{2}, 0);
214 let Inst{12} = !if(P.HasSrc1, src1_modifiers{2}, 0);
215 let Inst{13} = !if(P.HasSrc2, src2_modifiers{2}, 0);
216 let Inst{14} = !if(P.HasDst, src0_modifiers{3}, 0);
217}
218
Dmitry Preobrazhensky50805a02017-08-07 13:14:12 +0000219// NB: For V_INTERP* opcodes, src0 is encoded as src1 and vice versa
220class VOP3Interp_vi <bits<10> op, VOPProfile P> : VOP3e_vi <op, P> {
221 bits<2> attrchan;
222 bits<6> attr;
223 bits<1> high;
224
225 let Inst{8} = 0; // No modifiers for src0
226 let Inst{61} = 0;
227
228 let Inst{9} = !if(P.HasSrc0Mods, src0_modifiers{1}, 0);
229 let Inst{62} = !if(P.HasSrc0Mods, src0_modifiers{0}, 0);
230
231 let Inst{37-32} = attr;
232 let Inst{39-38} = attrchan;
233 let Inst{40} = !if(P.HasHigh, high, 0);
234
235 let Inst{49-41} = src0;
236}
237
Valery Pykhtin355103f2016-09-23 09:08:07 +0000238class VOP3be <VOPProfile P> : Enc64 {
Valery Pykhtine330cfa2016-09-20 10:41:16 +0000239 bits<8> vdst;
240 bits<2> src0_modifiers;
241 bits<9> src0;
242 bits<2> src1_modifiers;
243 bits<9> src1;
244 bits<2> src2_modifiers;
245 bits<9> src2;
246 bits<7> sdst;
247 bits<2> omod;
248
249 let Inst{7-0} = vdst;
250 let Inst{14-8} = sdst;
251 let Inst{31-26} = 0x34; //encoding
252 let Inst{40-32} = !if(P.HasSrc0, src0, 0);
253 let Inst{49-41} = !if(P.HasSrc1, src1, 0);
254 let Inst{58-50} = !if(P.HasSrc2, src2, 0);
255 let Inst{60-59} = !if(P.HasOMod, omod, 0);
256 let Inst{61} = !if(P.HasSrc0Mods, src0_modifiers{0}, 0);
257 let Inst{62} = !if(P.HasSrc1Mods, src1_modifiers{0}, 0);
258 let Inst{63} = !if(P.HasSrc2Mods, src2_modifiers{0}, 0);
259}
260
Matt Arsenault9be7b0d2017-02-27 18:49:11 +0000261class VOP3Pe <bits<10> op, VOPProfile P> : Enc64 {
262 bits<8> vdst;
263 // neg, neg_hi, op_sel put in srcN_modifiers
264 bits<4> src0_modifiers;
265 bits<9> src0;
266 bits<4> src1_modifiers;
267 bits<9> src1;
268 bits<4> src2_modifiers;
269 bits<9> src2;
270 bits<1> clamp;
271
272 let Inst{7-0} = vdst;
273 let Inst{8} = !if(P.HasSrc0Mods, src0_modifiers{1}, 0); // neg_hi src0
274 let Inst{9} = !if(P.HasSrc1Mods, src1_modifiers{1}, 0); // neg_hi src1
275 let Inst{10} = !if(P.HasSrc2Mods, src2_modifiers{1}, 0); // neg_hi src2
276
Dmitry Preobrazhensky851a3d92017-06-21 16:00:54 +0000277 let Inst{11} = !if(!and(P.HasSrc0, P.HasOpSel), src0_modifiers{2}, 0); // op_sel(0)
278 let Inst{12} = !if(!and(P.HasSrc1, P.HasOpSel), src1_modifiers{2}, 0); // op_sel(1)
279 let Inst{13} = !if(!and(P.HasSrc2, P.HasOpSel), src2_modifiers{2}, 0); // op_sel(2)
Matt Arsenault9be7b0d2017-02-27 18:49:11 +0000280
Dmitry Preobrazhensky851a3d92017-06-21 16:00:54 +0000281 let Inst{14} = !if(!and(P.HasSrc2, P.HasOpSel), src2_modifiers{3}, 0); // op_sel_hi(2)
Matt Arsenault9be7b0d2017-02-27 18:49:11 +0000282
283 let Inst{15} = !if(P.HasClamp, clamp{0}, 0);
284
285 let Inst{25-16} = op;
286 let Inst{31-26} = 0x34; //encoding
287 let Inst{40-32} = !if(P.HasSrc0, src0, 0);
288 let Inst{49-41} = !if(P.HasSrc1, src1, 0);
289 let Inst{58-50} = !if(P.HasSrc2, src2, 0);
Dmitry Preobrazhensky851a3d92017-06-21 16:00:54 +0000290 let Inst{59} = !if(!and(P.HasSrc0, P.HasOpSel), src0_modifiers{3}, 0); // op_sel_hi(0)
291 let Inst{60} = !if(!and(P.HasSrc1, P.HasOpSel), src1_modifiers{3}, 0); // op_sel_hi(1)
Matt Arsenault9be7b0d2017-02-27 18:49:11 +0000292 let Inst{61} = !if(P.HasSrc0Mods, src0_modifiers{0}, 0); // neg (lo)
293 let Inst{62} = !if(P.HasSrc1Mods, src1_modifiers{0}, 0); // neg (lo)
294 let Inst{63} = !if(P.HasSrc2Mods, src2_modifiers{0}, 0); // neg (lo)
295}
296
Valery Pykhtin355103f2016-09-23 09:08:07 +0000297class VOP3be_si <bits<9> op, VOPProfile P> : VOP3be<P> {
Valery Pykhtine330cfa2016-09-20 10:41:16 +0000298 let Inst{25-17} = op;
299}
300
Valery Pykhtin355103f2016-09-23 09:08:07 +0000301class VOP3be_vi <bits<10> op, VOPProfile P> : VOP3be<P> {
Valery Pykhtine330cfa2016-09-20 10:41:16 +0000302 bits<1> clamp;
303 let Inst{25-16} = op;
Valery Pykhtin355103f2016-09-23 09:08:07 +0000304 let Inst{15} = !if(P.HasClamp, clamp{0}, 0);
Valery Pykhtine330cfa2016-09-20 10:41:16 +0000305}
306
Sam Koltona568e3d2016-12-22 12:57:41 +0000307def SDWA {
308 // sdwa_sel
309 int BYTE_0 = 0;
310 int BYTE_1 = 1;
311 int BYTE_2 = 2;
312 int BYTE_3 = 3;
313 int WORD_0 = 4;
314 int WORD_1 = 5;
315 int DWORD = 6;
316
317 // dst_unused
318 int UNUSED_PAD = 0;
319 int UNUSED_SEXT = 1;
320 int UNUSED_PRESERVE = 2;
321}
322
Valery Pykhtin355103f2016-09-23 09:08:07 +0000323class VOP_SDWAe<VOPProfile P> : Enc64 {
Valery Pykhtin2828b9b2016-09-19 14:39:49 +0000324 bits<8> src0;
325 bits<3> src0_sel;
Valery Pykhtin355103f2016-09-23 09:08:07 +0000326 bits<2> src0_modifiers; // float: {abs,neg}, int {sext}
Valery Pykhtin2828b9b2016-09-19 14:39:49 +0000327 bits<3> src1_sel;
Valery Pykhtin355103f2016-09-23 09:08:07 +0000328 bits<2> src1_modifiers;
Valery Pykhtin2828b9b2016-09-19 14:39:49 +0000329 bits<3> dst_sel;
330 bits<2> dst_unused;
331 bits<1> clamp;
332
Valery Pykhtin2828b9b2016-09-19 14:39:49 +0000333 let Inst{39-32} = !if(P.HasSrc0, src0{7-0}, 0);
Dmitry Preobrazhensky9c1a6e72018-03-16 15:40:27 +0000334 let Inst{42-40} = !if(P.EmitDst, dst_sel{2-0}, 0);
335 let Inst{44-43} = !if(P.EmitDst, dst_unused{1-0}, 0);
Valery Pykhtin2828b9b2016-09-19 14:39:49 +0000336 let Inst{45} = !if(P.HasSDWAClamp, clamp{0}, 0);
Dmitry Preobrazhensky9c1a6e72018-03-16 15:40:27 +0000337 let Inst{50-48} = !if(P.HasSrc0, src0_sel{2-0}, 0);
Valery Pykhtin355103f2016-09-23 09:08:07 +0000338 let Inst{51} = !if(P.HasSrc0IntMods, src0_modifiers{0}, 0);
Sam Koltonf7659d712017-05-23 10:08:55 +0000339 let Inst{53-52} = !if(P.HasSrc0FloatMods, src0_modifiers{1-0}, 0);
Dmitry Preobrazhensky9c1a6e72018-03-16 15:40:27 +0000340 let Inst{58-56} = !if(P.HasSrc1, src1_sel{2-0}, 0);
Valery Pykhtin355103f2016-09-23 09:08:07 +0000341 let Inst{59} = !if(P.HasSrc1IntMods, src1_modifiers{0}, 0);
Sam Koltonf7659d712017-05-23 10:08:55 +0000342 let Inst{61-60} = !if(P.HasSrc1FloatMods, src1_modifiers{1-0}, 0);
343}
344
Sam Kolton549c89d2017-06-21 08:53:38 +0000345// GFX9 adds two features to SDWA:
346// 1. Add 3 fields to the SDWA microcode word: S0, S1 and OMOD.
347// a. S0 and S1 indicate that source 0 and 1 respectively are SGPRs rather
348// than VGPRs (at most 1 can be an SGPR);
349// b. OMOD is the standard output modifier (result *2, *4, /2)
350// 2. Add a new version of the SDWA microcode word for VOPC: SDWAB. This
351// replaces OMOD and the dest fields with SD and SDST (SGPR destination)
352// field.
353// a. When SD=1, the SDST is used as the destination for the compare result;
354// b. When SD=0, VCC is used.
355//
356// In GFX9, V_MAC_F16, V_MAC_F32 opcodes cannot be used with SDWA
357
Sam Koltonf7659d712017-05-23 10:08:55 +0000358// gfx9 SDWA basic encoding
359class VOP_SDWA9e<VOPProfile P> : Enc64 {
360 bits<9> src0; // {src0_sgpr{0}, src0{7-0}}
361 bits<3> src0_sel;
362 bits<2> src0_modifiers; // float: {abs,neg}, int {sext}
363 bits<3> src1_sel;
364 bits<2> src1_modifiers;
365 bits<1> src1_sgpr;
366
367 let Inst{39-32} = !if(P.HasSrc0, src0{7-0}, 0);
Dmitry Preobrazhensky9c1a6e72018-03-16 15:40:27 +0000368 let Inst{50-48} = !if(P.HasSrc0, src0_sel{2-0}, 0);
Sam Koltonf7659d712017-05-23 10:08:55 +0000369 let Inst{51} = !if(P.HasSrc0IntMods, src0_modifiers{0}, 0);
370 let Inst{53-52} = !if(P.HasSrc0FloatMods, src0_modifiers{1-0}, 0);
371 let Inst{55} = !if(P.HasSrc0, src0{8}, 0);
Dmitry Preobrazhensky9c1a6e72018-03-16 15:40:27 +0000372 let Inst{58-56} = !if(P.HasSrc1, src1_sel{2-0}, 0);
Sam Koltonf7659d712017-05-23 10:08:55 +0000373 let Inst{59} = !if(P.HasSrc1IntMods, src1_modifiers{0}, 0);
374 let Inst{61-60} = !if(P.HasSrc1FloatMods, src1_modifiers{1-0}, 0);
375 let Inst{63} = 0; // src1_sgpr - should be specified in subclass
376}
377
378// gfx9 SDWA-A
379class VOP_SDWA9Ae<VOPProfile P> : VOP_SDWA9e<P> {
380 bits<3> dst_sel;
381 bits<2> dst_unused;
382 bits<1> clamp;
383 bits<2> omod;
384
Dmitry Preobrazhensky9c1a6e72018-03-16 15:40:27 +0000385 let Inst{42-40} = !if(P.EmitDst, dst_sel{2-0}, 0);
386 let Inst{44-43} = !if(P.EmitDst, dst_unused{1-0}, 0);
Sam Koltonf7659d712017-05-23 10:08:55 +0000387 let Inst{45} = !if(P.HasSDWAClamp, clamp{0}, 0);
388 let Inst{47-46} = !if(P.HasSDWAOMod, omod{1-0}, 0);
389}
390
391// gfx9 SDWA-B
392class VOP_SDWA9Be<VOPProfile P> : VOP_SDWA9e<P> {
393 bits<8> sdst; // {vcc_sdst{0}, sdst{6-0}}
394
395 let Inst{46-40} = !if(P.EmitDst, sdst{6-0}, 0);
396 let Inst{47} = !if(P.EmitDst, sdst{7}, 0);
Valery Pykhtin355103f2016-09-23 09:08:07 +0000397}
398
Sam Koltona568e3d2016-12-22 12:57:41 +0000399class VOP_SDWA_Pseudo <string opName, VOPProfile P, list<dag> pattern=[]> :
400 InstSI <P.OutsSDWA, P.InsSDWA, "", pattern>,
401 VOP <opName>,
402 SIMCInstr <opName#"_sdwa", SIEncodingFamily.NONE>,
403 MnemonicAlias <opName#"_sdwa", opName> {
Matt Arsenaultb4493e92017-02-10 02:42:31 +0000404
Sam Koltona568e3d2016-12-22 12:57:41 +0000405 let isPseudo = 1;
406 let isCodeGenOnly = 1;
407 let UseNamedOperandTable = 1;
408
409 string Mnemonic = opName;
410 string AsmOperands = P.AsmSDWA;
Sam Kolton549c89d2017-06-21 08:53:38 +0000411 string AsmOperands9 = P.AsmSDWA9;
Sam Koltona568e3d2016-12-22 12:57:41 +0000412
413 let Size = 8;
Valery Pykhtin355103f2016-09-23 09:08:07 +0000414 let mayLoad = 0;
415 let mayStore = 0;
Matt Arsenaultb4493e92017-02-10 02:42:31 +0000416 let hasSideEffects = 0;
Sam Koltona568e3d2016-12-22 12:57:41 +0000417
Valery Pykhtin355103f2016-09-23 09:08:07 +0000418 let VALU = 1;
419 let SDWA = 1;
Sam Koltona568e3d2016-12-22 12:57:41 +0000420 let Uses = [EXEC];
Matt Arsenaultb4493e92017-02-10 02:42:31 +0000421
Konstantin Zhuravlyov5f1b8182018-09-27 20:49:00 +0000422 let SubtargetPredicate = !if(P.HasExtSDWA, HasSDWA, DisableInst);
423 let AssemblerPredicate = !if(P.HasExtSDWA, HasSDWA, DisableInst);
424 let AsmVariantName = !if(P.HasExtSDWA, AMDGPUAsmVariants.SDWA,
425 AMDGPUAsmVariants.Disable);
Valery Pykhtin355103f2016-09-23 09:08:07 +0000426 let DecoderNamespace = "SDWA";
Sam Koltona568e3d2016-12-22 12:57:41 +0000427
428 VOPProfile Pfl = P;
429}
430
431class VOP_SDWA_Real <VOP_SDWA_Pseudo ps> :
432 InstSI <ps.OutOperandList, ps.InOperandList, ps.Mnemonic # ps.AsmOperands, []>,
Sam Kolton549c89d2017-06-21 08:53:38 +0000433 SIMCInstr <ps.PseudoInstr, SIEncodingFamily.SDWA> {
Sam Koltona568e3d2016-12-22 12:57:41 +0000434
435 let isPseudo = 0;
436 let isCodeGenOnly = 0;
437
438 let Defs = ps.Defs;
439 let Uses = ps.Uses;
440 let SchedRW = ps.SchedRW;
441 let hasSideEffects = ps.hasSideEffects;
442
443 let Constraints = ps.Constraints;
444 let DisableEncoding = ps.DisableEncoding;
445
446 // Copy relevant pseudo op flags
447 let SubtargetPredicate = ps.SubtargetPredicate;
448 let AssemblerPredicate = ps.AssemblerPredicate;
449 let AsmMatchConverter = ps.AsmMatchConverter;
450 let AsmVariantName = ps.AsmVariantName;
451 let UseNamedOperandTable = ps.UseNamedOperandTable;
452 let DecoderNamespace = ps.DecoderNamespace;
453 let Constraints = ps.Constraints;
454 let DisableEncoding = ps.DisableEncoding;
455 let TSFlags = ps.TSFlags;
Valery Pykhtin355103f2016-09-23 09:08:07 +0000456}
457
Sam Kolton549c89d2017-06-21 08:53:38 +0000458class VOP_SDWA9_Real <VOP_SDWA_Pseudo ps> :
459 InstSI <ps.OutOperandList, ps.InOperandList, ps.Mnemonic # ps.AsmOperands9, []>,
460 SIMCInstr <ps.PseudoInstr, SIEncodingFamily.SDWA9> {
Sam Koltonf7659d712017-05-23 10:08:55 +0000461
462 let isPseudo = 0;
463 let isCodeGenOnly = 0;
464
465 let Defs = ps.Defs;
466 let Uses = ps.Uses;
467 let SchedRW = ps.SchedRW;
468 let hasSideEffects = ps.hasSideEffects;
469
470 let Constraints = ps.Constraints;
471 let DisableEncoding = ps.DisableEncoding;
472
Konstantin Zhuravlyov5f1b8182018-09-27 20:49:00 +0000473 let SubtargetPredicate = !if(ps.Pfl.HasExtSDWA9, HasSDWA9, DisableInst);
474 let AssemblerPredicate = !if(ps.Pfl.HasExtSDWA9, HasSDWA9, DisableInst);
475 let AsmVariantName = !if(ps.Pfl.HasExtSDWA9, AMDGPUAsmVariants.SDWA9,
476 AMDGPUAsmVariants.Disable);
Sam Kolton549c89d2017-06-21 08:53:38 +0000477 let DecoderNamespace = "SDWA9";
478
Sam Koltonf7659d712017-05-23 10:08:55 +0000479 // Copy relevant pseudo op flags
Sam Koltonf7659d712017-05-23 10:08:55 +0000480 let AsmMatchConverter = ps.AsmMatchConverter;
Sam Koltonf7659d712017-05-23 10:08:55 +0000481 let UseNamedOperandTable = ps.UseNamedOperandTable;
Sam Koltonf7659d712017-05-23 10:08:55 +0000482 let Constraints = ps.Constraints;
483 let DisableEncoding = ps.DisableEncoding;
484 let TSFlags = ps.TSFlags;
485}
486
Valery Pykhtin355103f2016-09-23 09:08:07 +0000487class VOP_DPPe<VOPProfile P> : Enc64 {
488 bits<2> src0_modifiers;
489 bits<8> src0;
490 bits<2> src1_modifiers;
491 bits<9> dpp_ctrl;
492 bits<1> bound_ctrl;
493 bits<4> bank_mask;
494 bits<4> row_mask;
495
496 let Inst{39-32} = !if(P.HasSrc0, src0{7-0}, 0);
497 let Inst{48-40} = dpp_ctrl;
498 let Inst{51} = bound_ctrl;
499 let Inst{52} = !if(P.HasSrc0Mods, src0_modifiers{0}, 0); // src0_neg
500 let Inst{53} = !if(P.HasSrc0Mods, src0_modifiers{1}, 0); // src0_abs
501 let Inst{54} = !if(P.HasSrc1Mods, src1_modifiers{0}, 0); // src1_neg
502 let Inst{55} = !if(P.HasSrc1Mods, src1_modifiers{1}, 0); // src1_abs
503 let Inst{59-56} = bank_mask;
504 let Inst{63-60} = row_mask;
505}
506
Valery Pykhtin3d9afa22018-11-30 14:21:56 +0000507class VOP_DPP_Pseudo <string OpName, VOPProfile P, list<dag> pattern=[]> :
508 InstSI <P.OutsDPP, P.InsDPP, OpName#P.AsmDPP, pattern>,
509 VOP <OpName>,
510 SIMCInstr <OpName#"_dpp", SIEncodingFamily.NONE>,
511 MnemonicAlias <OpName#"_dpp", OpName> {
512
513 let isPseudo = 1;
514 let isCodeGenOnly = 1;
Valery Pykhtin355103f2016-09-23 09:08:07 +0000515
516 let mayLoad = 0;
517 let mayStore = 0;
518 let hasSideEffects = 0;
519 let UseNamedOperandTable = 1;
520
521 let VALU = 1;
522 let DPP = 1;
523 let Size = 8;
Valery Pykhtin3d9afa22018-11-30 14:21:56 +0000524 let Uses = [EXEC];
525 let isConvergent = 1;
526
527 string Mnemonic = OpName;
528 string AsmOperands = P.AsmDPP;
Valery Pykhtin355103f2016-09-23 09:08:07 +0000529
530 let AsmMatchConverter = !if(!eq(P.HasModifiers,1), "cvtDPP", "");
Sam Kolton07dbde22017-01-20 10:01:25 +0000531 let SubtargetPredicate = HasDPP;
Konstantin Zhuravlyov5f1b8182018-09-27 20:49:00 +0000532 let AssemblerPredicate = !if(P.HasExtDPP, HasDPP, DisableInst);
533 let AsmVariantName = !if(P.HasExtDPP, AMDGPUAsmVariants.DPP,
534 AMDGPUAsmVariants.Disable);
Connor Abbott79f3ade2017-08-07 19:10:56 +0000535 let Constraints = !if(P.NumSrcArgs, "$old = $vdst", "");
536 let DisableEncoding = !if(P.NumSrcArgs, "$old", "");
Valery Pykhtin355103f2016-09-23 09:08:07 +0000537 let DecoderNamespace = "DPP";
Valery Pykhtin3d9afa22018-11-30 14:21:56 +0000538
539 VOPProfile Pfl = P;
540}
541
542class VOP_DPP_Real <VOP_DPP_Pseudo ps, int EncodingFamily> :
543 InstSI <ps.OutOperandList, ps.InOperandList, ps.Mnemonic # ps.AsmOperands, []>,
544 SIMCInstr <ps.PseudoInstr, EncodingFamily> {
545
546 let isPseudo = 0;
547 let isCodeGenOnly = 0;
548
549 let Defs = ps.Defs;
550 let Uses = ps.Uses;
551 let SchedRW = ps.SchedRW;
552 let hasSideEffects = ps.hasSideEffects;
553
554 let Constraints = ps.Constraints;
555 let DisableEncoding = ps.DisableEncoding;
556
557 // Copy relevant pseudo op flags
558 let isConvergent = ps.isConvergent;
559 let SubtargetPredicate = ps.SubtargetPredicate;
560 let AssemblerPredicate = ps.AssemblerPredicate;
561 let AsmMatchConverter = ps.AsmMatchConverter;
562 let AsmVariantName = ps.AsmVariantName;
563 let UseNamedOperandTable = ps.UseNamedOperandTable;
564 let DecoderNamespace = ps.DecoderNamespace;
565 let Constraints = ps.Constraints;
566 let DisableEncoding = ps.DisableEncoding;
567 let TSFlags = ps.TSFlags;
Valery Pykhtin2828b9b2016-09-19 14:39:49 +0000568}
569
Alexander Timofeev36617f012018-09-21 10:31:22 +0000570class getNumNodeArgs<SDPatternOperator Op> {
571 SDNode N = !cast<SDNode>(Op);
572 SDTypeProfile TP = N.TypeProfile;
573 int ret = TP.NumOperands;
574}
575
576
577class getDivergentFrag<SDPatternOperator Op> {
578
579 int NumSrcArgs = getNumNodeArgs<Op>.ret;
580 PatFrag ret = PatFrag <
581 !if(!eq(NumSrcArgs, 1),
582 (ops node:$src0),
583 !if(!eq(NumSrcArgs, 2),
584 (ops node:$src0, node:$src1),
585 (ops node:$src0, node:$src1, node:$src2))),
586 !if(!eq(NumSrcArgs, 1),
587 (Op $src0),
588 !if(!eq(NumSrcArgs, 2),
589 (Op $src0, $src1),
590 (Op $src0, $src1, $src2))),
591 [{ return N->isDivergent(); }]
592 >;
593}
594
595class VOPPatGen<SDPatternOperator Op, VOPProfile P> {
596
597 PatFrag Operator = getDivergentFrag < Op >.ret;
598
599 dag Ins = !foreach(tmp, P.Ins32, !subst(ins, Operator,
600 !subst(P.Src0RC32, P.Src0VT,
601 !subst(P.Src1RC32, P.Src1VT, tmp))));
602
603
604 dag Outs = !foreach(tmp, P.Outs32, !subst(outs, set,
605 !subst(P.DstRC, P.DstVT, tmp)));
606
607 list<dag> ret = [!con(Outs, (set Ins))];
608}
609
610class VOPPatOrNull<SDPatternOperator Op, VOPProfile P> {
611 list<dag> ret = !if(!ne(P.NeedPatGen,PatGenMode.NoPattern), VOPPatGen<Op, P>.ret, []);
612}
613
Alexander Timofeevb048fa32018-10-01 11:06:35 +0000614class DivergentFragOrOp<SDPatternOperator Op, VOPProfile P> {
615 SDPatternOperator ret = !if(!eq(P.NeedPatGen,PatGenMode.Pattern),
616 !if(!isa<SDNode>(Op), getDivergentFrag<Op>.ret, Op), Op);
617}
618
Valery Pykhtin2828b9b2016-09-19 14:39:49 +0000619include "VOPCInstructions.td"
Valery Pykhtin355103f2016-09-23 09:08:07 +0000620include "VOP1Instructions.td"
621include "VOP2Instructions.td"
Valery Pykhtine330cfa2016-09-20 10:41:16 +0000622include "VOP3Instructions.td"
Matt Arsenault9be7b0d2017-02-27 18:49:11 +0000623include "VOP3PInstructions.td"