blob: acb5b0668966ec35c9211e3ac8f42af45ca8da0d [file] [log] [blame]
Valery Pykhtin2828b9b2016-09-19 14:39:49 +00001//===-- VOPInstructions.td - Vector Instruction Defintions ----------------===//
2//
3// The LLVM Compiler Infrastructure
4//
5// This file is distributed under the University of Illinois Open Source
6// License. See LICENSE.TXT for details.
7//
8//===----------------------------------------------------------------------===//
9
Valery Pykhtin355103f2016-09-23 09:08:07 +000010// dummies for outer let
11class LetDummies {
12 bit isCommutable;
13 bit isConvertibleToThreeAddress;
14 bit isMoveImm;
15 bit isReMaterializable;
16 bit isAsCheapAsAMove;
17 bit VOPAsmPrefer32Bit;
18 Predicate SubtargetPredicate;
19 string Constraints;
20 string DisableEncoding;
21 list<SchedReadWrite> SchedRW;
22 list<Register> Uses;
23 list<Register> Defs;
24}
25
26class VOP <string opName> {
27 string OpName = opName;
28}
29
30class VOPAnyCommon <dag outs, dag ins, string asm, list<dag> pattern> :
31 InstSI <outs, ins, asm, pattern> {
32
33 let mayLoad = 0;
34 let mayStore = 0;
35 let hasSideEffects = 0;
36 let UseNamedOperandTable = 1;
37 let VALU = 1;
Matt Arsenaulteff1ad82016-11-18 04:42:59 +000038 let Uses = [EXEC];
Valery Pykhtin355103f2016-09-23 09:08:07 +000039}
40
41class VOP3Common <dag outs, dag ins, string asm = "",
42 list<dag> pattern = [], bit HasMods = 0,
43 bit VOP3Only = 0> :
44 VOPAnyCommon <outs, ins, asm, pattern> {
45
46 // Using complex patterns gives VOP3 patterns a very high complexity rating,
Simon Pilgrime995a8082016-11-18 11:04:02 +000047 // but standalone patterns are almost always preferred, so we need to adjust the
Valery Pykhtin355103f2016-09-23 09:08:07 +000048 // priority lower. The goal is to use a high number to reduce complexity to
49 // zero (or less than zero).
50 let AddedComplexity = -1000;
51
52 let VOP3 = 1;
Valery Pykhtin355103f2016-09-23 09:08:07 +000053
54 let AsmMatchConverter =
55 !if(!eq(VOP3Only,1),
56 "cvtVOP3",
57 !if(!eq(HasMods,1), "cvtVOP3_2_mod", ""));
58
59 let AsmVariantName = AMDGPUAsmVariants.VOP3;
60
61 let isCodeGenOnly = 0;
62
63 int Size = 8;
64
65 // Because SGPRs may be allowed if there are multiple operands, we
66 // need a post-isel hook to insert copies in order to avoid
67 // violating constant bus requirements.
68 let hasPostISelHook = 1;
69}
70
Matt Arsenault9be7b0d2017-02-27 18:49:11 +000071class VOP3_Pseudo <string opName, VOPProfile P, list<dag> pattern = [],
72 bit VOP3Only = 0, bit isVOP3P = 0> :
73 InstSI <P.Outs64, !if(!and(isVOP3P, P.IsPacked), P.InsVOP3P, P.Ins64), "", pattern>,
Valery Pykhtin2828b9b2016-09-19 14:39:49 +000074 VOP <opName>,
75 SIMCInstr<opName#"_e64", SIEncodingFamily.NONE>,
76 MnemonicAlias<opName#"_e64", opName> {
77
78 let isPseudo = 1;
79 let isCodeGenOnly = 1;
80 let UseNamedOperandTable = 1;
81
82 string Mnemonic = opName;
Matt Arsenault9be7b0d2017-02-27 18:49:11 +000083 string AsmOperands = !if(!and(isVOP3P, P.IsPacked), P.AsmVOP3P, P.Asm64);
Valery Pykhtin2828b9b2016-09-19 14:39:49 +000084
85 let Size = 8;
86 let mayLoad = 0;
87 let mayStore = 0;
88 let hasSideEffects = 0;
89 let SubtargetPredicate = isGCN;
90
91 // Because SGPRs may be allowed if there are multiple operands, we
92 // need a post-isel hook to insert copies in order to avoid
93 // violating constant bus requirements.
94 let hasPostISelHook = 1;
95
96 // Using complex patterns gives VOP3 patterns a very high complexity rating,
Simon Pilgrime995a8082016-11-18 11:04:02 +000097 // but standalone patterns are almost always preferred, so we need to adjust the
Valery Pykhtin2828b9b2016-09-19 14:39:49 +000098 // priority lower. The goal is to use a high number to reduce complexity to
99 // zero (or less than zero).
100 let AddedComplexity = -1000;
101
102 let VOP3 = 1;
103 let VALU = 1;
Matt Arsenaultd5c65152017-02-22 23:27:53 +0000104 let FPClamp = P.HasFPClamp;
Valery Pykhtin2828b9b2016-09-19 14:39:49 +0000105 let Uses = [EXEC];
106
107 let AsmVariantName = AMDGPUAsmVariants.VOP3;
108 let AsmMatchConverter =
109 !if(!eq(VOP3Only,1),
Matt Arsenault9be7b0d2017-02-27 18:49:11 +0000110 !if(!and(P.IsPacked, isVOP3P), "cvtVOP3P", "cvtVOP3"),
Valery Pykhtin2828b9b2016-09-19 14:39:49 +0000111 !if(!eq(P.HasModifiers, 1), "cvtVOP3_2_mod", ""));
112
113 VOPProfile Pfl = P;
114}
115
Matt Arsenault9be7b0d2017-02-27 18:49:11 +0000116class VOP3P_Pseudo <string opName, VOPProfile P, list<dag> pattern = []> :
117 VOP3_Pseudo<opName, P, pattern, 1, 1> {
118 let VOP3P = 1;
119}
120
Valery Pykhtin355103f2016-09-23 09:08:07 +0000121class VOP3_Real <VOP3_Pseudo ps, int EncodingFamily> :
Valery Pykhtin2828b9b2016-09-19 14:39:49 +0000122 InstSI <ps.OutOperandList, ps.InOperandList, ps.Mnemonic # ps.AsmOperands, []>,
123 SIMCInstr <ps.PseudoInstr, EncodingFamily> {
124
125 let isPseudo = 0;
126 let isCodeGenOnly = 0;
Matt Arsenault9be7b0d2017-02-27 18:49:11 +0000127 let UseNamedOperandTable = 1;
Valery Pykhtin2828b9b2016-09-19 14:39:49 +0000128
Sam Koltona6792a32016-12-22 11:30:48 +0000129 let Constraints = ps.Constraints;
130 let DisableEncoding = ps.DisableEncoding;
131
Valery Pykhtin2828b9b2016-09-19 14:39:49 +0000132 // copy relevant pseudo op flags
133 let SubtargetPredicate = ps.SubtargetPredicate;
134 let AsmMatchConverter = ps.AsmMatchConverter;
135 let AsmVariantName = ps.AsmVariantName;
136 let Constraints = ps.Constraints;
137 let DisableEncoding = ps.DisableEncoding;
138 let TSFlags = ps.TSFlags;
139}
140
Matt Arsenault9be7b0d2017-02-27 18:49:11 +0000141// XXX - Is there any reason to distingusih this from regular VOP3
142// here?
143class VOP3P_Real<VOP3P_Pseudo ps, int EncodingFamily> :
144 VOP3_Real<ps, EncodingFamily>;
145
Valery Pykhtin355103f2016-09-23 09:08:07 +0000146class VOP3a<VOPProfile P> : Enc64 {
Valery Pykhtin2828b9b2016-09-19 14:39:49 +0000147 bits<2> src0_modifiers;
148 bits<9> src0;
149 bits<2> src1_modifiers;
150 bits<9> src1;
151 bits<2> src2_modifiers;
152 bits<9> src2;
153 bits<1> clamp;
154 bits<2> omod;
155
156 let Inst{8} = !if(P.HasSrc0Mods, src0_modifiers{1}, 0);
157 let Inst{9} = !if(P.HasSrc1Mods, src1_modifiers{1}, 0);
158 let Inst{10} = !if(P.HasSrc2Mods, src2_modifiers{1}, 0);
159
160 let Inst{31-26} = 0x34; //encoding
Valery Pykhtin355103f2016-09-23 09:08:07 +0000161 let Inst{40-32} = !if(P.HasSrc0, src0, 0);
Valery Pykhtin2828b9b2016-09-19 14:39:49 +0000162 let Inst{49-41} = !if(P.HasSrc1, src1, 0);
163 let Inst{58-50} = !if(P.HasSrc2, src2, 0);
164 let Inst{60-59} = !if(P.HasOMod, omod, 0);
165 let Inst{61} = !if(P.HasSrc0Mods, src0_modifiers{0}, 0);
166 let Inst{62} = !if(P.HasSrc1Mods, src1_modifiers{0}, 0);
167 let Inst{63} = !if(P.HasSrc2Mods, src2_modifiers{0}, 0);
168}
169
Valery Pykhtin355103f2016-09-23 09:08:07 +0000170class VOP3a_si <bits<9> op, VOPProfile P> : VOP3a<P> {
Valery Pykhtin2828b9b2016-09-19 14:39:49 +0000171 let Inst{25-17} = op;
Valery Pykhtin355103f2016-09-23 09:08:07 +0000172 let Inst{11} = !if(P.HasClamp, clamp{0}, 0);
Valery Pykhtin2828b9b2016-09-19 14:39:49 +0000173}
174
Valery Pykhtin355103f2016-09-23 09:08:07 +0000175class VOP3a_vi <bits<10> op, VOPProfile P> : VOP3a<P> {
Valery Pykhtin2828b9b2016-09-19 14:39:49 +0000176 let Inst{25-16} = op;
Valery Pykhtin355103f2016-09-23 09:08:07 +0000177 let Inst{15} = !if(P.HasClamp, clamp{0}, 0);
Valery Pykhtin2828b9b2016-09-19 14:39:49 +0000178}
179
Valery Pykhtin355103f2016-09-23 09:08:07 +0000180class VOP3e_si <bits<9> op, VOPProfile P> : VOP3a_si <op, P> {
Valery Pykhtine330cfa2016-09-20 10:41:16 +0000181 bits<8> vdst;
Valery Pykhtin355103f2016-09-23 09:08:07 +0000182 let Inst{7-0} = !if(P.EmitDst, vdst{7-0}, 0);
Valery Pykhtine330cfa2016-09-20 10:41:16 +0000183}
184
Valery Pykhtin355103f2016-09-23 09:08:07 +0000185class VOP3e_vi <bits<10> op, VOPProfile P> : VOP3a_vi <op, P> {
Valery Pykhtine330cfa2016-09-20 10:41:16 +0000186 bits<8> vdst;
Valery Pykhtin355103f2016-09-23 09:08:07 +0000187 let Inst{7-0} = !if(P.EmitDst, vdst{7-0}, 0);
Valery Pykhtine330cfa2016-09-20 10:41:16 +0000188}
189
Valery Pykhtin355103f2016-09-23 09:08:07 +0000190class VOP3be <VOPProfile P> : Enc64 {
Valery Pykhtine330cfa2016-09-20 10:41:16 +0000191 bits<8> vdst;
192 bits<2> src0_modifiers;
193 bits<9> src0;
194 bits<2> src1_modifiers;
195 bits<9> src1;
196 bits<2> src2_modifiers;
197 bits<9> src2;
198 bits<7> sdst;
199 bits<2> omod;
200
201 let Inst{7-0} = vdst;
202 let Inst{14-8} = sdst;
203 let Inst{31-26} = 0x34; //encoding
204 let Inst{40-32} = !if(P.HasSrc0, src0, 0);
205 let Inst{49-41} = !if(P.HasSrc1, src1, 0);
206 let Inst{58-50} = !if(P.HasSrc2, src2, 0);
207 let Inst{60-59} = !if(P.HasOMod, omod, 0);
208 let Inst{61} = !if(P.HasSrc0Mods, src0_modifiers{0}, 0);
209 let Inst{62} = !if(P.HasSrc1Mods, src1_modifiers{0}, 0);
210 let Inst{63} = !if(P.HasSrc2Mods, src2_modifiers{0}, 0);
211}
212
Matt Arsenault9be7b0d2017-02-27 18:49:11 +0000213class VOP3Pe <bits<10> op, VOPProfile P> : Enc64 {
214 bits<8> vdst;
215 // neg, neg_hi, op_sel put in srcN_modifiers
216 bits<4> src0_modifiers;
217 bits<9> src0;
218 bits<4> src1_modifiers;
219 bits<9> src1;
220 bits<4> src2_modifiers;
221 bits<9> src2;
222 bits<1> clamp;
223
224 let Inst{7-0} = vdst;
225 let Inst{8} = !if(P.HasSrc0Mods, src0_modifiers{1}, 0); // neg_hi src0
226 let Inst{9} = !if(P.HasSrc1Mods, src1_modifiers{1}, 0); // neg_hi src1
227 let Inst{10} = !if(P.HasSrc2Mods, src2_modifiers{1}, 0); // neg_hi src2
228
229 let Inst{11} = !if(P.HasOpSel, src0_modifiers{2}, 0); // op_sel(0)
230 let Inst{12} = !if(P.HasOpSel, src1_modifiers{2}, 0); // op_sel(1)
231 let Inst{13} = !if(P.HasOpSel, src2_modifiers{2}, 0); // op_sel(2)
232
233 let Inst{14} = !if(P.HasOpSel, src2_modifiers{3}, 0); // op_sel_hi(2)
234
235 let Inst{15} = !if(P.HasClamp, clamp{0}, 0);
236
237 let Inst{25-16} = op;
238 let Inst{31-26} = 0x34; //encoding
239 let Inst{40-32} = !if(P.HasSrc0, src0, 0);
240 let Inst{49-41} = !if(P.HasSrc1, src1, 0);
241 let Inst{58-50} = !if(P.HasSrc2, src2, 0);
242 let Inst{59} = !if(P.HasOpSel, src0_modifiers{3}, 0); // op_sel_hi(0)
243 let Inst{60} = !if(P.HasOpSel, src1_modifiers{3}, 0); // op_sel_hi(1)
244 let Inst{61} = !if(P.HasSrc0Mods, src0_modifiers{0}, 0); // neg (lo)
245 let Inst{62} = !if(P.HasSrc1Mods, src1_modifiers{0}, 0); // neg (lo)
246 let Inst{63} = !if(P.HasSrc2Mods, src2_modifiers{0}, 0); // neg (lo)
247}
248
Valery Pykhtin355103f2016-09-23 09:08:07 +0000249class VOP3be_si <bits<9> op, VOPProfile P> : VOP3be<P> {
Valery Pykhtine330cfa2016-09-20 10:41:16 +0000250 let Inst{25-17} = op;
251}
252
Valery Pykhtin355103f2016-09-23 09:08:07 +0000253class VOP3be_vi <bits<10> op, VOPProfile P> : VOP3be<P> {
Valery Pykhtine330cfa2016-09-20 10:41:16 +0000254 bits<1> clamp;
255 let Inst{25-16} = op;
Valery Pykhtin355103f2016-09-23 09:08:07 +0000256 let Inst{15} = !if(P.HasClamp, clamp{0}, 0);
Valery Pykhtine330cfa2016-09-20 10:41:16 +0000257}
258
Sam Koltona568e3d2016-12-22 12:57:41 +0000259def SDWA {
260 // sdwa_sel
261 int BYTE_0 = 0;
262 int BYTE_1 = 1;
263 int BYTE_2 = 2;
264 int BYTE_3 = 3;
265 int WORD_0 = 4;
266 int WORD_1 = 5;
267 int DWORD = 6;
268
269 // dst_unused
270 int UNUSED_PAD = 0;
271 int UNUSED_SEXT = 1;
272 int UNUSED_PRESERVE = 2;
273}
274
Valery Pykhtin355103f2016-09-23 09:08:07 +0000275class VOP_SDWAe<VOPProfile P> : Enc64 {
Valery Pykhtin2828b9b2016-09-19 14:39:49 +0000276 bits<8> src0;
277 bits<3> src0_sel;
Valery Pykhtin355103f2016-09-23 09:08:07 +0000278 bits<2> src0_modifiers; // float: {abs,neg}, int {sext}
Valery Pykhtin2828b9b2016-09-19 14:39:49 +0000279 bits<3> src1_sel;
Valery Pykhtin355103f2016-09-23 09:08:07 +0000280 bits<2> src1_modifiers;
Valery Pykhtin2828b9b2016-09-19 14:39:49 +0000281 bits<3> dst_sel;
282 bits<2> dst_unused;
283 bits<1> clamp;
284
Valery Pykhtin2828b9b2016-09-19 14:39:49 +0000285 let Inst{39-32} = !if(P.HasSrc0, src0{7-0}, 0);
Sam Koltona568e3d2016-12-22 12:57:41 +0000286 let Inst{42-40} = !if(P.EmitDst, dst_sel{2-0}, SDWA.DWORD);
287 let Inst{44-43} = !if(P.EmitDst, dst_unused{1-0}, SDWA.UNUSED_PRESERVE);
Valery Pykhtin2828b9b2016-09-19 14:39:49 +0000288 let Inst{45} = !if(P.HasSDWAClamp, clamp{0}, 0);
Sam Koltona568e3d2016-12-22 12:57:41 +0000289 let Inst{50-48} = !if(P.HasSrc0, src0_sel{2-0}, SDWA.DWORD);
Valery Pykhtin355103f2016-09-23 09:08:07 +0000290 let Inst{53-52} = !if(P.HasSrc0FloatMods, src0_modifiers{1-0}, 0);
291 let Inst{51} = !if(P.HasSrc0IntMods, src0_modifiers{0}, 0);
Sam Koltona568e3d2016-12-22 12:57:41 +0000292 let Inst{58-56} = !if(P.HasSrc1, src1_sel{2-0}, SDWA.DWORD);
Valery Pykhtin355103f2016-09-23 09:08:07 +0000293 let Inst{61-60} = !if(P.HasSrc1FloatMods, src1_modifiers{1-0}, 0);
294 let Inst{59} = !if(P.HasSrc1IntMods, src1_modifiers{0}, 0);
295}
296
Sam Koltona568e3d2016-12-22 12:57:41 +0000297class VOP_SDWA_Pseudo <string opName, VOPProfile P, list<dag> pattern=[]> :
298 InstSI <P.OutsSDWA, P.InsSDWA, "", pattern>,
299 VOP <opName>,
300 SIMCInstr <opName#"_sdwa", SIEncodingFamily.NONE>,
301 MnemonicAlias <opName#"_sdwa", opName> {
Matt Arsenaultb4493e92017-02-10 02:42:31 +0000302
Sam Koltona568e3d2016-12-22 12:57:41 +0000303 let isPseudo = 1;
304 let isCodeGenOnly = 1;
305 let UseNamedOperandTable = 1;
306
307 string Mnemonic = opName;
308 string AsmOperands = P.AsmSDWA;
309
310 let Size = 8;
Valery Pykhtin355103f2016-09-23 09:08:07 +0000311 let mayLoad = 0;
312 let mayStore = 0;
Matt Arsenaultb4493e92017-02-10 02:42:31 +0000313 let hasSideEffects = 0;
Sam Koltona568e3d2016-12-22 12:57:41 +0000314
Valery Pykhtin355103f2016-09-23 09:08:07 +0000315 let VALU = 1;
316 let SDWA = 1;
Sam Koltona568e3d2016-12-22 12:57:41 +0000317 let Uses = [EXEC];
Matt Arsenaultb4493e92017-02-10 02:42:31 +0000318
Sam Kolton07dbde22017-01-20 10:01:25 +0000319 let SubtargetPredicate = HasSDWA;
320 let AssemblerPredicate = !if(P.HasExt, HasSDWA, DisableInst);
Valery Pykhtin355103f2016-09-23 09:08:07 +0000321 let AsmVariantName = !if(P.HasExt, AMDGPUAsmVariants.SDWA,
322 AMDGPUAsmVariants.Disable);
323 let DecoderNamespace = "SDWA";
Sam Koltona568e3d2016-12-22 12:57:41 +0000324
325 VOPProfile Pfl = P;
326}
327
328class VOP_SDWA_Real <VOP_SDWA_Pseudo ps> :
329 InstSI <ps.OutOperandList, ps.InOperandList, ps.Mnemonic # ps.AsmOperands, []>,
330 SIMCInstr <ps.PseudoInstr, SIEncodingFamily.VI> {
331
332 let isPseudo = 0;
333 let isCodeGenOnly = 0;
334
335 let Defs = ps.Defs;
336 let Uses = ps.Uses;
337 let SchedRW = ps.SchedRW;
338 let hasSideEffects = ps.hasSideEffects;
339
340 let Constraints = ps.Constraints;
341 let DisableEncoding = ps.DisableEncoding;
342
343 // Copy relevant pseudo op flags
344 let SubtargetPredicate = ps.SubtargetPredicate;
345 let AssemblerPredicate = ps.AssemblerPredicate;
346 let AsmMatchConverter = ps.AsmMatchConverter;
347 let AsmVariantName = ps.AsmVariantName;
348 let UseNamedOperandTable = ps.UseNamedOperandTable;
349 let DecoderNamespace = ps.DecoderNamespace;
350 let Constraints = ps.Constraints;
351 let DisableEncoding = ps.DisableEncoding;
352 let TSFlags = ps.TSFlags;
Valery Pykhtin355103f2016-09-23 09:08:07 +0000353}
354
355class VOP_DPPe<VOPProfile P> : Enc64 {
356 bits<2> src0_modifiers;
357 bits<8> src0;
358 bits<2> src1_modifiers;
359 bits<9> dpp_ctrl;
360 bits<1> bound_ctrl;
361 bits<4> bank_mask;
362 bits<4> row_mask;
363
364 let Inst{39-32} = !if(P.HasSrc0, src0{7-0}, 0);
365 let Inst{48-40} = dpp_ctrl;
366 let Inst{51} = bound_ctrl;
367 let Inst{52} = !if(P.HasSrc0Mods, src0_modifiers{0}, 0); // src0_neg
368 let Inst{53} = !if(P.HasSrc0Mods, src0_modifiers{1}, 0); // src0_abs
369 let Inst{54} = !if(P.HasSrc1Mods, src1_modifiers{0}, 0); // src1_neg
370 let Inst{55} = !if(P.HasSrc1Mods, src1_modifiers{1}, 0); // src1_abs
371 let Inst{59-56} = bank_mask;
372 let Inst{63-60} = row_mask;
373}
374
375class VOP_DPP <string OpName, VOPProfile P> :
376 InstSI <P.OutsDPP, P.InsDPP, OpName#P.AsmDPP, []>,
377 VOP_DPPe<P> {
378
379 let mayLoad = 0;
380 let mayStore = 0;
381 let hasSideEffects = 0;
382 let UseNamedOperandTable = 1;
383
384 let VALU = 1;
385 let DPP = 1;
386 let Size = 8;
387
388 let AsmMatchConverter = !if(!eq(P.HasModifiers,1), "cvtDPP", "");
Sam Kolton07dbde22017-01-20 10:01:25 +0000389 let SubtargetPredicate = HasDPP;
390 let AssemblerPredicate = !if(P.HasExt, HasDPP, DisableInst);
Valery Pykhtin355103f2016-09-23 09:08:07 +0000391 let AsmVariantName = !if(P.HasExt, AMDGPUAsmVariants.DPP,
392 AMDGPUAsmVariants.Disable);
393 let DecoderNamespace = "DPP";
Valery Pykhtin2828b9b2016-09-19 14:39:49 +0000394}
395
396include "VOPCInstructions.td"
Valery Pykhtin355103f2016-09-23 09:08:07 +0000397include "VOP1Instructions.td"
398include "VOP2Instructions.td"
Valery Pykhtine330cfa2016-09-20 10:41:16 +0000399include "VOP3Instructions.td"
Matt Arsenault9be7b0d2017-02-27 18:49:11 +0000400include "VOP3PInstructions.td"