blob: 6bb5abd3b20802b0bcb486e405f4c9afafc44d9c [file] [log] [blame]
Valery Pykhtin1b138862016-09-01 09:56:47 +00001//===---- SMInstructions.td - Scalar Memory Instruction Defintions --------===//
2//
3// The LLVM Compiler Infrastructure
4//
5// This file is distributed under the University of Illinois Open Source
6// License. See LICENSE.TXT for details.
7//
8//===----------------------------------------------------------------------===//
9
Artem Tamazov54bfd542016-10-31 16:07:39 +000010def smrd_offset_8 : NamedOperandU32<"SMRDOffset8",
11 NamedMatchClass<"SMRDOffset8">> {
Valery Pykhtin1b138862016-09-01 09:56:47 +000012 let OperandType = "OPERAND_IMMEDIATE";
13}
14
Artem Tamazov54bfd542016-10-31 16:07:39 +000015def smrd_offset_20 : NamedOperandU32<"SMRDOffset20",
16 NamedMatchClass<"SMRDOffset20">> {
17 let OperandType = "OPERAND_IMMEDIATE";
18}
Valery Pykhtin1b138862016-09-01 09:56:47 +000019
20//===----------------------------------------------------------------------===//
21// Scalar Memory classes
22//===----------------------------------------------------------------------===//
23
24class SM_Pseudo <string opName, dag outs, dag ins, string asmOps, list<dag> pattern=[]> :
25 InstSI <outs, ins, "", pattern>,
26 SIMCInstr<opName, SIEncodingFamily.NONE> {
27 let isPseudo = 1;
28 let isCodeGenOnly = 1;
29
30 let LGKM_CNT = 1;
31 let SMRD = 1;
32 let mayStore = 0;
33 let mayLoad = 1;
34 let hasSideEffects = 0;
35 let UseNamedOperandTable = 1;
36 let SchedRW = [WriteSMEM];
37 let SubtargetPredicate = isGCN;
38
39 string Mnemonic = opName;
40 string AsmOperands = asmOps;
41
42 bits<1> has_sbase = 1;
43 bits<1> has_sdst = 1;
Matt Arsenault7b647552016-10-28 21:55:15 +000044 bit has_glc = 0;
Valery Pykhtin1b138862016-09-01 09:56:47 +000045 bits<1> has_offset = 1;
46 bits<1> offset_is_imm = 0;
47}
48
49class SM_Real <SM_Pseudo ps>
50 : InstSI<ps.OutOperandList, ps.InOperandList, ps.Mnemonic # ps.AsmOperands, []> {
51
52 let isPseudo = 0;
53 let isCodeGenOnly = 0;
54
55 // copy relevant pseudo op flags
56 let SubtargetPredicate = ps.SubtargetPredicate;
57 let AsmMatchConverter = ps.AsmMatchConverter;
58
59 // encoding
60 bits<7> sbase;
61 bits<7> sdst;
62 bits<32> offset;
Matt Arsenault7b647552016-10-28 21:55:15 +000063 bits<1> imm = !if(ps.has_offset, ps.offset_is_imm, 0);
Valery Pykhtin1b138862016-09-01 09:56:47 +000064}
65
66class SM_Load_Pseudo <string opName, dag outs, dag ins, string asmOps, list<dag> pattern=[]>
67 : SM_Pseudo<opName, outs, ins, asmOps, pattern> {
68 RegisterClass BaseClass;
Matt Arsenault7b647552016-10-28 21:55:15 +000069 let mayLoad = 1;
70 let mayStore = 0;
71 let has_glc = 1;
72}
73
74class SM_Store_Pseudo <string opName, dag ins, string asmOps, list<dag> pattern = []>
75 : SM_Pseudo<opName, (outs), ins, asmOps, pattern> {
76 RegisterClass BaseClass;
77 RegisterClass SrcClass;
78 let mayLoad = 0;
79 let mayStore = 1;
80 let has_glc = 1;
81 let ScalarStore = 1;
Valery Pykhtin1b138862016-09-01 09:56:47 +000082}
83
84multiclass SM_Pseudo_Loads<string opName,
85 RegisterClass baseClass,
86 RegisterClass dstClass> {
87 def _IMM : SM_Load_Pseudo <opName,
88 (outs dstClass:$sdst),
Matt Arsenault7b647552016-10-28 21:55:15 +000089 (ins baseClass:$sbase, i32imm:$offset, i1imm:$glc),
90 " $sdst, $sbase, $offset$glc", []> {
Valery Pykhtin1b138862016-09-01 09:56:47 +000091 let offset_is_imm = 1;
92 let BaseClass = baseClass;
93 let PseudoInstr = opName # "_IMM";
Matt Arsenault7b647552016-10-28 21:55:15 +000094 let has_glc = 1;
Valery Pykhtin1b138862016-09-01 09:56:47 +000095 }
Matt Arsenault7b647552016-10-28 21:55:15 +000096
Valery Pykhtin1b138862016-09-01 09:56:47 +000097 def _SGPR : SM_Load_Pseudo <opName,
98 (outs dstClass:$sdst),
Matt Arsenault7b647552016-10-28 21:55:15 +000099 (ins baseClass:$sbase, SReg_32:$soff, i1imm:$glc),
100 " $sdst, $sbase, $offset$glc", []> {
Valery Pykhtin1b138862016-09-01 09:56:47 +0000101 let BaseClass = baseClass;
102 let PseudoInstr = opName # "_SGPR";
Matt Arsenault7b647552016-10-28 21:55:15 +0000103 let has_glc = 1;
104 }
105}
106
107multiclass SM_Pseudo_Stores<string opName,
108 RegisterClass baseClass,
109 RegisterClass srcClass> {
110 def _IMM : SM_Store_Pseudo <opName,
111 (ins srcClass:$sdata, baseClass:$sbase, i32imm:$offset, i1imm:$glc),
112 " $sdata, $sbase, $offset$glc", []> {
113 let offset_is_imm = 1;
114 let BaseClass = baseClass;
115 let SrcClass = srcClass;
116 let PseudoInstr = opName # "_IMM";
117 }
118
119 def _SGPR : SM_Store_Pseudo <opName,
120 (ins srcClass:$sdata, baseClass:$sbase, SReg_32:$soff, i1imm:$glc),
121 " $sdata, $sbase, $offset$glc", []> {
122 let BaseClass = baseClass;
123 let SrcClass = srcClass;
124 let PseudoInstr = opName # "_SGPR";
Valery Pykhtin1b138862016-09-01 09:56:47 +0000125 }
126}
127
128class SM_Time_Pseudo<string opName, SDPatternOperator node> : SM_Pseudo<
Matt Arsenault640c44b2016-11-29 19:39:53 +0000129 opName, (outs SReg_64_XEXEC:$sdst), (ins),
Valery Pykhtin1b138862016-09-01 09:56:47 +0000130 " $sdst", [(set i64:$sdst, (node))]> {
131 let hasSideEffects = 1;
Matt Arsenault73ce93b2017-12-08 20:01:02 +0000132 let mayStore = 0;
133 let mayLoad = 1;
Valery Pykhtin1b138862016-09-01 09:56:47 +0000134 let has_sbase = 0;
135 let has_offset = 0;
136}
137
138class SM_Inval_Pseudo <string opName, SDPatternOperator node> : SM_Pseudo<
139 opName, (outs), (ins), "", [(node)]> {
140 let hasSideEffects = 1;
141 let mayStore = 1;
142 let has_sdst = 0;
143 let has_sbase = 0;
144 let has_offset = 0;
145}
146
147
148//===----------------------------------------------------------------------===//
149// Scalar Memory Instructions
150//===----------------------------------------------------------------------===//
151
152// We are using the SReg_32_XM0 and not the SReg_32 register class for 32-bit
153// SMRD instructions, because the SReg_32_XM0 register class does not include M0
154// and writing to M0 from an SMRD instruction will hang the GPU.
Matt Arsenault640c44b2016-11-29 19:39:53 +0000155
156// XXX - SMEM instructions do not allow exec for data operand, but
157// does sdst for SMRD on SI/CI?
158defm S_LOAD_DWORD : SM_Pseudo_Loads <"s_load_dword", SReg_64, SReg_32_XM0_XEXEC>;
159defm S_LOAD_DWORDX2 : SM_Pseudo_Loads <"s_load_dwordx2", SReg_64, SReg_64_XEXEC>;
Valery Pykhtin1b138862016-09-01 09:56:47 +0000160defm S_LOAD_DWORDX4 : SM_Pseudo_Loads <"s_load_dwordx4", SReg_64, SReg_128>;
161defm S_LOAD_DWORDX8 : SM_Pseudo_Loads <"s_load_dwordx8", SReg_64, SReg_256>;
162defm S_LOAD_DWORDX16 : SM_Pseudo_Loads <"s_load_dwordx16", SReg_64, SReg_512>;
163
164defm S_BUFFER_LOAD_DWORD : SM_Pseudo_Loads <
Matt Arsenault640c44b2016-11-29 19:39:53 +0000165 "s_buffer_load_dword", SReg_128, SReg_32_XM0_XEXEC
Valery Pykhtin1b138862016-09-01 09:56:47 +0000166>;
167
Matt Arsenault640c44b2016-11-29 19:39:53 +0000168// FIXME: exec_lo/exec_hi appear to be allowed for SMRD loads on
169// SI/CI, bit disallowed for SMEM on VI.
Valery Pykhtin1b138862016-09-01 09:56:47 +0000170defm S_BUFFER_LOAD_DWORDX2 : SM_Pseudo_Loads <
Matt Arsenault640c44b2016-11-29 19:39:53 +0000171 "s_buffer_load_dwordx2", SReg_128, SReg_64_XEXEC
Valery Pykhtin1b138862016-09-01 09:56:47 +0000172>;
173
174defm S_BUFFER_LOAD_DWORDX4 : SM_Pseudo_Loads <
175 "s_buffer_load_dwordx4", SReg_128, SReg_128
176>;
177
178defm S_BUFFER_LOAD_DWORDX8 : SM_Pseudo_Loads <
179 "s_buffer_load_dwordx8", SReg_128, SReg_256
180>;
181
182defm S_BUFFER_LOAD_DWORDX16 : SM_Pseudo_Loads <
183 "s_buffer_load_dwordx16", SReg_128, SReg_512
184>;
185
Matt Arsenault640c44b2016-11-29 19:39:53 +0000186defm S_STORE_DWORD : SM_Pseudo_Stores <"s_store_dword", SReg_64, SReg_32_XM0_XEXEC>;
187defm S_STORE_DWORDX2 : SM_Pseudo_Stores <"s_store_dwordx2", SReg_64, SReg_64_XEXEC>;
Matt Arsenault7b647552016-10-28 21:55:15 +0000188defm S_STORE_DWORDX4 : SM_Pseudo_Stores <"s_store_dwordx4", SReg_64, SReg_128>;
189
190defm S_BUFFER_STORE_DWORD : SM_Pseudo_Stores <
Matt Arsenault640c44b2016-11-29 19:39:53 +0000191 "s_buffer_store_dword", SReg_128, SReg_32_XM0_XEXEC
Matt Arsenault7b647552016-10-28 21:55:15 +0000192>;
193
194defm S_BUFFER_STORE_DWORDX2 : SM_Pseudo_Stores <
Matt Arsenault640c44b2016-11-29 19:39:53 +0000195 "s_buffer_store_dwordx2", SReg_128, SReg_64_XEXEC
Matt Arsenault7b647552016-10-28 21:55:15 +0000196>;
197
198defm S_BUFFER_STORE_DWORDX4 : SM_Pseudo_Stores <
199 "s_buffer_store_dwordx4", SReg_128, SReg_128
200>;
201
202
Valery Pykhtin1b138862016-09-01 09:56:47 +0000203def S_MEMTIME : SM_Time_Pseudo <"s_memtime", int_amdgcn_s_memtime>;
204def S_DCACHE_INV : SM_Inval_Pseudo <"s_dcache_inv", int_amdgcn_s_dcache_inv>;
205
206let SubtargetPredicate = isCIVI in {
207def S_DCACHE_INV_VOL : SM_Inval_Pseudo <"s_dcache_inv_vol", int_amdgcn_s_dcache_inv_vol>;
208} // let SubtargetPredicate = isCIVI
209
210let SubtargetPredicate = isVI in {
211def S_DCACHE_WB : SM_Inval_Pseudo <"s_dcache_wb", int_amdgcn_s_dcache_wb>;
212def S_DCACHE_WB_VOL : SM_Inval_Pseudo <"s_dcache_wb_vol", int_amdgcn_s_dcache_wb_vol>;
213def S_MEMREALTIME : SM_Time_Pseudo <"s_memrealtime", int_amdgcn_s_memrealtime>;
214} // SubtargetPredicate = isVI
215
216
217
218//===----------------------------------------------------------------------===//
219// Scalar Memory Patterns
220//===----------------------------------------------------------------------===//
221
Alexander Timofeev18009562016-12-08 17:28:47 +0000222
Valery Pykhtin1b138862016-09-01 09:56:47 +0000223def smrd_load : PatFrag <(ops node:$ptr), (load node:$ptr), [{
224 auto Ld = cast<LoadSDNode>(N);
225 return Ld->getAlignment() >= 4 &&
Alexander Timofeev2e5eece2018-03-05 15:12:21 +0000226 ((((Ld->getAddressSpace() == AMDGPUASI.CONSTANT_ADDRESS) || (Ld->getAddressSpace() == AMDGPUASI.CONSTANT_ADDRESS_32BIT)) && !N->isDivergent()) ||
Yaxun Liu1a14bfa2017-03-27 14:04:01 +0000227 (Subtarget->getScalarizeGlobalBehavior() && Ld->getAddressSpace() == AMDGPUASI.GLOBAL_ADDRESS &&
Alexander Timofeev2e5eece2018-03-05 15:12:21 +0000228 !Ld->isVolatile() && !N->isDivergent() &&
Alexander Timofeev18009562016-12-08 17:28:47 +0000229 static_cast<const SITargetLowering *>(getTargetLowering())->isMemOpHasNoClobberedMemOperand(N)));
Valery Pykhtin1b138862016-09-01 09:56:47 +0000230}]>;
231
232def SMRDImm : ComplexPattern<i64, 2, "SelectSMRDImm">;
Marek Olsak8973a0a2017-05-24 14:53:50 +0000233def SMRDImm32 : ComplexPattern<i64, 2, "SelectSMRDImm32">;
Valery Pykhtin1b138862016-09-01 09:56:47 +0000234def SMRDSgpr : ComplexPattern<i64, 2, "SelectSMRDSgpr">;
235def SMRDBufferImm : ComplexPattern<i32, 1, "SelectSMRDBufferImm">;
Marek Olsak8973a0a2017-05-24 14:53:50 +0000236def SMRDBufferImm32 : ComplexPattern<i32, 1, "SelectSMRDBufferImm32">;
Valery Pykhtin1b138862016-09-01 09:56:47 +0000237
Valery Pykhtin1b138862016-09-01 09:56:47 +0000238multiclass SMRD_Pattern <string Instr, ValueType vt> {
239
240 // 1. IMM offset
Matt Arsenault90c75932017-10-03 00:06:41 +0000241 def : GCNPat <
Valery Pykhtin1b138862016-09-01 09:56:47 +0000242 (smrd_load (SMRDImm i64:$sbase, i32:$offset)),
Matt Arsenault7b647552016-10-28 21:55:15 +0000243 (vt (!cast<SM_Pseudo>(Instr#"_IMM") $sbase, $offset, 0))
Valery Pykhtin1b138862016-09-01 09:56:47 +0000244 >;
245
246 // 2. SGPR offset
Matt Arsenault90c75932017-10-03 00:06:41 +0000247 def : GCNPat <
Valery Pykhtin1b138862016-09-01 09:56:47 +0000248 (smrd_load (SMRDSgpr i64:$sbase, i32:$offset)),
Matt Arsenault7b647552016-10-28 21:55:15 +0000249 (vt (!cast<SM_Pseudo>(Instr#"_SGPR") $sbase, $offset, 0))
Valery Pykhtin1b138862016-09-01 09:56:47 +0000250 >;
251}
252
Matt Arsenault90c75932017-10-03 00:06:41 +0000253let OtherPredicates = [isSICI] in {
254def : GCNPat <
Valery Pykhtin1b138862016-09-01 09:56:47 +0000255 (i64 (readcyclecounter)),
256 (S_MEMTIME)
257>;
258}
259
260// Global and constant loads can be selected to either MUBUF or SMRD
261// instructions, but SMRD instructions are faster so we want the instruction
262// selector to prefer those.
263let AddedComplexity = 100 in {
264
265defm : SMRD_Pattern <"S_LOAD_DWORD", i32>;
266defm : SMRD_Pattern <"S_LOAD_DWORDX2", v2i32>;
267defm : SMRD_Pattern <"S_LOAD_DWORDX4", v4i32>;
268defm : SMRD_Pattern <"S_LOAD_DWORDX8", v8i32>;
269defm : SMRD_Pattern <"S_LOAD_DWORDX16", v16i32>;
270
271// 1. Offset as an immediate
Matt Arsenault90c75932017-10-03 00:06:41 +0000272def SM_LOAD_PATTERN : GCNPat < // name this pattern to reuse AddedComplexity on CI
Valery Pykhtin1b138862016-09-01 09:56:47 +0000273 (SIload_constant v4i32:$sbase, (SMRDBufferImm i32:$offset)),
Matt Arsenault7b647552016-10-28 21:55:15 +0000274 (S_BUFFER_LOAD_DWORD_IMM $sbase, $offset, 0)
Valery Pykhtin1b138862016-09-01 09:56:47 +0000275>;
276
277// 2. Offset loaded in an 32bit SGPR
Matt Arsenault90c75932017-10-03 00:06:41 +0000278def : GCNPat <
Marek Olsak5914ece2017-10-31 21:06:42 +0000279 (SIload_constant v4i32:$sbase, i32:$offset),
Matt Arsenault7b647552016-10-28 21:55:15 +0000280 (S_BUFFER_LOAD_DWORD_SGPR $sbase, $offset, 0)
Valery Pykhtin1b138862016-09-01 09:56:47 +0000281>;
282
283} // End let AddedComplexity = 100
284
Matt Arsenault90c75932017-10-03 00:06:41 +0000285let OtherPredicates = [isVI] in {
Valery Pykhtin1b138862016-09-01 09:56:47 +0000286
Matt Arsenault90c75932017-10-03 00:06:41 +0000287def : GCNPat <
Valery Pykhtin1b138862016-09-01 09:56:47 +0000288 (i64 (readcyclecounter)),
289 (S_MEMREALTIME)
290>;
291
Matt Arsenault90c75932017-10-03 00:06:41 +0000292} // let OtherPredicates = [isVI]
Valery Pykhtin1b138862016-09-01 09:56:47 +0000293
294
295//===----------------------------------------------------------------------===//
296// Targets
297//===----------------------------------------------------------------------===//
298
299//===----------------------------------------------------------------------===//
300// SI
301//===----------------------------------------------------------------------===//
302
303class SMRD_Real_si <bits<5> op, SM_Pseudo ps>
304 : SM_Real<ps>
305 , SIMCInstr<ps.PseudoInstr, SIEncodingFamily.SI>
306 , Enc32 {
307
308 let AssemblerPredicates = [isSICI];
309 let DecoderNamespace = "SICI";
310
311 let Inst{7-0} = !if(ps.has_offset, offset{7-0}, ?);
312 let Inst{8} = imm;
313 let Inst{14-9} = !if(ps.has_sbase, sbase{6-1}, ?);
314 let Inst{21-15} = !if(ps.has_sdst, sdst{6-0}, ?);
315 let Inst{26-22} = op;
316 let Inst{31-27} = 0x18; //encoding
317}
318
Matt Arsenault7b647552016-10-28 21:55:15 +0000319// FIXME: Assembler should reject trying to use glc on SMRD
320// instructions on SI.
Valery Pykhtin1b138862016-09-01 09:56:47 +0000321multiclass SM_Real_Loads_si<bits<5> op, string ps,
322 SM_Load_Pseudo immPs = !cast<SM_Load_Pseudo>(ps#_IMM),
323 SM_Load_Pseudo sgprPs = !cast<SM_Load_Pseudo>(ps#_SGPR)> {
Matt Arsenault7b647552016-10-28 21:55:15 +0000324
Valery Pykhtin1b138862016-09-01 09:56:47 +0000325 def _IMM_si : SMRD_Real_si <op, immPs> {
Artem Tamazov54bfd542016-10-31 16:07:39 +0000326 let InOperandList = (ins immPs.BaseClass:$sbase, smrd_offset_8:$offset, GLC:$glc);
Valery Pykhtin1b138862016-09-01 09:56:47 +0000327 }
Matt Arsenault7b647552016-10-28 21:55:15 +0000328
329 // FIXME: The operand name $offset is inconsistent with $soff used
330 // in the pseudo
Valery Pykhtin1b138862016-09-01 09:56:47 +0000331 def _SGPR_si : SMRD_Real_si <op, sgprPs> {
Matt Arsenault7b647552016-10-28 21:55:15 +0000332 let InOperandList = (ins sgprPs.BaseClass:$sbase, SReg_32:$offset, GLC:$glc);
Valery Pykhtin1b138862016-09-01 09:56:47 +0000333 }
Matt Arsenault7b647552016-10-28 21:55:15 +0000334
Valery Pykhtin1b138862016-09-01 09:56:47 +0000335}
336
337defm S_LOAD_DWORD : SM_Real_Loads_si <0x00, "S_LOAD_DWORD">;
338defm S_LOAD_DWORDX2 : SM_Real_Loads_si <0x01, "S_LOAD_DWORDX2">;
339defm S_LOAD_DWORDX4 : SM_Real_Loads_si <0x02, "S_LOAD_DWORDX4">;
340defm S_LOAD_DWORDX8 : SM_Real_Loads_si <0x03, "S_LOAD_DWORDX8">;
341defm S_LOAD_DWORDX16 : SM_Real_Loads_si <0x04, "S_LOAD_DWORDX16">;
342defm S_BUFFER_LOAD_DWORD : SM_Real_Loads_si <0x08, "S_BUFFER_LOAD_DWORD">;
343defm S_BUFFER_LOAD_DWORDX2 : SM_Real_Loads_si <0x09, "S_BUFFER_LOAD_DWORDX2">;
344defm S_BUFFER_LOAD_DWORDX4 : SM_Real_Loads_si <0x0a, "S_BUFFER_LOAD_DWORDX4">;
345defm S_BUFFER_LOAD_DWORDX8 : SM_Real_Loads_si <0x0b, "S_BUFFER_LOAD_DWORDX8">;
346defm S_BUFFER_LOAD_DWORDX16 : SM_Real_Loads_si <0x0c, "S_BUFFER_LOAD_DWORDX16">;
347
348def S_MEMTIME_si : SMRD_Real_si <0x1e, S_MEMTIME>;
349def S_DCACHE_INV_si : SMRD_Real_si <0x1f, S_DCACHE_INV>;
350
351
352//===----------------------------------------------------------------------===//
353// VI
354//===----------------------------------------------------------------------===//
355
356class SMEM_Real_vi <bits<8> op, SM_Pseudo ps>
357 : SM_Real<ps>
358 , SIMCInstr<ps.PseudoInstr, SIEncodingFamily.VI>
359 , Enc64 {
Matt Arsenault7b647552016-10-28 21:55:15 +0000360 bit glc;
Valery Pykhtin1b138862016-09-01 09:56:47 +0000361
362 let AssemblerPredicates = [isVI];
363 let DecoderNamespace = "VI";
364
365 let Inst{5-0} = !if(ps.has_sbase, sbase{6-1}, ?);
366 let Inst{12-6} = !if(ps.has_sdst, sdst{6-0}, ?);
367
Matt Arsenault7b647552016-10-28 21:55:15 +0000368 let Inst{16} = !if(ps.has_glc, glc, ?);
369 let Inst{17} = imm;
Valery Pykhtin1b138862016-09-01 09:56:47 +0000370 let Inst{25-18} = op;
371 let Inst{31-26} = 0x30; //encoding
372 let Inst{51-32} = !if(ps.has_offset, offset{19-0}, ?);
373}
374
375multiclass SM_Real_Loads_vi<bits<8> op, string ps,
376 SM_Load_Pseudo immPs = !cast<SM_Load_Pseudo>(ps#_IMM),
377 SM_Load_Pseudo sgprPs = !cast<SM_Load_Pseudo>(ps#_SGPR)> {
378 def _IMM_vi : SMEM_Real_vi <op, immPs> {
Artem Tamazov54bfd542016-10-31 16:07:39 +0000379 let InOperandList = (ins immPs.BaseClass:$sbase, smrd_offset_20:$offset, GLC:$glc);
Valery Pykhtin1b138862016-09-01 09:56:47 +0000380 }
381 def _SGPR_vi : SMEM_Real_vi <op, sgprPs> {
Matt Arsenault7b647552016-10-28 21:55:15 +0000382 let InOperandList = (ins sgprPs.BaseClass:$sbase, SReg_32:$offset, GLC:$glc);
383 }
384}
385
Sam Kolton83102d92016-12-05 09:58:51 +0000386class SMEM_Real_Store_vi <bits<8> op, SM_Pseudo ps> : SMEM_Real_vi <op, ps> {
387 // encoding
388 bits<7> sdata;
389
390 let sdst = ?;
391 let Inst{12-6} = !if(ps.has_sdst, sdata{6-0}, ?);
392}
393
Matt Arsenault7b647552016-10-28 21:55:15 +0000394multiclass SM_Real_Stores_vi<bits<8> op, string ps,
395 SM_Store_Pseudo immPs = !cast<SM_Store_Pseudo>(ps#_IMM),
396 SM_Store_Pseudo sgprPs = !cast<SM_Store_Pseudo>(ps#_SGPR)> {
397 // FIXME: The operand name $offset is inconsistent with $soff used
398 // in the pseudo
Sam Kolton83102d92016-12-05 09:58:51 +0000399 def _IMM_vi : SMEM_Real_Store_vi <op, immPs> {
Artem Tamazov54bfd542016-10-31 16:07:39 +0000400 let InOperandList = (ins immPs.SrcClass:$sdata, immPs.BaseClass:$sbase, smrd_offset_20:$offset, GLC:$glc);
Matt Arsenault7b647552016-10-28 21:55:15 +0000401 }
402
Sam Kolton83102d92016-12-05 09:58:51 +0000403 def _SGPR_vi : SMEM_Real_Store_vi <op, sgprPs> {
Matt Arsenault7b647552016-10-28 21:55:15 +0000404 let InOperandList = (ins sgprPs.SrcClass:$sdata, sgprPs.BaseClass:$sbase, SReg_32:$offset, GLC:$glc);
Valery Pykhtin1b138862016-09-01 09:56:47 +0000405 }
406}
407
408defm S_LOAD_DWORD : SM_Real_Loads_vi <0x00, "S_LOAD_DWORD">;
409defm S_LOAD_DWORDX2 : SM_Real_Loads_vi <0x01, "S_LOAD_DWORDX2">;
410defm S_LOAD_DWORDX4 : SM_Real_Loads_vi <0x02, "S_LOAD_DWORDX4">;
411defm S_LOAD_DWORDX8 : SM_Real_Loads_vi <0x03, "S_LOAD_DWORDX8">;
412defm S_LOAD_DWORDX16 : SM_Real_Loads_vi <0x04, "S_LOAD_DWORDX16">;
413defm S_BUFFER_LOAD_DWORD : SM_Real_Loads_vi <0x08, "S_BUFFER_LOAD_DWORD">;
414defm S_BUFFER_LOAD_DWORDX2 : SM_Real_Loads_vi <0x09, "S_BUFFER_LOAD_DWORDX2">;
415defm S_BUFFER_LOAD_DWORDX4 : SM_Real_Loads_vi <0x0a, "S_BUFFER_LOAD_DWORDX4">;
416defm S_BUFFER_LOAD_DWORDX8 : SM_Real_Loads_vi <0x0b, "S_BUFFER_LOAD_DWORDX8">;
417defm S_BUFFER_LOAD_DWORDX16 : SM_Real_Loads_vi <0x0c, "S_BUFFER_LOAD_DWORDX16">;
418
Matt Arsenault7b647552016-10-28 21:55:15 +0000419defm S_STORE_DWORD : SM_Real_Stores_vi <0x10, "S_STORE_DWORD">;
420defm S_STORE_DWORDX2 : SM_Real_Stores_vi <0x11, "S_STORE_DWORDX2">;
421defm S_STORE_DWORDX4 : SM_Real_Stores_vi <0x12, "S_STORE_DWORDX4">;
422
423defm S_BUFFER_STORE_DWORD : SM_Real_Stores_vi <0x18, "S_BUFFER_STORE_DWORD">;
424defm S_BUFFER_STORE_DWORDX2 : SM_Real_Stores_vi <0x19, "S_BUFFER_STORE_DWORDX2">;
425defm S_BUFFER_STORE_DWORDX4 : SM_Real_Stores_vi <0x1a, "S_BUFFER_STORE_DWORDX4">;
426
Sam Kolton83102d92016-12-05 09:58:51 +0000427// These instructions use same encoding
Valery Pykhtin1b138862016-09-01 09:56:47 +0000428def S_DCACHE_INV_vi : SMEM_Real_vi <0x20, S_DCACHE_INV>;
429def S_DCACHE_WB_vi : SMEM_Real_vi <0x21, S_DCACHE_WB>;
430def S_DCACHE_INV_VOL_vi : SMEM_Real_vi <0x22, S_DCACHE_INV_VOL>;
431def S_DCACHE_WB_VOL_vi : SMEM_Real_vi <0x23, S_DCACHE_WB_VOL>;
432def S_MEMTIME_vi : SMEM_Real_vi <0x24, S_MEMTIME>;
433def S_MEMREALTIME_vi : SMEM_Real_vi <0x25, S_MEMREALTIME>;
434
435
436//===----------------------------------------------------------------------===//
437// CI
438//===----------------------------------------------------------------------===//
439
440def smrd_literal_offset : NamedOperandU32<"SMRDLiteralOffset",
441 NamedMatchClass<"SMRDLiteralOffset">> {
442 let OperandType = "OPERAND_IMMEDIATE";
443}
444
445class SMRD_Real_Load_IMM_ci <bits<5> op, SM_Load_Pseudo ps> :
446 SM_Real<ps>,
447 Enc64 {
448
449 let AssemblerPredicates = [isCIOnly];
450 let DecoderNamespace = "CI";
Matt Arsenault7b647552016-10-28 21:55:15 +0000451 let InOperandList = (ins ps.BaseClass:$sbase, smrd_literal_offset:$offset, GLC:$glc);
Valery Pykhtin1b138862016-09-01 09:56:47 +0000452
453 let LGKM_CNT = ps.LGKM_CNT;
454 let SMRD = ps.SMRD;
455 let mayLoad = ps.mayLoad;
456 let mayStore = ps.mayStore;
457 let hasSideEffects = ps.hasSideEffects;
458 let SchedRW = ps.SchedRW;
459 let UseNamedOperandTable = ps.UseNamedOperandTable;
460
461 let Inst{7-0} = 0xff;
462 let Inst{8} = 0;
463 let Inst{14-9} = sbase{6-1};
464 let Inst{21-15} = sdst{6-0};
465 let Inst{26-22} = op;
466 let Inst{31-27} = 0x18; //encoding
467 let Inst{63-32} = offset{31-0};
468}
469
470def S_LOAD_DWORD_IMM_ci : SMRD_Real_Load_IMM_ci <0x00, S_LOAD_DWORD_IMM>;
471def S_LOAD_DWORDX2_IMM_ci : SMRD_Real_Load_IMM_ci <0x01, S_LOAD_DWORDX2_IMM>;
472def S_LOAD_DWORDX4_IMM_ci : SMRD_Real_Load_IMM_ci <0x02, S_LOAD_DWORDX4_IMM>;
473def S_LOAD_DWORDX8_IMM_ci : SMRD_Real_Load_IMM_ci <0x03, S_LOAD_DWORDX8_IMM>;
474def S_LOAD_DWORDX16_IMM_ci : SMRD_Real_Load_IMM_ci <0x04, S_LOAD_DWORDX16_IMM>;
475def S_BUFFER_LOAD_DWORD_IMM_ci : SMRD_Real_Load_IMM_ci <0x08, S_BUFFER_LOAD_DWORD_IMM>;
476def S_BUFFER_LOAD_DWORDX2_IMM_ci : SMRD_Real_Load_IMM_ci <0x09, S_BUFFER_LOAD_DWORDX2_IMM>;
477def S_BUFFER_LOAD_DWORDX4_IMM_ci : SMRD_Real_Load_IMM_ci <0x0a, S_BUFFER_LOAD_DWORDX4_IMM>;
478def S_BUFFER_LOAD_DWORDX8_IMM_ci : SMRD_Real_Load_IMM_ci <0x0b, S_BUFFER_LOAD_DWORDX8_IMM>;
479def S_BUFFER_LOAD_DWORDX16_IMM_ci : SMRD_Real_Load_IMM_ci <0x0c, S_BUFFER_LOAD_DWORDX16_IMM>;
480
481class SMRD_Real_ci <bits<5> op, SM_Pseudo ps>
482 : SM_Real<ps>
483 , SIMCInstr<ps.PseudoInstr, SIEncodingFamily.SI>
484 , Enc32 {
485
486 let AssemblerPredicates = [isCIOnly];
487 let DecoderNamespace = "CI";
488
489 let Inst{7-0} = !if(ps.has_offset, offset{7-0}, ?);
490 let Inst{8} = imm;
491 let Inst{14-9} = !if(ps.has_sbase, sbase{6-1}, ?);
492 let Inst{21-15} = !if(ps.has_sdst, sdst{6-0}, ?);
493 let Inst{26-22} = op;
494 let Inst{31-27} = 0x18; //encoding
495}
496
497def S_DCACHE_INV_VOL_ci : SMRD_Real_ci <0x1d, S_DCACHE_INV_VOL>;
Marek Olsak8973a0a2017-05-24 14:53:50 +0000498
499let AddedComplexity = SM_LOAD_PATTERN.AddedComplexity in {
500
Matt Arsenault90c75932017-10-03 00:06:41 +0000501class SMRD_Pattern_ci <string Instr, ValueType vt> : GCNPat <
Marek Olsak8973a0a2017-05-24 14:53:50 +0000502 (smrd_load (SMRDImm32 i64:$sbase, i32:$offset)),
503 (vt (!cast<SM_Pseudo>(Instr#"_IMM_ci") $sbase, $offset, 0))> {
Matt Arsenault90c75932017-10-03 00:06:41 +0000504 let OtherPredicates = [isCIOnly];
Marek Olsak8973a0a2017-05-24 14:53:50 +0000505}
506
507def : SMRD_Pattern_ci <"S_LOAD_DWORD", i32>;
508def : SMRD_Pattern_ci <"S_LOAD_DWORDX2", v2i32>;
509def : SMRD_Pattern_ci <"S_LOAD_DWORDX4", v4i32>;
510def : SMRD_Pattern_ci <"S_LOAD_DWORDX8", v8i32>;
511def : SMRD_Pattern_ci <"S_LOAD_DWORDX16", v16i32>;
512
Matt Arsenault90c75932017-10-03 00:06:41 +0000513def : GCNPat <
Marek Olsak8973a0a2017-05-24 14:53:50 +0000514 (SIload_constant v4i32:$sbase, (SMRDBufferImm32 i32:$offset)),
515 (S_BUFFER_LOAD_DWORD_IMM_ci $sbase, $offset, 0)> {
Matt Arsenault90c75932017-10-03 00:06:41 +0000516 let OtherPredicates = [isCI]; // should this be isCIOnly?
Marek Olsak8973a0a2017-05-24 14:53:50 +0000517}
518
519} // End let AddedComplexity = SM_LOAD_PATTERN.AddedComplexity
520