blob: b25e35e3add0573d0c641e403f1327e3ce0a71cd [file] [log] [blame]
Matt Arsenaultdf90c022013-10-15 23:44:45 +00001//===-- SIInstrInfo.h - SI Instruction Info Interface -----------*- C++ -*-===//
Tom Stellard75aadc22012-12-11 21:25:42 +00002//
3// The LLVM Compiler Infrastructure
4//
5// This file is distributed under the University of Illinois Open Source
6// License. See LICENSE.TXT for details.
7//
8//===----------------------------------------------------------------------===//
9//
10/// \file
11/// \brief Interface definition for SIInstrInfo.
12//
13//===----------------------------------------------------------------------===//
14
15
Benjamin Kramera7c40ef2014-08-13 16:26:38 +000016#ifndef LLVM_LIB_TARGET_R600_SIINSTRINFO_H
17#define LLVM_LIB_TARGET_R600_SIINSTRINFO_H
Tom Stellard75aadc22012-12-11 21:25:42 +000018
19#include "AMDGPUInstrInfo.h"
Matt Arsenaultc5f174d2014-12-01 15:52:46 +000020#include "SIDefines.h"
Tom Stellard75aadc22012-12-11 21:25:42 +000021#include "SIRegisterInfo.h"
22
23namespace llvm {
24
25class SIInstrInfo : public AMDGPUInstrInfo {
26private:
27 const SIRegisterInfo RI;
28
Tom Stellard15834092014-03-21 15:51:57 +000029 unsigned buildExtractSubReg(MachineBasicBlock::iterator MI,
30 MachineRegisterInfo &MRI,
31 MachineOperand &SuperReg,
32 const TargetRegisterClass *SuperRC,
33 unsigned SubIdx,
34 const TargetRegisterClass *SubRC) const;
Matt Arsenault248b7b62014-03-24 20:08:09 +000035 MachineOperand buildExtractSubRegOrImm(MachineBasicBlock::iterator MI,
36 MachineRegisterInfo &MRI,
37 MachineOperand &SuperReg,
38 const TargetRegisterClass *SuperRC,
39 unsigned SubIdx,
40 const TargetRegisterClass *SubRC) const;
Tom Stellard15834092014-03-21 15:51:57 +000041
Matt Arsenaultbd995802014-03-24 18:26:52 +000042 unsigned split64BitImm(SmallVectorImpl<MachineInstr *> &Worklist,
43 MachineBasicBlock::iterator MI,
44 MachineRegisterInfo &MRI,
45 const TargetRegisterClass *RC,
46 const MachineOperand &Op) const;
47
Marek Olsakbe047802014-12-07 12:19:03 +000048 void swapOperands(MachineBasicBlock::iterator Inst) const;
49
Matt Arsenault689f3252014-06-09 16:36:31 +000050 void splitScalar64BitUnaryOp(SmallVectorImpl<MachineInstr *> &Worklist,
51 MachineInstr *Inst, unsigned Opcode) const;
52
53 void splitScalar64BitBinaryOp(SmallVectorImpl<MachineInstr *> &Worklist,
54 MachineInstr *Inst, unsigned Opcode) const;
Matt Arsenaultf35182c2014-03-24 20:08:05 +000055
Matt Arsenault8333e432014-06-10 19:18:24 +000056 void splitScalar64BitBCNT(SmallVectorImpl<MachineInstr *> &Worklist,
57 MachineInstr *Inst) const;
Matt Arsenault94812212014-11-14 18:18:16 +000058 void splitScalar64BitBFE(SmallVectorImpl<MachineInstr *> &Worklist,
59 MachineInstr *Inst) const;
Matt Arsenault8333e432014-06-10 19:18:24 +000060
Matt Arsenault27cc9582014-04-18 01:53:18 +000061 void addDescImplicitUseDef(const MCInstrDesc &Desc, MachineInstr *MI) const;
Matt Arsenaultf35182c2014-03-24 20:08:05 +000062
Matt Arsenaultc09cc3c2014-11-19 00:01:31 +000063 bool checkInstOffsetsDoNotOverlap(MachineInstr *MIa,
64 MachineInstr *MIb) const;
65
Matt Arsenaultee522bf2014-09-26 17:55:06 +000066 unsigned findUsedSGPR(const MachineInstr *MI, int OpIndices[3]) const;
67
Tom Stellard75aadc22012-12-11 21:25:42 +000068public:
Tom Stellard2e59a452014-06-13 01:32:00 +000069 explicit SIInstrInfo(const AMDGPUSubtarget &st);
Tom Stellard75aadc22012-12-11 21:25:42 +000070
Craig Topper5656db42014-04-29 07:57:24 +000071 const SIRegisterInfo &getRegisterInfo() const override {
Matt Arsenault6dde3032014-03-11 00:01:34 +000072 return RI;
73 }
Tom Stellard75aadc22012-12-11 21:25:42 +000074
Matt Arsenaultc10853f2014-08-06 00:29:43 +000075 bool areLoadsFromSameBasePtr(SDNode *Load1, SDNode *Load2,
76 int64_t &Offset1,
77 int64_t &Offset2) const override;
78
Matt Arsenault1acc72f2014-07-29 21:34:55 +000079 bool getLdStBaseRegImmOfs(MachineInstr *LdSt,
80 unsigned &BaseReg, unsigned &Offset,
81 const TargetRegisterInfo *TRI) const final;
82
Matt Arsenault0e75a062014-09-17 17:48:30 +000083 bool shouldClusterLoads(MachineInstr *FirstLdSt,
84 MachineInstr *SecondLdSt,
85 unsigned NumLoads) const final;
86
Craig Topper5656db42014-04-29 07:57:24 +000087 void copyPhysReg(MachineBasicBlock &MBB,
88 MachineBasicBlock::iterator MI, DebugLoc DL,
89 unsigned DestReg, unsigned SrcReg,
90 bool KillSrc) const override;
Tom Stellard75aadc22012-12-11 21:25:42 +000091
Tom Stellard96468902014-09-24 01:33:17 +000092 unsigned calculateLDSSpillAddress(MachineBasicBlock &MBB,
93 MachineBasicBlock::iterator MI,
94 RegScavenger *RS,
95 unsigned TmpReg,
96 unsigned Offset,
97 unsigned Size) const;
98
Tom Stellardc149dc02013-11-27 21:23:35 +000099 void storeRegToStackSlot(MachineBasicBlock &MBB,
100 MachineBasicBlock::iterator MI,
101 unsigned SrcReg, bool isKill, int FrameIndex,
102 const TargetRegisterClass *RC,
Craig Topper5656db42014-04-29 07:57:24 +0000103 const TargetRegisterInfo *TRI) const override;
Tom Stellardc149dc02013-11-27 21:23:35 +0000104
105 void loadRegFromStackSlot(MachineBasicBlock &MBB,
106 MachineBasicBlock::iterator MI,
107 unsigned DestReg, int FrameIndex,
108 const TargetRegisterClass *RC,
Craig Topper5656db42014-04-29 07:57:24 +0000109 const TargetRegisterInfo *TRI) const override;
Tom Stellardc149dc02013-11-27 21:23:35 +0000110
Benjamin Kramer8c90fd72014-09-03 11:41:21 +0000111 bool expandPostRAPseudo(MachineBasicBlock::iterator MI) const override;
Tom Stellardeba61072014-05-02 15:41:42 +0000112
Tom Stellardef3b8642015-01-07 19:56:17 +0000113 // \brief Returns an opcode that can be used to move a value to a \p DstRC
114 // register. If there is no hardware instruction that can store to \p
115 // DstRC, then AMDGPU::COPY is returned.
116 unsigned getMovOpcode(const TargetRegisterClass *DstRC) const;
Christian Konig3c145802013-03-27 09:12:59 +0000117 unsigned commuteOpcode(unsigned Opcode) const;
118
Craig Topper5656db42014-04-29 07:57:24 +0000119 MachineInstr *commuteInstruction(MachineInstr *MI,
Matt Arsenault92befe72014-09-26 17:54:54 +0000120 bool NewMI = false) const override;
121 bool findCommutedOpIndices(MachineInstr *MI,
122 unsigned &SrcOpIdx1,
123 unsigned &SrcOpIdx2) const override;
Christian Konig76edd4f2013-02-26 17:52:29 +0000124
Tom Stellard30f59412014-03-31 14:01:56 +0000125 bool isTriviallyReMaterializable(const MachineInstr *MI,
Craig Toppere73658d2014-04-28 04:05:08 +0000126 AliasAnalysis *AA = nullptr) const;
Tom Stellard30f59412014-03-31 14:01:56 +0000127
Matt Arsenaultc09cc3c2014-11-19 00:01:31 +0000128 bool areMemAccessesTriviallyDisjoint(
129 MachineInstr *MIa, MachineInstr *MIb,
130 AliasAnalysis *AA = nullptr) const override;
131
Tom Stellard26a3b672013-10-22 18:19:10 +0000132 MachineInstr *buildMovInstr(MachineBasicBlock *MBB,
133 MachineBasicBlock::iterator I,
Craig Topper5656db42014-04-29 07:57:24 +0000134 unsigned DstReg, unsigned SrcReg) const override;
135 bool isMov(unsigned Opcode) const override;
Tom Stellard75aadc22012-12-11 21:25:42 +0000136
Craig Topper5656db42014-04-29 07:57:24 +0000137 bool isSafeToMoveRegClassDefs(const TargetRegisterClass *RC) const override;
Matt Arsenaultc5f174d2014-12-01 15:52:46 +0000138
139 bool isSALU(uint16_t Opcode) const {
140 return get(Opcode).TSFlags & SIInstrFlags::SALU;
141 }
142
143 bool isVALU(uint16_t Opcode) const {
144 return get(Opcode).TSFlags & SIInstrFlags::VALU;
145 }
146
147 bool isSOP1(uint16_t Opcode) const {
148 return get(Opcode).TSFlags & SIInstrFlags::SOP1;
149 }
150
151 bool isSOP2(uint16_t Opcode) const {
152 return get(Opcode).TSFlags & SIInstrFlags::SOP2;
153 }
154
155 bool isSOPC(uint16_t Opcode) const {
156 return get(Opcode).TSFlags & SIInstrFlags::SOPC;
157 }
158
159 bool isSOPK(uint16_t Opcode) const {
160 return get(Opcode).TSFlags & SIInstrFlags::SOPK;
161 }
162
163 bool isSOPP(uint16_t Opcode) const {
164 return get(Opcode).TSFlags & SIInstrFlags::SOPP;
165 }
166
167 bool isVOP1(uint16_t Opcode) const {
168 return get(Opcode).TSFlags & SIInstrFlags::VOP1;
169 }
170
171 bool isVOP2(uint16_t Opcode) const {
172 return get(Opcode).TSFlags & SIInstrFlags::VOP2;
173 }
174
175 bool isVOP3(uint16_t Opcode) const {
176 return get(Opcode).TSFlags & SIInstrFlags::VOP3;
177 }
178
179 bool isVOPC(uint16_t Opcode) const {
180 return get(Opcode).TSFlags & SIInstrFlags::VOPC;
181 }
182
183 bool isMUBUF(uint16_t Opcode) const {
184 return get(Opcode).TSFlags & SIInstrFlags::MUBUF;
185 }
186
187 bool isMTBUF(uint16_t Opcode) const {
188 return get(Opcode).TSFlags & SIInstrFlags::MTBUF;
189 }
190
191 bool isSMRD(uint16_t Opcode) const {
192 return get(Opcode).TSFlags & SIInstrFlags::SMRD;
193 }
194
195 bool isDS(uint16_t Opcode) const {
196 return get(Opcode).TSFlags & SIInstrFlags::DS;
197 }
198
199 bool isMIMG(uint16_t Opcode) const {
200 return get(Opcode).TSFlags & SIInstrFlags::MIMG;
201 }
202
203 bool isFLAT(uint16_t Opcode) const {
204 return get(Opcode).TSFlags & SIInstrFlags::FLAT;
205 }
Matt Arsenaultc09cc3c2014-11-19 00:01:31 +0000206
Michel Danzer494391b2015-02-06 02:51:20 +0000207 bool isWQM(uint16_t Opcode) const {
208 return get(Opcode).TSFlags & SIInstrFlags::WQM;
209 }
210
Matt Arsenaultd7bdcc42014-03-31 19:54:27 +0000211 bool isInlineConstant(const APInt &Imm) const;
Tom Stellard93fabce2013-10-10 17:11:55 +0000212 bool isInlineConstant(const MachineOperand &MO) const;
213 bool isLiteralConstant(const MachineOperand &MO) const;
Tom Stellardf3b2a1e2013-02-06 17:32:29 +0000214
Tom Stellardb02094e2014-07-21 15:45:01 +0000215 bool isImmOperandLegal(const MachineInstr *MI, unsigned OpNo,
216 const MachineOperand &MO) const;
217
Matt Arsenaultb2baffa2014-08-15 17:49:05 +0000218 /// \brief Return true if the given offset Size in bytes can be folded into
219 /// the immediate offsets of a memory instruction for the given address space.
Marek Olsak58f61a82014-12-07 17:17:38 +0000220 bool canFoldOffset(unsigned OffsetSize, unsigned AS) const;
Matt Arsenaultb2baffa2014-08-15 17:49:05 +0000221
Tom Stellard86d12eb2014-08-01 00:32:28 +0000222 /// \brief Return true if this 64-bit VALU instruction has a 32-bit encoding.
223 /// This function will return false if you pass it a 32-bit instruction.
224 bool hasVALU32BitEncoding(unsigned Opcode) const;
225
Tom Stellard73ae1cb2014-09-23 21:26:25 +0000226 /// \brief Returns true if this operand uses the constant bus.
227 bool usesConstantBus(const MachineRegisterInfo &MRI,
228 const MachineOperand &MO) const;
229
Tom Stellardb4a313a2014-08-01 00:32:39 +0000230 /// \brief Return true if this instruction has any modifiers.
231 /// e.g. src[012]_mod, omod, clamp.
232 bool hasModifiers(unsigned Opcode) const;
Matt Arsenaultace5b762014-10-17 18:00:43 +0000233
234 bool hasModifiersSet(const MachineInstr &MI,
235 unsigned OpName) const;
236
Craig Topper5656db42014-04-29 07:57:24 +0000237 bool verifyInstruction(const MachineInstr *MI,
238 StringRef &ErrInfo) const override;
Tom Stellardf3b2a1e2013-02-06 17:32:29 +0000239
Matt Arsenaultf14032a2013-11-15 22:02:28 +0000240 static unsigned getVALUOp(const MachineInstr &MI);
Matt Arsenaultf35182c2014-03-24 20:08:05 +0000241
Tom Stellard82166022013-11-13 23:36:37 +0000242 bool isSALUOpSupportedOnVALU(const MachineInstr &MI) const;
243
244 /// \brief Return the correct register class for \p OpNo. For target-specific
245 /// instructions, this will return the register class that has been defined
246 /// in tablegen. For generic instructions, like REG_SEQUENCE it will return
247 /// the register class of its machine operand.
248 /// to infer the correct register class base on the other operands.
249 const TargetRegisterClass *getOpRegClass(const MachineInstr &MI,
250 unsigned OpNo) const;\
251
252 /// \returns true if it is legal for the operand at index \p OpNo
253 /// to read a VGPR.
254 bool canReadVGPR(const MachineInstr &MI, unsigned OpNo) const;
255
256 /// \brief Legalize the \p OpIndex operand of this instruction by inserting
257 /// a MOV. For example:
258 /// ADD_I32_e32 VGPR0, 15
259 /// to
260 /// MOV VGPR1, 15
261 /// ADD_I32_e32 VGPR0, VGPR1
262 ///
263 /// If the operand being legalized is a register, then a COPY will be used
264 /// instead of MOV.
265 void legalizeOpWithMove(MachineInstr *MI, unsigned OpIdx) const;
266
Tom Stellard0e975cf2014-08-01 00:32:35 +0000267 /// \brief Check if \p MO is a legal operand if it was the \p OpIdx Operand
268 /// for \p MI.
269 bool isOperandLegal(const MachineInstr *MI, unsigned OpIdx,
270 const MachineOperand *MO = nullptr) const;
271
Tom Stellard82166022013-11-13 23:36:37 +0000272 /// \brief Legalize all operands in this instruction. This function may
273 /// create new instruction and insert them before \p MI.
274 void legalizeOperands(MachineInstr *MI) const;
275
Tom Stellard745f2ed2014-08-21 20:41:00 +0000276 /// \brief Split an SMRD instruction into two smaller loads of half the
277 // size storing the results in \p Lo and \p Hi.
278 void splitSMRD(MachineInstr *MI, const TargetRegisterClass *HalfRC,
279 unsigned HalfImmOp, unsigned HalfSGPROp,
280 MachineInstr *&Lo, MachineInstr *&Hi) const;
281
Tom Stellard0c354f22014-04-30 15:31:29 +0000282 void moveSMRDToVALU(MachineInstr *MI, MachineRegisterInfo &MRI) const;
283
Tom Stellard82166022013-11-13 23:36:37 +0000284 /// \brief Replace this instruction's opcode with the equivalent VALU
285 /// opcode. This function will also move the users of \p MI to the
286 /// VALU if necessary.
287 void moveToVALU(MachineInstr &MI) const;
288
Craig Topper5656db42014-04-29 07:57:24 +0000289 unsigned calculateIndirectAddress(unsigned RegIndex,
290 unsigned Channel) const override;
Tom Stellardf3b2a1e2013-02-06 17:32:29 +0000291
Craig Topper5656db42014-04-29 07:57:24 +0000292 const TargetRegisterClass *getIndirectAddrRegClass() const override;
Tom Stellardf3b2a1e2013-02-06 17:32:29 +0000293
Craig Topper5656db42014-04-29 07:57:24 +0000294 MachineInstrBuilder buildIndirectWrite(MachineBasicBlock *MBB,
295 MachineBasicBlock::iterator I,
296 unsigned ValueReg,
297 unsigned Address,
298 unsigned OffsetReg) const override;
Tom Stellardf3b2a1e2013-02-06 17:32:29 +0000299
Craig Topper5656db42014-04-29 07:57:24 +0000300 MachineInstrBuilder buildIndirectRead(MachineBasicBlock *MBB,
301 MachineBasicBlock::iterator I,
302 unsigned ValueReg,
303 unsigned Address,
304 unsigned OffsetReg) const override;
Tom Stellard81d871d2013-11-13 23:36:50 +0000305 void reserveIndirectRegisters(BitVector &Reserved,
306 const MachineFunction &MF) const;
307
308 void LoadM0(MachineInstr *MoveRel, MachineBasicBlock::iterator I,
309 unsigned SavReg, unsigned IndexReg) const;
Tom Stellardeba61072014-05-02 15:41:42 +0000310
311 void insertNOPs(MachineBasicBlock::iterator MI, int Count) const;
Tom Stellard1aaad692014-07-21 16:55:33 +0000312
313 /// \brief Returns the operand named \p Op. If \p MI does not have an
314 /// operand named \c Op, this function returns nullptr.
Tom Stellard6407e1e2014-08-01 00:32:33 +0000315 MachineOperand *getNamedOperand(MachineInstr &MI, unsigned OperandName) const;
Matt Arsenaultace5b762014-10-17 18:00:43 +0000316
317 const MachineOperand *getNamedOperand(const MachineInstr &MI,
318 unsigned OpName) const {
319 return getNamedOperand(const_cast<MachineInstr &>(MI), OpName);
320 }
Tom Stellard794c8c02014-12-02 17:05:41 +0000321
322 uint64_t getDefaultRsrcDataFormat() const;
323
Tom Stellard81d871d2013-11-13 23:36:50 +0000324};
Tom Stellard75aadc22012-12-11 21:25:42 +0000325
Christian Konigf741fbf2013-02-26 17:52:42 +0000326namespace AMDGPU {
327
328 int getVOPe64(uint16_t Opcode);
Tom Stellard1aaad692014-07-21 16:55:33 +0000329 int getVOPe32(uint16_t Opcode);
Christian Konig3c145802013-03-27 09:12:59 +0000330 int getCommuteRev(uint16_t Opcode);
331 int getCommuteOrig(uint16_t Opcode);
Tom Stellard155bbb72014-08-11 22:18:17 +0000332 int getAddr64Inst(uint16_t Opcode);
Matt Arsenault9903ccf2014-09-08 15:07:27 +0000333 int getAtomicRetOp(uint16_t Opcode);
334 int getAtomicNoRetOp(uint16_t Opcode);
Christian Konigf741fbf2013-02-26 17:52:42 +0000335
Tom Stellard15834092014-03-21 15:51:57 +0000336 const uint64_t RSRC_DATA_FORMAT = 0xf00000000000LL;
Tom Stellardb02094e2014-07-21 15:45:01 +0000337 const uint64_t RSRC_TID_ENABLE = 1LL << 55;
Tom Stellard15834092014-03-21 15:51:57 +0000338
Christian Konigf741fbf2013-02-26 17:52:42 +0000339} // End namespace AMDGPU
340
Tom Stellardec2e43c2014-09-22 15:35:29 +0000341namespace SI {
342namespace KernelInputOffsets {
343
344/// Offsets in bytes from the start of the input buffer
345enum Offsets {
346 NGROUPS_X = 0,
347 NGROUPS_Y = 4,
348 NGROUPS_Z = 8,
349 GLOBAL_SIZE_X = 12,
350 GLOBAL_SIZE_Y = 16,
351 GLOBAL_SIZE_Z = 20,
352 LOCAL_SIZE_X = 24,
353 LOCAL_SIZE_Y = 28,
354 LOCAL_SIZE_Z = 32
355};
356
357} // End namespace KernelInputOffsets
358} // End namespace SI
359
Tom Stellard75aadc22012-12-11 21:25:42 +0000360} // End namespace llvm
361
Benjamin Kramera7c40ef2014-08-13 16:26:38 +0000362#endif