blob: ce32fd7fa65a5182b26407286bd0cf7048eab6f4 [file] [log] [blame]
Matt Arsenaultdf90c022013-10-15 23:44:45 +00001//===-- SIInstrInfo.h - SI Instruction Info Interface -----------*- C++ -*-===//
Tom Stellard75aadc22012-12-11 21:25:42 +00002//
3// The LLVM Compiler Infrastructure
4//
5// This file is distributed under the University of Illinois Open Source
6// License. See LICENSE.TXT for details.
7//
8//===----------------------------------------------------------------------===//
9//
10/// \file
11/// \brief Interface definition for SIInstrInfo.
12//
13//===----------------------------------------------------------------------===//
14
15
Benjamin Kramera7c40ef2014-08-13 16:26:38 +000016#ifndef LLVM_LIB_TARGET_R600_SIINSTRINFO_H
17#define LLVM_LIB_TARGET_R600_SIINSTRINFO_H
Tom Stellard75aadc22012-12-11 21:25:42 +000018
19#include "AMDGPUInstrInfo.h"
20#include "SIRegisterInfo.h"
21
22namespace llvm {
23
24class SIInstrInfo : public AMDGPUInstrInfo {
25private:
26 const SIRegisterInfo RI;
27
Tom Stellard15834092014-03-21 15:51:57 +000028 unsigned buildExtractSubReg(MachineBasicBlock::iterator MI,
29 MachineRegisterInfo &MRI,
30 MachineOperand &SuperReg,
31 const TargetRegisterClass *SuperRC,
32 unsigned SubIdx,
33 const TargetRegisterClass *SubRC) const;
Matt Arsenault248b7b62014-03-24 20:08:09 +000034 MachineOperand buildExtractSubRegOrImm(MachineBasicBlock::iterator MI,
35 MachineRegisterInfo &MRI,
36 MachineOperand &SuperReg,
37 const TargetRegisterClass *SuperRC,
38 unsigned SubIdx,
39 const TargetRegisterClass *SubRC) const;
Tom Stellard15834092014-03-21 15:51:57 +000040
Matt Arsenaultbd995802014-03-24 18:26:52 +000041 unsigned split64BitImm(SmallVectorImpl<MachineInstr *> &Worklist,
42 MachineBasicBlock::iterator MI,
43 MachineRegisterInfo &MRI,
44 const TargetRegisterClass *RC,
45 const MachineOperand &Op) const;
46
Matt Arsenault689f3252014-06-09 16:36:31 +000047 void splitScalar64BitUnaryOp(SmallVectorImpl<MachineInstr *> &Worklist,
48 MachineInstr *Inst, unsigned Opcode) const;
49
50 void splitScalar64BitBinaryOp(SmallVectorImpl<MachineInstr *> &Worklist,
51 MachineInstr *Inst, unsigned Opcode) const;
Matt Arsenaultf35182c2014-03-24 20:08:05 +000052
Matt Arsenault8333e432014-06-10 19:18:24 +000053 void splitScalar64BitBCNT(SmallVectorImpl<MachineInstr *> &Worklist,
54 MachineInstr *Inst) const;
Matt Arsenault94812212014-11-14 18:18:16 +000055 void splitScalar64BitBFE(SmallVectorImpl<MachineInstr *> &Worklist,
56 MachineInstr *Inst) const;
Matt Arsenault8333e432014-06-10 19:18:24 +000057
Matt Arsenault27cc9582014-04-18 01:53:18 +000058 void addDescImplicitUseDef(const MCInstrDesc &Desc, MachineInstr *MI) const;
Matt Arsenaultf35182c2014-03-24 20:08:05 +000059
Matt Arsenaultee522bf2014-09-26 17:55:06 +000060 unsigned findUsedSGPR(const MachineInstr *MI, int OpIndices[3]) const;
61
Tom Stellard75aadc22012-12-11 21:25:42 +000062public:
Tom Stellard2e59a452014-06-13 01:32:00 +000063 explicit SIInstrInfo(const AMDGPUSubtarget &st);
Tom Stellard75aadc22012-12-11 21:25:42 +000064
Craig Topper5656db42014-04-29 07:57:24 +000065 const SIRegisterInfo &getRegisterInfo() const override {
Matt Arsenault6dde3032014-03-11 00:01:34 +000066 return RI;
67 }
Tom Stellard75aadc22012-12-11 21:25:42 +000068
Matt Arsenaultc10853f2014-08-06 00:29:43 +000069 bool areLoadsFromSameBasePtr(SDNode *Load1, SDNode *Load2,
70 int64_t &Offset1,
71 int64_t &Offset2) const override;
72
Matt Arsenault1acc72f2014-07-29 21:34:55 +000073 bool getLdStBaseRegImmOfs(MachineInstr *LdSt,
74 unsigned &BaseReg, unsigned &Offset,
75 const TargetRegisterInfo *TRI) const final;
76
Matt Arsenault0e75a062014-09-17 17:48:30 +000077 bool shouldClusterLoads(MachineInstr *FirstLdSt,
78 MachineInstr *SecondLdSt,
79 unsigned NumLoads) const final;
80
Craig Topper5656db42014-04-29 07:57:24 +000081 void copyPhysReg(MachineBasicBlock &MBB,
82 MachineBasicBlock::iterator MI, DebugLoc DL,
83 unsigned DestReg, unsigned SrcReg,
84 bool KillSrc) const override;
Tom Stellard75aadc22012-12-11 21:25:42 +000085
Tom Stellard96468902014-09-24 01:33:17 +000086 unsigned calculateLDSSpillAddress(MachineBasicBlock &MBB,
87 MachineBasicBlock::iterator MI,
88 RegScavenger *RS,
89 unsigned TmpReg,
90 unsigned Offset,
91 unsigned Size) const;
92
Tom Stellardc149dc02013-11-27 21:23:35 +000093 void storeRegToStackSlot(MachineBasicBlock &MBB,
94 MachineBasicBlock::iterator MI,
95 unsigned SrcReg, bool isKill, int FrameIndex,
96 const TargetRegisterClass *RC,
Craig Topper5656db42014-04-29 07:57:24 +000097 const TargetRegisterInfo *TRI) const override;
Tom Stellardc149dc02013-11-27 21:23:35 +000098
99 void loadRegFromStackSlot(MachineBasicBlock &MBB,
100 MachineBasicBlock::iterator MI,
101 unsigned DestReg, int FrameIndex,
102 const TargetRegisterClass *RC,
Craig Topper5656db42014-04-29 07:57:24 +0000103 const TargetRegisterInfo *TRI) const override;
Tom Stellardc149dc02013-11-27 21:23:35 +0000104
Benjamin Kramer8c90fd72014-09-03 11:41:21 +0000105 bool expandPostRAPseudo(MachineBasicBlock::iterator MI) const override;
Tom Stellardeba61072014-05-02 15:41:42 +0000106
Christian Konig3c145802013-03-27 09:12:59 +0000107 unsigned commuteOpcode(unsigned Opcode) const;
108
Craig Topper5656db42014-04-29 07:57:24 +0000109 MachineInstr *commuteInstruction(MachineInstr *MI,
Matt Arsenault92befe72014-09-26 17:54:54 +0000110 bool NewMI = false) const override;
111 bool findCommutedOpIndices(MachineInstr *MI,
112 unsigned &SrcOpIdx1,
113 unsigned &SrcOpIdx2) const override;
Christian Konig76edd4f2013-02-26 17:52:29 +0000114
Tom Stellard30f59412014-03-31 14:01:56 +0000115 bool isTriviallyReMaterializable(const MachineInstr *MI,
Craig Toppere73658d2014-04-28 04:05:08 +0000116 AliasAnalysis *AA = nullptr) const;
Tom Stellard30f59412014-03-31 14:01:56 +0000117
Tom Stellard26a3b672013-10-22 18:19:10 +0000118 MachineInstr *buildMovInstr(MachineBasicBlock *MBB,
119 MachineBasicBlock::iterator I,
Craig Topper5656db42014-04-29 07:57:24 +0000120 unsigned DstReg, unsigned SrcReg) const override;
121 bool isMov(unsigned Opcode) const override;
Tom Stellard75aadc22012-12-11 21:25:42 +0000122
Craig Topper5656db42014-04-29 07:57:24 +0000123 bool isSafeToMoveRegClassDefs(const TargetRegisterClass *RC) const override;
Tom Stellard5d7aaae2014-02-10 16:58:30 +0000124 bool isDS(uint16_t Opcode) const;
Matt Arsenaultb9f46ee2014-07-28 17:59:38 +0000125 bool isMIMG(uint16_t Opcode) const;
126 bool isSMRD(uint16_t Opcode) const;
Matt Arsenaulte2fabd32014-07-29 18:51:56 +0000127 bool isMUBUF(uint16_t Opcode) const;
128 bool isMTBUF(uint16_t Opcode) const;
Matt Arsenault3f981402014-09-15 15:41:53 +0000129 bool isFLAT(uint16_t Opcode) const;
Tom Stellard93fabce2013-10-10 17:11:55 +0000130 bool isVOP1(uint16_t Opcode) const;
131 bool isVOP2(uint16_t Opcode) const;
132 bool isVOP3(uint16_t Opcode) const;
133 bool isVOPC(uint16_t Opcode) const;
Matt Arsenaultd7bdcc42014-03-31 19:54:27 +0000134 bool isInlineConstant(const APInt &Imm) const;
Tom Stellard93fabce2013-10-10 17:11:55 +0000135 bool isInlineConstant(const MachineOperand &MO) const;
136 bool isLiteralConstant(const MachineOperand &MO) const;
Tom Stellardf3b2a1e2013-02-06 17:32:29 +0000137
Tom Stellardb02094e2014-07-21 15:45:01 +0000138 bool isImmOperandLegal(const MachineInstr *MI, unsigned OpNo,
139 const MachineOperand &MO) const;
140
Matt Arsenaultb2baffa2014-08-15 17:49:05 +0000141 /// \brief Return true if the given offset Size in bytes can be folded into
142 /// the immediate offsets of a memory instruction for the given address space.
143 static bool canFoldOffset(unsigned OffsetSize, unsigned AS) LLVM_READNONE;
144
Tom Stellard86d12eb2014-08-01 00:32:28 +0000145 /// \brief Return true if this 64-bit VALU instruction has a 32-bit encoding.
146 /// This function will return false if you pass it a 32-bit instruction.
147 bool hasVALU32BitEncoding(unsigned Opcode) const;
148
Tom Stellard73ae1cb2014-09-23 21:26:25 +0000149 /// \brief Returns true if this operand uses the constant bus.
150 bool usesConstantBus(const MachineRegisterInfo &MRI,
151 const MachineOperand &MO) const;
152
Tom Stellardb4a313a2014-08-01 00:32:39 +0000153 /// \brief Return true if this instruction has any modifiers.
154 /// e.g. src[012]_mod, omod, clamp.
155 bool hasModifiers(unsigned Opcode) const;
Matt Arsenaultace5b762014-10-17 18:00:43 +0000156
157 bool hasModifiersSet(const MachineInstr &MI,
158 unsigned OpName) const;
159
Craig Topper5656db42014-04-29 07:57:24 +0000160 bool verifyInstruction(const MachineInstr *MI,
161 StringRef &ErrInfo) const override;
Tom Stellardf3b2a1e2013-02-06 17:32:29 +0000162
Tom Stellard82166022013-11-13 23:36:37 +0000163 bool isSALUInstr(const MachineInstr &MI) const;
Matt Arsenaultf14032a2013-11-15 22:02:28 +0000164 static unsigned getVALUOp(const MachineInstr &MI);
Matt Arsenaultf35182c2014-03-24 20:08:05 +0000165
Tom Stellard82166022013-11-13 23:36:37 +0000166 bool isSALUOpSupportedOnVALU(const MachineInstr &MI) const;
167
168 /// \brief Return the correct register class for \p OpNo. For target-specific
169 /// instructions, this will return the register class that has been defined
170 /// in tablegen. For generic instructions, like REG_SEQUENCE it will return
171 /// the register class of its machine operand.
172 /// to infer the correct register class base on the other operands.
173 const TargetRegisterClass *getOpRegClass(const MachineInstr &MI,
174 unsigned OpNo) const;\
175
176 /// \returns true if it is legal for the operand at index \p OpNo
177 /// to read a VGPR.
178 bool canReadVGPR(const MachineInstr &MI, unsigned OpNo) const;
179
180 /// \brief Legalize the \p OpIndex operand of this instruction by inserting
181 /// a MOV. For example:
182 /// ADD_I32_e32 VGPR0, 15
183 /// to
184 /// MOV VGPR1, 15
185 /// ADD_I32_e32 VGPR0, VGPR1
186 ///
187 /// If the operand being legalized is a register, then a COPY will be used
188 /// instead of MOV.
189 void legalizeOpWithMove(MachineInstr *MI, unsigned OpIdx) const;
190
Tom Stellard0e975cf2014-08-01 00:32:35 +0000191 /// \brief Check if \p MO is a legal operand if it was the \p OpIdx Operand
192 /// for \p MI.
193 bool isOperandLegal(const MachineInstr *MI, unsigned OpIdx,
194 const MachineOperand *MO = nullptr) const;
195
Tom Stellard82166022013-11-13 23:36:37 +0000196 /// \brief Legalize all operands in this instruction. This function may
197 /// create new instruction and insert them before \p MI.
198 void legalizeOperands(MachineInstr *MI) const;
199
Tom Stellard745f2ed2014-08-21 20:41:00 +0000200 /// \brief Split an SMRD instruction into two smaller loads of half the
201 // size storing the results in \p Lo and \p Hi.
202 void splitSMRD(MachineInstr *MI, const TargetRegisterClass *HalfRC,
203 unsigned HalfImmOp, unsigned HalfSGPROp,
204 MachineInstr *&Lo, MachineInstr *&Hi) const;
205
Tom Stellard0c354f22014-04-30 15:31:29 +0000206 void moveSMRDToVALU(MachineInstr *MI, MachineRegisterInfo &MRI) const;
207
Tom Stellard82166022013-11-13 23:36:37 +0000208 /// \brief Replace this instruction's opcode with the equivalent VALU
209 /// opcode. This function will also move the users of \p MI to the
210 /// VALU if necessary.
211 void moveToVALU(MachineInstr &MI) const;
212
Craig Topper5656db42014-04-29 07:57:24 +0000213 unsigned calculateIndirectAddress(unsigned RegIndex,
214 unsigned Channel) const override;
Tom Stellardf3b2a1e2013-02-06 17:32:29 +0000215
Craig Topper5656db42014-04-29 07:57:24 +0000216 const TargetRegisterClass *getIndirectAddrRegClass() const override;
Tom Stellardf3b2a1e2013-02-06 17:32:29 +0000217
Craig Topper5656db42014-04-29 07:57:24 +0000218 MachineInstrBuilder buildIndirectWrite(MachineBasicBlock *MBB,
219 MachineBasicBlock::iterator I,
220 unsigned ValueReg,
221 unsigned Address,
222 unsigned OffsetReg) const override;
Tom Stellardf3b2a1e2013-02-06 17:32:29 +0000223
Craig Topper5656db42014-04-29 07:57:24 +0000224 MachineInstrBuilder buildIndirectRead(MachineBasicBlock *MBB,
225 MachineBasicBlock::iterator I,
226 unsigned ValueReg,
227 unsigned Address,
228 unsigned OffsetReg) const override;
Tom Stellard81d871d2013-11-13 23:36:50 +0000229 void reserveIndirectRegisters(BitVector &Reserved,
230 const MachineFunction &MF) const;
231
232 void LoadM0(MachineInstr *MoveRel, MachineBasicBlock::iterator I,
233 unsigned SavReg, unsigned IndexReg) const;
Tom Stellardeba61072014-05-02 15:41:42 +0000234
235 void insertNOPs(MachineBasicBlock::iterator MI, int Count) const;
Tom Stellard1aaad692014-07-21 16:55:33 +0000236
237 /// \brief Returns the operand named \p Op. If \p MI does not have an
238 /// operand named \c Op, this function returns nullptr.
Tom Stellard6407e1e2014-08-01 00:32:33 +0000239 MachineOperand *getNamedOperand(MachineInstr &MI, unsigned OperandName) const;
Matt Arsenaultace5b762014-10-17 18:00:43 +0000240
241 const MachineOperand *getNamedOperand(const MachineInstr &MI,
242 unsigned OpName) const {
243 return getNamedOperand(const_cast<MachineInstr &>(MI), OpName);
244 }
Tom Stellard81d871d2013-11-13 23:36:50 +0000245};
Tom Stellard75aadc22012-12-11 21:25:42 +0000246
Christian Konigf741fbf2013-02-26 17:52:42 +0000247namespace AMDGPU {
248
249 int getVOPe64(uint16_t Opcode);
Tom Stellard1aaad692014-07-21 16:55:33 +0000250 int getVOPe32(uint16_t Opcode);
Christian Konig3c145802013-03-27 09:12:59 +0000251 int getCommuteRev(uint16_t Opcode);
252 int getCommuteOrig(uint16_t Opcode);
Tom Stellardc721a232014-05-16 20:56:47 +0000253 int getMCOpcode(uint16_t Opcode, unsigned Gen);
Tom Stellard155bbb72014-08-11 22:18:17 +0000254 int getAddr64Inst(uint16_t Opcode);
Matt Arsenault9903ccf2014-09-08 15:07:27 +0000255 int getAtomicRetOp(uint16_t Opcode);
256 int getAtomicNoRetOp(uint16_t Opcode);
Christian Konigf741fbf2013-02-26 17:52:42 +0000257
Tom Stellard15834092014-03-21 15:51:57 +0000258 const uint64_t RSRC_DATA_FORMAT = 0xf00000000000LL;
Tom Stellardb02094e2014-07-21 15:45:01 +0000259 const uint64_t RSRC_TID_ENABLE = 1LL << 55;
Tom Stellard15834092014-03-21 15:51:57 +0000260
Christian Konigf741fbf2013-02-26 17:52:42 +0000261} // End namespace AMDGPU
262
Tom Stellardec2e43c2014-09-22 15:35:29 +0000263namespace SI {
264namespace KernelInputOffsets {
265
266/// Offsets in bytes from the start of the input buffer
267enum Offsets {
268 NGROUPS_X = 0,
269 NGROUPS_Y = 4,
270 NGROUPS_Z = 8,
271 GLOBAL_SIZE_X = 12,
272 GLOBAL_SIZE_Y = 16,
273 GLOBAL_SIZE_Z = 20,
274 LOCAL_SIZE_X = 24,
275 LOCAL_SIZE_Y = 28,
276 LOCAL_SIZE_Z = 32
277};
278
279} // End namespace KernelInputOffsets
280} // End namespace SI
281
Tom Stellard75aadc22012-12-11 21:25:42 +0000282} // End namespace llvm
283
Benjamin Kramera7c40ef2014-08-13 16:26:38 +0000284#endif