blob: 4c7f38a09a4844adc57f5f67ff9f49a88759b88e [file] [log] [blame]
Tom Stellard75aadc22012-12-11 21:25:42 +00001//===- SIMachineFunctionInfo.h - SIMachineFunctionInfo interface -*- C++ -*-==//
2//
3// The LLVM Compiler Infrastructure
4//
5// This file is distributed under the University of Illinois Open Source
6// License. See LICENSE.TXT for details.
7//
8//===----------------------------------------------------------------------===//
9//
10/// \file
11//
12//===----------------------------------------------------------------------===//
13
Matt Arsenault6b6a2c32016-03-11 08:00:27 +000014#ifndef LLVM_LIB_TARGET_AMDGPU_SIMACHINEFUNCTIONINFO_H
15#define LLVM_LIB_TARGET_AMDGPU_SIMACHINEFUNCTIONINFO_H
Tom Stellard75aadc22012-12-11 21:25:42 +000016
Vincent Lejeuneace6f732013-04-01 21:47:53 +000017#include "AMDGPUMachineFunction.h"
Matt Arsenault678e1112017-04-10 17:58:06 +000018#include "MCTargetDesc/AMDGPUMCTargetDesc.h"
Chandler Carruth6bda14b2017-06-06 11:49:48 +000019#include "SIRegisterInfo.h"
Eugene Zelenko66203762017-01-21 00:53:49 +000020#include "llvm/CodeGen/PseudoSourceValue.h"
21#include "llvm/MC/MCRegisterInfo.h"
22#include "llvm/Support/ErrorHandling.h"
NAKAMURA Takumi5cbd41e2016-06-27 10:26:43 +000023#include <array>
Eugene Zelenko66203762017-01-21 00:53:49 +000024#include <cassert>
Tom Stellardc149dc02013-11-27 21:23:35 +000025#include <map>
Eugene Zelenko66203762017-01-21 00:53:49 +000026#include <utility>
Tom Stellard75aadc22012-12-11 21:25:42 +000027
28namespace llvm {
29
Tom Stellard244891d2016-12-20 15:52:17 +000030class AMDGPUImagePseudoSourceValue : public PseudoSourceValue {
31public:
32 explicit AMDGPUImagePseudoSourceValue() :
33 PseudoSourceValue(PseudoSourceValue::TargetCustom) { }
34
35 bool isConstant(const MachineFrameInfo *) const override {
36 // This should probably be true for most images, but we will start by being
37 // conservative.
38 return false;
39 }
40
41 bool isAliased(const MachineFrameInfo *) const override {
42 // FIXME: If we ever change image intrinsics to accept fat pointers, then
43 // this could be true for some cases.
44 return false;
45 }
46
47 bool mayAlias(const MachineFrameInfo*) const override {
48 // FIXME: If we ever change image intrinsics to accept fat pointers, then
49 // this could be true for some cases.
50 return false;
51 }
52};
53
Tom Stellard6f9ef142016-12-20 17:19:44 +000054class AMDGPUBufferPseudoSourceValue : public PseudoSourceValue {
55public:
56 explicit AMDGPUBufferPseudoSourceValue() :
57 PseudoSourceValue(PseudoSourceValue::TargetCustom) { }
58
59 bool isConstant(const MachineFrameInfo *) const override {
60 // This should probably be true for most images, but we will start by being
61 // conservative.
62 return false;
63 }
64
65 bool isAliased(const MachineFrameInfo *) const override {
66 // FIXME: If we ever change image intrinsics to accept fat pointers, then
67 // this could be true for some cases.
68 return false;
69 }
70
71 bool mayAlias(const MachineFrameInfo*) const override {
72 // FIXME: If we ever change image intrinsics to accept fat pointers, then
73 // this could be true for some cases.
74 return false;
75 }
76};
Tom Stellard244891d2016-12-20 15:52:17 +000077
Tom Stellard75aadc22012-12-11 21:25:42 +000078/// This class keeps track of the SPI_SP_INPUT_ADDR config register, which
79/// tells the hardware which interpolation parameters to load.
Matt Arsenault6b6a2c32016-03-11 08:00:27 +000080class SIMachineFunctionInfo final : public AMDGPUMachineFunction {
Matt Arsenault26f8f3d2015-11-30 21:16:03 +000081 // FIXME: This should be removed and getPreloadedValue moved here.
Saleem Abdulrasool43e5fe32016-08-29 20:42:07 +000082 friend class SIRegisterInfo;
Tom Stellard96468902014-09-24 01:33:17 +000083
84 unsigned TIDReg;
Matt Arsenault26f8f3d2015-11-30 21:16:03 +000085
86 // Registers that may be reserved for spilling purposes. These may be the same
87 // as the input registers.
Matt Arsenault49affb82015-11-25 20:55:12 +000088 unsigned ScratchRSrcReg;
Matt Arsenault26f8f3d2015-11-30 21:16:03 +000089 unsigned ScratchWaveOffsetReg;
90
Matt Arsenault1c0ae392017-04-24 18:05:16 +000091 // This is the current function's incremented size from the kernel's scratch
92 // wave offset register. For an entry function, this is exactly the same as
93 // the ScratchWaveOffsetReg.
94 unsigned FrameOffsetReg;
95
96 // Top of the stack SGPR offset derived from the ScratchWaveOffsetReg.
97 unsigned StackPtrOffsetReg;
98
Tom Stellard2f3f9852017-01-25 01:25:13 +000099 // Input registers for non-HSA ABI
Matt Arsenault10fc0622017-06-26 03:01:31 +0000100 unsigned ImplicitBufferPtrUserSGPR;
Tom Stellard2f3f9852017-01-25 01:25:13 +0000101
Matt Arsenault26f8f3d2015-11-30 21:16:03 +0000102 // Input registers setup for the HSA ABI.
103 // User SGPRs in allocation order.
104 unsigned PrivateSegmentBufferUserSGPR;
105 unsigned DispatchPtrUserSGPR;
106 unsigned QueuePtrUserSGPR;
107 unsigned KernargSegmentPtrUserSGPR;
108 unsigned DispatchIDUserSGPR;
109 unsigned FlatScratchInitUserSGPR;
110 unsigned PrivateSegmentSizeUserSGPR;
111 unsigned GridWorkGroupCountXUserSGPR;
112 unsigned GridWorkGroupCountYUserSGPR;
113 unsigned GridWorkGroupCountZUserSGPR;
114
115 // System SGPRs in allocation order.
116 unsigned WorkGroupIDXSystemSGPR;
117 unsigned WorkGroupIDYSystemSGPR;
118 unsigned WorkGroupIDZSystemSGPR;
119 unsigned WorkGroupInfoSystemSGPR;
120 unsigned PrivateSegmentWaveByteOffsetSystemSGPR;
Matt Arsenault49affb82015-11-25 20:55:12 +0000121
Matt Arsenaulte15855d2017-07-17 22:35:50 +0000122 // VGPR inputs. These are always v0, v1 and v2 for entry functions.
123 unsigned WorkItemIDXVGPR;
124 unsigned WorkItemIDYVGPR;
125 unsigned WorkItemIDZVGPR;
126
Marek Olsakfccabaf2016-01-13 11:45:36 +0000127 // Graphics info.
128 unsigned PSInputAddr;
Matt Arsenaulte622dc32017-04-11 22:29:24 +0000129 unsigned PSInputEnable;
130
Marek Olsak8e9cc632016-01-13 17:23:09 +0000131 bool ReturnsVoid;
Marek Olsakfccabaf2016-01-13 11:45:36 +0000132
Konstantin Zhuravlyov1d650262016-09-06 20:22:28 +0000133 // A pair of default/requested minimum/maximum flat work group sizes.
134 // Minimum - first, maximum - second.
135 std::pair<unsigned, unsigned> FlatWorkGroupSizes;
Tom Stellard79a1fd72016-04-14 16:27:07 +0000136
Konstantin Zhuravlyov1d650262016-09-06 20:22:28 +0000137 // A pair of default/requested minimum/maximum number of waves per execution
138 // unit. Minimum - first, maximum - second.
139 std::pair<unsigned, unsigned> WavesPerEU;
140
Konstantin Zhuravlyovf2f3d142016-06-25 03:11:28 +0000141 // Stack object indices for work group IDs.
NAKAMURA Takumi5cbd41e2016-06-27 10:26:43 +0000142 std::array<int, 3> DebuggerWorkGroupIDStackObjectIndices;
Konstantin Zhuravlyovf2f3d142016-06-25 03:11:28 +0000143 // Stack object indices for work item IDs.
NAKAMURA Takumi5cbd41e2016-06-27 10:26:43 +0000144 std::array<int, 3> DebuggerWorkItemIDStackObjectIndices;
Konstantin Zhuravlyov71515e52016-04-26 17:24:40 +0000145
Tom Stellard6f9ef142016-12-20 17:19:44 +0000146 AMDGPUBufferPseudoSourceValue BufferPSV;
Tom Stellardbb138882016-12-20 17:26:34 +0000147 AMDGPUImagePseudoSourceValue ImagePSV;
Tom Stellard244891d2016-12-20 15:52:17 +0000148
Matt Arsenault161e2b42017-04-18 20:59:40 +0000149private:
Matt Arsenault49affb82015-11-25 20:55:12 +0000150 unsigned LDSWaveSpillSize;
Matt Arsenault49affb82015-11-25 20:55:12 +0000151 unsigned ScratchOffsetReg;
152 unsigned NumUserSGPRs;
Matt Arsenault26f8f3d2015-11-30 21:16:03 +0000153 unsigned NumSystemSGPRs;
Matt Arsenault49affb82015-11-25 20:55:12 +0000154
Matt Arsenault5b22dfa2015-11-05 05:27:10 +0000155 bool HasSpilledSGPRs;
Tom Stellard42fb60e2015-01-14 15:42:31 +0000156 bool HasSpilledVGPRs;
Matt Arsenault296b8492016-02-12 06:31:30 +0000157 bool HasNonSpillStackObjects;
Tom Stellard96468902014-09-24 01:33:17 +0000158
Marek Olsak0532c192016-07-13 17:35:15 +0000159 unsigned NumSpilledSGPRs;
160 unsigned NumSpilledVGPRs;
161
Matt Arsenault26f8f3d2015-11-30 21:16:03 +0000162 // Feature bits required for inputs passed in user SGPRs.
163 bool PrivateSegmentBuffer : 1;
Matt Arsenault49affb82015-11-25 20:55:12 +0000164 bool DispatchPtr : 1;
165 bool QueuePtr : 1;
Matt Arsenault49affb82015-11-25 20:55:12 +0000166 bool KernargSegmentPtr : 1;
Matt Arsenault8d718dc2016-07-22 17:01:30 +0000167 bool DispatchID : 1;
Matt Arsenault49affb82015-11-25 20:55:12 +0000168 bool FlatScratchInit : 1;
169 bool GridWorkgroupCountX : 1;
170 bool GridWorkgroupCountY : 1;
171 bool GridWorkgroupCountZ : 1;
Tom Stellardc149dc02013-11-27 21:23:35 +0000172
Matt Arsenault26f8f3d2015-11-30 21:16:03 +0000173 // Feature bits required for inputs passed in system SGPRs.
Matt Arsenault49affb82015-11-25 20:55:12 +0000174 bool WorkGroupIDX : 1; // Always initialized.
175 bool WorkGroupIDY : 1;
176 bool WorkGroupIDZ : 1;
177 bool WorkGroupInfo : 1;
Matt Arsenault26f8f3d2015-11-30 21:16:03 +0000178 bool PrivateSegmentWaveByteOffset : 1;
Matt Arsenault49affb82015-11-25 20:55:12 +0000179
180 bool WorkItemIDX : 1; // Always initialized.
181 bool WorkItemIDY : 1;
182 bool WorkItemIDZ : 1;
183
Tom Stellard2f3f9852017-01-25 01:25:13 +0000184 // Private memory buffer
185 // Compute directly in sgpr[0:1]
186 // Other shaders indirect 64-bits at sgpr[0:1]
Matt Arsenault10fc0622017-06-26 03:01:31 +0000187 bool ImplicitBufferPtr : 1;
Tom Stellard2f3f9852017-01-25 01:25:13 +0000188
Matt Arsenault26f8f3d2015-11-30 21:16:03 +0000189 MCPhysReg getNextUserSGPR() const {
190 assert(NumSystemSGPRs == 0 && "System SGPRs must be added after user SGPRs");
191 return AMDGPU::SGPR0 + NumUserSGPRs;
192 }
193
194 MCPhysReg getNextSystemSGPR() const {
195 return AMDGPU::SGPR0 + NumUserSGPRs + NumSystemSGPRs;
196 }
197
Matt Arsenault49affb82015-11-25 20:55:12 +0000198public:
Tom Stellardc149dc02013-11-27 21:23:35 +0000199 struct SpilledReg {
Eugene Zelenko66203762017-01-21 00:53:49 +0000200 unsigned VGPR = AMDGPU::NoRegister;
201 int Lane = -1;
202
203 SpilledReg() = default;
Tom Stellardc149dc02013-11-27 21:23:35 +0000204 SpilledReg(unsigned R, int L) : VGPR (R), Lane (L) { }
Eugene Zelenko66203762017-01-21 00:53:49 +0000205
Tom Stellardc149dc02013-11-27 21:23:35 +0000206 bool hasLane() { return Lane != -1;}
Tom Stellard649b5db2016-03-04 18:31:18 +0000207 bool hasReg() { return VGPR != AMDGPU::NoRegister;}
Tom Stellardc149dc02013-11-27 21:23:35 +0000208 };
209
Matt Arsenaulte0bf7d02017-02-21 19:12:08 +0000210private:
211 // SGPR->VGPR spilling support.
212 typedef std::pair<unsigned, unsigned> SpillRegMask;
213
214 // Track VGPR + wave index for each subregister of the SGPR spilled to
215 // frameindex key.
216 DenseMap<int, std::vector<SpilledReg>> SGPRToVGPRSpills;
217 unsigned NumVGPRSpillLanes = 0;
218 SmallVector<unsigned, 2> SpillVGPRs;
219
220public:
Tom Stellardc149dc02013-11-27 21:23:35 +0000221
Tom Stellard75aadc22012-12-11 21:25:42 +0000222 SIMachineFunctionInfo(const MachineFunction &MF);
Eugene Zelenko66203762017-01-21 00:53:49 +0000223
Matt Arsenaulte0bf7d02017-02-21 19:12:08 +0000224 ArrayRef<SpilledReg> getSGPRToVGPRSpills(int FrameIndex) const {
225 auto I = SGPRToVGPRSpills.find(FrameIndex);
226 return (I == SGPRToVGPRSpills.end()) ?
227 ArrayRef<SpilledReg>() : makeArrayRef(I->second);
228 }
229
230 bool allocateSGPRSpillToVGPR(MachineFunction &MF, int FI);
231 void removeSGPRToVGPRFrameIndices(MachineFrameInfo &MFI);
232
Tom Stellard96468902014-09-24 01:33:17 +0000233 bool hasCalculatedTID() const { return TIDReg != AMDGPU::NoRegister; };
234 unsigned getTIDReg() const { return TIDReg; };
235 void setTIDReg(unsigned Reg) { TIDReg = Reg; }
Matt Arsenault5b22dfa2015-11-05 05:27:10 +0000236
Matt Arsenault26f8f3d2015-11-30 21:16:03 +0000237 // Add user SGPRs.
238 unsigned addPrivateSegmentBuffer(const SIRegisterInfo &TRI);
239 unsigned addDispatchPtr(const SIRegisterInfo &TRI);
240 unsigned addQueuePtr(const SIRegisterInfo &TRI);
241 unsigned addKernargSegmentPtr(const SIRegisterInfo &TRI);
Matt Arsenault8d718dc2016-07-22 17:01:30 +0000242 unsigned addDispatchID(const SIRegisterInfo &TRI);
Matt Arsenault296b8492016-02-12 06:31:30 +0000243 unsigned addFlatScratchInit(const SIRegisterInfo &TRI);
Matt Arsenault10fc0622017-06-26 03:01:31 +0000244 unsigned addImplicitBufferPtr(const SIRegisterInfo &TRI);
Matt Arsenault26f8f3d2015-11-30 21:16:03 +0000245
246 // Add system SGPRs.
247 unsigned addWorkGroupIDX() {
248 WorkGroupIDXSystemSGPR = getNextSystemSGPR();
249 NumSystemSGPRs += 1;
250 return WorkGroupIDXSystemSGPR;
251 }
252
253 unsigned addWorkGroupIDY() {
254 WorkGroupIDYSystemSGPR = getNextSystemSGPR();
255 NumSystemSGPRs += 1;
256 return WorkGroupIDYSystemSGPR;
257 }
258
259 unsigned addWorkGroupIDZ() {
260 WorkGroupIDZSystemSGPR = getNextSystemSGPR();
261 NumSystemSGPRs += 1;
262 return WorkGroupIDZSystemSGPR;
263 }
264
265 unsigned addWorkGroupInfo() {
266 WorkGroupInfoSystemSGPR = getNextSystemSGPR();
267 NumSystemSGPRs += 1;
268 return WorkGroupInfoSystemSGPR;
269 }
270
271 unsigned addPrivateSegmentWaveByteOffset() {
272 PrivateSegmentWaveByteOffsetSystemSGPR = getNextSystemSGPR();
273 NumSystemSGPRs += 1;
274 return PrivateSegmentWaveByteOffsetSystemSGPR;
275 }
276
Tom Stellardf110f8f2016-04-14 16:27:03 +0000277 void setPrivateSegmentWaveByteOffset(unsigned Reg) {
278 PrivateSegmentWaveByteOffsetSystemSGPR = Reg;
279 }
280
Matt Arsenault26f8f3d2015-11-30 21:16:03 +0000281 bool hasPrivateSegmentBuffer() const {
282 return PrivateSegmentBuffer;
283 }
284
Matt Arsenault49affb82015-11-25 20:55:12 +0000285 bool hasDispatchPtr() const {
286 return DispatchPtr;
287 }
288
289 bool hasQueuePtr() const {
290 return QueuePtr;
291 }
292
Matt Arsenault49affb82015-11-25 20:55:12 +0000293 bool hasKernargSegmentPtr() const {
294 return KernargSegmentPtr;
295 }
296
Matt Arsenault8d718dc2016-07-22 17:01:30 +0000297 bool hasDispatchID() const {
298 return DispatchID;
299 }
300
Matt Arsenault49affb82015-11-25 20:55:12 +0000301 bool hasFlatScratchInit() const {
302 return FlatScratchInit;
303 }
304
305 bool hasGridWorkgroupCountX() const {
306 return GridWorkgroupCountX;
307 }
308
309 bool hasGridWorkgroupCountY() const {
310 return GridWorkgroupCountY;
311 }
312
313 bool hasGridWorkgroupCountZ() const {
314 return GridWorkgroupCountZ;
315 }
316
317 bool hasWorkGroupIDX() const {
318 return WorkGroupIDX;
319 }
320
321 bool hasWorkGroupIDY() const {
322 return WorkGroupIDY;
323 }
324
325 bool hasWorkGroupIDZ() const {
326 return WorkGroupIDZ;
327 }
328
329 bool hasWorkGroupInfo() const {
330 return WorkGroupInfo;
331 }
332
Matt Arsenault26f8f3d2015-11-30 21:16:03 +0000333 bool hasPrivateSegmentWaveByteOffset() const {
334 return PrivateSegmentWaveByteOffset;
335 }
336
Matt Arsenault49affb82015-11-25 20:55:12 +0000337 bool hasWorkItemIDX() const {
338 return WorkItemIDX;
339 }
340
341 bool hasWorkItemIDY() const {
342 return WorkItemIDY;
343 }
344
345 bool hasWorkItemIDZ() const {
346 return WorkItemIDZ;
347 }
348
Matt Arsenault10fc0622017-06-26 03:01:31 +0000349 bool hasImplicitBufferPtr() const {
350 return ImplicitBufferPtr;
Tom Stellard2f3f9852017-01-25 01:25:13 +0000351 }
352
Matt Arsenault26f8f3d2015-11-30 21:16:03 +0000353 unsigned getNumUserSGPRs() const {
354 return NumUserSGPRs;
355 }
356
357 unsigned getNumPreloadedSGPRs() const {
358 return NumUserSGPRs + NumSystemSGPRs;
359 }
360
361 unsigned getPrivateSegmentWaveByteOffsetSystemSGPR() const {
362 return PrivateSegmentWaveByteOffsetSystemSGPR;
363 }
364
Matt Arsenault49affb82015-11-25 20:55:12 +0000365 /// \brief Returns the physical register reserved for use as the resource
366 /// descriptor for scratch accesses.
367 unsigned getScratchRSrcReg() const {
368 return ScratchRSrcReg;
369 }
370
Matt Arsenault26f8f3d2015-11-30 21:16:03 +0000371 void setScratchRSrcReg(unsigned Reg) {
372 assert(Reg != AMDGPU::NoRegister && "Should never be unset");
373 ScratchRSrcReg = Reg;
374 }
375
376 unsigned getScratchWaveOffsetReg() const {
377 return ScratchWaveOffsetReg;
378 }
379
Matt Arsenault1c0ae392017-04-24 18:05:16 +0000380 unsigned getFrameOffsetReg() const {
381 return FrameOffsetReg;
382 }
383
384 void setStackPtrOffsetReg(unsigned Reg) {
Matt Arsenault1c0ae392017-04-24 18:05:16 +0000385 StackPtrOffsetReg = Reg;
386 }
387
Matt Arsenault1cc47f82017-07-18 16:44:56 +0000388 // Note the unset value for this is AMDGPU::SP_REG rather than
389 // NoRegister. This is mostly a workaround for MIR tests where state that
390 // can't be directly computed from the function is not preserved in serialized
391 // MIR.
Matt Arsenault1c0ae392017-04-24 18:05:16 +0000392 unsigned getStackPtrOffsetReg() const {
393 return StackPtrOffsetReg;
394 }
395
Matt Arsenault26f8f3d2015-11-30 21:16:03 +0000396 void setScratchWaveOffsetReg(unsigned Reg) {
397 assert(Reg != AMDGPU::NoRegister && "Should never be unset");
398 ScratchWaveOffsetReg = Reg;
Matt Arsenault2b1f9aa2017-05-17 21:56:25 +0000399 if (isEntryFunction())
400 FrameOffsetReg = ScratchWaveOffsetReg;
Matt Arsenault26f8f3d2015-11-30 21:16:03 +0000401 }
Matt Arsenault49affb82015-11-25 20:55:12 +0000402
Matt Arsenault99c14522016-04-25 19:27:24 +0000403 unsigned getQueuePtrUserSGPR() const {
404 return QueuePtrUserSGPR;
405 }
406
Matt Arsenault10fc0622017-06-26 03:01:31 +0000407 unsigned getImplicitBufferPtrUserSGPR() const {
408 return ImplicitBufferPtrUserSGPR;
Tom Stellard2f3f9852017-01-25 01:25:13 +0000409 }
410
Matt Arsenault5b22dfa2015-11-05 05:27:10 +0000411 bool hasSpilledSGPRs() const {
412 return HasSpilledSGPRs;
413 }
414
415 void setHasSpilledSGPRs(bool Spill = true) {
416 HasSpilledSGPRs = Spill;
417 }
418
419 bool hasSpilledVGPRs() const {
420 return HasSpilledVGPRs;
421 }
422
423 void setHasSpilledVGPRs(bool Spill = true) {
424 HasSpilledVGPRs = Spill;
425 }
Tom Stellard96468902014-09-24 01:33:17 +0000426
Matt Arsenault296b8492016-02-12 06:31:30 +0000427 bool hasNonSpillStackObjects() const {
428 return HasNonSpillStackObjects;
429 }
430
431 void setHasNonSpillStackObjects(bool StackObject = true) {
432 HasNonSpillStackObjects = StackObject;
433 }
434
Marek Olsak0532c192016-07-13 17:35:15 +0000435 unsigned getNumSpilledSGPRs() const {
436 return NumSpilledSGPRs;
437 }
438
439 unsigned getNumSpilledVGPRs() const {
440 return NumSpilledVGPRs;
441 }
442
443 void addToSpilledSGPRs(unsigned num) {
444 NumSpilledSGPRs += num;
445 }
446
447 void addToSpilledVGPRs(unsigned num) {
448 NumSpilledVGPRs += num;
449 }
450
Marek Olsakfccabaf2016-01-13 11:45:36 +0000451 unsigned getPSInputAddr() const {
452 return PSInputAddr;
453 }
454
Matt Arsenaulte622dc32017-04-11 22:29:24 +0000455 unsigned getPSInputEnable() const {
456 return PSInputEnable;
457 }
458
Marek Olsakfccabaf2016-01-13 11:45:36 +0000459 bool isPSInputAllocated(unsigned Index) const {
460 return PSInputAddr & (1 << Index);
461 }
462
463 void markPSInputAllocated(unsigned Index) {
464 PSInputAddr |= 1 << Index;
465 }
466
Matt Arsenaulte622dc32017-04-11 22:29:24 +0000467 void markPSInputEnabled(unsigned Index) {
468 PSInputEnable |= 1 << Index;
469 }
470
Marek Olsak8e9cc632016-01-13 17:23:09 +0000471 bool returnsVoid() const {
472 return ReturnsVoid;
473 }
474
475 void setIfReturnsVoid(bool Value) {
476 ReturnsVoid = Value;
477 }
478
Konstantin Zhuravlyov1d650262016-09-06 20:22:28 +0000479 /// \returns A pair of default/requested minimum/maximum flat work group sizes
480 /// for this function.
481 std::pair<unsigned, unsigned> getFlatWorkGroupSizes() const {
482 return FlatWorkGroupSizes;
483 }
484
485 /// \returns Default/requested minimum flat work group size for this function.
486 unsigned getMinFlatWorkGroupSize() const {
487 return FlatWorkGroupSizes.first;
488 }
489
490 /// \returns Default/requested maximum flat work group size for this function.
491 unsigned getMaxFlatWorkGroupSize() const {
492 return FlatWorkGroupSizes.second;
493 }
494
495 /// \returns A pair of default/requested minimum/maximum number of waves per
496 /// execution unit.
497 std::pair<unsigned, unsigned> getWavesPerEU() const {
498 return WavesPerEU;
499 }
500
501 /// \returns Default/requested minimum number of waves per execution unit.
502 unsigned getMinWavesPerEU() const {
503 return WavesPerEU.first;
504 }
505
506 /// \returns Default/requested maximum number of waves per execution unit.
507 unsigned getMaxWavesPerEU() const {
508 return WavesPerEU.second;
Konstantin Zhuravlyov71515e52016-04-26 17:24:40 +0000509 }
510
Konstantin Zhuravlyovf2f3d142016-06-25 03:11:28 +0000511 /// \returns Stack object index for \p Dim's work group ID.
512 int getDebuggerWorkGroupIDStackObjectIndex(unsigned Dim) const {
513 assert(Dim < 3);
514 return DebuggerWorkGroupIDStackObjectIndices[Dim];
515 }
516
517 /// \brief Sets stack object index for \p Dim's work group ID to \p ObjectIdx.
518 void setDebuggerWorkGroupIDStackObjectIndex(unsigned Dim, int ObjectIdx) {
519 assert(Dim < 3);
520 DebuggerWorkGroupIDStackObjectIndices[Dim] = ObjectIdx;
521 }
522
523 /// \returns Stack object index for \p Dim's work item ID.
524 int getDebuggerWorkItemIDStackObjectIndex(unsigned Dim) const {
525 assert(Dim < 3);
526 return DebuggerWorkItemIDStackObjectIndices[Dim];
527 }
528
529 /// \brief Sets stack object index for \p Dim's work item ID to \p ObjectIdx.
530 void setDebuggerWorkItemIDStackObjectIndex(unsigned Dim, int ObjectIdx) {
531 assert(Dim < 3);
532 DebuggerWorkItemIDStackObjectIndices[Dim] = ObjectIdx;
533 }
534
535 /// \returns SGPR used for \p Dim's work group ID.
536 unsigned getWorkGroupIDSGPR(unsigned Dim) const {
537 switch (Dim) {
538 case 0:
539 assert(hasWorkGroupIDX());
540 return WorkGroupIDXSystemSGPR;
541 case 1:
542 assert(hasWorkGroupIDY());
543 return WorkGroupIDYSystemSGPR;
544 case 2:
545 assert(hasWorkGroupIDZ());
546 return WorkGroupIDZSystemSGPR;
547 }
548 llvm_unreachable("unexpected dimension");
549 }
550
551 /// \returns VGPR used for \p Dim' work item ID.
552 unsigned getWorkItemIDVGPR(unsigned Dim) const {
553 switch (Dim) {
554 case 0:
555 assert(hasWorkItemIDX());
556 return AMDGPU::VGPR0;
557 case 1:
558 assert(hasWorkItemIDY());
559 return AMDGPU::VGPR1;
560 case 2:
561 assert(hasWorkItemIDZ());
562 return AMDGPU::VGPR2;
563 }
564 llvm_unreachable("unexpected dimension");
565 }
Tom Stellard244891d2016-12-20 15:52:17 +0000566
Matt Arsenault161e2b42017-04-18 20:59:40 +0000567 unsigned getLDSWaveSpillSize() const {
568 return LDSWaveSpillSize;
569 }
570
Tom Stellard6f9ef142016-12-20 17:19:44 +0000571 const AMDGPUBufferPseudoSourceValue *getBufferPSV() const {
572 return &BufferPSV;
573 }
574
Tom Stellardbb138882016-12-20 17:26:34 +0000575 const AMDGPUImagePseudoSourceValue *getImagePSV() const {
576 return &ImagePSV;
Tom Stellard244891d2016-12-20 15:52:17 +0000577 }
Tom Stellard75aadc22012-12-11 21:25:42 +0000578};
579
Eugene Zelenko66203762017-01-21 00:53:49 +0000580} // end namespace llvm
Tom Stellard75aadc22012-12-11 21:25:42 +0000581
Eugene Zelenko66203762017-01-21 00:53:49 +0000582#endif // LLVM_LIB_TARGET_AMDGPU_SIMACHINEFUNCTIONINFO_H