Matt Arsenault | 6b6a2c3 | 2016-03-11 08:00:27 +0000 | [diff] [blame] | 1 | //===-- AMDGPUMachineFunctionInfo.h -------------------------------*- C++ -*-=// |
Vincent Lejeune | ace6f73 | 2013-04-01 21:47:53 +0000 | [diff] [blame] | 2 | // |
| 3 | // The LLVM Compiler Infrastructure |
| 4 | // |
| 5 | // This file is distributed under the University of Illinois Open Source |
| 6 | // License. See LICENSE.TXT for details. |
| 7 | // |
| 8 | //===----------------------------------------------------------------------===// |
Vincent Lejeune | ace6f73 | 2013-04-01 21:47:53 +0000 | [diff] [blame] | 9 | |
Matt Arsenault | 6b6a2c3 | 2016-03-11 08:00:27 +0000 | [diff] [blame] | 10 | #ifndef LLVM_LIB_TARGET_AMDGPU_AMDGPUMACHINEFUNCTION_H |
| 11 | #define LLVM_LIB_TARGET_AMDGPU_AMDGPUMACHINEFUNCTION_H |
Vincent Lejeune | ace6f73 | 2013-04-01 21:47:53 +0000 | [diff] [blame] | 12 | |
Matt Arsenault | 52ef401 | 2016-07-26 16:45:58 +0000 | [diff] [blame] | 13 | #include "llvm/ADT/DenseMap.h" |
Chandler Carruth | 6bda14b | 2017-06-06 11:49:48 +0000 | [diff] [blame] | 14 | #include "llvm/CodeGen/MachineFunction.h" |
Vincent Lejeune | ace6f73 | 2013-04-01 21:47:53 +0000 | [diff] [blame] | 15 | |
| 16 | namespace llvm { |
| 17 | |
| 18 | class AMDGPUMachineFunction : public MachineFunctionInfo { |
Matt Arsenault | 52ef401 | 2016-07-26 16:45:58 +0000 | [diff] [blame] | 19 | /// A map to keep track of local memory objects and their offsets within the |
| 20 | /// local memory space. |
| 21 | SmallDenseMap<const GlobalValue *, unsigned, 4> LocalMemoryObjects; |
| 22 | |
Matt Arsenault | 1ea0402 | 2018-05-29 19:35:00 +0000 | [diff] [blame^] | 23 | protected: |
Matt Arsenault | e935f05 | 2016-06-18 05:15:53 +0000 | [diff] [blame] | 24 | uint64_t KernArgSize; |
| 25 | unsigned MaxKernArgAlign; |
| 26 | |
Matt Arsenault | 52ef401 | 2016-07-26 16:45:58 +0000 | [diff] [blame] | 27 | /// Number of bytes in the LDS that are being used. |
| 28 | unsigned LDSSize; |
| 29 | |
| 30 | // FIXME: This should probably be removed. |
| 31 | /// Start of implicit kernel args |
| 32 | unsigned ABIArgOffset; |
| 33 | |
Hiroshi Inoue | ae17900 | 2018-04-14 08:59:00 +0000 | [diff] [blame] | 34 | // Kernels + shaders. i.e. functions called by the driver and not called |
Matt Arsenault | 1074cb5 | 2017-03-30 23:58:04 +0000 | [diff] [blame] | 35 | // by other functions. |
| 36 | bool IsEntryFunction; |
| 37 | |
Matt Arsenault | 3cb3904 | 2017-02-27 19:35:42 +0000 | [diff] [blame] | 38 | bool NoSignedZerosFPMath; |
Matt Arsenault | 762af96 | 2014-07-13 03:06:39 +0000 | [diff] [blame] | 39 | |
Stanislav Mekhanoshin | 1c53842 | 2018-05-25 17:25:12 +0000 | [diff] [blame] | 40 | // Function may be memory bound. |
| 41 | bool MemoryBound; |
| 42 | |
| 43 | // Kernel may need limited waves per EU for better performance. |
| 44 | bool WaveLimiter; |
| 45 | |
Vincent Lejeune | ace6f73 | 2013-04-01 21:47:53 +0000 | [diff] [blame] | 46 | public: |
| 47 | AMDGPUMachineFunction(const MachineFunction &MF); |
Matt Arsenault | e935f05 | 2016-06-18 05:15:53 +0000 | [diff] [blame] | 48 | |
| 49 | uint64_t allocateKernArg(uint64_t Size, unsigned Align) { |
| 50 | assert(isPowerOf2_32(Align)); |
| 51 | KernArgSize = alignTo(KernArgSize, Align); |
| 52 | |
| 53 | uint64_t Result = KernArgSize; |
| 54 | KernArgSize += Size; |
| 55 | |
| 56 | MaxKernArgAlign = std::max(Align, MaxKernArgAlign); |
| 57 | return Result; |
| 58 | } |
| 59 | |
Matt Arsenault | 52ef401 | 2016-07-26 16:45:58 +0000 | [diff] [blame] | 60 | uint64_t getKernArgSize() const { |
| 61 | return KernArgSize; |
| 62 | } |
Matt Arsenault | 762af96 | 2014-07-13 03:06:39 +0000 | [diff] [blame] | 63 | |
Tom Stellard | 175959e | 2016-12-06 21:53:10 +0000 | [diff] [blame] | 64 | unsigned getMaxKernArgAlign() const { |
| 65 | return MaxKernArgAlign; |
| 66 | } |
| 67 | |
Matt Arsenault | 52ef401 | 2016-07-26 16:45:58 +0000 | [diff] [blame] | 68 | void setABIArgOffset(unsigned NewOffset) { |
| 69 | ABIArgOffset = NewOffset; |
| 70 | } |
Jan Vesely | e5121f3 | 2014-10-14 20:05:26 +0000 | [diff] [blame] | 71 | |
Matt Arsenault | 52ef401 | 2016-07-26 16:45:58 +0000 | [diff] [blame] | 72 | unsigned getABIArgOffset() const { |
| 73 | return ABIArgOffset; |
| 74 | } |
Tom Stellard | 1e1b05d | 2015-11-06 11:45:14 +0000 | [diff] [blame] | 75 | |
Matt Arsenault | 52ef401 | 2016-07-26 16:45:58 +0000 | [diff] [blame] | 76 | unsigned getLDSSize() const { |
| 77 | return LDSSize; |
| 78 | } |
| 79 | |
Matt Arsenault | 1074cb5 | 2017-03-30 23:58:04 +0000 | [diff] [blame] | 80 | bool isEntryFunction() const { |
| 81 | return IsEntryFunction; |
Matt Arsenault | 52ef401 | 2016-07-26 16:45:58 +0000 | [diff] [blame] | 82 | } |
| 83 | |
Matt Arsenault | 3cb3904 | 2017-02-27 19:35:42 +0000 | [diff] [blame] | 84 | bool hasNoSignedZerosFPMath() const { |
| 85 | return NoSignedZerosFPMath; |
| 86 | } |
| 87 | |
Stanislav Mekhanoshin | 1c53842 | 2018-05-25 17:25:12 +0000 | [diff] [blame] | 88 | bool isMemoryBound() const { |
| 89 | return MemoryBound; |
| 90 | } |
| 91 | |
| 92 | bool needsWaveLimiter() const { |
| 93 | return WaveLimiter; |
| 94 | } |
| 95 | |
Matt Arsenault | 52ef401 | 2016-07-26 16:45:58 +0000 | [diff] [blame] | 96 | unsigned allocateLDSGlobal(const DataLayout &DL, const GlobalValue &GV); |
Vincent Lejeune | ace6f73 | 2013-04-01 21:47:53 +0000 | [diff] [blame] | 97 | }; |
| 98 | |
Alexander Kornienko | f00654e | 2015-06-23 09:49:53 +0000 | [diff] [blame] | 99 | } |
Benjamin Kramer | a7c40ef | 2014-08-13 16:26:38 +0000 | [diff] [blame] | 100 | #endif |