Matt Arsenault | 6b6a2c3 | 2016-03-11 08:00:27 +0000 | [diff] [blame] | 1 | //===-- AMDGPUMachineFunctionInfo.h -------------------------------*- C++ -*-=// |
Vincent Lejeune | ace6f73 | 2013-04-01 21:47:53 +0000 | [diff] [blame] | 2 | // |
| 3 | // The LLVM Compiler Infrastructure |
| 4 | // |
| 5 | // This file is distributed under the University of Illinois Open Source |
| 6 | // License. See LICENSE.TXT for details. |
| 7 | // |
| 8 | //===----------------------------------------------------------------------===// |
Vincent Lejeune | ace6f73 | 2013-04-01 21:47:53 +0000 | [diff] [blame] | 9 | |
Matt Arsenault | 6b6a2c3 | 2016-03-11 08:00:27 +0000 | [diff] [blame] | 10 | #ifndef LLVM_LIB_TARGET_AMDGPU_AMDGPUMACHINEFUNCTION_H |
| 11 | #define LLVM_LIB_TARGET_AMDGPU_AMDGPUMACHINEFUNCTION_H |
Vincent Lejeune | ace6f73 | 2013-04-01 21:47:53 +0000 | [diff] [blame] | 12 | |
Matt Arsenault | 52ef401 | 2016-07-26 16:45:58 +0000 | [diff] [blame] | 13 | #include "llvm/ADT/DenseMap.h" |
Chandler Carruth | 6bda14b | 2017-06-06 11:49:48 +0000 | [diff] [blame] | 14 | #include "llvm/CodeGen/MachineFunction.h" |
Vincent Lejeune | ace6f73 | 2013-04-01 21:47:53 +0000 | [diff] [blame] | 15 | |
| 16 | namespace llvm { |
| 17 | |
| 18 | class AMDGPUMachineFunction : public MachineFunctionInfo { |
Matt Arsenault | 52ef401 | 2016-07-26 16:45:58 +0000 | [diff] [blame] | 19 | /// A map to keep track of local memory objects and their offsets within the |
| 20 | /// local memory space. |
| 21 | SmallDenseMap<const GlobalValue *, unsigned, 4> LocalMemoryObjects; |
| 22 | |
Matt Arsenault | e935f05 | 2016-06-18 05:15:53 +0000 | [diff] [blame] | 23 | uint64_t KernArgSize; |
| 24 | unsigned MaxKernArgAlign; |
| 25 | |
Matt Arsenault | 52ef401 | 2016-07-26 16:45:58 +0000 | [diff] [blame] | 26 | /// Number of bytes in the LDS that are being used. |
| 27 | unsigned LDSSize; |
| 28 | |
| 29 | // FIXME: This should probably be removed. |
| 30 | /// Start of implicit kernel args |
| 31 | unsigned ABIArgOffset; |
| 32 | |
Hiroshi Inoue | ae17900 | 2018-04-14 08:59:00 +0000 | [diff] [blame] | 33 | // Kernels + shaders. i.e. functions called by the driver and not called |
Matt Arsenault | 1074cb5 | 2017-03-30 23:58:04 +0000 | [diff] [blame] | 34 | // by other functions. |
| 35 | bool IsEntryFunction; |
| 36 | |
Matt Arsenault | 3cb3904 | 2017-02-27 19:35:42 +0000 | [diff] [blame] | 37 | bool NoSignedZerosFPMath; |
Matt Arsenault | 762af96 | 2014-07-13 03:06:39 +0000 | [diff] [blame] | 38 | |
Stanislav Mekhanoshin | 1c53842 | 2018-05-25 17:25:12 +0000 | [diff] [blame^] | 39 | // Function may be memory bound. |
| 40 | bool MemoryBound; |
| 41 | |
| 42 | // Kernel may need limited waves per EU for better performance. |
| 43 | bool WaveLimiter; |
| 44 | |
Vincent Lejeune | ace6f73 | 2013-04-01 21:47:53 +0000 | [diff] [blame] | 45 | public: |
| 46 | AMDGPUMachineFunction(const MachineFunction &MF); |
Matt Arsenault | e935f05 | 2016-06-18 05:15:53 +0000 | [diff] [blame] | 47 | |
| 48 | uint64_t allocateKernArg(uint64_t Size, unsigned Align) { |
| 49 | assert(isPowerOf2_32(Align)); |
| 50 | KernArgSize = alignTo(KernArgSize, Align); |
| 51 | |
| 52 | uint64_t Result = KernArgSize; |
| 53 | KernArgSize += Size; |
| 54 | |
| 55 | MaxKernArgAlign = std::max(Align, MaxKernArgAlign); |
| 56 | return Result; |
| 57 | } |
| 58 | |
Matt Arsenault | 52ef401 | 2016-07-26 16:45:58 +0000 | [diff] [blame] | 59 | uint64_t getKernArgSize() const { |
| 60 | return KernArgSize; |
| 61 | } |
Matt Arsenault | 762af96 | 2014-07-13 03:06:39 +0000 | [diff] [blame] | 62 | |
Tom Stellard | 175959e | 2016-12-06 21:53:10 +0000 | [diff] [blame] | 63 | unsigned getMaxKernArgAlign() const { |
| 64 | return MaxKernArgAlign; |
| 65 | } |
| 66 | |
Matt Arsenault | 52ef401 | 2016-07-26 16:45:58 +0000 | [diff] [blame] | 67 | void setABIArgOffset(unsigned NewOffset) { |
| 68 | ABIArgOffset = NewOffset; |
| 69 | } |
Jan Vesely | e5121f3 | 2014-10-14 20:05:26 +0000 | [diff] [blame] | 70 | |
Matt Arsenault | 52ef401 | 2016-07-26 16:45:58 +0000 | [diff] [blame] | 71 | unsigned getABIArgOffset() const { |
| 72 | return ABIArgOffset; |
| 73 | } |
Tom Stellard | 1e1b05d | 2015-11-06 11:45:14 +0000 | [diff] [blame] | 74 | |
Matt Arsenault | 52ef401 | 2016-07-26 16:45:58 +0000 | [diff] [blame] | 75 | unsigned getLDSSize() const { |
| 76 | return LDSSize; |
| 77 | } |
| 78 | |
Matt Arsenault | 1074cb5 | 2017-03-30 23:58:04 +0000 | [diff] [blame] | 79 | bool isEntryFunction() const { |
| 80 | return IsEntryFunction; |
Matt Arsenault | 52ef401 | 2016-07-26 16:45:58 +0000 | [diff] [blame] | 81 | } |
| 82 | |
Matt Arsenault | 3cb3904 | 2017-02-27 19:35:42 +0000 | [diff] [blame] | 83 | bool hasNoSignedZerosFPMath() const { |
| 84 | return NoSignedZerosFPMath; |
| 85 | } |
| 86 | |
Stanislav Mekhanoshin | 1c53842 | 2018-05-25 17:25:12 +0000 | [diff] [blame^] | 87 | bool isMemoryBound() const { |
| 88 | return MemoryBound; |
| 89 | } |
| 90 | |
| 91 | bool needsWaveLimiter() const { |
| 92 | return WaveLimiter; |
| 93 | } |
| 94 | |
Matt Arsenault | 52ef401 | 2016-07-26 16:45:58 +0000 | [diff] [blame] | 95 | unsigned allocateLDSGlobal(const DataLayout &DL, const GlobalValue &GV); |
Vincent Lejeune | ace6f73 | 2013-04-01 21:47:53 +0000 | [diff] [blame] | 96 | }; |
| 97 | |
Alexander Kornienko | f00654e | 2015-06-23 09:49:53 +0000 | [diff] [blame] | 98 | } |
Benjamin Kramer | a7c40ef | 2014-08-13 16:26:38 +0000 | [diff] [blame] | 99 | #endif |