Matt Arsenault | 6b6a2c3 | 2016-03-11 08:00:27 +0000 | [diff] [blame] | 1 | //===-- AMDGPUMachineFunctionInfo.h -------------------------------*- C++ -*-=// |
Vincent Lejeune | ace6f73 | 2013-04-01 21:47:53 +0000 | [diff] [blame] | 2 | // |
| 3 | // The LLVM Compiler Infrastructure |
| 4 | // |
| 5 | // This file is distributed under the University of Illinois Open Source |
| 6 | // License. See LICENSE.TXT for details. |
| 7 | // |
| 8 | //===----------------------------------------------------------------------===// |
Vincent Lejeune | ace6f73 | 2013-04-01 21:47:53 +0000 | [diff] [blame] | 9 | |
Matt Arsenault | 6b6a2c3 | 2016-03-11 08:00:27 +0000 | [diff] [blame] | 10 | #ifndef LLVM_LIB_TARGET_AMDGPU_AMDGPUMACHINEFUNCTION_H |
| 11 | #define LLVM_LIB_TARGET_AMDGPU_AMDGPUMACHINEFUNCTION_H |
Vincent Lejeune | ace6f73 | 2013-04-01 21:47:53 +0000 | [diff] [blame] | 12 | |
Matt Arsenault | 52ef401 | 2016-07-26 16:45:58 +0000 | [diff] [blame] | 13 | #include "llvm/ADT/DenseMap.h" |
Chandler Carruth | 6bda14b | 2017-06-06 11:49:48 +0000 | [diff] [blame] | 14 | #include "llvm/CodeGen/MachineFunction.h" |
Vincent Lejeune | ace6f73 | 2013-04-01 21:47:53 +0000 | [diff] [blame] | 15 | |
| 16 | namespace llvm { |
| 17 | |
Matt Arsenault | 75e7192 | 2018-06-28 10:18:55 +0000 | [diff] [blame^] | 18 | class AMDGPUSubtarget; |
| 19 | |
Vincent Lejeune | ace6f73 | 2013-04-01 21:47:53 +0000 | [diff] [blame] | 20 | class AMDGPUMachineFunction : public MachineFunctionInfo { |
Matt Arsenault | 52ef401 | 2016-07-26 16:45:58 +0000 | [diff] [blame] | 21 | /// A map to keep track of local memory objects and their offsets within the |
| 22 | /// local memory space. |
| 23 | SmallDenseMap<const GlobalValue *, unsigned, 4> LocalMemoryObjects; |
| 24 | |
Matt Arsenault | 1ea0402 | 2018-05-29 19:35:00 +0000 | [diff] [blame] | 25 | protected: |
Matt Arsenault | 75e7192 | 2018-06-28 10:18:55 +0000 | [diff] [blame^] | 26 | uint64_t ExplicitKernArgSize; |
Matt Arsenault | e935f05 | 2016-06-18 05:15:53 +0000 | [diff] [blame] | 27 | unsigned MaxKernArgAlign; |
| 28 | |
Matt Arsenault | 52ef401 | 2016-07-26 16:45:58 +0000 | [diff] [blame] | 29 | /// Number of bytes in the LDS that are being used. |
| 30 | unsigned LDSSize; |
| 31 | |
Hiroshi Inoue | ae17900 | 2018-04-14 08:59:00 +0000 | [diff] [blame] | 32 | // Kernels + shaders. i.e. functions called by the driver and not called |
Matt Arsenault | 1074cb5 | 2017-03-30 23:58:04 +0000 | [diff] [blame] | 33 | // by other functions. |
| 34 | bool IsEntryFunction; |
| 35 | |
Matt Arsenault | 3cb3904 | 2017-02-27 19:35:42 +0000 | [diff] [blame] | 36 | bool NoSignedZerosFPMath; |
Matt Arsenault | 762af96 | 2014-07-13 03:06:39 +0000 | [diff] [blame] | 37 | |
Stanislav Mekhanoshin | 1c53842 | 2018-05-25 17:25:12 +0000 | [diff] [blame] | 38 | // Function may be memory bound. |
| 39 | bool MemoryBound; |
| 40 | |
| 41 | // Kernel may need limited waves per EU for better performance. |
| 42 | bool WaveLimiter; |
| 43 | |
Vincent Lejeune | ace6f73 | 2013-04-01 21:47:53 +0000 | [diff] [blame] | 44 | public: |
| 45 | AMDGPUMachineFunction(const MachineFunction &MF); |
Matt Arsenault | e935f05 | 2016-06-18 05:15:53 +0000 | [diff] [blame] | 46 | |
| 47 | uint64_t allocateKernArg(uint64_t Size, unsigned Align) { |
| 48 | assert(isPowerOf2_32(Align)); |
Matt Arsenault | 75e7192 | 2018-06-28 10:18:55 +0000 | [diff] [blame^] | 49 | ExplicitKernArgSize = alignTo(ExplicitKernArgSize, Align); |
Matt Arsenault | e935f05 | 2016-06-18 05:15:53 +0000 | [diff] [blame] | 50 | |
Matt Arsenault | 75e7192 | 2018-06-28 10:18:55 +0000 | [diff] [blame^] | 51 | uint64_t Result = ExplicitKernArgSize; |
| 52 | ExplicitKernArgSize += Size; |
Matt Arsenault | e935f05 | 2016-06-18 05:15:53 +0000 | [diff] [blame] | 53 | |
| 54 | MaxKernArgAlign = std::max(Align, MaxKernArgAlign); |
| 55 | return Result; |
| 56 | } |
| 57 | |
Matt Arsenault | 75e7192 | 2018-06-28 10:18:55 +0000 | [diff] [blame^] | 58 | uint64_t getExplicitKernArgSize() const { |
| 59 | return ExplicitKernArgSize; |
Matt Arsenault | 52ef401 | 2016-07-26 16:45:58 +0000 | [diff] [blame] | 60 | } |
Matt Arsenault | 762af96 | 2014-07-13 03:06:39 +0000 | [diff] [blame] | 61 | |
Tom Stellard | 175959e | 2016-12-06 21:53:10 +0000 | [diff] [blame] | 62 | unsigned getMaxKernArgAlign() const { |
| 63 | return MaxKernArgAlign; |
| 64 | } |
| 65 | |
Matt Arsenault | 52ef401 | 2016-07-26 16:45:58 +0000 | [diff] [blame] | 66 | unsigned getLDSSize() const { |
| 67 | return LDSSize; |
| 68 | } |
| 69 | |
Matt Arsenault | 1074cb5 | 2017-03-30 23:58:04 +0000 | [diff] [blame] | 70 | bool isEntryFunction() const { |
| 71 | return IsEntryFunction; |
Matt Arsenault | 52ef401 | 2016-07-26 16:45:58 +0000 | [diff] [blame] | 72 | } |
| 73 | |
Matt Arsenault | 3cb3904 | 2017-02-27 19:35:42 +0000 | [diff] [blame] | 74 | bool hasNoSignedZerosFPMath() const { |
| 75 | return NoSignedZerosFPMath; |
| 76 | } |
| 77 | |
Stanislav Mekhanoshin | 1c53842 | 2018-05-25 17:25:12 +0000 | [diff] [blame] | 78 | bool isMemoryBound() const { |
| 79 | return MemoryBound; |
| 80 | } |
| 81 | |
| 82 | bool needsWaveLimiter() const { |
| 83 | return WaveLimiter; |
| 84 | } |
| 85 | |
Matt Arsenault | 52ef401 | 2016-07-26 16:45:58 +0000 | [diff] [blame] | 86 | unsigned allocateLDSGlobal(const DataLayout &DL, const GlobalValue &GV); |
Vincent Lejeune | ace6f73 | 2013-04-01 21:47:53 +0000 | [diff] [blame] | 87 | }; |
| 88 | |
Alexander Kornienko | f00654e | 2015-06-23 09:49:53 +0000 | [diff] [blame] | 89 | } |
Benjamin Kramer | a7c40ef | 2014-08-13 16:26:38 +0000 | [diff] [blame] | 90 | #endif |