Matt Arsenault | 52ef401 | 2016-07-26 16:45:58 +0000 | [diff] [blame] | 1 | //===-- AMDGPUMachineFunctionInfo.cpp ---------------------------------------=// |
| 2 | // |
Chandler Carruth | 2946cd7 | 2019-01-19 08:50:56 +0000 | [diff] [blame^] | 3 | // Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions. |
| 4 | // See https://llvm.org/LICENSE.txt for license information. |
| 5 | // SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception |
Matt Arsenault | 52ef401 | 2016-07-26 16:45:58 +0000 | [diff] [blame] | 6 | // |
| 7 | //===----------------------------------------------------------------------===// |
| 8 | |
Vincent Lejeune | ace6f73 | 2013-04-01 21:47:53 +0000 | [diff] [blame] | 9 | #include "AMDGPUMachineFunction.h" |
Matt Arsenault | 52ef401 | 2016-07-26 16:45:58 +0000 | [diff] [blame] | 10 | #include "AMDGPUSubtarget.h" |
Stanislav Mekhanoshin | 1c53842 | 2018-05-25 17:25:12 +0000 | [diff] [blame] | 11 | #include "AMDGPUPerfHintAnalysis.h" |
| 12 | #include "llvm/CodeGen/MachineModuleInfo.h" |
Matt Arsenault | e935f05 | 2016-06-18 05:15:53 +0000 | [diff] [blame] | 13 | |
Craig Topper | 8fc4096 | 2013-07-17 00:31:35 +0000 | [diff] [blame] | 14 | using namespace llvm; |
Vincent Lejeune | ace6f73 | 2013-04-01 21:47:53 +0000 | [diff] [blame] | 15 | |
Vincent Lejeune | ace6f73 | 2013-04-01 21:47:53 +0000 | [diff] [blame] | 16 | AMDGPUMachineFunction::AMDGPUMachineFunction(const MachineFunction &MF) : |
Matt Arsenault | 762af96 | 2014-07-13 03:06:39 +0000 | [diff] [blame] | 17 | MachineFunctionInfo(), |
Matt Arsenault | 52ef401 | 2016-07-26 16:45:58 +0000 | [diff] [blame] | 18 | LocalMemoryObjects(), |
Matt Arsenault | 75e7192 | 2018-06-28 10:18:55 +0000 | [diff] [blame] | 19 | ExplicitKernArgSize(0), |
Matt Arsenault | e935f05 | 2016-06-18 05:15:53 +0000 | [diff] [blame] | 20 | MaxKernArgAlign(0), |
Matt Arsenault | 3f98140 | 2014-09-15 15:41:53 +0000 | [diff] [blame] | 21 | LDSSize(0), |
Matthias Braun | f1caa28 | 2017-12-15 22:22:58 +0000 | [diff] [blame] | 22 | IsEntryFunction(AMDGPU::isEntryFunctionCC(MF.getFunction().getCallingConv())), |
Stanislav Mekhanoshin | 1c53842 | 2018-05-25 17:25:12 +0000 | [diff] [blame] | 23 | NoSignedZerosFPMath(MF.getTarget().Options.NoSignedZerosFPMath), |
| 24 | MemoryBound(false), |
| 25 | WaveLimiter(false) { |
Matt Arsenault | 4bec7d4 | 2018-07-20 09:05:08 +0000 | [diff] [blame] | 26 | const AMDGPUSubtarget &ST = AMDGPUSubtarget::get(MF); |
| 27 | |
Matt Arsenault | 52ef401 | 2016-07-26 16:45:58 +0000 | [diff] [blame] | 28 | // FIXME: Should initialize KernArgSize based on ExplicitKernelArgOffset, |
| 29 | // except reserved size is not correctly aligned. |
Matt Arsenault | 4bec7d4 | 2018-07-20 09:05:08 +0000 | [diff] [blame] | 30 | const Function &F = MF.getFunction(); |
Stanislav Mekhanoshin | 1c53842 | 2018-05-25 17:25:12 +0000 | [diff] [blame] | 31 | |
| 32 | if (auto *Resolver = MF.getMMI().getResolver()) { |
| 33 | if (AMDGPUPerfHintAnalysis *PHA = static_cast<AMDGPUPerfHintAnalysis*>( |
| 34 | Resolver->getAnalysisIfAvailable(&AMDGPUPerfHintAnalysisID, true))) { |
Matt Arsenault | 4bec7d4 | 2018-07-20 09:05:08 +0000 | [diff] [blame] | 35 | MemoryBound = PHA->isMemoryBound(&F); |
| 36 | WaveLimiter = PHA->needsWaveLimiter(&F); |
Stanislav Mekhanoshin | 1c53842 | 2018-05-25 17:25:12 +0000 | [diff] [blame] | 37 | } |
| 38 | } |
Matt Arsenault | 4bec7d4 | 2018-07-20 09:05:08 +0000 | [diff] [blame] | 39 | |
| 40 | CallingConv::ID CC = F.getCallingConv(); |
| 41 | if (CC == CallingConv::AMDGPU_KERNEL || CC == CallingConv::SPIR_KERNEL) |
| 42 | ExplicitKernArgSize = ST.getExplicitKernArgSize(F, MaxKernArgAlign); |
Nikolay Haustov | beb24f5 | 2016-07-01 10:00:58 +0000 | [diff] [blame] | 43 | } |
| 44 | |
Matt Arsenault | 52ef401 | 2016-07-26 16:45:58 +0000 | [diff] [blame] | 45 | unsigned AMDGPUMachineFunction::allocateLDSGlobal(const DataLayout &DL, |
| 46 | const GlobalValue &GV) { |
| 47 | auto Entry = LocalMemoryObjects.insert(std::make_pair(&GV, 0)); |
| 48 | if (!Entry.second) |
| 49 | return Entry.first->second; |
| 50 | |
| 51 | unsigned Align = GV.getAlignment(); |
| 52 | if (Align == 0) |
| 53 | Align = DL.getABITypeAlignment(GV.getValueType()); |
| 54 | |
| 55 | /// TODO: We should sort these to minimize wasted space due to alignment |
| 56 | /// padding. Currently the padding is decided by the first encountered use |
| 57 | /// during lowering. |
| 58 | unsigned Offset = LDSSize = alignTo(LDSSize, Align); |
| 59 | |
| 60 | Entry.first->second = Offset; |
| 61 | LDSSize += DL.getTypeAllocSize(GV.getValueType()); |
| 62 | |
| 63 | return Offset; |
Nikolay Haustov | beb24f5 | 2016-07-01 10:00:58 +0000 | [diff] [blame] | 64 | } |