blob: 0574c991ee6e9c1123d25f611e01d48986848330 [file] [log] [blame]
Matt Arsenault52ef4012016-07-26 16:45:58 +00001//===-- AMDGPUMachineFunctionInfo.cpp ---------------------------------------=//
2//
3// The LLVM Compiler Infrastructure
4//
5// This file is distributed under the University of Illinois Open Source
6// License. See LICENSE.TXT for details.
7//
8//===----------------------------------------------------------------------===//
9
Vincent Lejeuneace6f732013-04-01 21:47:53 +000010#include "AMDGPUMachineFunction.h"
Matt Arsenault52ef4012016-07-26 16:45:58 +000011#include "AMDGPUSubtarget.h"
Stanislav Mekhanoshin1c538422018-05-25 17:25:12 +000012#include "AMDGPUPerfHintAnalysis.h"
13#include "llvm/CodeGen/MachineModuleInfo.h"
Matt Arsenaulte935f052016-06-18 05:15:53 +000014
Craig Topper8fc40962013-07-17 00:31:35 +000015using namespace llvm;
Vincent Lejeuneace6f732013-04-01 21:47:53 +000016
Vincent Lejeuneace6f732013-04-01 21:47:53 +000017AMDGPUMachineFunction::AMDGPUMachineFunction(const MachineFunction &MF) :
Matt Arsenault762af962014-07-13 03:06:39 +000018 MachineFunctionInfo(),
Matt Arsenault52ef4012016-07-26 16:45:58 +000019 LocalMemoryObjects(),
Matt Arsenault75e71922018-06-28 10:18:55 +000020 ExplicitKernArgSize(0),
Matt Arsenaulte935f052016-06-18 05:15:53 +000021 MaxKernArgAlign(0),
Matt Arsenault3f981402014-09-15 15:41:53 +000022 LDSSize(0),
Matthias Braunf1caa282017-12-15 22:22:58 +000023 IsEntryFunction(AMDGPU::isEntryFunctionCC(MF.getFunction().getCallingConv())),
Stanislav Mekhanoshin1c538422018-05-25 17:25:12 +000024 NoSignedZerosFPMath(MF.getTarget().Options.NoSignedZerosFPMath),
25 MemoryBound(false),
26 WaveLimiter(false) {
Matt Arsenault52ef4012016-07-26 16:45:58 +000027 // FIXME: Should initialize KernArgSize based on ExplicitKernelArgOffset,
28 // except reserved size is not correctly aligned.
Stanislav Mekhanoshin1c538422018-05-25 17:25:12 +000029
30 if (auto *Resolver = MF.getMMI().getResolver()) {
31 if (AMDGPUPerfHintAnalysis *PHA = static_cast<AMDGPUPerfHintAnalysis*>(
32 Resolver->getAnalysisIfAvailable(&AMDGPUPerfHintAnalysisID, true))) {
33 MemoryBound = PHA->isMemoryBound(&MF.getFunction());
34 WaveLimiter = PHA->needsWaveLimiter(&MF.getFunction());
35 }
36 }
Nikolay Haustovbeb24f52016-07-01 10:00:58 +000037}
38
Matt Arsenault52ef4012016-07-26 16:45:58 +000039unsigned AMDGPUMachineFunction::allocateLDSGlobal(const DataLayout &DL,
40 const GlobalValue &GV) {
41 auto Entry = LocalMemoryObjects.insert(std::make_pair(&GV, 0));
42 if (!Entry.second)
43 return Entry.first->second;
44
45 unsigned Align = GV.getAlignment();
46 if (Align == 0)
47 Align = DL.getABITypeAlignment(GV.getValueType());
48
49 /// TODO: We should sort these to minimize wasted space due to alignment
50 /// padding. Currently the padding is decided by the first encountered use
51 /// during lowering.
52 unsigned Offset = LDSSize = alignTo(LDSSize, Align);
53
54 Entry.first->second = Offset;
55 LDSSize += DL.getTypeAllocSize(GV.getValueType());
56
57 return Offset;
Nikolay Haustovbeb24f52016-07-01 10:00:58 +000058}