blob: 08db0011e0912ec3f692e60a73b88773dd6d0410 [file] [log] [blame]
Tom Stellard75aadc22012-12-11 21:25:42 +00001//===-- AMDGPUTargetMachine.cpp - TargetMachine for hw codegen targets-----===//
2//
3// The LLVM Compiler Infrastructure
4//
5// This file is distributed under the University of Illinois Open Source
6// License. See LICENSE.TXT for details.
7//
8//===----------------------------------------------------------------------===//
9//
10/// \file
11/// \brief The AMDGPU target machine contains all of the hardware specific
12/// information needed to emit code for R600 and SI GPUs.
13//
14//===----------------------------------------------------------------------===//
15
16#include "AMDGPUTargetMachine.h"
17#include "AMDGPU.h"
18#include "R600ISelLowering.h"
19#include "R600InstrInfo.h"
Vincent Lejeune68b6b6d2013-03-05 18:41:32 +000020#include "R600MachineScheduler.h"
Tom Stellard75aadc22012-12-11 21:25:42 +000021#include "SIISelLowering.h"
22#include "SIInstrInfo.h"
23#include "llvm/Analysis/Passes.h"
Tom Stellard75aadc22012-12-11 21:25:42 +000024#include "llvm/CodeGen/MachineFunctionAnalysis.h"
Aditya Nandakumara2719322014-11-13 09:26:31 +000025#include "llvm/CodeGen/TargetLoweringObjectFileImpl.h"
Tom Stellard75aadc22012-12-11 21:25:42 +000026#include "llvm/CodeGen/MachineModuleInfo.h"
27#include "llvm/CodeGen/Passes.h"
Chandler Carruth5ad5f152014-01-13 09:26:24 +000028#include "llvm/IR/Verifier.h"
Tom Stellard75aadc22012-12-11 21:25:42 +000029#include "llvm/MC/MCAsmInfo.h"
30#include "llvm/PassManager.h"
31#include "llvm/Support/TargetRegistry.h"
32#include "llvm/Support/raw_os_ostream.h"
33#include "llvm/Transforms/IPO.h"
34#include "llvm/Transforms/Scalar.h"
35#include <llvm/CodeGen/Passes.h>
36
37using namespace llvm;
38
39extern "C" void LLVMInitializeR600Target() {
40 // Register the target
41 RegisterTargetMachine<AMDGPUTargetMachine> X(TheAMDGPUTarget);
42}
43
Vincent Lejeune68b6b6d2013-03-05 18:41:32 +000044static ScheduleDAGInstrs *createR600MachineScheduler(MachineSchedContext *C) {
David Blaikie422b93d2014-04-21 20:32:32 +000045 return new ScheduleDAGMILive(C, make_unique<R600SchedStrategy>());
Vincent Lejeune68b6b6d2013-03-05 18:41:32 +000046}
47
48static MachineSchedRegistry
49SchedCustomRegistry("r600", "Run R600's custom scheduler",
50 createR600MachineScheduler);
51
Tom Stellard75aadc22012-12-11 21:25:42 +000052AMDGPUTargetMachine::AMDGPUTargetMachine(const Target &T, StringRef TT,
Eric Christopherac4b69e2014-07-25 22:22:39 +000053 StringRef CPU, StringRef FS,
54 TargetOptions Options, Reloc::Model RM,
55 CodeModel::Model CM,
56 CodeGenOpt::Level OptLevel)
57 : LLVMTargetMachine(T, TT, CPU, FS, Options, RM, CM, OptLevel),
Aditya Nandakumara2719322014-11-13 09:26:31 +000058 TLOF(new TargetLoweringObjectFileELF()),
Eric Christopher34aaf972014-08-04 17:37:43 +000059 Subtarget(TT, CPU, FS, *this), IntrinsicInfo() {
Vincent Lejeune92b0a642013-12-07 01:49:19 +000060 setRequiresStructuredCFG(true);
Rafael Espindola227144c2013-05-13 01:16:13 +000061 initAsmInfo();
Tom Stellard75aadc22012-12-11 21:25:42 +000062}
63
64AMDGPUTargetMachine::~AMDGPUTargetMachine() {
Aditya Nandakumara2719322014-11-13 09:26:31 +000065 delete TLOF;
Tom Stellard75aadc22012-12-11 21:25:42 +000066}
67
68namespace {
69class AMDGPUPassConfig : public TargetPassConfig {
70public:
71 AMDGPUPassConfig(AMDGPUTargetMachine *TM, PassManagerBase &PM)
Andrew Trick978674b2013-09-20 05:14:41 +000072 : TargetPassConfig(TM, PM) {}
Tom Stellard75aadc22012-12-11 21:25:42 +000073
74 AMDGPUTargetMachine &getAMDGPUTargetMachine() const {
75 return getTM<AMDGPUTargetMachine>();
76 }
Andrew Trick978674b2013-09-20 05:14:41 +000077
Craig Topper5656db42014-04-29 07:57:24 +000078 ScheduleDAGInstrs *
79 createMachineScheduler(MachineSchedContext *C) const override {
Andrew Trick978674b2013-09-20 05:14:41 +000080 const AMDGPUSubtarget &ST = TM->getSubtarget<AMDGPUSubtarget>();
81 if (ST.getGeneration() <= AMDGPUSubtarget::NORTHERN_ISLANDS)
82 return createR600MachineScheduler(C);
Craig Topper062a2ba2014-04-25 05:30:21 +000083 return nullptr;
Andrew Trick978674b2013-09-20 05:14:41 +000084 }
85
Tom Stellard5cbb53c2014-11-03 19:49:05 +000086 void addIRPasses() override;
Benjamin Kramer8c90fd72014-09-03 11:41:21 +000087 void addCodeGenPrepare() override;
Craig Topper5656db42014-04-29 07:57:24 +000088 bool addPreISel() override;
89 bool addInstSelector() override;
90 bool addPreRegAlloc() override;
91 bool addPostRegAlloc() override;
92 bool addPreSched2() override;
93 bool addPreEmitPass() override;
Tom Stellard75aadc22012-12-11 21:25:42 +000094};
95} // End of anonymous namespace
96
97TargetPassConfig *AMDGPUTargetMachine::createPassConfig(PassManagerBase &PM) {
98 return new AMDGPUPassConfig(this, PM);
99}
100
Tom Stellard8b1e0212013-07-27 00:01:07 +0000101//===----------------------------------------------------------------------===//
102// AMDGPU Analysis Pass Setup
103//===----------------------------------------------------------------------===//
104
105void AMDGPUTargetMachine::addAnalysisPasses(PassManagerBase &PM) {
106 // Add first the target-independent BasicTTI pass, then our AMDGPU pass. This
107 // allows the AMDGPU pass to delegate to the target independent layer when
108 // appropriate.
109 PM.add(createBasicTargetTransformInfoPass(this));
110 PM.add(createAMDGPUTargetTransformInfoPass(this));
111}
112
Tom Stellard5cbb53c2014-11-03 19:49:05 +0000113void AMDGPUPassConfig::addIRPasses() {
114 // Function calls are not supported, so make sure we inline everything.
115 addPass(createAMDGPUAlwaysInlinePass());
116 addPass(createAlwaysInlinerPass());
117 // We need to add the barrier noop pass, otherwise adding the function
118 // inlining pass will cause all of the PassConfigs passes to be run
119 // one function at a time, which means if we have a nodule with two
120 // functions, then we will generate code for the first function
121 // without ever running any passes on the second.
122 addPass(createBarrierNoopPass());
123 TargetPassConfig::addIRPasses();
124}
125
Tom Stellard880a80a2014-06-17 16:53:14 +0000126void AMDGPUPassConfig::addCodeGenPrepare() {
127 const AMDGPUSubtarget &ST = TM->getSubtarget<AMDGPUSubtarget>();
Matt Arsenaultd9a23ab2014-07-13 02:08:26 +0000128 if (ST.isPromoteAllocaEnabled()) {
129 addPass(createAMDGPUPromoteAlloca(ST));
130 addPass(createSROAPass());
131 }
132
Tom Stellard880a80a2014-06-17 16:53:14 +0000133 TargetPassConfig::addCodeGenPrepare();
134}
135
Tom Stellard75aadc22012-12-11 21:25:42 +0000136bool
137AMDGPUPassConfig::addPreISel() {
Tom Stellardf8794352012-12-19 22:10:31 +0000138 const AMDGPUSubtarget &ST = TM->getSubtarget<AMDGPUSubtarget>();
Tom Stellardaa664d92013-08-06 02:43:45 +0000139 addPass(createFlattenCFGPass());
Tom Stellard66df8a22013-11-18 19:43:44 +0000140 if (ST.IsIRStructurizerEnabled())
Tom Stellarded0ceec2013-10-10 17:11:12 +0000141 addPass(createStructurizeCFGPass());
Matt Arsenaultd0ce2bd2014-02-24 21:01:23 +0000142 if (ST.getGeneration() >= AMDGPUSubtarget::SOUTHERN_ISLANDS) {
Vincent Lejeune4ee6dd62013-10-13 17:56:21 +0000143 addPass(createSinkingPass());
Tom Stellard9fa17912013-08-14 23:24:45 +0000144 addPass(createSITypeRewriter());
Tom Stellardf8794352012-12-19 22:10:31 +0000145 addPass(createSIAnnotateControlFlowPass());
Vincent Lejeuned3eed662013-05-17 16:50:20 +0000146 } else {
147 addPass(createR600TextureIntrinsicsReplacer());
Tom Stellardf8794352012-12-19 22:10:31 +0000148 }
Tom Stellard75aadc22012-12-11 21:25:42 +0000149 return false;
150}
151
152bool AMDGPUPassConfig::addInstSelector() {
Matt Arsenault162c1012014-11-18 21:06:58 +0000153 const AMDGPUSubtarget &ST = TM->getSubtarget<AMDGPUSubtarget>();
154
Tom Stellard75aadc22012-12-11 21:25:42 +0000155 addPass(createAMDGPUISelDag(getAMDGPUTargetMachine()));
Matt Arsenault162c1012014-11-18 21:06:58 +0000156
157 if (ST.getGeneration() >= AMDGPUSubtarget::SOUTHERN_ISLANDS) {
158 addPass(createSILowerI1CopiesPass());
159 addPass(createSIFixSGPRCopiesPass(*TM));
Matt Arsenault691ae3d2014-12-03 05:22:30 +0000160 addPass(createSIFoldOperandsPass());
Matt Arsenault162c1012014-11-18 21:06:58 +0000161 }
162
Tom Stellard75aadc22012-12-11 21:25:42 +0000163 return false;
164}
165
166bool AMDGPUPassConfig::addPreRegAlloc() {
Vincent Lejeunedec18752013-06-05 21:38:04 +0000167 const AMDGPUSubtarget &ST = TM->getSubtarget<AMDGPUSubtarget>();
Tom Stellarda6c6e1b2013-06-07 20:37:48 +0000168
169 if (ST.getGeneration() <= AMDGPUSubtarget::NORTHERN_ISLANDS) {
Vincent Lejeunedec18752013-06-05 21:38:04 +0000170 addPass(createR600VectorRegMerger(*TM));
Tom Stellard2f7cdda2013-08-06 23:08:28 +0000171 } else {
Matt Arsenault162c1012014-11-18 21:06:58 +0000172 if (getOptLevel() > CodeGenOpt::None && ST.loadStoreOptEnabled()) {
Matt Arsenault41033282014-10-10 22:01:59 +0000173 // Don't do this with no optimizations since it throws away debug info by
174 // merging nonadjacent loads.
175
176 // This should be run after scheduling, but before register allocation. It
177 // also need extra copies to the address operand to be eliminated.
178 initializeSILoadStoreOptimizerPass(*PassRegistry::getPassRegistry());
179 insertPass(&MachineSchedulerID, &SILoadStoreOptimizerID);
180 }
181
Tom Stellard1aaad692014-07-21 16:55:33 +0000182 addPass(createSIShrinkInstructionsPass());
Tom Stellard60024a02014-09-24 01:33:24 +0000183 addPass(createSIFixSGPRLiveRangesPass());
Vincent Lejeunedec18752013-06-05 21:38:04 +0000184 }
Tom Stellard75aadc22012-12-11 21:25:42 +0000185 return false;
186}
187
188bool AMDGPUPassConfig::addPostRegAlloc() {
Tom Stellardc4cabef2013-01-18 21:15:53 +0000189 const AMDGPUSubtarget &ST = TM->getSubtarget<AMDGPUSubtarget>();
190
Tom Stellarda6c6e1b2013-06-07 20:37:48 +0000191 if (ST.getGeneration() > AMDGPUSubtarget::NORTHERN_ISLANDS) {
Tom Stellard92105e82014-12-03 18:27:05 +0000192 addPass(createSIShrinkInstructionsPass());
Tom Stellardc4cabef2013-01-18 21:15:53 +0000193 }
Tom Stellard75aadc22012-12-11 21:25:42 +0000194 return false;
195}
196
197bool AMDGPUPassConfig::addPreSched2() {
Vincent Lejeunece499742013-07-09 15:03:33 +0000198 const AMDGPUSubtarget &ST = TM->getSubtarget<AMDGPUSubtarget>();
Tom Stellard75aadc22012-12-11 21:25:42 +0000199
Vincent Lejeunea4da6fb2013-10-01 19:32:58 +0000200 if (ST.getGeneration() <= AMDGPUSubtarget::NORTHERN_ISLANDS)
Tom Stellard1de55822013-12-11 17:51:41 +0000201 addPass(createR600EmitClauseMarkers());
Tom Stellard783893a2013-11-18 19:43:33 +0000202 if (ST.isIfCvtEnabled())
203 addPass(&IfConverterID);
Vincent Lejeunea4da6fb2013-10-01 19:32:58 +0000204 if (ST.getGeneration() <= AMDGPUSubtarget::NORTHERN_ISLANDS)
205 addPass(createR600ClauseMergePass(*TM));
Tom Stellard05cd4452014-12-03 18:27:08 +0000206 if (ST.getGeneration() >= AMDGPUSubtarget::SOUTHERN_ISLANDS) {
207 addPass(createSIInsertWaits(*TM));
208 }
Tom Stellard75aadc22012-12-11 21:25:42 +0000209 return false;
210}
211
212bool AMDGPUPassConfig::addPreEmitPass() {
Tom Stellard75aadc22012-12-11 21:25:42 +0000213 const AMDGPUSubtarget &ST = TM->getSubtarget<AMDGPUSubtarget>();
Tom Stellarda6c6e1b2013-06-07 20:37:48 +0000214 if (ST.getGeneration() <= AMDGPUSubtarget::NORTHERN_ISLANDS) {
Tom Stellardf2ba9722013-12-11 17:51:47 +0000215 addPass(createAMDGPUCFGStructurizerPass());
Tom Stellard75aadc22012-12-11 21:25:42 +0000216 addPass(createR600ExpandSpecialInstrsPass(*TM));
Tom Stellard75aadc22012-12-11 21:25:42 +0000217 addPass(&FinalizeMachineBundlesID);
Vincent Lejeune147700b2013-04-30 00:14:27 +0000218 addPass(createR600Packetizer(*TM));
219 addPass(createR600ControlFlowFinalizer(*TM));
Tom Stellard75aadc22012-12-11 21:25:42 +0000220 } else {
Tom Stellard75aadc22012-12-11 21:25:42 +0000221 addPass(createSILowerControlFlowPass(*TM));
222 }
223
224 return false;
225}