blob: ca4d0cae9b25cd70498bb59d47476e5314e8fb14 [file] [log] [blame]
Tom Stellard75aadc22012-12-11 21:25:42 +00001//===-- AMDGPUTargetMachine.cpp - TargetMachine for hw codegen targets-----===//
2//
3// The LLVM Compiler Infrastructure
4//
5// This file is distributed under the University of Illinois Open Source
6// License. See LICENSE.TXT for details.
7//
8//===----------------------------------------------------------------------===//
9//
10/// \file
11/// \brief The AMDGPU target machine contains all of the hardware specific
12/// information needed to emit code for R600 and SI GPUs.
13//
14//===----------------------------------------------------------------------===//
15
16#include "AMDGPUTargetMachine.h"
17#include "AMDGPU.h"
18#include "R600ISelLowering.h"
19#include "R600InstrInfo.h"
Vincent Lejeune68b6b6d2013-03-05 18:41:32 +000020#include "R600MachineScheduler.h"
Tom Stellard75aadc22012-12-11 21:25:42 +000021#include "SIISelLowering.h"
22#include "SIInstrInfo.h"
23#include "llvm/Analysis/Passes.h"
Tom Stellard75aadc22012-12-11 21:25:42 +000024#include "llvm/CodeGen/MachineFunctionAnalysis.h"
25#include "llvm/CodeGen/MachineModuleInfo.h"
26#include "llvm/CodeGen/Passes.h"
Chandler Carruth5ad5f152014-01-13 09:26:24 +000027#include "llvm/IR/Verifier.h"
Tom Stellard75aadc22012-12-11 21:25:42 +000028#include "llvm/MC/MCAsmInfo.h"
29#include "llvm/PassManager.h"
30#include "llvm/Support/TargetRegistry.h"
31#include "llvm/Support/raw_os_ostream.h"
32#include "llvm/Transforms/IPO.h"
33#include "llvm/Transforms/Scalar.h"
34#include <llvm/CodeGen/Passes.h>
35
36using namespace llvm;
37
38extern "C" void LLVMInitializeR600Target() {
39 // Register the target
40 RegisterTargetMachine<AMDGPUTargetMachine> X(TheAMDGPUTarget);
41}
42
Vincent Lejeune68b6b6d2013-03-05 18:41:32 +000043static ScheduleDAGInstrs *createR600MachineScheduler(MachineSchedContext *C) {
David Blaikie422b93d2014-04-21 20:32:32 +000044 return new ScheduleDAGMILive(C, make_unique<R600SchedStrategy>());
Vincent Lejeune68b6b6d2013-03-05 18:41:32 +000045}
46
47static MachineSchedRegistry
48SchedCustomRegistry("r600", "Run R600's custom scheduler",
49 createR600MachineScheduler);
50
Tom Stellard75aadc22012-12-11 21:25:42 +000051AMDGPUTargetMachine::AMDGPUTargetMachine(const Target &T, StringRef TT,
Eric Christopherac4b69e2014-07-25 22:22:39 +000052 StringRef CPU, StringRef FS,
53 TargetOptions Options, Reloc::Model RM,
54 CodeModel::Model CM,
55 CodeGenOpt::Level OptLevel)
56 : LLVMTargetMachine(T, TT, CPU, FS, Options, RM, CM, OptLevel),
Eric Christopher34aaf972014-08-04 17:37:43 +000057 Subtarget(TT, CPU, FS, *this), IntrinsicInfo() {
Vincent Lejeune92b0a642013-12-07 01:49:19 +000058 setRequiresStructuredCFG(true);
Rafael Espindola227144c2013-05-13 01:16:13 +000059 initAsmInfo();
Tom Stellard75aadc22012-12-11 21:25:42 +000060}
61
62AMDGPUTargetMachine::~AMDGPUTargetMachine() {
63}
64
65namespace {
66class AMDGPUPassConfig : public TargetPassConfig {
67public:
68 AMDGPUPassConfig(AMDGPUTargetMachine *TM, PassManagerBase &PM)
Andrew Trick978674b2013-09-20 05:14:41 +000069 : TargetPassConfig(TM, PM) {}
Tom Stellard75aadc22012-12-11 21:25:42 +000070
71 AMDGPUTargetMachine &getAMDGPUTargetMachine() const {
72 return getTM<AMDGPUTargetMachine>();
73 }
Andrew Trick978674b2013-09-20 05:14:41 +000074
Craig Topper5656db42014-04-29 07:57:24 +000075 ScheduleDAGInstrs *
76 createMachineScheduler(MachineSchedContext *C) const override {
Andrew Trick978674b2013-09-20 05:14:41 +000077 const AMDGPUSubtarget &ST = TM->getSubtarget<AMDGPUSubtarget>();
78 if (ST.getGeneration() <= AMDGPUSubtarget::NORTHERN_ISLANDS)
79 return createR600MachineScheduler(C);
Craig Topper062a2ba2014-04-25 05:30:21 +000080 return nullptr;
Andrew Trick978674b2013-09-20 05:14:41 +000081 }
82
Tom Stellard5cbb53c2014-11-03 19:49:05 +000083 void addIRPasses() override;
Benjamin Kramer8c90fd72014-09-03 11:41:21 +000084 void addCodeGenPrepare() override;
Craig Topper5656db42014-04-29 07:57:24 +000085 bool addPreISel() override;
86 bool addInstSelector() override;
87 bool addPreRegAlloc() override;
88 bool addPostRegAlloc() override;
89 bool addPreSched2() override;
90 bool addPreEmitPass() override;
Tom Stellard75aadc22012-12-11 21:25:42 +000091};
92} // End of anonymous namespace
93
94TargetPassConfig *AMDGPUTargetMachine::createPassConfig(PassManagerBase &PM) {
95 return new AMDGPUPassConfig(this, PM);
96}
97
Tom Stellard8b1e0212013-07-27 00:01:07 +000098//===----------------------------------------------------------------------===//
99// AMDGPU Analysis Pass Setup
100//===----------------------------------------------------------------------===//
101
102void AMDGPUTargetMachine::addAnalysisPasses(PassManagerBase &PM) {
103 // Add first the target-independent BasicTTI pass, then our AMDGPU pass. This
104 // allows the AMDGPU pass to delegate to the target independent layer when
105 // appropriate.
106 PM.add(createBasicTargetTransformInfoPass(this));
107 PM.add(createAMDGPUTargetTransformInfoPass(this));
108}
109
Tom Stellard5cbb53c2014-11-03 19:49:05 +0000110void AMDGPUPassConfig::addIRPasses() {
111 // Function calls are not supported, so make sure we inline everything.
112 addPass(createAMDGPUAlwaysInlinePass());
113 addPass(createAlwaysInlinerPass());
114 // We need to add the barrier noop pass, otherwise adding the function
115 // inlining pass will cause all of the PassConfigs passes to be run
116 // one function at a time, which means if we have a nodule with two
117 // functions, then we will generate code for the first function
118 // without ever running any passes on the second.
119 addPass(createBarrierNoopPass());
120 TargetPassConfig::addIRPasses();
121}
122
Tom Stellard880a80a2014-06-17 16:53:14 +0000123void AMDGPUPassConfig::addCodeGenPrepare() {
124 const AMDGPUSubtarget &ST = TM->getSubtarget<AMDGPUSubtarget>();
Matt Arsenaultd9a23ab2014-07-13 02:08:26 +0000125 if (ST.isPromoteAllocaEnabled()) {
126 addPass(createAMDGPUPromoteAlloca(ST));
127 addPass(createSROAPass());
128 }
129
Tom Stellard880a80a2014-06-17 16:53:14 +0000130 TargetPassConfig::addCodeGenPrepare();
131}
132
Tom Stellard75aadc22012-12-11 21:25:42 +0000133bool
134AMDGPUPassConfig::addPreISel() {
Tom Stellardf8794352012-12-19 22:10:31 +0000135 const AMDGPUSubtarget &ST = TM->getSubtarget<AMDGPUSubtarget>();
Tom Stellardaa664d92013-08-06 02:43:45 +0000136 addPass(createFlattenCFGPass());
Tom Stellard66df8a22013-11-18 19:43:44 +0000137 if (ST.IsIRStructurizerEnabled())
Tom Stellarded0ceec2013-10-10 17:11:12 +0000138 addPass(createStructurizeCFGPass());
Matt Arsenaultd0ce2bd2014-02-24 21:01:23 +0000139 if (ST.getGeneration() >= AMDGPUSubtarget::SOUTHERN_ISLANDS) {
Vincent Lejeune4ee6dd62013-10-13 17:56:21 +0000140 addPass(createSinkingPass());
Tom Stellard9fa17912013-08-14 23:24:45 +0000141 addPass(createSITypeRewriter());
Tom Stellardf8794352012-12-19 22:10:31 +0000142 addPass(createSIAnnotateControlFlowPass());
Vincent Lejeuned3eed662013-05-17 16:50:20 +0000143 } else {
144 addPass(createR600TextureIntrinsicsReplacer());
Tom Stellardf8794352012-12-19 22:10:31 +0000145 }
Tom Stellard75aadc22012-12-11 21:25:42 +0000146 return false;
147}
148
149bool AMDGPUPassConfig::addInstSelector() {
Tom Stellard75aadc22012-12-11 21:25:42 +0000150 addPass(createAMDGPUISelDag(getAMDGPUTargetMachine()));
Tom Stellard1bd80722014-04-30 15:31:33 +0000151 addPass(createSILowerI1CopiesPass());
Tom Stellard75aadc22012-12-11 21:25:42 +0000152 return false;
153}
154
155bool AMDGPUPassConfig::addPreRegAlloc() {
Vincent Lejeunedec18752013-06-05 21:38:04 +0000156 const AMDGPUSubtarget &ST = TM->getSubtarget<AMDGPUSubtarget>();
Tom Stellarda6c6e1b2013-06-07 20:37:48 +0000157
158 if (ST.getGeneration() <= AMDGPUSubtarget::NORTHERN_ISLANDS) {
Vincent Lejeunedec18752013-06-05 21:38:04 +0000159 addPass(createR600VectorRegMerger(*TM));
Tom Stellard2f7cdda2013-08-06 23:08:28 +0000160 } else {
161 addPass(createSIFixSGPRCopiesPass(*TM));
Tom Stellard15834092014-03-21 15:51:57 +0000162 // SIFixSGPRCopies can generate a lot of duplicate instructions,
163 // so we need to run MachineCSE afterwards.
164 addPass(&MachineCSEID);
Matt Arsenault41033282014-10-10 22:01:59 +0000165
166 if (getOptLevel() > CodeGenOpt::None && ST.loadStoreOptEnabled()) {
167 // Don't do this with no optimizations since it throws away debug info by
168 // merging nonadjacent loads.
169
170 // This should be run after scheduling, but before register allocation. It
171 // also need extra copies to the address operand to be eliminated.
172 initializeSILoadStoreOptimizerPass(*PassRegistry::getPassRegistry());
173 insertPass(&MachineSchedulerID, &SILoadStoreOptimizerID);
174 }
175
Tom Stellard1aaad692014-07-21 16:55:33 +0000176 addPass(createSIShrinkInstructionsPass());
Tom Stellard60024a02014-09-24 01:33:24 +0000177 addPass(createSIFixSGPRLiveRangesPass());
Vincent Lejeunedec18752013-06-05 21:38:04 +0000178 }
Tom Stellard75aadc22012-12-11 21:25:42 +0000179 return false;
180}
181
182bool AMDGPUPassConfig::addPostRegAlloc() {
Tom Stellardc4cabef2013-01-18 21:15:53 +0000183 const AMDGPUSubtarget &ST = TM->getSubtarget<AMDGPUSubtarget>();
184
Tom Stellard1aaad692014-07-21 16:55:33 +0000185 addPass(createSIShrinkInstructionsPass());
Tom Stellarda6c6e1b2013-06-07 20:37:48 +0000186 if (ST.getGeneration() > AMDGPUSubtarget::NORTHERN_ISLANDS) {
Tom Stellardc4cabef2013-01-18 21:15:53 +0000187 addPass(createSIInsertWaits(*TM));
188 }
Tom Stellard75aadc22012-12-11 21:25:42 +0000189 return false;
190}
191
192bool AMDGPUPassConfig::addPreSched2() {
Vincent Lejeunece499742013-07-09 15:03:33 +0000193 const AMDGPUSubtarget &ST = TM->getSubtarget<AMDGPUSubtarget>();
Tom Stellard75aadc22012-12-11 21:25:42 +0000194
Vincent Lejeunea4da6fb2013-10-01 19:32:58 +0000195 if (ST.getGeneration() <= AMDGPUSubtarget::NORTHERN_ISLANDS)
Tom Stellard1de55822013-12-11 17:51:41 +0000196 addPass(createR600EmitClauseMarkers());
Tom Stellard783893a2013-11-18 19:43:33 +0000197 if (ST.isIfCvtEnabled())
198 addPass(&IfConverterID);
Vincent Lejeunea4da6fb2013-10-01 19:32:58 +0000199 if (ST.getGeneration() <= AMDGPUSubtarget::NORTHERN_ISLANDS)
200 addPass(createR600ClauseMergePass(*TM));
Tom Stellard75aadc22012-12-11 21:25:42 +0000201 return false;
202}
203
204bool AMDGPUPassConfig::addPreEmitPass() {
Tom Stellard75aadc22012-12-11 21:25:42 +0000205 const AMDGPUSubtarget &ST = TM->getSubtarget<AMDGPUSubtarget>();
Tom Stellarda6c6e1b2013-06-07 20:37:48 +0000206 if (ST.getGeneration() <= AMDGPUSubtarget::NORTHERN_ISLANDS) {
Tom Stellardf2ba9722013-12-11 17:51:47 +0000207 addPass(createAMDGPUCFGStructurizerPass());
Tom Stellard75aadc22012-12-11 21:25:42 +0000208 addPass(createR600ExpandSpecialInstrsPass(*TM));
Tom Stellard75aadc22012-12-11 21:25:42 +0000209 addPass(&FinalizeMachineBundlesID);
Vincent Lejeune147700b2013-04-30 00:14:27 +0000210 addPass(createR600Packetizer(*TM));
211 addPass(createR600ControlFlowFinalizer(*TM));
Tom Stellard75aadc22012-12-11 21:25:42 +0000212 } else {
Tom Stellard75aadc22012-12-11 21:25:42 +0000213 addPass(createSILowerControlFlowPass(*TM));
214 }
215
216 return false;
217}