blob: 6a78b177e966dc35daf8f654bf1d2568396fb072 [file] [log] [blame]
Tom Stellard75aadc22012-12-11 21:25:42 +00001//===-- AMDGPUTargetMachine.cpp - TargetMachine for hw codegen targets-----===//
2//
3// The LLVM Compiler Infrastructure
4//
5// This file is distributed under the University of Illinois Open Source
6// License. See LICENSE.TXT for details.
7//
8//===----------------------------------------------------------------------===//
9//
10/// \file
11/// \brief The AMDGPU target machine contains all of the hardware specific
12/// information needed to emit code for R600 and SI GPUs.
13//
14//===----------------------------------------------------------------------===//
15
16#include "AMDGPUTargetMachine.h"
17#include "AMDGPU.h"
18#include "R600ISelLowering.h"
19#include "R600InstrInfo.h"
Vincent Lejeune68b6b6d2013-03-05 18:41:32 +000020#include "R600MachineScheduler.h"
Tom Stellard75aadc22012-12-11 21:25:42 +000021#include "SIISelLowering.h"
22#include "SIInstrInfo.h"
23#include "llvm/Analysis/Passes.h"
Tom Stellard75aadc22012-12-11 21:25:42 +000024#include "llvm/CodeGen/MachineFunctionAnalysis.h"
25#include "llvm/CodeGen/MachineModuleInfo.h"
26#include "llvm/CodeGen/Passes.h"
Chandler Carruth5ad5f152014-01-13 09:26:24 +000027#include "llvm/IR/Verifier.h"
Tom Stellard75aadc22012-12-11 21:25:42 +000028#include "llvm/MC/MCAsmInfo.h"
29#include "llvm/PassManager.h"
30#include "llvm/Support/TargetRegistry.h"
31#include "llvm/Support/raw_os_ostream.h"
32#include "llvm/Transforms/IPO.h"
33#include "llvm/Transforms/Scalar.h"
34#include <llvm/CodeGen/Passes.h>
35
36using namespace llvm;
37
38extern "C" void LLVMInitializeR600Target() {
39 // Register the target
40 RegisterTargetMachine<AMDGPUTargetMachine> X(TheAMDGPUTarget);
41}
42
Vincent Lejeune68b6b6d2013-03-05 18:41:32 +000043static ScheduleDAGInstrs *createR600MachineScheduler(MachineSchedContext *C) {
David Blaikie422b93d2014-04-21 20:32:32 +000044 return new ScheduleDAGMILive(C, make_unique<R600SchedStrategy>());
Vincent Lejeune68b6b6d2013-03-05 18:41:32 +000045}
46
47static MachineSchedRegistry
48SchedCustomRegistry("r600", "Run R600's custom scheduler",
49 createR600MachineScheduler);
50
Rafael Espindolaceb0c492013-12-14 06:13:44 +000051static std::string computeDataLayout(const AMDGPUSubtarget &ST) {
Rafael Espindola4fa79752013-12-19 16:51:03 +000052 std::string Ret = "e-p:32:32";
Rafael Espindolaceb0c492013-12-14 06:13:44 +000053
Matt Arsenaulta98cd6a2013-12-19 05:32:55 +000054 if (ST.is64bit()) {
55 // 32-bit private, local, and region pointers. 64-bit global and constant.
Matt Arsenault46b51b72014-05-22 18:27:07 +000056 Ret += "-p1:64:64-p2:64:64-p3:32:32-p4:64:64-p5:32:32-p24:64:64";
Matt Arsenaulta98cd6a2013-12-19 05:32:55 +000057 }
Rafael Espindolaceb0c492013-12-14 06:13:44 +000058
Rafael Espindolae89b4142013-12-16 19:31:14 +000059 Ret += "-i64:64-v16:16-v24:32-v32:32-v48:64-v96:128-v192:256-v256:256"
60 "-v512:512-v1024:1024-v2048:2048-n32:64";
61
Rafael Espindola0eb1ebe2013-12-16 19:18:57 +000062 return Ret;
Rafael Espindolaceb0c492013-12-14 06:13:44 +000063}
64
Tom Stellard75aadc22012-12-11 21:25:42 +000065AMDGPUTargetMachine::AMDGPUTargetMachine(const Target &T, StringRef TT,
66 StringRef CPU, StringRef FS,
67 TargetOptions Options,
68 Reloc::Model RM, CodeModel::Model CM,
69 CodeGenOpt::Level OptLevel
70)
71:
72 LLVMTargetMachine(T, TT, CPU, FS, Options, RM, CM, OptLevel),
73 Subtarget(TT, CPU, FS),
Rafael Espindolaceb0c492013-12-14 06:13:44 +000074 Layout(computeDataLayout(Subtarget)),
Tom Stellardaf775432013-10-23 00:44:32 +000075 FrameLowering(TargetFrameLowering::StackGrowsUp,
76 64 * 16 // Maximum stack alignment (long16)
77 , 0),
Tom Stellard75aadc22012-12-11 21:25:42 +000078 IntrinsicInfo(this),
79 InstrItins(&Subtarget.getInstrItineraryData()) {
80 // TLInfo uses InstrInfo so it must be initialized after.
Tom Stellarda6c6e1b2013-06-07 20:37:48 +000081 if (Subtarget.getGeneration() <= AMDGPUSubtarget::NORTHERN_ISLANDS) {
Rafael Espindola39aca622013-05-23 03:31:47 +000082 TLInfo.reset(new R600TargetLowering(*this));
Tom Stellard75aadc22012-12-11 21:25:42 +000083 } else {
Rafael Espindola39aca622013-05-23 03:31:47 +000084 TLInfo.reset(new SITargetLowering(*this));
Tom Stellard75aadc22012-12-11 21:25:42 +000085 }
Vincent Lejeune92b0a642013-12-07 01:49:19 +000086 setRequiresStructuredCFG(true);
Rafael Espindola227144c2013-05-13 01:16:13 +000087 initAsmInfo();
Tom Stellard75aadc22012-12-11 21:25:42 +000088}
89
90AMDGPUTargetMachine::~AMDGPUTargetMachine() {
91}
92
93namespace {
94class AMDGPUPassConfig : public TargetPassConfig {
95public:
96 AMDGPUPassConfig(AMDGPUTargetMachine *TM, PassManagerBase &PM)
Andrew Trick978674b2013-09-20 05:14:41 +000097 : TargetPassConfig(TM, PM) {}
Tom Stellard75aadc22012-12-11 21:25:42 +000098
99 AMDGPUTargetMachine &getAMDGPUTargetMachine() const {
100 return getTM<AMDGPUTargetMachine>();
101 }
Andrew Trick978674b2013-09-20 05:14:41 +0000102
Craig Topper5656db42014-04-29 07:57:24 +0000103 ScheduleDAGInstrs *
104 createMachineScheduler(MachineSchedContext *C) const override {
Andrew Trick978674b2013-09-20 05:14:41 +0000105 const AMDGPUSubtarget &ST = TM->getSubtarget<AMDGPUSubtarget>();
106 if (ST.getGeneration() <= AMDGPUSubtarget::NORTHERN_ISLANDS)
107 return createR600MachineScheduler(C);
Craig Topper062a2ba2014-04-25 05:30:21 +0000108 return nullptr;
Andrew Trick978674b2013-09-20 05:14:41 +0000109 }
110
Tom Stellard880a80a2014-06-17 16:53:14 +0000111 virtual void addCodeGenPrepare();
Craig Topper5656db42014-04-29 07:57:24 +0000112 bool addPreISel() override;
113 bool addInstSelector() override;
114 bool addPreRegAlloc() override;
115 bool addPostRegAlloc() override;
116 bool addPreSched2() override;
117 bool addPreEmitPass() override;
Tom Stellard75aadc22012-12-11 21:25:42 +0000118};
119} // End of anonymous namespace
120
121TargetPassConfig *AMDGPUTargetMachine::createPassConfig(PassManagerBase &PM) {
122 return new AMDGPUPassConfig(this, PM);
123}
124
Tom Stellard8b1e0212013-07-27 00:01:07 +0000125//===----------------------------------------------------------------------===//
126// AMDGPU Analysis Pass Setup
127//===----------------------------------------------------------------------===//
128
129void AMDGPUTargetMachine::addAnalysisPasses(PassManagerBase &PM) {
130 // Add first the target-independent BasicTTI pass, then our AMDGPU pass. This
131 // allows the AMDGPU pass to delegate to the target independent layer when
132 // appropriate.
133 PM.add(createBasicTargetTransformInfoPass(this));
134 PM.add(createAMDGPUTargetTransformInfoPass(this));
135}
136
Tom Stellard880a80a2014-06-17 16:53:14 +0000137void AMDGPUPassConfig::addCodeGenPrepare() {
138 const AMDGPUSubtarget &ST = TM->getSubtarget<AMDGPUSubtarget>();
Matt Arsenaultd9a23ab2014-07-13 02:08:26 +0000139 if (ST.isPromoteAllocaEnabled()) {
140 addPass(createAMDGPUPromoteAlloca(ST));
141 addPass(createSROAPass());
142 }
143
Tom Stellard880a80a2014-06-17 16:53:14 +0000144 TargetPassConfig::addCodeGenPrepare();
145}
146
Tom Stellard75aadc22012-12-11 21:25:42 +0000147bool
148AMDGPUPassConfig::addPreISel() {
Tom Stellardf8794352012-12-19 22:10:31 +0000149 const AMDGPUSubtarget &ST = TM->getSubtarget<AMDGPUSubtarget>();
Tom Stellardaa664d92013-08-06 02:43:45 +0000150 addPass(createFlattenCFGPass());
Tom Stellard66df8a22013-11-18 19:43:44 +0000151 if (ST.IsIRStructurizerEnabled())
Tom Stellarded0ceec2013-10-10 17:11:12 +0000152 addPass(createStructurizeCFGPass());
Matt Arsenaultd0ce2bd2014-02-24 21:01:23 +0000153 if (ST.getGeneration() >= AMDGPUSubtarget::SOUTHERN_ISLANDS) {
Vincent Lejeune4ee6dd62013-10-13 17:56:21 +0000154 addPass(createSinkingPass());
Tom Stellard9fa17912013-08-14 23:24:45 +0000155 addPass(createSITypeRewriter());
Tom Stellardf8794352012-12-19 22:10:31 +0000156 addPass(createSIAnnotateControlFlowPass());
Vincent Lejeuned3eed662013-05-17 16:50:20 +0000157 } else {
158 addPass(createR600TextureIntrinsicsReplacer());
Tom Stellardf8794352012-12-19 22:10:31 +0000159 }
Tom Stellard75aadc22012-12-11 21:25:42 +0000160 return false;
161}
162
163bool AMDGPUPassConfig::addInstSelector() {
Tom Stellard75aadc22012-12-11 21:25:42 +0000164 addPass(createAMDGPUISelDag(getAMDGPUTargetMachine()));
Tom Stellard1bd80722014-04-30 15:31:33 +0000165 addPass(createSILowerI1CopiesPass());
Tom Stellard75aadc22012-12-11 21:25:42 +0000166 return false;
167}
168
169bool AMDGPUPassConfig::addPreRegAlloc() {
Vincent Lejeunedec18752013-06-05 21:38:04 +0000170 const AMDGPUSubtarget &ST = TM->getSubtarget<AMDGPUSubtarget>();
Tom Stellarda6c6e1b2013-06-07 20:37:48 +0000171
172 if (ST.getGeneration() <= AMDGPUSubtarget::NORTHERN_ISLANDS) {
Vincent Lejeunedec18752013-06-05 21:38:04 +0000173 addPass(createR600VectorRegMerger(*TM));
Tom Stellard2f7cdda2013-08-06 23:08:28 +0000174 } else {
175 addPass(createSIFixSGPRCopiesPass(*TM));
Tom Stellard15834092014-03-21 15:51:57 +0000176 // SIFixSGPRCopies can generate a lot of duplicate instructions,
177 // so we need to run MachineCSE afterwards.
178 addPass(&MachineCSEID);
Tom Stellardb2de94e2014-07-02 20:53:48 +0000179 initializeSIFixSGPRLiveRangesPass(*PassRegistry::getPassRegistry());
180 insertPass(&RegisterCoalescerID, &SIFixSGPRLiveRangesID);
Vincent Lejeunedec18752013-06-05 21:38:04 +0000181 }
Tom Stellard75aadc22012-12-11 21:25:42 +0000182 return false;
183}
184
185bool AMDGPUPassConfig::addPostRegAlloc() {
Tom Stellardc4cabef2013-01-18 21:15:53 +0000186 const AMDGPUSubtarget &ST = TM->getSubtarget<AMDGPUSubtarget>();
187
Tom Stellarda6c6e1b2013-06-07 20:37:48 +0000188 if (ST.getGeneration() > AMDGPUSubtarget::NORTHERN_ISLANDS) {
Tom Stellardc4cabef2013-01-18 21:15:53 +0000189 addPass(createSIInsertWaits(*TM));
190 }
Tom Stellard75aadc22012-12-11 21:25:42 +0000191 return false;
192}
193
194bool AMDGPUPassConfig::addPreSched2() {
Vincent Lejeunece499742013-07-09 15:03:33 +0000195 const AMDGPUSubtarget &ST = TM->getSubtarget<AMDGPUSubtarget>();
Tom Stellard75aadc22012-12-11 21:25:42 +0000196
Vincent Lejeunea4da6fb2013-10-01 19:32:58 +0000197 if (ST.getGeneration() <= AMDGPUSubtarget::NORTHERN_ISLANDS)
Tom Stellard1de55822013-12-11 17:51:41 +0000198 addPass(createR600EmitClauseMarkers());
Tom Stellard783893a2013-11-18 19:43:33 +0000199 if (ST.isIfCvtEnabled())
200 addPass(&IfConverterID);
Vincent Lejeunea4da6fb2013-10-01 19:32:58 +0000201 if (ST.getGeneration() <= AMDGPUSubtarget::NORTHERN_ISLANDS)
202 addPass(createR600ClauseMergePass(*TM));
Tom Stellard75aadc22012-12-11 21:25:42 +0000203 return false;
204}
205
206bool AMDGPUPassConfig::addPreEmitPass() {
Tom Stellard75aadc22012-12-11 21:25:42 +0000207 const AMDGPUSubtarget &ST = TM->getSubtarget<AMDGPUSubtarget>();
Tom Stellarda6c6e1b2013-06-07 20:37:48 +0000208 if (ST.getGeneration() <= AMDGPUSubtarget::NORTHERN_ISLANDS) {
Tom Stellardf2ba9722013-12-11 17:51:47 +0000209 addPass(createAMDGPUCFGStructurizerPass());
Tom Stellard75aadc22012-12-11 21:25:42 +0000210 addPass(createR600ExpandSpecialInstrsPass(*TM));
Tom Stellard75aadc22012-12-11 21:25:42 +0000211 addPass(&FinalizeMachineBundlesID);
Vincent Lejeune147700b2013-04-30 00:14:27 +0000212 addPass(createR600Packetizer(*TM));
213 addPass(createR600ControlFlowFinalizer(*TM));
Tom Stellard75aadc22012-12-11 21:25:42 +0000214 } else {
Tom Stellard75aadc22012-12-11 21:25:42 +0000215 addPass(createSILowerControlFlowPass(*TM));
216 }
217
218 return false;
219}