blob: 6b68c2abe367644f9b10da539296683daf1b7e25 [file] [log] [blame]
Tom Stellard75aadc22012-12-11 21:25:42 +00001//===-- AMDGPUTargetMachine.cpp - TargetMachine for hw codegen targets-----===//
2//
3// The LLVM Compiler Infrastructure
4//
5// This file is distributed under the University of Illinois Open Source
6// License. See LICENSE.TXT for details.
7//
8//===----------------------------------------------------------------------===//
9//
10/// \file
11/// \brief The AMDGPU target machine contains all of the hardware specific
12/// information needed to emit code for R600 and SI GPUs.
13//
14//===----------------------------------------------------------------------===//
15
16#include "AMDGPUTargetMachine.h"
17#include "AMDGPU.h"
18#include "R600ISelLowering.h"
19#include "R600InstrInfo.h"
Vincent Lejeune68b6b6d2013-03-05 18:41:32 +000020#include "R600MachineScheduler.h"
Tom Stellard75aadc22012-12-11 21:25:42 +000021#include "SIISelLowering.h"
22#include "SIInstrInfo.h"
23#include "llvm/Analysis/Passes.h"
Tom Stellard75aadc22012-12-11 21:25:42 +000024#include "llvm/CodeGen/MachineFunctionAnalysis.h"
25#include "llvm/CodeGen/MachineModuleInfo.h"
26#include "llvm/CodeGen/Passes.h"
Chandler Carruth5ad5f152014-01-13 09:26:24 +000027#include "llvm/IR/Verifier.h"
Tom Stellard75aadc22012-12-11 21:25:42 +000028#include "llvm/MC/MCAsmInfo.h"
29#include "llvm/PassManager.h"
30#include "llvm/Support/TargetRegistry.h"
31#include "llvm/Support/raw_os_ostream.h"
32#include "llvm/Transforms/IPO.h"
33#include "llvm/Transforms/Scalar.h"
34#include <llvm/CodeGen/Passes.h>
35
Tom Stellarded0ceec2013-10-10 17:11:12 +000036
Tom Stellard75aadc22012-12-11 21:25:42 +000037using namespace llvm;
38
39extern "C" void LLVMInitializeR600Target() {
40 // Register the target
41 RegisterTargetMachine<AMDGPUTargetMachine> X(TheAMDGPUTarget);
42}
43
Vincent Lejeune68b6b6d2013-03-05 18:41:32 +000044static ScheduleDAGInstrs *createR600MachineScheduler(MachineSchedContext *C) {
David Blaikie422b93d2014-04-21 20:32:32 +000045 return new ScheduleDAGMILive(C, make_unique<R600SchedStrategy>());
Vincent Lejeune68b6b6d2013-03-05 18:41:32 +000046}
47
48static MachineSchedRegistry
49SchedCustomRegistry("r600", "Run R600's custom scheduler",
50 createR600MachineScheduler);
51
Rafael Espindolaceb0c492013-12-14 06:13:44 +000052static std::string computeDataLayout(const AMDGPUSubtarget &ST) {
Rafael Espindola4fa79752013-12-19 16:51:03 +000053 std::string Ret = "e-p:32:32";
Rafael Espindolaceb0c492013-12-14 06:13:44 +000054
Matt Arsenaulta98cd6a2013-12-19 05:32:55 +000055 if (ST.is64bit()) {
56 // 32-bit private, local, and region pointers. 64-bit global and constant.
57 Ret += "-p1:64:64-p2:64:64-p3:32:32-p4:32:32-p5:64:64";
58 }
Rafael Espindolaceb0c492013-12-14 06:13:44 +000059
Rafael Espindolae89b4142013-12-16 19:31:14 +000060 Ret += "-i64:64-v16:16-v24:32-v32:32-v48:64-v96:128-v192:256-v256:256"
61 "-v512:512-v1024:1024-v2048:2048-n32:64";
62
Rafael Espindola0eb1ebe2013-12-16 19:18:57 +000063 return Ret;
Rafael Espindolaceb0c492013-12-14 06:13:44 +000064}
65
Tom Stellard75aadc22012-12-11 21:25:42 +000066AMDGPUTargetMachine::AMDGPUTargetMachine(const Target &T, StringRef TT,
67 StringRef CPU, StringRef FS,
68 TargetOptions Options,
69 Reloc::Model RM, CodeModel::Model CM,
70 CodeGenOpt::Level OptLevel
71)
72:
73 LLVMTargetMachine(T, TT, CPU, FS, Options, RM, CM, OptLevel),
74 Subtarget(TT, CPU, FS),
Rafael Espindolaceb0c492013-12-14 06:13:44 +000075 Layout(computeDataLayout(Subtarget)),
Tom Stellardaf775432013-10-23 00:44:32 +000076 FrameLowering(TargetFrameLowering::StackGrowsUp,
77 64 * 16 // Maximum stack alignment (long16)
78 , 0),
Tom Stellard75aadc22012-12-11 21:25:42 +000079 IntrinsicInfo(this),
80 InstrItins(&Subtarget.getInstrItineraryData()) {
81 // TLInfo uses InstrInfo so it must be initialized after.
Tom Stellarda6c6e1b2013-06-07 20:37:48 +000082 if (Subtarget.getGeneration() <= AMDGPUSubtarget::NORTHERN_ISLANDS) {
Rafael Espindola39aca622013-05-23 03:31:47 +000083 InstrInfo.reset(new R600InstrInfo(*this));
84 TLInfo.reset(new R600TargetLowering(*this));
Tom Stellard75aadc22012-12-11 21:25:42 +000085 } else {
Rafael Espindola39aca622013-05-23 03:31:47 +000086 InstrInfo.reset(new SIInstrInfo(*this));
87 TLInfo.reset(new SITargetLowering(*this));
Tom Stellard75aadc22012-12-11 21:25:42 +000088 }
Vincent Lejeune92b0a642013-12-07 01:49:19 +000089 setRequiresStructuredCFG(true);
Rafael Espindola227144c2013-05-13 01:16:13 +000090 initAsmInfo();
Tom Stellard75aadc22012-12-11 21:25:42 +000091}
92
93AMDGPUTargetMachine::~AMDGPUTargetMachine() {
94}
95
96namespace {
97class AMDGPUPassConfig : public TargetPassConfig {
98public:
99 AMDGPUPassConfig(AMDGPUTargetMachine *TM, PassManagerBase &PM)
Andrew Trick978674b2013-09-20 05:14:41 +0000100 : TargetPassConfig(TM, PM) {}
Tom Stellard75aadc22012-12-11 21:25:42 +0000101
102 AMDGPUTargetMachine &getAMDGPUTargetMachine() const {
103 return getTM<AMDGPUTargetMachine>();
104 }
Andrew Trick978674b2013-09-20 05:14:41 +0000105
Craig Topper5656db42014-04-29 07:57:24 +0000106 ScheduleDAGInstrs *
107 createMachineScheduler(MachineSchedContext *C) const override {
Andrew Trick978674b2013-09-20 05:14:41 +0000108 const AMDGPUSubtarget &ST = TM->getSubtarget<AMDGPUSubtarget>();
109 if (ST.getGeneration() <= AMDGPUSubtarget::NORTHERN_ISLANDS)
110 return createR600MachineScheduler(C);
Craig Topper062a2ba2014-04-25 05:30:21 +0000111 return nullptr;
Andrew Trick978674b2013-09-20 05:14:41 +0000112 }
113
Craig Topper5656db42014-04-29 07:57:24 +0000114 bool addPreISel() override;
115 bool addInstSelector() override;
116 bool addPreRegAlloc() override;
117 bool addPostRegAlloc() override;
118 bool addPreSched2() override;
119 bool addPreEmitPass() override;
Tom Stellard75aadc22012-12-11 21:25:42 +0000120};
121} // End of anonymous namespace
122
123TargetPassConfig *AMDGPUTargetMachine::createPassConfig(PassManagerBase &PM) {
124 return new AMDGPUPassConfig(this, PM);
125}
126
Tom Stellard8b1e0212013-07-27 00:01:07 +0000127//===----------------------------------------------------------------------===//
128// AMDGPU Analysis Pass Setup
129//===----------------------------------------------------------------------===//
130
131void AMDGPUTargetMachine::addAnalysisPasses(PassManagerBase &PM) {
132 // Add first the target-independent BasicTTI pass, then our AMDGPU pass. This
133 // allows the AMDGPU pass to delegate to the target independent layer when
134 // appropriate.
135 PM.add(createBasicTargetTransformInfoPass(this));
136 PM.add(createAMDGPUTargetTransformInfoPass(this));
137}
138
Tom Stellard75aadc22012-12-11 21:25:42 +0000139bool
140AMDGPUPassConfig::addPreISel() {
Tom Stellardf8794352012-12-19 22:10:31 +0000141 const AMDGPUSubtarget &ST = TM->getSubtarget<AMDGPUSubtarget>();
Tom Stellardaa664d92013-08-06 02:43:45 +0000142 addPass(createFlattenCFGPass());
Tom Stellard66df8a22013-11-18 19:43:44 +0000143 if (ST.IsIRStructurizerEnabled())
Tom Stellarded0ceec2013-10-10 17:11:12 +0000144 addPass(createStructurizeCFGPass());
Matt Arsenaultd0ce2bd2014-02-24 21:01:23 +0000145 if (ST.getGeneration() >= AMDGPUSubtarget::SOUTHERN_ISLANDS) {
Vincent Lejeune4ee6dd62013-10-13 17:56:21 +0000146 addPass(createSinkingPass());
Tom Stellard9fa17912013-08-14 23:24:45 +0000147 addPass(createSITypeRewriter());
Tom Stellardf8794352012-12-19 22:10:31 +0000148 addPass(createSIAnnotateControlFlowPass());
Vincent Lejeuned3eed662013-05-17 16:50:20 +0000149 } else {
150 addPass(createR600TextureIntrinsicsReplacer());
Tom Stellardf8794352012-12-19 22:10:31 +0000151 }
Tom Stellard75aadc22012-12-11 21:25:42 +0000152 return false;
153}
154
155bool AMDGPUPassConfig::addInstSelector() {
Tom Stellard75aadc22012-12-11 21:25:42 +0000156 addPass(createAMDGPUISelDag(getAMDGPUTargetMachine()));
Tom Stellard1bd80722014-04-30 15:31:33 +0000157 addPass(createSILowerI1CopiesPass());
Tom Stellard75aadc22012-12-11 21:25:42 +0000158 return false;
159}
160
161bool AMDGPUPassConfig::addPreRegAlloc() {
Tom Stellard75aadc22012-12-11 21:25:42 +0000162 addPass(createAMDGPUConvertToISAPass(*TM));
Vincent Lejeunedec18752013-06-05 21:38:04 +0000163 const AMDGPUSubtarget &ST = TM->getSubtarget<AMDGPUSubtarget>();
Tom Stellarda6c6e1b2013-06-07 20:37:48 +0000164
165 if (ST.getGeneration() <= AMDGPUSubtarget::NORTHERN_ISLANDS) {
Vincent Lejeunedec18752013-06-05 21:38:04 +0000166 addPass(createR600VectorRegMerger(*TM));
Tom Stellard2f7cdda2013-08-06 23:08:28 +0000167 } else {
168 addPass(createSIFixSGPRCopiesPass(*TM));
Tom Stellard15834092014-03-21 15:51:57 +0000169 // SIFixSGPRCopies can generate a lot of duplicate instructions,
170 // so we need to run MachineCSE afterwards.
171 addPass(&MachineCSEID);
Vincent Lejeunedec18752013-06-05 21:38:04 +0000172 }
Tom Stellard75aadc22012-12-11 21:25:42 +0000173 return false;
174}
175
176bool AMDGPUPassConfig::addPostRegAlloc() {
Tom Stellardc4cabef2013-01-18 21:15:53 +0000177 const AMDGPUSubtarget &ST = TM->getSubtarget<AMDGPUSubtarget>();
178
Tom Stellarda6c6e1b2013-06-07 20:37:48 +0000179 if (ST.getGeneration() > AMDGPUSubtarget::NORTHERN_ISLANDS) {
Tom Stellardc4cabef2013-01-18 21:15:53 +0000180 addPass(createSIInsertWaits(*TM));
181 }
Tom Stellard75aadc22012-12-11 21:25:42 +0000182 return false;
183}
184
185bool AMDGPUPassConfig::addPreSched2() {
Vincent Lejeunece499742013-07-09 15:03:33 +0000186 const AMDGPUSubtarget &ST = TM->getSubtarget<AMDGPUSubtarget>();
Tom Stellard75aadc22012-12-11 21:25:42 +0000187
Vincent Lejeunea4da6fb2013-10-01 19:32:58 +0000188 if (ST.getGeneration() <= AMDGPUSubtarget::NORTHERN_ISLANDS)
Tom Stellard1de55822013-12-11 17:51:41 +0000189 addPass(createR600EmitClauseMarkers());
Tom Stellard783893a2013-11-18 19:43:33 +0000190 if (ST.isIfCvtEnabled())
191 addPass(&IfConverterID);
Vincent Lejeunea4da6fb2013-10-01 19:32:58 +0000192 if (ST.getGeneration() <= AMDGPUSubtarget::NORTHERN_ISLANDS)
193 addPass(createR600ClauseMergePass(*TM));
Tom Stellard75aadc22012-12-11 21:25:42 +0000194 return false;
195}
196
197bool AMDGPUPassConfig::addPreEmitPass() {
Tom Stellard75aadc22012-12-11 21:25:42 +0000198 const AMDGPUSubtarget &ST = TM->getSubtarget<AMDGPUSubtarget>();
Tom Stellarda6c6e1b2013-06-07 20:37:48 +0000199 if (ST.getGeneration() <= AMDGPUSubtarget::NORTHERN_ISLANDS) {
Tom Stellardf2ba9722013-12-11 17:51:47 +0000200 addPass(createAMDGPUCFGStructurizerPass());
Tom Stellard75aadc22012-12-11 21:25:42 +0000201 addPass(createR600ExpandSpecialInstrsPass(*TM));
Tom Stellard75aadc22012-12-11 21:25:42 +0000202 addPass(&FinalizeMachineBundlesID);
Vincent Lejeune147700b2013-04-30 00:14:27 +0000203 addPass(createR600Packetizer(*TM));
204 addPass(createR600ControlFlowFinalizer(*TM));
Tom Stellard75aadc22012-12-11 21:25:42 +0000205 } else {
Tom Stellard75aadc22012-12-11 21:25:42 +0000206 addPass(createSILowerControlFlowPass(*TM));
207 }
208
209 return false;
210}