blob: 7f5042876e7f94919f0811b8a6fed72a9aa0c717 [file] [log] [blame]
Tom Stellard75aadc22012-12-11 21:25:42 +00001//===-- AMDGPUTargetMachine.cpp - TargetMachine for hw codegen targets-----===//
2//
3// The LLVM Compiler Infrastructure
4//
5// This file is distributed under the University of Illinois Open Source
6// License. See LICENSE.TXT for details.
7//
8//===----------------------------------------------------------------------===//
9//
10/// \file
11/// \brief The AMDGPU target machine contains all of the hardware specific
12/// information needed to emit code for R600 and SI GPUs.
13//
14//===----------------------------------------------------------------------===//
15
16#include "AMDGPUTargetMachine.h"
17#include "AMDGPU.h"
18#include "R600ISelLowering.h"
19#include "R600InstrInfo.h"
Vincent Lejeune68b6b6d2013-03-05 18:41:32 +000020#include "R600MachineScheduler.h"
Tom Stellard75aadc22012-12-11 21:25:42 +000021#include "SIISelLowering.h"
22#include "SIInstrInfo.h"
23#include "llvm/Analysis/Passes.h"
Tom Stellard75aadc22012-12-11 21:25:42 +000024#include "llvm/CodeGen/MachineFunctionAnalysis.h"
25#include "llvm/CodeGen/MachineModuleInfo.h"
26#include "llvm/CodeGen/Passes.h"
Chandler Carruth5ad5f152014-01-13 09:26:24 +000027#include "llvm/IR/Verifier.h"
Tom Stellard75aadc22012-12-11 21:25:42 +000028#include "llvm/MC/MCAsmInfo.h"
29#include "llvm/PassManager.h"
30#include "llvm/Support/TargetRegistry.h"
31#include "llvm/Support/raw_os_ostream.h"
32#include "llvm/Transforms/IPO.h"
33#include "llvm/Transforms/Scalar.h"
34#include <llvm/CodeGen/Passes.h>
35
Tom Stellarded0ceec2013-10-10 17:11:12 +000036
Tom Stellard75aadc22012-12-11 21:25:42 +000037using namespace llvm;
38
39extern "C" void LLVMInitializeR600Target() {
40 // Register the target
41 RegisterTargetMachine<AMDGPUTargetMachine> X(TheAMDGPUTarget);
42}
43
Vincent Lejeune68b6b6d2013-03-05 18:41:32 +000044static ScheduleDAGInstrs *createR600MachineScheduler(MachineSchedContext *C) {
Andrew Trickd7f890e2013-12-28 21:56:47 +000045 return new ScheduleDAGMILive(C, new R600SchedStrategy());
Vincent Lejeune68b6b6d2013-03-05 18:41:32 +000046}
47
48static MachineSchedRegistry
49SchedCustomRegistry("r600", "Run R600's custom scheduler",
50 createR600MachineScheduler);
51
Rafael Espindolaceb0c492013-12-14 06:13:44 +000052static std::string computeDataLayout(const AMDGPUSubtarget &ST) {
Rafael Espindola4fa79752013-12-19 16:51:03 +000053 std::string Ret = "e-p:32:32";
Rafael Espindolaceb0c492013-12-14 06:13:44 +000054
Matt Arsenaulta98cd6a2013-12-19 05:32:55 +000055 if (ST.is64bit()) {
56 // 32-bit private, local, and region pointers. 64-bit global and constant.
57 Ret += "-p1:64:64-p2:64:64-p3:32:32-p4:32:32-p5:64:64";
58 }
Rafael Espindolaceb0c492013-12-14 06:13:44 +000059
Rafael Espindolae89b4142013-12-16 19:31:14 +000060 Ret += "-i64:64-v16:16-v24:32-v32:32-v48:64-v96:128-v192:256-v256:256"
61 "-v512:512-v1024:1024-v2048:2048-n32:64";
62
Rafael Espindola0eb1ebe2013-12-16 19:18:57 +000063 return Ret;
Rafael Espindolaceb0c492013-12-14 06:13:44 +000064}
65
Tom Stellard75aadc22012-12-11 21:25:42 +000066AMDGPUTargetMachine::AMDGPUTargetMachine(const Target &T, StringRef TT,
67 StringRef CPU, StringRef FS,
68 TargetOptions Options,
69 Reloc::Model RM, CodeModel::Model CM,
70 CodeGenOpt::Level OptLevel
71)
72:
73 LLVMTargetMachine(T, TT, CPU, FS, Options, RM, CM, OptLevel),
74 Subtarget(TT, CPU, FS),
Rafael Espindolaceb0c492013-12-14 06:13:44 +000075 Layout(computeDataLayout(Subtarget)),
Tom Stellardaf775432013-10-23 00:44:32 +000076 FrameLowering(TargetFrameLowering::StackGrowsUp,
77 64 * 16 // Maximum stack alignment (long16)
78 , 0),
Tom Stellard75aadc22012-12-11 21:25:42 +000079 IntrinsicInfo(this),
80 InstrItins(&Subtarget.getInstrItineraryData()) {
81 // TLInfo uses InstrInfo so it must be initialized after.
Tom Stellarda6c6e1b2013-06-07 20:37:48 +000082 if (Subtarget.getGeneration() <= AMDGPUSubtarget::NORTHERN_ISLANDS) {
Rafael Espindola39aca622013-05-23 03:31:47 +000083 InstrInfo.reset(new R600InstrInfo(*this));
84 TLInfo.reset(new R600TargetLowering(*this));
Tom Stellard75aadc22012-12-11 21:25:42 +000085 } else {
Rafael Espindola39aca622013-05-23 03:31:47 +000086 InstrInfo.reset(new SIInstrInfo(*this));
87 TLInfo.reset(new SITargetLowering(*this));
Tom Stellard75aadc22012-12-11 21:25:42 +000088 }
Vincent Lejeune92b0a642013-12-07 01:49:19 +000089 setRequiresStructuredCFG(true);
Rafael Espindola227144c2013-05-13 01:16:13 +000090 initAsmInfo();
Tom Stellard75aadc22012-12-11 21:25:42 +000091}
92
93AMDGPUTargetMachine::~AMDGPUTargetMachine() {
94}
95
96namespace {
97class AMDGPUPassConfig : public TargetPassConfig {
98public:
99 AMDGPUPassConfig(AMDGPUTargetMachine *TM, PassManagerBase &PM)
Andrew Trick978674b2013-09-20 05:14:41 +0000100 : TargetPassConfig(TM, PM) {}
Tom Stellard75aadc22012-12-11 21:25:42 +0000101
102 AMDGPUTargetMachine &getAMDGPUTargetMachine() const {
103 return getTM<AMDGPUTargetMachine>();
104 }
Andrew Trick978674b2013-09-20 05:14:41 +0000105
106 virtual ScheduleDAGInstrs *
107 createMachineScheduler(MachineSchedContext *C) const {
108 const AMDGPUSubtarget &ST = TM->getSubtarget<AMDGPUSubtarget>();
109 if (ST.getGeneration() <= AMDGPUSubtarget::NORTHERN_ISLANDS)
110 return createR600MachineScheduler(C);
111 return 0;
112 }
113
Tom Stellard75aadc22012-12-11 21:25:42 +0000114 virtual bool addPreISel();
115 virtual bool addInstSelector();
116 virtual bool addPreRegAlloc();
117 virtual bool addPostRegAlloc();
118 virtual bool addPreSched2();
119 virtual bool addPreEmitPass();
120};
121} // End of anonymous namespace
122
123TargetPassConfig *AMDGPUTargetMachine::createPassConfig(PassManagerBase &PM) {
124 return new AMDGPUPassConfig(this, PM);
125}
126
Tom Stellard8b1e0212013-07-27 00:01:07 +0000127//===----------------------------------------------------------------------===//
128// AMDGPU Analysis Pass Setup
129//===----------------------------------------------------------------------===//
130
131void AMDGPUTargetMachine::addAnalysisPasses(PassManagerBase &PM) {
132 // Add first the target-independent BasicTTI pass, then our AMDGPU pass. This
133 // allows the AMDGPU pass to delegate to the target independent layer when
134 // appropriate.
135 PM.add(createBasicTargetTransformInfoPass(this));
136 PM.add(createAMDGPUTargetTransformInfoPass(this));
137}
138
Tom Stellard75aadc22012-12-11 21:25:42 +0000139bool
140AMDGPUPassConfig::addPreISel() {
Tom Stellardf8794352012-12-19 22:10:31 +0000141 const AMDGPUSubtarget &ST = TM->getSubtarget<AMDGPUSubtarget>();
Tom Stellardaa664d92013-08-06 02:43:45 +0000142 addPass(createFlattenCFGPass());
Tom Stellard66df8a22013-11-18 19:43:44 +0000143 if (ST.IsIRStructurizerEnabled())
Tom Stellarded0ceec2013-10-10 17:11:12 +0000144 addPass(createStructurizeCFGPass());
Matt Arsenaultd0ce2bd2014-02-24 21:01:23 +0000145 if (ST.getGeneration() >= AMDGPUSubtarget::SOUTHERN_ISLANDS) {
Vincent Lejeune4ee6dd62013-10-13 17:56:21 +0000146 addPass(createSinkingPass());
Tom Stellard9fa17912013-08-14 23:24:45 +0000147 addPass(createSITypeRewriter());
Tom Stellardf8794352012-12-19 22:10:31 +0000148 addPass(createSIAnnotateControlFlowPass());
Vincent Lejeuned3eed662013-05-17 16:50:20 +0000149 } else {
150 addPass(createR600TextureIntrinsicsReplacer());
Tom Stellardf8794352012-12-19 22:10:31 +0000151 }
Tom Stellard75aadc22012-12-11 21:25:42 +0000152 return false;
153}
154
155bool AMDGPUPassConfig::addInstSelector() {
Tom Stellard75aadc22012-12-11 21:25:42 +0000156 addPass(createAMDGPUISelDag(getAMDGPUTargetMachine()));
157 return false;
158}
159
160bool AMDGPUPassConfig::addPreRegAlloc() {
Tom Stellard75aadc22012-12-11 21:25:42 +0000161 addPass(createAMDGPUConvertToISAPass(*TM));
Vincent Lejeunedec18752013-06-05 21:38:04 +0000162 const AMDGPUSubtarget &ST = TM->getSubtarget<AMDGPUSubtarget>();
Tom Stellarda6c6e1b2013-06-07 20:37:48 +0000163
164 if (ST.getGeneration() <= AMDGPUSubtarget::NORTHERN_ISLANDS) {
Vincent Lejeunedec18752013-06-05 21:38:04 +0000165 addPass(createR600VectorRegMerger(*TM));
Tom Stellard2f7cdda2013-08-06 23:08:28 +0000166 } else {
167 addPass(createSIFixSGPRCopiesPass(*TM));
Vincent Lejeunedec18752013-06-05 21:38:04 +0000168 }
Tom Stellard75aadc22012-12-11 21:25:42 +0000169 return false;
170}
171
172bool AMDGPUPassConfig::addPostRegAlloc() {
Tom Stellardc4cabef2013-01-18 21:15:53 +0000173 const AMDGPUSubtarget &ST = TM->getSubtarget<AMDGPUSubtarget>();
174
Tom Stellarda6c6e1b2013-06-07 20:37:48 +0000175 if (ST.getGeneration() > AMDGPUSubtarget::NORTHERN_ISLANDS) {
Tom Stellardc4cabef2013-01-18 21:15:53 +0000176 addPass(createSIInsertWaits(*TM));
177 }
Tom Stellard75aadc22012-12-11 21:25:42 +0000178 return false;
179}
180
181bool AMDGPUPassConfig::addPreSched2() {
Vincent Lejeunece499742013-07-09 15:03:33 +0000182 const AMDGPUSubtarget &ST = TM->getSubtarget<AMDGPUSubtarget>();
Tom Stellard75aadc22012-12-11 21:25:42 +0000183
Vincent Lejeunea4da6fb2013-10-01 19:32:58 +0000184 if (ST.getGeneration() <= AMDGPUSubtarget::NORTHERN_ISLANDS)
Tom Stellard1de55822013-12-11 17:51:41 +0000185 addPass(createR600EmitClauseMarkers());
Tom Stellard783893a2013-11-18 19:43:33 +0000186 if (ST.isIfCvtEnabled())
187 addPass(&IfConverterID);
Vincent Lejeunea4da6fb2013-10-01 19:32:58 +0000188 if (ST.getGeneration() <= AMDGPUSubtarget::NORTHERN_ISLANDS)
189 addPass(createR600ClauseMergePass(*TM));
Tom Stellard75aadc22012-12-11 21:25:42 +0000190 return false;
191}
192
193bool AMDGPUPassConfig::addPreEmitPass() {
Tom Stellard75aadc22012-12-11 21:25:42 +0000194 const AMDGPUSubtarget &ST = TM->getSubtarget<AMDGPUSubtarget>();
Tom Stellarda6c6e1b2013-06-07 20:37:48 +0000195 if (ST.getGeneration() <= AMDGPUSubtarget::NORTHERN_ISLANDS) {
Tom Stellardf2ba9722013-12-11 17:51:47 +0000196 addPass(createAMDGPUCFGStructurizerPass());
Tom Stellard75aadc22012-12-11 21:25:42 +0000197 addPass(createR600ExpandSpecialInstrsPass(*TM));
Tom Stellard75aadc22012-12-11 21:25:42 +0000198 addPass(&FinalizeMachineBundlesID);
Vincent Lejeune147700b2013-04-30 00:14:27 +0000199 addPass(createR600Packetizer(*TM));
200 addPass(createR600ControlFlowFinalizer(*TM));
Tom Stellard75aadc22012-12-11 21:25:42 +0000201 } else {
Tom Stellard75aadc22012-12-11 21:25:42 +0000202 addPass(createSILowerControlFlowPass(*TM));
203 }
204
205 return false;
206}