blob: 762a17ae071a6df638f3a6704c4de2f4deae1380 [file] [log] [blame]
Tom Stellard75aadc22012-12-11 21:25:42 +00001//===-- AMDGPUTargetMachine.cpp - TargetMachine for hw codegen targets-----===//
2//
3// The LLVM Compiler Infrastructure
4//
5// This file is distributed under the University of Illinois Open Source
6// License. See LICENSE.TXT for details.
7//
8//===----------------------------------------------------------------------===//
9//
10/// \file
11/// \brief The AMDGPU target machine contains all of the hardware specific
12/// information needed to emit code for R600 and SI GPUs.
13//
14//===----------------------------------------------------------------------===//
15
16#include "AMDGPUTargetMachine.h"
17#include "AMDGPU.h"
18#include "R600ISelLowering.h"
19#include "R600InstrInfo.h"
Vincent Lejeune68b6b6d2013-03-05 18:41:32 +000020#include "R600MachineScheduler.h"
Tom Stellard75aadc22012-12-11 21:25:42 +000021#include "SIISelLowering.h"
22#include "SIInstrInfo.h"
23#include "llvm/Analysis/Passes.h"
24#include "llvm/Analysis/Verifier.h"
25#include "llvm/CodeGen/MachineFunctionAnalysis.h"
26#include "llvm/CodeGen/MachineModuleInfo.h"
27#include "llvm/CodeGen/Passes.h"
28#include "llvm/MC/MCAsmInfo.h"
29#include "llvm/PassManager.h"
30#include "llvm/Support/TargetRegistry.h"
31#include "llvm/Support/raw_os_ostream.h"
32#include "llvm/Transforms/IPO.h"
33#include "llvm/Transforms/Scalar.h"
34#include <llvm/CodeGen/Passes.h>
35
Tom Stellarded0ceec2013-10-10 17:11:12 +000036
Tom Stellard75aadc22012-12-11 21:25:42 +000037using namespace llvm;
38
39extern "C" void LLVMInitializeR600Target() {
40 // Register the target
41 RegisterTargetMachine<AMDGPUTargetMachine> X(TheAMDGPUTarget);
42}
43
Vincent Lejeune68b6b6d2013-03-05 18:41:32 +000044static ScheduleDAGInstrs *createR600MachineScheduler(MachineSchedContext *C) {
45 return new ScheduleDAGMI(C, new R600SchedStrategy());
46}
47
48static MachineSchedRegistry
49SchedCustomRegistry("r600", "Run R600's custom scheduler",
50 createR600MachineScheduler);
51
Rafael Espindolaceb0c492013-12-14 06:13:44 +000052static std::string computeDataLayout(const AMDGPUSubtarget &ST) {
53 std::string DataLayout = std::string(
54 "e"
55 "-i1:8:8-i8:8:8-i16:16:16-i32:32:32-i64:64:64-f32:32:32"
56 "-v16:16:16-v24:32:32-v32:32:32-v48:64:64-v64:64:64-v96:128:128-v128:128:128"
57 "-v192:256:256-v256:256:256-v512:512:512-v1024:1024:1024-v2048:2048:2048"
58 "-n32:64"
59 );
60
61 if (ST.hasHWFP64())
62 DataLayout.append("-f64:64:64");
63
64 if (ST.is64bit())
65 DataLayout.append("-p:64:64:64");
66 else
67 DataLayout.append("-p:32:32:32");
68
69 if (ST.getGeneration() >= AMDGPUSubtarget::SOUTHERN_ISLANDS)
70 DataLayout.append("-p3:32:32:32");
71
72 return DataLayout;
73}
74
Tom Stellard75aadc22012-12-11 21:25:42 +000075AMDGPUTargetMachine::AMDGPUTargetMachine(const Target &T, StringRef TT,
76 StringRef CPU, StringRef FS,
77 TargetOptions Options,
78 Reloc::Model RM, CodeModel::Model CM,
79 CodeGenOpt::Level OptLevel
80)
81:
82 LLVMTargetMachine(T, TT, CPU, FS, Options, RM, CM, OptLevel),
83 Subtarget(TT, CPU, FS),
Rafael Espindolaceb0c492013-12-14 06:13:44 +000084 Layout(computeDataLayout(Subtarget)),
Tom Stellardaf775432013-10-23 00:44:32 +000085 FrameLowering(TargetFrameLowering::StackGrowsUp,
86 64 * 16 // Maximum stack alignment (long16)
87 , 0),
Tom Stellard75aadc22012-12-11 21:25:42 +000088 IntrinsicInfo(this),
89 InstrItins(&Subtarget.getInstrItineraryData()) {
90 // TLInfo uses InstrInfo so it must be initialized after.
Tom Stellarda6c6e1b2013-06-07 20:37:48 +000091 if (Subtarget.getGeneration() <= AMDGPUSubtarget::NORTHERN_ISLANDS) {
Rafael Espindola39aca622013-05-23 03:31:47 +000092 InstrInfo.reset(new R600InstrInfo(*this));
93 TLInfo.reset(new R600TargetLowering(*this));
Tom Stellard75aadc22012-12-11 21:25:42 +000094 } else {
Rafael Espindola39aca622013-05-23 03:31:47 +000095 InstrInfo.reset(new SIInstrInfo(*this));
96 TLInfo.reset(new SITargetLowering(*this));
Tom Stellard75aadc22012-12-11 21:25:42 +000097 }
Vincent Lejeune92b0a642013-12-07 01:49:19 +000098 setRequiresStructuredCFG(true);
Rafael Espindola227144c2013-05-13 01:16:13 +000099 initAsmInfo();
Tom Stellard75aadc22012-12-11 21:25:42 +0000100}
101
102AMDGPUTargetMachine::~AMDGPUTargetMachine() {
103}
104
105namespace {
106class AMDGPUPassConfig : public TargetPassConfig {
107public:
108 AMDGPUPassConfig(AMDGPUTargetMachine *TM, PassManagerBase &PM)
Andrew Trick978674b2013-09-20 05:14:41 +0000109 : TargetPassConfig(TM, PM) {}
Tom Stellard75aadc22012-12-11 21:25:42 +0000110
111 AMDGPUTargetMachine &getAMDGPUTargetMachine() const {
112 return getTM<AMDGPUTargetMachine>();
113 }
Andrew Trick978674b2013-09-20 05:14:41 +0000114
115 virtual ScheduleDAGInstrs *
116 createMachineScheduler(MachineSchedContext *C) const {
117 const AMDGPUSubtarget &ST = TM->getSubtarget<AMDGPUSubtarget>();
118 if (ST.getGeneration() <= AMDGPUSubtarget::NORTHERN_ISLANDS)
119 return createR600MachineScheduler(C);
120 return 0;
121 }
122
Tom Stellard75aadc22012-12-11 21:25:42 +0000123 virtual bool addPreISel();
124 virtual bool addInstSelector();
125 virtual bool addPreRegAlloc();
126 virtual bool addPostRegAlloc();
127 virtual bool addPreSched2();
128 virtual bool addPreEmitPass();
129};
130} // End of anonymous namespace
131
132TargetPassConfig *AMDGPUTargetMachine::createPassConfig(PassManagerBase &PM) {
133 return new AMDGPUPassConfig(this, PM);
134}
135
Tom Stellard8b1e0212013-07-27 00:01:07 +0000136//===----------------------------------------------------------------------===//
137// AMDGPU Analysis Pass Setup
138//===----------------------------------------------------------------------===//
139
140void AMDGPUTargetMachine::addAnalysisPasses(PassManagerBase &PM) {
141 // Add first the target-independent BasicTTI pass, then our AMDGPU pass. This
142 // allows the AMDGPU pass to delegate to the target independent layer when
143 // appropriate.
144 PM.add(createBasicTargetTransformInfoPass(this));
145 PM.add(createAMDGPUTargetTransformInfoPass(this));
146}
147
Tom Stellard75aadc22012-12-11 21:25:42 +0000148bool
149AMDGPUPassConfig::addPreISel() {
Tom Stellardf8794352012-12-19 22:10:31 +0000150 const AMDGPUSubtarget &ST = TM->getSubtarget<AMDGPUSubtarget>();
Tom Stellardaa664d92013-08-06 02:43:45 +0000151 addPass(createFlattenCFGPass());
Tom Stellard66df8a22013-11-18 19:43:44 +0000152 if (ST.IsIRStructurizerEnabled())
Tom Stellarded0ceec2013-10-10 17:11:12 +0000153 addPass(createStructurizeCFGPass());
Tom Stellarda6c6e1b2013-06-07 20:37:48 +0000154 if (ST.getGeneration() > AMDGPUSubtarget::NORTHERN_ISLANDS) {
Vincent Lejeune4ee6dd62013-10-13 17:56:21 +0000155 addPass(createSinkingPass());
Tom Stellard9fa17912013-08-14 23:24:45 +0000156 addPass(createSITypeRewriter());
Tom Stellardf8794352012-12-19 22:10:31 +0000157 addPass(createSIAnnotateControlFlowPass());
Vincent Lejeuned3eed662013-05-17 16:50:20 +0000158 } else {
159 addPass(createR600TextureIntrinsicsReplacer());
Tom Stellardf8794352012-12-19 22:10:31 +0000160 }
Tom Stellard75aadc22012-12-11 21:25:42 +0000161 return false;
162}
163
164bool AMDGPUPassConfig::addInstSelector() {
Tom Stellard75aadc22012-12-11 21:25:42 +0000165 addPass(createAMDGPUISelDag(getAMDGPUTargetMachine()));
166 return false;
167}
168
169bool AMDGPUPassConfig::addPreRegAlloc() {
Tom Stellard75aadc22012-12-11 21:25:42 +0000170 addPass(createAMDGPUConvertToISAPass(*TM));
Vincent Lejeunedec18752013-06-05 21:38:04 +0000171 const AMDGPUSubtarget &ST = TM->getSubtarget<AMDGPUSubtarget>();
Tom Stellarda6c6e1b2013-06-07 20:37:48 +0000172
173 if (ST.getGeneration() <= AMDGPUSubtarget::NORTHERN_ISLANDS) {
Vincent Lejeunedec18752013-06-05 21:38:04 +0000174 addPass(createR600VectorRegMerger(*TM));
Tom Stellard2f7cdda2013-08-06 23:08:28 +0000175 } else {
176 addPass(createSIFixSGPRCopiesPass(*TM));
Vincent Lejeunedec18752013-06-05 21:38:04 +0000177 }
Tom Stellard75aadc22012-12-11 21:25:42 +0000178 return false;
179}
180
181bool AMDGPUPassConfig::addPostRegAlloc() {
Tom Stellardc4cabef2013-01-18 21:15:53 +0000182 const AMDGPUSubtarget &ST = TM->getSubtarget<AMDGPUSubtarget>();
183
Tom Stellarda6c6e1b2013-06-07 20:37:48 +0000184 if (ST.getGeneration() > AMDGPUSubtarget::NORTHERN_ISLANDS) {
Tom Stellardc4cabef2013-01-18 21:15:53 +0000185 addPass(createSIInsertWaits(*TM));
186 }
Tom Stellard75aadc22012-12-11 21:25:42 +0000187 return false;
188}
189
190bool AMDGPUPassConfig::addPreSched2() {
Vincent Lejeunece499742013-07-09 15:03:33 +0000191 const AMDGPUSubtarget &ST = TM->getSubtarget<AMDGPUSubtarget>();
Tom Stellard75aadc22012-12-11 21:25:42 +0000192
Vincent Lejeunea4da6fb2013-10-01 19:32:58 +0000193 if (ST.getGeneration() <= AMDGPUSubtarget::NORTHERN_ISLANDS)
Tom Stellard1de55822013-12-11 17:51:41 +0000194 addPass(createR600EmitClauseMarkers());
Tom Stellard783893a2013-11-18 19:43:33 +0000195 if (ST.isIfCvtEnabled())
196 addPass(&IfConverterID);
Vincent Lejeunea4da6fb2013-10-01 19:32:58 +0000197 if (ST.getGeneration() <= AMDGPUSubtarget::NORTHERN_ISLANDS)
198 addPass(createR600ClauseMergePass(*TM));
Tom Stellard75aadc22012-12-11 21:25:42 +0000199 return false;
200}
201
202bool AMDGPUPassConfig::addPreEmitPass() {
Tom Stellard75aadc22012-12-11 21:25:42 +0000203 const AMDGPUSubtarget &ST = TM->getSubtarget<AMDGPUSubtarget>();
Tom Stellarda6c6e1b2013-06-07 20:37:48 +0000204 if (ST.getGeneration() <= AMDGPUSubtarget::NORTHERN_ISLANDS) {
Tom Stellardf2ba9722013-12-11 17:51:47 +0000205 addPass(createAMDGPUCFGStructurizerPass());
Tom Stellard75aadc22012-12-11 21:25:42 +0000206 addPass(createR600ExpandSpecialInstrsPass(*TM));
Tom Stellard75aadc22012-12-11 21:25:42 +0000207 addPass(&FinalizeMachineBundlesID);
Vincent Lejeune147700b2013-04-30 00:14:27 +0000208 addPass(createR600Packetizer(*TM));
209 addPass(createR600ControlFlowFinalizer(*TM));
Tom Stellard75aadc22012-12-11 21:25:42 +0000210 } else {
Tom Stellard75aadc22012-12-11 21:25:42 +0000211 addPass(createSILowerControlFlowPass(*TM));
212 }
213
214 return false;
215}