blob: c5515e6dfa8942a88aa8165ede6c4b80c4126217 [file] [log] [blame]
Tom Stellard75aadc22012-12-11 21:25:42 +00001//===-- AMDGPUTargetMachine.cpp - TargetMachine for hw codegen targets-----===//
2//
3// The LLVM Compiler Infrastructure
4//
5// This file is distributed under the University of Illinois Open Source
6// License. See LICENSE.TXT for details.
7//
8//===----------------------------------------------------------------------===//
9//
10/// \file
11/// \brief The AMDGPU target machine contains all of the hardware specific
12/// information needed to emit code for R600 and SI GPUs.
13//
14//===----------------------------------------------------------------------===//
15
16#include "AMDGPUTargetMachine.h"
17#include "AMDGPU.h"
18#include "R600ISelLowering.h"
19#include "R600InstrInfo.h"
Vincent Lejeune68b6b6d2013-03-05 18:41:32 +000020#include "R600MachineScheduler.h"
Tom Stellard75aadc22012-12-11 21:25:42 +000021#include "SIISelLowering.h"
22#include "SIInstrInfo.h"
23#include "llvm/Analysis/Passes.h"
Tom Stellard75aadc22012-12-11 21:25:42 +000024#include "llvm/CodeGen/MachineFunctionAnalysis.h"
25#include "llvm/CodeGen/MachineModuleInfo.h"
26#include "llvm/CodeGen/Passes.h"
Chandler Carruth5ad5f152014-01-13 09:26:24 +000027#include "llvm/IR/Verifier.h"
Tom Stellard75aadc22012-12-11 21:25:42 +000028#include "llvm/MC/MCAsmInfo.h"
29#include "llvm/PassManager.h"
30#include "llvm/Support/TargetRegistry.h"
31#include "llvm/Support/raw_os_ostream.h"
32#include "llvm/Transforms/IPO.h"
33#include "llvm/Transforms/Scalar.h"
34#include <llvm/CodeGen/Passes.h>
35
36using namespace llvm;
37
38extern "C" void LLVMInitializeR600Target() {
39 // Register the target
40 RegisterTargetMachine<AMDGPUTargetMachine> X(TheAMDGPUTarget);
41}
42
Vincent Lejeune68b6b6d2013-03-05 18:41:32 +000043static ScheduleDAGInstrs *createR600MachineScheduler(MachineSchedContext *C) {
David Blaikie422b93d2014-04-21 20:32:32 +000044 return new ScheduleDAGMILive(C, make_unique<R600SchedStrategy>());
Vincent Lejeune68b6b6d2013-03-05 18:41:32 +000045}
46
47static MachineSchedRegistry
48SchedCustomRegistry("r600", "Run R600's custom scheduler",
49 createR600MachineScheduler);
50
Tom Stellard75aadc22012-12-11 21:25:42 +000051AMDGPUTargetMachine::AMDGPUTargetMachine(const Target &T, StringRef TT,
Eric Christopherac4b69e2014-07-25 22:22:39 +000052 StringRef CPU, StringRef FS,
53 TargetOptions Options, Reloc::Model RM,
54 CodeModel::Model CM,
55 CodeGenOpt::Level OptLevel)
56 : LLVMTargetMachine(T, TT, CPU, FS, Options, RM, CM, OptLevel),
57 Subtarget(TT, CPU, FS, *this) {
Vincent Lejeune92b0a642013-12-07 01:49:19 +000058 setRequiresStructuredCFG(true);
Rafael Espindola227144c2013-05-13 01:16:13 +000059 initAsmInfo();
Tom Stellard75aadc22012-12-11 21:25:42 +000060}
61
62AMDGPUTargetMachine::~AMDGPUTargetMachine() {
63}
64
65namespace {
66class AMDGPUPassConfig : public TargetPassConfig {
67public:
68 AMDGPUPassConfig(AMDGPUTargetMachine *TM, PassManagerBase &PM)
Andrew Trick978674b2013-09-20 05:14:41 +000069 : TargetPassConfig(TM, PM) {}
Tom Stellard75aadc22012-12-11 21:25:42 +000070
71 AMDGPUTargetMachine &getAMDGPUTargetMachine() const {
72 return getTM<AMDGPUTargetMachine>();
73 }
Andrew Trick978674b2013-09-20 05:14:41 +000074
Craig Topper5656db42014-04-29 07:57:24 +000075 ScheduleDAGInstrs *
76 createMachineScheduler(MachineSchedContext *C) const override {
Andrew Trick978674b2013-09-20 05:14:41 +000077 const AMDGPUSubtarget &ST = TM->getSubtarget<AMDGPUSubtarget>();
78 if (ST.getGeneration() <= AMDGPUSubtarget::NORTHERN_ISLANDS)
79 return createR600MachineScheduler(C);
Craig Topper062a2ba2014-04-25 05:30:21 +000080 return nullptr;
Andrew Trick978674b2013-09-20 05:14:41 +000081 }
82
Tom Stellard880a80a2014-06-17 16:53:14 +000083 virtual void addCodeGenPrepare();
Craig Topper5656db42014-04-29 07:57:24 +000084 bool addPreISel() override;
85 bool addInstSelector() override;
86 bool addPreRegAlloc() override;
87 bool addPostRegAlloc() override;
88 bool addPreSched2() override;
89 bool addPreEmitPass() override;
Tom Stellard75aadc22012-12-11 21:25:42 +000090};
91} // End of anonymous namespace
92
93TargetPassConfig *AMDGPUTargetMachine::createPassConfig(PassManagerBase &PM) {
94 return new AMDGPUPassConfig(this, PM);
95}
96
Tom Stellard8b1e0212013-07-27 00:01:07 +000097//===----------------------------------------------------------------------===//
98// AMDGPU Analysis Pass Setup
99//===----------------------------------------------------------------------===//
100
101void AMDGPUTargetMachine::addAnalysisPasses(PassManagerBase &PM) {
102 // Add first the target-independent BasicTTI pass, then our AMDGPU pass. This
103 // allows the AMDGPU pass to delegate to the target independent layer when
104 // appropriate.
105 PM.add(createBasicTargetTransformInfoPass(this));
106 PM.add(createAMDGPUTargetTransformInfoPass(this));
107}
108
Tom Stellard880a80a2014-06-17 16:53:14 +0000109void AMDGPUPassConfig::addCodeGenPrepare() {
110 const AMDGPUSubtarget &ST = TM->getSubtarget<AMDGPUSubtarget>();
Matt Arsenaultd9a23ab2014-07-13 02:08:26 +0000111 if (ST.isPromoteAllocaEnabled()) {
112 addPass(createAMDGPUPromoteAlloca(ST));
113 addPass(createSROAPass());
114 }
115
Tom Stellard880a80a2014-06-17 16:53:14 +0000116 TargetPassConfig::addCodeGenPrepare();
117}
118
Tom Stellard75aadc22012-12-11 21:25:42 +0000119bool
120AMDGPUPassConfig::addPreISel() {
Tom Stellardf8794352012-12-19 22:10:31 +0000121 const AMDGPUSubtarget &ST = TM->getSubtarget<AMDGPUSubtarget>();
Tom Stellardaa664d92013-08-06 02:43:45 +0000122 addPass(createFlattenCFGPass());
Tom Stellard66df8a22013-11-18 19:43:44 +0000123 if (ST.IsIRStructurizerEnabled())
Tom Stellarded0ceec2013-10-10 17:11:12 +0000124 addPass(createStructurizeCFGPass());
Matt Arsenaultd0ce2bd2014-02-24 21:01:23 +0000125 if (ST.getGeneration() >= AMDGPUSubtarget::SOUTHERN_ISLANDS) {
Vincent Lejeune4ee6dd62013-10-13 17:56:21 +0000126 addPass(createSinkingPass());
Tom Stellard9fa17912013-08-14 23:24:45 +0000127 addPass(createSITypeRewriter());
Tom Stellardf8794352012-12-19 22:10:31 +0000128 addPass(createSIAnnotateControlFlowPass());
Vincent Lejeuned3eed662013-05-17 16:50:20 +0000129 } else {
130 addPass(createR600TextureIntrinsicsReplacer());
Tom Stellardf8794352012-12-19 22:10:31 +0000131 }
Tom Stellard75aadc22012-12-11 21:25:42 +0000132 return false;
133}
134
135bool AMDGPUPassConfig::addInstSelector() {
Tom Stellard75aadc22012-12-11 21:25:42 +0000136 addPass(createAMDGPUISelDag(getAMDGPUTargetMachine()));
Tom Stellard1bd80722014-04-30 15:31:33 +0000137 addPass(createSILowerI1CopiesPass());
Tom Stellard75aadc22012-12-11 21:25:42 +0000138 return false;
139}
140
141bool AMDGPUPassConfig::addPreRegAlloc() {
Vincent Lejeunedec18752013-06-05 21:38:04 +0000142 const AMDGPUSubtarget &ST = TM->getSubtarget<AMDGPUSubtarget>();
Tom Stellarda6c6e1b2013-06-07 20:37:48 +0000143
144 if (ST.getGeneration() <= AMDGPUSubtarget::NORTHERN_ISLANDS) {
Vincent Lejeunedec18752013-06-05 21:38:04 +0000145 addPass(createR600VectorRegMerger(*TM));
Tom Stellard2f7cdda2013-08-06 23:08:28 +0000146 } else {
147 addPass(createSIFixSGPRCopiesPass(*TM));
Tom Stellard15834092014-03-21 15:51:57 +0000148 // SIFixSGPRCopies can generate a lot of duplicate instructions,
149 // so we need to run MachineCSE afterwards.
150 addPass(&MachineCSEID);
Tom Stellard1aaad692014-07-21 16:55:33 +0000151 addPass(createSIShrinkInstructionsPass());
Tom Stellardb2de94e2014-07-02 20:53:48 +0000152 initializeSIFixSGPRLiveRangesPass(*PassRegistry::getPassRegistry());
153 insertPass(&RegisterCoalescerID, &SIFixSGPRLiveRangesID);
Vincent Lejeunedec18752013-06-05 21:38:04 +0000154 }
Tom Stellard75aadc22012-12-11 21:25:42 +0000155 return false;
156}
157
158bool AMDGPUPassConfig::addPostRegAlloc() {
Tom Stellardc4cabef2013-01-18 21:15:53 +0000159 const AMDGPUSubtarget &ST = TM->getSubtarget<AMDGPUSubtarget>();
160
Tom Stellard1aaad692014-07-21 16:55:33 +0000161 addPass(createSIShrinkInstructionsPass());
Tom Stellarda6c6e1b2013-06-07 20:37:48 +0000162 if (ST.getGeneration() > AMDGPUSubtarget::NORTHERN_ISLANDS) {
Tom Stellardc4cabef2013-01-18 21:15:53 +0000163 addPass(createSIInsertWaits(*TM));
164 }
Tom Stellard75aadc22012-12-11 21:25:42 +0000165 return false;
166}
167
168bool AMDGPUPassConfig::addPreSched2() {
Vincent Lejeunece499742013-07-09 15:03:33 +0000169 const AMDGPUSubtarget &ST = TM->getSubtarget<AMDGPUSubtarget>();
Tom Stellard75aadc22012-12-11 21:25:42 +0000170
Vincent Lejeunea4da6fb2013-10-01 19:32:58 +0000171 if (ST.getGeneration() <= AMDGPUSubtarget::NORTHERN_ISLANDS)
Tom Stellard1de55822013-12-11 17:51:41 +0000172 addPass(createR600EmitClauseMarkers());
Tom Stellard783893a2013-11-18 19:43:33 +0000173 if (ST.isIfCvtEnabled())
174 addPass(&IfConverterID);
Vincent Lejeunea4da6fb2013-10-01 19:32:58 +0000175 if (ST.getGeneration() <= AMDGPUSubtarget::NORTHERN_ISLANDS)
176 addPass(createR600ClauseMergePass(*TM));
Tom Stellard75aadc22012-12-11 21:25:42 +0000177 return false;
178}
179
180bool AMDGPUPassConfig::addPreEmitPass() {
Tom Stellard75aadc22012-12-11 21:25:42 +0000181 const AMDGPUSubtarget &ST = TM->getSubtarget<AMDGPUSubtarget>();
Tom Stellarda6c6e1b2013-06-07 20:37:48 +0000182 if (ST.getGeneration() <= AMDGPUSubtarget::NORTHERN_ISLANDS) {
Tom Stellardf2ba9722013-12-11 17:51:47 +0000183 addPass(createAMDGPUCFGStructurizerPass());
Tom Stellard75aadc22012-12-11 21:25:42 +0000184 addPass(createR600ExpandSpecialInstrsPass(*TM));
Tom Stellard75aadc22012-12-11 21:25:42 +0000185 addPass(&FinalizeMachineBundlesID);
Vincent Lejeune147700b2013-04-30 00:14:27 +0000186 addPass(createR600Packetizer(*TM));
187 addPass(createR600ControlFlowFinalizer(*TM));
Tom Stellard75aadc22012-12-11 21:25:42 +0000188 } else {
Tom Stellard75aadc22012-12-11 21:25:42 +0000189 addPass(createSILowerControlFlowPass(*TM));
190 }
191
192 return false;
193}