blob: c95a9410ff6a9776f1c9a444ec9a3074a529babc [file] [log] [blame]
Tom Stellard75aadc22012-12-11 21:25:42 +00001//===-- AMDGPUTargetMachine.cpp - TargetMachine for hw codegen targets-----===//
2//
3// The LLVM Compiler Infrastructure
4//
5// This file is distributed under the University of Illinois Open Source
6// License. See LICENSE.TXT for details.
7//
8//===----------------------------------------------------------------------===//
9//
10/// \file
11/// \brief The AMDGPU target machine contains all of the hardware specific
12/// information needed to emit code for R600 and SI GPUs.
13//
14//===----------------------------------------------------------------------===//
15
16#include "AMDGPUTargetMachine.h"
17#include "AMDGPU.h"
18#include "R600ISelLowering.h"
19#include "R600InstrInfo.h"
Vincent Lejeune68b6b6d2013-03-05 18:41:32 +000020#include "R600MachineScheduler.h"
Tom Stellard75aadc22012-12-11 21:25:42 +000021#include "SIISelLowering.h"
22#include "SIInstrInfo.h"
23#include "llvm/Analysis/Passes.h"
Tom Stellard75aadc22012-12-11 21:25:42 +000024#include "llvm/CodeGen/MachineFunctionAnalysis.h"
25#include "llvm/CodeGen/MachineModuleInfo.h"
26#include "llvm/CodeGen/Passes.h"
Chandler Carruth5ad5f152014-01-13 09:26:24 +000027#include "llvm/IR/Verifier.h"
Tom Stellard75aadc22012-12-11 21:25:42 +000028#include "llvm/MC/MCAsmInfo.h"
29#include "llvm/PassManager.h"
30#include "llvm/Support/TargetRegistry.h"
31#include "llvm/Support/raw_os_ostream.h"
32#include "llvm/Transforms/IPO.h"
33#include "llvm/Transforms/Scalar.h"
34#include <llvm/CodeGen/Passes.h>
35
36using namespace llvm;
37
38extern "C" void LLVMInitializeR600Target() {
39 // Register the target
40 RegisterTargetMachine<AMDGPUTargetMachine> X(TheAMDGPUTarget);
41}
42
Vincent Lejeune68b6b6d2013-03-05 18:41:32 +000043static ScheduleDAGInstrs *createR600MachineScheduler(MachineSchedContext *C) {
David Blaikie422b93d2014-04-21 20:32:32 +000044 return new ScheduleDAGMILive(C, make_unique<R600SchedStrategy>());
Vincent Lejeune68b6b6d2013-03-05 18:41:32 +000045}
46
47static MachineSchedRegistry
48SchedCustomRegistry("r600", "Run R600's custom scheduler",
49 createR600MachineScheduler);
50
Tom Stellard75aadc22012-12-11 21:25:42 +000051AMDGPUTargetMachine::AMDGPUTargetMachine(const Target &T, StringRef TT,
Eric Christopherac4b69e2014-07-25 22:22:39 +000052 StringRef CPU, StringRef FS,
53 TargetOptions Options, Reloc::Model RM,
54 CodeModel::Model CM,
55 CodeGenOpt::Level OptLevel)
56 : LLVMTargetMachine(T, TT, CPU, FS, Options, RM, CM, OptLevel),
Eric Christopher34aaf972014-08-04 17:37:43 +000057 Subtarget(TT, CPU, FS, *this), IntrinsicInfo() {
Vincent Lejeune92b0a642013-12-07 01:49:19 +000058 setRequiresStructuredCFG(true);
Rafael Espindola227144c2013-05-13 01:16:13 +000059 initAsmInfo();
Tom Stellard75aadc22012-12-11 21:25:42 +000060}
61
62AMDGPUTargetMachine::~AMDGPUTargetMachine() {
63}
64
65namespace {
66class AMDGPUPassConfig : public TargetPassConfig {
67public:
68 AMDGPUPassConfig(AMDGPUTargetMachine *TM, PassManagerBase &PM)
Andrew Trick978674b2013-09-20 05:14:41 +000069 : TargetPassConfig(TM, PM) {}
Tom Stellard75aadc22012-12-11 21:25:42 +000070
71 AMDGPUTargetMachine &getAMDGPUTargetMachine() const {
72 return getTM<AMDGPUTargetMachine>();
73 }
Andrew Trick978674b2013-09-20 05:14:41 +000074
Craig Topper5656db42014-04-29 07:57:24 +000075 ScheduleDAGInstrs *
76 createMachineScheduler(MachineSchedContext *C) const override {
Andrew Trick978674b2013-09-20 05:14:41 +000077 const AMDGPUSubtarget &ST = TM->getSubtarget<AMDGPUSubtarget>();
78 if (ST.getGeneration() <= AMDGPUSubtarget::NORTHERN_ISLANDS)
79 return createR600MachineScheduler(C);
Craig Topper062a2ba2014-04-25 05:30:21 +000080 return nullptr;
Andrew Trick978674b2013-09-20 05:14:41 +000081 }
82
Benjamin Kramer8c90fd72014-09-03 11:41:21 +000083 void addCodeGenPrepare() override;
Craig Topper5656db42014-04-29 07:57:24 +000084 bool addPreISel() override;
85 bool addInstSelector() override;
86 bool addPreRegAlloc() override;
87 bool addPostRegAlloc() override;
88 bool addPreSched2() override;
89 bool addPreEmitPass() override;
Tom Stellard75aadc22012-12-11 21:25:42 +000090};
91} // End of anonymous namespace
92
93TargetPassConfig *AMDGPUTargetMachine::createPassConfig(PassManagerBase &PM) {
94 return new AMDGPUPassConfig(this, PM);
95}
96
Tom Stellard8b1e0212013-07-27 00:01:07 +000097//===----------------------------------------------------------------------===//
98// AMDGPU Analysis Pass Setup
99//===----------------------------------------------------------------------===//
100
101void AMDGPUTargetMachine::addAnalysisPasses(PassManagerBase &PM) {
102 // Add first the target-independent BasicTTI pass, then our AMDGPU pass. This
103 // allows the AMDGPU pass to delegate to the target independent layer when
104 // appropriate.
105 PM.add(createBasicTargetTransformInfoPass(this));
106 PM.add(createAMDGPUTargetTransformInfoPass(this));
107}
108
Tom Stellard880a80a2014-06-17 16:53:14 +0000109void AMDGPUPassConfig::addCodeGenPrepare() {
110 const AMDGPUSubtarget &ST = TM->getSubtarget<AMDGPUSubtarget>();
Matt Arsenaultd9a23ab2014-07-13 02:08:26 +0000111 if (ST.isPromoteAllocaEnabled()) {
112 addPass(createAMDGPUPromoteAlloca(ST));
113 addPass(createSROAPass());
114 }
115
Tom Stellard880a80a2014-06-17 16:53:14 +0000116 TargetPassConfig::addCodeGenPrepare();
117}
118
Tom Stellard75aadc22012-12-11 21:25:42 +0000119bool
120AMDGPUPassConfig::addPreISel() {
Tom Stellardf8794352012-12-19 22:10:31 +0000121 const AMDGPUSubtarget &ST = TM->getSubtarget<AMDGPUSubtarget>();
Tom Stellardaa664d92013-08-06 02:43:45 +0000122 addPass(createFlattenCFGPass());
Tom Stellard66df8a22013-11-18 19:43:44 +0000123 if (ST.IsIRStructurizerEnabled())
Tom Stellarded0ceec2013-10-10 17:11:12 +0000124 addPass(createStructurizeCFGPass());
Matt Arsenaultd0ce2bd2014-02-24 21:01:23 +0000125 if (ST.getGeneration() >= AMDGPUSubtarget::SOUTHERN_ISLANDS) {
Vincent Lejeune4ee6dd62013-10-13 17:56:21 +0000126 addPass(createSinkingPass());
Tom Stellard9fa17912013-08-14 23:24:45 +0000127 addPass(createSITypeRewriter());
Tom Stellardf8794352012-12-19 22:10:31 +0000128 addPass(createSIAnnotateControlFlowPass());
Vincent Lejeuned3eed662013-05-17 16:50:20 +0000129 } else {
130 addPass(createR600TextureIntrinsicsReplacer());
Tom Stellardf8794352012-12-19 22:10:31 +0000131 }
Tom Stellard75aadc22012-12-11 21:25:42 +0000132 return false;
133}
134
135bool AMDGPUPassConfig::addInstSelector() {
Tom Stellard75aadc22012-12-11 21:25:42 +0000136 addPass(createAMDGPUISelDag(getAMDGPUTargetMachine()));
Tom Stellard1bd80722014-04-30 15:31:33 +0000137 addPass(createSILowerI1CopiesPass());
Tom Stellard75aadc22012-12-11 21:25:42 +0000138 return false;
139}
140
141bool AMDGPUPassConfig::addPreRegAlloc() {
Vincent Lejeunedec18752013-06-05 21:38:04 +0000142 const AMDGPUSubtarget &ST = TM->getSubtarget<AMDGPUSubtarget>();
Tom Stellarda6c6e1b2013-06-07 20:37:48 +0000143
144 if (ST.getGeneration() <= AMDGPUSubtarget::NORTHERN_ISLANDS) {
Vincent Lejeunedec18752013-06-05 21:38:04 +0000145 addPass(createR600VectorRegMerger(*TM));
Tom Stellard2f7cdda2013-08-06 23:08:28 +0000146 } else {
147 addPass(createSIFixSGPRCopiesPass(*TM));
Tom Stellard15834092014-03-21 15:51:57 +0000148 // SIFixSGPRCopies can generate a lot of duplicate instructions,
149 // so we need to run MachineCSE afterwards.
150 addPass(&MachineCSEID);
Tom Stellard1aaad692014-07-21 16:55:33 +0000151 addPass(createSIShrinkInstructionsPass());
Tom Stellard60024a02014-09-24 01:33:24 +0000152 addPass(createSIFixSGPRLiveRangesPass());
Vincent Lejeunedec18752013-06-05 21:38:04 +0000153 }
Tom Stellard75aadc22012-12-11 21:25:42 +0000154 return false;
155}
156
157bool AMDGPUPassConfig::addPostRegAlloc() {
Tom Stellardc4cabef2013-01-18 21:15:53 +0000158 const AMDGPUSubtarget &ST = TM->getSubtarget<AMDGPUSubtarget>();
159
Tom Stellard1aaad692014-07-21 16:55:33 +0000160 addPass(createSIShrinkInstructionsPass());
Tom Stellarda6c6e1b2013-06-07 20:37:48 +0000161 if (ST.getGeneration() > AMDGPUSubtarget::NORTHERN_ISLANDS) {
Tom Stellardc4cabef2013-01-18 21:15:53 +0000162 addPass(createSIInsertWaits(*TM));
163 }
Tom Stellard75aadc22012-12-11 21:25:42 +0000164 return false;
165}
166
167bool AMDGPUPassConfig::addPreSched2() {
Vincent Lejeunece499742013-07-09 15:03:33 +0000168 const AMDGPUSubtarget &ST = TM->getSubtarget<AMDGPUSubtarget>();
Tom Stellard75aadc22012-12-11 21:25:42 +0000169
Vincent Lejeunea4da6fb2013-10-01 19:32:58 +0000170 if (ST.getGeneration() <= AMDGPUSubtarget::NORTHERN_ISLANDS)
Tom Stellard1de55822013-12-11 17:51:41 +0000171 addPass(createR600EmitClauseMarkers());
Tom Stellard783893a2013-11-18 19:43:33 +0000172 if (ST.isIfCvtEnabled())
173 addPass(&IfConverterID);
Vincent Lejeunea4da6fb2013-10-01 19:32:58 +0000174 if (ST.getGeneration() <= AMDGPUSubtarget::NORTHERN_ISLANDS)
175 addPass(createR600ClauseMergePass(*TM));
Tom Stellard75aadc22012-12-11 21:25:42 +0000176 return false;
177}
178
179bool AMDGPUPassConfig::addPreEmitPass() {
Tom Stellard75aadc22012-12-11 21:25:42 +0000180 const AMDGPUSubtarget &ST = TM->getSubtarget<AMDGPUSubtarget>();
Tom Stellarda6c6e1b2013-06-07 20:37:48 +0000181 if (ST.getGeneration() <= AMDGPUSubtarget::NORTHERN_ISLANDS) {
Tom Stellardf2ba9722013-12-11 17:51:47 +0000182 addPass(createAMDGPUCFGStructurizerPass());
Tom Stellard75aadc22012-12-11 21:25:42 +0000183 addPass(createR600ExpandSpecialInstrsPass(*TM));
Tom Stellard75aadc22012-12-11 21:25:42 +0000184 addPass(&FinalizeMachineBundlesID);
Vincent Lejeune147700b2013-04-30 00:14:27 +0000185 addPass(createR600Packetizer(*TM));
186 addPass(createR600ControlFlowFinalizer(*TM));
Tom Stellard75aadc22012-12-11 21:25:42 +0000187 } else {
Tom Stellard75aadc22012-12-11 21:25:42 +0000188 addPass(createSILowerControlFlowPass(*TM));
189 }
190
191 return false;
192}