Tom Stellard | 75aadc2 | 2012-12-11 21:25:42 +0000 | [diff] [blame] | 1 | //===-- AMDGPUTargetMachine.cpp - TargetMachine for hw codegen targets-----===// |
| 2 | // |
| 3 | // The LLVM Compiler Infrastructure |
| 4 | // |
| 5 | // This file is distributed under the University of Illinois Open Source |
| 6 | // License. See LICENSE.TXT for details. |
| 7 | // |
| 8 | //===----------------------------------------------------------------------===// |
| 9 | // |
| 10 | /// \file |
| 11 | /// \brief The AMDGPU target machine contains all of the hardware specific |
| 12 | /// information needed to emit code for R600 and SI GPUs. |
| 13 | // |
| 14 | //===----------------------------------------------------------------------===// |
| 15 | |
| 16 | #include "AMDGPUTargetMachine.h" |
| 17 | #include "AMDGPU.h" |
| 18 | #include "R600ISelLowering.h" |
| 19 | #include "R600InstrInfo.h" |
Vincent Lejeune | 68b6b6d | 2013-03-05 18:41:32 +0000 | [diff] [blame] | 20 | #include "R600MachineScheduler.h" |
Tom Stellard | 75aadc2 | 2012-12-11 21:25:42 +0000 | [diff] [blame] | 21 | #include "SIISelLowering.h" |
| 22 | #include "SIInstrInfo.h" |
| 23 | #include "llvm/Analysis/Passes.h" |
Tom Stellard | 75aadc2 | 2012-12-11 21:25:42 +0000 | [diff] [blame] | 24 | #include "llvm/CodeGen/MachineFunctionAnalysis.h" |
| 25 | #include "llvm/CodeGen/MachineModuleInfo.h" |
| 26 | #include "llvm/CodeGen/Passes.h" |
Chandler Carruth | 5ad5f15 | 2014-01-13 09:26:24 +0000 | [diff] [blame] | 27 | #include "llvm/IR/Verifier.h" |
Tom Stellard | 75aadc2 | 2012-12-11 21:25:42 +0000 | [diff] [blame] | 28 | #include "llvm/MC/MCAsmInfo.h" |
| 29 | #include "llvm/PassManager.h" |
| 30 | #include "llvm/Support/TargetRegistry.h" |
| 31 | #include "llvm/Support/raw_os_ostream.h" |
| 32 | #include "llvm/Transforms/IPO.h" |
| 33 | #include "llvm/Transforms/Scalar.h" |
| 34 | #include <llvm/CodeGen/Passes.h> |
| 35 | |
| 36 | using namespace llvm; |
| 37 | |
| 38 | extern "C" void LLVMInitializeR600Target() { |
| 39 | // Register the target |
| 40 | RegisterTargetMachine<AMDGPUTargetMachine> X(TheAMDGPUTarget); |
| 41 | } |
| 42 | |
Vincent Lejeune | 68b6b6d | 2013-03-05 18:41:32 +0000 | [diff] [blame] | 43 | static ScheduleDAGInstrs *createR600MachineScheduler(MachineSchedContext *C) { |
David Blaikie | 422b93d | 2014-04-21 20:32:32 +0000 | [diff] [blame] | 44 | return new ScheduleDAGMILive(C, make_unique<R600SchedStrategy>()); |
Vincent Lejeune | 68b6b6d | 2013-03-05 18:41:32 +0000 | [diff] [blame] | 45 | } |
| 46 | |
| 47 | static MachineSchedRegistry |
| 48 | SchedCustomRegistry("r600", "Run R600's custom scheduler", |
| 49 | createR600MachineScheduler); |
| 50 | |
Tom Stellard | 75aadc2 | 2012-12-11 21:25:42 +0000 | [diff] [blame] | 51 | AMDGPUTargetMachine::AMDGPUTargetMachine(const Target &T, StringRef TT, |
Eric Christopher | ac4b69e | 2014-07-25 22:22:39 +0000 | [diff] [blame] | 52 | StringRef CPU, StringRef FS, |
| 53 | TargetOptions Options, Reloc::Model RM, |
| 54 | CodeModel::Model CM, |
| 55 | CodeGenOpt::Level OptLevel) |
| 56 | : LLVMTargetMachine(T, TT, CPU, FS, Options, RM, CM, OptLevel), |
Eric Christopher | 34aaf97 | 2014-08-04 17:37:43 +0000 | [diff] [blame] | 57 | Subtarget(TT, CPU, FS, *this), IntrinsicInfo() { |
Vincent Lejeune | 92b0a64 | 2013-12-07 01:49:19 +0000 | [diff] [blame] | 58 | setRequiresStructuredCFG(true); |
Rafael Espindola | 227144c | 2013-05-13 01:16:13 +0000 | [diff] [blame] | 59 | initAsmInfo(); |
Tom Stellard | 75aadc2 | 2012-12-11 21:25:42 +0000 | [diff] [blame] | 60 | } |
| 61 | |
| 62 | AMDGPUTargetMachine::~AMDGPUTargetMachine() { |
| 63 | } |
| 64 | |
| 65 | namespace { |
| 66 | class AMDGPUPassConfig : public TargetPassConfig { |
| 67 | public: |
| 68 | AMDGPUPassConfig(AMDGPUTargetMachine *TM, PassManagerBase &PM) |
Andrew Trick | 978674b | 2013-09-20 05:14:41 +0000 | [diff] [blame] | 69 | : TargetPassConfig(TM, PM) {} |
Tom Stellard | 75aadc2 | 2012-12-11 21:25:42 +0000 | [diff] [blame] | 70 | |
| 71 | AMDGPUTargetMachine &getAMDGPUTargetMachine() const { |
| 72 | return getTM<AMDGPUTargetMachine>(); |
| 73 | } |
Andrew Trick | 978674b | 2013-09-20 05:14:41 +0000 | [diff] [blame] | 74 | |
Craig Topper | 5656db4 | 2014-04-29 07:57:24 +0000 | [diff] [blame] | 75 | ScheduleDAGInstrs * |
| 76 | createMachineScheduler(MachineSchedContext *C) const override { |
Andrew Trick | 978674b | 2013-09-20 05:14:41 +0000 | [diff] [blame] | 77 | const AMDGPUSubtarget &ST = TM->getSubtarget<AMDGPUSubtarget>(); |
| 78 | if (ST.getGeneration() <= AMDGPUSubtarget::NORTHERN_ISLANDS) |
| 79 | return createR600MachineScheduler(C); |
Craig Topper | 062a2ba | 2014-04-25 05:30:21 +0000 | [diff] [blame] | 80 | return nullptr; |
Andrew Trick | 978674b | 2013-09-20 05:14:41 +0000 | [diff] [blame] | 81 | } |
| 82 | |
Tom Stellard | 5cbb53c | 2014-11-03 19:49:05 +0000 | [diff] [blame] | 83 | void addIRPasses() override; |
Benjamin Kramer | 8c90fd7 | 2014-09-03 11:41:21 +0000 | [diff] [blame] | 84 | void addCodeGenPrepare() override; |
Craig Topper | 5656db4 | 2014-04-29 07:57:24 +0000 | [diff] [blame] | 85 | bool addPreISel() override; |
| 86 | bool addInstSelector() override; |
| 87 | bool addPreRegAlloc() override; |
| 88 | bool addPostRegAlloc() override; |
| 89 | bool addPreSched2() override; |
| 90 | bool addPreEmitPass() override; |
Tom Stellard | 75aadc2 | 2012-12-11 21:25:42 +0000 | [diff] [blame] | 91 | }; |
| 92 | } // End of anonymous namespace |
| 93 | |
| 94 | TargetPassConfig *AMDGPUTargetMachine::createPassConfig(PassManagerBase &PM) { |
| 95 | return new AMDGPUPassConfig(this, PM); |
| 96 | } |
| 97 | |
Tom Stellard | 8b1e021 | 2013-07-27 00:01:07 +0000 | [diff] [blame] | 98 | //===----------------------------------------------------------------------===// |
| 99 | // AMDGPU Analysis Pass Setup |
| 100 | //===----------------------------------------------------------------------===// |
| 101 | |
| 102 | void AMDGPUTargetMachine::addAnalysisPasses(PassManagerBase &PM) { |
| 103 | // Add first the target-independent BasicTTI pass, then our AMDGPU pass. This |
| 104 | // allows the AMDGPU pass to delegate to the target independent layer when |
| 105 | // appropriate. |
| 106 | PM.add(createBasicTargetTransformInfoPass(this)); |
| 107 | PM.add(createAMDGPUTargetTransformInfoPass(this)); |
| 108 | } |
| 109 | |
Tom Stellard | 5cbb53c | 2014-11-03 19:49:05 +0000 | [diff] [blame] | 110 | void AMDGPUPassConfig::addIRPasses() { |
| 111 | // Function calls are not supported, so make sure we inline everything. |
| 112 | addPass(createAMDGPUAlwaysInlinePass()); |
| 113 | addPass(createAlwaysInlinerPass()); |
| 114 | // We need to add the barrier noop pass, otherwise adding the function |
| 115 | // inlining pass will cause all of the PassConfigs passes to be run |
| 116 | // one function at a time, which means if we have a nodule with two |
| 117 | // functions, then we will generate code for the first function |
| 118 | // without ever running any passes on the second. |
| 119 | addPass(createBarrierNoopPass()); |
| 120 | TargetPassConfig::addIRPasses(); |
| 121 | } |
| 122 | |
Tom Stellard | 880a80a | 2014-06-17 16:53:14 +0000 | [diff] [blame] | 123 | void AMDGPUPassConfig::addCodeGenPrepare() { |
| 124 | const AMDGPUSubtarget &ST = TM->getSubtarget<AMDGPUSubtarget>(); |
Matt Arsenault | d9a23ab | 2014-07-13 02:08:26 +0000 | [diff] [blame] | 125 | if (ST.isPromoteAllocaEnabled()) { |
| 126 | addPass(createAMDGPUPromoteAlloca(ST)); |
| 127 | addPass(createSROAPass()); |
| 128 | } |
| 129 | |
Tom Stellard | 880a80a | 2014-06-17 16:53:14 +0000 | [diff] [blame] | 130 | TargetPassConfig::addCodeGenPrepare(); |
| 131 | } |
| 132 | |
Tom Stellard | 75aadc2 | 2012-12-11 21:25:42 +0000 | [diff] [blame] | 133 | bool |
| 134 | AMDGPUPassConfig::addPreISel() { |
Tom Stellard | f879435 | 2012-12-19 22:10:31 +0000 | [diff] [blame] | 135 | const AMDGPUSubtarget &ST = TM->getSubtarget<AMDGPUSubtarget>(); |
Tom Stellard | aa664d9 | 2013-08-06 02:43:45 +0000 | [diff] [blame] | 136 | addPass(createFlattenCFGPass()); |
Tom Stellard | 66df8a2 | 2013-11-18 19:43:44 +0000 | [diff] [blame] | 137 | if (ST.IsIRStructurizerEnabled()) |
Tom Stellard | ed0ceec | 2013-10-10 17:11:12 +0000 | [diff] [blame] | 138 | addPass(createStructurizeCFGPass()); |
Matt Arsenault | d0ce2bd | 2014-02-24 21:01:23 +0000 | [diff] [blame] | 139 | if (ST.getGeneration() >= AMDGPUSubtarget::SOUTHERN_ISLANDS) { |
Vincent Lejeune | 4ee6dd6 | 2013-10-13 17:56:21 +0000 | [diff] [blame] | 140 | addPass(createSinkingPass()); |
Tom Stellard | 9fa1791 | 2013-08-14 23:24:45 +0000 | [diff] [blame] | 141 | addPass(createSITypeRewriter()); |
Tom Stellard | f879435 | 2012-12-19 22:10:31 +0000 | [diff] [blame] | 142 | addPass(createSIAnnotateControlFlowPass()); |
Vincent Lejeune | d3eed66 | 2013-05-17 16:50:20 +0000 | [diff] [blame] | 143 | } else { |
| 144 | addPass(createR600TextureIntrinsicsReplacer()); |
Tom Stellard | f879435 | 2012-12-19 22:10:31 +0000 | [diff] [blame] | 145 | } |
Tom Stellard | 75aadc2 | 2012-12-11 21:25:42 +0000 | [diff] [blame] | 146 | return false; |
| 147 | } |
| 148 | |
| 149 | bool AMDGPUPassConfig::addInstSelector() { |
Tom Stellard | 75aadc2 | 2012-12-11 21:25:42 +0000 | [diff] [blame] | 150 | addPass(createAMDGPUISelDag(getAMDGPUTargetMachine())); |
Tom Stellard | 1bd8072 | 2014-04-30 15:31:33 +0000 | [diff] [blame] | 151 | addPass(createSILowerI1CopiesPass()); |
Tom Stellard | 75aadc2 | 2012-12-11 21:25:42 +0000 | [diff] [blame] | 152 | return false; |
| 153 | } |
| 154 | |
| 155 | bool AMDGPUPassConfig::addPreRegAlloc() { |
Vincent Lejeune | dec1875 | 2013-06-05 21:38:04 +0000 | [diff] [blame] | 156 | const AMDGPUSubtarget &ST = TM->getSubtarget<AMDGPUSubtarget>(); |
Tom Stellard | a6c6e1b | 2013-06-07 20:37:48 +0000 | [diff] [blame] | 157 | |
| 158 | if (ST.getGeneration() <= AMDGPUSubtarget::NORTHERN_ISLANDS) { |
Vincent Lejeune | dec1875 | 2013-06-05 21:38:04 +0000 | [diff] [blame] | 159 | addPass(createR600VectorRegMerger(*TM)); |
Tom Stellard | 2f7cdda | 2013-08-06 23:08:28 +0000 | [diff] [blame] | 160 | } else { |
| 161 | addPass(createSIFixSGPRCopiesPass(*TM)); |
Tom Stellard | 1583409 | 2014-03-21 15:51:57 +0000 | [diff] [blame] | 162 | // SIFixSGPRCopies can generate a lot of duplicate instructions, |
| 163 | // so we need to run MachineCSE afterwards. |
| 164 | addPass(&MachineCSEID); |
Matt Arsenault | 4103328 | 2014-10-10 22:01:59 +0000 | [diff] [blame] | 165 | |
| 166 | if (getOptLevel() > CodeGenOpt::None && ST.loadStoreOptEnabled()) { |
| 167 | // Don't do this with no optimizations since it throws away debug info by |
| 168 | // merging nonadjacent loads. |
| 169 | |
| 170 | // This should be run after scheduling, but before register allocation. It |
| 171 | // also need extra copies to the address operand to be eliminated. |
| 172 | initializeSILoadStoreOptimizerPass(*PassRegistry::getPassRegistry()); |
| 173 | insertPass(&MachineSchedulerID, &SILoadStoreOptimizerID); |
| 174 | } |
| 175 | |
Tom Stellard | 1aaad69 | 2014-07-21 16:55:33 +0000 | [diff] [blame] | 176 | addPass(createSIShrinkInstructionsPass()); |
Tom Stellard | 60024a0 | 2014-09-24 01:33:24 +0000 | [diff] [blame] | 177 | addPass(createSIFixSGPRLiveRangesPass()); |
Vincent Lejeune | dec1875 | 2013-06-05 21:38:04 +0000 | [diff] [blame] | 178 | } |
Tom Stellard | 75aadc2 | 2012-12-11 21:25:42 +0000 | [diff] [blame] | 179 | return false; |
| 180 | } |
| 181 | |
| 182 | bool AMDGPUPassConfig::addPostRegAlloc() { |
Tom Stellard | c4cabef | 2013-01-18 21:15:53 +0000 | [diff] [blame] | 183 | const AMDGPUSubtarget &ST = TM->getSubtarget<AMDGPUSubtarget>(); |
| 184 | |
Tom Stellard | 1aaad69 | 2014-07-21 16:55:33 +0000 | [diff] [blame] | 185 | addPass(createSIShrinkInstructionsPass()); |
Tom Stellard | a6c6e1b | 2013-06-07 20:37:48 +0000 | [diff] [blame] | 186 | if (ST.getGeneration() > AMDGPUSubtarget::NORTHERN_ISLANDS) { |
Tom Stellard | c4cabef | 2013-01-18 21:15:53 +0000 | [diff] [blame] | 187 | addPass(createSIInsertWaits(*TM)); |
| 188 | } |
Tom Stellard | 75aadc2 | 2012-12-11 21:25:42 +0000 | [diff] [blame] | 189 | return false; |
| 190 | } |
| 191 | |
| 192 | bool AMDGPUPassConfig::addPreSched2() { |
Vincent Lejeune | ce49974 | 2013-07-09 15:03:33 +0000 | [diff] [blame] | 193 | const AMDGPUSubtarget &ST = TM->getSubtarget<AMDGPUSubtarget>(); |
Tom Stellard | 75aadc2 | 2012-12-11 21:25:42 +0000 | [diff] [blame] | 194 | |
Vincent Lejeune | a4da6fb | 2013-10-01 19:32:58 +0000 | [diff] [blame] | 195 | if (ST.getGeneration() <= AMDGPUSubtarget::NORTHERN_ISLANDS) |
Tom Stellard | 1de5582 | 2013-12-11 17:51:41 +0000 | [diff] [blame] | 196 | addPass(createR600EmitClauseMarkers()); |
Tom Stellard | 783893a | 2013-11-18 19:43:33 +0000 | [diff] [blame] | 197 | if (ST.isIfCvtEnabled()) |
| 198 | addPass(&IfConverterID); |
Vincent Lejeune | a4da6fb | 2013-10-01 19:32:58 +0000 | [diff] [blame] | 199 | if (ST.getGeneration() <= AMDGPUSubtarget::NORTHERN_ISLANDS) |
| 200 | addPass(createR600ClauseMergePass(*TM)); |
Tom Stellard | 75aadc2 | 2012-12-11 21:25:42 +0000 | [diff] [blame] | 201 | return false; |
| 202 | } |
| 203 | |
| 204 | bool AMDGPUPassConfig::addPreEmitPass() { |
Tom Stellard | 75aadc2 | 2012-12-11 21:25:42 +0000 | [diff] [blame] | 205 | const AMDGPUSubtarget &ST = TM->getSubtarget<AMDGPUSubtarget>(); |
Tom Stellard | a6c6e1b | 2013-06-07 20:37:48 +0000 | [diff] [blame] | 206 | if (ST.getGeneration() <= AMDGPUSubtarget::NORTHERN_ISLANDS) { |
Tom Stellard | f2ba972 | 2013-12-11 17:51:47 +0000 | [diff] [blame] | 207 | addPass(createAMDGPUCFGStructurizerPass()); |
Tom Stellard | 75aadc2 | 2012-12-11 21:25:42 +0000 | [diff] [blame] | 208 | addPass(createR600ExpandSpecialInstrsPass(*TM)); |
Tom Stellard | 75aadc2 | 2012-12-11 21:25:42 +0000 | [diff] [blame] | 209 | addPass(&FinalizeMachineBundlesID); |
Vincent Lejeune | 147700b | 2013-04-30 00:14:27 +0000 | [diff] [blame] | 210 | addPass(createR600Packetizer(*TM)); |
| 211 | addPass(createR600ControlFlowFinalizer(*TM)); |
Tom Stellard | 75aadc2 | 2012-12-11 21:25:42 +0000 | [diff] [blame] | 212 | } else { |
Tom Stellard | 75aadc2 | 2012-12-11 21:25:42 +0000 | [diff] [blame] | 213 | addPass(createSILowerControlFlowPass(*TM)); |
| 214 | } |
| 215 | |
| 216 | return false; |
| 217 | } |