Tom Stellard | 75aadc2 | 2012-12-11 21:25:42 +0000 | [diff] [blame] | 1 | //===-- AMDGPUTargetMachine.cpp - TargetMachine for hw codegen targets-----===// |
| 2 | // |
| 3 | // The LLVM Compiler Infrastructure |
| 4 | // |
| 5 | // This file is distributed under the University of Illinois Open Source |
| 6 | // License. See LICENSE.TXT for details. |
| 7 | // |
| 8 | //===----------------------------------------------------------------------===// |
| 9 | // |
| 10 | /// \file |
| 11 | /// \brief The AMDGPU target machine contains all of the hardware specific |
| 12 | /// information needed to emit code for R600 and SI GPUs. |
| 13 | // |
| 14 | //===----------------------------------------------------------------------===// |
| 15 | |
| 16 | #include "AMDGPUTargetMachine.h" |
| 17 | #include "AMDGPU.h" |
| 18 | #include "R600ISelLowering.h" |
| 19 | #include "R600InstrInfo.h" |
Vincent Lejeune | 68b6b6d | 2013-03-05 18:41:32 +0000 | [diff] [blame] | 20 | #include "R600MachineScheduler.h" |
Tom Stellard | 75aadc2 | 2012-12-11 21:25:42 +0000 | [diff] [blame] | 21 | #include "SIISelLowering.h" |
| 22 | #include "SIInstrInfo.h" |
| 23 | #include "llvm/Analysis/Passes.h" |
Tom Stellard | 75aadc2 | 2012-12-11 21:25:42 +0000 | [diff] [blame] | 24 | #include "llvm/CodeGen/MachineFunctionAnalysis.h" |
Aditya Nandakumar | a271932 | 2014-11-13 09:26:31 +0000 | [diff] [blame] | 25 | #include "llvm/CodeGen/TargetLoweringObjectFileImpl.h" |
Tom Stellard | 75aadc2 | 2012-12-11 21:25:42 +0000 | [diff] [blame] | 26 | #include "llvm/CodeGen/MachineModuleInfo.h" |
| 27 | #include "llvm/CodeGen/Passes.h" |
Chandler Carruth | 5ad5f15 | 2014-01-13 09:26:24 +0000 | [diff] [blame] | 28 | #include "llvm/IR/Verifier.h" |
Tom Stellard | 75aadc2 | 2012-12-11 21:25:42 +0000 | [diff] [blame] | 29 | #include "llvm/MC/MCAsmInfo.h" |
| 30 | #include "llvm/PassManager.h" |
| 31 | #include "llvm/Support/TargetRegistry.h" |
| 32 | #include "llvm/Support/raw_os_ostream.h" |
| 33 | #include "llvm/Transforms/IPO.h" |
| 34 | #include "llvm/Transforms/Scalar.h" |
| 35 | #include <llvm/CodeGen/Passes.h> |
| 36 | |
| 37 | using namespace llvm; |
| 38 | |
| 39 | extern "C" void LLVMInitializeR600Target() { |
| 40 | // Register the target |
| 41 | RegisterTargetMachine<AMDGPUTargetMachine> X(TheAMDGPUTarget); |
| 42 | } |
| 43 | |
Vincent Lejeune | 68b6b6d | 2013-03-05 18:41:32 +0000 | [diff] [blame] | 44 | static ScheduleDAGInstrs *createR600MachineScheduler(MachineSchedContext *C) { |
David Blaikie | 422b93d | 2014-04-21 20:32:32 +0000 | [diff] [blame] | 45 | return new ScheduleDAGMILive(C, make_unique<R600SchedStrategy>()); |
Vincent Lejeune | 68b6b6d | 2013-03-05 18:41:32 +0000 | [diff] [blame] | 46 | } |
| 47 | |
| 48 | static MachineSchedRegistry |
| 49 | SchedCustomRegistry("r600", "Run R600's custom scheduler", |
| 50 | createR600MachineScheduler); |
| 51 | |
Tom Stellard | 75aadc2 | 2012-12-11 21:25:42 +0000 | [diff] [blame] | 52 | AMDGPUTargetMachine::AMDGPUTargetMachine(const Target &T, StringRef TT, |
Eric Christopher | ac4b69e | 2014-07-25 22:22:39 +0000 | [diff] [blame] | 53 | StringRef CPU, StringRef FS, |
| 54 | TargetOptions Options, Reloc::Model RM, |
| 55 | CodeModel::Model CM, |
| 56 | CodeGenOpt::Level OptLevel) |
| 57 | : LLVMTargetMachine(T, TT, CPU, FS, Options, RM, CM, OptLevel), |
Aditya Nandakumar | a271932 | 2014-11-13 09:26:31 +0000 | [diff] [blame] | 58 | TLOF(new TargetLoweringObjectFileELF()), |
Eric Christopher | 34aaf97 | 2014-08-04 17:37:43 +0000 | [diff] [blame] | 59 | Subtarget(TT, CPU, FS, *this), IntrinsicInfo() { |
Vincent Lejeune | 92b0a64 | 2013-12-07 01:49:19 +0000 | [diff] [blame] | 60 | setRequiresStructuredCFG(true); |
Rafael Espindola | 227144c | 2013-05-13 01:16:13 +0000 | [diff] [blame] | 61 | initAsmInfo(); |
Tom Stellard | 75aadc2 | 2012-12-11 21:25:42 +0000 | [diff] [blame] | 62 | } |
| 63 | |
| 64 | AMDGPUTargetMachine::~AMDGPUTargetMachine() { |
Aditya Nandakumar | a271932 | 2014-11-13 09:26:31 +0000 | [diff] [blame] | 65 | delete TLOF; |
Tom Stellard | 75aadc2 | 2012-12-11 21:25:42 +0000 | [diff] [blame] | 66 | } |
| 67 | |
| 68 | namespace { |
| 69 | class AMDGPUPassConfig : public TargetPassConfig { |
| 70 | public: |
| 71 | AMDGPUPassConfig(AMDGPUTargetMachine *TM, PassManagerBase &PM) |
Andrew Trick | 978674b | 2013-09-20 05:14:41 +0000 | [diff] [blame] | 72 | : TargetPassConfig(TM, PM) {} |
Tom Stellard | 75aadc2 | 2012-12-11 21:25:42 +0000 | [diff] [blame] | 73 | |
| 74 | AMDGPUTargetMachine &getAMDGPUTargetMachine() const { |
| 75 | return getTM<AMDGPUTargetMachine>(); |
| 76 | } |
Andrew Trick | 978674b | 2013-09-20 05:14:41 +0000 | [diff] [blame] | 77 | |
Craig Topper | 5656db4 | 2014-04-29 07:57:24 +0000 | [diff] [blame] | 78 | ScheduleDAGInstrs * |
| 79 | createMachineScheduler(MachineSchedContext *C) const override { |
Andrew Trick | 978674b | 2013-09-20 05:14:41 +0000 | [diff] [blame] | 80 | const AMDGPUSubtarget &ST = TM->getSubtarget<AMDGPUSubtarget>(); |
| 81 | if (ST.getGeneration() <= AMDGPUSubtarget::NORTHERN_ISLANDS) |
| 82 | return createR600MachineScheduler(C); |
Craig Topper | 062a2ba | 2014-04-25 05:30:21 +0000 | [diff] [blame] | 83 | return nullptr; |
Andrew Trick | 978674b | 2013-09-20 05:14:41 +0000 | [diff] [blame] | 84 | } |
| 85 | |
Tom Stellard | 5cbb53c | 2014-11-03 19:49:05 +0000 | [diff] [blame] | 86 | void addIRPasses() override; |
Benjamin Kramer | 8c90fd7 | 2014-09-03 11:41:21 +0000 | [diff] [blame] | 87 | void addCodeGenPrepare() override; |
Craig Topper | 5656db4 | 2014-04-29 07:57:24 +0000 | [diff] [blame] | 88 | bool addPreISel() override; |
| 89 | bool addInstSelector() override; |
| 90 | bool addPreRegAlloc() override; |
| 91 | bool addPostRegAlloc() override; |
| 92 | bool addPreSched2() override; |
| 93 | bool addPreEmitPass() override; |
Tom Stellard | 75aadc2 | 2012-12-11 21:25:42 +0000 | [diff] [blame] | 94 | }; |
| 95 | } // End of anonymous namespace |
| 96 | |
| 97 | TargetPassConfig *AMDGPUTargetMachine::createPassConfig(PassManagerBase &PM) { |
| 98 | return new AMDGPUPassConfig(this, PM); |
| 99 | } |
| 100 | |
Tom Stellard | 8b1e021 | 2013-07-27 00:01:07 +0000 | [diff] [blame] | 101 | //===----------------------------------------------------------------------===// |
| 102 | // AMDGPU Analysis Pass Setup |
| 103 | //===----------------------------------------------------------------------===// |
| 104 | |
| 105 | void AMDGPUTargetMachine::addAnalysisPasses(PassManagerBase &PM) { |
| 106 | // Add first the target-independent BasicTTI pass, then our AMDGPU pass. This |
| 107 | // allows the AMDGPU pass to delegate to the target independent layer when |
| 108 | // appropriate. |
| 109 | PM.add(createBasicTargetTransformInfoPass(this)); |
| 110 | PM.add(createAMDGPUTargetTransformInfoPass(this)); |
| 111 | } |
| 112 | |
Tom Stellard | 5cbb53c | 2014-11-03 19:49:05 +0000 | [diff] [blame] | 113 | void AMDGPUPassConfig::addIRPasses() { |
| 114 | // Function calls are not supported, so make sure we inline everything. |
| 115 | addPass(createAMDGPUAlwaysInlinePass()); |
| 116 | addPass(createAlwaysInlinerPass()); |
| 117 | // We need to add the barrier noop pass, otherwise adding the function |
| 118 | // inlining pass will cause all of the PassConfigs passes to be run |
| 119 | // one function at a time, which means if we have a nodule with two |
| 120 | // functions, then we will generate code for the first function |
| 121 | // without ever running any passes on the second. |
| 122 | addPass(createBarrierNoopPass()); |
| 123 | TargetPassConfig::addIRPasses(); |
| 124 | } |
| 125 | |
Tom Stellard | 880a80a | 2014-06-17 16:53:14 +0000 | [diff] [blame] | 126 | void AMDGPUPassConfig::addCodeGenPrepare() { |
| 127 | const AMDGPUSubtarget &ST = TM->getSubtarget<AMDGPUSubtarget>(); |
Matt Arsenault | d9a23ab | 2014-07-13 02:08:26 +0000 | [diff] [blame] | 128 | if (ST.isPromoteAllocaEnabled()) { |
| 129 | addPass(createAMDGPUPromoteAlloca(ST)); |
| 130 | addPass(createSROAPass()); |
| 131 | } |
| 132 | |
Tom Stellard | 880a80a | 2014-06-17 16:53:14 +0000 | [diff] [blame] | 133 | TargetPassConfig::addCodeGenPrepare(); |
| 134 | } |
| 135 | |
Tom Stellard | 75aadc2 | 2012-12-11 21:25:42 +0000 | [diff] [blame] | 136 | bool |
| 137 | AMDGPUPassConfig::addPreISel() { |
Tom Stellard | f879435 | 2012-12-19 22:10:31 +0000 | [diff] [blame] | 138 | const AMDGPUSubtarget &ST = TM->getSubtarget<AMDGPUSubtarget>(); |
Tom Stellard | aa664d9 | 2013-08-06 02:43:45 +0000 | [diff] [blame] | 139 | addPass(createFlattenCFGPass()); |
Tom Stellard | 66df8a2 | 2013-11-18 19:43:44 +0000 | [diff] [blame] | 140 | if (ST.IsIRStructurizerEnabled()) |
Tom Stellard | ed0ceec | 2013-10-10 17:11:12 +0000 | [diff] [blame] | 141 | addPass(createStructurizeCFGPass()); |
Matt Arsenault | d0ce2bd | 2014-02-24 21:01:23 +0000 | [diff] [blame] | 142 | if (ST.getGeneration() >= AMDGPUSubtarget::SOUTHERN_ISLANDS) { |
Vincent Lejeune | 4ee6dd6 | 2013-10-13 17:56:21 +0000 | [diff] [blame] | 143 | addPass(createSinkingPass()); |
Tom Stellard | 9fa1791 | 2013-08-14 23:24:45 +0000 | [diff] [blame] | 144 | addPass(createSITypeRewriter()); |
Tom Stellard | f879435 | 2012-12-19 22:10:31 +0000 | [diff] [blame] | 145 | addPass(createSIAnnotateControlFlowPass()); |
Vincent Lejeune | d3eed66 | 2013-05-17 16:50:20 +0000 | [diff] [blame] | 146 | } else { |
| 147 | addPass(createR600TextureIntrinsicsReplacer()); |
Tom Stellard | f879435 | 2012-12-19 22:10:31 +0000 | [diff] [blame] | 148 | } |
Tom Stellard | 75aadc2 | 2012-12-11 21:25:42 +0000 | [diff] [blame] | 149 | return false; |
| 150 | } |
| 151 | |
| 152 | bool AMDGPUPassConfig::addInstSelector() { |
Matt Arsenault | 162c101 | 2014-11-18 21:06:58 +0000 | [diff] [blame] | 153 | const AMDGPUSubtarget &ST = TM->getSubtarget<AMDGPUSubtarget>(); |
| 154 | |
Tom Stellard | 75aadc2 | 2012-12-11 21:25:42 +0000 | [diff] [blame] | 155 | addPass(createAMDGPUISelDag(getAMDGPUTargetMachine())); |
Matt Arsenault | 162c101 | 2014-11-18 21:06:58 +0000 | [diff] [blame] | 156 | |
| 157 | if (ST.getGeneration() >= AMDGPUSubtarget::SOUTHERN_ISLANDS) { |
| 158 | addPass(createSILowerI1CopiesPass()); |
| 159 | addPass(createSIFixSGPRCopiesPass(*TM)); |
Matt Arsenault | 691ae3d | 2014-12-03 05:22:30 +0000 | [diff] [blame] | 160 | addPass(createSIFoldOperandsPass()); |
Matt Arsenault | 162c101 | 2014-11-18 21:06:58 +0000 | [diff] [blame] | 161 | } |
| 162 | |
Tom Stellard | 75aadc2 | 2012-12-11 21:25:42 +0000 | [diff] [blame] | 163 | return false; |
| 164 | } |
| 165 | |
| 166 | bool AMDGPUPassConfig::addPreRegAlloc() { |
Vincent Lejeune | dec1875 | 2013-06-05 21:38:04 +0000 | [diff] [blame] | 167 | const AMDGPUSubtarget &ST = TM->getSubtarget<AMDGPUSubtarget>(); |
Tom Stellard | a6c6e1b | 2013-06-07 20:37:48 +0000 | [diff] [blame] | 168 | |
| 169 | if (ST.getGeneration() <= AMDGPUSubtarget::NORTHERN_ISLANDS) { |
Vincent Lejeune | dec1875 | 2013-06-05 21:38:04 +0000 | [diff] [blame] | 170 | addPass(createR600VectorRegMerger(*TM)); |
Tom Stellard | 2f7cdda | 2013-08-06 23:08:28 +0000 | [diff] [blame] | 171 | } else { |
Matt Arsenault | 162c101 | 2014-11-18 21:06:58 +0000 | [diff] [blame] | 172 | if (getOptLevel() > CodeGenOpt::None && ST.loadStoreOptEnabled()) { |
Matt Arsenault | 4103328 | 2014-10-10 22:01:59 +0000 | [diff] [blame] | 173 | // Don't do this with no optimizations since it throws away debug info by |
| 174 | // merging nonadjacent loads. |
| 175 | |
| 176 | // This should be run after scheduling, but before register allocation. It |
| 177 | // also need extra copies to the address operand to be eliminated. |
| 178 | initializeSILoadStoreOptimizerPass(*PassRegistry::getPassRegistry()); |
| 179 | insertPass(&MachineSchedulerID, &SILoadStoreOptimizerID); |
| 180 | } |
| 181 | |
Tom Stellard | 1aaad69 | 2014-07-21 16:55:33 +0000 | [diff] [blame] | 182 | addPass(createSIShrinkInstructionsPass()); |
Tom Stellard | 60024a0 | 2014-09-24 01:33:24 +0000 | [diff] [blame] | 183 | addPass(createSIFixSGPRLiveRangesPass()); |
Vincent Lejeune | dec1875 | 2013-06-05 21:38:04 +0000 | [diff] [blame] | 184 | } |
Tom Stellard | 75aadc2 | 2012-12-11 21:25:42 +0000 | [diff] [blame] | 185 | return false; |
| 186 | } |
| 187 | |
| 188 | bool AMDGPUPassConfig::addPostRegAlloc() { |
Tom Stellard | c4cabef | 2013-01-18 21:15:53 +0000 | [diff] [blame] | 189 | const AMDGPUSubtarget &ST = TM->getSubtarget<AMDGPUSubtarget>(); |
| 190 | |
Tom Stellard | a6c6e1b | 2013-06-07 20:37:48 +0000 | [diff] [blame] | 191 | if (ST.getGeneration() > AMDGPUSubtarget::NORTHERN_ISLANDS) { |
Tom Stellard | 92105e8 | 2014-12-03 18:27:05 +0000 | [diff] [blame] | 192 | addPass(createSIShrinkInstructionsPass()); |
Tom Stellard | c4cabef | 2013-01-18 21:15:53 +0000 | [diff] [blame] | 193 | } |
Tom Stellard | 75aadc2 | 2012-12-11 21:25:42 +0000 | [diff] [blame] | 194 | return false; |
| 195 | } |
| 196 | |
| 197 | bool AMDGPUPassConfig::addPreSched2() { |
Vincent Lejeune | ce49974 | 2013-07-09 15:03:33 +0000 | [diff] [blame] | 198 | const AMDGPUSubtarget &ST = TM->getSubtarget<AMDGPUSubtarget>(); |
Tom Stellard | 75aadc2 | 2012-12-11 21:25:42 +0000 | [diff] [blame] | 199 | |
Vincent Lejeune | a4da6fb | 2013-10-01 19:32:58 +0000 | [diff] [blame] | 200 | if (ST.getGeneration() <= AMDGPUSubtarget::NORTHERN_ISLANDS) |
Tom Stellard | 1de5582 | 2013-12-11 17:51:41 +0000 | [diff] [blame] | 201 | addPass(createR600EmitClauseMarkers()); |
Tom Stellard | 783893a | 2013-11-18 19:43:33 +0000 | [diff] [blame] | 202 | if (ST.isIfCvtEnabled()) |
| 203 | addPass(&IfConverterID); |
Vincent Lejeune | a4da6fb | 2013-10-01 19:32:58 +0000 | [diff] [blame] | 204 | if (ST.getGeneration() <= AMDGPUSubtarget::NORTHERN_ISLANDS) |
| 205 | addPass(createR600ClauseMergePass(*TM)); |
Tom Stellard | 05cd445 | 2014-12-03 18:27:08 +0000 | [diff] [blame] | 206 | if (ST.getGeneration() >= AMDGPUSubtarget::SOUTHERN_ISLANDS) { |
| 207 | addPass(createSIInsertWaits(*TM)); |
| 208 | } |
Tom Stellard | 75aadc2 | 2012-12-11 21:25:42 +0000 | [diff] [blame] | 209 | return false; |
| 210 | } |
| 211 | |
| 212 | bool AMDGPUPassConfig::addPreEmitPass() { |
Tom Stellard | 75aadc2 | 2012-12-11 21:25:42 +0000 | [diff] [blame] | 213 | const AMDGPUSubtarget &ST = TM->getSubtarget<AMDGPUSubtarget>(); |
Tom Stellard | a6c6e1b | 2013-06-07 20:37:48 +0000 | [diff] [blame] | 214 | if (ST.getGeneration() <= AMDGPUSubtarget::NORTHERN_ISLANDS) { |
Tom Stellard | f2ba972 | 2013-12-11 17:51:47 +0000 | [diff] [blame] | 215 | addPass(createAMDGPUCFGStructurizerPass()); |
Tom Stellard | 75aadc2 | 2012-12-11 21:25:42 +0000 | [diff] [blame] | 216 | addPass(createR600ExpandSpecialInstrsPass(*TM)); |
Tom Stellard | 75aadc2 | 2012-12-11 21:25:42 +0000 | [diff] [blame] | 217 | addPass(&FinalizeMachineBundlesID); |
Vincent Lejeune | 147700b | 2013-04-30 00:14:27 +0000 | [diff] [blame] | 218 | addPass(createR600Packetizer(*TM)); |
| 219 | addPass(createR600ControlFlowFinalizer(*TM)); |
Tom Stellard | 75aadc2 | 2012-12-11 21:25:42 +0000 | [diff] [blame] | 220 | } else { |
Tom Stellard | 75aadc2 | 2012-12-11 21:25:42 +0000 | [diff] [blame] | 221 | addPass(createSILowerControlFlowPass(*TM)); |
| 222 | } |
| 223 | |
| 224 | return false; |
| 225 | } |