Tom Stellard | 75aadc2 | 2012-12-11 21:25:42 +0000 | [diff] [blame] | 1 | //===-- AMDGPUTargetMachine.cpp - TargetMachine for hw codegen targets-----===// |
| 2 | // |
| 3 | // The LLVM Compiler Infrastructure |
| 4 | // |
| 5 | // This file is distributed under the University of Illinois Open Source |
| 6 | // License. See LICENSE.TXT for details. |
| 7 | // |
| 8 | //===----------------------------------------------------------------------===// |
| 9 | // |
| 10 | /// \file |
| 11 | /// \brief The AMDGPU target machine contains all of the hardware specific |
| 12 | /// information needed to emit code for R600 and SI GPUs. |
| 13 | // |
| 14 | //===----------------------------------------------------------------------===// |
| 15 | |
| 16 | #include "AMDGPUTargetMachine.h" |
| 17 | #include "AMDGPU.h" |
| 18 | #include "R600ISelLowering.h" |
| 19 | #include "R600InstrInfo.h" |
Vincent Lejeune | 68b6b6d | 2013-03-05 18:41:32 +0000 | [diff] [blame] | 20 | #include "R600MachineScheduler.h" |
Tom Stellard | 75aadc2 | 2012-12-11 21:25:42 +0000 | [diff] [blame] | 21 | #include "SIISelLowering.h" |
| 22 | #include "SIInstrInfo.h" |
| 23 | #include "llvm/Analysis/Passes.h" |
Tom Stellard | 75aadc2 | 2012-12-11 21:25:42 +0000 | [diff] [blame] | 24 | #include "llvm/CodeGen/MachineFunctionAnalysis.h" |
| 25 | #include "llvm/CodeGen/MachineModuleInfo.h" |
| 26 | #include "llvm/CodeGen/Passes.h" |
Chandler Carruth | 5ad5f15 | 2014-01-13 09:26:24 +0000 | [diff] [blame] | 27 | #include "llvm/IR/Verifier.h" |
Tom Stellard | 75aadc2 | 2012-12-11 21:25:42 +0000 | [diff] [blame] | 28 | #include "llvm/MC/MCAsmInfo.h" |
| 29 | #include "llvm/PassManager.h" |
| 30 | #include "llvm/Support/TargetRegistry.h" |
| 31 | #include "llvm/Support/raw_os_ostream.h" |
| 32 | #include "llvm/Transforms/IPO.h" |
| 33 | #include "llvm/Transforms/Scalar.h" |
| 34 | #include <llvm/CodeGen/Passes.h> |
| 35 | |
Tom Stellard | ed0ceec | 2013-10-10 17:11:12 +0000 | [diff] [blame] | 36 | |
Tom Stellard | 75aadc2 | 2012-12-11 21:25:42 +0000 | [diff] [blame] | 37 | using namespace llvm; |
| 38 | |
| 39 | extern "C" void LLVMInitializeR600Target() { |
| 40 | // Register the target |
| 41 | RegisterTargetMachine<AMDGPUTargetMachine> X(TheAMDGPUTarget); |
| 42 | } |
| 43 | |
Vincent Lejeune | 68b6b6d | 2013-03-05 18:41:32 +0000 | [diff] [blame] | 44 | static ScheduleDAGInstrs *createR600MachineScheduler(MachineSchedContext *C) { |
David Blaikie | 422b93d | 2014-04-21 20:32:32 +0000 | [diff] [blame] | 45 | return new ScheduleDAGMILive(C, make_unique<R600SchedStrategy>()); |
Vincent Lejeune | 68b6b6d | 2013-03-05 18:41:32 +0000 | [diff] [blame] | 46 | } |
| 47 | |
| 48 | static MachineSchedRegistry |
| 49 | SchedCustomRegistry("r600", "Run R600's custom scheduler", |
| 50 | createR600MachineScheduler); |
| 51 | |
Rafael Espindola | ceb0c49 | 2013-12-14 06:13:44 +0000 | [diff] [blame] | 52 | static std::string computeDataLayout(const AMDGPUSubtarget &ST) { |
Rafael Espindola | 4fa7975 | 2013-12-19 16:51:03 +0000 | [diff] [blame] | 53 | std::string Ret = "e-p:32:32"; |
Rafael Espindola | ceb0c49 | 2013-12-14 06:13:44 +0000 | [diff] [blame] | 54 | |
Matt Arsenault | a98cd6a | 2013-12-19 05:32:55 +0000 | [diff] [blame] | 55 | if (ST.is64bit()) { |
| 56 | // 32-bit private, local, and region pointers. 64-bit global and constant. |
| 57 | Ret += "-p1:64:64-p2:64:64-p3:32:32-p4:32:32-p5:64:64"; |
| 58 | } |
Rafael Espindola | ceb0c49 | 2013-12-14 06:13:44 +0000 | [diff] [blame] | 59 | |
Rafael Espindola | e89b414 | 2013-12-16 19:31:14 +0000 | [diff] [blame] | 60 | Ret += "-i64:64-v16:16-v24:32-v32:32-v48:64-v96:128-v192:256-v256:256" |
| 61 | "-v512:512-v1024:1024-v2048:2048-n32:64"; |
| 62 | |
Rafael Espindola | 0eb1ebe | 2013-12-16 19:18:57 +0000 | [diff] [blame] | 63 | return Ret; |
Rafael Espindola | ceb0c49 | 2013-12-14 06:13:44 +0000 | [diff] [blame] | 64 | } |
| 65 | |
Tom Stellard | 75aadc2 | 2012-12-11 21:25:42 +0000 | [diff] [blame] | 66 | AMDGPUTargetMachine::AMDGPUTargetMachine(const Target &T, StringRef TT, |
| 67 | StringRef CPU, StringRef FS, |
| 68 | TargetOptions Options, |
| 69 | Reloc::Model RM, CodeModel::Model CM, |
| 70 | CodeGenOpt::Level OptLevel |
| 71 | ) |
| 72 | : |
| 73 | LLVMTargetMachine(T, TT, CPU, FS, Options, RM, CM, OptLevel), |
| 74 | Subtarget(TT, CPU, FS), |
Rafael Espindola | ceb0c49 | 2013-12-14 06:13:44 +0000 | [diff] [blame] | 75 | Layout(computeDataLayout(Subtarget)), |
Tom Stellard | af77543 | 2013-10-23 00:44:32 +0000 | [diff] [blame] | 76 | FrameLowering(TargetFrameLowering::StackGrowsUp, |
| 77 | 64 * 16 // Maximum stack alignment (long16) |
| 78 | , 0), |
Tom Stellard | 75aadc2 | 2012-12-11 21:25:42 +0000 | [diff] [blame] | 79 | IntrinsicInfo(this), |
| 80 | InstrItins(&Subtarget.getInstrItineraryData()) { |
| 81 | // TLInfo uses InstrInfo so it must be initialized after. |
Tom Stellard | a6c6e1b | 2013-06-07 20:37:48 +0000 | [diff] [blame] | 82 | if (Subtarget.getGeneration() <= AMDGPUSubtarget::NORTHERN_ISLANDS) { |
Rafael Espindola | 39aca62 | 2013-05-23 03:31:47 +0000 | [diff] [blame] | 83 | InstrInfo.reset(new R600InstrInfo(*this)); |
| 84 | TLInfo.reset(new R600TargetLowering(*this)); |
Tom Stellard | 75aadc2 | 2012-12-11 21:25:42 +0000 | [diff] [blame] | 85 | } else { |
Rafael Espindola | 39aca62 | 2013-05-23 03:31:47 +0000 | [diff] [blame] | 86 | InstrInfo.reset(new SIInstrInfo(*this)); |
| 87 | TLInfo.reset(new SITargetLowering(*this)); |
Tom Stellard | 75aadc2 | 2012-12-11 21:25:42 +0000 | [diff] [blame] | 88 | } |
Vincent Lejeune | 92b0a64 | 2013-12-07 01:49:19 +0000 | [diff] [blame] | 89 | setRequiresStructuredCFG(true); |
Rafael Espindola | 227144c | 2013-05-13 01:16:13 +0000 | [diff] [blame] | 90 | initAsmInfo(); |
Tom Stellard | 75aadc2 | 2012-12-11 21:25:42 +0000 | [diff] [blame] | 91 | } |
| 92 | |
| 93 | AMDGPUTargetMachine::~AMDGPUTargetMachine() { |
| 94 | } |
| 95 | |
| 96 | namespace { |
| 97 | class AMDGPUPassConfig : public TargetPassConfig { |
| 98 | public: |
| 99 | AMDGPUPassConfig(AMDGPUTargetMachine *TM, PassManagerBase &PM) |
Andrew Trick | 978674b | 2013-09-20 05:14:41 +0000 | [diff] [blame] | 100 | : TargetPassConfig(TM, PM) {} |
Tom Stellard | 75aadc2 | 2012-12-11 21:25:42 +0000 | [diff] [blame] | 101 | |
| 102 | AMDGPUTargetMachine &getAMDGPUTargetMachine() const { |
| 103 | return getTM<AMDGPUTargetMachine>(); |
| 104 | } |
Andrew Trick | 978674b | 2013-09-20 05:14:41 +0000 | [diff] [blame] | 105 | |
Craig Topper | 5656db4 | 2014-04-29 07:57:24 +0000 | [diff] [blame] | 106 | ScheduleDAGInstrs * |
| 107 | createMachineScheduler(MachineSchedContext *C) const override { |
Andrew Trick | 978674b | 2013-09-20 05:14:41 +0000 | [diff] [blame] | 108 | const AMDGPUSubtarget &ST = TM->getSubtarget<AMDGPUSubtarget>(); |
| 109 | if (ST.getGeneration() <= AMDGPUSubtarget::NORTHERN_ISLANDS) |
| 110 | return createR600MachineScheduler(C); |
Craig Topper | 062a2ba | 2014-04-25 05:30:21 +0000 | [diff] [blame] | 111 | return nullptr; |
Andrew Trick | 978674b | 2013-09-20 05:14:41 +0000 | [diff] [blame] | 112 | } |
| 113 | |
Craig Topper | 5656db4 | 2014-04-29 07:57:24 +0000 | [diff] [blame] | 114 | bool addPreISel() override; |
| 115 | bool addInstSelector() override; |
| 116 | bool addPreRegAlloc() override; |
| 117 | bool addPostRegAlloc() override; |
| 118 | bool addPreSched2() override; |
| 119 | bool addPreEmitPass() override; |
Tom Stellard | 75aadc2 | 2012-12-11 21:25:42 +0000 | [diff] [blame] | 120 | }; |
| 121 | } // End of anonymous namespace |
| 122 | |
| 123 | TargetPassConfig *AMDGPUTargetMachine::createPassConfig(PassManagerBase &PM) { |
| 124 | return new AMDGPUPassConfig(this, PM); |
| 125 | } |
| 126 | |
Tom Stellard | 8b1e021 | 2013-07-27 00:01:07 +0000 | [diff] [blame] | 127 | //===----------------------------------------------------------------------===// |
| 128 | // AMDGPU Analysis Pass Setup |
| 129 | //===----------------------------------------------------------------------===// |
| 130 | |
| 131 | void AMDGPUTargetMachine::addAnalysisPasses(PassManagerBase &PM) { |
| 132 | // Add first the target-independent BasicTTI pass, then our AMDGPU pass. This |
| 133 | // allows the AMDGPU pass to delegate to the target independent layer when |
| 134 | // appropriate. |
| 135 | PM.add(createBasicTargetTransformInfoPass(this)); |
| 136 | PM.add(createAMDGPUTargetTransformInfoPass(this)); |
| 137 | } |
| 138 | |
Tom Stellard | 75aadc2 | 2012-12-11 21:25:42 +0000 | [diff] [blame] | 139 | bool |
| 140 | AMDGPUPassConfig::addPreISel() { |
Tom Stellard | f879435 | 2012-12-19 22:10:31 +0000 | [diff] [blame] | 141 | const AMDGPUSubtarget &ST = TM->getSubtarget<AMDGPUSubtarget>(); |
Tom Stellard | aa664d9 | 2013-08-06 02:43:45 +0000 | [diff] [blame] | 142 | addPass(createFlattenCFGPass()); |
Tom Stellard | 66df8a2 | 2013-11-18 19:43:44 +0000 | [diff] [blame] | 143 | if (ST.IsIRStructurizerEnabled()) |
Tom Stellard | ed0ceec | 2013-10-10 17:11:12 +0000 | [diff] [blame] | 144 | addPass(createStructurizeCFGPass()); |
Matt Arsenault | d0ce2bd | 2014-02-24 21:01:23 +0000 | [diff] [blame] | 145 | if (ST.getGeneration() >= AMDGPUSubtarget::SOUTHERN_ISLANDS) { |
Vincent Lejeune | 4ee6dd6 | 2013-10-13 17:56:21 +0000 | [diff] [blame] | 146 | addPass(createSinkingPass()); |
Tom Stellard | 9fa1791 | 2013-08-14 23:24:45 +0000 | [diff] [blame] | 147 | addPass(createSITypeRewriter()); |
Tom Stellard | f879435 | 2012-12-19 22:10:31 +0000 | [diff] [blame] | 148 | addPass(createSIAnnotateControlFlowPass()); |
Vincent Lejeune | d3eed66 | 2013-05-17 16:50:20 +0000 | [diff] [blame] | 149 | } else { |
| 150 | addPass(createR600TextureIntrinsicsReplacer()); |
Tom Stellard | f879435 | 2012-12-19 22:10:31 +0000 | [diff] [blame] | 151 | } |
Tom Stellard | 75aadc2 | 2012-12-11 21:25:42 +0000 | [diff] [blame] | 152 | return false; |
| 153 | } |
| 154 | |
| 155 | bool AMDGPUPassConfig::addInstSelector() { |
Tom Stellard | 75aadc2 | 2012-12-11 21:25:42 +0000 | [diff] [blame] | 156 | addPass(createAMDGPUISelDag(getAMDGPUTargetMachine())); |
Tom Stellard | 1bd8072 | 2014-04-30 15:31:33 +0000 | [diff] [blame^] | 157 | addPass(createSILowerI1CopiesPass()); |
Tom Stellard | 75aadc2 | 2012-12-11 21:25:42 +0000 | [diff] [blame] | 158 | return false; |
| 159 | } |
| 160 | |
| 161 | bool AMDGPUPassConfig::addPreRegAlloc() { |
Tom Stellard | 75aadc2 | 2012-12-11 21:25:42 +0000 | [diff] [blame] | 162 | addPass(createAMDGPUConvertToISAPass(*TM)); |
Vincent Lejeune | dec1875 | 2013-06-05 21:38:04 +0000 | [diff] [blame] | 163 | const AMDGPUSubtarget &ST = TM->getSubtarget<AMDGPUSubtarget>(); |
Tom Stellard | a6c6e1b | 2013-06-07 20:37:48 +0000 | [diff] [blame] | 164 | |
| 165 | if (ST.getGeneration() <= AMDGPUSubtarget::NORTHERN_ISLANDS) { |
Vincent Lejeune | dec1875 | 2013-06-05 21:38:04 +0000 | [diff] [blame] | 166 | addPass(createR600VectorRegMerger(*TM)); |
Tom Stellard | 2f7cdda | 2013-08-06 23:08:28 +0000 | [diff] [blame] | 167 | } else { |
| 168 | addPass(createSIFixSGPRCopiesPass(*TM)); |
Tom Stellard | 1583409 | 2014-03-21 15:51:57 +0000 | [diff] [blame] | 169 | // SIFixSGPRCopies can generate a lot of duplicate instructions, |
| 170 | // so we need to run MachineCSE afterwards. |
| 171 | addPass(&MachineCSEID); |
Vincent Lejeune | dec1875 | 2013-06-05 21:38:04 +0000 | [diff] [blame] | 172 | } |
Tom Stellard | 75aadc2 | 2012-12-11 21:25:42 +0000 | [diff] [blame] | 173 | return false; |
| 174 | } |
| 175 | |
| 176 | bool AMDGPUPassConfig::addPostRegAlloc() { |
Tom Stellard | c4cabef | 2013-01-18 21:15:53 +0000 | [diff] [blame] | 177 | const AMDGPUSubtarget &ST = TM->getSubtarget<AMDGPUSubtarget>(); |
| 178 | |
Tom Stellard | a6c6e1b | 2013-06-07 20:37:48 +0000 | [diff] [blame] | 179 | if (ST.getGeneration() > AMDGPUSubtarget::NORTHERN_ISLANDS) { |
Tom Stellard | c4cabef | 2013-01-18 21:15:53 +0000 | [diff] [blame] | 180 | addPass(createSIInsertWaits(*TM)); |
| 181 | } |
Tom Stellard | 75aadc2 | 2012-12-11 21:25:42 +0000 | [diff] [blame] | 182 | return false; |
| 183 | } |
| 184 | |
| 185 | bool AMDGPUPassConfig::addPreSched2() { |
Vincent Lejeune | ce49974 | 2013-07-09 15:03:33 +0000 | [diff] [blame] | 186 | const AMDGPUSubtarget &ST = TM->getSubtarget<AMDGPUSubtarget>(); |
Tom Stellard | 75aadc2 | 2012-12-11 21:25:42 +0000 | [diff] [blame] | 187 | |
Vincent Lejeune | a4da6fb | 2013-10-01 19:32:58 +0000 | [diff] [blame] | 188 | if (ST.getGeneration() <= AMDGPUSubtarget::NORTHERN_ISLANDS) |
Tom Stellard | 1de5582 | 2013-12-11 17:51:41 +0000 | [diff] [blame] | 189 | addPass(createR600EmitClauseMarkers()); |
Tom Stellard | 783893a | 2013-11-18 19:43:33 +0000 | [diff] [blame] | 190 | if (ST.isIfCvtEnabled()) |
| 191 | addPass(&IfConverterID); |
Vincent Lejeune | a4da6fb | 2013-10-01 19:32:58 +0000 | [diff] [blame] | 192 | if (ST.getGeneration() <= AMDGPUSubtarget::NORTHERN_ISLANDS) |
| 193 | addPass(createR600ClauseMergePass(*TM)); |
Tom Stellard | 75aadc2 | 2012-12-11 21:25:42 +0000 | [diff] [blame] | 194 | return false; |
| 195 | } |
| 196 | |
| 197 | bool AMDGPUPassConfig::addPreEmitPass() { |
Tom Stellard | 75aadc2 | 2012-12-11 21:25:42 +0000 | [diff] [blame] | 198 | const AMDGPUSubtarget &ST = TM->getSubtarget<AMDGPUSubtarget>(); |
Tom Stellard | a6c6e1b | 2013-06-07 20:37:48 +0000 | [diff] [blame] | 199 | if (ST.getGeneration() <= AMDGPUSubtarget::NORTHERN_ISLANDS) { |
Tom Stellard | f2ba972 | 2013-12-11 17:51:47 +0000 | [diff] [blame] | 200 | addPass(createAMDGPUCFGStructurizerPass()); |
Tom Stellard | 75aadc2 | 2012-12-11 21:25:42 +0000 | [diff] [blame] | 201 | addPass(createR600ExpandSpecialInstrsPass(*TM)); |
Tom Stellard | 75aadc2 | 2012-12-11 21:25:42 +0000 | [diff] [blame] | 202 | addPass(&FinalizeMachineBundlesID); |
Vincent Lejeune | 147700b | 2013-04-30 00:14:27 +0000 | [diff] [blame] | 203 | addPass(createR600Packetizer(*TM)); |
| 204 | addPass(createR600ControlFlowFinalizer(*TM)); |
Tom Stellard | 75aadc2 | 2012-12-11 21:25:42 +0000 | [diff] [blame] | 205 | } else { |
Tom Stellard | 75aadc2 | 2012-12-11 21:25:42 +0000 | [diff] [blame] | 206 | addPass(createSILowerControlFlowPass(*TM)); |
| 207 | } |
| 208 | |
| 209 | return false; |
| 210 | } |