Nick Lewycky | f7a3c50 | 2010-09-07 18:14:24 +0000 | [diff] [blame] | 1 | //===-- PTXTargetMachine.cpp - Define TargetMachine for PTX ---------------===// |
| 2 | // |
| 3 | // The LLVM Compiler Infrastructure |
| 4 | // |
| 5 | // This file is distributed under the University of Illinois Open Source |
| 6 | // License. See LICENSE.TXT for details. |
| 7 | // |
| 8 | //===----------------------------------------------------------------------===// |
| 9 | // |
| 10 | // Top-level implementation for the PTX target. |
| 11 | // |
| 12 | //===----------------------------------------------------------------------===// |
| 13 | |
| 14 | #include "PTX.h" |
| 15 | #include "PTXTargetMachine.h" |
Eric Christopher | 50880d0 | 2010-09-18 18:52:28 +0000 | [diff] [blame] | 16 | #include "llvm/PassManager.h" |
Justin Holewinski | 40466cc | 2011-09-22 16:45:37 +0000 | [diff] [blame] | 17 | #include "llvm/Analysis/Passes.h" |
| 18 | #include "llvm/Analysis/Verifier.h" |
| 19 | #include "llvm/Assembly/PrintModulePass.h" |
| 20 | #include "llvm/ADT/OwningPtr.h" |
| 21 | #include "llvm/CodeGen/AsmPrinter.h" |
| 22 | #include "llvm/CodeGen/MachineFunctionAnalysis.h" |
| 23 | #include "llvm/CodeGen/MachineModuleInfo.h" |
| 24 | #include "llvm/CodeGen/Passes.h" |
| 25 | #include "llvm/MC/MCAsmInfo.h" |
| 26 | #include "llvm/MC/MCInstrInfo.h" |
| 27 | #include "llvm/MC/MCStreamer.h" |
| 28 | #include "llvm/MC/MCSubtargetInfo.h" |
Evan Cheng | 3e74d6f | 2011-08-24 18:08:43 +0000 | [diff] [blame] | 29 | #include "llvm/Support/TargetRegistry.h" |
Che-Liang Chiou | f48817c | 2011-03-02 07:36:48 +0000 | [diff] [blame] | 30 | #include "llvm/Support/raw_ostream.h" |
Justin Holewinski | 40466cc | 2011-09-22 16:45:37 +0000 | [diff] [blame] | 31 | #include "llvm/Target/TargetData.h" |
| 32 | #include "llvm/Target/TargetInstrInfo.h" |
| 33 | #include "llvm/Target/TargetLowering.h" |
| 34 | #include "llvm/Target/TargetLoweringObjectFile.h" |
| 35 | #include "llvm/Target/TargetMachine.h" |
| 36 | #include "llvm/Target/TargetOptions.h" |
| 37 | #include "llvm/Target/TargetRegisterInfo.h" |
| 38 | #include "llvm/Target/TargetSubtargetInfo.h" |
| 39 | #include "llvm/Transforms/Scalar.h" |
| 40 | #include "llvm/Support/Debug.h" |
| 41 | #include "llvm/Support/TargetRegistry.h" |
| 42 | |
Nick Lewycky | f7a3c50 | 2010-09-07 18:14:24 +0000 | [diff] [blame] | 43 | |
| 44 | using namespace llvm; |
| 45 | |
Rafael Espindola | a484f2c | 2010-11-28 14:48:34 +0000 | [diff] [blame] | 46 | namespace llvm { |
| 47 | MCStreamer *createPTXAsmStreamer(MCContext &Ctx, formatted_raw_ostream &OS, |
Rafael Espindola | 89b9372 | 2010-12-10 07:39:47 +0000 | [diff] [blame] | 48 | bool isVerboseAsm, bool useLoc, |
Nick Lewycky | 44d798d | 2011-10-17 23:05:28 +0000 | [diff] [blame] | 49 | bool useCFI, bool useDwarfDirectory, |
Rafael Espindola | a484f2c | 2010-11-28 14:48:34 +0000 | [diff] [blame] | 50 | MCInstPrinter *InstPrint, |
| 51 | MCCodeEmitter *CE, |
Evan Cheng | 78c10ee | 2011-07-25 23:24:55 +0000 | [diff] [blame] | 52 | MCAsmBackend *MAB, |
Bill Wendling | e266ce6 | 2011-06-17 20:55:01 +0000 | [diff] [blame] | 53 | bool ShowInst); |
Rafael Espindola | a484f2c | 2010-11-28 14:48:34 +0000 | [diff] [blame] | 54 | } |
| 55 | |
Eric Christopher | 50880d0 | 2010-09-18 18:52:28 +0000 | [diff] [blame] | 56 | extern "C" void LLVMInitializePTXTarget() { |
Justin Holewinski | e1fee48 | 2011-04-20 15:37:17 +0000 | [diff] [blame] | 57 | |
| 58 | RegisterTargetMachine<PTX32TargetMachine> X(ThePTX32Target); |
| 59 | RegisterTargetMachine<PTX64TargetMachine> Y(ThePTX64Target); |
| 60 | |
Justin Holewinski | e1fee48 | 2011-04-20 15:37:17 +0000 | [diff] [blame] | 61 | TargetRegistry::RegisterAsmStreamer(ThePTX32Target, createPTXAsmStreamer); |
| 62 | TargetRegistry::RegisterAsmStreamer(ThePTX64Target, createPTXAsmStreamer); |
Nick Lewycky | f7a3c50 | 2010-09-07 18:14:24 +0000 | [diff] [blame] | 63 | } |
| 64 | |
Che-Liang Chiou | f48817c | 2011-03-02 07:36:48 +0000 | [diff] [blame] | 65 | namespace { |
Che-Liang Chiou | 31c488c | 2011-03-02 07:58:46 +0000 | [diff] [blame] | 66 | const char* DataLayout32 = |
| 67 | "e-p:32:32-i64:32:32-f64:32:32-v128:32:128-v64:32:64-n32:64"; |
| 68 | const char* DataLayout64 = |
| 69 | "e-p:64:64-i64:32:32-f64:32:32-v128:32:128-v64:32:64-n32:64"; |
Che-Liang Chiou | f48817c | 2011-03-02 07:36:48 +0000 | [diff] [blame] | 70 | } |
| 71 | |
Anton Korobeynikov | 16c29b5 | 2011-01-10 12:39:04 +0000 | [diff] [blame] | 72 | // DataLayout and FrameLowering are filled with dummy data |
Nick Lewycky | f7a3c50 | 2010-09-07 18:14:24 +0000 | [diff] [blame] | 73 | PTXTargetMachine::PTXTargetMachine(const Target &T, |
Evan Cheng | 34ad6db | 2011-07-20 07:51:56 +0000 | [diff] [blame] | 74 | StringRef TT, StringRef CPU, StringRef FS, |
Nick Lewycky | 8a8d479 | 2011-12-02 22:16:29 +0000 | [diff] [blame] | 75 | const TargetOptions &Options, |
Evan Cheng | 34ad6db | 2011-07-20 07:51:56 +0000 | [diff] [blame] | 76 | Reloc::Model RM, CodeModel::Model CM, |
Evan Cheng | b95fc31 | 2011-11-16 08:38:26 +0000 | [diff] [blame] | 77 | CodeGenOpt::Level OL, |
Evan Cheng | 34ad6db | 2011-07-20 07:51:56 +0000 | [diff] [blame] | 78 | bool is64Bit) |
Nick Lewycky | 8a8d479 | 2011-12-02 22:16:29 +0000 | [diff] [blame] | 79 | : LLVMTargetMachine(T, TT, CPU, FS, Options, RM, CM, OL), |
Justin Holewinski | e1fee48 | 2011-04-20 15:37:17 +0000 | [diff] [blame] | 80 | DataLayout(is64Bit ? DataLayout64 : DataLayout32), |
Evan Cheng | 276365d | 2011-06-30 01:53:36 +0000 | [diff] [blame] | 81 | Subtarget(TT, CPU, FS, is64Bit), |
Anton Korobeynikov | 16c29b5 | 2011-01-10 12:39:04 +0000 | [diff] [blame] | 82 | FrameLowering(Subtarget), |
Che-Liang Chiou | 31c488c | 2011-03-02 07:58:46 +0000 | [diff] [blame] | 83 | InstrInfo(*this), |
Justin Holewinski | bc97f44 | 2011-09-26 18:57:27 +0000 | [diff] [blame] | 84 | TSInfo(*this), |
Che-Liang Chiou | 31c488c | 2011-03-02 07:58:46 +0000 | [diff] [blame] | 85 | TLInfo(*this) { |
Eric Christopher | 50880d0 | 2010-09-18 18:52:28 +0000 | [diff] [blame] | 86 | } |
| 87 | |
David Blaikie | 2d24e2a | 2011-12-20 02:50:00 +0000 | [diff] [blame] | 88 | void PTX32TargetMachine::anchor() { } |
| 89 | |
Evan Cheng | 4396613 | 2011-07-19 06:37:02 +0000 | [diff] [blame] | 90 | PTX32TargetMachine::PTX32TargetMachine(const Target &T, StringRef TT, |
| 91 | StringRef CPU, StringRef FS, |
Nick Lewycky | 8a8d479 | 2011-12-02 22:16:29 +0000 | [diff] [blame] | 92 | const TargetOptions &Options, |
Evan Cheng | b95fc31 | 2011-11-16 08:38:26 +0000 | [diff] [blame] | 93 | Reloc::Model RM, CodeModel::Model CM, |
| 94 | CodeGenOpt::Level OL) |
Nick Lewycky | 8a8d479 | 2011-12-02 22:16:29 +0000 | [diff] [blame] | 95 | : PTXTargetMachine(T, TT, CPU, FS, Options, RM, CM, OL, false) { |
Justin Holewinski | e1fee48 | 2011-04-20 15:37:17 +0000 | [diff] [blame] | 96 | } |
| 97 | |
David Blaikie | 2d24e2a | 2011-12-20 02:50:00 +0000 | [diff] [blame] | 98 | void PTX64TargetMachine::anchor() { } |
| 99 | |
Evan Cheng | 4396613 | 2011-07-19 06:37:02 +0000 | [diff] [blame] | 100 | PTX64TargetMachine::PTX64TargetMachine(const Target &T, StringRef TT, |
| 101 | StringRef CPU, StringRef FS, |
Nick Lewycky | 8a8d479 | 2011-12-02 22:16:29 +0000 | [diff] [blame] | 102 | const TargetOptions &Options, |
Evan Cheng | b95fc31 | 2011-11-16 08:38:26 +0000 | [diff] [blame] | 103 | Reloc::Model RM, CodeModel::Model CM, |
| 104 | CodeGenOpt::Level OL) |
Nick Lewycky | 8a8d479 | 2011-12-02 22:16:29 +0000 | [diff] [blame] | 105 | : PTXTargetMachine(T, TT, CPU, FS, Options, RM, CM, OL, true) { |
Justin Holewinski | e1fee48 | 2011-04-20 15:37:17 +0000 | [diff] [blame] | 106 | } |
| 107 | |
Andrew Trick | 6939fde | 2012-02-06 22:51:15 +0000 | [diff] [blame] | 108 | namespace llvm { |
Andrew Trick | 843ee2e | 2012-02-03 05:12:41 +0000 | [diff] [blame] | 109 | /// PTX Code Generator Pass Configuration Options. |
| 110 | class PTXPassConfig : public TargetPassConfig { |
| 111 | public: |
Andrew Trick | 061efcf | 2012-02-04 02:56:59 +0000 | [diff] [blame] | 112 | PTXPassConfig(PTXTargetMachine *TM, PassManagerBase &PM) |
| 113 | : TargetPassConfig(TM, PM) {} |
Andrew Trick | 843ee2e | 2012-02-03 05:12:41 +0000 | [diff] [blame] | 114 | |
| 115 | PTXTargetMachine &getPTXTargetMachine() const { |
| 116 | return getTM<PTXTargetMachine>(); |
| 117 | } |
| 118 | |
| 119 | bool addInstSelector(); |
Andrew Trick | 1e9bcb3 | 2012-02-10 04:10:40 +0000 | [diff] [blame] | 120 | FunctionPass *createTargetRegisterAllocator(bool); |
| 121 | void addOptimizedRegAlloc(FunctionPass *RegAllocPass); |
Andrew Trick | 843ee2e | 2012-02-03 05:12:41 +0000 | [diff] [blame] | 122 | bool addPostRegAlloc(); |
Andrew Trick | 1e9bcb3 | 2012-02-10 04:10:40 +0000 | [diff] [blame] | 123 | void addMachineLateOptimization(); |
| 124 | bool addPreEmitPass(); |
Andrew Trick | 843ee2e | 2012-02-03 05:12:41 +0000 | [diff] [blame] | 125 | }; |
| 126 | } // namespace |
| 127 | |
Andrew Trick | 061efcf | 2012-02-04 02:56:59 +0000 | [diff] [blame] | 128 | TargetPassConfig *PTXTargetMachine::createPassConfig(PassManagerBase &PM) { |
| 129 | return new PTXPassConfig(this, PM); |
Andrew Trick | 843ee2e | 2012-02-03 05:12:41 +0000 | [diff] [blame] | 130 | } |
| 131 | |
| 132 | bool PTXPassConfig::addInstSelector() { |
| 133 | PM.add(createPTXISelDag(getPTXTargetMachine(), getOptLevel())); |
Che-Liang Chiou | ad83c1d | 2011-01-01 10:50:37 +0000 | [diff] [blame] | 134 | return false; |
| 135 | } |
| 136 | |
Andrew Trick | 1e9bcb3 | 2012-02-10 04:10:40 +0000 | [diff] [blame] | 137 | FunctionPass *PTXPassConfig::createTargetRegisterAllocator(bool /*Optimized*/) { |
| 138 | return createPTXRegisterAllocator(); |
| 139 | } |
| 140 | |
| 141 | // Modify the optimized compilation path to bypass optimized register alloction. |
| 142 | void PTXPassConfig::addOptimizedRegAlloc(FunctionPass *RegAllocPass) { |
| 143 | addFastRegAlloc(RegAllocPass); |
| 144 | } |
| 145 | |
Andrew Trick | 843ee2e | 2012-02-03 05:12:41 +0000 | [diff] [blame] | 146 | bool PTXPassConfig::addPostRegAlloc() { |
Che-Liang Chiou | ad83c1d | 2011-01-01 10:50:37 +0000 | [diff] [blame] | 147 | // PTXMFInfoExtract must after register allocation! |
Andrew Trick | 843ee2e | 2012-02-03 05:12:41 +0000 | [diff] [blame] | 148 | //PM.add(createPTXMFInfoExtract(getPTXTargetMachine())); |
Eric Christopher | 50880d0 | 2010-09-18 18:52:28 +0000 | [diff] [blame] | 149 | return false; |
Nick Lewycky | f7a3c50 | 2010-09-07 18:14:24 +0000 | [diff] [blame] | 150 | } |
Justin Holewinski | 40466cc | 2011-09-22 16:45:37 +0000 | [diff] [blame] | 151 | |
Andrew Trick | 1e9bcb3 | 2012-02-10 04:10:40 +0000 | [diff] [blame] | 152 | /// Add passes that optimize machine instructions after register allocation. |
| 153 | void PTXPassConfig::addMachineLateOptimization() { |
Andrew Trick | 5e108ee | 2012-02-15 03:21:47 +0000 | [diff] [blame^] | 154 | if (addPass(BranchFolderPassID) != &NoPassID) |
| 155 | printNoVerify("After BranchFolding"); |
Justin Holewinski | 40466cc | 2011-09-22 16:45:37 +0000 | [diff] [blame] | 156 | |
Andrew Trick | 5e108ee | 2012-02-15 03:21:47 +0000 | [diff] [blame^] | 157 | if (addPass(TailDuplicateID) != &NoPassID) |
| 158 | printNoVerify("After TailDuplicate"); |
Justin Holewinski | 40466cc | 2011-09-22 16:45:37 +0000 | [diff] [blame] | 159 | } |
| 160 | |
Andrew Trick | 1e9bcb3 | 2012-02-10 04:10:40 +0000 | [diff] [blame] | 161 | bool PTXPassConfig::addPreEmitPass() { |
Andrew Trick | 843ee2e | 2012-02-03 05:12:41 +0000 | [diff] [blame] | 162 | PM.add(createPTXMFInfoExtract(getPTXTargetMachine(), getOptLevel())); |
| 163 | PM.add(createPTXFPRoundingModePass(getPTXTargetMachine(), getOptLevel())); |
Andrew Trick | 1e9bcb3 | 2012-02-10 04:10:40 +0000 | [diff] [blame] | 164 | return true; |
Justin Holewinski | 40466cc | 2011-09-22 16:45:37 +0000 | [diff] [blame] | 165 | } |