Tim Northover | 3b0846e | 2014-05-24 12:50:23 +0000 | [diff] [blame] | 1 | //===-- AArch64TargetMachine.cpp - Define TargetMachine for AArch64 -------===// |
| 2 | // |
| 3 | // The LLVM Compiler Infrastructure |
| 4 | // |
| 5 | // This file is distributed under the University of Illinois Open Source |
| 6 | // License. See LICENSE.TXT for details. |
| 7 | // |
| 8 | //===----------------------------------------------------------------------===// |
| 9 | // |
| 10 | // |
| 11 | //===----------------------------------------------------------------------===// |
| 12 | |
| 13 | #include "AArch64.h" |
| 14 | #include "AArch64TargetMachine.h" |
Tim Northover | 3b0846e | 2014-05-24 12:50:23 +0000 | [diff] [blame] | 15 | #include "llvm/CodeGen/Passes.h" |
Arnaud A. de Grandmaison | c75dbbb | 2014-09-10 14:06:10 +0000 | [diff] [blame] | 16 | #include "llvm/CodeGen/RegAllocRegistry.h" |
Benjamin Kramer | 1f8930e | 2014-07-25 11:42:14 +0000 | [diff] [blame] | 17 | #include "llvm/PassManager.h" |
Tim Northover | 3b0846e | 2014-05-24 12:50:23 +0000 | [diff] [blame] | 18 | #include "llvm/Support/CommandLine.h" |
| 19 | #include "llvm/Support/TargetRegistry.h" |
| 20 | #include "llvm/Target/TargetOptions.h" |
| 21 | #include "llvm/Transforms/Scalar.h" |
| 22 | using namespace llvm; |
| 23 | |
| 24 | static cl::opt<bool> |
| 25 | EnableCCMP("aarch64-ccmp", cl::desc("Enable the CCMP formation pass"), |
| 26 | cl::init(true), cl::Hidden); |
| 27 | |
Gerolf Hoflehner | 97c383b | 2014-08-07 21:40:58 +0000 | [diff] [blame] | 28 | static cl::opt<bool> EnableMCR("aarch64-mcr", |
| 29 | cl::desc("Enable the machine combiner pass"), |
| 30 | cl::init(true), cl::Hidden); |
| 31 | |
Tim Northover | 3b0846e | 2014-05-24 12:50:23 +0000 | [diff] [blame] | 32 | static cl::opt<bool> |
| 33 | EnableStPairSuppress("aarch64-stp-suppress", cl::desc("Suppress STP for AArch64"), |
| 34 | cl::init(true), cl::Hidden); |
| 35 | |
| 36 | static cl::opt<bool> |
| 37 | EnableAdvSIMDScalar("aarch64-simd-scalar", cl::desc("Enable use of AdvSIMD scalar" |
| 38 | " integer instructions"), cl::init(false), cl::Hidden); |
| 39 | |
| 40 | static cl::opt<bool> |
| 41 | EnablePromoteConstant("aarch64-promote-const", cl::desc("Enable the promote " |
| 42 | "constant pass"), cl::init(true), cl::Hidden); |
| 43 | |
| 44 | static cl::opt<bool> |
| 45 | EnableCollectLOH("aarch64-collect-loh", cl::desc("Enable the pass that emits the" |
| 46 | " linker optimization hints (LOH)"), cl::init(true), |
| 47 | cl::Hidden); |
| 48 | |
| 49 | static cl::opt<bool> |
| 50 | EnableDeadRegisterElimination("aarch64-dead-def-elimination", cl::Hidden, |
| 51 | cl::desc("Enable the pass that removes dead" |
| 52 | " definitons and replaces stores to" |
| 53 | " them with stores to the zero" |
| 54 | " register"), |
| 55 | cl::init(true)); |
| 56 | |
| 57 | static cl::opt<bool> |
| 58 | EnableLoadStoreOpt("aarch64-load-store-opt", cl::desc("Enable the load/store pair" |
| 59 | " optimization pass"), cl::init(true), cl::Hidden); |
| 60 | |
Tim Northover | b4ddc08 | 2014-05-30 10:09:59 +0000 | [diff] [blame] | 61 | static cl::opt<bool> |
| 62 | EnableAtomicTidy("aarch64-atomic-cfg-tidy", cl::Hidden, |
| 63 | cl::desc("Run SimplifyCFG after expanding atomic operations" |
| 64 | " to make use of cmpxchg flow-based information"), |
| 65 | cl::init(true)); |
| 66 | |
James Molloy | 9991794 | 2014-08-06 13:31:32 +0000 | [diff] [blame] | 67 | static cl::opt<bool> |
| 68 | EnableEarlyIfConversion("aarch64-enable-early-ifcvt", cl::Hidden, |
| 69 | cl::desc("Run early if-conversion"), |
| 70 | cl::init(true)); |
| 71 | |
Jiangning Liu | 1a486da | 2014-09-05 02:55:24 +0000 | [diff] [blame] | 72 | static cl::opt<bool> |
| 73 | EnableCondOpt("aarch64-condopt", |
| 74 | cl::desc("Enable the condition optimizer pass"), |
| 75 | cl::init(true), cl::Hidden); |
| 76 | |
Arnaud A. de Grandmaison | c75dbbb | 2014-09-10 14:06:10 +0000 | [diff] [blame] | 77 | static cl::opt<bool> |
| 78 | EnablePBQP("aarch64-pbqp", cl::Hidden, |
| 79 | cl::desc("Use PBQP register allocator (experimental)"), |
| 80 | cl::init(false)); |
James Molloy | 9991794 | 2014-08-06 13:31:32 +0000 | [diff] [blame] | 81 | |
Tim Northover | 3b0846e | 2014-05-24 12:50:23 +0000 | [diff] [blame] | 82 | extern "C" void LLVMInitializeAArch64Target() { |
| 83 | // Register the target. |
| 84 | RegisterTargetMachine<AArch64leTargetMachine> X(TheAArch64leTarget); |
| 85 | RegisterTargetMachine<AArch64beTargetMachine> Y(TheAArch64beTarget); |
Tim Northover | 35910d7 | 2014-07-23 12:58:11 +0000 | [diff] [blame] | 86 | RegisterTargetMachine<AArch64leTargetMachine> Z(TheARM64Target); |
Tim Northover | 3b0846e | 2014-05-24 12:50:23 +0000 | [diff] [blame] | 87 | } |
| 88 | |
| 89 | /// TargetMachine ctor - Create an AArch64 architecture model. |
| 90 | /// |
| 91 | AArch64TargetMachine::AArch64TargetMachine(const Target &T, StringRef TT, |
| 92 | StringRef CPU, StringRef FS, |
| 93 | const TargetOptions &Options, |
| 94 | Reloc::Model RM, CodeModel::Model CM, |
| 95 | CodeGenOpt::Level OL, |
| 96 | bool LittleEndian) |
| 97 | : LLVMTargetMachine(T, TT, CPU, FS, Options, RM, CM, OL), |
Arnaud A. de Grandmaison | c75dbbb | 2014-09-10 14:06:10 +0000 | [diff] [blame] | 98 | Subtarget(TT, CPU, FS, *this, LittleEndian), |
| 99 | usingPBQP(false) { |
Tim Northover | 3b0846e | 2014-05-24 12:50:23 +0000 | [diff] [blame] | 100 | initAsmInfo(); |
Arnaud A. de Grandmaison | c75dbbb | 2014-09-10 14:06:10 +0000 | [diff] [blame] | 101 | |
| 102 | if (EnablePBQP && Subtarget.isCortexA57() && OL != CodeGenOpt::None) { |
| 103 | usingPBQP = true; |
| 104 | RegisterRegAlloc::setDefault(createAArch64A57PBQPRegAlloc); |
| 105 | } |
Tim Northover | 3b0846e | 2014-05-24 12:50:23 +0000 | [diff] [blame] | 106 | } |
| 107 | |
| 108 | void AArch64leTargetMachine::anchor() { } |
| 109 | |
| 110 | AArch64leTargetMachine:: |
| 111 | AArch64leTargetMachine(const Target &T, StringRef TT, |
| 112 | StringRef CPU, StringRef FS, const TargetOptions &Options, |
| 113 | Reloc::Model RM, CodeModel::Model CM, |
| 114 | CodeGenOpt::Level OL) |
| 115 | : AArch64TargetMachine(T, TT, CPU, FS, Options, RM, CM, OL, true) {} |
| 116 | |
| 117 | void AArch64beTargetMachine::anchor() { } |
| 118 | |
| 119 | AArch64beTargetMachine:: |
| 120 | AArch64beTargetMachine(const Target &T, StringRef TT, |
| 121 | StringRef CPU, StringRef FS, const TargetOptions &Options, |
| 122 | Reloc::Model RM, CodeModel::Model CM, |
| 123 | CodeGenOpt::Level OL) |
| 124 | : AArch64TargetMachine(T, TT, CPU, FS, Options, RM, CM, OL, false) {} |
| 125 | |
| 126 | namespace { |
| 127 | /// AArch64 Code Generator Pass Configuration Options. |
| 128 | class AArch64PassConfig : public TargetPassConfig { |
| 129 | public: |
| 130 | AArch64PassConfig(AArch64TargetMachine *TM, PassManagerBase &PM) |
Chad Rosier | 486e087 | 2014-09-12 17:40:39 +0000 | [diff] [blame] | 131 | : TargetPassConfig(TM, PM) { |
Chad Rosier | 347ed4e | 2014-09-12 22:17:28 +0000 | [diff] [blame] | 132 | if (TM->getOptLevel() != CodeGenOpt::None) |
| 133 | substitutePass(&PostRASchedulerID, &PostMachineSchedulerID); |
Chad Rosier | 486e087 | 2014-09-12 17:40:39 +0000 | [diff] [blame] | 134 | } |
Tim Northover | 3b0846e | 2014-05-24 12:50:23 +0000 | [diff] [blame] | 135 | |
| 136 | AArch64TargetMachine &getAArch64TargetMachine() const { |
| 137 | return getTM<AArch64TargetMachine>(); |
| 138 | } |
| 139 | |
Tim Northover | b4ddc08 | 2014-05-30 10:09:59 +0000 | [diff] [blame] | 140 | void addIRPasses() override; |
Tim Northover | 3b0846e | 2014-05-24 12:50:23 +0000 | [diff] [blame] | 141 | bool addPreISel() override; |
| 142 | bool addInstSelector() override; |
| 143 | bool addILPOpts() override; |
| 144 | bool addPreRegAlloc() override; |
| 145 | bool addPostRegAlloc() override; |
| 146 | bool addPreSched2() override; |
| 147 | bool addPreEmitPass() override; |
| 148 | }; |
| 149 | } // namespace |
| 150 | |
| 151 | void AArch64TargetMachine::addAnalysisPasses(PassManagerBase &PM) { |
| 152 | // Add first the target-independent BasicTTI pass, then our AArch64 pass. This |
| 153 | // allows the AArch64 pass to delegate to the target independent layer when |
| 154 | // appropriate. |
| 155 | PM.add(createBasicTargetTransformInfoPass(this)); |
| 156 | PM.add(createAArch64TargetTransformInfoPass(this)); |
| 157 | } |
| 158 | |
| 159 | TargetPassConfig *AArch64TargetMachine::createPassConfig(PassManagerBase &PM) { |
| 160 | return new AArch64PassConfig(this, PM); |
| 161 | } |
| 162 | |
Tim Northover | b4ddc08 | 2014-05-30 10:09:59 +0000 | [diff] [blame] | 163 | void AArch64PassConfig::addIRPasses() { |
| 164 | // Always expand atomic operations, we don't deal with atomicrmw or cmpxchg |
| 165 | // ourselves. |
Robin Morisset | 59c23cd | 2014-08-21 21:50:01 +0000 | [diff] [blame] | 166 | addPass(createAtomicExpandPass(TM)); |
Tim Northover | b4ddc08 | 2014-05-30 10:09:59 +0000 | [diff] [blame] | 167 | |
| 168 | // Cmpxchg instructions are often used with a subsequent comparison to |
| 169 | // determine whether it succeeded. We can exploit existing control-flow in |
| 170 | // ldrex/strex loops to simplify this, but it needs tidying up. |
| 171 | if (TM->getOptLevel() != CodeGenOpt::None && EnableAtomicTidy) |
| 172 | addPass(createCFGSimplificationPass()); |
| 173 | |
| 174 | TargetPassConfig::addIRPasses(); |
| 175 | } |
| 176 | |
Tim Northover | 3b0846e | 2014-05-24 12:50:23 +0000 | [diff] [blame] | 177 | // Pass Pipeline Configuration |
| 178 | bool AArch64PassConfig::addPreISel() { |
| 179 | // Run promote constant before global merge, so that the promoted constants |
| 180 | // get a chance to be merged |
| 181 | if (TM->getOptLevel() != CodeGenOpt::None && EnablePromoteConstant) |
| 182 | addPass(createAArch64PromoteConstantPass()); |
| 183 | if (TM->getOptLevel() != CodeGenOpt::None) |
| 184 | addPass(createGlobalMergePass(TM)); |
Duncan P. N. Exon Smith | de58870 | 2014-07-02 18:17:40 +0000 | [diff] [blame] | 185 | if (TM->getOptLevel() != CodeGenOpt::None) |
| 186 | addPass(createAArch64AddressTypePromotionPass()); |
Tim Northover | 3b0846e | 2014-05-24 12:50:23 +0000 | [diff] [blame] | 187 | |
Tim Northover | 3b0846e | 2014-05-24 12:50:23 +0000 | [diff] [blame] | 188 | return false; |
| 189 | } |
| 190 | |
| 191 | bool AArch64PassConfig::addInstSelector() { |
| 192 | addPass(createAArch64ISelDag(getAArch64TargetMachine(), getOptLevel())); |
| 193 | |
| 194 | // For ELF, cleanup any local-dynamic TLS accesses (i.e. combine as many |
| 195 | // references to _TLS_MODULE_BASE_ as possible. |
| 196 | if (TM->getSubtarget<AArch64Subtarget>().isTargetELF() && |
| 197 | getOptLevel() != CodeGenOpt::None) |
| 198 | addPass(createAArch64CleanupLocalDynamicTLSPass()); |
| 199 | |
| 200 | return false; |
| 201 | } |
| 202 | |
| 203 | bool AArch64PassConfig::addILPOpts() { |
Jiangning Liu | 1a486da | 2014-09-05 02:55:24 +0000 | [diff] [blame] | 204 | if (EnableCondOpt) |
| 205 | addPass(createAArch64ConditionOptimizerPass()); |
Tim Northover | 3b0846e | 2014-05-24 12:50:23 +0000 | [diff] [blame] | 206 | if (EnableCCMP) |
| 207 | addPass(createAArch64ConditionalCompares()); |
Gerolf Hoflehner | 97c383b | 2014-08-07 21:40:58 +0000 | [diff] [blame] | 208 | if (EnableMCR) |
| 209 | addPass(&MachineCombinerID); |
James Molloy | 9991794 | 2014-08-06 13:31:32 +0000 | [diff] [blame] | 210 | if (EnableEarlyIfConversion) |
| 211 | addPass(&EarlyIfConverterID); |
Tim Northover | 3b0846e | 2014-05-24 12:50:23 +0000 | [diff] [blame] | 212 | if (EnableStPairSuppress) |
| 213 | addPass(createAArch64StorePairSuppressPass()); |
| 214 | return true; |
| 215 | } |
| 216 | |
| 217 | bool AArch64PassConfig::addPreRegAlloc() { |
| 218 | // Use AdvSIMD scalar instructions whenever profitable. |
Quentin Colombet | 0c740d4 | 2014-08-21 18:10:07 +0000 | [diff] [blame] | 219 | if (TM->getOptLevel() != CodeGenOpt::None && EnableAdvSIMDScalar) { |
Tim Northover | 3b0846e | 2014-05-24 12:50:23 +0000 | [diff] [blame] | 220 | addPass(createAArch64AdvSIMDScalar()); |
Quentin Colombet | 0c740d4 | 2014-08-21 18:10:07 +0000 | [diff] [blame] | 221 | // The AdvSIMD pass may produce copies that can be rewritten to |
| 222 | // be register coaleascer friendly. |
| 223 | addPass(&PeepholeOptimizerID); |
| 224 | } |
Tim Northover | 3b0846e | 2014-05-24 12:50:23 +0000 | [diff] [blame] | 225 | return true; |
| 226 | } |
| 227 | |
| 228 | bool AArch64PassConfig::addPostRegAlloc() { |
| 229 | // Change dead register definitions to refer to the zero register. |
| 230 | if (TM->getOptLevel() != CodeGenOpt::None && EnableDeadRegisterElimination) |
| 231 | addPass(createAArch64DeadRegisterDefinitions()); |
James Molloy | 3feea9c | 2014-08-08 12:33:21 +0000 | [diff] [blame] | 232 | if (TM->getOptLevel() != CodeGenOpt::None && |
Arnaud A. de Grandmaison | c75dbbb | 2014-09-10 14:06:10 +0000 | [diff] [blame] | 233 | TM->getSubtarget<AArch64Subtarget>().isCortexA57() && |
| 234 | !static_cast<const AArch64TargetMachine *>(TM)->isPBQPUsed()) |
James Molloy | 3feea9c | 2014-08-08 12:33:21 +0000 | [diff] [blame] | 235 | // Improve performance for some FP/SIMD code for A57. |
| 236 | addPass(createAArch64A57FPLoadBalancing()); |
Tim Northover | 3b0846e | 2014-05-24 12:50:23 +0000 | [diff] [blame] | 237 | return true; |
| 238 | } |
| 239 | |
| 240 | bool AArch64PassConfig::addPreSched2() { |
| 241 | // Expand some pseudo instructions to allow proper scheduling. |
| 242 | addPass(createAArch64ExpandPseudoPass()); |
| 243 | // Use load/store pair instructions when possible. |
| 244 | if (TM->getOptLevel() != CodeGenOpt::None && EnableLoadStoreOpt) |
| 245 | addPass(createAArch64LoadStoreOptimizationPass()); |
| 246 | return true; |
| 247 | } |
| 248 | |
| 249 | bool AArch64PassConfig::addPreEmitPass() { |
| 250 | // Relax conditional branch instructions if they're otherwise out of |
| 251 | // range of their destination. |
| 252 | addPass(createAArch64BranchRelaxation()); |
| 253 | if (TM->getOptLevel() != CodeGenOpt::None && EnableCollectLOH && |
| 254 | TM->getSubtarget<AArch64Subtarget>().isTargetMachO()) |
| 255 | addPass(createAArch64CollectLOHPass()); |
| 256 | return true; |
| 257 | } |