Tim Northover | 3b0846e | 2014-05-24 12:50:23 +0000 | [diff] [blame] | 1 | //===-- AArch64TargetMachine.cpp - Define TargetMachine for AArch64 -------===// |
| 2 | // |
| 3 | // The LLVM Compiler Infrastructure |
| 4 | // |
| 5 | // This file is distributed under the University of Illinois Open Source |
| 6 | // License. See LICENSE.TXT for details. |
| 7 | // |
| 8 | //===----------------------------------------------------------------------===// |
| 9 | // |
| 10 | // |
| 11 | //===----------------------------------------------------------------------===// |
| 12 | |
| 13 | #include "AArch64.h" |
| 14 | #include "AArch64TargetMachine.h" |
Aditya Nandakumar | a271932 | 2014-11-13 09:26:31 +0000 | [diff] [blame] | 15 | #include "AArch64TargetObjectFile.h" |
Tim Northover | 3b0846e | 2014-05-24 12:50:23 +0000 | [diff] [blame] | 16 | #include "llvm/CodeGen/Passes.h" |
Arnaud A. de Grandmaison | c75dbbb | 2014-09-10 14:06:10 +0000 | [diff] [blame] | 17 | #include "llvm/CodeGen/RegAllocRegistry.h" |
Eric Christopher | 3faf2f1 | 2014-10-06 06:45:36 +0000 | [diff] [blame] | 18 | #include "llvm/IR/Function.h" |
Benjamin Kramer | 1f8930e | 2014-07-25 11:42:14 +0000 | [diff] [blame] | 19 | #include "llvm/PassManager.h" |
Tim Northover | 3b0846e | 2014-05-24 12:50:23 +0000 | [diff] [blame] | 20 | #include "llvm/Support/CommandLine.h" |
| 21 | #include "llvm/Support/TargetRegistry.h" |
| 22 | #include "llvm/Target/TargetOptions.h" |
| 23 | #include "llvm/Transforms/Scalar.h" |
| 24 | using namespace llvm; |
| 25 | |
| 26 | static cl::opt<bool> |
| 27 | EnableCCMP("aarch64-ccmp", cl::desc("Enable the CCMP formation pass"), |
| 28 | cl::init(true), cl::Hidden); |
| 29 | |
Gerolf Hoflehner | 97c383b | 2014-08-07 21:40:58 +0000 | [diff] [blame] | 30 | static cl::opt<bool> EnableMCR("aarch64-mcr", |
| 31 | cl::desc("Enable the machine combiner pass"), |
| 32 | cl::init(true), cl::Hidden); |
| 33 | |
Tim Northover | 3b0846e | 2014-05-24 12:50:23 +0000 | [diff] [blame] | 34 | static cl::opt<bool> |
| 35 | EnableStPairSuppress("aarch64-stp-suppress", cl::desc("Suppress STP for AArch64"), |
| 36 | cl::init(true), cl::Hidden); |
| 37 | |
| 38 | static cl::opt<bool> |
| 39 | EnableAdvSIMDScalar("aarch64-simd-scalar", cl::desc("Enable use of AdvSIMD scalar" |
| 40 | " integer instructions"), cl::init(false), cl::Hidden); |
| 41 | |
| 42 | static cl::opt<bool> |
| 43 | EnablePromoteConstant("aarch64-promote-const", cl::desc("Enable the promote " |
| 44 | "constant pass"), cl::init(true), cl::Hidden); |
| 45 | |
| 46 | static cl::opt<bool> |
| 47 | EnableCollectLOH("aarch64-collect-loh", cl::desc("Enable the pass that emits the" |
| 48 | " linker optimization hints (LOH)"), cl::init(true), |
| 49 | cl::Hidden); |
| 50 | |
| 51 | static cl::opt<bool> |
| 52 | EnableDeadRegisterElimination("aarch64-dead-def-elimination", cl::Hidden, |
| 53 | cl::desc("Enable the pass that removes dead" |
| 54 | " definitons and replaces stores to" |
| 55 | " them with stores to the zero" |
| 56 | " register"), |
| 57 | cl::init(true)); |
| 58 | |
| 59 | static cl::opt<bool> |
| 60 | EnableLoadStoreOpt("aarch64-load-store-opt", cl::desc("Enable the load/store pair" |
| 61 | " optimization pass"), cl::init(true), cl::Hidden); |
| 62 | |
Tim Northover | b4ddc08 | 2014-05-30 10:09:59 +0000 | [diff] [blame] | 63 | static cl::opt<bool> |
| 64 | EnableAtomicTidy("aarch64-atomic-cfg-tidy", cl::Hidden, |
| 65 | cl::desc("Run SimplifyCFG after expanding atomic operations" |
| 66 | " to make use of cmpxchg flow-based information"), |
| 67 | cl::init(true)); |
| 68 | |
James Molloy | 9991794 | 2014-08-06 13:31:32 +0000 | [diff] [blame] | 69 | static cl::opt<bool> |
| 70 | EnableEarlyIfConversion("aarch64-enable-early-ifcvt", cl::Hidden, |
| 71 | cl::desc("Run early if-conversion"), |
| 72 | cl::init(true)); |
| 73 | |
Jiangning Liu | 1a486da | 2014-09-05 02:55:24 +0000 | [diff] [blame] | 74 | static cl::opt<bool> |
| 75 | EnableCondOpt("aarch64-condopt", |
| 76 | cl::desc("Enable the condition optimizer pass"), |
| 77 | cl::init(true), cl::Hidden); |
| 78 | |
Arnaud A. de Grandmaison | c75dbbb | 2014-09-10 14:06:10 +0000 | [diff] [blame] | 79 | static cl::opt<bool> |
Bradley Smith | f2a801d | 2014-10-13 10:12:35 +0000 | [diff] [blame] | 80 | EnableA53Fix835769("aarch64-fix-cortex-a53-835769", cl::Hidden, |
| 81 | cl::desc("Work around Cortex-A53 erratum 835769"), |
| 82 | cl::init(false)); |
| 83 | |
Hao Liu | fd46bea | 2014-11-19 06:39:53 +0000 | [diff] [blame] | 84 | static cl::opt<bool> |
| 85 | EnableGEPOpt("aarch64-gep-opt", cl::Hidden, |
| 86 | cl::desc("Enable optimizations on complex GEPs"), |
| 87 | cl::init(true)); |
| 88 | |
Tim Northover | 3b0846e | 2014-05-24 12:50:23 +0000 | [diff] [blame] | 89 | extern "C" void LLVMInitializeAArch64Target() { |
| 90 | // Register the target. |
| 91 | RegisterTargetMachine<AArch64leTargetMachine> X(TheAArch64leTarget); |
| 92 | RegisterTargetMachine<AArch64beTargetMachine> Y(TheAArch64beTarget); |
Tim Northover | 35910d7 | 2014-07-23 12:58:11 +0000 | [diff] [blame] | 93 | RegisterTargetMachine<AArch64leTargetMachine> Z(TheARM64Target); |
Tim Northover | 3b0846e | 2014-05-24 12:50:23 +0000 | [diff] [blame] | 94 | } |
| 95 | |
Aditya Nandakumar | a271932 | 2014-11-13 09:26:31 +0000 | [diff] [blame] | 96 | //===----------------------------------------------------------------------===// |
| 97 | // AArch64 Lowering public interface. |
| 98 | //===----------------------------------------------------------------------===// |
| 99 | static std::unique_ptr<TargetLoweringObjectFile> createTLOF(const Triple &TT) { |
| 100 | if (TT.isOSBinFormatMachO()) |
| 101 | return make_unique<AArch64_MachoTargetObjectFile>(); |
| 102 | |
| 103 | return make_unique<AArch64_ELFTargetObjectFile>(); |
| 104 | } |
| 105 | |
Tim Northover | 3b0846e | 2014-05-24 12:50:23 +0000 | [diff] [blame] | 106 | /// TargetMachine ctor - Create an AArch64 architecture model. |
| 107 | /// |
| 108 | AArch64TargetMachine::AArch64TargetMachine(const Target &T, StringRef TT, |
| 109 | StringRef CPU, StringRef FS, |
| 110 | const TargetOptions &Options, |
| 111 | Reloc::Model RM, CodeModel::Model CM, |
| 112 | CodeGenOpt::Level OL, |
| 113 | bool LittleEndian) |
| 114 | : LLVMTargetMachine(T, TT, CPU, FS, Options, RM, CM, OL), |
Aditya Nandakumar | a271932 | 2014-11-13 09:26:31 +0000 | [diff] [blame] | 115 | TLOF(createTLOF(Triple(getTargetTriple()))), |
Arnaud A. de Grandmaison | a61262f | 2014-10-21 20:47:22 +0000 | [diff] [blame] | 116 | Subtarget(TT, CPU, FS, *this, LittleEndian), isLittle(LittleEndian) { |
Tim Northover | 3b0846e | 2014-05-24 12:50:23 +0000 | [diff] [blame] | 117 | initAsmInfo(); |
| 118 | } |
| 119 | |
Reid Kleckner | 357600e | 2014-11-20 23:37:18 +0000 | [diff] [blame] | 120 | AArch64TargetMachine::~AArch64TargetMachine() {} |
| 121 | |
Eric Christopher | 3faf2f1 | 2014-10-06 06:45:36 +0000 | [diff] [blame] | 122 | const AArch64Subtarget * |
| 123 | AArch64TargetMachine::getSubtargetImpl(const Function &F) const { |
| 124 | AttributeSet FnAttrs = F.getAttributes(); |
| 125 | Attribute CPUAttr = |
| 126 | FnAttrs.getAttribute(AttributeSet::FunctionIndex, "target-cpu"); |
| 127 | Attribute FSAttr = |
| 128 | FnAttrs.getAttribute(AttributeSet::FunctionIndex, "target-features"); |
| 129 | |
| 130 | std::string CPU = !CPUAttr.hasAttribute(Attribute::None) |
| 131 | ? CPUAttr.getValueAsString().str() |
| 132 | : TargetCPU; |
| 133 | std::string FS = !FSAttr.hasAttribute(Attribute::None) |
| 134 | ? FSAttr.getValueAsString().str() |
| 135 | : TargetFS; |
| 136 | |
| 137 | auto &I = SubtargetMap[CPU + FS]; |
| 138 | if (!I) { |
| 139 | // This needs to be done before we create a new subtarget since any |
| 140 | // creation will depend on the TM and the code generation flags on the |
| 141 | // function that reside in TargetOptions. |
| 142 | resetTargetOptions(F); |
| 143 | I = llvm::make_unique<AArch64Subtarget>(TargetTriple, CPU, FS, *this, isLittle); |
| 144 | } |
| 145 | return I.get(); |
| 146 | } |
| 147 | |
Tim Northover | 3b0846e | 2014-05-24 12:50:23 +0000 | [diff] [blame] | 148 | void AArch64leTargetMachine::anchor() { } |
| 149 | |
| 150 | AArch64leTargetMachine:: |
| 151 | AArch64leTargetMachine(const Target &T, StringRef TT, |
| 152 | StringRef CPU, StringRef FS, const TargetOptions &Options, |
| 153 | Reloc::Model RM, CodeModel::Model CM, |
| 154 | CodeGenOpt::Level OL) |
| 155 | : AArch64TargetMachine(T, TT, CPU, FS, Options, RM, CM, OL, true) {} |
| 156 | |
| 157 | void AArch64beTargetMachine::anchor() { } |
| 158 | |
| 159 | AArch64beTargetMachine:: |
| 160 | AArch64beTargetMachine(const Target &T, StringRef TT, |
| 161 | StringRef CPU, StringRef FS, const TargetOptions &Options, |
| 162 | Reloc::Model RM, CodeModel::Model CM, |
| 163 | CodeGenOpt::Level OL) |
| 164 | : AArch64TargetMachine(T, TT, CPU, FS, Options, RM, CM, OL, false) {} |
| 165 | |
| 166 | namespace { |
| 167 | /// AArch64 Code Generator Pass Configuration Options. |
| 168 | class AArch64PassConfig : public TargetPassConfig { |
| 169 | public: |
| 170 | AArch64PassConfig(AArch64TargetMachine *TM, PassManagerBase &PM) |
Chad Rosier | 486e087 | 2014-09-12 17:40:39 +0000 | [diff] [blame] | 171 | : TargetPassConfig(TM, PM) { |
Chad Rosier | 347ed4e | 2014-09-12 22:17:28 +0000 | [diff] [blame] | 172 | if (TM->getOptLevel() != CodeGenOpt::None) |
| 173 | substitutePass(&PostRASchedulerID, &PostMachineSchedulerID); |
Chad Rosier | 486e087 | 2014-09-12 17:40:39 +0000 | [diff] [blame] | 174 | } |
Tim Northover | 3b0846e | 2014-05-24 12:50:23 +0000 | [diff] [blame] | 175 | |
| 176 | AArch64TargetMachine &getAArch64TargetMachine() const { |
| 177 | return getTM<AArch64TargetMachine>(); |
| 178 | } |
| 179 | |
Tim Northover | b4ddc08 | 2014-05-30 10:09:59 +0000 | [diff] [blame] | 180 | void addIRPasses() override; |
Tim Northover | 3b0846e | 2014-05-24 12:50:23 +0000 | [diff] [blame] | 181 | bool addPreISel() override; |
| 182 | bool addInstSelector() override; |
| 183 | bool addILPOpts() override; |
Matthias Braun | 7e37a5f | 2014-12-11 21:26:47 +0000 | [diff] [blame] | 184 | void addPreRegAlloc() override; |
| 185 | void addPostRegAlloc() override; |
| 186 | void addPreSched2() override; |
| 187 | void addPreEmitPass() override; |
Tim Northover | 3b0846e | 2014-05-24 12:50:23 +0000 | [diff] [blame] | 188 | }; |
| 189 | } // namespace |
| 190 | |
| 191 | void AArch64TargetMachine::addAnalysisPasses(PassManagerBase &PM) { |
| 192 | // Add first the target-independent BasicTTI pass, then our AArch64 pass. This |
| 193 | // allows the AArch64 pass to delegate to the target independent layer when |
| 194 | // appropriate. |
| 195 | PM.add(createBasicTargetTransformInfoPass(this)); |
| 196 | PM.add(createAArch64TargetTransformInfoPass(this)); |
| 197 | } |
| 198 | |
| 199 | TargetPassConfig *AArch64TargetMachine::createPassConfig(PassManagerBase &PM) { |
| 200 | return new AArch64PassConfig(this, PM); |
| 201 | } |
| 202 | |
Tim Northover | b4ddc08 | 2014-05-30 10:09:59 +0000 | [diff] [blame] | 203 | void AArch64PassConfig::addIRPasses() { |
| 204 | // Always expand atomic operations, we don't deal with atomicrmw or cmpxchg |
| 205 | // ourselves. |
Robin Morisset | 59c23cd | 2014-08-21 21:50:01 +0000 | [diff] [blame] | 206 | addPass(createAtomicExpandPass(TM)); |
Tim Northover | b4ddc08 | 2014-05-30 10:09:59 +0000 | [diff] [blame] | 207 | |
| 208 | // Cmpxchg instructions are often used with a subsequent comparison to |
| 209 | // determine whether it succeeded. We can exploit existing control-flow in |
| 210 | // ldrex/strex loops to simplify this, but it needs tidying up. |
| 211 | if (TM->getOptLevel() != CodeGenOpt::None && EnableAtomicTidy) |
| 212 | addPass(createCFGSimplificationPass()); |
| 213 | |
| 214 | TargetPassConfig::addIRPasses(); |
Hao Liu | fd46bea | 2014-11-19 06:39:53 +0000 | [diff] [blame] | 215 | |
| 216 | if (TM->getOptLevel() == CodeGenOpt::Aggressive && EnableGEPOpt) { |
| 217 | // Call SeparateConstOffsetFromGEP pass to extract constants within indices |
| 218 | // and lower a GEP with multiple indices to either arithmetic operations or |
| 219 | // multiple GEPs with single index. |
| 220 | addPass(createSeparateConstOffsetFromGEPPass(TM, true)); |
| 221 | // Call EarlyCSE pass to find and remove subexpressions in the lowered |
| 222 | // result. |
| 223 | addPass(createEarlyCSEPass()); |
| 224 | // Do loop invariant code motion in case part of the lowered result is |
| 225 | // invariant. |
| 226 | addPass(createLICMPass()); |
| 227 | } |
Tim Northover | b4ddc08 | 2014-05-30 10:09:59 +0000 | [diff] [blame] | 228 | } |
| 229 | |
Tim Northover | 3b0846e | 2014-05-24 12:50:23 +0000 | [diff] [blame] | 230 | // Pass Pipeline Configuration |
| 231 | bool AArch64PassConfig::addPreISel() { |
| 232 | // Run promote constant before global merge, so that the promoted constants |
| 233 | // get a chance to be merged |
| 234 | if (TM->getOptLevel() != CodeGenOpt::None && EnablePromoteConstant) |
| 235 | addPass(createAArch64PromoteConstantPass()); |
| 236 | if (TM->getOptLevel() != CodeGenOpt::None) |
| 237 | addPass(createGlobalMergePass(TM)); |
Duncan P. N. Exon Smith | de58870 | 2014-07-02 18:17:40 +0000 | [diff] [blame] | 238 | if (TM->getOptLevel() != CodeGenOpt::None) |
| 239 | addPass(createAArch64AddressTypePromotionPass()); |
Tim Northover | 3b0846e | 2014-05-24 12:50:23 +0000 | [diff] [blame] | 240 | |
Tim Northover | 3b0846e | 2014-05-24 12:50:23 +0000 | [diff] [blame] | 241 | return false; |
| 242 | } |
| 243 | |
| 244 | bool AArch64PassConfig::addInstSelector() { |
| 245 | addPass(createAArch64ISelDag(getAArch64TargetMachine(), getOptLevel())); |
| 246 | |
| 247 | // For ELF, cleanup any local-dynamic TLS accesses (i.e. combine as many |
| 248 | // references to _TLS_MODULE_BASE_ as possible. |
| 249 | if (TM->getSubtarget<AArch64Subtarget>().isTargetELF() && |
| 250 | getOptLevel() != CodeGenOpt::None) |
| 251 | addPass(createAArch64CleanupLocalDynamicTLSPass()); |
| 252 | |
| 253 | return false; |
| 254 | } |
| 255 | |
| 256 | bool AArch64PassConfig::addILPOpts() { |
Jiangning Liu | 1a486da | 2014-09-05 02:55:24 +0000 | [diff] [blame] | 257 | if (EnableCondOpt) |
| 258 | addPass(createAArch64ConditionOptimizerPass()); |
Tim Northover | 3b0846e | 2014-05-24 12:50:23 +0000 | [diff] [blame] | 259 | if (EnableCCMP) |
| 260 | addPass(createAArch64ConditionalCompares()); |
Gerolf Hoflehner | 97c383b | 2014-08-07 21:40:58 +0000 | [diff] [blame] | 261 | if (EnableMCR) |
| 262 | addPass(&MachineCombinerID); |
James Molloy | 9991794 | 2014-08-06 13:31:32 +0000 | [diff] [blame] | 263 | if (EnableEarlyIfConversion) |
| 264 | addPass(&EarlyIfConverterID); |
Tim Northover | 3b0846e | 2014-05-24 12:50:23 +0000 | [diff] [blame] | 265 | if (EnableStPairSuppress) |
| 266 | addPass(createAArch64StorePairSuppressPass()); |
| 267 | return true; |
| 268 | } |
| 269 | |
Matthias Braun | 7e37a5f | 2014-12-11 21:26:47 +0000 | [diff] [blame] | 270 | void AArch64PassConfig::addPreRegAlloc() { |
Tim Northover | 3b0846e | 2014-05-24 12:50:23 +0000 | [diff] [blame] | 271 | // Use AdvSIMD scalar instructions whenever profitable. |
Quentin Colombet | 0c740d4 | 2014-08-21 18:10:07 +0000 | [diff] [blame] | 272 | if (TM->getOptLevel() != CodeGenOpt::None && EnableAdvSIMDScalar) { |
Matthias Braun | b2f2388 | 2014-12-11 23:18:03 +0000 | [diff] [blame] | 273 | addPass(createAArch64AdvSIMDScalar()); |
Quentin Colombet | 0c740d4 | 2014-08-21 18:10:07 +0000 | [diff] [blame] | 274 | // The AdvSIMD pass may produce copies that can be rewritten to |
| 275 | // be register coaleascer friendly. |
| 276 | addPass(&PeepholeOptimizerID); |
| 277 | } |
Tim Northover | 3b0846e | 2014-05-24 12:50:23 +0000 | [diff] [blame] | 278 | } |
| 279 | |
Matthias Braun | 7e37a5f | 2014-12-11 21:26:47 +0000 | [diff] [blame] | 280 | void AArch64PassConfig::addPostRegAlloc() { |
Tim Northover | 3b0846e | 2014-05-24 12:50:23 +0000 | [diff] [blame] | 281 | // Change dead register definitions to refer to the zero register. |
| 282 | if (TM->getOptLevel() != CodeGenOpt::None && EnableDeadRegisterElimination) |
Matthias Braun | b2f2388 | 2014-12-11 23:18:03 +0000 | [diff] [blame] | 283 | addPass(createAArch64DeadRegisterDefinitions()); |
James Molloy | 3feea9c | 2014-08-08 12:33:21 +0000 | [diff] [blame] | 284 | if (TM->getOptLevel() != CodeGenOpt::None && |
Tim Northover | 0091789 | 2014-10-28 01:24:32 +0000 | [diff] [blame] | 285 | (TM->getSubtarget<AArch64Subtarget>().isCortexA53() || |
| 286 | TM->getSubtarget<AArch64Subtarget>().isCortexA57()) && |
Arnaud A. de Grandmaison | a61262f | 2014-10-21 20:47:22 +0000 | [diff] [blame] | 287 | usingDefaultRegAlloc()) |
James Molloy | 3feea9c | 2014-08-08 12:33:21 +0000 | [diff] [blame] | 288 | // Improve performance for some FP/SIMD code for A57. |
| 289 | addPass(createAArch64A57FPLoadBalancing()); |
Tim Northover | 3b0846e | 2014-05-24 12:50:23 +0000 | [diff] [blame] | 290 | } |
| 291 | |
Matthias Braun | 7e37a5f | 2014-12-11 21:26:47 +0000 | [diff] [blame] | 292 | void AArch64PassConfig::addPreSched2() { |
Tim Northover | 3b0846e | 2014-05-24 12:50:23 +0000 | [diff] [blame] | 293 | // Expand some pseudo instructions to allow proper scheduling. |
Matthias Braun | b2f2388 | 2014-12-11 23:18:03 +0000 | [diff] [blame] | 294 | addPass(createAArch64ExpandPseudoPass()); |
Tim Northover | 3b0846e | 2014-05-24 12:50:23 +0000 | [diff] [blame] | 295 | // Use load/store pair instructions when possible. |
| 296 | if (TM->getOptLevel() != CodeGenOpt::None && EnableLoadStoreOpt) |
| 297 | addPass(createAArch64LoadStoreOptimizationPass()); |
Tim Northover | 3b0846e | 2014-05-24 12:50:23 +0000 | [diff] [blame] | 298 | } |
| 299 | |
Matthias Braun | 7e37a5f | 2014-12-11 21:26:47 +0000 | [diff] [blame] | 300 | void AArch64PassConfig::addPreEmitPass() { |
Bradley Smith | f2a801d | 2014-10-13 10:12:35 +0000 | [diff] [blame] | 301 | if (EnableA53Fix835769) |
Matthias Braun | b2f2388 | 2014-12-11 23:18:03 +0000 | [diff] [blame] | 302 | addPass(createAArch64A53Fix835769()); |
Tim Northover | 3b0846e | 2014-05-24 12:50:23 +0000 | [diff] [blame] | 303 | // Relax conditional branch instructions if they're otherwise out of |
| 304 | // range of their destination. |
Matthias Braun | b2f2388 | 2014-12-11 23:18:03 +0000 | [diff] [blame] | 305 | addPass(createAArch64BranchRelaxation()); |
Tim Northover | 3b0846e | 2014-05-24 12:50:23 +0000 | [diff] [blame] | 306 | if (TM->getOptLevel() != CodeGenOpt::None && EnableCollectLOH && |
| 307 | TM->getSubtarget<AArch64Subtarget>().isTargetMachO()) |
| 308 | addPass(createAArch64CollectLOHPass()); |
Tim Northover | 3b0846e | 2014-05-24 12:50:23 +0000 | [diff] [blame] | 309 | } |