Tim Northover | 3b0846e | 2014-05-24 12:50:23 +0000 | [diff] [blame] | 1 | //===-- AArch64TargetMachine.cpp - Define TargetMachine for AArch64 -------===// |
| 2 | // |
| 3 | // The LLVM Compiler Infrastructure |
| 4 | // |
| 5 | // This file is distributed under the University of Illinois Open Source |
| 6 | // License. See LICENSE.TXT for details. |
| 7 | // |
| 8 | //===----------------------------------------------------------------------===// |
| 9 | // |
| 10 | // |
| 11 | //===----------------------------------------------------------------------===// |
| 12 | |
Quentin Colombet | 7a43edd | 2017-05-27 01:34:07 +0000 | [diff] [blame] | 13 | #include "AArch64TargetMachine.h" |
Tim Northover | 3b0846e | 2014-05-24 12:50:23 +0000 | [diff] [blame] | 14 | #include "AArch64.h" |
Evandro Menezes | 94edf02 | 2017-02-01 02:54:34 +0000 | [diff] [blame] | 15 | #include "AArch64MacroFusion.h" |
Eugene Zelenko | 049b017 | 2017-01-06 00:30:53 +0000 | [diff] [blame] | 16 | #include "AArch64Subtarget.h" |
Aditya Nandakumar | a271932 | 2014-11-13 09:26:31 +0000 | [diff] [blame] | 17 | #include "AArch64TargetObjectFile.h" |
Chandler Carruth | 93dcdc4 | 2015-01-31 11:17:59 +0000 | [diff] [blame] | 18 | #include "AArch64TargetTransformInfo.h" |
Eugene Zelenko | 049b017 | 2017-01-06 00:30:53 +0000 | [diff] [blame] | 19 | #include "MCTargetDesc/AArch64MCTargetDesc.h" |
| 20 | #include "llvm/ADT/STLExtras.h" |
| 21 | #include "llvm/ADT/Triple.h" |
| 22 | #include "llvm/Analysis/TargetTransformInfo.h" |
Quentin Colombet | 846219a | 2016-04-07 21:24:40 +0000 | [diff] [blame] | 23 | #include "llvm/CodeGen/GlobalISel/IRTranslator.h" |
Ahmed Bougacha | 6756a2c | 2016-07-27 14:31:55 +0000 | [diff] [blame] | 24 | #include "llvm/CodeGen/GlobalISel/InstructionSelect.h" |
Tim Northover | 69fa84a | 2016-10-14 22:18:18 +0000 | [diff] [blame] | 25 | #include "llvm/CodeGen/GlobalISel/Legalizer.h" |
Quentin Colombet | 7a43edd | 2017-05-27 01:34:07 +0000 | [diff] [blame] | 26 | #include "llvm/CodeGen/GlobalISel/Localizer.h" |
Quentin Colombet | d413181 | 2016-04-07 20:27:33 +0000 | [diff] [blame] | 27 | #include "llvm/CodeGen/GlobalISel/RegBankSelect.h" |
Matthias Braun | 115efcd | 2016-11-28 20:11:54 +0000 | [diff] [blame] | 28 | #include "llvm/CodeGen/MachineScheduler.h" |
Tim Northover | 3b0846e | 2014-05-24 12:50:23 +0000 | [diff] [blame] | 29 | #include "llvm/CodeGen/Passes.h" |
Matthias Braun | 31d19d4 | 2016-05-10 03:21:59 +0000 | [diff] [blame] | 30 | #include "llvm/CodeGen/TargetPassConfig.h" |
Eugene Zelenko | 049b017 | 2017-01-06 00:30:53 +0000 | [diff] [blame] | 31 | #include "llvm/IR/Attributes.h" |
Eric Christopher | 3faf2f1 | 2014-10-06 06:45:36 +0000 | [diff] [blame] | 32 | #include "llvm/IR/Function.h" |
Eli Friedman | 0917d0c | 2018-11-07 22:30:56 +0000 | [diff] [blame] | 33 | #include "llvm/MC/MCAsmInfo.h" |
Eugene Zelenko | 049b017 | 2017-01-06 00:30:53 +0000 | [diff] [blame] | 34 | #include "llvm/MC/MCTargetOptions.h" |
| 35 | #include "llvm/Pass.h" |
| 36 | #include "llvm/Support/CodeGen.h" |
Tim Northover | 3b0846e | 2014-05-24 12:50:23 +0000 | [diff] [blame] | 37 | #include "llvm/Support/CommandLine.h" |
| 38 | #include "llvm/Support/TargetRegistry.h" |
David Blaikie | 6054e65 | 2018-03-23 23:58:19 +0000 | [diff] [blame] | 39 | #include "llvm/Target/TargetLoweringObjectFile.h" |
Tim Northover | 3b0846e | 2014-05-24 12:50:23 +0000 | [diff] [blame] | 40 | #include "llvm/Target/TargetOptions.h" |
| 41 | #include "llvm/Transforms/Scalar.h" |
Eugene Zelenko | 049b017 | 2017-01-06 00:30:53 +0000 | [diff] [blame] | 42 | #include <memory> |
| 43 | #include <string> |
| 44 | |
Tim Northover | 3b0846e | 2014-05-24 12:50:23 +0000 | [diff] [blame] | 45 | using namespace llvm; |
| 46 | |
Diana Picus | 850043b | 2016-08-01 05:56:57 +0000 | [diff] [blame] | 47 | static cl::opt<bool> EnableCCMP("aarch64-enable-ccmp", |
| 48 | cl::desc("Enable the CCMP formation pass"), |
| 49 | cl::init(true), cl::Hidden); |
Tim Northover | 3b0846e | 2014-05-24 12:50:23 +0000 | [diff] [blame] | 50 | |
Chad Rosier | 6db9ff6 | 2017-06-23 19:20:12 +0000 | [diff] [blame] | 51 | static cl::opt<bool> |
| 52 | EnableCondBrTuning("aarch64-enable-cond-br-tune", |
| 53 | cl::desc("Enable the conditional branch tuning pass"), |
| 54 | cl::init(true), cl::Hidden); |
| 55 | |
Diana Picus | 850043b | 2016-08-01 05:56:57 +0000 | [diff] [blame] | 56 | static cl::opt<bool> EnableMCR("aarch64-enable-mcr", |
Gerolf Hoflehner | 97c383b | 2014-08-07 21:40:58 +0000 | [diff] [blame] | 57 | cl::desc("Enable the machine combiner pass"), |
| 58 | cl::init(true), cl::Hidden); |
| 59 | |
Diana Picus | 850043b | 2016-08-01 05:56:57 +0000 | [diff] [blame] | 60 | static cl::opt<bool> EnableStPairSuppress("aarch64-enable-stp-suppress", |
| 61 | cl::desc("Suppress STP for AArch64"), |
| 62 | cl::init(true), cl::Hidden); |
| 63 | |
| 64 | static cl::opt<bool> EnableAdvSIMDScalar( |
| 65 | "aarch64-enable-simd-scalar", |
| 66 | cl::desc("Enable use of AdvSIMD scalar integer instructions"), |
| 67 | cl::init(false), cl::Hidden); |
Tim Northover | 3b0846e | 2014-05-24 12:50:23 +0000 | [diff] [blame] | 68 | |
| 69 | static cl::opt<bool> |
Diana Picus | 850043b | 2016-08-01 05:56:57 +0000 | [diff] [blame] | 70 | EnablePromoteConstant("aarch64-enable-promote-const", |
| 71 | cl::desc("Enable the promote constant pass"), |
| 72 | cl::init(true), cl::Hidden); |
| 73 | |
| 74 | static cl::opt<bool> EnableCollectLOH( |
| 75 | "aarch64-enable-collect-loh", |
| 76 | cl::desc("Enable the pass that emits the linker optimization hints (LOH)"), |
| 77 | cl::init(true), cl::Hidden); |
Tim Northover | 3b0846e | 2014-05-24 12:50:23 +0000 | [diff] [blame] | 78 | |
| 79 | static cl::opt<bool> |
Diana Picus | 850043b | 2016-08-01 05:56:57 +0000 | [diff] [blame] | 80 | EnableDeadRegisterElimination("aarch64-enable-dead-defs", cl::Hidden, |
| 81 | cl::desc("Enable the pass that removes dead" |
| 82 | " definitons and replaces stores to" |
| 83 | " them with stores to the zero" |
| 84 | " register"), |
| 85 | cl::init(true)); |
Tim Northover | 3b0846e | 2014-05-24 12:50:23 +0000 | [diff] [blame] | 86 | |
Diana Picus | 850043b | 2016-08-01 05:56:57 +0000 | [diff] [blame] | 87 | static cl::opt<bool> EnableRedundantCopyElimination( |
| 88 | "aarch64-enable-copyelim", |
| 89 | cl::desc("Enable the redundant copy elimination pass"), cl::init(true), |
| 90 | cl::Hidden); |
Tim Northover | 3b0846e | 2014-05-24 12:50:23 +0000 | [diff] [blame] | 91 | |
Diana Picus | 850043b | 2016-08-01 05:56:57 +0000 | [diff] [blame] | 92 | static cl::opt<bool> EnableLoadStoreOpt("aarch64-enable-ldst-opt", |
| 93 | cl::desc("Enable the load/store pair" |
| 94 | " optimization pass"), |
| 95 | cl::init(true), cl::Hidden); |
Tim Northover | 3b0846e | 2014-05-24 12:50:23 +0000 | [diff] [blame] | 96 | |
Diana Picus | 850043b | 2016-08-01 05:56:57 +0000 | [diff] [blame] | 97 | static cl::opt<bool> EnableAtomicTidy( |
| 98 | "aarch64-enable-atomic-cfg-tidy", cl::Hidden, |
| 99 | cl::desc("Run SimplifyCFG after expanding atomic operations" |
| 100 | " to make use of cmpxchg flow-based information"), |
| 101 | cl::init(true)); |
Tim Northover | b4ddc08 | 2014-05-30 10:09:59 +0000 | [diff] [blame] | 102 | |
James Molloy | 9991794 | 2014-08-06 13:31:32 +0000 | [diff] [blame] | 103 | static cl::opt<bool> |
| 104 | EnableEarlyIfConversion("aarch64-enable-early-ifcvt", cl::Hidden, |
| 105 | cl::desc("Run early if-conversion"), |
| 106 | cl::init(true)); |
| 107 | |
Jiangning Liu | 1a486da | 2014-09-05 02:55:24 +0000 | [diff] [blame] | 108 | static cl::opt<bool> |
Diana Picus | 850043b | 2016-08-01 05:56:57 +0000 | [diff] [blame] | 109 | EnableCondOpt("aarch64-enable-condopt", |
| 110 | cl::desc("Enable the condition optimizer pass"), |
| 111 | cl::init(true), cl::Hidden); |
Jiangning Liu | 1a486da | 2014-09-05 02:55:24 +0000 | [diff] [blame] | 112 | |
Arnaud A. de Grandmaison | c75dbbb | 2014-09-10 14:06:10 +0000 | [diff] [blame] | 113 | static cl::opt<bool> |
Bradley Smith | f2a801d | 2014-10-13 10:12:35 +0000 | [diff] [blame] | 114 | EnableA53Fix835769("aarch64-fix-cortex-a53-835769", cl::Hidden, |
| 115 | cl::desc("Work around Cortex-A53 erratum 835769"), |
| 116 | cl::init(false)); |
| 117 | |
Hao Liu | fd46bea | 2014-11-19 06:39:53 +0000 | [diff] [blame] | 118 | static cl::opt<bool> |
Diana Picus | 850043b | 2016-08-01 05:56:57 +0000 | [diff] [blame] | 119 | EnableGEPOpt("aarch64-enable-gep-opt", cl::Hidden, |
| 120 | cl::desc("Enable optimizations on complex GEPs"), |
| 121 | cl::init(false)); |
| 122 | |
| 123 | static cl::opt<bool> |
| 124 | BranchRelaxation("aarch64-enable-branch-relax", cl::Hidden, cl::init(true), |
| 125 | cl::desc("Relax out of range conditional branches")); |
Hao Liu | fd46bea | 2014-11-19 06:39:53 +0000 | [diff] [blame] | 126 | |
Tim Northover | 1c35341 | 2018-10-24 20:19:09 +0000 | [diff] [blame] | 127 | static cl::opt<bool> EnableCompressJumpTables( |
| 128 | "aarch64-enable-compress-jump-tables", cl::Hidden, cl::init(true), |
| 129 | cl::desc("Use smallest entry possible for jump tables")); |
| 130 | |
Ahmed Bougacha | b96444e | 2015-04-11 00:06:36 +0000 | [diff] [blame] | 131 | // FIXME: Unify control over GlobalMerge. |
| 132 | static cl::opt<cl::boolOrDefault> |
Diana Picus | 850043b | 2016-08-01 05:56:57 +0000 | [diff] [blame] | 133 | EnableGlobalMerge("aarch64-enable-global-merge", cl::Hidden, |
| 134 | cl::desc("Enable the global merge pass")); |
Ahmed Bougacha | b96444e | 2015-04-11 00:06:36 +0000 | [diff] [blame] | 135 | |
Adam Nemet | 53e758f | 2016-03-18 00:27:29 +0000 | [diff] [blame] | 136 | static cl::opt<bool> |
Diana Picus | 850043b | 2016-08-01 05:56:57 +0000 | [diff] [blame] | 137 | EnableLoopDataPrefetch("aarch64-enable-loop-data-prefetch", cl::Hidden, |
Adam Nemet | 53e758f | 2016-03-18 00:27:29 +0000 | [diff] [blame] | 138 | cl::desc("Enable the loop data prefetch pass"), |
Adam Nemet | fb8fbba5 | 2016-03-30 00:21:29 +0000 | [diff] [blame] | 139 | cl::init(true)); |
Adam Nemet | 53e758f | 2016-03-18 00:27:29 +0000 | [diff] [blame] | 140 | |
Ahmed Bougacha | 120ae22 | 2017-03-01 23:33:08 +0000 | [diff] [blame] | 141 | static cl::opt<int> EnableGlobalISelAtO( |
| 142 | "aarch64-enable-global-isel-at-O", cl::Hidden, |
| 143 | cl::desc("Enable GlobalISel at or below an opt level (-1 to disable)"), |
Amara Emerson | 854d10d | 2018-01-02 16:30:47 +0000 | [diff] [blame] | 144 | cl::init(0)); |
Ahmed Bougacha | 120ae22 | 2017-03-01 23:33:08 +0000 | [diff] [blame] | 145 | |
Geoff Berry | b1e8714 | 2017-07-14 21:44:12 +0000 | [diff] [blame] | 146 | static cl::opt<bool> EnableFalkorHWPFFix("aarch64-enable-falkor-hwpf-fix", |
| 147 | cl::init(true), cl::Hidden); |
| 148 | |
Oliver Stannard | 250e5a5 | 2018-10-08 14:04:24 +0000 | [diff] [blame] | 149 | static cl::opt<bool> |
| 150 | EnableBranchTargets("aarch64-enable-branch-targets", cl::Hidden, |
| 151 | cl::desc("Enable the AAcrh64 branch target pass"), |
| 152 | cl::init(true)); |
| 153 | |
Tim Northover | 3b0846e | 2014-05-24 12:50:23 +0000 | [diff] [blame] | 154 | extern "C" void LLVMInitializeAArch64Target() { |
| 155 | // Register the target. |
Mehdi Amini | f42454b | 2016-10-09 23:00:34 +0000 | [diff] [blame] | 156 | RegisterTargetMachine<AArch64leTargetMachine> X(getTheAArch64leTarget()); |
| 157 | RegisterTargetMachine<AArch64beTargetMachine> Y(getTheAArch64beTarget()); |
| 158 | RegisterTargetMachine<AArch64leTargetMachine> Z(getTheARM64Target()); |
Tim Northover | 5dad9df | 2016-04-01 23:14:52 +0000 | [diff] [blame] | 159 | auto PR = PassRegistry::getPassRegistry(); |
| 160 | initializeGlobalISel(*PR); |
Diana Picus | 850043b | 2016-08-01 05:56:57 +0000 | [diff] [blame] | 161 | initializeAArch64A53Fix835769Pass(*PR); |
| 162 | initializeAArch64A57FPLoadBalancingPass(*PR); |
Diana Picus | 850043b | 2016-08-01 05:56:57 +0000 | [diff] [blame] | 163 | initializeAArch64AdvSIMDScalarPass(*PR); |
Oliver Stannard | 250e5a5 | 2018-10-08 14:04:24 +0000 | [diff] [blame] | 164 | initializeAArch64BranchTargetsPass(*PR); |
Diana Picus | 850043b | 2016-08-01 05:56:57 +0000 | [diff] [blame] | 165 | initializeAArch64CollectLOHPass(*PR); |
Tim Northover | 1c35341 | 2018-10-24 20:19:09 +0000 | [diff] [blame] | 166 | initializeAArch64CompressJumpTablesPass(*PR); |
Diana Picus | 850043b | 2016-08-01 05:56:57 +0000 | [diff] [blame] | 167 | initializeAArch64ConditionalComparesPass(*PR); |
| 168 | initializeAArch64ConditionOptimizerPass(*PR); |
| 169 | initializeAArch64DeadRegisterDefinitionsPass(*PR); |
Tim Northover | 5dad9df | 2016-04-01 23:14:52 +0000 | [diff] [blame] | 170 | initializeAArch64ExpandPseudoPass(*PR); |
Geoff Berry | 24c81e8 | 2016-07-20 21:45:58 +0000 | [diff] [blame] | 171 | initializeAArch64LoadStoreOptPass(*PR); |
Abderrazek Zaafrani | 2c80e4c | 2017-12-08 00:58:49 +0000 | [diff] [blame] | 172 | initializeAArch64SIMDInstrOptPass(*PR); |
Daniel Sanders | c973ad1 | 2018-10-03 02:12:17 +0000 | [diff] [blame] | 173 | initializeAArch64PreLegalizerCombinerPass(*PR); |
Diana Picus | 850043b | 2016-08-01 05:56:57 +0000 | [diff] [blame] | 174 | initializeAArch64PromoteConstantPass(*PR); |
| 175 | initializeAArch64RedundantCopyEliminationPass(*PR); |
| 176 | initializeAArch64StorePairSuppressPass(*PR); |
Geoff Berry | 9962fae | 2017-07-18 16:14:22 +0000 | [diff] [blame] | 177 | initializeFalkorHWPFFixPass(*PR); |
Geoff Berry | b1e8714 | 2017-07-14 21:44:12 +0000 | [diff] [blame] | 178 | initializeFalkorMarkStridedAccessesLegacyPass(*PR); |
Diana Picus | 850043b | 2016-08-01 05:56:57 +0000 | [diff] [blame] | 179 | initializeLDTLSCleanupPass(*PR); |
Kristof Beyls | e66bc1f | 2018-12-18 08:50:02 +0000 | [diff] [blame] | 180 | initializeAArch64SpeculationHardeningPass(*PR); |
Tim Northover | 3b0846e | 2014-05-24 12:50:23 +0000 | [diff] [blame] | 181 | } |
| 182 | |
Aditya Nandakumar | a271932 | 2014-11-13 09:26:31 +0000 | [diff] [blame] | 183 | //===----------------------------------------------------------------------===// |
| 184 | // AArch64 Lowering public interface. |
| 185 | //===----------------------------------------------------------------------===// |
| 186 | static std::unique_ptr<TargetLoweringObjectFile> createTLOF(const Triple &TT) { |
| 187 | if (TT.isOSBinFormatMachO()) |
Eugene Zelenko | 049b017 | 2017-01-06 00:30:53 +0000 | [diff] [blame] | 188 | return llvm::make_unique<AArch64_MachoTargetObjectFile>(); |
Mandeep Singh Grang | 0c72172 | 2017-06-27 23:58:19 +0000 | [diff] [blame] | 189 | if (TT.isOSBinFormatCOFF()) |
| 190 | return llvm::make_unique<AArch64_COFFTargetObjectFile>(); |
Aditya Nandakumar | a271932 | 2014-11-13 09:26:31 +0000 | [diff] [blame] | 191 | |
Eugene Zelenko | 049b017 | 2017-01-06 00:30:53 +0000 | [diff] [blame] | 192 | return llvm::make_unique<AArch64_ELFTargetObjectFile>(); |
Aditya Nandakumar | a271932 | 2014-11-13 09:26:31 +0000 | [diff] [blame] | 193 | } |
| 194 | |
Mehdi Amini | 93e1ea1 | 2015-03-12 00:07:24 +0000 | [diff] [blame] | 195 | // Helper function to build a DataLayout string |
Joel Jones | 504bf33 | 2016-10-24 13:37:13 +0000 | [diff] [blame] | 196 | static std::string computeDataLayout(const Triple &TT, |
| 197 | const MCTargetOptions &Options, |
| 198 | bool LittleEndian) { |
| 199 | if (Options.getABIName() == "ilp32") |
| 200 | return "e-m:e-p:32:32-i8:8-i16:16-i64:64-S128"; |
Daniel Sanders | ed64d62 | 2015-06-11 15:34:59 +0000 | [diff] [blame] | 201 | if (TT.isOSBinFormatMachO()) |
Mehdi Amini | 93e1ea1 | 2015-03-12 00:07:24 +0000 | [diff] [blame] | 202 | return "e-m:o-i64:64-i128:128-n32:64-S128"; |
Mandeep Singh Grang | 0c72172 | 2017-06-27 23:58:19 +0000 | [diff] [blame] | 203 | if (TT.isOSBinFormatCOFF()) |
Mandeep Singh Grang | 6d6f2fa | 2017-07-17 21:25:19 +0000 | [diff] [blame] | 204 | return "e-m:w-p:64:64-i32:32-i64:64-i128:128-n32:64-S128"; |
Mehdi Amini | 93e1ea1 | 2015-03-12 00:07:24 +0000 | [diff] [blame] | 205 | if (LittleEndian) |
Chad Rosier | 112d0e9 | 2016-07-07 20:02:18 +0000 | [diff] [blame] | 206 | return "e-m:e-i8:8:32-i16:16:32-i64:64-i128:128-n32:64-S128"; |
| 207 | return "E-m:e-i8:8:32-i16:16:32-i64:64-i128:128-n32:64-S128"; |
Mehdi Amini | 93e1ea1 | 2015-03-12 00:07:24 +0000 | [diff] [blame] | 208 | } |
| 209 | |
Rafael Espindola | 8c34dd8 | 2016-05-18 22:04:49 +0000 | [diff] [blame] | 210 | static Reloc::Model getEffectiveRelocModel(const Triple &TT, |
| 211 | Optional<Reloc::Model> RM) { |
| 212 | // AArch64 Darwin is always PIC. |
| 213 | if (TT.isOSDarwin()) |
| 214 | return Reloc::PIC_; |
| 215 | // On ELF platforms the default static relocation model has a smart enough |
| 216 | // linker to cope with referencing external symbols defined in a shared |
| 217 | // library. Hence DynamicNoPIC doesn't need to be promoted to PIC. |
| 218 | if (!RM.hasValue() || *RM == Reloc::DynamicNoPIC) |
| 219 | return Reloc::Static; |
| 220 | return *RM; |
| 221 | } |
| 222 | |
David Green | ca29c27 | 2018-12-07 12:10:23 +0000 | [diff] [blame] | 223 | static CodeModel::Model |
| 224 | getEffectiveAArch64CodeModel(const Triple &TT, Optional<CodeModel::Model> CM, |
| 225 | bool JIT) { |
Rafael Espindola | 79e238a | 2017-08-03 02:16:21 +0000 | [diff] [blame] | 226 | if (CM) { |
David Green | 9dd1d45 | 2018-08-22 11:31:39 +0000 | [diff] [blame] | 227 | if (*CM != CodeModel::Small && *CM != CodeModel::Tiny && |
| 228 | *CM != CodeModel::Large) { |
Rafael Espindola | 79e238a | 2017-08-03 02:16:21 +0000 | [diff] [blame] | 229 | if (!TT.isOSFuchsia()) |
| 230 | report_fatal_error( |
David Green | 9dd1d45 | 2018-08-22 11:31:39 +0000 | [diff] [blame] | 231 | "Only small, tiny and large code models are allowed on AArch64"); |
| 232 | else if (*CM != CodeModel::Kernel) |
| 233 | report_fatal_error("Only small, tiny, kernel, and large code models " |
| 234 | "are allowed on AArch64"); |
| 235 | } else if (*CM == CodeModel::Tiny && !TT.isOSBinFormatELF()) |
| 236 | report_fatal_error("tiny code model is only supported on ELF"); |
Rafael Espindola | 79e238a | 2017-08-03 02:16:21 +0000 | [diff] [blame] | 237 | return *CM; |
| 238 | } |
| 239 | // The default MCJIT memory managers make no guarantees about where they can |
| 240 | // find an executable page; JITed code needs to be able to refer to globals |
| 241 | // no matter how far away they are. |
| 242 | if (JIT) |
| 243 | return CodeModel::Large; |
| 244 | return CodeModel::Small; |
| 245 | } |
| 246 | |
Rafael Espindola | 38af4d6 | 2016-05-18 16:00:24 +0000 | [diff] [blame] | 247 | /// Create an AArch64 architecture model. |
Tim Northover | 3b0846e | 2014-05-24 12:50:23 +0000 | [diff] [blame] | 248 | /// |
Rafael Espindola | 79e238a | 2017-08-03 02:16:21 +0000 | [diff] [blame] | 249 | AArch64TargetMachine::AArch64TargetMachine(const Target &T, const Triple &TT, |
| 250 | StringRef CPU, StringRef FS, |
| 251 | const TargetOptions &Options, |
| 252 | Optional<Reloc::Model> RM, |
| 253 | Optional<CodeModel::Model> CM, |
| 254 | CodeGenOpt::Level OL, bool JIT, |
| 255 | bool LittleEndian) |
Matthias Braun | bb8507e | 2017-10-12 22:57:28 +0000 | [diff] [blame] | 256 | : LLVMTargetMachine(T, |
| 257 | computeDataLayout(TT, Options.MCOptions, LittleEndian), |
| 258 | TT, CPU, FS, Options, getEffectiveRelocModel(TT, RM), |
David Green | ca29c27 | 2018-12-07 12:10:23 +0000 | [diff] [blame] | 259 | getEffectiveAArch64CodeModel(TT, CM, JIT), OL), |
Rafael Espindola | 79e238a | 2017-08-03 02:16:21 +0000 | [diff] [blame] | 260 | TLOF(createTLOF(getTargetTriple())), isLittle(LittleEndian) { |
Tim Northover | 3b0846e | 2014-05-24 12:50:23 +0000 | [diff] [blame] | 261 | initAsmInfo(); |
Volkan Keles | a79b062 | 2018-01-17 22:34:21 +0000 | [diff] [blame] | 262 | |
Matthias Braun | da5e7e1 | 2018-06-28 17:00:45 +0000 | [diff] [blame] | 263 | if (TT.isOSBinFormatMachO()) { |
Tim Northover | 271d3d2 | 2018-04-13 22:25:20 +0000 | [diff] [blame] | 264 | this->Options.TrapUnreachable = true; |
Matthias Braun | da5e7e1 | 2018-06-28 17:00:45 +0000 | [diff] [blame] | 265 | this->Options.NoTrapAfterNoreturn = true; |
| 266 | } |
Tim Northover | 271d3d2 | 2018-04-13 22:25:20 +0000 | [diff] [blame] | 267 | |
Eli Friedman | 0917d0c | 2018-11-07 22:30:56 +0000 | [diff] [blame] | 268 | if (getMCAsmInfo()->usesWindowsCFI()) { |
Eli Friedman | d00fb2e | 2018-11-07 21:31:14 +0000 | [diff] [blame] | 269 | // Unwinding can get confused if the last instruction in an |
| 270 | // exception-handling region (function, funclet, try block, etc.) |
| 271 | // is a call. |
| 272 | // |
| 273 | // FIXME: We could elide the trap if the next instruction would be in |
| 274 | // the same region anyway. |
| 275 | this->Options.TrapUnreachable = true; |
| 276 | } |
| 277 | |
Volkan Keles | a79b062 | 2018-01-17 22:34:21 +0000 | [diff] [blame] | 278 | // Enable GlobalISel at or below EnableGlobalISelAt0. |
Petr Pavlu | e6406d5 | 2018-11-29 12:56:32 +0000 | [diff] [blame] | 279 | if (getOptLevel() <= EnableGlobalISelAtO) { |
Volkan Keles | a79b062 | 2018-01-17 22:34:21 +0000 | [diff] [blame] | 280 | setGlobalISel(true); |
Petr Pavlu | e6406d5 | 2018-11-29 12:56:32 +0000 | [diff] [blame] | 281 | setGlobalISelAbort(GlobalISelAbortMode::Disable); |
| 282 | } |
Jessica Paquette | dafa198 | 2018-06-28 17:45:43 +0000 | [diff] [blame] | 283 | |
| 284 | // AArch64 supports the MachineOutliner. |
| 285 | setMachineOutliner(true); |
Jessica Paquette | f90edbe | 2018-07-27 20:18:27 +0000 | [diff] [blame] | 286 | |
| 287 | // AArch64 supports default outlining behaviour. |
| 288 | setSupportsDefaultOutlining(true); |
Tim Northover | 3b0846e | 2014-05-24 12:50:23 +0000 | [diff] [blame] | 289 | } |
| 290 | |
Eugene Zelenko | 049b017 | 2017-01-06 00:30:53 +0000 | [diff] [blame] | 291 | AArch64TargetMachine::~AArch64TargetMachine() = default; |
Reid Kleckner | 357600e | 2014-11-20 23:37:18 +0000 | [diff] [blame] | 292 | |
Eric Christopher | 3faf2f1 | 2014-10-06 06:45:36 +0000 | [diff] [blame] | 293 | const AArch64Subtarget * |
| 294 | AArch64TargetMachine::getSubtargetImpl(const Function &F) const { |
Duncan P. N. Exon Smith | 003bb7d | 2015-02-14 02:09:06 +0000 | [diff] [blame] | 295 | Attribute CPUAttr = F.getFnAttribute("target-cpu"); |
| 296 | Attribute FSAttr = F.getFnAttribute("target-features"); |
Eric Christopher | 3faf2f1 | 2014-10-06 06:45:36 +0000 | [diff] [blame] | 297 | |
| 298 | std::string CPU = !CPUAttr.hasAttribute(Attribute::None) |
| 299 | ? CPUAttr.getValueAsString().str() |
| 300 | : TargetCPU; |
| 301 | std::string FS = !FSAttr.hasAttribute(Attribute::None) |
| 302 | ? FSAttr.getValueAsString().str() |
| 303 | : TargetFS; |
| 304 | |
Daniel Sanders | a1b2db79 | 2017-05-19 11:08:33 +0000 | [diff] [blame] | 305 | auto &I = SubtargetMap[CPU + FS]; |
Eric Christopher | 3faf2f1 | 2014-10-06 06:45:36 +0000 | [diff] [blame] | 306 | if (!I) { |
| 307 | // This needs to be done before we create a new subtarget since any |
| 308 | // creation will depend on the TM and the code generation flags on the |
| 309 | // function that reside in TargetOptions. |
| 310 | resetTargetOptions(F); |
Daniel Sanders | c81f450 | 2015-06-16 15:44:21 +0000 | [diff] [blame] | 311 | I = llvm::make_unique<AArch64Subtarget>(TargetTriple, CPU, FS, *this, |
Daniel Sanders | a1b2db79 | 2017-05-19 11:08:33 +0000 | [diff] [blame] | 312 | isLittle); |
Eric Christopher | 3faf2f1 | 2014-10-06 06:45:36 +0000 | [diff] [blame] | 313 | } |
| 314 | return I.get(); |
| 315 | } |
| 316 | |
Tim Northover | 3b0846e | 2014-05-24 12:50:23 +0000 | [diff] [blame] | 317 | void AArch64leTargetMachine::anchor() { } |
| 318 | |
Daniel Sanders | 3e5de88 | 2015-06-11 19:41:26 +0000 | [diff] [blame] | 319 | AArch64leTargetMachine::AArch64leTargetMachine( |
| 320 | const Target &T, const Triple &TT, StringRef CPU, StringRef FS, |
Rafael Espindola | 8c34dd8 | 2016-05-18 22:04:49 +0000 | [diff] [blame] | 321 | const TargetOptions &Options, Optional<Reloc::Model> RM, |
Rafael Espindola | 79e238a | 2017-08-03 02:16:21 +0000 | [diff] [blame] | 322 | Optional<CodeModel::Model> CM, CodeGenOpt::Level OL, bool JIT) |
| 323 | : AArch64TargetMachine(T, TT, CPU, FS, Options, RM, CM, OL, JIT, true) {} |
Tim Northover | 3b0846e | 2014-05-24 12:50:23 +0000 | [diff] [blame] | 324 | |
| 325 | void AArch64beTargetMachine::anchor() { } |
| 326 | |
Daniel Sanders | 3e5de88 | 2015-06-11 19:41:26 +0000 | [diff] [blame] | 327 | AArch64beTargetMachine::AArch64beTargetMachine( |
| 328 | const Target &T, const Triple &TT, StringRef CPU, StringRef FS, |
Rafael Espindola | 8c34dd8 | 2016-05-18 22:04:49 +0000 | [diff] [blame] | 329 | const TargetOptions &Options, Optional<Reloc::Model> RM, |
Rafael Espindola | 79e238a | 2017-08-03 02:16:21 +0000 | [diff] [blame] | 330 | Optional<CodeModel::Model> CM, CodeGenOpt::Level OL, bool JIT) |
| 331 | : AArch64TargetMachine(T, TT, CPU, FS, Options, RM, CM, OL, JIT, false) {} |
Tim Northover | 3b0846e | 2014-05-24 12:50:23 +0000 | [diff] [blame] | 332 | |
| 333 | namespace { |
Eugene Zelenko | 049b017 | 2017-01-06 00:30:53 +0000 | [diff] [blame] | 334 | |
Tim Northover | 3b0846e | 2014-05-24 12:50:23 +0000 | [diff] [blame] | 335 | /// AArch64 Code Generator Pass Configuration Options. |
| 336 | class AArch64PassConfig : public TargetPassConfig { |
| 337 | public: |
Matthias Braun | 5e394c3 | 2017-05-30 21:36:41 +0000 | [diff] [blame] | 338 | AArch64PassConfig(AArch64TargetMachine &TM, PassManagerBase &PM) |
Chad Rosier | 486e087 | 2014-09-12 17:40:39 +0000 | [diff] [blame] | 339 | : TargetPassConfig(TM, PM) { |
Matthias Braun | 5e394c3 | 2017-05-30 21:36:41 +0000 | [diff] [blame] | 340 | if (TM.getOptLevel() != CodeGenOpt::None) |
Chad Rosier | 347ed4e | 2014-09-12 22:17:28 +0000 | [diff] [blame] | 341 | substitutePass(&PostRASchedulerID, &PostMachineSchedulerID); |
Chad Rosier | 486e087 | 2014-09-12 17:40:39 +0000 | [diff] [blame] | 342 | } |
Tim Northover | 3b0846e | 2014-05-24 12:50:23 +0000 | [diff] [blame] | 343 | |
| 344 | AArch64TargetMachine &getAArch64TargetMachine() const { |
| 345 | return getTM<AArch64TargetMachine>(); |
| 346 | } |
| 347 | |
Matthias Braun | 115efcd | 2016-11-28 20:11:54 +0000 | [diff] [blame] | 348 | ScheduleDAGInstrs * |
| 349 | createMachineScheduler(MachineSchedContext *C) const override { |
Florian Hahn | 15be1ac | 2017-07-12 21:41:28 +0000 | [diff] [blame] | 350 | const AArch64Subtarget &ST = C->MF->getSubtarget<AArch64Subtarget>(); |
Matthias Braun | 115efcd | 2016-11-28 20:11:54 +0000 | [diff] [blame] | 351 | ScheduleDAGMILive *DAG = createGenericSchedLive(C); |
| 352 | DAG->addMutation(createLoadClusterDAGMutation(DAG->TII, DAG->TRI)); |
| 353 | DAG->addMutation(createStoreClusterDAGMutation(DAG->TII, DAG->TRI)); |
Florian Hahn | 15be1ac | 2017-07-12 21:41:28 +0000 | [diff] [blame] | 354 | if (ST.hasFusion()) |
| 355 | DAG->addMutation(createAArch64MacroFusionDAGMutation()); |
Matthias Braun | 115efcd | 2016-11-28 20:11:54 +0000 | [diff] [blame] | 356 | return DAG; |
| 357 | } |
| 358 | |
Evandro Menezes | 455382e | 2017-02-01 02:54:42 +0000 | [diff] [blame] | 359 | ScheduleDAGInstrs * |
| 360 | createPostMachineScheduler(MachineSchedContext *C) const override { |
| 361 | const AArch64Subtarget &ST = C->MF->getSubtarget<AArch64Subtarget>(); |
Florian Hahn | f934add | 2017-07-12 20:53:22 +0000 | [diff] [blame] | 362 | if (ST.hasFusion()) { |
Evandro Menezes | 455382e | 2017-02-01 02:54:42 +0000 | [diff] [blame] | 363 | // Run the Macro Fusion after RA again since literals are expanded from |
| 364 | // pseudos then (v. addPreSched2()). |
| 365 | ScheduleDAGMI *DAG = createGenericSchedPostRA(C); |
| 366 | DAG->addMutation(createAArch64MacroFusionDAGMutation()); |
| 367 | return DAG; |
| 368 | } |
| 369 | |
| 370 | return nullptr; |
| 371 | } |
| 372 | |
Tim Northover | b4ddc08 | 2014-05-30 10:09:59 +0000 | [diff] [blame] | 373 | void addIRPasses() override; |
Tim Northover | 3b0846e | 2014-05-24 12:50:23 +0000 | [diff] [blame] | 374 | bool addPreISel() override; |
| 375 | bool addInstSelector() override; |
Quentin Colombet | d96f495 | 2016-02-11 19:35:06 +0000 | [diff] [blame] | 376 | bool addIRTranslator() override; |
Daniel Sanders | c973ad1 | 2018-10-03 02:12:17 +0000 | [diff] [blame] | 377 | void addPreLegalizeMachineIR() override; |
Tim Northover | 33b07d6 | 2016-07-22 20:03:43 +0000 | [diff] [blame] | 378 | bool addLegalizeMachineIR() override; |
Quentin Colombet | d413181 | 2016-04-07 20:27:33 +0000 | [diff] [blame] | 379 | bool addRegBankSelect() override; |
Quentin Colombet | 7a43edd | 2017-05-27 01:34:07 +0000 | [diff] [blame] | 380 | void addPreGlobalInstructionSelect() override; |
Ahmed Bougacha | 6756a2c | 2016-07-27 14:31:55 +0000 | [diff] [blame] | 381 | bool addGlobalInstructionSelect() override; |
Tim Northover | 3b0846e | 2014-05-24 12:50:23 +0000 | [diff] [blame] | 382 | bool addILPOpts() override; |
Matthias Braun | 7e37a5f | 2014-12-11 21:26:47 +0000 | [diff] [blame] | 383 | void addPreRegAlloc() override; |
| 384 | void addPostRegAlloc() override; |
| 385 | void addPreSched2() override; |
| 386 | void addPreEmitPass() override; |
Tim Northover | 3b0846e | 2014-05-24 12:50:23 +0000 | [diff] [blame] | 387 | }; |
Eugene Zelenko | 049b017 | 2017-01-06 00:30:53 +0000 | [diff] [blame] | 388 | |
| 389 | } // end anonymous namespace |
Tim Northover | 3b0846e | 2014-05-24 12:50:23 +0000 | [diff] [blame] | 390 | |
Sanjoy Das | 26d11ca | 2017-12-22 18:21:59 +0000 | [diff] [blame] | 391 | TargetTransformInfo |
| 392 | AArch64TargetMachine::getTargetTransformInfo(const Function &F) { |
| 393 | return TargetTransformInfo(AArch64TTIImpl(this, F)); |
Tim Northover | 3b0846e | 2014-05-24 12:50:23 +0000 | [diff] [blame] | 394 | } |
| 395 | |
| 396 | TargetPassConfig *AArch64TargetMachine::createPassConfig(PassManagerBase &PM) { |
Matthias Braun | 5e394c3 | 2017-05-30 21:36:41 +0000 | [diff] [blame] | 397 | return new AArch64PassConfig(*this, PM); |
Tim Northover | 3b0846e | 2014-05-24 12:50:23 +0000 | [diff] [blame] | 398 | } |
| 399 | |
Tim Northover | b4ddc08 | 2014-05-30 10:09:59 +0000 | [diff] [blame] | 400 | void AArch64PassConfig::addIRPasses() { |
| 401 | // Always expand atomic operations, we don't deal with atomicrmw or cmpxchg |
| 402 | // ourselves. |
Francis Visoiu Mistrih | 8b61764 | 2017-05-18 17:21:13 +0000 | [diff] [blame] | 403 | addPass(createAtomicExpandPass()); |
Tim Northover | b4ddc08 | 2014-05-30 10:09:59 +0000 | [diff] [blame] | 404 | |
| 405 | // Cmpxchg instructions are often used with a subsequent comparison to |
| 406 | // determine whether it succeeded. We can exploit existing control-flow in |
| 407 | // ldrex/strex loops to simplify this, but it needs tidying up. |
| 408 | if (TM->getOptLevel() != CodeGenOpt::None && EnableAtomicTidy) |
Sanjay Patel | 0ab0c1a | 2017-12-14 22:05:20 +0000 | [diff] [blame] | 409 | addPass(createCFGSimplificationPass(1, true, true, false, true)); |
Tim Northover | b4ddc08 | 2014-05-30 10:09:59 +0000 | [diff] [blame] | 410 | |
Junmo Park | 384d376 | 2016-07-06 23:18:58 +0000 | [diff] [blame] | 411 | // Run LoopDataPrefetch |
Adam Nemet | 53e758f | 2016-03-18 00:27:29 +0000 | [diff] [blame] | 412 | // |
| 413 | // Run this before LSR to remove the multiplies involved in computing the |
| 414 | // pointer values N iterations ahead. |
Geoff Berry | b1e8714 | 2017-07-14 21:44:12 +0000 | [diff] [blame] | 415 | if (TM->getOptLevel() != CodeGenOpt::None) { |
| 416 | if (EnableLoopDataPrefetch) |
| 417 | addPass(createLoopDataPrefetchPass()); |
| 418 | if (EnableFalkorHWPFFix) |
| 419 | addPass(createFalkorMarkStridedAccessesPass()); |
| 420 | } |
Adam Nemet | 53e758f | 2016-03-18 00:27:29 +0000 | [diff] [blame] | 421 | |
Tim Northover | b4ddc08 | 2014-05-30 10:09:59 +0000 | [diff] [blame] | 422 | TargetPassConfig::addIRPasses(); |
Hao Liu | fd46bea | 2014-11-19 06:39:53 +0000 | [diff] [blame] | 423 | |
Hao Liu | 7ec8ee3 | 2015-06-26 02:32:07 +0000 | [diff] [blame] | 424 | // Match interleaved memory accesses to ldN/stN intrinsics. |
Martin Elshuber | fef3036 | 2018-11-19 14:26:10 +0000 | [diff] [blame] | 425 | if (TM->getOptLevel() != CodeGenOpt::None) { |
| 426 | addPass(createInterleavedLoadCombinePass()); |
Francis Visoiu Mistrih | 8b61764 | 2017-05-18 17:21:13 +0000 | [diff] [blame] | 427 | addPass(createInterleavedAccessPass()); |
Martin Elshuber | fef3036 | 2018-11-19 14:26:10 +0000 | [diff] [blame] | 428 | } |
Hao Liu | 7ec8ee3 | 2015-06-26 02:32:07 +0000 | [diff] [blame] | 429 | |
Hao Liu | fd46bea | 2014-11-19 06:39:53 +0000 | [diff] [blame] | 430 | if (TM->getOptLevel() == CodeGenOpt::Aggressive && EnableGEPOpt) { |
| 431 | // Call SeparateConstOffsetFromGEP pass to extract constants within indices |
| 432 | // and lower a GEP with multiple indices to either arithmetic operations or |
| 433 | // multiple GEPs with single index. |
David Blaikie | 8ad9a97 | 2018-03-28 22:28:50 +0000 | [diff] [blame] | 434 | addPass(createSeparateConstOffsetFromGEPPass(true)); |
Hao Liu | fd46bea | 2014-11-19 06:39:53 +0000 | [diff] [blame] | 435 | // Call EarlyCSE pass to find and remove subexpressions in the lowered |
| 436 | // result. |
| 437 | addPass(createEarlyCSEPass()); |
| 438 | // Do loop invariant code motion in case part of the lowered result is |
| 439 | // invariant. |
| 440 | addPass(createLICMPass()); |
| 441 | } |
Tim Northover | b4ddc08 | 2014-05-30 10:09:59 +0000 | [diff] [blame] | 442 | } |
| 443 | |
Tim Northover | 3b0846e | 2014-05-24 12:50:23 +0000 | [diff] [blame] | 444 | // Pass Pipeline Configuration |
| 445 | bool AArch64PassConfig::addPreISel() { |
| 446 | // Run promote constant before global merge, so that the promoted constants |
| 447 | // get a chance to be merged |
| 448 | if (TM->getOptLevel() != CodeGenOpt::None && EnablePromoteConstant) |
| 449 | addPass(createAArch64PromoteConstantPass()); |
Eric Christopher | ed47b22 | 2015-02-23 19:28:45 +0000 | [diff] [blame] | 450 | // FIXME: On AArch64, this depends on the type. |
| 451 | // Basically, the addressable offsets are up to 4095 * Ty.getSizeInBytes(). |
| 452 | // and the offset has to be a multiple of the related size in bytes. |
Ahmed Bougacha | 8207641 | 2015-06-04 20:39:23 +0000 | [diff] [blame] | 453 | if ((TM->getOptLevel() != CodeGenOpt::None && |
Ahmed Bougacha | b96444e | 2015-04-11 00:06:36 +0000 | [diff] [blame] | 454 | EnableGlobalMerge == cl::BOU_UNSET) || |
Ahmed Bougacha | 8207641 | 2015-06-04 20:39:23 +0000 | [diff] [blame] | 455 | EnableGlobalMerge == cl::BOU_TRUE) { |
| 456 | bool OnlyOptimizeForSize = (TM->getOptLevel() < CodeGenOpt::Aggressive) && |
| 457 | (EnableGlobalMerge == cl::BOU_UNSET); |
| 458 | addPass(createGlobalMergePass(TM, 4095, OnlyOptimizeForSize)); |
| 459 | } |
| 460 | |
Tim Northover | 3b0846e | 2014-05-24 12:50:23 +0000 | [diff] [blame] | 461 | return false; |
| 462 | } |
| 463 | |
| 464 | bool AArch64PassConfig::addInstSelector() { |
| 465 | addPass(createAArch64ISelDag(getAArch64TargetMachine(), getOptLevel())); |
| 466 | |
| 467 | // For ELF, cleanup any local-dynamic TLS accesses (i.e. combine as many |
| 468 | // references to _TLS_MODULE_BASE_ as possible. |
Daniel Sanders | c81f450 | 2015-06-16 15:44:21 +0000 | [diff] [blame] | 469 | if (TM->getTargetTriple().isOSBinFormatELF() && |
Tim Northover | 3b0846e | 2014-05-24 12:50:23 +0000 | [diff] [blame] | 470 | getOptLevel() != CodeGenOpt::None) |
| 471 | addPass(createAArch64CleanupLocalDynamicTLSPass()); |
| 472 | |
| 473 | return false; |
| 474 | } |
| 475 | |
Quentin Colombet | d96f495 | 2016-02-11 19:35:06 +0000 | [diff] [blame] | 476 | bool AArch64PassConfig::addIRTranslator() { |
| 477 | addPass(new IRTranslator()); |
| 478 | return false; |
| 479 | } |
Eugene Zelenko | 049b017 | 2017-01-06 00:30:53 +0000 | [diff] [blame] | 480 | |
Daniel Sanders | c973ad1 | 2018-10-03 02:12:17 +0000 | [diff] [blame] | 481 | void AArch64PassConfig::addPreLegalizeMachineIR() { |
| 482 | addPass(createAArch64PreLegalizeCombiner()); |
| 483 | } |
| 484 | |
Tim Northover | 33b07d6 | 2016-07-22 20:03:43 +0000 | [diff] [blame] | 485 | bool AArch64PassConfig::addLegalizeMachineIR() { |
Tim Northover | 69fa84a | 2016-10-14 22:18:18 +0000 | [diff] [blame] | 486 | addPass(new Legalizer()); |
Tim Northover | 33b07d6 | 2016-07-22 20:03:43 +0000 | [diff] [blame] | 487 | return false; |
| 488 | } |
Eugene Zelenko | 049b017 | 2017-01-06 00:30:53 +0000 | [diff] [blame] | 489 | |
Quentin Colombet | d413181 | 2016-04-07 20:27:33 +0000 | [diff] [blame] | 490 | bool AArch64PassConfig::addRegBankSelect() { |
| 491 | addPass(new RegBankSelect()); |
| 492 | return false; |
| 493 | } |
Eugene Zelenko | 049b017 | 2017-01-06 00:30:53 +0000 | [diff] [blame] | 494 | |
Quentin Colombet | 7a43edd | 2017-05-27 01:34:07 +0000 | [diff] [blame] | 495 | void AArch64PassConfig::addPreGlobalInstructionSelect() { |
| 496 | // Workaround the deficiency of the fast register allocator. |
| 497 | if (TM->getOptLevel() == CodeGenOpt::None) |
| 498 | addPass(new Localizer()); |
| 499 | } |
| 500 | |
Ahmed Bougacha | 6756a2c | 2016-07-27 14:31:55 +0000 | [diff] [blame] | 501 | bool AArch64PassConfig::addGlobalInstructionSelect() { |
| 502 | addPass(new InstructionSelect()); |
| 503 | return false; |
| 504 | } |
Quentin Colombet | d96f495 | 2016-02-11 19:35:06 +0000 | [diff] [blame] | 505 | |
Tim Northover | 3b0846e | 2014-05-24 12:50:23 +0000 | [diff] [blame] | 506 | bool AArch64PassConfig::addILPOpts() { |
Jiangning Liu | 1a486da | 2014-09-05 02:55:24 +0000 | [diff] [blame] | 507 | if (EnableCondOpt) |
| 508 | addPass(createAArch64ConditionOptimizerPass()); |
Tim Northover | 3b0846e | 2014-05-24 12:50:23 +0000 | [diff] [blame] | 509 | if (EnableCCMP) |
| 510 | addPass(createAArch64ConditionalCompares()); |
Gerolf Hoflehner | 97c383b | 2014-08-07 21:40:58 +0000 | [diff] [blame] | 511 | if (EnableMCR) |
| 512 | addPass(&MachineCombinerID); |
Chad Rosier | 6db9ff6 | 2017-06-23 19:20:12 +0000 | [diff] [blame] | 513 | if (EnableCondBrTuning) |
| 514 | addPass(createAArch64CondBrTuning()); |
James Molloy | 9991794 | 2014-08-06 13:31:32 +0000 | [diff] [blame] | 515 | if (EnableEarlyIfConversion) |
| 516 | addPass(&EarlyIfConverterID); |
Tim Northover | 3b0846e | 2014-05-24 12:50:23 +0000 | [diff] [blame] | 517 | if (EnableStPairSuppress) |
| 518 | addPass(createAArch64StorePairSuppressPass()); |
Abderrazek Zaafrani | 2c80e4c | 2017-12-08 00:58:49 +0000 | [diff] [blame] | 519 | addPass(createAArch64SIMDInstrOptPass()); |
Tim Northover | 3b0846e | 2014-05-24 12:50:23 +0000 | [diff] [blame] | 520 | return true; |
| 521 | } |
| 522 | |
Matthias Braun | 7e37a5f | 2014-12-11 21:26:47 +0000 | [diff] [blame] | 523 | void AArch64PassConfig::addPreRegAlloc() { |
Matthias Braun | 3d51cf0 | 2016-11-16 03:38:27 +0000 | [diff] [blame] | 524 | // Change dead register definitions to refer to the zero register. |
| 525 | if (TM->getOptLevel() != CodeGenOpt::None && EnableDeadRegisterElimination) |
| 526 | addPass(createAArch64DeadRegisterDefinitions()); |
| 527 | |
Tim Northover | 3b0846e | 2014-05-24 12:50:23 +0000 | [diff] [blame] | 528 | // Use AdvSIMD scalar instructions whenever profitable. |
Quentin Colombet | 0c740d4 | 2014-08-21 18:10:07 +0000 | [diff] [blame] | 529 | if (TM->getOptLevel() != CodeGenOpt::None && EnableAdvSIMDScalar) { |
Matthias Braun | b2f2388 | 2014-12-11 23:18:03 +0000 | [diff] [blame] | 530 | addPass(createAArch64AdvSIMDScalar()); |
Quentin Colombet | 0c740d4 | 2014-08-21 18:10:07 +0000 | [diff] [blame] | 531 | // The AdvSIMD pass may produce copies that can be rewritten to |
| 532 | // be register coaleascer friendly. |
| 533 | addPass(&PeepholeOptimizerID); |
| 534 | } |
Tim Northover | 3b0846e | 2014-05-24 12:50:23 +0000 | [diff] [blame] | 535 | } |
| 536 | |
Matthias Braun | 7e37a5f | 2014-12-11 21:26:47 +0000 | [diff] [blame] | 537 | void AArch64PassConfig::addPostRegAlloc() { |
Jun Bum Lim | b389d9b | 2016-02-16 20:02:39 +0000 | [diff] [blame] | 538 | // Remove redundant copy instructions. |
| 539 | if (TM->getOptLevel() != CodeGenOpt::None && EnableRedundantCopyElimination) |
| 540 | addPass(createAArch64RedundantCopyEliminationPass()); |
| 541 | |
Eric Christopher | 6f1e568 | 2015-03-03 23:22:40 +0000 | [diff] [blame] | 542 | if (TM->getOptLevel() != CodeGenOpt::None && usingDefaultRegAlloc()) |
James Molloy | 3feea9c | 2014-08-08 12:33:21 +0000 | [diff] [blame] | 543 | // Improve performance for some FP/SIMD code for A57. |
| 544 | addPass(createAArch64A57FPLoadBalancing()); |
Tim Northover | 3b0846e | 2014-05-24 12:50:23 +0000 | [diff] [blame] | 545 | } |
| 546 | |
Matthias Braun | 7e37a5f | 2014-12-11 21:26:47 +0000 | [diff] [blame] | 547 | void AArch64PassConfig::addPreSched2() { |
Tim Northover | 3b0846e | 2014-05-24 12:50:23 +0000 | [diff] [blame] | 548 | // Expand some pseudo instructions to allow proper scheduling. |
Matthias Braun | b2f2388 | 2014-12-11 23:18:03 +0000 | [diff] [blame] | 549 | addPass(createAArch64ExpandPseudoPass()); |
Tim Northover | 3b0846e | 2014-05-24 12:50:23 +0000 | [diff] [blame] | 550 | // Use load/store pair instructions when possible. |
Geoff Berry | 9962fae | 2017-07-18 16:14:22 +0000 | [diff] [blame] | 551 | if (TM->getOptLevel() != CodeGenOpt::None) { |
| 552 | if (EnableLoadStoreOpt) |
| 553 | addPass(createAArch64LoadStoreOptimizationPass()); |
Kristof Beyls | e66bc1f | 2018-12-18 08:50:02 +0000 | [diff] [blame] | 554 | } |
| 555 | |
| 556 | // The AArch64SpeculationHardeningPass destroys dominator tree and natural |
| 557 | // loop info, which is needed for the FalkorHWPFFixPass and also later on. |
| 558 | // Therefore, run the AArch64SpeculationHardeningPass before the |
| 559 | // FalkorHWPFFixPass to avoid recomputing dominator tree and natural loop |
| 560 | // info. |
| 561 | addPass(createAArch64SpeculationHardeningPass()); |
| 562 | |
| 563 | if (TM->getOptLevel() != CodeGenOpt::None) { |
Geoff Berry | 9962fae | 2017-07-18 16:14:22 +0000 | [diff] [blame] | 564 | if (EnableFalkorHWPFFix) |
| 565 | addPass(createFalkorHWPFFixPass()); |
| 566 | } |
Tim Northover | 3b0846e | 2014-05-24 12:50:23 +0000 | [diff] [blame] | 567 | } |
| 568 | |
Matthias Braun | 7e37a5f | 2014-12-11 21:26:47 +0000 | [diff] [blame] | 569 | void AArch64PassConfig::addPreEmitPass() { |
Alexandros Lamprineas | 490ae11 | 2018-12-17 10:45:43 +0000 | [diff] [blame] | 570 | // Machine Block Placement might have created new opportunities when run |
| 571 | // at O3, where the Tail Duplication Threshold is set to 4 instructions. |
| 572 | // Run the load/store optimizer once more. |
| 573 | if (TM->getOptLevel() >= CodeGenOpt::Aggressive && EnableLoadStoreOpt) |
| 574 | addPass(createAArch64LoadStoreOptimizationPass()); |
| 575 | |
Bradley Smith | f2a801d | 2014-10-13 10:12:35 +0000 | [diff] [blame] | 576 | if (EnableA53Fix835769) |
Matthias Braun | b2f2388 | 2014-12-11 23:18:03 +0000 | [diff] [blame] | 577 | addPass(createAArch64A53Fix835769()); |
Tim Northover | 3b0846e | 2014-05-24 12:50:23 +0000 | [diff] [blame] | 578 | // Relax conditional branch instructions if they're otherwise out of |
| 579 | // range of their destination. |
Diana Picus | 850043b | 2016-08-01 05:56:57 +0000 | [diff] [blame] | 580 | if (BranchRelaxation) |
Matt Arsenault | 36919a4 | 2016-10-06 15:38:53 +0000 | [diff] [blame] | 581 | addPass(&BranchRelaxationPassID); |
| 582 | |
Oliver Stannard | 250e5a5 | 2018-10-08 14:04:24 +0000 | [diff] [blame] | 583 | if (EnableBranchTargets) |
| 584 | addPass(createAArch64BranchTargetsPass()); |
| 585 | |
Tim Northover | 1c35341 | 2018-10-24 20:19:09 +0000 | [diff] [blame] | 586 | if (TM->getOptLevel() != CodeGenOpt::None && EnableCompressJumpTables) |
| 587 | addPass(createAArch64CompressJumpTablesPass()); |
| 588 | |
Tim Northover | 3b0846e | 2014-05-24 12:50:23 +0000 | [diff] [blame] | 589 | if (TM->getOptLevel() != CodeGenOpt::None && EnableCollectLOH && |
Daniel Sanders | c81f450 | 2015-06-16 15:44:21 +0000 | [diff] [blame] | 590 | TM->getTargetTriple().isOSBinFormatMachO()) |
Tim Northover | 3b0846e | 2014-05-24 12:50:23 +0000 | [diff] [blame] | 591 | addPass(createAArch64CollectLOHPass()); |
Tim Northover | 3b0846e | 2014-05-24 12:50:23 +0000 | [diff] [blame] | 592 | } |