| Nate Begeman | 6cca84e | 2005-10-16 05:39:50 +0000 | [diff] [blame] | 1 | //===-- PPCTargetMachine.cpp - Define TargetMachine for PowerPC -----------===// | 
| Misha Brukman | b440243 | 2005-04-21 23:30:14 +0000 | [diff] [blame] | 2 | // | 
| Misha Brukman | e05203f | 2004-06-21 16:55:25 +0000 | [diff] [blame] | 3 | //                     The LLVM Compiler Infrastructure | 
|  | 4 | // | 
| Chris Lattner | f3ebc3f | 2007-12-29 20:36:04 +0000 | [diff] [blame] | 5 | // This file is distributed under the University of Illinois Open Source | 
|  | 6 | // License. See LICENSE.TXT for details. | 
| Misha Brukman | b440243 | 2005-04-21 23:30:14 +0000 | [diff] [blame] | 7 | // | 
| Misha Brukman | e05203f | 2004-06-21 16:55:25 +0000 | [diff] [blame] | 8 | //===----------------------------------------------------------------------===// | 
| Misha Brukman | b440243 | 2005-04-21 23:30:14 +0000 | [diff] [blame] | 9 | // | 
| Chris Lattner | 73785d2 | 2005-08-15 23:47:04 +0000 | [diff] [blame] | 10 | // Top-level implementation for the PowerPC target. | 
| Misha Brukman | e05203f | 2004-06-21 16:55:25 +0000 | [diff] [blame] | 11 | // | 
|  | 12 | //===----------------------------------------------------------------------===// | 
|  | 13 |  | 
| Eugene Zelenko | 8187c19 | 2017-01-13 00:58:58 +0000 | [diff] [blame] | 14 | #include "MCTargetDesc/PPCMCTargetDesc.h" | 
| Craig Topper | b25fda9 | 2012-03-17 18:46:09 +0000 | [diff] [blame] | 15 | #include "PPC.h" | 
| Eugene Zelenko | 8187c19 | 2017-01-13 00:58:58 +0000 | [diff] [blame] | 16 | #include "PPCSubtarget.h" | 
| Chandler Carruth | d990388 | 2015-01-14 11:23:27 +0000 | [diff] [blame] | 17 | #include "PPCTargetObjectFile.h" | 
| Eugene Zelenko | 8187c19 | 2017-01-13 00:58:58 +0000 | [diff] [blame] | 18 | #include "PPCTargetMachine.h" | 
| Chandler Carruth | 93dcdc4 | 2015-01-31 11:17:59 +0000 | [diff] [blame] | 19 | #include "PPCTargetTransformInfo.h" | 
| Eugene Zelenko | 8187c19 | 2017-01-13 00:58:58 +0000 | [diff] [blame] | 20 | #include "llvm/ADT/Optional.h" | 
|  | 21 | #include "llvm/ADT/STLExtras.h" | 
|  | 22 | #include "llvm/ADT/StringRef.h" | 
|  | 23 | #include "llvm/ADT/Triple.h" | 
|  | 24 | #include "llvm/Analysis/TargetTransformInfo.h" | 
| Andrew Trick | ccb6736 | 2012-02-03 05:12:41 +0000 | [diff] [blame] | 25 | #include "llvm/CodeGen/Passes.h" | 
| Matthias Braun | 31d19d4 | 2016-05-10 03:21:59 +0000 | [diff] [blame] | 26 | #include "llvm/CodeGen/TargetPassConfig.h" | 
| Eugene Zelenko | 8187c19 | 2017-01-13 00:58:58 +0000 | [diff] [blame] | 27 | #include "llvm/IR/Attributes.h" | 
|  | 28 | #include "llvm/IR/DataLayout.h" | 
| Eric Christopher | 3faf2f1 | 2014-10-06 06:45:36 +0000 | [diff] [blame] | 29 | #include "llvm/IR/Function.h" | 
| Eugene Zelenko | 8187c19 | 2017-01-13 00:58:58 +0000 | [diff] [blame] | 30 | #include "llvm/Pass.h" | 
|  | 31 | #include "llvm/Support/CodeGen.h" | 
| Hal Finkel | 96c2d4d | 2012-06-08 15:38:21 +0000 | [diff] [blame] | 32 | #include "llvm/Support/CommandLine.h" | 
| Evan Cheng | 2bb4035 | 2011-08-24 18:08:43 +0000 | [diff] [blame] | 33 | #include "llvm/Support/TargetRegistry.h" | 
| Eugene Zelenko | 8187c19 | 2017-01-13 00:58:58 +0000 | [diff] [blame] | 34 | #include "llvm/Target/TargetLoweringObjectFile.h" | 
| Chandler Carruth | ed0881b | 2012-12-03 16:50:05 +0000 | [diff] [blame] | 35 | #include "llvm/Target/TargetOptions.h" | 
| Hal Finkel | f413be1 | 2014-11-21 04:35:51 +0000 | [diff] [blame] | 36 | #include "llvm/Transforms/Scalar.h" | 
| Eugene Zelenko | 8187c19 | 2017-01-13 00:58:58 +0000 | [diff] [blame] | 37 | #include <cassert> | 
|  | 38 | #include <memory> | 
|  | 39 | #include <string> | 
|  | 40 |  | 
| Misha Brukman | e05203f | 2004-06-21 16:55:25 +0000 | [diff] [blame] | 41 | using namespace llvm; | 
|  | 42 |  | 
| Hal Finkel | 96c2d4d | 2012-06-08 15:38:21 +0000 | [diff] [blame] | 43 | static cl:: | 
| Hal Finkel | c6b5deb | 2012-06-08 19:19:53 +0000 | [diff] [blame] | 44 | opt<bool> DisableCTRLoops("disable-ppc-ctrloops", cl::Hidden, | 
|  | 45 | cl::desc("Disable CTR loops for PPC")); | 
| Hal Finkel | 96c2d4d | 2012-06-08 15:38:21 +0000 | [diff] [blame] | 46 |  | 
| Hal Finkel | c9dd020 | 2015-02-05 18:43:00 +0000 | [diff] [blame] | 47 | static cl:: | 
|  | 48 | opt<bool> DisablePreIncPrep("disable-ppc-preinc-prep", cl::Hidden, | 
|  | 49 | cl::desc("Disable PPC loop preinc prep")); | 
|  | 50 |  | 
| Hal Finkel | 174e590 | 2014-03-25 23:29:21 +0000 | [diff] [blame] | 51 | static cl::opt<bool> | 
|  | 52 | VSXFMAMutateEarly("schedule-ppc-vsx-fma-mutation-early", | 
|  | 53 | cl::Hidden, cl::desc("Schedule VSX FMA instruction mutation early")); | 
|  | 54 |  | 
| Bill Schmidt | fe723b9 | 2015-04-27 19:57:34 +0000 | [diff] [blame] | 55 | static cl:: | 
|  | 56 | opt<bool> DisableVSXSwapRemoval("disable-ppc-vsx-swap-removal", cl::Hidden, | 
|  | 57 | cl::desc("Disable VSX Swap Removal for PPC")); | 
|  | 58 |  | 
| Bill Schmidt | 34af5e1 | 2015-11-10 21:38:26 +0000 | [diff] [blame] | 59 | static cl:: | 
| Hal Finkel | fc35391 | 2016-03-31 20:39:41 +0000 | [diff] [blame] | 60 | opt<bool> DisableQPXLoadSplat("disable-ppc-qpx-load-splat", cl::Hidden, | 
|  | 61 | cl::desc("Disable QPX load splat simplification")); | 
|  | 62 |  | 
|  | 63 | static cl:: | 
| Bill Schmidt | 34af5e1 | 2015-11-10 21:38:26 +0000 | [diff] [blame] | 64 | opt<bool> DisableMIPeephole("disable-ppc-peephole", cl::Hidden, | 
|  | 65 | cl::desc("Disable machine peepholes for PPC")); | 
|  | 66 |  | 
| Hal Finkel | f413be1 | 2014-11-21 04:35:51 +0000 | [diff] [blame] | 67 | static cl::opt<bool> | 
|  | 68 | EnableGEPOpt("ppc-gep-opt", cl::Hidden, | 
|  | 69 | cl::desc("Enable optimizations on complex GEPs"), | 
|  | 70 | cl::init(true)); | 
|  | 71 |  | 
| Hal Finkel | e5aaf3f | 2015-02-20 05:08:21 +0000 | [diff] [blame] | 72 | static cl::opt<bool> | 
|  | 73 | EnablePrefetch("enable-ppc-prefetching", | 
|  | 74 | cl::desc("disable software prefetching on PPC"), | 
|  | 75 | cl::init(false), cl::Hidden); | 
|  | 76 |  | 
| Hal Finkel | 8340de1 | 2015-05-18 06:25:59 +0000 | [diff] [blame] | 77 | static cl::opt<bool> | 
|  | 78 | EnableExtraTOCRegDeps("enable-ppc-extra-toc-reg-deps", | 
|  | 79 | cl::desc("Add extra TOC register dependencies"), | 
|  | 80 | cl::init(true), cl::Hidden); | 
|  | 81 |  | 
| Hal Finkel | 5d36b23 | 2015-07-15 08:23:05 +0000 | [diff] [blame] | 82 | static cl::opt<bool> | 
|  | 83 | EnableMachineCombinerPass("ppc-machine-combiner", | 
|  | 84 | cl::desc("Enable the machine combiner pass"), | 
|  | 85 | cl::init(true), cl::Hidden); | 
|  | 86 |  | 
| Daniel Dunbar | 5680b4f | 2009-07-25 06:49:55 +0000 | [diff] [blame] | 87 | extern "C" void LLVMInitializePowerPCTarget() { | 
|  | 88 | // Register the targets | 
| Mehdi Amini | f42454b | 2016-10-09 23:00:34 +0000 | [diff] [blame] | 89 | RegisterTargetMachine<PPC32TargetMachine> A(getThePPC32Target()); | 
|  | 90 | RegisterTargetMachine<PPC64TargetMachine> B(getThePPC64Target()); | 
|  | 91 | RegisterTargetMachine<PPC64TargetMachine> C(getThePPC64LETarget()); | 
| Kit Barton | a1c712f | 2015-12-07 20:50:29 +0000 | [diff] [blame] | 92 |  | 
|  | 93 | PassRegistry &PR = *PassRegistry::getPassRegistry(); | 
|  | 94 | initializePPCBoolRetToIntPass(PR); | 
| Tony Jiang | 8e8c444 | 2017-01-16 20:12:26 +0000 | [diff] [blame] | 95 | initializePPCExpandISELPass(PR); | 
| Daniel Dunbar | 5680b4f | 2009-07-25 06:49:55 +0000 | [diff] [blame] | 96 | } | 
| Douglas Gregor | 1b731d5 | 2009-06-16 20:12:29 +0000 | [diff] [blame] | 97 |  | 
| Eric Christopher | 8b77065 | 2015-01-26 19:03:15 +0000 | [diff] [blame] | 98 | /// Return the datalayout string of a subtarget. | 
|  | 99 | static std::string getDataLayoutString(const Triple &T) { | 
|  | 100 | bool is64Bit = T.getArch() == Triple::ppc64 || T.getArch() == Triple::ppc64le; | 
|  | 101 | std::string Ret; | 
|  | 102 |  | 
|  | 103 | // Most PPC* platforms are big endian, PPC64LE is little endian. | 
|  | 104 | if (T.getArch() == Triple::ppc64le) | 
|  | 105 | Ret = "e"; | 
|  | 106 | else | 
|  | 107 | Ret = "E"; | 
|  | 108 |  | 
|  | 109 | Ret += DataLayout::getManglingComponent(T); | 
|  | 110 |  | 
|  | 111 | // PPC32 has 32 bit pointers. The PS3 (OS Lv2) is a PPC64 machine with 32 bit | 
|  | 112 | // pointers. | 
|  | 113 | if (!is64Bit || T.getOS() == Triple::Lv2) | 
|  | 114 | Ret += "-p:32:32"; | 
|  | 115 |  | 
|  | 116 | // Note, the alignment values for f64 and i64 on ppc64 in Darwin | 
|  | 117 | // documentation are wrong; these are correct (i.e. "what gcc does"). | 
|  | 118 | if (is64Bit || !T.isOSDarwin()) | 
|  | 119 | Ret += "-i64:64"; | 
|  | 120 | else | 
|  | 121 | Ret += "-f64:32:64"; | 
|  | 122 |  | 
|  | 123 | // PPC64 has 32 and 64 bit registers, PPC32 has only 32 bit ones. | 
|  | 124 | if (is64Bit) | 
|  | 125 | Ret += "-n32:64"; | 
|  | 126 | else | 
|  | 127 | Ret += "-n32"; | 
|  | 128 |  | 
|  | 129 | return Ret; | 
|  | 130 | } | 
|  | 131 |  | 
| Daniel Sanders | 335487a | 2015-06-16 13:15:50 +0000 | [diff] [blame] | 132 | static std::string computeFSAdditions(StringRef FS, CodeGenOpt::Level OL, | 
|  | 133 | const Triple &TT) { | 
| Eric Christopher | 36448af | 2014-10-01 20:38:26 +0000 | [diff] [blame] | 134 | std::string FullFS = FS; | 
| Eric Christopher | 36448af | 2014-10-01 20:38:26 +0000 | [diff] [blame] | 135 |  | 
|  | 136 | // Make sure 64-bit features are available when CPUname is generic | 
| Daniel Sanders | 335487a | 2015-06-16 13:15:50 +0000 | [diff] [blame] | 137 | if (TT.getArch() == Triple::ppc64 || TT.getArch() == Triple::ppc64le) { | 
| Eric Christopher | 36448af | 2014-10-01 20:38:26 +0000 | [diff] [blame] | 138 | if (!FullFS.empty()) | 
|  | 139 | FullFS = "+64bit," + FullFS; | 
|  | 140 | else | 
|  | 141 | FullFS = "+64bit"; | 
|  | 142 | } | 
|  | 143 |  | 
|  | 144 | if (OL >= CodeGenOpt::Default) { | 
|  | 145 | if (!FullFS.empty()) | 
|  | 146 | FullFS = "+crbits," + FullFS; | 
|  | 147 | else | 
|  | 148 | FullFS = "+crbits"; | 
|  | 149 | } | 
| Hal Finkel | e2ab0f1 | 2015-01-15 21:17:34 +0000 | [diff] [blame] | 150 |  | 
|  | 151 | if (OL != CodeGenOpt::None) { | 
| NAKAMURA Takumi | 70ad98a | 2015-09-22 11:13:55 +0000 | [diff] [blame] | 152 | if (!FullFS.empty()) | 
| Hal Finkel | e2ab0f1 | 2015-01-15 21:17:34 +0000 | [diff] [blame] | 153 | FullFS = "+invariant-function-descriptors," + FullFS; | 
|  | 154 | else | 
|  | 155 | FullFS = "+invariant-function-descriptors"; | 
|  | 156 | } | 
|  | 157 |  | 
| Eric Christopher | 36448af | 2014-10-01 20:38:26 +0000 | [diff] [blame] | 158 | return FullFS; | 
|  | 159 | } | 
|  | 160 |  | 
| Aditya Nandakumar | a271932 | 2014-11-13 09:26:31 +0000 | [diff] [blame] | 161 | static std::unique_ptr<TargetLoweringObjectFile> createTLOF(const Triple &TT) { | 
|  | 162 | // If it isn't a Mach-O file then it's going to be a linux ELF | 
|  | 163 | // object file. | 
|  | 164 | if (TT.isOSDarwin()) | 
| Eugene Zelenko | 8187c19 | 2017-01-13 00:58:58 +0000 | [diff] [blame] | 165 | return llvm::make_unique<TargetLoweringObjectFileMachO>(); | 
| Aditya Nandakumar | a271932 | 2014-11-13 09:26:31 +0000 | [diff] [blame] | 166 |  | 
| Eugene Zelenko | 8187c19 | 2017-01-13 00:58:58 +0000 | [diff] [blame] | 167 | return llvm::make_unique<PPC64LinuxTargetObjectFile>(); | 
| Aditya Nandakumar | a271932 | 2014-11-13 09:26:31 +0000 | [diff] [blame] | 168 | } | 
|  | 169 |  | 
| Eric Christopher | fee6aaf | 2015-02-17 06:45:15 +0000 | [diff] [blame] | 170 | static PPCTargetMachine::PPCABI computeTargetABI(const Triple &TT, | 
|  | 171 | const TargetOptions &Options) { | 
|  | 172 | if (Options.MCOptions.getABIName().startswith("elfv1")) | 
|  | 173 | return PPCTargetMachine::PPC_ABI_ELFv1; | 
|  | 174 | else if (Options.MCOptions.getABIName().startswith("elfv2")) | 
|  | 175 | return PPCTargetMachine::PPC_ABI_ELFv2; | 
|  | 176 |  | 
|  | 177 | assert(Options.MCOptions.getABIName().empty() && | 
| NAKAMURA Takumi | 0a7d0ad | 2015-09-22 11:15:07 +0000 | [diff] [blame] | 178 | "Unknown target-abi option!"); | 
| Eric Christopher | fee6aaf | 2015-02-17 06:45:15 +0000 | [diff] [blame] | 179 |  | 
|  | 180 | if (!TT.isMacOSX()) { | 
|  | 181 | switch (TT.getArch()) { | 
|  | 182 | case Triple::ppc64le: | 
|  | 183 | return PPCTargetMachine::PPC_ABI_ELFv2; | 
|  | 184 | case Triple::ppc64: | 
|  | 185 | return PPCTargetMachine::PPC_ABI_ELFv1; | 
|  | 186 | default: | 
|  | 187 | // Fallthrough. | 
|  | 188 | ; | 
|  | 189 | } | 
|  | 190 | } | 
|  | 191 | return PPCTargetMachine::PPC_ABI_UNKNOWN; | 
|  | 192 | } | 
|  | 193 |  | 
| Rafael Espindola | 8c34dd8 | 2016-05-18 22:04:49 +0000 | [diff] [blame] | 194 | static Reloc::Model getEffectiveRelocModel(const Triple &TT, | 
|  | 195 | Optional<Reloc::Model> RM) { | 
|  | 196 | if (!RM.hasValue()) { | 
| Joerg Sonnenberger | 400e7b7 | 2016-12-15 00:01:53 +0000 | [diff] [blame] | 197 | if (TT.getArch() == Triple::ppc64 || TT.getArch() == Triple::ppc64le) { | 
|  | 198 | if (!TT.isOSBinFormatMachO() && !TT.isMacOSX()) | 
|  | 199 | return Reloc::PIC_; | 
|  | 200 | } | 
| Rafael Espindola | 8c34dd8 | 2016-05-18 22:04:49 +0000 | [diff] [blame] | 201 | if (TT.isOSDarwin()) | 
|  | 202 | return Reloc::DynamicNoPIC; | 
|  | 203 | return Reloc::Static; | 
|  | 204 | } | 
|  | 205 | return *RM; | 
|  | 206 | } | 
|  | 207 |  | 
| NAKAMURA Takumi | 8496503 | 2015-09-22 11:14:12 +0000 | [diff] [blame] | 208 | // The FeatureString here is a little subtle. We are modifying the feature | 
|  | 209 | // string with what are (currently) non-function specific overrides as it goes | 
|  | 210 | // into the LLVMTargetMachine constructor and then using the stored value in the | 
| Eric Christopher | 36448af | 2014-10-01 20:38:26 +0000 | [diff] [blame] | 211 | // Subtarget constructor below it. | 
| Daniel Sanders | 3e5de88 | 2015-06-11 19:41:26 +0000 | [diff] [blame] | 212 | PPCTargetMachine::PPCTargetMachine(const Target &T, const Triple &TT, | 
|  | 213 | StringRef CPU, StringRef FS, | 
|  | 214 | const TargetOptions &Options, | 
| Rafael Espindola | 8c34dd8 | 2016-05-18 22:04:49 +0000 | [diff] [blame] | 215 | Optional<Reloc::Model> RM, | 
|  | 216 | CodeModel::Model CM, CodeGenOpt::Level OL) | 
| Daniel Sanders | 3e5de88 | 2015-06-11 19:41:26 +0000 | [diff] [blame] | 217 | : LLVMTargetMachine(T, getDataLayoutString(TT), TT, CPU, | 
| Rafael Espindola | 8c34dd8 | 2016-05-18 22:04:49 +0000 | [diff] [blame] | 218 | computeFSAdditions(FS, OL, TT), Options, | 
|  | 219 | getEffectiveRelocModel(TT, RM), CM, OL), | 
| Daniel Sanders | c81f450 | 2015-06-16 15:44:21 +0000 | [diff] [blame] | 220 | TLOF(createTLOF(getTargetTriple())), | 
| Hal Finkel | cbf0892 | 2015-07-12 02:33:57 +0000 | [diff] [blame] | 221 | TargetABI(computeTargetABI(TT, Options)), | 
|  | 222 | Subtarget(TargetTriple, CPU, computeFSAdditions(FS, OL, TT), *this) { | 
|  | 223 |  | 
| Rafael Espindola | 227144c | 2013-05-13 01:16:13 +0000 | [diff] [blame] | 224 | initAsmInfo(); | 
| Nate Begeman | 6cca84e | 2005-10-16 05:39:50 +0000 | [diff] [blame] | 225 | } | 
|  | 226 |  | 
| Eugene Zelenko | 8187c19 | 2017-01-13 00:58:58 +0000 | [diff] [blame] | 227 | PPCTargetMachine::~PPCTargetMachine() = default; | 
| Reid Kleckner | 357600e | 2014-11-20 23:37:18 +0000 | [diff] [blame] | 228 |  | 
| Eugene Zelenko | 8187c19 | 2017-01-13 00:58:58 +0000 | [diff] [blame] | 229 | void PPC32TargetMachine::anchor() {} | 
| David Blaikie | a379b181 | 2011-12-20 02:50:00 +0000 | [diff] [blame] | 230 |  | 
| Daniel Sanders | 3e5de88 | 2015-06-11 19:41:26 +0000 | [diff] [blame] | 231 | PPC32TargetMachine::PPC32TargetMachine(const Target &T, const Triple &TT, | 
| Evan Cheng | efd9b42 | 2011-07-20 07:51:56 +0000 | [diff] [blame] | 232 | StringRef CPU, StringRef FS, | 
| Nick Lewycky | 50f02cb | 2011-12-02 22:16:29 +0000 | [diff] [blame] | 233 | const TargetOptions &Options, | 
| Rafael Espindola | 8c34dd8 | 2016-05-18 22:04:49 +0000 | [diff] [blame] | 234 | Optional<Reloc::Model> RM, | 
|  | 235 | CodeModel::Model CM, | 
| Evan Cheng | ecb2908 | 2011-11-16 08:38:26 +0000 | [diff] [blame] | 236 | CodeGenOpt::Level OL) | 
| Daniel Sanders | 3e5de88 | 2015-06-11 19:41:26 +0000 | [diff] [blame] | 237 | : PPCTargetMachine(T, TT, CPU, FS, Options, RM, CM, OL) {} | 
| Chris Lattner | 0c4aa14 | 2006-06-16 01:37:27 +0000 | [diff] [blame] | 238 |  | 
| Eugene Zelenko | 8187c19 | 2017-01-13 00:58:58 +0000 | [diff] [blame] | 239 | void PPC64TargetMachine::anchor() {} | 
| Chris Lattner | 0c4aa14 | 2006-06-16 01:37:27 +0000 | [diff] [blame] | 240 |  | 
| Daniel Sanders | 3e5de88 | 2015-06-11 19:41:26 +0000 | [diff] [blame] | 241 | PPC64TargetMachine::PPC64TargetMachine(const Target &T, const Triple &TT, | 
|  | 242 | StringRef CPU, StringRef FS, | 
| Nick Lewycky | 50f02cb | 2011-12-02 22:16:29 +0000 | [diff] [blame] | 243 | const TargetOptions &Options, | 
| Rafael Espindola | 8c34dd8 | 2016-05-18 22:04:49 +0000 | [diff] [blame] | 244 | Optional<Reloc::Model> RM, | 
|  | 245 | CodeModel::Model CM, | 
| Evan Cheng | ecb2908 | 2011-11-16 08:38:26 +0000 | [diff] [blame] | 246 | CodeGenOpt::Level OL) | 
| Daniel Sanders | 3e5de88 | 2015-06-11 19:41:26 +0000 | [diff] [blame] | 247 | : PPCTargetMachine(T, TT, CPU, FS, Options, RM, CM, OL) {} | 
| Chris Lattner | 0c4aa14 | 2006-06-16 01:37:27 +0000 | [diff] [blame] | 248 |  | 
| Eric Christopher | 3faf2f1 | 2014-10-06 06:45:36 +0000 | [diff] [blame] | 249 | const PPCSubtarget * | 
|  | 250 | PPCTargetMachine::getSubtargetImpl(const Function &F) const { | 
| Duncan P. N. Exon Smith | 5bedaf93 | 2015-02-14 02:54:07 +0000 | [diff] [blame] | 251 | Attribute CPUAttr = F.getFnAttribute("target-cpu"); | 
|  | 252 | Attribute FSAttr = F.getFnAttribute("target-features"); | 
| Eric Christopher | 3faf2f1 | 2014-10-06 06:45:36 +0000 | [diff] [blame] | 253 |  | 
|  | 254 | std::string CPU = !CPUAttr.hasAttribute(Attribute::None) | 
|  | 255 | ? CPUAttr.getValueAsString().str() | 
|  | 256 | : TargetCPU; | 
|  | 257 | std::string FS = !FSAttr.hasAttribute(Attribute::None) | 
|  | 258 | ? FSAttr.getValueAsString().str() | 
|  | 259 | : TargetFS; | 
|  | 260 |  | 
| Petar Jovanovic | 280f710 | 2015-12-14 17:57:33 +0000 | [diff] [blame] | 261 | // FIXME: This is related to the code below to reset the target options, | 
|  | 262 | // we need to know whether or not the soft float flag is set on the | 
|  | 263 | // function before we can generate a subtarget. We also need to use | 
|  | 264 | // it as a key for the subtarget since that can be the only difference | 
|  | 265 | // between two functions. | 
|  | 266 | bool SoftFloat = | 
| Nirav Dave | 8dd66e5 | 2016-03-30 15:41:12 +0000 | [diff] [blame] | 267 | F.getFnAttribute("use-soft-float").getValueAsString() == "true"; | 
| Petar Jovanovic | 280f710 | 2015-12-14 17:57:33 +0000 | [diff] [blame] | 268 | // If the soft float attribute is set on the function turn on the soft float | 
|  | 269 | // subtarget feature. | 
|  | 270 | if (SoftFloat) | 
| Hal Finkel | a932105 | 2016-10-02 02:10:20 +0000 | [diff] [blame] | 271 | FS += FS.empty() ? "-hard-float" : ",-hard-float"; | 
| Petar Jovanovic | 280f710 | 2015-12-14 17:57:33 +0000 | [diff] [blame] | 272 |  | 
| Eric Christopher | 3faf2f1 | 2014-10-06 06:45:36 +0000 | [diff] [blame] | 273 | auto &I = SubtargetMap[CPU + FS]; | 
|  | 274 | if (!I) { | 
|  | 275 | // This needs to be done before we create a new subtarget since any | 
|  | 276 | // creation will depend on the TM and the code generation flags on the | 
|  | 277 | // function that reside in TargetOptions. | 
|  | 278 | resetTargetOptions(F); | 
| Eric Christopher | ed1042b | 2015-03-26 00:50:23 +0000 | [diff] [blame] | 279 | I = llvm::make_unique<PPCSubtarget>( | 
| Daniel Sanders | c81f450 | 2015-06-16 15:44:21 +0000 | [diff] [blame] | 280 | TargetTriple, CPU, | 
| Eric Christopher | ed1042b | 2015-03-26 00:50:23 +0000 | [diff] [blame] | 281 | // FIXME: It would be good to have the subtarget additions here | 
|  | 282 | // not necessary. Anything that turns them on/off (overrides) ends | 
|  | 283 | // up being put at the end of the feature string, but the defaults | 
|  | 284 | // shouldn't require adding them. Fixing this means pulling Feature64Bit | 
|  | 285 | // out of most of the target cpus in the .td file and making it set only | 
|  | 286 | // as part of initialization via the TargetTriple. | 
|  | 287 | computeFSAdditions(FS, getOptLevel(), getTargetTriple()), *this); | 
| Eric Christopher | 3faf2f1 | 2014-10-06 06:45:36 +0000 | [diff] [blame] | 288 | } | 
|  | 289 | return I.get(); | 
|  | 290 | } | 
| Misha Brukman | b440243 | 2005-04-21 23:30:14 +0000 | [diff] [blame] | 291 |  | 
| Chris Lattner | 12e9730 | 2006-09-04 04:14:57 +0000 | [diff] [blame] | 292 | //===----------------------------------------------------------------------===// | 
|  | 293 | // Pass Pipeline Configuration | 
|  | 294 | //===----------------------------------------------------------------------===// | 
| Nate Begeman | f17ea0f | 2004-08-11 07:40:04 +0000 | [diff] [blame] | 295 |  | 
| Andrew Trick | ccb6736 | 2012-02-03 05:12:41 +0000 | [diff] [blame] | 296 | namespace { | 
| Eugene Zelenko | 8187c19 | 2017-01-13 00:58:58 +0000 | [diff] [blame] | 297 |  | 
| Andrew Trick | ccb6736 | 2012-02-03 05:12:41 +0000 | [diff] [blame] | 298 | /// PPC Code Generator Pass Configuration Options. | 
|  | 299 | class PPCPassConfig : public TargetPassConfig { | 
|  | 300 | public: | 
| Andrew Trick | f8ea108 | 2012-02-04 02:56:59 +0000 | [diff] [blame] | 301 | PPCPassConfig(PPCTargetMachine *TM, PassManagerBase &PM) | 
|  | 302 | : TargetPassConfig(TM, PM) {} | 
| Andrew Trick | ccb6736 | 2012-02-03 05:12:41 +0000 | [diff] [blame] | 303 |  | 
|  | 304 | PPCTargetMachine &getPPCTargetMachine() const { | 
|  | 305 | return getTM<PPCTargetMachine>(); | 
|  | 306 | } | 
|  | 307 |  | 
| Robin Morisset | 2212996 | 2014-09-23 20:46:49 +0000 | [diff] [blame] | 308 | void addIRPasses() override; | 
| Craig Topper | 0d3fa92 | 2014-04-29 07:57:37 +0000 | [diff] [blame] | 309 | bool addPreISel() override; | 
|  | 310 | bool addILPOpts() override; | 
|  | 311 | bool addInstSelector() override; | 
| Bill Schmidt | fe723b9 | 2015-04-27 19:57:34 +0000 | [diff] [blame] | 312 | void addMachineSSAOptimization() override; | 
| Matthias Braun | 7e37a5f | 2014-12-11 21:26:47 +0000 | [diff] [blame] | 313 | void addPreRegAlloc() override; | 
|  | 314 | void addPreSched2() override; | 
|  | 315 | void addPreEmitPass() override; | 
| Andrew Trick | ccb6736 | 2012-02-03 05:12:41 +0000 | [diff] [blame] | 316 | }; | 
| Eugene Zelenko | 8187c19 | 2017-01-13 00:58:58 +0000 | [diff] [blame] | 317 |  | 
|  | 318 | } // end anonymous namespace | 
| Andrew Trick | ccb6736 | 2012-02-03 05:12:41 +0000 | [diff] [blame] | 319 |  | 
| Andrew Trick | f8ea108 | 2012-02-04 02:56:59 +0000 | [diff] [blame] | 320 | TargetPassConfig *PPCTargetMachine::createPassConfig(PassManagerBase &PM) { | 
| Hal Finkel | eb50c2d | 2012-06-09 03:14:50 +0000 | [diff] [blame] | 321 | return new PPCPassConfig(this, PM); | 
| Andrew Trick | ccb6736 | 2012-02-03 05:12:41 +0000 | [diff] [blame] | 322 | } | 
|  | 323 |  | 
| Robin Morisset | 2212996 | 2014-09-23 20:46:49 +0000 | [diff] [blame] | 324 | void PPCPassConfig::addIRPasses() { | 
| Kit Barton | a1c712f | 2015-12-07 20:50:29 +0000 | [diff] [blame] | 325 | if (TM->getOptLevel() != CodeGenOpt::None) | 
|  | 326 | addPass(createPPCBoolRetToIntPass()); | 
| Robin Morisset | 2212996 | 2014-09-23 20:46:49 +0000 | [diff] [blame] | 327 | addPass(createAtomicExpandPass(&getPPCTargetMachine())); | 
| Hal Finkel | f413be1 | 2014-11-21 04:35:51 +0000 | [diff] [blame] | 328 |  | 
| Hal Finkel | e5aaf3f | 2015-02-20 05:08:21 +0000 | [diff] [blame] | 329 | // For the BG/Q (or if explicitly requested), add explicit data prefetch | 
|  | 330 | // intrinsics. | 
| Daniel Sanders | c81f450 | 2015-06-16 15:44:21 +0000 | [diff] [blame] | 331 | bool UsePrefetching = TM->getTargetTriple().getVendor() == Triple::BGQ && | 
|  | 332 | getOptLevel() != CodeGenOpt::None; | 
| Hal Finkel | e5aaf3f | 2015-02-20 05:08:21 +0000 | [diff] [blame] | 333 | if (EnablePrefetch.getNumOccurrences() > 0) | 
|  | 334 | UsePrefetching = EnablePrefetch; | 
|  | 335 | if (UsePrefetching) | 
| Adam Nemet | 9d9cb27 | 2016-02-18 21:38:19 +0000 | [diff] [blame] | 336 | addPass(createLoopDataPrefetchPass()); | 
| Hal Finkel | e5aaf3f | 2015-02-20 05:08:21 +0000 | [diff] [blame] | 337 |  | 
| Ehsan Amiri | 4701a91 | 2016-04-07 15:30:55 +0000 | [diff] [blame] | 338 | if (TM->getOptLevel() >= CodeGenOpt::Default && EnableGEPOpt) { | 
| Hal Finkel | f413be1 | 2014-11-21 04:35:51 +0000 | [diff] [blame] | 339 | // Call SeparateConstOffsetFromGEP pass to extract constants within indices | 
|  | 340 | // and lower a GEP with multiple indices to either arithmetic operations or | 
|  | 341 | // multiple GEPs with single index. | 
|  | 342 | addPass(createSeparateConstOffsetFromGEPPass(TM, true)); | 
|  | 343 | // Call EarlyCSE pass to find and remove subexpressions in the lowered | 
|  | 344 | // result. | 
|  | 345 | addPass(createEarlyCSEPass()); | 
|  | 346 | // Do loop invariant code motion in case part of the lowered result is | 
|  | 347 | // invariant. | 
|  | 348 | addPass(createLICMPass()); | 
|  | 349 | } | 
|  | 350 |  | 
| Robin Morisset | 2212996 | 2014-09-23 20:46:49 +0000 | [diff] [blame] | 351 | TargetPassConfig::addIRPasses(); | 
|  | 352 | } | 
|  | 353 |  | 
| Hal Finkel | 25c1992 | 2013-05-15 21:37:41 +0000 | [diff] [blame] | 354 | bool PPCPassConfig::addPreISel() { | 
| Hal Finkel | c9dd020 | 2015-02-05 18:43:00 +0000 | [diff] [blame] | 355 | if (!DisablePreIncPrep && getOptLevel() != CodeGenOpt::None) | 
|  | 356 | addPass(createPPCLoopPreIncPrepPass(getPPCTargetMachine())); | 
|  | 357 |  | 
| Hal Finkel | c6b5deb | 2012-06-08 19:19:53 +0000 | [diff] [blame] | 358 | if (!DisableCTRLoops && getOptLevel() != CodeGenOpt::None) | 
| Hal Finkel | 25c1992 | 2013-05-15 21:37:41 +0000 | [diff] [blame] | 359 | addPass(createPPCCTRLoops(getPPCTargetMachine())); | 
| Hal Finkel | 96c2d4d | 2012-06-08 15:38:21 +0000 | [diff] [blame] | 360 |  | 
|  | 361 | return false; | 
|  | 362 | } | 
|  | 363 |  | 
| Hal Finkel | ed6a285 | 2013-04-05 23:29:01 +0000 | [diff] [blame] | 364 | bool PPCPassConfig::addILPOpts() { | 
| Eric Christopher | 6b0fcfe | 2014-05-21 23:40:26 +0000 | [diff] [blame] | 365 | addPass(&EarlyIfConverterID); | 
| Hal Finkel | 5d36b23 | 2015-07-15 08:23:05 +0000 | [diff] [blame] | 366 |  | 
|  | 367 | if (EnableMachineCombinerPass) | 
|  | 368 | addPass(&MachineCombinerID); | 
|  | 369 |  | 
| Eric Christopher | 6b0fcfe | 2014-05-21 23:40:26 +0000 | [diff] [blame] | 370 | return true; | 
| Hal Finkel | ed6a285 | 2013-04-05 23:29:01 +0000 | [diff] [blame] | 371 | } | 
|  | 372 |  | 
| Andrew Trick | ccb6736 | 2012-02-03 05:12:41 +0000 | [diff] [blame] | 373 | bool PPCPassConfig::addInstSelector() { | 
| Chris Lattner | c6aa806 | 2005-08-17 19:33:30 +0000 | [diff] [blame] | 374 | // Install an instruction selector. | 
| Bob Wilson | bbd38dd | 2012-07-02 19:48:31 +0000 | [diff] [blame] | 375 | addPass(createPPCISelDag(getPPCTargetMachine())); | 
| Hal Finkel | 8ca3884 | 2013-05-20 16:08:17 +0000 | [diff] [blame] | 376 |  | 
|  | 377 | #ifndef NDEBUG | 
|  | 378 | if (!DisableCTRLoops && getOptLevel() != CodeGenOpt::None) | 
|  | 379 | addPass(createPPCCTRLoopsVerify()); | 
|  | 380 | #endif | 
|  | 381 |  | 
| Eric Christopher | d71e444 | 2014-05-22 01:21:35 +0000 | [diff] [blame] | 382 | addPass(createPPCVSXCopyPass()); | 
| Nate Begeman | f17ea0f | 2004-08-11 07:40:04 +0000 | [diff] [blame] | 383 | return false; | 
|  | 384 | } | 
|  | 385 |  | 
| Bill Schmidt | fe723b9 | 2015-04-27 19:57:34 +0000 | [diff] [blame] | 386 | void PPCPassConfig::addMachineSSAOptimization() { | 
|  | 387 | TargetPassConfig::addMachineSSAOptimization(); | 
|  | 388 | // For little endian, remove where possible the vector swap instructions | 
|  | 389 | // introduced at code generation to normalize vector element order. | 
| Daniel Sanders | c81f450 | 2015-06-16 15:44:21 +0000 | [diff] [blame] | 390 | if (TM->getTargetTriple().getArch() == Triple::ppc64le && | 
| Bill Schmidt | fe723b9 | 2015-04-27 19:57:34 +0000 | [diff] [blame] | 391 | !DisableVSXSwapRemoval) | 
|  | 392 | addPass(createPPCVSXSwapRemovalPass()); | 
| Bill Schmidt | 34af5e1 | 2015-11-10 21:38:26 +0000 | [diff] [blame] | 393 | // Target-specific peephole cleanups performed after instruction | 
|  | 394 | // selection. | 
|  | 395 | if (!DisableMIPeephole) { | 
|  | 396 | addPass(createPPCMIPeepholePass()); | 
|  | 397 | addPass(&DeadMachineInstructionElimID); | 
|  | 398 | } | 
| Bill Schmidt | fe723b9 | 2015-04-27 19:57:34 +0000 | [diff] [blame] | 399 | } | 
|  | 400 |  | 
| Matthias Braun | 7e37a5f | 2014-12-11 21:26:47 +0000 | [diff] [blame] | 401 | void PPCPassConfig::addPreRegAlloc() { | 
| Andrew Kaylor | 289bd5f | 2016-04-27 19:39:32 +0000 | [diff] [blame] | 402 | if (getOptLevel() != CodeGenOpt::None) { | 
|  | 403 | initializePPCVSXFMAMutatePass(*PassRegistry::getPassRegistry()); | 
|  | 404 | insertPass(VSXFMAMutateEarly ? &RegisterCoalescerID : &MachineSchedulerID, | 
|  | 405 | &PPCVSXFMAMutateID); | 
|  | 406 | } | 
| Rafael Espindola | 248cfb9 | 2016-06-28 12:49:12 +0000 | [diff] [blame] | 407 |  | 
|  | 408 | // FIXME: We probably don't need to run these for -fPIE. | 
|  | 409 | if (getPPCTargetMachine().isPositionIndependent()) { | 
| Matthias Braun | f84547c | 2016-04-28 23:42:51 +0000 | [diff] [blame] | 410 | // FIXME: LiveVariables should not be necessary here! | 
|  | 411 | // PPCTLSDYnamicCallPass uses LiveIntervals which previously dependet on | 
|  | 412 | // LiveVariables. This (unnecessary) dependency has been removed now, | 
|  | 413 | // however a stage-2 clang build fails without LiveVariables computed here. | 
|  | 414 | addPass(&LiveVariablesID, false); | 
| Bill Schmidt | 82f1c77 | 2015-02-10 19:09:05 +0000 | [diff] [blame] | 415 | addPass(createPPCTLSDynamicCallPass()); | 
| Matthias Braun | f84547c | 2016-04-28 23:42:51 +0000 | [diff] [blame] | 416 | } | 
| Hal Finkel | 8340de1 | 2015-05-18 06:25:59 +0000 | [diff] [blame] | 417 | if (EnableExtraTOCRegDeps) | 
|  | 418 | addPass(createPPCTOCRegDepsPass()); | 
| Hal Finkel | 174e590 | 2014-03-25 23:29:21 +0000 | [diff] [blame] | 419 | } | 
|  | 420 |  | 
| Matthias Braun | 7e37a5f | 2014-12-11 21:26:47 +0000 | [diff] [blame] | 421 | void PPCPassConfig::addPreSched2() { | 
| Hal Finkel | fc35391 | 2016-03-31 20:39:41 +0000 | [diff] [blame] | 422 | if (getOptLevel() != CodeGenOpt::None) { | 
| Hal Finkel | 5711eca | 2013-04-09 22:58:37 +0000 | [diff] [blame] | 423 | addPass(&IfConverterID); | 
| Hal Finkel | fc35391 | 2016-03-31 20:39:41 +0000 | [diff] [blame] | 424 |  | 
|  | 425 | // This optimization must happen after anything that might do store-to-load | 
|  | 426 | // forwarding. Here we're after RA (and, thus, when spills are inserted) | 
|  | 427 | // but before post-RA scheduling. | 
|  | 428 | if (!DisableQPXLoadSplat) | 
|  | 429 | addPass(createPPCQPXLoadSplatPass()); | 
|  | 430 | } | 
| Hal Finkel | 5711eca | 2013-04-09 22:58:37 +0000 | [diff] [blame] | 431 | } | 
|  | 432 |  | 
| Matthias Braun | 7e37a5f | 2014-12-11 21:26:47 +0000 | [diff] [blame] | 433 | void PPCPassConfig::addPreEmitPass() { | 
| Tony Jiang | 8e8c444 | 2017-01-16 20:12:26 +0000 | [diff] [blame] | 434 | addPass(createPPCExpandISELPass()); | 
|  | 435 |  | 
| Hal Finkel | b5aa7e5 | 2013-04-08 16:24:03 +0000 | [diff] [blame] | 436 | if (getOptLevel() != CodeGenOpt::None) | 
| Matthias Braun | 7e37a5f | 2014-12-11 21:26:47 +0000 | [diff] [blame] | 437 | addPass(createPPCEarlyReturnPass(), false); | 
| Chris Lattner | 12e9730 | 2006-09-04 04:14:57 +0000 | [diff] [blame] | 438 | // Must run branch selection immediately preceding the asm printer. | 
| Matthias Braun | 7e37a5f | 2014-12-11 21:26:47 +0000 | [diff] [blame] | 439 | addPass(createPPCBranchSelectionPass(), false); | 
| Chris Lattner | 12e9730 | 2006-09-04 04:14:57 +0000 | [diff] [blame] | 440 | } | 
|  | 441 |  | 
| Chandler Carruth | 8b04c0d | 2015-02-01 13:20:00 +0000 | [diff] [blame] | 442 | TargetIRAnalysis PPCTargetMachine::getTargetIRAnalysis() { | 
| Eric Christopher | a4e5d3c | 2015-09-16 23:38:13 +0000 | [diff] [blame] | 443 | return TargetIRAnalysis([this](const Function &F) { | 
|  | 444 | return TargetTransformInfo(PPCTTIImpl(this, F)); | 
|  | 445 | }); | 
| Hal Finkel | 4e5ca9e | 2013-01-25 23:05:59 +0000 | [diff] [blame] | 446 | } |