blob: e8a87e7f4437feb3f31fe08214bad161434c8a97 [file] [log] [blame]
Jia Liub22310f2012-02-18 12:03:15 +00001//===-- PowerPCSubtarget.cpp - PPC Subtarget Information ------------------===//
Nate Begeman3bcfcd92005-08-04 07:12:09 +00002//
3// The LLVM Compiler Infrastructure
4//
Chris Lattnerf3ebc3f2007-12-29 20:36:04 +00005// This file is distributed under the University of Illinois Open Source
6// License. See LICENSE.TXT for details.
Nate Begeman3bcfcd92005-08-04 07:12:09 +00007//
8//===----------------------------------------------------------------------===//
9//
Evan Cheng0d639a22011-07-01 21:01:15 +000010// This file implements the PPC specific subclass of TargetSubtargetInfo.
Nate Begeman3bcfcd92005-08-04 07:12:09 +000011//
12//===----------------------------------------------------------------------===//
13
Chris Lattnerbfca1ab2005-10-14 23:51:18 +000014#include "PPCSubtarget.h"
15#include "PPC.h"
Chandler Carruthed0881b2012-12-03 16:50:05 +000016#include "PPCRegisterInfo.h"
Eric Christopher8b770652015-01-26 19:03:15 +000017#include "PPCTargetMachine.h"
Hal Finkela0014a52013-07-15 22:29:40 +000018#include "llvm/CodeGen/MachineFunction.h"
Hal Finkel21442b22013-09-11 23:05:25 +000019#include "llvm/CodeGen/MachineScheduler.h"
Hal Finkela0014a52013-07-15 22:29:40 +000020#include "llvm/IR/Attributes.h"
Hal Finkela0014a52013-07-15 22:29:40 +000021#include "llvm/IR/Function.h"
Chandler Carruth8a8cd2b2014-01-07 11:48:04 +000022#include "llvm/IR/GlobalValue.h"
Hal Finkel5ff00b42015-01-09 02:03:11 +000023#include "llvm/Support/CommandLine.h"
Evan Cheng2bb40352011-08-24 18:08:43 +000024#include "llvm/Support/TargetRegistry.h"
Chandler Carruthed0881b2012-12-03 16:50:05 +000025#include "llvm/Target/TargetMachine.h"
Dan Gohman906152a2009-01-05 17:59:02 +000026#include <cstdlib>
Evan Cheng54b68e32011-07-01 20:45:01 +000027
Chandler Carruthd174b722014-04-22 02:03:14 +000028using namespace llvm;
29
Chandler Carruthe96dd892014-04-21 22:55:11 +000030#define DEBUG_TYPE "ppc-subtarget"
31
Evan Cheng54b68e32011-07-01 20:45:01 +000032#define GET_SUBTARGETINFO_TARGET_DESC
Evan Cheng4d1ca962011-07-08 01:53:10 +000033#define GET_SUBTARGETINFO_CTOR
Evan Chengc9c090d2011-07-01 22:36:09 +000034#include "PPCGenSubtargetInfo.inc"
Evan Cheng54b68e32011-07-01 20:45:01 +000035
Hal Finkel5ff00b42015-01-09 02:03:11 +000036static cl::opt<bool> UseSubRegLiveness("ppc-track-subreg-liveness",
37cl::desc("Enable subregister liveness tracking for PPC"), cl::Hidden);
38
Hal Finkelc93a9a22015-02-25 01:06:45 +000039static cl::opt<bool> QPXStackUnaligned("qpx-stack-unaligned",
40 cl::desc("Even when QPX is enabled the stack is not 32-byte aligned"),
41 cl::Hidden);
42
Eric Christopherd104c312014-06-12 20:54:11 +000043PPCSubtarget &PPCSubtarget::initializeSubtargetDependencies(StringRef CPU,
44 StringRef FS) {
45 initializeEnvironment();
Eric Christopherb68e2532014-09-03 20:36:31 +000046 initSubtargetFeatures(CPU, FS);
Eric Christopherd104c312014-06-12 20:54:11 +000047 return *this;
48}
49
Daniel Sandersa73f1fd2015-06-10 12:11:26 +000050PPCSubtarget::PPCSubtarget(const Triple &TT, const std::string &CPU,
Eric Christopherf6ed33e2014-10-01 21:36:28 +000051 const std::string &FS, const PPCTargetMachine &TM)
Daniel Sanders50f17232015-09-15 16:17:27 +000052 : PPCGenSubtargetInfo(TT, CPU, FS), TargetTriple(TT),
Eric Christopher3770cf52014-08-09 04:38:56 +000053 IsPPC64(TargetTriple.getArch() == Triple::ppc64 ||
54 TargetTriple.getArch() == Triple::ppc64le),
Eric Christopherfee6aaf2015-02-17 06:45:15 +000055 TM(TM), FrameLowering(initializeSubtargetDependencies(CPU, FS)),
Mehdi Amini157e5a62015-07-09 02:10:08 +000056 InstrInfo(*this), TLInfo(TM, *this) {}
Eric Christopherb9fd9ed2014-08-07 22:02:54 +000057
Hal Finkela0014a52013-07-15 22:29:40 +000058void PPCSubtarget::initializeEnvironment() {
59 StackAlignment = 16;
60 DarwinDirective = PPC::DIR_NONE;
61 HasMFOCRF = false;
62 Has64BitSupport = false;
63 Use64BitRegs = false;
Hal Finkel940ab932014-02-28 00:27:01 +000064 UseCRBits = false;
Hal Finkela9321052016-10-02 02:10:20 +000065 HasHardFloat = false;
Hal Finkela0014a52013-07-15 22:29:40 +000066 HasAltivec = false;
Joerg Sonnenberger39f095a2014-08-07 12:18:21 +000067 HasSPE = false;
Hal Finkela0014a52013-07-15 22:29:40 +000068 HasQPX = false;
Hal Finkel27774d92014-03-13 07:58:58 +000069 HasVSX = false;
Bill Schmidtdcce0232014-10-10 17:21:15 +000070 HasP8Vector = false;
Bill Schmidtfe88b182015-02-03 21:58:23 +000071 HasP8Altivec = false;
Nemanja Ivanovice8effe12015-03-04 20:44:33 +000072 HasP8Crypto = false;
Kit Barton93612ec2016-02-26 21:11:55 +000073 HasP9Vector = false;
74 HasP9Altivec = false;
Hal Finkeldbc78e12013-08-19 05:01:02 +000075 HasFCPSGN = false;
Hal Finkela0014a52013-07-15 22:29:40 +000076 HasFSQRT = false;
77 HasFRE = false;
78 HasFRES = false;
79 HasFRSQRTE = false;
80 HasFRSQRTES = false;
81 HasRecipPrec = false;
82 HasSTFIWX = false;
83 HasLFIWAX = false;
84 HasFPRND = false;
85 HasFPCVT = false;
86 HasISEL = false;
Nemanja Ivanovicc0904792015-04-09 23:54:37 +000087 HasBPERMD = false;
88 HasExtDiv = false;
Hal Finkel4edc66b2015-01-03 01:16:37 +000089 HasCMPB = false;
Hal Finkela0014a52013-07-15 22:29:40 +000090 HasLDBRX = false;
91 IsBookE = false;
Hal Finkelfe3368c2014-10-02 22:34:22 +000092 HasOnlyMSYNC = false;
Joerg Sonnenberger0b2ebcb2014-08-04 15:47:38 +000093 IsPPC4xx = false;
Joerg Sonnenberger74052102014-08-04 17:07:41 +000094 IsPPC6xx = false;
Joerg Sonnenberger0b2ebcb2014-08-04 15:47:38 +000095 IsE500 = false;
Kit Barton4f79f962015-06-16 16:01:15 +000096 FeatureMFTB = false;
Hal Finkel0096dbd2013-09-12 14:40:06 +000097 DeprecatedDST = false;
Hal Finkela0014a52013-07-15 22:29:40 +000098 HasLazyResolverStubs = false;
Bill Schmidt082cfc02015-01-14 20:17:10 +000099 HasICBT = false;
Hal Finkele2ab0f12015-01-15 21:17:34 +0000100 HasInvariantFunctionDescriptors = false;
Nemanja Ivanovic0adf26b2015-03-10 20:51:07 +0000101 HasPartwordAtomics = false;
Nemanja Ivanovicc38b5312015-04-11 10:40:42 +0000102 HasDirectMove = false;
Hal Finkelc93a9a22015-02-25 01:06:45 +0000103 IsQPXStackUnaligned = false;
Kit Barton535e69d2015-03-25 19:36:23 +0000104 HasHTM = false;
Eric Christopher25bf4a82015-11-20 22:38:20 +0000105 HasFusion = false;
Nemanja Ivanovicb033f672015-12-15 12:19:34 +0000106 HasFloat128 = false;
Nemanja Ivanovica621a7f2016-03-31 15:26:37 +0000107 IsISA3_0 = false;
Hal Finkelb074a602016-08-30 00:59:23 +0000108 UseLongCalls = false;
Hal Finkelfa7057a2016-03-29 01:36:01 +0000109
110 HasPOPCNTD = POPCNTD_Unavailable;
Hal Finkela0014a52013-07-15 22:29:40 +0000111}
112
Eric Christopherb68e2532014-09-03 20:36:31 +0000113void PPCSubtarget::initSubtargetFeatures(StringRef CPU, StringRef FS) {
Jim Laskey19058c32005-09-01 21:38:21 +0000114 // Determine default and user specified characteristics
Evan Chengfe6e4052011-06-30 01:53:36 +0000115 std::string CPUName = CPU;
Nemanja Ivanovic1a5706c2016-02-29 16:42:27 +0000116 if (CPUName.empty() || CPU == "generic") {
Bill Schmidt8cf15ce2015-01-29 15:59:09 +0000117 // If cross-compiling with -march=ppc64le without -mcpu
118 if (TargetTriple.getArch() == Triple::ppc64le)
119 CPUName = "ppc64le";
120 else
121 CPUName = "generic";
122 }
Jim Laskeya2b52352005-10-26 17:30:34 +0000123
Evan Cheng54b68e32011-07-01 20:45:01 +0000124 // Initialize scheduling itinerary for the specified CPU.
125 InstrItins = getInstrItineraryForCPU(CPUName);
126
Adhemerval Zanellaf2aceda2012-10-25 12:27:42 +0000127 // Parse features string.
Eric Christopher36448af2014-10-01 20:38:26 +0000128 ParseSubtargetFeatures(CPUName, FS);
Adhemerval Zanellaf2aceda2012-10-25 12:27:42 +0000129
Chris Lattner16682ff2006-06-16 17:50:12 +0000130 // If the user requested use of 64-bit regs, but the cpu selected doesn't
Dale Johannesen2e019122008-02-15 18:40:53 +0000131 // support it, ignore.
Eric Christopher36448af2014-10-01 20:38:26 +0000132 if (IsPPC64 && has64BitSupport())
133 Use64BitRegs = true;
Chris Lattnerf4646a72006-12-11 23:22:45 +0000134
135 // Set up darwin-specific properties.
Chris Lattnere6555212009-08-11 22:49:34 +0000136 if (isDarwin())
Chris Lattnerf4646a72006-12-11 23:22:45 +0000137 HasLazyResolverStubs = true;
Hal Finkele1df9092013-01-30 23:43:27 +0000138
139 // QPX requires a 32-byte aligned stack. Note that we need to do this if
140 // we're compiling for a BG/Q system regardless of whether or not QPX
141 // is enabled because external functions will assume this alignment.
Hal Finkelc93a9a22015-02-25 01:06:45 +0000142 IsQPXStackUnaligned = QPXStackUnaligned;
143 StackAlignment = getPlatformStackAlignment();
Bill Schmidt0a9170d2013-07-26 01:35:43 +0000144
145 // Determine endianness.
Eric Christopher75dc3902015-02-17 06:45:17 +0000146 // FIXME: Part of the TargetMachine.
Bill Schmidt0a9170d2013-07-26 01:35:43 +0000147 IsLittleEndian = (TargetTriple.getArch() == Triple::ppc64le);
Chris Lattnerf4646a72006-12-11 23:22:45 +0000148}
149
Rafael Espindola65787a92016-06-23 20:50:42 +0000150/// Return true if accesses to the specified global have to go through a dyld
151/// lazy resolution stub. This means that an extra load is required to get the
152/// address of the global.
Eric Christophere8dbfe12015-02-13 22:23:04 +0000153bool PPCSubtarget::hasLazyResolverStub(const GlobalValue *GV) const {
Rafael Espindola65787a92016-06-23 20:50:42 +0000154 if (!HasLazyResolverStubs)
Chris Lattnerf4646a72006-12-11 23:22:45 +0000155 return false;
Rafael Espindola3beef8d2016-06-27 23:15:57 +0000156 if (!TM.shouldAssumeDSOLocal(*GV->getParent(), GV))
Rafael Espindola65787a92016-06-23 20:50:42 +0000157 return true;
158 // 32 bit macho has no relocation for a-b if a is undefined, even if b is in
159 // the section that is being relocated. This means we have to use o load even
160 // for GVs that are known to be local to the dso.
161 if (GV->isDeclarationForLinker() || GV->hasCommonLinkage())
162 return true;
163 return false;
Nate Begeman3bcfcd92005-08-04 07:12:09 +0000164}
Hal Finkel58ca3602011-12-02 04:58:02 +0000165
Hal Finkel42daeae2013-11-30 20:55:12 +0000166// Embedded cores need aggressive scheduling (and some others also benefit).
Hal Finkel21442b22013-09-11 23:05:25 +0000167static bool needsAggressiveScheduling(unsigned Directive) {
168 switch (Directive) {
169 default: return false;
170 case PPC::DIR_440:
171 case PPC::DIR_A2:
172 case PPC::DIR_E500mc:
173 case PPC::DIR_E5500:
Hal Finkel42daeae2013-11-30 20:55:12 +0000174 case PPC::DIR_PWR7:
Will Schmidt970ff642014-06-26 13:36:19 +0000175 case PPC::DIR_PWR8:
Nemanja Ivanovic6e29baf2016-05-09 18:54:58 +0000176 // FIXME: Same as P8 until POWER9 scheduling info is available
177 case PPC::DIR_PWR9:
Hal Finkel21442b22013-09-11 23:05:25 +0000178 return true;
179 }
180}
181
182bool PPCSubtarget::enableMachineScheduler() const {
183 // Enable MI scheduling for the embedded cores.
184 // FIXME: Enable this for all cores (some additional modeling
185 // may be necessary).
186 return needsAggressiveScheduling(DarwinDirective);
187}
188
Sanjay Patela2f658d2014-07-15 22:39:58 +0000189// This overrides the PostRAScheduler bit in the SchedModel for each CPU.
Matthias Braun39a2afc2015-06-13 03:42:16 +0000190bool PPCSubtarget::enablePostRAScheduler() const { return true; }
Sanjay Patela2f658d2014-07-15 22:39:58 +0000191
192PPCGenSubtargetInfo::AntiDepBreakMode PPCSubtarget::getAntiDepBreakMode() const {
193 return TargetSubtargetInfo::ANTIDEP_ALL;
194}
195
196void PPCSubtarget::getCriticalPathRCs(RegClassVector &CriticalPathRCs) const {
197 CriticalPathRCs.clear();
198 CriticalPathRCs.push_back(isPPC64() ?
199 &PPC::G8RCRegClass : &PPC::GPRCRegClass);
200}
201
Hal Finkel21442b22013-09-11 23:05:25 +0000202void PPCSubtarget::overrideSchedPolicy(MachineSchedPolicy &Policy,
Hal Finkel21442b22013-09-11 23:05:25 +0000203 unsigned NumRegionInstrs) const {
204 if (needsAggressiveScheduling(DarwinDirective)) {
205 Policy.OnlyTopDown = false;
206 Policy.OnlyBottomUp = false;
207 }
208
209 // Spilling is generally expensive on all PPC cores, so always enable
210 // register-pressure tracking.
211 Policy.ShouldTrackPressure = true;
212}
213
214bool PPCSubtarget::useAA() const {
215 // Use AA during code generation for the embedded cores.
216 return needsAggressiveScheduling(DarwinDirective);
217}
218
Hal Finkel5ff00b42015-01-09 02:03:11 +0000219bool PPCSubtarget::enableSubRegLiveness() const {
220 return UseSubRegLiveness;
221}
222
Eric Christopherc1808362015-11-20 20:51:31 +0000223unsigned char PPCSubtarget::classifyGlobalReference(
224 const GlobalValue *GV) const {
225 // Note that currently we don't generate non-pic references.
226 // If a caller wants that, this will have to be updated.
227
228 // Large code model always uses the TOC even for local symbols.
229 if (TM.getCodeModel() == CodeModel::Large)
230 return PPCII::MO_PIC_FLAG | PPCII::MO_NLP_FLAG;
231
232 unsigned char flags = PPCII::MO_PIC_FLAG;
233
234 // Only if the relocation mode is PIC do we have to worry about
235 // interposition. In all other cases we can use a slightly looser standard to
236 // decide how to access the symbol.
237 if (TM.getRelocationModel() == Reloc::PIC_) {
238 // If it's local, or it's non-default, it can't be interposed.
239 if (!GV->hasLocalLinkage() &&
240 GV->hasDefaultVisibility()) {
241 flags |= PPCII::MO_NLP_FLAG;
242 }
243 return flags;
244 }
245
246 if (GV->isStrongDefinitionForLinker())
247 return flags;
248 return flags | PPCII::MO_NLP_FLAG;
249}
250
Eric Christopherfee6aaf2015-02-17 06:45:15 +0000251bool PPCSubtarget::isELFv2ABI() const { return TM.isELFv2ABI(); }
252bool PPCSubtarget::isPPC64() const { return TM.isPPC64(); }