blob: b0ce1335bd37ddb3acd650f42d74e75dbf3d26d3 [file] [log] [blame]
Bill Wendling2bce78e2010-12-04 23:57:24 +00001//===-- X86Subtarget.cpp - X86 Subtarget Information ----------------------===//
Nate Begemanf26625e2005-07-12 01:41:54 +00002//
3// The LLVM Compiler Infrastructure
4//
Chris Lattnerf3ebc3f2007-12-29 20:36:04 +00005// This file is distributed under the University of Illinois Open Source
6// License. See LICENSE.TXT for details.
Nate Begemanf26625e2005-07-12 01:41:54 +00007//
8//===----------------------------------------------------------------------===//
9//
Evan Cheng0d639a22011-07-01 21:01:15 +000010// This file implements the X86 specific subclass of TargetSubtargetInfo.
Nate Begemanf26625e2005-07-12 01:41:54 +000011//
12//===----------------------------------------------------------------------===//
13
Quentin Colombet8cf805a2017-07-01 00:45:50 +000014#include "X86.h"
15
Quentin Colombet8cf805a2017-07-01 00:45:50 +000016#include "X86CallLowering.h"
17#include "X86LegalizerInfo.h"
18#include "X86RegisterBankInfo.h"
Nate Begemanf26625e2005-07-12 01:41:54 +000019#include "X86Subtarget.h"
Chandler Carruth6bda14b2017-06-06 11:49:48 +000020#include "MCTargetDesc/X86BaseInfo.h"
Eric Christopher4629ed72014-08-09 01:07:25 +000021#include "X86TargetMachine.h"
Eugene Zelenkofbd13c52017-02-02 22:55:55 +000022#include "llvm/ADT/Triple.h"
Quentin Colombet8cf805a2017-07-01 00:45:50 +000023#include "llvm/CodeGen/GlobalISel/CallLowering.h"
24#include "llvm/CodeGen/GlobalISel/InstructionSelect.h"
25#include "llvm/CodeGen/GlobalISel/Legalizer.h"
26#include "llvm/CodeGen/GlobalISel/RegBankSelect.h"
Bill Wendlingaef9c372013-02-15 22:31:27 +000027#include "llvm/IR/Attributes.h"
Peter Collingbournedc5e5832017-02-02 00:32:03 +000028#include "llvm/IR/ConstantRange.h"
Bill Wendlingaef9c372013-02-15 22:31:27 +000029#include "llvm/IR/Function.h"
Chandler Carruth9fb823b2013-01-02 11:36:10 +000030#include "llvm/IR/GlobalValue.h"
Eugene Zelenkofbd13c52017-02-02 22:55:55 +000031#include "llvm/Support/Casting.h"
32#include "llvm/Support/CodeGen.h"
Eric Christopher3470bbb2014-05-21 23:51:57 +000033#include "llvm/Support/CommandLine.h"
Evan Cheng9a3ec1b2009-01-03 04:04:46 +000034#include "llvm/Support/Debug.h"
Rafael Espindola65596562011-09-07 16:10:57 +000035#include "llvm/Support/ErrorHandling.h"
Chandler Carruthed0881b2012-12-03 16:50:05 +000036#include "llvm/Support/raw_ostream.h"
Anton Korobeynikov430e68a12006-12-22 22:29:05 +000037#include "llvm/Target/TargetMachine.h"
Eugene Zelenkofbd13c52017-02-02 22:55:55 +000038#include <cassert>
39#include <string>
Evan Cheng54b68e32011-07-01 20:45:01 +000040
Chris Lattner3ad60b12009-04-25 18:27:23 +000041#if defined(_MSC_VER)
Bill Wendling6eecd562009-08-03 00:11:34 +000042#include <intrin.h>
Chris Lattner3ad60b12009-04-25 18:27:23 +000043#endif
44
Chandler Carruth84e68b22014-04-22 02:41:26 +000045using namespace llvm;
46
47#define DEBUG_TYPE "subtarget"
48
Chandler Carruthd174b722014-04-22 02:03:14 +000049#define GET_SUBTARGETINFO_TARGET_DESC
50#define GET_SUBTARGETINFO_CTOR
51#include "X86GenSubtargetInfo.inc"
52
Eric Christopher6b0fcfe2014-05-21 23:40:26 +000053// Temporary option to control early if-conversion for x86 while adding machine
54// models.
55static cl::opt<bool>
56X86EarlyIfConv("x86-early-ifcvt", cl::Hidden,
57 cl::desc("Enable early if-conversion on X86"));
58
59
Sanjay Patel2e753412015-08-14 15:11:42 +000060/// Classify a blockaddress reference for the current subtarget according to how
61/// we should reference it in a non-pcrel context.
Rafael Espindolacb2d2662016-05-19 18:34:20 +000062unsigned char X86Subtarget::classifyBlockAddressReference() const {
Rafael Espindolac7e98132016-05-20 12:20:10 +000063 return classifyLocalReference(nullptr);
64}
Chad Rosier24c19d22012-08-01 18:39:17 +000065
Sanjay Patel2e753412015-08-14 15:11:42 +000066/// Classify a global variable reference for the current subtarget according to
67/// how we should reference it in a non-pcrel context.
Rafael Espindolaab03eb02016-05-19 22:07:57 +000068unsigned char
69X86Subtarget::classifyGlobalReference(const GlobalValue *GV) const {
Rafael Espindolac7e98132016-05-20 12:20:10 +000070 return classifyGlobalReference(GV, *GV->getParent());
71}
Chris Lattnerdc842c02009-07-10 07:20:05 +000072
Rafael Espindolac7e98132016-05-20 12:20:10 +000073unsigned char
74X86Subtarget::classifyLocalReference(const GlobalValue *GV) const {
75 // 64 bits can use %rip addressing for anything local.
76 if (is64Bit())
Chris Lattnerdc842c02009-07-10 07:20:05 +000077 return X86II::MO_NO_FLAG;
Chad Rosier24c19d22012-08-01 18:39:17 +000078
Rafael Espindolac7e98132016-05-20 12:20:10 +000079 // If this is for a position dependent executable, the static linker can
80 // figure it out.
Davide Italianoef5d8be2016-06-18 00:03:20 +000081 if (!isPositionIndependent())
Rafael Espindolac7e98132016-05-20 12:20:10 +000082 return X86II::MO_NO_FLAG;
Sriraman Tallam3cb77342016-04-22 21:41:58 +000083
Rafael Espindolac7e98132016-05-20 12:20:10 +000084 // The COFF dynamic linker just patches the executable sections.
85 if (isTargetCOFF())
86 return X86II::MO_NO_FLAG;
Chad Rosier24c19d22012-08-01 18:39:17 +000087
Rafael Espindolac7e98132016-05-20 12:20:10 +000088 if (isTargetDarwin()) {
89 // 32 bit macho has no relocation for a-b if a is undefined, even if
90 // b is in the section that is being relocated.
91 // This means we have to use o load even for GVs that are known to be
92 // local to the dso.
93 if (GV && (GV->isDeclarationForLinker() || GV->hasCommonLinkage()))
Chris Lattnerbd3e5602009-07-10 20:53:38 +000094 return X86II::MO_DARWIN_NONLAZY_PIC_BASE;
Chad Rosier24c19d22012-08-01 18:39:17 +000095
Chris Lattnerbd3e5602009-07-10 20:53:38 +000096 return X86II::MO_PIC_BASE_OFFSET;
97 }
Chad Rosier24c19d22012-08-01 18:39:17 +000098
Rafael Espindolac7e98132016-05-20 12:20:10 +000099 return X86II::MO_GOTOFF;
100}
Chad Rosier24c19d22012-08-01 18:39:17 +0000101
Rafael Espindolac7e98132016-05-20 12:20:10 +0000102unsigned char X86Subtarget::classifyGlobalReference(const GlobalValue *GV,
103 const Module &M) const {
104 // Large model never uses stubs.
105 if (TM.getCodeModel() == CodeModel::Large)
Chris Lattnerbd3e5602009-07-10 20:53:38 +0000106 return X86II::MO_NO_FLAG;
Rafael Espindolac7e98132016-05-20 12:20:10 +0000107
Peter Collingbourne235c2752016-12-08 19:01:00 +0000108 // Absolute symbols can be referenced directly.
Peter Collingbournedc5e5832017-02-02 00:32:03 +0000109 if (GV) {
110 if (Optional<ConstantRange> CR = GV->getAbsoluteSymbolRange()) {
111 // See if we can use the 8-bit immediate form. Note that some instructions
112 // will sign extend the immediate operand, so to be conservative we only
113 // accept the range [0,128).
114 if (CR->getUnsignedMax().ult(128))
115 return X86II::MO_ABS8;
116 else
117 return X86II::MO_NO_FLAG;
118 }
119 }
Peter Collingbourne235c2752016-12-08 19:01:00 +0000120
Rafael Espindola2393c3b2017-10-27 21:18:48 +0000121 if (TM.shouldAssumeDSOLocal(M, GV))
Rafael Espindolac7e98132016-05-20 12:20:10 +0000122 return classifyLocalReference(GV);
123
124 if (isTargetCOFF())
125 return X86II::MO_DLLIMPORT;
126
127 if (is64Bit())
128 return X86II::MO_GOTPCREL;
129
130 if (isTargetDarwin()) {
Davide Italianoef5d8be2016-06-18 00:03:20 +0000131 if (!isPositionIndependent())
Rafael Espindolac7e98132016-05-20 12:20:10 +0000132 return X86II::MO_DARWIN_NONLAZY;
133 return X86II::MO_DARWIN_NONLAZY_PIC_BASE;
Chris Lattnerdc842c02009-07-10 07:20:05 +0000134 }
Chad Rosier24c19d22012-08-01 18:39:17 +0000135
Rafael Espindolac7e98132016-05-20 12:20:10 +0000136 return X86II::MO_GOT;
Chris Lattnerdc842c02009-07-10 07:20:05 +0000137}
138
Rafael Espindola46107b92016-05-19 18:49:29 +0000139unsigned char
140X86Subtarget::classifyGlobalFunctionReference(const GlobalValue *GV) const {
Rafael Espindolac7e98132016-05-20 12:20:10 +0000141 return classifyGlobalFunctionReference(GV, *GV->getParent());
142}
143
144unsigned char
145X86Subtarget::classifyGlobalFunctionReference(const GlobalValue *GV,
146 const Module &M) const {
Rafael Espindola3beef8d2016-06-27 23:15:57 +0000147 if (TM.shouldAssumeDSOLocal(M, GV))
Rafael Espindolac7e98132016-05-20 12:20:10 +0000148 return X86II::MO_NO_FLAG;
149
Reid Kleckner7662d502017-08-05 00:10:43 +0000150 if (isTargetCOFF()) {
151 assert(GV->hasDLLImportStorageClass() &&
152 "shouldAssumeDSOLocal gave inconsistent answer");
153 return X86II::MO_DLLIMPORT;
154 }
155
Oren Ben Simhon51de0332017-05-04 07:22:49 +0000156 const Function *F = dyn_cast_or_null<Function>(GV);
Rafael Espindolac7e98132016-05-20 12:20:10 +0000157
Oren Ben Simhon51de0332017-05-04 07:22:49 +0000158 if (isTargetELF()) {
159 if (is64Bit() && F && (CallingConv::X86_RegCall == F->getCallingConv()))
160 // According to psABI, PLT stub clobbers XMM8-XMM15.
161 // In Regcall calling convention those registers are used for passing
162 // parameters. Thus we need to prevent lazy binding in Regcall.
163 return X86II::MO_GOTPCREL;
Asaf Badouh89406d12016-04-20 08:32:57 +0000164 return X86II::MO_PLT;
Oren Ben Simhon51de0332017-05-04 07:22:49 +0000165 }
Rafael Espindolac7e98132016-05-20 12:20:10 +0000166
167 if (is64Bit()) {
Rafael Espindolac7e98132016-05-20 12:20:10 +0000168 if (F && F->hasFnAttribute(Attribute::NonLazyBind))
169 // If the function is marked as non-lazy, generate an indirect call
170 // which loads from the GOT directly. This avoids runtime overhead
171 // at the cost of eager binding (and one extra byte of encoding).
172 return X86II::MO_GOTPCREL;
173 return X86II::MO_NO_FLAG;
Asaf Badouh89406d12016-04-20 08:32:57 +0000174 }
175
176 return X86II::MO_NO_FLAG;
177}
Anton Korobeynikov6dbdfe22006-11-30 22:42:55 +0000178
Sanjay Patel2e753412015-08-14 15:11:42 +0000179/// This function returns the name of a function which has an interface like
180/// the non-standard bzero function, if such a function exists on the
181/// current subtarget and it is considered preferable over memset with zero
Bill Wendlingbd092622008-09-30 21:22:07 +0000182/// passed as the second argument. Otherwise it returns null.
Bill Wendling17825842008-09-30 22:05:33 +0000183const char *X86Subtarget::getBZeroEntry() const {
Dan Gohman980d7202008-04-01 20:38:36 +0000184 // Darwin 10 has a __bzero entry point for this purpose.
Daniel Dunbarcd01ed52011-04-20 00:14:25 +0000185 if (getTargetTriple().isMacOSX() &&
186 !getTargetTriple().isMacOSXVersionLT(10, 6))
Bill Wendling17825842008-09-30 22:05:33 +0000187 return "__bzero";
Dan Gohman980d7202008-04-01 20:38:36 +0000188
Craig Topper062a2ba2014-04-25 05:30:21 +0000189 return nullptr;
Dan Gohman980d7202008-04-01 20:38:36 +0000190}
191
Evan Cheng0e88c7d2013-01-29 02:32:37 +0000192bool X86Subtarget::hasSinCos() const {
Petr Hosek710479c2017-07-23 22:30:00 +0000193 if (getTargetTriple().isMacOSX()) {
194 return !getTargetTriple().isMacOSXVersionLT(10, 9) && is64Bit();
195 } else if (getTargetTriple().isOSFuchsia()) {
196 return true;
197 }
198 return false;
Evan Cheng0e88c7d2013-01-29 02:32:37 +0000199}
200
Sanjay Patel2e753412015-08-14 15:11:42 +0000201/// Return true if the subtarget allows calls to immediate address.
Rafael Espindola46107b92016-05-19 18:49:29 +0000202bool X86Subtarget::isLegalToCallImmediateAddr() const {
David Majnemer02f21882014-03-28 21:40:47 +0000203 // FIXME: I386 PE/COFF supports PC relative calls using IMAGE_REL_I386_REL32
204 // but WinCOFFObjectWriter::RecordRelocation cannot emit them. Once it does,
205 // the following check for Win32 should be removed.
206 if (In64BitMode || isTargetWin32())
Evan Cheng96098332009-05-20 04:53:57 +0000207 return false;
Rafael Espindolaab03eb02016-05-19 22:07:57 +0000208 return isTargetELF() || TM.getRelocationModel() == Reloc::Static;
Evan Cheng96098332009-05-20 04:53:57 +0000209}
210
Eric Christopherb68e2532014-09-03 20:36:31 +0000211void X86Subtarget::initSubtargetFeatures(StringRef CPU, StringRef FS) {
Nadav Rotem08ab8772013-02-27 05:56:20 +0000212 std::string CPUName = CPU;
Jim Grosbach48551fb2014-04-12 01:34:29 +0000213 if (CPUName.empty())
214 CPUName = "generic";
Evan Cheng964cb5f2011-07-08 21:14:14 +0000215
Jim Grosbach48551fb2014-04-12 01:34:29 +0000216 // Make sure 64-bit features are available in 64-bit mode. (But make sure
217 // SSE2 can be turned off explicitly.)
218 std::string FullFS = FS;
219 if (In64BitMode) {
220 if (!FullFS.empty())
221 FullFS = "+64bit,+sse2," + FullFS;
222 else
223 FullFS = "+64bit,+sse2";
Evan Cheng11b0a5d2006-09-08 06:48:29 +0000224 }
Evan Chengc5e6d2f2011-07-11 03:57:24 +0000225
Hans Wennborg5000ce82015-12-04 23:00:33 +0000226 // LAHF/SAHF are always supported in non-64-bit mode.
227 if (!In64BitMode) {
228 if (!FullFS.empty())
229 FullFS = "+sahf," + FullFS;
230 else
231 FullFS = "+sahf";
232 }
233
Duncan P. N. Exon Smithbb57d732015-07-10 22:33:01 +0000234 // Parse features string and set the CPU.
Jim Grosbach48551fb2014-04-12 01:34:29 +0000235 ParseSubtargetFeatures(CPUName, FullFS);
236
Sanjay Pateldeb8f822015-08-25 16:29:21 +0000237 // All CPUs that implement SSE4.2 or SSE4A support unaligned accesses of
238 // 16-bytes and under that are reasonably fast. These features were
239 // introduced with Intel's Nehalem/Silvermont and AMD's Family10h
240 // micro-architectures respectively.
241 if (hasSSE42() || hasSSE4A())
Sanjay Patel30145672015-09-01 20:51:51 +0000242 IsUAMem16Slow = false;
Sanjay Pateldeb8f822015-08-25 16:29:21 +0000243
Andrew Tricke0c83b12012-08-07 00:25:30 +0000244 InstrItins = getInstrItineraryForCPU(CPUName);
Andrew Trick8523b162012-02-01 23:20:51 +0000245
Evan Chengc5e6d2f2011-07-11 03:57:24 +0000246 // It's important to keep the MCSubtargetInfo feature bits in sync with
247 // target data structure which is shared with MC code emitter, etc.
248 if (In64BitMode)
249 ToggleFeature(X86::Mode64Bit);
Craig Topper3c80d622014-01-06 04:55:54 +0000250 else if (In32BitMode)
251 ToggleFeature(X86::Mode32Bit);
252 else if (In16BitMode)
253 ToggleFeature(X86::Mode16Bit);
254 else
255 llvm_unreachable("Not 16-bit, 32-bit or 64-bit mode!");
Evan Chengc5e6d2f2011-07-11 03:57:24 +0000256
David Greene00411812010-01-05 01:29:13 +0000257 DEBUG(dbgs() << "Subtarget features: SSELevel " << X86SSELevel
Bill Wendling6eecd562009-08-03 00:11:34 +0000258 << ", 3DNowLevel " << X863DNowLevel
259 << ", 64bit " << HasX86_64 << "\n");
Evan Cheng13bcc6c2011-07-07 21:06:52 +0000260 assert((!In64BitMode || HasX86_64) &&
Dan Gohman74037512009-02-03 00:04:43 +0000261 "64-bit code requested on a subtarget that doesn't support it!");
Evan Cheng11b0a5d2006-09-08 06:48:29 +0000262
Marcin Koscielnicki0275fac2016-05-05 11:35:51 +0000263 // Stack alignment is 16 bytes on Darwin, Linux, kFreeBSD and Solaris (both
Roman Divackye8a93fe82011-02-22 17:30:05 +0000264 // 32 and 64 bit) and for all 64-bit targets.
Evan Cheng3a0c5e52011-06-23 17:54:54 +0000265 if (StackAlignOverride)
266 stackAlignment = StackAlignOverride;
Roman Divacky22135672012-11-09 20:10:44 +0000267 else if (isTargetDarwin() || isTargetLinux() || isTargetSolaris() ||
Marcin Koscielnicki0275fac2016-05-05 11:35:51 +0000268 isTargetKFreeBSD() || In64BitMode)
Nate Begemanf26625e2005-07-12 01:41:54 +0000269 stackAlignment = 16;
Mohammed Agabariae9aebf22017-09-13 09:00:27 +0000270
271 // Gather is available since Haswell (AVX2 set). So technically, we can generate Gathers
272 // on all AVX2 processors. But the overhead on HSW is high. Skylake Client processor has
273 // faster Gathers than HSW and performance is similar to Skylake Server (AVX-512).
274 // The specified overhead is relative to the Load operation."2" is the number provided
275 // by Intel architects, This parameter is used for cost estimation of Gather Op and
276 // comparison with other alternatives.
277 if (X86ProcFamily == IntelSkylake || hasAVX512())
278 GatherOverhead = 2;
279 if (hasAVX512())
280 ScatterOverhead = 2;
Dan Gohmandc53f1c2010-05-27 18:43:40 +0000281}
Andrew Trick8523b162012-02-01 23:20:51 +0000282
Bill Wendling61375d82013-02-16 01:36:26 +0000283void X86Subtarget::initializeEnvironment() {
Eric Christopher11e59832015-10-08 20:10:06 +0000284 X86SSELevel = NoSSE;
Bill Wendling61375d82013-02-16 01:36:26 +0000285 X863DNowLevel = NoThreeDNow;
Andrey Turetskiy6a3d5612016-03-23 11:13:54 +0000286 HasX87 = false;
Bill Wendling61375d82013-02-16 01:36:26 +0000287 HasCMov = false;
288 HasX86_64 = false;
289 HasPOPCNT = false;
290 HasSSE4A = false;
291 HasAES = false;
Craig Topper09b65982015-10-16 06:03:09 +0000292 HasFXSR = false;
Amjad Aboud1db6d7a2015-10-12 11:47:46 +0000293 HasXSAVE = false;
294 HasXSAVEOPT = false;
295 HasXSAVEC = false;
296 HasXSAVES = false;
Bill Wendling61375d82013-02-16 01:36:26 +0000297 HasPCLMUL = false;
298 HasFMA = false;
299 HasFMA4 = false;
300 HasXOP = false;
Yunzhong Gaodd36e932013-09-24 18:21:52 +0000301 HasTBM = false;
Simon Pilgrim99b925b2017-05-03 15:51:39 +0000302 HasLWP = false;
Bill Wendling61375d82013-02-16 01:36:26 +0000303 HasMOVBE = false;
304 HasRDRAND = false;
305 HasF16C = false;
306 HasFSGSBase = false;
307 HasLZCNT = false;
308 HasBMI = false;
309 HasBMI2 = false;
Michael Zuckerman97b6a6922016-01-17 13:42:12 +0000310 HasVBMI = false;
Elena Demikhovsky29cde352016-01-24 10:41:28 +0000311 HasIFMA = false;
Bill Wendling61375d82013-02-16 01:36:26 +0000312 HasRTM = false;
Elena Demikhovsky003e7d72013-07-28 08:28:38 +0000313 HasERI = false;
314 HasCDI = false;
Craig Topper7a8cf012013-08-20 05:23:59 +0000315 HasPFI = false;
Robert Khasanovbfa01312014-07-21 14:54:21 +0000316 HasDQI = false;
Oren Ben Simhon7bf27f02017-05-25 13:45:23 +0000317 HasVPOPCNTDQ = false;
Robert Khasanovbfa01312014-07-21 14:54:21 +0000318 HasBWI = false;
319 HasVLX = false;
Bill Wendling61375d82013-02-16 01:36:26 +0000320 HasADX = false;
Asaf Badouh5acf66f2015-12-15 13:35:29 +0000321 HasPKU = false;
Ben Langmuir16501752013-09-12 15:51:31 +0000322 HasSHA = false;
Michael Liao5173ee02013-03-26 17:47:11 +0000323 HasPRFCHW = false;
Michael Liaoa486a112013-03-28 23:41:26 +0000324 HasRDSEED = false;
Hans Wennborg5000ce82015-12-04 23:00:33 +0000325 HasLAHFSAHF = false;
Ashutosh Nema348af9c2016-05-18 11:59:12 +0000326 HasMWAITX = false;
Craig Topper50f3d142017-02-09 04:27:34 +0000327 HasCLZERO = false;
Elena Demikhovskyf7e641c2015-06-03 10:30:57 +0000328 HasMPX = false;
Tim Northover9bb69312017-05-01 17:50:15 +0000329 HasSGX = false;
330 HasCLFLUSHOPT = false;
331 HasCLWB = false;
Zvi Rackover8bc7e4d2016-12-06 19:35:20 +0000332 IsPMULLDSlow = false;
Ekaterina Romanovad5fa5542013-11-21 23:21:26 +0000333 IsSHLDSlow = false;
Sanjay Patel30145672015-09-01 20:51:51 +0000334 IsUAMem16Slow = false;
Sanjay Patel501890e2014-11-21 17:40:04 +0000335 IsUAMem32Slow = false;
Sanjay Patelffd039b2015-02-03 17:13:04 +0000336 HasSSEUnalignedMem = false;
Bill Wendling61375d82013-02-16 01:36:26 +0000337 HasCmpxchg16b = false;
338 UseLeaForSP = false;
Amjad Aboud4f977512017-03-03 09:03:24 +0000339 HasFastPartialYMMorZMMWrite = false;
Nikolai Bozhenovf6795302016-08-04 12:47:28 +0000340 HasFastScalarFSQRT = false;
341 HasFastVectorFSQRT = false;
Pierre Gousseaub6d652a2016-10-14 16:41:38 +0000342 HasFastLZCNT = false;
Craig Topperd88389a2017-02-21 06:39:13 +0000343 HasFastSHLDRotate = false;
Craig Topper641e2af2017-08-30 04:34:48 +0000344 HasMacroFusion = false;
Clement Courbet203fc172017-04-21 09:20:50 +0000345 HasERMSB = false;
Alexey Volkovfd1731d2014-11-21 11:19:34 +0000346 HasSlowDivide32 = false;
347 HasSlowDivide64 = false;
Bill Wendling61375d82013-02-16 01:36:26 +0000348 PadShortFunctions = false;
Craig Topper62c47a22017-08-29 05:14:27 +0000349 SlowTwoMemOps = false;
Preston Gurd8b7ab4b2013-04-25 20:29:37 +0000350 LEAUsesAG = false;
Alexey Volkov6226de62014-05-20 08:55:50 +0000351 SlowLEA = false;
Lama Saba2ea271b2017-05-18 08:11:50 +0000352 Slow3OpsLEA = false;
Alexey Volkov5260dba2014-06-09 11:40:41 +0000353 SlowIncDec = false;
Bill Wendling61375d82013-02-16 01:36:26 +0000354 stackAlignment = 4;
355 // FIXME: this is a known good value for Yonah. How about others?
356 MaxInlineSizeThreshold = 128;
Eric Christopher824f42f2015-05-12 01:26:05 +0000357 UseSoftFloat = false;
Mohammed Agabariae9aebf22017-09-13 09:00:27 +0000358 X86ProcFamily = Others;
359 GatherOverhead = 1024;
360 ScatterOverhead = 1024;
Bill Wendling61375d82013-02-16 01:36:26 +0000361}
362
Eric Christopher1a212032014-06-11 00:25:19 +0000363X86Subtarget &X86Subtarget::initializeSubtargetDependencies(StringRef CPU,
364 StringRef FS) {
365 initializeEnvironment();
Eric Christopherb68e2532014-09-03 20:36:31 +0000366 initSubtargetFeatures(CPU, FS);
Eric Christopher1a212032014-06-11 00:25:19 +0000367 return *this;
368}
369
David Majnemerca290232016-05-20 18:16:06 +0000370X86Subtarget::X86Subtarget(const Triple &TT, StringRef CPU, StringRef FS,
371 const X86TargetMachine &TM,
Daniel Sandersa1b2db792017-05-19 11:08:33 +0000372 unsigned StackAlignOverride)
Daniel Sanders50f17232015-09-15 16:17:27 +0000373 : X86GenSubtargetInfo(TT, CPU, FS), X86ProcFamily(Others),
Rafael Espindolaab03eb02016-05-19 22:07:57 +0000374 PICStyle(PICStyles::None), TM(TM), TargetTriple(TT),
Eric Christopherb8f97682014-05-07 21:05:47 +0000375 StackAlignOverride(StackAlignOverride),
376 In64BitMode(TargetTriple.getArch() == Triple::x86_64),
377 In32BitMode(TargetTriple.getArch() == Triple::x86 &&
378 TargetTriple.getEnvironment() != Triple::CODE16),
379 In16BitMode(TargetTriple.getArch() == Triple::x86 &&
Eric Christophera08f30b2014-06-09 17:08:19 +0000380 TargetTriple.getEnvironment() == Triple::CODE16),
Daniel Sanderse9fdba32017-04-29 17:30:09 +0000381 InstrInfo(initializeSubtargetDependencies(CPU, FS)), TLInfo(TM, *this),
Daniel Sandersa1b2db792017-05-19 11:08:33 +0000382 FrameLowering(*this, getStackAlignment()) {
Eric Christopher4629ed72014-08-09 01:07:25 +0000383 // Determine the PICStyle based on the target selected.
Rafael Espindola0d348262016-06-20 23:41:56 +0000384 if (!isPositionIndependent())
Eric Christopher4629ed72014-08-09 01:07:25 +0000385 setPICStyle(PICStyles::None);
Rafael Espindola0d348262016-06-20 23:41:56 +0000386 else if (is64Bit())
Eric Christopher4629ed72014-08-09 01:07:25 +0000387 setPICStyle(PICStyles::RIPRel);
Rafael Espindola0d348262016-06-20 23:41:56 +0000388 else if (isTargetCOFF())
Eric Christopher4629ed72014-08-09 01:07:25 +0000389 setPICStyle(PICStyles::None);
Rafael Espindola0d348262016-06-20 23:41:56 +0000390 else if (isTargetDarwin())
391 setPICStyle(PICStyles::StubPIC);
392 else if (isTargetELF())
Eric Christopher4629ed72014-08-09 01:07:25 +0000393 setPICStyle(PICStyles::GOT);
Quentin Colombet8cf805a2017-07-01 00:45:50 +0000394
Quentin Colombet61d71a12017-08-15 22:31:51 +0000395 CallLoweringInfo.reset(new X86CallLowering(*getTargetLowering()));
396 Legalizer.reset(new X86LegalizerInfo(*this, TM));
Quentin Colombet8cf805a2017-07-01 00:45:50 +0000397
398 auto *RBI = new X86RegisterBankInfo(*getRegisterInfo());
Quentin Colombet61d71a12017-08-15 22:31:51 +0000399 RegBankInfo.reset(RBI);
400 InstSelector.reset(createX86InstructionSelector(TM, *this, *RBI));
Eric Christopher4629ed72014-08-09 01:07:25 +0000401}
Bill Wendlingaef9c372013-02-15 22:31:27 +0000402
Zvi Rackover76dbf262016-11-15 06:34:33 +0000403const CallLowering *X86Subtarget::getCallLowering() const {
Quentin Colombet61d71a12017-08-15 22:31:51 +0000404 return CallLoweringInfo.get();
Zvi Rackover76dbf262016-11-15 06:34:33 +0000405}
406
407const InstructionSelector *X86Subtarget::getInstructionSelector() const {
Quentin Colombet61d71a12017-08-15 22:31:51 +0000408 return InstSelector.get();
Zvi Rackover76dbf262016-11-15 06:34:33 +0000409}
410
411const LegalizerInfo *X86Subtarget::getLegalizerInfo() const {
Quentin Colombet61d71a12017-08-15 22:31:51 +0000412 return Legalizer.get();
Zvi Rackover76dbf262016-11-15 06:34:33 +0000413}
414
415const RegisterBankInfo *X86Subtarget::getRegBankInfo() const {
Quentin Colombet61d71a12017-08-15 22:31:51 +0000416 return RegBankInfo.get();
Zvi Rackover76dbf262016-11-15 06:34:33 +0000417}
418
Sanjay Patela2f658d2014-07-15 22:39:58 +0000419bool X86Subtarget::enableEarlyIfConversion() const {
Eric Christopher3470bbb2014-05-21 23:51:57 +0000420 return hasCMov() && X86EarlyIfConv;
Eric Christopher6b0fcfe2014-05-21 23:40:26 +0000421}