blob: dd409d1457b6ae8cac62a33c92b0c16919851446 [file] [log] [blame]
Jia Liue1d61962012-02-19 02:03:36 +00001//===-- X86Subtarget.h - Define Subtarget for the X86 ----------*- C++ -*--===//
Nate Begemanf26625e2005-07-12 01:41:54 +00002//
3// The LLVM Compiler Infrastructure
4//
Chris Lattnerf3ebc3f2007-12-29 20:36:04 +00005// This file is distributed under the University of Illinois Open Source
6// License. See LICENSE.TXT for details.
Nate Begemanf26625e2005-07-12 01:41:54 +00007//
8//===----------------------------------------------------------------------===//
9//
Evan Cheng0d639a22011-07-01 21:01:15 +000010// This file declares the X86 specific subclass of TargetSubtargetInfo.
Nate Begemanf26625e2005-07-12 01:41:54 +000011//
12//===----------------------------------------------------------------------===//
13
Benjamin Kramera7c40ef2014-08-13 16:26:38 +000014#ifndef LLVM_LIB_TARGET_X86_X86SUBTARGET_H
15#define LLVM_LIB_TARGET_X86_X86SUBTARGET_H
Nate Begemanf26625e2005-07-12 01:41:54 +000016
Eric Christophera08f30b2014-06-09 17:08:19 +000017#include "X86FrameLowering.h"
18#include "X86ISelLowering.h"
19#include "X86InstrInfo.h"
Eric Christophera08f30b2014-06-09 17:08:19 +000020#include "X86SelectionDAGInfo.h"
Eric Christopherd4298462010-07-05 19:26:33 +000021#include "llvm/ADT/Triple.h"
Chandler Carruth9fb823b2013-01-02 11:36:10 +000022#include "llvm/IR/CallingConv.h"
Evan Cheng0d639a22011-07-01 21:01:15 +000023#include "llvm/Target/TargetSubtargetInfo.h"
Jim Laskey19058c32005-09-01 21:38:21 +000024#include <string>
25
Evan Cheng54b68e32011-07-01 20:45:01 +000026#define GET_SUBTARGETINFO_HEADER
Evan Chengc9c090d2011-07-01 22:36:09 +000027#include "X86GenSubtargetInfo.inc"
Evan Cheng54b68e32011-07-01 20:45:01 +000028
Nate Begemanf26625e2005-07-12 01:41:54 +000029namespace llvm {
Anton Korobeynikov6dbdfe22006-11-30 22:42:55 +000030class GlobalValue;
Evan Cheng1a72add62011-07-07 07:07:08 +000031class StringRef;
Anton Korobeynikov430e68a12006-12-22 22:29:05 +000032class TargetMachine;
Mikhail Glushenkovabd56bd2010-02-28 22:54:30 +000033
Sanjay Patele63abfe2015-02-03 18:47:32 +000034/// The X86 backend supports a number of different styles of PIC.
Mikhail Glushenkovabd56bd2010-02-28 22:54:30 +000035///
Duncan Sands595a4422008-11-28 09:29:37 +000036namespace PICStyles {
Anton Korobeynikova0554d92007-01-12 19:20:47 +000037enum Style {
Chris Lattnerba4d7332009-07-10 20:58:47 +000038 StubPIC, // Used on i386-darwin in -fPIC mode.
39 StubDynamicNoPIC, // Used on i386-darwin in -mdynamic-no-pic mode.
40 GOT, // Used on many 32-bit unices in -fPIC mode.
41 RIPRel, // Used on X86-64 when not in -static mode.
42 None // Set when in -static mode (not PIC or DynamicNoPIC mode).
Anton Korobeynikova0554d92007-01-12 19:20:47 +000043};
44}
Nate Begemanf26625e2005-07-12 01:41:54 +000045
Craig Topperec828472014-03-31 06:53:13 +000046class X86Subtarget final : public X86GenSubtargetInfo {
Eric Christophera08f30b2014-06-09 17:08:19 +000047
Nate Begemanf26625e2005-07-12 01:41:54 +000048protected:
Evan Chengcde9e302006-01-27 08:10:46 +000049 enum X86SSEEnum {
Eric Christopher11e59832015-10-08 20:10:06 +000050 NoSSE, SSE1, SSE2, SSE3, SSSE3, SSE41, SSE42, AVX, AVX2, AVX512F
Evan Chengcde9e302006-01-27 08:10:46 +000051 };
52
Evan Chengff1beda2006-10-06 09:17:41 +000053 enum X863DNowEnum {
Eric Christopher57a6e132015-11-14 03:04:00 +000054 NoThreeDNow, MMX, ThreeDNow, ThreeDNowA
Evan Chengff1beda2006-10-06 09:17:41 +000055 };
56
Andrew Trick8523b162012-02-01 23:20:51 +000057 enum X86ProcFamilyEnum {
Craig Topperf730a6b2016-02-13 21:35:37 +000058 Others, IntelAtom, IntelSLM
Andrew Trick8523b162012-02-01 23:20:51 +000059 };
60
Sanjay Patele63abfe2015-02-03 18:47:32 +000061 /// X86 processor family: Intel Atom, and others
Andrew Trick8523b162012-02-01 23:20:51 +000062 X86ProcFamilyEnum X86ProcFamily;
Chad Rosier24c19d22012-08-01 18:39:17 +000063
Sanjay Patele63abfe2015-02-03 18:47:32 +000064 /// Which PIC style to use
Duncan Sands595a4422008-11-28 09:29:37 +000065 PICStyles::Style PICStyle;
Mikhail Glushenkovabd56bd2010-02-28 22:54:30 +000066
Eric Christopher11e59832015-10-08 20:10:06 +000067 /// SSE1, SSE2, SSE3, SSSE3, SSE41, SSE42, or none supported.
Evan Chengcde9e302006-01-27 08:10:46 +000068 X86SSEEnum X86SSELevel;
69
Eric Christopher57a6e132015-11-14 03:04:00 +000070 /// MMX, 3DNow, 3DNow Athlon, or none supported.
Evan Chengff1beda2006-10-06 09:17:41 +000071 X863DNowEnum X863DNowLevel;
72
Andrey Turetskiy6a3d5612016-03-23 11:13:54 +000073 /// True if the processor supports X87 instructions.
74 bool HasX87;
75
Sanjay Patele63abfe2015-02-03 18:47:32 +000076 /// True if this processor has conditional move instructions
Chris Lattnercc8c5812009-09-02 05:53:04 +000077 /// (generally pentium pro+).
78 bool HasCMov;
Mikhail Glushenkovabd56bd2010-02-28 22:54:30 +000079
Sanjay Patele63abfe2015-02-03 18:47:32 +000080 /// True if the processor supports X86-64 instructions.
Evan Cheng11b0a5d2006-09-08 06:48:29 +000081 bool HasX86_64;
Evan Cheng4c91aa32009-01-02 05:35:45 +000082
Sanjay Patele63abfe2015-02-03 18:47:32 +000083 /// True if the processor supports POPCNT.
Benjamin Kramer2f489232010-12-04 20:32:23 +000084 bool HasPOPCNT;
85
Sanjay Patele63abfe2015-02-03 18:47:32 +000086 /// True if the processor supports SSE4A instructions.
Stefanus Du Toit96180b52009-05-26 21:04:35 +000087 bool HasSSE4A;
88
Sanjay Patele63abfe2015-02-03 18:47:32 +000089 /// Target has AES instructions
Eric Christopher2ef63182010-04-02 21:54:27 +000090 bool HasAES;
91
Craig Topper09b65982015-10-16 06:03:09 +000092 /// Target has FXSAVE/FXRESTOR instructions
93 bool HasFXSR;
94
Amjad Aboud1db6d7a2015-10-12 11:47:46 +000095 /// Target has XSAVE instructions
96 bool HasXSAVE;
97 /// Target has XSAVEOPT instructions
98 bool HasXSAVEOPT;
99 /// Target has XSAVEC instructions
100 bool HasXSAVEC;
101 /// Target has XSAVES instructions
102 bool HasXSAVES;
103
Sanjay Patele63abfe2015-02-03 18:47:32 +0000104 /// Target has carry-less multiplication
Benjamin Kramera0396e42012-05-31 14:34:17 +0000105 bool HasPCLMUL;
Bruno Cardoso Lopes09dc24b2010-07-23 01:17:51 +0000106
Sanjay Patele63abfe2015-02-03 18:47:32 +0000107 /// Target has 3-operand fused multiply-add
Craig Topper79dbb0c2012-06-03 18:58:46 +0000108 bool HasFMA;
David Greene8f6f72c2009-06-26 22:46:54 +0000109
Sanjay Patele63abfe2015-02-03 18:47:32 +0000110 /// Target has 4-operand fused multiply-add
David Greene8f6f72c2009-06-26 22:46:54 +0000111 bool HasFMA4;
112
Sanjay Patele63abfe2015-02-03 18:47:32 +0000113 /// Target has XOP instructions
Jan Sjödin1280eb12011-12-02 15:14:37 +0000114 bool HasXOP;
115
Sanjay Patele63abfe2015-02-03 18:47:32 +0000116 /// Target has TBM instructions.
Yunzhong Gaodd36e932013-09-24 18:21:52 +0000117 bool HasTBM;
118
Sanjay Patele63abfe2015-02-03 18:47:32 +0000119 /// True if the processor has the MOVBE instruction.
Craig Topper786bdb92011-10-03 17:28:23 +0000120 bool HasMOVBE;
121
Sanjay Patele63abfe2015-02-03 18:47:32 +0000122 /// True if the processor has the RDRAND instruction.
Craig Topper786bdb92011-10-03 17:28:23 +0000123 bool HasRDRAND;
124
Sanjay Patele63abfe2015-02-03 18:47:32 +0000125 /// Processor has 16-bit floating point conversion instructions.
Craig Topperfe9179f2011-10-09 07:31:39 +0000126 bool HasF16C;
127
Sanjay Patele63abfe2015-02-03 18:47:32 +0000128 /// Processor has FS/GS base insturctions.
Craig Topper228d9132011-10-30 19:57:21 +0000129 bool HasFSGSBase;
130
Sanjay Patele63abfe2015-02-03 18:47:32 +0000131 /// Processor has LZCNT instruction.
Craig Topper271064e2011-10-11 06:44:02 +0000132 bool HasLZCNT;
133
Sanjay Patele63abfe2015-02-03 18:47:32 +0000134 /// Processor has BMI1 instructions.
Craig Topper3657fe42011-10-14 03:21:46 +0000135 bool HasBMI;
136
Sanjay Patele63abfe2015-02-03 18:47:32 +0000137 /// Processor has BMI2 instructions.
Craig Topperaea148c2011-10-16 07:55:05 +0000138 bool HasBMI2;
139
Michael Zuckerman97b6a6922016-01-17 13:42:12 +0000140 /// Processor has VBMI instructions.
141 bool HasVBMI;
142
Elena Demikhovsky29cde352016-01-24 10:41:28 +0000143 /// Processor has Integer Fused Multiply Add
144 bool HasIFMA;
145
Sanjay Patele63abfe2015-02-03 18:47:32 +0000146 /// Processor has RTM instructions.
Michael Liao73cffdd2012-11-08 07:28:54 +0000147 bool HasRTM;
148
Sanjay Patele63abfe2015-02-03 18:47:32 +0000149 /// Processor has HLE.
Michael Liaoe344ec92013-03-26 22:46:02 +0000150 bool HasHLE;
151
Sanjay Patele63abfe2015-02-03 18:47:32 +0000152 /// Processor has ADX instructions.
Kay Tiong Khoof809c642013-02-14 19:08:21 +0000153 bool HasADX;
154
Sanjay Patele63abfe2015-02-03 18:47:32 +0000155 /// Processor has SHA instructions.
Ben Langmuir16501752013-09-12 15:51:31 +0000156 bool HasSHA;
157
Sanjay Patele63abfe2015-02-03 18:47:32 +0000158 /// Processor has PRFCHW instructions.
Michael Liao5173ee02013-03-26 17:47:11 +0000159 bool HasPRFCHW;
160
Sanjay Patele63abfe2015-02-03 18:47:32 +0000161 /// Processor has RDSEED instructions.
Michael Liaoa486a112013-03-28 23:41:26 +0000162 bool HasRDSEED;
163
Hans Wennborg5000ce82015-12-04 23:00:33 +0000164 /// Processor has LAHF/SAHF instructions.
165 bool HasLAHFSAHF;
166
Ashutosh Nema348af9c2016-05-18 11:59:12 +0000167 /// Processor has MONITORX/MWAITX instructions.
168 bool HasMWAITX;
169
Elena Demikhovsky29cde352016-01-24 10:41:28 +0000170 /// Processor has Prefetch with intent to Write instruction
171 bool HasPFPREFETCHWT1;
172
Sanjay Patele63abfe2015-02-03 18:47:32 +0000173 /// True if BT (bit test) of memory instructions are slow.
David Greene8f6f72c2009-06-26 22:46:54 +0000174 bool IsBTMemSlow;
Evan Cheng4cf30b72009-12-18 07:40:29 +0000175
Sanjay Patele63abfe2015-02-03 18:47:32 +0000176 /// True if SHLD instructions are slow.
Ekaterina Romanovad5fa5542013-11-21 23:21:26 +0000177 bool IsSHLDSlow;
178
Sanjay Patel30145672015-09-01 20:51:51 +0000179 /// True if unaligned memory accesses of 16-bytes are slow.
180 bool IsUAMem16Slow;
Evan Cheng738b0f92010-04-01 05:58:17 +0000181
Sanjay Patel9e916dc2015-08-21 20:17:26 +0000182 /// True if unaligned memory accesses of 32-bytes are slow.
Sanjay Patel501890e2014-11-21 17:40:04 +0000183 bool IsUAMem32Slow;
Michael Liao5bf95782014-12-04 05:20:33 +0000184
Sanjay Patelffd039b2015-02-03 17:13:04 +0000185 /// True if SSE operations can have unaligned memory operands.
186 /// This may require setting a configuration bit in the processor.
187 bool HasSSEUnalignedMem;
David Greene206351a2010-01-11 16:29:42 +0000188
Sanjay Patele63abfe2015-02-03 18:47:32 +0000189 /// True if this processor has the CMPXCHG16B instruction;
Eli Friedman5e570422011-08-26 21:21:21 +0000190 /// this is true for most x86-64 chips, but not the first AMD chips.
191 bool HasCmpxchg16b;
192
Sanjay Patele63abfe2015-02-03 18:47:32 +0000193 /// True if the LEA instruction should be used for adjusting
Evan Cheng1b81fdd2012-02-07 22:50:41 +0000194 /// the stack pointer. This is an optimization for Intel Atom processors.
195 bool UseLeaForSP;
196
Yunzhong Gao0de36ec2016-02-12 23:37:57 +0000197 /// True if there is no performance penalty to writing only the lower parts
198 /// of a YMM register without clearing the upper part.
199 bool HasFastPartialYMMWrite;
200
Sanjay Patele63abfe2015-02-03 18:47:32 +0000201 /// True if 8-bit divisions are significantly faster than
Alexey Volkovfd1731d2014-11-21 11:19:34 +0000202 /// 32-bit divisions and should be used when possible.
203 bool HasSlowDivide32;
204
Sanjay Patele63abfe2015-02-03 18:47:32 +0000205 /// True if 16-bit divides are significantly faster than
Alexey Volkovfd1731d2014-11-21 11:19:34 +0000206 /// 64-bit divisions and should be used when possible.
207 bool HasSlowDivide64;
Preston Gurdcdf540d2012-09-04 18:22:17 +0000208
Sanjay Patele63abfe2015-02-03 18:47:32 +0000209 /// True if the short functions should be padded to prevent
Preston Gurda01daac2013-01-08 18:27:24 +0000210 /// a stall when returning too early.
211 bool PadShortFunctions;
212
Sanjay Patele63abfe2015-02-03 18:47:32 +0000213 /// True if the Calls with memory reference should be converted
Preston Gurd663e6f92013-03-27 19:14:02 +0000214 /// to a register-based indirect call.
215 bool CallRegIndirect;
Sanjay Patele63abfe2015-02-03 18:47:32 +0000216
217 /// True if the LEA instruction inputs have to be ready at address generation
218 /// (AG) time.
Preston Gurd8b7ab4b2013-04-25 20:29:37 +0000219 bool LEAUsesAG;
Preston Gurd663e6f92013-03-27 19:14:02 +0000220
Sanjay Patele63abfe2015-02-03 18:47:32 +0000221 /// True if the LEA instruction with certain arguments is slow
Alexey Volkov6226de62014-05-20 08:55:50 +0000222 bool SlowLEA;
223
Sanjay Patele63abfe2015-02-03 18:47:32 +0000224 /// True if INC and DEC instructions are slow when writing to flags
Alexey Volkov5260dba2014-06-09 11:40:41 +0000225 bool SlowIncDec;
226
Elena Demikhovsky8cfb43f2013-07-24 11:02:47 +0000227 /// Processor has AVX-512 PreFetch Instructions
228 bool HasPFI;
Robert Khasanovbfa01312014-07-21 14:54:21 +0000229
Elena Demikhovsky8cfb43f2013-07-24 11:02:47 +0000230 /// Processor has AVX-512 Exponential and Reciprocal Instructions
231 bool HasERI;
Robert Khasanovbfa01312014-07-21 14:54:21 +0000232
Elena Demikhovsky8cfb43f2013-07-24 11:02:47 +0000233 /// Processor has AVX-512 Conflict Detection Instructions
234 bool HasCDI;
Robert Khasanovbfa01312014-07-21 14:54:21 +0000235
236 /// Processor has AVX-512 Doubleword and Quadword instructions
237 bool HasDQI;
238
239 /// Processor has AVX-512 Byte and Word instructions
240 bool HasBWI;
241
242 /// Processor has AVX-512 Vector Length eXtenstions
243 bool HasVLX;
244
Asaf Badouh5acf66f2015-12-15 13:35:29 +0000245 /// Processor has PKU extenstions
246 bool HasPKU;
247
Elena Demikhovsky29cde352016-01-24 10:41:28 +0000248 /// Processor supports MPX - Memory Protection Extensions
Elena Demikhovskyf7e641c2015-06-03 10:30:57 +0000249 bool HasMPX;
250
Elena Demikhovsky29cde352016-01-24 10:41:28 +0000251 /// Processor supports Invalidate Process-Context Identifier
252 bool HasInvPCId;
253
254 /// Processor has VM Functions
255 bool HasVMFUNC;
256
257 /// Processor has Supervisor Mode Access Protection
258 bool HasSMAP;
259
260 /// Processor has Software Guard Extensions
261 bool HasSGX;
262
263 /// Processor supports Flush Cache Line instruction
264 bool HasCLFLUSHOPT;
265
266 /// Processor has Persistent Commit feature
267 bool HasPCOMMIT;
268
269 /// Processor supports Cache Line Write Back instruction
270 bool HasCLWB;
271
Eric Christopher824f42f2015-05-12 01:26:05 +0000272 /// Use software floating point for code generation.
273 bool UseSoftFloat;
274
Sanjay Patele63abfe2015-02-03 18:47:32 +0000275 /// The minimum alignment known to hold of the stack frame on
Chris Lattner351817b2005-07-12 02:36:10 +0000276 /// entry to the function and which must be maintained by every function.
Nate Begemanf26625e2005-07-12 01:41:54 +0000277 unsigned stackAlignment;
Jeff Cohen33a030e2005-07-27 05:53:44 +0000278
Rafael Espindola063f1772007-10-31 11:52:06 +0000279 /// Max. memset / memcpy size that is turned into rep/movs, rep/stos ops.
Evan Cheng763cdfd2007-08-01 23:45:51 +0000280 ///
Rafael Espindola063f1772007-10-31 11:52:06 +0000281 unsigned MaxInlineSizeThreshold;
NAKAMURA Takumi0544fe72011-02-17 12:23:50 +0000282
Sanjay Patele63abfe2015-02-03 18:47:32 +0000283 /// What processor and OS we're targeting.
Eric Christopherd4298462010-07-05 19:26:33 +0000284 Triple TargetTriple;
Chad Rosier24c19d22012-08-01 18:39:17 +0000285
Andrew Trick8523b162012-02-01 23:20:51 +0000286 /// Instruction itineraries for scheduling
287 InstrItineraryData InstrItins;
Evan Cheng03c1e6f2006-02-16 00:21:07 +0000288
Evan Cheng11b0a5d2006-09-08 06:48:29 +0000289private:
Eric Christophere950b672014-08-09 04:38:53 +0000290
Sanjay Patele63abfe2015-02-03 18:47:32 +0000291 /// Override the stack alignment.
Bill Wendlingaef9c372013-02-15 22:31:27 +0000292 unsigned StackAlignOverride;
293
Sanjay Patele63abfe2015-02-03 18:47:32 +0000294 /// True if compiling for 64-bit, false for 16-bit or 32-bit.
Evan Cheng13bcc6c2011-07-07 21:06:52 +0000295 bool In64BitMode;
Evan Cheng11b0a5d2006-09-08 06:48:29 +0000296
Sanjay Patele63abfe2015-02-03 18:47:32 +0000297 /// True if compiling for 32-bit, false for 16-bit or 64-bit.
Craig Topper3c80d622014-01-06 04:55:54 +0000298 bool In32BitMode;
299
Sanjay Patele63abfe2015-02-03 18:47:32 +0000300 /// True if compiling for 16-bit, false for 32-bit or 64-bit.
Craig Topper3c80d622014-01-06 04:55:54 +0000301 bool In16BitMode;
302
Eric Christophera08f30b2014-06-09 17:08:19 +0000303 X86SelectionDAGInfo TSInfo;
Eric Christopher1a212032014-06-11 00:25:19 +0000304 // Ordering here is important. X86InstrInfo initializes X86RegisterInfo which
305 // X86TargetLowering needs.
306 X86InstrInfo InstrInfo;
307 X86TargetLowering TLInfo;
308 X86FrameLowering FrameLowering;
Eric Christophera08f30b2014-06-09 17:08:19 +0000309
Nate Begemanf26625e2005-07-12 01:41:54 +0000310public:
Jeff Cohen33a030e2005-07-27 05:53:44 +0000311 /// This constructor initializes the data members to match that
Daniel Dunbar31b44e82009-08-02 22:11:08 +0000312 /// of the specified triple.
Nate Begemanf26625e2005-07-12 01:41:54 +0000313 ///
Daniel Sandersa73f1fd2015-06-10 12:11:26 +0000314 X86Subtarget(const Triple &TT, const std::string &CPU, const std::string &FS,
315 const X86TargetMachine &TM, unsigned StackAlignOverride);
Eric Christophera08f30b2014-06-09 17:08:19 +0000316
Eric Christopherd9134482014-08-04 21:25:23 +0000317 const X86TargetLowering *getTargetLowering() const override {
318 return &TLInfo;
319 }
320 const X86InstrInfo *getInstrInfo() const override { return &InstrInfo; }
Eric Christopherd9134482014-08-04 21:25:23 +0000321 const X86FrameLowering *getFrameLowering() const override {
322 return &FrameLowering;
323 }
324 const X86SelectionDAGInfo *getSelectionDAGInfo() const override {
325 return &TSInfo;
326 }
327 const X86RegisterInfo *getRegisterInfo() const override {
328 return &getInstrInfo()->getRegisterInfo();
329 }
Chris Lattner351817b2005-07-12 02:36:10 +0000330
Sanjay Patele63abfe2015-02-03 18:47:32 +0000331 /// Returns the minimum alignment known to hold of the
Chris Lattner351817b2005-07-12 02:36:10 +0000332 /// stack frame on entry to the function and which must be maintained by every
333 /// function for this subtarget.
Nate Begemanf26625e2005-07-12 01:41:54 +0000334 unsigned getStackAlignment() const { return stackAlignment; }
Jeff Cohen33a030e2005-07-27 05:53:44 +0000335
Sanjay Patele63abfe2015-02-03 18:47:32 +0000336 /// Returns the maximum memset / memcpy size
Rafael Espindola063f1772007-10-31 11:52:06 +0000337 /// that still makes it profitable to inline the call.
338 unsigned getMaxInlineSizeThreshold() const { return MaxInlineSizeThreshold; }
Anton Korobeynikov5b96cde2006-11-21 00:01:06 +0000339
340 /// ParseSubtargetFeatures - Parses features string setting specified
Evan Chengff1beda2006-10-06 09:17:41 +0000341 /// subtarget options. Definition of function is auto generated by tblgen.
Evan Cheng1a72add62011-07-07 07:07:08 +0000342 void ParseSubtargetFeatures(StringRef CPU, StringRef FS);
Evan Chengff1beda2006-10-06 09:17:41 +0000343
Bill Wendling61375d82013-02-16 01:36:26 +0000344private:
Sanjay Patele63abfe2015-02-03 18:47:32 +0000345 /// Initialize the full set of dependencies so we can use an initializer
Eric Christopher1a212032014-06-11 00:25:19 +0000346 /// list for X86Subtarget.
347 X86Subtarget &initializeSubtargetDependencies(StringRef CPU, StringRef FS);
Bill Wendling61375d82013-02-16 01:36:26 +0000348 void initializeEnvironment();
Eric Christopherb68e2532014-09-03 20:36:31 +0000349 void initSubtargetFeatures(StringRef CPU, StringRef FS);
Bill Wendling61375d82013-02-16 01:36:26 +0000350public:
Eli Bendersky597fc122013-01-25 22:07:43 +0000351 /// Is this x86_64? (disregarding specific ABI / programming model)
352 bool is64Bit() const {
353 return In64BitMode;
354 }
355
Craig Topper3c80d622014-01-06 04:55:54 +0000356 bool is32Bit() const {
357 return In32BitMode;
358 }
359
360 bool is16Bit() const {
361 return In16BitMode;
362 }
363
Eli Bendersky597fc122013-01-25 22:07:43 +0000364 /// Is this x86_64 with the ILP32 programming model (x32 ABI)?
365 bool isTarget64BitILP32() const {
Rafael Espindoladdb913c2013-12-19 00:44:37 +0000366 return In64BitMode && (TargetTriple.getEnvironment() == Triple::GNUX32 ||
Simon Pilgrima2794102014-11-22 19:12:10 +0000367 TargetTriple.isOSNaCl());
Eli Bendersky597fc122013-01-25 22:07:43 +0000368 }
369
370 /// Is this x86_64 with the LP64 programming model (standard AMD64, no x32)?
371 bool isTarget64BitLP64() const {
Pavel Chupinf55eb452014-08-07 09:41:19 +0000372 return In64BitMode && (TargetTriple.getEnvironment() != Triple::GNUX32 &&
Simon Pilgrima2794102014-11-22 19:12:10 +0000373 !TargetTriple.isOSNaCl());
Eli Bendersky597fc122013-01-25 22:07:43 +0000374 }
Evan Cheng54c13da2006-01-26 09:53:06 +0000375
Duncan Sands595a4422008-11-28 09:29:37 +0000376 PICStyles::Style getPICStyle() const { return PICStyle; }
377 void setPICStyle(PICStyles::Style Style) { PICStyle = Style; }
Anton Korobeynikova0554d92007-01-12 19:20:47 +0000378
Andrey Turetskiy6a3d5612016-03-23 11:13:54 +0000379 bool hasX87() const { return HasX87; }
Chris Lattnera30d4ce2010-03-14 18:31:44 +0000380 bool hasCMov() const { return HasCMov; }
Craig Toppereb8f9e92012-01-10 06:30:56 +0000381 bool hasSSE1() const { return X86SSELevel >= SSE1; }
382 bool hasSSE2() const { return X86SSELevel >= SSE2; }
383 bool hasSSE3() const { return X86SSELevel >= SSE3; }
384 bool hasSSSE3() const { return X86SSELevel >= SSSE3; }
385 bool hasSSE41() const { return X86SSELevel >= SSE41; }
386 bool hasSSE42() const { return X86SSELevel >= SSE42; }
Craig Topperb0c0f722012-01-10 06:54:16 +0000387 bool hasAVX() const { return X86SSELevel >= AVX; }
388 bool hasAVX2() const { return X86SSELevel >= AVX2; }
Craig Topper5c94bb82013-08-21 03:57:57 +0000389 bool hasAVX512() const { return X86SSELevel >= AVX512F; }
Elena Demikhovskyeace43b2012-11-29 12:44:59 +0000390 bool hasFp256() const { return hasAVX(); }
391 bool hasInt256() const { return hasAVX2(); }
Stefanus Du Toit96180b52009-05-26 21:04:35 +0000392 bool hasSSE4A() const { return HasSSE4A; }
Eric Christopher57a6e132015-11-14 03:04:00 +0000393 bool hasMMX() const { return X863DNowLevel >= MMX; }
Evan Chengff1beda2006-10-06 09:17:41 +0000394 bool has3DNow() const { return X863DNowLevel >= ThreeDNow; }
395 bool has3DNowA() const { return X863DNowLevel >= ThreeDNowA; }
Benjamin Kramer2f489232010-12-04 20:32:23 +0000396 bool hasPOPCNT() const { return HasPOPCNT; }
Eric Christopher2ef63182010-04-02 21:54:27 +0000397 bool hasAES() const { return HasAES; }
Craig Topper09b65982015-10-16 06:03:09 +0000398 bool hasFXSR() const { return HasFXSR; }
Amjad Aboud1db6d7a2015-10-12 11:47:46 +0000399 bool hasXSAVE() const { return HasXSAVE; }
400 bool hasXSAVEOPT() const { return HasXSAVEOPT; }
401 bool hasXSAVEC() const { return HasXSAVEC; }
402 bool hasXSAVES() const { return HasXSAVES; }
Benjamin Kramera0396e42012-05-31 14:34:17 +0000403 bool hasPCLMUL() const { return HasPCLMUL; }
Simon Pilgrimdb26b3d2015-11-30 22:22:06 +0000404 // Prefer FMA4 to FMA - its better for commutation/memory folding and
405 // has equal or better performance on all supported targets.
406 bool hasFMA() const { return HasFMA && !HasFMA4; }
407 bool hasFMA4() const { return HasFMA4; }
Sanjay Patel60216f62015-12-01 17:27:55 +0000408 bool hasAnyFMA() const { return hasFMA() || hasFMA4() || hasAVX512(); }
Jan Sjödin1280eb12011-12-02 15:14:37 +0000409 bool hasXOP() const { return HasXOP; }
Yunzhong Gaodd36e932013-09-24 18:21:52 +0000410 bool hasTBM() const { return HasTBM; }
Craig Topper786bdb92011-10-03 17:28:23 +0000411 bool hasMOVBE() const { return HasMOVBE; }
412 bool hasRDRAND() const { return HasRDRAND; }
Craig Topperfe9179f2011-10-09 07:31:39 +0000413 bool hasF16C() const { return HasF16C; }
Craig Topper228d9132011-10-30 19:57:21 +0000414 bool hasFSGSBase() const { return HasFSGSBase; }
Craig Topper271064e2011-10-11 06:44:02 +0000415 bool hasLZCNT() const { return HasLZCNT; }
Craig Topper3657fe42011-10-14 03:21:46 +0000416 bool hasBMI() const { return HasBMI; }
Craig Topperaea148c2011-10-16 07:55:05 +0000417 bool hasBMI2() const { return HasBMI2; }
Michael Zuckerman97b6a6922016-01-17 13:42:12 +0000418 bool hasVBMI() const { return HasVBMI; }
Elena Demikhovsky29cde352016-01-24 10:41:28 +0000419 bool hasIFMA() const { return HasIFMA; }
Michael Liao73cffdd2012-11-08 07:28:54 +0000420 bool hasRTM() const { return HasRTM; }
Michael Liaoe344ec92013-03-26 22:46:02 +0000421 bool hasHLE() const { return HasHLE; }
Kay Tiong Khoof809c642013-02-14 19:08:21 +0000422 bool hasADX() const { return HasADX; }
Ben Langmuir16501752013-09-12 15:51:31 +0000423 bool hasSHA() const { return HasSHA; }
Michael Liao5173ee02013-03-26 17:47:11 +0000424 bool hasPRFCHW() const { return HasPRFCHW; }
Michael Liaoa486a112013-03-28 23:41:26 +0000425 bool hasRDSEED() const { return HasRDSEED; }
Hans Wennborg5000ce82015-12-04 23:00:33 +0000426 bool hasLAHFSAHF() const { return HasLAHFSAHF; }
Ashutosh Nema348af9c2016-05-18 11:59:12 +0000427 bool hasMWAITX() const { return HasMWAITX; }
Evan Cheng4c91aa32009-01-02 05:35:45 +0000428 bool isBTMemSlow() const { return IsBTMemSlow; }
Ekaterina Romanovad5fa5542013-11-21 23:21:26 +0000429 bool isSHLDSlow() const { return IsSHLDSlow; }
Sanjay Patel30145672015-09-01 20:51:51 +0000430 bool isUnalignedMem16Slow() const { return IsUAMem16Slow; }
Sanjay Patel501890e2014-11-21 17:40:04 +0000431 bool isUnalignedMem32Slow() const { return IsUAMem32Slow; }
Sanjay Patelffd039b2015-02-03 17:13:04 +0000432 bool hasSSEUnalignedMem() const { return HasSSEUnalignedMem; }
Eli Friedman5e570422011-08-26 21:21:21 +0000433 bool hasCmpxchg16b() const { return HasCmpxchg16b; }
Evan Cheng1b81fdd2012-02-07 22:50:41 +0000434 bool useLeaForSP() const { return UseLeaForSP; }
Yunzhong Gao0de36ec2016-02-12 23:37:57 +0000435 bool hasFastPartialYMMWrite() const { return HasFastPartialYMMWrite; }
Alexey Volkovfd1731d2014-11-21 11:19:34 +0000436 bool hasSlowDivide32() const { return HasSlowDivide32; }
437 bool hasSlowDivide64() const { return HasSlowDivide64; }
Preston Gurda01daac2013-01-08 18:27:24 +0000438 bool padShortFunctions() const { return PadShortFunctions; }
Preston Gurd663e6f92013-03-27 19:14:02 +0000439 bool callRegIndirect() const { return CallRegIndirect; }
Preston Gurd8b7ab4b2013-04-25 20:29:37 +0000440 bool LEAusesAG() const { return LEAUsesAG; }
Alexey Volkov6226de62014-05-20 08:55:50 +0000441 bool slowLEA() const { return SlowLEA; }
Alexey Volkov5260dba2014-06-09 11:40:41 +0000442 bool slowIncDec() const { return SlowIncDec; }
Elena Demikhovsky8cfb43f2013-07-24 11:02:47 +0000443 bool hasCDI() const { return HasCDI; }
444 bool hasPFI() const { return HasPFI; }
445 bool hasERI() const { return HasERI; }
Robert Khasanovbfa01312014-07-21 14:54:21 +0000446 bool hasDQI() const { return HasDQI; }
447 bool hasBWI() const { return HasBWI; }
448 bool hasVLX() const { return HasVLX; }
Asaf Badouh5acf66f2015-12-15 13:35:29 +0000449 bool hasPKU() const { return HasPKU; }
Elena Demikhovskyf7e641c2015-06-03 10:30:57 +0000450 bool hasMPX() const { return HasMPX; }
Evan Cheng4c91aa32009-01-02 05:35:45 +0000451
Andrew Trick8523b162012-02-01 23:20:51 +0000452 bool isAtom() const { return X86ProcFamily == IntelAtom; }
Alexey Volkov6226de62014-05-20 08:55:50 +0000453 bool isSLM() const { return X86ProcFamily == IntelSLM; }
Eric Christopher824f42f2015-05-12 01:26:05 +0000454 bool useSoftFloat() const { return UseSoftFloat; }
Andrew Trick8523b162012-02-01 23:20:51 +0000455
Sanjay Patele9bf9932016-02-13 17:26:29 +0000456 /// Use mfence if we have SSE2 or we're on x86-64 (even if we asked for
457 /// no-sse2). There isn't any reason to disable it if the target processor
458 /// supports it.
459 bool hasMFence() const { return hasSSE2() || is64Bit(); }
460
Daniel Dunbar44b53032011-04-19 21:01:47 +0000461 const Triple &getTargetTriple() const { return TargetTriple; }
462
Daniel Dunbar2b9b0e32011-04-19 21:14:45 +0000463 bool isTargetDarwin() const { return TargetTriple.isOSDarwin(); }
Simon Pilgrima2794102014-11-22 19:12:10 +0000464 bool isTargetFreeBSD() const { return TargetTriple.isOSFreeBSD(); }
Rafael Espindola44eae722014-12-29 15:47:28 +0000465 bool isTargetDragonFly() const { return TargetTriple.isOSDragonFly(); }
Simon Pilgrima2794102014-11-22 19:12:10 +0000466 bool isTargetSolaris() const { return TargetTriple.isOSSolaris(); }
Alex Rosenbergb9fefdd2015-01-26 19:09:27 +0000467 bool isTargetPS4() const { return TargetTriple.isPS4(); }
Tim Northover9653eb52013-12-10 16:57:43 +0000468
469 bool isTargetELF() const { return TargetTriple.isOSBinFormatELF(); }
470 bool isTargetCOFF() const { return TargetTriple.isOSBinFormatCOFF(); }
Eric Christopher21895152014-12-05 00:22:38 +0000471 bool isTargetMachO() const { return TargetTriple.isOSBinFormatMachO(); }
Tim Northover9653eb52013-12-10 16:57:43 +0000472
Cameron Esfahani943908b2013-08-29 20:23:14 +0000473 bool isTargetLinux() const { return TargetTriple.isOSLinux(); }
Marcin Koscielnicki0275fac2016-05-05 11:35:51 +0000474 bool isTargetKFreeBSD() const { return TargetTriple.isOSKFreeBSD(); }
475 bool isTargetGlibc() const { return TargetTriple.isOSGlibc(); }
Evgeniy Stepanov5fe279e2015-10-08 21:21:24 +0000476 bool isTargetAndroid() const { return TargetTriple.isAndroid(); }
Cameron Esfahani943908b2013-08-29 20:23:14 +0000477 bool isTargetNaCl() const { return TargetTriple.isOSNaCl(); }
Nick Lewycky73df7e32011-09-05 21:51:43 +0000478 bool isTargetNaCl32() const { return isTargetNaCl() && !is64Bit(); }
479 bool isTargetNaCl64() const { return isTargetNaCl() && is64Bit(); }
Michael Kupersteine1194bd2015-10-27 07:23:59 +0000480 bool isTargetMCU() const { return TargetTriple.isOSIAMCU(); }
Yaron Keren28954962014-04-02 04:27:51 +0000481
482 bool isTargetWindowsMSVC() const {
483 return TargetTriple.isWindowsMSVCEnvironment();
484 }
485
Yaron Keren136fe7d2014-04-01 18:15:34 +0000486 bool isTargetKnownWindowsMSVC() const {
NAKAMURA Takumi09717bd2014-03-30 04:35:00 +0000487 return TargetTriple.isKnownWindowsMSVCEnvironment();
Saleem Abdulrasooledbdd2e2014-03-27 22:50:05 +0000488 }
Yaron Keren28954962014-04-02 04:27:51 +0000489
Pat Gavlinb3990952015-08-14 22:41:43 +0000490 bool isTargetWindowsCoreCLR() const {
491 return TargetTriple.isWindowsCoreCLREnvironment();
492 }
493
Yaron Keren28954962014-04-02 04:27:51 +0000494 bool isTargetWindowsCygwin() const {
Saleem Abdulrasooledbdd2e2014-03-27 22:50:05 +0000495 return TargetTriple.isWindowsCygwinEnvironment();
496 }
Yaron Keren28954962014-04-02 04:27:51 +0000497
498 bool isTargetWindowsGNU() const {
499 return TargetTriple.isWindowsGNUEnvironment();
500 }
501
Saleem Abdulrasool2f3b3f32014-11-20 18:01:26 +0000502 bool isTargetWindowsItanium() const {
503 return TargetTriple.isWindowsItaniumEnvironment();
504 }
505
Chandler Carruthebd90c52012-02-05 08:26:40 +0000506 bool isTargetCygMing() const { return TargetTriple.isOSCygMing(); }
Mikhail Glushenkovabd56bd2010-02-28 22:54:30 +0000507
Yaron Keren79bb2662013-10-23 23:37:01 +0000508 bool isOSWindows() const { return TargetTriple.isOSWindows(); }
509
Anton Korobeynikov7f125b22008-03-22 20:57:27 +0000510 bool isTargetWin64() const {
Chandler Carruthebd90c52012-02-05 08:26:40 +0000511 return In64BitMode && TargetTriple.isOSWindows();
Evan Chengd22a4a12011-02-01 01:14:13 +0000512 }
513
Anton Korobeynikova5a64552010-09-02 23:03:46 +0000514 bool isTargetWin32() const {
Yaron Keren136fe7d2014-04-01 18:15:34 +0000515 return !In64BitMode && (isTargetCygMing() || isTargetKnownWindowsMSVC());
Anton Korobeynikova5a64552010-09-02 23:03:46 +0000516 }
517
Duncan Sands595a4422008-11-28 09:29:37 +0000518 bool isPICStyleSet() const { return PICStyle != PICStyles::None; }
519 bool isPICStyleGOT() const { return PICStyle == PICStyles::GOT; }
Duncan Sands595a4422008-11-28 09:29:37 +0000520 bool isPICStyleRIPRel() const { return PICStyle == PICStyles::RIPRel; }
Chris Lattnere2f524f2009-07-10 20:47:30 +0000521
Chris Lattner21c29402009-07-10 21:00:45 +0000522 bool isPICStyleStubPIC() const {
Chris Lattnerba4d7332009-07-10 20:58:47 +0000523 return PICStyle == PICStyles::StubPIC;
524 }
525
Chris Lattner21c29402009-07-10 21:00:45 +0000526 bool isPICStyleStubNoDynamic() const {
Chris Lattnerba4d7332009-07-10 20:58:47 +0000527 return PICStyle == PICStyles::StubDynamicNoPIC;
528 }
529 bool isPICStyleStubAny() const {
530 return PICStyle == PICStyles::StubDynamicNoPIC ||
Charles Davise8f297c2013-07-12 06:02:35 +0000531 PICStyle == PICStyles::StubPIC;
532 }
533
534 bool isCallingConvWin64(CallingConv::ID CC) const {
Reid Kleckner4f21df22015-07-08 21:03:47 +0000535 switch (CC) {
536 // On Win64, all these conventions just use the default convention.
537 case CallingConv::C:
538 case CallingConv::Fast:
539 case CallingConv::X86_FastCall:
540 case CallingConv::X86_StdCall:
541 case CallingConv::X86_ThisCall:
542 case CallingConv::X86_VectorCall:
543 case CallingConv::Intel_OCL_BI:
544 return isTargetWin64();
545 // This convention allows using the Win64 convention on other targets.
546 case CallingConv::X86_64_Win64:
547 return true;
548 // This convention allows using the SysV convention on Windows targets.
549 case CallingConv::X86_64_SysV:
550 return false;
551 // Otherwise, who knows what this is.
552 default:
553 return false;
554 }
Charles Davise8f297c2013-07-12 06:02:35 +0000555 }
Mikhail Glushenkovabd56bd2010-02-28 22:54:30 +0000556
Sriraman Tallam3cb77342016-04-22 21:41:58 +0000557 /// Determine if this global is defined in a Position Independent
558 /// Executable (PIE) where its definition cannot be interposed.
559 bool isGlobalDefinedInPIE(const GlobalValue *GV,
560 const TargetMachine &TM) const {
Sriraman Tallam7da9b442016-04-29 21:19:16 +0000561 return GV->getParent()->getPIELevel() != PIELevel::Default &&
Sriraman Tallam3cb77342016-04-22 21:41:58 +0000562 !GV->isDeclarationForLinker();
563 }
564
Rafael Espindolacb2d2662016-05-19 18:34:20 +0000565 /// Classify a global variable reference for the current subtarget according
566 /// to how we should reference it in a non-pcrel context.
567 unsigned char classifyGlobalReference(const GlobalValue *GV,
Chris Lattnerdc842c02009-07-10 07:20:05 +0000568 const TargetMachine &TM)const;
Anton Korobeynikov93acb492006-12-20 01:03:20 +0000569
Rafael Espindolacb2d2662016-05-19 18:34:20 +0000570 /// Classify a global function reference for the current subtarget.
Asaf Badouh89406d12016-04-20 08:32:57 +0000571 unsigned char classifyGlobalFunctionReference(const GlobalValue *GV,
572 const TargetMachine &TM) const;
573
Sanjay Patele63abfe2015-02-03 18:47:32 +0000574 /// Classify a blockaddress reference for the current subtarget according to
575 /// how we should reference it in a non-pcrel context.
Rafael Espindolacb2d2662016-05-19 18:34:20 +0000576 unsigned char classifyBlockAddressReference() const;
Dan Gohman7a6611792009-11-20 23:18:13 +0000577
Sanjay Patele63abfe2015-02-03 18:47:32 +0000578 /// Return true if the subtarget allows calls to immediate address.
Rafael Espindolacb2d2662016-05-19 18:34:20 +0000579 bool isLegalToCallImmediateAddr(const TargetMachine &TM) const;
Evan Cheng96098332009-05-20 04:53:57 +0000580
Dan Gohman980d7202008-04-01 20:38:36 +0000581 /// This function returns the name of a function which has an interface
582 /// like the non-standard bzero function, if such a function exists on
583 /// the current subtarget and it is considered prefereable over
584 /// memset with zero passed as the second argument. Otherwise it
585 /// returns null.
Bill Wendling17825842008-09-30 22:05:33 +0000586 const char *getBZeroEntry() const;
Andrew Tricke97d8d62013-10-15 23:33:07 +0000587
Evan Cheng0e88c7d2013-01-29 02:32:37 +0000588 /// This function returns true if the target has sincos() routine in its
589 /// compiler runtime or math libraries.
590 bool hasSinCos() const;
Dan Gohmanb9a01212008-12-16 03:35:01 +0000591
Andrew Tricke97d8d62013-10-15 23:33:07 +0000592 /// Enable the MachineScheduler pass for all X86 subtargets.
Craig Topper73156022014-03-02 09:09:27 +0000593 bool enableMachineScheduler() const override { return true; }
Andrew Tricke97d8d62013-10-15 23:33:07 +0000594
Eric Christopher6b0fcfe2014-05-21 23:40:26 +0000595 bool enableEarlyIfConversion() const override;
596
Sanjay Patele63abfe2015-02-03 18:47:32 +0000597 /// Return the instruction itineraries based on the subtarget selection.
Eric Christopherd9134482014-08-04 21:25:23 +0000598 const InstrItineraryData *getInstrItineraryData() const override {
599 return &InstrItins;
600 }
Sanjay Patela2f658d2014-07-15 22:39:58 +0000601
602 AntiDepBreakMode getAntiDepBreakMode() const override {
603 return TargetSubtargetInfo::ANTIDEP_CRITICAL;
604 }
Evan Cheng47455a72009-09-03 04:37:05 +0000605};
Evan Chenga8b4aea2006-10-16 21:00:37 +0000606
Alexander Kornienkof00654e2015-06-23 09:49:53 +0000607} // End llvm namespace
Nate Begemanf26625e2005-07-12 01:41:54 +0000608
609#endif