blob: c61977e8eca681cd65a9b025e437af7fed820e12 [file] [log] [blame]
Jia Liue1d61962012-02-19 02:03:36 +00001//===-- X86Subtarget.h - Define Subtarget for the X86 ----------*- C++ -*--===//
Nate Begemanf26625e2005-07-12 01:41:54 +00002//
3// The LLVM Compiler Infrastructure
4//
Chris Lattnerf3ebc3f2007-12-29 20:36:04 +00005// This file is distributed under the University of Illinois Open Source
6// License. See LICENSE.TXT for details.
Nate Begemanf26625e2005-07-12 01:41:54 +00007//
8//===----------------------------------------------------------------------===//
9//
Evan Cheng0d639a22011-07-01 21:01:15 +000010// This file declares the X86 specific subclass of TargetSubtargetInfo.
Nate Begemanf26625e2005-07-12 01:41:54 +000011//
12//===----------------------------------------------------------------------===//
13
Benjamin Kramera7c40ef2014-08-13 16:26:38 +000014#ifndef LLVM_LIB_TARGET_X86_X86SUBTARGET_H
15#define LLVM_LIB_TARGET_X86_X86SUBTARGET_H
Nate Begemanf26625e2005-07-12 01:41:54 +000016
Eric Christophera08f30b2014-06-09 17:08:19 +000017#include "X86FrameLowering.h"
18#include "X86ISelLowering.h"
19#include "X86InstrInfo.h"
Eric Christophera08f30b2014-06-09 17:08:19 +000020#include "X86SelectionDAGInfo.h"
Eugene Zelenkofbd13c52017-02-02 22:55:55 +000021#include "llvm/ADT/StringRef.h"
Eric Christopherd4298462010-07-05 19:26:33 +000022#include "llvm/ADT/Triple.h"
Quentin Colombet61d71a12017-08-15 22:31:51 +000023#include "llvm/CodeGen/GlobalISel/CallLowering.h"
24#include "llvm/CodeGen/GlobalISel/InstructionSelector.h"
25#include "llvm/CodeGen/GlobalISel/LegalizerInfo.h"
26#include "llvm/CodeGen/GlobalISel/RegisterBankInfo.h"
David Blaikieb3bde2e2017-11-17 01:07:10 +000027#include "llvm/CodeGen/TargetSubtargetInfo.h"
Chandler Carruth9fb823b2013-01-02 11:36:10 +000028#include "llvm/IR/CallingConv.h"
Eugene Zelenkofbd13c52017-02-02 22:55:55 +000029#include "llvm/MC/MCInstrItineraries.h"
30#include "llvm/Target/TargetMachine.h"
Eugene Zelenkofbd13c52017-02-02 22:55:55 +000031#include <memory>
Jim Laskey19058c32005-09-01 21:38:21 +000032
Evan Cheng54b68e32011-07-01 20:45:01 +000033#define GET_SUBTARGETINFO_HEADER
Evan Chengc9c090d2011-07-01 22:36:09 +000034#include "X86GenSubtargetInfo.inc"
Evan Cheng54b68e32011-07-01 20:45:01 +000035
Nate Begemanf26625e2005-07-12 01:41:54 +000036namespace llvm {
Eugene Zelenkofbd13c52017-02-02 22:55:55 +000037
Anton Korobeynikov6dbdfe22006-11-30 22:42:55 +000038class GlobalValue;
Mikhail Glushenkovabd56bd2010-02-28 22:54:30 +000039
Sanjay Patele63abfe2015-02-03 18:47:32 +000040/// The X86 backend supports a number of different styles of PIC.
Mikhail Glushenkovabd56bd2010-02-28 22:54:30 +000041///
Duncan Sands595a4422008-11-28 09:29:37 +000042namespace PICStyles {
Eugene Zelenkofbd13c52017-02-02 22:55:55 +000043
Anton Korobeynikova0554d92007-01-12 19:20:47 +000044enum Style {
Rafael Espindola0d348262016-06-20 23:41:56 +000045 StubPIC, // Used on i386-darwin in pic mode.
46 GOT, // Used on 32 bit elf on when in pic mode.
47 RIPRel, // Used on X86-64 when in pic mode.
48 None // Set when not in pic mode.
Anton Korobeynikova0554d92007-01-12 19:20:47 +000049};
Eugene Zelenkofbd13c52017-02-02 22:55:55 +000050
51} // end namespace PICStyles
Nate Begemanf26625e2005-07-12 01:41:54 +000052
Craig Topperec828472014-03-31 06:53:13 +000053class X86Subtarget final : public X86GenSubtargetInfo {
Mohammed Agabaria115f68e2017-11-20 08:18:12 +000054public:
Andrew Trick8523b162012-02-01 23:20:51 +000055 enum X86ProcFamilyEnum {
Mohammed Agabaria115f68e2017-11-20 08:18:12 +000056 Others,
Mohammed Agabariae9aebf22017-09-13 09:00:27 +000057 IntelAtom,
58 IntelSLM,
59 IntelGLM,
60 IntelHaswell,
61 IntelBroadwell,
62 IntelSkylake,
63 IntelKNL,
64 IntelSKX,
Craig Topper81037f32017-11-19 01:12:00 +000065 IntelCannonlake,
66 IntelIcelake,
Andrew Trick8523b162012-02-01 23:20:51 +000067 };
68
Mohammed Agabaria115f68e2017-11-20 08:18:12 +000069protected:
70 enum X86SSEEnum {
71 NoSSE, SSE1, SSE2, SSE3, SSSE3, SSE41, SSE42, AVX, AVX2, AVX512F
72 };
73
74 enum X863DNowEnum {
75 NoThreeDNow, MMX, ThreeDNow, ThreeDNowA
76 };
77
Sanjay Patele63abfe2015-02-03 18:47:32 +000078 /// X86 processor family: Intel Atom, and others
Andrew Trick8523b162012-02-01 23:20:51 +000079 X86ProcFamilyEnum X86ProcFamily;
Chad Rosier24c19d22012-08-01 18:39:17 +000080
Sanjay Patele63abfe2015-02-03 18:47:32 +000081 /// Which PIC style to use
Duncan Sands595a4422008-11-28 09:29:37 +000082 PICStyles::Style PICStyle;
Mikhail Glushenkovabd56bd2010-02-28 22:54:30 +000083
Rafael Espindolaab03eb02016-05-19 22:07:57 +000084 const TargetMachine &TM;
Rafael Espindola46107b92016-05-19 18:49:29 +000085
Eric Christopher11e59832015-10-08 20:10:06 +000086 /// SSE1, SSE2, SSE3, SSSE3, SSE41, SSE42, or none supported.
Evan Chengcde9e302006-01-27 08:10:46 +000087 X86SSEEnum X86SSELevel;
88
Eric Christopher57a6e132015-11-14 03:04:00 +000089 /// MMX, 3DNow, 3DNow Athlon, or none supported.
Evan Chengff1beda2006-10-06 09:17:41 +000090 X863DNowEnum X863DNowLevel;
91
Andrey Turetskiy6a3d5612016-03-23 11:13:54 +000092 /// True if the processor supports X87 instructions.
93 bool HasX87;
94
Craig Topper505f38a2018-01-10 22:07:16 +000095 /// True if this processor has NOPL instruction
96 /// (generally pentium pro+).
97 bool HasNOPL;
98
Sanjay Patele63abfe2015-02-03 18:47:32 +000099 /// True if this processor has conditional move instructions
Chris Lattnercc8c5812009-09-02 05:53:04 +0000100 /// (generally pentium pro+).
101 bool HasCMov;
Mikhail Glushenkovabd56bd2010-02-28 22:54:30 +0000102
Sanjay Patele63abfe2015-02-03 18:47:32 +0000103 /// True if the processor supports X86-64 instructions.
Evan Cheng11b0a5d2006-09-08 06:48:29 +0000104 bool HasX86_64;
Evan Cheng4c91aa32009-01-02 05:35:45 +0000105
Sanjay Patele63abfe2015-02-03 18:47:32 +0000106 /// True if the processor supports POPCNT.
Benjamin Kramer2f489232010-12-04 20:32:23 +0000107 bool HasPOPCNT;
108
Sanjay Patele63abfe2015-02-03 18:47:32 +0000109 /// True if the processor supports SSE4A instructions.
Stefanus Du Toit96180b52009-05-26 21:04:35 +0000110 bool HasSSE4A;
111
Sanjay Patele63abfe2015-02-03 18:47:32 +0000112 /// Target has AES instructions
Eric Christopher2ef63182010-04-02 21:54:27 +0000113 bool HasAES;
Coby Tayree2a1c02f2017-11-21 09:11:41 +0000114 bool HasVAES;
Eric Christopher2ef63182010-04-02 21:54:27 +0000115
Craig Topper09b65982015-10-16 06:03:09 +0000116 /// Target has FXSAVE/FXRESTOR instructions
117 bool HasFXSR;
118
Amjad Aboud1db6d7a2015-10-12 11:47:46 +0000119 /// Target has XSAVE instructions
120 bool HasXSAVE;
Eugene Zelenkofbd13c52017-02-02 22:55:55 +0000121
Amjad Aboud1db6d7a2015-10-12 11:47:46 +0000122 /// Target has XSAVEOPT instructions
123 bool HasXSAVEOPT;
Eugene Zelenkofbd13c52017-02-02 22:55:55 +0000124
Amjad Aboud1db6d7a2015-10-12 11:47:46 +0000125 /// Target has XSAVEC instructions
126 bool HasXSAVEC;
Eugene Zelenkofbd13c52017-02-02 22:55:55 +0000127
Amjad Aboud1db6d7a2015-10-12 11:47:46 +0000128 /// Target has XSAVES instructions
129 bool HasXSAVES;
130
Sanjay Patele63abfe2015-02-03 18:47:32 +0000131 /// Target has carry-less multiplication
Benjamin Kramera0396e42012-05-31 14:34:17 +0000132 bool HasPCLMUL;
Coby Tayree7ca5e5872017-11-21 09:30:33 +0000133 bool HasVPCLMULQDQ;
Bruno Cardoso Lopes09dc24b2010-07-23 01:17:51 +0000134
Coby Tayreed8b17be2017-11-26 09:36:41 +0000135 /// Target has Galois Field Arithmetic instructions
136 bool HasGFNI;
137
Sanjay Patele63abfe2015-02-03 18:47:32 +0000138 /// Target has 3-operand fused multiply-add
Craig Topper79dbb0c2012-06-03 18:58:46 +0000139 bool HasFMA;
David Greene8f6f72c2009-06-26 22:46:54 +0000140
Sanjay Patele63abfe2015-02-03 18:47:32 +0000141 /// Target has 4-operand fused multiply-add
David Greene8f6f72c2009-06-26 22:46:54 +0000142 bool HasFMA4;
143
Sanjay Patele63abfe2015-02-03 18:47:32 +0000144 /// Target has XOP instructions
Jan Sjödin1280eb12011-12-02 15:14:37 +0000145 bool HasXOP;
146
Sanjay Patele63abfe2015-02-03 18:47:32 +0000147 /// Target has TBM instructions.
Yunzhong Gaodd36e932013-09-24 18:21:52 +0000148 bool HasTBM;
149
Simon Pilgrim99b925b2017-05-03 15:51:39 +0000150 /// Target has LWP instructions
151 bool HasLWP;
152
Sanjay Patele63abfe2015-02-03 18:47:32 +0000153 /// True if the processor has the MOVBE instruction.
Craig Topper786bdb92011-10-03 17:28:23 +0000154 bool HasMOVBE;
155
Sanjay Patele63abfe2015-02-03 18:47:32 +0000156 /// True if the processor has the RDRAND instruction.
Craig Topper786bdb92011-10-03 17:28:23 +0000157 bool HasRDRAND;
158
Sanjay Patele63abfe2015-02-03 18:47:32 +0000159 /// Processor has 16-bit floating point conversion instructions.
Craig Topperfe9179f2011-10-09 07:31:39 +0000160 bool HasF16C;
161
Sanjay Patele63abfe2015-02-03 18:47:32 +0000162 /// Processor has FS/GS base insturctions.
Craig Topper228d9132011-10-30 19:57:21 +0000163 bool HasFSGSBase;
164
Sanjay Patele63abfe2015-02-03 18:47:32 +0000165 /// Processor has LZCNT instruction.
Craig Topper271064e2011-10-11 06:44:02 +0000166 bool HasLZCNT;
167
Sanjay Patele63abfe2015-02-03 18:47:32 +0000168 /// Processor has BMI1 instructions.
Craig Topper3657fe42011-10-14 03:21:46 +0000169 bool HasBMI;
170
Sanjay Patele63abfe2015-02-03 18:47:32 +0000171 /// Processor has BMI2 instructions.
Craig Topperaea148c2011-10-16 07:55:05 +0000172 bool HasBMI2;
173
Michael Zuckerman97b6a6922016-01-17 13:42:12 +0000174 /// Processor has VBMI instructions.
175 bool HasVBMI;
176
Coby Tayree71e37cc2017-11-21 09:48:44 +0000177 /// Processor has VBMI2 instructions.
178 bool HasVBMI2;
179
Elena Demikhovsky29cde352016-01-24 10:41:28 +0000180 /// Processor has Integer Fused Multiply Add
181 bool HasIFMA;
182
Sanjay Patele63abfe2015-02-03 18:47:32 +0000183 /// Processor has RTM instructions.
Michael Liao73cffdd2012-11-08 07:28:54 +0000184 bool HasRTM;
185
Sanjay Patele63abfe2015-02-03 18:47:32 +0000186 /// Processor has ADX instructions.
Kay Tiong Khoof809c642013-02-14 19:08:21 +0000187 bool HasADX;
188
Sanjay Patele63abfe2015-02-03 18:47:32 +0000189 /// Processor has SHA instructions.
Ben Langmuir16501752013-09-12 15:51:31 +0000190 bool HasSHA;
191
Sanjay Patele63abfe2015-02-03 18:47:32 +0000192 /// Processor has PRFCHW instructions.
Michael Liao5173ee02013-03-26 17:47:11 +0000193 bool HasPRFCHW;
194
Sanjay Patele63abfe2015-02-03 18:47:32 +0000195 /// Processor has RDSEED instructions.
Michael Liaoa486a112013-03-28 23:41:26 +0000196 bool HasRDSEED;
197
Hans Wennborg5000ce82015-12-04 23:00:33 +0000198 /// Processor has LAHF/SAHF instructions.
199 bool HasLAHFSAHF;
200
Ashutosh Nema348af9c2016-05-18 11:59:12 +0000201 /// Processor has MONITORX/MWAITX instructions.
202 bool HasMWAITX;
203
Craig Topper50f3d142017-02-09 04:27:34 +0000204 /// Processor has Cache Line Zero instruction
205 bool HasCLZERO;
206
Elena Demikhovsky29cde352016-01-24 10:41:28 +0000207 /// Processor has Prefetch with intent to Write instruction
Craig Toppere2685982017-12-22 02:30:30 +0000208 bool HasPREFETCHWT1;
Elena Demikhovsky29cde352016-01-24 10:41:28 +0000209
Sanjay Patele63abfe2015-02-03 18:47:32 +0000210 /// True if SHLD instructions are slow.
Ekaterina Romanovad5fa5542013-11-21 23:21:26 +0000211 bool IsSHLDSlow;
212
Zvi Rackover8bc7e4d2016-12-06 19:35:20 +0000213 /// True if the PMULLD instruction is slow compared to PMULLW/PMULHW and
214 // PMULUDQ.
215 bool IsPMULLDSlow;
216
Sanjay Patel30145672015-09-01 20:51:51 +0000217 /// True if unaligned memory accesses of 16-bytes are slow.
218 bool IsUAMem16Slow;
Evan Cheng738b0f92010-04-01 05:58:17 +0000219
Sanjay Patel9e916dc2015-08-21 20:17:26 +0000220 /// True if unaligned memory accesses of 32-bytes are slow.
Sanjay Patel501890e2014-11-21 17:40:04 +0000221 bool IsUAMem32Slow;
Michael Liao5bf95782014-12-04 05:20:33 +0000222
Sanjay Patelffd039b2015-02-03 17:13:04 +0000223 /// True if SSE operations can have unaligned memory operands.
224 /// This may require setting a configuration bit in the processor.
225 bool HasSSEUnalignedMem;
David Greene206351a2010-01-11 16:29:42 +0000226
Sanjay Patele63abfe2015-02-03 18:47:32 +0000227 /// True if this processor has the CMPXCHG16B instruction;
Eli Friedman5e570422011-08-26 21:21:21 +0000228 /// this is true for most x86-64 chips, but not the first AMD chips.
229 bool HasCmpxchg16b;
230
Sanjay Patele63abfe2015-02-03 18:47:32 +0000231 /// True if the LEA instruction should be used for adjusting
Evan Cheng1b81fdd2012-02-07 22:50:41 +0000232 /// the stack pointer. This is an optimization for Intel Atom processors.
233 bool UseLeaForSP;
234
Marina Yatsina77a21db2018-01-22 10:07:01 +0000235 /// True if POPCNT instruction has a false dependency on the destination register.
236 bool HasPOPCNTFalseDeps;
237
238 /// True if LZCNT/TZCNT instructions have a false dependency on the destination register.
239 bool HasLZCNTFalseDeps;
240
Simon Pilgrimfd5df632017-12-19 13:16:43 +0000241 /// True if its preferable to combine to a single shuffle using a variable
242 /// mask over multiple fixed shuffles.
243 bool HasFastVariableShuffle;
244
Yunzhong Gao0de36ec2016-02-12 23:37:57 +0000245 /// True if there is no performance penalty to writing only the lower parts
Amjad Aboud4f977512017-03-03 09:03:24 +0000246 /// of a YMM or ZMM register without clearing the upper part.
247 bool HasFastPartialYMMorZMMWrite;
Yunzhong Gao0de36ec2016-02-12 23:37:57 +0000248
Simon Pilgrim02bdac52018-01-29 21:24:31 +0000249 /// True if there is no performance penalty for writing NOPs with up to
250 /// 11 bytes.
251 bool HasFast11ByteNOP;
252
253 /// True if there is no performance penalty for writing NOPs with up to
254 /// 15 bytes.
255 bool HasFast15ByteNOP;
256
Craig Topperea37e202017-11-25 18:09:37 +0000257 /// True if gather is reasonably fast. This is true for Skylake client and
258 /// all AVX-512 CPUs.
259 bool HasFastGather;
260
Nikolai Bozhenovf6795302016-08-04 12:47:28 +0000261 /// True if hardware SQRTSS instruction is at least as fast (latency) as
262 /// RSQRTSS followed by a Newton-Raphson iteration.
263 bool HasFastScalarFSQRT;
264
265 /// True if hardware SQRTPS/VSQRTPS instructions are at least as fast
266 /// (throughput) as RSQRTPS/VRSQRTPS followed by a Newton-Raphson iteration.
267 bool HasFastVectorFSQRT;
268
Sanjay Patele63abfe2015-02-03 18:47:32 +0000269 /// True if 8-bit divisions are significantly faster than
Alexey Volkovfd1731d2014-11-21 11:19:34 +0000270 /// 32-bit divisions and should be used when possible.
271 bool HasSlowDivide32;
272
Nikolai Bozhenov6bdf92c2017-01-12 19:34:15 +0000273 /// True if 32-bit divides are significantly faster than
Alexey Volkovfd1731d2014-11-21 11:19:34 +0000274 /// 64-bit divisions and should be used when possible.
275 bool HasSlowDivide64;
Preston Gurdcdf540d2012-09-04 18:22:17 +0000276
Pierre Gousseaub6d652a2016-10-14 16:41:38 +0000277 /// True if LZCNT instruction is fast.
278 bool HasFastLZCNT;
279
Craig Topperd88389a2017-02-21 06:39:13 +0000280 /// True if SHLD based rotate is fast.
281 bool HasFastSHLDRotate;
282
Craig Topper641e2af2017-08-30 04:34:48 +0000283 /// True if the processor supports macrofusion.
284 bool HasMacroFusion;
285
Clement Courbet203fc172017-04-21 09:20:50 +0000286 /// True if the processor has enhanced REP MOVSB/STOSB.
287 bool HasERMSB;
Clement Courbet1ce3b822017-04-21 09:20:39 +0000288
Sanjay Patele63abfe2015-02-03 18:47:32 +0000289 /// True if the short functions should be padded to prevent
Preston Gurda01daac2013-01-08 18:27:24 +0000290 /// a stall when returning too early.
291 bool PadShortFunctions;
292
Craig Topper62c47a22017-08-29 05:14:27 +0000293 /// True if two memory operand instructions should use a temporary register
294 /// instead.
295 bool SlowTwoMemOps;
Sanjay Patele63abfe2015-02-03 18:47:32 +0000296
297 /// True if the LEA instruction inputs have to be ready at address generation
298 /// (AG) time.
Preston Gurd8b7ab4b2013-04-25 20:29:37 +0000299 bool LEAUsesAG;
Preston Gurd663e6f92013-03-27 19:14:02 +0000300
Sanjay Patele63abfe2015-02-03 18:47:32 +0000301 /// True if the LEA instruction with certain arguments is slow
Alexey Volkov6226de62014-05-20 08:55:50 +0000302 bool SlowLEA;
303
Lama Saba2ea271b2017-05-18 08:11:50 +0000304 /// True if the LEA instruction has all three source operands: base, index,
305 /// and offset or if the LEA instruction uses base and index registers where
306 /// the base is EBP, RBP,or R13
307 bool Slow3OpsLEA;
308
Sanjay Patele63abfe2015-02-03 18:47:32 +0000309 /// True if INC and DEC instructions are slow when writing to flags
Alexey Volkov5260dba2014-06-09 11:40:41 +0000310 bool SlowIncDec;
311
Elena Demikhovsky8cfb43f2013-07-24 11:02:47 +0000312 /// Processor has AVX-512 PreFetch Instructions
313 bool HasPFI;
Robert Khasanovbfa01312014-07-21 14:54:21 +0000314
Elena Demikhovsky8cfb43f2013-07-24 11:02:47 +0000315 /// Processor has AVX-512 Exponential and Reciprocal Instructions
316 bool HasERI;
Robert Khasanovbfa01312014-07-21 14:54:21 +0000317
Elena Demikhovsky8cfb43f2013-07-24 11:02:47 +0000318 /// Processor has AVX-512 Conflict Detection Instructions
319 bool HasCDI;
Robert Khasanovbfa01312014-07-21 14:54:21 +0000320
Oren Ben Simhon7bf27f02017-05-25 13:45:23 +0000321 /// Processor has AVX-512 population count Instructions
322 bool HasVPOPCNTDQ;
323
Robert Khasanovbfa01312014-07-21 14:54:21 +0000324 /// Processor has AVX-512 Doubleword and Quadword instructions
325 bool HasDQI;
326
327 /// Processor has AVX-512 Byte and Word instructions
328 bool HasBWI;
329
330 /// Processor has AVX-512 Vector Length eXtenstions
331 bool HasVLX;
332
Asaf Badouh5acf66f2015-12-15 13:35:29 +0000333 /// Processor has PKU extenstions
334 bool HasPKU;
335
Coby Tayree3880f2a2017-11-21 10:04:28 +0000336 /// Processor has AVX-512 Vector Neural Network Instructions
337 bool HasVNNI;
338
Coby Tayree5c7fe5d2017-11-21 10:32:42 +0000339 /// Processor has AVX-512 Bit Algorithms instructions
340 bool HasBITALG;
341
Elena Demikhovsky29cde352016-01-24 10:41:28 +0000342 /// Processor supports MPX - Memory Protection Extensions
Elena Demikhovskyf7e641c2015-06-03 10:30:57 +0000343 bool HasMPX;
344
Oren Ben Simhonfa582b02017-11-26 13:02:45 +0000345 /// Processor supports CET SHSTK - Control-Flow Enforcement Technology
346 /// using Shadow Stack
347 bool HasSHSTK;
348
349 /// Processor supports CET IBT - Control-Flow Enforcement Technology
350 /// using Indirect Branch Tracking
351 bool HasIBT;
352
Elena Demikhovsky29cde352016-01-24 10:41:28 +0000353 /// Processor has Software Guard Extensions
354 bool HasSGX;
355
356 /// Processor supports Flush Cache Line instruction
357 bool HasCLFLUSHOPT;
358
Elena Demikhovsky29cde352016-01-24 10:41:28 +0000359 /// Processor supports Cache Line Write Back instruction
360 bool HasCLWB;
361
Craig Topper84b26b92018-01-18 23:52:31 +0000362 /// Processor support RDPID instruction
363 bool HasRDPID;
364
Chandler Carruthc58f2162018-01-22 22:05:25 +0000365 /// Use a retpoline thunk rather than indirect calls to block speculative
366 /// execution.
367 bool UseRetpoline;
368
369 /// When using a retpoline thunk, call an externally provided thunk rather
370 /// than emitting one inside the compiler.
371 bool UseRetpolineExternalThunk;
372
Eric Christopher824f42f2015-05-12 01:26:05 +0000373 /// Use software floating point for code generation.
374 bool UseSoftFloat;
375
Sanjay Patele63abfe2015-02-03 18:47:32 +0000376 /// The minimum alignment known to hold of the stack frame on
Chris Lattner351817b2005-07-12 02:36:10 +0000377 /// entry to the function and which must be maintained by every function.
Nate Begemanf26625e2005-07-12 01:41:54 +0000378 unsigned stackAlignment;
Jeff Cohen33a030e2005-07-27 05:53:44 +0000379
Rafael Espindola063f1772007-10-31 11:52:06 +0000380 /// Max. memset / memcpy size that is turned into rep/movs, rep/stos ops.
Evan Cheng763cdfd2007-08-01 23:45:51 +0000381 ///
Rafael Espindola063f1772007-10-31 11:52:06 +0000382 unsigned MaxInlineSizeThreshold;
NAKAMURA Takumi0544fe72011-02-17 12:23:50 +0000383
Craig Topper0d797a32018-01-20 00:26:08 +0000384 /// Indicates target prefers 256 bit instructions.
385 bool Prefer256Bit;
386
Sanjay Patele63abfe2015-02-03 18:47:32 +0000387 /// What processor and OS we're targeting.
Eric Christopherd4298462010-07-05 19:26:33 +0000388 Triple TargetTriple;
Chad Rosier24c19d22012-08-01 18:39:17 +0000389
Andrew Trick8523b162012-02-01 23:20:51 +0000390 /// Instruction itineraries for scheduling
391 InstrItineraryData InstrItins;
Evan Cheng03c1e6f2006-02-16 00:21:07 +0000392
Quentin Colombet61d71a12017-08-15 22:31:51 +0000393 /// GlobalISel related APIs.
394 std::unique_ptr<CallLowering> CallLoweringInfo;
395 std::unique_ptr<LegalizerInfo> Legalizer;
396 std::unique_ptr<RegisterBankInfo> RegBankInfo;
397 std::unique_ptr<InstructionSelector> InstSelector;
Eric Christophere950b672014-08-09 04:38:53 +0000398
Eugene Zelenkofbd13c52017-02-02 22:55:55 +0000399private:
Sanjay Patele63abfe2015-02-03 18:47:32 +0000400 /// Override the stack alignment.
Bill Wendlingaef9c372013-02-15 22:31:27 +0000401 unsigned StackAlignOverride;
402
Craig Topper0d797a32018-01-20 00:26:08 +0000403 /// Preferred vector width from function attribute.
404 unsigned PreferVectorWidthOverride;
405
406 /// Resolved preferred vector width from function attribute and subtarget
407 /// features.
408 unsigned PreferVectorWidth;
409
Craig Topper24d3b282018-02-11 08:06:27 +0000410 /// Required vector width from function attribute.
411 unsigned RequiredVectorWidth;
412
Sanjay Patele63abfe2015-02-03 18:47:32 +0000413 /// True if compiling for 64-bit, false for 16-bit or 32-bit.
Evan Cheng13bcc6c2011-07-07 21:06:52 +0000414 bool In64BitMode;
Evan Cheng11b0a5d2006-09-08 06:48:29 +0000415
Sanjay Patele63abfe2015-02-03 18:47:32 +0000416 /// True if compiling for 32-bit, false for 16-bit or 64-bit.
Craig Topper3c80d622014-01-06 04:55:54 +0000417 bool In32BitMode;
418
Sanjay Patele63abfe2015-02-03 18:47:32 +0000419 /// True if compiling for 16-bit, false for 32-bit or 64-bit.
Craig Topper3c80d622014-01-06 04:55:54 +0000420 bool In16BitMode;
421
Mohammed Agabariae9aebf22017-09-13 09:00:27 +0000422 /// Contains the Overhead of gather\scatter instructions
423 int GatherOverhead;
424 int ScatterOverhead;
425
Eric Christophera08f30b2014-06-09 17:08:19 +0000426 X86SelectionDAGInfo TSInfo;
Eric Christopher1a212032014-06-11 00:25:19 +0000427 // Ordering here is important. X86InstrInfo initializes X86RegisterInfo which
428 // X86TargetLowering needs.
429 X86InstrInfo InstrInfo;
430 X86TargetLowering TLInfo;
431 X86FrameLowering FrameLowering;
Eric Christophera08f30b2014-06-09 17:08:19 +0000432
Nate Begemanf26625e2005-07-12 01:41:54 +0000433public:
Jeff Cohen33a030e2005-07-27 05:53:44 +0000434 /// This constructor initializes the data members to match that
Daniel Dunbar31b44e82009-08-02 22:11:08 +0000435 /// of the specified triple.
Nate Begemanf26625e2005-07-12 01:41:54 +0000436 ///
David Majnemerca290232016-05-20 18:16:06 +0000437 X86Subtarget(const Triple &TT, StringRef CPU, StringRef FS,
Craig Topper0d797a32018-01-20 00:26:08 +0000438 const X86TargetMachine &TM, unsigned StackAlignOverride,
Craig Topper24d3b282018-02-11 08:06:27 +0000439 unsigned PreferVectorWidthOverride,
440 unsigned RequiredVectorWidth);
Eric Christophera08f30b2014-06-09 17:08:19 +0000441
Eric Christopherd9134482014-08-04 21:25:23 +0000442 const X86TargetLowering *getTargetLowering() const override {
443 return &TLInfo;
444 }
Eugene Zelenkofbd13c52017-02-02 22:55:55 +0000445
Eric Christopherd9134482014-08-04 21:25:23 +0000446 const X86InstrInfo *getInstrInfo() const override { return &InstrInfo; }
Eugene Zelenkofbd13c52017-02-02 22:55:55 +0000447
Eric Christopherd9134482014-08-04 21:25:23 +0000448 const X86FrameLowering *getFrameLowering() const override {
449 return &FrameLowering;
450 }
Eugene Zelenkofbd13c52017-02-02 22:55:55 +0000451
Eric Christopherd9134482014-08-04 21:25:23 +0000452 const X86SelectionDAGInfo *getSelectionDAGInfo() const override {
453 return &TSInfo;
454 }
Eugene Zelenkofbd13c52017-02-02 22:55:55 +0000455
Eric Christopherd9134482014-08-04 21:25:23 +0000456 const X86RegisterInfo *getRegisterInfo() const override {
457 return &getInstrInfo()->getRegisterInfo();
458 }
Chris Lattner351817b2005-07-12 02:36:10 +0000459
Sanjay Patele63abfe2015-02-03 18:47:32 +0000460 /// Returns the minimum alignment known to hold of the
Chris Lattner351817b2005-07-12 02:36:10 +0000461 /// stack frame on entry to the function and which must be maintained by every
462 /// function for this subtarget.
Nate Begemanf26625e2005-07-12 01:41:54 +0000463 unsigned getStackAlignment() const { return stackAlignment; }
Jeff Cohen33a030e2005-07-27 05:53:44 +0000464
Sanjay Patele63abfe2015-02-03 18:47:32 +0000465 /// Returns the maximum memset / memcpy size
Rafael Espindola063f1772007-10-31 11:52:06 +0000466 /// that still makes it profitable to inline the call.
467 unsigned getMaxInlineSizeThreshold() const { return MaxInlineSizeThreshold; }
Anton Korobeynikov5b96cde2006-11-21 00:01:06 +0000468
469 /// ParseSubtargetFeatures - Parses features string setting specified
Evan Chengff1beda2006-10-06 09:17:41 +0000470 /// subtarget options. Definition of function is auto generated by tblgen.
Evan Cheng1a72add62011-07-07 07:07:08 +0000471 void ParseSubtargetFeatures(StringRef CPU, StringRef FS);
Evan Chengff1beda2006-10-06 09:17:41 +0000472
Zvi Rackover76dbf262016-11-15 06:34:33 +0000473 /// Methods used by Global ISel
474 const CallLowering *getCallLowering() const override;
475 const InstructionSelector *getInstructionSelector() const override;
476 const LegalizerInfo *getLegalizerInfo() const override;
477 const RegisterBankInfo *getRegBankInfo() const override;
Eugene Zelenkofbd13c52017-02-02 22:55:55 +0000478
Bill Wendling61375d82013-02-16 01:36:26 +0000479private:
Sanjay Patele63abfe2015-02-03 18:47:32 +0000480 /// Initialize the full set of dependencies so we can use an initializer
Eric Christopher1a212032014-06-11 00:25:19 +0000481 /// list for X86Subtarget.
482 X86Subtarget &initializeSubtargetDependencies(StringRef CPU, StringRef FS);
Bill Wendling61375d82013-02-16 01:36:26 +0000483 void initializeEnvironment();
Eric Christopherb68e2532014-09-03 20:36:31 +0000484 void initSubtargetFeatures(StringRef CPU, StringRef FS);
Eugene Zelenkofbd13c52017-02-02 22:55:55 +0000485
Bill Wendling61375d82013-02-16 01:36:26 +0000486public:
Eli Bendersky597fc122013-01-25 22:07:43 +0000487 /// Is this x86_64? (disregarding specific ABI / programming model)
488 bool is64Bit() const {
489 return In64BitMode;
490 }
491
Craig Topper3c80d622014-01-06 04:55:54 +0000492 bool is32Bit() const {
493 return In32BitMode;
494 }
495
496 bool is16Bit() const {
497 return In16BitMode;
498 }
499
Eli Bendersky597fc122013-01-25 22:07:43 +0000500 /// Is this x86_64 with the ILP32 programming model (x32 ABI)?
501 bool isTarget64BitILP32() const {
Rafael Espindoladdb913c2013-12-19 00:44:37 +0000502 return In64BitMode && (TargetTriple.getEnvironment() == Triple::GNUX32 ||
Simon Pilgrima2794102014-11-22 19:12:10 +0000503 TargetTriple.isOSNaCl());
Eli Bendersky597fc122013-01-25 22:07:43 +0000504 }
505
506 /// Is this x86_64 with the LP64 programming model (standard AMD64, no x32)?
507 bool isTarget64BitLP64() const {
Pavel Chupinf55eb452014-08-07 09:41:19 +0000508 return In64BitMode && (TargetTriple.getEnvironment() != Triple::GNUX32 &&
Simon Pilgrima2794102014-11-22 19:12:10 +0000509 !TargetTriple.isOSNaCl());
Eli Bendersky597fc122013-01-25 22:07:43 +0000510 }
Evan Cheng54c13da2006-01-26 09:53:06 +0000511
Duncan Sands595a4422008-11-28 09:29:37 +0000512 PICStyles::Style getPICStyle() const { return PICStyle; }
513 void setPICStyle(PICStyles::Style Style) { PICStyle = Style; }
Anton Korobeynikova0554d92007-01-12 19:20:47 +0000514
Andrey Turetskiy6a3d5612016-03-23 11:13:54 +0000515 bool hasX87() const { return HasX87; }
Craig Topper505f38a2018-01-10 22:07:16 +0000516 bool hasNOPL() const { return HasNOPL; }
Chris Lattnera30d4ce2010-03-14 18:31:44 +0000517 bool hasCMov() const { return HasCMov; }
Craig Toppereb8f9e92012-01-10 06:30:56 +0000518 bool hasSSE1() const { return X86SSELevel >= SSE1; }
519 bool hasSSE2() const { return X86SSELevel >= SSE2; }
520 bool hasSSE3() const { return X86SSELevel >= SSE3; }
521 bool hasSSSE3() const { return X86SSELevel >= SSSE3; }
522 bool hasSSE41() const { return X86SSELevel >= SSE41; }
523 bool hasSSE42() const { return X86SSELevel >= SSE42; }
Craig Topperb0c0f722012-01-10 06:54:16 +0000524 bool hasAVX() const { return X86SSELevel >= AVX; }
525 bool hasAVX2() const { return X86SSELevel >= AVX2; }
Craig Topper5c94bb82013-08-21 03:57:57 +0000526 bool hasAVX512() const { return X86SSELevel >= AVX512F; }
Elena Demikhovskyeace43b2012-11-29 12:44:59 +0000527 bool hasInt256() const { return hasAVX2(); }
Stefanus Du Toit96180b52009-05-26 21:04:35 +0000528 bool hasSSE4A() const { return HasSSE4A; }
Eric Christopher57a6e132015-11-14 03:04:00 +0000529 bool hasMMX() const { return X863DNowLevel >= MMX; }
Evan Chengff1beda2006-10-06 09:17:41 +0000530 bool has3DNow() const { return X863DNowLevel >= ThreeDNow; }
531 bool has3DNowA() const { return X863DNowLevel >= ThreeDNowA; }
Benjamin Kramer2f489232010-12-04 20:32:23 +0000532 bool hasPOPCNT() const { return HasPOPCNT; }
Eric Christopher2ef63182010-04-02 21:54:27 +0000533 bool hasAES() const { return HasAES; }
Coby Tayree2a1c02f2017-11-21 09:11:41 +0000534 bool hasVAES() const { return HasVAES; }
Craig Topper09b65982015-10-16 06:03:09 +0000535 bool hasFXSR() const { return HasFXSR; }
Amjad Aboud1db6d7a2015-10-12 11:47:46 +0000536 bool hasXSAVE() const { return HasXSAVE; }
537 bool hasXSAVEOPT() const { return HasXSAVEOPT; }
538 bool hasXSAVEC() const { return HasXSAVEC; }
539 bool hasXSAVES() const { return HasXSAVES; }
Benjamin Kramera0396e42012-05-31 14:34:17 +0000540 bool hasPCLMUL() const { return HasPCLMUL; }
Coby Tayree7ca5e5872017-11-21 09:30:33 +0000541 bool hasVPCLMULQDQ() const { return HasVPCLMULQDQ; }
Coby Tayreed8b17be2017-11-26 09:36:41 +0000542 bool hasGFNI() const { return HasGFNI; }
Simon Pilgrimdb26b3d2015-11-30 22:22:06 +0000543 // Prefer FMA4 to FMA - its better for commutation/memory folding and
544 // has equal or better performance on all supported targets.
Craig Toppere4856312017-11-25 18:32:43 +0000545 bool hasFMA() const { return HasFMA; }
Simon Pilgrimdb26b3d2015-11-30 22:22:06 +0000546 bool hasFMA4() const { return HasFMA4; }
Craig Toppera8d40972017-03-17 07:37:31 +0000547 bool hasAnyFMA() const { return hasFMA() || hasFMA4(); }
Jan Sjödin1280eb12011-12-02 15:14:37 +0000548 bool hasXOP() const { return HasXOP; }
Yunzhong Gaodd36e932013-09-24 18:21:52 +0000549 bool hasTBM() const { return HasTBM; }
Simon Pilgrim99b925b2017-05-03 15:51:39 +0000550 bool hasLWP() const { return HasLWP; }
Craig Topper786bdb92011-10-03 17:28:23 +0000551 bool hasMOVBE() const { return HasMOVBE; }
552 bool hasRDRAND() const { return HasRDRAND; }
Craig Topperfe9179f2011-10-09 07:31:39 +0000553 bool hasF16C() const { return HasF16C; }
Craig Topper228d9132011-10-30 19:57:21 +0000554 bool hasFSGSBase() const { return HasFSGSBase; }
Craig Topper271064e2011-10-11 06:44:02 +0000555 bool hasLZCNT() const { return HasLZCNT; }
Craig Topper3657fe42011-10-14 03:21:46 +0000556 bool hasBMI() const { return HasBMI; }
Craig Topperaea148c2011-10-16 07:55:05 +0000557 bool hasBMI2() const { return HasBMI2; }
Michael Zuckerman97b6a6922016-01-17 13:42:12 +0000558 bool hasVBMI() const { return HasVBMI; }
Coby Tayree71e37cc2017-11-21 09:48:44 +0000559 bool hasVBMI2() const { return HasVBMI2; }
Elena Demikhovsky29cde352016-01-24 10:41:28 +0000560 bool hasIFMA() const { return HasIFMA; }
Michael Liao73cffdd2012-11-08 07:28:54 +0000561 bool hasRTM() const { return HasRTM; }
Kay Tiong Khoof809c642013-02-14 19:08:21 +0000562 bool hasADX() const { return HasADX; }
Ben Langmuir16501752013-09-12 15:51:31 +0000563 bool hasSHA() const { return HasSHA; }
Craig Toppere2685982017-12-22 02:30:30 +0000564 bool hasPRFCHW() const { return HasPRFCHW || HasPREFETCHWT1; }
565 bool hasPREFETCHWT1() const { return HasPREFETCHWT1; }
566 bool hasSSEPrefetch() const {
567 // We implicitly enable these when we have a write prefix supporting cache
568 // level OR if we have prfchw, but don't already have a read prefetch from
569 // 3dnow.
570 return hasSSE1() || (hasPRFCHW() && !has3DNow()) || hasPREFETCHWT1();
571 }
Michael Liaoa486a112013-03-28 23:41:26 +0000572 bool hasRDSEED() const { return HasRDSEED; }
Hans Wennborg5000ce82015-12-04 23:00:33 +0000573 bool hasLAHFSAHF() const { return HasLAHFSAHF; }
Ashutosh Nema348af9c2016-05-18 11:59:12 +0000574 bool hasMWAITX() const { return HasMWAITX; }
Craig Topper50f3d142017-02-09 04:27:34 +0000575 bool hasCLZERO() const { return HasCLZERO; }
Ekaterina Romanovad5fa5542013-11-21 23:21:26 +0000576 bool isSHLDSlow() const { return IsSHLDSlow; }
Zvi Rackover8bc7e4d2016-12-06 19:35:20 +0000577 bool isPMULLDSlow() const { return IsPMULLDSlow; }
Sanjay Patel30145672015-09-01 20:51:51 +0000578 bool isUnalignedMem16Slow() const { return IsUAMem16Slow; }
Sanjay Patel501890e2014-11-21 17:40:04 +0000579 bool isUnalignedMem32Slow() const { return IsUAMem32Slow; }
Mohammed Agabariae9aebf22017-09-13 09:00:27 +0000580 int getGatherOverhead() const { return GatherOverhead; }
581 int getScatterOverhead() const { return ScatterOverhead; }
Sanjay Patelffd039b2015-02-03 17:13:04 +0000582 bool hasSSEUnalignedMem() const { return HasSSEUnalignedMem; }
Eli Friedman5e570422011-08-26 21:21:21 +0000583 bool hasCmpxchg16b() const { return HasCmpxchg16b; }
Evan Cheng1b81fdd2012-02-07 22:50:41 +0000584 bool useLeaForSP() const { return UseLeaForSP; }
Marina Yatsina77a21db2018-01-22 10:07:01 +0000585 bool hasPOPCNTFalseDeps() const { return HasPOPCNTFalseDeps; }
586 bool hasLZCNTFalseDeps() const { return HasLZCNTFalseDeps; }
Simon Pilgrimfd5df632017-12-19 13:16:43 +0000587 bool hasFastVariableShuffle() const {
588 return HasFastVariableShuffle;
589 }
Amjad Aboud4f977512017-03-03 09:03:24 +0000590 bool hasFastPartialYMMorZMMWrite() const {
591 return HasFastPartialYMMorZMMWrite;
592 }
Craig Topperea37e202017-11-25 18:09:37 +0000593 bool hasFastGather() const { return HasFastGather; }
Nikolai Bozhenovf6795302016-08-04 12:47:28 +0000594 bool hasFastScalarFSQRT() const { return HasFastScalarFSQRT; }
595 bool hasFastVectorFSQRT() const { return HasFastVectorFSQRT; }
Pierre Gousseaub6d652a2016-10-14 16:41:38 +0000596 bool hasFastLZCNT() const { return HasFastLZCNT; }
Craig Topperd88389a2017-02-21 06:39:13 +0000597 bool hasFastSHLDRotate() const { return HasFastSHLDRotate; }
Craig Topper641e2af2017-08-30 04:34:48 +0000598 bool hasMacroFusion() const { return HasMacroFusion; }
Clement Courbet203fc172017-04-21 09:20:50 +0000599 bool hasERMSB() const { return HasERMSB; }
Alexey Volkovfd1731d2014-11-21 11:19:34 +0000600 bool hasSlowDivide32() const { return HasSlowDivide32; }
601 bool hasSlowDivide64() const { return HasSlowDivide64; }
Preston Gurda01daac2013-01-08 18:27:24 +0000602 bool padShortFunctions() const { return PadShortFunctions; }
Craig Topper62c47a22017-08-29 05:14:27 +0000603 bool slowTwoMemOps() const { return SlowTwoMemOps; }
Preston Gurd8b7ab4b2013-04-25 20:29:37 +0000604 bool LEAusesAG() const { return LEAUsesAG; }
Alexey Volkov6226de62014-05-20 08:55:50 +0000605 bool slowLEA() const { return SlowLEA; }
Lama Saba2ea271b2017-05-18 08:11:50 +0000606 bool slow3OpsLEA() const { return Slow3OpsLEA; }
Alexey Volkov5260dba2014-06-09 11:40:41 +0000607 bool slowIncDec() const { return SlowIncDec; }
Elena Demikhovsky8cfb43f2013-07-24 11:02:47 +0000608 bool hasCDI() const { return HasCDI; }
Oren Ben Simhon7bf27f02017-05-25 13:45:23 +0000609 bool hasVPOPCNTDQ() const { return HasVPOPCNTDQ; }
Elena Demikhovsky8cfb43f2013-07-24 11:02:47 +0000610 bool hasPFI() const { return HasPFI; }
611 bool hasERI() const { return HasERI; }
Robert Khasanovbfa01312014-07-21 14:54:21 +0000612 bool hasDQI() const { return HasDQI; }
613 bool hasBWI() const { return HasBWI; }
614 bool hasVLX() const { return HasVLX; }
Asaf Badouh5acf66f2015-12-15 13:35:29 +0000615 bool hasPKU() const { return HasPKU; }
Coby Tayree3880f2a2017-11-21 10:04:28 +0000616 bool hasVNNI() const { return HasVNNI; }
Coby Tayree5c7fe5d2017-11-21 10:32:42 +0000617 bool hasBITALG() const { return HasBITALG; }
Elena Demikhovskyf7e641c2015-06-03 10:30:57 +0000618 bool hasMPX() const { return HasMPX; }
Oren Ben Simhonfa582b02017-11-26 13:02:45 +0000619 bool hasSHSTK() const { return HasSHSTK; }
620 bool hasIBT() const { return HasIBT; }
Craig Topper3fd463a2017-02-08 05:45:46 +0000621 bool hasCLFLUSHOPT() const { return HasCLFLUSHOPT; }
Craig Topper559f61e2017-08-29 23:13:36 +0000622 bool hasCLWB() const { return HasCLWB; }
Craig Topper84b26b92018-01-18 23:52:31 +0000623 bool hasRDPID() const { return HasRDPID; }
Chandler Carruthc58f2162018-01-22 22:05:25 +0000624 bool useRetpoline() const { return UseRetpoline; }
625 bool useRetpolineExternalThunk() const { return UseRetpolineExternalThunk; }
Evan Cheng4c91aa32009-01-02 05:35:45 +0000626
Craig Topper0d797a32018-01-20 00:26:08 +0000627 unsigned getPreferVectorWidth() const { return PreferVectorWidth; }
Craig Topper24d3b282018-02-11 08:06:27 +0000628 unsigned getRequiredVectorWidth() const { return RequiredVectorWidth; }
Craig Topper0d797a32018-01-20 00:26:08 +0000629
Craig Topper08bd1482018-01-20 00:26:12 +0000630 // Helper functions to determine when we should allow widening to 512-bit
631 // during codegen.
632 // TODO: Currently we're always allowing widening on CPUs without VLX,
633 // because for many cases we don't have a better option.
634 bool canExtendTo512DQ() const {
635 return hasAVX512() && (!hasVLX() || getPreferVectorWidth() >= 512);
636 }
637 bool canExtendTo512BW() const {
638 return hasBWI() && canExtendTo512DQ();
639 }
640
Craig Topper24d3b282018-02-11 08:06:27 +0000641 // If there are no 512-bit vectors and we prefer not to use 512-bit registers,
642 // disable them in the legalizer.
643 bool useAVX512Regs() const {
644 return hasAVX512() && (canExtendTo512DQ() || RequiredVectorWidth > 256);
645 }
646
647 bool useBWIRegs() const {
648 return hasBWI() && useAVX512Regs();
649 }
650
Eugene Zelenkofbd13c52017-02-02 22:55:55 +0000651 bool isXRaySupported() const override { return is64Bit(); }
Dean Michael Berris464015442016-09-19 00:54:35 +0000652
Mohammed Agabariae9aebf22017-09-13 09:00:27 +0000653 X86ProcFamilyEnum getProcFamily() const { return X86ProcFamily; }
654
655 /// TODO: to be removed later and replaced with suitable properties
Andrew Trick8523b162012-02-01 23:20:51 +0000656 bool isAtom() const { return X86ProcFamily == IntelAtom; }
Alexey Volkov6226de62014-05-20 08:55:50 +0000657 bool isSLM() const { return X86ProcFamily == IntelSLM; }
Eric Christopher824f42f2015-05-12 01:26:05 +0000658 bool useSoftFloat() const { return UseSoftFloat; }
Andrew Trick8523b162012-02-01 23:20:51 +0000659
Sanjay Patele9bf9932016-02-13 17:26:29 +0000660 /// Use mfence if we have SSE2 or we're on x86-64 (even if we asked for
661 /// no-sse2). There isn't any reason to disable it if the target processor
662 /// supports it.
663 bool hasMFence() const { return hasSSE2() || is64Bit(); }
664
Daniel Dunbar44b53032011-04-19 21:01:47 +0000665 const Triple &getTargetTriple() const { return TargetTriple; }
666
Daniel Dunbar2b9b0e32011-04-19 21:14:45 +0000667 bool isTargetDarwin() const { return TargetTriple.isOSDarwin(); }
Simon Pilgrima2794102014-11-22 19:12:10 +0000668 bool isTargetFreeBSD() const { return TargetTriple.isOSFreeBSD(); }
Rafael Espindola44eae722014-12-29 15:47:28 +0000669 bool isTargetDragonFly() const { return TargetTriple.isOSDragonFly(); }
Simon Pilgrima2794102014-11-22 19:12:10 +0000670 bool isTargetSolaris() const { return TargetTriple.isOSSolaris(); }
Paul Robinson78a69532016-11-30 23:14:27 +0000671 bool isTargetPS4() const { return TargetTriple.isPS4CPU(); }
Tim Northover9653eb52013-12-10 16:57:43 +0000672
673 bool isTargetELF() const { return TargetTriple.isOSBinFormatELF(); }
674 bool isTargetCOFF() const { return TargetTriple.isOSBinFormatCOFF(); }
Eric Christopher21895152014-12-05 00:22:38 +0000675 bool isTargetMachO() const { return TargetTriple.isOSBinFormatMachO(); }
Tim Northover9653eb52013-12-10 16:57:43 +0000676
Cameron Esfahani943908b2013-08-29 20:23:14 +0000677 bool isTargetLinux() const { return TargetTriple.isOSLinux(); }
Marcin Koscielnicki0275fac2016-05-05 11:35:51 +0000678 bool isTargetKFreeBSD() const { return TargetTriple.isOSKFreeBSD(); }
679 bool isTargetGlibc() const { return TargetTriple.isOSGlibc(); }
Evgeniy Stepanov5fe279e2015-10-08 21:21:24 +0000680 bool isTargetAndroid() const { return TargetTriple.isAndroid(); }
Cameron Esfahani943908b2013-08-29 20:23:14 +0000681 bool isTargetNaCl() const { return TargetTriple.isOSNaCl(); }
Nick Lewycky73df7e32011-09-05 21:51:43 +0000682 bool isTargetNaCl32() const { return isTargetNaCl() && !is64Bit(); }
683 bool isTargetNaCl64() const { return isTargetNaCl() && is64Bit(); }
Michael Kupersteine1194bd2015-10-27 07:23:59 +0000684 bool isTargetMCU() const { return TargetTriple.isOSIAMCU(); }
Petr Hoseka7d59162017-02-24 03:10:10 +0000685 bool isTargetFuchsia() const { return TargetTriple.isOSFuchsia(); }
Yaron Keren28954962014-04-02 04:27:51 +0000686
687 bool isTargetWindowsMSVC() const {
688 return TargetTriple.isWindowsMSVCEnvironment();
689 }
690
Yaron Keren136fe7d2014-04-01 18:15:34 +0000691 bool isTargetKnownWindowsMSVC() const {
NAKAMURA Takumi09717bd2014-03-30 04:35:00 +0000692 return TargetTriple.isKnownWindowsMSVCEnvironment();
Saleem Abdulrasooledbdd2e2014-03-27 22:50:05 +0000693 }
Yaron Keren28954962014-04-02 04:27:51 +0000694
Pat Gavlinb3990952015-08-14 22:41:43 +0000695 bool isTargetWindowsCoreCLR() const {
696 return TargetTriple.isWindowsCoreCLREnvironment();
697 }
698
Yaron Keren28954962014-04-02 04:27:51 +0000699 bool isTargetWindowsCygwin() const {
Saleem Abdulrasooledbdd2e2014-03-27 22:50:05 +0000700 return TargetTriple.isWindowsCygwinEnvironment();
701 }
Yaron Keren28954962014-04-02 04:27:51 +0000702
703 bool isTargetWindowsGNU() const {
704 return TargetTriple.isWindowsGNUEnvironment();
705 }
706
Saleem Abdulrasool2f3b3f32014-11-20 18:01:26 +0000707 bool isTargetWindowsItanium() const {
708 return TargetTriple.isWindowsItaniumEnvironment();
709 }
710
Chandler Carruthebd90c52012-02-05 08:26:40 +0000711 bool isTargetCygMing() const { return TargetTriple.isOSCygMing(); }
Mikhail Glushenkovabd56bd2010-02-28 22:54:30 +0000712
Yaron Keren79bb2662013-10-23 23:37:01 +0000713 bool isOSWindows() const { return TargetTriple.isOSWindows(); }
714
Reid Kleckner9cdd4df2017-10-11 21:24:33 +0000715 bool isTargetWin64() const { return In64BitMode && isOSWindows(); }
Evan Chengd22a4a12011-02-01 01:14:13 +0000716
Reid Kleckner9cdd4df2017-10-11 21:24:33 +0000717 bool isTargetWin32() const { return !In64BitMode && isOSWindows(); }
Anton Korobeynikova5a64552010-09-02 23:03:46 +0000718
Duncan Sands595a4422008-11-28 09:29:37 +0000719 bool isPICStyleGOT() const { return PICStyle == PICStyles::GOT; }
Duncan Sands595a4422008-11-28 09:29:37 +0000720 bool isPICStyleRIPRel() const { return PICStyle == PICStyles::RIPRel; }
Chris Lattnere2f524f2009-07-10 20:47:30 +0000721
Chris Lattner21c29402009-07-10 21:00:45 +0000722 bool isPICStyleStubPIC() const {
Chris Lattnerba4d7332009-07-10 20:58:47 +0000723 return PICStyle == PICStyles::StubPIC;
724 }
725
Rafael Espindolaf9e348b2016-06-27 21:33:08 +0000726 bool isPositionIndependent() const { return TM.isPositionIndependent(); }
Davide Italianoef5d8be2016-06-18 00:03:20 +0000727
Charles Davise8f297c2013-07-12 06:02:35 +0000728 bool isCallingConvWin64(CallingConv::ID CC) const {
Reid Kleckner4f21df22015-07-08 21:03:47 +0000729 switch (CC) {
730 // On Win64, all these conventions just use the default convention.
731 case CallingConv::C:
732 case CallingConv::Fast:
Saleem Abdulrasoolaff96d92017-09-20 21:00:40 +0000733 case CallingConv::Swift:
Reid Kleckner4f21df22015-07-08 21:03:47 +0000734 case CallingConv::X86_FastCall:
735 case CallingConv::X86_StdCall:
736 case CallingConv::X86_ThisCall:
737 case CallingConv::X86_VectorCall:
738 case CallingConv::Intel_OCL_BI:
739 return isTargetWin64();
740 // This convention allows using the Win64 convention on other targets.
Martin Storsjo2f24e932017-07-17 20:05:19 +0000741 case CallingConv::Win64:
Reid Kleckner4f21df22015-07-08 21:03:47 +0000742 return true;
743 // This convention allows using the SysV convention on Windows targets.
744 case CallingConv::X86_64_SysV:
745 return false;
746 // Otherwise, who knows what this is.
747 default:
748 return false;
749 }
Charles Davise8f297c2013-07-12 06:02:35 +0000750 }
Mikhail Glushenkovabd56bd2010-02-28 22:54:30 +0000751
Rafael Espindolacb2d2662016-05-19 18:34:20 +0000752 /// Classify a global variable reference for the current subtarget according
753 /// to how we should reference it in a non-pcrel context.
Rafael Espindolac7e98132016-05-20 12:20:10 +0000754 unsigned char classifyLocalReference(const GlobalValue *GV) const;
755
756 unsigned char classifyGlobalReference(const GlobalValue *GV,
757 const Module &M) const;
Rafael Espindolaab03eb02016-05-19 22:07:57 +0000758 unsigned char classifyGlobalReference(const GlobalValue *GV) const;
Anton Korobeynikov93acb492006-12-20 01:03:20 +0000759
Rafael Espindolacb2d2662016-05-19 18:34:20 +0000760 /// Classify a global function reference for the current subtarget.
Rafael Espindolac7e98132016-05-20 12:20:10 +0000761 unsigned char classifyGlobalFunctionReference(const GlobalValue *GV,
762 const Module &M) const;
Rafael Espindola46107b92016-05-19 18:49:29 +0000763 unsigned char classifyGlobalFunctionReference(const GlobalValue *GV) const;
Asaf Badouh89406d12016-04-20 08:32:57 +0000764
Sanjay Patele63abfe2015-02-03 18:47:32 +0000765 /// Classify a blockaddress reference for the current subtarget according to
766 /// how we should reference it in a non-pcrel context.
Rafael Espindolacb2d2662016-05-19 18:34:20 +0000767 unsigned char classifyBlockAddressReference() const;
Dan Gohman7a6611792009-11-20 23:18:13 +0000768
Sanjay Patele63abfe2015-02-03 18:47:32 +0000769 /// Return true if the subtarget allows calls to immediate address.
Rafael Espindola46107b92016-05-19 18:49:29 +0000770 bool isLegalToCallImmediateAddr() const;
Evan Cheng96098332009-05-20 04:53:57 +0000771
Chandler Carruthc58f2162018-01-22 22:05:25 +0000772 /// If we are using retpolines, we need to expand indirectbr to avoid it
773 /// lowering to an actual indirect jump.
774 bool enableIndirectBrExpand() const override { return useRetpoline(); }
775
Andrew Tricke97d8d62013-10-15 23:33:07 +0000776 /// Enable the MachineScheduler pass for all X86 subtargets.
Craig Topper73156022014-03-02 09:09:27 +0000777 bool enableMachineScheduler() const override { return true; }
Andrew Tricke97d8d62013-10-15 23:33:07 +0000778
Andrew V. Tischenko75745d02017-04-14 07:44:23 +0000779 // TODO: Update the regression tests and return true.
780 bool supportPrintSchedInfo() const override { return false; }
781
Eric Christopher6b0fcfe2014-05-21 23:40:26 +0000782 bool enableEarlyIfConversion() const override;
783
Sanjay Patele63abfe2015-02-03 18:47:32 +0000784 /// Return the instruction itineraries based on the subtarget selection.
Eric Christopherd9134482014-08-04 21:25:23 +0000785 const InstrItineraryData *getInstrItineraryData() const override {
786 return &InstrItins;
787 }
Sanjay Patela2f658d2014-07-15 22:39:58 +0000788
789 AntiDepBreakMode getAntiDepBreakMode() const override {
790 return TargetSubtargetInfo::ANTIDEP_CRITICAL;
791 }
Marina Yatsinaf9371d82017-10-22 17:59:38 +0000792
Benjamin Kramera7c822a2017-10-22 19:16:31 +0000793 bool enableAdvancedRASplitCost() const override { return true; }
Evan Cheng47455a72009-09-03 04:37:05 +0000794};
Evan Chenga8b4aea2006-10-16 21:00:37 +0000795
Eugene Zelenkofbd13c52017-02-02 22:55:55 +0000796} // end namespace llvm
Nate Begemanf26625e2005-07-12 01:41:54 +0000797
Eugene Zelenkofbd13c52017-02-02 22:55:55 +0000798#endif // LLVM_LIB_TARGET_X86_X86SUBTARGET_H