blob: f930806be6c7376e25a06cd683892f0906088d1b [file] [log] [blame]
Nate Begeman8c00f8c2005-08-04 07:12:09 +00001//=====---- X86Subtarget.h - Define Subtarget for the X86 -----*- C++ -*--====//
Nate Begemanfb5792f2005-07-12 01:41:54 +00002//
3// The LLVM Compiler Infrastructure
4//
Chris Lattner4ee451d2007-12-29 20:36:04 +00005// This file is distributed under the University of Illinois Open Source
6// License. See LICENSE.TXT for details.
Nate Begemanfb5792f2005-07-12 01:41:54 +00007//
8//===----------------------------------------------------------------------===//
9//
Evan Cheng5b1b44892011-07-01 21:01:15 +000010// This file declares the X86 specific subclass of TargetSubtargetInfo.
Nate Begemanfb5792f2005-07-12 01:41:54 +000011//
12//===----------------------------------------------------------------------===//
13
14#ifndef X86SUBTARGET_H
15#define X86SUBTARGET_H
16
Eric Christopher62f35a22010-07-05 19:26:33 +000017#include "llvm/ADT/Triple.h"
Evan Cheng5b1b44892011-07-01 21:01:15 +000018#include "llvm/Target/TargetSubtargetInfo.h"
Dan Gohman4d3d6e12010-05-27 18:43:40 +000019#include "llvm/CallingConv.h"
Jim Laskeyb1e11802005-09-01 21:38:21 +000020#include <string>
21
Evan Cheng94214702011-07-01 20:45:01 +000022#define GET_SUBTARGETINFO_HEADER
Evan Cheng385e9302011-07-01 22:36:09 +000023#include "X86GenSubtargetInfo.inc"
Evan Cheng94214702011-07-01 20:45:01 +000024
Nate Begemanfb5792f2005-07-12 01:41:54 +000025namespace llvm {
Anton Korobeynikov7784ebc2006-11-30 22:42:55 +000026class GlobalValue;
Evan Cheng0ddff1b2011-07-07 07:07:08 +000027class StringRef;
Anton Korobeynikov2b2bc682006-12-22 22:29:05 +000028class TargetMachine;
Mikhail Glushenkov5d96eb82010-02-28 22:54:30 +000029
Chris Lattnere4df7562009-07-09 03:15:51 +000030/// PICStyles - The X86 backend supports a number of different styles of PIC.
Mikhail Glushenkov5d96eb82010-02-28 22:54:30 +000031///
Duncan Sandsf9a67a82008-11-28 09:29:37 +000032namespace PICStyles {
Anton Korobeynikov7f705592007-01-12 19:20:47 +000033enum Style {
Chris Lattner8097b652009-07-10 20:58:47 +000034 StubPIC, // Used on i386-darwin in -fPIC mode.
35 StubDynamicNoPIC, // Used on i386-darwin in -mdynamic-no-pic mode.
36 GOT, // Used on many 32-bit unices in -fPIC mode.
37 RIPRel, // Used on X86-64 when not in -static mode.
38 None // Set when in -static mode (not PIC or DynamicNoPIC mode).
Anton Korobeynikov7f705592007-01-12 19:20:47 +000039};
40}
Nate Begemanfb5792f2005-07-12 01:41:54 +000041
Evan Cheng94214702011-07-01 20:45:01 +000042class X86Subtarget : public X86GenSubtargetInfo {
Nate Begemanfb5792f2005-07-12 01:41:54 +000043protected:
Evan Cheng559806f2006-01-27 08:10:46 +000044 enum X86SSEEnum {
Craig Topper16de4632012-01-09 09:02:13 +000045 NoMMXSSE, MMX, SSE1, SSE2, SSE3, SSSE3, SSE41, SSE42, AVX, AVX2
Evan Cheng559806f2006-01-27 08:10:46 +000046 };
47
Evan Chenga26eb5e2006-10-06 09:17:41 +000048 enum X863DNowEnum {
49 NoThreeDNow, ThreeDNow, ThreeDNowA
50 };
51
Andrew Trick922d3142012-02-01 23:20:51 +000052 enum X86ProcFamilyEnum {
53 Others, IntelAtom
54 };
55
56 /// X86ProcFamily - X86 processor family: Intel Atom, and others
57 X86ProcFamilyEnum X86ProcFamily;
58
Anton Korobeynikov7f705592007-01-12 19:20:47 +000059 /// PICStyle - Which PIC style to use
Evan Chengf6844ca2007-08-01 23:45:51 +000060 ///
Duncan Sandsf9a67a82008-11-28 09:29:37 +000061 PICStyles::Style PICStyle;
Mikhail Glushenkov5d96eb82010-02-28 22:54:30 +000062
Evan Chengadd25172008-02-12 07:59:55 +000063 /// X86SSELevel - MMX, SSE1, SSE2, SSE3, SSSE3, SSE41, SSE42, or
64 /// none supported.
Evan Cheng559806f2006-01-27 08:10:46 +000065 X86SSEEnum X86SSELevel;
66
Evan Chenga26eb5e2006-10-06 09:17:41 +000067 /// X863DNowLevel - 3DNow or 3DNow Athlon, or none supported.
Evan Chengf6844ca2007-08-01 23:45:51 +000068 ///
Evan Chenga26eb5e2006-10-06 09:17:41 +000069 X863DNowEnum X863DNowLevel;
70
Chris Lattner70084162009-09-02 05:53:04 +000071 /// HasCMov - True if this processor has conditional move instructions
72 /// (generally pentium pro+).
73 bool HasCMov;
Mikhail Glushenkov5d96eb82010-02-28 22:54:30 +000074
Evan Cheng25ab6902006-09-08 06:48:29 +000075 /// HasX86_64 - True if the processor supports X86-64 instructions.
Evan Chengf6844ca2007-08-01 23:45:51 +000076 ///
Evan Cheng25ab6902006-09-08 06:48:29 +000077 bool HasX86_64;
Evan Chengccb69762009-01-02 05:35:45 +000078
Benjamin Kramer1292c222010-12-04 20:32:23 +000079 /// HasPOPCNT - True if the processor supports POPCNT.
80 bool HasPOPCNT;
81
Stefanus Du Toit8cf5ab12009-05-26 21:04:35 +000082 /// HasSSE4A - True if the processor supports SSE4A instructions.
83 bool HasSSE4A;
84
Eric Christopher6d1cd1c2010-04-02 21:54:27 +000085 /// HasAES - Target has AES instructions
86 bool HasAES;
87
Bruno Cardoso Lopescdae7e82010-07-23 01:17:51 +000088 /// HasCLMUL - Target has carry-less multiplication
89 bool HasCLMUL;
90
David Greene343dadb2009-06-26 22:46:54 +000091 /// HasFMA3 - Target has 3-operand fused multiply-add
92 bool HasFMA3;
93
94 /// HasFMA4 - Target has 4-operand fused multiply-add
95 bool HasFMA4;
96
Jan Sjödince25d262011-12-02 15:14:37 +000097 /// HasXOP - Target has XOP instructions
98 bool HasXOP;
99
Craig Topperda394042011-10-09 07:31:39 +0000100 /// HasMOVBE - True if the processor has the MOVBE instruction.
Craig Topper581fe822011-10-03 17:28:23 +0000101 bool HasMOVBE;
102
Craig Topperda394042011-10-09 07:31:39 +0000103 /// HasRDRAND - True if the processor has the RDRAND instruction.
Craig Topper581fe822011-10-03 17:28:23 +0000104 bool HasRDRAND;
105
Craig Topperda394042011-10-09 07:31:39 +0000106 /// HasF16C - Processor has 16-bit floating point conversion instructions.
107 bool HasF16C;
108
Craig Toppere7b05502011-10-30 19:57:21 +0000109 /// HasFSGSBase - Processor has FS/GS base insturctions.
110 bool HasFSGSBase;
111
Craig Topper37f21672011-10-11 06:44:02 +0000112 /// HasLZCNT - Processor has LZCNT instruction.
113 bool HasLZCNT;
114
Craig Topper909652f2011-10-14 03:21:46 +0000115 /// HasBMI - Processor has BMI1 instructions.
116 bool HasBMI;
117
Craig Topperb53fa8b2011-10-16 07:55:05 +0000118 /// HasBMI2 - Processor has BMI2 instructions.
119 bool HasBMI2;
120
David Greene343dadb2009-06-26 22:46:54 +0000121 /// IsBTMemSlow - True if BT (bit test) of memory instructions are slow.
122 bool IsBTMemSlow;
Evan Cheng400073d2009-12-18 07:40:29 +0000123
Evan Cheng48c58bb2010-04-01 05:58:17 +0000124 /// IsUAMemFast - True if unaligned memory access is fast.
125 bool IsUAMemFast;
126
Mikhail Glushenkov5d96eb82010-02-28 22:54:30 +0000127 /// HasVectorUAMem - True if SIMD operations can have unaligned memory
Evan Cheng5528e7b2010-04-21 01:47:12 +0000128 /// operands. This may require setting a feature bit in the processor.
David Greene95eb2ee2010-01-11 16:29:42 +0000129 bool HasVectorUAMem;
130
Eli Friedman43f51ae2011-08-26 21:21:21 +0000131 /// HasCmpxchg16b - True if this processor has the CMPXCHG16B instruction;
132 /// this is true for most x86-64 chips, but not the first AMD chips.
133 bool HasCmpxchg16b;
134
Andrew Trick922d3142012-02-01 23:20:51 +0000135 /// PostRAScheduler - True if using post-register-allocation scheduler.
136 bool PostRAScheduler;
137
Chris Lattnerb151aca2005-07-12 02:36:10 +0000138 /// stackAlignment - The minimum alignment known to hold of the stack frame on
139 /// entry to the function and which must be maintained by every function.
Nate Begemanfb5792f2005-07-12 01:41:54 +0000140 unsigned stackAlignment;
Jeff Cohen9eb59ec2005-07-27 05:53:44 +0000141
Rafael Espindolafc05f402007-10-31 11:52:06 +0000142 /// Max. memset / memcpy size that is turned into rep/movs, rep/stos ops.
Evan Chengf6844ca2007-08-01 23:45:51 +0000143 ///
Rafael Espindolafc05f402007-10-31 11:52:06 +0000144 unsigned MaxInlineSizeThreshold;
NAKAMURA Takumie310b3a2011-02-17 12:23:50 +0000145
Eric Christopher62f35a22010-07-05 19:26:33 +0000146 /// TargetTriple - What processor and OS we're targeting.
147 Triple TargetTriple;
Andrew Trick922d3142012-02-01 23:20:51 +0000148
149 /// Instruction itineraries for scheduling
150 InstrItineraryData InstrItins;
Evan Cheng18a84522006-02-16 00:21:07 +0000151
Evan Cheng25ab6902006-09-08 06:48:29 +0000152private:
Evan Cheng18fb1d32011-07-07 21:06:52 +0000153 /// In64BitMode - True if compiling for 64-bit, false for 32-bit.
154 bool In64BitMode;
Evan Cheng25ab6902006-09-08 06:48:29 +0000155
Nate Begemanfb5792f2005-07-12 01:41:54 +0000156public:
Anton Korobeynikov12c49af2006-11-21 00:01:06 +0000157
Jeff Cohen9eb59ec2005-07-27 05:53:44 +0000158 /// This constructor initializes the data members to match that
Daniel Dunbar3be03402009-08-02 22:11:08 +0000159 /// of the specified triple.
Nate Begemanfb5792f2005-07-12 01:41:54 +0000160 ///
Evan Cheng276365d2011-06-30 01:53:36 +0000161 X86Subtarget(const std::string &TT, const std::string &CPU,
Evan Cheng18fb1d32011-07-07 21:06:52 +0000162 const std::string &FS,
Evan Cheng4d1a8dd2011-07-08 22:30:25 +0000163 unsigned StackAlignOverride, bool is64Bit);
Chris Lattnerb151aca2005-07-12 02:36:10 +0000164
165 /// getStackAlignment - Returns the minimum alignment known to hold of the
166 /// stack frame on entry to the function and which must be maintained by every
167 /// function for this subtarget.
Nate Begemanfb5792f2005-07-12 01:41:54 +0000168 unsigned getStackAlignment() const { return stackAlignment; }
Jeff Cohen9eb59ec2005-07-27 05:53:44 +0000169
Rafael Espindolafc05f402007-10-31 11:52:06 +0000170 /// getMaxInlineSizeThreshold - Returns the maximum memset / memcpy size
171 /// that still makes it profitable to inline the call.
172 unsigned getMaxInlineSizeThreshold() const { return MaxInlineSizeThreshold; }
Anton Korobeynikov12c49af2006-11-21 00:01:06 +0000173
174 /// ParseSubtargetFeatures - Parses features string setting specified
Evan Chenga26eb5e2006-10-06 09:17:41 +0000175 /// subtarget options. Definition of function is auto generated by tblgen.
Evan Cheng0ddff1b2011-07-07 07:07:08 +0000176 void ParseSubtargetFeatures(StringRef CPU, StringRef FS);
Evan Chenga26eb5e2006-10-06 09:17:41 +0000177
178 /// AutoDetectSubtargetFeatures - Auto-detect CPU features using CPUID
179 /// instruction.
180 void AutoDetectSubtargetFeatures();
Evan Cheng97c7fc32006-01-26 09:53:06 +0000181
Evan Cheng18fb1d32011-07-07 21:06:52 +0000182 bool is64Bit() const { return In64BitMode; }
Evan Cheng97c7fc32006-01-26 09:53:06 +0000183
Duncan Sandsf9a67a82008-11-28 09:29:37 +0000184 PICStyles::Style getPICStyle() const { return PICStyle; }
185 void setPICStyle(PICStyles::Style Style) { PICStyle = Style; }
Anton Korobeynikov7f705592007-01-12 19:20:47 +0000186
Chris Lattner314a1132010-03-14 18:31:44 +0000187 bool hasCMov() const { return HasCMov; }
Evan Cheng559806f2006-01-27 08:10:46 +0000188 bool hasMMX() const { return X86SSELevel >= MMX; }
Craig Topperc6d59952012-01-10 06:30:56 +0000189 bool hasSSE1() const { return X86SSELevel >= SSE1; }
190 bool hasSSE2() const { return X86SSELevel >= SSE2; }
191 bool hasSSE3() const { return X86SSELevel >= SSE3; }
192 bool hasSSSE3() const { return X86SSELevel >= SSSE3; }
193 bool hasSSE41() const { return X86SSELevel >= SSE41; }
194 bool hasSSE42() const { return X86SSELevel >= SSE42; }
Craig Topper1accb7e2012-01-10 06:54:16 +0000195 bool hasAVX() const { return X86SSELevel >= AVX; }
196 bool hasAVX2() const { return X86SSELevel >= AVX2; }
Stefanus Du Toit8cf5ab12009-05-26 21:04:35 +0000197 bool hasSSE4A() const { return HasSSE4A; }
Evan Chenga26eb5e2006-10-06 09:17:41 +0000198 bool has3DNow() const { return X863DNowLevel >= ThreeDNow; }
199 bool has3DNowA() const { return X863DNowLevel >= ThreeDNowA; }
Benjamin Kramer1292c222010-12-04 20:32:23 +0000200 bool hasPOPCNT() const { return HasPOPCNT; }
Eric Christopher6d1cd1c2010-04-02 21:54:27 +0000201 bool hasAES() const { return HasAES; }
Bruno Cardoso Lopescdae7e82010-07-23 01:17:51 +0000202 bool hasCLMUL() const { return HasCLMUL; }
David Greene343dadb2009-06-26 22:46:54 +0000203 bool hasFMA3() const { return HasFMA3; }
204 bool hasFMA4() const { return HasFMA4; }
Jan Sjödince25d262011-12-02 15:14:37 +0000205 bool hasXOP() const { return HasXOP; }
Craig Topper581fe822011-10-03 17:28:23 +0000206 bool hasMOVBE() const { return HasMOVBE; }
207 bool hasRDRAND() const { return HasRDRAND; }
Craig Topperda394042011-10-09 07:31:39 +0000208 bool hasF16C() const { return HasF16C; }
Craig Toppere7b05502011-10-30 19:57:21 +0000209 bool hasFSGSBase() const { return HasFSGSBase; }
Craig Topper37f21672011-10-11 06:44:02 +0000210 bool hasLZCNT() const { return HasLZCNT; }
Craig Topper909652f2011-10-14 03:21:46 +0000211 bool hasBMI() const { return HasBMI; }
Craig Topperb53fa8b2011-10-16 07:55:05 +0000212 bool hasBMI2() const { return HasBMI2; }
Evan Chengccb69762009-01-02 05:35:45 +0000213 bool isBTMemSlow() const { return IsBTMemSlow; }
Evan Cheng48c58bb2010-04-01 05:58:17 +0000214 bool isUnalignedMemAccessFast() const { return IsUAMemFast; }
David Greene95eb2ee2010-01-11 16:29:42 +0000215 bool hasVectorUAMem() const { return HasVectorUAMem; }
Eli Friedman43f51ae2011-08-26 21:21:21 +0000216 bool hasCmpxchg16b() const { return HasCmpxchg16b; }
Evan Chengccb69762009-01-02 05:35:45 +0000217
Andrew Trick922d3142012-02-01 23:20:51 +0000218 bool isAtom() const { return X86ProcFamily == IntelAtom; }
219
Daniel Dunbar24cfd062011-04-19 21:01:47 +0000220 const Triple &getTargetTriple() const { return TargetTriple; }
221
Daniel Dunbar912225e2011-04-19 21:14:45 +0000222 bool isTargetDarwin() const { return TargetTriple.isOSDarwin(); }
223 bool isTargetFreeBSD() const {
224 return TargetTriple.getOS() == Triple::FreeBSD;
225 }
226 bool isTargetSolaris() const {
227 return TargetTriple.getOS() == Triple::Solaris;
228 }
NAKAMURA Takumie310b3a2011-02-17 12:23:50 +0000229
Eric Christopher62f35a22010-07-05 19:26:33 +0000230 // ELF is a reasonably sane default and the only other X86 targets we
231 // support are Darwin and Windows. Just use "not those".
Chandler Carruth69f44692012-02-05 08:26:40 +0000232 bool isTargetELF() const { return TargetTriple.isOSBinFormatELF(); }
Eric Christopher62f35a22010-07-05 19:26:33 +0000233 bool isTargetLinux() const { return TargetTriple.getOS() == Triple::Linux; }
Nick Lewycky1fac6b52011-09-05 21:51:43 +0000234 bool isTargetNaCl() const {
235 return TargetTriple.getOS() == Triple::NativeClient;
236 }
237 bool isTargetNaCl32() const { return isTargetNaCl() && !is64Bit(); }
238 bool isTargetNaCl64() const { return isTargetNaCl() && is64Bit(); }
Eric Christopher62f35a22010-07-05 19:26:33 +0000239 bool isTargetWindows() const { return TargetTriple.getOS() == Triple::Win32; }
NAKAMURA Takumi6904f052011-02-17 12:24:17 +0000240 bool isTargetMingw() const { return TargetTriple.getOS() == Triple::MinGW32; }
Eric Christopher62f35a22010-07-05 19:26:33 +0000241 bool isTargetCygwin() const { return TargetTriple.getOS() == Triple::Cygwin; }
Chandler Carruth69f44692012-02-05 08:26:40 +0000242 bool isTargetCygMing() const { return TargetTriple.isOSCygMing(); }
243 bool isTargetCOFF() const { return TargetTriple.isOSBinFormatCOFF(); }
244 bool isTargetEnvMacho() const { return TargetTriple.isEnvironmentMachO(); }
Mikhail Glushenkov5d96eb82010-02-28 22:54:30 +0000245
Anton Korobeynikov1a979d92008-03-22 20:57:27 +0000246 bool isTargetWin64() const {
NAKAMURA Takumie3345c42011-07-20 04:02:20 +0000247 // FIXME: x86_64-cygwin has not been released yet.
Chandler Carruth69f44692012-02-05 08:26:40 +0000248 return In64BitMode && TargetTriple.isOSWindows();
Evan Cheng2bffee22011-02-01 01:14:13 +0000249 }
250
Anton Korobeynikovace53f22010-09-02 23:03:46 +0000251 bool isTargetWin32() const {
Chandler Carruth69f44692012-02-05 08:26:40 +0000252 // FIXME: Cygwin is included for isTargetWin64 -- should it be included
253 // here too?
Evan Cheng18fb1d32011-07-07 21:06:52 +0000254 return !In64BitMode && (isTargetMingw() || isTargetWindows());
Anton Korobeynikovace53f22010-09-02 23:03:46 +0000255 }
256
Duncan Sandsf9a67a82008-11-28 09:29:37 +0000257 bool isPICStyleSet() const { return PICStyle != PICStyles::None; }
258 bool isPICStyleGOT() const { return PICStyle == PICStyles::GOT; }
Duncan Sandsf9a67a82008-11-28 09:29:37 +0000259 bool isPICStyleRIPRel() const { return PICStyle == PICStyles::RIPRel; }
Chris Lattner3b67e9b2009-07-10 20:47:30 +0000260
Chris Lattnere2c92082009-07-10 21:00:45 +0000261 bool isPICStyleStubPIC() const {
Chris Lattner8097b652009-07-10 20:58:47 +0000262 return PICStyle == PICStyles::StubPIC;
263 }
264
Chris Lattnere2c92082009-07-10 21:00:45 +0000265 bool isPICStyleStubNoDynamic() const {
Chris Lattner8097b652009-07-10 20:58:47 +0000266 return PICStyle == PICStyles::StubDynamicNoPIC;
267 }
268 bool isPICStyleStubAny() const {
269 return PICStyle == PICStyles::StubDynamicNoPIC ||
270 PICStyle == PICStyles::StubPIC; }
Mikhail Glushenkov5d96eb82010-02-28 22:54:30 +0000271
Chris Lattnerd392bd92009-07-10 07:20:05 +0000272 /// ClassifyGlobalReference - Classify a global variable reference for the
273 /// current subtarget according to how we should reference it in a non-pcrel
274 /// context.
275 unsigned char ClassifyGlobalReference(const GlobalValue *GV,
276 const TargetMachine &TM)const;
Anton Korobeynikov15fccf12006-12-20 01:03:20 +0000277
Dan Gohman29cbade2009-11-20 23:18:13 +0000278 /// ClassifyBlockAddressReference - Classify a blockaddress reference for the
279 /// current subtarget according to how we should reference it in a non-pcrel
280 /// context.
281 unsigned char ClassifyBlockAddressReference() const;
282
Evan Chengd7f666a2009-05-20 04:53:57 +0000283 /// IsLegalToCallImmediateAddr - Return true if the subtarget allows calls
284 /// to immediate address.
285 bool IsLegalToCallImmediateAddr(const TargetMachine &TM) const;
286
Dan Gohman68d599d2008-04-01 20:38:36 +0000287 /// This function returns the name of a function which has an interface
288 /// like the non-standard bzero function, if such a function exists on
289 /// the current subtarget and it is considered prefereable over
290 /// memset with zero passed as the second argument. Otherwise it
291 /// returns null.
Bill Wendling6e087382008-09-30 22:05:33 +0000292 const char *getBZeroEntry() const;
Dan Gohman8749b612008-12-16 03:35:01 +0000293
294 /// getSpecialAddressLatency - For targets where it is beneficial to
295 /// backschedule instructions that compute addresses, return a value
296 /// indicating the number of scheduling cycles of backscheduling that
297 /// should be attempted.
298 unsigned getSpecialAddressLatency() const;
Andrew Trick922d3142012-02-01 23:20:51 +0000299
300 /// enablePostRAScheduler - run for Atom optimization.
301 bool enablePostRAScheduler(CodeGenOpt::Level OptLevel,
302 TargetSubtargetInfo::AntiDepBreakMode& Mode,
303 RegClassVector& CriticalPathRCs) const;
304
305 /// getInstrItins = Return the instruction itineraries based on the
306 /// subtarget selection.
307 const InstrItineraryData &getInstrItineraryData() const { return InstrItins; }
Evan Chengd0da6ff2009-09-03 04:37:05 +0000308};
Evan Cheng751c0e12006-10-16 21:00:37 +0000309
Nate Begemanfb5792f2005-07-12 01:41:54 +0000310} // End llvm namespace
311
312#endif