blob: 573d4413717f42c52163deaeaecc4417ce5120fe [file] [log] [blame]
Jia Liub22310f2012-02-18 12:03:15 +00001//===-- X86.td - Target definition file for the Intel X86 --*- tablegen -*-===//
Michael J. Spencerb88784c2011-04-14 14:33:36 +00002//
John Criswell29265fe2003-10-21 15:17:13 +00003// The LLVM Compiler Infrastructure
4//
Chris Lattnerf3ebc3f2007-12-29 20:36:04 +00005// This file is distributed under the University of Illinois Open Source
6// License. See LICENSE.TXT for details.
Michael J. Spencerb88784c2011-04-14 14:33:36 +00007//
John Criswell29265fe2003-10-21 15:17:13 +00008//===----------------------------------------------------------------------===//
Chris Lattner5da8e802003-08-03 15:47:49 +00009//
Craig Topper271064e2011-10-11 06:44:02 +000010// This is a target description file for the Intel i386 architecture, referred
11// to here as the "X86" architecture.
Chris Lattner5da8e802003-08-03 15:47:49 +000012//
13//===----------------------------------------------------------------------===//
14
Chris Lattner25510802003-08-04 04:59:56 +000015// Get the target-independent interfaces which we are implementing...
Chris Lattner5da8e802003-08-03 15:47:49 +000016//
Evan Cheng977e7be2008-11-24 07:34:46 +000017include "llvm/Target/Target.td"
Chris Lattner5da8e802003-08-03 15:47:49 +000018
19//===----------------------------------------------------------------------===//
Anitha Boyapati426feb62012-08-16 03:50:04 +000020// X86 Subtarget state
Evan Cheng13bcc6c2011-07-07 21:06:52 +000021//
22
23def Mode64Bit : SubtargetFeature<"64bit-mode", "In64BitMode", "true",
24 "64-bit mode (x86_64)">;
Craig Topper3c80d622014-01-06 04:55:54 +000025def Mode32Bit : SubtargetFeature<"32bit-mode", "In32BitMode", "true",
26 "32-bit mode (80386)">;
27def Mode16Bit : SubtargetFeature<"16bit-mode", "In16BitMode", "true",
28 "16-bit mode (i8086)">;
Evan Cheng13bcc6c2011-07-07 21:06:52 +000029
30//===----------------------------------------------------------------------===//
Anitha Boyapati426feb62012-08-16 03:50:04 +000031// X86 Subtarget features
Bill Wendlinge6182262007-05-04 20:38:40 +000032//===----------------------------------------------------------------------===//
Chris Lattnercc8c5812009-09-02 05:53:04 +000033
Andrey Turetskiy6a3d5612016-03-23 11:13:54 +000034def FeatureX87 : SubtargetFeature<"x87","HasX87", "true",
35 "Enable X87 float instructions">;
36
Chris Lattnercc8c5812009-09-02 05:53:04 +000037def FeatureCMOV : SubtargetFeature<"cmov","HasCMov", "true",
38 "Enable conditional move instructions">;
39
Benjamin Kramer2f489232010-12-04 20:32:23 +000040def FeaturePOPCNT : SubtargetFeature<"popcnt", "HasPOPCNT", "true",
41 "Support POPCNT instruction">;
42
Craig Topper09b65982015-10-16 06:03:09 +000043def FeatureFXSR : SubtargetFeature<"fxsr", "HasFXSR", "true",
44 "Support fxsave/fxrestore instructions">;
45
Amjad Aboud1db6d7a2015-10-12 11:47:46 +000046def FeatureXSAVE : SubtargetFeature<"xsave", "HasXSAVE", "true",
47 "Support xsave instructions">;
48
49def FeatureXSAVEOPT: SubtargetFeature<"xsaveopt", "HasXSAVEOPT", "true",
50 "Support xsaveopt instructions">;
51
52def FeatureXSAVEC : SubtargetFeature<"xsavec", "HasXSAVEC", "true",
53 "Support xsavec instructions">;
54
55def FeatureXSAVES : SubtargetFeature<"xsaves", "HasXSAVES", "true",
56 "Support xsaves instructions">;
57
Bill Wendlinge6182262007-05-04 20:38:40 +000058def FeatureSSE1 : SubtargetFeature<"sse", "X86SSELevel", "SSE1",
59 "Enable SSE instructions",
Chris Lattnercc8c5812009-09-02 05:53:04 +000060 // SSE codegen depends on cmovs, and all
Michael J. Spencerb88784c2011-04-14 14:33:36 +000061 // SSE1+ processors support them.
Eric Christopher11e59832015-10-08 20:10:06 +000062 [FeatureCMOV]>;
Bill Wendlinge6182262007-05-04 20:38:40 +000063def FeatureSSE2 : SubtargetFeature<"sse2", "X86SSELevel", "SSE2",
64 "Enable SSE2 instructions",
65 [FeatureSSE1]>;
66def FeatureSSE3 : SubtargetFeature<"sse3", "X86SSELevel", "SSE3",
67 "Enable SSE3 instructions",
68 [FeatureSSE2]>;
69def FeatureSSSE3 : SubtargetFeature<"ssse3", "X86SSELevel", "SSSE3",
70 "Enable SSSE3 instructions",
71 [FeatureSSE3]>;
Rafael Espindola94a2c562013-08-23 20:21:34 +000072def FeatureSSE41 : SubtargetFeature<"sse4.1", "X86SSELevel", "SSE41",
Nate Begemane14fdfa2008-02-03 07:18:54 +000073 "Enable SSE 4.1 instructions",
74 [FeatureSSSE3]>;
Rafael Espindola94a2c562013-08-23 20:21:34 +000075def FeatureSSE42 : SubtargetFeature<"sse4.2", "X86SSELevel", "SSE42",
Nate Begemane14fdfa2008-02-03 07:18:54 +000076 "Enable SSE 4.2 instructions",
Craig Topper7bd33052011-12-29 15:51:45 +000077 [FeatureSSE41]>;
Eric Christopher57a6e132015-11-14 03:04:00 +000078// The MMX subtarget feature is separate from the rest of the SSE features
79// because it's important (for odd compatibility reasons) to be able to
80// turn it off explicitly while allowing SSE+ to be on.
81def FeatureMMX : SubtargetFeature<"mmx","X863DNowLevel", "MMX",
82 "Enable MMX instructions">;
Bill Wendlinge6182262007-05-04 20:38:40 +000083def Feature3DNow : SubtargetFeature<"3dnow", "X863DNowLevel", "ThreeDNow",
Michael J. Spencer30088ba2011-04-15 00:32:41 +000084 "Enable 3DNow! instructions",
85 [FeatureMMX]>;
Bill Wendlinge6182262007-05-04 20:38:40 +000086def Feature3DNowA : SubtargetFeature<"3dnowa", "X863DNowLevel", "ThreeDNowA",
Bill Wendlingf985c492007-05-06 07:56:19 +000087 "Enable 3DNow! Athlon instructions",
88 [Feature3DNow]>;
Dan Gohman74037512009-02-03 00:04:43 +000089// All x86-64 hardware has SSE2, but we don't mark SSE2 as an implied
90// feature, because SSE2 can be disabled (e.g. for compiling OS kernels)
91// without disabling 64-bit mode.
Bill Wendlingf985c492007-05-06 07:56:19 +000092def Feature64Bit : SubtargetFeature<"64bit", "HasX86_64", "true",
Chris Lattner77f7dba2010-03-14 22:24:34 +000093 "Support 64-bit instructions",
94 [FeatureCMOV]>;
Nick Lewycky3be42b82013-10-05 20:11:44 +000095def FeatureCMPXCHG16B : SubtargetFeature<"cx16", "HasCmpxchg16b", "true",
Eli Friedman5e570422011-08-26 21:21:21 +000096 "64-bit with cmpxchg16b",
97 [Feature64Bit]>;
Ekaterina Romanovad5fa5542013-11-21 23:21:26 +000098def FeatureSlowSHLD : SubtargetFeature<"slow-shld", "IsSHLDSlow", "true",
99 "SHLD instruction is slow">;
Zvi Rackover8bc7e4d2016-12-06 19:35:20 +0000100def FeatureSlowPMULLD : SubtargetFeature<"slow-pmulld", "IsPMULLDSlow", "true",
101 "PMULLD instruction is slow">;
Sanjay Patel30145672015-09-01 20:51:51 +0000102// FIXME: This should not apply to CPUs that do not have SSE.
103def FeatureSlowUAMem16 : SubtargetFeature<"slow-unaligned-mem-16",
104 "IsUAMem16Slow", "true",
105 "Slow unaligned 16-byte memory access">;
Sanjay Patel501890e2014-11-21 17:40:04 +0000106def FeatureSlowUAMem32 : SubtargetFeature<"slow-unaligned-mem-32",
Sanjay Patel9e916dc2015-08-21 20:17:26 +0000107 "IsUAMem32Slow", "true",
108 "Slow unaligned 32-byte memory access">;
Stefanus Du Toit96180b52009-05-26 21:04:35 +0000109def FeatureSSE4A : SubtargetFeature<"sse4a", "HasSSE4A", "true",
Craig Toppera5d1fc22011-12-30 07:16:00 +0000110 "Support SSE 4a instructions",
111 [FeatureSSE3]>;
Evan Chengff1beda2006-10-06 09:17:41 +0000112
Craig Topperf287a452012-01-09 09:02:13 +0000113def FeatureAVX : SubtargetFeature<"avx", "X86SSELevel", "AVX",
114 "Enable AVX instructions",
115 [FeatureSSE42]>;
116def FeatureAVX2 : SubtargetFeature<"avx2", "X86SSELevel", "AVX2",
Craig Topper228d9132011-10-30 19:57:21 +0000117 "Enable AVX2 instructions",
118 [FeatureAVX]>;
Craig Toppercb6c3862017-11-06 22:49:01 +0000119def FeatureFMA : SubtargetFeature<"fma", "HasFMA", "true",
120 "Enable three-operand fused multiple-add",
121 [FeatureAVX]>;
Craig Topper428a4e62017-11-06 22:49:04 +0000122def FeatureF16C : SubtargetFeature<"f16c", "HasF16C", "true",
123 "Support 16-bit floating point conversion instructions",
124 [FeatureAVX]>;
Craig Topper5c94bb82013-08-21 03:57:57 +0000125def FeatureAVX512 : SubtargetFeature<"avx512f", "X86SSELevel", "AVX512F",
Elena Demikhovsky8cfb43f2013-07-24 11:02:47 +0000126 "Enable AVX-512 instructions",
Craig Topper428a4e62017-11-06 22:49:04 +0000127 [FeatureAVX2, FeatureFMA, FeatureF16C]>;
Craig Topper5c94bb82013-08-21 03:57:57 +0000128def FeatureERI : SubtargetFeature<"avx512er", "HasERI", "true",
Elena Demikhovsky003e7d72013-07-28 08:28:38 +0000129 "Enable AVX-512 Exponential and Reciprocal Instructions",
130 [FeatureAVX512]>;
Craig Topper5c94bb82013-08-21 03:57:57 +0000131def FeatureCDI : SubtargetFeature<"avx512cd", "HasCDI", "true",
Elena Demikhovsky003e7d72013-07-28 08:28:38 +0000132 "Enable AVX-512 Conflict Detection Instructions",
133 [FeatureAVX512]>;
Oren Ben Simhon7bf27f02017-05-25 13:45:23 +0000134def FeatureVPOPCNTDQ : SubtargetFeature<"avx512vpopcntdq", "HasVPOPCNTDQ",
135 "true", "Enable AVX-512 Population Count Instructions",
136 [FeatureAVX512]>;
Craig Topper5c94bb82013-08-21 03:57:57 +0000137def FeaturePFI : SubtargetFeature<"avx512pf", "HasPFI", "true",
Elena Demikhovsky003e7d72013-07-28 08:28:38 +0000138 "Enable AVX-512 PreFetch Instructions",
139 [FeatureAVX512]>;
Elena Demikhovsky29cde352016-01-24 10:41:28 +0000140def FeaturePREFETCHWT1 : SubtargetFeature<"prefetchwt1", "HasPFPREFETCHWT1",
141 "true",
142 "Prefetch with Intent to Write and T1 Hint">;
Robert Khasanovbfa01312014-07-21 14:54:21 +0000143def FeatureDQI : SubtargetFeature<"avx512dq", "HasDQI", "true",
144 "Enable AVX-512 Doubleword and Quadword Instructions",
145 [FeatureAVX512]>;
146def FeatureBWI : SubtargetFeature<"avx512bw", "HasBWI", "true",
147 "Enable AVX-512 Byte and Word Instructions",
148 [FeatureAVX512]>;
149def FeatureVLX : SubtargetFeature<"avx512vl", "HasVLX", "true",
150 "Enable AVX-512 Vector Length eXtensions",
151 [FeatureAVX512]>;
Michael Zuckerman97b6a6922016-01-17 13:42:12 +0000152def FeatureVBMI : SubtargetFeature<"avx512vbmi", "HasVBMI", "true",
Craig Topper5c842be2016-11-09 04:50:48 +0000153 "Enable AVX-512 Vector Byte Manipulation Instructions",
154 [FeatureBWI]>;
Craig Topper3bb3f732016-02-08 01:23:15 +0000155def FeatureIFMA : SubtargetFeature<"avx512ifma", "HasIFMA", "true",
Elena Demikhovsky29cde352016-01-24 10:41:28 +0000156 "Enable AVX-512 Integer Fused Multiple-Add",
157 [FeatureAVX512]>;
Asaf Badouh5acf66f2015-12-15 13:35:29 +0000158def FeaturePKU : SubtargetFeature<"pku", "HasPKU", "true",
159 "Enable protection keys">;
Benjamin Kramera0396e42012-05-31 14:34:17 +0000160def FeaturePCLMUL : SubtargetFeature<"pclmul", "HasPCLMUL", "true",
161 "Enable packed carry-less multiplication instructions",
Craig Topper29dd1482012-05-01 05:28:32 +0000162 [FeatureSSE2]>;
David Greene8f6f72c2009-06-26 22:46:54 +0000163def FeatureFMA4 : SubtargetFeature<"fma4", "HasFMA4", "true",
Craig Toppera5d1fc22011-12-30 07:16:00 +0000164 "Enable four-operand fused multiple-add",
Craig Topperbae0e9e2012-05-01 06:54:48 +0000165 [FeatureAVX, FeatureSSE4A]>;
Craig Toppera5d1fc22011-12-30 07:16:00 +0000166def FeatureXOP : SubtargetFeature<"xop", "HasXOP", "true",
Craig Topper43518cc2012-05-01 05:41:41 +0000167 "Enable XOP instructions",
Anitha Boyapatiaf3e9832012-08-16 04:04:02 +0000168 [FeatureFMA4]>;
Sanjay Patelffd039b2015-02-03 17:13:04 +0000169def FeatureSSEUnalignedMem : SubtargetFeature<"sse-unaligned-mem",
170 "HasSSEUnalignedMem", "true",
171 "Allow unaligned memory operands with SSE instructions">;
Eric Christopher2ef63182010-04-02 21:54:27 +0000172def FeatureAES : SubtargetFeature<"aes", "HasAES", "true",
Craig Topper29dd1482012-05-01 05:28:32 +0000173 "Enable AES instructions",
174 [FeatureSSE2]>;
Yunzhong Gaodd36e932013-09-24 18:21:52 +0000175def FeatureTBM : SubtargetFeature<"tbm", "HasTBM", "true",
176 "Enable TBM instructions">;
Simon Pilgrim99b925b2017-05-03 15:51:39 +0000177def FeatureLWP : SubtargetFeature<"lwp", "HasLWP", "true",
178 "Enable LWP instructions">;
Craig Topper786bdb92011-10-03 17:28:23 +0000179def FeatureMOVBE : SubtargetFeature<"movbe", "HasMOVBE", "true",
180 "Support MOVBE instruction">;
Rafael Espindola94a2c562013-08-23 20:21:34 +0000181def FeatureRDRAND : SubtargetFeature<"rdrnd", "HasRDRAND", "true",
Craig Topper786bdb92011-10-03 17:28:23 +0000182 "Support RDRAND instruction">;
Craig Topper228d9132011-10-30 19:57:21 +0000183def FeatureFSGSBase : SubtargetFeature<"fsgsbase", "HasFSGSBase", "true",
184 "Support FS/GS Base instructions">;
Craig Topper271064e2011-10-11 06:44:02 +0000185def FeatureLZCNT : SubtargetFeature<"lzcnt", "HasLZCNT", "true",
186 "Support LZCNT instruction">;
Craig Topper3657fe42011-10-14 03:21:46 +0000187def FeatureBMI : SubtargetFeature<"bmi", "HasBMI", "true",
188 "Support BMI instructions">;
Craig Topperaea148c2011-10-16 07:55:05 +0000189def FeatureBMI2 : SubtargetFeature<"bmi2", "HasBMI2", "true",
190 "Support BMI2 instructions">;
Michael Liao73cffdd2012-11-08 07:28:54 +0000191def FeatureRTM : SubtargetFeature<"rtm", "HasRTM", "true",
192 "Support RTM instructions">;
Kay Tiong Khoof809c642013-02-14 19:08:21 +0000193def FeatureADX : SubtargetFeature<"adx", "HasADX", "true",
194 "Support ADX instructions">;
Ben Langmuir16501752013-09-12 15:51:31 +0000195def FeatureSHA : SubtargetFeature<"sha", "HasSHA", "true",
196 "Enable SHA instructions",
197 [FeatureSSE2]>;
Michael Liao5173ee02013-03-26 17:47:11 +0000198def FeaturePRFCHW : SubtargetFeature<"prfchw", "HasPRFCHW", "true",
199 "Support PRFCHW instructions">;
Michael Liaoa486a112013-03-28 23:41:26 +0000200def FeatureRDSEED : SubtargetFeature<"rdseed", "HasRDSEED", "true",
201 "Support RDSEED instruction">;
Hans Wennborg5000ce82015-12-04 23:00:33 +0000202def FeatureLAHFSAHF : SubtargetFeature<"sahf", "HasLAHFSAHF", "true",
203 "Support LAHF and SAHF instructions">;
Ashutosh Nema348af9c2016-05-18 11:59:12 +0000204def FeatureMWAITX : SubtargetFeature<"mwaitx", "HasMWAITX", "true",
205 "Enable MONITORX/MWAITX timer functionality">;
Craig Topper50f3d142017-02-09 04:27:34 +0000206def FeatureCLZERO : SubtargetFeature<"clzero", "HasCLZERO", "true",
207 "Enable Cache Line Zero">;
Elena Demikhovskyf7e641c2015-06-03 10:30:57 +0000208def FeatureMPX : SubtargetFeature<"mpx", "HasMPX", "true",
209 "Support MPX instructions">;
Sanjay Patel53d1d8b2015-10-12 15:24:01 +0000210def FeatureLEAForSP : SubtargetFeature<"lea-sp", "UseLeaForSP", "true",
Evan Cheng1b81fdd2012-02-07 22:50:41 +0000211 "Use LEA for adjusting the stack pointer">;
Alexey Volkovfd1731d2014-11-21 11:19:34 +0000212def FeatureSlowDivide32 : SubtargetFeature<"idivl-to-divb",
213 "HasSlowDivide32", "true",
214 "Use 8-bit divide for positive values less than 256">;
Nikolai Bozhenov6bdf92c2017-01-12 19:34:15 +0000215def FeatureSlowDivide64 : SubtargetFeature<"idivq-to-divl",
Alexey Volkovfd1731d2014-11-21 11:19:34 +0000216 "HasSlowDivide64", "true",
Nikolai Bozhenov6bdf92c2017-01-12 19:34:15 +0000217 "Use 32-bit divide for positive values less than 2^32">;
Preston Gurda01daac2013-01-08 18:27:24 +0000218def FeaturePadShortFunctions : SubtargetFeature<"pad-short-functions",
219 "PadShortFunctions", "true",
220 "Pad short functions">;
Elena Demikhovsky29cde352016-01-24 10:41:28 +0000221def FeatureSGX : SubtargetFeature<"sgx", "HasSGX", "true",
222 "Enable Software Guard Extensions">;
223def FeatureCLFLUSHOPT : SubtargetFeature<"clflushopt", "HasCLFLUSHOPT", "true",
224 "Flush A Cache Line Optimized">;
Elena Demikhovsky29cde352016-01-24 10:41:28 +0000225def FeatureCLWB : SubtargetFeature<"clwb", "HasCLWB", "true",
226 "Cache Line Write Back">;
Craig Topper62c47a22017-08-29 05:14:27 +0000227// On some processors, instructions that implicitly take two memory operands are
228// slow. In practice, this means that CALL, PUSH, and POP with memory operands
229// should be avoided in favor of a MOV + register CALL/PUSH/POP.
230def FeatureSlowTwoMemOps : SubtargetFeature<"slow-two-mem-ops",
231 "SlowTwoMemOps", "true",
232 "Two memory operand instructions are slow">;
Preston Gurd8b7ab4b2013-04-25 20:29:37 +0000233def FeatureLEAUsesAG : SubtargetFeature<"lea-uses-ag", "LEAUsesAG", "true",
234 "LEA instruction needs inputs at AG stage">;
Alexey Volkov6226de62014-05-20 08:55:50 +0000235def FeatureSlowLEA : SubtargetFeature<"slow-lea", "SlowLEA", "true",
236 "LEA instruction with certain arguments is slow">;
Lama Saba2ea271b2017-05-18 08:11:50 +0000237def FeatureSlow3OpsLEA : SubtargetFeature<"slow-3ops-lea", "Slow3OpsLEA", "true",
238 "LEA instruction with 3 ops or certain registers is slow">;
Alexey Volkov5260dba2014-06-09 11:40:41 +0000239def FeatureSlowIncDec : SubtargetFeature<"slow-incdec", "SlowIncDec", "true",
240 "INC and DEC instructions are slower than ADD and SUB">;
Eric Christopher824f42f2015-05-12 01:26:05 +0000241def FeatureSoftFloat
242 : SubtargetFeature<"soft-float", "UseSoftFloat", "true",
243 "Use software floating point features.">;
Amjad Aboud4f977512017-03-03 09:03:24 +0000244// On some X86 processors, there is no performance hazard to writing only the
245// lower parts of a YMM or ZMM register without clearing the upper part.
246def FeatureFastPartialYMMorZMMWrite
247 : SubtargetFeature<"fast-partial-ymm-or-zmm-write",
248 "HasFastPartialYMMorZMMWrite",
249 "true", "Partial writes to YMM/ZMM registers are fast">;
Nikolai Bozhenovf6795302016-08-04 12:47:28 +0000250// FeatureFastScalarFSQRT should be enabled if scalar FSQRT has shorter latency
251// than the corresponding NR code. FeatureFastVectorFSQRT should be enabled if
252// vector FSQRT has higher throughput than the corresponding NR code.
253// The idea is that throughput bound code is likely to be vectorized, so for
254// vectorized code we should care about the throughput of SQRT operations.
255// But if the code is scalar that probably means that the code has some kind of
256// dependency and we should care more about reducing the latency.
257def FeatureFastScalarFSQRT
258 : SubtargetFeature<"fast-scalar-fsqrt", "HasFastScalarFSQRT",
259 "true", "Scalar SQRT is fast (disable Newton-Raphson)">;
260def FeatureFastVectorFSQRT
261 : SubtargetFeature<"fast-vector-fsqrt", "HasFastVectorFSQRT",
262 "true", "Vector SQRT is fast (disable Newton-Raphson)">;
Pierre Gousseaub6d652a2016-10-14 16:41:38 +0000263// If lzcnt has equivalent latency/throughput to most simple integer ops, it can
264// be used to replace test/set sequences.
265def FeatureFastLZCNT
266 : SubtargetFeature<
267 "fast-lzcnt", "HasFastLZCNT", "true",
268 "LZCNT instructions are as fast as most simple integer ops">;
David Greene8f6f72c2009-06-26 22:46:54 +0000269
Craig Topperd88389a2017-02-21 06:39:13 +0000270
271// Sandy Bridge and newer processors can use SHLD with the same source on both
272// inputs to implement rotate to avoid the partial flag update of the normal
273// rotate instructions.
274def FeatureFastSHLDRotate
275 : SubtargetFeature<
276 "fast-shld-rotate", "HasFastSHLDRotate", "true",
277 "SHLD can be used as a faster rotate">;
278
Clement Courbet203fc172017-04-21 09:20:50 +0000279// Ivy Bridge and newer processors have enhanced REP MOVSB and STOSB (aka
280// "string operations"). See "REP String Enhancement" in the Intel Software
Clement Courbet41b43332017-04-21 09:21:05 +0000281// Development Manual. This feature essentially means that REP MOVSB will copy
Clement Courbet203fc172017-04-21 09:20:50 +0000282// using the largest available size instead of copying bytes one by one, making
283// it at least as fast as REPMOVS{W,D,Q}.
284def FeatureERMSB
Clement Courbet1ce3b822017-04-21 09:20:39 +0000285 : SubtargetFeature<
Clement Courbet203fc172017-04-21 09:20:50 +0000286 "ermsb", "HasERMSB", "true",
Clement Courbet1ce3b822017-04-21 09:20:39 +0000287 "REP MOVS/STOS are fast">;
288
Craig Topper641e2af2017-08-30 04:34:48 +0000289// Sandy Bridge and newer processors have many instructions that can be
290// fused with conditional branches and pass through the CPU as a single
291// operation.
292def FeatureMacroFusion
293 : SubtargetFeature<"macrofusion", "HasMacroFusion", "true",
294 "Various instructions can be fused with conditional branches">;
295
Evan Chengff1beda2006-10-06 09:17:41 +0000296//===----------------------------------------------------------------------===//
297// X86 processors supported.
298//===----------------------------------------------------------------------===//
299
Andrew Trick8523b162012-02-01 23:20:51 +0000300include "X86Schedule.td"
301
302def ProcIntelAtom : SubtargetFeature<"atom", "X86ProcFamily", "IntelAtom",
303 "Intel Atom processors">;
Preston Gurd3fe264d2013-09-13 19:23:28 +0000304def ProcIntelSLM : SubtargetFeature<"slm", "X86ProcFamily", "IntelSLM",
305 "Intel Silvermont processors">;
Michael Zuckerman4bcb9c32017-06-29 10:00:33 +0000306def ProcIntelGLM : SubtargetFeature<"glm", "X86ProcFamily", "IntelGLM",
307 "Intel Goldmont processors">;
Mohammed Agabariae9aebf22017-09-13 09:00:27 +0000308def ProcIntelHSW : SubtargetFeature<"haswell", "X86ProcFamily",
309 "IntelHaswell", "Intel Haswell processors">;
310def ProcIntelBDW : SubtargetFeature<"broadwell", "X86ProcFamily",
311 "IntelBroadwell", "Intel Broadwell processors">;
312def ProcIntelSKL : SubtargetFeature<"skylake", "X86ProcFamily",
313 "IntelSkylake", "Intel Skylake processors">;
314def ProcIntelKNL : SubtargetFeature<"knl", "X86ProcFamily",
315 "IntelKNL", "Intel Knights Landing processors">;
316def ProcIntelSKX : SubtargetFeature<"skx", "X86ProcFamily",
317 "IntelSKX", "Intel Skylake Server processors">;
318def ProcIntelCNL : SubtargetFeature<"cannonlake", "X86ProcFamily",
319 "IntelCannonlake", "Intel Cannonlake processors">;
Craig Topper81037f32017-11-19 01:12:00 +0000320def ProcIntelICL : SubtargetFeature<"icelake", "X86ProcFamily",
321 "IntelIcelake", "Intel Icelake processors">;
Andrew Trick8523b162012-02-01 23:20:51 +0000322
Evan Chengff1beda2006-10-06 09:17:41 +0000323class Proc<string Name, list<SubtargetFeature> Features>
Andrew Trick87255e32012-07-07 04:00:00 +0000324 : ProcessorModel<Name, GenericModel, Features>;
Andrew Trick8523b162012-02-01 23:20:51 +0000325
Andrey Turetskiy6a3d5612016-03-23 11:13:54 +0000326def : Proc<"generic", [FeatureX87, FeatureSlowUAMem16]>;
327def : Proc<"i386", [FeatureX87, FeatureSlowUAMem16]>;
328def : Proc<"i486", [FeatureX87, FeatureSlowUAMem16]>;
329def : Proc<"i586", [FeatureX87, FeatureSlowUAMem16]>;
330def : Proc<"pentium", [FeatureX87, FeatureSlowUAMem16]>;
331def : Proc<"pentium-mmx", [FeatureX87, FeatureSlowUAMem16, FeatureMMX]>;
Craig Topper38373222017-11-01 22:15:49 +0000332
333foreach P = ["i686", "pentiumpro"] in {
334 def : Proc<P, [FeatureX87, FeatureSlowUAMem16, FeatureCMOV]>;
335}
336
Andrey Turetskiy6a3d5612016-03-23 11:13:54 +0000337def : Proc<"pentium2", [FeatureX87, FeatureSlowUAMem16, FeatureMMX,
338 FeatureCMOV, FeatureFXSR]>;
Craig Topper38373222017-11-01 22:15:49 +0000339
340foreach P = ["pentium3", "pentium3m"] in {
341 def : Proc<P, [FeatureX87, FeatureSlowUAMem16, FeatureMMX, FeatureSSE1,
342 FeatureFXSR]>;
343}
Mitch Bodarte60465d2016-04-27 22:52:35 +0000344
345// Enable the PostRAScheduler for SSE2 and SSE3 class cpus.
346// The intent is to enable it for pentium4 which is the current default
347// processor in a vanilla 32-bit clang compilation when no specific
348// architecture is specified. This generally gives a nice performance
349// increase on silvermont, with largely neutral behavior on other
350// contemporary large core processors.
351// pentium-m, pentium4m, prescott and nocona are included as a preventative
352// measure to avoid performance surprises, in case clang's default cpu
353// changes slightly.
354
355def : ProcessorModel<"pentium-m", GenericPostRAModel,
356 [FeatureX87, FeatureSlowUAMem16, FeatureMMX,
Craig Topper27381172017-10-15 16:57:33 +0000357 FeatureSSE2, FeatureFXSR]>;
Mitch Bodarte60465d2016-04-27 22:52:35 +0000358
Craig Topper38373222017-11-01 22:15:49 +0000359foreach P = ["pentium4", "pentium4m"] in {
360 def : ProcessorModel<P, GenericPostRAModel,
361 [FeatureX87, FeatureSlowUAMem16, FeatureMMX,
362 FeatureSSE2, FeatureFXSR]>;
363}
Chandler Carruth32908d72014-05-07 17:37:03 +0000364
Andrey Turetskiy958eb462016-04-01 10:16:15 +0000365// Intel Quark.
366def : Proc<"lakemont", []>;
367
Jakob Stoklund Olesen1ac7e662013-03-26 22:19:12 +0000368// Intel Core Duo.
Craig Topper09b65982015-10-16 06:03:09 +0000369def : ProcessorModel<"yonah", SandyBridgeModel,
Andrey Turetskiy6a3d5612016-03-23 11:13:54 +0000370 [FeatureX87, FeatureSlowUAMem16, FeatureMMX, FeatureSSE3,
Craig Topper27381172017-10-15 16:57:33 +0000371 FeatureFXSR]>;
Jakob Stoklund Olesen1ac7e662013-03-26 22:19:12 +0000372
373// NetBurst.
Mitch Bodarte60465d2016-04-27 22:52:35 +0000374def : ProcessorModel<"prescott", GenericPostRAModel,
375 [FeatureX87, FeatureSlowUAMem16, FeatureMMX, FeatureSSE3,
Craig Topper27381172017-10-15 16:57:33 +0000376 FeatureFXSR]>;
Mitch Bodarte60465d2016-04-27 22:52:35 +0000377def : ProcessorModel<"nocona", GenericPostRAModel, [
Andrey Turetskiy6a3d5612016-03-23 11:13:54 +0000378 FeatureX87,
Eric Christopher11e59832015-10-08 20:10:06 +0000379 FeatureSlowUAMem16,
380 FeatureMMX,
381 FeatureSSE3,
Craig Topper09b65982015-10-16 06:03:09 +0000382 FeatureFXSR,
Craig Topper27381172017-10-15 16:57:33 +0000383 FeatureCMPXCHG16B
Eric Christopher11e59832015-10-08 20:10:06 +0000384]>;
Jakob Stoklund Olesen1ac7e662013-03-26 22:19:12 +0000385
386// Intel Core 2 Solo/Duo.
Eric Christopher11e59832015-10-08 20:10:06 +0000387def : ProcessorModel<"core2", SandyBridgeModel, [
Andrey Turetskiy6a3d5612016-03-23 11:13:54 +0000388 FeatureX87,
Eric Christopher11e59832015-10-08 20:10:06 +0000389 FeatureSlowUAMem16,
390 FeatureMMX,
391 FeatureSSSE3,
Craig Topper09b65982015-10-16 06:03:09 +0000392 FeatureFXSR,
Eric Christopher11e59832015-10-08 20:10:06 +0000393 FeatureCMPXCHG16B,
Craig Topper641e2af2017-08-30 04:34:48 +0000394 FeatureLAHFSAHF,
395 FeatureMacroFusion
Eric Christopher11e59832015-10-08 20:10:06 +0000396]>;
397def : ProcessorModel<"penryn", SandyBridgeModel, [
Andrey Turetskiy6a3d5612016-03-23 11:13:54 +0000398 FeatureX87,
Eric Christopher11e59832015-10-08 20:10:06 +0000399 FeatureSlowUAMem16,
400 FeatureMMX,
401 FeatureSSE41,
Craig Topper09b65982015-10-16 06:03:09 +0000402 FeatureFXSR,
Eric Christopher11e59832015-10-08 20:10:06 +0000403 FeatureCMPXCHG16B,
Craig Topper641e2af2017-08-30 04:34:48 +0000404 FeatureLAHFSAHF,
405 FeatureMacroFusion
Eric Christopher11e59832015-10-08 20:10:06 +0000406]>;
Jakob Stoklund Olesen1ac7e662013-03-26 22:19:12 +0000407
Chandler Carruthaf8924032014-12-09 10:58:36 +0000408// Atom CPUs.
409class BonnellProc<string Name> : ProcessorModel<Name, AtomModel, [
Eric Christopher11e59832015-10-08 20:10:06 +0000410 ProcIntelAtom,
Andrey Turetskiy6a3d5612016-03-23 11:13:54 +0000411 FeatureX87,
Eric Christopher11e59832015-10-08 20:10:06 +0000412 FeatureSlowUAMem16,
413 FeatureMMX,
414 FeatureSSSE3,
Craig Topper09b65982015-10-16 06:03:09 +0000415 FeatureFXSR,
Eric Christopher11e59832015-10-08 20:10:06 +0000416 FeatureCMPXCHG16B,
417 FeatureMOVBE,
Sanjay Patel53d1d8b2015-10-12 15:24:01 +0000418 FeatureLEAForSP,
Eric Christopher11e59832015-10-08 20:10:06 +0000419 FeatureSlowDivide32,
420 FeatureSlowDivide64,
Craig Topper62c47a22017-08-29 05:14:27 +0000421 FeatureSlowTwoMemOps,
Eric Christopher11e59832015-10-08 20:10:06 +0000422 FeatureLEAUsesAG,
Hans Wennborg5000ce82015-12-04 23:00:33 +0000423 FeaturePadShortFunctions,
424 FeatureLAHFSAHF
Eric Christopher11e59832015-10-08 20:10:06 +0000425]>;
Chandler Carruthaf8924032014-12-09 10:58:36 +0000426def : BonnellProc<"bonnell">;
427def : BonnellProc<"atom">; // Pin the generic name to the baseline.
Jakob Stoklund Olesen1ac7e662013-03-26 22:19:12 +0000428
Chandler Carruthaf8924032014-12-09 10:58:36 +0000429class SilvermontProc<string Name> : ProcessorModel<Name, SLMModel, [
Eric Christopher11e59832015-10-08 20:10:06 +0000430 ProcIntelSLM,
Andrey Turetskiy6a3d5612016-03-23 11:13:54 +0000431 FeatureX87,
Eric Christopher11e59832015-10-08 20:10:06 +0000432 FeatureMMX,
433 FeatureSSE42,
Craig Topper09b65982015-10-16 06:03:09 +0000434 FeatureFXSR,
Eric Christopher11e59832015-10-08 20:10:06 +0000435 FeatureCMPXCHG16B,
436 FeatureMOVBE,
437 FeaturePOPCNT,
438 FeaturePCLMUL,
439 FeatureAES,
440 FeatureSlowDivide64,
Craig Topper62c47a22017-08-29 05:14:27 +0000441 FeatureSlowTwoMemOps,
Eric Christopher11e59832015-10-08 20:10:06 +0000442 FeaturePRFCHW,
443 FeatureSlowLEA,
444 FeatureSlowIncDec,
Zvi Rackover8bc7e4d2016-12-06 19:35:20 +0000445 FeatureSlowPMULLD,
Hans Wennborg5000ce82015-12-04 23:00:33 +0000446 FeatureLAHFSAHF
Eric Christopher11e59832015-10-08 20:10:06 +0000447]>;
Chandler Carruthaf8924032014-12-09 10:58:36 +0000448def : SilvermontProc<"silvermont">;
449def : SilvermontProc<"slm">; // Legacy alias.
450
Michael Zuckerman4bcb9c32017-06-29 10:00:33 +0000451class GoldmontProc<string Name> : ProcessorModel<Name, SLMModel, [
452 ProcIntelGLM,
453 FeatureX87,
454 FeatureMMX,
455 FeatureSSE42,
456 FeatureFXSR,
457 FeatureCMPXCHG16B,
458 FeatureMOVBE,
459 FeaturePOPCNT,
460 FeaturePCLMUL,
461 FeatureAES,
462 FeaturePRFCHW,
Craig Topper62c47a22017-08-29 05:14:27 +0000463 FeatureSlowTwoMemOps,
Michael Zuckerman4bcb9c32017-06-29 10:00:33 +0000464 FeatureSlowLEA,
465 FeatureSlowIncDec,
Michael Zuckerman4bcb9c32017-06-29 10:00:33 +0000466 FeatureLAHFSAHF,
467 FeatureMPX,
468 FeatureSHA,
Craig Toppera4c5caf2017-07-04 05:33:19 +0000469 FeatureRDRAND,
Michael Zuckerman4bcb9c32017-06-29 10:00:33 +0000470 FeatureRDSEED,
471 FeatureXSAVE,
472 FeatureXSAVEOPT,
473 FeatureXSAVEC,
474 FeatureXSAVES,
Michael Zuckermanac1d20d2017-09-25 13:45:31 +0000475 FeatureCLFLUSHOPT,
476 FeatureFSGSBase
Michael Zuckerman4bcb9c32017-06-29 10:00:33 +0000477]>;
478def : GoldmontProc<"goldmont">;
479
Eric Christopher2ef63182010-04-02 21:54:27 +0000480// "Arrandale" along with corei3 and corei5
Craig Topper3611d9b2015-03-30 06:31:11 +0000481class NehalemProc<string Name> : ProcessorModel<Name, SandyBridgeModel, [
Andrey Turetskiy6a3d5612016-03-23 11:13:54 +0000482 FeatureX87,
Eric Christopher11e59832015-10-08 20:10:06 +0000483 FeatureMMX,
484 FeatureSSE42,
Craig Topper09b65982015-10-16 06:03:09 +0000485 FeatureFXSR,
Eric Christopher11e59832015-10-08 20:10:06 +0000486 FeatureCMPXCHG16B,
Hans Wennborg5000ce82015-12-04 23:00:33 +0000487 FeaturePOPCNT,
Craig Topper641e2af2017-08-30 04:34:48 +0000488 FeatureLAHFSAHF,
489 FeatureMacroFusion
Eric Christopher11e59832015-10-08 20:10:06 +0000490]>;
Craig Topper3611d9b2015-03-30 06:31:11 +0000491def : NehalemProc<"nehalem">;
492def : NehalemProc<"corei7">;
Jakob Stoklund Olesen1ac7e662013-03-26 22:19:12 +0000493
Eric Christopher2ef63182010-04-02 21:54:27 +0000494// Westmere is a similar machine to nehalem with some additional features.
495// Westmere is the corei3/i5/i7 path from nehalem to sandybridge
Chandler Carruthaf8924032014-12-09 10:58:36 +0000496class WestmereProc<string Name> : ProcessorModel<Name, SandyBridgeModel, [
Andrey Turetskiy6a3d5612016-03-23 11:13:54 +0000497 FeatureX87,
Eric Christopher11e59832015-10-08 20:10:06 +0000498 FeatureMMX,
499 FeatureSSE42,
Craig Topper09b65982015-10-16 06:03:09 +0000500 FeatureFXSR,
Eric Christopher11e59832015-10-08 20:10:06 +0000501 FeatureCMPXCHG16B,
Eric Christopher11e59832015-10-08 20:10:06 +0000502 FeaturePOPCNT,
503 FeatureAES,
Hans Wennborg5000ce82015-12-04 23:00:33 +0000504 FeaturePCLMUL,
Craig Topper641e2af2017-08-30 04:34:48 +0000505 FeatureLAHFSAHF,
506 FeatureMacroFusion
Eric Christopher11e59832015-10-08 20:10:06 +0000507]>;
Chandler Carruthaf8924032014-12-09 10:58:36 +0000508def : WestmereProc<"westmere">;
509
Craig Topperf730a6b2016-02-13 21:35:37 +0000510class ProcessorFeatures<list<SubtargetFeature> Inherited,
511 list<SubtargetFeature> NewFeatures> {
512 list<SubtargetFeature> Value = !listconcat(Inherited, NewFeatures);
513}
514
515class ProcModel<string Name, SchedMachineModel Model,
516 list<SubtargetFeature> ProcFeatures,
517 list<SubtargetFeature> OtherFeatures> :
518 ProcessorModel<Name, Model, !listconcat(ProcFeatures, OtherFeatures)>;
519
Nate Begeman8b08f522010-12-10 00:26:57 +0000520// SSE is not listed here since llvm treats AVX as a reimplementation of SSE,
521// rather than a superset.
Craig Topperf730a6b2016-02-13 21:35:37 +0000522def SNBFeatures : ProcessorFeatures<[], [
Andrey Turetskiy6a3d5612016-03-23 11:13:54 +0000523 FeatureX87,
Eric Christopher11e59832015-10-08 20:10:06 +0000524 FeatureMMX,
525 FeatureAVX,
Craig Topper09b65982015-10-16 06:03:09 +0000526 FeatureFXSR,
Eric Christopher11e59832015-10-08 20:10:06 +0000527 FeatureCMPXCHG16B,
Eric Christopher11e59832015-10-08 20:10:06 +0000528 FeaturePOPCNT,
529 FeatureAES,
Nikolai Bozhenov6bdf92c2017-01-12 19:34:15 +0000530 FeatureSlowDivide64,
Craig Topper0ee35692015-10-14 05:37:38 +0000531 FeaturePCLMUL,
532 FeatureXSAVE,
Hans Wennborg5000ce82015-12-04 23:00:33 +0000533 FeatureXSAVEOPT,
Nikolai Bozhenovf6795302016-08-04 12:47:28 +0000534 FeatureLAHFSAHF,
Lama Saba2ea271b2017-05-18 08:11:50 +0000535 FeatureSlow3OpsLEA,
Craig Topperd88389a2017-02-21 06:39:13 +0000536 FeatureFastScalarFSQRT,
Craig Topper641e2af2017-08-30 04:34:48 +0000537 FeatureFastSHLDRotate,
Craig Topperef1f7162017-08-30 05:00:35 +0000538 FeatureSlowIncDec,
Craig Topper641e2af2017-08-30 04:34:48 +0000539 FeatureMacroFusion
Eric Christopher11e59832015-10-08 20:10:06 +0000540]>;
Elena Demikhovsky29cde352016-01-24 10:41:28 +0000541
Craig Topperf730a6b2016-02-13 21:35:37 +0000542class SandyBridgeProc<string Name> : ProcModel<Name, SandyBridgeModel,
543 SNBFeatures.Value, [
Elena Demikhovsky29cde352016-01-24 10:41:28 +0000544 FeatureSlowUAMem32
545]>;
Chandler Carruthaf8924032014-12-09 10:58:36 +0000546def : SandyBridgeProc<"sandybridge">;
547def : SandyBridgeProc<"corei7-avx">; // Legacy alias.
Evan Chengff1beda2006-10-06 09:17:41 +0000548
Craig Topperf730a6b2016-02-13 21:35:37 +0000549def IVBFeatures : ProcessorFeatures<SNBFeatures.Value, [
Eric Christopher11e59832015-10-08 20:10:06 +0000550 FeatureRDRAND,
551 FeatureF16C,
Elena Demikhovsky29cde352016-01-24 10:41:28 +0000552 FeatureFSGSBase
553]>;
554
Craig Topperf730a6b2016-02-13 21:35:37 +0000555class IvyBridgeProc<string Name> : ProcModel<Name, SandyBridgeModel,
556 IVBFeatures.Value, [
Elena Demikhovsky29cde352016-01-24 10:41:28 +0000557 FeatureSlowUAMem32
Eric Christopher11e59832015-10-08 20:10:06 +0000558]>;
Chandler Carruthaf8924032014-12-09 10:58:36 +0000559def : IvyBridgeProc<"ivybridge">;
560def : IvyBridgeProc<"core-avx-i">; // Legacy alias.
Craig Topper3657fe42011-10-14 03:21:46 +0000561
Craig Topperf730a6b2016-02-13 21:35:37 +0000562def HSWFeatures : ProcessorFeatures<IVBFeatures.Value, [
Eric Christopher11e59832015-10-08 20:10:06 +0000563 FeatureAVX2,
Eric Christopher11e59832015-10-08 20:10:06 +0000564 FeatureBMI,
565 FeatureBMI2,
Clement Courbet203fc172017-04-21 09:20:50 +0000566 FeatureERMSB,
Eric Christopher11e59832015-10-08 20:10:06 +0000567 FeatureFMA,
Elena Demikhovsky29cde352016-01-24 10:41:28 +0000568 FeatureLZCNT,
Craig Topperef1f7162017-08-30 05:00:35 +0000569 FeatureMOVBE
Eric Christopher11e59832015-10-08 20:10:06 +0000570]>;
Elena Demikhovsky29cde352016-01-24 10:41:28 +0000571
Craig Topperf730a6b2016-02-13 21:35:37 +0000572class HaswellProc<string Name> : ProcModel<Name, HaswellModel,
Mohammed Agabariae9aebf22017-09-13 09:00:27 +0000573 HSWFeatures.Value, [
Craig Topper27381172017-10-15 16:57:33 +0000574 ProcIntelHSW
Craig Topper54541c42017-10-13 16:04:08 +0000575]>;
Chandler Carruthaf8924032014-12-09 10:58:36 +0000576def : HaswellProc<"haswell">;
577def : HaswellProc<"core-avx2">; // Legacy alias.
578
Craig Topperf730a6b2016-02-13 21:35:37 +0000579def BDWFeatures : ProcessorFeatures<HSWFeatures.Value, [
Eric Christopher11e59832015-10-08 20:10:06 +0000580 FeatureADX,
Craig Topper86576bd2017-02-09 06:50:59 +0000581 FeatureRDSEED
Eric Christopher11e59832015-10-08 20:10:06 +0000582]>;
Gadi Haber323f2e12017-10-24 20:19:47 +0000583class BroadwellProc<string Name> : ProcModel<Name, BroadwellModel,
Craig Topper54541c42017-10-13 16:04:08 +0000584 BDWFeatures.Value, [
Craig Topper27381172017-10-15 16:57:33 +0000585 ProcIntelBDW
Craig Topper54541c42017-10-13 16:04:08 +0000586]>;
Chandler Carruthaf8924032014-12-09 10:58:36 +0000587def : BroadwellProc<"broadwell">;
588
Craig Topperf730a6b2016-02-13 21:35:37 +0000589def SKLFeatures : ProcessorFeatures<BDWFeatures.Value, [
Elena Demikhovsky29cde352016-01-24 10:41:28 +0000590 FeatureMPX,
Eric Christopher58297412017-03-29 07:40:44 +0000591 FeatureRTM,
Elena Demikhovsky29cde352016-01-24 10:41:28 +0000592 FeatureXSAVEC,
593 FeatureXSAVES,
594 FeatureSGX,
Nikolai Bozhenovf6795302016-08-04 12:47:28 +0000595 FeatureCLFLUSHOPT,
596 FeatureFastVectorFSQRT
Elena Demikhovsky29cde352016-01-24 10:41:28 +0000597]>;
598
Gadi Haber6f8fbf42017-09-19 06:19:27 +0000599class SkylakeClientProc<string Name> : ProcModel<Name, SkylakeClientModel,
Mohammed Agabariae9aebf22017-09-13 09:00:27 +0000600 SKLFeatures.Value, [
Craig Topper27381172017-10-15 16:57:33 +0000601 ProcIntelSKL
Craig Topper5805fb32017-10-13 16:06:06 +0000602]>;
Sanjoy Dasaa63dc02016-02-21 17:12:03 +0000603def : SkylakeClientProc<"skylake">;
Elena Demikhovsky29cde352016-01-24 10:41:28 +0000604
Craig Topper5d692912017-10-13 18:10:17 +0000605def KNLFeatures : ProcessorFeatures<IVBFeatures.Value, [
Eric Christopher11e59832015-10-08 20:10:06 +0000606 FeatureAVX512,
607 FeatureERI,
608 FeatureCDI,
609 FeaturePFI,
Elena Demikhovsky29cde352016-01-24 10:41:28 +0000610 FeaturePREFETCHWT1,
611 FeatureADX,
612 FeatureRDSEED,
Eric Christopher11e59832015-10-08 20:10:06 +0000613 FeatureMOVBE,
614 FeatureLZCNT,
615 FeatureBMI,
616 FeatureBMI2,
Craig Topper5d692912017-10-13 18:10:17 +0000617 FeatureFMA
618]>;
619
620// FIXME: define KNL model
621class KnightsLandingProc<string Name> : ProcModel<Name, HaswellModel,
622 KNLFeatures.Value, [
623 ProcIntelKNL,
Craig Topper62c47a22017-08-29 05:14:27 +0000624 FeatureSlowTwoMemOps,
Amjad Aboud4f977512017-03-03 09:03:24 +0000625 FeatureFastPartialYMMorZMMWrite
Eric Christopher11e59832015-10-08 20:10:06 +0000626]>;
Chandler Carruthaf8924032014-12-09 10:58:36 +0000627def : KnightsLandingProc<"knl">;
Elena Demikhovsky8cfb43f2013-07-24 11:02:47 +0000628
Craig Topper5d692912017-10-13 18:10:17 +0000629class KnightsMillProc<string Name> : ProcModel<Name, HaswellModel,
630 KNLFeatures.Value, [
631 ProcIntelKNL,
632 FeatureSlowTwoMemOps,
Craig Topper6fae2ee2017-10-25 17:10:32 +0000633 FeatureFastPartialYMMorZMMWrite,
634 FeatureVPOPCNTDQ
Craig Topper5d692912017-10-13 18:10:17 +0000635]>;
636def : KnightsMillProc<"knm">; // TODO Add AVX5124FMAPS/AVX5124VNNIW features
637
Craig Topperf730a6b2016-02-13 21:35:37 +0000638def SKXFeatures : ProcessorFeatures<SKLFeatures.Value, [
Eric Christopher11e59832015-10-08 20:10:06 +0000639 FeatureAVX512,
640 FeatureCDI,
641 FeatureDQI,
642 FeatureBWI,
643 FeatureVLX,
Asaf Badouh5acf66f2015-12-15 13:35:29 +0000644 FeaturePKU,
Elena Demikhovsky29cde352016-01-24 10:41:28 +0000645 FeatureCLWB
Eric Christopher11e59832015-10-08 20:10:06 +0000646]>;
Chandler Carruthaf8924032014-12-09 10:58:36 +0000647
Gadi Haber684944b2017-10-08 12:52:54 +0000648class SkylakeServerProc<string Name> : ProcModel<Name, SkylakeServerModel,
Mohammed Agabariae9aebf22017-09-13 09:00:27 +0000649 SKXFeatures.Value, [
Craig Topper27381172017-10-15 16:57:33 +0000650 ProcIntelSKX
Craig Toppera1f9c9dd2017-10-15 16:41:15 +0000651]>;
Sanjoy Dasaa63dc02016-02-21 17:12:03 +0000652def : SkylakeServerProc<"skylake-avx512">;
Elena Demikhovsky29cde352016-01-24 10:41:28 +0000653def : SkylakeServerProc<"skx">; // Legacy alias.
654
Craig Topperf730a6b2016-02-13 21:35:37 +0000655def CNLFeatures : ProcessorFeatures<SKXFeatures.Value, [
Elena Demikhovsky9242ea82016-01-18 13:00:31 +0000656 FeatureVBMI,
Elena Demikhovsky29cde352016-01-24 10:41:28 +0000657 FeatureIFMA,
658 FeatureSHA
Elena Demikhovsky9242ea82016-01-18 13:00:31 +0000659]>;
Elena Demikhovsky29cde352016-01-24 10:41:28 +0000660
Craig Topperf730a6b2016-02-13 21:35:37 +0000661class CannonlakeProc<string Name> : ProcModel<Name, HaswellModel,
Mohammed Agabariae9aebf22017-09-13 09:00:27 +0000662 CNLFeatures.Value, [
Craig Topper27381172017-10-15 16:57:33 +0000663 ProcIntelCNL
Craig Topper5805fb32017-10-13 16:06:06 +0000664]>;
Elena Demikhovsky9242ea82016-01-18 13:00:31 +0000665def : CannonlakeProc<"cannonlake">;
Chandler Carruthaf8924032014-12-09 10:58:36 +0000666
Craig Topper81037f32017-11-19 01:12:00 +0000667def ICLFeatures : ProcessorFeatures<CNLFeatures.Value, [
668 // TODO: Insert features here.
669]>;
670
671class IcelakeProc<string Name> : ProcModel<Name, SkylakeServerModel,
672 ICLFeatures.Value, [
673 ProcIntelICL
674]>;
675def : IcelakeProc<"icelake">;
676
Chandler Carruthaf8924032014-12-09 10:58:36 +0000677// AMD CPUs.
Robert Khasanovbfa01312014-07-21 14:54:21 +0000678
Andrey Turetskiy6a3d5612016-03-23 11:13:54 +0000679def : Proc<"k6", [FeatureX87, FeatureSlowUAMem16, FeatureMMX]>;
680def : Proc<"k6-2", [FeatureX87, FeatureSlowUAMem16, Feature3DNow]>;
681def : Proc<"k6-3", [FeatureX87, FeatureSlowUAMem16, Feature3DNow]>;
Craig Topper38373222017-11-01 22:15:49 +0000682
683foreach P = ["athlon", "athlon-tbird"] in {
684 def : Proc<P, [FeatureX87, FeatureSlowUAMem16, Feature3DNowA, FeatureSlowSHLD]>;
685}
686
687foreach P = ["athlon-4", "athlon-xp", "athlon-mp"] in {
688 def : Proc<P, [FeatureX87, FeatureSlowUAMem16, FeatureSSE1,
689 Feature3DNowA, FeatureFXSR, FeatureSlowSHLD]>;
690}
691
692foreach P = ["k8", "opteron", "athlon64", "athlon-fx"] in {
693 def : Proc<P, [FeatureX87, FeatureSlowUAMem16, FeatureSSE2, Feature3DNowA,
694 FeatureFXSR, Feature64Bit, FeatureSlowSHLD]>;
695}
696
697foreach P = ["k8-sse3", "opteron-sse3", "athlon64-sse3"] in {
698 def : Proc<P, [FeatureX87, FeatureSlowUAMem16, FeatureSSE3, Feature3DNowA,
699 FeatureFXSR, FeatureCMPXCHG16B, FeatureSlowSHLD]>;
700}
701
702foreach P = ["amdfam10", "barcelona"] in {
703 def : Proc<P, [FeatureX87, FeatureSSE4A, Feature3DNowA, FeatureFXSR,
704 FeatureCMPXCHG16B, FeatureLZCNT, FeaturePOPCNT,
705 FeatureSlowSHLD, FeatureLAHFSAHF]>;
706}
Sanjay Patel9e916dc2015-08-21 20:17:26 +0000707
Benjamin Kramer077ae1d2012-01-10 11:50:02 +0000708// Bobcat
Eric Christopher11e59832015-10-08 20:10:06 +0000709def : Proc<"btver1", [
Andrey Turetskiy6a3d5612016-03-23 11:13:54 +0000710 FeatureX87,
Eric Christopher11e59832015-10-08 20:10:06 +0000711 FeatureMMX,
712 FeatureSSSE3,
713 FeatureSSE4A,
Craig Topper09b65982015-10-16 06:03:09 +0000714 FeatureFXSR,
Eric Christopher11e59832015-10-08 20:10:06 +0000715 FeatureCMPXCHG16B,
716 FeaturePRFCHW,
717 FeatureLZCNT,
718 FeaturePOPCNT,
Hans Wennborg5000ce82015-12-04 23:00:33 +0000719 FeatureSlowSHLD,
720 FeatureLAHFSAHF
Eric Christopher11e59832015-10-08 20:10:06 +0000721]>;
Sanjay Patel1191adf2014-09-09 20:07:07 +0000722
Benjamin Kramerb44c4272013-05-03 10:20:08 +0000723// Jaguar
Eric Christopher11e59832015-10-08 20:10:06 +0000724def : ProcessorModel<"btver2", BtVer2Model, [
Andrey Turetskiy6a3d5612016-03-23 11:13:54 +0000725 FeatureX87,
Eric Christopher11e59832015-10-08 20:10:06 +0000726 FeatureMMX,
727 FeatureAVX,
Craig Topper09b65982015-10-16 06:03:09 +0000728 FeatureFXSR,
Eric Christopher11e59832015-10-08 20:10:06 +0000729 FeatureSSE4A,
730 FeatureCMPXCHG16B,
731 FeaturePRFCHW,
732 FeatureAES,
733 FeaturePCLMUL,
734 FeatureBMI,
735 FeatureF16C,
736 FeatureMOVBE,
737 FeatureLZCNT,
Pierre Gousseaub6d652a2016-10-14 16:41:38 +0000738 FeatureFastLZCNT,
Eric Christopher11e59832015-10-08 20:10:06 +0000739 FeaturePOPCNT,
Craig Topper0ee35692015-10-14 05:37:38 +0000740 FeatureXSAVE,
741 FeatureXSAVEOPT,
Hans Wennborg5000ce82015-12-04 23:00:33 +0000742 FeatureSlowSHLD,
Yunzhong Gao0de36ec2016-02-12 23:37:57 +0000743 FeatureLAHFSAHF,
Amjad Aboud4f977512017-03-03 09:03:24 +0000744 FeatureFastPartialYMMorZMMWrite
Eric Christopher11e59832015-10-08 20:10:06 +0000745]>;
Sanjay Patele57f3c02014-11-28 18:40:18 +0000746
Benjamin Kramer077ae1d2012-01-10 11:50:02 +0000747// Bulldozer
Eric Christopher11e59832015-10-08 20:10:06 +0000748def : Proc<"bdver1", [
Andrey Turetskiy6a3d5612016-03-23 11:13:54 +0000749 FeatureX87,
Eric Christopher11e59832015-10-08 20:10:06 +0000750 FeatureXOP,
751 FeatureFMA4,
752 FeatureCMPXCHG16B,
753 FeatureAES,
754 FeaturePRFCHW,
755 FeaturePCLMUL,
756 FeatureMMX,
757 FeatureAVX,
Craig Topper09b65982015-10-16 06:03:09 +0000758 FeatureFXSR,
Eric Christopher11e59832015-10-08 20:10:06 +0000759 FeatureSSE4A,
760 FeatureLZCNT,
761 FeaturePOPCNT,
Craig Topper0ee35692015-10-14 05:37:38 +0000762 FeatureXSAVE,
Simon Pilgrim99b925b2017-05-03 15:51:39 +0000763 FeatureLWP,
Hans Wennborg5000ce82015-12-04 23:00:33 +0000764 FeatureSlowSHLD,
Craig Topper641e2af2017-08-30 04:34:48 +0000765 FeatureLAHFSAHF,
766 FeatureMacroFusion
Eric Christopher11e59832015-10-08 20:10:06 +0000767]>;
Benjamin Kramerb44c4272013-05-03 10:20:08 +0000768// Piledriver
Eric Christopher11e59832015-10-08 20:10:06 +0000769def : Proc<"bdver2", [
Andrey Turetskiy6a3d5612016-03-23 11:13:54 +0000770 FeatureX87,
Eric Christopher11e59832015-10-08 20:10:06 +0000771 FeatureXOP,
772 FeatureFMA4,
773 FeatureCMPXCHG16B,
774 FeatureAES,
775 FeaturePRFCHW,
776 FeaturePCLMUL,
777 FeatureMMX,
778 FeatureAVX,
Craig Topper09b65982015-10-16 06:03:09 +0000779 FeatureFXSR,
Eric Christopher11e59832015-10-08 20:10:06 +0000780 FeatureSSE4A,
781 FeatureF16C,
782 FeatureLZCNT,
783 FeaturePOPCNT,
Craig Topper0ee35692015-10-14 05:37:38 +0000784 FeatureXSAVE,
Eric Christopher11e59832015-10-08 20:10:06 +0000785 FeatureBMI,
786 FeatureTBM,
Simon Pilgrim99b925b2017-05-03 15:51:39 +0000787 FeatureLWP,
Eric Christopher11e59832015-10-08 20:10:06 +0000788 FeatureFMA,
Hans Wennborg5000ce82015-12-04 23:00:33 +0000789 FeatureSlowSHLD,
Craig Topper641e2af2017-08-30 04:34:48 +0000790 FeatureLAHFSAHF,
791 FeatureMacroFusion
Eric Christopher11e59832015-10-08 20:10:06 +0000792]>;
Benjamin Kramerd114def2013-11-04 10:29:20 +0000793
794// Steamroller
Eric Christopher11e59832015-10-08 20:10:06 +0000795def : Proc<"bdver3", [
Andrey Turetskiy6a3d5612016-03-23 11:13:54 +0000796 FeatureX87,
Eric Christopher11e59832015-10-08 20:10:06 +0000797 FeatureXOP,
798 FeatureFMA4,
799 FeatureCMPXCHG16B,
800 FeatureAES,
801 FeaturePRFCHW,
802 FeaturePCLMUL,
803 FeatureMMX,
804 FeatureAVX,
Craig Topper09b65982015-10-16 06:03:09 +0000805 FeatureFXSR,
Eric Christopher11e59832015-10-08 20:10:06 +0000806 FeatureSSE4A,
807 FeatureF16C,
808 FeatureLZCNT,
809 FeaturePOPCNT,
Craig Topper0ee35692015-10-14 05:37:38 +0000810 FeatureXSAVE,
Eric Christopher11e59832015-10-08 20:10:06 +0000811 FeatureBMI,
812 FeatureTBM,
Simon Pilgrim99b925b2017-05-03 15:51:39 +0000813 FeatureLWP,
Eric Christopher11e59832015-10-08 20:10:06 +0000814 FeatureFMA,
Craig Topper0ee35692015-10-14 05:37:38 +0000815 FeatureXSAVEOPT,
Eric Christopher11e59832015-10-08 20:10:06 +0000816 FeatureSlowSHLD,
Hans Wennborg5000ce82015-12-04 23:00:33 +0000817 FeatureFSGSBase,
Craig Topper641e2af2017-08-30 04:34:48 +0000818 FeatureLAHFSAHF,
819 FeatureMacroFusion
Eric Christopher11e59832015-10-08 20:10:06 +0000820]>;
Benjamin Kramerd114def2013-11-04 10:29:20 +0000821
Benjamin Kramer60045732014-05-02 15:47:07 +0000822// Excavator
Eric Christopher11e59832015-10-08 20:10:06 +0000823def : Proc<"bdver4", [
Andrey Turetskiy6a3d5612016-03-23 11:13:54 +0000824 FeatureX87,
Eric Christopher11e59832015-10-08 20:10:06 +0000825 FeatureMMX,
826 FeatureAVX2,
Craig Topper09b65982015-10-16 06:03:09 +0000827 FeatureFXSR,
Eric Christopher11e59832015-10-08 20:10:06 +0000828 FeatureXOP,
829 FeatureFMA4,
830 FeatureCMPXCHG16B,
831 FeatureAES,
832 FeaturePRFCHW,
833 FeaturePCLMUL,
834 FeatureF16C,
835 FeatureLZCNT,
836 FeaturePOPCNT,
Craig Topper0ee35692015-10-14 05:37:38 +0000837 FeatureXSAVE,
Eric Christopher11e59832015-10-08 20:10:06 +0000838 FeatureBMI,
839 FeatureBMI2,
840 FeatureTBM,
Simon Pilgrim99b925b2017-05-03 15:51:39 +0000841 FeatureLWP,
Eric Christopher11e59832015-10-08 20:10:06 +0000842 FeatureFMA,
Craig Topper0ee35692015-10-14 05:37:38 +0000843 FeatureXSAVEOPT,
Simon Pilgrim381a0ad2016-07-24 16:00:53 +0000844 FeatureSlowSHLD,
Hans Wennborg5000ce82015-12-04 23:00:33 +0000845 FeatureFSGSBase,
Ashutosh Nema348af9c2016-05-18 11:59:12 +0000846 FeatureLAHFSAHF,
Craig Topper641e2af2017-08-30 04:34:48 +0000847 FeatureMWAITX,
848 FeatureMacroFusion
Eric Christopher11e59832015-10-08 20:10:06 +0000849]>;
Benjamin Kramer60045732014-05-02 15:47:07 +0000850
Craig Topper106b5b62017-07-19 02:45:14 +0000851// Znver1
852def: ProcessorModel<"znver1", Znver1Model, [
Craig Topperd55b8312017-01-10 06:01:16 +0000853 FeatureADX,
854 FeatureAES,
855 FeatureAVX2,
856 FeatureBMI,
857 FeatureBMI2,
858 FeatureCLFLUSHOPT,
Craig Topper50f3d142017-02-09 04:27:34 +0000859 FeatureCLZERO,
Craig Topperd55b8312017-01-10 06:01:16 +0000860 FeatureCMPXCHG16B,
861 FeatureF16C,
862 FeatureFMA,
863 FeatureFSGSBase,
864 FeatureFXSR,
865 FeatureFastLZCNT,
866 FeatureLAHFSAHF,
867 FeatureLZCNT,
Craig Topper641e2af2017-08-30 04:34:48 +0000868 FeatureMacroFusion,
Craig Topperd55b8312017-01-10 06:01:16 +0000869 FeatureMMX,
870 FeatureMOVBE,
871 FeatureMWAITX,
872 FeaturePCLMUL,
873 FeaturePOPCNT,
874 FeaturePRFCHW,
875 FeatureRDRAND,
876 FeatureRDSEED,
877 FeatureSHA,
Craig Topperd55b8312017-01-10 06:01:16 +0000878 FeatureSSE4A,
879 FeatureSlowSHLD,
880 FeatureX87,
881 FeatureXSAVE,
882 FeatureXSAVEC,
883 FeatureXSAVEOPT,
884 FeatureXSAVES]>;
885
Andrey Turetskiy6a3d5612016-03-23 11:13:54 +0000886def : Proc<"geode", [FeatureX87, FeatureSlowUAMem16, Feature3DNowA]>;
Evan Chengff1beda2006-10-06 09:17:41 +0000887
Andrey Turetskiy6a3d5612016-03-23 11:13:54 +0000888def : Proc<"winchip-c6", [FeatureX87, FeatureSlowUAMem16, FeatureMMX]>;
889def : Proc<"winchip2", [FeatureX87, FeatureSlowUAMem16, Feature3DNow]>;
890def : Proc<"c3", [FeatureX87, FeatureSlowUAMem16, Feature3DNow]>;
891def : Proc<"c3-2", [FeatureX87, FeatureSlowUAMem16, FeatureMMX,
892 FeatureSSE1, FeatureFXSR]>;
Evan Chengff1beda2006-10-06 09:17:41 +0000893
Chandler Carruth32908d72014-05-07 17:37:03 +0000894// We also provide a generic 64-bit specific x86 processor model which tries to
895// be good for modern chips without enabling instruction set encodings past the
896// basic SSE2 and 64-bit ones. It disables slow things from any mainstream and
897// modern 64-bit x86 chip, and enables features that are generally beneficial.
Michael Liao5bf95782014-12-04 05:20:33 +0000898//
Chandler Carruth32908d72014-05-07 17:37:03 +0000899// We currently use the Sandy Bridge model as the default scheduling model as
900// we use it across Nehalem, Westmere, Sandy Bridge, and Ivy Bridge which
901// covers a huge swath of x86 processors. If there are specific scheduling
902// knobs which need to be tuned differently for AMD chips, we might consider
903// forming a common base for them.
Chandler Carruth98c51cb2017-08-21 08:45:22 +0000904def : ProcessorModel<"x86-64", SandyBridgeModel, [
905 FeatureX87,
906 FeatureMMX,
907 FeatureSSE2,
908 FeatureFXSR,
909 Feature64Bit,
910 FeatureSlow3OpsLEA,
Craig Topper641e2af2017-08-30 04:34:48 +0000911 FeatureSlowIncDec,
912 FeatureMacroFusion
Chandler Carruth98c51cb2017-08-21 08:45:22 +0000913]>;
Chandler Carruth32908d72014-05-07 17:37:03 +0000914
Evan Chengff1beda2006-10-06 09:17:41 +0000915//===----------------------------------------------------------------------===//
Chris Lattner5da8e802003-08-03 15:47:49 +0000916// Register File Description
917//===----------------------------------------------------------------------===//
918
919include "X86RegisterInfo.td"
Igor Bregerb4442f32017-02-10 07:05:56 +0000920include "X86RegisterBanks.td"
Chris Lattner5da8e802003-08-03 15:47:49 +0000921
Chris Lattnera8c3cff2003-08-03 18:19:37 +0000922//===----------------------------------------------------------------------===//
923// Instruction Descriptions
924//===----------------------------------------------------------------------===//
925
Chris Lattner59a4a912003-08-03 21:54:21 +0000926include "X86InstrInfo.td"
927
Jakob Stoklund Olesenb93331f2010-04-05 03:10:20 +0000928def X86InstrInfo : InstrInfo;
Chris Lattnera8c3cff2003-08-03 18:19:37 +0000929
Chris Lattner5d00a0b2007-02-26 18:17:14 +0000930//===----------------------------------------------------------------------===//
931// Calling Conventions
932//===----------------------------------------------------------------------===//
933
934include "X86CallingConv.td"
935
936
937//===----------------------------------------------------------------------===//
Jim Grosbach4cf25f52010-10-30 13:48:28 +0000938// Assembly Parser
Chris Lattner5d00a0b2007-02-26 18:17:14 +0000939//===----------------------------------------------------------------------===//
940
Devang Patel85d684a2012-01-09 19:13:28 +0000941def ATTAsmParserVariant : AsmParserVariant {
Daniel Dunbar00331992009-07-29 00:02:19 +0000942 int Variant = 0;
Daniel Dunbare4318712009-08-11 20:59:47 +0000943
Chad Rosier9f7a2212013-04-18 22:35:36 +0000944 // Variant name.
945 string Name = "att";
946
Daniel Dunbare4318712009-08-11 20:59:47 +0000947 // Discard comments in assembly strings.
948 string CommentDelimiter = "#";
949
950 // Recognize hard coded registers.
951 string RegisterPrefix = "%";
Daniel Dunbar00331992009-07-29 00:02:19 +0000952}
953
Devang Patel67bf992a2012-01-10 17:51:54 +0000954def IntelAsmParserVariant : AsmParserVariant {
955 int Variant = 1;
956
Chad Rosier9f7a2212013-04-18 22:35:36 +0000957 // Variant name.
958 string Name = "intel";
959
Devang Patel67bf992a2012-01-10 17:51:54 +0000960 // Discard comments in assembly strings.
961 string CommentDelimiter = ";";
962
963 // Recognize hard coded registers.
964 string RegisterPrefix = "";
965}
966
Jim Grosbach4cf25f52010-10-30 13:48:28 +0000967//===----------------------------------------------------------------------===//
968// Assembly Printers
969//===----------------------------------------------------------------------===//
970
Chris Lattner56832602004-10-03 20:36:57 +0000971// The X86 target supports two different syntaxes for emitting machine code.
972// This is controlled by the -x86-asm-syntax={att|intel}
973def ATTAsmWriter : AsmWriter {
Chris Lattner1cbd3de2009-09-13 19:30:11 +0000974 string AsmWriterClassName = "ATTInstPrinter";
Chris Lattner56832602004-10-03 20:36:57 +0000975 int Variant = 0;
976}
977def IntelAsmWriter : AsmWriter {
Chris Lattner13306a12009-09-20 07:47:59 +0000978 string AsmWriterClassName = "IntelInstPrinter";
Chris Lattner56832602004-10-03 20:36:57 +0000979 int Variant = 1;
980}
981
Chris Lattnera8c3cff2003-08-03 18:19:37 +0000982def X86 : Target {
Chris Lattnera8c3cff2003-08-03 18:19:37 +0000983 // Information about the instructions...
Chris Lattner25510802003-08-04 04:59:56 +0000984 let InstructionSet = X86InstrInfo;
Devang Patel67bf992a2012-01-10 17:51:54 +0000985 let AssemblyParserVariants = [ATTAsmParserVariant, IntelAsmParserVariant];
Chris Lattner56832602004-10-03 20:36:57 +0000986 let AssemblyWriters = [ATTAsmWriter, IntelAsmWriter];
Chris Lattnera8c3cff2003-08-03 18:19:37 +0000987}