blob: 0d0ec76c7436a5be4a23204b1cad9a01ca0bc4ea [file] [log] [blame]
Jia Liub22310f2012-02-18 12:03:15 +00001//===-- X86.td - Target definition file for the Intel X86 --*- tablegen -*-===//
Michael J. Spencerb88784c2011-04-14 14:33:36 +00002//
John Criswell29265fe2003-10-21 15:17:13 +00003// The LLVM Compiler Infrastructure
4//
Chris Lattnerf3ebc3f2007-12-29 20:36:04 +00005// This file is distributed under the University of Illinois Open Source
6// License. See LICENSE.TXT for details.
Michael J. Spencerb88784c2011-04-14 14:33:36 +00007//
John Criswell29265fe2003-10-21 15:17:13 +00008//===----------------------------------------------------------------------===//
Chris Lattner5da8e802003-08-03 15:47:49 +00009//
Craig Topper271064e2011-10-11 06:44:02 +000010// This is a target description file for the Intel i386 architecture, referred
11// to here as the "X86" architecture.
Chris Lattner5da8e802003-08-03 15:47:49 +000012//
13//===----------------------------------------------------------------------===//
14
Chris Lattner25510802003-08-04 04:59:56 +000015// Get the target-independent interfaces which we are implementing...
Chris Lattner5da8e802003-08-03 15:47:49 +000016//
Evan Cheng977e7be2008-11-24 07:34:46 +000017include "llvm/Target/Target.td"
Chris Lattner5da8e802003-08-03 15:47:49 +000018
19//===----------------------------------------------------------------------===//
Anitha Boyapati426feb62012-08-16 03:50:04 +000020// X86 Subtarget state
Evan Cheng13bcc6c2011-07-07 21:06:52 +000021//
22
23def Mode64Bit : SubtargetFeature<"64bit-mode", "In64BitMode", "true",
24 "64-bit mode (x86_64)">;
Craig Topper3c80d622014-01-06 04:55:54 +000025def Mode32Bit : SubtargetFeature<"32bit-mode", "In32BitMode", "true",
26 "32-bit mode (80386)">;
27def Mode16Bit : SubtargetFeature<"16bit-mode", "In16BitMode", "true",
28 "16-bit mode (i8086)">;
Evan Cheng13bcc6c2011-07-07 21:06:52 +000029
30//===----------------------------------------------------------------------===//
Anitha Boyapati426feb62012-08-16 03:50:04 +000031// X86 Subtarget features
Bill Wendlinge6182262007-05-04 20:38:40 +000032//===----------------------------------------------------------------------===//
Chris Lattnercc8c5812009-09-02 05:53:04 +000033
Andrey Turetskiy6a3d5612016-03-23 11:13:54 +000034def FeatureX87 : SubtargetFeature<"x87","HasX87", "true",
35 "Enable X87 float instructions">;
36
Craig Topper505f38a2018-01-10 22:07:16 +000037def FeatureNOPL : SubtargetFeature<"nopl", "HasNOPL", "true",
38 "Enable NOPL instruction">;
39
Chris Lattnercc8c5812009-09-02 05:53:04 +000040def FeatureCMOV : SubtargetFeature<"cmov","HasCMov", "true",
41 "Enable conditional move instructions">;
42
Benjamin Kramer2f489232010-12-04 20:32:23 +000043def FeaturePOPCNT : SubtargetFeature<"popcnt", "HasPOPCNT", "true",
44 "Support POPCNT instruction">;
45
Craig Topper09b65982015-10-16 06:03:09 +000046def FeatureFXSR : SubtargetFeature<"fxsr", "HasFXSR", "true",
47 "Support fxsave/fxrestore instructions">;
48
Amjad Aboud1db6d7a2015-10-12 11:47:46 +000049def FeatureXSAVE : SubtargetFeature<"xsave", "HasXSAVE", "true",
50 "Support xsave instructions">;
51
52def FeatureXSAVEOPT: SubtargetFeature<"xsaveopt", "HasXSAVEOPT", "true",
53 "Support xsaveopt instructions">;
54
55def FeatureXSAVEC : SubtargetFeature<"xsavec", "HasXSAVEC", "true",
56 "Support xsavec instructions">;
57
58def FeatureXSAVES : SubtargetFeature<"xsaves", "HasXSAVES", "true",
59 "Support xsaves instructions">;
60
Bill Wendlinge6182262007-05-04 20:38:40 +000061def FeatureSSE1 : SubtargetFeature<"sse", "X86SSELevel", "SSE1",
62 "Enable SSE instructions",
Chris Lattnercc8c5812009-09-02 05:53:04 +000063 // SSE codegen depends on cmovs, and all
Michael J. Spencerb88784c2011-04-14 14:33:36 +000064 // SSE1+ processors support them.
Eric Christopher11e59832015-10-08 20:10:06 +000065 [FeatureCMOV]>;
Bill Wendlinge6182262007-05-04 20:38:40 +000066def FeatureSSE2 : SubtargetFeature<"sse2", "X86SSELevel", "SSE2",
67 "Enable SSE2 instructions",
68 [FeatureSSE1]>;
69def FeatureSSE3 : SubtargetFeature<"sse3", "X86SSELevel", "SSE3",
70 "Enable SSE3 instructions",
71 [FeatureSSE2]>;
72def FeatureSSSE3 : SubtargetFeature<"ssse3", "X86SSELevel", "SSSE3",
73 "Enable SSSE3 instructions",
74 [FeatureSSE3]>;
Rafael Espindola94a2c562013-08-23 20:21:34 +000075def FeatureSSE41 : SubtargetFeature<"sse4.1", "X86SSELevel", "SSE41",
Nate Begemane14fdfa2008-02-03 07:18:54 +000076 "Enable SSE 4.1 instructions",
77 [FeatureSSSE3]>;
Rafael Espindola94a2c562013-08-23 20:21:34 +000078def FeatureSSE42 : SubtargetFeature<"sse4.2", "X86SSELevel", "SSE42",
Nate Begemane14fdfa2008-02-03 07:18:54 +000079 "Enable SSE 4.2 instructions",
Craig Topper7bd33052011-12-29 15:51:45 +000080 [FeatureSSE41]>;
Eric Christopher57a6e132015-11-14 03:04:00 +000081// The MMX subtarget feature is separate from the rest of the SSE features
82// because it's important (for odd compatibility reasons) to be able to
83// turn it off explicitly while allowing SSE+ to be on.
84def FeatureMMX : SubtargetFeature<"mmx","X863DNowLevel", "MMX",
85 "Enable MMX instructions">;
Bill Wendlinge6182262007-05-04 20:38:40 +000086def Feature3DNow : SubtargetFeature<"3dnow", "X863DNowLevel", "ThreeDNow",
Michael J. Spencer30088ba2011-04-15 00:32:41 +000087 "Enable 3DNow! instructions",
88 [FeatureMMX]>;
Bill Wendlinge6182262007-05-04 20:38:40 +000089def Feature3DNowA : SubtargetFeature<"3dnowa", "X863DNowLevel", "ThreeDNowA",
Bill Wendlingf985c492007-05-06 07:56:19 +000090 "Enable 3DNow! Athlon instructions",
91 [Feature3DNow]>;
Dan Gohman74037512009-02-03 00:04:43 +000092// All x86-64 hardware has SSE2, but we don't mark SSE2 as an implied
93// feature, because SSE2 can be disabled (e.g. for compiling OS kernels)
94// without disabling 64-bit mode.
Bill Wendlingf985c492007-05-06 07:56:19 +000095def Feature64Bit : SubtargetFeature<"64bit", "HasX86_64", "true",
Chris Lattner77f7dba2010-03-14 22:24:34 +000096 "Support 64-bit instructions",
97 [FeatureCMOV]>;
Nick Lewycky3be42b82013-10-05 20:11:44 +000098def FeatureCMPXCHG16B : SubtargetFeature<"cx16", "HasCmpxchg16b", "true",
Eli Friedman5e570422011-08-26 21:21:21 +000099 "64-bit with cmpxchg16b",
100 [Feature64Bit]>;
Ekaterina Romanovad5fa5542013-11-21 23:21:26 +0000101def FeatureSlowSHLD : SubtargetFeature<"slow-shld", "IsSHLDSlow", "true",
102 "SHLD instruction is slow">;
Zvi Rackover8bc7e4d2016-12-06 19:35:20 +0000103def FeatureSlowPMULLD : SubtargetFeature<"slow-pmulld", "IsPMULLDSlow", "true",
104 "PMULLD instruction is slow">;
Sanjay Patel30145672015-09-01 20:51:51 +0000105// FIXME: This should not apply to CPUs that do not have SSE.
106def FeatureSlowUAMem16 : SubtargetFeature<"slow-unaligned-mem-16",
107 "IsUAMem16Slow", "true",
108 "Slow unaligned 16-byte memory access">;
Sanjay Patel501890e2014-11-21 17:40:04 +0000109def FeatureSlowUAMem32 : SubtargetFeature<"slow-unaligned-mem-32",
Sanjay Patel9e916dc2015-08-21 20:17:26 +0000110 "IsUAMem32Slow", "true",
111 "Slow unaligned 32-byte memory access">;
Stefanus Du Toit96180b52009-05-26 21:04:35 +0000112def FeatureSSE4A : SubtargetFeature<"sse4a", "HasSSE4A", "true",
Craig Toppera5d1fc22011-12-30 07:16:00 +0000113 "Support SSE 4a instructions",
114 [FeatureSSE3]>;
Evan Chengff1beda2006-10-06 09:17:41 +0000115
Craig Topperf287a452012-01-09 09:02:13 +0000116def FeatureAVX : SubtargetFeature<"avx", "X86SSELevel", "AVX",
117 "Enable AVX instructions",
118 [FeatureSSE42]>;
119def FeatureAVX2 : SubtargetFeature<"avx2", "X86SSELevel", "AVX2",
Craig Topper228d9132011-10-30 19:57:21 +0000120 "Enable AVX2 instructions",
121 [FeatureAVX]>;
Craig Toppercb6c3862017-11-06 22:49:01 +0000122def FeatureFMA : SubtargetFeature<"fma", "HasFMA", "true",
123 "Enable three-operand fused multiple-add",
124 [FeatureAVX]>;
Craig Topper428a4e62017-11-06 22:49:04 +0000125def FeatureF16C : SubtargetFeature<"f16c", "HasF16C", "true",
126 "Support 16-bit floating point conversion instructions",
127 [FeatureAVX]>;
Craig Topper5c94bb82013-08-21 03:57:57 +0000128def FeatureAVX512 : SubtargetFeature<"avx512f", "X86SSELevel", "AVX512F",
Elena Demikhovsky8cfb43f2013-07-24 11:02:47 +0000129 "Enable AVX-512 instructions",
Craig Topper428a4e62017-11-06 22:49:04 +0000130 [FeatureAVX2, FeatureFMA, FeatureF16C]>;
Craig Topper5c94bb82013-08-21 03:57:57 +0000131def FeatureERI : SubtargetFeature<"avx512er", "HasERI", "true",
Elena Demikhovsky003e7d72013-07-28 08:28:38 +0000132 "Enable AVX-512 Exponential and Reciprocal Instructions",
133 [FeatureAVX512]>;
Craig Topper5c94bb82013-08-21 03:57:57 +0000134def FeatureCDI : SubtargetFeature<"avx512cd", "HasCDI", "true",
Elena Demikhovsky003e7d72013-07-28 08:28:38 +0000135 "Enable AVX-512 Conflict Detection Instructions",
136 [FeatureAVX512]>;
Oren Ben Simhon7bf27f02017-05-25 13:45:23 +0000137def FeatureVPOPCNTDQ : SubtargetFeature<"avx512vpopcntdq", "HasVPOPCNTDQ",
138 "true", "Enable AVX-512 Population Count Instructions",
139 [FeatureAVX512]>;
Craig Topper5c94bb82013-08-21 03:57:57 +0000140def FeaturePFI : SubtargetFeature<"avx512pf", "HasPFI", "true",
Elena Demikhovsky003e7d72013-07-28 08:28:38 +0000141 "Enable AVX-512 PreFetch Instructions",
142 [FeatureAVX512]>;
Craig Toppere2685982017-12-22 02:30:30 +0000143def FeaturePREFETCHWT1 : SubtargetFeature<"prefetchwt1", "HasPREFETCHWT1",
Elena Demikhovsky29cde352016-01-24 10:41:28 +0000144 "true",
145 "Prefetch with Intent to Write and T1 Hint">;
Robert Khasanovbfa01312014-07-21 14:54:21 +0000146def FeatureDQI : SubtargetFeature<"avx512dq", "HasDQI", "true",
147 "Enable AVX-512 Doubleword and Quadword Instructions",
148 [FeatureAVX512]>;
149def FeatureBWI : SubtargetFeature<"avx512bw", "HasBWI", "true",
150 "Enable AVX-512 Byte and Word Instructions",
151 [FeatureAVX512]>;
152def FeatureVLX : SubtargetFeature<"avx512vl", "HasVLX", "true",
153 "Enable AVX-512 Vector Length eXtensions",
154 [FeatureAVX512]>;
Michael Zuckerman97b6a6922016-01-17 13:42:12 +0000155def FeatureVBMI : SubtargetFeature<"avx512vbmi", "HasVBMI", "true",
Craig Topper5c842be2016-11-09 04:50:48 +0000156 "Enable AVX-512 Vector Byte Manipulation Instructions",
157 [FeatureBWI]>;
Coby Tayree71e37cc2017-11-21 09:48:44 +0000158def FeatureVBMI2 : SubtargetFeature<"avx512vbmi2", "HasVBMI2", "true",
159 "Enable AVX-512 further Vector Byte Manipulation Instructions",
160 [FeatureBWI]>;
Craig Topper3bb3f732016-02-08 01:23:15 +0000161def FeatureIFMA : SubtargetFeature<"avx512ifma", "HasIFMA", "true",
Elena Demikhovsky29cde352016-01-24 10:41:28 +0000162 "Enable AVX-512 Integer Fused Multiple-Add",
163 [FeatureAVX512]>;
Asaf Badouh5acf66f2015-12-15 13:35:29 +0000164def FeaturePKU : SubtargetFeature<"pku", "HasPKU", "true",
165 "Enable protection keys">;
Coby Tayree3880f2a2017-11-21 10:04:28 +0000166def FeatureVNNI : SubtargetFeature<"avx512vnni", "HasVNNI", "true",
167 "Enable AVX-512 Vector Neural Network Instructions",
168 [FeatureAVX512]>;
Coby Tayree5c7fe5d2017-11-21 10:32:42 +0000169def FeatureBITALG : SubtargetFeature<"avx512bitalg", "HasBITALG", "true",
170 "Enable AVX-512 Bit Algorithms",
171 [FeatureBWI]>;
Benjamin Kramera0396e42012-05-31 14:34:17 +0000172def FeaturePCLMUL : SubtargetFeature<"pclmul", "HasPCLMUL", "true",
173 "Enable packed carry-less multiplication instructions",
Craig Topper29dd1482012-05-01 05:28:32 +0000174 [FeatureSSE2]>;
Coby Tayreed8b17be2017-11-26 09:36:41 +0000175def FeatureGFNI : SubtargetFeature<"gfni", "HasGFNI", "true",
176 "Enable Galois Field Arithmetic Instructions",
177 [FeatureSSE2]>;
Coby Tayree7ca5e5872017-11-21 09:30:33 +0000178def FeatureVPCLMULQDQ : SubtargetFeature<"vpclmulqdq", "HasVPCLMULQDQ", "true",
179 "Enable vpclmulqdq instructions",
180 [FeatureAVX, FeaturePCLMUL]>;
David Greene8f6f72c2009-06-26 22:46:54 +0000181def FeatureFMA4 : SubtargetFeature<"fma4", "HasFMA4", "true",
Craig Toppera5d1fc22011-12-30 07:16:00 +0000182 "Enable four-operand fused multiple-add",
Craig Topperbae0e9e2012-05-01 06:54:48 +0000183 [FeatureAVX, FeatureSSE4A]>;
Craig Toppera5d1fc22011-12-30 07:16:00 +0000184def FeatureXOP : SubtargetFeature<"xop", "HasXOP", "true",
Craig Topper43518cc2012-05-01 05:41:41 +0000185 "Enable XOP instructions",
Anitha Boyapatiaf3e9832012-08-16 04:04:02 +0000186 [FeatureFMA4]>;
Sanjay Patelffd039b2015-02-03 17:13:04 +0000187def FeatureSSEUnalignedMem : SubtargetFeature<"sse-unaligned-mem",
188 "HasSSEUnalignedMem", "true",
189 "Allow unaligned memory operands with SSE instructions">;
Eric Christopher2ef63182010-04-02 21:54:27 +0000190def FeatureAES : SubtargetFeature<"aes", "HasAES", "true",
Craig Topper29dd1482012-05-01 05:28:32 +0000191 "Enable AES instructions",
192 [FeatureSSE2]>;
Coby Tayree2a1c02f2017-11-21 09:11:41 +0000193def FeatureVAES : SubtargetFeature<"vaes", "HasVAES", "true",
194 "Promote selected AES instructions to AVX512/AVX registers",
195 [FeatureAVX, FeatureAES]>;
Yunzhong Gaodd36e932013-09-24 18:21:52 +0000196def FeatureTBM : SubtargetFeature<"tbm", "HasTBM", "true",
197 "Enable TBM instructions">;
Simon Pilgrim99b925b2017-05-03 15:51:39 +0000198def FeatureLWP : SubtargetFeature<"lwp", "HasLWP", "true",
199 "Enable LWP instructions">;
Craig Topper786bdb92011-10-03 17:28:23 +0000200def FeatureMOVBE : SubtargetFeature<"movbe", "HasMOVBE", "true",
201 "Support MOVBE instruction">;
Rafael Espindola94a2c562013-08-23 20:21:34 +0000202def FeatureRDRAND : SubtargetFeature<"rdrnd", "HasRDRAND", "true",
Craig Topper786bdb92011-10-03 17:28:23 +0000203 "Support RDRAND instruction">;
Craig Topper228d9132011-10-30 19:57:21 +0000204def FeatureFSGSBase : SubtargetFeature<"fsgsbase", "HasFSGSBase", "true",
205 "Support FS/GS Base instructions">;
Craig Topper271064e2011-10-11 06:44:02 +0000206def FeatureLZCNT : SubtargetFeature<"lzcnt", "HasLZCNT", "true",
207 "Support LZCNT instruction">;
Craig Topper3657fe42011-10-14 03:21:46 +0000208def FeatureBMI : SubtargetFeature<"bmi", "HasBMI", "true",
209 "Support BMI instructions">;
Craig Topperaea148c2011-10-16 07:55:05 +0000210def FeatureBMI2 : SubtargetFeature<"bmi2", "HasBMI2", "true",
211 "Support BMI2 instructions">;
Michael Liao73cffdd2012-11-08 07:28:54 +0000212def FeatureRTM : SubtargetFeature<"rtm", "HasRTM", "true",
213 "Support RTM instructions">;
Kay Tiong Khoof809c642013-02-14 19:08:21 +0000214def FeatureADX : SubtargetFeature<"adx", "HasADX", "true",
215 "Support ADX instructions">;
Ben Langmuir16501752013-09-12 15:51:31 +0000216def FeatureSHA : SubtargetFeature<"sha", "HasSHA", "true",
217 "Enable SHA instructions",
218 [FeatureSSE2]>;
Oren Ben Simhonfa582b02017-11-26 13:02:45 +0000219def FeatureSHSTK : SubtargetFeature<"shstk", "HasSHSTK", "true",
220 "Support CET Shadow-Stack instructions">;
221def FeatureIBT : SubtargetFeature<"ibt", "HasIBT", "true",
222 "Support CET Indirect-Branch-Tracking instructions">;
Michael Liao5173ee02013-03-26 17:47:11 +0000223def FeaturePRFCHW : SubtargetFeature<"prfchw", "HasPRFCHW", "true",
224 "Support PRFCHW instructions">;
Michael Liaoa486a112013-03-28 23:41:26 +0000225def FeatureRDSEED : SubtargetFeature<"rdseed", "HasRDSEED", "true",
226 "Support RDSEED instruction">;
Hans Wennborg5000ce82015-12-04 23:00:33 +0000227def FeatureLAHFSAHF : SubtargetFeature<"sahf", "HasLAHFSAHF", "true",
228 "Support LAHF and SAHF instructions">;
Ashutosh Nema348af9c2016-05-18 11:59:12 +0000229def FeatureMWAITX : SubtargetFeature<"mwaitx", "HasMWAITX", "true",
230 "Enable MONITORX/MWAITX timer functionality">;
Craig Topper50f3d142017-02-09 04:27:34 +0000231def FeatureCLZERO : SubtargetFeature<"clzero", "HasCLZERO", "true",
232 "Enable Cache Line Zero">;
Elena Demikhovskyf7e641c2015-06-03 10:30:57 +0000233def FeatureMPX : SubtargetFeature<"mpx", "HasMPX", "true",
234 "Support MPX instructions">;
Sanjay Patel53d1d8b2015-10-12 15:24:01 +0000235def FeatureLEAForSP : SubtargetFeature<"lea-sp", "UseLeaForSP", "true",
Evan Cheng1b81fdd2012-02-07 22:50:41 +0000236 "Use LEA for adjusting the stack pointer">;
Alexey Volkovfd1731d2014-11-21 11:19:34 +0000237def FeatureSlowDivide32 : SubtargetFeature<"idivl-to-divb",
238 "HasSlowDivide32", "true",
239 "Use 8-bit divide for positive values less than 256">;
Nikolai Bozhenov6bdf92c2017-01-12 19:34:15 +0000240def FeatureSlowDivide64 : SubtargetFeature<"idivq-to-divl",
Alexey Volkovfd1731d2014-11-21 11:19:34 +0000241 "HasSlowDivide64", "true",
Nikolai Bozhenov6bdf92c2017-01-12 19:34:15 +0000242 "Use 32-bit divide for positive values less than 2^32">;
Preston Gurda01daac2013-01-08 18:27:24 +0000243def FeaturePadShortFunctions : SubtargetFeature<"pad-short-functions",
244 "PadShortFunctions", "true",
245 "Pad short functions">;
Elena Demikhovsky29cde352016-01-24 10:41:28 +0000246def FeatureSGX : SubtargetFeature<"sgx", "HasSGX", "true",
247 "Enable Software Guard Extensions">;
248def FeatureCLFLUSHOPT : SubtargetFeature<"clflushopt", "HasCLFLUSHOPT", "true",
249 "Flush A Cache Line Optimized">;
Elena Demikhovsky29cde352016-01-24 10:41:28 +0000250def FeatureCLWB : SubtargetFeature<"clwb", "HasCLWB", "true",
251 "Cache Line Write Back">;
Craig Topper84b26b92018-01-18 23:52:31 +0000252def FeatureRDPID : SubtargetFeature<"rdpid", "HasRDPID", "true",
253 "Support RDPID instructions">;
Craig Topper62c47a22017-08-29 05:14:27 +0000254// On some processors, instructions that implicitly take two memory operands are
255// slow. In practice, this means that CALL, PUSH, and POP with memory operands
256// should be avoided in favor of a MOV + register CALL/PUSH/POP.
257def FeatureSlowTwoMemOps : SubtargetFeature<"slow-two-mem-ops",
258 "SlowTwoMemOps", "true",
259 "Two memory operand instructions are slow">;
Preston Gurd8b7ab4b2013-04-25 20:29:37 +0000260def FeatureLEAUsesAG : SubtargetFeature<"lea-uses-ag", "LEAUsesAG", "true",
261 "LEA instruction needs inputs at AG stage">;
Alexey Volkov6226de62014-05-20 08:55:50 +0000262def FeatureSlowLEA : SubtargetFeature<"slow-lea", "SlowLEA", "true",
263 "LEA instruction with certain arguments is slow">;
Lama Saba2ea271b2017-05-18 08:11:50 +0000264def FeatureSlow3OpsLEA : SubtargetFeature<"slow-3ops-lea", "Slow3OpsLEA", "true",
265 "LEA instruction with 3 ops or certain registers is slow">;
Alexey Volkov5260dba2014-06-09 11:40:41 +0000266def FeatureSlowIncDec : SubtargetFeature<"slow-incdec", "SlowIncDec", "true",
267 "INC and DEC instructions are slower than ADD and SUB">;
Eric Christopher824f42f2015-05-12 01:26:05 +0000268def FeatureSoftFloat
269 : SubtargetFeature<"soft-float", "UseSoftFloat", "true",
270 "Use software floating point features.">;
Marina Yatsina77a21db2018-01-22 10:07:01 +0000271def FeaturePOPCNTFalseDeps : SubtargetFeature<"false-deps-popcnt",
272 "HasPOPCNTFalseDeps", "true",
273 "POPCNT has a false dependency on dest register">;
274def FeatureLZCNTFalseDeps : SubtargetFeature<"false-deps-lzcnt-tzcnt",
275 "HasLZCNTFalseDeps", "true",
276 "LZCNT/TZCNT have a false dependency on dest register">;
Simon Pilgrimfd5df632017-12-19 13:16:43 +0000277// On recent X86 (port bound) processors, its preferable to combine to a single shuffle
278// using a variable mask over multiple fixed shuffles.
279def FeatureFastVariableShuffle
280 : SubtargetFeature<"fast-variable-shuffle",
281 "HasFastVariableShuffle",
282 "true", "Shuffles with variable masks are fast">;
Amjad Aboud4f977512017-03-03 09:03:24 +0000283// On some X86 processors, there is no performance hazard to writing only the
284// lower parts of a YMM or ZMM register without clearing the upper part.
285def FeatureFastPartialYMMorZMMWrite
286 : SubtargetFeature<"fast-partial-ymm-or-zmm-write",
287 "HasFastPartialYMMorZMMWrite",
288 "true", "Partial writes to YMM/ZMM registers are fast">;
Nikolai Bozhenovf6795302016-08-04 12:47:28 +0000289// FeatureFastScalarFSQRT should be enabled if scalar FSQRT has shorter latency
290// than the corresponding NR code. FeatureFastVectorFSQRT should be enabled if
291// vector FSQRT has higher throughput than the corresponding NR code.
292// The idea is that throughput bound code is likely to be vectorized, so for
293// vectorized code we should care about the throughput of SQRT operations.
294// But if the code is scalar that probably means that the code has some kind of
295// dependency and we should care more about reducing the latency.
296def FeatureFastScalarFSQRT
297 : SubtargetFeature<"fast-scalar-fsqrt", "HasFastScalarFSQRT",
298 "true", "Scalar SQRT is fast (disable Newton-Raphson)">;
299def FeatureFastVectorFSQRT
300 : SubtargetFeature<"fast-vector-fsqrt", "HasFastVectorFSQRT",
301 "true", "Vector SQRT is fast (disable Newton-Raphson)">;
Pierre Gousseaub6d652a2016-10-14 16:41:38 +0000302// If lzcnt has equivalent latency/throughput to most simple integer ops, it can
303// be used to replace test/set sequences.
304def FeatureFastLZCNT
305 : SubtargetFeature<
306 "fast-lzcnt", "HasFastLZCNT", "true",
307 "LZCNT instructions are as fast as most simple integer ops">;
Simon Pilgrim02bdac52018-01-29 21:24:31 +0000308// If the target can efficiently decode NOPs upto 11-bytes in length.
309def FeatureFast11ByteNOP
310 : SubtargetFeature<
311 "fast-11bytenop", "HasFast11ByteNOP", "true",
312 "Target can quickly decode up to 11 byte NOPs">;
313// If the target can efficiently decode NOPs upto 15-bytes in length.
314def FeatureFast15ByteNOP
315 : SubtargetFeature<
316 "fast-15bytenop", "HasFast15ByteNOP", "true",
317 "Target can quickly decode up to 15 byte NOPs">;
Craig Topperd88389a2017-02-21 06:39:13 +0000318// Sandy Bridge and newer processors can use SHLD with the same source on both
319// inputs to implement rotate to avoid the partial flag update of the normal
320// rotate instructions.
321def FeatureFastSHLDRotate
322 : SubtargetFeature<
323 "fast-shld-rotate", "HasFastSHLDRotate", "true",
324 "SHLD can be used as a faster rotate">;
325
Clement Courbet203fc172017-04-21 09:20:50 +0000326// Ivy Bridge and newer processors have enhanced REP MOVSB and STOSB (aka
327// "string operations"). See "REP String Enhancement" in the Intel Software
Clement Courbet41b43332017-04-21 09:21:05 +0000328// Development Manual. This feature essentially means that REP MOVSB will copy
Clement Courbet203fc172017-04-21 09:20:50 +0000329// using the largest available size instead of copying bytes one by one, making
330// it at least as fast as REPMOVS{W,D,Q}.
331def FeatureERMSB
Clement Courbet1ce3b822017-04-21 09:20:39 +0000332 : SubtargetFeature<
Clement Courbet203fc172017-04-21 09:20:50 +0000333 "ermsb", "HasERMSB", "true",
Clement Courbet1ce3b822017-04-21 09:20:39 +0000334 "REP MOVS/STOS are fast">;
335
Craig Topper641e2af2017-08-30 04:34:48 +0000336// Sandy Bridge and newer processors have many instructions that can be
337// fused with conditional branches and pass through the CPU as a single
338// operation.
339def FeatureMacroFusion
340 : SubtargetFeature<"macrofusion", "HasMacroFusion", "true",
341 "Various instructions can be fused with conditional branches">;
342
Craig Topperea37e202017-11-25 18:09:37 +0000343// Gather is available since Haswell (AVX2 set). So technically, we can
344// generate Gathers on all AVX2 processors. But the overhead on HSW is high.
345// Skylake Client processor has faster Gathers than HSW and performance is
346// similar to Skylake Server (AVX-512).
347def FeatureHasFastGather
348 : SubtargetFeature<"fast-gather", "HasFastGather", "true",
349 "Indicates if gather is reasonably fast.">;
350
Craig Topper0d797a32018-01-20 00:26:08 +0000351def FeaturePrefer256Bit
352 : SubtargetFeature<"prefer-256-bit", "Prefer256Bit", "true",
353 "Prefer 256-bit AVX instructions">;
354
Chandler Carruthc58f2162018-01-22 22:05:25 +0000355// Enable mitigation of some aspects of speculative execution related
356// vulnerabilities by removing speculatable indirect branches. This disables
357// jump-table formation, rewrites explicit `indirectbr` instructions into
358// `switch` instructions, and uses a special construct called a "retpoline" to
359// prevent speculation of the remaining indirect branches (indirect calls and
360// tail calls).
361def FeatureRetpoline
362 : SubtargetFeature<"retpoline", "UseRetpoline", "true",
363 "Remove speculation of indirect branches from the "
364 "generated code, either by avoiding them entirely or "
365 "lowering them with a speculation blocking construct.">;
366
367// Rely on external thunks for the emitted retpoline calls. This allows users
368// to provide their own custom thunk definitions in highly specialized
369// environments such as a kernel that does boot-time hot patching.
370def FeatureRetpolineExternalThunk
371 : SubtargetFeature<
372 "retpoline-external-thunk", "UseRetpolineExternalThunk", "true",
373 "Enable retpoline, but with an externally provided thunk.",
374 [FeatureRetpoline]>;
375
Evan Chengff1beda2006-10-06 09:17:41 +0000376//===----------------------------------------------------------------------===//
Craig Topper57c28152017-12-10 17:42:36 +0000377// Register File Description
378//===----------------------------------------------------------------------===//
379
380include "X86RegisterInfo.td"
381include "X86RegisterBanks.td"
382
383//===----------------------------------------------------------------------===//
384// Instruction Descriptions
Evan Chengff1beda2006-10-06 09:17:41 +0000385//===----------------------------------------------------------------------===//
386
Andrew Trick8523b162012-02-01 23:20:51 +0000387include "X86Schedule.td"
Craig Topper57c28152017-12-10 17:42:36 +0000388include "X86InstrInfo.td"
389
390def X86InstrInfo : InstrInfo;
391
392//===----------------------------------------------------------------------===//
393// X86 processors supported.
394//===----------------------------------------------------------------------===//
395
396include "X86ScheduleAtom.td"
397include "X86SchedSandyBridge.td"
398include "X86SchedHaswell.td"
399include "X86SchedBroadwell.td"
400include "X86ScheduleSLM.td"
401include "X86ScheduleZnver1.td"
402include "X86ScheduleBtVer2.td"
403include "X86SchedSkylakeClient.td"
404include "X86SchedSkylakeServer.td"
Andrew Trick8523b162012-02-01 23:20:51 +0000405
406def ProcIntelAtom : SubtargetFeature<"atom", "X86ProcFamily", "IntelAtom",
407 "Intel Atom processors">;
Preston Gurd3fe264d2013-09-13 19:23:28 +0000408def ProcIntelSLM : SubtargetFeature<"slm", "X86ProcFamily", "IntelSLM",
409 "Intel Silvermont processors">;
Michael Zuckerman4bcb9c32017-06-29 10:00:33 +0000410def ProcIntelGLM : SubtargetFeature<"glm", "X86ProcFamily", "IntelGLM",
411 "Intel Goldmont processors">;
Mohammed Agabariae9aebf22017-09-13 09:00:27 +0000412def ProcIntelHSW : SubtargetFeature<"haswell", "X86ProcFamily",
413 "IntelHaswell", "Intel Haswell processors">;
414def ProcIntelBDW : SubtargetFeature<"broadwell", "X86ProcFamily",
415 "IntelBroadwell", "Intel Broadwell processors">;
416def ProcIntelSKL : SubtargetFeature<"skylake", "X86ProcFamily",
417 "IntelSkylake", "Intel Skylake processors">;
418def ProcIntelKNL : SubtargetFeature<"knl", "X86ProcFamily",
419 "IntelKNL", "Intel Knights Landing processors">;
420def ProcIntelSKX : SubtargetFeature<"skx", "X86ProcFamily",
421 "IntelSKX", "Intel Skylake Server processors">;
422def ProcIntelCNL : SubtargetFeature<"cannonlake", "X86ProcFamily",
423 "IntelCannonlake", "Intel Cannonlake processors">;
Gabor Buella213edc42018-04-10 18:59:13 +0000424def ProcIntelICL : SubtargetFeature<"icelake-client", "X86ProcFamily",
425 "IntelIcelakeClient", "Intel Icelake processors">;
426def ProcIntelICX : SubtargetFeature<"icelake-server", "X86ProcFamily",
427 "IntelIcelakeServer", "Intel Icelake Server processors">;
Andrew Trick8523b162012-02-01 23:20:51 +0000428
Evan Chengff1beda2006-10-06 09:17:41 +0000429class Proc<string Name, list<SubtargetFeature> Features>
Andrew Trick87255e32012-07-07 04:00:00 +0000430 : ProcessorModel<Name, GenericModel, Features>;
Andrew Trick8523b162012-02-01 23:20:51 +0000431
Andrey Turetskiy6a3d5612016-03-23 11:13:54 +0000432def : Proc<"generic", [FeatureX87, FeatureSlowUAMem16]>;
433def : Proc<"i386", [FeatureX87, FeatureSlowUAMem16]>;
434def : Proc<"i486", [FeatureX87, FeatureSlowUAMem16]>;
435def : Proc<"i586", [FeatureX87, FeatureSlowUAMem16]>;
436def : Proc<"pentium", [FeatureX87, FeatureSlowUAMem16]>;
437def : Proc<"pentium-mmx", [FeatureX87, FeatureSlowUAMem16, FeatureMMX]>;
Craig Topper38373222017-11-01 22:15:49 +0000438
Craig Topper505f38a2018-01-10 22:07:16 +0000439def : Proc<"i686", [FeatureX87, FeatureSlowUAMem16, FeatureCMOV]>;
440def : Proc<"pentiumpro", [FeatureX87, FeatureSlowUAMem16, FeatureCMOV,
441 FeatureNOPL]>;
Craig Topper38373222017-11-01 22:15:49 +0000442
Andrey Turetskiy6a3d5612016-03-23 11:13:54 +0000443def : Proc<"pentium2", [FeatureX87, FeatureSlowUAMem16, FeatureMMX,
Craig Topper505f38a2018-01-10 22:07:16 +0000444 FeatureCMOV, FeatureFXSR, FeatureNOPL]>;
Craig Topper38373222017-11-01 22:15:49 +0000445
446foreach P = ["pentium3", "pentium3m"] in {
447 def : Proc<P, [FeatureX87, FeatureSlowUAMem16, FeatureMMX, FeatureSSE1,
Craig Topper505f38a2018-01-10 22:07:16 +0000448 FeatureFXSR, FeatureNOPL]>;
Craig Topper38373222017-11-01 22:15:49 +0000449}
Mitch Bodarte60465d2016-04-27 22:52:35 +0000450
451// Enable the PostRAScheduler for SSE2 and SSE3 class cpus.
452// The intent is to enable it for pentium4 which is the current default
453// processor in a vanilla 32-bit clang compilation when no specific
454// architecture is specified. This generally gives a nice performance
455// increase on silvermont, with largely neutral behavior on other
456// contemporary large core processors.
457// pentium-m, pentium4m, prescott and nocona are included as a preventative
458// measure to avoid performance surprises, in case clang's default cpu
459// changes slightly.
460
461def : ProcessorModel<"pentium-m", GenericPostRAModel,
462 [FeatureX87, FeatureSlowUAMem16, FeatureMMX,
Craig Topper505f38a2018-01-10 22:07:16 +0000463 FeatureSSE2, FeatureFXSR, FeatureNOPL]>;
Mitch Bodarte60465d2016-04-27 22:52:35 +0000464
Craig Topper38373222017-11-01 22:15:49 +0000465foreach P = ["pentium4", "pentium4m"] in {
466 def : ProcessorModel<P, GenericPostRAModel,
467 [FeatureX87, FeatureSlowUAMem16, FeatureMMX,
Craig Topper505f38a2018-01-10 22:07:16 +0000468 FeatureSSE2, FeatureFXSR, FeatureNOPL]>;
Craig Topper38373222017-11-01 22:15:49 +0000469}
Chandler Carruth32908d72014-05-07 17:37:03 +0000470
Andrey Turetskiy958eb462016-04-01 10:16:15 +0000471// Intel Quark.
472def : Proc<"lakemont", []>;
473
Jakob Stoklund Olesen1ac7e662013-03-26 22:19:12 +0000474// Intel Core Duo.
Craig Topper09b65982015-10-16 06:03:09 +0000475def : ProcessorModel<"yonah", SandyBridgeModel,
Andrey Turetskiy6a3d5612016-03-23 11:13:54 +0000476 [FeatureX87, FeatureSlowUAMem16, FeatureMMX, FeatureSSE3,
Craig Topper505f38a2018-01-10 22:07:16 +0000477 FeatureFXSR, FeatureNOPL]>;
Jakob Stoklund Olesen1ac7e662013-03-26 22:19:12 +0000478
479// NetBurst.
Mitch Bodarte60465d2016-04-27 22:52:35 +0000480def : ProcessorModel<"prescott", GenericPostRAModel,
481 [FeatureX87, FeatureSlowUAMem16, FeatureMMX, FeatureSSE3,
Craig Topper505f38a2018-01-10 22:07:16 +0000482 FeatureFXSR, FeatureNOPL]>;
Mitch Bodarte60465d2016-04-27 22:52:35 +0000483def : ProcessorModel<"nocona", GenericPostRAModel, [
Andrey Turetskiy6a3d5612016-03-23 11:13:54 +0000484 FeatureX87,
Eric Christopher11e59832015-10-08 20:10:06 +0000485 FeatureSlowUAMem16,
486 FeatureMMX,
487 FeatureSSE3,
Craig Topper09b65982015-10-16 06:03:09 +0000488 FeatureFXSR,
Craig Topper505f38a2018-01-10 22:07:16 +0000489 FeatureNOPL,
Craig Topper27381172017-10-15 16:57:33 +0000490 FeatureCMPXCHG16B
Eric Christopher11e59832015-10-08 20:10:06 +0000491]>;
Jakob Stoklund Olesen1ac7e662013-03-26 22:19:12 +0000492
493// Intel Core 2 Solo/Duo.
Eric Christopher11e59832015-10-08 20:10:06 +0000494def : ProcessorModel<"core2", SandyBridgeModel, [
Andrey Turetskiy6a3d5612016-03-23 11:13:54 +0000495 FeatureX87,
Eric Christopher11e59832015-10-08 20:10:06 +0000496 FeatureSlowUAMem16,
497 FeatureMMX,
498 FeatureSSSE3,
Craig Topper09b65982015-10-16 06:03:09 +0000499 FeatureFXSR,
Craig Topper505f38a2018-01-10 22:07:16 +0000500 FeatureNOPL,
Eric Christopher11e59832015-10-08 20:10:06 +0000501 FeatureCMPXCHG16B,
Craig Topper641e2af2017-08-30 04:34:48 +0000502 FeatureLAHFSAHF,
503 FeatureMacroFusion
Eric Christopher11e59832015-10-08 20:10:06 +0000504]>;
505def : ProcessorModel<"penryn", SandyBridgeModel, [
Andrey Turetskiy6a3d5612016-03-23 11:13:54 +0000506 FeatureX87,
Eric Christopher11e59832015-10-08 20:10:06 +0000507 FeatureSlowUAMem16,
508 FeatureMMX,
509 FeatureSSE41,
Craig Topper09b65982015-10-16 06:03:09 +0000510 FeatureFXSR,
Craig Topper505f38a2018-01-10 22:07:16 +0000511 FeatureNOPL,
Eric Christopher11e59832015-10-08 20:10:06 +0000512 FeatureCMPXCHG16B,
Craig Topper641e2af2017-08-30 04:34:48 +0000513 FeatureLAHFSAHF,
514 FeatureMacroFusion
Eric Christopher11e59832015-10-08 20:10:06 +0000515]>;
Jakob Stoklund Olesen1ac7e662013-03-26 22:19:12 +0000516
Chandler Carruthaf8924032014-12-09 10:58:36 +0000517// Atom CPUs.
518class BonnellProc<string Name> : ProcessorModel<Name, AtomModel, [
Eric Christopher11e59832015-10-08 20:10:06 +0000519 ProcIntelAtom,
Andrey Turetskiy6a3d5612016-03-23 11:13:54 +0000520 FeatureX87,
Eric Christopher11e59832015-10-08 20:10:06 +0000521 FeatureSlowUAMem16,
522 FeatureMMX,
523 FeatureSSSE3,
Craig Topper09b65982015-10-16 06:03:09 +0000524 FeatureFXSR,
Craig Topper505f38a2018-01-10 22:07:16 +0000525 FeatureNOPL,
Eric Christopher11e59832015-10-08 20:10:06 +0000526 FeatureCMPXCHG16B,
527 FeatureMOVBE,
Sanjay Patel53d1d8b2015-10-12 15:24:01 +0000528 FeatureLEAForSP,
Eric Christopher11e59832015-10-08 20:10:06 +0000529 FeatureSlowDivide32,
530 FeatureSlowDivide64,
Craig Topper62c47a22017-08-29 05:14:27 +0000531 FeatureSlowTwoMemOps,
Eric Christopher11e59832015-10-08 20:10:06 +0000532 FeatureLEAUsesAG,
Hans Wennborg5000ce82015-12-04 23:00:33 +0000533 FeaturePadShortFunctions,
534 FeatureLAHFSAHF
Eric Christopher11e59832015-10-08 20:10:06 +0000535]>;
Chandler Carruthaf8924032014-12-09 10:58:36 +0000536def : BonnellProc<"bonnell">;
537def : BonnellProc<"atom">; // Pin the generic name to the baseline.
Jakob Stoklund Olesen1ac7e662013-03-26 22:19:12 +0000538
Chandler Carruthaf8924032014-12-09 10:58:36 +0000539class SilvermontProc<string Name> : ProcessorModel<Name, SLMModel, [
Eric Christopher11e59832015-10-08 20:10:06 +0000540 ProcIntelSLM,
Andrey Turetskiy6a3d5612016-03-23 11:13:54 +0000541 FeatureX87,
Eric Christopher11e59832015-10-08 20:10:06 +0000542 FeatureMMX,
543 FeatureSSE42,
Craig Topper09b65982015-10-16 06:03:09 +0000544 FeatureFXSR,
Craig Topper505f38a2018-01-10 22:07:16 +0000545 FeatureNOPL,
Eric Christopher11e59832015-10-08 20:10:06 +0000546 FeatureCMPXCHG16B,
547 FeatureMOVBE,
548 FeaturePOPCNT,
549 FeaturePCLMUL,
550 FeatureAES,
551 FeatureSlowDivide64,
Craig Topper62c47a22017-08-29 05:14:27 +0000552 FeatureSlowTwoMemOps,
Eric Christopher11e59832015-10-08 20:10:06 +0000553 FeaturePRFCHW,
554 FeatureSlowLEA,
555 FeatureSlowIncDec,
Zvi Rackover8bc7e4d2016-12-06 19:35:20 +0000556 FeatureSlowPMULLD,
Craig Topperb207dd62018-01-26 19:34:14 +0000557 FeatureRDRAND,
Hans Wennborg5000ce82015-12-04 23:00:33 +0000558 FeatureLAHFSAHF
Eric Christopher11e59832015-10-08 20:10:06 +0000559]>;
Chandler Carruthaf8924032014-12-09 10:58:36 +0000560def : SilvermontProc<"silvermont">;
561def : SilvermontProc<"slm">; // Legacy alias.
562
Michael Zuckerman4bcb9c32017-06-29 10:00:33 +0000563class GoldmontProc<string Name> : ProcessorModel<Name, SLMModel, [
564 ProcIntelGLM,
565 FeatureX87,
566 FeatureMMX,
567 FeatureSSE42,
568 FeatureFXSR,
Craig Topper505f38a2018-01-10 22:07:16 +0000569 FeatureNOPL,
Michael Zuckerman4bcb9c32017-06-29 10:00:33 +0000570 FeatureCMPXCHG16B,
571 FeatureMOVBE,
572 FeaturePOPCNT,
573 FeaturePCLMUL,
574 FeatureAES,
575 FeaturePRFCHW,
Craig Topper62c47a22017-08-29 05:14:27 +0000576 FeatureSlowTwoMemOps,
Michael Zuckerman4bcb9c32017-06-29 10:00:33 +0000577 FeatureSlowLEA,
578 FeatureSlowIncDec,
Michael Zuckerman4bcb9c32017-06-29 10:00:33 +0000579 FeatureLAHFSAHF,
580 FeatureMPX,
581 FeatureSHA,
Craig Toppera4c5caf2017-07-04 05:33:19 +0000582 FeatureRDRAND,
Michael Zuckerman4bcb9c32017-06-29 10:00:33 +0000583 FeatureRDSEED,
584 FeatureXSAVE,
585 FeatureXSAVEOPT,
586 FeatureXSAVEC,
587 FeatureXSAVES,
Michael Zuckermanac1d20d2017-09-25 13:45:31 +0000588 FeatureCLFLUSHOPT,
589 FeatureFSGSBase
Michael Zuckerman4bcb9c32017-06-29 10:00:33 +0000590]>;
591def : GoldmontProc<"goldmont">;
592
Eric Christopher2ef63182010-04-02 21:54:27 +0000593// "Arrandale" along with corei3 and corei5
Craig Topper3611d9b2015-03-30 06:31:11 +0000594class NehalemProc<string Name> : ProcessorModel<Name, SandyBridgeModel, [
Andrey Turetskiy6a3d5612016-03-23 11:13:54 +0000595 FeatureX87,
Eric Christopher11e59832015-10-08 20:10:06 +0000596 FeatureMMX,
597 FeatureSSE42,
Craig Topper09b65982015-10-16 06:03:09 +0000598 FeatureFXSR,
Craig Topper505f38a2018-01-10 22:07:16 +0000599 FeatureNOPL,
Eric Christopher11e59832015-10-08 20:10:06 +0000600 FeatureCMPXCHG16B,
Hans Wennborg5000ce82015-12-04 23:00:33 +0000601 FeaturePOPCNT,
Craig Topper641e2af2017-08-30 04:34:48 +0000602 FeatureLAHFSAHF,
603 FeatureMacroFusion
Eric Christopher11e59832015-10-08 20:10:06 +0000604]>;
Craig Topper3611d9b2015-03-30 06:31:11 +0000605def : NehalemProc<"nehalem">;
606def : NehalemProc<"corei7">;
Jakob Stoklund Olesen1ac7e662013-03-26 22:19:12 +0000607
Eric Christopher2ef63182010-04-02 21:54:27 +0000608// Westmere is a similar machine to nehalem with some additional features.
609// Westmere is the corei3/i5/i7 path from nehalem to sandybridge
Chandler Carruthaf8924032014-12-09 10:58:36 +0000610class WestmereProc<string Name> : ProcessorModel<Name, SandyBridgeModel, [
Andrey Turetskiy6a3d5612016-03-23 11:13:54 +0000611 FeatureX87,
Eric Christopher11e59832015-10-08 20:10:06 +0000612 FeatureMMX,
613 FeatureSSE42,
Craig Topper09b65982015-10-16 06:03:09 +0000614 FeatureFXSR,
Craig Topper505f38a2018-01-10 22:07:16 +0000615 FeatureNOPL,
Eric Christopher11e59832015-10-08 20:10:06 +0000616 FeatureCMPXCHG16B,
Eric Christopher11e59832015-10-08 20:10:06 +0000617 FeaturePOPCNT,
618 FeatureAES,
Hans Wennborg5000ce82015-12-04 23:00:33 +0000619 FeaturePCLMUL,
Craig Topper641e2af2017-08-30 04:34:48 +0000620 FeatureLAHFSAHF,
621 FeatureMacroFusion
Eric Christopher11e59832015-10-08 20:10:06 +0000622]>;
Chandler Carruthaf8924032014-12-09 10:58:36 +0000623def : WestmereProc<"westmere">;
624
Craig Topperf730a6b2016-02-13 21:35:37 +0000625class ProcessorFeatures<list<SubtargetFeature> Inherited,
626 list<SubtargetFeature> NewFeatures> {
627 list<SubtargetFeature> Value = !listconcat(Inherited, NewFeatures);
628}
629
630class ProcModel<string Name, SchedMachineModel Model,
631 list<SubtargetFeature> ProcFeatures,
632 list<SubtargetFeature> OtherFeatures> :
633 ProcessorModel<Name, Model, !listconcat(ProcFeatures, OtherFeatures)>;
634
Nate Begeman8b08f522010-12-10 00:26:57 +0000635// SSE is not listed here since llvm treats AVX as a reimplementation of SSE,
636// rather than a superset.
Craig Topperf730a6b2016-02-13 21:35:37 +0000637def SNBFeatures : ProcessorFeatures<[], [
Andrey Turetskiy6a3d5612016-03-23 11:13:54 +0000638 FeatureX87,
Eric Christopher11e59832015-10-08 20:10:06 +0000639 FeatureMMX,
640 FeatureAVX,
Craig Topper09b65982015-10-16 06:03:09 +0000641 FeatureFXSR,
Craig Topper505f38a2018-01-10 22:07:16 +0000642 FeatureNOPL,
Eric Christopher11e59832015-10-08 20:10:06 +0000643 FeatureCMPXCHG16B,
Eric Christopher11e59832015-10-08 20:10:06 +0000644 FeaturePOPCNT,
645 FeatureAES,
Nikolai Bozhenov6bdf92c2017-01-12 19:34:15 +0000646 FeatureSlowDivide64,
Craig Topper0ee35692015-10-14 05:37:38 +0000647 FeaturePCLMUL,
648 FeatureXSAVE,
Hans Wennborg5000ce82015-12-04 23:00:33 +0000649 FeatureXSAVEOPT,
Nikolai Bozhenovf6795302016-08-04 12:47:28 +0000650 FeatureLAHFSAHF,
Lama Saba2ea271b2017-05-18 08:11:50 +0000651 FeatureSlow3OpsLEA,
Craig Topperd88389a2017-02-21 06:39:13 +0000652 FeatureFastScalarFSQRT,
Craig Topper641e2af2017-08-30 04:34:48 +0000653 FeatureFastSHLDRotate,
Craig Topperef1f7162017-08-30 05:00:35 +0000654 FeatureSlowIncDec,
Craig Topper641e2af2017-08-30 04:34:48 +0000655 FeatureMacroFusion
Eric Christopher11e59832015-10-08 20:10:06 +0000656]>;
Elena Demikhovsky29cde352016-01-24 10:41:28 +0000657
Craig Topperf730a6b2016-02-13 21:35:37 +0000658class SandyBridgeProc<string Name> : ProcModel<Name, SandyBridgeModel,
659 SNBFeatures.Value, [
Marina Yatsina77a21db2018-01-22 10:07:01 +0000660 FeatureSlowUAMem32,
661 FeaturePOPCNTFalseDeps
Elena Demikhovsky29cde352016-01-24 10:41:28 +0000662]>;
Chandler Carruthaf8924032014-12-09 10:58:36 +0000663def : SandyBridgeProc<"sandybridge">;
664def : SandyBridgeProc<"corei7-avx">; // Legacy alias.
Evan Chengff1beda2006-10-06 09:17:41 +0000665
Craig Topperf730a6b2016-02-13 21:35:37 +0000666def IVBFeatures : ProcessorFeatures<SNBFeatures.Value, [
Eric Christopher11e59832015-10-08 20:10:06 +0000667 FeatureRDRAND,
668 FeatureF16C,
Elena Demikhovsky29cde352016-01-24 10:41:28 +0000669 FeatureFSGSBase
670]>;
671
Craig Topperf730a6b2016-02-13 21:35:37 +0000672class IvyBridgeProc<string Name> : ProcModel<Name, SandyBridgeModel,
673 IVBFeatures.Value, [
Marina Yatsina77a21db2018-01-22 10:07:01 +0000674 FeatureSlowUAMem32,
675 FeaturePOPCNTFalseDeps
Eric Christopher11e59832015-10-08 20:10:06 +0000676]>;
Chandler Carruthaf8924032014-12-09 10:58:36 +0000677def : IvyBridgeProc<"ivybridge">;
678def : IvyBridgeProc<"core-avx-i">; // Legacy alias.
Craig Topper3657fe42011-10-14 03:21:46 +0000679
Craig Topperf730a6b2016-02-13 21:35:37 +0000680def HSWFeatures : ProcessorFeatures<IVBFeatures.Value, [
Eric Christopher11e59832015-10-08 20:10:06 +0000681 FeatureAVX2,
Eric Christopher11e59832015-10-08 20:10:06 +0000682 FeatureBMI,
683 FeatureBMI2,
Clement Courbet203fc172017-04-21 09:20:50 +0000684 FeatureERMSB,
Eric Christopher11e59832015-10-08 20:10:06 +0000685 FeatureFMA,
Elena Demikhovsky29cde352016-01-24 10:41:28 +0000686 FeatureLZCNT,
Simon Pilgrimfd5df632017-12-19 13:16:43 +0000687 FeatureMOVBE,
688 FeatureFastVariableShuffle
Eric Christopher11e59832015-10-08 20:10:06 +0000689]>;
Elena Demikhovsky29cde352016-01-24 10:41:28 +0000690
Craig Topperf730a6b2016-02-13 21:35:37 +0000691class HaswellProc<string Name> : ProcModel<Name, HaswellModel,
Mohammed Agabariae9aebf22017-09-13 09:00:27 +0000692 HSWFeatures.Value, [
Marina Yatsina77a21db2018-01-22 10:07:01 +0000693 ProcIntelHSW,
694 FeaturePOPCNTFalseDeps,
695 FeatureLZCNTFalseDeps
Craig Topper54541c42017-10-13 16:04:08 +0000696]>;
Chandler Carruthaf8924032014-12-09 10:58:36 +0000697def : HaswellProc<"haswell">;
698def : HaswellProc<"core-avx2">; // Legacy alias.
699
Craig Topperf730a6b2016-02-13 21:35:37 +0000700def BDWFeatures : ProcessorFeatures<HSWFeatures.Value, [
Eric Christopher11e59832015-10-08 20:10:06 +0000701 FeatureADX,
Craig Topper67885f52017-12-22 02:41:12 +0000702 FeatureRDSEED,
703 FeaturePRFCHW
Eric Christopher11e59832015-10-08 20:10:06 +0000704]>;
Gadi Haber323f2e12017-10-24 20:19:47 +0000705class BroadwellProc<string Name> : ProcModel<Name, BroadwellModel,
Craig Topper54541c42017-10-13 16:04:08 +0000706 BDWFeatures.Value, [
Marina Yatsina77a21db2018-01-22 10:07:01 +0000707 ProcIntelBDW,
708 FeaturePOPCNTFalseDeps,
709 FeatureLZCNTFalseDeps
Craig Topper54541c42017-10-13 16:04:08 +0000710]>;
Chandler Carruthaf8924032014-12-09 10:58:36 +0000711def : BroadwellProc<"broadwell">;
712
Craig Topperf730a6b2016-02-13 21:35:37 +0000713def SKLFeatures : ProcessorFeatures<BDWFeatures.Value, [
Elena Demikhovsky29cde352016-01-24 10:41:28 +0000714 FeatureMPX,
Eric Christopher58297412017-03-29 07:40:44 +0000715 FeatureRTM,
Elena Demikhovsky29cde352016-01-24 10:41:28 +0000716 FeatureXSAVEC,
717 FeatureXSAVES,
Nikolai Bozhenovf6795302016-08-04 12:47:28 +0000718 FeatureCLFLUSHOPT,
719 FeatureFastVectorFSQRT
Elena Demikhovsky29cde352016-01-24 10:41:28 +0000720]>;
721
Gadi Haber6f8fbf42017-09-19 06:19:27 +0000722class SkylakeClientProc<string Name> : ProcModel<Name, SkylakeClientModel,
Mohammed Agabariae9aebf22017-09-13 09:00:27 +0000723 SKLFeatures.Value, [
Craig Topperea37e202017-11-25 18:09:37 +0000724 ProcIntelSKL,
Marina Yatsina77a21db2018-01-22 10:07:01 +0000725 FeatureHasFastGather,
Gabor Buella3eab22d2018-04-10 13:58:57 +0000726 FeaturePOPCNTFalseDeps,
727 FeatureSGX
Craig Topper5805fb32017-10-13 16:06:06 +0000728]>;
Sanjoy Dasaa63dc02016-02-21 17:12:03 +0000729def : SkylakeClientProc<"skylake">;
Elena Demikhovsky29cde352016-01-24 10:41:28 +0000730
Craig Topper5d692912017-10-13 18:10:17 +0000731def KNLFeatures : ProcessorFeatures<IVBFeatures.Value, [
Eric Christopher11e59832015-10-08 20:10:06 +0000732 FeatureAVX512,
733 FeatureERI,
734 FeatureCDI,
735 FeaturePFI,
Elena Demikhovsky29cde352016-01-24 10:41:28 +0000736 FeaturePREFETCHWT1,
737 FeatureADX,
738 FeatureRDSEED,
Eric Christopher11e59832015-10-08 20:10:06 +0000739 FeatureMOVBE,
740 FeatureLZCNT,
741 FeatureBMI,
742 FeatureBMI2,
Craig Topper67885f52017-12-22 02:41:12 +0000743 FeatureFMA,
744 FeaturePRFCHW
Craig Topper5d692912017-10-13 18:10:17 +0000745]>;
746
747// FIXME: define KNL model
748class KnightsLandingProc<string Name> : ProcModel<Name, HaswellModel,
749 KNLFeatures.Value, [
750 ProcIntelKNL,
Craig Topper62c47a22017-08-29 05:14:27 +0000751 FeatureSlowTwoMemOps,
Craig Topperea37e202017-11-25 18:09:37 +0000752 FeatureFastPartialYMMorZMMWrite,
753 FeatureHasFastGather
Eric Christopher11e59832015-10-08 20:10:06 +0000754]>;
Chandler Carruthaf8924032014-12-09 10:58:36 +0000755def : KnightsLandingProc<"knl">;
Elena Demikhovsky8cfb43f2013-07-24 11:02:47 +0000756
Craig Topper5d692912017-10-13 18:10:17 +0000757class KnightsMillProc<string Name> : ProcModel<Name, HaswellModel,
758 KNLFeatures.Value, [
759 ProcIntelKNL,
760 FeatureSlowTwoMemOps,
Craig Topper6fae2ee2017-10-25 17:10:32 +0000761 FeatureFastPartialYMMorZMMWrite,
Craig Topperea37e202017-11-25 18:09:37 +0000762 FeatureHasFastGather,
Craig Topper6fae2ee2017-10-25 17:10:32 +0000763 FeatureVPOPCNTDQ
Craig Topper5d692912017-10-13 18:10:17 +0000764]>;
765def : KnightsMillProc<"knm">; // TODO Add AVX5124FMAPS/AVX5124VNNIW features
766
Craig Topperf730a6b2016-02-13 21:35:37 +0000767def SKXFeatures : ProcessorFeatures<SKLFeatures.Value, [
Eric Christopher11e59832015-10-08 20:10:06 +0000768 FeatureAVX512,
769 FeatureCDI,
770 FeatureDQI,
771 FeatureBWI,
772 FeatureVLX,
Asaf Badouh5acf66f2015-12-15 13:35:29 +0000773 FeaturePKU,
Elena Demikhovsky29cde352016-01-24 10:41:28 +0000774 FeatureCLWB
Eric Christopher11e59832015-10-08 20:10:06 +0000775]>;
Chandler Carruthaf8924032014-12-09 10:58:36 +0000776
Gadi Haber684944b2017-10-08 12:52:54 +0000777class SkylakeServerProc<string Name> : ProcModel<Name, SkylakeServerModel,
Mohammed Agabariae9aebf22017-09-13 09:00:27 +0000778 SKXFeatures.Value, [
Craig Topperea37e202017-11-25 18:09:37 +0000779 ProcIntelSKX,
Craig Toppera8f87a32018-01-29 21:56:48 +0000780 FeatureHasFastGather,
781 FeaturePOPCNTFalseDeps
Craig Toppera1f9c9dd2017-10-15 16:41:15 +0000782]>;
Sanjoy Dasaa63dc02016-02-21 17:12:03 +0000783def : SkylakeServerProc<"skylake-avx512">;
Elena Demikhovsky29cde352016-01-24 10:41:28 +0000784def : SkylakeServerProc<"skx">; // Legacy alias.
785
Craig Topperd710ada2018-02-21 00:15:48 +0000786def CNLFeatures : ProcessorFeatures<SKLFeatures.Value, [
787 FeatureAVX512,
788 FeatureCDI,
789 FeatureDQI,
790 FeatureBWI,
791 FeatureVLX,
792 FeaturePKU,
Elena Demikhovsky9242ea82016-01-18 13:00:31 +0000793 FeatureVBMI,
Elena Demikhovsky29cde352016-01-24 10:41:28 +0000794 FeatureIFMA,
Gabor Buella3eab22d2018-04-10 13:58:57 +0000795 FeatureSHA,
796 FeatureSGX
Elena Demikhovsky9242ea82016-01-18 13:00:31 +0000797]>;
Elena Demikhovsky29cde352016-01-24 10:41:28 +0000798
Craig Topper9a94dfc2017-11-19 01:25:30 +0000799class CannonlakeProc<string Name> : ProcModel<Name, SkylakeServerModel,
Mohammed Agabariae9aebf22017-09-13 09:00:27 +0000800 CNLFeatures.Value, [
Craig Topperea37e202017-11-25 18:09:37 +0000801 ProcIntelCNL,
802 FeatureHasFastGather
Craig Topper5805fb32017-10-13 16:06:06 +0000803]>;
Elena Demikhovsky9242ea82016-01-18 13:00:31 +0000804def : CannonlakeProc<"cannonlake">;
Chandler Carruthaf8924032014-12-09 10:58:36 +0000805
Craig Topper81037f32017-11-19 01:12:00 +0000806def ICLFeatures : ProcessorFeatures<CNLFeatures.Value, [
Craig Toppera8905702017-11-21 21:05:18 +0000807 FeatureBITALG,
808 FeatureVAES,
809 FeatureVBMI2,
810 FeatureVNNI,
811 FeatureVPCLMULQDQ,
Coby Tayreed8b17be2017-11-26 09:36:41 +0000812 FeatureVPOPCNTDQ,
Craig Topper55cfa892017-12-27 22:04:04 +0000813 FeatureGFNI,
Craig Topper84b26b92018-01-18 23:52:31 +0000814 FeatureCLWB,
815 FeatureRDPID
Craig Topper81037f32017-11-19 01:12:00 +0000816]>;
817
Gabor Buella213edc42018-04-10 18:59:13 +0000818class IcelakeClientProc<string Name> : ProcModel<Name, SkylakeServerModel,
819 ICLFeatures.Value, [
Craig Topperea37e202017-11-25 18:09:37 +0000820 ProcIntelICL,
821 FeatureHasFastGather
Craig Topper81037f32017-11-19 01:12:00 +0000822]>;
Gabor Buella213edc42018-04-10 18:59:13 +0000823def : IcelakeClientProc<"icelake-client">;
824
825class IcelakeServerProc<string Name> : ProcModel<Name, SkylakeServerModel,
826 ICLFeatures.Value, [
827 ProcIntelICX,
828 FeatureHasFastGather
829]>;
830def : IcelakeServerProc<"icelake-server">;
Craig Topper81037f32017-11-19 01:12:00 +0000831
Chandler Carruthaf8924032014-12-09 10:58:36 +0000832// AMD CPUs.
Robert Khasanovbfa01312014-07-21 14:54:21 +0000833
Andrey Turetskiy6a3d5612016-03-23 11:13:54 +0000834def : Proc<"k6", [FeatureX87, FeatureSlowUAMem16, FeatureMMX]>;
835def : Proc<"k6-2", [FeatureX87, FeatureSlowUAMem16, Feature3DNow]>;
836def : Proc<"k6-3", [FeatureX87, FeatureSlowUAMem16, Feature3DNow]>;
Craig Topper38373222017-11-01 22:15:49 +0000837
838foreach P = ["athlon", "athlon-tbird"] in {
Craig Topper505f38a2018-01-10 22:07:16 +0000839 def : Proc<P, [FeatureX87, FeatureSlowUAMem16, Feature3DNowA,
840 FeatureNOPL, FeatureSlowSHLD]>;
Craig Topper38373222017-11-01 22:15:49 +0000841}
842
843foreach P = ["athlon-4", "athlon-xp", "athlon-mp"] in {
844 def : Proc<P, [FeatureX87, FeatureSlowUAMem16, FeatureSSE1,
Craig Topper505f38a2018-01-10 22:07:16 +0000845 Feature3DNowA, FeatureFXSR, FeatureNOPL, FeatureSlowSHLD]>;
Craig Topper38373222017-11-01 22:15:49 +0000846}
847
848foreach P = ["k8", "opteron", "athlon64", "athlon-fx"] in {
849 def : Proc<P, [FeatureX87, FeatureSlowUAMem16, FeatureSSE2, Feature3DNowA,
Craig Topper505f38a2018-01-10 22:07:16 +0000850 FeatureFXSR, FeatureNOPL, Feature64Bit, FeatureSlowSHLD]>;
Craig Topper38373222017-11-01 22:15:49 +0000851}
852
853foreach P = ["k8-sse3", "opteron-sse3", "athlon64-sse3"] in {
854 def : Proc<P, [FeatureX87, FeatureSlowUAMem16, FeatureSSE3, Feature3DNowA,
Craig Topper505f38a2018-01-10 22:07:16 +0000855 FeatureFXSR, FeatureNOPL, FeatureCMPXCHG16B, FeatureSlowSHLD]>;
Craig Topper38373222017-11-01 22:15:49 +0000856}
857
858foreach P = ["amdfam10", "barcelona"] in {
859 def : Proc<P, [FeatureX87, FeatureSSE4A, Feature3DNowA, FeatureFXSR,
Craig Topper505f38a2018-01-10 22:07:16 +0000860 FeatureNOPL, FeatureCMPXCHG16B, FeatureLZCNT, FeaturePOPCNT,
Craig Topper38373222017-11-01 22:15:49 +0000861 FeatureSlowSHLD, FeatureLAHFSAHF]>;
862}
Sanjay Patel9e916dc2015-08-21 20:17:26 +0000863
Benjamin Kramer077ae1d2012-01-10 11:50:02 +0000864// Bobcat
Eric Christopher11e59832015-10-08 20:10:06 +0000865def : Proc<"btver1", [
Andrey Turetskiy6a3d5612016-03-23 11:13:54 +0000866 FeatureX87,
Eric Christopher11e59832015-10-08 20:10:06 +0000867 FeatureMMX,
868 FeatureSSSE3,
869 FeatureSSE4A,
Craig Topper09b65982015-10-16 06:03:09 +0000870 FeatureFXSR,
Craig Topper505f38a2018-01-10 22:07:16 +0000871 FeatureNOPL,
Eric Christopher11e59832015-10-08 20:10:06 +0000872 FeatureCMPXCHG16B,
873 FeaturePRFCHW,
874 FeatureLZCNT,
875 FeaturePOPCNT,
Hans Wennborg5000ce82015-12-04 23:00:33 +0000876 FeatureSlowSHLD,
Simon Pilgrim02bdac52018-01-29 21:24:31 +0000877 FeatureLAHFSAHF,
878 FeatureFast15ByteNOP
Eric Christopher11e59832015-10-08 20:10:06 +0000879]>;
Sanjay Patel1191adf2014-09-09 20:07:07 +0000880
Benjamin Kramerb44c4272013-05-03 10:20:08 +0000881// Jaguar
Eric Christopher11e59832015-10-08 20:10:06 +0000882def : ProcessorModel<"btver2", BtVer2Model, [
Andrey Turetskiy6a3d5612016-03-23 11:13:54 +0000883 FeatureX87,
Eric Christopher11e59832015-10-08 20:10:06 +0000884 FeatureMMX,
885 FeatureAVX,
Craig Topper09b65982015-10-16 06:03:09 +0000886 FeatureFXSR,
Craig Topper505f38a2018-01-10 22:07:16 +0000887 FeatureNOPL,
Eric Christopher11e59832015-10-08 20:10:06 +0000888 FeatureSSE4A,
889 FeatureCMPXCHG16B,
890 FeaturePRFCHW,
891 FeatureAES,
892 FeaturePCLMUL,
893 FeatureBMI,
894 FeatureF16C,
895 FeatureMOVBE,
896 FeatureLZCNT,
Pierre Gousseaub6d652a2016-10-14 16:41:38 +0000897 FeatureFastLZCNT,
Eric Christopher11e59832015-10-08 20:10:06 +0000898 FeaturePOPCNT,
Craig Topper0ee35692015-10-14 05:37:38 +0000899 FeatureXSAVE,
900 FeatureXSAVEOPT,
Hans Wennborg5000ce82015-12-04 23:00:33 +0000901 FeatureSlowSHLD,
Yunzhong Gao0de36ec2016-02-12 23:37:57 +0000902 FeatureLAHFSAHF,
Simon Pilgrim02bdac52018-01-29 21:24:31 +0000903 FeatureFast15ByteNOP,
Amjad Aboud4f977512017-03-03 09:03:24 +0000904 FeatureFastPartialYMMorZMMWrite
Eric Christopher11e59832015-10-08 20:10:06 +0000905]>;
Sanjay Patele57f3c02014-11-28 18:40:18 +0000906
Benjamin Kramer077ae1d2012-01-10 11:50:02 +0000907// Bulldozer
Eric Christopher11e59832015-10-08 20:10:06 +0000908def : Proc<"bdver1", [
Andrey Turetskiy6a3d5612016-03-23 11:13:54 +0000909 FeatureX87,
Eric Christopher11e59832015-10-08 20:10:06 +0000910 FeatureXOP,
911 FeatureFMA4,
912 FeatureCMPXCHG16B,
913 FeatureAES,
914 FeaturePRFCHW,
915 FeaturePCLMUL,
916 FeatureMMX,
917 FeatureAVX,
Craig Topper09b65982015-10-16 06:03:09 +0000918 FeatureFXSR,
Craig Topper505f38a2018-01-10 22:07:16 +0000919 FeatureNOPL,
Eric Christopher11e59832015-10-08 20:10:06 +0000920 FeatureSSE4A,
921 FeatureLZCNT,
922 FeaturePOPCNT,
Craig Topper0ee35692015-10-14 05:37:38 +0000923 FeatureXSAVE,
Simon Pilgrim99b925b2017-05-03 15:51:39 +0000924 FeatureLWP,
Hans Wennborg5000ce82015-12-04 23:00:33 +0000925 FeatureSlowSHLD,
Craig Topper641e2af2017-08-30 04:34:48 +0000926 FeatureLAHFSAHF,
Simon Pilgrim02bdac52018-01-29 21:24:31 +0000927 FeatureFast11ByteNOP,
Craig Topper641e2af2017-08-30 04:34:48 +0000928 FeatureMacroFusion
Eric Christopher11e59832015-10-08 20:10:06 +0000929]>;
Benjamin Kramerb44c4272013-05-03 10:20:08 +0000930// Piledriver
Eric Christopher11e59832015-10-08 20:10:06 +0000931def : Proc<"bdver2", [
Andrey Turetskiy6a3d5612016-03-23 11:13:54 +0000932 FeatureX87,
Eric Christopher11e59832015-10-08 20:10:06 +0000933 FeatureXOP,
934 FeatureFMA4,
935 FeatureCMPXCHG16B,
936 FeatureAES,
937 FeaturePRFCHW,
938 FeaturePCLMUL,
939 FeatureMMX,
940 FeatureAVX,
Craig Topper09b65982015-10-16 06:03:09 +0000941 FeatureFXSR,
Craig Topper505f38a2018-01-10 22:07:16 +0000942 FeatureNOPL,
Eric Christopher11e59832015-10-08 20:10:06 +0000943 FeatureSSE4A,
944 FeatureF16C,
945 FeatureLZCNT,
946 FeaturePOPCNT,
Craig Topper0ee35692015-10-14 05:37:38 +0000947 FeatureXSAVE,
Eric Christopher11e59832015-10-08 20:10:06 +0000948 FeatureBMI,
949 FeatureTBM,
Simon Pilgrim99b925b2017-05-03 15:51:39 +0000950 FeatureLWP,
Eric Christopher11e59832015-10-08 20:10:06 +0000951 FeatureFMA,
Hans Wennborg5000ce82015-12-04 23:00:33 +0000952 FeatureSlowSHLD,
Craig Topper641e2af2017-08-30 04:34:48 +0000953 FeatureLAHFSAHF,
Simon Pilgrim02bdac52018-01-29 21:24:31 +0000954 FeatureFast11ByteNOP,
Craig Topper641e2af2017-08-30 04:34:48 +0000955 FeatureMacroFusion
Eric Christopher11e59832015-10-08 20:10:06 +0000956]>;
Benjamin Kramerd114def2013-11-04 10:29:20 +0000957
958// Steamroller
Eric Christopher11e59832015-10-08 20:10:06 +0000959def : Proc<"bdver3", [
Andrey Turetskiy6a3d5612016-03-23 11:13:54 +0000960 FeatureX87,
Eric Christopher11e59832015-10-08 20:10:06 +0000961 FeatureXOP,
962 FeatureFMA4,
963 FeatureCMPXCHG16B,
964 FeatureAES,
965 FeaturePRFCHW,
966 FeaturePCLMUL,
967 FeatureMMX,
968 FeatureAVX,
Craig Topper09b65982015-10-16 06:03:09 +0000969 FeatureFXSR,
Craig Topper505f38a2018-01-10 22:07:16 +0000970 FeatureNOPL,
Eric Christopher11e59832015-10-08 20:10:06 +0000971 FeatureSSE4A,
972 FeatureF16C,
973 FeatureLZCNT,
974 FeaturePOPCNT,
Craig Topper0ee35692015-10-14 05:37:38 +0000975 FeatureXSAVE,
Eric Christopher11e59832015-10-08 20:10:06 +0000976 FeatureBMI,
977 FeatureTBM,
Simon Pilgrim99b925b2017-05-03 15:51:39 +0000978 FeatureLWP,
Eric Christopher11e59832015-10-08 20:10:06 +0000979 FeatureFMA,
Craig Topper0ee35692015-10-14 05:37:38 +0000980 FeatureXSAVEOPT,
Eric Christopher11e59832015-10-08 20:10:06 +0000981 FeatureSlowSHLD,
Hans Wennborg5000ce82015-12-04 23:00:33 +0000982 FeatureFSGSBase,
Craig Topper641e2af2017-08-30 04:34:48 +0000983 FeatureLAHFSAHF,
Simon Pilgrim02bdac52018-01-29 21:24:31 +0000984 FeatureFast11ByteNOP,
Craig Topper641e2af2017-08-30 04:34:48 +0000985 FeatureMacroFusion
Eric Christopher11e59832015-10-08 20:10:06 +0000986]>;
Benjamin Kramerd114def2013-11-04 10:29:20 +0000987
Benjamin Kramer60045732014-05-02 15:47:07 +0000988// Excavator
Eric Christopher11e59832015-10-08 20:10:06 +0000989def : Proc<"bdver4", [
Andrey Turetskiy6a3d5612016-03-23 11:13:54 +0000990 FeatureX87,
Eric Christopher11e59832015-10-08 20:10:06 +0000991 FeatureMMX,
992 FeatureAVX2,
Craig Topper09b65982015-10-16 06:03:09 +0000993 FeatureFXSR,
Craig Topper505f38a2018-01-10 22:07:16 +0000994 FeatureNOPL,
Eric Christopher11e59832015-10-08 20:10:06 +0000995 FeatureXOP,
996 FeatureFMA4,
997 FeatureCMPXCHG16B,
998 FeatureAES,
999 FeaturePRFCHW,
1000 FeaturePCLMUL,
1001 FeatureF16C,
1002 FeatureLZCNT,
1003 FeaturePOPCNT,
Craig Topper0ee35692015-10-14 05:37:38 +00001004 FeatureXSAVE,
Eric Christopher11e59832015-10-08 20:10:06 +00001005 FeatureBMI,
1006 FeatureBMI2,
1007 FeatureTBM,
Simon Pilgrim99b925b2017-05-03 15:51:39 +00001008 FeatureLWP,
Eric Christopher11e59832015-10-08 20:10:06 +00001009 FeatureFMA,
Craig Topper0ee35692015-10-14 05:37:38 +00001010 FeatureXSAVEOPT,
Simon Pilgrim381a0ad2016-07-24 16:00:53 +00001011 FeatureSlowSHLD,
Hans Wennborg5000ce82015-12-04 23:00:33 +00001012 FeatureFSGSBase,
Ashutosh Nema348af9c2016-05-18 11:59:12 +00001013 FeatureLAHFSAHF,
Simon Pilgrim02bdac52018-01-29 21:24:31 +00001014 FeatureFast11ByteNOP,
Craig Topper641e2af2017-08-30 04:34:48 +00001015 FeatureMWAITX,
1016 FeatureMacroFusion
Eric Christopher11e59832015-10-08 20:10:06 +00001017]>;
Benjamin Kramer60045732014-05-02 15:47:07 +00001018
Craig Topper106b5b62017-07-19 02:45:14 +00001019// Znver1
1020def: ProcessorModel<"znver1", Znver1Model, [
Craig Topperd55b8312017-01-10 06:01:16 +00001021 FeatureADX,
1022 FeatureAES,
1023 FeatureAVX2,
1024 FeatureBMI,
1025 FeatureBMI2,
1026 FeatureCLFLUSHOPT,
Craig Topper50f3d142017-02-09 04:27:34 +00001027 FeatureCLZERO,
Craig Topperd55b8312017-01-10 06:01:16 +00001028 FeatureCMPXCHG16B,
1029 FeatureF16C,
1030 FeatureFMA,
1031 FeatureFSGSBase,
1032 FeatureFXSR,
Craig Topper505f38a2018-01-10 22:07:16 +00001033 FeatureNOPL,
Craig Topperd55b8312017-01-10 06:01:16 +00001034 FeatureFastLZCNT,
1035 FeatureLAHFSAHF,
1036 FeatureLZCNT,
Simon Pilgrim02bdac52018-01-29 21:24:31 +00001037 FeatureFast15ByteNOP,
Craig Topper641e2af2017-08-30 04:34:48 +00001038 FeatureMacroFusion,
Craig Topperd55b8312017-01-10 06:01:16 +00001039 FeatureMMX,
1040 FeatureMOVBE,
1041 FeatureMWAITX,
1042 FeaturePCLMUL,
1043 FeaturePOPCNT,
1044 FeaturePRFCHW,
1045 FeatureRDRAND,
1046 FeatureRDSEED,
1047 FeatureSHA,
Craig Topperd55b8312017-01-10 06:01:16 +00001048 FeatureSSE4A,
1049 FeatureSlowSHLD,
1050 FeatureX87,
1051 FeatureXSAVE,
1052 FeatureXSAVEC,
1053 FeatureXSAVEOPT,
1054 FeatureXSAVES]>;
1055
Andrey Turetskiy6a3d5612016-03-23 11:13:54 +00001056def : Proc<"geode", [FeatureX87, FeatureSlowUAMem16, Feature3DNowA]>;
Evan Chengff1beda2006-10-06 09:17:41 +00001057
Andrey Turetskiy6a3d5612016-03-23 11:13:54 +00001058def : Proc<"winchip-c6", [FeatureX87, FeatureSlowUAMem16, FeatureMMX]>;
1059def : Proc<"winchip2", [FeatureX87, FeatureSlowUAMem16, Feature3DNow]>;
1060def : Proc<"c3", [FeatureX87, FeatureSlowUAMem16, Feature3DNow]>;
1061def : Proc<"c3-2", [FeatureX87, FeatureSlowUAMem16, FeatureMMX,
1062 FeatureSSE1, FeatureFXSR]>;
Evan Chengff1beda2006-10-06 09:17:41 +00001063
Chandler Carruth32908d72014-05-07 17:37:03 +00001064// We also provide a generic 64-bit specific x86 processor model which tries to
1065// be good for modern chips without enabling instruction set encodings past the
1066// basic SSE2 and 64-bit ones. It disables slow things from any mainstream and
1067// modern 64-bit x86 chip, and enables features that are generally beneficial.
Michael Liao5bf95782014-12-04 05:20:33 +00001068//
Chandler Carruth32908d72014-05-07 17:37:03 +00001069// We currently use the Sandy Bridge model as the default scheduling model as
1070// we use it across Nehalem, Westmere, Sandy Bridge, and Ivy Bridge which
1071// covers a huge swath of x86 processors. If there are specific scheduling
1072// knobs which need to be tuned differently for AMD chips, we might consider
1073// forming a common base for them.
Chandler Carruth98c51cb2017-08-21 08:45:22 +00001074def : ProcessorModel<"x86-64", SandyBridgeModel, [
1075 FeatureX87,
1076 FeatureMMX,
1077 FeatureSSE2,
1078 FeatureFXSR,
Craig Topper505f38a2018-01-10 22:07:16 +00001079 FeatureNOPL,
Chandler Carruth98c51cb2017-08-21 08:45:22 +00001080 Feature64Bit,
1081 FeatureSlow3OpsLEA,
Craig Topper641e2af2017-08-30 04:34:48 +00001082 FeatureSlowIncDec,
1083 FeatureMacroFusion
Chandler Carruth98c51cb2017-08-21 08:45:22 +00001084]>;
Chandler Carruth32908d72014-05-07 17:37:03 +00001085
Evan Chengff1beda2006-10-06 09:17:41 +00001086//===----------------------------------------------------------------------===//
Chris Lattner5d00a0b2007-02-26 18:17:14 +00001087// Calling Conventions
1088//===----------------------------------------------------------------------===//
1089
1090include "X86CallingConv.td"
1091
1092
1093//===----------------------------------------------------------------------===//
Jim Grosbach4cf25f52010-10-30 13:48:28 +00001094// Assembly Parser
Chris Lattner5d00a0b2007-02-26 18:17:14 +00001095//===----------------------------------------------------------------------===//
1096
Devang Patel85d684a2012-01-09 19:13:28 +00001097def ATTAsmParserVariant : AsmParserVariant {
Daniel Dunbar00331992009-07-29 00:02:19 +00001098 int Variant = 0;
Daniel Dunbare4318712009-08-11 20:59:47 +00001099
Chad Rosier9f7a2212013-04-18 22:35:36 +00001100 // Variant name.
1101 string Name = "att";
1102
Daniel Dunbare4318712009-08-11 20:59:47 +00001103 // Discard comments in assembly strings.
1104 string CommentDelimiter = "#";
1105
1106 // Recognize hard coded registers.
1107 string RegisterPrefix = "%";
Daniel Dunbar00331992009-07-29 00:02:19 +00001108}
1109
Devang Patel67bf992a2012-01-10 17:51:54 +00001110def IntelAsmParserVariant : AsmParserVariant {
1111 int Variant = 1;
1112
Chad Rosier9f7a2212013-04-18 22:35:36 +00001113 // Variant name.
1114 string Name = "intel";
1115
Devang Patel67bf992a2012-01-10 17:51:54 +00001116 // Discard comments in assembly strings.
1117 string CommentDelimiter = ";";
1118
1119 // Recognize hard coded registers.
1120 string RegisterPrefix = "";
1121}
1122
Jim Grosbach4cf25f52010-10-30 13:48:28 +00001123//===----------------------------------------------------------------------===//
1124// Assembly Printers
1125//===----------------------------------------------------------------------===//
1126
Chris Lattner56832602004-10-03 20:36:57 +00001127// The X86 target supports two different syntaxes for emitting machine code.
1128// This is controlled by the -x86-asm-syntax={att|intel}
1129def ATTAsmWriter : AsmWriter {
Chris Lattner1cbd3de2009-09-13 19:30:11 +00001130 string AsmWriterClassName = "ATTInstPrinter";
Chris Lattner56832602004-10-03 20:36:57 +00001131 int Variant = 0;
1132}
1133def IntelAsmWriter : AsmWriter {
Chris Lattner13306a12009-09-20 07:47:59 +00001134 string AsmWriterClassName = "IntelInstPrinter";
Chris Lattner56832602004-10-03 20:36:57 +00001135 int Variant = 1;
1136}
1137
Chris Lattnera8c3cff2003-08-03 18:19:37 +00001138def X86 : Target {
Chris Lattnera8c3cff2003-08-03 18:19:37 +00001139 // Information about the instructions...
Chris Lattner25510802003-08-04 04:59:56 +00001140 let InstructionSet = X86InstrInfo;
Devang Patel67bf992a2012-01-10 17:51:54 +00001141 let AssemblyParserVariants = [ATTAsmParserVariant, IntelAsmParserVariant];
Chris Lattner56832602004-10-03 20:36:57 +00001142 let AssemblyWriters = [ATTAsmWriter, IntelAsmWriter];
Geoff Berryf8bf2ec2018-02-23 18:25:08 +00001143 let AllowRegisterRenaming = 1;
Chris Lattnera8c3cff2003-08-03 18:19:37 +00001144}
Clement Courbetb4493792018-04-10 08:16:37 +00001145
1146//===----------------------------------------------------------------------===//
1147// Pfm Counters
1148//===----------------------------------------------------------------------===//
1149
1150include "X86PfmCounters.td"