blob: 22c671940737554c30d310accc29116f498230bd [file] [log] [blame]
Simon Pilgrima271c542017-05-03 15:42:29 +00001//===-- X86Schedule.td - X86 Scheduling Definitions --------*- tablegen -*-===//
2//
3// The LLVM Compiler Infrastructure
4//
5// This file is distributed under the University of Illinois Open Source
6// License. See LICENSE.TXT for details.
7//
8//===----------------------------------------------------------------------===//
9
Simon Pilgrim963bf4d2018-04-13 14:24:06 +000010//===----------------------------------------------------------------------===//
Simon Pilgrima271c542017-05-03 15:42:29 +000011// InstrSchedModel annotations for out-of-order CPUs.
Simon Pilgrima271c542017-05-03 15:42:29 +000012
13// Instructions with folded loads need to read the memory operand immediately,
14// but other register operands don't have to be read until the load is ready.
15// These operands are marked with ReadAfterLd.
16def ReadAfterLd : SchedRead;
17
18// Instructions with both a load and a store folded are modeled as a folded
19// load + WriteRMW.
20def WriteRMW : SchedWrite;
21
Simon Pilgrimf2d2ced2018-05-03 17:56:43 +000022// Helper to set SchedWrite ExePorts/Latency/ResourceCycles/NumMicroOps.
23multiclass X86WriteRes<SchedWrite SchedRW,
24 list<ProcResourceKind> ExePorts,
25 int Lat, list<int> Res, int UOps> {
26 def : WriteRes<SchedRW, ExePorts> {
27 let Latency = Lat;
28 let ResourceCycles = Res;
29 let NumMicroOps = UOps;
30 }
31}
32
Simon Pilgrima271c542017-05-03 15:42:29 +000033// Most instructions can fold loads, so almost every SchedWrite comes in two
34// variants: With and without a folded load.
35// An X86FoldableSchedWrite holds a reference to the corresponding SchedWrite
36// with a folded load.
37class X86FoldableSchedWrite : SchedWrite {
38 // The SchedWrite to use when a load is folded into the instruction.
39 SchedWrite Folded;
40}
41
42// Multiclass that produces a linked pair of SchedWrites.
43multiclass X86SchedWritePair {
44 // Register-Memory operation.
45 def Ld : SchedWrite;
46 // Register-Register operation.
47 def NAME : X86FoldableSchedWrite {
48 let Folded = !cast<SchedWrite>(NAME#"Ld");
49 }
50}
51
Simon Pilgrim3c354082018-04-30 18:18:38 +000052// Multiclass that wraps X86FoldableSchedWrite for each vector width.
53class X86SchedWriteWidths<X86FoldableSchedWrite sScl,
54 X86FoldableSchedWrite s128,
55 X86FoldableSchedWrite s256,
56 X86FoldableSchedWrite s512> {
57 X86FoldableSchedWrite Scl = sScl; // Scalar float/double operations.
58 X86FoldableSchedWrite MMX = sScl; // MMX operations.
59 X86FoldableSchedWrite XMM = s128; // XMM operations.
60 X86FoldableSchedWrite YMM = s256; // YMM operations.
61 X86FoldableSchedWrite ZMM = s512; // ZMM operations.
62}
63
Simon Pilgrimf3ae50f2018-05-07 11:50:44 +000064// Multiclass that wraps X86SchedWriteWidths for each fp vector type.
65class X86SchedWriteSizes<X86SchedWriteWidths sPS,
66 X86SchedWriteWidths sPD> {
67 X86SchedWriteWidths PS = sPS;
68 X86SchedWriteWidths PD = sPD;
69}
70
Craig Topperb7baa352018-04-08 17:53:18 +000071// Loads, stores, and moves, not folded with other operations.
72def WriteLoad : SchedWrite;
73def WriteStore : SchedWrite;
74def WriteMove : SchedWrite;
75
Simon Pilgrima271c542017-05-03 15:42:29 +000076// Arithmetic.
77defm WriteALU : X86SchedWritePair; // Simple integer ALU op.
Craig Topperb7baa352018-04-08 17:53:18 +000078def WriteALURMW : WriteSequence<[WriteALULd, WriteStore]>;
Simon Pilgrima271c542017-05-03 15:42:29 +000079defm WriteIMul : X86SchedWritePair; // Integer multiplication.
80def WriteIMulH : SchedWrite; // Integer multiplication, high part.
81defm WriteIDiv : X86SchedWritePair; // Integer division.
82def WriteLEA : SchedWrite; // LEA instructions can't fold loads.
83
Simon Pilgrimf33d9052018-03-26 18:19:28 +000084defm WriteBitScan : X86SchedWritePair; // Bit scan forward/reverse.
85defm WritePOPCNT : X86SchedWritePair; // Bit population count.
86defm WriteLZCNT : X86SchedWritePair; // Leading zero count.
87defm WriteTZCNT : X86SchedWritePair; // Trailing zero count.
Craig Topperb7baa352018-04-08 17:53:18 +000088defm WriteCMOV : X86SchedWritePair; // Conditional move.
89def WriteSETCC : SchedWrite; // Set register based on condition code.
90def WriteSETCCStore : SchedWrite;
Simon Pilgrimf33d9052018-03-26 18:19:28 +000091
Simon Pilgrima271c542017-05-03 15:42:29 +000092// Integer shifts and rotates.
93defm WriteShift : X86SchedWritePair;
94
Craig Topper89310f52018-03-29 20:41:39 +000095// BMI1 BEXTR, BMI2 BZHI
96defm WriteBEXTR : X86SchedWritePair;
97defm WriteBZHI : X86SchedWritePair;
98
Simon Pilgrima271c542017-05-03 15:42:29 +000099// Idioms that clear a register, like xorps %xmm0, %xmm0.
100// These can often bypass execution ports completely.
101def WriteZero : SchedWrite;
102
103// Branches don't produce values, so they have no latency, but they still
104// consume resources. Indirect branches can fold loads.
105defm WriteJump : X86SchedWritePair;
106
107// Floating point. This covers both scalar and vector operations.
Simon Pilgrimfb7aa572018-03-15 14:45:30 +0000108def WriteFLoad : SchedWrite;
109def WriteFStore : SchedWrite;
110def WriteFMove : SchedWrite;
Simon Pilgrim86e3c2692018-04-17 07:22:44 +0000111defm WriteFAdd : X86SchedWritePair; // Floating point add/sub.
Simon Pilgrim5269167f2018-05-01 16:13:42 +0000112defm WriteFAddY : X86SchedWritePair; // Floating point add/sub (YMM/ZMM).
Simon Pilgrim86e3c2692018-04-17 07:22:44 +0000113defm WriteFCmp : X86SchedWritePair; // Floating point compare.
Simon Pilgrimc546f942018-05-01 16:50:16 +0000114defm WriteFCmpY : X86SchedWritePair; // Floating point compare (YMM/ZMM).
Simon Pilgrim86e3c2692018-04-17 07:22:44 +0000115defm WriteFCom : X86SchedWritePair; // Floating point compare to flags.
Simon Pilgrima271c542017-05-03 15:42:29 +0000116defm WriteFMul : X86SchedWritePair; // Floating point multiplication.
Simon Pilgrim21caf012018-05-01 18:22:53 +0000117defm WriteFMulY : X86SchedWritePair; // Floating point multiplication (YMM/ZMM).
Simon Pilgrimac5d0a32018-05-07 16:15:46 +0000118defm WriteFDiv : X86SchedWritePair; // Floating point division.
119defm WriteFDivX : X86SchedWritePair; // Floating point division (XMM).
120defm WriteFDivY : X86SchedWritePair; // Floating point division (YMM).
121defm WriteFDivZ : X86SchedWritePair; // Floating point division (ZMM).
122defm WriteFDiv64 : X86SchedWritePair; // Floating point division.
123defm WriteFDiv64X : X86SchedWritePair; // Floating point division (XMM).
124defm WriteFDiv64Y : X86SchedWritePair; // Floating point division (YMM).
125defm WriteFDiv64Z : X86SchedWritePair; // Floating point division (ZMM).
Simon Pilgrima271c542017-05-03 15:42:29 +0000126defm WriteFSqrt : X86SchedWritePair; // Floating point square root.
Simon Pilgrimf3ae50f2018-05-07 11:50:44 +0000127defm WriteFSqrtX : X86SchedWritePair; // Floating point square root (XMM).
128defm WriteFSqrtY : X86SchedWritePair; // Floating point square root (YMM).
129defm WriteFSqrtZ : X86SchedWritePair; // Floating point square root (ZMM).
130defm WriteFSqrt64 : X86SchedWritePair; // Floating point double square root.
131defm WriteFSqrt64X : X86SchedWritePair; // Floating point double square root (XMM).
132defm WriteFSqrt64Y : X86SchedWritePair; // Floating point double square root (YMM).
133defm WriteFSqrt64Z : X86SchedWritePair; // Floating point double square root (ZMM).
134defm WriteFSqrt80 : X86SchedWritePair; // Floating point long double square root.
Simon Pilgrima271c542017-05-03 15:42:29 +0000135defm WriteFRcp : X86SchedWritePair; // Floating point reciprocal estimate.
Simon Pilgrimf3ae50f2018-05-07 11:50:44 +0000136defm WriteFRcpX : X86SchedWritePair; // Floating point reciprocal estimate (XMM).
Simon Pilgrimc7088682018-05-01 18:06:07 +0000137defm WriteFRcpY : X86SchedWritePair; // Floating point reciprocal estimate (YMM/ZMM).
Simon Pilgrima271c542017-05-03 15:42:29 +0000138defm WriteFRsqrt : X86SchedWritePair; // Floating point reciprocal square root estimate.
Simon Pilgrimf3ae50f2018-05-07 11:50:44 +0000139defm WriteFRsqrtX: X86SchedWritePair; // Floating point reciprocal square root estimate (XMM).
Simon Pilgrimc7088682018-05-01 18:06:07 +0000140defm WriteFRsqrtY: X86SchedWritePair; // Floating point reciprocal square root estimate (YMM/ZMM).
Simon Pilgrima271c542017-05-03 15:42:29 +0000141defm WriteFMA : X86SchedWritePair; // Fused Multiply Add.
Simon Pilgrim67cc2462018-05-04 15:20:18 +0000142defm WriteFMAX : X86SchedWritePair; // Fused Multiply Add (XMM).
Simon Pilgrimdbd1ae72018-04-25 13:07:58 +0000143defm WriteFMAY : X86SchedWritePair; // Fused Multiply Add (YMM/ZMM).
Simon Pilgrim542b20d2018-05-03 22:31:19 +0000144defm WriteDPPD : X86SchedWritePair; // Floating point double dot product.
145defm WriteDPPS : X86SchedWritePair; // Floating point single dot product.
146defm WriteDPPSY : X86SchedWritePair; // Floating point single dot product (YMM).
Simon Pilgrimb2aa89c2018-04-27 15:50:33 +0000147defm WriteFSign : X86SchedWritePair; // Floating point fabs/fchs.
Simon Pilgrimbe51b202018-05-04 12:59:24 +0000148defm WriteFRnd : X86SchedWritePair; // Floating point rounding.
149defm WriteFRndY : X86SchedWritePair; // Floating point rounding (YMM/ZMM).
Simon Pilgrimb2aa89c2018-04-27 15:50:33 +0000150defm WriteFLogic : X86SchedWritePair; // Floating point and/or/xor logicals.
151defm WriteFLogicY : X86SchedWritePair; // Floating point and/or/xor logicals (YMM/ZMM).
Simon Pilgrima271c542017-05-03 15:42:29 +0000152defm WriteFShuffle : X86SchedWritePair; // Floating point vector shuffles.
Simon Pilgrimdd8eae12018-05-01 14:25:01 +0000153defm WriteFShuffleY : X86SchedWritePair; // Floating point vector shuffles (YMM/ZMM).
Simon Pilgrim89c8a102018-04-11 13:49:19 +0000154defm WriteFVarShuffle : X86SchedWritePair; // Floating point vector variable shuffles.
Simon Pilgrim8a937e02018-04-27 18:19:48 +0000155defm WriteFVarShuffleY : X86SchedWritePair; // Floating point vector variable shuffles (YMM/ZMM).
Simon Pilgrima271c542017-05-03 15:42:29 +0000156defm WriteFBlend : X86SchedWritePair; // Floating point vector blends.
Simon Pilgrim8a937e02018-04-27 18:19:48 +0000157defm WriteFBlendY : X86SchedWritePair; // Floating point vector blends (YMM/ZMM).
Simon Pilgrima271c542017-05-03 15:42:29 +0000158defm WriteFVarBlend : X86SchedWritePair; // Fp vector variable blends.
Simon Pilgrim8a937e02018-04-27 18:19:48 +0000159defm WriteFVarBlendY : X86SchedWritePair; // Fp vector variable blends (YMM/ZMM).
Simon Pilgrima271c542017-05-03 15:42:29 +0000160
161// FMA Scheduling helper class.
162class FMASC { X86FoldableSchedWrite Sched = WriteFAdd; }
163
Andrew V. Tischenko8cb1d092017-06-08 16:44:13 +0000164// Horizontal Add/Sub (float and integer)
165defm WriteFHAdd : X86SchedWritePair;
Simon Pilgrimc3c767b2018-04-27 16:11:57 +0000166defm WriteFHAddY : X86SchedWritePair; // YMM/ZMM.
167defm WritePHAdd : X86SchedWritePair;
Simon Pilgrimf7dd6062018-05-03 13:27:10 +0000168defm WritePHAddY : X86SchedWritePair; // YMM/ZMM.
Andrew V. Tischenko8cb1d092017-06-08 16:44:13 +0000169
Simon Pilgrima271c542017-05-03 15:42:29 +0000170// Vector integer operations.
Simon Pilgrimfb7aa572018-03-15 14:45:30 +0000171def WriteVecLoad : SchedWrite;
172def WriteVecStore : SchedWrite;
173def WriteVecMove : SchedWrite;
Simon Pilgrima271c542017-05-03 15:42:29 +0000174defm WriteVecALU : X86SchedWritePair; // Vector integer ALU op, no logicals.
Simon Pilgrimf7dd6062018-05-03 13:27:10 +0000175defm WriteVecALUY : X86SchedWritePair; // Vector integer ALU op, no logicals (YMM/ZMM).
Simon Pilgrimd14d2e72018-04-20 21:16:05 +0000176defm WriteVecLogic : X86SchedWritePair; // Vector integer and/or/xor logicals.
Simon Pilgrim57f2b182018-05-01 12:39:17 +0000177defm WriteVecLogicY: X86SchedWritePair; // Vector integer and/or/xor logicals (YMM/ZMM).
Simon Pilgrimf2d2ced2018-05-03 17:56:43 +0000178defm WriteVecShift : X86SchedWritePair; // Vector integer shifts (default).
179defm WriteVecShiftX : X86SchedWritePair; // Vector integer shifts (XMM).
180defm WriteVecShiftY : X86SchedWritePair; // Vector integer shifts (YMM/ZMM).
Simon Pilgrimd7ffbc52018-05-04 17:47:46 +0000181defm WriteVecShiftImm : X86SchedWritePair; // Vector integer immediate shifts (default).
Simon Pilgrimf2d2ced2018-05-03 17:56:43 +0000182defm WriteVecShiftImmX: X86SchedWritePair; // Vector integer immediate shifts (XMM).
183defm WriteVecShiftImmY: X86SchedWritePair; // Vector integer immediate shifts (YMM/ZMM).
Simon Pilgrimd7ffbc52018-05-04 17:47:46 +0000184defm WriteVecIMul : X86SchedWritePair; // Vector integer multiply (default).
185defm WriteVecIMulX : X86SchedWritePair; // Vector integer multiply (XMM).
Simon Pilgrim93c878c2018-05-03 10:31:20 +0000186defm WriteVecIMulY : X86SchedWritePair; // Vector integer multiply (YMM/ZMM).
187defm WritePMULLD : X86SchedWritePair; // Vector PMULLD.
188defm WritePMULLDY : X86SchedWritePair; // Vector PMULLD (YMM/ZMM).
Simon Pilgrima271c542017-05-03 15:42:29 +0000189defm WriteShuffle : X86SchedWritePair; // Vector shuffles.
Simon Pilgrim6732f6e2018-05-02 18:48:23 +0000190defm WriteShuffleY : X86SchedWritePair; // Vector shuffles (YMM/ZMM).
Simon Pilgrim89c8a102018-04-11 13:49:19 +0000191defm WriteVarShuffle : X86SchedWritePair; // Vector variable shuffles.
Simon Pilgrim6732f6e2018-05-02 18:48:23 +0000192defm WriteVarShuffleY : X86SchedWritePair; // Vector variable shuffles (YMM/ZMM).
Simon Pilgrima271c542017-05-03 15:42:29 +0000193defm WriteBlend : X86SchedWritePair; // Vector blends.
Simon Pilgrim6732f6e2018-05-02 18:48:23 +0000194defm WriteBlendY : X86SchedWritePair; // Vector blends (YMM/ZMM).
Simon Pilgrima271c542017-05-03 15:42:29 +0000195defm WriteVarBlend : X86SchedWritePair; // Vector variable blends.
Simon Pilgrim6732f6e2018-05-02 18:48:23 +0000196defm WriteVarBlendY : X86SchedWritePair; // Vector variable blends (YMM/ZMM).
Simon Pilgrim93c878c2018-05-03 10:31:20 +0000197defm WritePSADBW : X86SchedWritePair; // Vector PSADBW.
198defm WritePSADBWY : X86SchedWritePair; // Vector PSADBW (YMM/ZMM).
199defm WriteMPSAD : X86SchedWritePair; // Vector MPSAD.
200defm WriteMPSADY : X86SchedWritePair; // Vector MPSAD (YMM/ZMM).
Simon Pilgrim27bc83e2018-04-24 18:49:25 +0000201defm WritePHMINPOS : X86SchedWritePair; // Vector PHMINPOS.
Simon Pilgrima271c542017-05-03 15:42:29 +0000202
Simon Pilgrimf7d2a932018-04-24 13:21:41 +0000203// Vector insert/extract operations.
204defm WriteVecInsert : X86SchedWritePair; // Insert gpr to vector element.
205def WriteVecExtract : SchedWrite; // Extract vector element to gpr.
206def WriteVecExtractSt : SchedWrite; // Extract vector element and store.
207
Simon Pilgrima2f26782018-03-27 20:38:54 +0000208// MOVMSK operations.
Simon Pilgrimbf4c8c02018-05-04 14:54:33 +0000209def WriteFMOVMSK : SchedWrite;
210def WriteVecMOVMSK : SchedWrite;
211def WriteVecMOVMSKY : SchedWrite;
212def WriteMMXMOVMSK : SchedWrite;
Simon Pilgrima2f26782018-03-27 20:38:54 +0000213
Simon Pilgrima271c542017-05-03 15:42:29 +0000214// Conversion between integer and float.
215defm WriteCvtF2I : X86SchedWritePair; // Float -> Integer.
216defm WriteCvtI2F : X86SchedWritePair; // Integer -> Float.
217defm WriteCvtF2F : X86SchedWritePair; // Float -> Float size conversion.
Simon Pilgrimf0945aa2018-04-24 16:43:07 +0000218def WriteCvtF2FSt : SchedWrite; // // Float -> Float + store size conversion.
Simon Pilgrima271c542017-05-03 15:42:29 +0000219
Simon Pilgrim28e7bcb2018-03-26 21:06:14 +0000220// CRC32 instruction.
221defm WriteCRC32 : X86SchedWritePair;
222
Simon Pilgrima271c542017-05-03 15:42:29 +0000223// Strings instructions.
224// Packed Compare Implicit Length Strings, Return Mask
225defm WritePCmpIStrM : X86SchedWritePair;
226// Packed Compare Explicit Length Strings, Return Mask
227defm WritePCmpEStrM : X86SchedWritePair;
228// Packed Compare Implicit Length Strings, Return Index
229defm WritePCmpIStrI : X86SchedWritePair;
230// Packed Compare Explicit Length Strings, Return Index
231defm WritePCmpEStrI : X86SchedWritePair;
232
233// AES instructions.
234defm WriteAESDecEnc : X86SchedWritePair; // Decryption, encryption.
235defm WriteAESIMC : X86SchedWritePair; // InvMixColumn.
236defm WriteAESKeyGen : X86SchedWritePair; // Key Generation.
237
238// Carry-less multiplication instructions.
239defm WriteCLMul : X86SchedWritePair;
240
Simon Pilgrim0e51a122018-05-04 18:16:13 +0000241// EMMS/FEMMS
242def WriteEMMS : SchedWrite;
243
Craig Topper05242bf2018-04-21 18:07:36 +0000244// Load/store MXCSR
245def WriteLDMXCSR : SchedWrite;
246def WriteSTMXCSR : SchedWrite;
247
Simon Pilgrima271c542017-05-03 15:42:29 +0000248// Catch-all for expensive system instructions.
249def WriteSystem : SchedWrite;
250
251// AVX2.
252defm WriteFShuffle256 : X86SchedWritePair; // Fp 256-bit width vector shuffles.
Simon Pilgrim89c8a102018-04-11 13:49:19 +0000253defm WriteFVarShuffle256 : X86SchedWritePair; // Fp 256-bit width variable shuffles.
Simon Pilgrima271c542017-05-03 15:42:29 +0000254defm WriteShuffle256 : X86SchedWritePair; // 256-bit width vector shuffles.
Simon Pilgrim89c8a102018-04-11 13:49:19 +0000255defm WriteVarShuffle256 : X86SchedWritePair; // 256-bit width vector variable shuffles.
Simon Pilgrimf2d2ced2018-05-03 17:56:43 +0000256defm WriteVarVecShift : X86SchedWritePair; // Variable vector shifts.
257defm WriteVarVecShiftY : X86SchedWritePair; // Variable vector shifts (YMM/ZMM).
Simon Pilgrima271c542017-05-03 15:42:29 +0000258
259// Old microcoded instructions that nobody use.
260def WriteMicrocoded : SchedWrite;
261
262// Fence instructions.
263def WriteFence : SchedWrite;
264
265// Nop, not very useful expect it provides a model for nops!
266def WriteNop : SchedWrite;
267
Simon Pilgrim3c354082018-04-30 18:18:38 +0000268// Vector width wrappers.
269def SchedWriteFAdd
Simon Pilgrim5269167f2018-05-01 16:13:42 +0000270 : X86SchedWriteWidths<WriteFAdd, WriteFAdd, WriteFAddY, WriteFAddY>;
Simon Pilgrim342ac8c2018-05-03 09:11:32 +0000271def SchedWriteFHAdd
272 : X86SchedWriteWidths<WriteFHAdd, WriteFHAdd, WriteFHAddY, WriteFHAddY>;
Simon Pilgrim3c354082018-04-30 18:18:38 +0000273def SchedWriteFCmp
Simon Pilgrimc546f942018-05-01 16:50:16 +0000274 : X86SchedWriteWidths<WriteFCmp, WriteFCmp, WriteFCmpY, WriteFCmpY>;
Simon Pilgrim3c354082018-04-30 18:18:38 +0000275def SchedWriteFMul
Simon Pilgrim21caf012018-05-01 18:22:53 +0000276 : X86SchedWriteWidths<WriteFMul, WriteFMul, WriteFMulY, WriteFMulY>;
Simon Pilgrimac5d0a32018-05-07 16:15:46 +0000277def SchedWriteFMul64
278 : X86SchedWriteWidths<WriteFMul, WriteFMul, WriteFMulY, WriteFMulY>;
Simon Pilgrima1f1a3b2018-05-02 13:32:56 +0000279def SchedWriteFMA
Simon Pilgrim67cc2462018-05-04 15:20:18 +0000280 : X86SchedWriteWidths<WriteFMA, WriteFMAX, WriteFMAY, WriteFMAY>;
Simon Pilgrim542b20d2018-05-03 22:31:19 +0000281def SchedWriteDPPD
282 : X86SchedWriteWidths<WriteDPPD, WriteDPPD, WriteDPPD, WriteDPPD>;
283def SchedWriteDPPS
284 : X86SchedWriteWidths<WriteDPPS, WriteDPPS, WriteDPPSY, WriteDPPSY>;
Simon Pilgrim3c354082018-04-30 18:18:38 +0000285def SchedWriteFDiv
Simon Pilgrimac5d0a32018-05-07 16:15:46 +0000286 : X86SchedWriteWidths<WriteFDiv, WriteFDivX, WriteFDivY, WriteFDivZ>;
287def SchedWriteFDiv64
288 : X86SchedWriteWidths<WriteFDiv64, WriteFDiv64X, WriteFDiv64Y, WriteFDiv64Z>;
Simon Pilgrimc7088682018-05-01 18:06:07 +0000289def SchedWriteFSqrt
Simon Pilgrimf3ae50f2018-05-07 11:50:44 +0000290 : X86SchedWriteWidths<WriteFSqrt, WriteFSqrtX,
291 WriteFSqrtY, WriteFSqrtZ>;
292def SchedWriteFSqrt64
293 : X86SchedWriteWidths<WriteFSqrt64, WriteFSqrt64X,
294 WriteFSqrt64Y, WriteFSqrt64Z>;
Simon Pilgrim1b7a80d2018-05-01 15:57:17 +0000295def SchedWriteFRcp
Simon Pilgrimf3ae50f2018-05-07 11:50:44 +0000296 : X86SchedWriteWidths<WriteFRcp, WriteFRcpX, WriteFRcpY, WriteFRcpY>;
Simon Pilgrim1b7a80d2018-05-01 15:57:17 +0000297def SchedWriteFRsqrt
Simon Pilgrimf3ae50f2018-05-07 11:50:44 +0000298 : X86SchedWriteWidths<WriteFRsqrt, WriteFRsqrtX, WriteFRsqrtY, WriteFRsqrtY>;
Simon Pilgrimbe51b202018-05-04 12:59:24 +0000299def SchedWriteFRnd
300 : X86SchedWriteWidths<WriteFRnd, WriteFRnd, WriteFRndY, WriteFRndY>;
Simon Pilgrim3c354082018-04-30 18:18:38 +0000301def SchedWriteFLogic
302 : X86SchedWriteWidths<WriteFLogic, WriteFLogic, WriteFLogicY, WriteFLogicY>;
303
304def SchedWriteFShuffle
305 : X86SchedWriteWidths<WriteFShuffle, WriteFShuffle,
Simon Pilgrimdd8eae12018-05-01 14:25:01 +0000306 WriteFShuffleY, WriteFShuffleY>;
Simon Pilgrim3c354082018-04-30 18:18:38 +0000307def SchedWriteFVarShuffle
308 : X86SchedWriteWidths<WriteFVarShuffle, WriteFVarShuffle,
309 WriteFVarShuffleY, WriteFVarShuffleY>;
310def SchedWriteFBlend
311 : X86SchedWriteWidths<WriteFBlend, WriteFBlend, WriteFBlendY, WriteFBlendY>;
312def SchedWriteFVarBlend
313 : X86SchedWriteWidths<WriteFVarBlend, WriteFVarBlend,
314 WriteFVarBlendY, WriteFVarBlendY>;
315
316def SchedWriteVecALU
Simon Pilgrimf7dd6062018-05-03 13:27:10 +0000317 : X86SchedWriteWidths<WriteVecALU, WriteVecALU, WriteVecALUY, WriteVecALUY>;
Simon Pilgrim342ac8c2018-05-03 09:11:32 +0000318def SchedWritePHAdd
Simon Pilgrimf7dd6062018-05-03 13:27:10 +0000319 : X86SchedWriteWidths<WritePHAdd, WritePHAdd, WritePHAddY, WritePHAddY>;
Simon Pilgrim3c354082018-04-30 18:18:38 +0000320def SchedWriteVecLogic
321 : X86SchedWriteWidths<WriteVecLogic, WriteVecLogic,
Simon Pilgrim57f2b182018-05-01 12:39:17 +0000322 WriteVecLogicY, WriteVecLogicY>;
Simon Pilgrim3c354082018-04-30 18:18:38 +0000323def SchedWriteVecShift
Simon Pilgrimf2d2ced2018-05-03 17:56:43 +0000324 : X86SchedWriteWidths<WriteVecShift, WriteVecShiftX,
325 WriteVecShiftY, WriteVecShiftY>;
326def SchedWriteVecShiftImm
Simon Pilgrimd7ffbc52018-05-04 17:47:46 +0000327 : X86SchedWriteWidths<WriteVecShiftImm, WriteVecShiftImmX,
Simon Pilgrimf2d2ced2018-05-03 17:56:43 +0000328 WriteVecShiftImmY, WriteVecShiftImmY>;
Simon Pilgrime8671ef2018-05-02 12:27:54 +0000329def SchedWriteVarVecShift
330 : X86SchedWriteWidths<WriteVarVecShift, WriteVarVecShift,
Simon Pilgrimf2d2ced2018-05-03 17:56:43 +0000331 WriteVarVecShiftY, WriteVarVecShiftY>;
Simon Pilgrim3c354082018-04-30 18:18:38 +0000332def SchedWriteVecIMul
Simon Pilgrimd7ffbc52018-05-04 17:47:46 +0000333 : X86SchedWriteWidths<WriteVecIMul, WriteVecIMulX,
Simon Pilgrim93c878c2018-05-03 10:31:20 +0000334 WriteVecIMulY, WriteVecIMulY>;
Simon Pilgrim3c354082018-04-30 18:18:38 +0000335def SchedWritePMULLD
336 : X86SchedWriteWidths<WritePMULLD, WritePMULLD,
Simon Pilgrim93c878c2018-05-03 10:31:20 +0000337 WritePMULLDY, WritePMULLDY>;
Simon Pilgrime8671ef2018-05-02 12:27:54 +0000338def SchedWriteMPSAD
339 : X86SchedWriteWidths<WriteMPSAD, WriteMPSAD,
Simon Pilgrim93c878c2018-05-03 10:31:20 +0000340 WriteMPSADY, WriteMPSADY>;
Simon Pilgrime8671ef2018-05-02 12:27:54 +0000341def SchedWritePSADBW
342 : X86SchedWriteWidths<WritePSADBW, WritePSADBW,
Simon Pilgrim93c878c2018-05-03 10:31:20 +0000343 WritePSADBWY, WritePSADBWY>;
Simon Pilgrim3c354082018-04-30 18:18:38 +0000344
345def SchedWriteShuffle
346 : X86SchedWriteWidths<WriteShuffle, WriteShuffle,
Simon Pilgrim6732f6e2018-05-02 18:48:23 +0000347 WriteShuffleY, WriteShuffleY>;
Simon Pilgrim3c354082018-04-30 18:18:38 +0000348def SchedWriteVarShuffle
349 : X86SchedWriteWidths<WriteVarShuffle, WriteVarShuffle,
Simon Pilgrim6732f6e2018-05-02 18:48:23 +0000350 WriteVarShuffleY, WriteVarShuffleY>;
Simon Pilgrim3c354082018-04-30 18:18:38 +0000351def SchedWriteBlend
Simon Pilgrim6732f6e2018-05-02 18:48:23 +0000352 : X86SchedWriteWidths<WriteBlend, WriteBlend, WriteBlendY, WriteBlendY>;
Simon Pilgrim3c354082018-04-30 18:18:38 +0000353def SchedWriteVarBlend
354 : X86SchedWriteWidths<WriteVarBlend, WriteVarBlend,
Simon Pilgrim6732f6e2018-05-02 18:48:23 +0000355 WriteVarBlendY, WriteVarBlendY>;
Simon Pilgrim3c354082018-04-30 18:18:38 +0000356
Simon Pilgrimf3ae50f2018-05-07 11:50:44 +0000357// Vector size wrappers.
358def SchedWriteFAddSizes
359 : X86SchedWriteSizes<SchedWriteFAdd, SchedWriteFAdd>;
Simon Pilgrimac5d0a32018-05-07 16:15:46 +0000360def SchedWriteFCmpSizes
361 : X86SchedWriteSizes<SchedWriteFCmp, SchedWriteFCmp>;
Simon Pilgrimf3ae50f2018-05-07 11:50:44 +0000362def SchedWriteFMulSizes
Simon Pilgrimac5d0a32018-05-07 16:15:46 +0000363 : X86SchedWriteSizes<SchedWriteFMul, SchedWriteFMul64>;
Simon Pilgrimf3ae50f2018-05-07 11:50:44 +0000364def SchedWriteFDivSizes
Simon Pilgrimac5d0a32018-05-07 16:15:46 +0000365 : X86SchedWriteSizes<SchedWriteFDiv, SchedWriteFDiv64>;
Simon Pilgrimf3ae50f2018-05-07 11:50:44 +0000366def SchedWriteFSqrtSizes
367 : X86SchedWriteSizes<SchedWriteFSqrt, SchedWriteFSqrt64>;
Simon Pilgrimac5d0a32018-05-07 16:15:46 +0000368def SchedWriteFLogicSizes
369 : X86SchedWriteSizes<SchedWriteFLogic, SchedWriteFLogic>;
370def SchedWriteFShuffleSizes
371 : X86SchedWriteSizes<SchedWriteFShuffle, SchedWriteFShuffle>;
Simon Pilgrimf3ae50f2018-05-07 11:50:44 +0000372
Simon Pilgrima271c542017-05-03 15:42:29 +0000373//===----------------------------------------------------------------------===//
Simon Pilgrim35935c02018-04-12 18:46:15 +0000374// Generic Processor Scheduler Models.
Simon Pilgrima271c542017-05-03 15:42:29 +0000375
376// IssueWidth is analogous to the number of decode units. Core and its
377// descendents, including Nehalem and SandyBridge have 4 decoders.
378// Resources beyond the decoder operate on micro-ops and are bufferred
379// so adjacent micro-ops don't directly compete.
380//
381// MicroOpBufferSize > 1 indicates that RAW dependencies can be
382// decoded in the same cycle. The value 32 is a reasonably arbitrary
383// number of in-flight instructions.
384//
385// HighLatency=10 is optimistic. X86InstrInfo::isHighLatencyDef
386// indicates high latency opcodes. Alternatively, InstrItinData
387// entries may be included here to define specific operand
388// latencies. Since these latencies are not used for pipeline hazards,
389// they do not need to be exact.
390//
Simon Pilgrime0c78682018-04-13 14:31:57 +0000391// The GenericX86Model contains no instruction schedules
Simon Pilgrima271c542017-05-03 15:42:29 +0000392// and disables PostRAScheduler.
393class GenericX86Model : SchedMachineModel {
394 let IssueWidth = 4;
395 let MicroOpBufferSize = 32;
396 let LoadLatency = 4;
397 let HighLatency = 10;
398 let PostRAScheduler = 0;
399 let CompleteModel = 0;
400}
401
402def GenericModel : GenericX86Model;
403
404// Define a model with the PostRAScheduler enabled.
405def GenericPostRAModel : GenericX86Model {
406 let PostRAScheduler = 1;
407}
408