blob: 4c004f02630b8dae9d2c679f93e1a3a46bd6a79a [file] [log] [blame]
Simon Pilgrima271c542017-05-03 15:42:29 +00001//===-- X86Schedule.td - X86 Scheduling Definitions --------*- tablegen -*-===//
2//
3// The LLVM Compiler Infrastructure
4//
5// This file is distributed under the University of Illinois Open Source
6// License. See LICENSE.TXT for details.
7//
8//===----------------------------------------------------------------------===//
9
Simon Pilgrim963bf4d2018-04-13 14:24:06 +000010//===----------------------------------------------------------------------===//
Simon Pilgrima271c542017-05-03 15:42:29 +000011// InstrSchedModel annotations for out-of-order CPUs.
Simon Pilgrima271c542017-05-03 15:42:29 +000012
13// Instructions with folded loads need to read the memory operand immediately,
14// but other register operands don't have to be read until the load is ready.
15// These operands are marked with ReadAfterLd.
16def ReadAfterLd : SchedRead;
17
18// Instructions with both a load and a store folded are modeled as a folded
19// load + WriteRMW.
20def WriteRMW : SchedWrite;
21
Simon Pilgrimf2d2ced2018-05-03 17:56:43 +000022// Helper to set SchedWrite ExePorts/Latency/ResourceCycles/NumMicroOps.
23multiclass X86WriteRes<SchedWrite SchedRW,
24 list<ProcResourceKind> ExePorts,
25 int Lat, list<int> Res, int UOps> {
26 def : WriteRes<SchedRW, ExePorts> {
27 let Latency = Lat;
28 let ResourceCycles = Res;
29 let NumMicroOps = UOps;
30 }
31}
32
Simon Pilgrima271c542017-05-03 15:42:29 +000033// Most instructions can fold loads, so almost every SchedWrite comes in two
34// variants: With and without a folded load.
35// An X86FoldableSchedWrite holds a reference to the corresponding SchedWrite
36// with a folded load.
37class X86FoldableSchedWrite : SchedWrite {
38 // The SchedWrite to use when a load is folded into the instruction.
39 SchedWrite Folded;
40}
41
42// Multiclass that produces a linked pair of SchedWrites.
43multiclass X86SchedWritePair {
44 // Register-Memory operation.
45 def Ld : SchedWrite;
46 // Register-Register operation.
47 def NAME : X86FoldableSchedWrite {
48 let Folded = !cast<SchedWrite>(NAME#"Ld");
49 }
50}
51
Simon Pilgrim3c354082018-04-30 18:18:38 +000052// Multiclass that wraps X86FoldableSchedWrite for each vector width.
53class X86SchedWriteWidths<X86FoldableSchedWrite sScl,
54 X86FoldableSchedWrite s128,
55 X86FoldableSchedWrite s256,
56 X86FoldableSchedWrite s512> {
57 X86FoldableSchedWrite Scl = sScl; // Scalar float/double operations.
58 X86FoldableSchedWrite MMX = sScl; // MMX operations.
59 X86FoldableSchedWrite XMM = s128; // XMM operations.
60 X86FoldableSchedWrite YMM = s256; // YMM operations.
61 X86FoldableSchedWrite ZMM = s512; // ZMM operations.
62}
63
Simon Pilgrimf3ae50f2018-05-07 11:50:44 +000064// Multiclass that wraps X86SchedWriteWidths for each fp vector type.
65class X86SchedWriteSizes<X86SchedWriteWidths sPS,
66 X86SchedWriteWidths sPD> {
67 X86SchedWriteWidths PS = sPS;
68 X86SchedWriteWidths PD = sPD;
69}
70
Simon Pilgrimead11e42018-05-11 12:46:54 +000071// Multiclass that wraps move/load/store triple for a vector width.
72class X86SchedWriteMoveLS<SchedWrite MoveRR,
73 SchedWrite LoadRM,
74 SchedWrite StoreMR> {
75 SchedWrite RR = MoveRR;
76 SchedWrite RM = LoadRM;
77 SchedWrite MR = StoreMR;
78}
79
80// Multiclass that wraps X86SchedWriteMoveLS for each vector width.
81class X86SchedWriteMoveLSWidths<X86SchedWriteMoveLS sScl,
82 X86SchedWriteMoveLS s128,
83 X86SchedWriteMoveLS s256,
84 X86SchedWriteMoveLS s512> {
85 X86SchedWriteMoveLS Scl = sScl; // Scalar float/double operations.
86 X86SchedWriteMoveLS MMX = sScl; // MMX operations.
87 X86SchedWriteMoveLS XMM = s128; // XMM operations.
88 X86SchedWriteMoveLS YMM = s256; // YMM operations.
89 X86SchedWriteMoveLS ZMM = s512; // ZMM operations.
90}
91
Craig Topperb7baa352018-04-08 17:53:18 +000092// Loads, stores, and moves, not folded with other operations.
Simon Pilgrim215ce4a2018-05-14 18:37:19 +000093def WriteLoad : SchedWrite;
94def WriteStore : SchedWrite;
95def WriteStoreNT : SchedWrite;
96def WriteMove : SchedWrite;
Craig Topperb7baa352018-04-08 17:53:18 +000097
Simon Pilgrima271c542017-05-03 15:42:29 +000098// Arithmetic.
Simon Pilgrim2864b462018-05-08 14:55:16 +000099defm WriteALU : X86SchedWritePair; // Simple integer ALU op.
Simon Pilgrimead11e42018-05-11 12:46:54 +0000100def WriteALURMW : WriteSequence<[WriteALULd, WriteStore]>;
Simon Pilgrim2864b462018-05-08 14:55:16 +0000101defm WriteIMul : X86SchedWritePair; // Integer multiplication.
102defm WriteIMul64 : X86SchedWritePair; // Integer 64-bit multiplication.
103def WriteIMulH : SchedWrite; // Integer multiplication, high part.
104def WriteLEA : SchedWrite; // LEA instructions can't fold loads.
Simon Pilgrima271c542017-05-03 15:42:29 +0000105
Simon Pilgrim25805542018-05-08 13:51:45 +0000106// Integer division.
107defm WriteDiv8 : X86SchedWritePair;
108defm WriteDiv16 : X86SchedWritePair;
109defm WriteDiv32 : X86SchedWritePair;
110defm WriteDiv64 : X86SchedWritePair;
111defm WriteIDiv8 : X86SchedWritePair;
112defm WriteIDiv16 : X86SchedWritePair;
113defm WriteIDiv32 : X86SchedWritePair;
114defm WriteIDiv64 : X86SchedWritePair;
115
Simon Pilgrimf33d9052018-03-26 18:19:28 +0000116defm WriteBitScan : X86SchedWritePair; // Bit scan forward/reverse.
117defm WritePOPCNT : X86SchedWritePair; // Bit population count.
118defm WriteLZCNT : X86SchedWritePair; // Leading zero count.
119defm WriteTZCNT : X86SchedWritePair; // Trailing zero count.
Craig Topperb7baa352018-04-08 17:53:18 +0000120defm WriteCMOV : X86SchedWritePair; // Conditional move.
Simon Pilgrim6e160c12018-05-12 18:07:07 +0000121def WriteFCMOV : SchedWrite; // X87 conditional move.
Craig Topperb7baa352018-04-08 17:53:18 +0000122def WriteSETCC : SchedWrite; // Set register based on condition code.
123def WriteSETCCStore : SchedWrite;
Simon Pilgrimf33d9052018-03-26 18:19:28 +0000124
Simon Pilgrima271c542017-05-03 15:42:29 +0000125// Integer shifts and rotates.
126defm WriteShift : X86SchedWritePair;
127
Craig Topper89310f52018-03-29 20:41:39 +0000128// BMI1 BEXTR, BMI2 BZHI
129defm WriteBEXTR : X86SchedWritePair;
130defm WriteBZHI : X86SchedWritePair;
131
Simon Pilgrima271c542017-05-03 15:42:29 +0000132// Idioms that clear a register, like xorps %xmm0, %xmm0.
133// These can often bypass execution ports completely.
134def WriteZero : SchedWrite;
135
136// Branches don't produce values, so they have no latency, but they still
137// consume resources. Indirect branches can fold loads.
138defm WriteJump : X86SchedWritePair;
139
140// Floating point. This covers both scalar and vector operations.
Simon Pilgrimb0a3be02018-05-08 12:17:55 +0000141def WriteFLoad : SchedWrite;
Simon Pilgrim22dd72b2018-05-11 14:30:54 +0000142def WriteFLoadX : SchedWrite;
143def WriteFLoadY : SchedWrite;
Simon Pilgrimb0a3be02018-05-08 12:17:55 +0000144def WriteFMaskedLoad : SchedWrite;
145def WriteFMaskedLoadY : SchedWrite;
146def WriteFStore : SchedWrite;
Simon Pilgrim22dd72b2018-05-11 14:30:54 +0000147def WriteFStoreX : SchedWrite;
148def WriteFStoreY : SchedWrite;
Simon Pilgrim215ce4a2018-05-14 18:37:19 +0000149def WriteFStoreNT : SchedWrite;
150def WriteFStoreNTX : SchedWrite;
151def WriteFStoreNTY : SchedWrite;
Simon Pilgrimb0a3be02018-05-08 12:17:55 +0000152def WriteFMaskedStore : SchedWrite;
153def WriteFMaskedStoreY : SchedWrite;
154def WriteFMove : SchedWrite;
Simon Pilgrim22dd72b2018-05-11 14:30:54 +0000155def WriteFMoveX : SchedWrite;
156def WriteFMoveY : SchedWrite;
Simon Pilgrim1233e122018-05-07 20:52:53 +0000157
158defm WriteFAdd : X86SchedWritePair; // Floating point add/sub.
159defm WriteFAddX : X86SchedWritePair; // Floating point add/sub (XMM).
160defm WriteFAddY : X86SchedWritePair; // Floating point add/sub (YMM/ZMM).
161defm WriteFAdd64 : X86SchedWritePair; // Floating point double add/sub.
162defm WriteFAdd64X : X86SchedWritePair; // Floating point double add/sub (XMM).
163defm WriteFAdd64Y : X86SchedWritePair; // Floating point double add/sub (YMM/ZMM).
164defm WriteFCmp : X86SchedWritePair; // Floating point compare.
165defm WriteFCmpX : X86SchedWritePair; // Floating point compare (XMM).
166defm WriteFCmpY : X86SchedWritePair; // Floating point compare (YMM/ZMM).
167defm WriteFCmp64 : X86SchedWritePair; // Floating point double compare.
168defm WriteFCmp64X : X86SchedWritePair; // Floating point double compare (XMM).
169defm WriteFCmp64Y : X86SchedWritePair; // Floating point double compare (YMM/ZMM).
170defm WriteFCom : X86SchedWritePair; // Floating point compare to flags.
171defm WriteFMul : X86SchedWritePair; // Floating point multiplication.
172defm WriteFMulX : X86SchedWritePair; // Floating point multiplication (XMM).
173defm WriteFMulY : X86SchedWritePair; // Floating point multiplication (YMM/ZMM).
174defm WriteFMul64 : X86SchedWritePair; // Floating point double multiplication.
175defm WriteFMul64X : X86SchedWritePair; // Floating point double multiplication (XMM).
176defm WriteFMul64Y : X86SchedWritePair; // Floating point double multiplication (YMM/ZMM).
Simon Pilgrimac5d0a32018-05-07 16:15:46 +0000177defm WriteFDiv : X86SchedWritePair; // Floating point division.
178defm WriteFDivX : X86SchedWritePair; // Floating point division (XMM).
179defm WriteFDivY : X86SchedWritePair; // Floating point division (YMM).
180defm WriteFDivZ : X86SchedWritePair; // Floating point division (ZMM).
Simon Pilgrim1233e122018-05-07 20:52:53 +0000181defm WriteFDiv64 : X86SchedWritePair; // Floating point double division.
182defm WriteFDiv64X : X86SchedWritePair; // Floating point double division (XMM).
183defm WriteFDiv64Y : X86SchedWritePair; // Floating point double division (YMM).
184defm WriteFDiv64Z : X86SchedWritePair; // Floating point double division (ZMM).
Simon Pilgrima271c542017-05-03 15:42:29 +0000185defm WriteFSqrt : X86SchedWritePair; // Floating point square root.
Simon Pilgrimf3ae50f2018-05-07 11:50:44 +0000186defm WriteFSqrtX : X86SchedWritePair; // Floating point square root (XMM).
187defm WriteFSqrtY : X86SchedWritePair; // Floating point square root (YMM).
188defm WriteFSqrtZ : X86SchedWritePair; // Floating point square root (ZMM).
189defm WriteFSqrt64 : X86SchedWritePair; // Floating point double square root.
190defm WriteFSqrt64X : X86SchedWritePair; // Floating point double square root (XMM).
191defm WriteFSqrt64Y : X86SchedWritePair; // Floating point double square root (YMM).
192defm WriteFSqrt64Z : X86SchedWritePair; // Floating point double square root (ZMM).
193defm WriteFSqrt80 : X86SchedWritePair; // Floating point long double square root.
Simon Pilgrima271c542017-05-03 15:42:29 +0000194defm WriteFRcp : X86SchedWritePair; // Floating point reciprocal estimate.
Simon Pilgrimf3ae50f2018-05-07 11:50:44 +0000195defm WriteFRcpX : X86SchedWritePair; // Floating point reciprocal estimate (XMM).
Simon Pilgrimc7088682018-05-01 18:06:07 +0000196defm WriteFRcpY : X86SchedWritePair; // Floating point reciprocal estimate (YMM/ZMM).
Simon Pilgrima271c542017-05-03 15:42:29 +0000197defm WriteFRsqrt : X86SchedWritePair; // Floating point reciprocal square root estimate.
Simon Pilgrimf3ae50f2018-05-07 11:50:44 +0000198defm WriteFRsqrtX: X86SchedWritePair; // Floating point reciprocal square root estimate (XMM).
Simon Pilgrimc7088682018-05-01 18:06:07 +0000199defm WriteFRsqrtY: X86SchedWritePair; // Floating point reciprocal square root estimate (YMM/ZMM).
Simon Pilgrima271c542017-05-03 15:42:29 +0000200defm WriteFMA : X86SchedWritePair; // Fused Multiply Add.
Simon Pilgrim67cc2462018-05-04 15:20:18 +0000201defm WriteFMAX : X86SchedWritePair; // Fused Multiply Add (XMM).
Simon Pilgrimdbd1ae72018-04-25 13:07:58 +0000202defm WriteFMAY : X86SchedWritePair; // Fused Multiply Add (YMM/ZMM).
Simon Pilgrim542b20d2018-05-03 22:31:19 +0000203defm WriteDPPD : X86SchedWritePair; // Floating point double dot product.
204defm WriteDPPS : X86SchedWritePair; // Floating point single dot product.
205defm WriteDPPSY : X86SchedWritePair; // Floating point single dot product (YMM).
Simon Pilgrimb2aa89c2018-04-27 15:50:33 +0000206defm WriteFSign : X86SchedWritePair; // Floating point fabs/fchs.
Simon Pilgrimbe51b202018-05-04 12:59:24 +0000207defm WriteFRnd : X86SchedWritePair; // Floating point rounding.
208defm WriteFRndY : X86SchedWritePair; // Floating point rounding (YMM/ZMM).
Simon Pilgrimb2aa89c2018-04-27 15:50:33 +0000209defm WriteFLogic : X86SchedWritePair; // Floating point and/or/xor logicals.
210defm WriteFLogicY : X86SchedWritePair; // Floating point and/or/xor logicals (YMM/ZMM).
Simon Pilgrim210286e2018-05-08 10:28:03 +0000211defm WriteFTest : X86SchedWritePair; // Floating point TEST instructions.
212defm WriteFTestY : X86SchedWritePair; // Floating point TEST instructions (YMM/ZMM).
Simon Pilgrima271c542017-05-03 15:42:29 +0000213defm WriteFShuffle : X86SchedWritePair; // Floating point vector shuffles.
Simon Pilgrimdd8eae12018-05-01 14:25:01 +0000214defm WriteFShuffleY : X86SchedWritePair; // Floating point vector shuffles (YMM/ZMM).
Simon Pilgrim89c8a102018-04-11 13:49:19 +0000215defm WriteFVarShuffle : X86SchedWritePair; // Floating point vector variable shuffles.
Simon Pilgrim8a937e02018-04-27 18:19:48 +0000216defm WriteFVarShuffleY : X86SchedWritePair; // Floating point vector variable shuffles (YMM/ZMM).
Simon Pilgrima271c542017-05-03 15:42:29 +0000217defm WriteFBlend : X86SchedWritePair; // Floating point vector blends.
Simon Pilgrim8a937e02018-04-27 18:19:48 +0000218defm WriteFBlendY : X86SchedWritePair; // Floating point vector blends (YMM/ZMM).
Simon Pilgrima271c542017-05-03 15:42:29 +0000219defm WriteFVarBlend : X86SchedWritePair; // Fp vector variable blends.
Simon Pilgrim8a937e02018-04-27 18:19:48 +0000220defm WriteFVarBlendY : X86SchedWritePair; // Fp vector variable blends (YMM/ZMM).
Simon Pilgrima271c542017-05-03 15:42:29 +0000221
222// FMA Scheduling helper class.
223class FMASC { X86FoldableSchedWrite Sched = WriteFAdd; }
224
Andrew V. Tischenko8cb1d092017-06-08 16:44:13 +0000225// Horizontal Add/Sub (float and integer)
226defm WriteFHAdd : X86SchedWritePair;
Simon Pilgrimc3c767b2018-04-27 16:11:57 +0000227defm WriteFHAddY : X86SchedWritePair; // YMM/ZMM.
228defm WritePHAdd : X86SchedWritePair;
Simon Pilgrim38ac0e92018-05-10 17:06:09 +0000229defm WritePHAddX : X86SchedWritePair; // XMM.
Simon Pilgrimf7dd6062018-05-03 13:27:10 +0000230defm WritePHAddY : X86SchedWritePair; // YMM/ZMM.
Andrew V. Tischenko8cb1d092017-06-08 16:44:13 +0000231
Simon Pilgrima271c542017-05-03 15:42:29 +0000232// Vector integer operations.
Simon Pilgrimb0a3be02018-05-08 12:17:55 +0000233def WriteVecLoad : SchedWrite;
Simon Pilgrim22dd72b2018-05-11 14:30:54 +0000234def WriteVecLoadX : SchedWrite;
235def WriteVecLoadY : SchedWrite;
Simon Pilgrim215ce4a2018-05-14 18:37:19 +0000236def WriteVecLoadNT : SchedWrite;
237def WriteVecLoadNTY : SchedWrite;
Simon Pilgrimb0a3be02018-05-08 12:17:55 +0000238def WriteVecMaskedLoad : SchedWrite;
239def WriteVecMaskedLoadY : SchedWrite;
240def WriteVecStore : SchedWrite;
Simon Pilgrim22dd72b2018-05-11 14:30:54 +0000241def WriteVecStoreX : SchedWrite;
242def WriteVecStoreY : SchedWrite;
Simon Pilgrim215ce4a2018-05-14 18:37:19 +0000243def WriteVecStoreNT : SchedWrite;
244def WriteVecStoreNTY : SchedWrite;
Simon Pilgrimb0a3be02018-05-08 12:17:55 +0000245def WriteVecMaskedStore : SchedWrite;
246def WriteVecMaskedStoreY : SchedWrite;
247def WriteVecMove : SchedWrite;
Simon Pilgrim22dd72b2018-05-11 14:30:54 +0000248def WriteVecMoveX : SchedWrite;
249def WriteVecMoveY : SchedWrite;
Simon Pilgrim210286e2018-05-08 10:28:03 +0000250
Simon Pilgrim38ac0e92018-05-10 17:06:09 +0000251defm WriteVecALU : X86SchedWritePair; // Vector integer ALU op, no logicals.
252defm WriteVecALUX : X86SchedWritePair; // Vector integer ALU op, no logicals (XMM).
253defm WriteVecALUY : X86SchedWritePair; // Vector integer ALU op, no logicals (YMM/ZMM).
254defm WriteVecLogic : X86SchedWritePair; // Vector integer and/or/xor logicals.
255defm WriteVecLogicX : X86SchedWritePair; // Vector integer and/or/xor logicals (XMM).
256defm WriteVecLogicY : X86SchedWritePair; // Vector integer and/or/xor logicals (YMM/ZMM).
Simon Pilgrim210286e2018-05-08 10:28:03 +0000257defm WriteVecTest : X86SchedWritePair; // Vector integer TEST instructions.
258defm WriteVecTestY : X86SchedWritePair; // Vector integer TEST instructions (YMM/ZMM).
Simon Pilgrimf2d2ced2018-05-03 17:56:43 +0000259defm WriteVecShift : X86SchedWritePair; // Vector integer shifts (default).
260defm WriteVecShiftX : X86SchedWritePair; // Vector integer shifts (XMM).
261defm WriteVecShiftY : X86SchedWritePair; // Vector integer shifts (YMM/ZMM).
Simon Pilgrimd7ffbc52018-05-04 17:47:46 +0000262defm WriteVecShiftImm : X86SchedWritePair; // Vector integer immediate shifts (default).
Simon Pilgrimf2d2ced2018-05-03 17:56:43 +0000263defm WriteVecShiftImmX: X86SchedWritePair; // Vector integer immediate shifts (XMM).
264defm WriteVecShiftImmY: X86SchedWritePair; // Vector integer immediate shifts (YMM/ZMM).
Simon Pilgrimd7ffbc52018-05-04 17:47:46 +0000265defm WriteVecIMul : X86SchedWritePair; // Vector integer multiply (default).
266defm WriteVecIMulX : X86SchedWritePair; // Vector integer multiply (XMM).
Simon Pilgrim93c878c2018-05-03 10:31:20 +0000267defm WriteVecIMulY : X86SchedWritePair; // Vector integer multiply (YMM/ZMM).
268defm WritePMULLD : X86SchedWritePair; // Vector PMULLD.
269defm WritePMULLDY : X86SchedWritePair; // Vector PMULLD (YMM/ZMM).
Simon Pilgrima271c542017-05-03 15:42:29 +0000270defm WriteShuffle : X86SchedWritePair; // Vector shuffles.
Simon Pilgrim38ac0e92018-05-10 17:06:09 +0000271defm WriteShuffleX : X86SchedWritePair; // Vector shuffles (XMM).
Simon Pilgrim6732f6e2018-05-02 18:48:23 +0000272defm WriteShuffleY : X86SchedWritePair; // Vector shuffles (YMM/ZMM).
Simon Pilgrim89c8a102018-04-11 13:49:19 +0000273defm WriteVarShuffle : X86SchedWritePair; // Vector variable shuffles.
Simon Pilgrim38ac0e92018-05-10 17:06:09 +0000274defm WriteVarShuffleX : X86SchedWritePair; // Vector variable shuffles (XMM).
Simon Pilgrim6732f6e2018-05-02 18:48:23 +0000275defm WriteVarShuffleY : X86SchedWritePair; // Vector variable shuffles (YMM/ZMM).
Simon Pilgrima271c542017-05-03 15:42:29 +0000276defm WriteBlend : X86SchedWritePair; // Vector blends.
Simon Pilgrim6732f6e2018-05-02 18:48:23 +0000277defm WriteBlendY : X86SchedWritePair; // Vector blends (YMM/ZMM).
Simon Pilgrima271c542017-05-03 15:42:29 +0000278defm WriteVarBlend : X86SchedWritePair; // Vector variable blends.
Simon Pilgrim6732f6e2018-05-02 18:48:23 +0000279defm WriteVarBlendY : X86SchedWritePair; // Vector variable blends (YMM/ZMM).
Simon Pilgrim93c878c2018-05-03 10:31:20 +0000280defm WritePSADBW : X86SchedWritePair; // Vector PSADBW.
Simon Pilgrim38ac0e92018-05-10 17:06:09 +0000281defm WritePSADBWX : X86SchedWritePair; // Vector PSADBW (XMM).
Simon Pilgrim93c878c2018-05-03 10:31:20 +0000282defm WritePSADBWY : X86SchedWritePair; // Vector PSADBW (YMM/ZMM).
283defm WriteMPSAD : X86SchedWritePair; // Vector MPSAD.
284defm WriteMPSADY : X86SchedWritePair; // Vector MPSAD (YMM/ZMM).
Simon Pilgrim27bc83e2018-04-24 18:49:25 +0000285defm WritePHMINPOS : X86SchedWritePair; // Vector PHMINPOS.
Simon Pilgrima271c542017-05-03 15:42:29 +0000286
Simon Pilgrimf7d2a932018-04-24 13:21:41 +0000287// Vector insert/extract operations.
288defm WriteVecInsert : X86SchedWritePair; // Insert gpr to vector element.
289def WriteVecExtract : SchedWrite; // Extract vector element to gpr.
290def WriteVecExtractSt : SchedWrite; // Extract vector element and store.
291
Simon Pilgrima2f26782018-03-27 20:38:54 +0000292// MOVMSK operations.
Simon Pilgrimbf4c8c02018-05-04 14:54:33 +0000293def WriteFMOVMSK : SchedWrite;
294def WriteVecMOVMSK : SchedWrite;
295def WriteVecMOVMSKY : SchedWrite;
296def WriteMMXMOVMSK : SchedWrite;
Simon Pilgrima2f26782018-03-27 20:38:54 +0000297
Simon Pilgrima271c542017-05-03 15:42:29 +0000298// Conversion between integer and float.
299defm WriteCvtF2I : X86SchedWritePair; // Float -> Integer.
300defm WriteCvtI2F : X86SchedWritePair; // Integer -> Float.
301defm WriteCvtF2F : X86SchedWritePair; // Float -> Float size conversion.
Simon Pilgrim891ebcd2018-05-15 14:12:32 +0000302
303defm WriteCvtPH2PS : X86SchedWritePair; // Half -> Float size conversion.
304defm WriteCvtPH2PSY : X86SchedWritePair; // Half -> Float size conversion (YMM/ZMM).
305
306def WriteCvtPS2PH : SchedWrite; // // Float -> Half size conversion.
307def WriteCvtPS2PHY : SchedWrite; // // Float -> Half size conversion (YMM/ZMM).
308def WriteCvtPS2PHSt : SchedWrite; // // Float -> Half + store size conversion.
309def WriteCvtPS2PHYSt : SchedWrite; // // Float -> Half + store size conversion (YMM/ZMM).
Simon Pilgrima271c542017-05-03 15:42:29 +0000310
Simon Pilgrim28e7bcb2018-03-26 21:06:14 +0000311// CRC32 instruction.
312defm WriteCRC32 : X86SchedWritePair;
313
Simon Pilgrima271c542017-05-03 15:42:29 +0000314// Strings instructions.
315// Packed Compare Implicit Length Strings, Return Mask
316defm WritePCmpIStrM : X86SchedWritePair;
317// Packed Compare Explicit Length Strings, Return Mask
318defm WritePCmpEStrM : X86SchedWritePair;
319// Packed Compare Implicit Length Strings, Return Index
320defm WritePCmpIStrI : X86SchedWritePair;
321// Packed Compare Explicit Length Strings, Return Index
322defm WritePCmpEStrI : X86SchedWritePair;
323
324// AES instructions.
325defm WriteAESDecEnc : X86SchedWritePair; // Decryption, encryption.
326defm WriteAESIMC : X86SchedWritePair; // InvMixColumn.
327defm WriteAESKeyGen : X86SchedWritePair; // Key Generation.
328
329// Carry-less multiplication instructions.
330defm WriteCLMul : X86SchedWritePair;
331
Simon Pilgrim0e51a122018-05-04 18:16:13 +0000332// EMMS/FEMMS
333def WriteEMMS : SchedWrite;
334
Craig Topper05242bf2018-04-21 18:07:36 +0000335// Load/store MXCSR
336def WriteLDMXCSR : SchedWrite;
337def WriteSTMXCSR : SchedWrite;
338
Simon Pilgrima271c542017-05-03 15:42:29 +0000339// Catch-all for expensive system instructions.
340def WriteSystem : SchedWrite;
341
342// AVX2.
343defm WriteFShuffle256 : X86SchedWritePair; // Fp 256-bit width vector shuffles.
Simon Pilgrim89c8a102018-04-11 13:49:19 +0000344defm WriteFVarShuffle256 : X86SchedWritePair; // Fp 256-bit width variable shuffles.
Simon Pilgrima271c542017-05-03 15:42:29 +0000345defm WriteShuffle256 : X86SchedWritePair; // 256-bit width vector shuffles.
Simon Pilgrim89c8a102018-04-11 13:49:19 +0000346defm WriteVarShuffle256 : X86SchedWritePair; // 256-bit width vector variable shuffles.
Simon Pilgrimf2d2ced2018-05-03 17:56:43 +0000347defm WriteVarVecShift : X86SchedWritePair; // Variable vector shifts.
348defm WriteVarVecShiftY : X86SchedWritePair; // Variable vector shifts (YMM/ZMM).
Simon Pilgrima271c542017-05-03 15:42:29 +0000349
350// Old microcoded instructions that nobody use.
351def WriteMicrocoded : SchedWrite;
352
353// Fence instructions.
354def WriteFence : SchedWrite;
355
356// Nop, not very useful expect it provides a model for nops!
357def WriteNop : SchedWrite;
358
Simon Pilgrimead11e42018-05-11 12:46:54 +0000359// Move/Load/Store wrappers.
360def WriteFMoveLS
361 : X86SchedWriteMoveLS<WriteFMove, WriteFLoad, WriteFStore>;
362def WriteFMoveLSX
Simon Pilgrim22dd72b2018-05-11 14:30:54 +0000363 : X86SchedWriteMoveLS<WriteFMoveX, WriteFLoadX, WriteFStoreX>;
Simon Pilgrimead11e42018-05-11 12:46:54 +0000364def WriteFMoveLSY
Simon Pilgrim22dd72b2018-05-11 14:30:54 +0000365 : X86SchedWriteMoveLS<WriteFMoveY, WriteFLoadY, WriteFStoreY>;
Simon Pilgrimead11e42018-05-11 12:46:54 +0000366def SchedWriteFMoveLS
367 : X86SchedWriteMoveLSWidths<WriteFMoveLS, WriteFMoveLSX,
368 WriteFMoveLSY, WriteFMoveLSY>;
369
Simon Pilgrim215ce4a2018-05-14 18:37:19 +0000370def WriteFMoveLSNT
371 : X86SchedWriteMoveLS<WriteFMove, WriteFLoad, WriteFStoreNT>;
372def WriteFMoveLSNTX
373 : X86SchedWriteMoveLS<WriteFMove, WriteFLoad, WriteFStoreNTX>;
374def WriteFMoveLSNTY
375 : X86SchedWriteMoveLS<WriteFMoveY, WriteFLoadY, WriteFStoreNTY>;
376def SchedWriteFMoveLSNT
377 : X86SchedWriteMoveLSWidths<WriteFMoveLSNT, WriteFMoveLSNTX,
378 WriteFMoveLSNTY, WriteFMoveLSNTY>;
379
Simon Pilgrimead11e42018-05-11 12:46:54 +0000380def WriteVecMoveLS
381 : X86SchedWriteMoveLS<WriteVecMove, WriteVecLoad, WriteVecStore>;
382def WriteVecMoveLSX
Simon Pilgrim22dd72b2018-05-11 14:30:54 +0000383 : X86SchedWriteMoveLS<WriteVecMoveX, WriteVecLoadX, WriteVecStoreX>;
Simon Pilgrimead11e42018-05-11 12:46:54 +0000384def WriteVecMoveLSY
Simon Pilgrim22dd72b2018-05-11 14:30:54 +0000385 : X86SchedWriteMoveLS<WriteVecMoveY, WriteVecLoadY, WriteVecStoreY>;
Simon Pilgrimead11e42018-05-11 12:46:54 +0000386def SchedWriteVecMoveLS
387 : X86SchedWriteMoveLSWidths<WriteVecMoveLS, WriteVecMoveLSX,
388 WriteVecMoveLSY, WriteVecMoveLSY>;
389
Simon Pilgrim215ce4a2018-05-14 18:37:19 +0000390def WriteVecMoveLSNT
391 : X86SchedWriteMoveLS<WriteVecMove, WriteVecLoadNT, WriteVecStoreNT>;
392def WriteVecMoveLSNTX
393 : X86SchedWriteMoveLS<WriteVecMoveX, WriteVecLoadNT, WriteVecStoreNT>;
394def WriteVecMoveLSNTY
395 : X86SchedWriteMoveLS<WriteVecMoveY, WriteVecLoadNTY, WriteVecStoreNTY>;
396def SchedWriteVecMoveLSNT
397 : X86SchedWriteMoveLSWidths<WriteVecMoveLSNT, WriteVecMoveLSNTX,
398 WriteVecMoveLSNTY, WriteVecMoveLSNTY>;
399
Simon Pilgrim3c354082018-04-30 18:18:38 +0000400// Vector width wrappers.
401def SchedWriteFAdd
Simon Pilgrim1233e122018-05-07 20:52:53 +0000402 : X86SchedWriteWidths<WriteFAdd, WriteFAddX, WriteFAddY, WriteFAddY>;
403def SchedWriteFAdd64
404 : X86SchedWriteWidths<WriteFAdd64, WriteFAdd64X, WriteFAdd64Y, WriteFAdd64Y>;
Simon Pilgrim342ac8c2018-05-03 09:11:32 +0000405def SchedWriteFHAdd
406 : X86SchedWriteWidths<WriteFHAdd, WriteFHAdd, WriteFHAddY, WriteFHAddY>;
Simon Pilgrim3c354082018-04-30 18:18:38 +0000407def SchedWriteFCmp
Simon Pilgrim1233e122018-05-07 20:52:53 +0000408 : X86SchedWriteWidths<WriteFCmp, WriteFCmpX, WriteFCmpY, WriteFCmpY>;
409def SchedWriteFCmp64
410 : X86SchedWriteWidths<WriteFCmp64, WriteFCmp64X, WriteFCmp64Y, WriteFCmp64Y>;
Simon Pilgrim3c354082018-04-30 18:18:38 +0000411def SchedWriteFMul
Simon Pilgrim1233e122018-05-07 20:52:53 +0000412 : X86SchedWriteWidths<WriteFMul, WriteFMulX, WriteFMulY, WriteFMulY>;
Simon Pilgrimac5d0a32018-05-07 16:15:46 +0000413def SchedWriteFMul64
Simon Pilgrim1233e122018-05-07 20:52:53 +0000414 : X86SchedWriteWidths<WriteFMul64, WriteFMul64X, WriteFMul64Y, WriteFMul64Y>;
Simon Pilgrima1f1a3b2018-05-02 13:32:56 +0000415def SchedWriteFMA
Simon Pilgrim67cc2462018-05-04 15:20:18 +0000416 : X86SchedWriteWidths<WriteFMA, WriteFMAX, WriteFMAY, WriteFMAY>;
Simon Pilgrim542b20d2018-05-03 22:31:19 +0000417def SchedWriteDPPD
418 : X86SchedWriteWidths<WriteDPPD, WriteDPPD, WriteDPPD, WriteDPPD>;
419def SchedWriteDPPS
420 : X86SchedWriteWidths<WriteDPPS, WriteDPPS, WriteDPPSY, WriteDPPSY>;
Simon Pilgrim3c354082018-04-30 18:18:38 +0000421def SchedWriteFDiv
Simon Pilgrimac5d0a32018-05-07 16:15:46 +0000422 : X86SchedWriteWidths<WriteFDiv, WriteFDivX, WriteFDivY, WriteFDivZ>;
423def SchedWriteFDiv64
424 : X86SchedWriteWidths<WriteFDiv64, WriteFDiv64X, WriteFDiv64Y, WriteFDiv64Z>;
Simon Pilgrimc7088682018-05-01 18:06:07 +0000425def SchedWriteFSqrt
Simon Pilgrimf3ae50f2018-05-07 11:50:44 +0000426 : X86SchedWriteWidths<WriteFSqrt, WriteFSqrtX,
427 WriteFSqrtY, WriteFSqrtZ>;
428def SchedWriteFSqrt64
429 : X86SchedWriteWidths<WriteFSqrt64, WriteFSqrt64X,
430 WriteFSqrt64Y, WriteFSqrt64Z>;
Simon Pilgrim1b7a80d2018-05-01 15:57:17 +0000431def SchedWriteFRcp
Simon Pilgrimf3ae50f2018-05-07 11:50:44 +0000432 : X86SchedWriteWidths<WriteFRcp, WriteFRcpX, WriteFRcpY, WriteFRcpY>;
Simon Pilgrim1b7a80d2018-05-01 15:57:17 +0000433def SchedWriteFRsqrt
Simon Pilgrimf3ae50f2018-05-07 11:50:44 +0000434 : X86SchedWriteWidths<WriteFRsqrt, WriteFRsqrtX, WriteFRsqrtY, WriteFRsqrtY>;
Simon Pilgrimbe51b202018-05-04 12:59:24 +0000435def SchedWriteFRnd
436 : X86SchedWriteWidths<WriteFRnd, WriteFRnd, WriteFRndY, WriteFRndY>;
Simon Pilgrim3c354082018-04-30 18:18:38 +0000437def SchedWriteFLogic
438 : X86SchedWriteWidths<WriteFLogic, WriteFLogic, WriteFLogicY, WriteFLogicY>;
Simon Pilgrim210286e2018-05-08 10:28:03 +0000439def SchedWriteFTest
440 : X86SchedWriteWidths<WriteFTest, WriteFTest, WriteFTestY, WriteFTestY>;
Simon Pilgrim3c354082018-04-30 18:18:38 +0000441
442def SchedWriteFShuffle
443 : X86SchedWriteWidths<WriteFShuffle, WriteFShuffle,
Simon Pilgrimdd8eae12018-05-01 14:25:01 +0000444 WriteFShuffleY, WriteFShuffleY>;
Simon Pilgrim3c354082018-04-30 18:18:38 +0000445def SchedWriteFVarShuffle
446 : X86SchedWriteWidths<WriteFVarShuffle, WriteFVarShuffle,
447 WriteFVarShuffleY, WriteFVarShuffleY>;
448def SchedWriteFBlend
449 : X86SchedWriteWidths<WriteFBlend, WriteFBlend, WriteFBlendY, WriteFBlendY>;
450def SchedWriteFVarBlend
451 : X86SchedWriteWidths<WriteFVarBlend, WriteFVarBlend,
452 WriteFVarBlendY, WriteFVarBlendY>;
453
454def SchedWriteVecALU
Simon Pilgrim38ac0e92018-05-10 17:06:09 +0000455 : X86SchedWriteWidths<WriteVecALU, WriteVecALUX, WriteVecALUY, WriteVecALUY>;
Simon Pilgrim342ac8c2018-05-03 09:11:32 +0000456def SchedWritePHAdd
Simon Pilgrim38ac0e92018-05-10 17:06:09 +0000457 : X86SchedWriteWidths<WritePHAdd, WritePHAddX, WritePHAddY, WritePHAddY>;
Simon Pilgrim3c354082018-04-30 18:18:38 +0000458def SchedWriteVecLogic
Simon Pilgrim38ac0e92018-05-10 17:06:09 +0000459 : X86SchedWriteWidths<WriteVecLogic, WriteVecLogicX,
Simon Pilgrim57f2b182018-05-01 12:39:17 +0000460 WriteVecLogicY, WriteVecLogicY>;
Simon Pilgrim210286e2018-05-08 10:28:03 +0000461def SchedWriteVecTest
462 : X86SchedWriteWidths<WriteVecTest, WriteVecTest,
463 WriteVecTestY, WriteVecTestY>;
Simon Pilgrim3c354082018-04-30 18:18:38 +0000464def SchedWriteVecShift
Simon Pilgrimf2d2ced2018-05-03 17:56:43 +0000465 : X86SchedWriteWidths<WriteVecShift, WriteVecShiftX,
466 WriteVecShiftY, WriteVecShiftY>;
467def SchedWriteVecShiftImm
Simon Pilgrimd7ffbc52018-05-04 17:47:46 +0000468 : X86SchedWriteWidths<WriteVecShiftImm, WriteVecShiftImmX,
Simon Pilgrimf2d2ced2018-05-03 17:56:43 +0000469 WriteVecShiftImmY, WriteVecShiftImmY>;
Simon Pilgrime8671ef2018-05-02 12:27:54 +0000470def SchedWriteVarVecShift
471 : X86SchedWriteWidths<WriteVarVecShift, WriteVarVecShift,
Simon Pilgrimf2d2ced2018-05-03 17:56:43 +0000472 WriteVarVecShiftY, WriteVarVecShiftY>;
Simon Pilgrim3c354082018-04-30 18:18:38 +0000473def SchedWriteVecIMul
Simon Pilgrimd7ffbc52018-05-04 17:47:46 +0000474 : X86SchedWriteWidths<WriteVecIMul, WriteVecIMulX,
Simon Pilgrim93c878c2018-05-03 10:31:20 +0000475 WriteVecIMulY, WriteVecIMulY>;
Simon Pilgrim3c354082018-04-30 18:18:38 +0000476def SchedWritePMULLD
477 : X86SchedWriteWidths<WritePMULLD, WritePMULLD,
Simon Pilgrim93c878c2018-05-03 10:31:20 +0000478 WritePMULLDY, WritePMULLDY>;
Simon Pilgrime8671ef2018-05-02 12:27:54 +0000479def SchedWriteMPSAD
480 : X86SchedWriteWidths<WriteMPSAD, WriteMPSAD,
Simon Pilgrim93c878c2018-05-03 10:31:20 +0000481 WriteMPSADY, WriteMPSADY>;
Simon Pilgrime8671ef2018-05-02 12:27:54 +0000482def SchedWritePSADBW
Simon Pilgrim38ac0e92018-05-10 17:06:09 +0000483 : X86SchedWriteWidths<WritePSADBW, WritePSADBWX,
Simon Pilgrim93c878c2018-05-03 10:31:20 +0000484 WritePSADBWY, WritePSADBWY>;
Simon Pilgrim3c354082018-04-30 18:18:38 +0000485
486def SchedWriteShuffle
Simon Pilgrim38ac0e92018-05-10 17:06:09 +0000487 : X86SchedWriteWidths<WriteShuffle, WriteShuffleX,
Simon Pilgrim6732f6e2018-05-02 18:48:23 +0000488 WriteShuffleY, WriteShuffleY>;
Simon Pilgrim3c354082018-04-30 18:18:38 +0000489def SchedWriteVarShuffle
Simon Pilgrim38ac0e92018-05-10 17:06:09 +0000490 : X86SchedWriteWidths<WriteVarShuffle, WriteVarShuffleX,
Simon Pilgrim6732f6e2018-05-02 18:48:23 +0000491 WriteVarShuffleY, WriteVarShuffleY>;
Simon Pilgrim3c354082018-04-30 18:18:38 +0000492def SchedWriteBlend
Simon Pilgrim6732f6e2018-05-02 18:48:23 +0000493 : X86SchedWriteWidths<WriteBlend, WriteBlend, WriteBlendY, WriteBlendY>;
Simon Pilgrim3c354082018-04-30 18:18:38 +0000494def SchedWriteVarBlend
495 : X86SchedWriteWidths<WriteVarBlend, WriteVarBlend,
Simon Pilgrim6732f6e2018-05-02 18:48:23 +0000496 WriteVarBlendY, WriteVarBlendY>;
Simon Pilgrim3c354082018-04-30 18:18:38 +0000497
Simon Pilgrimf3ae50f2018-05-07 11:50:44 +0000498// Vector size wrappers.
499def SchedWriteFAddSizes
Simon Pilgrim1233e122018-05-07 20:52:53 +0000500 : X86SchedWriteSizes<SchedWriteFAdd, SchedWriteFAdd64>;
Simon Pilgrimac5d0a32018-05-07 16:15:46 +0000501def SchedWriteFCmpSizes
Simon Pilgrim1233e122018-05-07 20:52:53 +0000502 : X86SchedWriteSizes<SchedWriteFCmp, SchedWriteFCmp64>;
Simon Pilgrimf3ae50f2018-05-07 11:50:44 +0000503def SchedWriteFMulSizes
Simon Pilgrimac5d0a32018-05-07 16:15:46 +0000504 : X86SchedWriteSizes<SchedWriteFMul, SchedWriteFMul64>;
Simon Pilgrimf3ae50f2018-05-07 11:50:44 +0000505def SchedWriteFDivSizes
Simon Pilgrimac5d0a32018-05-07 16:15:46 +0000506 : X86SchedWriteSizes<SchedWriteFDiv, SchedWriteFDiv64>;
Simon Pilgrimf3ae50f2018-05-07 11:50:44 +0000507def SchedWriteFSqrtSizes
508 : X86SchedWriteSizes<SchedWriteFSqrt, SchedWriteFSqrt64>;
Simon Pilgrimac5d0a32018-05-07 16:15:46 +0000509def SchedWriteFLogicSizes
510 : X86SchedWriteSizes<SchedWriteFLogic, SchedWriteFLogic>;
511def SchedWriteFShuffleSizes
512 : X86SchedWriteSizes<SchedWriteFShuffle, SchedWriteFShuffle>;
Simon Pilgrimf3ae50f2018-05-07 11:50:44 +0000513
Simon Pilgrima271c542017-05-03 15:42:29 +0000514//===----------------------------------------------------------------------===//
Simon Pilgrim35935c02018-04-12 18:46:15 +0000515// Generic Processor Scheduler Models.
Simon Pilgrima271c542017-05-03 15:42:29 +0000516
517// IssueWidth is analogous to the number of decode units. Core and its
518// descendents, including Nehalem and SandyBridge have 4 decoders.
519// Resources beyond the decoder operate on micro-ops and are bufferred
520// so adjacent micro-ops don't directly compete.
521//
522// MicroOpBufferSize > 1 indicates that RAW dependencies can be
523// decoded in the same cycle. The value 32 is a reasonably arbitrary
524// number of in-flight instructions.
525//
526// HighLatency=10 is optimistic. X86InstrInfo::isHighLatencyDef
527// indicates high latency opcodes. Alternatively, InstrItinData
528// entries may be included here to define specific operand
529// latencies. Since these latencies are not used for pipeline hazards,
530// they do not need to be exact.
531//
Simon Pilgrime0c78682018-04-13 14:31:57 +0000532// The GenericX86Model contains no instruction schedules
Simon Pilgrima271c542017-05-03 15:42:29 +0000533// and disables PostRAScheduler.
534class GenericX86Model : SchedMachineModel {
535 let IssueWidth = 4;
536 let MicroOpBufferSize = 32;
537 let LoadLatency = 4;
538 let HighLatency = 10;
539 let PostRAScheduler = 0;
540 let CompleteModel = 0;
541}
542
543def GenericModel : GenericX86Model;
544
545// Define a model with the PostRAScheduler enabled.
546def GenericPostRAModel : GenericX86Model {
547 let PostRAScheduler = 1;
548}
549