blob: 85ca7a9b0adeec4819dabc70265be012f03e7c12 [file] [log] [blame]
Simon Pilgrima271c542017-05-03 15:42:29 +00001//===-- X86Schedule.td - X86 Scheduling Definitions --------*- tablegen -*-===//
2//
3// The LLVM Compiler Infrastructure
4//
5// This file is distributed under the University of Illinois Open Source
6// License. See LICENSE.TXT for details.
7//
8//===----------------------------------------------------------------------===//
9
10// InstrSchedModel annotations for out-of-order CPUs.
11//
12// These annotations are independent of the itinerary classes defined below.
13
14// Instructions with folded loads need to read the memory operand immediately,
15// but other register operands don't have to be read until the load is ready.
16// These operands are marked with ReadAfterLd.
17def ReadAfterLd : SchedRead;
18
19// Instructions with both a load and a store folded are modeled as a folded
20// load + WriteRMW.
21def WriteRMW : SchedWrite;
22
23// Most instructions can fold loads, so almost every SchedWrite comes in two
24// variants: With and without a folded load.
25// An X86FoldableSchedWrite holds a reference to the corresponding SchedWrite
26// with a folded load.
27class X86FoldableSchedWrite : SchedWrite {
28 // The SchedWrite to use when a load is folded into the instruction.
29 SchedWrite Folded;
30}
31
32// Multiclass that produces a linked pair of SchedWrites.
33multiclass X86SchedWritePair {
34 // Register-Memory operation.
35 def Ld : SchedWrite;
36 // Register-Register operation.
37 def NAME : X86FoldableSchedWrite {
38 let Folded = !cast<SchedWrite>(NAME#"Ld");
39 }
40}
41
42// Arithmetic.
43defm WriteALU : X86SchedWritePair; // Simple integer ALU op.
44defm WriteIMul : X86SchedWritePair; // Integer multiplication.
45def WriteIMulH : SchedWrite; // Integer multiplication, high part.
46defm WriteIDiv : X86SchedWritePair; // Integer division.
47def WriteLEA : SchedWrite; // LEA instructions can't fold loads.
48
Simon Pilgrimf33d9052018-03-26 18:19:28 +000049defm WriteBitScan : X86SchedWritePair; // Bit scan forward/reverse.
50defm WritePOPCNT : X86SchedWritePair; // Bit population count.
51defm WriteLZCNT : X86SchedWritePair; // Leading zero count.
52defm WriteTZCNT : X86SchedWritePair; // Trailing zero count.
53
Simon Pilgrima271c542017-05-03 15:42:29 +000054// Integer shifts and rotates.
55defm WriteShift : X86SchedWritePair;
56
57// Loads, stores, and moves, not folded with other operations.
58def WriteLoad : SchedWrite;
59def WriteStore : SchedWrite;
60def WriteMove : SchedWrite;
61
62// Idioms that clear a register, like xorps %xmm0, %xmm0.
63// These can often bypass execution ports completely.
64def WriteZero : SchedWrite;
65
66// Branches don't produce values, so they have no latency, but they still
67// consume resources. Indirect branches can fold loads.
68defm WriteJump : X86SchedWritePair;
69
70// Floating point. This covers both scalar and vector operations.
Simon Pilgrimfb7aa572018-03-15 14:45:30 +000071def WriteFLoad : SchedWrite;
72def WriteFStore : SchedWrite;
73def WriteFMove : SchedWrite;
Simon Pilgrima271c542017-05-03 15:42:29 +000074defm WriteFAdd : X86SchedWritePair; // Floating point add/sub/compare.
75defm WriteFMul : X86SchedWritePair; // Floating point multiplication.
76defm WriteFDiv : X86SchedWritePair; // Floating point division.
77defm WriteFSqrt : X86SchedWritePair; // Floating point square root.
78defm WriteFRcp : X86SchedWritePair; // Floating point reciprocal estimate.
79defm WriteFRsqrt : X86SchedWritePair; // Floating point reciprocal square root estimate.
80defm WriteFMA : X86SchedWritePair; // Fused Multiply Add.
81defm WriteFShuffle : X86SchedWritePair; // Floating point vector shuffles.
82defm WriteFBlend : X86SchedWritePair; // Floating point vector blends.
83defm WriteFVarBlend : X86SchedWritePair; // Fp vector variable blends.
84
85// FMA Scheduling helper class.
86class FMASC { X86FoldableSchedWrite Sched = WriteFAdd; }
87
Andrew V. Tischenko8cb1d092017-06-08 16:44:13 +000088// Horizontal Add/Sub (float and integer)
89defm WriteFHAdd : X86SchedWritePair;
90defm WritePHAdd : X86SchedWritePair;
91
Simon Pilgrima271c542017-05-03 15:42:29 +000092// Vector integer operations.
Simon Pilgrimfb7aa572018-03-15 14:45:30 +000093def WriteVecLoad : SchedWrite;
94def WriteVecStore : SchedWrite;
95def WriteVecMove : SchedWrite;
Simon Pilgrima271c542017-05-03 15:42:29 +000096defm WriteVecALU : X86SchedWritePair; // Vector integer ALU op, no logicals.
97defm WriteVecShift : X86SchedWritePair; // Vector integer shifts.
98defm WriteVecIMul : X86SchedWritePair; // Vector integer multiply.
99defm WriteShuffle : X86SchedWritePair; // Vector shuffles.
100defm WriteBlend : X86SchedWritePair; // Vector blends.
101defm WriteVarBlend : X86SchedWritePair; // Vector variable blends.
102defm WriteMPSAD : X86SchedWritePair; // Vector MPSAD.
103
104// Vector bitwise operations.
105// These are often used on both floating point and integer vectors.
106defm WriteVecLogic : X86SchedWritePair; // Vector and/or/xor.
107
108// Conversion between integer and float.
109defm WriteCvtF2I : X86SchedWritePair; // Float -> Integer.
110defm WriteCvtI2F : X86SchedWritePair; // Integer -> Float.
111defm WriteCvtF2F : X86SchedWritePair; // Float -> Float size conversion.
112
Simon Pilgrim28e7bcb2018-03-26 21:06:14 +0000113// CRC32 instruction.
114defm WriteCRC32 : X86SchedWritePair;
115
Simon Pilgrima271c542017-05-03 15:42:29 +0000116// Strings instructions.
117// Packed Compare Implicit Length Strings, Return Mask
118defm WritePCmpIStrM : X86SchedWritePair;
119// Packed Compare Explicit Length Strings, Return Mask
120defm WritePCmpEStrM : X86SchedWritePair;
121// Packed Compare Implicit Length Strings, Return Index
122defm WritePCmpIStrI : X86SchedWritePair;
123// Packed Compare Explicit Length Strings, Return Index
124defm WritePCmpEStrI : X86SchedWritePair;
125
126// AES instructions.
127defm WriteAESDecEnc : X86SchedWritePair; // Decryption, encryption.
128defm WriteAESIMC : X86SchedWritePair; // InvMixColumn.
129defm WriteAESKeyGen : X86SchedWritePair; // Key Generation.
130
131// Carry-less multiplication instructions.
132defm WriteCLMul : X86SchedWritePair;
133
134// Catch-all for expensive system instructions.
135def WriteSystem : SchedWrite;
136
137// AVX2.
138defm WriteFShuffle256 : X86SchedWritePair; // Fp 256-bit width vector shuffles.
139defm WriteShuffle256 : X86SchedWritePair; // 256-bit width vector shuffles.
140defm WriteVarVecShift : X86SchedWritePair; // Variable vector shifts.
141
142// Old microcoded instructions that nobody use.
143def WriteMicrocoded : SchedWrite;
144
145// Fence instructions.
146def WriteFence : SchedWrite;
147
148// Nop, not very useful expect it provides a model for nops!
149def WriteNop : SchedWrite;
150
151//===----------------------------------------------------------------------===//
152// Instruction Itinerary classes used for X86
153def IIC_ALU_MEM : InstrItinClass;
154def IIC_ALU_NONMEM : InstrItinClass;
155def IIC_LEA : InstrItinClass;
156def IIC_LEA_16 : InstrItinClass;
Craig Topper5ccd8722018-03-19 16:38:33 +0000157def IIC_MUL8_MEM : InstrItinClass;
158def IIC_MUL8_REG : InstrItinClass;
Simon Pilgrima271c542017-05-03 15:42:29 +0000159def IIC_MUL16_MEM : InstrItinClass;
160def IIC_MUL16_REG : InstrItinClass;
161def IIC_MUL32_MEM : InstrItinClass;
162def IIC_MUL32_REG : InstrItinClass;
Craig Topper5ccd8722018-03-19 16:38:33 +0000163def IIC_MUL64_MEM : InstrItinClass;
164def IIC_MUL64_REG : InstrItinClass;
Simon Pilgrima271c542017-05-03 15:42:29 +0000165// imul by al, ax, eax, tax
Craig Topper5ccd8722018-03-19 16:38:33 +0000166def IIC_IMUL8_MEM : InstrItinClass;
167def IIC_IMUL8_REG : InstrItinClass;
Simon Pilgrima271c542017-05-03 15:42:29 +0000168def IIC_IMUL16_MEM : InstrItinClass;
169def IIC_IMUL16_REG : InstrItinClass;
170def IIC_IMUL32_MEM : InstrItinClass;
171def IIC_IMUL32_REG : InstrItinClass;
Craig Topper5ccd8722018-03-19 16:38:33 +0000172def IIC_IMUL64_MEM : InstrItinClass;
173def IIC_IMUL64_REG : InstrItinClass;
Simon Pilgrima271c542017-05-03 15:42:29 +0000174// imul reg by reg|mem
175def IIC_IMUL16_RM : InstrItinClass;
176def IIC_IMUL16_RR : InstrItinClass;
177def IIC_IMUL32_RM : InstrItinClass;
178def IIC_IMUL32_RR : InstrItinClass;
179def IIC_IMUL64_RM : InstrItinClass;
180def IIC_IMUL64_RR : InstrItinClass;
181// imul reg = reg/mem * imm
182def IIC_IMUL16_RMI : InstrItinClass;
183def IIC_IMUL16_RRI : InstrItinClass;
184def IIC_IMUL32_RMI : InstrItinClass;
185def IIC_IMUL32_RRI : InstrItinClass;
186def IIC_IMUL64_RMI : InstrItinClass;
187def IIC_IMUL64_RRI : InstrItinClass;
188// div
189def IIC_DIV8_MEM : InstrItinClass;
190def IIC_DIV8_REG : InstrItinClass;
Craig Topper5ccd8722018-03-19 16:38:33 +0000191def IIC_DIV16_MEM : InstrItinClass;
192def IIC_DIV16_REG : InstrItinClass;
193def IIC_DIV32_MEM : InstrItinClass;
194def IIC_DIV32_REG : InstrItinClass;
195def IIC_DIV64_MEM : InstrItinClass;
196def IIC_DIV64_REG : InstrItinClass;
Simon Pilgrima271c542017-05-03 15:42:29 +0000197// idiv
Craig Topper5ccd8722018-03-19 16:38:33 +0000198def IIC_IDIV8_MEM : InstrItinClass;
199def IIC_IDIV8_REG : InstrItinClass;
200def IIC_IDIV16_MEM : InstrItinClass;
201def IIC_IDIV16_REG : InstrItinClass;
202def IIC_IDIV32_MEM : InstrItinClass;
203def IIC_IDIV32_REG : InstrItinClass;
204def IIC_IDIV64_MEM : InstrItinClass;
205def IIC_IDIV64_REG : InstrItinClass;
Simon Pilgrima271c542017-05-03 15:42:29 +0000206// neg/not/inc/dec
207def IIC_UNARY_REG : InstrItinClass;
208def IIC_UNARY_MEM : InstrItinClass;
209// add/sub/and/or/xor/sbc/cmp/test
210def IIC_BIN_MEM : InstrItinClass;
211def IIC_BIN_NONMEM : InstrItinClass;
212// adc/sbc
213def IIC_BIN_CARRY_MEM : InstrItinClass;
214def IIC_BIN_CARRY_NONMEM : InstrItinClass;
215// shift/rotate
216def IIC_SR : InstrItinClass;
217// shift double
218def IIC_SHD16_REG_IM : InstrItinClass;
219def IIC_SHD16_REG_CL : InstrItinClass;
220def IIC_SHD16_MEM_IM : InstrItinClass;
221def IIC_SHD16_MEM_CL : InstrItinClass;
222def IIC_SHD32_REG_IM : InstrItinClass;
223def IIC_SHD32_REG_CL : InstrItinClass;
224def IIC_SHD32_MEM_IM : InstrItinClass;
225def IIC_SHD32_MEM_CL : InstrItinClass;
226def IIC_SHD64_REG_IM : InstrItinClass;
227def IIC_SHD64_REG_CL : InstrItinClass;
228def IIC_SHD64_MEM_IM : InstrItinClass;
229def IIC_SHD64_MEM_CL : InstrItinClass;
230// cmov
231def IIC_CMOV16_RM : InstrItinClass;
232def IIC_CMOV16_RR : InstrItinClass;
233def IIC_CMOV32_RM : InstrItinClass;
234def IIC_CMOV32_RR : InstrItinClass;
235def IIC_CMOV64_RM : InstrItinClass;
236def IIC_CMOV64_RR : InstrItinClass;
237// set
238def IIC_SET_R : InstrItinClass;
239def IIC_SET_M : InstrItinClass;
240// jmp/jcc/jcxz
241def IIC_Jcc : InstrItinClass;
242def IIC_JCXZ : InstrItinClass;
243def IIC_JMP_REL : InstrItinClass;
244def IIC_JMP_REG : InstrItinClass;
245def IIC_JMP_MEM : InstrItinClass;
246def IIC_JMP_FAR_MEM : InstrItinClass;
247def IIC_JMP_FAR_PTR : InstrItinClass;
248// loop
249def IIC_LOOP : InstrItinClass;
250def IIC_LOOPE : InstrItinClass;
251def IIC_LOOPNE : InstrItinClass;
252// call
253def IIC_CALL_RI : InstrItinClass;
254def IIC_CALL_MEM : InstrItinClass;
255def IIC_CALL_FAR_MEM : InstrItinClass;
256def IIC_CALL_FAR_PTR : InstrItinClass;
257// ret
258def IIC_RET : InstrItinClass;
259def IIC_RET_IMM : InstrItinClass;
260//sign extension movs
261def IIC_MOVSX : InstrItinClass;
262def IIC_MOVSX_R16_R8 : InstrItinClass;
263def IIC_MOVSX_R16_M8 : InstrItinClass;
Simon Pilgrima271c542017-05-03 15:42:29 +0000264//zero extension movs
265def IIC_MOVZX : InstrItinClass;
266def IIC_MOVZX_R16_R8 : InstrItinClass;
267def IIC_MOVZX_R16_M8 : InstrItinClass;
268
269def IIC_REP_MOVS : InstrItinClass;
270def IIC_REP_STOS : InstrItinClass;
271
272// SSE scalar/parallel binary operations
273def IIC_SSE_ALU_F32S_RR : InstrItinClass;
274def IIC_SSE_ALU_F32S_RM : InstrItinClass;
275def IIC_SSE_ALU_F64S_RR : InstrItinClass;
276def IIC_SSE_ALU_F64S_RM : InstrItinClass;
277def IIC_SSE_MUL_F32S_RR : InstrItinClass;
278def IIC_SSE_MUL_F32S_RM : InstrItinClass;
279def IIC_SSE_MUL_F64S_RR : InstrItinClass;
280def IIC_SSE_MUL_F64S_RM : InstrItinClass;
281def IIC_SSE_DIV_F32S_RR : InstrItinClass;
282def IIC_SSE_DIV_F32S_RM : InstrItinClass;
283def IIC_SSE_DIV_F64S_RR : InstrItinClass;
284def IIC_SSE_DIV_F64S_RM : InstrItinClass;
285def IIC_SSE_ALU_F32P_RR : InstrItinClass;
286def IIC_SSE_ALU_F32P_RM : InstrItinClass;
287def IIC_SSE_ALU_F64P_RR : InstrItinClass;
288def IIC_SSE_ALU_F64P_RM : InstrItinClass;
289def IIC_SSE_MUL_F32P_RR : InstrItinClass;
290def IIC_SSE_MUL_F32P_RM : InstrItinClass;
291def IIC_SSE_MUL_F64P_RR : InstrItinClass;
292def IIC_SSE_MUL_F64P_RM : InstrItinClass;
293def IIC_SSE_DIV_F32P_RR : InstrItinClass;
294def IIC_SSE_DIV_F32P_RM : InstrItinClass;
295def IIC_SSE_DIV_F64P_RR : InstrItinClass;
296def IIC_SSE_DIV_F64P_RM : InstrItinClass;
297
298def IIC_SSE_COMIS_RR : InstrItinClass;
299def IIC_SSE_COMIS_RM : InstrItinClass;
300
301def IIC_SSE_HADDSUB_RR : InstrItinClass;
302def IIC_SSE_HADDSUB_RM : InstrItinClass;
303
304def IIC_SSE_BIT_P_RR : InstrItinClass;
305def IIC_SSE_BIT_P_RM : InstrItinClass;
306
307def IIC_SSE_INTALU_P_RR : InstrItinClass;
308def IIC_SSE_INTALU_P_RM : InstrItinClass;
309def IIC_SSE_INTALUQ_P_RR : InstrItinClass;
310def IIC_SSE_INTALUQ_P_RM : InstrItinClass;
311
312def IIC_SSE_INTMUL_P_RR : InstrItinClass;
313def IIC_SSE_INTMUL_P_RM : InstrItinClass;
314
315def IIC_SSE_INTSH_P_RR : InstrItinClass;
316def IIC_SSE_INTSH_P_RM : InstrItinClass;
317def IIC_SSE_INTSH_P_RI : InstrItinClass;
318
319def IIC_SSE_INTSHDQ_P_RI : InstrItinClass;
320
321def IIC_SSE_SHUFP : InstrItinClass;
322def IIC_SSE_PSHUF_RI : InstrItinClass;
323def IIC_SSE_PSHUF_MI : InstrItinClass;
324
Simon Pilgrim3f24ff62017-08-01 16:47:48 +0000325def IIC_SSE_PACK : InstrItinClass;
Simon Pilgrima271c542017-05-03 15:42:29 +0000326def IIC_SSE_UNPCK : InstrItinClass;
327
328def IIC_SSE_MOVMSK : InstrItinClass;
329def IIC_SSE_MASKMOV : InstrItinClass;
330
331def IIC_SSE_PEXTRW : InstrItinClass;
332def IIC_SSE_PINSRW : InstrItinClass;
333
334def IIC_SSE_PABS_RR : InstrItinClass;
335def IIC_SSE_PABS_RM : InstrItinClass;
336
337def IIC_SSE_SQRTPS_RR : InstrItinClass;
338def IIC_SSE_SQRTPS_RM : InstrItinClass;
339def IIC_SSE_SQRTSS_RR : InstrItinClass;
340def IIC_SSE_SQRTSS_RM : InstrItinClass;
341def IIC_SSE_SQRTPD_RR : InstrItinClass;
342def IIC_SSE_SQRTPD_RM : InstrItinClass;
343def IIC_SSE_SQRTSD_RR : InstrItinClass;
344def IIC_SSE_SQRTSD_RM : InstrItinClass;
345
346def IIC_SSE_RSQRTPS_RR : InstrItinClass;
347def IIC_SSE_RSQRTPS_RM : InstrItinClass;
348def IIC_SSE_RSQRTSS_RR : InstrItinClass;
349def IIC_SSE_RSQRTSS_RM : InstrItinClass;
350
351def IIC_SSE_RCPP_RR : InstrItinClass;
352def IIC_SSE_RCPP_RM : InstrItinClass;
353def IIC_SSE_RCPS_RR : InstrItinClass;
354def IIC_SSE_RCPS_RM : InstrItinClass;
355
356def IIC_SSE_MOV_S_RR : InstrItinClass;
357def IIC_SSE_MOV_S_RM : InstrItinClass;
358def IIC_SSE_MOV_S_MR : InstrItinClass;
359
360def IIC_SSE_MOVA_P_RR : InstrItinClass;
361def IIC_SSE_MOVA_P_RM : InstrItinClass;
362def IIC_SSE_MOVA_P_MR : InstrItinClass;
363
364def IIC_SSE_MOVU_P_RR : InstrItinClass;
365def IIC_SSE_MOVU_P_RM : InstrItinClass;
366def IIC_SSE_MOVU_P_MR : InstrItinClass;
367
368def IIC_SSE_MOVDQ : InstrItinClass;
369def IIC_SSE_MOVD_ToGP : InstrItinClass;
370def IIC_SSE_MOVQ_RR : InstrItinClass;
371
372def IIC_SSE_MOV_LH : InstrItinClass;
373
374def IIC_SSE_LDDQU : InstrItinClass;
375
376def IIC_SSE_MOVNT : InstrItinClass;
377
378def IIC_SSE_PHADDSUBD_RR : InstrItinClass;
379def IIC_SSE_PHADDSUBD_RM : InstrItinClass;
380def IIC_SSE_PHADDSUBSW_RR : InstrItinClass;
381def IIC_SSE_PHADDSUBSW_RM : InstrItinClass;
382def IIC_SSE_PHADDSUBW_RR : InstrItinClass;
383def IIC_SSE_PHADDSUBW_RM : InstrItinClass;
384def IIC_SSE_PSHUFB_RR : InstrItinClass;
385def IIC_SSE_PSHUFB_RM : InstrItinClass;
386def IIC_SSE_PSIGN_RR : InstrItinClass;
387def IIC_SSE_PSIGN_RM : InstrItinClass;
388
389def IIC_SSE_PMADD : InstrItinClass;
390def IIC_SSE_PMULHRSW : InstrItinClass;
391def IIC_SSE_PALIGNRR : InstrItinClass;
392def IIC_SSE_PALIGNRM : InstrItinClass;
393def IIC_SSE_MWAIT : InstrItinClass;
394def IIC_SSE_MONITOR : InstrItinClass;
395def IIC_SSE_MWAITX : InstrItinClass;
396def IIC_SSE_MONITORX : InstrItinClass;
397def IIC_SSE_CLZERO : InstrItinClass;
398
399def IIC_SSE_PREFETCH : InstrItinClass;
400def IIC_SSE_PAUSE : InstrItinClass;
401def IIC_SSE_LFENCE : InstrItinClass;
402def IIC_SSE_MFENCE : InstrItinClass;
403def IIC_SSE_SFENCE : InstrItinClass;
404def IIC_SSE_LDMXCSR : InstrItinClass;
405def IIC_SSE_STMXCSR : InstrItinClass;
406
407def IIC_SSE_CVT_PD_RR : InstrItinClass;
408def IIC_SSE_CVT_PD_RM : InstrItinClass;
409def IIC_SSE_CVT_PS_RR : InstrItinClass;
410def IIC_SSE_CVT_PS_RM : InstrItinClass;
Simon Pilgrima271c542017-05-03 15:42:29 +0000411def IIC_SSE_CVT_Scalar_RR : InstrItinClass;
412def IIC_SSE_CVT_Scalar_RM : InstrItinClass;
413def IIC_SSE_CVT_SS2SI32_RM : InstrItinClass;
414def IIC_SSE_CVT_SS2SI32_RR : InstrItinClass;
415def IIC_SSE_CVT_SS2SI64_RM : InstrItinClass;
416def IIC_SSE_CVT_SS2SI64_RR : InstrItinClass;
417def IIC_SSE_CVT_SD2SI_RM : InstrItinClass;
418def IIC_SSE_CVT_SD2SI_RR : InstrItinClass;
419
Simon Pilgrim91c159d2017-12-10 12:26:35 +0000420def IIC_AVX_ZERO : InstrItinClass;
421
Simon Pilgrima271c542017-05-03 15:42:29 +0000422// MMX
423def IIC_MMX_MOV_MM_RM : InstrItinClass;
424def IIC_MMX_MOV_REG_MM : InstrItinClass;
425def IIC_MMX_MOVQ_RM : InstrItinClass;
426def IIC_MMX_MOVQ_RR : InstrItinClass;
427
428def IIC_MMX_ALU_RM : InstrItinClass;
429def IIC_MMX_ALU_RR : InstrItinClass;
430def IIC_MMX_ALUQ_RM : InstrItinClass;
431def IIC_MMX_ALUQ_RR : InstrItinClass;
432def IIC_MMX_PHADDSUBW_RM : InstrItinClass;
433def IIC_MMX_PHADDSUBW_RR : InstrItinClass;
434def IIC_MMX_PHADDSUBD_RM : InstrItinClass;
435def IIC_MMX_PHADDSUBD_RR : InstrItinClass;
436def IIC_MMX_PMUL : InstrItinClass;
437def IIC_MMX_MISC_FUNC_MEM : InstrItinClass;
438def IIC_MMX_MISC_FUNC_REG : InstrItinClass;
439def IIC_MMX_PSADBW : InstrItinClass;
440def IIC_MMX_SHIFT_RI : InstrItinClass;
441def IIC_MMX_SHIFT_RM : InstrItinClass;
442def IIC_MMX_SHIFT_RR : InstrItinClass;
443def IIC_MMX_UNPCK_H_RM : InstrItinClass;
444def IIC_MMX_UNPCK_H_RR : InstrItinClass;
445def IIC_MMX_UNPCK_L : InstrItinClass;
446def IIC_MMX_PCK_RM : InstrItinClass;
447def IIC_MMX_PCK_RR : InstrItinClass;
448def IIC_MMX_PSHUF : InstrItinClass;
449def IIC_MMX_PEXTR : InstrItinClass;
450def IIC_MMX_PINSRW : InstrItinClass;
451def IIC_MMX_MASKMOV : InstrItinClass;
Simon Pilgrimf545bb6c2017-11-26 17:56:07 +0000452def IIC_MMX_MOVMSK : InstrItinClass;
Simon Pilgrima271c542017-05-03 15:42:29 +0000453def IIC_MMX_CVT_PD_RR : InstrItinClass;
454def IIC_MMX_CVT_PD_RM : InstrItinClass;
455def IIC_MMX_CVT_PS_RR : InstrItinClass;
456def IIC_MMX_CVT_PS_RM : InstrItinClass;
457
Simon Pilgrimfe6e92d2017-11-26 20:50:29 +0000458def IIC_3DNOW_FALU_RM : InstrItinClass;
459def IIC_3DNOW_FALU_RR : InstrItinClass;
460def IIC_3DNOW_FCVT_F2I_RM : InstrItinClass;
461def IIC_3DNOW_FCVT_F2I_RR : InstrItinClass;
462def IIC_3DNOW_FCVT_I2F_RM : InstrItinClass;
463def IIC_3DNOW_FCVT_I2F_RR : InstrItinClass;
464def IIC_3DNOW_MISC_FUNC_REG : InstrItinClass;
465def IIC_3DNOW_MISC_FUNC_MEM : InstrItinClass;
466
Simon Pilgrima271c542017-05-03 15:42:29 +0000467def IIC_CMPX_LOCK : InstrItinClass;
468def IIC_CMPX_LOCK_8 : InstrItinClass;
469def IIC_CMPX_LOCK_8B : InstrItinClass;
470def IIC_CMPX_LOCK_16B : InstrItinClass;
471
472def IIC_XADD_LOCK_MEM : InstrItinClass;
473def IIC_XADD_LOCK_MEM8 : InstrItinClass;
474
Simon Pilgrim65f805f2017-12-05 18:01:26 +0000475def IIC_FCMOV : InstrItinClass;
Simon Pilgrima271c542017-05-03 15:42:29 +0000476def IIC_FILD : InstrItinClass;
477def IIC_FLD : InstrItinClass;
478def IIC_FLD80 : InstrItinClass;
479def IIC_FST : InstrItinClass;
480def IIC_FST80 : InstrItinClass;
481def IIC_FIST : InstrItinClass;
482def IIC_FLDZ : InstrItinClass;
483def IIC_FUCOM : InstrItinClass;
484def IIC_FUCOMI : InstrItinClass;
485def IIC_FCOMI : InstrItinClass;
486def IIC_FNSTSW : InstrItinClass;
487def IIC_FNSTCW : InstrItinClass;
488def IIC_FLDCW : InstrItinClass;
489def IIC_FNINIT : InstrItinClass;
490def IIC_FFREE : InstrItinClass;
491def IIC_FNCLEX : InstrItinClass;
492def IIC_WAIT : InstrItinClass;
493def IIC_FXAM : InstrItinClass;
494def IIC_FNOP : InstrItinClass;
495def IIC_FLDL : InstrItinClass;
496def IIC_F2XM1 : InstrItinClass;
497def IIC_FYL2X : InstrItinClass;
498def IIC_FPTAN : InstrItinClass;
499def IIC_FPATAN : InstrItinClass;
500def IIC_FXTRACT : InstrItinClass;
501def IIC_FPREM1 : InstrItinClass;
502def IIC_FPSTP : InstrItinClass;
503def IIC_FPREM : InstrItinClass;
Simon Pilgrim0747a7e2017-11-28 15:03:42 +0000504def IIC_FSIGN : InstrItinClass;
505def IIC_FSQRT : InstrItinClass;
Simon Pilgrima271c542017-05-03 15:42:29 +0000506def IIC_FYL2XP1 : InstrItinClass;
507def IIC_FSINCOS : InstrItinClass;
508def IIC_FRNDINT : InstrItinClass;
509def IIC_FSCALE : InstrItinClass;
510def IIC_FCOMPP : InstrItinClass;
511def IIC_FXSAVE : InstrItinClass;
512def IIC_FXRSTOR : InstrItinClass;
513
514def IIC_FXCH : InstrItinClass;
515
516// System instructions
517def IIC_CPUID : InstrItinClass;
518def IIC_INT : InstrItinClass;
519def IIC_INT3 : InstrItinClass;
520def IIC_INVD : InstrItinClass;
521def IIC_INVLPG : InstrItinClass;
Simon Pilgrim1ddcae62017-12-08 15:48:37 +0000522def IIC_INVPCID : InstrItinClass;
Simon Pilgrima271c542017-05-03 15:42:29 +0000523def IIC_IRET : InstrItinClass;
524def IIC_HLT : InstrItinClass;
525def IIC_LXS : InstrItinClass;
526def IIC_LTR : InstrItinClass;
Simon Pilgrim42fcda92017-12-08 19:03:42 +0000527def IIC_MPX : InstrItinClass;
Simon Pilgrim1ddcae62017-12-08 15:48:37 +0000528def IIC_PKU : InstrItinClass;
529def IIC_PTWRITE : InstrItinClass;
530def IIC_RDPID : InstrItinClass;
Simon Pilgrim60411d92017-12-07 14:18:48 +0000531def IIC_RDRAND : InstrItinClass;
532def IIC_RDSEED : InstrItinClass;
Simon Pilgrima271c542017-05-03 15:42:29 +0000533def IIC_RDTSC : InstrItinClass;
Simon Pilgrimf00ea1b2017-12-13 14:22:04 +0000534def IIC_RDTSCP : InstrItinClass;
Simon Pilgrima271c542017-05-03 15:42:29 +0000535def IIC_RSM : InstrItinClass;
536def IIC_SIDT : InstrItinClass;
537def IIC_SGDT : InstrItinClass;
538def IIC_SLDT : InstrItinClass;
Simon Pilgrim1ddcae62017-12-08 15:48:37 +0000539def IIC_SMAP : InstrItinClass;
540def IIC_SMX : InstrItinClass;
Simon Pilgrima271c542017-05-03 15:42:29 +0000541def IIC_STR : InstrItinClass;
Simon Pilgrim6b7cd862017-12-07 14:35:17 +0000542def IIC_SKINIT : InstrItinClass;
543def IIC_SVM : InstrItinClass;
Simon Pilgrima13271b2017-12-07 15:57:32 +0000544def IIC_VMX : InstrItinClass;
Simon Pilgrim6b7cd862017-12-07 14:35:17 +0000545def IIC_CLGI : InstrItinClass;
546def IIC_STGI : InstrItinClass;
Simon Pilgrima271c542017-05-03 15:42:29 +0000547def IIC_SWAPGS : InstrItinClass;
548def IIC_SYSCALL : InstrItinClass;
549def IIC_SYS_ENTER_EXIT : InstrItinClass;
550def IIC_IN_RR : InstrItinClass;
551def IIC_IN_RI : InstrItinClass;
552def IIC_OUT_RR : InstrItinClass;
553def IIC_OUT_IR : InstrItinClass;
554def IIC_INS : InstrItinClass;
Simon Pilgrim99b925b2017-05-03 15:51:39 +0000555def IIC_LWP : InstrItinClass;
Simon Pilgrima271c542017-05-03 15:42:29 +0000556def IIC_MOV_REG_DR : InstrItinClass;
557def IIC_MOV_DR_REG : InstrItinClass;
558def IIC_MOV_REG_CR : InstrItinClass;
559def IIC_MOV_CR_REG : InstrItinClass;
560def IIC_MOV_REG_SR : InstrItinClass;
561def IIC_MOV_MEM_SR : InstrItinClass;
562def IIC_MOV_SR_REG : InstrItinClass;
563def IIC_MOV_SR_MEM : InstrItinClass;
564def IIC_LAR_RM : InstrItinClass;
565def IIC_LAR_RR : InstrItinClass;
566def IIC_LSL_RM : InstrItinClass;
567def IIC_LSL_RR : InstrItinClass;
568def IIC_LGDT : InstrItinClass;
569def IIC_LIDT : InstrItinClass;
570def IIC_LLDT_REG : InstrItinClass;
571def IIC_LLDT_MEM : InstrItinClass;
572def IIC_PUSH_CS : InstrItinClass;
573def IIC_PUSH_SR : InstrItinClass;
574def IIC_POP_SR : InstrItinClass;
575def IIC_POP_SR_SS : InstrItinClass;
Simon Pilgrim7e636cc2017-12-09 20:42:27 +0000576def IIC_SEGMENT_BASE_R : InstrItinClass;
577def IIC_SEGMENT_BASE_W : InstrItinClass;
Simon Pilgrima271c542017-05-03 15:42:29 +0000578def IIC_VERR : InstrItinClass;
579def IIC_VERW_REG : InstrItinClass;
580def IIC_VERW_MEM : InstrItinClass;
581def IIC_WRMSR : InstrItinClass;
582def IIC_RDMSR : InstrItinClass;
583def IIC_RDPMC : InstrItinClass;
584def IIC_SMSW : InstrItinClass;
585def IIC_LMSW_REG : InstrItinClass;
586def IIC_LMSW_MEM : InstrItinClass;
587def IIC_ENTER : InstrItinClass;
588def IIC_LEAVE : InstrItinClass;
589def IIC_POP_MEM : InstrItinClass;
590def IIC_POP_REG16 : InstrItinClass;
591def IIC_POP_REG : InstrItinClass;
592def IIC_POP_F : InstrItinClass;
593def IIC_POP_FD : InstrItinClass;
594def IIC_POP_A : InstrItinClass;
595def IIC_PUSH_IMM : InstrItinClass;
596def IIC_PUSH_MEM : InstrItinClass;
597def IIC_PUSH_REG : InstrItinClass;
598def IIC_PUSH_F : InstrItinClass;
599def IIC_PUSH_A : InstrItinClass;
600def IIC_BSWAP : InstrItinClass;
601def IIC_BIT_SCAN_MEM : InstrItinClass;
602def IIC_BIT_SCAN_REG : InstrItinClass;
Simon Pilgrimf1d599a2017-12-07 15:24:14 +0000603def IIC_LZCNT_RR : InstrItinClass;
604def IIC_LZCNT_RM : InstrItinClass;
605def IIC_TZCNT_RR : InstrItinClass;
606def IIC_TZCNT_RM : InstrItinClass;
Simon Pilgrima271c542017-05-03 15:42:29 +0000607def IIC_MOVS : InstrItinClass;
608def IIC_STOS : InstrItinClass;
609def IIC_SCAS : InstrItinClass;
610def IIC_CMPS : InstrItinClass;
611def IIC_MOV : InstrItinClass;
612def IIC_MOV_MEM : InstrItinClass;
613def IIC_AHF : InstrItinClass;
614def IIC_BT_MI : InstrItinClass;
615def IIC_BT_MR : InstrItinClass;
616def IIC_BT_RI : InstrItinClass;
617def IIC_BT_RR : InstrItinClass;
618def IIC_BTX_MI : InstrItinClass;
619def IIC_BTX_MR : InstrItinClass;
620def IIC_BTX_RI : InstrItinClass;
621def IIC_BTX_RR : InstrItinClass;
622def IIC_XCHG_REG : InstrItinClass;
623def IIC_XCHG_MEM : InstrItinClass;
624def IIC_XADD_REG : InstrItinClass;
625def IIC_XADD_MEM : InstrItinClass;
626def IIC_CMPXCHG_MEM : InstrItinClass;
627def IIC_CMPXCHG_REG : InstrItinClass;
628def IIC_CMPXCHG_MEM8 : InstrItinClass;
629def IIC_CMPXCHG_REG8 : InstrItinClass;
630def IIC_CMPXCHG_8B : InstrItinClass;
631def IIC_CMPXCHG_16B : InstrItinClass;
632def IIC_LODS : InstrItinClass;
633def IIC_OUTS : InstrItinClass;
634def IIC_CLC : InstrItinClass;
635def IIC_CLD : InstrItinClass;
636def IIC_CLI : InstrItinClass;
637def IIC_CMC : InstrItinClass;
638def IIC_CLTS : InstrItinClass;
639def IIC_STC : InstrItinClass;
640def IIC_STI : InstrItinClass;
641def IIC_STD : InstrItinClass;
642def IIC_XLAT : InstrItinClass;
643def IIC_AAA : InstrItinClass;
644def IIC_AAD : InstrItinClass;
645def IIC_AAM : InstrItinClass;
646def IIC_AAS : InstrItinClass;
647def IIC_DAA : InstrItinClass;
648def IIC_DAS : InstrItinClass;
649def IIC_BOUND : InstrItinClass;
650def IIC_ARPL_REG : InstrItinClass;
651def IIC_ARPL_MEM : InstrItinClass;
652def IIC_MOVBE : InstrItinClass;
653def IIC_AES : InstrItinClass;
654def IIC_BLEND_MEM : InstrItinClass;
655def IIC_BLEND_NOMEM : InstrItinClass;
656def IIC_CBW : InstrItinClass;
657def IIC_CRC32_REG : InstrItinClass;
658def IIC_CRC32_MEM : InstrItinClass;
659def IIC_SSE_DPPD_RR : InstrItinClass;
660def IIC_SSE_DPPD_RM : InstrItinClass;
661def IIC_SSE_DPPS_RR : InstrItinClass;
662def IIC_SSE_DPPS_RM : InstrItinClass;
663def IIC_MMX_EMMS : InstrItinClass;
664def IIC_SSE_EXTRACTPS_RR : InstrItinClass;
665def IIC_SSE_EXTRACTPS_RM : InstrItinClass;
666def IIC_SSE_INSERTPS_RR : InstrItinClass;
667def IIC_SSE_INSERTPS_RM : InstrItinClass;
668def IIC_SSE_MPSADBW_RR : InstrItinClass;
669def IIC_SSE_MPSADBW_RM : InstrItinClass;
670def IIC_SSE_PMULLD_RR : InstrItinClass;
671def IIC_SSE_PMULLD_RM : InstrItinClass;
672def IIC_SSE_ROUNDPS_REG : InstrItinClass;
673def IIC_SSE_ROUNDPS_MEM : InstrItinClass;
674def IIC_SSE_ROUNDPD_REG : InstrItinClass;
675def IIC_SSE_ROUNDPD_MEM : InstrItinClass;
676def IIC_SSE_POPCNT_RR : InstrItinClass;
677def IIC_SSE_POPCNT_RM : InstrItinClass;
678def IIC_SSE_PCLMULQDQ_RR : InstrItinClass;
679def IIC_SSE_PCLMULQDQ_RM : InstrItinClass;
680
681def IIC_NOP : InstrItinClass;
682
683//===----------------------------------------------------------------------===//
684// Processor instruction itineraries.
685
686// IssueWidth is analogous to the number of decode units. Core and its
687// descendents, including Nehalem and SandyBridge have 4 decoders.
688// Resources beyond the decoder operate on micro-ops and are bufferred
689// so adjacent micro-ops don't directly compete.
690//
691// MicroOpBufferSize > 1 indicates that RAW dependencies can be
692// decoded in the same cycle. The value 32 is a reasonably arbitrary
693// number of in-flight instructions.
694//
695// HighLatency=10 is optimistic. X86InstrInfo::isHighLatencyDef
696// indicates high latency opcodes. Alternatively, InstrItinData
697// entries may be included here to define specific operand
698// latencies. Since these latencies are not used for pipeline hazards,
699// they do not need to be exact.
700//
701// The GenericX86Model contains no instruction itineraries
702// and disables PostRAScheduler.
703class GenericX86Model : SchedMachineModel {
704 let IssueWidth = 4;
705 let MicroOpBufferSize = 32;
706 let LoadLatency = 4;
707 let HighLatency = 10;
708 let PostRAScheduler = 0;
709 let CompleteModel = 0;
710}
711
712def GenericModel : GenericX86Model;
713
714// Define a model with the PostRAScheduler enabled.
715def GenericPostRAModel : GenericX86Model {
716 let PostRAScheduler = 1;
717}
718