blob: b994a57e27a32c290c7165641dd277f962fa7268 [file] [log] [blame]
Simon Pilgrima271c542017-05-03 15:42:29 +00001//===-- X86Schedule.td - X86 Scheduling Definitions --------*- tablegen -*-===//
2//
3// The LLVM Compiler Infrastructure
4//
5// This file is distributed under the University of Illinois Open Source
6// License. See LICENSE.TXT for details.
7//
8//===----------------------------------------------------------------------===//
9
10// InstrSchedModel annotations for out-of-order CPUs.
11//
12// These annotations are independent of the itinerary classes defined below.
13
14// Instructions with folded loads need to read the memory operand immediately,
15// but other register operands don't have to be read until the load is ready.
16// These operands are marked with ReadAfterLd.
17def ReadAfterLd : SchedRead;
18
19// Instructions with both a load and a store folded are modeled as a folded
20// load + WriteRMW.
21def WriteRMW : SchedWrite;
22
23// Most instructions can fold loads, so almost every SchedWrite comes in two
24// variants: With and without a folded load.
25// An X86FoldableSchedWrite holds a reference to the corresponding SchedWrite
26// with a folded load.
27class X86FoldableSchedWrite : SchedWrite {
28 // The SchedWrite to use when a load is folded into the instruction.
29 SchedWrite Folded;
30}
31
32// Multiclass that produces a linked pair of SchedWrites.
33multiclass X86SchedWritePair {
34 // Register-Memory operation.
35 def Ld : SchedWrite;
36 // Register-Register operation.
37 def NAME : X86FoldableSchedWrite {
38 let Folded = !cast<SchedWrite>(NAME#"Ld");
39 }
40}
41
42// Arithmetic.
43defm WriteALU : X86SchedWritePair; // Simple integer ALU op.
44defm WriteIMul : X86SchedWritePair; // Integer multiplication.
45def WriteIMulH : SchedWrite; // Integer multiplication, high part.
46defm WriteIDiv : X86SchedWritePair; // Integer division.
47def WriteLEA : SchedWrite; // LEA instructions can't fold loads.
48
Simon Pilgrimf33d9052018-03-26 18:19:28 +000049defm WriteBitScan : X86SchedWritePair; // Bit scan forward/reverse.
50defm WritePOPCNT : X86SchedWritePair; // Bit population count.
51defm WriteLZCNT : X86SchedWritePair; // Leading zero count.
52defm WriteTZCNT : X86SchedWritePair; // Trailing zero count.
53
Simon Pilgrima271c542017-05-03 15:42:29 +000054// Integer shifts and rotates.
55defm WriteShift : X86SchedWritePair;
56
57// Loads, stores, and moves, not folded with other operations.
58def WriteLoad : SchedWrite;
59def WriteStore : SchedWrite;
60def WriteMove : SchedWrite;
61
62// Idioms that clear a register, like xorps %xmm0, %xmm0.
63// These can often bypass execution ports completely.
64def WriteZero : SchedWrite;
65
66// Branches don't produce values, so they have no latency, but they still
67// consume resources. Indirect branches can fold loads.
68defm WriteJump : X86SchedWritePair;
69
70// Floating point. This covers both scalar and vector operations.
Simon Pilgrimfb7aa572018-03-15 14:45:30 +000071def WriteFLoad : SchedWrite;
72def WriteFStore : SchedWrite;
73def WriteFMove : SchedWrite;
Simon Pilgrima271c542017-05-03 15:42:29 +000074defm WriteFAdd : X86SchedWritePair; // Floating point add/sub/compare.
75defm WriteFMul : X86SchedWritePair; // Floating point multiplication.
76defm WriteFDiv : X86SchedWritePair; // Floating point division.
77defm WriteFSqrt : X86SchedWritePair; // Floating point square root.
78defm WriteFRcp : X86SchedWritePair; // Floating point reciprocal estimate.
79defm WriteFRsqrt : X86SchedWritePair; // Floating point reciprocal square root estimate.
80defm WriteFMA : X86SchedWritePair; // Fused Multiply Add.
81defm WriteFShuffle : X86SchedWritePair; // Floating point vector shuffles.
82defm WriteFBlend : X86SchedWritePair; // Floating point vector blends.
83defm WriteFVarBlend : X86SchedWritePair; // Fp vector variable blends.
84
85// FMA Scheduling helper class.
86class FMASC { X86FoldableSchedWrite Sched = WriteFAdd; }
87
Andrew V. Tischenko8cb1d092017-06-08 16:44:13 +000088// Horizontal Add/Sub (float and integer)
89defm WriteFHAdd : X86SchedWritePair;
90defm WritePHAdd : X86SchedWritePair;
91
Simon Pilgrima271c542017-05-03 15:42:29 +000092// Vector integer operations.
Simon Pilgrimfb7aa572018-03-15 14:45:30 +000093def WriteVecLoad : SchedWrite;
94def WriteVecStore : SchedWrite;
95def WriteVecMove : SchedWrite;
Simon Pilgrima271c542017-05-03 15:42:29 +000096defm WriteVecALU : X86SchedWritePair; // Vector integer ALU op, no logicals.
97defm WriteVecShift : X86SchedWritePair; // Vector integer shifts.
98defm WriteVecIMul : X86SchedWritePair; // Vector integer multiply.
99defm WriteShuffle : X86SchedWritePair; // Vector shuffles.
100defm WriteBlend : X86SchedWritePair; // Vector blends.
101defm WriteVarBlend : X86SchedWritePair; // Vector variable blends.
102defm WriteMPSAD : X86SchedWritePair; // Vector MPSAD.
103
104// Vector bitwise operations.
105// These are often used on both floating point and integer vectors.
106defm WriteVecLogic : X86SchedWritePair; // Vector and/or/xor.
107
108// Conversion between integer and float.
109defm WriteCvtF2I : X86SchedWritePair; // Float -> Integer.
110defm WriteCvtI2F : X86SchedWritePair; // Integer -> Float.
111defm WriteCvtF2F : X86SchedWritePair; // Float -> Float size conversion.
112
113// Strings instructions.
114// Packed Compare Implicit Length Strings, Return Mask
115defm WritePCmpIStrM : X86SchedWritePair;
116// Packed Compare Explicit Length Strings, Return Mask
117defm WritePCmpEStrM : X86SchedWritePair;
118// Packed Compare Implicit Length Strings, Return Index
119defm WritePCmpIStrI : X86SchedWritePair;
120// Packed Compare Explicit Length Strings, Return Index
121defm WritePCmpEStrI : X86SchedWritePair;
122
123// AES instructions.
124defm WriteAESDecEnc : X86SchedWritePair; // Decryption, encryption.
125defm WriteAESIMC : X86SchedWritePair; // InvMixColumn.
126defm WriteAESKeyGen : X86SchedWritePair; // Key Generation.
127
128// Carry-less multiplication instructions.
129defm WriteCLMul : X86SchedWritePair;
130
131// Catch-all for expensive system instructions.
132def WriteSystem : SchedWrite;
133
134// AVX2.
135defm WriteFShuffle256 : X86SchedWritePair; // Fp 256-bit width vector shuffles.
136defm WriteShuffle256 : X86SchedWritePair; // 256-bit width vector shuffles.
137defm WriteVarVecShift : X86SchedWritePair; // Variable vector shifts.
138
139// Old microcoded instructions that nobody use.
140def WriteMicrocoded : SchedWrite;
141
142// Fence instructions.
143def WriteFence : SchedWrite;
144
145// Nop, not very useful expect it provides a model for nops!
146def WriteNop : SchedWrite;
147
148//===----------------------------------------------------------------------===//
149// Instruction Itinerary classes used for X86
150def IIC_ALU_MEM : InstrItinClass;
151def IIC_ALU_NONMEM : InstrItinClass;
152def IIC_LEA : InstrItinClass;
153def IIC_LEA_16 : InstrItinClass;
Craig Topper5ccd8722018-03-19 16:38:33 +0000154def IIC_MUL8_MEM : InstrItinClass;
155def IIC_MUL8_REG : InstrItinClass;
Simon Pilgrima271c542017-05-03 15:42:29 +0000156def IIC_MUL16_MEM : InstrItinClass;
157def IIC_MUL16_REG : InstrItinClass;
158def IIC_MUL32_MEM : InstrItinClass;
159def IIC_MUL32_REG : InstrItinClass;
Craig Topper5ccd8722018-03-19 16:38:33 +0000160def IIC_MUL64_MEM : InstrItinClass;
161def IIC_MUL64_REG : InstrItinClass;
Simon Pilgrima271c542017-05-03 15:42:29 +0000162// imul by al, ax, eax, tax
Craig Topper5ccd8722018-03-19 16:38:33 +0000163def IIC_IMUL8_MEM : InstrItinClass;
164def IIC_IMUL8_REG : InstrItinClass;
Simon Pilgrima271c542017-05-03 15:42:29 +0000165def IIC_IMUL16_MEM : InstrItinClass;
166def IIC_IMUL16_REG : InstrItinClass;
167def IIC_IMUL32_MEM : InstrItinClass;
168def IIC_IMUL32_REG : InstrItinClass;
Craig Topper5ccd8722018-03-19 16:38:33 +0000169def IIC_IMUL64_MEM : InstrItinClass;
170def IIC_IMUL64_REG : InstrItinClass;
Simon Pilgrima271c542017-05-03 15:42:29 +0000171// imul reg by reg|mem
172def IIC_IMUL16_RM : InstrItinClass;
173def IIC_IMUL16_RR : InstrItinClass;
174def IIC_IMUL32_RM : InstrItinClass;
175def IIC_IMUL32_RR : InstrItinClass;
176def IIC_IMUL64_RM : InstrItinClass;
177def IIC_IMUL64_RR : InstrItinClass;
178// imul reg = reg/mem * imm
179def IIC_IMUL16_RMI : InstrItinClass;
180def IIC_IMUL16_RRI : InstrItinClass;
181def IIC_IMUL32_RMI : InstrItinClass;
182def IIC_IMUL32_RRI : InstrItinClass;
183def IIC_IMUL64_RMI : InstrItinClass;
184def IIC_IMUL64_RRI : InstrItinClass;
185// div
186def IIC_DIV8_MEM : InstrItinClass;
187def IIC_DIV8_REG : InstrItinClass;
Craig Topper5ccd8722018-03-19 16:38:33 +0000188def IIC_DIV16_MEM : InstrItinClass;
189def IIC_DIV16_REG : InstrItinClass;
190def IIC_DIV32_MEM : InstrItinClass;
191def IIC_DIV32_REG : InstrItinClass;
192def IIC_DIV64_MEM : InstrItinClass;
193def IIC_DIV64_REG : InstrItinClass;
Simon Pilgrima271c542017-05-03 15:42:29 +0000194// idiv
Craig Topper5ccd8722018-03-19 16:38:33 +0000195def IIC_IDIV8_MEM : InstrItinClass;
196def IIC_IDIV8_REG : InstrItinClass;
197def IIC_IDIV16_MEM : InstrItinClass;
198def IIC_IDIV16_REG : InstrItinClass;
199def IIC_IDIV32_MEM : InstrItinClass;
200def IIC_IDIV32_REG : InstrItinClass;
201def IIC_IDIV64_MEM : InstrItinClass;
202def IIC_IDIV64_REG : InstrItinClass;
Simon Pilgrima271c542017-05-03 15:42:29 +0000203// neg/not/inc/dec
204def IIC_UNARY_REG : InstrItinClass;
205def IIC_UNARY_MEM : InstrItinClass;
206// add/sub/and/or/xor/sbc/cmp/test
207def IIC_BIN_MEM : InstrItinClass;
208def IIC_BIN_NONMEM : InstrItinClass;
209// adc/sbc
210def IIC_BIN_CARRY_MEM : InstrItinClass;
211def IIC_BIN_CARRY_NONMEM : InstrItinClass;
212// shift/rotate
213def IIC_SR : InstrItinClass;
214// shift double
215def IIC_SHD16_REG_IM : InstrItinClass;
216def IIC_SHD16_REG_CL : InstrItinClass;
217def IIC_SHD16_MEM_IM : InstrItinClass;
218def IIC_SHD16_MEM_CL : InstrItinClass;
219def IIC_SHD32_REG_IM : InstrItinClass;
220def IIC_SHD32_REG_CL : InstrItinClass;
221def IIC_SHD32_MEM_IM : InstrItinClass;
222def IIC_SHD32_MEM_CL : InstrItinClass;
223def IIC_SHD64_REG_IM : InstrItinClass;
224def IIC_SHD64_REG_CL : InstrItinClass;
225def IIC_SHD64_MEM_IM : InstrItinClass;
226def IIC_SHD64_MEM_CL : InstrItinClass;
227// cmov
228def IIC_CMOV16_RM : InstrItinClass;
229def IIC_CMOV16_RR : InstrItinClass;
230def IIC_CMOV32_RM : InstrItinClass;
231def IIC_CMOV32_RR : InstrItinClass;
232def IIC_CMOV64_RM : InstrItinClass;
233def IIC_CMOV64_RR : InstrItinClass;
234// set
235def IIC_SET_R : InstrItinClass;
236def IIC_SET_M : InstrItinClass;
237// jmp/jcc/jcxz
238def IIC_Jcc : InstrItinClass;
239def IIC_JCXZ : InstrItinClass;
240def IIC_JMP_REL : InstrItinClass;
241def IIC_JMP_REG : InstrItinClass;
242def IIC_JMP_MEM : InstrItinClass;
243def IIC_JMP_FAR_MEM : InstrItinClass;
244def IIC_JMP_FAR_PTR : InstrItinClass;
245// loop
246def IIC_LOOP : InstrItinClass;
247def IIC_LOOPE : InstrItinClass;
248def IIC_LOOPNE : InstrItinClass;
249// call
250def IIC_CALL_RI : InstrItinClass;
251def IIC_CALL_MEM : InstrItinClass;
252def IIC_CALL_FAR_MEM : InstrItinClass;
253def IIC_CALL_FAR_PTR : InstrItinClass;
254// ret
255def IIC_RET : InstrItinClass;
256def IIC_RET_IMM : InstrItinClass;
257//sign extension movs
258def IIC_MOVSX : InstrItinClass;
259def IIC_MOVSX_R16_R8 : InstrItinClass;
260def IIC_MOVSX_R16_M8 : InstrItinClass;
Simon Pilgrima271c542017-05-03 15:42:29 +0000261//zero extension movs
262def IIC_MOVZX : InstrItinClass;
263def IIC_MOVZX_R16_R8 : InstrItinClass;
264def IIC_MOVZX_R16_M8 : InstrItinClass;
265
266def IIC_REP_MOVS : InstrItinClass;
267def IIC_REP_STOS : InstrItinClass;
268
269// SSE scalar/parallel binary operations
270def IIC_SSE_ALU_F32S_RR : InstrItinClass;
271def IIC_SSE_ALU_F32S_RM : InstrItinClass;
272def IIC_SSE_ALU_F64S_RR : InstrItinClass;
273def IIC_SSE_ALU_F64S_RM : InstrItinClass;
274def IIC_SSE_MUL_F32S_RR : InstrItinClass;
275def IIC_SSE_MUL_F32S_RM : InstrItinClass;
276def IIC_SSE_MUL_F64S_RR : InstrItinClass;
277def IIC_SSE_MUL_F64S_RM : InstrItinClass;
278def IIC_SSE_DIV_F32S_RR : InstrItinClass;
279def IIC_SSE_DIV_F32S_RM : InstrItinClass;
280def IIC_SSE_DIV_F64S_RR : InstrItinClass;
281def IIC_SSE_DIV_F64S_RM : InstrItinClass;
282def IIC_SSE_ALU_F32P_RR : InstrItinClass;
283def IIC_SSE_ALU_F32P_RM : InstrItinClass;
284def IIC_SSE_ALU_F64P_RR : InstrItinClass;
285def IIC_SSE_ALU_F64P_RM : InstrItinClass;
286def IIC_SSE_MUL_F32P_RR : InstrItinClass;
287def IIC_SSE_MUL_F32P_RM : InstrItinClass;
288def IIC_SSE_MUL_F64P_RR : InstrItinClass;
289def IIC_SSE_MUL_F64P_RM : InstrItinClass;
290def IIC_SSE_DIV_F32P_RR : InstrItinClass;
291def IIC_SSE_DIV_F32P_RM : InstrItinClass;
292def IIC_SSE_DIV_F64P_RR : InstrItinClass;
293def IIC_SSE_DIV_F64P_RM : InstrItinClass;
294
295def IIC_SSE_COMIS_RR : InstrItinClass;
296def IIC_SSE_COMIS_RM : InstrItinClass;
297
298def IIC_SSE_HADDSUB_RR : InstrItinClass;
299def IIC_SSE_HADDSUB_RM : InstrItinClass;
300
301def IIC_SSE_BIT_P_RR : InstrItinClass;
302def IIC_SSE_BIT_P_RM : InstrItinClass;
303
304def IIC_SSE_INTALU_P_RR : InstrItinClass;
305def IIC_SSE_INTALU_P_RM : InstrItinClass;
306def IIC_SSE_INTALUQ_P_RR : InstrItinClass;
307def IIC_SSE_INTALUQ_P_RM : InstrItinClass;
308
309def IIC_SSE_INTMUL_P_RR : InstrItinClass;
310def IIC_SSE_INTMUL_P_RM : InstrItinClass;
311
312def IIC_SSE_INTSH_P_RR : InstrItinClass;
313def IIC_SSE_INTSH_P_RM : InstrItinClass;
314def IIC_SSE_INTSH_P_RI : InstrItinClass;
315
316def IIC_SSE_INTSHDQ_P_RI : InstrItinClass;
317
318def IIC_SSE_SHUFP : InstrItinClass;
319def IIC_SSE_PSHUF_RI : InstrItinClass;
320def IIC_SSE_PSHUF_MI : InstrItinClass;
321
Simon Pilgrim3f24ff62017-08-01 16:47:48 +0000322def IIC_SSE_PACK : InstrItinClass;
Simon Pilgrima271c542017-05-03 15:42:29 +0000323def IIC_SSE_UNPCK : InstrItinClass;
324
325def IIC_SSE_MOVMSK : InstrItinClass;
326def IIC_SSE_MASKMOV : InstrItinClass;
327
328def IIC_SSE_PEXTRW : InstrItinClass;
329def IIC_SSE_PINSRW : InstrItinClass;
330
331def IIC_SSE_PABS_RR : InstrItinClass;
332def IIC_SSE_PABS_RM : InstrItinClass;
333
334def IIC_SSE_SQRTPS_RR : InstrItinClass;
335def IIC_SSE_SQRTPS_RM : InstrItinClass;
336def IIC_SSE_SQRTSS_RR : InstrItinClass;
337def IIC_SSE_SQRTSS_RM : InstrItinClass;
338def IIC_SSE_SQRTPD_RR : InstrItinClass;
339def IIC_SSE_SQRTPD_RM : InstrItinClass;
340def IIC_SSE_SQRTSD_RR : InstrItinClass;
341def IIC_SSE_SQRTSD_RM : InstrItinClass;
342
343def IIC_SSE_RSQRTPS_RR : InstrItinClass;
344def IIC_SSE_RSQRTPS_RM : InstrItinClass;
345def IIC_SSE_RSQRTSS_RR : InstrItinClass;
346def IIC_SSE_RSQRTSS_RM : InstrItinClass;
347
348def IIC_SSE_RCPP_RR : InstrItinClass;
349def IIC_SSE_RCPP_RM : InstrItinClass;
350def IIC_SSE_RCPS_RR : InstrItinClass;
351def IIC_SSE_RCPS_RM : InstrItinClass;
352
353def IIC_SSE_MOV_S_RR : InstrItinClass;
354def IIC_SSE_MOV_S_RM : InstrItinClass;
355def IIC_SSE_MOV_S_MR : InstrItinClass;
356
357def IIC_SSE_MOVA_P_RR : InstrItinClass;
358def IIC_SSE_MOVA_P_RM : InstrItinClass;
359def IIC_SSE_MOVA_P_MR : InstrItinClass;
360
361def IIC_SSE_MOVU_P_RR : InstrItinClass;
362def IIC_SSE_MOVU_P_RM : InstrItinClass;
363def IIC_SSE_MOVU_P_MR : InstrItinClass;
364
365def IIC_SSE_MOVDQ : InstrItinClass;
366def IIC_SSE_MOVD_ToGP : InstrItinClass;
367def IIC_SSE_MOVQ_RR : InstrItinClass;
368
369def IIC_SSE_MOV_LH : InstrItinClass;
370
371def IIC_SSE_LDDQU : InstrItinClass;
372
373def IIC_SSE_MOVNT : InstrItinClass;
374
375def IIC_SSE_PHADDSUBD_RR : InstrItinClass;
376def IIC_SSE_PHADDSUBD_RM : InstrItinClass;
377def IIC_SSE_PHADDSUBSW_RR : InstrItinClass;
378def IIC_SSE_PHADDSUBSW_RM : InstrItinClass;
379def IIC_SSE_PHADDSUBW_RR : InstrItinClass;
380def IIC_SSE_PHADDSUBW_RM : InstrItinClass;
381def IIC_SSE_PSHUFB_RR : InstrItinClass;
382def IIC_SSE_PSHUFB_RM : InstrItinClass;
383def IIC_SSE_PSIGN_RR : InstrItinClass;
384def IIC_SSE_PSIGN_RM : InstrItinClass;
385
386def IIC_SSE_PMADD : InstrItinClass;
387def IIC_SSE_PMULHRSW : InstrItinClass;
388def IIC_SSE_PALIGNRR : InstrItinClass;
389def IIC_SSE_PALIGNRM : InstrItinClass;
390def IIC_SSE_MWAIT : InstrItinClass;
391def IIC_SSE_MONITOR : InstrItinClass;
392def IIC_SSE_MWAITX : InstrItinClass;
393def IIC_SSE_MONITORX : InstrItinClass;
394def IIC_SSE_CLZERO : InstrItinClass;
395
396def IIC_SSE_PREFETCH : InstrItinClass;
397def IIC_SSE_PAUSE : InstrItinClass;
398def IIC_SSE_LFENCE : InstrItinClass;
399def IIC_SSE_MFENCE : InstrItinClass;
400def IIC_SSE_SFENCE : InstrItinClass;
401def IIC_SSE_LDMXCSR : InstrItinClass;
402def IIC_SSE_STMXCSR : InstrItinClass;
403
404def IIC_SSE_CVT_PD_RR : InstrItinClass;
405def IIC_SSE_CVT_PD_RM : InstrItinClass;
406def IIC_SSE_CVT_PS_RR : InstrItinClass;
407def IIC_SSE_CVT_PS_RM : InstrItinClass;
Simon Pilgrima271c542017-05-03 15:42:29 +0000408def IIC_SSE_CVT_Scalar_RR : InstrItinClass;
409def IIC_SSE_CVT_Scalar_RM : InstrItinClass;
410def IIC_SSE_CVT_SS2SI32_RM : InstrItinClass;
411def IIC_SSE_CVT_SS2SI32_RR : InstrItinClass;
412def IIC_SSE_CVT_SS2SI64_RM : InstrItinClass;
413def IIC_SSE_CVT_SS2SI64_RR : InstrItinClass;
414def IIC_SSE_CVT_SD2SI_RM : InstrItinClass;
415def IIC_SSE_CVT_SD2SI_RR : InstrItinClass;
416
Simon Pilgrim91c159d2017-12-10 12:26:35 +0000417def IIC_AVX_ZERO : InstrItinClass;
418
Simon Pilgrima271c542017-05-03 15:42:29 +0000419// MMX
420def IIC_MMX_MOV_MM_RM : InstrItinClass;
421def IIC_MMX_MOV_REG_MM : InstrItinClass;
422def IIC_MMX_MOVQ_RM : InstrItinClass;
423def IIC_MMX_MOVQ_RR : InstrItinClass;
424
425def IIC_MMX_ALU_RM : InstrItinClass;
426def IIC_MMX_ALU_RR : InstrItinClass;
427def IIC_MMX_ALUQ_RM : InstrItinClass;
428def IIC_MMX_ALUQ_RR : InstrItinClass;
429def IIC_MMX_PHADDSUBW_RM : InstrItinClass;
430def IIC_MMX_PHADDSUBW_RR : InstrItinClass;
431def IIC_MMX_PHADDSUBD_RM : InstrItinClass;
432def IIC_MMX_PHADDSUBD_RR : InstrItinClass;
433def IIC_MMX_PMUL : InstrItinClass;
434def IIC_MMX_MISC_FUNC_MEM : InstrItinClass;
435def IIC_MMX_MISC_FUNC_REG : InstrItinClass;
436def IIC_MMX_PSADBW : InstrItinClass;
437def IIC_MMX_SHIFT_RI : InstrItinClass;
438def IIC_MMX_SHIFT_RM : InstrItinClass;
439def IIC_MMX_SHIFT_RR : InstrItinClass;
440def IIC_MMX_UNPCK_H_RM : InstrItinClass;
441def IIC_MMX_UNPCK_H_RR : InstrItinClass;
442def IIC_MMX_UNPCK_L : InstrItinClass;
443def IIC_MMX_PCK_RM : InstrItinClass;
444def IIC_MMX_PCK_RR : InstrItinClass;
445def IIC_MMX_PSHUF : InstrItinClass;
446def IIC_MMX_PEXTR : InstrItinClass;
447def IIC_MMX_PINSRW : InstrItinClass;
448def IIC_MMX_MASKMOV : InstrItinClass;
Simon Pilgrimf545bb6c2017-11-26 17:56:07 +0000449def IIC_MMX_MOVMSK : InstrItinClass;
Simon Pilgrima271c542017-05-03 15:42:29 +0000450def IIC_MMX_CVT_PD_RR : InstrItinClass;
451def IIC_MMX_CVT_PD_RM : InstrItinClass;
452def IIC_MMX_CVT_PS_RR : InstrItinClass;
453def IIC_MMX_CVT_PS_RM : InstrItinClass;
454
Simon Pilgrimfe6e92d2017-11-26 20:50:29 +0000455def IIC_3DNOW_FALU_RM : InstrItinClass;
456def IIC_3DNOW_FALU_RR : InstrItinClass;
457def IIC_3DNOW_FCVT_F2I_RM : InstrItinClass;
458def IIC_3DNOW_FCVT_F2I_RR : InstrItinClass;
459def IIC_3DNOW_FCVT_I2F_RM : InstrItinClass;
460def IIC_3DNOW_FCVT_I2F_RR : InstrItinClass;
461def IIC_3DNOW_MISC_FUNC_REG : InstrItinClass;
462def IIC_3DNOW_MISC_FUNC_MEM : InstrItinClass;
463
Simon Pilgrima271c542017-05-03 15:42:29 +0000464def IIC_CMPX_LOCK : InstrItinClass;
465def IIC_CMPX_LOCK_8 : InstrItinClass;
466def IIC_CMPX_LOCK_8B : InstrItinClass;
467def IIC_CMPX_LOCK_16B : InstrItinClass;
468
469def IIC_XADD_LOCK_MEM : InstrItinClass;
470def IIC_XADD_LOCK_MEM8 : InstrItinClass;
471
Simon Pilgrim65f805f2017-12-05 18:01:26 +0000472def IIC_FCMOV : InstrItinClass;
Simon Pilgrima271c542017-05-03 15:42:29 +0000473def IIC_FILD : InstrItinClass;
474def IIC_FLD : InstrItinClass;
475def IIC_FLD80 : InstrItinClass;
476def IIC_FST : InstrItinClass;
477def IIC_FST80 : InstrItinClass;
478def IIC_FIST : InstrItinClass;
479def IIC_FLDZ : InstrItinClass;
480def IIC_FUCOM : InstrItinClass;
481def IIC_FUCOMI : InstrItinClass;
482def IIC_FCOMI : InstrItinClass;
483def IIC_FNSTSW : InstrItinClass;
484def IIC_FNSTCW : InstrItinClass;
485def IIC_FLDCW : InstrItinClass;
486def IIC_FNINIT : InstrItinClass;
487def IIC_FFREE : InstrItinClass;
488def IIC_FNCLEX : InstrItinClass;
489def IIC_WAIT : InstrItinClass;
490def IIC_FXAM : InstrItinClass;
491def IIC_FNOP : InstrItinClass;
492def IIC_FLDL : InstrItinClass;
493def IIC_F2XM1 : InstrItinClass;
494def IIC_FYL2X : InstrItinClass;
495def IIC_FPTAN : InstrItinClass;
496def IIC_FPATAN : InstrItinClass;
497def IIC_FXTRACT : InstrItinClass;
498def IIC_FPREM1 : InstrItinClass;
499def IIC_FPSTP : InstrItinClass;
500def IIC_FPREM : InstrItinClass;
Simon Pilgrim0747a7e2017-11-28 15:03:42 +0000501def IIC_FSIGN : InstrItinClass;
502def IIC_FSQRT : InstrItinClass;
Simon Pilgrima271c542017-05-03 15:42:29 +0000503def IIC_FYL2XP1 : InstrItinClass;
504def IIC_FSINCOS : InstrItinClass;
505def IIC_FRNDINT : InstrItinClass;
506def IIC_FSCALE : InstrItinClass;
507def IIC_FCOMPP : InstrItinClass;
508def IIC_FXSAVE : InstrItinClass;
509def IIC_FXRSTOR : InstrItinClass;
510
511def IIC_FXCH : InstrItinClass;
512
513// System instructions
514def IIC_CPUID : InstrItinClass;
515def IIC_INT : InstrItinClass;
516def IIC_INT3 : InstrItinClass;
517def IIC_INVD : InstrItinClass;
518def IIC_INVLPG : InstrItinClass;
Simon Pilgrim1ddcae62017-12-08 15:48:37 +0000519def IIC_INVPCID : InstrItinClass;
Simon Pilgrima271c542017-05-03 15:42:29 +0000520def IIC_IRET : InstrItinClass;
521def IIC_HLT : InstrItinClass;
522def IIC_LXS : InstrItinClass;
523def IIC_LTR : InstrItinClass;
Simon Pilgrim42fcda92017-12-08 19:03:42 +0000524def IIC_MPX : InstrItinClass;
Simon Pilgrim1ddcae62017-12-08 15:48:37 +0000525def IIC_PKU : InstrItinClass;
526def IIC_PTWRITE : InstrItinClass;
527def IIC_RDPID : InstrItinClass;
Simon Pilgrim60411d92017-12-07 14:18:48 +0000528def IIC_RDRAND : InstrItinClass;
529def IIC_RDSEED : InstrItinClass;
Simon Pilgrima271c542017-05-03 15:42:29 +0000530def IIC_RDTSC : InstrItinClass;
Simon Pilgrimf00ea1b2017-12-13 14:22:04 +0000531def IIC_RDTSCP : InstrItinClass;
Simon Pilgrima271c542017-05-03 15:42:29 +0000532def IIC_RSM : InstrItinClass;
533def IIC_SIDT : InstrItinClass;
534def IIC_SGDT : InstrItinClass;
535def IIC_SLDT : InstrItinClass;
Simon Pilgrim1ddcae62017-12-08 15:48:37 +0000536def IIC_SMAP : InstrItinClass;
537def IIC_SMX : InstrItinClass;
Simon Pilgrima271c542017-05-03 15:42:29 +0000538def IIC_STR : InstrItinClass;
Simon Pilgrim6b7cd862017-12-07 14:35:17 +0000539def IIC_SKINIT : InstrItinClass;
540def IIC_SVM : InstrItinClass;
Simon Pilgrima13271b2017-12-07 15:57:32 +0000541def IIC_VMX : InstrItinClass;
Simon Pilgrim6b7cd862017-12-07 14:35:17 +0000542def IIC_CLGI : InstrItinClass;
543def IIC_STGI : InstrItinClass;
Simon Pilgrima271c542017-05-03 15:42:29 +0000544def IIC_SWAPGS : InstrItinClass;
545def IIC_SYSCALL : InstrItinClass;
546def IIC_SYS_ENTER_EXIT : InstrItinClass;
547def IIC_IN_RR : InstrItinClass;
548def IIC_IN_RI : InstrItinClass;
549def IIC_OUT_RR : InstrItinClass;
550def IIC_OUT_IR : InstrItinClass;
551def IIC_INS : InstrItinClass;
Simon Pilgrim99b925b2017-05-03 15:51:39 +0000552def IIC_LWP : InstrItinClass;
Simon Pilgrima271c542017-05-03 15:42:29 +0000553def IIC_MOV_REG_DR : InstrItinClass;
554def IIC_MOV_DR_REG : InstrItinClass;
555def IIC_MOV_REG_CR : InstrItinClass;
556def IIC_MOV_CR_REG : InstrItinClass;
557def IIC_MOV_REG_SR : InstrItinClass;
558def IIC_MOV_MEM_SR : InstrItinClass;
559def IIC_MOV_SR_REG : InstrItinClass;
560def IIC_MOV_SR_MEM : InstrItinClass;
561def IIC_LAR_RM : InstrItinClass;
562def IIC_LAR_RR : InstrItinClass;
563def IIC_LSL_RM : InstrItinClass;
564def IIC_LSL_RR : InstrItinClass;
565def IIC_LGDT : InstrItinClass;
566def IIC_LIDT : InstrItinClass;
567def IIC_LLDT_REG : InstrItinClass;
568def IIC_LLDT_MEM : InstrItinClass;
569def IIC_PUSH_CS : InstrItinClass;
570def IIC_PUSH_SR : InstrItinClass;
571def IIC_POP_SR : InstrItinClass;
572def IIC_POP_SR_SS : InstrItinClass;
Simon Pilgrim7e636cc2017-12-09 20:42:27 +0000573def IIC_SEGMENT_BASE_R : InstrItinClass;
574def IIC_SEGMENT_BASE_W : InstrItinClass;
Simon Pilgrima271c542017-05-03 15:42:29 +0000575def IIC_VERR : InstrItinClass;
576def IIC_VERW_REG : InstrItinClass;
577def IIC_VERW_MEM : InstrItinClass;
578def IIC_WRMSR : InstrItinClass;
579def IIC_RDMSR : InstrItinClass;
580def IIC_RDPMC : InstrItinClass;
581def IIC_SMSW : InstrItinClass;
582def IIC_LMSW_REG : InstrItinClass;
583def IIC_LMSW_MEM : InstrItinClass;
584def IIC_ENTER : InstrItinClass;
585def IIC_LEAVE : InstrItinClass;
586def IIC_POP_MEM : InstrItinClass;
587def IIC_POP_REG16 : InstrItinClass;
588def IIC_POP_REG : InstrItinClass;
589def IIC_POP_F : InstrItinClass;
590def IIC_POP_FD : InstrItinClass;
591def IIC_POP_A : InstrItinClass;
592def IIC_PUSH_IMM : InstrItinClass;
593def IIC_PUSH_MEM : InstrItinClass;
594def IIC_PUSH_REG : InstrItinClass;
595def IIC_PUSH_F : InstrItinClass;
596def IIC_PUSH_A : InstrItinClass;
597def IIC_BSWAP : InstrItinClass;
598def IIC_BIT_SCAN_MEM : InstrItinClass;
599def IIC_BIT_SCAN_REG : InstrItinClass;
Simon Pilgrimf1d599a2017-12-07 15:24:14 +0000600def IIC_LZCNT_RR : InstrItinClass;
601def IIC_LZCNT_RM : InstrItinClass;
602def IIC_TZCNT_RR : InstrItinClass;
603def IIC_TZCNT_RM : InstrItinClass;
Simon Pilgrima271c542017-05-03 15:42:29 +0000604def IIC_MOVS : InstrItinClass;
605def IIC_STOS : InstrItinClass;
606def IIC_SCAS : InstrItinClass;
607def IIC_CMPS : InstrItinClass;
608def IIC_MOV : InstrItinClass;
609def IIC_MOV_MEM : InstrItinClass;
610def IIC_AHF : InstrItinClass;
611def IIC_BT_MI : InstrItinClass;
612def IIC_BT_MR : InstrItinClass;
613def IIC_BT_RI : InstrItinClass;
614def IIC_BT_RR : InstrItinClass;
615def IIC_BTX_MI : InstrItinClass;
616def IIC_BTX_MR : InstrItinClass;
617def IIC_BTX_RI : InstrItinClass;
618def IIC_BTX_RR : InstrItinClass;
619def IIC_XCHG_REG : InstrItinClass;
620def IIC_XCHG_MEM : InstrItinClass;
621def IIC_XADD_REG : InstrItinClass;
622def IIC_XADD_MEM : InstrItinClass;
623def IIC_CMPXCHG_MEM : InstrItinClass;
624def IIC_CMPXCHG_REG : InstrItinClass;
625def IIC_CMPXCHG_MEM8 : InstrItinClass;
626def IIC_CMPXCHG_REG8 : InstrItinClass;
627def IIC_CMPXCHG_8B : InstrItinClass;
628def IIC_CMPXCHG_16B : InstrItinClass;
629def IIC_LODS : InstrItinClass;
630def IIC_OUTS : InstrItinClass;
631def IIC_CLC : InstrItinClass;
632def IIC_CLD : InstrItinClass;
633def IIC_CLI : InstrItinClass;
634def IIC_CMC : InstrItinClass;
635def IIC_CLTS : InstrItinClass;
636def IIC_STC : InstrItinClass;
637def IIC_STI : InstrItinClass;
638def IIC_STD : InstrItinClass;
639def IIC_XLAT : InstrItinClass;
640def IIC_AAA : InstrItinClass;
641def IIC_AAD : InstrItinClass;
642def IIC_AAM : InstrItinClass;
643def IIC_AAS : InstrItinClass;
644def IIC_DAA : InstrItinClass;
645def IIC_DAS : InstrItinClass;
646def IIC_BOUND : InstrItinClass;
647def IIC_ARPL_REG : InstrItinClass;
648def IIC_ARPL_MEM : InstrItinClass;
649def IIC_MOVBE : InstrItinClass;
650def IIC_AES : InstrItinClass;
651def IIC_BLEND_MEM : InstrItinClass;
652def IIC_BLEND_NOMEM : InstrItinClass;
653def IIC_CBW : InstrItinClass;
654def IIC_CRC32_REG : InstrItinClass;
655def IIC_CRC32_MEM : InstrItinClass;
656def IIC_SSE_DPPD_RR : InstrItinClass;
657def IIC_SSE_DPPD_RM : InstrItinClass;
658def IIC_SSE_DPPS_RR : InstrItinClass;
659def IIC_SSE_DPPS_RM : InstrItinClass;
660def IIC_MMX_EMMS : InstrItinClass;
661def IIC_SSE_EXTRACTPS_RR : InstrItinClass;
662def IIC_SSE_EXTRACTPS_RM : InstrItinClass;
663def IIC_SSE_INSERTPS_RR : InstrItinClass;
664def IIC_SSE_INSERTPS_RM : InstrItinClass;
665def IIC_SSE_MPSADBW_RR : InstrItinClass;
666def IIC_SSE_MPSADBW_RM : InstrItinClass;
667def IIC_SSE_PMULLD_RR : InstrItinClass;
668def IIC_SSE_PMULLD_RM : InstrItinClass;
669def IIC_SSE_ROUNDPS_REG : InstrItinClass;
670def IIC_SSE_ROUNDPS_MEM : InstrItinClass;
671def IIC_SSE_ROUNDPD_REG : InstrItinClass;
672def IIC_SSE_ROUNDPD_MEM : InstrItinClass;
673def IIC_SSE_POPCNT_RR : InstrItinClass;
674def IIC_SSE_POPCNT_RM : InstrItinClass;
675def IIC_SSE_PCLMULQDQ_RR : InstrItinClass;
676def IIC_SSE_PCLMULQDQ_RM : InstrItinClass;
677
678def IIC_NOP : InstrItinClass;
679
680//===----------------------------------------------------------------------===//
681// Processor instruction itineraries.
682
683// IssueWidth is analogous to the number of decode units. Core and its
684// descendents, including Nehalem and SandyBridge have 4 decoders.
685// Resources beyond the decoder operate on micro-ops and are bufferred
686// so adjacent micro-ops don't directly compete.
687//
688// MicroOpBufferSize > 1 indicates that RAW dependencies can be
689// decoded in the same cycle. The value 32 is a reasonably arbitrary
690// number of in-flight instructions.
691//
692// HighLatency=10 is optimistic. X86InstrInfo::isHighLatencyDef
693// indicates high latency opcodes. Alternatively, InstrItinData
694// entries may be included here to define specific operand
695// latencies. Since these latencies are not used for pipeline hazards,
696// they do not need to be exact.
697//
698// The GenericX86Model contains no instruction itineraries
699// and disables PostRAScheduler.
700class GenericX86Model : SchedMachineModel {
701 let IssueWidth = 4;
702 let MicroOpBufferSize = 32;
703 let LoadLatency = 4;
704 let HighLatency = 10;
705 let PostRAScheduler = 0;
706 let CompleteModel = 0;
707}
708
709def GenericModel : GenericX86Model;
710
711// Define a model with the PostRAScheduler enabled.
712def GenericPostRAModel : GenericX86Model {
713 let PostRAScheduler = 1;
714}
715