blob: 9a87b2d598e4870427aed417cc54fabac1349059 [file] [log] [blame]
Simon Pilgrima271c542017-05-03 15:42:29 +00001//===-- X86Schedule.td - X86 Scheduling Definitions --------*- tablegen -*-===//
2//
3// The LLVM Compiler Infrastructure
4//
5// This file is distributed under the University of Illinois Open Source
6// License. See LICENSE.TXT for details.
7//
8//===----------------------------------------------------------------------===//
9
10// InstrSchedModel annotations for out-of-order CPUs.
11//
12// These annotations are independent of the itinerary classes defined below.
13
14// Instructions with folded loads need to read the memory operand immediately,
15// but other register operands don't have to be read until the load is ready.
16// These operands are marked with ReadAfterLd.
17def ReadAfterLd : SchedRead;
18
19// Instructions with both a load and a store folded are modeled as a folded
20// load + WriteRMW.
21def WriteRMW : SchedWrite;
22
23// Most instructions can fold loads, so almost every SchedWrite comes in two
24// variants: With and without a folded load.
25// An X86FoldableSchedWrite holds a reference to the corresponding SchedWrite
26// with a folded load.
27class X86FoldableSchedWrite : SchedWrite {
28 // The SchedWrite to use when a load is folded into the instruction.
29 SchedWrite Folded;
30}
31
32// Multiclass that produces a linked pair of SchedWrites.
33multiclass X86SchedWritePair {
34 // Register-Memory operation.
35 def Ld : SchedWrite;
36 // Register-Register operation.
37 def NAME : X86FoldableSchedWrite {
38 let Folded = !cast<SchedWrite>(NAME#"Ld");
39 }
40}
41
42// Arithmetic.
43defm WriteALU : X86SchedWritePair; // Simple integer ALU op.
44defm WriteIMul : X86SchedWritePair; // Integer multiplication.
45def WriteIMulH : SchedWrite; // Integer multiplication, high part.
46defm WriteIDiv : X86SchedWritePair; // Integer division.
47def WriteLEA : SchedWrite; // LEA instructions can't fold loads.
48
49// Integer shifts and rotates.
50defm WriteShift : X86SchedWritePair;
51
52// Loads, stores, and moves, not folded with other operations.
53def WriteLoad : SchedWrite;
54def WriteStore : SchedWrite;
55def WriteMove : SchedWrite;
56
57// Idioms that clear a register, like xorps %xmm0, %xmm0.
58// These can often bypass execution ports completely.
59def WriteZero : SchedWrite;
60
61// Branches don't produce values, so they have no latency, but they still
62// consume resources. Indirect branches can fold loads.
63defm WriteJump : X86SchedWritePair;
64
65// Floating point. This covers both scalar and vector operations.
Simon Pilgrimfb7aa572018-03-15 14:45:30 +000066def WriteFLoad : SchedWrite;
67def WriteFStore : SchedWrite;
68def WriteFMove : SchedWrite;
Simon Pilgrima271c542017-05-03 15:42:29 +000069defm WriteFAdd : X86SchedWritePair; // Floating point add/sub/compare.
70defm WriteFMul : X86SchedWritePair; // Floating point multiplication.
71defm WriteFDiv : X86SchedWritePair; // Floating point division.
72defm WriteFSqrt : X86SchedWritePair; // Floating point square root.
73defm WriteFRcp : X86SchedWritePair; // Floating point reciprocal estimate.
74defm WriteFRsqrt : X86SchedWritePair; // Floating point reciprocal square root estimate.
75defm WriteFMA : X86SchedWritePair; // Fused Multiply Add.
76defm WriteFShuffle : X86SchedWritePair; // Floating point vector shuffles.
77defm WriteFBlend : X86SchedWritePair; // Floating point vector blends.
78defm WriteFVarBlend : X86SchedWritePair; // Fp vector variable blends.
79
80// FMA Scheduling helper class.
81class FMASC { X86FoldableSchedWrite Sched = WriteFAdd; }
82
Andrew V. Tischenko8cb1d092017-06-08 16:44:13 +000083// Horizontal Add/Sub (float and integer)
84defm WriteFHAdd : X86SchedWritePair;
85defm WritePHAdd : X86SchedWritePair;
86
Simon Pilgrima271c542017-05-03 15:42:29 +000087// Vector integer operations.
Simon Pilgrimfb7aa572018-03-15 14:45:30 +000088def WriteVecLoad : SchedWrite;
89def WriteVecStore : SchedWrite;
90def WriteVecMove : SchedWrite;
Simon Pilgrima271c542017-05-03 15:42:29 +000091defm WriteVecALU : X86SchedWritePair; // Vector integer ALU op, no logicals.
92defm WriteVecShift : X86SchedWritePair; // Vector integer shifts.
93defm WriteVecIMul : X86SchedWritePair; // Vector integer multiply.
94defm WriteShuffle : X86SchedWritePair; // Vector shuffles.
95defm WriteBlend : X86SchedWritePair; // Vector blends.
96defm WriteVarBlend : X86SchedWritePair; // Vector variable blends.
97defm WriteMPSAD : X86SchedWritePair; // Vector MPSAD.
98
99// Vector bitwise operations.
100// These are often used on both floating point and integer vectors.
101defm WriteVecLogic : X86SchedWritePair; // Vector and/or/xor.
102
103// Conversion between integer and float.
104defm WriteCvtF2I : X86SchedWritePair; // Float -> Integer.
105defm WriteCvtI2F : X86SchedWritePair; // Integer -> Float.
106defm WriteCvtF2F : X86SchedWritePair; // Float -> Float size conversion.
107
108// Strings instructions.
109// Packed Compare Implicit Length Strings, Return Mask
110defm WritePCmpIStrM : X86SchedWritePair;
111// Packed Compare Explicit Length Strings, Return Mask
112defm WritePCmpEStrM : X86SchedWritePair;
113// Packed Compare Implicit Length Strings, Return Index
114defm WritePCmpIStrI : X86SchedWritePair;
115// Packed Compare Explicit Length Strings, Return Index
116defm WritePCmpEStrI : X86SchedWritePair;
117
118// AES instructions.
119defm WriteAESDecEnc : X86SchedWritePair; // Decryption, encryption.
120defm WriteAESIMC : X86SchedWritePair; // InvMixColumn.
121defm WriteAESKeyGen : X86SchedWritePair; // Key Generation.
122
123// Carry-less multiplication instructions.
124defm WriteCLMul : X86SchedWritePair;
125
126// Catch-all for expensive system instructions.
127def WriteSystem : SchedWrite;
128
129// AVX2.
130defm WriteFShuffle256 : X86SchedWritePair; // Fp 256-bit width vector shuffles.
131defm WriteShuffle256 : X86SchedWritePair; // 256-bit width vector shuffles.
132defm WriteVarVecShift : X86SchedWritePair; // Variable vector shifts.
133
134// Old microcoded instructions that nobody use.
135def WriteMicrocoded : SchedWrite;
136
137// Fence instructions.
138def WriteFence : SchedWrite;
139
140// Nop, not very useful expect it provides a model for nops!
141def WriteNop : SchedWrite;
142
143//===----------------------------------------------------------------------===//
144// Instruction Itinerary classes used for X86
145def IIC_ALU_MEM : InstrItinClass;
146def IIC_ALU_NONMEM : InstrItinClass;
147def IIC_LEA : InstrItinClass;
148def IIC_LEA_16 : InstrItinClass;
149def IIC_MUL8 : InstrItinClass;
150def IIC_MUL16_MEM : InstrItinClass;
151def IIC_MUL16_REG : InstrItinClass;
152def IIC_MUL32_MEM : InstrItinClass;
153def IIC_MUL32_REG : InstrItinClass;
154def IIC_MUL64 : InstrItinClass;
155// imul by al, ax, eax, tax
156def IIC_IMUL8 : InstrItinClass;
157def IIC_IMUL16_MEM : InstrItinClass;
158def IIC_IMUL16_REG : InstrItinClass;
159def IIC_IMUL32_MEM : InstrItinClass;
160def IIC_IMUL32_REG : InstrItinClass;
161def IIC_IMUL64 : InstrItinClass;
162// imul reg by reg|mem
163def IIC_IMUL16_RM : InstrItinClass;
164def IIC_IMUL16_RR : InstrItinClass;
165def IIC_IMUL32_RM : InstrItinClass;
166def IIC_IMUL32_RR : InstrItinClass;
167def IIC_IMUL64_RM : InstrItinClass;
168def IIC_IMUL64_RR : InstrItinClass;
169// imul reg = reg/mem * imm
170def IIC_IMUL16_RMI : InstrItinClass;
171def IIC_IMUL16_RRI : InstrItinClass;
172def IIC_IMUL32_RMI : InstrItinClass;
173def IIC_IMUL32_RRI : InstrItinClass;
174def IIC_IMUL64_RMI : InstrItinClass;
175def IIC_IMUL64_RRI : InstrItinClass;
176// div
177def IIC_DIV8_MEM : InstrItinClass;
178def IIC_DIV8_REG : InstrItinClass;
179def IIC_DIV16 : InstrItinClass;
180def IIC_DIV32 : InstrItinClass;
181def IIC_DIV64 : InstrItinClass;
182// idiv
183def IIC_IDIV8 : InstrItinClass;
184def IIC_IDIV16 : InstrItinClass;
185def IIC_IDIV32 : InstrItinClass;
186def IIC_IDIV64 : InstrItinClass;
187// neg/not/inc/dec
188def IIC_UNARY_REG : InstrItinClass;
189def IIC_UNARY_MEM : InstrItinClass;
190// add/sub/and/or/xor/sbc/cmp/test
191def IIC_BIN_MEM : InstrItinClass;
192def IIC_BIN_NONMEM : InstrItinClass;
193// adc/sbc
194def IIC_BIN_CARRY_MEM : InstrItinClass;
195def IIC_BIN_CARRY_NONMEM : InstrItinClass;
196// shift/rotate
197def IIC_SR : InstrItinClass;
198// shift double
199def IIC_SHD16_REG_IM : InstrItinClass;
200def IIC_SHD16_REG_CL : InstrItinClass;
201def IIC_SHD16_MEM_IM : InstrItinClass;
202def IIC_SHD16_MEM_CL : InstrItinClass;
203def IIC_SHD32_REG_IM : InstrItinClass;
204def IIC_SHD32_REG_CL : InstrItinClass;
205def IIC_SHD32_MEM_IM : InstrItinClass;
206def IIC_SHD32_MEM_CL : InstrItinClass;
207def IIC_SHD64_REG_IM : InstrItinClass;
208def IIC_SHD64_REG_CL : InstrItinClass;
209def IIC_SHD64_MEM_IM : InstrItinClass;
210def IIC_SHD64_MEM_CL : InstrItinClass;
211// cmov
212def IIC_CMOV16_RM : InstrItinClass;
213def IIC_CMOV16_RR : InstrItinClass;
214def IIC_CMOV32_RM : InstrItinClass;
215def IIC_CMOV32_RR : InstrItinClass;
216def IIC_CMOV64_RM : InstrItinClass;
217def IIC_CMOV64_RR : InstrItinClass;
218// set
219def IIC_SET_R : InstrItinClass;
220def IIC_SET_M : InstrItinClass;
221// jmp/jcc/jcxz
222def IIC_Jcc : InstrItinClass;
223def IIC_JCXZ : InstrItinClass;
224def IIC_JMP_REL : InstrItinClass;
225def IIC_JMP_REG : InstrItinClass;
226def IIC_JMP_MEM : InstrItinClass;
227def IIC_JMP_FAR_MEM : InstrItinClass;
228def IIC_JMP_FAR_PTR : InstrItinClass;
229// loop
230def IIC_LOOP : InstrItinClass;
231def IIC_LOOPE : InstrItinClass;
232def IIC_LOOPNE : InstrItinClass;
233// call
234def IIC_CALL_RI : InstrItinClass;
235def IIC_CALL_MEM : InstrItinClass;
236def IIC_CALL_FAR_MEM : InstrItinClass;
237def IIC_CALL_FAR_PTR : InstrItinClass;
238// ret
239def IIC_RET : InstrItinClass;
240def IIC_RET_IMM : InstrItinClass;
241//sign extension movs
242def IIC_MOVSX : InstrItinClass;
243def IIC_MOVSX_R16_R8 : InstrItinClass;
244def IIC_MOVSX_R16_M8 : InstrItinClass;
245def IIC_MOVSX_R16_R16 : InstrItinClass;
246def IIC_MOVSX_R32_R32 : InstrItinClass;
247//zero extension movs
248def IIC_MOVZX : InstrItinClass;
249def IIC_MOVZX_R16_R8 : InstrItinClass;
250def IIC_MOVZX_R16_M8 : InstrItinClass;
251
252def IIC_REP_MOVS : InstrItinClass;
253def IIC_REP_STOS : InstrItinClass;
254
255// SSE scalar/parallel binary operations
256def IIC_SSE_ALU_F32S_RR : InstrItinClass;
257def IIC_SSE_ALU_F32S_RM : InstrItinClass;
258def IIC_SSE_ALU_F64S_RR : InstrItinClass;
259def IIC_SSE_ALU_F64S_RM : InstrItinClass;
260def IIC_SSE_MUL_F32S_RR : InstrItinClass;
261def IIC_SSE_MUL_F32S_RM : InstrItinClass;
262def IIC_SSE_MUL_F64S_RR : InstrItinClass;
263def IIC_SSE_MUL_F64S_RM : InstrItinClass;
264def IIC_SSE_DIV_F32S_RR : InstrItinClass;
265def IIC_SSE_DIV_F32S_RM : InstrItinClass;
266def IIC_SSE_DIV_F64S_RR : InstrItinClass;
267def IIC_SSE_DIV_F64S_RM : InstrItinClass;
268def IIC_SSE_ALU_F32P_RR : InstrItinClass;
269def IIC_SSE_ALU_F32P_RM : InstrItinClass;
270def IIC_SSE_ALU_F64P_RR : InstrItinClass;
271def IIC_SSE_ALU_F64P_RM : InstrItinClass;
272def IIC_SSE_MUL_F32P_RR : InstrItinClass;
273def IIC_SSE_MUL_F32P_RM : InstrItinClass;
274def IIC_SSE_MUL_F64P_RR : InstrItinClass;
275def IIC_SSE_MUL_F64P_RM : InstrItinClass;
276def IIC_SSE_DIV_F32P_RR : InstrItinClass;
277def IIC_SSE_DIV_F32P_RM : InstrItinClass;
278def IIC_SSE_DIV_F64P_RR : InstrItinClass;
279def IIC_SSE_DIV_F64P_RM : InstrItinClass;
280
281def IIC_SSE_COMIS_RR : InstrItinClass;
282def IIC_SSE_COMIS_RM : InstrItinClass;
283
284def IIC_SSE_HADDSUB_RR : InstrItinClass;
285def IIC_SSE_HADDSUB_RM : InstrItinClass;
286
287def IIC_SSE_BIT_P_RR : InstrItinClass;
288def IIC_SSE_BIT_P_RM : InstrItinClass;
289
290def IIC_SSE_INTALU_P_RR : InstrItinClass;
291def IIC_SSE_INTALU_P_RM : InstrItinClass;
292def IIC_SSE_INTALUQ_P_RR : InstrItinClass;
293def IIC_SSE_INTALUQ_P_RM : InstrItinClass;
294
295def IIC_SSE_INTMUL_P_RR : InstrItinClass;
296def IIC_SSE_INTMUL_P_RM : InstrItinClass;
297
298def IIC_SSE_INTSH_P_RR : InstrItinClass;
299def IIC_SSE_INTSH_P_RM : InstrItinClass;
300def IIC_SSE_INTSH_P_RI : InstrItinClass;
301
302def IIC_SSE_INTSHDQ_P_RI : InstrItinClass;
303
304def IIC_SSE_SHUFP : InstrItinClass;
305def IIC_SSE_PSHUF_RI : InstrItinClass;
306def IIC_SSE_PSHUF_MI : InstrItinClass;
307
Simon Pilgrim3f24ff62017-08-01 16:47:48 +0000308def IIC_SSE_PACK : InstrItinClass;
Simon Pilgrima271c542017-05-03 15:42:29 +0000309def IIC_SSE_UNPCK : InstrItinClass;
310
311def IIC_SSE_MOVMSK : InstrItinClass;
312def IIC_SSE_MASKMOV : InstrItinClass;
313
314def IIC_SSE_PEXTRW : InstrItinClass;
315def IIC_SSE_PINSRW : InstrItinClass;
316
317def IIC_SSE_PABS_RR : InstrItinClass;
318def IIC_SSE_PABS_RM : InstrItinClass;
319
320def IIC_SSE_SQRTPS_RR : InstrItinClass;
321def IIC_SSE_SQRTPS_RM : InstrItinClass;
322def IIC_SSE_SQRTSS_RR : InstrItinClass;
323def IIC_SSE_SQRTSS_RM : InstrItinClass;
324def IIC_SSE_SQRTPD_RR : InstrItinClass;
325def IIC_SSE_SQRTPD_RM : InstrItinClass;
326def IIC_SSE_SQRTSD_RR : InstrItinClass;
327def IIC_SSE_SQRTSD_RM : InstrItinClass;
328
329def IIC_SSE_RSQRTPS_RR : InstrItinClass;
330def IIC_SSE_RSQRTPS_RM : InstrItinClass;
331def IIC_SSE_RSQRTSS_RR : InstrItinClass;
332def IIC_SSE_RSQRTSS_RM : InstrItinClass;
333
334def IIC_SSE_RCPP_RR : InstrItinClass;
335def IIC_SSE_RCPP_RM : InstrItinClass;
336def IIC_SSE_RCPS_RR : InstrItinClass;
337def IIC_SSE_RCPS_RM : InstrItinClass;
338
339def IIC_SSE_MOV_S_RR : InstrItinClass;
340def IIC_SSE_MOV_S_RM : InstrItinClass;
341def IIC_SSE_MOV_S_MR : InstrItinClass;
342
343def IIC_SSE_MOVA_P_RR : InstrItinClass;
344def IIC_SSE_MOVA_P_RM : InstrItinClass;
345def IIC_SSE_MOVA_P_MR : InstrItinClass;
346
347def IIC_SSE_MOVU_P_RR : InstrItinClass;
348def IIC_SSE_MOVU_P_RM : InstrItinClass;
349def IIC_SSE_MOVU_P_MR : InstrItinClass;
350
351def IIC_SSE_MOVDQ : InstrItinClass;
352def IIC_SSE_MOVD_ToGP : InstrItinClass;
353def IIC_SSE_MOVQ_RR : InstrItinClass;
354
355def IIC_SSE_MOV_LH : InstrItinClass;
356
357def IIC_SSE_LDDQU : InstrItinClass;
358
359def IIC_SSE_MOVNT : InstrItinClass;
360
361def IIC_SSE_PHADDSUBD_RR : InstrItinClass;
362def IIC_SSE_PHADDSUBD_RM : InstrItinClass;
363def IIC_SSE_PHADDSUBSW_RR : InstrItinClass;
364def IIC_SSE_PHADDSUBSW_RM : InstrItinClass;
365def IIC_SSE_PHADDSUBW_RR : InstrItinClass;
366def IIC_SSE_PHADDSUBW_RM : InstrItinClass;
367def IIC_SSE_PSHUFB_RR : InstrItinClass;
368def IIC_SSE_PSHUFB_RM : InstrItinClass;
369def IIC_SSE_PSIGN_RR : InstrItinClass;
370def IIC_SSE_PSIGN_RM : InstrItinClass;
371
372def IIC_SSE_PMADD : InstrItinClass;
373def IIC_SSE_PMULHRSW : InstrItinClass;
374def IIC_SSE_PALIGNRR : InstrItinClass;
375def IIC_SSE_PALIGNRM : InstrItinClass;
376def IIC_SSE_MWAIT : InstrItinClass;
377def IIC_SSE_MONITOR : InstrItinClass;
378def IIC_SSE_MWAITX : InstrItinClass;
379def IIC_SSE_MONITORX : InstrItinClass;
380def IIC_SSE_CLZERO : InstrItinClass;
381
382def IIC_SSE_PREFETCH : InstrItinClass;
383def IIC_SSE_PAUSE : InstrItinClass;
384def IIC_SSE_LFENCE : InstrItinClass;
385def IIC_SSE_MFENCE : InstrItinClass;
386def IIC_SSE_SFENCE : InstrItinClass;
387def IIC_SSE_LDMXCSR : InstrItinClass;
388def IIC_SSE_STMXCSR : InstrItinClass;
389
390def IIC_SSE_CVT_PD_RR : InstrItinClass;
391def IIC_SSE_CVT_PD_RM : InstrItinClass;
392def IIC_SSE_CVT_PS_RR : InstrItinClass;
393def IIC_SSE_CVT_PS_RM : InstrItinClass;
Simon Pilgrima271c542017-05-03 15:42:29 +0000394def IIC_SSE_CVT_Scalar_RR : InstrItinClass;
395def IIC_SSE_CVT_Scalar_RM : InstrItinClass;
396def IIC_SSE_CVT_SS2SI32_RM : InstrItinClass;
397def IIC_SSE_CVT_SS2SI32_RR : InstrItinClass;
398def IIC_SSE_CVT_SS2SI64_RM : InstrItinClass;
399def IIC_SSE_CVT_SS2SI64_RR : InstrItinClass;
400def IIC_SSE_CVT_SD2SI_RM : InstrItinClass;
401def IIC_SSE_CVT_SD2SI_RR : InstrItinClass;
402
Simon Pilgrim91c159d2017-12-10 12:26:35 +0000403def IIC_AVX_ZERO : InstrItinClass;
404
Simon Pilgrima271c542017-05-03 15:42:29 +0000405// MMX
406def IIC_MMX_MOV_MM_RM : InstrItinClass;
407def IIC_MMX_MOV_REG_MM : InstrItinClass;
408def IIC_MMX_MOVQ_RM : InstrItinClass;
409def IIC_MMX_MOVQ_RR : InstrItinClass;
410
411def IIC_MMX_ALU_RM : InstrItinClass;
412def IIC_MMX_ALU_RR : InstrItinClass;
413def IIC_MMX_ALUQ_RM : InstrItinClass;
414def IIC_MMX_ALUQ_RR : InstrItinClass;
415def IIC_MMX_PHADDSUBW_RM : InstrItinClass;
416def IIC_MMX_PHADDSUBW_RR : InstrItinClass;
417def IIC_MMX_PHADDSUBD_RM : InstrItinClass;
418def IIC_MMX_PHADDSUBD_RR : InstrItinClass;
419def IIC_MMX_PMUL : InstrItinClass;
420def IIC_MMX_MISC_FUNC_MEM : InstrItinClass;
421def IIC_MMX_MISC_FUNC_REG : InstrItinClass;
422def IIC_MMX_PSADBW : InstrItinClass;
423def IIC_MMX_SHIFT_RI : InstrItinClass;
424def IIC_MMX_SHIFT_RM : InstrItinClass;
425def IIC_MMX_SHIFT_RR : InstrItinClass;
426def IIC_MMX_UNPCK_H_RM : InstrItinClass;
427def IIC_MMX_UNPCK_H_RR : InstrItinClass;
428def IIC_MMX_UNPCK_L : InstrItinClass;
429def IIC_MMX_PCK_RM : InstrItinClass;
430def IIC_MMX_PCK_RR : InstrItinClass;
431def IIC_MMX_PSHUF : InstrItinClass;
432def IIC_MMX_PEXTR : InstrItinClass;
433def IIC_MMX_PINSRW : InstrItinClass;
434def IIC_MMX_MASKMOV : InstrItinClass;
Simon Pilgrimf545bb6c2017-11-26 17:56:07 +0000435def IIC_MMX_MOVMSK : InstrItinClass;
Simon Pilgrima271c542017-05-03 15:42:29 +0000436def IIC_MMX_CVT_PD_RR : InstrItinClass;
437def IIC_MMX_CVT_PD_RM : InstrItinClass;
438def IIC_MMX_CVT_PS_RR : InstrItinClass;
439def IIC_MMX_CVT_PS_RM : InstrItinClass;
440
Simon Pilgrimfe6e92d2017-11-26 20:50:29 +0000441def IIC_3DNOW_FALU_RM : InstrItinClass;
442def IIC_3DNOW_FALU_RR : InstrItinClass;
443def IIC_3DNOW_FCVT_F2I_RM : InstrItinClass;
444def IIC_3DNOW_FCVT_F2I_RR : InstrItinClass;
445def IIC_3DNOW_FCVT_I2F_RM : InstrItinClass;
446def IIC_3DNOW_FCVT_I2F_RR : InstrItinClass;
447def IIC_3DNOW_MISC_FUNC_REG : InstrItinClass;
448def IIC_3DNOW_MISC_FUNC_MEM : InstrItinClass;
449
Simon Pilgrima271c542017-05-03 15:42:29 +0000450def IIC_CMPX_LOCK : InstrItinClass;
451def IIC_CMPX_LOCK_8 : InstrItinClass;
452def IIC_CMPX_LOCK_8B : InstrItinClass;
453def IIC_CMPX_LOCK_16B : InstrItinClass;
454
455def IIC_XADD_LOCK_MEM : InstrItinClass;
456def IIC_XADD_LOCK_MEM8 : InstrItinClass;
457
Simon Pilgrim65f805f2017-12-05 18:01:26 +0000458def IIC_FCMOV : InstrItinClass;
Simon Pilgrima271c542017-05-03 15:42:29 +0000459def IIC_FILD : InstrItinClass;
460def IIC_FLD : InstrItinClass;
461def IIC_FLD80 : InstrItinClass;
462def IIC_FST : InstrItinClass;
463def IIC_FST80 : InstrItinClass;
464def IIC_FIST : InstrItinClass;
465def IIC_FLDZ : InstrItinClass;
466def IIC_FUCOM : InstrItinClass;
467def IIC_FUCOMI : InstrItinClass;
468def IIC_FCOMI : InstrItinClass;
469def IIC_FNSTSW : InstrItinClass;
470def IIC_FNSTCW : InstrItinClass;
471def IIC_FLDCW : InstrItinClass;
472def IIC_FNINIT : InstrItinClass;
473def IIC_FFREE : InstrItinClass;
474def IIC_FNCLEX : InstrItinClass;
475def IIC_WAIT : InstrItinClass;
476def IIC_FXAM : InstrItinClass;
477def IIC_FNOP : InstrItinClass;
478def IIC_FLDL : InstrItinClass;
479def IIC_F2XM1 : InstrItinClass;
480def IIC_FYL2X : InstrItinClass;
481def IIC_FPTAN : InstrItinClass;
482def IIC_FPATAN : InstrItinClass;
483def IIC_FXTRACT : InstrItinClass;
484def IIC_FPREM1 : InstrItinClass;
485def IIC_FPSTP : InstrItinClass;
486def IIC_FPREM : InstrItinClass;
Simon Pilgrim0747a7e2017-11-28 15:03:42 +0000487def IIC_FSIGN : InstrItinClass;
488def IIC_FSQRT : InstrItinClass;
Simon Pilgrima271c542017-05-03 15:42:29 +0000489def IIC_FYL2XP1 : InstrItinClass;
490def IIC_FSINCOS : InstrItinClass;
491def IIC_FRNDINT : InstrItinClass;
492def IIC_FSCALE : InstrItinClass;
493def IIC_FCOMPP : InstrItinClass;
494def IIC_FXSAVE : InstrItinClass;
495def IIC_FXRSTOR : InstrItinClass;
496
497def IIC_FXCH : InstrItinClass;
498
499// System instructions
500def IIC_CPUID : InstrItinClass;
501def IIC_INT : InstrItinClass;
502def IIC_INT3 : InstrItinClass;
503def IIC_INVD : InstrItinClass;
504def IIC_INVLPG : InstrItinClass;
Simon Pilgrim1ddcae62017-12-08 15:48:37 +0000505def IIC_INVPCID : InstrItinClass;
Simon Pilgrima271c542017-05-03 15:42:29 +0000506def IIC_IRET : InstrItinClass;
507def IIC_HLT : InstrItinClass;
508def IIC_LXS : InstrItinClass;
509def IIC_LTR : InstrItinClass;
Simon Pilgrim42fcda92017-12-08 19:03:42 +0000510def IIC_MPX : InstrItinClass;
Simon Pilgrim1ddcae62017-12-08 15:48:37 +0000511def IIC_PKU : InstrItinClass;
512def IIC_PTWRITE : InstrItinClass;
513def IIC_RDPID : InstrItinClass;
Simon Pilgrim60411d92017-12-07 14:18:48 +0000514def IIC_RDRAND : InstrItinClass;
515def IIC_RDSEED : InstrItinClass;
Simon Pilgrima271c542017-05-03 15:42:29 +0000516def IIC_RDTSC : InstrItinClass;
Simon Pilgrimf00ea1b2017-12-13 14:22:04 +0000517def IIC_RDTSCP : InstrItinClass;
Simon Pilgrima271c542017-05-03 15:42:29 +0000518def IIC_RSM : InstrItinClass;
519def IIC_SIDT : InstrItinClass;
520def IIC_SGDT : InstrItinClass;
521def IIC_SLDT : InstrItinClass;
Simon Pilgrim1ddcae62017-12-08 15:48:37 +0000522def IIC_SMAP : InstrItinClass;
523def IIC_SMX : InstrItinClass;
Simon Pilgrima271c542017-05-03 15:42:29 +0000524def IIC_STR : InstrItinClass;
Simon Pilgrim6b7cd862017-12-07 14:35:17 +0000525def IIC_SKINIT : InstrItinClass;
526def IIC_SVM : InstrItinClass;
Simon Pilgrima13271b2017-12-07 15:57:32 +0000527def IIC_VMX : InstrItinClass;
Simon Pilgrim6b7cd862017-12-07 14:35:17 +0000528def IIC_CLGI : InstrItinClass;
529def IIC_STGI : InstrItinClass;
Simon Pilgrima271c542017-05-03 15:42:29 +0000530def IIC_SWAPGS : InstrItinClass;
531def IIC_SYSCALL : InstrItinClass;
532def IIC_SYS_ENTER_EXIT : InstrItinClass;
533def IIC_IN_RR : InstrItinClass;
534def IIC_IN_RI : InstrItinClass;
535def IIC_OUT_RR : InstrItinClass;
536def IIC_OUT_IR : InstrItinClass;
537def IIC_INS : InstrItinClass;
Simon Pilgrim99b925b2017-05-03 15:51:39 +0000538def IIC_LWP : InstrItinClass;
Simon Pilgrima271c542017-05-03 15:42:29 +0000539def IIC_MOV_REG_DR : InstrItinClass;
540def IIC_MOV_DR_REG : InstrItinClass;
541def IIC_MOV_REG_CR : InstrItinClass;
542def IIC_MOV_CR_REG : InstrItinClass;
543def IIC_MOV_REG_SR : InstrItinClass;
544def IIC_MOV_MEM_SR : InstrItinClass;
545def IIC_MOV_SR_REG : InstrItinClass;
546def IIC_MOV_SR_MEM : InstrItinClass;
547def IIC_LAR_RM : InstrItinClass;
548def IIC_LAR_RR : InstrItinClass;
549def IIC_LSL_RM : InstrItinClass;
550def IIC_LSL_RR : InstrItinClass;
551def IIC_LGDT : InstrItinClass;
552def IIC_LIDT : InstrItinClass;
553def IIC_LLDT_REG : InstrItinClass;
554def IIC_LLDT_MEM : InstrItinClass;
555def IIC_PUSH_CS : InstrItinClass;
556def IIC_PUSH_SR : InstrItinClass;
557def IIC_POP_SR : InstrItinClass;
558def IIC_POP_SR_SS : InstrItinClass;
Simon Pilgrim7e636cc2017-12-09 20:42:27 +0000559def IIC_SEGMENT_BASE_R : InstrItinClass;
560def IIC_SEGMENT_BASE_W : InstrItinClass;
Simon Pilgrima271c542017-05-03 15:42:29 +0000561def IIC_VERR : InstrItinClass;
562def IIC_VERW_REG : InstrItinClass;
563def IIC_VERW_MEM : InstrItinClass;
564def IIC_WRMSR : InstrItinClass;
565def IIC_RDMSR : InstrItinClass;
566def IIC_RDPMC : InstrItinClass;
567def IIC_SMSW : InstrItinClass;
568def IIC_LMSW_REG : InstrItinClass;
569def IIC_LMSW_MEM : InstrItinClass;
570def IIC_ENTER : InstrItinClass;
571def IIC_LEAVE : InstrItinClass;
572def IIC_POP_MEM : InstrItinClass;
573def IIC_POP_REG16 : InstrItinClass;
574def IIC_POP_REG : InstrItinClass;
575def IIC_POP_F : InstrItinClass;
576def IIC_POP_FD : InstrItinClass;
577def IIC_POP_A : InstrItinClass;
578def IIC_PUSH_IMM : InstrItinClass;
579def IIC_PUSH_MEM : InstrItinClass;
580def IIC_PUSH_REG : InstrItinClass;
581def IIC_PUSH_F : InstrItinClass;
582def IIC_PUSH_A : InstrItinClass;
583def IIC_BSWAP : InstrItinClass;
584def IIC_BIT_SCAN_MEM : InstrItinClass;
585def IIC_BIT_SCAN_REG : InstrItinClass;
Simon Pilgrimf1d599a2017-12-07 15:24:14 +0000586def IIC_LZCNT_RR : InstrItinClass;
587def IIC_LZCNT_RM : InstrItinClass;
588def IIC_TZCNT_RR : InstrItinClass;
589def IIC_TZCNT_RM : InstrItinClass;
Simon Pilgrima271c542017-05-03 15:42:29 +0000590def IIC_MOVS : InstrItinClass;
591def IIC_STOS : InstrItinClass;
592def IIC_SCAS : InstrItinClass;
593def IIC_CMPS : InstrItinClass;
594def IIC_MOV : InstrItinClass;
595def IIC_MOV_MEM : InstrItinClass;
596def IIC_AHF : InstrItinClass;
597def IIC_BT_MI : InstrItinClass;
598def IIC_BT_MR : InstrItinClass;
599def IIC_BT_RI : InstrItinClass;
600def IIC_BT_RR : InstrItinClass;
601def IIC_BTX_MI : InstrItinClass;
602def IIC_BTX_MR : InstrItinClass;
603def IIC_BTX_RI : InstrItinClass;
604def IIC_BTX_RR : InstrItinClass;
605def IIC_XCHG_REG : InstrItinClass;
606def IIC_XCHG_MEM : InstrItinClass;
607def IIC_XADD_REG : InstrItinClass;
608def IIC_XADD_MEM : InstrItinClass;
609def IIC_CMPXCHG_MEM : InstrItinClass;
610def IIC_CMPXCHG_REG : InstrItinClass;
611def IIC_CMPXCHG_MEM8 : InstrItinClass;
612def IIC_CMPXCHG_REG8 : InstrItinClass;
613def IIC_CMPXCHG_8B : InstrItinClass;
614def IIC_CMPXCHG_16B : InstrItinClass;
615def IIC_LODS : InstrItinClass;
616def IIC_OUTS : InstrItinClass;
617def IIC_CLC : InstrItinClass;
618def IIC_CLD : InstrItinClass;
619def IIC_CLI : InstrItinClass;
620def IIC_CMC : InstrItinClass;
621def IIC_CLTS : InstrItinClass;
622def IIC_STC : InstrItinClass;
623def IIC_STI : InstrItinClass;
624def IIC_STD : InstrItinClass;
625def IIC_XLAT : InstrItinClass;
626def IIC_AAA : InstrItinClass;
627def IIC_AAD : InstrItinClass;
628def IIC_AAM : InstrItinClass;
629def IIC_AAS : InstrItinClass;
630def IIC_DAA : InstrItinClass;
631def IIC_DAS : InstrItinClass;
632def IIC_BOUND : InstrItinClass;
633def IIC_ARPL_REG : InstrItinClass;
634def IIC_ARPL_MEM : InstrItinClass;
635def IIC_MOVBE : InstrItinClass;
636def IIC_AES : InstrItinClass;
637def IIC_BLEND_MEM : InstrItinClass;
638def IIC_BLEND_NOMEM : InstrItinClass;
639def IIC_CBW : InstrItinClass;
640def IIC_CRC32_REG : InstrItinClass;
641def IIC_CRC32_MEM : InstrItinClass;
642def IIC_SSE_DPPD_RR : InstrItinClass;
643def IIC_SSE_DPPD_RM : InstrItinClass;
644def IIC_SSE_DPPS_RR : InstrItinClass;
645def IIC_SSE_DPPS_RM : InstrItinClass;
646def IIC_MMX_EMMS : InstrItinClass;
647def IIC_SSE_EXTRACTPS_RR : InstrItinClass;
648def IIC_SSE_EXTRACTPS_RM : InstrItinClass;
649def IIC_SSE_INSERTPS_RR : InstrItinClass;
650def IIC_SSE_INSERTPS_RM : InstrItinClass;
651def IIC_SSE_MPSADBW_RR : InstrItinClass;
652def IIC_SSE_MPSADBW_RM : InstrItinClass;
653def IIC_SSE_PMULLD_RR : InstrItinClass;
654def IIC_SSE_PMULLD_RM : InstrItinClass;
655def IIC_SSE_ROUNDPS_REG : InstrItinClass;
656def IIC_SSE_ROUNDPS_MEM : InstrItinClass;
657def IIC_SSE_ROUNDPD_REG : InstrItinClass;
658def IIC_SSE_ROUNDPD_MEM : InstrItinClass;
659def IIC_SSE_POPCNT_RR : InstrItinClass;
660def IIC_SSE_POPCNT_RM : InstrItinClass;
661def IIC_SSE_PCLMULQDQ_RR : InstrItinClass;
662def IIC_SSE_PCLMULQDQ_RM : InstrItinClass;
663
664def IIC_NOP : InstrItinClass;
665
666//===----------------------------------------------------------------------===//
667// Processor instruction itineraries.
668
669// IssueWidth is analogous to the number of decode units. Core and its
670// descendents, including Nehalem and SandyBridge have 4 decoders.
671// Resources beyond the decoder operate on micro-ops and are bufferred
672// so adjacent micro-ops don't directly compete.
673//
674// MicroOpBufferSize > 1 indicates that RAW dependencies can be
675// decoded in the same cycle. The value 32 is a reasonably arbitrary
676// number of in-flight instructions.
677//
678// HighLatency=10 is optimistic. X86InstrInfo::isHighLatencyDef
679// indicates high latency opcodes. Alternatively, InstrItinData
680// entries may be included here to define specific operand
681// latencies. Since these latencies are not used for pipeline hazards,
682// they do not need to be exact.
683//
684// The GenericX86Model contains no instruction itineraries
685// and disables PostRAScheduler.
686class GenericX86Model : SchedMachineModel {
687 let IssueWidth = 4;
688 let MicroOpBufferSize = 32;
689 let LoadLatency = 4;
690 let HighLatency = 10;
691 let PostRAScheduler = 0;
692 let CompleteModel = 0;
693}
694
695def GenericModel : GenericX86Model;
696
697// Define a model with the PostRAScheduler enabled.
698def GenericPostRAModel : GenericX86Model {
699 let PostRAScheduler = 1;
700}
701