blob: 8dc2eac74ba41e72f76b8af9006f8f99d45efd6a [file] [log] [blame]
Simon Pilgrima271c542017-05-03 15:42:29 +00001//===-- X86Schedule.td - X86 Scheduling Definitions --------*- tablegen -*-===//
2//
3// The LLVM Compiler Infrastructure
4//
5// This file is distributed under the University of Illinois Open Source
6// License. See LICENSE.TXT for details.
7//
8//===----------------------------------------------------------------------===//
9
10// InstrSchedModel annotations for out-of-order CPUs.
11//
12// These annotations are independent of the itinerary classes defined below.
13
14// Instructions with folded loads need to read the memory operand immediately,
15// but other register operands don't have to be read until the load is ready.
16// These operands are marked with ReadAfterLd.
17def ReadAfterLd : SchedRead;
18
19// Instructions with both a load and a store folded are modeled as a folded
20// load + WriteRMW.
21def WriteRMW : SchedWrite;
22
23// Most instructions can fold loads, so almost every SchedWrite comes in two
24// variants: With and without a folded load.
25// An X86FoldableSchedWrite holds a reference to the corresponding SchedWrite
26// with a folded load.
27class X86FoldableSchedWrite : SchedWrite {
28 // The SchedWrite to use when a load is folded into the instruction.
29 SchedWrite Folded;
30}
31
32// Multiclass that produces a linked pair of SchedWrites.
33multiclass X86SchedWritePair {
34 // Register-Memory operation.
35 def Ld : SchedWrite;
36 // Register-Register operation.
37 def NAME : X86FoldableSchedWrite {
38 let Folded = !cast<SchedWrite>(NAME#"Ld");
39 }
40}
41
42// Arithmetic.
43defm WriteALU : X86SchedWritePair; // Simple integer ALU op.
Craig Topperf0d04262018-04-06 16:16:48 +000044def WriteALURMW : WriteSequence<[WriteALULd, WriteRMW]>;
Simon Pilgrima271c542017-05-03 15:42:29 +000045defm WriteIMul : X86SchedWritePair; // Integer multiplication.
46def WriteIMulH : SchedWrite; // Integer multiplication, high part.
47defm WriteIDiv : X86SchedWritePair; // Integer division.
48def WriteLEA : SchedWrite; // LEA instructions can't fold loads.
49
Simon Pilgrimf33d9052018-03-26 18:19:28 +000050defm WriteBitScan : X86SchedWritePair; // Bit scan forward/reverse.
51defm WritePOPCNT : X86SchedWritePair; // Bit population count.
52defm WriteLZCNT : X86SchedWritePair; // Leading zero count.
53defm WriteTZCNT : X86SchedWritePair; // Trailing zero count.
54
Simon Pilgrima271c542017-05-03 15:42:29 +000055// Integer shifts and rotates.
56defm WriteShift : X86SchedWritePair;
57
Craig Topper89310f52018-03-29 20:41:39 +000058// BMI1 BEXTR, BMI2 BZHI
59defm WriteBEXTR : X86SchedWritePair;
60defm WriteBZHI : X86SchedWritePair;
61
Simon Pilgrima271c542017-05-03 15:42:29 +000062// Loads, stores, and moves, not folded with other operations.
63def WriteLoad : SchedWrite;
64def WriteStore : SchedWrite;
65def WriteMove : SchedWrite;
66
67// Idioms that clear a register, like xorps %xmm0, %xmm0.
68// These can often bypass execution ports completely.
69def WriteZero : SchedWrite;
70
71// Branches don't produce values, so they have no latency, but they still
72// consume resources. Indirect branches can fold loads.
73defm WriteJump : X86SchedWritePair;
74
75// Floating point. This covers both scalar and vector operations.
Simon Pilgrimfb7aa572018-03-15 14:45:30 +000076def WriteFLoad : SchedWrite;
77def WriteFStore : SchedWrite;
78def WriteFMove : SchedWrite;
Simon Pilgrima271c542017-05-03 15:42:29 +000079defm WriteFAdd : X86SchedWritePair; // Floating point add/sub/compare.
80defm WriteFMul : X86SchedWritePair; // Floating point multiplication.
81defm WriteFDiv : X86SchedWritePair; // Floating point division.
82defm WriteFSqrt : X86SchedWritePair; // Floating point square root.
83defm WriteFRcp : X86SchedWritePair; // Floating point reciprocal estimate.
84defm WriteFRsqrt : X86SchedWritePair; // Floating point reciprocal square root estimate.
85defm WriteFMA : X86SchedWritePair; // Fused Multiply Add.
86defm WriteFShuffle : X86SchedWritePair; // Floating point vector shuffles.
87defm WriteFBlend : X86SchedWritePair; // Floating point vector blends.
88defm WriteFVarBlend : X86SchedWritePair; // Fp vector variable blends.
89
90// FMA Scheduling helper class.
91class FMASC { X86FoldableSchedWrite Sched = WriteFAdd; }
92
Andrew V. Tischenko8cb1d092017-06-08 16:44:13 +000093// Horizontal Add/Sub (float and integer)
94defm WriteFHAdd : X86SchedWritePair;
95defm WritePHAdd : X86SchedWritePair;
96
Simon Pilgrima271c542017-05-03 15:42:29 +000097// Vector integer operations.
Simon Pilgrimfb7aa572018-03-15 14:45:30 +000098def WriteVecLoad : SchedWrite;
99def WriteVecStore : SchedWrite;
100def WriteVecMove : SchedWrite;
Simon Pilgrima271c542017-05-03 15:42:29 +0000101defm WriteVecALU : X86SchedWritePair; // Vector integer ALU op, no logicals.
102defm WriteVecShift : X86SchedWritePair; // Vector integer shifts.
103defm WriteVecIMul : X86SchedWritePair; // Vector integer multiply.
Craig Topper13a0f832018-03-31 04:54:32 +0000104defm WritePMULLD : X86SchedWritePair; // PMULLD
Simon Pilgrima271c542017-05-03 15:42:29 +0000105defm WriteShuffle : X86SchedWritePair; // Vector shuffles.
106defm WriteBlend : X86SchedWritePair; // Vector blends.
107defm WriteVarBlend : X86SchedWritePair; // Vector variable blends.
108defm WriteMPSAD : X86SchedWritePair; // Vector MPSAD.
109
110// Vector bitwise operations.
111// These are often used on both floating point and integer vectors.
112defm WriteVecLogic : X86SchedWritePair; // Vector and/or/xor.
113
Simon Pilgrima2f26782018-03-27 20:38:54 +0000114// MOVMSK operations.
115def WriteFMOVMSK : SchedWrite;
116def WriteVecMOVMSK : SchedWrite;
117def WriteMMXMOVMSK : SchedWrite;
118
Simon Pilgrima271c542017-05-03 15:42:29 +0000119// Conversion between integer and float.
120defm WriteCvtF2I : X86SchedWritePair; // Float -> Integer.
121defm WriteCvtI2F : X86SchedWritePair; // Integer -> Float.
122defm WriteCvtF2F : X86SchedWritePair; // Float -> Float size conversion.
123
Simon Pilgrim28e7bcb2018-03-26 21:06:14 +0000124// CRC32 instruction.
125defm WriteCRC32 : X86SchedWritePair;
126
Simon Pilgrima271c542017-05-03 15:42:29 +0000127// Strings instructions.
128// Packed Compare Implicit Length Strings, Return Mask
129defm WritePCmpIStrM : X86SchedWritePair;
130// Packed Compare Explicit Length Strings, Return Mask
131defm WritePCmpEStrM : X86SchedWritePair;
132// Packed Compare Implicit Length Strings, Return Index
133defm WritePCmpIStrI : X86SchedWritePair;
134// Packed Compare Explicit Length Strings, Return Index
135defm WritePCmpEStrI : X86SchedWritePair;
136
137// AES instructions.
138defm WriteAESDecEnc : X86SchedWritePair; // Decryption, encryption.
139defm WriteAESIMC : X86SchedWritePair; // InvMixColumn.
140defm WriteAESKeyGen : X86SchedWritePair; // Key Generation.
141
142// Carry-less multiplication instructions.
143defm WriteCLMul : X86SchedWritePair;
144
145// Catch-all for expensive system instructions.
146def WriteSystem : SchedWrite;
147
148// AVX2.
149defm WriteFShuffle256 : X86SchedWritePair; // Fp 256-bit width vector shuffles.
150defm WriteShuffle256 : X86SchedWritePair; // 256-bit width vector shuffles.
151defm WriteVarVecShift : X86SchedWritePair; // Variable vector shifts.
152
153// Old microcoded instructions that nobody use.
154def WriteMicrocoded : SchedWrite;
155
156// Fence instructions.
157def WriteFence : SchedWrite;
158
159// Nop, not very useful expect it provides a model for nops!
160def WriteNop : SchedWrite;
161
162//===----------------------------------------------------------------------===//
163// Instruction Itinerary classes used for X86
164def IIC_ALU_MEM : InstrItinClass;
165def IIC_ALU_NONMEM : InstrItinClass;
166def IIC_LEA : InstrItinClass;
167def IIC_LEA_16 : InstrItinClass;
Craig Topper5ccd8722018-03-19 16:38:33 +0000168def IIC_MUL8_MEM : InstrItinClass;
169def IIC_MUL8_REG : InstrItinClass;
Simon Pilgrima271c542017-05-03 15:42:29 +0000170def IIC_MUL16_MEM : InstrItinClass;
171def IIC_MUL16_REG : InstrItinClass;
172def IIC_MUL32_MEM : InstrItinClass;
173def IIC_MUL32_REG : InstrItinClass;
Craig Topper5ccd8722018-03-19 16:38:33 +0000174def IIC_MUL64_MEM : InstrItinClass;
175def IIC_MUL64_REG : InstrItinClass;
Simon Pilgrima271c542017-05-03 15:42:29 +0000176// imul by al, ax, eax, tax
Craig Topper5ccd8722018-03-19 16:38:33 +0000177def IIC_IMUL8_MEM : InstrItinClass;
178def IIC_IMUL8_REG : InstrItinClass;
Simon Pilgrima271c542017-05-03 15:42:29 +0000179def IIC_IMUL16_MEM : InstrItinClass;
180def IIC_IMUL16_REG : InstrItinClass;
181def IIC_IMUL32_MEM : InstrItinClass;
182def IIC_IMUL32_REG : InstrItinClass;
Craig Topper5ccd8722018-03-19 16:38:33 +0000183def IIC_IMUL64_MEM : InstrItinClass;
184def IIC_IMUL64_REG : InstrItinClass;
Simon Pilgrima271c542017-05-03 15:42:29 +0000185// imul reg by reg|mem
186def IIC_IMUL16_RM : InstrItinClass;
187def IIC_IMUL16_RR : InstrItinClass;
188def IIC_IMUL32_RM : InstrItinClass;
189def IIC_IMUL32_RR : InstrItinClass;
190def IIC_IMUL64_RM : InstrItinClass;
191def IIC_IMUL64_RR : InstrItinClass;
192// imul reg = reg/mem * imm
193def IIC_IMUL16_RMI : InstrItinClass;
194def IIC_IMUL16_RRI : InstrItinClass;
195def IIC_IMUL32_RMI : InstrItinClass;
196def IIC_IMUL32_RRI : InstrItinClass;
197def IIC_IMUL64_RMI : InstrItinClass;
198def IIC_IMUL64_RRI : InstrItinClass;
199// div
200def IIC_DIV8_MEM : InstrItinClass;
201def IIC_DIV8_REG : InstrItinClass;
Craig Topper5ccd8722018-03-19 16:38:33 +0000202def IIC_DIV16_MEM : InstrItinClass;
203def IIC_DIV16_REG : InstrItinClass;
204def IIC_DIV32_MEM : InstrItinClass;
205def IIC_DIV32_REG : InstrItinClass;
206def IIC_DIV64_MEM : InstrItinClass;
207def IIC_DIV64_REG : InstrItinClass;
Simon Pilgrima271c542017-05-03 15:42:29 +0000208// idiv
Craig Topper5ccd8722018-03-19 16:38:33 +0000209def IIC_IDIV8_MEM : InstrItinClass;
210def IIC_IDIV8_REG : InstrItinClass;
211def IIC_IDIV16_MEM : InstrItinClass;
212def IIC_IDIV16_REG : InstrItinClass;
213def IIC_IDIV32_MEM : InstrItinClass;
214def IIC_IDIV32_REG : InstrItinClass;
215def IIC_IDIV64_MEM : InstrItinClass;
216def IIC_IDIV64_REG : InstrItinClass;
Simon Pilgrima271c542017-05-03 15:42:29 +0000217// neg/not/inc/dec
218def IIC_UNARY_REG : InstrItinClass;
219def IIC_UNARY_MEM : InstrItinClass;
220// add/sub/and/or/xor/sbc/cmp/test
221def IIC_BIN_MEM : InstrItinClass;
222def IIC_BIN_NONMEM : InstrItinClass;
223// adc/sbc
224def IIC_BIN_CARRY_MEM : InstrItinClass;
225def IIC_BIN_CARRY_NONMEM : InstrItinClass;
226// shift/rotate
227def IIC_SR : InstrItinClass;
228// shift double
229def IIC_SHD16_REG_IM : InstrItinClass;
230def IIC_SHD16_REG_CL : InstrItinClass;
231def IIC_SHD16_MEM_IM : InstrItinClass;
232def IIC_SHD16_MEM_CL : InstrItinClass;
233def IIC_SHD32_REG_IM : InstrItinClass;
234def IIC_SHD32_REG_CL : InstrItinClass;
235def IIC_SHD32_MEM_IM : InstrItinClass;
236def IIC_SHD32_MEM_CL : InstrItinClass;
237def IIC_SHD64_REG_IM : InstrItinClass;
238def IIC_SHD64_REG_CL : InstrItinClass;
239def IIC_SHD64_MEM_IM : InstrItinClass;
240def IIC_SHD64_MEM_CL : InstrItinClass;
241// cmov
242def IIC_CMOV16_RM : InstrItinClass;
243def IIC_CMOV16_RR : InstrItinClass;
244def IIC_CMOV32_RM : InstrItinClass;
245def IIC_CMOV32_RR : InstrItinClass;
246def IIC_CMOV64_RM : InstrItinClass;
247def IIC_CMOV64_RR : InstrItinClass;
248// set
249def IIC_SET_R : InstrItinClass;
250def IIC_SET_M : InstrItinClass;
251// jmp/jcc/jcxz
252def IIC_Jcc : InstrItinClass;
253def IIC_JCXZ : InstrItinClass;
254def IIC_JMP_REL : InstrItinClass;
255def IIC_JMP_REG : InstrItinClass;
256def IIC_JMP_MEM : InstrItinClass;
257def IIC_JMP_FAR_MEM : InstrItinClass;
258def IIC_JMP_FAR_PTR : InstrItinClass;
259// loop
260def IIC_LOOP : InstrItinClass;
261def IIC_LOOPE : InstrItinClass;
262def IIC_LOOPNE : InstrItinClass;
263// call
264def IIC_CALL_RI : InstrItinClass;
265def IIC_CALL_MEM : InstrItinClass;
266def IIC_CALL_FAR_MEM : InstrItinClass;
267def IIC_CALL_FAR_PTR : InstrItinClass;
268// ret
269def IIC_RET : InstrItinClass;
270def IIC_RET_IMM : InstrItinClass;
271//sign extension movs
272def IIC_MOVSX : InstrItinClass;
273def IIC_MOVSX_R16_R8 : InstrItinClass;
274def IIC_MOVSX_R16_M8 : InstrItinClass;
Simon Pilgrima271c542017-05-03 15:42:29 +0000275//zero extension movs
276def IIC_MOVZX : InstrItinClass;
277def IIC_MOVZX_R16_R8 : InstrItinClass;
278def IIC_MOVZX_R16_M8 : InstrItinClass;
279
280def IIC_REP_MOVS : InstrItinClass;
281def IIC_REP_STOS : InstrItinClass;
282
283// SSE scalar/parallel binary operations
284def IIC_SSE_ALU_F32S_RR : InstrItinClass;
285def IIC_SSE_ALU_F32S_RM : InstrItinClass;
286def IIC_SSE_ALU_F64S_RR : InstrItinClass;
287def IIC_SSE_ALU_F64S_RM : InstrItinClass;
288def IIC_SSE_MUL_F32S_RR : InstrItinClass;
289def IIC_SSE_MUL_F32S_RM : InstrItinClass;
290def IIC_SSE_MUL_F64S_RR : InstrItinClass;
291def IIC_SSE_MUL_F64S_RM : InstrItinClass;
292def IIC_SSE_DIV_F32S_RR : InstrItinClass;
293def IIC_SSE_DIV_F32S_RM : InstrItinClass;
294def IIC_SSE_DIV_F64S_RR : InstrItinClass;
295def IIC_SSE_DIV_F64S_RM : InstrItinClass;
296def IIC_SSE_ALU_F32P_RR : InstrItinClass;
297def IIC_SSE_ALU_F32P_RM : InstrItinClass;
298def IIC_SSE_ALU_F64P_RR : InstrItinClass;
299def IIC_SSE_ALU_F64P_RM : InstrItinClass;
300def IIC_SSE_MUL_F32P_RR : InstrItinClass;
301def IIC_SSE_MUL_F32P_RM : InstrItinClass;
302def IIC_SSE_MUL_F64P_RR : InstrItinClass;
303def IIC_SSE_MUL_F64P_RM : InstrItinClass;
304def IIC_SSE_DIV_F32P_RR : InstrItinClass;
305def IIC_SSE_DIV_F32P_RM : InstrItinClass;
306def IIC_SSE_DIV_F64P_RR : InstrItinClass;
307def IIC_SSE_DIV_F64P_RM : InstrItinClass;
308
309def IIC_SSE_COMIS_RR : InstrItinClass;
310def IIC_SSE_COMIS_RM : InstrItinClass;
311
312def IIC_SSE_HADDSUB_RR : InstrItinClass;
313def IIC_SSE_HADDSUB_RM : InstrItinClass;
314
315def IIC_SSE_BIT_P_RR : InstrItinClass;
316def IIC_SSE_BIT_P_RM : InstrItinClass;
317
318def IIC_SSE_INTALU_P_RR : InstrItinClass;
319def IIC_SSE_INTALU_P_RM : InstrItinClass;
320def IIC_SSE_INTALUQ_P_RR : InstrItinClass;
321def IIC_SSE_INTALUQ_P_RM : InstrItinClass;
322
323def IIC_SSE_INTMUL_P_RR : InstrItinClass;
324def IIC_SSE_INTMUL_P_RM : InstrItinClass;
325
326def IIC_SSE_INTSH_P_RR : InstrItinClass;
327def IIC_SSE_INTSH_P_RM : InstrItinClass;
328def IIC_SSE_INTSH_P_RI : InstrItinClass;
329
330def IIC_SSE_INTSHDQ_P_RI : InstrItinClass;
331
332def IIC_SSE_SHUFP : InstrItinClass;
333def IIC_SSE_PSHUF_RI : InstrItinClass;
334def IIC_SSE_PSHUF_MI : InstrItinClass;
335
Simon Pilgrim3f24ff62017-08-01 16:47:48 +0000336def IIC_SSE_PACK : InstrItinClass;
Simon Pilgrima271c542017-05-03 15:42:29 +0000337def IIC_SSE_UNPCK : InstrItinClass;
338
339def IIC_SSE_MOVMSK : InstrItinClass;
340def IIC_SSE_MASKMOV : InstrItinClass;
341
342def IIC_SSE_PEXTRW : InstrItinClass;
343def IIC_SSE_PINSRW : InstrItinClass;
344
345def IIC_SSE_PABS_RR : InstrItinClass;
346def IIC_SSE_PABS_RM : InstrItinClass;
347
348def IIC_SSE_SQRTPS_RR : InstrItinClass;
349def IIC_SSE_SQRTPS_RM : InstrItinClass;
350def IIC_SSE_SQRTSS_RR : InstrItinClass;
351def IIC_SSE_SQRTSS_RM : InstrItinClass;
352def IIC_SSE_SQRTPD_RR : InstrItinClass;
353def IIC_SSE_SQRTPD_RM : InstrItinClass;
354def IIC_SSE_SQRTSD_RR : InstrItinClass;
355def IIC_SSE_SQRTSD_RM : InstrItinClass;
356
357def IIC_SSE_RSQRTPS_RR : InstrItinClass;
358def IIC_SSE_RSQRTPS_RM : InstrItinClass;
359def IIC_SSE_RSQRTSS_RR : InstrItinClass;
360def IIC_SSE_RSQRTSS_RM : InstrItinClass;
361
362def IIC_SSE_RCPP_RR : InstrItinClass;
363def IIC_SSE_RCPP_RM : InstrItinClass;
364def IIC_SSE_RCPS_RR : InstrItinClass;
365def IIC_SSE_RCPS_RM : InstrItinClass;
366
367def IIC_SSE_MOV_S_RR : InstrItinClass;
368def IIC_SSE_MOV_S_RM : InstrItinClass;
369def IIC_SSE_MOV_S_MR : InstrItinClass;
370
371def IIC_SSE_MOVA_P_RR : InstrItinClass;
372def IIC_SSE_MOVA_P_RM : InstrItinClass;
373def IIC_SSE_MOVA_P_MR : InstrItinClass;
374
375def IIC_SSE_MOVU_P_RR : InstrItinClass;
376def IIC_SSE_MOVU_P_RM : InstrItinClass;
377def IIC_SSE_MOVU_P_MR : InstrItinClass;
378
379def IIC_SSE_MOVDQ : InstrItinClass;
380def IIC_SSE_MOVD_ToGP : InstrItinClass;
381def IIC_SSE_MOVQ_RR : InstrItinClass;
382
383def IIC_SSE_MOV_LH : InstrItinClass;
384
385def IIC_SSE_LDDQU : InstrItinClass;
386
387def IIC_SSE_MOVNT : InstrItinClass;
388
389def IIC_SSE_PHADDSUBD_RR : InstrItinClass;
390def IIC_SSE_PHADDSUBD_RM : InstrItinClass;
391def IIC_SSE_PHADDSUBSW_RR : InstrItinClass;
392def IIC_SSE_PHADDSUBSW_RM : InstrItinClass;
393def IIC_SSE_PHADDSUBW_RR : InstrItinClass;
394def IIC_SSE_PHADDSUBW_RM : InstrItinClass;
395def IIC_SSE_PSHUFB_RR : InstrItinClass;
396def IIC_SSE_PSHUFB_RM : InstrItinClass;
397def IIC_SSE_PSIGN_RR : InstrItinClass;
398def IIC_SSE_PSIGN_RM : InstrItinClass;
399
400def IIC_SSE_PMADD : InstrItinClass;
401def IIC_SSE_PMULHRSW : InstrItinClass;
402def IIC_SSE_PALIGNRR : InstrItinClass;
403def IIC_SSE_PALIGNRM : InstrItinClass;
404def IIC_SSE_MWAIT : InstrItinClass;
405def IIC_SSE_MONITOR : InstrItinClass;
406def IIC_SSE_MWAITX : InstrItinClass;
407def IIC_SSE_MONITORX : InstrItinClass;
408def IIC_SSE_CLZERO : InstrItinClass;
409
410def IIC_SSE_PREFETCH : InstrItinClass;
411def IIC_SSE_PAUSE : InstrItinClass;
412def IIC_SSE_LFENCE : InstrItinClass;
413def IIC_SSE_MFENCE : InstrItinClass;
414def IIC_SSE_SFENCE : InstrItinClass;
415def IIC_SSE_LDMXCSR : InstrItinClass;
416def IIC_SSE_STMXCSR : InstrItinClass;
417
418def IIC_SSE_CVT_PD_RR : InstrItinClass;
419def IIC_SSE_CVT_PD_RM : InstrItinClass;
420def IIC_SSE_CVT_PS_RR : InstrItinClass;
421def IIC_SSE_CVT_PS_RM : InstrItinClass;
Simon Pilgrima271c542017-05-03 15:42:29 +0000422def IIC_SSE_CVT_Scalar_RR : InstrItinClass;
423def IIC_SSE_CVT_Scalar_RM : InstrItinClass;
424def IIC_SSE_CVT_SS2SI32_RM : InstrItinClass;
425def IIC_SSE_CVT_SS2SI32_RR : InstrItinClass;
426def IIC_SSE_CVT_SS2SI64_RM : InstrItinClass;
427def IIC_SSE_CVT_SS2SI64_RR : InstrItinClass;
428def IIC_SSE_CVT_SD2SI_RM : InstrItinClass;
429def IIC_SSE_CVT_SD2SI_RR : InstrItinClass;
430
Simon Pilgrim91c159d2017-12-10 12:26:35 +0000431def IIC_AVX_ZERO : InstrItinClass;
432
Simon Pilgrima271c542017-05-03 15:42:29 +0000433// MMX
434def IIC_MMX_MOV_MM_RM : InstrItinClass;
435def IIC_MMX_MOV_REG_MM : InstrItinClass;
436def IIC_MMX_MOVQ_RM : InstrItinClass;
437def IIC_MMX_MOVQ_RR : InstrItinClass;
438
439def IIC_MMX_ALU_RM : InstrItinClass;
440def IIC_MMX_ALU_RR : InstrItinClass;
441def IIC_MMX_ALUQ_RM : InstrItinClass;
442def IIC_MMX_ALUQ_RR : InstrItinClass;
443def IIC_MMX_PHADDSUBW_RM : InstrItinClass;
444def IIC_MMX_PHADDSUBW_RR : InstrItinClass;
445def IIC_MMX_PHADDSUBD_RM : InstrItinClass;
446def IIC_MMX_PHADDSUBD_RR : InstrItinClass;
447def IIC_MMX_PMUL : InstrItinClass;
448def IIC_MMX_MISC_FUNC_MEM : InstrItinClass;
449def IIC_MMX_MISC_FUNC_REG : InstrItinClass;
450def IIC_MMX_PSADBW : InstrItinClass;
451def IIC_MMX_SHIFT_RI : InstrItinClass;
452def IIC_MMX_SHIFT_RM : InstrItinClass;
453def IIC_MMX_SHIFT_RR : InstrItinClass;
454def IIC_MMX_UNPCK_H_RM : InstrItinClass;
455def IIC_MMX_UNPCK_H_RR : InstrItinClass;
456def IIC_MMX_UNPCK_L : InstrItinClass;
457def IIC_MMX_PCK_RM : InstrItinClass;
458def IIC_MMX_PCK_RR : InstrItinClass;
459def IIC_MMX_PSHUF : InstrItinClass;
460def IIC_MMX_PEXTR : InstrItinClass;
461def IIC_MMX_PINSRW : InstrItinClass;
462def IIC_MMX_MASKMOV : InstrItinClass;
Simon Pilgrimf545bb6c2017-11-26 17:56:07 +0000463def IIC_MMX_MOVMSK : InstrItinClass;
Simon Pilgrima271c542017-05-03 15:42:29 +0000464def IIC_MMX_CVT_PD_RR : InstrItinClass;
465def IIC_MMX_CVT_PD_RM : InstrItinClass;
466def IIC_MMX_CVT_PS_RR : InstrItinClass;
467def IIC_MMX_CVT_PS_RM : InstrItinClass;
468
Simon Pilgrimfe6e92d2017-11-26 20:50:29 +0000469def IIC_3DNOW_FALU_RM : InstrItinClass;
470def IIC_3DNOW_FALU_RR : InstrItinClass;
471def IIC_3DNOW_FCVT_F2I_RM : InstrItinClass;
472def IIC_3DNOW_FCVT_F2I_RR : InstrItinClass;
473def IIC_3DNOW_FCVT_I2F_RM : InstrItinClass;
474def IIC_3DNOW_FCVT_I2F_RR : InstrItinClass;
475def IIC_3DNOW_MISC_FUNC_REG : InstrItinClass;
476def IIC_3DNOW_MISC_FUNC_MEM : InstrItinClass;
477
Simon Pilgrima271c542017-05-03 15:42:29 +0000478def IIC_CMPX_LOCK : InstrItinClass;
479def IIC_CMPX_LOCK_8 : InstrItinClass;
480def IIC_CMPX_LOCK_8B : InstrItinClass;
481def IIC_CMPX_LOCK_16B : InstrItinClass;
482
483def IIC_XADD_LOCK_MEM : InstrItinClass;
484def IIC_XADD_LOCK_MEM8 : InstrItinClass;
485
Simon Pilgrim65f805f2017-12-05 18:01:26 +0000486def IIC_FCMOV : InstrItinClass;
Simon Pilgrima271c542017-05-03 15:42:29 +0000487def IIC_FILD : InstrItinClass;
488def IIC_FLD : InstrItinClass;
489def IIC_FLD80 : InstrItinClass;
490def IIC_FST : InstrItinClass;
491def IIC_FST80 : InstrItinClass;
492def IIC_FIST : InstrItinClass;
493def IIC_FLDZ : InstrItinClass;
494def IIC_FUCOM : InstrItinClass;
495def IIC_FUCOMI : InstrItinClass;
496def IIC_FCOMI : InstrItinClass;
497def IIC_FNSTSW : InstrItinClass;
498def IIC_FNSTCW : InstrItinClass;
499def IIC_FLDCW : InstrItinClass;
500def IIC_FNINIT : InstrItinClass;
501def IIC_FFREE : InstrItinClass;
502def IIC_FNCLEX : InstrItinClass;
503def IIC_WAIT : InstrItinClass;
504def IIC_FXAM : InstrItinClass;
505def IIC_FNOP : InstrItinClass;
506def IIC_FLDL : InstrItinClass;
507def IIC_F2XM1 : InstrItinClass;
508def IIC_FYL2X : InstrItinClass;
509def IIC_FPTAN : InstrItinClass;
510def IIC_FPATAN : InstrItinClass;
511def IIC_FXTRACT : InstrItinClass;
512def IIC_FPREM1 : InstrItinClass;
513def IIC_FPSTP : InstrItinClass;
514def IIC_FPREM : InstrItinClass;
Simon Pilgrim0747a7e2017-11-28 15:03:42 +0000515def IIC_FSIGN : InstrItinClass;
516def IIC_FSQRT : InstrItinClass;
Simon Pilgrima271c542017-05-03 15:42:29 +0000517def IIC_FYL2XP1 : InstrItinClass;
518def IIC_FSINCOS : InstrItinClass;
519def IIC_FRNDINT : InstrItinClass;
520def IIC_FSCALE : InstrItinClass;
521def IIC_FCOMPP : InstrItinClass;
522def IIC_FXSAVE : InstrItinClass;
523def IIC_FXRSTOR : InstrItinClass;
524
525def IIC_FXCH : InstrItinClass;
526
527// System instructions
528def IIC_CPUID : InstrItinClass;
529def IIC_INT : InstrItinClass;
530def IIC_INT3 : InstrItinClass;
531def IIC_INVD : InstrItinClass;
532def IIC_INVLPG : InstrItinClass;
Simon Pilgrim1ddcae62017-12-08 15:48:37 +0000533def IIC_INVPCID : InstrItinClass;
Simon Pilgrima271c542017-05-03 15:42:29 +0000534def IIC_IRET : InstrItinClass;
535def IIC_HLT : InstrItinClass;
536def IIC_LXS : InstrItinClass;
537def IIC_LTR : InstrItinClass;
Simon Pilgrim42fcda92017-12-08 19:03:42 +0000538def IIC_MPX : InstrItinClass;
Simon Pilgrim1ddcae62017-12-08 15:48:37 +0000539def IIC_PKU : InstrItinClass;
540def IIC_PTWRITE : InstrItinClass;
541def IIC_RDPID : InstrItinClass;
Simon Pilgrim60411d92017-12-07 14:18:48 +0000542def IIC_RDRAND : InstrItinClass;
543def IIC_RDSEED : InstrItinClass;
Simon Pilgrima271c542017-05-03 15:42:29 +0000544def IIC_RDTSC : InstrItinClass;
Simon Pilgrimf00ea1b2017-12-13 14:22:04 +0000545def IIC_RDTSCP : InstrItinClass;
Simon Pilgrima271c542017-05-03 15:42:29 +0000546def IIC_RSM : InstrItinClass;
547def IIC_SIDT : InstrItinClass;
548def IIC_SGDT : InstrItinClass;
549def IIC_SLDT : InstrItinClass;
Simon Pilgrim1ddcae62017-12-08 15:48:37 +0000550def IIC_SMAP : InstrItinClass;
551def IIC_SMX : InstrItinClass;
Simon Pilgrima271c542017-05-03 15:42:29 +0000552def IIC_STR : InstrItinClass;
Simon Pilgrim6b7cd862017-12-07 14:35:17 +0000553def IIC_SKINIT : InstrItinClass;
554def IIC_SVM : InstrItinClass;
Simon Pilgrima13271b2017-12-07 15:57:32 +0000555def IIC_VMX : InstrItinClass;
Simon Pilgrim6b7cd862017-12-07 14:35:17 +0000556def IIC_CLGI : InstrItinClass;
557def IIC_STGI : InstrItinClass;
Simon Pilgrima271c542017-05-03 15:42:29 +0000558def IIC_SWAPGS : InstrItinClass;
559def IIC_SYSCALL : InstrItinClass;
560def IIC_SYS_ENTER_EXIT : InstrItinClass;
561def IIC_IN_RR : InstrItinClass;
562def IIC_IN_RI : InstrItinClass;
563def IIC_OUT_RR : InstrItinClass;
564def IIC_OUT_IR : InstrItinClass;
565def IIC_INS : InstrItinClass;
Simon Pilgrim99b925b2017-05-03 15:51:39 +0000566def IIC_LWP : InstrItinClass;
Simon Pilgrima271c542017-05-03 15:42:29 +0000567def IIC_MOV_REG_DR : InstrItinClass;
568def IIC_MOV_DR_REG : InstrItinClass;
569def IIC_MOV_REG_CR : InstrItinClass;
570def IIC_MOV_CR_REG : InstrItinClass;
571def IIC_MOV_REG_SR : InstrItinClass;
572def IIC_MOV_MEM_SR : InstrItinClass;
573def IIC_MOV_SR_REG : InstrItinClass;
574def IIC_MOV_SR_MEM : InstrItinClass;
575def IIC_LAR_RM : InstrItinClass;
576def IIC_LAR_RR : InstrItinClass;
577def IIC_LSL_RM : InstrItinClass;
578def IIC_LSL_RR : InstrItinClass;
579def IIC_LGDT : InstrItinClass;
580def IIC_LIDT : InstrItinClass;
581def IIC_LLDT_REG : InstrItinClass;
582def IIC_LLDT_MEM : InstrItinClass;
583def IIC_PUSH_CS : InstrItinClass;
584def IIC_PUSH_SR : InstrItinClass;
585def IIC_POP_SR : InstrItinClass;
586def IIC_POP_SR_SS : InstrItinClass;
Simon Pilgrim7e636cc2017-12-09 20:42:27 +0000587def IIC_SEGMENT_BASE_R : InstrItinClass;
588def IIC_SEGMENT_BASE_W : InstrItinClass;
Simon Pilgrima271c542017-05-03 15:42:29 +0000589def IIC_VERR : InstrItinClass;
590def IIC_VERW_REG : InstrItinClass;
591def IIC_VERW_MEM : InstrItinClass;
592def IIC_WRMSR : InstrItinClass;
593def IIC_RDMSR : InstrItinClass;
594def IIC_RDPMC : InstrItinClass;
595def IIC_SMSW : InstrItinClass;
596def IIC_LMSW_REG : InstrItinClass;
597def IIC_LMSW_MEM : InstrItinClass;
598def IIC_ENTER : InstrItinClass;
599def IIC_LEAVE : InstrItinClass;
600def IIC_POP_MEM : InstrItinClass;
601def IIC_POP_REG16 : InstrItinClass;
602def IIC_POP_REG : InstrItinClass;
603def IIC_POP_F : InstrItinClass;
604def IIC_POP_FD : InstrItinClass;
605def IIC_POP_A : InstrItinClass;
606def IIC_PUSH_IMM : InstrItinClass;
607def IIC_PUSH_MEM : InstrItinClass;
608def IIC_PUSH_REG : InstrItinClass;
609def IIC_PUSH_F : InstrItinClass;
610def IIC_PUSH_A : InstrItinClass;
611def IIC_BSWAP : InstrItinClass;
612def IIC_BIT_SCAN_MEM : InstrItinClass;
613def IIC_BIT_SCAN_REG : InstrItinClass;
Simon Pilgrimf1d599a2017-12-07 15:24:14 +0000614def IIC_LZCNT_RR : InstrItinClass;
615def IIC_LZCNT_RM : InstrItinClass;
616def IIC_TZCNT_RR : InstrItinClass;
617def IIC_TZCNT_RM : InstrItinClass;
Simon Pilgrima271c542017-05-03 15:42:29 +0000618def IIC_MOVS : InstrItinClass;
619def IIC_STOS : InstrItinClass;
620def IIC_SCAS : InstrItinClass;
621def IIC_CMPS : InstrItinClass;
622def IIC_MOV : InstrItinClass;
623def IIC_MOV_MEM : InstrItinClass;
624def IIC_AHF : InstrItinClass;
625def IIC_BT_MI : InstrItinClass;
626def IIC_BT_MR : InstrItinClass;
627def IIC_BT_RI : InstrItinClass;
628def IIC_BT_RR : InstrItinClass;
629def IIC_BTX_MI : InstrItinClass;
630def IIC_BTX_MR : InstrItinClass;
631def IIC_BTX_RI : InstrItinClass;
632def IIC_BTX_RR : InstrItinClass;
633def IIC_XCHG_REG : InstrItinClass;
634def IIC_XCHG_MEM : InstrItinClass;
635def IIC_XADD_REG : InstrItinClass;
636def IIC_XADD_MEM : InstrItinClass;
637def IIC_CMPXCHG_MEM : InstrItinClass;
638def IIC_CMPXCHG_REG : InstrItinClass;
639def IIC_CMPXCHG_MEM8 : InstrItinClass;
640def IIC_CMPXCHG_REG8 : InstrItinClass;
641def IIC_CMPXCHG_8B : InstrItinClass;
642def IIC_CMPXCHG_16B : InstrItinClass;
643def IIC_LODS : InstrItinClass;
644def IIC_OUTS : InstrItinClass;
Craig Topper22d25a02018-04-06 16:16:43 +0000645def IIC_CLC_CMC_STC : InstrItinClass;
Simon Pilgrima271c542017-05-03 15:42:29 +0000646def IIC_CLD : InstrItinClass;
647def IIC_CLI : InstrItinClass;
Simon Pilgrima271c542017-05-03 15:42:29 +0000648def IIC_CLTS : InstrItinClass;
Simon Pilgrima271c542017-05-03 15:42:29 +0000649def IIC_STI : InstrItinClass;
650def IIC_STD : InstrItinClass;
651def IIC_XLAT : InstrItinClass;
652def IIC_AAA : InstrItinClass;
653def IIC_AAD : InstrItinClass;
654def IIC_AAM : InstrItinClass;
655def IIC_AAS : InstrItinClass;
656def IIC_DAA : InstrItinClass;
657def IIC_DAS : InstrItinClass;
658def IIC_BOUND : InstrItinClass;
659def IIC_ARPL_REG : InstrItinClass;
660def IIC_ARPL_MEM : InstrItinClass;
661def IIC_MOVBE : InstrItinClass;
662def IIC_AES : InstrItinClass;
663def IIC_BLEND_MEM : InstrItinClass;
664def IIC_BLEND_NOMEM : InstrItinClass;
665def IIC_CBW : InstrItinClass;
666def IIC_CRC32_REG : InstrItinClass;
667def IIC_CRC32_MEM : InstrItinClass;
668def IIC_SSE_DPPD_RR : InstrItinClass;
669def IIC_SSE_DPPD_RM : InstrItinClass;
670def IIC_SSE_DPPS_RR : InstrItinClass;
671def IIC_SSE_DPPS_RM : InstrItinClass;
672def IIC_MMX_EMMS : InstrItinClass;
673def IIC_SSE_EXTRACTPS_RR : InstrItinClass;
674def IIC_SSE_EXTRACTPS_RM : InstrItinClass;
675def IIC_SSE_INSERTPS_RR : InstrItinClass;
676def IIC_SSE_INSERTPS_RM : InstrItinClass;
677def IIC_SSE_MPSADBW_RR : InstrItinClass;
678def IIC_SSE_MPSADBW_RM : InstrItinClass;
679def IIC_SSE_PMULLD_RR : InstrItinClass;
680def IIC_SSE_PMULLD_RM : InstrItinClass;
681def IIC_SSE_ROUNDPS_REG : InstrItinClass;
682def IIC_SSE_ROUNDPS_MEM : InstrItinClass;
683def IIC_SSE_ROUNDPD_REG : InstrItinClass;
684def IIC_SSE_ROUNDPD_MEM : InstrItinClass;
685def IIC_SSE_POPCNT_RR : InstrItinClass;
686def IIC_SSE_POPCNT_RM : InstrItinClass;
687def IIC_SSE_PCLMULQDQ_RR : InstrItinClass;
688def IIC_SSE_PCLMULQDQ_RM : InstrItinClass;
689
690def IIC_NOP : InstrItinClass;
691
692//===----------------------------------------------------------------------===//
693// Processor instruction itineraries.
694
695// IssueWidth is analogous to the number of decode units. Core and its
696// descendents, including Nehalem and SandyBridge have 4 decoders.
697// Resources beyond the decoder operate on micro-ops and are bufferred
698// so adjacent micro-ops don't directly compete.
699//
700// MicroOpBufferSize > 1 indicates that RAW dependencies can be
701// decoded in the same cycle. The value 32 is a reasonably arbitrary
702// number of in-flight instructions.
703//
704// HighLatency=10 is optimistic. X86InstrInfo::isHighLatencyDef
705// indicates high latency opcodes. Alternatively, InstrItinData
706// entries may be included here to define specific operand
707// latencies. Since these latencies are not used for pipeline hazards,
708// they do not need to be exact.
709//
710// The GenericX86Model contains no instruction itineraries
711// and disables PostRAScheduler.
712class GenericX86Model : SchedMachineModel {
713 let IssueWidth = 4;
714 let MicroOpBufferSize = 32;
715 let LoadLatency = 4;
716 let HighLatency = 10;
717 let PostRAScheduler = 0;
718 let CompleteModel = 0;
719}
720
721def GenericModel : GenericX86Model;
722
723// Define a model with the PostRAScheduler enabled.
724def GenericPostRAModel : GenericX86Model {
725 let PostRAScheduler = 1;
726}
727