blob: 528c4ec7378194972aef5e8bec58033e00f72be9 [file] [log] [blame]
Jia Liub22310f2012-02-18 12:03:15 +00001//===-- ARMSchedule.td - ARM Scheduling Definitions --------*- tablegen -*-===//
2//
Evan Cheng4e712de2009-06-19 01:51:50 +00003// The LLVM Compiler Infrastructure
4//
5// This file is distributed under the University of Illinois Open Source
6// License. See LICENSE.TXT for details.
Jia Liub22310f2012-02-18 12:03:15 +00007//
Evan Cheng4e712de2009-06-19 01:51:50 +00008//===----------------------------------------------------------------------===//
Arnold Schwaighoferfb1dddc2013-03-26 02:01:39 +00009//===----------------------------------------------------------------------===//
10// Instruction scheduling annotations for out-of-order CPUs.
11// These annotations are independent of the itinerary class defined below.
12// Here we define the subtarget independent read/write per-operand resources.
13// The subtarget schedule definitions will then map these to the subtarget's
14// resource usages.
15// For example:
16// The instruction cycle timings table might contain an entry for an operation
17// like the following:
18// Rd <- ADD Rn, Rm, <shift> Rs
19// Uops | Latency from register | Uops - resource requirements - latency
20// 2 | Rn: 1 Rm: 4 Rs: 4 | uop T0, Rm, Rs - P01 - 3
21// | | uopc Rd, Rn, T0 - P01 - 1
22// This is telling us that the result will be available in destination register
23// Rd after a minimum of three cycles after the result in Rm and Rs is available
24// and one cycle after the result in Rn is available. The micro-ops can execute
25// on resource P01.
26// To model this, we need to express that we need to dispatch two micro-ops,
27// that the resource P01 is needed and that the latency to Rn is different than
28// the latency to Rm and Rs. The scheduler can decrease Rn's producer latency by
29// two.
30// We will do this by assigning (abstract) resources to register defs/uses.
31// ARMSchedule.td:
32// def WriteALUsr : SchedWrite;
33// def ReadAdvanceALUsr : ScheRead;
34//
35// ARMInstrInfo.td:
36// def ADDrs : I<>, Sched<[WriteALUsr, ReadAdvanceALUsr, ReadDefault,
37// ReadDefault]> { ...}
38// ReadAdvance read resources allow us to define "pipeline by-passes" or
39// shorter latencies to certain registers as needed in the example above.
40// The "ReadDefault" can be omitted.
41// Next, the subtarget td file assigns resources to the abstract resources
42// defined here.
43// ARMScheduleSubtarget.td:
44// // Resources.
45// def P01 : ProcResource<3>; // ALU unit (3 of it).
46// ...
47// // Resource usages.
48// def : WriteRes<WriteALUsr, [P01, P01]> {
49// Latency = 4; // Latency of 4.
50// NumMicroOps = 2; // Dispatch 2 micro-ops.
51// // The two instances of resource P01 are occupied for one cycle. It is one
52// // cycle because these resources happen to be pipelined.
53// ResourceCycles = [1, 1];
54// }
55// def : ReadAdvance<ReadAdvanceALUsr, 3>;
56
57// Basic ALU operation.
58def WriteALU : SchedWrite;
Arnold Schwaighofer6793aeb2013-04-01 13:07:05 +000059def ReadALU : SchedRead;
Arnold Schwaighoferfb1dddc2013-03-26 02:01:39 +000060
61// Basic ALU with shifts.
62def WriteALUsi : SchedWrite; // Shift by immediate.
63def WriteALUsr : SchedWrite; // Shift by register.
64def WriteALUSsr : SchedWrite; // Shift by register (flag setting).
Arnold Schwaighofer6793aeb2013-04-01 13:07:05 +000065def ReadALUsr : SchedRead; // Some operands are read later.
66
Arnold Schwaighoferfb6b9f42013-04-05 05:01:06 +000067// Compares.
68def WriteCMP : SchedWrite;
69def WriteCMPsi : SchedWrite;
70def WriteCMPsr : SchedWrite;
71
Arnold Schwaighofer2773f1d2013-06-05 16:06:11 +000072// Division.
73def WriteDiv : SchedWrite;
74
75// Loads.
76def WriteLd : SchedWrite;
77def WritePreLd : SchedWrite;
78
79// Branches.
80def WriteBr : SchedWrite;
81def WriteBrL : SchedWrite;
82def WriteBrTbl : SchedWrite;
83
84// Fixpoint conversions.
85def WriteCvtFP : SchedWrite;
86
Arnold Schwaighofereac54472013-06-06 20:26:18 +000087// Noop.
88def WriteNoop : SchedWrite;
89
Arnold Schwaighofer6793aeb2013-04-01 13:07:05 +000090// Define TII for use in SchedVariant Predicates.
91def : PredicateProlog<[{
92 const ARMBaseInstrInfo *TII =
93 static_cast<const ARMBaseInstrInfo*>(SchedModel->getInstrInfo());
94 (void)TII;
95}]>;
Evan Cheng4e712de2009-06-19 01:51:50 +000096
Arnold Schwaighofer5dde1f32013-04-05 04:42:00 +000097def IsPredicatedPred : SchedPredicate<[{TII->isPredicated(MI)}]>;
98
Evan Cheng4e712de2009-06-19 01:51:50 +000099//===----------------------------------------------------------------------===//
Evan Cheng4e712de2009-06-19 01:51:50 +0000100// Instruction Itinerary classes used for ARM
101//
David Goodwina7c2dfb2009-08-19 18:00:44 +0000102def IIC_iALUx : InstrItinClass;
103def IIC_iALUi : InstrItinClass;
104def IIC_iALUr : InstrItinClass;
105def IIC_iALUsi : InstrItinClass;
Evan Cheng4a010fd2010-09-29 22:42:35 +0000106def IIC_iALUsir : InstrItinClass;
David Goodwina7c2dfb2009-08-19 18:00:44 +0000107def IIC_iALUsr : InstrItinClass;
Evan Chengc35d7bb2010-09-29 00:27:46 +0000108def IIC_iBITi : InstrItinClass;
109def IIC_iBITr : InstrItinClass;
110def IIC_iBITsi : InstrItinClass;
111def IIC_iBITsr : InstrItinClass;
David Goodwina7c2dfb2009-08-19 18:00:44 +0000112def IIC_iUNAr : InstrItinClass;
113def IIC_iUNAsi : InstrItinClass;
Evan Cheng62d626c2010-09-25 00:49:35 +0000114def IIC_iEXTr : InstrItinClass;
115def IIC_iEXTAr : InstrItinClass;
Evan Chengc35d7bb2010-09-29 00:27:46 +0000116def IIC_iEXTAsr : InstrItinClass;
David Goodwina7c2dfb2009-08-19 18:00:44 +0000117def IIC_iCMPi : InstrItinClass;
118def IIC_iCMPr : InstrItinClass;
119def IIC_iCMPsi : InstrItinClass;
120def IIC_iCMPsr : InstrItinClass;
Evan Cheng2259d672010-09-29 00:49:25 +0000121def IIC_iTSTi : InstrItinClass;
122def IIC_iTSTr : InstrItinClass;
123def IIC_iTSTsi : InstrItinClass;
124def IIC_iTSTsr : InstrItinClass;
David Goodwina7c2dfb2009-08-19 18:00:44 +0000125def IIC_iMOVi : InstrItinClass;
126def IIC_iMOVr : InstrItinClass;
127def IIC_iMOVsi : InstrItinClass;
128def IIC_iMOVsr : InstrItinClass;
Evan Cheng2259d672010-09-29 00:49:25 +0000129def IIC_iMOVix2 : InstrItinClass;
Evan Chengb8b0ad82011-01-20 08:34:58 +0000130def IIC_iMOVix2addpc : InstrItinClass;
131def IIC_iMOVix2ld : InstrItinClass;
Evan Cheng2259d672010-09-29 00:49:25 +0000132def IIC_iMVNi : InstrItinClass;
133def IIC_iMVNr : InstrItinClass;
134def IIC_iMVNsi : InstrItinClass;
135def IIC_iMVNsr : InstrItinClass;
David Goodwina7c2dfb2009-08-19 18:00:44 +0000136def IIC_iCMOVi : InstrItinClass;
137def IIC_iCMOVr : InstrItinClass;
138def IIC_iCMOVsi : InstrItinClass;
139def IIC_iCMOVsr : InstrItinClass;
Evan Cheng79ff5232010-11-13 05:14:20 +0000140def IIC_iCMOVix2 : InstrItinClass;
David Goodwina7c2dfb2009-08-19 18:00:44 +0000141def IIC_iMUL16 : InstrItinClass;
142def IIC_iMAC16 : InstrItinClass;
143def IIC_iMUL32 : InstrItinClass;
144def IIC_iMAC32 : InstrItinClass;
145def IIC_iMUL64 : InstrItinClass;
146def IIC_iMAC64 : InstrItinClass;
Bob Wilsone8a549c2012-09-29 21:43:49 +0000147def IIC_iDIV : InstrItinClass;
Evan Cheng2fb20b12010-09-30 01:08:25 +0000148def IIC_iLoad_i : InstrItinClass;
149def IIC_iLoad_r : InstrItinClass;
150def IIC_iLoad_si : InstrItinClass;
151def IIC_iLoad_iu : InstrItinClass;
152def IIC_iLoad_ru : InstrItinClass;
153def IIC_iLoad_siu : InstrItinClass;
154def IIC_iLoad_bh_i : InstrItinClass;
155def IIC_iLoad_bh_r : InstrItinClass;
156def IIC_iLoad_bh_si : InstrItinClass;
157def IIC_iLoad_bh_iu : InstrItinClass;
158def IIC_iLoad_bh_ru : InstrItinClass;
159def IIC_iLoad_bh_siu : InstrItinClass;
160def IIC_iLoad_d_i : InstrItinClass;
161def IIC_iLoad_d_r : InstrItinClass;
162def IIC_iLoad_d_ru : InstrItinClass;
Andrew Trickf161e392012-07-02 18:10:42 +0000163def IIC_iLoad_m : InstrItinClass;
164def IIC_iLoad_mu : InstrItinClass;
165def IIC_iLoad_mBr : InstrItinClass;
166def IIC_iPop : InstrItinClass;
167def IIC_iPop_Br : InstrItinClass;
Evan Chenge37da032010-09-24 22:41:41 +0000168def IIC_iLoadiALU : InstrItinClass;
Evan Cheng2fb20b12010-09-30 01:08:25 +0000169def IIC_iStore_i : InstrItinClass;
170def IIC_iStore_r : InstrItinClass;
171def IIC_iStore_si : InstrItinClass;
172def IIC_iStore_iu : InstrItinClass;
173def IIC_iStore_ru : InstrItinClass;
174def IIC_iStore_siu : InstrItinClass;
175def IIC_iStore_bh_i : InstrItinClass;
176def IIC_iStore_bh_r : InstrItinClass;
177def IIC_iStore_bh_si : InstrItinClass;
178def IIC_iStore_bh_iu : InstrItinClass;
179def IIC_iStore_bh_ru : InstrItinClass;
180def IIC_iStore_bh_siu : InstrItinClass;
181def IIC_iStore_d_i : InstrItinClass;
182def IIC_iStore_d_r : InstrItinClass;
183def IIC_iStore_d_ru : InstrItinClass;
Andrew Trickf161e392012-07-02 18:10:42 +0000184def IIC_iStore_m : InstrItinClass;
185def IIC_iStore_mu : InstrItinClass;
Evan Cheng8740ee32010-11-03 06:34:55 +0000186def IIC_Preload : InstrItinClass;
David Goodwinafcaf792009-09-23 21:38:08 +0000187def IIC_Br : InstrItinClass;
David Goodwin50902732009-09-21 20:52:17 +0000188def IIC_fpSTAT : InstrItinClass;
David Goodwin50902732009-09-21 20:52:17 +0000189def IIC_fpUNA32 : InstrItinClass;
190def IIC_fpUNA64 : InstrItinClass;
191def IIC_fpCMP32 : InstrItinClass;
192def IIC_fpCMP64 : InstrItinClass;
193def IIC_fpCVTSD : InstrItinClass;
194def IIC_fpCVTDS : InstrItinClass;
Anton Korobeynikov4c1da0f2010-04-07 18:19:46 +0000195def IIC_fpCVTSH : InstrItinClass;
196def IIC_fpCVTHS : InstrItinClass;
David Goodwin50902732009-09-21 20:52:17 +0000197def IIC_fpCVTIS : InstrItinClass;
198def IIC_fpCVTID : InstrItinClass;
199def IIC_fpCVTSI : InstrItinClass;
200def IIC_fpCVTDI : InstrItinClass;
Anton Korobeynikov20637052010-04-07 18:20:02 +0000201def IIC_fpMOVIS : InstrItinClass;
202def IIC_fpMOVID : InstrItinClass;
203def IIC_fpMOVSI : InstrItinClass;
204def IIC_fpMOVDI : InstrItinClass;
David Goodwin50902732009-09-21 20:52:17 +0000205def IIC_fpALU32 : InstrItinClass;
206def IIC_fpALU64 : InstrItinClass;
207def IIC_fpMUL32 : InstrItinClass;
208def IIC_fpMUL64 : InstrItinClass;
209def IIC_fpMAC32 : InstrItinClass;
210def IIC_fpMAC64 : InstrItinClass;
Anton Korobeynikov5482b9f2012-01-22 12:07:33 +0000211def IIC_fpFMAC32 : InstrItinClass;
212def IIC_fpFMAC64 : InstrItinClass;
David Goodwin50902732009-09-21 20:52:17 +0000213def IIC_fpDIV32 : InstrItinClass;
214def IIC_fpDIV64 : InstrItinClass;
215def IIC_fpSQRT32 : InstrItinClass;
216def IIC_fpSQRT64 : InstrItinClass;
217def IIC_fpLoad32 : InstrItinClass;
218def IIC_fpLoad64 : InstrItinClass;
Andrew Trickf161e392012-07-02 18:10:42 +0000219def IIC_fpLoad_m : InstrItinClass;
220def IIC_fpLoad_mu : InstrItinClass;
David Goodwin50902732009-09-21 20:52:17 +0000221def IIC_fpStore32 : InstrItinClass;
222def IIC_fpStore64 : InstrItinClass;
Andrew Trickf161e392012-07-02 18:10:42 +0000223def IIC_fpStore_m : InstrItinClass;
224def IIC_fpStore_mu : InstrItinClass;
David Goodwinafcaf792009-09-23 21:38:08 +0000225def IIC_VLD1 : InstrItinClass;
Evan Cheng05f13e92010-10-09 01:03:04 +0000226def IIC_VLD1x2 : InstrItinClass;
227def IIC_VLD1x3 : InstrItinClass;
228def IIC_VLD1x4 : InstrItinClass;
229def IIC_VLD1u : InstrItinClass;
230def IIC_VLD1x2u : InstrItinClass;
231def IIC_VLD1x3u : InstrItinClass;
232def IIC_VLD1x4u : InstrItinClass;
Bob Wilsondc449902010-11-01 22:04:05 +0000233def IIC_VLD1ln : InstrItinClass;
234def IIC_VLD1lnu : InstrItinClass;
Bob Wilsonc92eea02010-11-27 06:35:16 +0000235def IIC_VLD1dup : InstrItinClass;
236def IIC_VLD1dupu : InstrItinClass;
David Goodwinafcaf792009-09-23 21:38:08 +0000237def IIC_VLD2 : InstrItinClass;
Evan Cheng05f13e92010-10-09 01:03:04 +0000238def IIC_VLD2x2 : InstrItinClass;
239def IIC_VLD2u : InstrItinClass;
240def IIC_VLD2x2u : InstrItinClass;
241def IIC_VLD2ln : InstrItinClass;
242def IIC_VLD2lnu : InstrItinClass;
Bob Wilson2d790df2010-11-28 06:51:26 +0000243def IIC_VLD2dup : InstrItinClass;
244def IIC_VLD2dupu : InstrItinClass;
David Goodwinafcaf792009-09-23 21:38:08 +0000245def IIC_VLD3 : InstrItinClass;
Evan Chenga7624002010-10-09 01:45:34 +0000246def IIC_VLD3ln : InstrItinClass;
247def IIC_VLD3u : InstrItinClass;
248def IIC_VLD3lnu : InstrItinClass;
Bob Wilson77ab1652010-11-29 19:35:29 +0000249def IIC_VLD3dup : InstrItinClass;
250def IIC_VLD3dupu : InstrItinClass;
David Goodwinafcaf792009-09-23 21:38:08 +0000251def IIC_VLD4 : InstrItinClass;
Evan Chengd7a404d2010-10-09 04:07:58 +0000252def IIC_VLD4ln : InstrItinClass;
253def IIC_VLD4u : InstrItinClass;
254def IIC_VLD4lnu : InstrItinClass;
Bob Wilson431ac4ef2010-11-30 00:00:35 +0000255def IIC_VLD4dup : InstrItinClass;
256def IIC_VLD4dupu : InstrItinClass;
Evan Cheng94ad0082010-10-11 22:03:18 +0000257def IIC_VST1 : InstrItinClass;
258def IIC_VST1x2 : InstrItinClass;
259def IIC_VST1x3 : InstrItinClass;
260def IIC_VST1x4 : InstrItinClass;
261def IIC_VST1u : InstrItinClass;
262def IIC_VST1x2u : InstrItinClass;
263def IIC_VST1x3u : InstrItinClass;
264def IIC_VST1x4u : InstrItinClass;
Bob Wilsond80b29d2010-11-02 21:18:25 +0000265def IIC_VST1ln : InstrItinClass;
266def IIC_VST1lnu : InstrItinClass;
Evan Cheng94ad0082010-10-11 22:03:18 +0000267def IIC_VST2 : InstrItinClass;
268def IIC_VST2x2 : InstrItinClass;
269def IIC_VST2u : InstrItinClass;
270def IIC_VST2x2u : InstrItinClass;
271def IIC_VST2ln : InstrItinClass;
272def IIC_VST2lnu : InstrItinClass;
273def IIC_VST3 : InstrItinClass;
274def IIC_VST3u : InstrItinClass;
275def IIC_VST3ln : InstrItinClass;
276def IIC_VST3lnu : InstrItinClass;
277def IIC_VST4 : InstrItinClass;
278def IIC_VST4u : InstrItinClass;
279def IIC_VST4ln : InstrItinClass;
280def IIC_VST4lnu : InstrItinClass;
David Goodwinafcaf792009-09-23 21:38:08 +0000281def IIC_VUNAD : InstrItinClass;
282def IIC_VUNAQ : InstrItinClass;
283def IIC_VBIND : InstrItinClass;
284def IIC_VBINQ : InstrItinClass;
Evan Chenge790afc2010-10-11 23:41:41 +0000285def IIC_VPBIND : InstrItinClass;
286def IIC_VFMULD : InstrItinClass;
287def IIC_VFMULQ : InstrItinClass;
Evan Cheng2a5d7642010-10-01 20:50:58 +0000288def IIC_VMOV : InstrItinClass;
David Goodwinbea68482009-09-25 18:38:29 +0000289def IIC_VMOVImm : InstrItinClass;
David Goodwinafcaf792009-09-23 21:38:08 +0000290def IIC_VMOVD : InstrItinClass;
291def IIC_VMOVQ : InstrItinClass;
David Goodwinbea68482009-09-25 18:38:29 +0000292def IIC_VMOVIS : InstrItinClass;
293def IIC_VMOVID : InstrItinClass;
294def IIC_VMOVISL : InstrItinClass;
295def IIC_VMOVSI : InstrItinClass;
296def IIC_VMOVDI : InstrItinClass;
Evan Cheng2a5d7642010-10-01 20:50:58 +0000297def IIC_VMOVN : InstrItinClass;
David Goodwinafcaf792009-09-23 21:38:08 +0000298def IIC_VPERMD : InstrItinClass;
299def IIC_VPERMQ : InstrItinClass;
300def IIC_VPERMQ3 : InstrItinClass;
David Goodwinbea68482009-09-25 18:38:29 +0000301def IIC_VMACD : InstrItinClass;
302def IIC_VMACQ : InstrItinClass;
Anton Korobeynikov5482b9f2012-01-22 12:07:33 +0000303def IIC_VFMACD : InstrItinClass;
304def IIC_VFMACQ : InstrItinClass;
David Goodwinbea68482009-09-25 18:38:29 +0000305def IIC_VRECSD : InstrItinClass;
306def IIC_VRECSQ : InstrItinClass;
David Goodwinafcaf792009-09-23 21:38:08 +0000307def IIC_VCNTiD : InstrItinClass;
308def IIC_VCNTiQ : InstrItinClass;
309def IIC_VUNAiD : InstrItinClass;
310def IIC_VUNAiQ : InstrItinClass;
311def IIC_VQUNAiD : InstrItinClass;
312def IIC_VQUNAiQ : InstrItinClass;
313def IIC_VBINiD : InstrItinClass;
314def IIC_VBINiQ : InstrItinClass;
315def IIC_VSUBiD : InstrItinClass;
316def IIC_VSUBiQ : InstrItinClass;
317def IIC_VBINi4D : InstrItinClass;
318def IIC_VBINi4Q : InstrItinClass;
Anton Korobeynikov7d4fad52010-04-07 18:20:13 +0000319def IIC_VSUBi4D : InstrItinClass;
320def IIC_VSUBi4Q : InstrItinClass;
Anton Korobeynikova248bec2010-04-07 18:20:42 +0000321def IIC_VABAD : InstrItinClass;
322def IIC_VABAQ : InstrItinClass;
David Goodwinbea68482009-09-25 18:38:29 +0000323def IIC_VSHLiD : InstrItinClass;
324def IIC_VSHLiQ : InstrItinClass;
325def IIC_VSHLi4D : InstrItinClass;
326def IIC_VSHLi4Q : InstrItinClass;
327def IIC_VPALiD : InstrItinClass;
328def IIC_VPALiQ : InstrItinClass;
David Goodwinafcaf792009-09-23 21:38:08 +0000329def IIC_VMULi16D : InstrItinClass;
330def IIC_VMULi32D : InstrItinClass;
331def IIC_VMULi16Q : InstrItinClass;
332def IIC_VMULi32Q : InstrItinClass;
David Goodwinbea68482009-09-25 18:38:29 +0000333def IIC_VMACi16D : InstrItinClass;
334def IIC_VMACi32D : InstrItinClass;
335def IIC_VMACi16Q : InstrItinClass;
336def IIC_VMACi32Q : InstrItinClass;
337def IIC_VEXTD : InstrItinClass;
338def IIC_VEXTQ : InstrItinClass;
339def IIC_VTB1 : InstrItinClass;
340def IIC_VTB2 : InstrItinClass;
341def IIC_VTB3 : InstrItinClass;
342def IIC_VTB4 : InstrItinClass;
343def IIC_VTBX1 : InstrItinClass;
344def IIC_VTBX2 : InstrItinClass;
345def IIC_VTBX3 : InstrItinClass;
346def IIC_VTBX4 : InstrItinClass;
Evan Cheng4e712de2009-06-19 01:51:50 +0000347
348//===----------------------------------------------------------------------===//
349// Processor instruction itineraries.
350
Evan Cheng4e712de2009-06-19 01:51:50 +0000351include "ARMScheduleV6.td"
Anton Korobeynikov090323a2010-04-07 18:22:11 +0000352include "ARMScheduleA8.td"
353include "ARMScheduleA9.td"
Bob Wilsone8a549c2012-09-29 21:43:49 +0000354include "ARMScheduleSwift.td"