blob: 1deb846f2d153d01dc2a0103b64fade3ed9af869 [file] [log] [blame]
Anton Korobeynikov090323a2010-04-07 18:22:11 +00001//=- ARMScheduleA9.td - ARM Cortex-A9 Scheduling Definitions -*- tablegen -*-=//
Jim Grosbach7ea5fc02010-06-28 04:27:01 +00002//
Anton Korobeynikov090323a2010-04-07 18:22:11 +00003// The LLVM Compiler Infrastructure
4//
5// This file is distributed under the University of Illinois Open Source
6// License. See LICENSE.TXT for details.
Jim Grosbach7ea5fc02010-06-28 04:27:01 +00007//
Anton Korobeynikov090323a2010-04-07 18:22:11 +00008//===----------------------------------------------------------------------===//
9//
10// This file defines the itinerary class data for the ARM Cortex A9 processors.
11//
12//===----------------------------------------------------------------------===//
13
14//
15// Ad-hoc scheduling information derived from pretty vague "Cortex-A9 Technical
16// Reference Manual".
17//
Anton Korobeynikov7d62e332010-04-18 20:31:01 +000018// Functional units
Anton Korobeynikov7d62e332010-04-18 20:31:01 +000019def A9_Pipe0 : FuncUnit; // pipeline 0
20def A9_Pipe1 : FuncUnit; // pipeline 1
21def A9_LSPipe : FuncUnit; // LS pipe
22def A9_NPipe : FuncUnit; // NEON ALU/MUL pipe
23def A9_DRegsVFP: FuncUnit; // FP register set, VFP side
24def A9_DRegsN : FuncUnit; // FP register set, NEON side
25
26// Dual issue pipeline represented by A9_Pipe0 | A9_Pipe1
Anton Korobeynikov090323a2010-04-07 18:22:11 +000027//
Anton Korobeynikov7d62e332010-04-18 20:31:01 +000028def CortexA9Itineraries : ProcessorItineraries<
Evan Cheng0097dd02010-09-28 23:50:49 +000029 [A9_NPipe, A9_DRegsN, A9_DRegsVFP, A9_LSPipe, A9_Pipe0, A9_Pipe1], [], [
Anton Korobeynikov94d7fd82010-05-29 19:25:17 +000030 // Two fully-pipelined integer ALU pipelines
31 // FIXME: There are no operand latencies for these instructions at all!
32 //
33 // Move instructions, unconditional
Jim Grosbach7ea5fc02010-06-28 04:27:01 +000034 InstrItinData<IIC_iMOVi , [InstrStage<1, [A9_Pipe0, A9_Pipe1]>], [1]>,
Evan Cheng1d35ad62010-09-24 22:03:46 +000035 InstrItinData<IIC_iMOVix2 , [InstrStage<1, [A9_Pipe0, A9_Pipe1]>,
Evan Chenge37da032010-09-24 22:41:41 +000036 InstrStage<1, [A9_Pipe0, A9_Pipe1]>], [2]>,
Jim Grosbach7ea5fc02010-06-28 04:27:01 +000037 InstrItinData<IIC_iMOVr , [InstrStage<1, [A9_Pipe0, A9_Pipe1]>], [1, 1]>,
38 InstrItinData<IIC_iMOVsi , [InstrStage<1, [A9_Pipe0, A9_Pipe1]>], [1, 1]>,
39 InstrItinData<IIC_iMOVsr , [InstrStage<2, [A9_Pipe0, A9_Pipe1]>], [2, 2, 1]>,
Anton Korobeynikov94d7fd82010-05-29 19:25:17 +000040 //
41 // No operand cycles
42 InstrItinData<IIC_iALUx , [InstrStage<1, [A9_Pipe0, A9_Pipe1]>]>,
43 //
44 // Binary Instructions that produce a result
Jim Grosbach7ea5fc02010-06-28 04:27:01 +000045 InstrItinData<IIC_iALUi , [InstrStage<1, [A9_Pipe0, A9_Pipe1]>], [2, 2]>,
46 InstrItinData<IIC_iALUr , [InstrStage<1, [A9_Pipe0, A9_Pipe1]>], [2, 2, 2]>,
47 InstrItinData<IIC_iALUsi, [InstrStage<2, [A9_Pipe0, A9_Pipe1]>], [2, 2, 1]>,
48 InstrItinData<IIC_iALUsr,[InstrStage<3, [A9_Pipe0, A9_Pipe1]>], [2, 2, 1, 1]>,
Anton Korobeynikov94d7fd82010-05-29 19:25:17 +000049 //
50 // Unary Instructions that produce a result
Jim Grosbach7ea5fc02010-06-28 04:27:01 +000051 InstrItinData<IIC_iUNAr , [InstrStage<1, [A9_Pipe0, A9_Pipe1]>], [2, 2]>,
52 InstrItinData<IIC_iUNAsi , [InstrStage<2, [A9_Pipe0, A9_Pipe1]>], [2, 1]>,
Anton Korobeynikov94d7fd82010-05-29 19:25:17 +000053 //
Evan Cheng62d626c2010-09-25 00:49:35 +000054 // Zero and sign extension instructions
55 InstrItinData<IIC_iEXTr , [InstrStage<1, [A9_Pipe0, A9_Pipe1]>], [2, 1]>,
Evan Cheng48cc2162010-09-25 01:09:28 +000056 InstrItinData<IIC_iEXTAr, [InstrStage<2, [A9_Pipe0, A9_Pipe1]>], [3, 1, 1]>,
Evan Cheng62d626c2010-09-25 00:49:35 +000057 //
Anton Korobeynikov94d7fd82010-05-29 19:25:17 +000058 // Compare instructions
Jim Grosbach7ea5fc02010-06-28 04:27:01 +000059 InstrItinData<IIC_iCMPi , [InstrStage<1, [A9_Pipe0, A9_Pipe1]>], [2]>,
60 InstrItinData<IIC_iCMPr , [InstrStage<1, [A9_Pipe0, A9_Pipe1]>], [2, 2]>,
61 InstrItinData<IIC_iCMPsi , [InstrStage<2, [A9_Pipe0, A9_Pipe1]>], [2, 1]>,
62 InstrItinData<IIC_iCMPsr , [InstrStage<3, [A9_Pipe0, A9_Pipe1]>], [2, 1, 1]>,
Anton Korobeynikov94d7fd82010-05-29 19:25:17 +000063 //
64 // Move instructions, conditional
Jim Grosbach7ea5fc02010-06-28 04:27:01 +000065 InstrItinData<IIC_iCMOVi , [InstrStage<1, [A9_Pipe0, A9_Pipe1]>], [2]>,
66 InstrItinData<IIC_iCMOVr , [InstrStage<1, [A9_Pipe0, A9_Pipe1]>], [2, 1]>,
67 InstrItinData<IIC_iCMOVsi , [InstrStage<1, [A9_Pipe0, A9_Pipe1]>], [2, 1]>,
68 InstrItinData<IIC_iCMOVsr , [InstrStage<2, [A9_Pipe0, A9_Pipe1]>], [2, 1, 1]>,
Anton Korobeynikov94d7fd82010-05-29 19:25:17 +000069
70 // Integer multiply pipeline
71 //
72 InstrItinData<IIC_iMUL16 , [InstrStage<1, [A9_Pipe1], 0>,
73 InstrStage<2, [A9_Pipe0]>], [4, 1, 1]>,
74 InstrItinData<IIC_iMAC16 , [InstrStage<1, [A9_Pipe1], 0>,
75 InstrStage<2, [A9_Pipe0]>], [4, 1, 1, 2]>,
76 InstrItinData<IIC_iMUL32 , [InstrStage<1, [A9_Pipe1], 0>,
77 InstrStage<2, [A9_Pipe0]>], [4, 1, 1]>,
78 InstrItinData<IIC_iMAC32 , [InstrStage<1, [A9_Pipe1], 0>,
79 InstrStage<2, [A9_Pipe0]>], [4, 1, 1, 2]>,
80 InstrItinData<IIC_iMUL64 , [InstrStage<2, [A9_Pipe1], 0>,
81 InstrStage<3, [A9_Pipe0]>], [4, 5, 1, 1]>,
82 InstrItinData<IIC_iMAC64 , [InstrStage<2, [A9_Pipe1], 0>,
83 InstrStage<3, [A9_Pipe0]>], [4, 5, 1, 1]>,
Anton Korobeynikov2a21aef2010-05-29 19:25:34 +000084 // Integer load pipeline
85 // FIXME: The timings are some rough approximations
86 //
87 // Immediate offset
88 InstrItinData<IIC_iLoadi , [InstrStage<1, [A9_Pipe1]>,
89 InstrStage<1, [A9_LSPipe]>], [3, 1]>,
90 //
91 // Register offset
92 InstrItinData<IIC_iLoadr , [InstrStage<1, [A9_Pipe1]>,
93 InstrStage<1, [A9_LSPipe]>], [3, 1, 1]>,
94 //
95 // Scaled register offset
96 InstrItinData<IIC_iLoadsi , [InstrStage<1, [A9_Pipe1]>,
97 InstrStage<2, [A9_LSPipe]>], [4, 1, 1]>,
98 //
99 // Immediate offset with update
100 InstrItinData<IIC_iLoadiu , [InstrStage<1, [A9_Pipe1]>,
101 InstrStage<2, [A9_LSPipe]>], [3, 2, 1]>,
102 //
103 // Register offset with update
104 InstrItinData<IIC_iLoadru , [InstrStage<1, [A9_Pipe1]>,
105 InstrStage<2, [A9_LSPipe]>], [3, 2, 1, 1]>,
106 //
107 // Scaled register offset with update
108 InstrItinData<IIC_iLoadsiu , [InstrStage<1, [A9_Pipe1]>,
109 InstrStage<2, [A9_LSPipe]>], [4, 3, 1, 1]>,
110 //
111 // Load multiple
112 InstrItinData<IIC_iLoadm , [InstrStage<1, [A9_Pipe1]>,
113 InstrStage<1, [A9_LSPipe]>]>,
Anton Korobeynikov94d7fd82010-05-29 19:25:17 +0000114
Evan Cheng722cd122010-09-08 22:57:08 +0000115 //
116 // Load multiple plus branch
117 InstrItinData<IIC_iLoadmBr , [InstrStage<1, [A9_Pipe1]>,
118 InstrStage<1, [A9_LSPipe]>,
119 InstrStage<1, [A9_Pipe0, A9_Pipe1]>]>,
120
Evan Chenge37da032010-09-24 22:41:41 +0000121 //
122 // iLoadi + iALUr for t2LDRpci_pic.
123 InstrItinData<IIC_iLoadiALU, [InstrStage<1, [A9_Pipe1]>,
124 InstrStage<1, [A9_LSPipe]>,
125 InstrStage<1, [A9_Pipe0, A9_Pipe1]>], [4, 1]>,
126
Anton Korobeynikov2a21aef2010-05-29 19:25:34 +0000127 // Integer store pipeline
128 ///
129 // Immediate offset
130 InstrItinData<IIC_iStorei , [InstrStage<1, [A9_Pipe1]>,
131 InstrStage<1, [A9_LSPipe]>], [3, 1]>,
132 //
133 // Register offset
134 InstrItinData<IIC_iStorer , [InstrStage<1, [ A9_Pipe1]>,
135 InstrStage<1, [A9_LSPipe]>], [3, 1, 1]>,
136 //
137 // Scaled register offset
138 InstrItinData<IIC_iStoresi , [InstrStage<1, [A9_Pipe1]>,
139 InstrStage<2, [A9_LSPipe]>], [3, 1, 1]>,
140 //
141 // Immediate offset with update
142 InstrItinData<IIC_iStoreiu , [InstrStage<1, [A9_Pipe1]>,
143 InstrStage<1, [A9_LSPipe]>], [2, 3, 1]>,
144 //
145 // Register offset with update
146 InstrItinData<IIC_iStoreru , [InstrStage<1, [A9_Pipe1]>,
147 InstrStage<1, [A9_LSPipe]>], [2, 3, 1, 1]>,
148 //
149 // Scaled register offset with update
150 InstrItinData<IIC_iStoresiu, [InstrStage<1, [A9_Pipe1]>,
151 InstrStage<2, [A9_LSPipe]>], [3, 3, 1, 1]>,
152 //
153 // Store multiple
154 InstrItinData<IIC_iStorem , [InstrStage<1, [A9_Pipe1]>,
155 InstrStage<1, [A9_LSPipe]>]>,
Anton Korobeynikov94d7fd82010-05-29 19:25:17 +0000156 // Branch
157 //
158 // no delay slots, so the latency of a branch is unimportant
159 InstrItinData<IIC_Br , [InstrStage<1, [A9_Pipe0, A9_Pipe1]>]>,
160
Anton Korobeynikov090323a2010-04-07 18:22:11 +0000161 // VFP and NEON shares the same register file. This means that every VFP
162 // instruction should wait for full completion of the consecutive NEON
163 // instruction and vice-versa. We model this behavior with two artificial FUs:
164 // DRegsVFP and DRegsVFP.
165 //
166 // Every VFP instruction:
167 // - Acquires DRegsVFP resource for 1 cycle
168 // - Reserves DRegsN resource for the whole duration (including time to
169 // register file writeback!).
170 // Every NEON instruction does the same but with FUs swapped.
171 //
Jim Grosbach7ea5fc02010-06-28 04:27:01 +0000172 // Since the reserved FU cannot be acquired, this models precisely
173 // "cross-domain" stalls.
Anton Korobeynikov090323a2010-04-07 18:22:11 +0000174
175 // VFP
176 // Issue through integer pipeline, and execute in NEON unit.
177
178 // FP Special Register to Integer Register File Move
Anton Korobeynikov7d62e332010-04-18 20:31:01 +0000179 InstrItinData<IIC_fpSTAT , [InstrStage<1, [A9_DRegsVFP], 0, Required>,
180 InstrStage<2, [A9_DRegsN], 0, Reserved>,
Anton Korobeynikovd4c7cce2010-05-29 19:25:29 +0000181 InstrStage<1, [A9_Pipe1]>,
Anton Korobeynikov7d62e332010-04-18 20:31:01 +0000182 InstrStage<1, [A9_NPipe]>]>,
Anton Korobeynikov090323a2010-04-07 18:22:11 +0000183 //
184 // Single-precision FP Unary
Anton Korobeynikov7d62e332010-04-18 20:31:01 +0000185 InstrItinData<IIC_fpUNA32 , [InstrStage<1, [A9_DRegsVFP], 0, Required>,
Anton Korobeynikov090323a2010-04-07 18:22:11 +0000186 // Extra latency cycles since wbck is 2 cycles
Anton Korobeynikov7d62e332010-04-18 20:31:01 +0000187 InstrStage<3, [A9_DRegsN], 0, Reserved>,
Anton Korobeynikovd4c7cce2010-05-29 19:25:29 +0000188 InstrStage<1, [A9_Pipe1]>,
Anton Korobeynikov7d62e332010-04-18 20:31:01 +0000189 InstrStage<1, [A9_NPipe]>], [1, 1]>,
Anton Korobeynikov090323a2010-04-07 18:22:11 +0000190 //
191 // Double-precision FP Unary
Anton Korobeynikov7d62e332010-04-18 20:31:01 +0000192 InstrItinData<IIC_fpUNA64 , [InstrStage<1, [A9_DRegsVFP], 0, Required>,
Anton Korobeynikov090323a2010-04-07 18:22:11 +0000193 // Extra latency cycles since wbck is 2 cycles
Anton Korobeynikov7d62e332010-04-18 20:31:01 +0000194 InstrStage<3, [A9_DRegsN], 0, Reserved>,
Anton Korobeynikovd4c7cce2010-05-29 19:25:29 +0000195 InstrStage<1, [A9_Pipe1]>,
Anton Korobeynikov7d62e332010-04-18 20:31:01 +0000196 InstrStage<1, [A9_NPipe]>], [1, 1]>,
Anton Korobeynikov090323a2010-04-07 18:22:11 +0000197
198 //
199 // Single-precision FP Compare
Anton Korobeynikov7d62e332010-04-18 20:31:01 +0000200 InstrItinData<IIC_fpCMP32 , [InstrStage<1, [A9_DRegsVFP], 0, Required>,
Anton Korobeynikov090323a2010-04-07 18:22:11 +0000201 // Extra latency cycles since wbck is 4 cycles
Anton Korobeynikov7d62e332010-04-18 20:31:01 +0000202 InstrStage<5, [A9_DRegsN], 0, Reserved>,
Anton Korobeynikovd4c7cce2010-05-29 19:25:29 +0000203 InstrStage<1, [A9_Pipe1]>,
Anton Korobeynikov7d62e332010-04-18 20:31:01 +0000204 InstrStage<1, [A9_NPipe]>], [1, 1]>,
Anton Korobeynikov090323a2010-04-07 18:22:11 +0000205 //
206 // Double-precision FP Compare
Anton Korobeynikov7d62e332010-04-18 20:31:01 +0000207 InstrItinData<IIC_fpCMP64 , [InstrStage<1, [A9_DRegsVFP], 0, Required>,
Anton Korobeynikov090323a2010-04-07 18:22:11 +0000208 // Extra latency cycles since wbck is 4 cycles
Anton Korobeynikov7d62e332010-04-18 20:31:01 +0000209 InstrStage<5, [A9_DRegsN], 0, Reserved>,
Anton Korobeynikovd4c7cce2010-05-29 19:25:29 +0000210 InstrStage<1, [A9_Pipe1]>,
Anton Korobeynikov7d62e332010-04-18 20:31:01 +0000211 InstrStage<1, [A9_NPipe]>], [1, 1]>,
Anton Korobeynikov090323a2010-04-07 18:22:11 +0000212 //
213 // Single to Double FP Convert
Anton Korobeynikov7d62e332010-04-18 20:31:01 +0000214 InstrItinData<IIC_fpCVTSD , [InstrStage<1, [A9_DRegsVFP], 0, Required>,
215 InstrStage<5, [A9_DRegsN], 0, Reserved>,
Anton Korobeynikovd4c7cce2010-05-29 19:25:29 +0000216 InstrStage<1, [A9_Pipe1]>,
Anton Korobeynikov7d62e332010-04-18 20:31:01 +0000217 InstrStage<1, [A9_NPipe]>], [4, 1]>,
Anton Korobeynikov090323a2010-04-07 18:22:11 +0000218 //
219 // Double to Single FP Convert
Anton Korobeynikov7d62e332010-04-18 20:31:01 +0000220 InstrItinData<IIC_fpCVTDS , [InstrStage<1, [A9_DRegsVFP], 0, Required>,
221 InstrStage<5, [A9_DRegsN], 0, Reserved>,
Anton Korobeynikovd4c7cce2010-05-29 19:25:29 +0000222 InstrStage<1, [A9_Pipe1]>,
Anton Korobeynikov7d62e332010-04-18 20:31:01 +0000223 InstrStage<1, [A9_NPipe]>], [4, 1]>,
Anton Korobeynikov090323a2010-04-07 18:22:11 +0000224
225 //
226 // Single to Half FP Convert
Anton Korobeynikov7d62e332010-04-18 20:31:01 +0000227 InstrItinData<IIC_fpCVTSH , [InstrStage<1, [A9_DRegsVFP], 0, Required>,
228 InstrStage<5, [A9_DRegsN], 0, Reserved>,
Anton Korobeynikovd4c7cce2010-05-29 19:25:29 +0000229 InstrStage<1, [A9_Pipe1]>,
Anton Korobeynikov7d62e332010-04-18 20:31:01 +0000230 InstrStage<1, [A9_NPipe]>], [4, 1]>,
Anton Korobeynikov090323a2010-04-07 18:22:11 +0000231 //
232 // Half to Single FP Convert
Anton Korobeynikov7d62e332010-04-18 20:31:01 +0000233 InstrItinData<IIC_fpCVTHS , [InstrStage<1, [A9_DRegsVFP], 0, Required>,
234 InstrStage<3, [A9_DRegsN], 0, Reserved>,
Anton Korobeynikovd4c7cce2010-05-29 19:25:29 +0000235 InstrStage<1, [A9_Pipe1]>,
Anton Korobeynikov7d62e332010-04-18 20:31:01 +0000236 InstrStage<1, [A9_NPipe]>], [2, 1]>,
Anton Korobeynikov090323a2010-04-07 18:22:11 +0000237
238 //
239 // Single-Precision FP to Integer Convert
Anton Korobeynikov7d62e332010-04-18 20:31:01 +0000240 InstrItinData<IIC_fpCVTSI , [InstrStage<1, [A9_DRegsVFP], 0, Required>,
241 InstrStage<5, [A9_DRegsN], 0, Reserved>,
Anton Korobeynikovd4c7cce2010-05-29 19:25:29 +0000242 InstrStage<1, [A9_Pipe1]>,
Anton Korobeynikov7d62e332010-04-18 20:31:01 +0000243 InstrStage<1, [A9_NPipe]>], [4, 1]>,
Anton Korobeynikov090323a2010-04-07 18:22:11 +0000244 //
245 // Double-Precision FP to Integer Convert
Anton Korobeynikov7d62e332010-04-18 20:31:01 +0000246 InstrItinData<IIC_fpCVTDI , [InstrStage<1, [A9_DRegsVFP], 0, Required>,
247 InstrStage<5, [A9_DRegsN], 0, Reserved>,
Anton Korobeynikovd4c7cce2010-05-29 19:25:29 +0000248 InstrStage<1, [A9_Pipe1]>,
Anton Korobeynikov7d62e332010-04-18 20:31:01 +0000249 InstrStage<1, [A9_NPipe]>], [4, 1]>,
Anton Korobeynikov090323a2010-04-07 18:22:11 +0000250 //
251 // Integer to Single-Precision FP Convert
Anton Korobeynikov7d62e332010-04-18 20:31:01 +0000252 InstrItinData<IIC_fpCVTIS , [InstrStage<1, [A9_DRegsVFP], 0, Required>,
253 InstrStage<5, [A9_DRegsN], 0, Reserved>,
Anton Korobeynikovd4c7cce2010-05-29 19:25:29 +0000254 InstrStage<1, [A9_Pipe1]>,
Anton Korobeynikov7d62e332010-04-18 20:31:01 +0000255 InstrStage<1, [A9_NPipe]>], [4, 1]>,
Anton Korobeynikov090323a2010-04-07 18:22:11 +0000256 //
257 // Integer to Double-Precision FP Convert
Anton Korobeynikov7d62e332010-04-18 20:31:01 +0000258 InstrItinData<IIC_fpCVTID , [InstrStage<1, [A9_DRegsVFP], 0, Required>,
259 InstrStage<5, [A9_DRegsN], 0, Reserved>,
Anton Korobeynikovd4c7cce2010-05-29 19:25:29 +0000260 InstrStage<1, [A9_Pipe1]>,
Anton Korobeynikov7d62e332010-04-18 20:31:01 +0000261 InstrStage<1, [A9_NPipe]>], [4, 1]>,
Anton Korobeynikov090323a2010-04-07 18:22:11 +0000262 //
263 // Single-precision FP ALU
Anton Korobeynikov7d62e332010-04-18 20:31:01 +0000264 InstrItinData<IIC_fpALU32 , [InstrStage<1, [A9_DRegsVFP], 0, Required>,
265 InstrStage<5, [A9_DRegsN], 0, Reserved>,
Anton Korobeynikovd4c7cce2010-05-29 19:25:29 +0000266 InstrStage<1, [A9_Pipe1]>,
Anton Korobeynikov7d62e332010-04-18 20:31:01 +0000267 InstrStage<1, [A9_NPipe]>], [4, 1, 1]>,
Anton Korobeynikov090323a2010-04-07 18:22:11 +0000268 //
269 // Double-precision FP ALU
Anton Korobeynikov7d62e332010-04-18 20:31:01 +0000270 InstrItinData<IIC_fpALU64 , [InstrStage<1, [A9_DRegsVFP], 0, Required>,
271 InstrStage<5, [A9_DRegsN], 0, Reserved>,
Anton Korobeynikovd4c7cce2010-05-29 19:25:29 +0000272 InstrStage<1, [A9_Pipe1]>,
Anton Korobeynikov7d62e332010-04-18 20:31:01 +0000273 InstrStage<1, [A9_NPipe]>], [4, 1, 1]>,
Anton Korobeynikov090323a2010-04-07 18:22:11 +0000274 //
275 // Single-precision FP Multiply
Anton Korobeynikov7d62e332010-04-18 20:31:01 +0000276 InstrItinData<IIC_fpMUL32 , [InstrStage<1, [A9_DRegsVFP], 0, Required>,
277 InstrStage<6, [A9_DRegsN], 0, Reserved>,
Anton Korobeynikovd4c7cce2010-05-29 19:25:29 +0000278 InstrStage<1, [A9_Pipe1]>,
Anton Korobeynikov7d62e332010-04-18 20:31:01 +0000279 InstrStage<1, [A9_NPipe]>], [5, 1, 1]>,
Anton Korobeynikov090323a2010-04-07 18:22:11 +0000280 //
281 // Double-precision FP Multiply
Anton Korobeynikov7d62e332010-04-18 20:31:01 +0000282 InstrItinData<IIC_fpMUL64 , [InstrStage<1, [A9_DRegsVFP], 0, Required>,
283 InstrStage<7, [A9_DRegsN], 0, Reserved>,
Anton Korobeynikovd4c7cce2010-05-29 19:25:29 +0000284 InstrStage<1, [A9_Pipe1]>,
Anton Korobeynikov7d62e332010-04-18 20:31:01 +0000285 InstrStage<2, [A9_NPipe]>], [6, 1, 1]>,
Anton Korobeynikov090323a2010-04-07 18:22:11 +0000286 //
287 // Single-precision FP MAC
Anton Korobeynikov7d62e332010-04-18 20:31:01 +0000288 InstrItinData<IIC_fpMAC32 , [InstrStage<1, [A9_DRegsVFP], 0, Required>,
289 InstrStage<9, [A9_DRegsN], 0, Reserved>,
Anton Korobeynikovd4c7cce2010-05-29 19:25:29 +0000290 InstrStage<1, [A9_Pipe1]>,
Anton Korobeynikov7d62e332010-04-18 20:31:01 +0000291 InstrStage<1, [A9_NPipe]>], [8, 0, 1, 1]>,
Anton Korobeynikov090323a2010-04-07 18:22:11 +0000292 //
293 // Double-precision FP MAC
Anton Korobeynikov7d62e332010-04-18 20:31:01 +0000294 InstrItinData<IIC_fpMAC64 , [InstrStage<1, [A9_DRegsVFP], 0, Required>,
295 InstrStage<10, [A9_DRegsN], 0, Reserved>,
Anton Korobeynikovd4c7cce2010-05-29 19:25:29 +0000296 InstrStage<1, [A9_Pipe1]>,
Anton Korobeynikov7d62e332010-04-18 20:31:01 +0000297 InstrStage<2, [A9_NPipe]>], [9, 0, 1, 1]>,
Anton Korobeynikov090323a2010-04-07 18:22:11 +0000298 //
299 // Single-precision FP DIV
Anton Korobeynikov7d62e332010-04-18 20:31:01 +0000300 InstrItinData<IIC_fpDIV32 , [InstrStage<1, [A9_DRegsVFP], 0, Required>,
301 InstrStage<16, [A9_DRegsN], 0, Reserved>,
Anton Korobeynikovd4c7cce2010-05-29 19:25:29 +0000302 InstrStage<1, [A9_Pipe1]>,
Anton Korobeynikov7d62e332010-04-18 20:31:01 +0000303 InstrStage<10, [A9_NPipe]>], [15, 1, 1]>,
Anton Korobeynikov090323a2010-04-07 18:22:11 +0000304 //
305 // Double-precision FP DIV
Anton Korobeynikov7d62e332010-04-18 20:31:01 +0000306 InstrItinData<IIC_fpDIV64 , [InstrStage<1, [A9_DRegsVFP], 0, Required>,
307 InstrStage<26, [A9_DRegsN], 0, Reserved>,
Anton Korobeynikovd4c7cce2010-05-29 19:25:29 +0000308 InstrStage<1, [A9_Pipe1]>,
Anton Korobeynikov7d62e332010-04-18 20:31:01 +0000309 InstrStage<20, [A9_NPipe]>], [25, 1, 1]>,
Anton Korobeynikov090323a2010-04-07 18:22:11 +0000310 //
311 // Single-precision FP SQRT
Anton Korobeynikov7d62e332010-04-18 20:31:01 +0000312 InstrItinData<IIC_fpSQRT32, [InstrStage<1, [A9_DRegsVFP], 0, Required>,
313 InstrStage<18, [A9_DRegsN], 0, Reserved>,
Anton Korobeynikovd4c7cce2010-05-29 19:25:29 +0000314 InstrStage<1, [A9_Pipe1]>,
315 InstrStage<13, [A9_NPipe]>], [17, 1]>,
Anton Korobeynikov090323a2010-04-07 18:22:11 +0000316 //
317 // Double-precision FP SQRT
Anton Korobeynikov7d62e332010-04-18 20:31:01 +0000318 InstrItinData<IIC_fpSQRT64, [InstrStage<1, [A9_DRegsVFP], 0, Required>,
319 InstrStage<33, [A9_DRegsN], 0, Reserved>,
Anton Korobeynikovd4c7cce2010-05-29 19:25:29 +0000320 InstrStage<1, [A9_Pipe1]>,
Anton Korobeynikov7d62e332010-04-18 20:31:01 +0000321 InstrStage<28, [A9_NPipe]>], [32, 1]>,
Anton Korobeynikov090323a2010-04-07 18:22:11 +0000322
323 //
324 // Integer to Single-precision Move
Anton Korobeynikov7d62e332010-04-18 20:31:01 +0000325 InstrItinData<IIC_fpMOVIS, [InstrStage<1, [A9_DRegsVFP], 0, Required>,
Anton Korobeynikov090323a2010-04-07 18:22:11 +0000326 // Extra 1 latency cycle since wbck is 2 cycles
Anton Korobeynikov7d62e332010-04-18 20:31:01 +0000327 InstrStage<3, [A9_DRegsN], 0, Reserved>,
Anton Korobeynikovd4c7cce2010-05-29 19:25:29 +0000328 InstrStage<1, [A9_Pipe1]>,
Anton Korobeynikov7d62e332010-04-18 20:31:01 +0000329 InstrStage<1, [A9_NPipe]>], [1, 1]>,
Anton Korobeynikov090323a2010-04-07 18:22:11 +0000330 //
331 // Integer to Double-precision Move
Anton Korobeynikov7d62e332010-04-18 20:31:01 +0000332 InstrItinData<IIC_fpMOVID, [InstrStage<1, [A9_DRegsVFP], 0, Required>,
Anton Korobeynikov090323a2010-04-07 18:22:11 +0000333 // Extra 1 latency cycle since wbck is 2 cycles
Anton Korobeynikov7d62e332010-04-18 20:31:01 +0000334 InstrStage<3, [A9_DRegsN], 0, Reserved>,
Anton Korobeynikovd4c7cce2010-05-29 19:25:29 +0000335 InstrStage<1, [A9_Pipe1]>,
Anton Korobeynikov7d62e332010-04-18 20:31:01 +0000336 InstrStage<1, [A9_NPipe]>], [1, 1, 1]>,
Anton Korobeynikov090323a2010-04-07 18:22:11 +0000337 //
338 // Single-precision to Integer Move
Anton Korobeynikov7d62e332010-04-18 20:31:01 +0000339 InstrItinData<IIC_fpMOVSI, [InstrStage<1, [A9_DRegsVFP], 0, Required>,
340 InstrStage<2, [A9_DRegsN], 0, Reserved>,
Anton Korobeynikovd4c7cce2010-05-29 19:25:29 +0000341 InstrStage<1, [A9_Pipe1]>,
Anton Korobeynikov7d62e332010-04-18 20:31:01 +0000342 InstrStage<1, [A9_NPipe]>], [1, 1]>,
Anton Korobeynikov090323a2010-04-07 18:22:11 +0000343 //
344 // Double-precision to Integer Move
Anton Korobeynikov7d62e332010-04-18 20:31:01 +0000345 InstrItinData<IIC_fpMOVDI, [InstrStage<1, [A9_DRegsVFP], 0, Required>,
346 InstrStage<2, [A9_DRegsN], 0, Reserved>,
Anton Korobeynikovd4c7cce2010-05-29 19:25:29 +0000347 InstrStage<1, [A9_Pipe1]>,
Anton Korobeynikov7d62e332010-04-18 20:31:01 +0000348 InstrStage<1, [A9_NPipe]>], [1, 1, 1]>,
Anton Korobeynikov090323a2010-04-07 18:22:11 +0000349 //
350 // Single-precision FP Load
Anton Korobeynikov7d62e332010-04-18 20:31:01 +0000351 InstrItinData<IIC_fpLoad32, [InstrStage<1, [A9_DRegsVFP], 0, Required>,
352 InstrStage<2, [A9_DRegsN], 0, Reserved>,
Anton Korobeynikova09d9542010-05-29 19:25:39 +0000353 InstrStage<1, [A9_Pipe1], 0>,
354 InstrStage<1, [A9_LSPipe]>,
Anton Korobeynikov7d62e332010-04-18 20:31:01 +0000355 InstrStage<1, [A9_NPipe]>]>,
Anton Korobeynikov090323a2010-04-07 18:22:11 +0000356 //
357 // Double-precision FP Load
Anton Korobeynikov7d62e332010-04-18 20:31:01 +0000358 InstrItinData<IIC_fpLoad64, [InstrStage<1, [A9_DRegsVFP], 0, Required>,
359 InstrStage<2, [A9_DRegsN], 0, Reserved>,
Anton Korobeynikova09d9542010-05-29 19:25:39 +0000360 InstrStage<1, [A9_Pipe1], 0>,
361 InstrStage<1, [A9_LSPipe]>,
Anton Korobeynikov7d62e332010-04-18 20:31:01 +0000362 InstrStage<1, [A9_NPipe]>]>,
Anton Korobeynikov090323a2010-04-07 18:22:11 +0000363 //
364 // FP Load Multiple
Anton Korobeynikov7d62e332010-04-18 20:31:01 +0000365 InstrItinData<IIC_fpLoadm, [InstrStage<1, [A9_DRegsVFP], 0, Required>,
366 InstrStage<2, [A9_DRegsN], 0, Reserved>,
Anton Korobeynikova09d9542010-05-29 19:25:39 +0000367 InstrStage<1, [A9_Pipe1], 0>,
368 InstrStage<1, [A9_LSPipe]>,
Anton Korobeynikov7d62e332010-04-18 20:31:01 +0000369 InstrStage<1, [A9_NPipe]>]>,
Anton Korobeynikov090323a2010-04-07 18:22:11 +0000370 //
371 // Single-precision FP Store
Anton Korobeynikov7d62e332010-04-18 20:31:01 +0000372 InstrItinData<IIC_fpStore32,[InstrStage<1, [A9_DRegsVFP], 0, Required>,
373 InstrStage<2, [A9_DRegsN], 0, Reserved>,
Anton Korobeynikova09d9542010-05-29 19:25:39 +0000374 InstrStage<1, [A9_Pipe1], 0>,
375 InstrStage<1, [A9_LSPipe]>,
Anton Korobeynikov7d62e332010-04-18 20:31:01 +0000376 InstrStage<1, [A9_NPipe]>]>,
Anton Korobeynikov090323a2010-04-07 18:22:11 +0000377 //
378 // Double-precision FP Store
Anton Korobeynikov7d62e332010-04-18 20:31:01 +0000379 InstrItinData<IIC_fpStore64,[InstrStage<1, [A9_DRegsVFP], 0, Required>,
380 InstrStage<2, [A9_DRegsN], 0, Reserved>,
Anton Korobeynikova09d9542010-05-29 19:25:39 +0000381 InstrStage<1, [A9_Pipe1], 0>,
382 InstrStage<1, [A9_LSPipe]>,
Anton Korobeynikov7d62e332010-04-18 20:31:01 +0000383 InstrStage<1, [A9_NPipe]>]>,
Anton Korobeynikov090323a2010-04-07 18:22:11 +0000384 //
385 // FP Store Multiple
Anton Korobeynikov7d62e332010-04-18 20:31:01 +0000386 InstrItinData<IIC_fpStorem, [InstrStage<1, [A9_DRegsVFP], 0, Required>,
387 InstrStage<2, [A9_DRegsN], 0, Reserved>,
Anton Korobeynikova09d9542010-05-29 19:25:39 +0000388 InstrStage<1, [A9_Pipe1], 0>,
389 InstrStage<1, [A9_LSPipe]>,
Anton Korobeynikov7d62e332010-04-18 20:31:01 +0000390 InstrStage<1, [A9_NPipe]>]>,
Anton Korobeynikov090323a2010-04-07 18:22:11 +0000391 // NEON
392 // Issue through integer pipeline, and execute in NEON unit.
Jim Grosbach7ea5fc02010-06-28 04:27:01 +0000393 // FIXME: Neon pipeline and LdSt unit are multiplexed.
Anton Korobeynikov090323a2010-04-07 18:22:11 +0000394 // Add some syntactic sugar to model this!
395 // VLD1
396 // FIXME: We don't model this instruction properly
Anton Korobeynikov7d62e332010-04-18 20:31:01 +0000397 InstrItinData<IIC_VLD1, [InstrStage<1, [A9_DRegsN], 0, Required>,
398 InstrStage<7, [A9_DRegsVFP], 0, Reserved>,
Anton Korobeynikova09d9542010-05-29 19:25:39 +0000399 InstrStage<1, [A9_Pipe1], 0>,
400 InstrStage<1, [A9_LSPipe]>,
Anton Korobeynikov7d62e332010-04-18 20:31:01 +0000401 InstrStage<1, [A9_NPipe]>]>,
Anton Korobeynikov090323a2010-04-07 18:22:11 +0000402 //
403 // VLD2
404 // FIXME: We don't model this instruction properly
Anton Korobeynikov7d62e332010-04-18 20:31:01 +0000405 InstrItinData<IIC_VLD2, [InstrStage<1, [A9_DRegsN], 0, Required>,
Anton Korobeynikov090323a2010-04-07 18:22:11 +0000406 // Extra latency cycles since wbck is 6 cycles
Anton Korobeynikov7d62e332010-04-18 20:31:01 +0000407 InstrStage<7, [A9_DRegsVFP], 0, Reserved>,
Anton Korobeynikova09d9542010-05-29 19:25:39 +0000408 InstrStage<1, [A9_Pipe1], 0>,
409 InstrStage<1, [A9_LSPipe]>,
Anton Korobeynikov7d62e332010-04-18 20:31:01 +0000410 InstrStage<1, [A9_NPipe]>], [2, 2, 1]>,
Anton Korobeynikov090323a2010-04-07 18:22:11 +0000411 //
412 // VLD3
413 // FIXME: We don't model this instruction properly
Anton Korobeynikov7d62e332010-04-18 20:31:01 +0000414 InstrItinData<IIC_VLD3, [InstrStage<1, [A9_DRegsN], 0, Required>,
Anton Korobeynikov090323a2010-04-07 18:22:11 +0000415 // Extra latency cycles since wbck is 6 cycles
Anton Korobeynikov7d62e332010-04-18 20:31:01 +0000416 InstrStage<7, [A9_DRegsVFP], 0, Reserved>,
Anton Korobeynikova09d9542010-05-29 19:25:39 +0000417 InstrStage<1, [A9_Pipe1], 0>,
418 InstrStage<1, [A9_LSPipe]>,
Anton Korobeynikov7d62e332010-04-18 20:31:01 +0000419 InstrStage<1, [A9_NPipe]>], [2, 2, 2, 1]>,
Anton Korobeynikov090323a2010-04-07 18:22:11 +0000420 //
421 // VLD4
422 // FIXME: We don't model this instruction properly
Anton Korobeynikov7d62e332010-04-18 20:31:01 +0000423 InstrItinData<IIC_VLD4, [InstrStage<1, [A9_DRegsN], 0, Required>,
Anton Korobeynikov090323a2010-04-07 18:22:11 +0000424 // Extra latency cycles since wbck is 6 cycles
Anton Korobeynikov7d62e332010-04-18 20:31:01 +0000425 InstrStage<7, [A9_DRegsVFP], 0, Reserved>,
Anton Korobeynikova09d9542010-05-29 19:25:39 +0000426 InstrStage<1, [A9_Pipe1], 0>,
427 InstrStage<1, [A9_LSPipe]>,
Anton Korobeynikov7d62e332010-04-18 20:31:01 +0000428 InstrStage<1, [A9_NPipe]>], [2, 2, 2, 2, 1]>,
Anton Korobeynikov090323a2010-04-07 18:22:11 +0000429 //
430 // VST
431 // FIXME: We don't model this instruction properly
Anton Korobeynikov7d62e332010-04-18 20:31:01 +0000432 InstrItinData<IIC_VST, [InstrStage<1, [A9_DRegsN], 0, Required>,
Anton Korobeynikov090323a2010-04-07 18:22:11 +0000433 // Extra latency cycles since wbck is 6 cycles
Anton Korobeynikov7d62e332010-04-18 20:31:01 +0000434 InstrStage<7, [A9_DRegsVFP], 0, Reserved>,
Anton Korobeynikova09d9542010-05-29 19:25:39 +0000435 InstrStage<1, [A9_Pipe1], 0>,
436 InstrStage<1, [A9_LSPipe]>,
Anton Korobeynikov7d62e332010-04-18 20:31:01 +0000437 InstrStage<1, [A9_NPipe]>]>,
Anton Korobeynikov090323a2010-04-07 18:22:11 +0000438 //
439 // Double-register Integer Unary
Anton Korobeynikov7d62e332010-04-18 20:31:01 +0000440 InstrItinData<IIC_VUNAiD, [InstrStage<1, [A9_DRegsN], 0, Required>,
Anton Korobeynikov090323a2010-04-07 18:22:11 +0000441 // Extra latency cycles since wbck is 6 cycles
Anton Korobeynikov7d62e332010-04-18 20:31:01 +0000442 InstrStage<7, [A9_DRegsVFP], 0, Reserved>,
Anton Korobeynikovd4c7cce2010-05-29 19:25:29 +0000443 InstrStage<1, [A9_Pipe1]>,
Anton Korobeynikov7d62e332010-04-18 20:31:01 +0000444 InstrStage<1, [A9_NPipe]>], [4, 2]>,
Anton Korobeynikov090323a2010-04-07 18:22:11 +0000445 //
446 // Quad-register Integer Unary
Anton Korobeynikov7d62e332010-04-18 20:31:01 +0000447 InstrItinData<IIC_VUNAiQ, [InstrStage<1, [A9_DRegsN], 0, Required>,
Anton Korobeynikov090323a2010-04-07 18:22:11 +0000448 // Extra latency cycles since wbck is 6 cycles
Anton Korobeynikov7d62e332010-04-18 20:31:01 +0000449 InstrStage<7, [A9_DRegsVFP], 0, Reserved>,
Anton Korobeynikovd4c7cce2010-05-29 19:25:29 +0000450 InstrStage<1, [A9_Pipe1]>,
Anton Korobeynikov7d62e332010-04-18 20:31:01 +0000451 InstrStage<1, [A9_NPipe]>], [4, 2]>,
Anton Korobeynikov090323a2010-04-07 18:22:11 +0000452 //
453 // Double-register Integer Q-Unary
Anton Korobeynikov7d62e332010-04-18 20:31:01 +0000454 InstrItinData<IIC_VQUNAiD, [InstrStage<1, [A9_DRegsN], 0, Required>,
Anton Korobeynikov090323a2010-04-07 18:22:11 +0000455 // Extra latency cycles since wbck is 6 cycles
Anton Korobeynikov7d62e332010-04-18 20:31:01 +0000456 InstrStage<7, [A9_DRegsVFP], 0, Reserved>,
Anton Korobeynikovd4c7cce2010-05-29 19:25:29 +0000457 InstrStage<1, [A9_Pipe1]>,
Anton Korobeynikov7d62e332010-04-18 20:31:01 +0000458 InstrStage<1, [A9_NPipe]>], [4, 1]>,
Anton Korobeynikov090323a2010-04-07 18:22:11 +0000459 //
460 // Quad-register Integer CountQ-Unary
Anton Korobeynikov7d62e332010-04-18 20:31:01 +0000461 InstrItinData<IIC_VQUNAiQ, [InstrStage<1, [A9_DRegsN], 0, Required>,
Anton Korobeynikov090323a2010-04-07 18:22:11 +0000462 // Extra latency cycles since wbck is 6 cycles
Anton Korobeynikov7d62e332010-04-18 20:31:01 +0000463 InstrStage<7, [A9_DRegsVFP], 0, Reserved>,
Anton Korobeynikovd4c7cce2010-05-29 19:25:29 +0000464 InstrStage<1, [A9_Pipe1]>,
Anton Korobeynikov7d62e332010-04-18 20:31:01 +0000465 InstrStage<1, [A9_NPipe]>], [4, 1]>,
Anton Korobeynikov090323a2010-04-07 18:22:11 +0000466 //
467 // Double-register Integer Binary
Anton Korobeynikov7d62e332010-04-18 20:31:01 +0000468 InstrItinData<IIC_VBINiD, [InstrStage<1, [A9_DRegsN], 0, Required>,
Anton Korobeynikov090323a2010-04-07 18:22:11 +0000469 // Extra latency cycles since wbck is 6 cycles
Anton Korobeynikov7d62e332010-04-18 20:31:01 +0000470 InstrStage<7, [A9_DRegsVFP], 0, Reserved>,
Anton Korobeynikovd4c7cce2010-05-29 19:25:29 +0000471 InstrStage<1, [A9_Pipe1]>,
Anton Korobeynikov7d62e332010-04-18 20:31:01 +0000472 InstrStage<1, [A9_NPipe]>], [3, 2, 2]>,
Anton Korobeynikov090323a2010-04-07 18:22:11 +0000473 //
474 // Quad-register Integer Binary
Anton Korobeynikov7d62e332010-04-18 20:31:01 +0000475 InstrItinData<IIC_VBINiQ, [InstrStage<1, [A9_DRegsN], 0, Required>,
Anton Korobeynikov090323a2010-04-07 18:22:11 +0000476 // Extra latency cycles since wbck is 6 cycles
Anton Korobeynikov7d62e332010-04-18 20:31:01 +0000477 InstrStage<7, [A9_DRegsVFP], 0, Reserved>,
Anton Korobeynikovd4c7cce2010-05-29 19:25:29 +0000478 InstrStage<1, [A9_Pipe1]>,
Anton Korobeynikov7d62e332010-04-18 20:31:01 +0000479 InstrStage<1, [A9_NPipe]>], [3, 2, 2]>,
Anton Korobeynikov090323a2010-04-07 18:22:11 +0000480 //
481 // Double-register Integer Subtract
Anton Korobeynikov7d62e332010-04-18 20:31:01 +0000482 InstrItinData<IIC_VSUBiD, [InstrStage<1, [A9_DRegsN], 0, Required>,
Anton Korobeynikov090323a2010-04-07 18:22:11 +0000483 // Extra latency cycles since wbck is 6 cycles
Anton Korobeynikov7d62e332010-04-18 20:31:01 +0000484 InstrStage<7, [A9_DRegsVFP], 0, Reserved>,
Anton Korobeynikovd4c7cce2010-05-29 19:25:29 +0000485 InstrStage<1, [A9_Pipe1]>,
Anton Korobeynikov7d62e332010-04-18 20:31:01 +0000486 InstrStage<1, [A9_NPipe]>], [3, 2, 1]>,
Anton Korobeynikov090323a2010-04-07 18:22:11 +0000487 //
488 // Quad-register Integer Subtract
Anton Korobeynikov7d62e332010-04-18 20:31:01 +0000489 InstrItinData<IIC_VSUBiQ, [InstrStage<1, [A9_DRegsN], 0, Required>,
Anton Korobeynikov090323a2010-04-07 18:22:11 +0000490 // Extra latency cycles since wbck is 6 cycles
Anton Korobeynikov7d62e332010-04-18 20:31:01 +0000491 InstrStage<7, [A9_DRegsVFP], 0, Reserved>,
Anton Korobeynikovd4c7cce2010-05-29 19:25:29 +0000492 InstrStage<1, [A9_Pipe1]>,
Anton Korobeynikov7d62e332010-04-18 20:31:01 +0000493 InstrStage<1, [A9_NPipe]>], [3, 2, 1]>,
Anton Korobeynikov090323a2010-04-07 18:22:11 +0000494 //
495 // Double-register Integer Shift
Anton Korobeynikov7d62e332010-04-18 20:31:01 +0000496 InstrItinData<IIC_VSHLiD, [InstrStage<1, [A9_DRegsN], 0, Required>,
Anton Korobeynikov090323a2010-04-07 18:22:11 +0000497 // Extra latency cycles since wbck is 6 cycles
Anton Korobeynikov7d62e332010-04-18 20:31:01 +0000498 InstrStage<7, [A9_DRegsVFP], 0, Reserved>,
Anton Korobeynikovd4c7cce2010-05-29 19:25:29 +0000499 InstrStage<1, [A9_Pipe1]>,
Anton Korobeynikov7d62e332010-04-18 20:31:01 +0000500 InstrStage<1, [A9_NPipe]>], [3, 1, 1]>,
Anton Korobeynikov090323a2010-04-07 18:22:11 +0000501 //
502 // Quad-register Integer Shift
Anton Korobeynikov7d62e332010-04-18 20:31:01 +0000503 InstrItinData<IIC_VSHLiQ, [InstrStage<1, [A9_DRegsN], 0, Required>,
Anton Korobeynikov090323a2010-04-07 18:22:11 +0000504 // Extra latency cycles since wbck is 6 cycles
Anton Korobeynikov7d62e332010-04-18 20:31:01 +0000505 InstrStage<7, [A9_DRegsVFP], 0, Reserved>,
Anton Korobeynikovd4c7cce2010-05-29 19:25:29 +0000506 InstrStage<1, [A9_Pipe1]>,
Anton Korobeynikov7d62e332010-04-18 20:31:01 +0000507 InstrStage<1, [A9_NPipe]>], [3, 1, 1]>,
Anton Korobeynikov090323a2010-04-07 18:22:11 +0000508 //
509 // Double-register Integer Shift (4 cycle)
Anton Korobeynikov7d62e332010-04-18 20:31:01 +0000510 InstrItinData<IIC_VSHLi4D, [InstrStage<1, [A9_DRegsN], 0, Required>,
Anton Korobeynikov090323a2010-04-07 18:22:11 +0000511 // Extra latency cycles since wbck is 6 cycles
Anton Korobeynikov7d62e332010-04-18 20:31:01 +0000512 InstrStage<7, [A9_DRegsVFP], 0, Reserved>,
Anton Korobeynikovd4c7cce2010-05-29 19:25:29 +0000513 InstrStage<1, [A9_Pipe1]>,
Anton Korobeynikov7d62e332010-04-18 20:31:01 +0000514 InstrStage<1, [A9_NPipe]>], [4, 1, 1]>,
Anton Korobeynikov090323a2010-04-07 18:22:11 +0000515 //
516 // Quad-register Integer Shift (4 cycle)
Anton Korobeynikov7d62e332010-04-18 20:31:01 +0000517 InstrItinData<IIC_VSHLi4Q, [InstrStage<1, [A9_DRegsN], 0, Required>,
Anton Korobeynikov090323a2010-04-07 18:22:11 +0000518 // Extra latency cycles since wbck is 6 cycles
Anton Korobeynikov7d62e332010-04-18 20:31:01 +0000519 InstrStage<7, [A9_DRegsVFP], 0, Reserved>,
Anton Korobeynikovd4c7cce2010-05-29 19:25:29 +0000520 InstrStage<1, [A9_Pipe1]>,
Anton Korobeynikov7d62e332010-04-18 20:31:01 +0000521 InstrStage<1, [A9_NPipe]>], [4, 1, 1]>,
Anton Korobeynikov090323a2010-04-07 18:22:11 +0000522 //
523 // Double-register Integer Binary (4 cycle)
Anton Korobeynikov7d62e332010-04-18 20:31:01 +0000524 InstrItinData<IIC_VBINi4D, [InstrStage<1, [A9_DRegsN], 0, Required>,
Anton Korobeynikov090323a2010-04-07 18:22:11 +0000525 // Extra latency cycles since wbck is 6 cycles
Anton Korobeynikov7d62e332010-04-18 20:31:01 +0000526 InstrStage<7, [A9_DRegsVFP], 0, Reserved>,
Anton Korobeynikovd4c7cce2010-05-29 19:25:29 +0000527 InstrStage<1, [A9_Pipe1]>,
Anton Korobeynikov7d62e332010-04-18 20:31:01 +0000528 InstrStage<1, [A9_NPipe]>], [4, 2, 2]>,
Anton Korobeynikov090323a2010-04-07 18:22:11 +0000529 //
530 // Quad-register Integer Binary (4 cycle)
Anton Korobeynikov7d62e332010-04-18 20:31:01 +0000531 InstrItinData<IIC_VBINi4Q, [InstrStage<1, [A9_DRegsN], 0, Required>,
Anton Korobeynikov090323a2010-04-07 18:22:11 +0000532 // Extra latency cycles since wbck is 6 cycles
Anton Korobeynikov7d62e332010-04-18 20:31:01 +0000533 InstrStage<7, [A9_DRegsVFP], 0, Reserved>,
Anton Korobeynikovd4c7cce2010-05-29 19:25:29 +0000534 InstrStage<1, [A9_Pipe1]>,
Anton Korobeynikov7d62e332010-04-18 20:31:01 +0000535 InstrStage<1, [A9_NPipe]>], [4, 2, 2]>,
Anton Korobeynikov090323a2010-04-07 18:22:11 +0000536 //
537 // Double-register Integer Subtract (4 cycle)
Anton Korobeynikov7d62e332010-04-18 20:31:01 +0000538 InstrItinData<IIC_VSUBiD, [InstrStage<1, [A9_DRegsN], 0, Required>,
Anton Korobeynikov090323a2010-04-07 18:22:11 +0000539 // Extra latency cycles since wbck is 6 cycles
Anton Korobeynikov7d62e332010-04-18 20:31:01 +0000540 InstrStage<7, [A9_DRegsVFP], 0, Reserved>,
Anton Korobeynikovd4c7cce2010-05-29 19:25:29 +0000541 InstrStage<1, [A9_Pipe1]>,
Anton Korobeynikov7d62e332010-04-18 20:31:01 +0000542 InstrStage<1, [A9_NPipe]>], [4, 2, 1]>,
Anton Korobeynikov090323a2010-04-07 18:22:11 +0000543 //
544 // Quad-register Integer Subtract (4 cycle)
Anton Korobeynikov7d62e332010-04-18 20:31:01 +0000545 InstrItinData<IIC_VSUBiQ, [InstrStage<1, [A9_DRegsN], 0, Required>,
Anton Korobeynikov090323a2010-04-07 18:22:11 +0000546 // Extra latency cycles since wbck is 6 cycles
Anton Korobeynikov7d62e332010-04-18 20:31:01 +0000547 InstrStage<7, [A9_DRegsVFP], 0, Reserved>,
Anton Korobeynikovd4c7cce2010-05-29 19:25:29 +0000548 InstrStage<1, [A9_Pipe1]>,
Anton Korobeynikov7d62e332010-04-18 20:31:01 +0000549 InstrStage<1, [A9_NPipe]>], [4, 2, 1]>,
Anton Korobeynikov090323a2010-04-07 18:22:11 +0000550
551 //
552 // Double-register Integer Count
Anton Korobeynikov7d62e332010-04-18 20:31:01 +0000553 InstrItinData<IIC_VCNTiD, [InstrStage<1, [A9_DRegsN], 0, Required>,
Anton Korobeynikov090323a2010-04-07 18:22:11 +0000554 // Extra latency cycles since wbck is 6 cycles
Anton Korobeynikov7d62e332010-04-18 20:31:01 +0000555 InstrStage<7, [A9_DRegsVFP], 0, Reserved>,
Anton Korobeynikovd4c7cce2010-05-29 19:25:29 +0000556 InstrStage<1, [A9_Pipe1]>,
Anton Korobeynikov7d62e332010-04-18 20:31:01 +0000557 InstrStage<1, [A9_NPipe]>], [3, 2, 2]>,
Anton Korobeynikov090323a2010-04-07 18:22:11 +0000558 //
559 // Quad-register Integer Count
560 // Result written in N3, but that is relative to the last cycle of multicycle,
561 // so we use 4 for those cases
Anton Korobeynikov7d62e332010-04-18 20:31:01 +0000562 InstrItinData<IIC_VCNTiQ, [InstrStage<1, [A9_DRegsN], 0, Required>,
Anton Korobeynikov090323a2010-04-07 18:22:11 +0000563 // Extra latency cycles since wbck is 7 cycles
Anton Korobeynikov7d62e332010-04-18 20:31:01 +0000564 InstrStage<8, [A9_DRegsVFP], 0, Reserved>,
Anton Korobeynikovd4c7cce2010-05-29 19:25:29 +0000565 InstrStage<1, [A9_Pipe1]>,
Anton Korobeynikov7d62e332010-04-18 20:31:01 +0000566 InstrStage<2, [A9_NPipe]>], [4, 2, 2]>,
Anton Korobeynikov090323a2010-04-07 18:22:11 +0000567 //
568 // Double-register Absolute Difference and Accumulate
Anton Korobeynikov7d62e332010-04-18 20:31:01 +0000569 InstrItinData<IIC_VABAD, [InstrStage<1, [A9_DRegsN], 0, Required>,
Anton Korobeynikov090323a2010-04-07 18:22:11 +0000570 // Extra latency cycles since wbck is 6 cycles
Anton Korobeynikov7d62e332010-04-18 20:31:01 +0000571 InstrStage<7, [A9_DRegsVFP], 0, Reserved>,
Anton Korobeynikovd4c7cce2010-05-29 19:25:29 +0000572 InstrStage<1, [A9_Pipe1]>,
Anton Korobeynikov7d62e332010-04-18 20:31:01 +0000573 InstrStage<1, [A9_NPipe]>], [6, 3, 2, 1]>,
Anton Korobeynikov090323a2010-04-07 18:22:11 +0000574 //
575 // Quad-register Absolute Difference and Accumulate
Anton Korobeynikov7d62e332010-04-18 20:31:01 +0000576 InstrItinData<IIC_VABAQ, [InstrStage<1, [A9_DRegsN], 0, Required>,
Anton Korobeynikov090323a2010-04-07 18:22:11 +0000577 // Extra latency cycles since wbck is 6 cycles
Anton Korobeynikov7d62e332010-04-18 20:31:01 +0000578 InstrStage<7, [A9_DRegsVFP], 0, Reserved>,
Anton Korobeynikovd4c7cce2010-05-29 19:25:29 +0000579 InstrStage<1, [A9_Pipe1]>,
Anton Korobeynikov7d62e332010-04-18 20:31:01 +0000580 InstrStage<2, [A9_NPipe]>], [6, 3, 2, 1]>,
Anton Korobeynikov090323a2010-04-07 18:22:11 +0000581 //
582 // Double-register Integer Pair Add Long
Anton Korobeynikov7d62e332010-04-18 20:31:01 +0000583 InstrItinData<IIC_VPALiD, [InstrStage<1, [A9_DRegsN], 0, Required>,
Anton Korobeynikov090323a2010-04-07 18:22:11 +0000584 // Extra latency cycles since wbck is 6 cycles
Anton Korobeynikov7d62e332010-04-18 20:31:01 +0000585 InstrStage<7, [A9_DRegsVFP], 0, Reserved>,
Anton Korobeynikovd4c7cce2010-05-29 19:25:29 +0000586 InstrStage<1, [A9_Pipe1]>,
Anton Korobeynikov7d62e332010-04-18 20:31:01 +0000587 InstrStage<1, [A9_NPipe]>], [6, 3, 1]>,
Anton Korobeynikov090323a2010-04-07 18:22:11 +0000588 //
589 // Quad-register Integer Pair Add Long
Anton Korobeynikov7d62e332010-04-18 20:31:01 +0000590 InstrItinData<IIC_VPALiQ, [InstrStage<1, [A9_DRegsN], 0, Required>,
Anton Korobeynikov090323a2010-04-07 18:22:11 +0000591 // Extra latency cycles since wbck is 6 cycles
Anton Korobeynikov7d62e332010-04-18 20:31:01 +0000592 InstrStage<7, [A9_DRegsVFP], 0, Reserved>,
Anton Korobeynikovd4c7cce2010-05-29 19:25:29 +0000593 InstrStage<1, [A9_Pipe1]>,
Anton Korobeynikov7d62e332010-04-18 20:31:01 +0000594 InstrStage<2, [A9_NPipe]>], [6, 3, 1]>,
Anton Korobeynikov090323a2010-04-07 18:22:11 +0000595
596 //
597 // Double-register Integer Multiply (.8, .16)
Anton Korobeynikov7d62e332010-04-18 20:31:01 +0000598 InstrItinData<IIC_VMULi16D, [InstrStage<1, [A9_DRegsN], 0, Required>,
Anton Korobeynikov090323a2010-04-07 18:22:11 +0000599 // Extra latency cycles since wbck is 6 cycles
Anton Korobeynikov7d62e332010-04-18 20:31:01 +0000600 InstrStage<7, [A9_DRegsVFP], 0, Reserved>,
Anton Korobeynikovd4c7cce2010-05-29 19:25:29 +0000601 InstrStage<1, [A9_Pipe1]>,
Anton Korobeynikov7d62e332010-04-18 20:31:01 +0000602 InstrStage<1, [A9_NPipe]>], [6, 2, 2]>,
Anton Korobeynikov090323a2010-04-07 18:22:11 +0000603 //
604 // Quad-register Integer Multiply (.8, .16)
Anton Korobeynikov7d62e332010-04-18 20:31:01 +0000605 InstrItinData<IIC_VMULi16Q, [InstrStage<1, [A9_DRegsN], 0, Required>,
Anton Korobeynikov090323a2010-04-07 18:22:11 +0000606 // Extra latency cycles since wbck is 7 cycles
Anton Korobeynikov7d62e332010-04-18 20:31:01 +0000607 InstrStage<8, [A9_DRegsVFP], 0, Reserved>,
Anton Korobeynikovd4c7cce2010-05-29 19:25:29 +0000608 InstrStage<1, [A9_Pipe1]>,
Anton Korobeynikov7d62e332010-04-18 20:31:01 +0000609 InstrStage<2, [A9_NPipe]>], [7, 2, 2]>,
Anton Korobeynikov090323a2010-04-07 18:22:11 +0000610
611 //
612 // Double-register Integer Multiply (.32)
Anton Korobeynikov7d62e332010-04-18 20:31:01 +0000613 InstrItinData<IIC_VMULi32D, [InstrStage<1, [A9_DRegsN], 0, Required>,
Anton Korobeynikov090323a2010-04-07 18:22:11 +0000614 // Extra latency cycles since wbck is 7 cycles
Anton Korobeynikov7d62e332010-04-18 20:31:01 +0000615 InstrStage<8, [A9_DRegsVFP], 0, Reserved>,
Anton Korobeynikovd4c7cce2010-05-29 19:25:29 +0000616 InstrStage<1, [A9_Pipe1]>,
Anton Korobeynikov7d62e332010-04-18 20:31:01 +0000617 InstrStage<2, [A9_NPipe]>], [7, 2, 1]>,
Anton Korobeynikov090323a2010-04-07 18:22:11 +0000618 //
619 // Quad-register Integer Multiply (.32)
Anton Korobeynikov7d62e332010-04-18 20:31:01 +0000620 InstrItinData<IIC_VMULi32Q, [InstrStage<1, [A9_DRegsN], 0, Required>,
Anton Korobeynikov090323a2010-04-07 18:22:11 +0000621 // Extra latency cycles since wbck is 9 cycles
Anton Korobeynikov7d62e332010-04-18 20:31:01 +0000622 InstrStage<10, [A9_DRegsVFP], 0, Reserved>,
Anton Korobeynikovd4c7cce2010-05-29 19:25:29 +0000623 InstrStage<1, [A9_Pipe1]>,
Anton Korobeynikov7d62e332010-04-18 20:31:01 +0000624 InstrStage<4, [A9_NPipe]>], [9, 2, 1]>,
Anton Korobeynikov090323a2010-04-07 18:22:11 +0000625 //
626 // Double-register Integer Multiply-Accumulate (.8, .16)
Anton Korobeynikov7d62e332010-04-18 20:31:01 +0000627 InstrItinData<IIC_VMACi16D, [InstrStage<1, [A9_DRegsN], 0, Required>,
Anton Korobeynikov090323a2010-04-07 18:22:11 +0000628 // Extra latency cycles since wbck is 6 cycles
Anton Korobeynikov7d62e332010-04-18 20:31:01 +0000629 InstrStage<7, [A9_DRegsVFP], 0, Reserved>,
Anton Korobeynikovd4c7cce2010-05-29 19:25:29 +0000630 InstrStage<1, [A9_Pipe1]>,
Anton Korobeynikov7d62e332010-04-18 20:31:01 +0000631 InstrStage<1, [A9_NPipe]>], [6, 3, 2, 2]>,
Anton Korobeynikov090323a2010-04-07 18:22:11 +0000632 //
633 // Double-register Integer Multiply-Accumulate (.32)
Anton Korobeynikov7d62e332010-04-18 20:31:01 +0000634 InstrItinData<IIC_VMACi32D, [InstrStage<1, [A9_DRegsN], 0, Required>,
Anton Korobeynikov090323a2010-04-07 18:22:11 +0000635 // Extra latency cycles since wbck is 7 cycles
Anton Korobeynikov7d62e332010-04-18 20:31:01 +0000636 InstrStage<8, [A9_DRegsVFP], 0, Reserved>,
Anton Korobeynikovd4c7cce2010-05-29 19:25:29 +0000637 InstrStage<1, [A9_Pipe1]>,
Anton Korobeynikov7d62e332010-04-18 20:31:01 +0000638 InstrStage<2, [A9_NPipe]>], [7, 3, 2, 1]>,
Anton Korobeynikov090323a2010-04-07 18:22:11 +0000639 //
640 // Quad-register Integer Multiply-Accumulate (.8, .16)
Anton Korobeynikov7d62e332010-04-18 20:31:01 +0000641 InstrItinData<IIC_VMACi16Q, [InstrStage<1, [A9_DRegsN], 0, Required>,
Anton Korobeynikov090323a2010-04-07 18:22:11 +0000642 // Extra latency cycles since wbck is 7 cycles
Anton Korobeynikov7d62e332010-04-18 20:31:01 +0000643 InstrStage<8, [A9_DRegsVFP], 0, Reserved>,
Anton Korobeynikovd4c7cce2010-05-29 19:25:29 +0000644 InstrStage<1, [A9_Pipe1]>,
Anton Korobeynikov7d62e332010-04-18 20:31:01 +0000645 InstrStage<2, [A9_NPipe]>], [7, 3, 2, 2]>,
Anton Korobeynikov090323a2010-04-07 18:22:11 +0000646 //
647 // Quad-register Integer Multiply-Accumulate (.32)
Anton Korobeynikov7d62e332010-04-18 20:31:01 +0000648 InstrItinData<IIC_VMACi32Q, [InstrStage<1, [A9_DRegsN], 0, Required>,
Anton Korobeynikov090323a2010-04-07 18:22:11 +0000649 // Extra latency cycles since wbck is 9 cycles
Anton Korobeynikov7d62e332010-04-18 20:31:01 +0000650 InstrStage<10, [A9_DRegsVFP], 0, Reserved>,
Anton Korobeynikovd4c7cce2010-05-29 19:25:29 +0000651 InstrStage<1, [A9_Pipe1]>,
Anton Korobeynikov7d62e332010-04-18 20:31:01 +0000652 InstrStage<4, [A9_NPipe]>], [9, 3, 2, 1]>,
Anton Korobeynikov090323a2010-04-07 18:22:11 +0000653 //
654 // Move Immediate
Anton Korobeynikov7d62e332010-04-18 20:31:01 +0000655 InstrItinData<IIC_VMOVImm, [InstrStage<1, [A9_DRegsN], 0, Required>,
Anton Korobeynikov090323a2010-04-07 18:22:11 +0000656 // Extra latency cycles since wbck is 6 cycles
Anton Korobeynikov7d62e332010-04-18 20:31:01 +0000657 InstrStage<7, [A9_DRegsVFP], 0, Reserved>,
Anton Korobeynikovd4c7cce2010-05-29 19:25:29 +0000658 InstrStage<1, [A9_Pipe1]>,
Anton Korobeynikov7d62e332010-04-18 20:31:01 +0000659 InstrStage<1, [A9_NPipe]>], [3]>,
Anton Korobeynikov090323a2010-04-07 18:22:11 +0000660 //
661 // Double-register Permute Move
Anton Korobeynikov7d62e332010-04-18 20:31:01 +0000662 InstrItinData<IIC_VMOVD, [InstrStage<1, [A9_DRegsN], 0, Required>,
Anton Korobeynikov090323a2010-04-07 18:22:11 +0000663 // FIXME: all latencies are arbitrary, no information is available
Anton Korobeynikov7d62e332010-04-18 20:31:01 +0000664 InstrStage<3, [A9_DRegsVFP], 0, Reserved>,
Anton Korobeynikovd4c7cce2010-05-29 19:25:29 +0000665 InstrStage<1, [A9_Pipe1]>,
Anton Korobeynikov7d62e332010-04-18 20:31:01 +0000666 InstrStage<1, [A9_LSPipe]>], [2, 1]>,
Anton Korobeynikov090323a2010-04-07 18:22:11 +0000667 //
668 // Quad-register Permute Move
669 // Result written in N2, but that is relative to the last cycle of multicycle,
670 // so we use 3 for those cases
Anton Korobeynikov7d62e332010-04-18 20:31:01 +0000671 InstrItinData<IIC_VMOVQ, [InstrStage<1, [A9_DRegsN], 0, Required>,
Anton Korobeynikov090323a2010-04-07 18:22:11 +0000672 // FIXME: all latencies are arbitrary, no information is available
Anton Korobeynikov7d62e332010-04-18 20:31:01 +0000673 InstrStage<4, [A9_DRegsVFP], 0, Reserved>,
Anton Korobeynikovd4c7cce2010-05-29 19:25:29 +0000674 InstrStage<1, [A9_Pipe1]>,
Anton Korobeynikov7d62e332010-04-18 20:31:01 +0000675 InstrStage<2, [A9_NPipe]>], [3, 1]>,
Anton Korobeynikov090323a2010-04-07 18:22:11 +0000676 //
677 // Integer to Single-precision Move
Anton Korobeynikov7d62e332010-04-18 20:31:01 +0000678 InstrItinData<IIC_VMOVIS , [InstrStage<1, [A9_DRegsN], 0, Required>,
Anton Korobeynikov090323a2010-04-07 18:22:11 +0000679 // FIXME: all latencies are arbitrary, no information is available
Anton Korobeynikov7d62e332010-04-18 20:31:01 +0000680 InstrStage<3, [A9_DRegsVFP], 0, Reserved>,
Anton Korobeynikovd4c7cce2010-05-29 19:25:29 +0000681 InstrStage<1, [A9_Pipe1]>,
Anton Korobeynikov7d62e332010-04-18 20:31:01 +0000682 InstrStage<1, [A9_NPipe]>], [2, 1]>,
Anton Korobeynikov090323a2010-04-07 18:22:11 +0000683 //
684 // Integer to Double-precision Move
Anton Korobeynikov7d62e332010-04-18 20:31:01 +0000685 InstrItinData<IIC_VMOVID , [InstrStage<1, [A9_DRegsN], 0, Required>,
Anton Korobeynikov090323a2010-04-07 18:22:11 +0000686 // FIXME: all latencies are arbitrary, no information is available
Anton Korobeynikov7d62e332010-04-18 20:31:01 +0000687 InstrStage<3, [A9_DRegsVFP], 0, Reserved>,
Anton Korobeynikovd4c7cce2010-05-29 19:25:29 +0000688 InstrStage<1, [A9_Pipe1]>,
Anton Korobeynikov7d62e332010-04-18 20:31:01 +0000689 InstrStage<1, [A9_NPipe]>], [2, 1, 1]>,
Anton Korobeynikov090323a2010-04-07 18:22:11 +0000690 //
691 // Single-precision to Integer Move
Anton Korobeynikov7d62e332010-04-18 20:31:01 +0000692 InstrItinData<IIC_VMOVSI , [InstrStage<1, [A9_DRegsN], 0, Required>,
Anton Korobeynikov090323a2010-04-07 18:22:11 +0000693 // FIXME: all latencies are arbitrary, no information is available
Anton Korobeynikov7d62e332010-04-18 20:31:01 +0000694 InstrStage<3, [A9_DRegsVFP], 0, Reserved>,
Anton Korobeynikovd4c7cce2010-05-29 19:25:29 +0000695 InstrStage<1, [A9_Pipe1]>,
Anton Korobeynikov7d62e332010-04-18 20:31:01 +0000696 InstrStage<1, [A9_NPipe]>], [2, 1]>,
Anton Korobeynikov090323a2010-04-07 18:22:11 +0000697 //
698 // Double-precision to Integer Move
Anton Korobeynikov7d62e332010-04-18 20:31:01 +0000699 InstrItinData<IIC_VMOVDI , [InstrStage<1, [A9_DRegsN], 0, Required>,
Anton Korobeynikov090323a2010-04-07 18:22:11 +0000700 // FIXME: all latencies are arbitrary, no information is available
Anton Korobeynikov7d62e332010-04-18 20:31:01 +0000701 InstrStage<3, [A9_DRegsVFP], 0, Reserved>,
Anton Korobeynikovd4c7cce2010-05-29 19:25:29 +0000702 InstrStage<1, [A9_Pipe1]>,
Anton Korobeynikov7d62e332010-04-18 20:31:01 +0000703 InstrStage<1, [A9_NPipe]>], [2, 2, 1]>,
Anton Korobeynikov090323a2010-04-07 18:22:11 +0000704 //
705 // Integer to Lane Move
Anton Korobeynikov7d62e332010-04-18 20:31:01 +0000706 InstrItinData<IIC_VMOVISL , [InstrStage<1, [A9_DRegsN], 0, Required>,
Anton Korobeynikov090323a2010-04-07 18:22:11 +0000707 // FIXME: all latencies are arbitrary, no information is available
Anton Korobeynikov7d62e332010-04-18 20:31:01 +0000708 InstrStage<4, [A9_DRegsVFP], 0, Reserved>,
Anton Korobeynikovd4c7cce2010-05-29 19:25:29 +0000709 InstrStage<1, [A9_Pipe1]>,
Anton Korobeynikov7d62e332010-04-18 20:31:01 +0000710 InstrStage<2, [A9_NPipe]>], [3, 1, 1]>,
Anton Korobeynikov090323a2010-04-07 18:22:11 +0000711
712 //
713 // Double-register FP Unary
Anton Korobeynikov7d62e332010-04-18 20:31:01 +0000714 InstrItinData<IIC_VUNAD, [InstrStage<1, [A9_DRegsN], 0, Required>,
Anton Korobeynikov090323a2010-04-07 18:22:11 +0000715 // Extra latency cycles since wbck is 6 cycles
Anton Korobeynikov7d62e332010-04-18 20:31:01 +0000716 InstrStage<7, [A9_DRegsVFP], 0, Reserved>,
Anton Korobeynikovd4c7cce2010-05-29 19:25:29 +0000717 InstrStage<1, [A9_Pipe1]>,
Anton Korobeynikov7d62e332010-04-18 20:31:01 +0000718 InstrStage<1, [A9_NPipe]>], [5, 2]>,
Anton Korobeynikov090323a2010-04-07 18:22:11 +0000719 //
720 // Quad-register FP Unary
721 // Result written in N5, but that is relative to the last cycle of multicycle,
722 // so we use 6 for those cases
Anton Korobeynikov7d62e332010-04-18 20:31:01 +0000723 InstrItinData<IIC_VUNAQ, [InstrStage<1, [A9_DRegsN], 0, Required>,
Anton Korobeynikov090323a2010-04-07 18:22:11 +0000724 // Extra latency cycles since wbck is 7 cycles
Anton Korobeynikov7d62e332010-04-18 20:31:01 +0000725 InstrStage<8, [A9_DRegsVFP], 0, Reserved>,
Anton Korobeynikovd4c7cce2010-05-29 19:25:29 +0000726 InstrStage<1, [A9_Pipe1]>,
Anton Korobeynikov7d62e332010-04-18 20:31:01 +0000727 InstrStage<2, [A9_NPipe]>], [6, 2]>,
Anton Korobeynikov090323a2010-04-07 18:22:11 +0000728 //
729 // Double-register FP Binary
730 // FIXME: We're using this itin for many instructions and [2, 2] here is too
731 // optimistic.
Anton Korobeynikov7d62e332010-04-18 20:31:01 +0000732 InstrItinData<IIC_VBIND, [InstrStage<1, [A9_DRegsN], 0, Required>,
Anton Korobeynikov090323a2010-04-07 18:22:11 +0000733 // Extra latency cycles since wbck is 7 cycles
Anton Korobeynikov7d62e332010-04-18 20:31:01 +0000734 InstrStage<7, [A9_DRegsVFP], 0, Reserved>,
Anton Korobeynikovd4c7cce2010-05-29 19:25:29 +0000735 InstrStage<1, [A9_Pipe1]>,
Anton Korobeynikov7d62e332010-04-18 20:31:01 +0000736 InstrStage<1, [A9_NPipe]>], [5, 2, 2]>,
Anton Korobeynikov090323a2010-04-07 18:22:11 +0000737 //
738 // Quad-register FP Binary
739 // Result written in N5, but that is relative to the last cycle of multicycle,
740 // so we use 6 for those cases
741 // FIXME: We're using this itin for many instructions and [2, 2] here is too
742 // optimistic.
Anton Korobeynikov7d62e332010-04-18 20:31:01 +0000743 InstrItinData<IIC_VBINQ, [InstrStage<1, [A9_DRegsN], 0, Required>,
Anton Korobeynikov090323a2010-04-07 18:22:11 +0000744 // Extra latency cycles since wbck is 8 cycles
Anton Korobeynikov7d62e332010-04-18 20:31:01 +0000745 InstrStage<8, [A9_DRegsVFP], 0, Reserved>,
Anton Korobeynikovd4c7cce2010-05-29 19:25:29 +0000746 InstrStage<1, [A9_Pipe1]>,
Anton Korobeynikov7d62e332010-04-18 20:31:01 +0000747 InstrStage<2, [A9_NPipe]>], [6, 2, 2]>,
Anton Korobeynikov090323a2010-04-07 18:22:11 +0000748 //
749 // Double-register FP Multiple-Accumulate
Anton Korobeynikov7d62e332010-04-18 20:31:01 +0000750 InstrItinData<IIC_VMACD, [InstrStage<1, [A9_DRegsN], 0, Required>,
Anton Korobeynikov090323a2010-04-07 18:22:11 +0000751 // Extra latency cycles since wbck is 7 cycles
Anton Korobeynikov7d62e332010-04-18 20:31:01 +0000752 InstrStage<8, [A9_DRegsVFP], 0, Reserved>,
Anton Korobeynikovd4c7cce2010-05-29 19:25:29 +0000753 InstrStage<1, [A9_Pipe1]>,
Anton Korobeynikov7d62e332010-04-18 20:31:01 +0000754 InstrStage<2, [A9_NPipe]>], [6, 3, 2, 1]>,
Anton Korobeynikov090323a2010-04-07 18:22:11 +0000755 //
756 // Quad-register FP Multiple-Accumulate
757 // Result written in N9, but that is relative to the last cycle of multicycle,
758 // so we use 10 for those cases
Anton Korobeynikov7d62e332010-04-18 20:31:01 +0000759 InstrItinData<IIC_VMACQ, [InstrStage<1, [A9_DRegsN], 0, Required>,
Anton Korobeynikov090323a2010-04-07 18:22:11 +0000760 // Extra latency cycles since wbck is 9 cycles
Anton Korobeynikov7d62e332010-04-18 20:31:01 +0000761 InstrStage<10, [A9_DRegsVFP], 0, Reserved>,
Anton Korobeynikovd4c7cce2010-05-29 19:25:29 +0000762 InstrStage<1, [A9_Pipe1]>,
Anton Korobeynikov7d62e332010-04-18 20:31:01 +0000763 InstrStage<4, [A9_NPipe]>], [8, 4, 2, 1]>,
Anton Korobeynikov090323a2010-04-07 18:22:11 +0000764 //
765 // Double-register Reciprical Step
Anton Korobeynikov7d62e332010-04-18 20:31:01 +0000766 InstrItinData<IIC_VRECSD, [InstrStage<1, [A9_DRegsN], 0, Required>,
Anton Korobeynikov090323a2010-04-07 18:22:11 +0000767 // Extra latency cycles since wbck is 7 cycles
Anton Korobeynikov7d62e332010-04-18 20:31:01 +0000768 InstrStage<8, [A9_DRegsVFP], 0, Reserved>,
Anton Korobeynikovd4c7cce2010-05-29 19:25:29 +0000769 InstrStage<1, [A9_Pipe1]>,
Anton Korobeynikov7d62e332010-04-18 20:31:01 +0000770 InstrStage<2, [A9_NPipe]>], [6, 2, 2]>,
Anton Korobeynikov090323a2010-04-07 18:22:11 +0000771 //
772 // Quad-register Reciprical Step
Anton Korobeynikov7d62e332010-04-18 20:31:01 +0000773 InstrItinData<IIC_VRECSQ, [InstrStage<1, [A9_DRegsN], 0, Required>,
Anton Korobeynikov090323a2010-04-07 18:22:11 +0000774 // Extra latency cycles since wbck is 9 cycles
Anton Korobeynikov7d62e332010-04-18 20:31:01 +0000775 InstrStage<10, [A9_DRegsVFP], 0, Reserved>,
Anton Korobeynikovd4c7cce2010-05-29 19:25:29 +0000776 InstrStage<1, [A9_Pipe1]>,
Anton Korobeynikov7d62e332010-04-18 20:31:01 +0000777 InstrStage<4, [A9_NPipe]>], [8, 2, 2]>,
Anton Korobeynikov090323a2010-04-07 18:22:11 +0000778 //
779 // Double-register Permute
Anton Korobeynikov7d62e332010-04-18 20:31:01 +0000780 InstrItinData<IIC_VPERMD, [InstrStage<1, [A9_DRegsN], 0, Required>,
Anton Korobeynikov090323a2010-04-07 18:22:11 +0000781 // Extra latency cycles since wbck is 6 cycles
Anton Korobeynikov7d62e332010-04-18 20:31:01 +0000782 InstrStage<7, [A9_DRegsVFP], 0, Reserved>,
Anton Korobeynikovd4c7cce2010-05-29 19:25:29 +0000783 InstrStage<1, [A9_Pipe1]>,
Anton Korobeynikov7d62e332010-04-18 20:31:01 +0000784 InstrStage<1, [A9_NPipe]>], [2, 2, 1, 1]>,
Anton Korobeynikov090323a2010-04-07 18:22:11 +0000785 //
786 // Quad-register Permute
787 // Result written in N2, but that is relative to the last cycle of multicycle,
788 // so we use 3 for those cases
Anton Korobeynikov7d62e332010-04-18 20:31:01 +0000789 InstrItinData<IIC_VPERMQ, [InstrStage<1, [A9_DRegsN], 0, Required>,
Anton Korobeynikov090323a2010-04-07 18:22:11 +0000790 // Extra latency cycles since wbck is 7 cycles
Anton Korobeynikov7d62e332010-04-18 20:31:01 +0000791 InstrStage<8, [A9_DRegsVFP], 0, Reserved>,
Anton Korobeynikovd4c7cce2010-05-29 19:25:29 +0000792 InstrStage<1, [A9_Pipe1]>,
Anton Korobeynikov7d62e332010-04-18 20:31:01 +0000793 InstrStage<2, [A9_NPipe]>], [3, 3, 1, 1]>,
Anton Korobeynikov090323a2010-04-07 18:22:11 +0000794 //
795 // Quad-register Permute (3 cycle issue)
796 // Result written in N2, but that is relative to the last cycle of multicycle,
797 // so we use 4 for those cases
Anton Korobeynikov7d62e332010-04-18 20:31:01 +0000798 InstrItinData<IIC_VPERMQ3, [InstrStage<1, [A9_DRegsN], 0, Required>,
Anton Korobeynikov090323a2010-04-07 18:22:11 +0000799 // Extra latency cycles since wbck is 8 cycles
Anton Korobeynikov7d62e332010-04-18 20:31:01 +0000800 InstrStage<9, [A9_DRegsVFP], 0, Reserved>,
Anton Korobeynikovd4c7cce2010-05-29 19:25:29 +0000801 InstrStage<1, [A9_Pipe1]>,
Anton Korobeynikov7d62e332010-04-18 20:31:01 +0000802 InstrStage<3, [A9_LSPipe]>], [4, 4, 1, 1]>,
Anton Korobeynikov090323a2010-04-07 18:22:11 +0000803
804 //
805 // Double-register VEXT
Anton Korobeynikov7d62e332010-04-18 20:31:01 +0000806 InstrItinData<IIC_VEXTD, [InstrStage<1, [A9_DRegsN], 0, Required>,
Anton Korobeynikov090323a2010-04-07 18:22:11 +0000807 // Extra latency cycles since wbck is 7 cycles
Anton Korobeynikov7d62e332010-04-18 20:31:01 +0000808 InstrStage<7, [A9_DRegsVFP], 0, Reserved>,
Anton Korobeynikovd4c7cce2010-05-29 19:25:29 +0000809 InstrStage<1, [A9_Pipe1]>,
Anton Korobeynikov7d62e332010-04-18 20:31:01 +0000810 InstrStage<1, [A9_NPipe]>], [2, 1, 1]>,
Anton Korobeynikov090323a2010-04-07 18:22:11 +0000811 //
812 // Quad-register VEXT
Anton Korobeynikov7d62e332010-04-18 20:31:01 +0000813 InstrItinData<IIC_VEXTQ, [InstrStage<1, [A9_DRegsN], 0, Required>,
Anton Korobeynikov090323a2010-04-07 18:22:11 +0000814 // Extra latency cycles since wbck is 9 cycles
Anton Korobeynikov7d62e332010-04-18 20:31:01 +0000815 InstrStage<8, [A9_DRegsVFP], 0, Reserved>,
Anton Korobeynikovd4c7cce2010-05-29 19:25:29 +0000816 InstrStage<1, [A9_Pipe1]>,
Anton Korobeynikov7d62e332010-04-18 20:31:01 +0000817 InstrStage<2, [A9_NPipe]>], [3, 1, 1]>,
Anton Korobeynikov090323a2010-04-07 18:22:11 +0000818 //
819 // VTB
Anton Korobeynikov7d62e332010-04-18 20:31:01 +0000820 InstrItinData<IIC_VTB1, [InstrStage<1, [A9_DRegsN], 0, Required>,
Anton Korobeynikov090323a2010-04-07 18:22:11 +0000821 // Extra latency cycles since wbck is 7 cycles
Anton Korobeynikov7d62e332010-04-18 20:31:01 +0000822 InstrStage<8, [A9_DRegsVFP], 0, Reserved>,
Anton Korobeynikovd4c7cce2010-05-29 19:25:29 +0000823 InstrStage<1, [A9_Pipe1]>,
Anton Korobeynikov7d62e332010-04-18 20:31:01 +0000824 InstrStage<2, [A9_NPipe]>], [3, 2, 1]>,
825 InstrItinData<IIC_VTB2, [InstrStage<2, [A9_DRegsN], 0, Required>,
Anton Korobeynikov090323a2010-04-07 18:22:11 +0000826 // Extra latency cycles since wbck is 7 cycles
Anton Korobeynikov7d62e332010-04-18 20:31:01 +0000827 InstrStage<8, [A9_DRegsVFP], 0, Reserved>,
Anton Korobeynikovd4c7cce2010-05-29 19:25:29 +0000828 InstrStage<1, [A9_Pipe1]>,
Anton Korobeynikov7d62e332010-04-18 20:31:01 +0000829 InstrStage<2, [A9_NPipe]>], [3, 2, 2, 1]>,
830 InstrItinData<IIC_VTB3, [InstrStage<2, [A9_DRegsN], 0, Required>,
Anton Korobeynikov090323a2010-04-07 18:22:11 +0000831 // Extra latency cycles since wbck is 8 cycles
Anton Korobeynikov7d62e332010-04-18 20:31:01 +0000832 InstrStage<9, [A9_DRegsVFP], 0, Reserved>,
Anton Korobeynikovd4c7cce2010-05-29 19:25:29 +0000833 InstrStage<1, [A9_Pipe1]>,
Anton Korobeynikov7d62e332010-04-18 20:31:01 +0000834 InstrStage<3, [A9_NPipe]>], [4, 2, 2, 3, 1]>,
835 InstrItinData<IIC_VTB4, [InstrStage<1, [A9_DRegsN], 0, Required>,
Anton Korobeynikov090323a2010-04-07 18:22:11 +0000836 // Extra latency cycles since wbck is 8 cycles
Anton Korobeynikov7d62e332010-04-18 20:31:01 +0000837 InstrStage<9, [A9_DRegsVFP], 0, Reserved>,
Anton Korobeynikovd4c7cce2010-05-29 19:25:29 +0000838 InstrStage<1, [A9_Pipe1]>,
Anton Korobeynikov7d62e332010-04-18 20:31:01 +0000839 InstrStage<3, [A9_NPipe]>], [4, 2, 2, 3, 3, 1]>,
Anton Korobeynikov090323a2010-04-07 18:22:11 +0000840 //
841 // VTBX
Anton Korobeynikov7d62e332010-04-18 20:31:01 +0000842 InstrItinData<IIC_VTBX1, [InstrStage<1, [A9_DRegsN], 0, Required>,
Anton Korobeynikov090323a2010-04-07 18:22:11 +0000843 // Extra latency cycles since wbck is 7 cycles
Anton Korobeynikov7d62e332010-04-18 20:31:01 +0000844 InstrStage<8, [A9_DRegsVFP], 0, Reserved>,
Anton Korobeynikovd4c7cce2010-05-29 19:25:29 +0000845 InstrStage<1, [A9_Pipe1]>,
Anton Korobeynikov7d62e332010-04-18 20:31:01 +0000846 InstrStage<2, [A9_NPipe]>], [3, 1, 2, 1]>,
847 InstrItinData<IIC_VTBX2, [InstrStage<1, [A9_DRegsN], 0, Required>,
Anton Korobeynikov090323a2010-04-07 18:22:11 +0000848 // Extra latency cycles since wbck is 7 cycles
Anton Korobeynikov7d62e332010-04-18 20:31:01 +0000849 InstrStage<8, [A9_DRegsVFP], 0, Reserved>,
Anton Korobeynikovd4c7cce2010-05-29 19:25:29 +0000850 InstrStage<1, [A9_Pipe1]>,
Anton Korobeynikov7d62e332010-04-18 20:31:01 +0000851 InstrStage<2, [A9_NPipe]>], [3, 1, 2, 2, 1]>,
852 InstrItinData<IIC_VTBX3, [InstrStage<1, [A9_DRegsN], 0, Required>,
Anton Korobeynikov090323a2010-04-07 18:22:11 +0000853 // Extra latency cycles since wbck is 8 cycles
Anton Korobeynikov7d62e332010-04-18 20:31:01 +0000854 InstrStage<9, [A9_DRegsVFP], 0, Reserved>,
Anton Korobeynikovd4c7cce2010-05-29 19:25:29 +0000855 InstrStage<1, [A9_Pipe1]>,
Anton Korobeynikov7d62e332010-04-18 20:31:01 +0000856 InstrStage<3, [A9_NPipe]>], [4, 1, 2, 2, 3, 1]>,
857 InstrItinData<IIC_VTBX4, [InstrStage<1, [A9_DRegsN], 0, Required>,
Anton Korobeynikov090323a2010-04-07 18:22:11 +0000858 // Extra latency cycles since wbck is 8 cycles
Anton Korobeynikov7d62e332010-04-18 20:31:01 +0000859 InstrStage<9, [A9_DRegsVFP], 0, Reserved>,
Anton Korobeynikovd4c7cce2010-05-29 19:25:29 +0000860 InstrStage<1, [A9_Pipe1]>,
Jim Grosbach7ea5fc02010-06-28 04:27:01 +0000861 InstrStage<2, [A9_NPipe]>], [4, 1, 2, 2, 3, 3, 1]>
Anton Korobeynikov090323a2010-04-07 18:22:11 +0000862]>;