blob: 16db02ed27579f64813fde3e17c7393ebaee7aed [file] [log] [blame]
Tim Northover00ed9962014-03-29 10:18:08 +00001//===- ARM64InstrFormats.td - ARM64 Instruction Formats ------*- tblgen -*-===//
2//
3// The LLVM Compiler Infrastructure
4//
5// This file is distributed under the University of Illinois Open Source
6// License. See LICENSE.TXT for details.
7//
8//===----------------------------------------------------------------------===//
9
10//===----------------------------------------------------------------------===//
11// Describe ARM64 instructions format here
12//
13
14// Format specifies the encoding used by the instruction. This is part of the
15// ad-hoc solution used to emit machine instruction encodings by our machine
16// code emitter.
17class Format<bits<2> val> {
18 bits<2> Value = val;
19}
20
21def PseudoFrm : Format<0>;
22def NormalFrm : Format<1>; // Do we need any others?
23
24// ARM64 Instruction Format
25class ARM64Inst<Format f, string cstr> : Instruction {
26 field bits<32> Inst; // Instruction encoding.
27 // Mask of bits that cause an encoding to be UNPREDICTABLE.
28 // If a bit is set, then if the corresponding bit in the
29 // target encoding differs from its value in the "Inst" field,
30 // the instruction is UNPREDICTABLE (SoftFail in abstract parlance).
31 field bits<32> Unpredictable = 0;
32 // SoftFail is the generic name for this field, but we alias it so
33 // as to make it more obvious what it means in ARM-land.
34 field bits<32> SoftFail = Unpredictable;
35 let Namespace = "ARM64";
36 Format F = f;
37 bits<2> Form = F.Value;
38 let Pattern = [];
39 let Constraints = cstr;
40}
41
42// Pseudo instructions (don't have encoding information)
43class Pseudo<dag oops, dag iops, list<dag> pattern, string cstr = "">
44 : ARM64Inst<PseudoFrm, cstr> {
45 dag OutOperandList = oops;
46 dag InOperandList = iops;
47 let Pattern = pattern;
48 let isCodeGenOnly = 1;
49}
50
51// Real instructions (have encoding information)
52class EncodedI<string cstr, list<dag> pattern> : ARM64Inst<NormalFrm, cstr> {
53 let Pattern = pattern;
54 let Size = 4;
55}
56
57// Normal instructions
58class I<dag oops, dag iops, string asm, string operands, string cstr,
59 list<dag> pattern>
60 : EncodedI<cstr, pattern> {
61 dag OutOperandList = oops;
62 dag InOperandList = iops;
63 let AsmString = !strconcat(asm, operands);
64}
65
66class TriOpFrag<dag res> : PatFrag<(ops node:$LHS, node:$MHS, node:$RHS), res>;
67class BinOpFrag<dag res> : PatFrag<(ops node:$LHS, node:$RHS), res>;
68class UnOpFrag<dag res> : PatFrag<(ops node:$LHS), res>;
69
70// Helper fragment for an extract of the high portion of a 128-bit vector.
71def extract_high_v16i8 :
72 UnOpFrag<(extract_subvector (v16i8 node:$LHS), (i64 8))>;
73def extract_high_v8i16 :
74 UnOpFrag<(extract_subvector (v8i16 node:$LHS), (i64 4))>;
75def extract_high_v4i32 :
76 UnOpFrag<(extract_subvector (v4i32 node:$LHS), (i64 2))>;
77def extract_high_v2i64 :
78 UnOpFrag<(extract_subvector (v2i64 node:$LHS), (i64 1))>;
79
80//===----------------------------------------------------------------------===//
81// Asm Operand Classes.
82//
83
84// Shifter operand for arithmetic shifted encodings.
85def ShifterOperand : AsmOperandClass {
86 let Name = "Shifter";
87}
88
89// Shifter operand for mov immediate encodings.
90def MovImm32ShifterOperand : AsmOperandClass {
91 let SuperClasses = [ShifterOperand];
92 let Name = "MovImm32Shifter";
93}
94def MovImm64ShifterOperand : AsmOperandClass {
95 let SuperClasses = [ShifterOperand];
96 let Name = "MovImm64Shifter";
97}
98
99// Shifter operand for arithmetic register shifted encodings.
100def ArithmeticShifterOperand : AsmOperandClass {
101 let SuperClasses = [ShifterOperand];
102 let Name = "ArithmeticShifter";
103}
104
105// Shifter operand for arithmetic shifted encodings for ADD/SUB instructions.
106def AddSubShifterOperand : AsmOperandClass {
107 let SuperClasses = [ArithmeticShifterOperand];
108 let Name = "AddSubShifter";
109}
110
111// Shifter operand for logical vector 128/64-bit shifted encodings.
112def LogicalVecShifterOperand : AsmOperandClass {
113 let SuperClasses = [ShifterOperand];
114 let Name = "LogicalVecShifter";
115}
116def LogicalVecHalfWordShifterOperand : AsmOperandClass {
117 let SuperClasses = [LogicalVecShifterOperand];
118 let Name = "LogicalVecHalfWordShifter";
119}
120
121// The "MSL" shifter on the vector MOVI instruction.
122def MoveVecShifterOperand : AsmOperandClass {
123 let SuperClasses = [ShifterOperand];
124 let Name = "MoveVecShifter";
125}
126
127// Extend operand for arithmetic encodings.
128def ExtendOperand : AsmOperandClass { let Name = "Extend"; }
129def ExtendOperand64 : AsmOperandClass {
130 let SuperClasses = [ExtendOperand];
131 let Name = "Extend64";
132}
133// 'extend' that's a lsl of a 64-bit register.
134def ExtendOperandLSL64 : AsmOperandClass {
135 let SuperClasses = [ExtendOperand];
136 let Name = "ExtendLSL64";
137}
138
139// 8-bit floating-point immediate encodings.
140def FPImmOperand : AsmOperandClass {
141 let Name = "FPImm";
142 let ParserMethod = "tryParseFPImm";
143}
144
145// 8-bit immediate for AdvSIMD where 64-bit values of the form:
146// aaaaaaaa bbbbbbbb cccccccc dddddddd eeeeeeee ffffffff gggggggg hhhhhhhh
147// are encoded as the eight bit value 'abcdefgh'.
148def SIMDImmType10Operand : AsmOperandClass { let Name = "SIMDImmType10"; }
149
150
151//===----------------------------------------------------------------------===//
152// Operand Definitions.
153//
154
155// ADR[P] instruction labels.
156def AdrpOperand : AsmOperandClass {
157 let Name = "AdrpLabel";
158 let ParserMethod = "tryParseAdrpLabel";
159}
160def adrplabel : Operand<i64> {
161 let EncoderMethod = "getAdrLabelOpValue";
162 let PrintMethod = "printAdrpLabel";
163 let ParserMatchClass = AdrpOperand;
164}
165
166def AdrOperand : AsmOperandClass {
167 let Name = "AdrLabel";
168 let ParserMethod = "tryParseAdrLabel";
169}
170def adrlabel : Operand<i64> {
171 let EncoderMethod = "getAdrLabelOpValue";
172 let ParserMatchClass = AdrOperand;
173}
174
175// simm9 predicate - True if the immediate is in the range [-256, 255].
176def SImm9Operand : AsmOperandClass {
177 let Name = "SImm9";
178 let DiagnosticType = "InvalidMemoryIndexedSImm9";
179}
180def simm9 : Operand<i64>, ImmLeaf<i64, [{ return Imm >= -256 && Imm < 256; }]> {
181 let ParserMatchClass = SImm9Operand;
182}
183
184// simm7s4 predicate - True if the immediate is a multiple of 4 in the range
185// [-256, 252].
186def SImm7s4Operand : AsmOperandClass {
187 let Name = "SImm7s4";
188 let DiagnosticType = "InvalidMemoryIndexed32SImm7";
189}
190def simm7s4 : Operand<i32> {
191 let ParserMatchClass = SImm7s4Operand;
192 let PrintMethod = "printImmScale4";
193}
194
195// simm7s8 predicate - True if the immediate is a multiple of 8 in the range
196// [-512, 504].
197def SImm7s8Operand : AsmOperandClass {
198 let Name = "SImm7s8";
199 let DiagnosticType = "InvalidMemoryIndexed64SImm7";
200}
201def simm7s8 : Operand<i32> {
202 let ParserMatchClass = SImm7s8Operand;
203 let PrintMethod = "printImmScale8";
204}
205
206// simm7s16 predicate - True if the immediate is a multiple of 16 in the range
207// [-1024, 1008].
208def SImm7s16Operand : AsmOperandClass {
209 let Name = "SImm7s16";
210 let DiagnosticType = "InvalidMemoryIndexed64SImm7";
211}
212def simm7s16 : Operand<i32> {
213 let ParserMatchClass = SImm7s16Operand;
214 let PrintMethod = "printImmScale16";
215}
216
217// imm0_65535 predicate - True if the immediate is in the range [0,65535].
218def Imm0_65535Operand : AsmOperandClass { let Name = "Imm0_65535"; }
219def imm0_65535 : Operand<i32>, ImmLeaf<i32, [{
220 return ((uint32_t)Imm) < 65536;
221}]> {
222 let ParserMatchClass = Imm0_65535Operand;
223}
224
225def Imm1_8Operand : AsmOperandClass {
226 let Name = "Imm1_8";
227 let DiagnosticType = "InvalidImm1_8";
228}
229def Imm1_16Operand : AsmOperandClass {
230 let Name = "Imm1_16";
231 let DiagnosticType = "InvalidImm1_16";
232}
233def Imm1_32Operand : AsmOperandClass {
234 let Name = "Imm1_32";
235 let DiagnosticType = "InvalidImm1_32";
236}
237def Imm1_64Operand : AsmOperandClass {
238 let Name = "Imm1_64";
239 let DiagnosticType = "InvalidImm1_64";
240}
241
242def MovZSymbolG3AsmOperand : AsmOperandClass {
243 let Name = "MovZSymbolG3";
244 let RenderMethod = "addImmOperands";
245}
246
247def movz_symbol_g3 : Operand<i32> {
248 let ParserMatchClass = MovZSymbolG3AsmOperand;
249}
250
251def MovZSymbolG2AsmOperand : AsmOperandClass {
252 let Name = "MovZSymbolG2";
253 let RenderMethod = "addImmOperands";
254}
255
256def movz_symbol_g2 : Operand<i32> {
257 let ParserMatchClass = MovZSymbolG2AsmOperand;
258}
259
260def MovZSymbolG1AsmOperand : AsmOperandClass {
261 let Name = "MovZSymbolG1";
262 let RenderMethod = "addImmOperands";
263}
264
265def movz_symbol_g1 : Operand<i32> {
266 let ParserMatchClass = MovZSymbolG1AsmOperand;
267}
268
269def MovZSymbolG0AsmOperand : AsmOperandClass {
270 let Name = "MovZSymbolG0";
271 let RenderMethod = "addImmOperands";
272}
273
274def movz_symbol_g0 : Operand<i32> {
275 let ParserMatchClass = MovZSymbolG0AsmOperand;
276}
277
278def MovKSymbolG2AsmOperand : AsmOperandClass {
279 let Name = "MovKSymbolG2";
280 let RenderMethod = "addImmOperands";
281}
282
283def movk_symbol_g2 : Operand<i32> {
284 let ParserMatchClass = MovKSymbolG2AsmOperand;
285}
286
287def MovKSymbolG1AsmOperand : AsmOperandClass {
288 let Name = "MovKSymbolG1";
289 let RenderMethod = "addImmOperands";
290}
291
292def movk_symbol_g1 : Operand<i32> {
293 let ParserMatchClass = MovKSymbolG1AsmOperand;
294}
295
296def MovKSymbolG0AsmOperand : AsmOperandClass {
297 let Name = "MovKSymbolG0";
298 let RenderMethod = "addImmOperands";
299}
300
301def movk_symbol_g0 : Operand<i32> {
302 let ParserMatchClass = MovKSymbolG0AsmOperand;
303}
304
305def fixedpoint32 : Operand<i32> {
306 let EncoderMethod = "getFixedPointScaleOpValue";
307 let DecoderMethod = "DecodeFixedPointScaleImm";
308 let ParserMatchClass = Imm1_32Operand;
309}
310def fixedpoint64 : Operand<i64> {
311 let EncoderMethod = "getFixedPointScaleOpValue";
312 let DecoderMethod = "DecodeFixedPointScaleImm";
313 let ParserMatchClass = Imm1_64Operand;
314}
315
316def vecshiftR8 : Operand<i32>, ImmLeaf<i32, [{
317 return (((uint32_t)Imm) > 0) && (((uint32_t)Imm) < 9);
318}]> {
319 let EncoderMethod = "getVecShiftR8OpValue";
320 let DecoderMethod = "DecodeVecShiftR8Imm";
321 let ParserMatchClass = Imm1_8Operand;
322}
323def vecshiftR16 : Operand<i32>, ImmLeaf<i32, [{
324 return (((uint32_t)Imm) > 0) && (((uint32_t)Imm) < 17);
325}]> {
326 let EncoderMethod = "getVecShiftR16OpValue";
327 let DecoderMethod = "DecodeVecShiftR16Imm";
328 let ParserMatchClass = Imm1_16Operand;
329}
330def vecshiftR16Narrow : Operand<i32>, ImmLeaf<i32, [{
331 return (((uint32_t)Imm) > 0) && (((uint32_t)Imm) < 9);
332}]> {
333 let EncoderMethod = "getVecShiftR16OpValue";
334 let DecoderMethod = "DecodeVecShiftR16ImmNarrow";
335 let ParserMatchClass = Imm1_8Operand;
336}
337def vecshiftR32 : Operand<i32>, ImmLeaf<i32, [{
338 return (((uint32_t)Imm) > 0) && (((uint32_t)Imm) < 33);
339}]> {
340 let EncoderMethod = "getVecShiftR32OpValue";
341 let DecoderMethod = "DecodeVecShiftR32Imm";
342 let ParserMatchClass = Imm1_32Operand;
343}
344def vecshiftR32Narrow : Operand<i32>, ImmLeaf<i32, [{
345 return (((uint32_t)Imm) > 0) && (((uint32_t)Imm) < 17);
346}]> {
347 let EncoderMethod = "getVecShiftR32OpValue";
348 let DecoderMethod = "DecodeVecShiftR32ImmNarrow";
349 let ParserMatchClass = Imm1_16Operand;
350}
351def vecshiftR64 : Operand<i32>, ImmLeaf<i32, [{
352 return (((uint32_t)Imm) > 0) && (((uint32_t)Imm) < 65);
353}]> {
354 let EncoderMethod = "getVecShiftR64OpValue";
355 let DecoderMethod = "DecodeVecShiftR64Imm";
356 let ParserMatchClass = Imm1_64Operand;
357}
358def vecshiftR64Narrow : Operand<i32>, ImmLeaf<i32, [{
359 return (((uint32_t)Imm) > 0) && (((uint32_t)Imm) < 33);
360}]> {
361 let EncoderMethod = "getVecShiftR64OpValue";
362 let DecoderMethod = "DecodeVecShiftR64ImmNarrow";
363 let ParserMatchClass = Imm1_32Operand;
364}
365
366def Imm0_7Operand : AsmOperandClass { let Name = "Imm0_7"; }
367def Imm0_15Operand : AsmOperandClass { let Name = "Imm0_15"; }
368def Imm0_31Operand : AsmOperandClass { let Name = "Imm0_31"; }
369def Imm0_63Operand : AsmOperandClass { let Name = "Imm0_63"; }
370
371def vecshiftL8 : Operand<i32>, ImmLeaf<i32, [{
372 return (((uint32_t)Imm) < 8);
373}]> {
374 let EncoderMethod = "getVecShiftL8OpValue";
375 let DecoderMethod = "DecodeVecShiftL8Imm";
376 let ParserMatchClass = Imm0_7Operand;
377}
378def vecshiftL16 : Operand<i32>, ImmLeaf<i32, [{
379 return (((uint32_t)Imm) < 16);
380}]> {
381 let EncoderMethod = "getVecShiftL16OpValue";
382 let DecoderMethod = "DecodeVecShiftL16Imm";
383 let ParserMatchClass = Imm0_15Operand;
384}
385def vecshiftL32 : Operand<i32>, ImmLeaf<i32, [{
386 return (((uint32_t)Imm) < 32);
387}]> {
388 let EncoderMethod = "getVecShiftL32OpValue";
389 let DecoderMethod = "DecodeVecShiftL32Imm";
390 let ParserMatchClass = Imm0_31Operand;
391}
392def vecshiftL64 : Operand<i32>, ImmLeaf<i32, [{
393 return (((uint32_t)Imm) < 64);
394}]> {
395 let EncoderMethod = "getVecShiftL64OpValue";
396 let DecoderMethod = "DecodeVecShiftL64Imm";
397 let ParserMatchClass = Imm0_63Operand;
398}
399
400
401// Crazy immediate formats used by 32-bit and 64-bit logical immediate
402// instructions for splatting repeating bit patterns across the immediate.
403def logical_imm32_XFORM : SDNodeXForm<imm, [{
404 uint64_t enc = ARM64_AM::encodeLogicalImmediate(N->getZExtValue(), 32);
405 return CurDAG->getTargetConstant(enc, MVT::i32);
406}]>;
407def logical_imm64_XFORM : SDNodeXForm<imm, [{
408 uint64_t enc = ARM64_AM::encodeLogicalImmediate(N->getZExtValue(), 64);
409 return CurDAG->getTargetConstant(enc, MVT::i32);
410}]>;
411
412def LogicalImm32Operand : AsmOperandClass { let Name = "LogicalImm32"; }
413def LogicalImm64Operand : AsmOperandClass { let Name = "LogicalImm64"; }
414def logical_imm32 : Operand<i32>, PatLeaf<(imm), [{
415 return ARM64_AM::isLogicalImmediate(N->getZExtValue(), 32);
416}], logical_imm32_XFORM> {
417 let PrintMethod = "printLogicalImm32";
418 let ParserMatchClass = LogicalImm32Operand;
419}
420def logical_imm64 : Operand<i64>, PatLeaf<(imm), [{
421 return ARM64_AM::isLogicalImmediate(N->getZExtValue(), 64);
422}], logical_imm64_XFORM> {
423 let PrintMethod = "printLogicalImm64";
424 let ParserMatchClass = LogicalImm64Operand;
425}
426
427// imm0_255 predicate - True if the immediate is in the range [0,255].
428def Imm0_255Operand : AsmOperandClass { let Name = "Imm0_255"; }
429def imm0_255 : Operand<i32>, ImmLeaf<i32, [{
430 return ((uint32_t)Imm) < 256;
431}]> {
432 let ParserMatchClass = Imm0_255Operand;
433}
434
435// imm0_127 predicate - True if the immediate is in the range [0,127]
436def Imm0_127Operand : AsmOperandClass { let Name = "Imm0_127"; }
437def imm0_127 : Operand<i32>, ImmLeaf<i32, [{
438 return ((uint32_t)Imm) < 128;
439}]> {
440 let ParserMatchClass = Imm0_127Operand;
441}
442
Tim Northover2ad88d32014-04-03 09:26:16 +0000443// NOTE: These imm0_N operands have to be of type i64 because i64 is the size
444// for all shift-amounts.
445
Tim Northover00ed9962014-03-29 10:18:08 +0000446// imm0_63 predicate - True if the immediate is in the range [0,63]
Tim Northover00ed9962014-03-29 10:18:08 +0000447def imm0_63 : Operand<i64>, ImmLeaf<i64, [{
448 return ((uint64_t)Imm) < 64;
449}]> {
450 let ParserMatchClass = Imm0_63Operand;
451}
452
Tim Northover2ad88d32014-04-03 09:26:16 +0000453// imm0_31 predicate - True if the immediate is in the range [0,31]
454def imm0_31 : Operand<i64>, ImmLeaf<i64, [{
Tim Northover00ed9962014-03-29 10:18:08 +0000455 return ((uint64_t)Imm) < 32;
456}]> {
457 let ParserMatchClass = Imm0_31Operand;
458}
459
Tim Northover2ad88d32014-04-03 09:26:16 +0000460// imm0_15 predicate - True if the immediate is in the range [0,15]
461def imm0_15 : Operand<i64>, ImmLeaf<i64, [{
Tim Northover00ed9962014-03-29 10:18:08 +0000462 return ((uint64_t)Imm) < 16;
463}]> {
464 let ParserMatchClass = Imm0_15Operand;
465}
466
Tim Northover00ed9962014-03-29 10:18:08 +0000467// imm0_7 predicate - True if the immediate is in the range [0,7]
Tim Northover2ad88d32014-04-03 09:26:16 +0000468def imm0_7 : Operand<i64>, ImmLeaf<i64, [{
469 return ((uint64_t)Imm) < 8;
Tim Northover00ed9962014-03-29 10:18:08 +0000470}]> {
471 let ParserMatchClass = Imm0_7Operand;
472}
473
474// An arithmetic shifter operand:
475// {7-6} - shift type: 00 = lsl, 01 = lsr, 10 = asr
476// {5-0} - imm6
477def arith_shift : Operand<i32> {
478 let PrintMethod = "printShifter";
479 let ParserMatchClass = ArithmeticShifterOperand;
480}
481
482class arith_shifted_reg<ValueType Ty, RegisterClass regclass>
483 : Operand<Ty>,
484 ComplexPattern<Ty, 2, "SelectArithShiftedRegister", []> {
485 let PrintMethod = "printShiftedRegister";
486 let MIOperandInfo = (ops regclass, arith_shift);
487}
488
489def arith_shifted_reg32 : arith_shifted_reg<i32, GPR32>;
490def arith_shifted_reg64 : arith_shifted_reg<i64, GPR64>;
491
492// An arithmetic shifter operand:
493// {7-6} - shift type: 00 = lsl, 01 = lsr, 10 = asr, 11 = ror
494// {5-0} - imm6
495def logical_shift : Operand<i32> {
496 let PrintMethod = "printShifter";
497 let ParserMatchClass = ShifterOperand;
498}
499
500class logical_shifted_reg<ValueType Ty, RegisterClass regclass>
501 : Operand<Ty>,
502 ComplexPattern<Ty, 2, "SelectLogicalShiftedRegister", []> {
503 let PrintMethod = "printShiftedRegister";
504 let MIOperandInfo = (ops regclass, logical_shift);
505}
506
507def logical_shifted_reg32 : logical_shifted_reg<i32, GPR32>;
508def logical_shifted_reg64 : logical_shifted_reg<i64, GPR64>;
509
510// A logical vector shifter operand:
511// {7-6} - shift type: 00 = lsl
512// {5-0} - imm6: #0, #8, #16, or #24
513def logical_vec_shift : Operand<i32> {
514 let PrintMethod = "printShifter";
515 let EncoderMethod = "getVecShifterOpValue";
516 let ParserMatchClass = LogicalVecShifterOperand;
517}
518
519// A logical vector half-word shifter operand:
520// {7-6} - shift type: 00 = lsl
521// {5-0} - imm6: #0 or #8
522def logical_vec_hw_shift : Operand<i32> {
523 let PrintMethod = "printShifter";
524 let EncoderMethod = "getVecShifterOpValue";
525 let ParserMatchClass = LogicalVecHalfWordShifterOperand;
526}
527
528// A vector move shifter operand:
529// {0} - imm1: #8 or #16
530def move_vec_shift : Operand<i32> {
531 let PrintMethod = "printShifter";
532 let EncoderMethod = "getMoveVecShifterOpValue";
533 let ParserMatchClass = MoveVecShifterOperand;
534}
535
536// An ADD/SUB immediate shifter operand:
537// {7-6} - shift type: 00 = lsl
538// {5-0} - imm6: #0 or #12
539def addsub_shift : Operand<i32> {
540 let ParserMatchClass = AddSubShifterOperand;
541}
542
543class addsub_shifted_imm<ValueType Ty>
544 : Operand<Ty>, ComplexPattern<Ty, 2, "SelectArithImmed", [imm]> {
545 let PrintMethod = "printAddSubImm";
546 let EncoderMethod = "getAddSubImmOpValue";
547 let MIOperandInfo = (ops i32imm, addsub_shift);
548}
549
550def addsub_shifted_imm32 : addsub_shifted_imm<i32>;
551def addsub_shifted_imm64 : addsub_shifted_imm<i64>;
552
553class neg_addsub_shifted_imm<ValueType Ty>
554 : Operand<Ty>, ComplexPattern<Ty, 2, "SelectNegArithImmed", [imm]> {
555 let PrintMethod = "printAddSubImm";
556 let EncoderMethod = "getAddSubImmOpValue";
557 let MIOperandInfo = (ops i32imm, addsub_shift);
558}
559
560def neg_addsub_shifted_imm32 : neg_addsub_shifted_imm<i32>;
561def neg_addsub_shifted_imm64 : neg_addsub_shifted_imm<i64>;
562
563// An extend operand:
564// {5-3} - extend type
565// {2-0} - imm3
566def arith_extend : Operand<i32> {
567 let PrintMethod = "printExtend";
568 let ParserMatchClass = ExtendOperand;
569}
570def arith_extend64 : Operand<i32> {
571 let PrintMethod = "printExtend";
572 let ParserMatchClass = ExtendOperand64;
573}
574
575// 'extend' that's a lsl of a 64-bit register.
576def arith_extendlsl64 : Operand<i32> {
577 let PrintMethod = "printExtend";
578 let ParserMatchClass = ExtendOperandLSL64;
579}
580
581class arith_extended_reg32<ValueType Ty> : Operand<Ty>,
582 ComplexPattern<Ty, 2, "SelectArithExtendedRegister", []> {
583 let PrintMethod = "printExtendedRegister";
584 let MIOperandInfo = (ops GPR32, arith_extend);
585}
586
587class arith_extended_reg32to64<ValueType Ty> : Operand<Ty>,
588 ComplexPattern<Ty, 2, "SelectArithExtendedRegister", []> {
589 let PrintMethod = "printExtendedRegister";
590 let MIOperandInfo = (ops GPR32, arith_extend64);
591}
592
593// Floating-point immediate.
594def fpimm32 : Operand<f32>,
595 PatLeaf<(f32 fpimm), [{
596 return ARM64_AM::getFP32Imm(N->getValueAPF()) != -1;
597 }], SDNodeXForm<fpimm, [{
598 APFloat InVal = N->getValueAPF();
599 uint32_t enc = ARM64_AM::getFP32Imm(InVal);
600 return CurDAG->getTargetConstant(enc, MVT::i32);
601 }]>> {
602 let ParserMatchClass = FPImmOperand;
603 let PrintMethod = "printFPImmOperand";
604}
605def fpimm64 : Operand<f64>,
606 PatLeaf<(f64 fpimm), [{
607 return ARM64_AM::getFP64Imm(N->getValueAPF()) != -1;
608 }], SDNodeXForm<fpimm, [{
609 APFloat InVal = N->getValueAPF();
610 uint32_t enc = ARM64_AM::getFP64Imm(InVal);
611 return CurDAG->getTargetConstant(enc, MVT::i32);
612 }]>> {
613 let ParserMatchClass = FPImmOperand;
614 let PrintMethod = "printFPImmOperand";
615}
616
617def fpimm8 : Operand<i32> {
618 let ParserMatchClass = FPImmOperand;
619 let PrintMethod = "printFPImmOperand";
620}
621
622def fpimm0 : PatLeaf<(fpimm), [{
623 return N->isExactlyValue(+0.0);
624}]>;
625
626// 8-bit immediate for AdvSIMD where 64-bit values of the form:
627// aaaaaaaa bbbbbbbb cccccccc dddddddd eeeeeeee ffffffff gggggggg hhhhhhhh
628// are encoded as the eight bit value 'abcdefgh'.
629def simdimmtype10 : Operand<i32>,
630 PatLeaf<(f64 fpimm), [{
631 return ARM64_AM::isAdvSIMDModImmType10(N->getValueAPF()
632 .bitcastToAPInt()
633 .getZExtValue());
634 }], SDNodeXForm<fpimm, [{
635 APFloat InVal = N->getValueAPF();
636 uint32_t enc = ARM64_AM::encodeAdvSIMDModImmType10(N->getValueAPF()
637 .bitcastToAPInt()
638 .getZExtValue());
639 return CurDAG->getTargetConstant(enc, MVT::i32);
640 }]>> {
641 let ParserMatchClass = SIMDImmType10Operand;
642 let PrintMethod = "printSIMDType10Operand";
643}
644
645
646//---
647// Sytem management
648//---
649
650// Base encoding for system instruction operands.
651let mayLoad = 0, mayStore = 0, hasSideEffects = 1 in
652class BaseSystemI<bit L, dag oops, dag iops, string asm, string operands>
653 : I<oops, iops, asm, operands, "", []> {
654 let Inst{31-22} = 0b1101010100;
655 let Inst{21} = L;
656}
657
658// System instructions which do not have an Rt register.
659class SimpleSystemI<bit L, dag iops, string asm, string operands>
660 : BaseSystemI<L, (outs), iops, asm, operands> {
661 let Inst{4-0} = 0b11111;
662}
663
664// System instructions which have an Rt register.
665class RtSystemI<bit L, dag oops, dag iops, string asm, string operands>
666 : BaseSystemI<L, oops, iops, asm, operands>,
667 Sched<[WriteSys]> {
668 bits<5> Rt;
669 let Inst{4-0} = Rt;
670}
671
672// Hint instructions that take both a CRm and a 3-bit immediate.
673class HintI<string mnemonic>
674 : SimpleSystemI<0, (ins imm0_127:$imm), mnemonic#" $imm", "">,
675 Sched<[WriteHint]> {
676 bits <7> imm;
677 let Inst{20-12} = 0b000110010;
678 let Inst{11-5} = imm;
679}
680
681// System instructions taking a single literal operand which encodes into
682// CRm. op2 differentiates the opcodes.
683def BarrierAsmOperand : AsmOperandClass {
684 let Name = "Barrier";
685 let ParserMethod = "tryParseBarrierOperand";
686}
687def barrier_op : Operand<i32> {
688 let PrintMethod = "printBarrierOption";
689 let ParserMatchClass = BarrierAsmOperand;
690}
691class CRmSystemI<Operand crmtype, bits<3> opc, string asm>
692 : SimpleSystemI<0, (ins crmtype:$CRm), asm, "\t$CRm">,
693 Sched<[WriteBarrier]> {
694 bits<4> CRm;
695 let Inst{20-12} = 0b000110011;
696 let Inst{11-8} = CRm;
697 let Inst{7-5} = opc;
698}
699
Bradley Smith08c391c2014-04-09 14:42:36 +0000700// MRS/MSR system instructions. These have different operand classes because
701// a different subset of registers can be accessed through each instruction.
702def MRSSystemRegisterOperand : AsmOperandClass {
703 let Name = "MRSSystemRegister";
Bradley Smithe8b41662014-04-09 14:43:06 +0000704 let ParserMethod = "tryParseSysReg";
Tim Northover00ed9962014-03-29 10:18:08 +0000705}
706// concatenation of 1, op0, op1, CRn, CRm, op2. 16-bit immediate.
Bradley Smith08c391c2014-04-09 14:42:36 +0000707def mrs_sysreg_op : Operand<i32> {
708 let ParserMatchClass = MRSSystemRegisterOperand;
709 let DecoderMethod = "DecodeMRSSystemRegister";
710 let PrintMethod = "printMRSSystemRegister";
Tim Northover00ed9962014-03-29 10:18:08 +0000711}
712
Bradley Smith08c391c2014-04-09 14:42:36 +0000713def MSRSystemRegisterOperand : AsmOperandClass {
714 let Name = "MSRSystemRegister";
Bradley Smithe8b41662014-04-09 14:43:06 +0000715 let ParserMethod = "tryParseSysReg";
Bradley Smith08c391c2014-04-09 14:42:36 +0000716}
717def msr_sysreg_op : Operand<i32> {
718 let ParserMatchClass = MSRSystemRegisterOperand;
719 let DecoderMethod = "DecodeMSRSystemRegister";
720 let PrintMethod = "printMSRSystemRegister";
721}
722
723class MRSI : RtSystemI<1, (outs GPR64:$Rt), (ins mrs_sysreg_op:$systemreg),
Tim Northover00ed9962014-03-29 10:18:08 +0000724 "mrs", "\t$Rt, $systemreg"> {
725 bits<15> systemreg;
726 let Inst{20} = 1;
727 let Inst{19-5} = systemreg;
728}
729
730// FIXME: Some of these def CPSR, others don't. Best way to model that?
731// Explicitly modeling each of the system register as a register class
732// would do it, but feels like overkill at this point.
Bradley Smith08c391c2014-04-09 14:42:36 +0000733class MSRI : RtSystemI<0, (outs), (ins msr_sysreg_op:$systemreg, GPR64:$Rt),
Tim Northover00ed9962014-03-29 10:18:08 +0000734 "msr", "\t$systemreg, $Rt"> {
735 bits<15> systemreg;
736 let Inst{20} = 1;
737 let Inst{19-5} = systemreg;
738}
739
740def SystemCPSRFieldOperand : AsmOperandClass {
741 let Name = "SystemCPSRField";
Bradley Smithe8b41662014-04-09 14:43:06 +0000742 let ParserMethod = "tryParseSysReg";
Tim Northover00ed9962014-03-29 10:18:08 +0000743}
744def cpsrfield_op : Operand<i32> {
745 let ParserMatchClass = SystemCPSRFieldOperand;
746 let PrintMethod = "printSystemCPSRField";
747}
748
749let Defs = [CPSR] in
750class MSRcpsrI : SimpleSystemI<0, (ins cpsrfield_op:$cpsr_field, imm0_15:$imm),
751 "msr", "\t$cpsr_field, $imm">,
752 Sched<[WriteSys]> {
753 bits<6> cpsrfield;
754 bits<4> imm;
755 let Inst{20-19} = 0b00;
756 let Inst{18-16} = cpsrfield{5-3};
757 let Inst{15-12} = 0b0100;
758 let Inst{11-8} = imm;
759 let Inst{7-5} = cpsrfield{2-0};
760
761 let DecoderMethod = "DecodeSystemCPSRInstruction";
762}
763
764// SYS and SYSL generic system instructions.
765def SysCRAsmOperand : AsmOperandClass {
766 let Name = "SysCR";
767 let ParserMethod = "tryParseSysCROperand";
768}
769
770def sys_cr_op : Operand<i32> {
771 let PrintMethod = "printSysCROperand";
772 let ParserMatchClass = SysCRAsmOperand;
773}
774
775class SystemI<bit L, string asm>
776 : SimpleSystemI<L,
777 (ins imm0_7:$op1, sys_cr_op:$Cn, sys_cr_op:$Cm, imm0_7:$op2),
778 asm, "\t$op1, $Cn, $Cm, $op2">,
779 Sched<[WriteSys]> {
780 bits<3> op1;
781 bits<4> Cn;
782 bits<4> Cm;
783 bits<3> op2;
784 let Inst{20-19} = 0b01;
785 let Inst{18-16} = op1;
786 let Inst{15-12} = Cn;
787 let Inst{11-8} = Cm;
788 let Inst{7-5} = op2;
789}
790
791class SystemXtI<bit L, string asm>
792 : RtSystemI<L, (outs),
793 (ins imm0_7:$op1, sys_cr_op:$Cn, sys_cr_op:$Cm, imm0_7:$op2, GPR64:$Rt),
794 asm, "\t$op1, $Cn, $Cm, $op2, $Rt"> {
795 bits<3> op1;
796 bits<4> Cn;
797 bits<4> Cm;
798 bits<3> op2;
799 let Inst{20-19} = 0b01;
800 let Inst{18-16} = op1;
801 let Inst{15-12} = Cn;
802 let Inst{11-8} = Cm;
803 let Inst{7-5} = op2;
804}
805
806class SystemLXtI<bit L, string asm>
807 : RtSystemI<L, (outs),
808 (ins GPR64:$Rt, imm0_7:$op1, sys_cr_op:$Cn, sys_cr_op:$Cm, imm0_7:$op2),
809 asm, "\t$Rt, $op1, $Cn, $Cm, $op2"> {
810 bits<3> op1;
811 bits<4> Cn;
812 bits<4> Cm;
813 bits<3> op2;
814 let Inst{20-19} = 0b01;
815 let Inst{18-16} = op1;
816 let Inst{15-12} = Cn;
817 let Inst{11-8} = Cm;
818 let Inst{7-5} = op2;
819}
820
821
822// Branch (register) instructions:
823//
824// case opc of
825// 0001 blr
826// 0000 br
827// 0101 dret
828// 0100 eret
829// 0010 ret
830// otherwise UNDEFINED
831class BaseBranchReg<bits<4> opc, dag oops, dag iops, string asm,
832 string operands, list<dag> pattern>
833 : I<oops, iops, asm, operands, "", pattern>, Sched<[WriteBrReg]> {
834 let Inst{31-25} = 0b1101011;
835 let Inst{24-21} = opc;
836 let Inst{20-16} = 0b11111;
837 let Inst{15-10} = 0b000000;
838 let Inst{4-0} = 0b00000;
839}
840
841class BranchReg<bits<4> opc, string asm, list<dag> pattern>
842 : BaseBranchReg<opc, (outs), (ins GPR64:$Rn), asm, "\t$Rn", pattern> {
843 bits<5> Rn;
844 let Inst{9-5} = Rn;
845}
846
847let mayLoad = 0, mayStore = 0, hasSideEffects = 1, isReturn = 1 in
848class SpecialReturn<bits<4> opc, string asm>
849 : BaseBranchReg<opc, (outs), (ins), asm, "", []> {
850 let Inst{9-5} = 0b11111;
851}
852
853//---
854// Conditional branch instruction.
855//---
856// Branch condition code.
857// 4-bit immediate. Pretty-printed as .<cc>
858def dotCcode : Operand<i32> {
859 let PrintMethod = "printDotCondCode";
860}
861
862// Conditional branch target. 19-bit immediate. The low two bits of the target
863// offset are implied zero and so are not part of the immediate.
864def BranchTarget19Operand : AsmOperandClass {
865 let Name = "BranchTarget19";
866}
867def am_brcond : Operand<OtherVT> {
868 let EncoderMethod = "getCondBranchTargetOpValue";
869 let DecoderMethod = "DecodeCondBranchTarget";
870 let PrintMethod = "printAlignedBranchTarget";
871 let ParserMatchClass = BranchTarget19Operand;
872}
873
874class BranchCond : I<(outs), (ins dotCcode:$cond, am_brcond:$target),
875 "b", "$cond\t$target", "",
876 [(ARM64brcond bb:$target, imm:$cond, CPSR)]>,
877 Sched<[WriteBr]> {
878 let isBranch = 1;
879 let isTerminator = 1;
880 let Uses = [CPSR];
881
882 bits<4> cond;
883 bits<19> target;
884 let Inst{31-24} = 0b01010100;
885 let Inst{23-5} = target;
886 let Inst{4} = 0;
887 let Inst{3-0} = cond;
888}
889
890//---
891// Compare-and-branch instructions.
892//---
893class BaseCmpBranch<RegisterClass regtype, bit op, string asm, SDNode node>
894 : I<(outs), (ins regtype:$Rt, am_brcond:$target),
895 asm, "\t$Rt, $target", "",
896 [(node regtype:$Rt, bb:$target)]>,
897 Sched<[WriteBr]> {
898 let isBranch = 1;
899 let isTerminator = 1;
900
901 bits<5> Rt;
902 bits<19> target;
903 let Inst{30-25} = 0b011010;
904 let Inst{24} = op;
905 let Inst{23-5} = target;
906 let Inst{4-0} = Rt;
907}
908
909multiclass CmpBranch<bit op, string asm, SDNode node> {
910 def W : BaseCmpBranch<GPR32, op, asm, node> {
911 let Inst{31} = 0;
912 }
913 def X : BaseCmpBranch<GPR64, op, asm, node> {
914 let Inst{31} = 1;
915 }
916}
917
918//---
919// Test-bit-and-branch instructions.
920//---
921// Test-and-branch target. 14-bit sign-extended immediate. The low two bits of
922// the target offset are implied zero and so are not part of the immediate.
923def BranchTarget14Operand : AsmOperandClass {
924 let Name = "BranchTarget14";
925}
926def am_tbrcond : Operand<OtherVT> {
927 let EncoderMethod = "getTestBranchTargetOpValue";
928 let PrintMethod = "printAlignedBranchTarget";
929 let ParserMatchClass = BranchTarget14Operand;
930}
931
932class TestBranch<bit op, string asm, SDNode node>
933 : I<(outs), (ins GPR64:$Rt, imm0_63:$bit_off, am_tbrcond:$target),
934 asm, "\t$Rt, $bit_off, $target", "",
935 [(node GPR64:$Rt, imm0_63:$bit_off, bb:$target)]>,
936 Sched<[WriteBr]> {
937 let isBranch = 1;
938 let isTerminator = 1;
939
940 bits<5> Rt;
941 bits<6> bit_off;
942 bits<14> target;
943
944 let Inst{31} = bit_off{5};
945 let Inst{30-25} = 0b011011;
946 let Inst{24} = op;
947 let Inst{23-19} = bit_off{4-0};
948 let Inst{18-5} = target;
949 let Inst{4-0} = Rt;
950
951 let DecoderMethod = "DecodeTestAndBranch";
952}
953
954//---
955// Unconditional branch (immediate) instructions.
956//---
957def BranchTarget26Operand : AsmOperandClass {
958 let Name = "BranchTarget26";
959}
960def am_b_target : Operand<OtherVT> {
961 let EncoderMethod = "getBranchTargetOpValue";
962 let PrintMethod = "printAlignedBranchTarget";
963 let ParserMatchClass = BranchTarget26Operand;
964}
965def am_bl_target : Operand<i64> {
966 let EncoderMethod = "getBranchTargetOpValue";
967 let PrintMethod = "printAlignedBranchTarget";
968 let ParserMatchClass = BranchTarget26Operand;
969}
970
971class BImm<bit op, dag iops, string asm, list<dag> pattern>
972 : I<(outs), iops, asm, "\t$addr", "", pattern>, Sched<[WriteBr]> {
973 bits<26> addr;
974 let Inst{31} = op;
975 let Inst{30-26} = 0b00101;
976 let Inst{25-0} = addr;
977
978 let DecoderMethod = "DecodeUnconditionalBranch";
979}
980
981class BranchImm<bit op, string asm, list<dag> pattern>
982 : BImm<op, (ins am_b_target:$addr), asm, pattern>;
983class CallImm<bit op, string asm, list<dag> pattern>
984 : BImm<op, (ins am_bl_target:$addr), asm, pattern>;
985
986//---
987// Basic one-operand data processing instructions.
988//---
989
990let mayLoad = 0, mayStore = 0, hasSideEffects = 0 in
991class BaseOneOperandData<bits<3> opc, RegisterClass regtype, string asm,
992 SDPatternOperator node>
993 : I<(outs regtype:$Rd), (ins regtype:$Rn), asm, "\t$Rd, $Rn", "",
994 [(set regtype:$Rd, (node regtype:$Rn))]>,
995 Sched<[WriteI]> {
996 bits<5> Rd;
997 bits<5> Rn;
998
999 let Inst{30-13} = 0b101101011000000000;
1000 let Inst{12-10} = opc;
1001 let Inst{9-5} = Rn;
1002 let Inst{4-0} = Rd;
1003}
1004
1005let mayLoad = 0, mayStore = 0, hasSideEffects = 0 in
1006multiclass OneOperandData<bits<3> opc, string asm,
1007 SDPatternOperator node = null_frag> {
1008 def Wr : BaseOneOperandData<opc, GPR32, asm, node> {
1009 let Inst{31} = 0;
1010 }
1011
1012 def Xr : BaseOneOperandData<opc, GPR64, asm, node> {
1013 let Inst{31} = 1;
1014 }
1015}
1016
1017class OneWRegData<bits<3> opc, string asm, SDPatternOperator node>
1018 : BaseOneOperandData<opc, GPR32, asm, node> {
1019 let Inst{31} = 0;
1020}
1021
1022class OneXRegData<bits<3> opc, string asm, SDPatternOperator node>
1023 : BaseOneOperandData<opc, GPR64, asm, node> {
1024 let Inst{31} = 1;
1025}
1026
1027//---
1028// Basic two-operand data processing instructions.
1029//---
1030class BaseBaseAddSubCarry<bit isSub, RegisterClass regtype, string asm,
1031 list<dag> pattern>
1032 : I<(outs regtype:$Rd), (ins regtype:$Rn, regtype:$Rm),
1033 asm, "\t$Rd, $Rn, $Rm", "", pattern>,
1034 Sched<[WriteI]> {
1035 let Uses = [CPSR];
1036 bits<5> Rd;
1037 bits<5> Rn;
1038 bits<5> Rm;
1039 let Inst{30} = isSub;
1040 let Inst{28-21} = 0b11010000;
1041 let Inst{20-16} = Rm;
1042 let Inst{15-10} = 0;
1043 let Inst{9-5} = Rn;
1044 let Inst{4-0} = Rd;
1045}
1046
1047class BaseAddSubCarry<bit isSub, RegisterClass regtype, string asm,
1048 SDNode OpNode>
1049 : BaseBaseAddSubCarry<isSub, regtype, asm,
1050 [(set regtype:$Rd, (OpNode regtype:$Rn, regtype:$Rm, CPSR))]>;
1051
1052class BaseAddSubCarrySetFlags<bit isSub, RegisterClass regtype, string asm,
1053 SDNode OpNode>
1054 : BaseBaseAddSubCarry<isSub, regtype, asm,
1055 [(set regtype:$Rd, (OpNode regtype:$Rn, regtype:$Rm, CPSR)),
1056 (implicit CPSR)]> {
1057 let Defs = [CPSR];
1058}
1059
1060multiclass AddSubCarry<bit isSub, string asm, string asm_setflags,
1061 SDNode OpNode, SDNode OpNode_setflags> {
1062 def Wr : BaseAddSubCarry<isSub, GPR32, asm, OpNode> {
1063 let Inst{31} = 0;
1064 let Inst{29} = 0;
1065 }
1066 def Xr : BaseAddSubCarry<isSub, GPR64, asm, OpNode> {
1067 let Inst{31} = 1;
1068 let Inst{29} = 0;
1069 }
1070
1071 // Sets flags.
1072 def SWr : BaseAddSubCarrySetFlags<isSub, GPR32, asm_setflags,
1073 OpNode_setflags> {
1074 let Inst{31} = 0;
1075 let Inst{29} = 1;
1076 }
1077 def SXr : BaseAddSubCarrySetFlags<isSub, GPR64, asm_setflags,
1078 OpNode_setflags> {
1079 let Inst{31} = 1;
1080 let Inst{29} = 1;
1081 }
1082}
1083
1084class BaseTwoOperand<bits<4> opc, RegisterClass regtype, string asm,
1085 SDPatternOperator OpNode>
1086 : I<(outs regtype:$Rd), (ins regtype:$Rn, regtype:$Rm),
1087 asm, "\t$Rd, $Rn, $Rm", "",
1088 [(set regtype:$Rd, (OpNode regtype:$Rn, regtype:$Rm))]> {
1089 bits<5> Rd;
1090 bits<5> Rn;
1091 bits<5> Rm;
1092 let Inst{30-21} = 0b0011010110;
1093 let Inst{20-16} = Rm;
1094 let Inst{15-14} = 0b00;
1095 let Inst{13-10} = opc;
1096 let Inst{9-5} = Rn;
1097 let Inst{4-0} = Rd;
1098}
1099
1100class BaseDiv<bit isSigned, RegisterClass regtype, string asm,
1101 SDPatternOperator OpNode>
1102 : BaseTwoOperand<{0,0,1,?}, regtype, asm, OpNode> {
1103 let Inst{10} = isSigned;
1104}
1105
1106multiclass Div<bit isSigned, string asm, SDPatternOperator OpNode> {
1107 def Wr : BaseDiv<isSigned, GPR32, asm, OpNode>,
1108 Sched<[WriteID32]> {
1109 let Inst{31} = 0;
1110 }
1111 def Xr : BaseDiv<isSigned, GPR64, asm, OpNode>,
1112 Sched<[WriteID64]> {
1113 let Inst{31} = 1;
1114 }
1115}
1116
Tim Northover2ad88d32014-04-03 09:26:16 +00001117class BaseShift<bits<2> shift_type, RegisterClass regtype, string asm,
1118 SDPatternOperator OpNode = null_frag>
Tim Northover00ed9962014-03-29 10:18:08 +00001119 : BaseTwoOperand<{1,0,?,?}, regtype, asm, OpNode>,
1120 Sched<[WriteIS]> {
1121 let Inst{11-10} = shift_type;
1122}
1123
1124multiclass Shift<bits<2> shift_type, string asm, SDNode OpNode> {
Tim Northover2ad88d32014-04-03 09:26:16 +00001125 def Wr : BaseShift<shift_type, GPR32, asm> {
Tim Northover00ed9962014-03-29 10:18:08 +00001126 let Inst{31} = 0;
1127 }
1128
1129 def Xr : BaseShift<shift_type, GPR64, asm, OpNode> {
1130 let Inst{31} = 1;
1131 }
Tim Northover2ad88d32014-04-03 09:26:16 +00001132
1133 def : Pat<(i32 (OpNode GPR32:$Rn, i64:$Rm)),
1134 (!cast<Instruction>(NAME # "Wr") GPR32:$Rn,
1135 (EXTRACT_SUBREG i64:$Rm, sub_32))>;
1136
1137 def : Pat<(i32 (OpNode GPR32:$Rn, (i64 (zext GPR32:$Rm)))),
1138 (!cast<Instruction>(NAME # "Wr") GPR32:$Rn, GPR32:$Rm)>;
1139
1140 def : Pat<(i32 (OpNode GPR32:$Rn, (i64 (anyext GPR32:$Rm)))),
1141 (!cast<Instruction>(NAME # "Wr") GPR32:$Rn, GPR32:$Rm)>;
1142
1143 def : Pat<(i32 (OpNode GPR32:$Rn, (i64 (sext GPR32:$Rm)))),
1144 (!cast<Instruction>(NAME # "Wr") GPR32:$Rn, GPR32:$Rm)>;
Tim Northover00ed9962014-03-29 10:18:08 +00001145}
1146
1147class ShiftAlias<string asm, Instruction inst, RegisterClass regtype>
1148 : InstAlias<asm#" $dst, $src1, $src2",
1149 (inst regtype:$dst, regtype:$src1, regtype:$src2)>;
1150
1151class BaseMulAccum<bit isSub, bits<3> opc, RegisterClass multype,
1152 RegisterClass addtype, string asm,
1153 list<dag> pattern>
1154 : I<(outs addtype:$Rd), (ins multype:$Rn, multype:$Rm, addtype:$Ra),
1155 asm, "\t$Rd, $Rn, $Rm, $Ra", "", pattern> {
1156 bits<5> Rd;
1157 bits<5> Rn;
1158 bits<5> Rm;
1159 bits<5> Ra;
1160 let Inst{30-24} = 0b0011011;
1161 let Inst{23-21} = opc;
1162 let Inst{20-16} = Rm;
1163 let Inst{15} = isSub;
1164 let Inst{14-10} = Ra;
1165 let Inst{9-5} = Rn;
1166 let Inst{4-0} = Rd;
1167}
1168
1169multiclass MulAccum<bit isSub, string asm, SDNode AccNode> {
1170 def Wrrr : BaseMulAccum<isSub, 0b000, GPR32, GPR32, asm,
1171 [(set GPR32:$Rd, (AccNode GPR32:$Ra, (mul GPR32:$Rn, GPR32:$Rm)))]>,
1172 Sched<[WriteIM32]> {
1173 let Inst{31} = 0;
1174 }
1175
1176 def Xrrr : BaseMulAccum<isSub, 0b000, GPR64, GPR64, asm,
1177 [(set GPR64:$Rd, (AccNode GPR64:$Ra, (mul GPR64:$Rn, GPR64:$Rm)))]>,
1178 Sched<[WriteIM64]> {
1179 let Inst{31} = 1;
1180 }
1181}
1182
1183class WideMulAccum<bit isSub, bits<3> opc, string asm,
1184 SDNode AccNode, SDNode ExtNode>
1185 : BaseMulAccum<isSub, opc, GPR32, GPR64, asm,
1186 [(set GPR64:$Rd, (AccNode GPR64:$Ra,
1187 (mul (ExtNode GPR32:$Rn), (ExtNode GPR32:$Rm))))]>,
1188 Sched<[WriteIM32]> {
1189 let Inst{31} = 1;
1190}
1191
1192class MulHi<bits<3> opc, string asm, SDNode OpNode>
1193 : I<(outs GPR64:$Rd), (ins GPR64:$Rn, GPR64:$Rm),
1194 asm, "\t$Rd, $Rn, $Rm", "",
1195 [(set GPR64:$Rd, (OpNode GPR64:$Rn, GPR64:$Rm))]>,
1196 Sched<[WriteIM64]> {
1197 bits<5> Rd;
1198 bits<5> Rn;
1199 bits<5> Rm;
1200 let Inst{31-24} = 0b10011011;
1201 let Inst{23-21} = opc;
1202 let Inst{20-16} = Rm;
1203 let Inst{15-10} = 0b011111;
1204 let Inst{9-5} = Rn;
1205 let Inst{4-0} = Rd;
1206}
1207
1208class MulAccumWAlias<string asm, Instruction inst>
1209 : InstAlias<asm#" $dst, $src1, $src2",
1210 (inst GPR32:$dst, GPR32:$src1, GPR32:$src2, WZR)>;
1211class MulAccumXAlias<string asm, Instruction inst>
1212 : InstAlias<asm#" $dst, $src1, $src2",
1213 (inst GPR64:$dst, GPR64:$src1, GPR64:$src2, XZR)>;
1214class WideMulAccumAlias<string asm, Instruction inst>
1215 : InstAlias<asm#" $dst, $src1, $src2",
1216 (inst GPR64:$dst, GPR32:$src1, GPR32:$src2, XZR)>;
1217
1218class BaseCRC32<bit sf, bits<2> sz, bit C, RegisterClass StreamReg,
1219 SDPatternOperator OpNode, string asm>
1220 : I<(outs GPR32:$Rd), (ins GPR32:$Rn, StreamReg:$Rm),
1221 asm, "\t$Rd, $Rn, $Rm", "",
1222 [(set GPR32:$Rd, (OpNode GPR32:$Rn, StreamReg:$Rm))]>,
1223 Sched<[WriteISReg]> {
1224 bits<5> Rd;
1225 bits<5> Rn;
1226 bits<5> Rm;
1227
1228 let Inst{31} = sf;
1229 let Inst{30-21} = 0b0011010110;
1230 let Inst{20-16} = Rm;
1231 let Inst{15-13} = 0b010;
1232 let Inst{12} = C;
1233 let Inst{11-10} = sz;
1234 let Inst{9-5} = Rn;
1235 let Inst{4-0} = Rd;
1236}
1237
1238//---
1239// Address generation.
1240//---
1241
1242class ADRI<bit page, string asm, Operand adr, list<dag> pattern>
1243 : I<(outs GPR64:$Xd), (ins adr:$label), asm, "\t$Xd, $label", "",
1244 pattern>,
1245 Sched<[WriteI]> {
1246 bits<5> Xd;
1247 bits<21> label;
1248 let Inst{31} = page;
1249 let Inst{30-29} = label{1-0};
1250 let Inst{28-24} = 0b10000;
1251 let Inst{23-5} = label{20-2};
1252 let Inst{4-0} = Xd;
1253
1254 let DecoderMethod = "DecodeAdrInstruction";
1255}
1256
1257//---
1258// Move immediate.
1259//---
1260
1261def movimm32_imm : Operand<i32> {
1262 let ParserMatchClass = Imm0_65535Operand;
1263 let EncoderMethod = "getMoveWideImmOpValue";
1264}
1265def movimm32_shift : Operand<i32> {
1266 let PrintMethod = "printShifter";
1267 let ParserMatchClass = MovImm32ShifterOperand;
1268}
1269def movimm64_shift : Operand<i32> {
1270 let PrintMethod = "printShifter";
1271 let ParserMatchClass = MovImm64ShifterOperand;
1272}
1273let mayLoad = 0, mayStore = 0, hasSideEffects = 0 in
1274class BaseMoveImmediate<bits<2> opc, RegisterClass regtype, Operand shifter,
1275 string asm>
1276 : I<(outs regtype:$Rd), (ins movimm32_imm:$imm, shifter:$shift),
1277 asm, "\t$Rd, $imm$shift", "", []>,
1278 Sched<[WriteImm]> {
1279 bits<5> Rd;
1280 bits<16> imm;
1281 bits<6> shift;
1282 let Inst{30-29} = opc;
1283 let Inst{28-23} = 0b100101;
1284 let Inst{22-21} = shift{5-4};
1285 let Inst{20-5} = imm;
1286 let Inst{4-0} = Rd;
1287
1288 let DecoderMethod = "DecodeMoveImmInstruction";
1289}
1290
1291multiclass MoveImmediate<bits<2> opc, string asm> {
1292 def Wi : BaseMoveImmediate<opc, GPR32, movimm32_shift, asm> {
1293 let Inst{31} = 0;
1294 }
1295
1296 def Xi : BaseMoveImmediate<opc, GPR64, movimm64_shift, asm> {
1297 let Inst{31} = 1;
1298 }
1299}
1300
1301let mayLoad = 0, mayStore = 0, hasSideEffects = 0 in
1302class BaseInsertImmediate<bits<2> opc, RegisterClass regtype, Operand shifter,
1303 string asm>
1304 : I<(outs regtype:$Rd),
1305 (ins regtype:$src, movimm32_imm:$imm, shifter:$shift),
1306 asm, "\t$Rd, $imm$shift", "$src = $Rd", []>,
1307 Sched<[WriteI]> {
1308 bits<5> Rd;
1309 bits<16> imm;
1310 bits<6> shift;
1311 let Inst{30-29} = opc;
1312 let Inst{28-23} = 0b100101;
1313 let Inst{22-21} = shift{5-4};
1314 let Inst{20-5} = imm;
1315 let Inst{4-0} = Rd;
1316
1317 let DecoderMethod = "DecodeMoveImmInstruction";
1318}
1319
1320multiclass InsertImmediate<bits<2> opc, string asm> {
1321 def Wi : BaseInsertImmediate<opc, GPR32, movimm32_shift, asm> {
1322 let Inst{31} = 0;
1323 }
1324
1325 def Xi : BaseInsertImmediate<opc, GPR64, movimm64_shift, asm> {
1326 let Inst{31} = 1;
1327 }
1328}
1329
1330//---
1331// Add/Subtract
1332//---
1333
1334class BaseAddSubImm<bit isSub, bit setFlags, RegisterClass dstRegtype,
1335 RegisterClass srcRegtype, addsub_shifted_imm immtype,
1336 string asm, SDPatternOperator OpNode>
1337 : I<(outs dstRegtype:$Rd), (ins srcRegtype:$Rn, immtype:$imm),
1338 asm, "\t$Rd, $Rn, $imm", "",
1339 [(set dstRegtype:$Rd, (OpNode srcRegtype:$Rn, immtype:$imm))]>,
1340 Sched<[WriteI]> {
1341 bits<5> Rd;
1342 bits<5> Rn;
1343 bits<14> imm;
1344 let Inst{30} = isSub;
1345 let Inst{29} = setFlags;
1346 let Inst{28-24} = 0b10001;
1347 let Inst{23-22} = imm{13-12}; // '00' => lsl #0, '01' => lsl #12
1348 let Inst{21-10} = imm{11-0};
1349 let Inst{9-5} = Rn;
1350 let Inst{4-0} = Rd;
1351 let DecoderMethod = "DecodeBaseAddSubImm";
1352}
1353
1354class BaseAddSubRegPseudo<RegisterClass regtype,
1355 SDPatternOperator OpNode>
1356 : Pseudo<(outs regtype:$Rd), (ins regtype:$Rn, regtype:$Rm),
1357 [(set regtype:$Rd, (OpNode regtype:$Rn, regtype:$Rm))]>,
1358 Sched<[WriteI]>;
1359
1360class BaseAddSubSReg<bit isSub, bit setFlags, RegisterClass regtype,
1361 arith_shifted_reg shifted_regtype, string asm,
1362 SDPatternOperator OpNode>
1363 : I<(outs regtype:$Rd), (ins regtype:$Rn, shifted_regtype:$Rm),
1364 asm, "\t$Rd, $Rn, $Rm", "",
1365 [(set regtype:$Rd, (OpNode regtype:$Rn, shifted_regtype:$Rm))]>,
1366 Sched<[WriteISReg]> {
1367 // The operands are in order to match the 'addr' MI operands, so we
1368 // don't need an encoder method and by-name matching. Just use the default
1369 // in-order handling. Since we're using by-order, make sure the names
1370 // do not match.
1371 bits<5> dst;
1372 bits<5> src1;
1373 bits<5> src2;
1374 bits<8> shift;
1375 let Inst{30} = isSub;
1376 let Inst{29} = setFlags;
1377 let Inst{28-24} = 0b01011;
1378 let Inst{23-22} = shift{7-6};
1379 let Inst{21} = 0;
1380 let Inst{20-16} = src2;
1381 let Inst{15-10} = shift{5-0};
1382 let Inst{9-5} = src1;
1383 let Inst{4-0} = dst;
1384
1385 let DecoderMethod = "DecodeThreeAddrSRegInstruction";
1386}
1387
1388class BaseAddSubEReg<bit isSub, bit setFlags, RegisterClass dstRegtype,
1389 RegisterClass src1Regtype, Operand src2Regtype,
1390 string asm, SDPatternOperator OpNode>
1391 : I<(outs dstRegtype:$R1),
1392 (ins src1Regtype:$R2, src2Regtype:$R3),
1393 asm, "\t$R1, $R2, $R3", "",
1394 [(set dstRegtype:$R1, (OpNode src1Regtype:$R2, src2Regtype:$R3))]>,
1395 Sched<[WriteIEReg]> {
1396 bits<5> Rd;
1397 bits<5> Rn;
1398 bits<5> Rm;
1399 bits<6> ext;
1400 let Inst{30} = isSub;
1401 let Inst{29} = setFlags;
1402 let Inst{28-24} = 0b01011;
1403 let Inst{23-21} = 0b001;
1404 let Inst{20-16} = Rm;
1405 let Inst{15-13} = ext{5-3};
1406 let Inst{12-10} = ext{2-0};
1407 let Inst{9-5} = Rn;
1408 let Inst{4-0} = Rd;
1409
1410 let DecoderMethod = "DecodeAddSubERegInstruction";
1411}
1412
1413let mayLoad = 0, mayStore = 0, hasSideEffects = 0 in
1414class BaseAddSubEReg64<bit isSub, bit setFlags, RegisterClass dstRegtype,
1415 RegisterClass src1Regtype, RegisterClass src2Regtype,
1416 Operand ext_op, string asm>
1417 : I<(outs dstRegtype:$Rd),
1418 (ins src1Regtype:$Rn, src2Regtype:$Rm, ext_op:$ext),
1419 asm, "\t$Rd, $Rn, $Rm$ext", "", []>,
1420 Sched<[WriteIEReg]> {
1421 bits<5> Rd;
1422 bits<5> Rn;
1423 bits<5> Rm;
1424 bits<6> ext;
1425 let Inst{30} = isSub;
1426 let Inst{29} = setFlags;
1427 let Inst{28-24} = 0b01011;
1428 let Inst{23-21} = 0b001;
1429 let Inst{20-16} = Rm;
1430 let Inst{15} = ext{5};
1431 let Inst{12-10} = ext{2-0};
1432 let Inst{9-5} = Rn;
1433 let Inst{4-0} = Rd;
1434
1435 let DecoderMethod = "DecodeAddSubERegInstruction";
1436}
1437
1438// Aliases for register+register add/subtract.
1439class AddSubRegAlias<string asm, Instruction inst, RegisterClass dstRegtype,
1440 RegisterClass src1Regtype, RegisterClass src2Regtype,
1441 int shiftExt>
1442 : InstAlias<asm#" $dst, $src1, $src2",
1443 (inst dstRegtype:$dst, src1Regtype:$src1, src2Regtype:$src2,
1444 shiftExt)>;
1445
1446multiclass AddSub<bit isSub, string mnemonic,
1447 SDPatternOperator OpNode = null_frag> {
1448 let hasSideEffects = 0 in {
1449 // Add/Subtract immediate
1450 def Wri : BaseAddSubImm<isSub, 0, GPR32sp, GPR32sp, addsub_shifted_imm32,
1451 mnemonic, OpNode> {
1452 let Inst{31} = 0;
1453 }
1454 def Xri : BaseAddSubImm<isSub, 0, GPR64sp, GPR64sp, addsub_shifted_imm64,
1455 mnemonic, OpNode> {
1456 let Inst{31} = 1;
1457 }
1458
1459 // Add/Subtract register - Only used for CodeGen
1460 def Wrr : BaseAddSubRegPseudo<GPR32, OpNode>;
1461 def Xrr : BaseAddSubRegPseudo<GPR64, OpNode>;
1462
1463 // Add/Subtract shifted register
1464 def Wrs : BaseAddSubSReg<isSub, 0, GPR32, arith_shifted_reg32, mnemonic,
1465 OpNode> {
1466 let Inst{31} = 0;
1467 }
1468 def Xrs : BaseAddSubSReg<isSub, 0, GPR64, arith_shifted_reg64, mnemonic,
1469 OpNode> {
1470 let Inst{31} = 1;
1471 }
1472 }
1473
1474 // Add/Subtract extended register
1475 let AddedComplexity = 1, hasSideEffects = 0 in {
1476 def Wrx : BaseAddSubEReg<isSub, 0, GPR32sp, GPR32sp,
1477 arith_extended_reg32<i32>, mnemonic, OpNode> {
1478 let Inst{31} = 0;
1479 }
1480 def Xrx : BaseAddSubEReg<isSub, 0, GPR64sp, GPR64sp,
1481 arith_extended_reg32to64<i64>, mnemonic, OpNode> {
1482 let Inst{31} = 1;
1483 }
1484 }
1485
1486 def Xrx64 : BaseAddSubEReg64<isSub, 0, GPR64sp, GPR64sp, GPR64,
1487 arith_extendlsl64, mnemonic> {
1488 // UXTX and SXTX only.
1489 let Inst{14-13} = 0b11;
1490 let Inst{31} = 1;
1491 }
1492
1493 // Register/register aliases with no shift when SP is not used.
1494 def : AddSubRegAlias<mnemonic, !cast<Instruction>(NAME#"Wrs"),
1495 GPR32, GPR32, GPR32, 0>;
1496 def : AddSubRegAlias<mnemonic, !cast<Instruction>(NAME#"Xrs"),
1497 GPR64, GPR64, GPR64, 0>;
1498
1499 // Register/register aliases with no shift when either the destination or
1500 // first source register is SP. This relies on the shifted register aliases
1501 // above matching first in the case when SP is not used.
1502 def : AddSubRegAlias<mnemonic, !cast<Instruction>(NAME#"Wrx"),
1503 GPR32sp, GPR32sp, GPR32, 16>; // UXTW #0
1504 def : AddSubRegAlias<mnemonic,
1505 !cast<Instruction>(NAME#"Xrx64"),
1506 GPR64sp, GPR64sp, GPR64, 24>; // UXTX #0
1507}
1508
1509multiclass AddSubS<bit isSub, string mnemonic, SDNode OpNode> {
1510 let isCompare = 1, Defs = [CPSR] in {
1511 // Add/Subtract immediate
1512 def Wri : BaseAddSubImm<isSub, 1, GPR32, GPR32sp, addsub_shifted_imm32,
1513 mnemonic, OpNode> {
1514 let Inst{31} = 0;
1515 }
1516 def Xri : BaseAddSubImm<isSub, 1, GPR64, GPR64sp, addsub_shifted_imm64,
1517 mnemonic, OpNode> {
1518 let Inst{31} = 1;
1519 }
1520
1521 // Add/Subtract register
1522 def Wrr : BaseAddSubRegPseudo<GPR32, OpNode>;
1523 def Xrr : BaseAddSubRegPseudo<GPR64, OpNode>;
1524
1525 // Add/Subtract shifted register
1526 def Wrs : BaseAddSubSReg<isSub, 1, GPR32, arith_shifted_reg32, mnemonic,
1527 OpNode> {
1528 let Inst{31} = 0;
1529 }
1530 def Xrs : BaseAddSubSReg<isSub, 1, GPR64, arith_shifted_reg64, mnemonic,
1531 OpNode> {
1532 let Inst{31} = 1;
1533 }
1534
1535 // Add/Subtract extended register
1536 let AddedComplexity = 1 in {
1537 def Wrx : BaseAddSubEReg<isSub, 1, GPR32, GPR32sp,
1538 arith_extended_reg32<i32>, mnemonic, OpNode> {
1539 let Inst{31} = 0;
1540 }
1541 def Xrx : BaseAddSubEReg<isSub, 1, GPR64, GPR64sp,
1542 arith_extended_reg32<i64>, mnemonic, OpNode> {
1543 let Inst{31} = 1;
1544 }
1545 }
1546
1547 def Xrx64 : BaseAddSubEReg64<isSub, 1, GPR64, GPR64sp, GPR64,
1548 arith_extendlsl64, mnemonic> {
1549 // UXTX and SXTX only.
1550 let Inst{14-13} = 0b11;
1551 let Inst{31} = 1;
1552 }
1553 } // Defs = [CPSR]
1554
1555 // Register/register aliases with no shift when SP is not used.
1556 def : AddSubRegAlias<mnemonic, !cast<Instruction>(NAME#"Wrs"),
1557 GPR32, GPR32, GPR32, 0>;
1558 def : AddSubRegAlias<mnemonic, !cast<Instruction>(NAME#"Xrs"),
1559 GPR64, GPR64, GPR64, 0>;
1560
1561 // Register/register aliases with no shift when the first source register
1562 // is SP. This relies on the shifted register aliases above matching first
1563 // in the case when SP is not used.
1564 def : AddSubRegAlias<mnemonic, !cast<Instruction>(NAME#"Wrx"),
1565 GPR32, GPR32sp, GPR32, 16>; // UXTW #0
1566 def : AddSubRegAlias<mnemonic,
1567 !cast<Instruction>(NAME#"Xrx64"),
1568 GPR64, GPR64sp, GPR64, 24>; // UXTX #0
1569}
1570
1571//---
1572// Extract
1573//---
1574def SDTA64EXTR : SDTypeProfile<1, 3, [SDTCisSameAs<0, 1>, SDTCisSameAs<0, 2>,
Tim Northover2ad88d32014-04-03 09:26:16 +00001575 SDTCisPtrTy<3>]>;
Tim Northover00ed9962014-03-29 10:18:08 +00001576def ARM64Extr : SDNode<"ARM64ISD::EXTR", SDTA64EXTR>;
1577
1578class BaseExtractImm<RegisterClass regtype, Operand imm_type, string asm,
1579 list<dag> patterns>
1580 : I<(outs regtype:$Rd), (ins regtype:$Rn, regtype:$Rm, imm_type:$imm),
1581 asm, "\t$Rd, $Rn, $Rm, $imm", "", patterns>,
1582 Sched<[WriteExtr, ReadExtrHi]> {
1583 bits<5> Rd;
1584 bits<5> Rn;
1585 bits<5> Rm;
1586 bits<6> imm;
1587
1588 let Inst{30-23} = 0b00100111;
1589 let Inst{21} = 0;
1590 let Inst{20-16} = Rm;
1591 let Inst{15-10} = imm;
1592 let Inst{9-5} = Rn;
1593 let Inst{4-0} = Rd;
1594}
1595
1596multiclass ExtractImm<string asm> {
1597 def Wrri : BaseExtractImm<GPR32, imm0_31, asm,
1598 [(set GPR32:$Rd,
1599 (ARM64Extr GPR32:$Rn, GPR32:$Rm, imm0_31:$imm))]> {
1600 let Inst{31} = 0;
1601 let Inst{22} = 0;
1602 }
1603 def Xrri : BaseExtractImm<GPR64, imm0_63, asm,
1604 [(set GPR64:$Rd,
1605 (ARM64Extr GPR64:$Rn, GPR64:$Rm, imm0_63:$imm))]> {
1606
1607 let Inst{31} = 1;
1608 let Inst{22} = 1;
1609 }
1610}
1611
1612//---
1613// Bitfield
1614//---
1615
1616let mayLoad = 0, mayStore = 0, hasSideEffects = 0 in
1617class BaseBitfieldImm<bits<2> opc,
1618 RegisterClass regtype, Operand imm_type, string asm>
1619 : I<(outs regtype:$Rd), (ins regtype:$Rn, imm_type:$immr, imm_type:$imms),
1620 asm, "\t$Rd, $Rn, $immr, $imms", "", []>,
1621 Sched<[WriteIS]> {
1622 bits<5> Rd;
1623 bits<5> Rn;
1624 bits<6> immr;
1625 bits<6> imms;
1626
1627 let Inst{30-29} = opc;
1628 let Inst{28-23} = 0b100110;
1629 let Inst{21-16} = immr;
1630 let Inst{15-10} = imms;
1631 let Inst{9-5} = Rn;
1632 let Inst{4-0} = Rd;
1633}
1634
1635multiclass BitfieldImm<bits<2> opc, string asm> {
1636 def Wri : BaseBitfieldImm<opc, GPR32, imm0_31, asm> {
1637 let Inst{31} = 0;
1638 let Inst{22} = 0;
1639 }
1640 def Xri : BaseBitfieldImm<opc, GPR64, imm0_63, asm> {
1641 let Inst{31} = 1;
1642 let Inst{22} = 1;
1643 }
1644}
1645
1646let mayLoad = 0, mayStore = 0, hasSideEffects = 0 in
1647class BaseBitfieldImmWith2RegArgs<bits<2> opc,
1648 RegisterClass regtype, Operand imm_type, string asm>
1649 : I<(outs regtype:$Rd), (ins regtype:$src, regtype:$Rn, imm_type:$immr,
1650 imm_type:$imms),
1651 asm, "\t$Rd, $Rn, $immr, $imms", "$src = $Rd", []>,
1652 Sched<[WriteIS]> {
1653 bits<5> Rd;
1654 bits<5> Rn;
1655 bits<6> immr;
1656 bits<6> imms;
1657
1658 let Inst{30-29} = opc;
1659 let Inst{28-23} = 0b100110;
1660 let Inst{21-16} = immr;
1661 let Inst{15-10} = imms;
1662 let Inst{9-5} = Rn;
1663 let Inst{4-0} = Rd;
1664}
1665
1666multiclass BitfieldImmWith2RegArgs<bits<2> opc, string asm> {
1667 def Wri : BaseBitfieldImmWith2RegArgs<opc, GPR32, imm0_31, asm> {
1668 let Inst{31} = 0;
1669 let Inst{22} = 0;
1670 }
1671 def Xri : BaseBitfieldImmWith2RegArgs<opc, GPR64, imm0_63, asm> {
1672 let Inst{31} = 1;
1673 let Inst{22} = 1;
1674 }
1675}
1676
1677//---
1678// Logical
1679//---
1680
1681// Logical (immediate)
1682class BaseLogicalImm<bits<2> opc, RegisterClass dregtype,
1683 RegisterClass sregtype, Operand imm_type, string asm,
1684 list<dag> pattern>
1685 : I<(outs dregtype:$Rd), (ins sregtype:$Rn, imm_type:$imm),
1686 asm, "\t$Rd, $Rn, $imm", "", pattern>,
1687 Sched<[WriteI]> {
1688 bits<5> Rd;
1689 bits<5> Rn;
1690 bits<13> imm;
1691 let Inst{30-29} = opc;
1692 let Inst{28-23} = 0b100100;
1693 let Inst{22} = imm{12};
1694 let Inst{21-16} = imm{11-6};
1695 let Inst{15-10} = imm{5-0};
1696 let Inst{9-5} = Rn;
1697 let Inst{4-0} = Rd;
1698
1699 let DecoderMethod = "DecodeLogicalImmInstruction";
1700}
1701
1702// Logical (shifted register)
1703class BaseLogicalSReg<bits<2> opc, bit N, RegisterClass regtype,
1704 logical_shifted_reg shifted_regtype, string asm,
1705 list<dag> pattern>
1706 : I<(outs regtype:$Rd), (ins regtype:$Rn, shifted_regtype:$Rm),
1707 asm, "\t$Rd, $Rn, $Rm", "", pattern>,
1708 Sched<[WriteISReg]> {
1709 // The operands are in order to match the 'addr' MI operands, so we
1710 // don't need an encoder method and by-name matching. Just use the default
1711 // in-order handling. Since we're using by-order, make sure the names
1712 // do not match.
1713 bits<5> dst;
1714 bits<5> src1;
1715 bits<5> src2;
1716 bits<8> shift;
1717 let Inst{30-29} = opc;
1718 let Inst{28-24} = 0b01010;
1719 let Inst{23-22} = shift{7-6};
1720 let Inst{21} = N;
1721 let Inst{20-16} = src2;
1722 let Inst{15-10} = shift{5-0};
1723 let Inst{9-5} = src1;
1724 let Inst{4-0} = dst;
1725
1726 let DecoderMethod = "DecodeThreeAddrSRegInstruction";
1727}
1728
1729// Aliases for register+register logical instructions.
1730class LogicalRegAlias<string asm, Instruction inst, RegisterClass regtype>
1731 : InstAlias<asm#" $dst, $src1, $src2",
1732 (inst regtype:$dst, regtype:$src1, regtype:$src2, 0)>;
1733
1734let AddedComplexity = 6 in
1735multiclass LogicalImm<bits<2> opc, string mnemonic, SDNode OpNode> {
1736 def Wri : BaseLogicalImm<opc, GPR32sp, GPR32, logical_imm32, mnemonic,
1737 [(set GPR32sp:$Rd, (OpNode GPR32:$Rn,
1738 logical_imm32:$imm))]> {
1739 let Inst{31} = 0;
1740 let Inst{22} = 0; // 64-bit version has an additional bit of immediate.
1741 }
1742 def Xri : BaseLogicalImm<opc, GPR64sp, GPR64, logical_imm64, mnemonic,
1743 [(set GPR64sp:$Rd, (OpNode GPR64:$Rn,
1744 logical_imm64:$imm))]> {
1745 let Inst{31} = 1;
1746 }
1747}
1748
1749multiclass LogicalImmS<bits<2> opc, string mnemonic, SDNode OpNode> {
1750 let isCompare = 1, Defs = [CPSR] in {
1751 def Wri : BaseLogicalImm<opc, GPR32, GPR32, logical_imm32, mnemonic,
1752 [(set GPR32:$Rd, (OpNode GPR32:$Rn, logical_imm32:$imm))]> {
1753 let Inst{31} = 0;
1754 let Inst{22} = 0; // 64-bit version has an additional bit of immediate.
1755 }
1756 def Xri : BaseLogicalImm<opc, GPR64, GPR64, logical_imm64, mnemonic,
1757 [(set GPR64:$Rd, (OpNode GPR64:$Rn, logical_imm64:$imm))]> {
1758 let Inst{31} = 1;
1759 }
1760 } // end Defs = [CPSR]
1761}
1762
1763class BaseLogicalRegPseudo<RegisterClass regtype, SDPatternOperator OpNode>
1764 : Pseudo<(outs regtype:$Rd), (ins regtype:$Rn, regtype:$Rm),
1765 [(set regtype:$Rd, (OpNode regtype:$Rn, regtype:$Rm))]>,
1766 Sched<[WriteI]>;
1767
1768// Split from LogicalImm as not all instructions have both.
1769multiclass LogicalReg<bits<2> opc, bit N, string mnemonic,
1770 SDPatternOperator OpNode> {
1771 def Wrr : BaseLogicalRegPseudo<GPR32, OpNode>;
1772 def Xrr : BaseLogicalRegPseudo<GPR64, OpNode>;
1773
1774 def Wrs : BaseLogicalSReg<opc, N, GPR32, logical_shifted_reg32, mnemonic,
1775 [(set GPR32:$Rd, (OpNode GPR32:$Rn,
1776 logical_shifted_reg32:$Rm))]> {
1777 let Inst{31} = 0;
1778 }
1779 def Xrs : BaseLogicalSReg<opc, N, GPR64, logical_shifted_reg64, mnemonic,
1780 [(set GPR64:$Rd, (OpNode GPR64:$Rn,
1781 logical_shifted_reg64:$Rm))]> {
1782 let Inst{31} = 1;
1783 }
1784
1785 def : LogicalRegAlias<mnemonic,
1786 !cast<Instruction>(NAME#"Wrs"), GPR32>;
1787 def : LogicalRegAlias<mnemonic,
1788 !cast<Instruction>(NAME#"Xrs"), GPR64>;
1789}
1790
1791// Split from LogicalReg to allow setting CPSR Defs
1792multiclass LogicalRegS<bits<2> opc, bit N, string mnemonic> {
1793 let Defs = [CPSR], mayLoad = 0, mayStore = 0, hasSideEffects = 0 in {
1794 def Wrs : BaseLogicalSReg<opc, N, GPR32, logical_shifted_reg32, mnemonic, []>{
1795 let Inst{31} = 0;
1796 }
1797 def Xrs : BaseLogicalSReg<opc, N, GPR64, logical_shifted_reg64, mnemonic, []>{
1798 let Inst{31} = 1;
1799 }
1800 } // Defs = [CPSR]
1801
1802 def : LogicalRegAlias<mnemonic,
1803 !cast<Instruction>(NAME#"Wrs"), GPR32>;
1804 def : LogicalRegAlias<mnemonic,
1805 !cast<Instruction>(NAME#"Xrs"), GPR64>;
1806}
1807
1808//---
1809// Conditionally set flags
1810//---
1811
1812// Condition code.
1813// 4-bit immediate. Pretty-printed as <cc>
1814def ccode : Operand<i32> {
1815 let PrintMethod = "printCondCode";
1816}
1817
1818let mayLoad = 0, mayStore = 0, hasSideEffects = 0 in
1819class BaseCondSetFlagsImm<bit op, RegisterClass regtype, string asm>
1820 : I<(outs), (ins regtype:$Rn, imm0_31:$imm, imm0_15:$nzcv, ccode:$cond),
1821 asm, "\t$Rn, $imm, $nzcv, $cond", "", []>,
1822 Sched<[WriteI]> {
1823 let Uses = [CPSR];
1824 let Defs = [CPSR];
1825
1826 bits<5> Rn;
1827 bits<5> imm;
1828 bits<4> nzcv;
1829 bits<4> cond;
1830
1831 let Inst{30} = op;
1832 let Inst{29-21} = 0b111010010;
1833 let Inst{20-16} = imm;
1834 let Inst{15-12} = cond;
1835 let Inst{11-10} = 0b10;
1836 let Inst{9-5} = Rn;
1837 let Inst{4} = 0b0;
1838 let Inst{3-0} = nzcv;
1839}
1840
1841multiclass CondSetFlagsImm<bit op, string asm> {
1842 def Wi : BaseCondSetFlagsImm<op, GPR32, asm> {
1843 let Inst{31} = 0;
1844 }
1845 def Xi : BaseCondSetFlagsImm<op, GPR64, asm> {
1846 let Inst{31} = 1;
1847 }
1848}
1849
1850let mayLoad = 0, mayStore = 0, hasSideEffects = 0 in
1851class BaseCondSetFlagsReg<bit op, RegisterClass regtype, string asm>
1852 : I<(outs), (ins regtype:$Rn, regtype:$Rm, imm0_15:$nzcv, ccode:$cond),
1853 asm, "\t$Rn, $Rm, $nzcv, $cond", "", []>,
1854 Sched<[WriteI]> {
1855 let Uses = [CPSR];
1856 let Defs = [CPSR];
1857
1858 bits<5> Rn;
1859 bits<5> Rm;
1860 bits<4> nzcv;
1861 bits<4> cond;
1862
1863 let Inst{30} = op;
1864 let Inst{29-21} = 0b111010010;
1865 let Inst{20-16} = Rm;
1866 let Inst{15-12} = cond;
1867 let Inst{11-10} = 0b00;
1868 let Inst{9-5} = Rn;
1869 let Inst{4} = 0b0;
1870 let Inst{3-0} = nzcv;
1871}
1872
1873multiclass CondSetFlagsReg<bit op, string asm> {
1874 def Wr : BaseCondSetFlagsReg<op, GPR32, asm> {
1875 let Inst{31} = 0;
1876 }
1877 def Xr : BaseCondSetFlagsReg<op, GPR64, asm> {
1878 let Inst{31} = 1;
1879 }
1880}
1881
1882//---
1883// Conditional select
1884//---
1885
1886class BaseCondSelect<bit op, bits<2> op2, RegisterClass regtype, string asm>
1887 : I<(outs regtype:$Rd), (ins regtype:$Rn, regtype:$Rm, ccode:$cond),
1888 asm, "\t$Rd, $Rn, $Rm, $cond", "",
1889 [(set regtype:$Rd,
1890 (ARM64csel regtype:$Rn, regtype:$Rm, (i32 imm:$cond), CPSR))]>,
1891 Sched<[WriteI]> {
1892 let Uses = [CPSR];
1893
1894 bits<5> Rd;
1895 bits<5> Rn;
1896 bits<5> Rm;
1897 bits<4> cond;
1898
1899 let Inst{30} = op;
1900 let Inst{29-21} = 0b011010100;
1901 let Inst{20-16} = Rm;
1902 let Inst{15-12} = cond;
1903 let Inst{11-10} = op2;
1904 let Inst{9-5} = Rn;
1905 let Inst{4-0} = Rd;
1906}
1907
1908multiclass CondSelect<bit op, bits<2> op2, string asm> {
1909 def Wr : BaseCondSelect<op, op2, GPR32, asm> {
1910 let Inst{31} = 0;
1911 }
1912 def Xr : BaseCondSelect<op, op2, GPR64, asm> {
1913 let Inst{31} = 1;
1914 }
1915}
1916
1917class BaseCondSelectOp<bit op, bits<2> op2, RegisterClass regtype, string asm,
1918 PatFrag frag>
1919 : I<(outs regtype:$Rd), (ins regtype:$Rn, regtype:$Rm, ccode:$cond),
1920 asm, "\t$Rd, $Rn, $Rm, $cond", "",
1921 [(set regtype:$Rd,
1922 (ARM64csel regtype:$Rn, (frag regtype:$Rm),
1923 (i32 imm:$cond), CPSR))]>,
1924 Sched<[WriteI]> {
1925 let Uses = [CPSR];
1926
1927 bits<5> Rd;
1928 bits<5> Rn;
1929 bits<5> Rm;
1930 bits<4> cond;
1931
1932 let Inst{30} = op;
1933 let Inst{29-21} = 0b011010100;
1934 let Inst{20-16} = Rm;
1935 let Inst{15-12} = cond;
1936 let Inst{11-10} = op2;
1937 let Inst{9-5} = Rn;
1938 let Inst{4-0} = Rd;
1939}
1940
1941multiclass CondSelectOp<bit op, bits<2> op2, string asm, PatFrag frag> {
1942 def Wr : BaseCondSelectOp<op, op2, GPR32, asm, frag> {
1943 let Inst{31} = 0;
1944 }
1945 def Xr : BaseCondSelectOp<op, op2, GPR64, asm, frag> {
1946 let Inst{31} = 1;
1947 }
1948}
1949
1950//---
1951// Special Mask Value
1952//---
1953def maski8_or_more : Operand<i32>,
1954 ImmLeaf<i32, [{ return (Imm & 0xff) == 0xff; }]> {
1955}
1956def maski16_or_more : Operand<i32>,
1957 ImmLeaf<i32, [{ return (Imm & 0xffff) == 0xffff; }]> {
1958}
1959
1960
1961//---
1962// Load/store
1963//---
1964
1965// (unsigned immediate)
1966// Indexed for 8-bit registers. offset is in range [0,4095].
1967def MemoryIndexed8Operand : AsmOperandClass {
1968 let Name = "MemoryIndexed8";
1969 let DiagnosticType = "InvalidMemoryIndexed8";
1970}
1971def am_indexed8 : Operand<i64>,
1972 ComplexPattern<i64, 2, "SelectAddrModeIndexed8", []> {
1973 let PrintMethod = "printAMIndexed8";
1974 let EncoderMethod
1975 = "getAMIndexed8OpValue<ARM64::fixup_arm64_ldst_imm12_scale1>";
1976 let ParserMatchClass = MemoryIndexed8Operand;
1977 let MIOperandInfo = (ops GPR64sp:$base, i64imm:$offset);
1978}
1979
1980// Indexed for 16-bit registers. offset is multiple of 2 in range [0,8190],
1981// stored as immval/2 (the 12-bit literal that encodes directly into the insn).
1982def MemoryIndexed16Operand : AsmOperandClass {
1983 let Name = "MemoryIndexed16";
1984 let DiagnosticType = "InvalidMemoryIndexed16";
1985}
1986def am_indexed16 : Operand<i64>,
1987 ComplexPattern<i64, 2, "SelectAddrModeIndexed16", []> {
1988 let PrintMethod = "printAMIndexed16";
1989 let EncoderMethod
1990 = "getAMIndexed8OpValue<ARM64::fixup_arm64_ldst_imm12_scale2>";
1991 let ParserMatchClass = MemoryIndexed16Operand;
1992 let MIOperandInfo = (ops GPR64sp:$base, i64imm:$offset);
1993}
1994
1995// Indexed for 32-bit registers. offset is multiple of 4 in range [0,16380],
1996// stored as immval/4 (the 12-bit literal that encodes directly into the insn).
1997def MemoryIndexed32Operand : AsmOperandClass {
1998 let Name = "MemoryIndexed32";
1999 let DiagnosticType = "InvalidMemoryIndexed32";
2000}
2001def am_indexed32 : Operand<i64>,
2002 ComplexPattern<i64, 2, "SelectAddrModeIndexed32", []> {
2003 let PrintMethod = "printAMIndexed32";
2004 let EncoderMethod
2005 = "getAMIndexed8OpValue<ARM64::fixup_arm64_ldst_imm12_scale4>";
2006 let ParserMatchClass = MemoryIndexed32Operand;
2007 let MIOperandInfo = (ops GPR64sp:$base, i64imm:$offset);
2008}
2009
2010// Indexed for 64-bit registers. offset is multiple of 8 in range [0,32760],
2011// stored as immval/8 (the 12-bit literal that encodes directly into the insn).
2012def MemoryIndexed64Operand : AsmOperandClass {
2013 let Name = "MemoryIndexed64";
2014 let DiagnosticType = "InvalidMemoryIndexed64";
2015}
2016def am_indexed64 : Operand<i64>,
2017 ComplexPattern<i64, 2, "SelectAddrModeIndexed64", []> {
2018 let PrintMethod = "printAMIndexed64";
2019 let EncoderMethod
2020 = "getAMIndexed8OpValue<ARM64::fixup_arm64_ldst_imm12_scale8>";
2021 let ParserMatchClass = MemoryIndexed64Operand;
2022 let MIOperandInfo = (ops GPR64sp:$base, i64imm:$offset);
2023}
2024
2025// Indexed for 128-bit registers. offset is multiple of 16 in range [0,65520],
2026// stored as immval/16 (the 12-bit literal that encodes directly into the insn).
2027def MemoryIndexed128Operand : AsmOperandClass {
2028 let Name = "MemoryIndexed128";
2029 let DiagnosticType = "InvalidMemoryIndexed128";
2030}
2031def am_indexed128 : Operand<i64>,
2032 ComplexPattern<i64, 2, "SelectAddrModeIndexed128", []> {
2033 let PrintMethod = "printAMIndexed128";
2034 let EncoderMethod
2035 = "getAMIndexed8OpValue<ARM64::fixup_arm64_ldst_imm12_scale16>";
2036 let ParserMatchClass = MemoryIndexed128Operand;
2037 let MIOperandInfo = (ops GPR64sp:$base, i64imm:$offset);
2038}
2039
2040// No offset.
2041def MemoryNoIndexOperand : AsmOperandClass { let Name = "MemoryNoIndex"; }
2042def am_noindex : Operand<i64>,
2043 ComplexPattern<i64, 1, "SelectAddrModeNoIndex", []> {
2044 let PrintMethod = "printAMNoIndex";
2045 let ParserMatchClass = MemoryNoIndexOperand;
2046 let MIOperandInfo = (ops GPR64sp:$base);
2047}
2048
2049class BaseLoadStoreUI<bits<2> sz, bit V, bits<2> opc, dag oops, dag iops,
2050 string asm, list<dag> pattern>
2051 : I<oops, iops, asm, "\t$Rt, $addr", "", pattern> {
2052 bits<5> dst;
2053
2054 bits<17> addr;
2055 bits<5> base = addr{4-0};
2056 bits<12> offset = addr{16-5};
2057
2058 let Inst{31-30} = sz;
2059 let Inst{29-27} = 0b111;
2060 let Inst{26} = V;
2061 let Inst{25-24} = 0b01;
2062 let Inst{23-22} = opc;
2063 let Inst{21-10} = offset;
2064 let Inst{9-5} = base;
2065 let Inst{4-0} = dst;
2066
2067 let DecoderMethod = "DecodeUnsignedLdStInstruction";
2068}
2069
2070let mayLoad = 1, mayStore = 0, hasSideEffects = 0 in
2071class LoadUI<bits<2> sz, bit V, bits<2> opc, RegisterClass regtype,
2072 Operand indextype, string asm, list<dag> pattern>
2073 : BaseLoadStoreUI<sz, V, opc,
2074 (outs regtype:$Rt), (ins indextype:$addr), asm, pattern>,
2075 Sched<[WriteLD]>;
2076
2077let mayLoad = 0, mayStore = 1, hasSideEffects = 0 in
2078class StoreUI<bits<2> sz, bit V, bits<2> opc, RegisterClass regtype,
2079 Operand indextype, string asm, list<dag> pattern>
2080 : BaseLoadStoreUI<sz, V, opc,
2081 (outs), (ins regtype:$Rt, indextype:$addr), asm, pattern>,
2082 Sched<[WriteST]>;
2083
2084def PrefetchOperand : AsmOperandClass {
2085 let Name = "Prefetch";
2086 let ParserMethod = "tryParsePrefetch";
2087}
2088def prfop : Operand<i32> {
2089 let PrintMethod = "printPrefetchOp";
2090 let ParserMatchClass = PrefetchOperand;
2091}
2092
2093let mayLoad = 0, mayStore = 0, hasSideEffects = 1 in
2094class PrefetchUI<bits<2> sz, bit V, bits<2> opc, string asm, list<dag> pat>
2095 : BaseLoadStoreUI<sz, V, opc,
2096 (outs), (ins prfop:$Rt, am_indexed64:$addr), asm, pat>,
2097 Sched<[WriteLD]>;
2098
2099//---
2100// Load literal
2101//---
2102
2103let mayLoad = 1, mayStore = 0, hasSideEffects = 0 in
2104class LoadLiteral<bits<2> opc, bit V, RegisterClass regtype, string asm>
2105 : I<(outs regtype:$Rt), (ins am_brcond:$label),
2106 asm, "\t$Rt, $label", "", []>,
2107 Sched<[WriteLD]> {
2108 bits<5> Rt;
2109 bits<19> label;
2110 let Inst{31-30} = opc;
2111 let Inst{29-27} = 0b011;
2112 let Inst{26} = V;
2113 let Inst{25-24} = 0b00;
2114 let Inst{23-5} = label;
2115 let Inst{4-0} = Rt;
2116}
2117
2118let mayLoad = 0, mayStore = 0, hasSideEffects = 1 in
2119class PrefetchLiteral<bits<2> opc, bit V, string asm, list<dag> pat>
2120 : I<(outs), (ins prfop:$Rt, am_brcond:$label),
2121 asm, "\t$Rt, $label", "", pat>,
2122 Sched<[WriteLD]> {
2123 bits<5> Rt;
2124 bits<19> label;
2125 let Inst{31-30} = opc;
2126 let Inst{29-27} = 0b011;
2127 let Inst{26} = V;
2128 let Inst{25-24} = 0b00;
2129 let Inst{23-5} = label;
2130 let Inst{4-0} = Rt;
2131}
2132
2133//---
2134// Load/store register offset
2135//---
2136
2137class MemROAsmOperand<int sz> : AsmOperandClass {
2138 let Name = "MemoryRegisterOffset"#sz;
2139}
2140
2141def MemROAsmOperand8 : MemROAsmOperand<8>;
2142def MemROAsmOperand16 : MemROAsmOperand<16>;
2143def MemROAsmOperand32 : MemROAsmOperand<32>;
2144def MemROAsmOperand64 : MemROAsmOperand<64>;
2145def MemROAsmOperand128 : MemROAsmOperand<128>;
2146
2147class ro_indexed<int sz> : Operand<i64> { // ComplexPattern<...>
2148 let PrintMethod = "printMemoryRegOffset"#sz;
2149 let MIOperandInfo = (ops GPR64sp:$base, GPR64:$offset, i32imm:$extend);
2150}
2151
2152def ro_indexed8 : ro_indexed<8>, ComplexPattern<i64, 3, "SelectAddrModeRO8", []> {
2153 let ParserMatchClass = MemROAsmOperand8;
2154}
2155
2156def ro_indexed16 : ro_indexed<16>, ComplexPattern<i64, 3, "SelectAddrModeRO16", []> {
2157 let ParserMatchClass = MemROAsmOperand16;
2158}
2159
2160def ro_indexed32 : ro_indexed<32>, ComplexPattern<i64, 3, "SelectAddrModeRO32", []> {
2161 let ParserMatchClass = MemROAsmOperand32;
2162}
2163
2164def ro_indexed64 : ro_indexed<64>, ComplexPattern<i64, 3, "SelectAddrModeRO64", []> {
2165 let ParserMatchClass = MemROAsmOperand64;
2166}
2167
2168def ro_indexed128 : ro_indexed<128>, ComplexPattern<i64, 3, "SelectAddrModeRO128", []> {
2169 let ParserMatchClass = MemROAsmOperand128;
2170}
2171
2172class LoadStore8RO<bits<2> sz, bit V, bits<2> opc, RegisterClass regtype,
2173 string asm, dag ins, dag outs, list<dag> pat>
2174 : I<ins, outs, asm, "\t$Rt, $addr", "", pat> {
2175 // The operands are in order to match the 'addr' MI operands, so we
2176 // don't need an encoder method and by-name matching. Just use the default
2177 // in-order handling. Since we're using by-order, make sure the names
2178 // do not match.
2179 bits<5> dst;
2180 bits<5> base;
2181 bits<5> offset;
2182 bits<4> extend;
2183 let Inst{31-30} = sz;
2184 let Inst{29-27} = 0b111;
2185 let Inst{26} = V;
2186 let Inst{25-24} = 0b00;
2187 let Inst{23-22} = opc;
2188 let Inst{21} = 1;
2189 let Inst{20-16} = offset;
2190 let Inst{15-13} = extend{3-1};
2191
2192 let Inst{12} = extend{0};
2193 let Inst{11-10} = 0b10;
2194 let Inst{9-5} = base;
2195 let Inst{4-0} = dst;
2196
2197 let DecoderMethod = "DecodeRegOffsetLdStInstruction";
2198}
2199
2200class Load8RO<bits<2> sz, bit V, bits<2> opc, RegisterClass regtype,
2201 string asm, list<dag> pat>
2202 : LoadStore8RO<sz, V, opc, regtype, asm,
2203 (outs regtype:$Rt), (ins ro_indexed8:$addr), pat>,
2204 Sched<[WriteLDIdx, ReadAdrBase]>;
2205
2206class Store8RO<bits<2> sz, bit V, bits<2> opc, RegisterClass regtype,
2207 string asm, list<dag> pat>
2208 : LoadStore8RO<sz, V, opc, regtype, asm,
2209 (outs), (ins regtype:$Rt, ro_indexed8:$addr), pat>,
2210 Sched<[WriteSTIdx, ReadAdrBase]>;
2211
2212class LoadStore16RO<bits<2> sz, bit V, bits<2> opc, RegisterClass regtype,
2213 string asm, dag ins, dag outs, list<dag> pat>
2214 : I<ins, outs, asm, "\t$Rt, $addr", "", pat> {
2215 // The operands are in order to match the 'addr' MI operands, so we
2216 // don't need an encoder method and by-name matching. Just use the default
2217 // in-order handling. Since we're using by-order, make sure the names
2218 // do not match.
2219 bits<5> dst;
2220 bits<5> base;
2221 bits<5> offset;
2222 bits<4> extend;
2223 let Inst{31-30} = sz;
2224 let Inst{29-27} = 0b111;
2225 let Inst{26} = V;
2226 let Inst{25-24} = 0b00;
2227 let Inst{23-22} = opc;
2228 let Inst{21} = 1;
2229 let Inst{20-16} = offset;
2230 let Inst{15-13} = extend{3-1};
2231
2232 let Inst{12} = extend{0};
2233 let Inst{11-10} = 0b10;
2234 let Inst{9-5} = base;
2235 let Inst{4-0} = dst;
2236
2237 let DecoderMethod = "DecodeRegOffsetLdStInstruction";
2238}
2239
2240class Load16RO<bits<2> sz, bit V, bits<2> opc, RegisterClass regtype,
2241 string asm, list<dag> pat>
2242 : LoadStore16RO<sz, V, opc, regtype, asm,
2243 (outs regtype:$Rt), (ins ro_indexed16:$addr), pat>,
2244 Sched<[WriteLDIdx, ReadAdrBase]>;
2245
2246class Store16RO<bits<2> sz, bit V, bits<2> opc, RegisterClass regtype,
2247 string asm, list<dag> pat>
2248 : LoadStore16RO<sz, V, opc, regtype, asm,
2249 (outs), (ins regtype:$Rt, ro_indexed16:$addr), pat>,
2250 Sched<[WriteSTIdx, ReadAdrBase]>;
2251
2252class LoadStore32RO<bits<2> sz, bit V, bits<2> opc, RegisterClass regtype,
2253 string asm, dag ins, dag outs, list<dag> pat>
2254 : I<ins, outs, asm, "\t$Rt, $addr", "", pat> {
2255 // The operands are in order to match the 'addr' MI operands, so we
2256 // don't need an encoder method and by-name matching. Just use the default
2257 // in-order handling. Since we're using by-order, make sure the names
2258 // do not match.
2259 bits<5> dst;
2260 bits<5> base;
2261 bits<5> offset;
2262 bits<4> extend;
2263 let Inst{31-30} = sz;
2264 let Inst{29-27} = 0b111;
2265 let Inst{26} = V;
2266 let Inst{25-24} = 0b00;
2267 let Inst{23-22} = opc;
2268 let Inst{21} = 1;
2269 let Inst{20-16} = offset;
2270 let Inst{15-13} = extend{3-1};
2271
2272 let Inst{12} = extend{0};
2273 let Inst{11-10} = 0b10;
2274 let Inst{9-5} = base;
2275 let Inst{4-0} = dst;
2276
2277 let DecoderMethod = "DecodeRegOffsetLdStInstruction";
2278}
2279
2280class Load32RO<bits<2> sz, bit V, bits<2> opc, RegisterClass regtype,
2281 string asm, list<dag> pat>
2282 : LoadStore32RO<sz, V, opc, regtype, asm,
2283 (outs regtype:$Rt), (ins ro_indexed32:$addr), pat>,
2284 Sched<[WriteLDIdx, ReadAdrBase]>;
2285
2286class Store32RO<bits<2> sz, bit V, bits<2> opc, RegisterClass regtype,
2287 string asm, list<dag> pat>
2288 : LoadStore32RO<sz, V, opc, regtype, asm,
2289 (outs), (ins regtype:$Rt, ro_indexed32:$addr), pat>,
2290 Sched<[WriteSTIdx, ReadAdrBase]>;
2291
2292class LoadStore64RO<bits<2> sz, bit V, bits<2> opc, RegisterClass regtype,
2293 string asm, dag ins, dag outs, list<dag> pat>
2294 : I<ins, outs, asm, "\t$Rt, $addr", "", pat> {
2295 // The operands are in order to match the 'addr' MI operands, so we
2296 // don't need an encoder method and by-name matching. Just use the default
2297 // in-order handling. Since we're using by-order, make sure the names
2298 // do not match.
2299 bits<5> dst;
2300 bits<5> base;
2301 bits<5> offset;
2302 bits<4> extend;
2303 let Inst{31-30} = sz;
2304 let Inst{29-27} = 0b111;
2305 let Inst{26} = V;
2306 let Inst{25-24} = 0b00;
2307 let Inst{23-22} = opc;
2308 let Inst{21} = 1;
2309 let Inst{20-16} = offset;
2310 let Inst{15-13} = extend{3-1};
2311
2312 let Inst{12} = extend{0};
2313 let Inst{11-10} = 0b10;
2314 let Inst{9-5} = base;
2315 let Inst{4-0} = dst;
2316
2317 let DecoderMethod = "DecodeRegOffsetLdStInstruction";
2318}
2319
2320let mayLoad = 1, mayStore = 0, hasSideEffects = 0 in
2321class Load64RO<bits<2> sz, bit V, bits<2> opc, RegisterClass regtype,
2322 string asm, list<dag> pat>
2323 : LoadStore64RO<sz, V, opc, regtype, asm,
2324 (outs regtype:$Rt), (ins ro_indexed64:$addr), pat>,
2325 Sched<[WriteLDIdx, ReadAdrBase]>;
2326
2327let mayLoad = 0, mayStore = 1, hasSideEffects = 0 in
2328class Store64RO<bits<2> sz, bit V, bits<2> opc, RegisterClass regtype,
2329 string asm, list<dag> pat>
2330 : LoadStore64RO<sz, V, opc, regtype, asm,
2331 (outs), (ins regtype:$Rt, ro_indexed64:$addr), pat>,
2332 Sched<[WriteSTIdx, ReadAdrBase]>;
2333
2334
2335class LoadStore128RO<bits<2> sz, bit V, bits<2> opc, RegisterClass regtype,
2336 string asm, dag ins, dag outs, list<dag> pat>
2337 : I<ins, outs, asm, "\t$Rt, $addr", "", pat> {
2338 // The operands are in order to match the 'addr' MI operands, so we
2339 // don't need an encoder method and by-name matching. Just use the default
2340 // in-order handling. Since we're using by-order, make sure the names
2341 // do not match.
2342 bits<5> dst;
2343 bits<5> base;
2344 bits<5> offset;
2345 bits<4> extend;
2346 let Inst{31-30} = sz;
2347 let Inst{29-27} = 0b111;
2348 let Inst{26} = V;
2349 let Inst{25-24} = 0b00;
2350 let Inst{23-22} = opc;
2351 let Inst{21} = 1;
2352 let Inst{20-16} = offset;
2353 let Inst{15-13} = extend{3-1};
2354
2355 let Inst{12} = extend{0};
2356 let Inst{11-10} = 0b10;
2357 let Inst{9-5} = base;
2358 let Inst{4-0} = dst;
2359
2360 let DecoderMethod = "DecodeRegOffsetLdStInstruction";
2361}
2362
2363let mayLoad = 1, mayStore = 0, hasSideEffects = 0 in
2364class Load128RO<bits<2> sz, bit V, bits<2> opc, RegisterClass regtype,
2365 string asm, list<dag> pat>
2366 : LoadStore128RO<sz, V, opc, regtype, asm,
2367 (outs regtype:$Rt), (ins ro_indexed128:$addr), pat>,
2368 Sched<[WriteLDIdx, ReadAdrBase]>;
2369
2370let mayLoad = 0, mayStore = 1, hasSideEffects = 0 in
2371class Store128RO<bits<2> sz, bit V, bits<2> opc, RegisterClass regtype,
2372 string asm, list<dag> pat>
2373 : LoadStore128RO<sz, V, opc, regtype, asm,
2374 (outs), (ins regtype:$Rt, ro_indexed128:$addr), pat>,
2375 Sched<[WriteSTIdx, ReadAdrBase]>;
2376
2377let mayLoad = 0, mayStore = 0, hasSideEffects = 1 in
2378class PrefetchRO<bits<2> sz, bit V, bits<2> opc, string asm, list<dag> pat>
2379 : I<(outs), (ins prfop:$Rt, ro_indexed64:$addr), asm,
2380 "\t$Rt, $addr", "", pat>,
2381 Sched<[WriteLD]> {
2382 // The operands are in order to match the 'addr' MI operands, so we
2383 // don't need an encoder method and by-name matching. Just use the default
2384 // in-order handling. Since we're using by-order, make sure the names
2385 // do not match.
2386 bits<5> dst;
2387 bits<5> base;
2388 bits<5> offset;
2389 bits<4> extend;
2390 let Inst{31-30} = sz;
2391 let Inst{29-27} = 0b111;
2392 let Inst{26} = V;
2393 let Inst{25-24} = 0b00;
2394 let Inst{23-22} = opc;
2395 let Inst{21} = 1;
2396 let Inst{20-16} = offset;
2397 let Inst{15-13} = extend{3-1};
2398
2399 let Inst{12} = extend{0};
2400 let Inst{11-10} = 0b10;
2401 let Inst{9-5} = base;
2402 let Inst{4-0} = dst;
2403
2404 let DecoderMethod = "DecodeRegOffsetLdStInstruction";
2405}
2406
2407//---
2408// Load/store unscaled immediate
2409//---
2410
2411def MemoryUnscaledOperand : AsmOperandClass {
2412 let Name = "MemoryUnscaled";
2413 let DiagnosticType = "InvalidMemoryIndexedSImm9";
2414}
2415class am_unscaled_operand : Operand<i64> {
2416 let PrintMethod = "printAMUnscaled";
2417 let ParserMatchClass = MemoryUnscaledOperand;
2418 let MIOperandInfo = (ops GPR64sp:$base, i64imm:$offset);
2419}
2420def am_unscaled : am_unscaled_operand;
2421def am_unscaled8 : am_unscaled_operand,
2422 ComplexPattern<i64, 2, "SelectAddrModeUnscaled8", []>;
2423def am_unscaled16 : am_unscaled_operand,
2424 ComplexPattern<i64, 2, "SelectAddrModeUnscaled16", []>;
2425def am_unscaled32 : am_unscaled_operand,
2426 ComplexPattern<i64, 2, "SelectAddrModeUnscaled32", []>;
2427def am_unscaled64 : am_unscaled_operand,
2428 ComplexPattern<i64, 2, "SelectAddrModeUnscaled64", []>;
2429def am_unscaled128 : am_unscaled_operand,
2430 ComplexPattern<i64, 2, "SelectAddrModeUnscaled128", []>;
2431
2432class BaseLoadStoreUnscale<bits<2> sz, bit V, bits<2> opc, dag oops, dag iops,
2433 string asm, list<dag> pattern>
2434 : I<oops, iops, asm, "\t$Rt, $addr", "", pattern> {
2435 // The operands are in order to match the 'addr' MI operands, so we
2436 // don't need an encoder method and by-name matching. Just use the default
2437 // in-order handling. Since we're using by-order, make sure the names
2438 // do not match.
2439 bits<5> dst;
2440 bits<5> base;
2441 bits<9> offset;
2442 let Inst{31-30} = sz;
2443 let Inst{29-27} = 0b111;
2444 let Inst{26} = V;
2445 let Inst{25-24} = 0b00;
2446 let Inst{23-22} = opc;
2447 let Inst{21} = 0;
2448 let Inst{20-12} = offset;
2449 let Inst{11-10} = 0b00;
2450 let Inst{9-5} = base;
2451 let Inst{4-0} = dst;
2452
2453 let DecoderMethod = "DecodeSignedLdStInstruction";
2454}
2455
2456let AddedComplexity = 1 in // try this before LoadUI
2457class LoadUnscaled<bits<2> sz, bit V, bits<2> opc, RegisterClass regtype,
2458 Operand amtype, string asm, list<dag> pattern>
2459 : BaseLoadStoreUnscale<sz, V, opc, (outs regtype:$Rt),
2460 (ins amtype:$addr), asm, pattern>,
2461 Sched<[WriteLD]>;
2462
2463let AddedComplexity = 1 in // try this before StoreUI
2464class StoreUnscaled<bits<2> sz, bit V, bits<2> opc, RegisterClass regtype,
2465 Operand amtype, string asm, list<dag> pattern>
2466 : BaseLoadStoreUnscale<sz, V, opc, (outs),
2467 (ins regtype:$Rt, amtype:$addr), asm, pattern>,
2468 Sched<[WriteST]>;
2469
2470let mayLoad = 0, mayStore = 0, hasSideEffects = 1 in
2471class PrefetchUnscaled<bits<2> sz, bit V, bits<2> opc, string asm, list<dag> pat>
2472 : BaseLoadStoreUnscale<sz, V, opc, (outs),
2473 (ins prfop:$Rt, am_unscaled:$addr), asm, pat>,
2474 Sched<[WriteLD]>;
2475
2476//---
2477// Load/store unscaled immediate, unprivileged
2478//---
2479
2480class BaseLoadStoreUnprivileged<bits<2> sz, bit V, bits<2> opc,
2481 dag oops, dag iops, string asm>
2482 : I<oops, iops, asm, "\t$Rt, $addr", "", []> {
2483 // The operands are in order to match the 'addr' MI operands, so we
2484 // don't need an encoder method and by-name matching. Just use the default
2485 // in-order handling. Since we're using by-order, make sure the names
2486 // do not match.
2487 bits<5> dst;
2488 bits<5> base;
2489 bits<9> offset;
2490 let Inst{31-30} = sz;
2491 let Inst{29-27} = 0b111;
2492 let Inst{26} = V;
2493 let Inst{25-24} = 0b00;
2494 let Inst{23-22} = opc;
2495 let Inst{21} = 0;
2496 let Inst{20-12} = offset;
2497 let Inst{11-10} = 0b10;
2498 let Inst{9-5} = base;
2499 let Inst{4-0} = dst;
2500
2501 let DecoderMethod = "DecodeSignedLdStInstruction";
2502}
2503
2504let mayStore = 0, mayLoad = 1, hasSideEffects = 0 in {
2505class LoadUnprivileged<bits<2> sz, bit V, bits<2> opc, RegisterClass regtype,
2506 string asm>
2507 : BaseLoadStoreUnprivileged<sz, V, opc,
2508 (outs regtype:$Rt), (ins am_unscaled:$addr), asm>,
2509 Sched<[WriteLD]>;
2510}
2511
2512let mayStore = 1, mayLoad = 0, hasSideEffects = 0 in {
2513class StoreUnprivileged<bits<2> sz, bit V, bits<2> opc, RegisterClass regtype,
2514 string asm>
2515 : BaseLoadStoreUnprivileged<sz, V, opc,
2516 (outs), (ins regtype:$Rt, am_unscaled:$addr), asm>,
2517 Sched<[WriteST]>;
2518}
2519
2520//---
2521// Load/store pre-indexed
2522//---
2523
2524class BaseLoadStorePreIdx<bits<2> sz, bit V, bits<2> opc, dag oops, dag iops,
2525 string asm, string cstr>
2526 : I<oops, iops, asm, "\t$Rt, $addr!", cstr, []> {
2527 // The operands are in order to match the 'addr' MI operands, so we
2528 // don't need an encoder method and by-name matching. Just use the default
2529 // in-order handling.
2530 bits<5> dst;
2531 bits<5> base;
2532 bits<9> offset;
2533 let Inst{31-30} = sz;
2534 let Inst{29-27} = 0b111;
2535 let Inst{26} = V;
2536 let Inst{25-24} = 0;
2537 let Inst{23-22} = opc;
2538 let Inst{21} = 0;
2539 let Inst{20-12} = offset;
2540 let Inst{11-10} = 0b11;
2541 let Inst{9-5} = base;
2542 let Inst{4-0} = dst;
2543
2544 let DecoderMethod = "DecodeSignedLdStInstruction";
2545}
2546
2547let hasSideEffects = 0 in {
2548let mayStore = 0, mayLoad = 1 in
2549// FIXME: Modeling the write-back of these instructions for isel is tricky.
2550// we need the complex addressing mode for the memory reference, but
2551// we also need the write-back specified as a tied operand to the
2552// base register. That combination does not play nicely with
2553// the asm matcher and friends.
2554class LoadPreIdx<bits<2> sz, bit V, bits<2> opc, RegisterClass regtype,
2555 string asm>
2556 : BaseLoadStorePreIdx<sz, V, opc,
2557 (outs regtype:$Rt/*, GPR64sp:$wback*/),
2558 (ins am_unscaled:$addr), asm, ""/*"$addr.base = $wback"*/>,
2559 Sched<[WriteLD, WriteAdr]>;
2560
2561let mayStore = 1, mayLoad = 0 in
2562class StorePreIdx<bits<2> sz, bit V, bits<2> opc, RegisterClass regtype,
2563 string asm>
2564 : BaseLoadStorePreIdx<sz, V, opc,
2565 (outs/* GPR64sp:$wback*/),
2566 (ins regtype:$Rt, am_unscaled:$addr),
2567 asm, ""/*"$addr.base = $wback"*/>,
2568 Sched<[WriteAdr, WriteST]>;
2569} // hasSideEffects = 0
2570
2571// ISel pseudo-instructions which have the tied operands. When the MC lowering
2572// logic finally gets smart enough to strip off tied operands that are just
2573// for isel convenience, we can get rid of these pseudos and just reference
2574// the real instructions directly.
2575//
2576// Ironically, also because of the writeback operands, we can't put the
2577// matcher pattern directly on the instruction, but need to define it
2578// separately.
2579//
2580// Loads aren't matched with patterns here at all, but rather in C++
2581// custom lowering.
2582let mayStore = 0, mayLoad = 1, hasSideEffects = 0 in {
2583class LoadPreIdxPseudo<RegisterClass regtype>
2584 : Pseudo<(outs regtype:$Rt, GPR64sp:$wback),
2585 (ins am_noindex:$addr, simm9:$offset), [],
2586 "$addr.base = $wback,@earlyclobber $wback">,
2587 Sched<[WriteLD, WriteAdr]>;
2588class LoadPostIdxPseudo<RegisterClass regtype>
2589 : Pseudo<(outs regtype:$Rt, GPR64sp:$wback),
2590 (ins am_noindex:$addr, simm9:$offset), [],
2591 "$addr.base = $wback,@earlyclobber $wback">,
2592 Sched<[WriteLD, WriteI]>;
2593}
2594multiclass StorePreIdxPseudo<RegisterClass regtype, ValueType Ty,
2595 SDPatternOperator OpNode> {
2596 let mayStore = 1, mayLoad = 0, hasSideEffects = 0 in
2597 def _isel: Pseudo<(outs GPR64sp:$wback),
2598 (ins regtype:$Rt, am_noindex:$addr, simm9:$offset), [],
2599 "$addr.base = $wback,@earlyclobber $wback">,
2600 Sched<[WriteAdr, WriteST]>;
2601
2602 def : Pat<(OpNode (Ty regtype:$Rt), am_noindex:$addr, simm9:$offset),
2603 (!cast<Instruction>(NAME#_isel) regtype:$Rt, am_noindex:$addr,
2604 simm9:$offset)>;
2605}
2606
2607//---
2608// Load/store post-indexed
2609//---
2610
2611// (pre-index) load/stores.
2612class BaseLoadStorePostIdx<bits<2> sz, bit V, bits<2> opc, dag oops, dag iops,
2613 string asm, string cstr>
2614 : I<oops, iops, asm, "\t$Rt, $addr, $idx", cstr, []> {
2615 // The operands are in order to match the 'addr' MI operands, so we
2616 // don't need an encoder method and by-name matching. Just use the default
2617 // in-order handling.
2618 bits<5> dst;
2619 bits<5> base;
2620 bits<9> offset;
2621 let Inst{31-30} = sz;
2622 let Inst{29-27} = 0b111;
2623 let Inst{26} = V;
2624 let Inst{25-24} = 0b00;
2625 let Inst{23-22} = opc;
2626 let Inst{21} = 0b0;
2627 let Inst{20-12} = offset;
2628 let Inst{11-10} = 0b01;
2629 let Inst{9-5} = base;
2630 let Inst{4-0} = dst;
2631
2632 let DecoderMethod = "DecodeSignedLdStInstruction";
2633}
2634
2635let hasSideEffects = 0 in {
2636let mayStore = 0, mayLoad = 1 in
2637// FIXME: Modeling the write-back of these instructions for isel is tricky.
2638// we need the complex addressing mode for the memory reference, but
2639// we also need the write-back specified as a tied operand to the
2640// base register. That combination does not play nicely with
2641// the asm matcher and friends.
2642class LoadPostIdx<bits<2> sz, bit V, bits<2> opc, RegisterClass regtype,
2643 string asm>
2644 : BaseLoadStorePostIdx<sz, V, opc,
2645 (outs regtype:$Rt/*, GPR64sp:$wback*/),
2646 (ins am_noindex:$addr, simm9:$idx),
2647 asm, ""/*"$addr.base = $wback"*/>,
2648 Sched<[WriteLD, WriteI]>;
2649
2650let mayStore = 1, mayLoad = 0 in
2651class StorePostIdx<bits<2> sz, bit V, bits<2> opc, RegisterClass regtype,
2652 string asm>
2653 : BaseLoadStorePostIdx<sz, V, opc,
2654 (outs/* GPR64sp:$wback*/),
2655 (ins regtype:$Rt, am_noindex:$addr, simm9:$idx),
2656 asm, ""/*"$addr.base = $wback"*/>,
2657 Sched<[WriteAdr, WriteST, ReadAdrBase]>;
2658} // hasSideEffects = 0
2659
2660// ISel pseudo-instructions which have the tied operands. When the MC lowering
2661// logic finally gets smart enough to strip off tied operands that are just
2662// for isel convenience, we can get rid of these pseudos and just reference
2663// the real instructions directly.
2664//
2665// Ironically, also because of the writeback operands, we can't put the
2666// matcher pattern directly on the instruction, but need to define it
2667// separately.
2668multiclass StorePostIdxPseudo<RegisterClass regtype, ValueType Ty,
2669 SDPatternOperator OpNode, Instruction Insn> {
2670 let mayStore = 1, mayLoad = 0, hasSideEffects = 0 in
2671 def _isel: Pseudo<(outs GPR64sp:$wback),
2672 (ins regtype:$Rt, am_noindex:$addr, simm9:$idx), [],
2673 "$addr.base = $wback,@earlyclobber $wback">,
2674 PseudoInstExpansion<(Insn regtype:$Rt, am_noindex:$addr, simm9:$idx)>,
2675 Sched<[WriteAdr, WriteST, ReadAdrBase]>;
2676
2677 def : Pat<(OpNode (Ty regtype:$Rt), am_noindex:$addr, simm9:$idx),
2678 (!cast<Instruction>(NAME#_isel) regtype:$Rt, am_noindex:$addr,
2679 simm9:$idx)>;
2680}
2681
2682//---
2683// Load/store pair
2684//---
2685
2686// (indexed, offset)
2687
2688class BaseLoadStorePairOffset<bits<2> opc, bit V, bit L, dag oops, dag iops,
2689 string asm>
2690 : I<oops, iops, asm, "\t$Rt, $Rt2, $addr", "", []> {
2691 // The operands are in order to match the 'addr' MI operands, so we
2692 // don't need an encoder method and by-name matching. Just use the default
2693 // in-order handling. Since we're using by-order, make sure the names
2694 // do not match.
2695 bits<5> dst;
2696 bits<5> dst2;
2697 bits<5> base;
2698 bits<7> offset;
2699 let Inst{31-30} = opc;
2700 let Inst{29-27} = 0b101;
2701 let Inst{26} = V;
2702 let Inst{25-23} = 0b010;
2703 let Inst{22} = L;
2704 let Inst{21-15} = offset;
2705 let Inst{14-10} = dst2;
2706 let Inst{9-5} = base;
2707 let Inst{4-0} = dst;
2708
2709 let DecoderMethod = "DecodePairLdStInstruction";
2710}
2711
2712let hasSideEffects = 0 in {
2713let mayStore = 0, mayLoad = 1 in
2714class LoadPairOffset<bits<2> opc, bit V, RegisterClass regtype,
2715 Operand indextype, string asm>
2716 : BaseLoadStorePairOffset<opc, V, 1,
2717 (outs regtype:$Rt, regtype:$Rt2),
2718 (ins indextype:$addr), asm>,
2719 Sched<[WriteLD, WriteLDHi]>;
2720
2721let mayLoad = 0, mayStore = 1 in
2722class StorePairOffset<bits<2> opc, bit V, RegisterClass regtype,
2723 Operand indextype, string asm>
2724 : BaseLoadStorePairOffset<opc, V, 0, (outs),
2725 (ins regtype:$Rt, regtype:$Rt2, indextype:$addr),
2726 asm>,
2727 Sched<[WriteSTP]>;
2728} // hasSideEffects = 0
2729
2730// (pre-indexed)
2731
2732def MemoryIndexed32SImm7 : AsmOperandClass {
2733 let Name = "MemoryIndexed32SImm7";
2734 let DiagnosticType = "InvalidMemoryIndexed32SImm7";
2735}
2736def am_indexed32simm7 : Operand<i32> { // ComplexPattern<...>
2737 let PrintMethod = "printAMIndexed32";
2738 let ParserMatchClass = MemoryIndexed32SImm7;
2739 let MIOperandInfo = (ops GPR64sp:$base, i32imm:$offset);
2740}
2741
2742def MemoryIndexed64SImm7 : AsmOperandClass {
2743 let Name = "MemoryIndexed64SImm7";
2744 let DiagnosticType = "InvalidMemoryIndexed64SImm7";
2745}
2746def am_indexed64simm7 : Operand<i32> { // ComplexPattern<...>
2747 let PrintMethod = "printAMIndexed64";
2748 let ParserMatchClass = MemoryIndexed64SImm7;
2749 let MIOperandInfo = (ops GPR64sp:$base, i32imm:$offset);
2750}
2751
2752def MemoryIndexed128SImm7 : AsmOperandClass {
2753 let Name = "MemoryIndexed128SImm7";
2754 let DiagnosticType = "InvalidMemoryIndexed128SImm7";
2755}
2756def am_indexed128simm7 : Operand<i32> { // ComplexPattern<...>
2757 let PrintMethod = "printAMIndexed128";
2758 let ParserMatchClass = MemoryIndexed128SImm7;
2759 let MIOperandInfo = (ops GPR64sp:$base, i32imm:$offset);
2760}
2761
2762class BaseLoadStorePairPreIdx<bits<2> opc, bit V, bit L, dag oops, dag iops,
2763 string asm>
2764 : I<oops, iops, asm, "\t$Rt, $Rt2, $addr!", "", []> {
2765 // The operands are in order to match the 'addr' MI operands, so we
2766 // don't need an encoder method and by-name matching. Just use the default
2767 // in-order handling. Since we're using by-order, make sure the names
2768 // do not match.
2769 bits<5> dst;
2770 bits<5> dst2;
2771 bits<5> base;
2772 bits<7> offset;
2773 let Inst{31-30} = opc;
2774 let Inst{29-27} = 0b101;
2775 let Inst{26} = V;
2776 let Inst{25-23} = 0b011;
2777 let Inst{22} = L;
2778 let Inst{21-15} = offset;
2779 let Inst{14-10} = dst2;
2780 let Inst{9-5} = base;
2781 let Inst{4-0} = dst;
2782
2783 let DecoderMethod = "DecodePairLdStInstruction";
2784}
2785
2786let hasSideEffects = 0 in {
2787let mayStore = 0, mayLoad = 1 in
2788class LoadPairPreIdx<bits<2> opc, bit V, RegisterClass regtype,
2789 Operand addrmode, string asm>
2790 : BaseLoadStorePairPreIdx<opc, V, 1,
2791 (outs regtype:$Rt, regtype:$Rt2),
2792 (ins addrmode:$addr), asm>,
2793 Sched<[WriteLD, WriteLDHi, WriteAdr]>;
2794
2795let mayStore = 1, mayLoad = 0 in
2796class StorePairPreIdx<bits<2> opc, bit V, RegisterClass regtype,
2797 Operand addrmode, string asm>
2798 : BaseLoadStorePairPreIdx<opc, V, 0, (outs),
2799 (ins regtype:$Rt, regtype:$Rt2, addrmode:$addr),
2800 asm>,
2801 Sched<[WriteAdr, WriteSTP]>;
2802} // hasSideEffects = 0
2803
2804// (post-indexed)
2805
2806class BaseLoadStorePairPostIdx<bits<2> opc, bit V, bit L, dag oops, dag iops,
2807 string asm>
2808 : I<oops, iops, asm, "\t$Rt, $Rt2, $addr, $idx", "", []> {
2809 // The operands are in order to match the 'addr' MI operands, so we
2810 // don't need an encoder method and by-name matching. Just use the default
2811 // in-order handling. Since we're using by-order, make sure the names
2812 // do not match.
2813 bits<5> dst;
2814 bits<5> dst2;
2815 bits<5> base;
2816 bits<7> offset;
2817 let Inst{31-30} = opc;
2818 let Inst{29-27} = 0b101;
2819 let Inst{26} = V;
2820 let Inst{25-23} = 0b001;
2821 let Inst{22} = L;
2822 let Inst{21-15} = offset;
2823 let Inst{14-10} = dst2;
2824 let Inst{9-5} = base;
2825 let Inst{4-0} = dst;
2826
2827 let DecoderMethod = "DecodePairLdStInstruction";
2828}
2829
2830let hasSideEffects = 0 in {
2831let mayStore = 0, mayLoad = 1 in
2832class LoadPairPostIdx<bits<2> opc, bit V, RegisterClass regtype,
2833 Operand idxtype, string asm>
2834 : BaseLoadStorePairPostIdx<opc, V, 1,
2835 (outs regtype:$Rt, regtype:$Rt2),
2836 (ins am_noindex:$addr, idxtype:$idx), asm>,
2837 Sched<[WriteLD, WriteLDHi, WriteAdr]>;
2838
2839let mayStore = 1, mayLoad = 0 in
2840class StorePairPostIdx<bits<2> opc, bit V, RegisterClass regtype,
2841 Operand idxtype, string asm>
2842 : BaseLoadStorePairPostIdx<opc, V, 0, (outs),
2843 (ins regtype:$Rt, regtype:$Rt2,
2844 am_noindex:$addr, idxtype:$idx),
2845 asm>,
2846 Sched<[WriteAdr, WriteSTP]>;
2847} // hasSideEffects = 0
2848
2849// (no-allocate)
2850
2851class BaseLoadStorePairNoAlloc<bits<2> opc, bit V, bit L, dag oops, dag iops,
2852 string asm>
2853 : I<oops, iops, asm, "\t$Rt, $Rt2, $addr", "", []> {
2854 // The operands are in order to match the 'addr' MI operands, so we
2855 // don't need an encoder method and by-name matching. Just use the default
2856 // in-order handling. Since we're using by-order, make sure the names
2857 // do not match.
2858 bits<5> dst;
2859 bits<5> dst2;
2860 bits<5> base;
2861 bits<7> offset;
2862 let Inst{31-30} = opc;
2863 let Inst{29-27} = 0b101;
2864 let Inst{26} = V;
2865 let Inst{25-23} = 0b000;
2866 let Inst{22} = L;
2867 let Inst{21-15} = offset;
2868 let Inst{14-10} = dst2;
2869 let Inst{9-5} = base;
2870 let Inst{4-0} = dst;
2871
2872 let DecoderMethod = "DecodePairLdStInstruction";
2873}
2874
2875let hasSideEffects = 0 in {
2876let mayStore = 0, mayLoad = 1 in
2877class LoadPairNoAlloc<bits<2> opc, bit V, RegisterClass regtype,
2878 Operand indextype, string asm>
2879 : BaseLoadStorePairNoAlloc<opc, V, 1,
2880 (outs regtype:$Rt, regtype:$Rt2),
2881 (ins indextype:$addr), asm>,
2882 Sched<[WriteLD, WriteLDHi]>;
2883
2884let mayStore = 1, mayLoad = 0 in
2885class StorePairNoAlloc<bits<2> opc, bit V, RegisterClass regtype,
2886 Operand indextype, string asm>
2887 : BaseLoadStorePairNoAlloc<opc, V, 0, (outs),
2888 (ins regtype:$Rt, regtype:$Rt2, indextype:$addr),
2889 asm>,
2890 Sched<[WriteSTP]>;
2891} // hasSideEffects = 0
2892
2893//---
2894// Load/store exclusive
2895//---
2896
2897// True exclusive operations write to and/or read from the system's exclusive
2898// monitors, which as far as a compiler is concerned can be modelled as a
2899// random shared memory address. Hence LoadExclusive mayStore.
Bradley Smithbc35b1f2014-04-09 14:43:01 +00002900//
2901// Since these instructions have the undefined register bits set to 1 in
2902// their canonical form, we need a post encoder method to set those bits
2903// to 1 when encoding these instructions. We do this using the
2904// fixLoadStoreExclusive function. This function has template parameters:
2905//
2906// fixLoadStoreExclusive<int hasRs, int hasRt2>
2907//
2908// hasRs indicates that the instruction uses the Rs field, so we won't set
2909// it to 1 (and the same for Rt2). We don't need template parameters for
2910// the other register fields since Rt and Rn are always used.
2911//
Tim Northover00ed9962014-03-29 10:18:08 +00002912let hasSideEffects = 1, mayLoad = 1, mayStore = 1 in
2913class BaseLoadStoreExclusive<bits<2> sz, bit o2, bit L, bit o1, bit o0,
2914 dag oops, dag iops, string asm, string operands>
2915 : I<oops, iops, asm, operands, "", []> {
2916 let Inst{31-30} = sz;
2917 let Inst{29-24} = 0b001000;
2918 let Inst{23} = o2;
2919 let Inst{22} = L;
2920 let Inst{21} = o1;
2921 let Inst{15} = o0;
2922
2923 let DecoderMethod = "DecodeExclusiveLdStInstruction";
2924}
2925
2926// Neither Rs nor Rt2 operands.
2927class LoadStoreExclusiveSimple<bits<2> sz, bit o2, bit L, bit o1, bit o0,
2928 dag oops, dag iops, string asm, string operands>
2929 : BaseLoadStoreExclusive<sz, o2, L, o1, o0, oops, iops, asm, operands> {
2930 bits<5> reg;
2931 bits<5> base;
Tim Northover00ed9962014-03-29 10:18:08 +00002932 let Inst{9-5} = base;
2933 let Inst{4-0} = reg;
Bradley Smithbc35b1f2014-04-09 14:43:01 +00002934
2935 let PostEncoderMethod = "fixLoadStoreExclusive<0,0>";
Tim Northover00ed9962014-03-29 10:18:08 +00002936}
2937
2938// Simple load acquires don't set the exclusive monitor
2939let mayLoad = 1, mayStore = 0 in
2940class LoadAcquire<bits<2> sz, bit o2, bit L, bit o1, bit o0,
2941 RegisterClass regtype, string asm>
2942 : LoadStoreExclusiveSimple<sz, o2, L, o1, o0, (outs regtype:$Rt),
2943 (ins am_noindex:$addr), asm, "\t$Rt, $addr">,
2944 Sched<[WriteLD]>;
2945
2946class LoadExclusive<bits<2> sz, bit o2, bit L, bit o1, bit o0,
2947 RegisterClass regtype, string asm>
2948 : LoadStoreExclusiveSimple<sz, o2, L, o1, o0, (outs regtype:$Rt),
2949 (ins am_noindex:$addr), asm, "\t$Rt, $addr">,
2950 Sched<[WriteLD]>;
2951
2952class LoadExclusivePair<bits<2> sz, bit o2, bit L, bit o1, bit o0,
2953 RegisterClass regtype, string asm>
2954 : BaseLoadStoreExclusive<sz, o2, L, o1, o0,
2955 (outs regtype:$Rt, regtype:$Rt2),
2956 (ins am_noindex:$addr), asm,
2957 "\t$Rt, $Rt2, $addr">,
2958 Sched<[WriteLD, WriteLDHi]> {
2959 bits<5> dst1;
2960 bits<5> dst2;
2961 bits<5> base;
Tim Northover00ed9962014-03-29 10:18:08 +00002962 let Inst{14-10} = dst2;
2963 let Inst{9-5} = base;
2964 let Inst{4-0} = dst1;
Bradley Smithbc35b1f2014-04-09 14:43:01 +00002965
2966 let PostEncoderMethod = "fixLoadStoreExclusive<0,1>";
Tim Northover00ed9962014-03-29 10:18:08 +00002967}
2968
2969// Simple store release operations do not check the exclusive monitor.
2970let mayLoad = 0, mayStore = 1 in
2971class StoreRelease<bits<2> sz, bit o2, bit L, bit o1, bit o0,
2972 RegisterClass regtype, string asm>
2973 : LoadStoreExclusiveSimple<sz, o2, L, o1, o0, (outs),
2974 (ins regtype:$Rt, am_noindex:$addr),
2975 asm, "\t$Rt, $addr">,
2976 Sched<[WriteST]>;
2977
2978let mayLoad = 1, mayStore = 1 in
2979class StoreExclusive<bits<2> sz, bit o2, bit L, bit o1, bit o0,
2980 RegisterClass regtype, string asm>
2981 : BaseLoadStoreExclusive<sz, o2, L, o1, o0, (outs GPR32:$Ws),
2982 (ins regtype:$Rt, am_noindex:$addr),
2983 asm, "\t$Ws, $Rt, $addr">,
2984 Sched<[WriteSTX]> {
2985 bits<5> status;
2986 bits<5> reg;
2987 bits<5> base;
2988 let Inst{20-16} = status;
Tim Northover00ed9962014-03-29 10:18:08 +00002989 let Inst{9-5} = base;
2990 let Inst{4-0} = reg;
2991
2992 let Constraints = "@earlyclobber $Ws";
Bradley Smithbc35b1f2014-04-09 14:43:01 +00002993 let PostEncoderMethod = "fixLoadStoreExclusive<1,0>";
Tim Northover00ed9962014-03-29 10:18:08 +00002994}
2995
2996class StoreExclusivePair<bits<2> sz, bit o2, bit L, bit o1, bit o0,
2997 RegisterClass regtype, string asm>
2998 : BaseLoadStoreExclusive<sz, o2, L, o1, o0,
2999 (outs GPR32:$Ws),
3000 (ins regtype:$Rt, regtype:$Rt2, am_noindex:$addr),
3001 asm, "\t$Ws, $Rt, $Rt2, $addr">,
3002 Sched<[WriteSTX]> {
3003 bits<5> status;
3004 bits<5> dst1;
3005 bits<5> dst2;
3006 bits<5> base;
3007 let Inst{20-16} = status;
3008 let Inst{14-10} = dst2;
3009 let Inst{9-5} = base;
3010 let Inst{4-0} = dst1;
3011
3012 let Constraints = "@earlyclobber $Ws";
3013}
3014
3015//---
3016// Exception generation
3017//---
3018
3019let mayLoad = 0, mayStore = 0, hasSideEffects = 1 in
3020class ExceptionGeneration<bits<3> op1, bits<2> ll, string asm>
3021 : I<(outs), (ins imm0_65535:$imm), asm, "\t$imm", "", []>,
3022 Sched<[WriteSys]> {
3023 bits<16> imm;
3024 let Inst{31-24} = 0b11010100;
3025 let Inst{23-21} = op1;
3026 let Inst{20-5} = imm;
3027 let Inst{4-2} = 0b000;
3028 let Inst{1-0} = ll;
3029}
3030
3031//---
3032// Floating point to integer conversion
3033//---
3034
3035class BaseFPToIntegerUnscaled<bits<2> type, bits<2> rmode, bits<3> opcode,
3036 RegisterClass srcType, RegisterClass dstType,
3037 string asm, list<dag> pattern>
3038 : I<(outs dstType:$Rd), (ins srcType:$Rn),
3039 asm, "\t$Rd, $Rn", "", pattern>,
3040 Sched<[WriteFCvt]> {
3041 bits<5> Rd;
3042 bits<5> Rn;
3043 let Inst{30} = 0;
3044 let Inst{28-24} = 0b11110;
3045 let Inst{23-22} = type;
3046 let Inst{21} = 1;
3047 let Inst{20-19} = rmode;
3048 let Inst{18-16} = opcode;
3049 let Inst{15-10} = 0;
3050 let Inst{9-5} = Rn;
3051 let Inst{4-0} = Rd;
3052}
3053
3054let mayLoad = 0, mayStore = 0, hasSideEffects = 0 in
3055class BaseFPToInteger<bits<2> type, bits<2> rmode, bits<3> opcode,
3056 RegisterClass srcType, RegisterClass dstType,
3057 Operand immType, string asm>
3058 : I<(outs dstType:$Rd), (ins srcType:$Rn, immType:$scale),
3059 asm, "\t$Rd, $Rn, $scale", "", []>,
3060 Sched<[WriteFCvt]> {
3061 bits<5> Rd;
3062 bits<5> Rn;
3063 bits<6> scale;
3064 let Inst{30} = 0;
3065 let Inst{28-24} = 0b11110;
3066 let Inst{23-22} = type;
3067 let Inst{21} = 0;
3068 let Inst{20-19} = rmode;
3069 let Inst{18-16} = opcode;
3070 let Inst{15-10} = scale;
3071 let Inst{9-5} = Rn;
3072 let Inst{4-0} = Rd;
3073}
3074
3075multiclass FPToInteger<bits<2> rmode, bits<3> opcode, string asm, SDPatternOperator OpN> {
3076 // Unscaled single-precision to 32-bit
3077 def UWSr : BaseFPToIntegerUnscaled<0b00, rmode, opcode, FPR32, GPR32, asm,
3078 [(set GPR32:$Rd, (OpN FPR32:$Rn))]> {
3079 let Inst{31} = 0; // 32-bit GPR flag
3080 }
3081
3082 // Unscaled single-precision to 64-bit
3083 def UXSr : BaseFPToIntegerUnscaled<0b00, rmode, opcode, FPR32, GPR64, asm,
3084 [(set GPR64:$Rd, (OpN FPR32:$Rn))]> {
3085 let Inst{31} = 1; // 64-bit GPR flag
3086 }
3087
3088 // Unscaled double-precision to 32-bit
3089 def UWDr : BaseFPToIntegerUnscaled<0b01, rmode, opcode, FPR64, GPR32, asm,
3090 [(set GPR32:$Rd, (OpN (f64 FPR64:$Rn)))]> {
3091 let Inst{31} = 0; // 32-bit GPR flag
3092 }
3093
3094 // Unscaled double-precision to 64-bit
3095 def UXDr : BaseFPToIntegerUnscaled<0b01, rmode, opcode, FPR64, GPR64, asm,
3096 [(set GPR64:$Rd, (OpN (f64 FPR64:$Rn)))]> {
3097 let Inst{31} = 1; // 64-bit GPR flag
3098 }
3099
3100 // Scaled single-precision to 32-bit
3101 def SWSri : BaseFPToInteger<0b00, rmode, opcode, FPR32, GPR32,
3102 fixedpoint32, asm> {
3103 let Inst{31} = 0; // 32-bit GPR flag
3104 }
3105
3106 // Scaled single-precision to 64-bit
3107 def SXSri : BaseFPToInteger<0b00, rmode, opcode, FPR32, GPR64,
3108 fixedpoint64, asm> {
3109 let Inst{31} = 1; // 64-bit GPR flag
3110 }
3111
3112 // Scaled double-precision to 32-bit
3113 def SWDri : BaseFPToInteger<0b01, rmode, opcode, FPR64, GPR32,
3114 fixedpoint32, asm> {
3115 let Inst{31} = 0; // 32-bit GPR flag
3116 }
3117
3118 // Scaled double-precision to 64-bit
3119 def SXDri : BaseFPToInteger<0b01, rmode, opcode, FPR64, GPR64,
3120 fixedpoint64, asm> {
3121 let Inst{31} = 1; // 64-bit GPR flag
3122 }
3123}
3124
3125//---
3126// Integer to floating point conversion
3127//---
3128
3129let mayStore = 0, mayLoad = 0, hasSideEffects = 0 in
3130class BaseIntegerToFP<bit isUnsigned,
3131 RegisterClass srcType, RegisterClass dstType,
3132 Operand immType, string asm>
3133 : I<(outs dstType:$Rd), (ins srcType:$Rn, immType:$scale),
3134 asm, "\t$Rd, $Rn, $scale", "", []>,
3135 Sched<[WriteFCvt]> {
3136 bits<5> Rd;
3137 bits<5> Rn;
3138 bits<6> scale;
3139 let Inst{30-23} = 0b00111100;
3140 let Inst{21-17} = 0b00001;
3141 let Inst{16} = isUnsigned;
3142 let Inst{15-10} = scale;
3143 let Inst{9-5} = Rn;
3144 let Inst{4-0} = Rd;
3145}
3146
3147class BaseIntegerToFPUnscaled<bit isUnsigned,
3148 RegisterClass srcType, RegisterClass dstType,
3149 ValueType dvt, string asm, SDNode node>
3150 : I<(outs dstType:$Rd), (ins srcType:$Rn),
3151 asm, "\t$Rd, $Rn", "", [(set (dvt dstType:$Rd), (node srcType:$Rn))]>,
3152 Sched<[WriteFCvt]> {
3153 bits<5> Rd;
3154 bits<5> Rn;
3155 bits<6> scale;
3156 let Inst{30-23} = 0b00111100;
3157 let Inst{21-17} = 0b10001;
3158 let Inst{16} = isUnsigned;
3159 let Inst{15-10} = 0b000000;
3160 let Inst{9-5} = Rn;
3161 let Inst{4-0} = Rd;
3162}
3163
3164multiclass IntegerToFP<bit isUnsigned, string asm, SDNode node> {
3165 // Unscaled
3166 def UWSri: BaseIntegerToFPUnscaled<isUnsigned, GPR32, FPR32, f32, asm, node> {
3167 let Inst{31} = 0; // 32-bit GPR flag
3168 let Inst{22} = 0; // 32-bit FPR flag
3169 }
3170
3171 def UWDri: BaseIntegerToFPUnscaled<isUnsigned, GPR32, FPR64, f64, asm, node> {
3172 let Inst{31} = 0; // 32-bit GPR flag
3173 let Inst{22} = 1; // 64-bit FPR flag
3174 }
3175
3176 def UXSri: BaseIntegerToFPUnscaled<isUnsigned, GPR64, FPR32, f32, asm, node> {
3177 let Inst{31} = 1; // 64-bit GPR flag
3178 let Inst{22} = 0; // 32-bit FPR flag
3179 }
3180
3181 def UXDri: BaseIntegerToFPUnscaled<isUnsigned, GPR64, FPR64, f64, asm, node> {
3182 let Inst{31} = 1; // 64-bit GPR flag
3183 let Inst{22} = 1; // 64-bit FPR flag
3184 }
3185
3186 // Scaled
3187 def SWSri: BaseIntegerToFP<isUnsigned, GPR32, FPR32, fixedpoint32, asm> {
3188 let Inst{31} = 0; // 32-bit GPR flag
3189 let Inst{22} = 0; // 32-bit FPR flag
3190 }
3191
3192 def SWDri: BaseIntegerToFP<isUnsigned, GPR32, FPR64, fixedpoint32, asm> {
3193 let Inst{31} = 0; // 32-bit GPR flag
3194 let Inst{22} = 1; // 64-bit FPR flag
3195 }
3196
3197 def SXSri: BaseIntegerToFP<isUnsigned, GPR64, FPR32, fixedpoint64, asm> {
3198 let Inst{31} = 1; // 64-bit GPR flag
3199 let Inst{22} = 0; // 32-bit FPR flag
3200 }
3201
3202 def SXDri: BaseIntegerToFP<isUnsigned, GPR64, FPR64, fixedpoint64, asm> {
3203 let Inst{31} = 1; // 64-bit GPR flag
3204 let Inst{22} = 1; // 64-bit FPR flag
3205 }
3206}
3207
3208//---
3209// Unscaled integer <-> floating point conversion (i.e. FMOV)
3210//---
3211
3212let mayLoad = 0, mayStore = 0, hasSideEffects = 0 in
3213class BaseUnscaledConversion<bits<2> rmode, bits<3> opcode,
3214 RegisterClass srcType, RegisterClass dstType,
3215 string asm>
3216 : I<(outs dstType:$Rd), (ins srcType:$Rn), asm, "\t$Rd, $Rn", "",
3217 // We use COPY_TO_REGCLASS for these bitconvert operations.
3218 // copyPhysReg() expands the resultant COPY instructions after
3219 // regalloc is done. This gives greater freedom for the allocator
3220 // and related passes (coalescing, copy propagation, et. al.) to
3221 // be more effective.
3222 [/*(set (dvt dstType:$Rd), (bitconvert (svt srcType:$Rn)))*/]>,
3223 Sched<[WriteFCopy]> {
3224 bits<5> Rd;
3225 bits<5> Rn;
3226 let Inst{30-23} = 0b00111100;
3227 let Inst{21} = 1;
3228 let Inst{20-19} = rmode;
3229 let Inst{18-16} = opcode;
3230 let Inst{15-10} = 0b000000;
3231 let Inst{9-5} = Rn;
3232 let Inst{4-0} = Rd;
3233}
3234
3235let mayLoad = 0, mayStore = 0, hasSideEffects = 0 in
3236class BaseUnscaledConversionToHigh<bits<2> rmode, bits<3> opcode,
3237 RegisterClass srcType, RegisterOperand dstType, string asm>
3238 : I<(outs dstType:$Rd), (ins srcType:$Rn), asm, "\t$Rd[1], $Rn", "", []>,
3239 Sched<[WriteFCopy]> {
3240 bits<5> Rd;
3241 bits<5> Rn;
3242 let Inst{30-23} = 0b00111101;
3243 let Inst{21} = 1;
3244 let Inst{20-19} = rmode;
3245 let Inst{18-16} = opcode;
3246 let Inst{15-10} = 0b000000;
3247 let Inst{9-5} = Rn;
3248 let Inst{4-0} = Rd;
3249}
3250
3251let mayLoad = 0, mayStore = 0, hasSideEffects = 0 in
3252class BaseUnscaledConversionFromHigh<bits<2> rmode, bits<3> opcode,
3253 RegisterOperand srcType, RegisterClass dstType, string asm>
3254 : I<(outs dstType:$Rd), (ins srcType:$Rn), asm, "\t$Rd, $Rn[1]", "", []>,
3255 Sched<[WriteFCopy]> {
3256 bits<5> Rd;
3257 bits<5> Rn;
3258 let Inst{30-23} = 0b00111101;
3259 let Inst{21} = 1;
3260 let Inst{20-19} = rmode;
3261 let Inst{18-16} = opcode;
3262 let Inst{15-10} = 0b000000;
3263 let Inst{9-5} = Rn;
3264 let Inst{4-0} = Rd;
3265}
3266
3267
3268
3269multiclass UnscaledConversion<string asm> {
3270 def WSr : BaseUnscaledConversion<0b00, 0b111, GPR32, FPR32, asm> {
3271 let Inst{31} = 0; // 32-bit GPR flag
3272 let Inst{22} = 0; // 32-bit FPR flag
3273 }
3274
3275 def XDr : BaseUnscaledConversion<0b00, 0b111, GPR64, FPR64, asm> {
3276 let Inst{31} = 1; // 64-bit GPR flag
3277 let Inst{22} = 1; // 64-bit FPR flag
3278 }
3279
3280 def SWr : BaseUnscaledConversion<0b00, 0b110, FPR32, GPR32, asm> {
3281 let Inst{31} = 0; // 32-bit GPR flag
3282 let Inst{22} = 0; // 32-bit FPR flag
3283 }
3284
3285 def DXr : BaseUnscaledConversion<0b00, 0b110, FPR64, GPR64, asm> {
3286 let Inst{31} = 1; // 64-bit GPR flag
3287 let Inst{22} = 1; // 64-bit FPR flag
3288 }
3289
3290 def XDHighr : BaseUnscaledConversionToHigh<0b01, 0b111, GPR64, V128,
3291 asm#".d"> {
3292 let Inst{31} = 1;
3293 let Inst{22} = 0;
3294 }
3295
3296 def DXHighr : BaseUnscaledConversionFromHigh<0b01, 0b110, V128, GPR64,
3297 asm#".d"> {
3298 let Inst{31} = 1;
3299 let Inst{22} = 0;
3300 }
3301
3302 def : InstAlias<asm#"$Vd.d[1], $Rn",
3303 (!cast<Instruction>(NAME#XDHighr) V128:$Vd, GPR64:$Rn), 0>;
3304 def : InstAlias<asm#"$Rd, $Vn.d[1]",
3305 (!cast<Instruction>(NAME#DXHighr) GPR64:$Rd, V128:$Vn), 0>;
3306}
3307
3308//---
3309// Floating point conversion
3310//---
3311
3312class BaseFPConversion<bits<2> type, bits<2> opcode, RegisterClass dstType,
3313 RegisterClass srcType, string asm, list<dag> pattern>
3314 : I<(outs dstType:$Rd), (ins srcType:$Rn), asm, "\t$Rd, $Rn", "", pattern>,
3315 Sched<[WriteFCvt]> {
3316 bits<5> Rd;
3317 bits<5> Rn;
3318 let Inst{31-24} = 0b00011110;
3319 let Inst{23-22} = type;
3320 let Inst{21-17} = 0b10001;
3321 let Inst{16-15} = opcode;
3322 let Inst{14-10} = 0b10000;
3323 let Inst{9-5} = Rn;
3324 let Inst{4-0} = Rd;
3325}
3326
3327multiclass FPConversion<string asm> {
3328 // Double-precision to Half-precision
3329 let mayLoad = 0, mayStore = 0, hasSideEffects = 0 in
3330 def HDr : BaseFPConversion<0b01, 0b11, FPR16, FPR64, asm, []>;
3331
3332 // Double-precision to Single-precision
3333 def SDr : BaseFPConversion<0b01, 0b00, FPR32, FPR64, asm,
3334 [(set FPR32:$Rd, (fround FPR64:$Rn))]>;
3335
3336 // Half-precision to Double-precision
3337 let mayLoad = 0, mayStore = 0, hasSideEffects = 0 in
3338 def DHr : BaseFPConversion<0b11, 0b01, FPR64, FPR16, asm, []>;
3339
3340 // Half-precision to Single-precision
3341 let mayLoad = 0, mayStore = 0, hasSideEffects = 0 in
3342 def SHr : BaseFPConversion<0b11, 0b00, FPR32, FPR16, asm, []>;
3343
3344 // Single-precision to Double-precision
3345 def DSr : BaseFPConversion<0b00, 0b01, FPR64, FPR32, asm,
3346 [(set FPR64:$Rd, (fextend FPR32:$Rn))]>;
3347
3348 // Single-precision to Half-precision
3349 let mayLoad = 0, mayStore = 0, hasSideEffects = 0 in
3350 def HSr : BaseFPConversion<0b00, 0b11, FPR16, FPR32, asm, []>;
3351}
3352
3353//---
3354// Single operand floating point data processing
3355//---
3356
3357let mayLoad = 0, mayStore = 0, hasSideEffects = 0 in
3358class BaseSingleOperandFPData<bits<4> opcode, RegisterClass regtype,
3359 ValueType vt, string asm, SDPatternOperator node>
3360 : I<(outs regtype:$Rd), (ins regtype:$Rn), asm, "\t$Rd, $Rn", "",
3361 [(set (vt regtype:$Rd), (node (vt regtype:$Rn)))]>,
3362 Sched<[WriteF]> {
3363 bits<5> Rd;
3364 bits<5> Rn;
3365 let Inst{31-23} = 0b000111100;
3366 let Inst{21-19} = 0b100;
3367 let Inst{18-15} = opcode;
3368 let Inst{14-10} = 0b10000;
3369 let Inst{9-5} = Rn;
3370 let Inst{4-0} = Rd;
3371}
3372
3373multiclass SingleOperandFPData<bits<4> opcode, string asm,
3374 SDPatternOperator node = null_frag> {
3375 def Sr : BaseSingleOperandFPData<opcode, FPR32, f32, asm, node> {
3376 let Inst{22} = 0; // 32-bit size flag
3377 }
3378
3379 def Dr : BaseSingleOperandFPData<opcode, FPR64, f64, asm, node> {
3380 let Inst{22} = 1; // 64-bit size flag
3381 }
3382}
3383
3384//---
3385// Two operand floating point data processing
3386//---
3387
3388let mayLoad = 0, mayStore = 0, hasSideEffects = 0 in
3389class BaseTwoOperandFPData<bits<4> opcode, RegisterClass regtype,
3390 string asm, list<dag> pat>
3391 : I<(outs regtype:$Rd), (ins regtype:$Rn, regtype:$Rm),
3392 asm, "\t$Rd, $Rn, $Rm", "", pat>,
3393 Sched<[WriteF]> {
3394 bits<5> Rd;
3395 bits<5> Rn;
3396 bits<5> Rm;
3397 let Inst{31-23} = 0b000111100;
3398 let Inst{21} = 1;
3399 let Inst{20-16} = Rm;
3400 let Inst{15-12} = opcode;
3401 let Inst{11-10} = 0b10;
3402 let Inst{9-5} = Rn;
3403 let Inst{4-0} = Rd;
3404}
3405
3406multiclass TwoOperandFPData<bits<4> opcode, string asm,
3407 SDPatternOperator node = null_frag> {
3408 def Srr : BaseTwoOperandFPData<opcode, FPR32, asm,
3409 [(set (f32 FPR32:$Rd),
3410 (node (f32 FPR32:$Rn), (f32 FPR32:$Rm)))]> {
3411 let Inst{22} = 0; // 32-bit size flag
3412 }
3413
3414 def Drr : BaseTwoOperandFPData<opcode, FPR64, asm,
3415 [(set (f64 FPR64:$Rd),
3416 (node (f64 FPR64:$Rn), (f64 FPR64:$Rm)))]> {
3417 let Inst{22} = 1; // 64-bit size flag
3418 }
3419}
3420
3421multiclass TwoOperandFPDataNeg<bits<4> opcode, string asm, SDNode node> {
3422 def Srr : BaseTwoOperandFPData<opcode, FPR32, asm,
3423 [(set FPR32:$Rd, (fneg (node FPR32:$Rn, (f32 FPR32:$Rm))))]> {
3424 let Inst{22} = 0; // 32-bit size flag
3425 }
3426
3427 def Drr : BaseTwoOperandFPData<opcode, FPR64, asm,
3428 [(set FPR64:$Rd, (fneg (node FPR64:$Rn, (f64 FPR64:$Rm))))]> {
3429 let Inst{22} = 1; // 64-bit size flag
3430 }
3431}
3432
3433
3434//---
3435// Three operand floating point data processing
3436//---
3437
3438class BaseThreeOperandFPData<bit isNegated, bit isSub,
3439 RegisterClass regtype, string asm, list<dag> pat>
3440 : I<(outs regtype:$Rd), (ins regtype:$Rn, regtype:$Rm, regtype: $Ra),
3441 asm, "\t$Rd, $Rn, $Rm, $Ra", "", pat>,
3442 Sched<[WriteFMul]> {
3443 bits<5> Rd;
3444 bits<5> Rn;
3445 bits<5> Rm;
3446 bits<5> Ra;
3447 let Inst{31-23} = 0b000111110;
3448 let Inst{21} = isNegated;
3449 let Inst{20-16} = Rm;
3450 let Inst{15} = isSub;
3451 let Inst{14-10} = Ra;
3452 let Inst{9-5} = Rn;
3453 let Inst{4-0} = Rd;
3454}
3455
3456multiclass ThreeOperandFPData<bit isNegated, bit isSub,string asm,
3457 SDPatternOperator node> {
3458 def Srrr : BaseThreeOperandFPData<isNegated, isSub, FPR32, asm,
3459 [(set FPR32:$Rd,
3460 (node (f32 FPR32:$Rn), (f32 FPR32:$Rm), (f32 FPR32:$Ra)))]> {
3461 let Inst{22} = 0; // 32-bit size flag
3462 }
3463
3464 def Drrr : BaseThreeOperandFPData<isNegated, isSub, FPR64, asm,
3465 [(set FPR64:$Rd,
3466 (node (f64 FPR64:$Rn), (f64 FPR64:$Rm), (f64 FPR64:$Ra)))]> {
3467 let Inst{22} = 1; // 64-bit size flag
3468 }
3469}
3470
3471//---
3472// Floating point data comparisons
3473//---
3474
3475let mayLoad = 0, mayStore = 0, hasSideEffects = 0 in
3476class BaseOneOperandFPComparison<bit signalAllNans,
3477 RegisterClass regtype, string asm,
3478 list<dag> pat>
3479 : I<(outs), (ins regtype:$Rn), asm, "\t$Rn, #0.0", "", pat>,
3480 Sched<[WriteFCmp]> {
3481 bits<5> Rn;
3482 let Inst{31-23} = 0b000111100;
3483 let Inst{21} = 1;
3484
3485 let Inst{20-16} = 0b00000;
3486 let Inst{15-10} = 0b001000;
3487 let Inst{9-5} = Rn;
3488 let Inst{4} = signalAllNans;
3489 let Inst{3-0} = 0b1000;
3490}
3491
3492let mayLoad = 0, mayStore = 0, hasSideEffects = 0 in
3493class BaseTwoOperandFPComparison<bit signalAllNans, RegisterClass regtype,
3494 string asm, list<dag> pat>
3495 : I<(outs), (ins regtype:$Rn, regtype:$Rm), asm, "\t$Rn, $Rm", "", pat>,
3496 Sched<[WriteFCmp]> {
3497 bits<5> Rm;
3498 bits<5> Rn;
3499 let Inst{31-23} = 0b000111100;
3500 let Inst{21} = 1;
3501 let Inst{20-16} = Rm;
3502 let Inst{15-10} = 0b001000;
3503 let Inst{9-5} = Rn;
3504 let Inst{4} = signalAllNans;
3505 let Inst{3-0} = 0b0000;
3506}
3507
3508multiclass FPComparison<bit signalAllNans, string asm,
3509 SDPatternOperator OpNode = null_frag> {
3510 let Defs = [CPSR] in {
3511 def Srr : BaseTwoOperandFPComparison<signalAllNans, FPR32, asm,
3512 [(OpNode FPR32:$Rn, (f32 FPR32:$Rm)), (implicit CPSR)]> {
3513 let Inst{22} = 0;
3514 }
3515
3516 def Sri : BaseOneOperandFPComparison<signalAllNans, FPR32, asm,
3517 [(OpNode (f32 FPR32:$Rn), fpimm0), (implicit CPSR)]> {
3518 let Inst{22} = 0;
3519 }
3520
3521 def Drr : BaseTwoOperandFPComparison<signalAllNans, FPR64, asm,
3522 [(OpNode FPR64:$Rn, (f64 FPR64:$Rm)), (implicit CPSR)]> {
3523 let Inst{22} = 1;
3524 }
3525
3526 def Dri : BaseOneOperandFPComparison<signalAllNans, FPR64, asm,
3527 [(OpNode (f64 FPR64:$Rn), fpimm0), (implicit CPSR)]> {
3528 let Inst{22} = 1;
3529 }
3530 } // Defs = [CPSR]
3531}
3532
3533//---
3534// Floating point conditional comparisons
3535//---
3536
3537let mayLoad = 0, mayStore = 0, hasSideEffects = 0 in
3538class BaseFPCondComparison<bit signalAllNans,
3539 RegisterClass regtype, string asm>
3540 : I<(outs), (ins regtype:$Rn, regtype:$Rm, imm0_15:$nzcv, ccode:$cond),
3541 asm, "\t$Rn, $Rm, $nzcv, $cond", "", []>,
3542 Sched<[WriteFCmp]> {
3543 bits<5> Rn;
3544 bits<5> Rm;
3545 bits<4> nzcv;
3546 bits<4> cond;
3547
3548 let Inst{31-23} = 0b000111100;
3549 let Inst{21} = 1;
3550 let Inst{20-16} = Rm;
3551 let Inst{15-12} = cond;
3552 let Inst{11-10} = 0b01;
3553 let Inst{9-5} = Rn;
3554 let Inst{4} = signalAllNans;
3555 let Inst{3-0} = nzcv;
3556}
3557
3558multiclass FPCondComparison<bit signalAllNans, string asm> {
3559 let Defs = [CPSR], Uses = [CPSR] in {
3560 def Srr : BaseFPCondComparison<signalAllNans, FPR32, asm> {
3561 let Inst{22} = 0;
3562 }
3563
3564 def Drr : BaseFPCondComparison<signalAllNans, FPR64, asm> {
3565 let Inst{22} = 1;
3566 }
3567 } // Defs = [CPSR], Uses = [CPSR]
3568}
3569
3570//---
3571// Floating point conditional select
3572//---
3573
3574class BaseFPCondSelect<RegisterClass regtype, ValueType vt, string asm>
3575 : I<(outs regtype:$Rd), (ins regtype:$Rn, regtype:$Rm, ccode:$cond),
3576 asm, "\t$Rd, $Rn, $Rm, $cond", "",
3577 [(set regtype:$Rd,
3578 (ARM64csel (vt regtype:$Rn), regtype:$Rm,
3579 (i32 imm:$cond), CPSR))]>,
3580 Sched<[WriteF]> {
3581 bits<5> Rd;
3582 bits<5> Rn;
3583 bits<5> Rm;
3584 bits<4> cond;
3585
3586 let Inst{31-23} = 0b000111100;
3587 let Inst{21} = 1;
3588 let Inst{20-16} = Rm;
3589 let Inst{15-12} = cond;
3590 let Inst{11-10} = 0b11;
3591 let Inst{9-5} = Rn;
3592 let Inst{4-0} = Rd;
3593}
3594
3595multiclass FPCondSelect<string asm> {
3596 let Uses = [CPSR] in {
3597 def Srrr : BaseFPCondSelect<FPR32, f32, asm> {
3598 let Inst{22} = 0;
3599 }
3600
3601 def Drrr : BaseFPCondSelect<FPR64, f64, asm> {
3602 let Inst{22} = 1;
3603 }
3604 } // Uses = [CPSR]
3605}
3606
3607//---
3608// Floating move immediate
3609//---
3610
3611class BaseFPMoveImmediate<RegisterClass regtype, Operand fpimmtype, string asm>
3612 : I<(outs regtype:$Rd), (ins fpimmtype:$imm), asm, "\t$Rd, $imm", "",
3613 [(set regtype:$Rd, fpimmtype:$imm)]>,
3614 Sched<[WriteFImm]> {
3615 bits<5> Rd;
3616 bits<8> imm;
3617 let Inst{31-23} = 0b000111100;
3618 let Inst{21} = 1;
3619 let Inst{20-13} = imm;
3620 let Inst{12-5} = 0b10000000;
3621 let Inst{4-0} = Rd;
3622}
3623
3624multiclass FPMoveImmediate<string asm> {
3625 def Si : BaseFPMoveImmediate<FPR32, fpimm32, asm> {
3626 let Inst{22} = 0;
3627 }
3628
3629 def Di : BaseFPMoveImmediate<FPR64, fpimm64, asm> {
3630 let Inst{22} = 1;
3631 }
3632}
3633
3634//----------------------------------------------------------------------------
3635// AdvSIMD
3636//----------------------------------------------------------------------------
3637
3638def VectorIndexBOperand : AsmOperandClass { let Name = "VectorIndexB"; }
3639def VectorIndexHOperand : AsmOperandClass { let Name = "VectorIndexH"; }
3640def VectorIndexSOperand : AsmOperandClass { let Name = "VectorIndexS"; }
3641def VectorIndexDOperand : AsmOperandClass { let Name = "VectorIndexD"; }
3642def VectorIndexB : Operand<i64>, ImmLeaf<i64, [{
3643 return ((uint64_t)Imm) < 16;
3644}]> {
3645 let ParserMatchClass = VectorIndexBOperand;
3646 let PrintMethod = "printVectorIndex";
3647 let MIOperandInfo = (ops i64imm);
3648}
3649def VectorIndexH : Operand<i64>, ImmLeaf<i64, [{
3650 return ((uint64_t)Imm) < 8;
3651}]> {
3652 let ParserMatchClass = VectorIndexHOperand;
3653 let PrintMethod = "printVectorIndex";
3654 let MIOperandInfo = (ops i64imm);
3655}
3656def VectorIndexS : Operand<i64>, ImmLeaf<i64, [{
3657 return ((uint64_t)Imm) < 4;
3658}]> {
3659 let ParserMatchClass = VectorIndexSOperand;
3660 let PrintMethod = "printVectorIndex";
3661 let MIOperandInfo = (ops i64imm);
3662}
3663def VectorIndexD : Operand<i64>, ImmLeaf<i64, [{
3664 return ((uint64_t)Imm) < 2;
3665}]> {
3666 let ParserMatchClass = VectorIndexDOperand;
3667 let PrintMethod = "printVectorIndex";
3668 let MIOperandInfo = (ops i64imm);
3669}
3670
3671//----------------------------------------------------------------------------
3672// AdvSIMD three register vector instructions
3673//----------------------------------------------------------------------------
3674
3675let mayLoad = 0, mayStore = 0, hasSideEffects = 0 in
3676class BaseSIMDThreeSameVector<bit Q, bit U, bits<2> size, bits<5> opcode,
3677 RegisterOperand regtype, string asm, string kind,
3678 list<dag> pattern>
3679 : I<(outs regtype:$Rd), (ins regtype:$Rn, regtype:$Rm), asm,
3680 "{\t$Rd" # kind # ", $Rn" # kind # ", $Rm" # kind #
3681 "|" # kind # "\t$Rd, $Rn, $Rm|}", "", pattern>,
3682 Sched<[WriteV]> {
3683 bits<5> Rd;
3684 bits<5> Rn;
3685 bits<5> Rm;
3686 let Inst{31} = 0;
3687 let Inst{30} = Q;
3688 let Inst{29} = U;
3689 let Inst{28-24} = 0b01110;
3690 let Inst{23-22} = size;
3691 let Inst{21} = 1;
3692 let Inst{20-16} = Rm;
3693 let Inst{15-11} = opcode;
3694 let Inst{10} = 1;
3695 let Inst{9-5} = Rn;
3696 let Inst{4-0} = Rd;
3697}
3698
3699let mayLoad = 0, mayStore = 0, hasSideEffects = 0 in
3700class BaseSIMDThreeSameVectorTied<bit Q, bit U, bits<2> size, bits<5> opcode,
3701 RegisterOperand regtype, string asm, string kind,
3702 list<dag> pattern>
3703 : I<(outs regtype:$dst), (ins regtype:$Rd, regtype:$Rn, regtype:$Rm), asm,
3704 "{\t$Rd" # kind # ", $Rn" # kind # ", $Rm" # kind #
3705 "|" # kind # "\t$Rd, $Rn, $Rm}", "$Rd = $dst", pattern>,
3706 Sched<[WriteV]> {
3707 bits<5> Rd;
3708 bits<5> Rn;
3709 bits<5> Rm;
3710 let Inst{31} = 0;
3711 let Inst{30} = Q;
3712 let Inst{29} = U;
3713 let Inst{28-24} = 0b01110;
3714 let Inst{23-22} = size;
3715 let Inst{21} = 1;
3716 let Inst{20-16} = Rm;
3717 let Inst{15-11} = opcode;
3718 let Inst{10} = 1;
3719 let Inst{9-5} = Rn;
3720 let Inst{4-0} = Rd;
3721}
3722
3723// All operand sizes distinguished in the encoding.
3724multiclass SIMDThreeSameVector<bit U, bits<5> opc, string asm,
3725 SDPatternOperator OpNode> {
3726 def v8i8 : BaseSIMDThreeSameVector<0, U, 0b00, opc, V64,
3727 asm, ".8b",
3728 [(set (v8i8 V64:$Rd), (OpNode (v8i8 V64:$Rn), (v8i8 V64:$Rm)))]>;
3729 def v16i8 : BaseSIMDThreeSameVector<1, U, 0b00, opc, V128,
3730 asm, ".16b",
3731 [(set (v16i8 V128:$Rd), (OpNode (v16i8 V128:$Rn), (v16i8 V128:$Rm)))]>;
3732 def v4i16 : BaseSIMDThreeSameVector<0, U, 0b01, opc, V64,
3733 asm, ".4h",
3734 [(set (v4i16 V64:$Rd), (OpNode (v4i16 V64:$Rn), (v4i16 V64:$Rm)))]>;
3735 def v8i16 : BaseSIMDThreeSameVector<1, U, 0b01, opc, V128,
3736 asm, ".8h",
3737 [(set (v8i16 V128:$Rd), (OpNode (v8i16 V128:$Rn), (v8i16 V128:$Rm)))]>;
3738 def v2i32 : BaseSIMDThreeSameVector<0, U, 0b10, opc, V64,
3739 asm, ".2s",
3740 [(set (v2i32 V64:$Rd), (OpNode (v2i32 V64:$Rn), (v2i32 V64:$Rm)))]>;
3741 def v4i32 : BaseSIMDThreeSameVector<1, U, 0b10, opc, V128,
3742 asm, ".4s",
3743 [(set (v4i32 V128:$Rd), (OpNode (v4i32 V128:$Rn), (v4i32 V128:$Rm)))]>;
3744 def v2i64 : BaseSIMDThreeSameVector<1, U, 0b11, opc, V128,
3745 asm, ".2d",
3746 [(set (v2i64 V128:$Rd), (OpNode (v2i64 V128:$Rn), (v2i64 V128:$Rm)))]>;
3747}
3748
3749// As above, but D sized elements unsupported.
3750multiclass SIMDThreeSameVectorBHS<bit U, bits<5> opc, string asm,
3751 SDPatternOperator OpNode> {
3752 def v8i8 : BaseSIMDThreeSameVector<0, U, 0b00, opc, V64,
3753 asm, ".8b",
3754 [(set V64:$Rd, (v8i8 (OpNode (v8i8 V64:$Rn), (v8i8 V64:$Rm))))]>;
3755 def v16i8 : BaseSIMDThreeSameVector<1, U, 0b00, opc, V128,
3756 asm, ".16b",
3757 [(set V128:$Rd, (v16i8 (OpNode (v16i8 V128:$Rn), (v16i8 V128:$Rm))))]>;
3758 def v4i16 : BaseSIMDThreeSameVector<0, U, 0b01, opc, V64,
3759 asm, ".4h",
3760 [(set V64:$Rd, (v4i16 (OpNode (v4i16 V64:$Rn), (v4i16 V64:$Rm))))]>;
3761 def v8i16 : BaseSIMDThreeSameVector<1, U, 0b01, opc, V128,
3762 asm, ".8h",
3763 [(set V128:$Rd, (v8i16 (OpNode (v8i16 V128:$Rn), (v8i16 V128:$Rm))))]>;
3764 def v2i32 : BaseSIMDThreeSameVector<0, U, 0b10, opc, V64,
3765 asm, ".2s",
3766 [(set V64:$Rd, (v2i32 (OpNode (v2i32 V64:$Rn), (v2i32 V64:$Rm))))]>;
3767 def v4i32 : BaseSIMDThreeSameVector<1, U, 0b10, opc, V128,
3768 asm, ".4s",
3769 [(set V128:$Rd, (v4i32 (OpNode (v4i32 V128:$Rn), (v4i32 V128:$Rm))))]>;
3770}
3771
3772multiclass SIMDThreeSameVectorBHSTied<bit U, bits<5> opc, string asm,
3773 SDPatternOperator OpNode> {
3774 def v8i8 : BaseSIMDThreeSameVectorTied<0, U, 0b00, opc, V64,
3775 asm, ".8b",
3776 [(set (v8i8 V64:$dst),
3777 (OpNode (v8i8 V64:$Rd), (v8i8 V64:$Rn), (v8i8 V64:$Rm)))]>;
3778 def v16i8 : BaseSIMDThreeSameVectorTied<1, U, 0b00, opc, V128,
3779 asm, ".16b",
3780 [(set (v16i8 V128:$dst),
3781 (OpNode (v16i8 V128:$Rd), (v16i8 V128:$Rn), (v16i8 V128:$Rm)))]>;
3782 def v4i16 : BaseSIMDThreeSameVectorTied<0, U, 0b01, opc, V64,
3783 asm, ".4h",
3784 [(set (v4i16 V64:$dst),
3785 (OpNode (v4i16 V64:$Rd), (v4i16 V64:$Rn), (v4i16 V64:$Rm)))]>;
3786 def v8i16 : BaseSIMDThreeSameVectorTied<1, U, 0b01, opc, V128,
3787 asm, ".8h",
3788 [(set (v8i16 V128:$dst),
3789 (OpNode (v8i16 V128:$Rd), (v8i16 V128:$Rn), (v8i16 V128:$Rm)))]>;
3790 def v2i32 : BaseSIMDThreeSameVectorTied<0, U, 0b10, opc, V64,
3791 asm, ".2s",
3792 [(set (v2i32 V64:$dst),
3793 (OpNode (v2i32 V64:$Rd), (v2i32 V64:$Rn), (v2i32 V64:$Rm)))]>;
3794 def v4i32 : BaseSIMDThreeSameVectorTied<1, U, 0b10, opc, V128,
3795 asm, ".4s",
3796 [(set (v4i32 V128:$dst),
3797 (OpNode (v4i32 V128:$Rd), (v4i32 V128:$Rn), (v4i32 V128:$Rm)))]>;
3798}
3799
3800// As above, but only B sized elements supported.
3801multiclass SIMDThreeSameVectorB<bit U, bits<5> opc, string asm,
3802 SDPatternOperator OpNode> {
3803 def v8i8 : BaseSIMDThreeSameVector<0, U, 0b00, opc, V64,
3804 asm, ".8b",
3805 [(set (v8i8 V64:$Rd), (OpNode (v8i8 V64:$Rn), (v8i8 V64:$Rm)))]>;
3806 def v16i8 : BaseSIMDThreeSameVector<1, U, 0b00, opc, V128,
3807 asm, ".16b",
3808 [(set (v16i8 V128:$Rd),
3809 (OpNode (v16i8 V128:$Rn), (v16i8 V128:$Rm)))]>;
3810}
3811
3812// As above, but only S and D sized floating point elements supported.
3813multiclass SIMDThreeSameVectorFP<bit U, bit S, bits<5> opc,
3814 string asm, SDPatternOperator OpNode> {
3815 def v2f32 : BaseSIMDThreeSameVector<0, U, {S,0}, opc, V64,
3816 asm, ".2s",
3817 [(set (v2f32 V64:$Rd), (OpNode (v2f32 V64:$Rn), (v2f32 V64:$Rm)))]>;
3818 def v4f32 : BaseSIMDThreeSameVector<1, U, {S,0}, opc, V128,
3819 asm, ".4s",
3820 [(set (v4f32 V128:$Rd), (OpNode (v4f32 V128:$Rn), (v4f32 V128:$Rm)))]>;
3821 def v2f64 : BaseSIMDThreeSameVector<1, U, {S,1}, opc, V128,
3822 asm, ".2d",
3823 [(set (v2f64 V128:$Rd), (OpNode (v2f64 V128:$Rn), (v2f64 V128:$Rm)))]>;
3824}
3825
3826multiclass SIMDThreeSameVectorFPCmp<bit U, bit S, bits<5> opc,
3827 string asm,
3828 SDPatternOperator OpNode> {
3829 def v2f32 : BaseSIMDThreeSameVector<0, U, {S,0}, opc, V64,
3830 asm, ".2s",
3831 [(set (v2i32 V64:$Rd), (OpNode (v2f32 V64:$Rn), (v2f32 V64:$Rm)))]>;
3832 def v4f32 : BaseSIMDThreeSameVector<1, U, {S,0}, opc, V128,
3833 asm, ".4s",
3834 [(set (v4i32 V128:$Rd), (OpNode (v4f32 V128:$Rn), (v4f32 V128:$Rm)))]>;
3835 def v2f64 : BaseSIMDThreeSameVector<1, U, {S,1}, opc, V128,
3836 asm, ".2d",
3837 [(set (v2i64 V128:$Rd), (OpNode (v2f64 V128:$Rn), (v2f64 V128:$Rm)))]>;
3838}
3839
3840multiclass SIMDThreeSameVectorFPTied<bit U, bit S, bits<5> opc,
3841 string asm, SDPatternOperator OpNode> {
3842 def v2f32 : BaseSIMDThreeSameVectorTied<0, U, {S,0}, opc, V64,
3843 asm, ".2s",
3844 [(set (v2f32 V64:$dst),
3845 (OpNode (v2f32 V64:$Rd), (v2f32 V64:$Rn), (v2f32 V64:$Rm)))]>;
3846 def v4f32 : BaseSIMDThreeSameVectorTied<1, U, {S,0}, opc, V128,
3847 asm, ".4s",
3848 [(set (v4f32 V128:$dst),
3849 (OpNode (v4f32 V128:$Rd), (v4f32 V128:$Rn), (v4f32 V128:$Rm)))]>;
3850 def v2f64 : BaseSIMDThreeSameVectorTied<1, U, {S,1}, opc, V128,
3851 asm, ".2d",
3852 [(set (v2f64 V128:$dst),
3853 (OpNode (v2f64 V128:$Rd), (v2f64 V128:$Rn), (v2f64 V128:$Rm)))]>;
3854}
3855
3856// As above, but D and B sized elements unsupported.
3857multiclass SIMDThreeSameVectorHS<bit U, bits<5> opc, string asm,
3858 SDPatternOperator OpNode> {
3859 def v4i16 : BaseSIMDThreeSameVector<0, U, 0b01, opc, V64,
3860 asm, ".4h",
3861 [(set (v4i16 V64:$Rd), (OpNode (v4i16 V64:$Rn), (v4i16 V64:$Rm)))]>;
3862 def v8i16 : BaseSIMDThreeSameVector<1, U, 0b01, opc, V128,
3863 asm, ".8h",
3864 [(set (v8i16 V128:$Rd), (OpNode (v8i16 V128:$Rn), (v8i16 V128:$Rm)))]>;
3865 def v2i32 : BaseSIMDThreeSameVector<0, U, 0b10, opc, V64,
3866 asm, ".2s",
3867 [(set (v2i32 V64:$Rd), (OpNode (v2i32 V64:$Rn), (v2i32 V64:$Rm)))]>;
3868 def v4i32 : BaseSIMDThreeSameVector<1, U, 0b10, opc, V128,
3869 asm, ".4s",
3870 [(set (v4i32 V128:$Rd), (OpNode (v4i32 V128:$Rn), (v4i32 V128:$Rm)))]>;
3871}
3872
3873// Logical three vector ops share opcode bits, and only use B sized elements.
3874multiclass SIMDLogicalThreeVector<bit U, bits<2> size, string asm,
3875 SDPatternOperator OpNode = null_frag> {
3876 def v8i8 : BaseSIMDThreeSameVector<0, U, size, 0b00011, V64,
3877 asm, ".8b",
3878 [(set (v8i8 V64:$Rd), (OpNode V64:$Rn, V64:$Rm))]>;
3879 def v16i8 : BaseSIMDThreeSameVector<1, U, size, 0b00011, V128,
3880 asm, ".16b",
3881 [(set (v16i8 V128:$Rd), (OpNode V128:$Rn, V128:$Rm))]>;
3882
3883 def : Pat<(v4i16 (OpNode V64:$LHS, V64:$RHS)),
3884 (!cast<Instruction>(NAME#"v8i8") V64:$LHS, V64:$RHS)>;
3885 def : Pat<(v2i32 (OpNode V64:$LHS, V64:$RHS)),
3886 (!cast<Instruction>(NAME#"v8i8") V64:$LHS, V64:$RHS)>;
3887 def : Pat<(v1i64 (OpNode V64:$LHS, V64:$RHS)),
3888 (!cast<Instruction>(NAME#"v8i8") V64:$LHS, V64:$RHS)>;
3889
3890 def : Pat<(v8i16 (OpNode V128:$LHS, V128:$RHS)),
3891 (!cast<Instruction>(NAME#"v16i8") V128:$LHS, V128:$RHS)>;
3892 def : Pat<(v4i32 (OpNode V128:$LHS, V128:$RHS)),
3893 (!cast<Instruction>(NAME#"v16i8") V128:$LHS, V128:$RHS)>;
3894 def : Pat<(v2i64 (OpNode V128:$LHS, V128:$RHS)),
3895 (!cast<Instruction>(NAME#"v16i8") V128:$LHS, V128:$RHS)>;
3896}
3897
3898multiclass SIMDLogicalThreeVectorTied<bit U, bits<2> size,
3899 string asm, SDPatternOperator OpNode> {
3900 def v8i8 : BaseSIMDThreeSameVectorTied<0, U, size, 0b00011, V64,
3901 asm, ".8b",
3902 [(set (v8i8 V64:$dst),
3903 (OpNode (v8i8 V64:$Rd), (v8i8 V64:$Rn), (v8i8 V64:$Rm)))]>;
3904 def v16i8 : BaseSIMDThreeSameVectorTied<1, U, size, 0b00011, V128,
3905 asm, ".16b",
3906 [(set (v16i8 V128:$dst),
3907 (OpNode (v16i8 V128:$Rd), (v16i8 V128:$Rn),
3908 (v16i8 V128:$Rm)))]>;
3909
3910 def : Pat<(v4i16 (OpNode (v4i16 V64:$LHS), (v4i16 V64:$MHS),
3911 (v4i16 V64:$RHS))),
3912 (!cast<Instruction>(NAME#"v8i8")
3913 V64:$LHS, V64:$MHS, V64:$RHS)>;
3914 def : Pat<(v2i32 (OpNode (v2i32 V64:$LHS), (v2i32 V64:$MHS),
3915 (v2i32 V64:$RHS))),
3916 (!cast<Instruction>(NAME#"v8i8")
3917 V64:$LHS, V64:$MHS, V64:$RHS)>;
3918 def : Pat<(v1i64 (OpNode (v1i64 V64:$LHS), (v1i64 V64:$MHS),
3919 (v1i64 V64:$RHS))),
3920 (!cast<Instruction>(NAME#"v8i8")
3921 V64:$LHS, V64:$MHS, V64:$RHS)>;
3922
3923 def : Pat<(v8i16 (OpNode (v8i16 V128:$LHS), (v8i16 V128:$MHS),
3924 (v8i16 V128:$RHS))),
3925 (!cast<Instruction>(NAME#"v16i8")
3926 V128:$LHS, V128:$MHS, V128:$RHS)>;
3927 def : Pat<(v4i32 (OpNode (v4i32 V128:$LHS), (v4i32 V128:$MHS),
3928 (v4i32 V128:$RHS))),
3929 (!cast<Instruction>(NAME#"v16i8")
3930 V128:$LHS, V128:$MHS, V128:$RHS)>;
3931 def : Pat<(v2i64 (OpNode (v2i64 V128:$LHS), (v2i64 V128:$MHS),
3932 (v2i64 V128:$RHS))),
3933 (!cast<Instruction>(NAME#"v16i8")
3934 V128:$LHS, V128:$MHS, V128:$RHS)>;
3935}
3936
3937
3938//----------------------------------------------------------------------------
3939// AdvSIMD two register vector instructions.
3940//----------------------------------------------------------------------------
3941
3942let mayLoad = 0, mayStore = 0, hasSideEffects = 0 in
3943class BaseSIMDTwoSameVector<bit Q, bit U, bits<2> size, bits<5> opcode,
3944 RegisterOperand regtype, string asm, string dstkind,
3945 string srckind, list<dag> pattern>
3946 : I<(outs regtype:$Rd), (ins regtype:$Rn), asm,
3947 "{\t$Rd" # dstkind # ", $Rn" # srckind #
3948 "|" # dstkind # "\t$Rd, $Rn}", "", pattern>,
3949 Sched<[WriteV]> {
3950 bits<5> Rd;
3951 bits<5> Rn;
3952 let Inst{31} = 0;
3953 let Inst{30} = Q;
3954 let Inst{29} = U;
3955 let Inst{28-24} = 0b01110;
3956 let Inst{23-22} = size;
3957 let Inst{21-17} = 0b10000;
3958 let Inst{16-12} = opcode;
3959 let Inst{11-10} = 0b10;
3960 let Inst{9-5} = Rn;
3961 let Inst{4-0} = Rd;
3962}
3963
3964let mayLoad = 0, mayStore = 0, hasSideEffects = 0 in
3965class BaseSIMDTwoSameVectorTied<bit Q, bit U, bits<2> size, bits<5> opcode,
3966 RegisterOperand regtype, string asm, string dstkind,
3967 string srckind, list<dag> pattern>
3968 : I<(outs regtype:$dst), (ins regtype:$Rd, regtype:$Rn), asm,
3969 "{\t$Rd" # dstkind # ", $Rn" # srckind #
3970 "|" # dstkind # "\t$Rd, $Rn}", "$Rd = $dst", pattern>,
3971 Sched<[WriteV]> {
3972 bits<5> Rd;
3973 bits<5> Rn;
3974 let Inst{31} = 0;
3975 let Inst{30} = Q;
3976 let Inst{29} = U;
3977 let Inst{28-24} = 0b01110;
3978 let Inst{23-22} = size;
3979 let Inst{21-17} = 0b10000;
3980 let Inst{16-12} = opcode;
3981 let Inst{11-10} = 0b10;
3982 let Inst{9-5} = Rn;
3983 let Inst{4-0} = Rd;
3984}
3985
3986// Supports B, H, and S element sizes.
3987multiclass SIMDTwoVectorBHS<bit U, bits<5> opc, string asm,
3988 SDPatternOperator OpNode> {
3989 def v8i8 : BaseSIMDTwoSameVector<0, U, 0b00, opc, V64,
3990 asm, ".8b", ".8b",
3991 [(set (v8i8 V64:$Rd), (OpNode (v8i8 V64:$Rn)))]>;
3992 def v16i8 : BaseSIMDTwoSameVector<1, U, 0b00, opc, V128,
3993 asm, ".16b", ".16b",
3994 [(set (v16i8 V128:$Rd), (OpNode (v16i8 V128:$Rn)))]>;
3995 def v4i16 : BaseSIMDTwoSameVector<0, U, 0b01, opc, V64,
3996 asm, ".4h", ".4h",
3997 [(set (v4i16 V64:$Rd), (OpNode (v4i16 V64:$Rn)))]>;
3998 def v8i16 : BaseSIMDTwoSameVector<1, U, 0b01, opc, V128,
3999 asm, ".8h", ".8h",
4000 [(set (v8i16 V128:$Rd), (OpNode (v8i16 V128:$Rn)))]>;
4001 def v2i32 : BaseSIMDTwoSameVector<0, U, 0b10, opc, V64,
4002 asm, ".2s", ".2s",
4003 [(set (v2i32 V64:$Rd), (OpNode (v2i32 V64:$Rn)))]>;
4004 def v4i32 : BaseSIMDTwoSameVector<1, U, 0b10, opc, V128,
4005 asm, ".4s", ".4s",
4006 [(set (v4i32 V128:$Rd), (OpNode (v4i32 V128:$Rn)))]>;
4007}
4008
4009class BaseSIMDVectorLShiftLongBySize<bit Q, bits<2> size,
4010 RegisterOperand regtype, string asm, string dstkind,
4011 string srckind, string amount>
4012 : I<(outs V128:$Rd), (ins regtype:$Rn), asm,
4013 "{\t$Rd" # dstkind # ", $Rn" # srckind # ", #" # amount #
4014 "|" # dstkind # "\t$Rd, $Rn, #" # amount # "}", "", []>,
4015 Sched<[WriteV]> {
4016 bits<5> Rd;
4017 bits<5> Rn;
4018 let Inst{31} = 0;
4019 let Inst{30} = Q;
4020 let Inst{29-24} = 0b101110;
4021 let Inst{23-22} = size;
4022 let Inst{21-10} = 0b100001001110;
4023 let Inst{9-5} = Rn;
4024 let Inst{4-0} = Rd;
4025}
4026
4027multiclass SIMDVectorLShiftLongBySizeBHS {
4028 let neverHasSideEffects = 1 in {
4029 def v8i8 : BaseSIMDVectorLShiftLongBySize<0, 0b00, V64,
4030 "shll", ".8h", ".8b", "8">;
4031 def v16i8 : BaseSIMDVectorLShiftLongBySize<1, 0b00, V128,
4032 "shll2", ".8h", ".16b", "8">;
4033 def v4i16 : BaseSIMDVectorLShiftLongBySize<0, 0b01, V64,
4034 "shll", ".4s", ".4h", "16">;
4035 def v8i16 : BaseSIMDVectorLShiftLongBySize<1, 0b01, V128,
4036 "shll2", ".4s", ".8h", "16">;
4037 def v2i32 : BaseSIMDVectorLShiftLongBySize<0, 0b10, V64,
4038 "shll", ".2d", ".2s", "32">;
4039 def v4i32 : BaseSIMDVectorLShiftLongBySize<1, 0b10, V128,
4040 "shll2", ".2d", ".4s", "32">;
4041 }
4042}
4043
4044// Supports all element sizes.
4045multiclass SIMDLongTwoVector<bit U, bits<5> opc, string asm,
4046 SDPatternOperator OpNode> {
4047 def v8i8_v4i16 : BaseSIMDTwoSameVector<0, U, 0b00, opc, V64,
4048 asm, ".4h", ".8b",
4049 [(set (v4i16 V64:$Rd), (OpNode (v8i8 V64:$Rn)))]>;
4050 def v16i8_v8i16 : BaseSIMDTwoSameVector<1, U, 0b00, opc, V128,
4051 asm, ".8h", ".16b",
4052 [(set (v8i16 V128:$Rd), (OpNode (v16i8 V128:$Rn)))]>;
4053 def v4i16_v2i32 : BaseSIMDTwoSameVector<0, U, 0b01, opc, V64,
4054 asm, ".2s", ".4h",
4055 [(set (v2i32 V64:$Rd), (OpNode (v4i16 V64:$Rn)))]>;
4056 def v8i16_v4i32 : BaseSIMDTwoSameVector<1, U, 0b01, opc, V128,
4057 asm, ".4s", ".8h",
4058 [(set (v4i32 V128:$Rd), (OpNode (v8i16 V128:$Rn)))]>;
4059 def v2i32_v1i64 : BaseSIMDTwoSameVector<0, U, 0b10, opc, V64,
4060 asm, ".1d", ".2s",
4061 [(set (v1i64 V64:$Rd), (OpNode (v2i32 V64:$Rn)))]>;
4062 def v4i32_v2i64 : BaseSIMDTwoSameVector<1, U, 0b10, opc, V128,
4063 asm, ".2d", ".4s",
4064 [(set (v2i64 V128:$Rd), (OpNode (v4i32 V128:$Rn)))]>;
4065}
4066
4067multiclass SIMDLongTwoVectorTied<bit U, bits<5> opc, string asm,
4068 SDPatternOperator OpNode> {
4069 def v8i8_v4i16 : BaseSIMDTwoSameVectorTied<0, U, 0b00, opc, V64,
4070 asm, ".4h", ".8b",
4071 [(set (v4i16 V64:$dst), (OpNode (v4i16 V64:$Rd),
4072 (v8i8 V64:$Rn)))]>;
4073 def v16i8_v8i16 : BaseSIMDTwoSameVectorTied<1, U, 0b00, opc, V128,
4074 asm, ".8h", ".16b",
4075 [(set (v8i16 V128:$dst), (OpNode (v8i16 V128:$Rd),
4076 (v16i8 V128:$Rn)))]>;
4077 def v4i16_v2i32 : BaseSIMDTwoSameVectorTied<0, U, 0b01, opc, V64,
4078 asm, ".2s", ".4h",
4079 [(set (v2i32 V64:$dst), (OpNode (v2i32 V64:$Rd),
4080 (v4i16 V64:$Rn)))]>;
4081 def v8i16_v4i32 : BaseSIMDTwoSameVectorTied<1, U, 0b01, opc, V128,
4082 asm, ".4s", ".8h",
4083 [(set (v4i32 V128:$dst), (OpNode (v4i32 V128:$Rd),
4084 (v8i16 V128:$Rn)))]>;
4085 def v2i32_v1i64 : BaseSIMDTwoSameVectorTied<0, U, 0b10, opc, V64,
4086 asm, ".1d", ".2s",
4087 [(set (v1i64 V64:$dst), (OpNode (v1i64 V64:$Rd),
4088 (v2i32 V64:$Rn)))]>;
4089 def v4i32_v2i64 : BaseSIMDTwoSameVectorTied<1, U, 0b10, opc, V128,
4090 asm, ".2d", ".4s",
4091 [(set (v2i64 V128:$dst), (OpNode (v2i64 V128:$Rd),
4092 (v4i32 V128:$Rn)))]>;
4093}
4094
4095// Supports all element sizes, except 1xD.
4096multiclass SIMDTwoVectorBHSDTied<bit U, bits<5> opc, string asm,
4097 SDPatternOperator OpNode> {
4098 def v8i8 : BaseSIMDTwoSameVectorTied<0, U, 0b00, opc, V64,
4099 asm, ".8b", ".8b",
4100 [(set (v8i8 V64:$dst), (OpNode (v8i8 V64:$Rd), (v8i8 V64:$Rn)))]>;
4101 def v16i8 : BaseSIMDTwoSameVectorTied<1, U, 0b00, opc, V128,
4102 asm, ".16b", ".16b",
4103 [(set (v16i8 V128:$dst), (OpNode (v16i8 V128:$Rd), (v16i8 V128:$Rn)))]>;
4104 def v4i16 : BaseSIMDTwoSameVectorTied<0, U, 0b01, opc, V64,
4105 asm, ".4h", ".4h",
4106 [(set (v4i16 V64:$dst), (OpNode (v4i16 V64:$Rd), (v4i16 V64:$Rn)))]>;
4107 def v8i16 : BaseSIMDTwoSameVectorTied<1, U, 0b01, opc, V128,
4108 asm, ".8h", ".8h",
4109 [(set (v8i16 V128:$dst), (OpNode (v8i16 V128:$Rd), (v8i16 V128:$Rn)))]>;
4110 def v2i32 : BaseSIMDTwoSameVectorTied<0, U, 0b10, opc, V64,
4111 asm, ".2s", ".2s",
4112 [(set (v2i32 V64:$dst), (OpNode (v2i32 V64:$Rd), (v2i32 V64:$Rn)))]>;
4113 def v4i32 : BaseSIMDTwoSameVectorTied<1, U, 0b10, opc, V128,
4114 asm, ".4s", ".4s",
4115 [(set (v4i32 V128:$dst), (OpNode (v4i32 V128:$Rd), (v4i32 V128:$Rn)))]>;
4116 def v2i64 : BaseSIMDTwoSameVectorTied<1, U, 0b11, opc, V128,
4117 asm, ".2d", ".2d",
4118 [(set (v2i64 V128:$dst), (OpNode (v2i64 V128:$Rd), (v2i64 V128:$Rn)))]>;
4119}
4120
4121multiclass SIMDTwoVectorBHSD<bit U, bits<5> opc, string asm,
4122 SDPatternOperator OpNode = null_frag> {
4123 def v8i8 : BaseSIMDTwoSameVector<0, U, 0b00, opc, V64,
4124 asm, ".8b", ".8b",
4125 [(set (v8i8 V64:$Rd), (OpNode (v8i8 V64:$Rn)))]>;
4126 def v16i8 : BaseSIMDTwoSameVector<1, U, 0b00, opc, V128,
4127 asm, ".16b", ".16b",
4128 [(set (v16i8 V128:$Rd), (OpNode (v16i8 V128:$Rn)))]>;
4129 def v4i16 : BaseSIMDTwoSameVector<0, U, 0b01, opc, V64,
4130 asm, ".4h", ".4h",
4131 [(set (v4i16 V64:$Rd), (OpNode (v4i16 V64:$Rn)))]>;
4132 def v8i16 : BaseSIMDTwoSameVector<1, U, 0b01, opc, V128,
4133 asm, ".8h", ".8h",
4134 [(set (v8i16 V128:$Rd), (OpNode (v8i16 V128:$Rn)))]>;
4135 def v2i32 : BaseSIMDTwoSameVector<0, U, 0b10, opc, V64,
4136 asm, ".2s", ".2s",
4137 [(set (v2i32 V64:$Rd), (OpNode (v2i32 V64:$Rn)))]>;
4138 def v4i32 : BaseSIMDTwoSameVector<1, U, 0b10, opc, V128,
4139 asm, ".4s", ".4s",
4140 [(set (v4i32 V128:$Rd), (OpNode (v4i32 V128:$Rn)))]>;
4141 def v2i64 : BaseSIMDTwoSameVector<1, U, 0b11, opc, V128,
4142 asm, ".2d", ".2d",
4143 [(set (v2i64 V128:$Rd), (OpNode (v2i64 V128:$Rn)))]>;
4144}
4145
4146
4147// Supports only B element sizes.
4148multiclass SIMDTwoVectorB<bit U, bits<2> size, bits<5> opc, string asm,
4149 SDPatternOperator OpNode> {
4150 def v8i8 : BaseSIMDTwoSameVector<0, U, size, opc, V64,
4151 asm, ".8b", ".8b",
4152 [(set (v8i8 V64:$Rd), (OpNode (v8i8 V64:$Rn)))]>;
4153 def v16i8 : BaseSIMDTwoSameVector<1, U, size, opc, V128,
4154 asm, ".16b", ".16b",
4155 [(set (v16i8 V128:$Rd), (OpNode (v16i8 V128:$Rn)))]>;
4156
4157}
4158
4159// Supports only B and H element sizes.
4160multiclass SIMDTwoVectorBH<bit U, bits<5> opc, string asm,
4161 SDPatternOperator OpNode> {
4162 def v8i8 : BaseSIMDTwoSameVector<0, U, 0b00, opc, V64,
4163 asm, ".8b", ".8b",
4164 [(set (v8i8 V64:$Rd), (OpNode V64:$Rn))]>;
4165 def v16i8 : BaseSIMDTwoSameVector<1, U, 0b00, opc, V128,
4166 asm, ".16b", ".16b",
4167 [(set (v16i8 V128:$Rd), (OpNode V128:$Rn))]>;
4168 def v4i16 : BaseSIMDTwoSameVector<0, U, 0b01, opc, V64,
4169 asm, ".4h", ".4h",
4170 [(set (v4i16 V64:$Rd), (OpNode V64:$Rn))]>;
4171 def v8i16 : BaseSIMDTwoSameVector<1, U, 0b01, opc, V128,
4172 asm, ".8h", ".8h",
4173 [(set (v8i16 V128:$Rd), (OpNode V128:$Rn))]>;
4174}
4175
4176// Supports only S and D element sizes, uses high bit of the size field
4177// as an extra opcode bit.
4178multiclass SIMDTwoVectorFP<bit U, bit S, bits<5> opc, string asm,
4179 SDPatternOperator OpNode> {
4180 def v2f32 : BaseSIMDTwoSameVector<0, U, {S,0}, opc, V64,
4181 asm, ".2s", ".2s",
4182 [(set (v2f32 V64:$Rd), (OpNode (v2f32 V64:$Rn)))]>;
4183 def v4f32 : BaseSIMDTwoSameVector<1, U, {S,0}, opc, V128,
4184 asm, ".4s", ".4s",
4185 [(set (v4f32 V128:$Rd), (OpNode (v4f32 V128:$Rn)))]>;
4186 def v2f64 : BaseSIMDTwoSameVector<1, U, {S,1}, opc, V128,
4187 asm, ".2d", ".2d",
4188 [(set (v2f64 V128:$Rd), (OpNode (v2f64 V128:$Rn)))]>;
4189}
4190
4191// Supports only S element size.
4192multiclass SIMDTwoVectorS<bit U, bit S, bits<5> opc, string asm,
4193 SDPatternOperator OpNode> {
4194 def v2i32 : BaseSIMDTwoSameVector<0, U, {S,0}, opc, V64,
4195 asm, ".2s", ".2s",
4196 [(set (v2i32 V64:$Rd), (OpNode (v2i32 V64:$Rn)))]>;
4197 def v4i32 : BaseSIMDTwoSameVector<1, U, {S,0}, opc, V128,
4198 asm, ".4s", ".4s",
4199 [(set (v4i32 V128:$Rd), (OpNode (v4i32 V128:$Rn)))]>;
4200}
4201
4202
4203multiclass SIMDTwoVectorFPToInt<bit U, bit S, bits<5> opc, string asm,
4204 SDPatternOperator OpNode> {
4205 def v2f32 : BaseSIMDTwoSameVector<0, U, {S,0}, opc, V64,
4206 asm, ".2s", ".2s",
4207 [(set (v2i32 V64:$Rd), (OpNode (v2f32 V64:$Rn)))]>;
4208 def v4f32 : BaseSIMDTwoSameVector<1, U, {S,0}, opc, V128,
4209 asm, ".4s", ".4s",
4210 [(set (v4i32 V128:$Rd), (OpNode (v4f32 V128:$Rn)))]>;
4211 def v2f64 : BaseSIMDTwoSameVector<1, U, {S,1}, opc, V128,
4212 asm, ".2d", ".2d",
4213 [(set (v2i64 V128:$Rd), (OpNode (v2f64 V128:$Rn)))]>;
4214}
4215
4216multiclass SIMDTwoVectorIntToFP<bit U, bit S, bits<5> opc, string asm,
4217 SDPatternOperator OpNode> {
4218 def v2f32 : BaseSIMDTwoSameVector<0, U, {S,0}, opc, V64,
4219 asm, ".2s", ".2s",
4220 [(set (v2f32 V64:$Rd), (OpNode (v2i32 V64:$Rn)))]>;
4221 def v4f32 : BaseSIMDTwoSameVector<1, U, {S,0}, opc, V128,
4222 asm, ".4s", ".4s",
4223 [(set (v4f32 V128:$Rd), (OpNode (v4i32 V128:$Rn)))]>;
4224 def v2f64 : BaseSIMDTwoSameVector<1, U, {S,1}, opc, V128,
4225 asm, ".2d", ".2d",
4226 [(set (v2f64 V128:$Rd), (OpNode (v2i64 V128:$Rn)))]>;
4227}
4228
4229
4230class BaseSIMDMixedTwoVector<bit Q, bit U, bits<2> size, bits<5> opcode,
4231 RegisterOperand inreg, RegisterOperand outreg,
4232 string asm, string outkind, string inkind,
4233 list<dag> pattern>
4234 : I<(outs outreg:$Rd), (ins inreg:$Rn), asm,
4235 "{\t$Rd" # outkind # ", $Rn" # inkind #
4236 "|" # outkind # "\t$Rd, $Rn}", "", pattern>,
4237 Sched<[WriteV]> {
4238 bits<5> Rd;
4239 bits<5> Rn;
4240 let Inst{31} = 0;
4241 let Inst{30} = Q;
4242 let Inst{29} = U;
4243 let Inst{28-24} = 0b01110;
4244 let Inst{23-22} = size;
4245 let Inst{21-17} = 0b10000;
4246 let Inst{16-12} = opcode;
4247 let Inst{11-10} = 0b10;
4248 let Inst{9-5} = Rn;
4249 let Inst{4-0} = Rd;
4250}
4251
4252class BaseSIMDMixedTwoVectorTied<bit Q, bit U, bits<2> size, bits<5> opcode,
4253 RegisterOperand inreg, RegisterOperand outreg,
4254 string asm, string outkind, string inkind,
4255 list<dag> pattern>
4256 : I<(outs outreg:$dst), (ins outreg:$Rd, inreg:$Rn), asm,
4257 "{\t$Rd" # outkind # ", $Rn" # inkind #
4258 "|" # outkind # "\t$Rd, $Rn}", "$Rd = $dst", pattern>,
4259 Sched<[WriteV]> {
4260 bits<5> Rd;
4261 bits<5> Rn;
4262 let Inst{31} = 0;
4263 let Inst{30} = Q;
4264 let Inst{29} = U;
4265 let Inst{28-24} = 0b01110;
4266 let Inst{23-22} = size;
4267 let Inst{21-17} = 0b10000;
4268 let Inst{16-12} = opcode;
4269 let Inst{11-10} = 0b10;
4270 let Inst{9-5} = Rn;
4271 let Inst{4-0} = Rd;
4272}
4273
4274multiclass SIMDMixedTwoVector<bit U, bits<5> opc, string asm,
4275 SDPatternOperator OpNode> {
4276 def v8i8 : BaseSIMDMixedTwoVector<0, U, 0b00, opc, V128, V64,
4277 asm, ".8b", ".8h",
4278 [(set (v8i8 V64:$Rd), (OpNode (v8i16 V128:$Rn)))]>;
4279 def v16i8 : BaseSIMDMixedTwoVectorTied<1, U, 0b00, opc, V128, V128,
4280 asm#"2", ".16b", ".8h", []>;
4281 def v4i16 : BaseSIMDMixedTwoVector<0, U, 0b01, opc, V128, V64,
4282 asm, ".4h", ".4s",
4283 [(set (v4i16 V64:$Rd), (OpNode (v4i32 V128:$Rn)))]>;
4284 def v8i16 : BaseSIMDMixedTwoVectorTied<1, U, 0b01, opc, V128, V128,
4285 asm#"2", ".8h", ".4s", []>;
4286 def v2i32 : BaseSIMDMixedTwoVector<0, U, 0b10, opc, V128, V64,
4287 asm, ".2s", ".2d",
4288 [(set (v2i32 V64:$Rd), (OpNode (v2i64 V128:$Rn)))]>;
4289 def v4i32 : BaseSIMDMixedTwoVectorTied<1, U, 0b10, opc, V128, V128,
4290 asm#"2", ".4s", ".2d", []>;
4291
4292 def : Pat<(concat_vectors (v8i8 V64:$Rd), (OpNode (v8i16 V128:$Rn))),
4293 (!cast<Instruction>(NAME # "v16i8")
4294 (INSERT_SUBREG (IMPLICIT_DEF), V64:$Rd, dsub), V128:$Rn)>;
4295 def : Pat<(concat_vectors (v4i16 V64:$Rd), (OpNode (v4i32 V128:$Rn))),
4296 (!cast<Instruction>(NAME # "v8i16")
4297 (INSERT_SUBREG (IMPLICIT_DEF), V64:$Rd, dsub), V128:$Rn)>;
4298 def : Pat<(concat_vectors (v2i32 V64:$Rd), (OpNode (v2i64 V128:$Rn))),
4299 (!cast<Instruction>(NAME # "v4i32")
4300 (INSERT_SUBREG (IMPLICIT_DEF), V64:$Rd, dsub), V128:$Rn)>;
4301}
4302
4303class BaseSIMDCmpTwoVector<bit Q, bit U, bits<2> size, bits<5> opcode,
4304 RegisterOperand regtype, string asm, string kind,
4305 ValueType dty, ValueType sty, SDNode OpNode>
4306 : I<(outs regtype:$Rd), (ins regtype:$Rn), asm,
4307 "{\t$Rd" # kind # ", $Rn" # kind # ", #0" #
4308 "|" # kind # "\t$Rd, $Rn, #0}", "",
4309 [(set (dty regtype:$Rd), (OpNode (sty regtype:$Rn)))]>,
4310 Sched<[WriteV]> {
4311 bits<5> Rd;
4312 bits<5> Rn;
4313 let Inst{31} = 0;
4314 let Inst{30} = Q;
4315 let Inst{29} = U;
4316 let Inst{28-24} = 0b01110;
4317 let Inst{23-22} = size;
4318 let Inst{21-17} = 0b10000;
4319 let Inst{16-12} = opcode;
4320 let Inst{11-10} = 0b10;
4321 let Inst{9-5} = Rn;
4322 let Inst{4-0} = Rd;
4323}
4324
4325// Comparisons support all element sizes, except 1xD.
4326multiclass SIMDCmpTwoVector<bit U, bits<5> opc, string asm,
4327 SDNode OpNode> {
4328 def v8i8rz : BaseSIMDCmpTwoVector<0, U, 0b00, opc, V64,
4329 asm, ".8b",
4330 v8i8, v8i8, OpNode>;
4331 def v16i8rz : BaseSIMDCmpTwoVector<1, U, 0b00, opc, V128,
4332 asm, ".16b",
4333 v16i8, v16i8, OpNode>;
4334 def v4i16rz : BaseSIMDCmpTwoVector<0, U, 0b01, opc, V64,
4335 asm, ".4h",
4336 v4i16, v4i16, OpNode>;
4337 def v8i16rz : BaseSIMDCmpTwoVector<1, U, 0b01, opc, V128,
4338 asm, ".8h",
4339 v8i16, v8i16, OpNode>;
4340 def v2i32rz : BaseSIMDCmpTwoVector<0, U, 0b10, opc, V64,
4341 asm, ".2s",
4342 v2i32, v2i32, OpNode>;
4343 def v4i32rz : BaseSIMDCmpTwoVector<1, U, 0b10, opc, V128,
4344 asm, ".4s",
4345 v4i32, v4i32, OpNode>;
4346 def v2i64rz : BaseSIMDCmpTwoVector<1, U, 0b11, opc, V128,
4347 asm, ".2d",
4348 v2i64, v2i64, OpNode>;
4349}
4350
4351// FP Comparisons support only S and D element sizes.
4352multiclass SIMDFPCmpTwoVector<bit U, bit S, bits<5> opc,
4353 string asm, SDNode OpNode> {
4354 def v2i32rz : BaseSIMDCmpTwoVector<0, U, {S,0}, opc, V64,
4355 asm, ".2s",
4356 v2i32, v2f32, OpNode>;
4357 def v4i32rz : BaseSIMDCmpTwoVector<1, U, {S,0}, opc, V128,
4358 asm, ".4s",
4359 v4i32, v4f32, OpNode>;
4360 def v2i64rz : BaseSIMDCmpTwoVector<1, U, {S,1}, opc, V128,
4361 asm, ".2d",
4362 v2i64, v2f64, OpNode>;
4363}
4364
4365let mayLoad = 0, mayStore = 0, hasSideEffects = 0 in
4366class BaseSIMDFPCvtTwoVector<bit Q, bit U, bits<2> size, bits<5> opcode,
4367 RegisterOperand outtype, RegisterOperand intype,
4368 string asm, string VdTy, string VnTy,
4369 list<dag> pattern>
4370 : I<(outs outtype:$Rd), (ins intype:$Rn), asm,
4371 !strconcat("\t$Rd", VdTy, ", $Rn", VnTy), "", pattern>,
4372 Sched<[WriteV]> {
4373 bits<5> Rd;
4374 bits<5> Rn;
4375 let Inst{31} = 0;
4376 let Inst{30} = Q;
4377 let Inst{29} = U;
4378 let Inst{28-24} = 0b01110;
4379 let Inst{23-22} = size;
4380 let Inst{21-17} = 0b10000;
4381 let Inst{16-12} = opcode;
4382 let Inst{11-10} = 0b10;
4383 let Inst{9-5} = Rn;
4384 let Inst{4-0} = Rd;
4385}
4386
4387class BaseSIMDFPCvtTwoVectorTied<bit Q, bit U, bits<2> size, bits<5> opcode,
4388 RegisterOperand outtype, RegisterOperand intype,
4389 string asm, string VdTy, string VnTy,
4390 list<dag> pattern>
4391 : I<(outs outtype:$dst), (ins outtype:$Rd, intype:$Rn), asm,
4392 !strconcat("\t$Rd", VdTy, ", $Rn", VnTy), "$Rd = $dst", pattern>,
4393 Sched<[WriteV]> {
4394 bits<5> Rd;
4395 bits<5> Rn;
4396 let Inst{31} = 0;
4397 let Inst{30} = Q;
4398 let Inst{29} = U;
4399 let Inst{28-24} = 0b01110;
4400 let Inst{23-22} = size;
4401 let Inst{21-17} = 0b10000;
4402 let Inst{16-12} = opcode;
4403 let Inst{11-10} = 0b10;
4404 let Inst{9-5} = Rn;
4405 let Inst{4-0} = Rd;
4406}
4407
4408multiclass SIMDFPWidenTwoVector<bit U, bit S, bits<5> opc, string asm> {
4409 def v4i16 : BaseSIMDFPCvtTwoVector<0, U, {S,0}, opc, V128, V64,
4410 asm, ".4s", ".4h", []>;
4411 def v8i16 : BaseSIMDFPCvtTwoVector<1, U, {S,0}, opc, V128, V128,
4412 asm#"2", ".4s", ".8h", []>;
4413 def v2i32 : BaseSIMDFPCvtTwoVector<0, U, {S,1}, opc, V128, V64,
4414 asm, ".2d", ".2s", []>;
4415 def v4i32 : BaseSIMDFPCvtTwoVector<1, U, {S,1}, opc, V128, V128,
4416 asm#"2", ".2d", ".4s", []>;
4417}
4418
4419multiclass SIMDFPNarrowTwoVector<bit U, bit S, bits<5> opc, string asm> {
4420 def v4i16 : BaseSIMDFPCvtTwoVector<0, U, {S,0}, opc, V64, V128,
4421 asm, ".4h", ".4s", []>;
4422 def v8i16 : BaseSIMDFPCvtTwoVectorTied<1, U, {S,0}, opc, V128, V128,
4423 asm#"2", ".8h", ".4s", []>;
4424 def v2i32 : BaseSIMDFPCvtTwoVector<0, U, {S,1}, opc, V64, V128,
4425 asm, ".2s", ".2d", []>;
4426 def v4i32 : BaseSIMDFPCvtTwoVectorTied<1, U, {S,1}, opc, V128, V128,
4427 asm#"2", ".4s", ".2d", []>;
4428}
4429
4430multiclass SIMDFPInexactCvtTwoVector<bit U, bit S, bits<5> opc, string asm,
4431 Intrinsic OpNode> {
4432 def v2f32 : BaseSIMDFPCvtTwoVector<0, U, {S,1}, opc, V64, V128,
4433 asm, ".2s", ".2d",
4434 [(set (v2f32 V64:$Rd), (OpNode (v2f64 V128:$Rn)))]>;
4435 def v4f32 : BaseSIMDFPCvtTwoVectorTied<1, U, {S,1}, opc, V128, V128,
4436 asm#"2", ".4s", ".2d", []>;
4437
4438 def : Pat<(concat_vectors (v2f32 V64:$Rd), (OpNode (v2f64 V128:$Rn))),
4439 (!cast<Instruction>(NAME # "v4f32")
4440 (INSERT_SUBREG (IMPLICIT_DEF), V64:$Rd, dsub), V128:$Rn)>;
4441}
4442
4443//----------------------------------------------------------------------------
4444// AdvSIMD three register different-size vector instructions.
4445//----------------------------------------------------------------------------
4446
4447let mayLoad = 0, mayStore = 0, hasSideEffects = 0 in
4448class BaseSIMDDifferentThreeVector<bit U, bits<3> size, bits<4> opcode,
4449 RegisterOperand outtype, RegisterOperand intype1,
4450 RegisterOperand intype2, string asm,
4451 string outkind, string inkind1, string inkind2,
4452 list<dag> pattern>
4453 : I<(outs outtype:$Rd), (ins intype1:$Rn, intype2:$Rm), asm,
4454 "{\t$Rd" # outkind # ", $Rn" # inkind1 # ", $Rm" # inkind2 #
4455 "|" # outkind # "\t$Rd, $Rn, $Rm}", "", pattern>,
4456 Sched<[WriteV]> {
4457 bits<5> Rd;
4458 bits<5> Rn;
4459 bits<5> Rm;
4460 let Inst{31} = 0;
4461 let Inst{30} = size{0};
4462 let Inst{29} = U;
4463 let Inst{28-24} = 0b01110;
4464 let Inst{23-22} = size{2-1};
4465 let Inst{21} = 1;
4466 let Inst{20-16} = Rm;
4467 let Inst{15-12} = opcode;
4468 let Inst{11-10} = 0b00;
4469 let Inst{9-5} = Rn;
4470 let Inst{4-0} = Rd;
4471}
4472
4473let mayLoad = 0, mayStore = 0, hasSideEffects = 0 in
4474class BaseSIMDDifferentThreeVectorTied<bit U, bits<3> size, bits<4> opcode,
4475 RegisterOperand outtype, RegisterOperand intype1,
4476 RegisterOperand intype2, string asm,
4477 string outkind, string inkind1, string inkind2,
4478 list<dag> pattern>
4479 : I<(outs outtype:$dst), (ins outtype:$Rd, intype1:$Rn, intype2:$Rm), asm,
4480 "{\t$Rd" # outkind # ", $Rn" # inkind1 # ", $Rm" # inkind2 #
4481 "|" # outkind # "\t$Rd, $Rn, $Rm}", "$Rd = $dst", pattern>,
4482 Sched<[WriteV]> {
4483 bits<5> Rd;
4484 bits<5> Rn;
4485 bits<5> Rm;
4486 let Inst{31} = 0;
4487 let Inst{30} = size{0};
4488 let Inst{29} = U;
4489 let Inst{28-24} = 0b01110;
4490 let Inst{23-22} = size{2-1};
4491 let Inst{21} = 1;
4492 let Inst{20-16} = Rm;
4493 let Inst{15-12} = opcode;
4494 let Inst{11-10} = 0b00;
4495 let Inst{9-5} = Rn;
4496 let Inst{4-0} = Rd;
4497}
4498
4499// FIXME: TableGen doesn't know how to deal with expanded types that also
4500// change the element count (in this case, placing the results in
4501// the high elements of the result register rather than the low
4502// elements). Until that's fixed, we can't code-gen those.
4503multiclass SIMDNarrowThreeVectorBHS<bit U, bits<4> opc, string asm,
4504 Intrinsic IntOp> {
4505 def v8i16_v8i8 : BaseSIMDDifferentThreeVector<U, 0b000, opc,
4506 V64, V128, V128,
4507 asm, ".8b", ".8h", ".8h",
4508 [(set (v8i8 V64:$Rd), (IntOp (v8i16 V128:$Rn), (v8i16 V128:$Rm)))]>;
4509 def v8i16_v16i8 : BaseSIMDDifferentThreeVectorTied<U, 0b001, opc,
4510 V128, V128, V128,
4511 asm#"2", ".16b", ".8h", ".8h",
4512 []>;
4513 def v4i32_v4i16 : BaseSIMDDifferentThreeVector<U, 0b010, opc,
4514 V64, V128, V128,
4515 asm, ".4h", ".4s", ".4s",
4516 [(set (v4i16 V64:$Rd), (IntOp (v4i32 V128:$Rn), (v4i32 V128:$Rm)))]>;
4517 def v4i32_v8i16 : BaseSIMDDifferentThreeVectorTied<U, 0b011, opc,
4518 V128, V128, V128,
4519 asm#"2", ".8h", ".4s", ".4s",
4520 []>;
4521 def v2i64_v2i32 : BaseSIMDDifferentThreeVector<U, 0b100, opc,
4522 V64, V128, V128,
4523 asm, ".2s", ".2d", ".2d",
4524 [(set (v2i32 V64:$Rd), (IntOp (v2i64 V128:$Rn), (v2i64 V128:$Rm)))]>;
4525 def v2i64_v4i32 : BaseSIMDDifferentThreeVectorTied<U, 0b101, opc,
4526 V128, V128, V128,
4527 asm#"2", ".4s", ".2d", ".2d",
4528 []>;
4529
4530
4531 // Patterns for the '2' variants involve INSERT_SUBREG, which you can't put in
4532 // a version attached to an instruction.
4533 def : Pat<(concat_vectors (v8i8 V64:$Rd), (IntOp (v8i16 V128:$Rn),
4534 (v8i16 V128:$Rm))),
4535 (!cast<Instruction>(NAME # "v8i16_v16i8")
4536 (INSERT_SUBREG (IMPLICIT_DEF), V64:$Rd, dsub),
4537 V128:$Rn, V128:$Rm)>;
4538 def : Pat<(concat_vectors (v4i16 V64:$Rd), (IntOp (v4i32 V128:$Rn),
4539 (v4i32 V128:$Rm))),
4540 (!cast<Instruction>(NAME # "v4i32_v8i16")
4541 (INSERT_SUBREG (IMPLICIT_DEF), V64:$Rd, dsub),
4542 V128:$Rn, V128:$Rm)>;
4543 def : Pat<(concat_vectors (v2i32 V64:$Rd), (IntOp (v2i64 V128:$Rn),
4544 (v2i64 V128:$Rm))),
4545 (!cast<Instruction>(NAME # "v2i64_v4i32")
4546 (INSERT_SUBREG (IMPLICIT_DEF), V64:$Rd, dsub),
4547 V128:$Rn, V128:$Rm)>;
4548}
4549
4550multiclass SIMDDifferentThreeVectorBD<bit U, bits<4> opc, string asm,
4551 Intrinsic IntOp> {
4552 def v8i8 : BaseSIMDDifferentThreeVector<U, 0b000, opc,
4553 V128, V64, V64,
4554 asm, ".8h", ".8b", ".8b",
4555 [(set (v8i16 V128:$Rd), (IntOp (v8i8 V64:$Rn), (v8i8 V64:$Rm)))]>;
4556 def v16i8 : BaseSIMDDifferentThreeVector<U, 0b001, opc,
4557 V128, V128, V128,
4558 asm#"2", ".8h", ".16b", ".16b", []>;
4559 def v1i64 : BaseSIMDDifferentThreeVector<U, 0b110, opc,
4560 V128, V64, V64,
4561 asm, ".1q", ".1d", ".1d", []>;
4562 def v2i64 : BaseSIMDDifferentThreeVector<U, 0b111, opc,
4563 V128, V128, V128,
4564 asm#"2", ".1q", ".2d", ".2d", []>;
4565
4566 def : Pat<(v8i16 (IntOp (v8i8 (extract_high_v16i8 V128:$Rn)),
4567 (v8i8 (extract_high_v16i8 V128:$Rm)))),
4568 (!cast<Instruction>(NAME#"v16i8") V128:$Rn, V128:$Rm)>;
4569}
4570
4571multiclass SIMDLongThreeVectorHS<bit U, bits<4> opc, string asm,
4572 SDPatternOperator OpNode> {
4573 def v4i16_v4i32 : BaseSIMDDifferentThreeVector<U, 0b010, opc,
4574 V128, V64, V64,
4575 asm, ".4s", ".4h", ".4h",
4576 [(set (v4i32 V128:$Rd), (OpNode (v4i16 V64:$Rn), (v4i16 V64:$Rm)))]>;
4577 def v8i16_v4i32 : BaseSIMDDifferentThreeVector<U, 0b011, opc,
4578 V128, V128, V128,
4579 asm#"2", ".4s", ".8h", ".8h",
4580 [(set (v4i32 V128:$Rd), (OpNode (extract_high_v8i16 V128:$Rn),
4581 (extract_high_v8i16 V128:$Rm)))]>;
4582 def v2i32_v2i64 : BaseSIMDDifferentThreeVector<U, 0b100, opc,
4583 V128, V64, V64,
4584 asm, ".2d", ".2s", ".2s",
4585 [(set (v2i64 V128:$Rd), (OpNode (v2i32 V64:$Rn), (v2i32 V64:$Rm)))]>;
4586 def v4i32_v2i64 : BaseSIMDDifferentThreeVector<U, 0b101, opc,
4587 V128, V128, V128,
4588 asm#"2", ".2d", ".4s", ".4s",
4589 [(set (v2i64 V128:$Rd), (OpNode (extract_high_v4i32 V128:$Rn),
4590 (extract_high_v4i32 V128:$Rm)))]>;
4591}
4592
4593multiclass SIMDLongThreeVectorBHSabdl<bit U, bits<4> opc, string asm,
4594 SDPatternOperator OpNode = null_frag> {
4595 def v8i8_v8i16 : BaseSIMDDifferentThreeVector<U, 0b000, opc,
4596 V128, V64, V64,
4597 asm, ".8h", ".8b", ".8b",
4598 [(set (v8i16 V128:$Rd),
4599 (zext (v8i8 (OpNode (v8i8 V64:$Rn), (v8i8 V64:$Rm)))))]>;
4600 def v16i8_v8i16 : BaseSIMDDifferentThreeVector<U, 0b001, opc,
4601 V128, V128, V128,
4602 asm#"2", ".8h", ".16b", ".16b",
4603 [(set (v8i16 V128:$Rd),
4604 (zext (v8i8 (OpNode (extract_high_v16i8 V128:$Rn),
4605 (extract_high_v16i8 V128:$Rm)))))]>;
4606 def v4i16_v4i32 : BaseSIMDDifferentThreeVector<U, 0b010, opc,
4607 V128, V64, V64,
4608 asm, ".4s", ".4h", ".4h",
4609 [(set (v4i32 V128:$Rd),
4610 (zext (v4i16 (OpNode (v4i16 V64:$Rn), (v4i16 V64:$Rm)))))]>;
4611 def v8i16_v4i32 : BaseSIMDDifferentThreeVector<U, 0b011, opc,
4612 V128, V128, V128,
4613 asm#"2", ".4s", ".8h", ".8h",
4614 [(set (v4i32 V128:$Rd),
4615 (zext (v4i16 (OpNode (extract_high_v8i16 V128:$Rn),
4616 (extract_high_v8i16 V128:$Rm)))))]>;
4617 def v2i32_v2i64 : BaseSIMDDifferentThreeVector<U, 0b100, opc,
4618 V128, V64, V64,
4619 asm, ".2d", ".2s", ".2s",
4620 [(set (v2i64 V128:$Rd),
4621 (zext (v2i32 (OpNode (v2i32 V64:$Rn), (v2i32 V64:$Rm)))))]>;
4622 def v4i32_v2i64 : BaseSIMDDifferentThreeVector<U, 0b101, opc,
4623 V128, V128, V128,
4624 asm#"2", ".2d", ".4s", ".4s",
4625 [(set (v2i64 V128:$Rd),
4626 (zext (v2i32 (OpNode (extract_high_v4i32 V128:$Rn),
4627 (extract_high_v4i32 V128:$Rm)))))]>;
4628}
4629
4630multiclass SIMDLongThreeVectorTiedBHSabal<bit U, bits<4> opc,
4631 string asm,
4632 SDPatternOperator OpNode> {
4633 def v8i8_v8i16 : BaseSIMDDifferentThreeVectorTied<U, 0b000, opc,
4634 V128, V64, V64,
4635 asm, ".8h", ".8b", ".8b",
4636 [(set (v8i16 V128:$dst),
4637 (add (v8i16 V128:$Rd),
4638 (zext (v8i8 (OpNode (v8i8 V64:$Rn), (v8i8 V64:$Rm))))))]>;
4639 def v16i8_v8i16 : BaseSIMDDifferentThreeVectorTied<U, 0b001, opc,
4640 V128, V128, V128,
4641 asm#"2", ".8h", ".16b", ".16b",
4642 [(set (v8i16 V128:$dst),
4643 (add (v8i16 V128:$Rd),
4644 (zext (v8i8 (OpNode (extract_high_v16i8 V128:$Rn),
4645 (extract_high_v16i8 V128:$Rm))))))]>;
4646 def v4i16_v4i32 : BaseSIMDDifferentThreeVectorTied<U, 0b010, opc,
4647 V128, V64, V64,
4648 asm, ".4s", ".4h", ".4h",
4649 [(set (v4i32 V128:$dst),
4650 (add (v4i32 V128:$Rd),
4651 (zext (v4i16 (OpNode (v4i16 V64:$Rn), (v4i16 V64:$Rm))))))]>;
4652 def v8i16_v4i32 : BaseSIMDDifferentThreeVectorTied<U, 0b011, opc,
4653 V128, V128, V128,
4654 asm#"2", ".4s", ".8h", ".8h",
4655 [(set (v4i32 V128:$dst),
4656 (add (v4i32 V128:$Rd),
4657 (zext (v4i16 (OpNode (extract_high_v8i16 V128:$Rn),
4658 (extract_high_v8i16 V128:$Rm))))))]>;
4659 def v2i32_v2i64 : BaseSIMDDifferentThreeVectorTied<U, 0b100, opc,
4660 V128, V64, V64,
4661 asm, ".2d", ".2s", ".2s",
4662 [(set (v2i64 V128:$dst),
4663 (add (v2i64 V128:$Rd),
4664 (zext (v2i32 (OpNode (v2i32 V64:$Rn), (v2i32 V64:$Rm))))))]>;
4665 def v4i32_v2i64 : BaseSIMDDifferentThreeVectorTied<U, 0b101, opc,
4666 V128, V128, V128,
4667 asm#"2", ".2d", ".4s", ".4s",
4668 [(set (v2i64 V128:$dst),
4669 (add (v2i64 V128:$Rd),
4670 (zext (v2i32 (OpNode (extract_high_v4i32 V128:$Rn),
4671 (extract_high_v4i32 V128:$Rm))))))]>;
4672}
4673
4674multiclass SIMDLongThreeVectorBHS<bit U, bits<4> opc, string asm,
4675 SDPatternOperator OpNode = null_frag> {
4676 def v8i8_v8i16 : BaseSIMDDifferentThreeVector<U, 0b000, opc,
4677 V128, V64, V64,
4678 asm, ".8h", ".8b", ".8b",
4679 [(set (v8i16 V128:$Rd), (OpNode (v8i8 V64:$Rn), (v8i8 V64:$Rm)))]>;
4680 def v16i8_v8i16 : BaseSIMDDifferentThreeVector<U, 0b001, opc,
4681 V128, V128, V128,
4682 asm#"2", ".8h", ".16b", ".16b",
4683 [(set (v8i16 V128:$Rd), (OpNode (extract_high_v16i8 V128:$Rn),
4684 (extract_high_v16i8 V128:$Rm)))]>;
4685 def v4i16_v4i32 : BaseSIMDDifferentThreeVector<U, 0b010, opc,
4686 V128, V64, V64,
4687 asm, ".4s", ".4h", ".4h",
4688 [(set (v4i32 V128:$Rd), (OpNode (v4i16 V64:$Rn), (v4i16 V64:$Rm)))]>;
4689 def v8i16_v4i32 : BaseSIMDDifferentThreeVector<U, 0b011, opc,
4690 V128, V128, V128,
4691 asm#"2", ".4s", ".8h", ".8h",
4692 [(set (v4i32 V128:$Rd), (OpNode (extract_high_v8i16 V128:$Rn),
4693 (extract_high_v8i16 V128:$Rm)))]>;
4694 def v2i32_v2i64 : BaseSIMDDifferentThreeVector<U, 0b100, opc,
4695 V128, V64, V64,
4696 asm, ".2d", ".2s", ".2s",
4697 [(set (v2i64 V128:$Rd), (OpNode (v2i32 V64:$Rn), (v2i32 V64:$Rm)))]>;
4698 def v4i32_v2i64 : BaseSIMDDifferentThreeVector<U, 0b101, opc,
4699 V128, V128, V128,
4700 asm#"2", ".2d", ".4s", ".4s",
4701 [(set (v2i64 V128:$Rd), (OpNode (extract_high_v4i32 V128:$Rn),
4702 (extract_high_v4i32 V128:$Rm)))]>;
4703}
4704
4705multiclass SIMDLongThreeVectorTiedBHS<bit U, bits<4> opc,
4706 string asm,
4707 SDPatternOperator OpNode> {
4708 def v8i8_v8i16 : BaseSIMDDifferentThreeVectorTied<U, 0b000, opc,
4709 V128, V64, V64,
4710 asm, ".8h", ".8b", ".8b",
4711 [(set (v8i16 V128:$dst),
4712 (OpNode (v8i16 V128:$Rd), (v8i8 V64:$Rn), (v8i8 V64:$Rm)))]>;
4713 def v16i8_v8i16 : BaseSIMDDifferentThreeVectorTied<U, 0b001, opc,
4714 V128, V128, V128,
4715 asm#"2", ".8h", ".16b", ".16b",
4716 [(set (v8i16 V128:$dst),
4717 (OpNode (v8i16 V128:$Rd),
4718 (extract_high_v16i8 V128:$Rn),
4719 (extract_high_v16i8 V128:$Rm)))]>;
4720 def v4i16_v4i32 : BaseSIMDDifferentThreeVectorTied<U, 0b010, opc,
4721 V128, V64, V64,
4722 asm, ".4s", ".4h", ".4h",
4723 [(set (v4i32 V128:$dst),
4724 (OpNode (v4i32 V128:$Rd), (v4i16 V64:$Rn), (v4i16 V64:$Rm)))]>;
4725 def v8i16_v4i32 : BaseSIMDDifferentThreeVectorTied<U, 0b011, opc,
4726 V128, V128, V128,
4727 asm#"2", ".4s", ".8h", ".8h",
4728 [(set (v4i32 V128:$dst),
4729 (OpNode (v4i32 V128:$Rd),
4730 (extract_high_v8i16 V128:$Rn),
4731 (extract_high_v8i16 V128:$Rm)))]>;
4732 def v2i32_v2i64 : BaseSIMDDifferentThreeVectorTied<U, 0b100, opc,
4733 V128, V64, V64,
4734 asm, ".2d", ".2s", ".2s",
4735 [(set (v2i64 V128:$dst),
4736 (OpNode (v2i64 V128:$Rd), (v2i32 V64:$Rn), (v2i32 V64:$Rm)))]>;
4737 def v4i32_v2i64 : BaseSIMDDifferentThreeVectorTied<U, 0b101, opc,
4738 V128, V128, V128,
4739 asm#"2", ".2d", ".4s", ".4s",
4740 [(set (v2i64 V128:$dst),
4741 (OpNode (v2i64 V128:$Rd),
4742 (extract_high_v4i32 V128:$Rn),
4743 (extract_high_v4i32 V128:$Rm)))]>;
4744}
4745
4746multiclass SIMDLongThreeVectorSQDMLXTiedHS<bit U, bits<4> opc, string asm,
4747 SDPatternOperator Accum> {
4748 def v4i16_v4i32 : BaseSIMDDifferentThreeVectorTied<U, 0b010, opc,
4749 V128, V64, V64,
4750 asm, ".4s", ".4h", ".4h",
4751 [(set (v4i32 V128:$dst),
4752 (Accum (v4i32 V128:$Rd),
4753 (v4i32 (int_arm64_neon_sqdmull (v4i16 V64:$Rn),
4754 (v4i16 V64:$Rm)))))]>;
4755 def v8i16_v4i32 : BaseSIMDDifferentThreeVectorTied<U, 0b011, opc,
4756 V128, V128, V128,
4757 asm#"2", ".4s", ".8h", ".8h",
4758 [(set (v4i32 V128:$dst),
4759 (Accum (v4i32 V128:$Rd),
4760 (v4i32 (int_arm64_neon_sqdmull (extract_high_v8i16 V128:$Rn),
4761 (extract_high_v8i16 V128:$Rm)))))]>;
4762 def v2i32_v2i64 : BaseSIMDDifferentThreeVectorTied<U, 0b100, opc,
4763 V128, V64, V64,
4764 asm, ".2d", ".2s", ".2s",
4765 [(set (v2i64 V128:$dst),
4766 (Accum (v2i64 V128:$Rd),
4767 (v2i64 (int_arm64_neon_sqdmull (v2i32 V64:$Rn),
4768 (v2i32 V64:$Rm)))))]>;
4769 def v4i32_v2i64 : BaseSIMDDifferentThreeVectorTied<U, 0b101, opc,
4770 V128, V128, V128,
4771 asm#"2", ".2d", ".4s", ".4s",
4772 [(set (v2i64 V128:$dst),
4773 (Accum (v2i64 V128:$Rd),
4774 (v2i64 (int_arm64_neon_sqdmull (extract_high_v4i32 V128:$Rn),
4775 (extract_high_v4i32 V128:$Rm)))))]>;
4776}
4777
4778multiclass SIMDWideThreeVectorBHS<bit U, bits<4> opc, string asm,
4779 SDPatternOperator OpNode> {
4780 def v8i8_v8i16 : BaseSIMDDifferentThreeVector<U, 0b000, opc,
4781 V128, V128, V64,
4782 asm, ".8h", ".8h", ".8b",
4783 [(set (v8i16 V128:$Rd), (OpNode (v8i16 V128:$Rn), (v8i8 V64:$Rm)))]>;
4784 def v16i8_v8i16 : BaseSIMDDifferentThreeVector<U, 0b001, opc,
4785 V128, V128, V128,
4786 asm#"2", ".8h", ".8h", ".16b",
4787 [(set (v8i16 V128:$Rd), (OpNode (v8i16 V128:$Rn),
4788 (extract_high_v16i8 V128:$Rm)))]>;
4789 def v4i16_v4i32 : BaseSIMDDifferentThreeVector<U, 0b010, opc,
4790 V128, V128, V64,
4791 asm, ".4s", ".4s", ".4h",
4792 [(set (v4i32 V128:$Rd), (OpNode (v4i32 V128:$Rn), (v4i16 V64:$Rm)))]>;
4793 def v8i16_v4i32 : BaseSIMDDifferentThreeVector<U, 0b011, opc,
4794 V128, V128, V128,
4795 asm#"2", ".4s", ".4s", ".8h",
4796 [(set (v4i32 V128:$Rd), (OpNode (v4i32 V128:$Rn),
4797 (extract_high_v8i16 V128:$Rm)))]>;
4798 def v2i32_v2i64 : BaseSIMDDifferentThreeVector<U, 0b100, opc,
4799 V128, V128, V64,
4800 asm, ".2d", ".2d", ".2s",
4801 [(set (v2i64 V128:$Rd), (OpNode (v2i64 V128:$Rn), (v2i32 V64:$Rm)))]>;
4802 def v4i32_v2i64 : BaseSIMDDifferentThreeVector<U, 0b101, opc,
4803 V128, V128, V128,
4804 asm#"2", ".2d", ".2d", ".4s",
4805 [(set (v2i64 V128:$Rd), (OpNode (v2i64 V128:$Rn),
4806 (extract_high_v4i32 V128:$Rm)))]>;
4807}
4808
4809//----------------------------------------------------------------------------
4810// AdvSIMD bitwise extract from vector
4811//----------------------------------------------------------------------------
4812
4813class BaseSIMDBitwiseExtract<bit size, RegisterOperand regtype, ValueType vty,
4814 string asm, string kind>
4815 : I<(outs regtype:$Rd), (ins regtype:$Rn, regtype:$Rm, i32imm:$imm), asm,
4816 "{\t$Rd" # kind # ", $Rn" # kind # ", $Rm" # kind # ", $imm" #
4817 "|" # kind # "\t$Rd, $Rn, $Rm, $imm}", "",
4818 [(set (vty regtype:$Rd),
4819 (ARM64ext regtype:$Rn, regtype:$Rm, (i32 imm:$imm)))]>,
4820 Sched<[WriteV]> {
4821 bits<5> Rd;
4822 bits<5> Rn;
4823 bits<5> Rm;
4824 bits<4> imm;
4825 let Inst{31} = 0;
4826 let Inst{30} = size;
4827 let Inst{29-21} = 0b101110000;
4828 let Inst{20-16} = Rm;
4829 let Inst{15} = 0;
4830 let Inst{14-11} = imm;
4831 let Inst{10} = 0;
4832 let Inst{9-5} = Rn;
4833 let Inst{4-0} = Rd;
4834}
4835
4836
4837multiclass SIMDBitwiseExtract<string asm> {
4838 def v8i8 : BaseSIMDBitwiseExtract<0, V64, v8i8, asm, ".8b">;
4839 def v16i8 : BaseSIMDBitwiseExtract<1, V128, v16i8, asm, ".16b">;
4840}
4841
4842//----------------------------------------------------------------------------
4843// AdvSIMD zip vector
4844//----------------------------------------------------------------------------
4845
4846class BaseSIMDZipVector<bits<3> size, bits<3> opc, RegisterOperand regtype,
4847 string asm, string kind, SDNode OpNode, ValueType valty>
4848 : I<(outs regtype:$Rd), (ins regtype:$Rn, regtype:$Rm), asm,
4849 "{\t$Rd" # kind # ", $Rn" # kind # ", $Rm" # kind #
4850 "|" # kind # "\t$Rd, $Rn, $Rm}", "",
4851 [(set (valty regtype:$Rd), (OpNode regtype:$Rn, regtype:$Rm))]>,
4852 Sched<[WriteV]> {
4853 bits<5> Rd;
4854 bits<5> Rn;
4855 bits<5> Rm;
4856 let Inst{31} = 0;
4857 let Inst{30} = size{0};
4858 let Inst{29-24} = 0b001110;
4859 let Inst{23-22} = size{2-1};
4860 let Inst{21} = 0;
4861 let Inst{20-16} = Rm;
4862 let Inst{15} = 0;
4863 let Inst{14-12} = opc;
4864 let Inst{11-10} = 0b10;
4865 let Inst{9-5} = Rn;
4866 let Inst{4-0} = Rd;
4867}
4868
4869multiclass SIMDZipVector<bits<3>opc, string asm,
4870 SDNode OpNode> {
4871 def v8i8 : BaseSIMDZipVector<0b000, opc, V64,
4872 asm, ".8b", OpNode, v8i8>;
4873 def v16i8 : BaseSIMDZipVector<0b001, opc, V128,
4874 asm, ".16b", OpNode, v16i8>;
4875 def v4i16 : BaseSIMDZipVector<0b010, opc, V64,
4876 asm, ".4h", OpNode, v4i16>;
4877 def v8i16 : BaseSIMDZipVector<0b011, opc, V128,
4878 asm, ".8h", OpNode, v8i16>;
4879 def v2i32 : BaseSIMDZipVector<0b100, opc, V64,
4880 asm, ".2s", OpNode, v2i32>;
4881 def v4i32 : BaseSIMDZipVector<0b101, opc, V128,
4882 asm, ".4s", OpNode, v4i32>;
4883 def v2i64 : BaseSIMDZipVector<0b111, opc, V128,
4884 asm, ".2d", OpNode, v2i64>;
4885
4886 def : Pat<(v2f32 (OpNode V64:$Rn, V64:$Rm)),
4887 (!cast<Instruction>(NAME#"v2i32") V64:$Rn, V64:$Rm)>;
4888 def : Pat<(v4f32 (OpNode V128:$Rn, V128:$Rm)),
4889 (!cast<Instruction>(NAME#"v4i32") V128:$Rn, V128:$Rm)>;
4890 def : Pat<(v2f64 (OpNode V128:$Rn, V128:$Rm)),
4891 (!cast<Instruction>(NAME#"v2i64") V128:$Rn, V128:$Rm)>;
4892}
4893
4894//----------------------------------------------------------------------------
4895// AdvSIMD three register scalar instructions
4896//----------------------------------------------------------------------------
4897
4898let mayStore = 0, mayLoad = 0, hasSideEffects = 0 in
4899class BaseSIMDThreeScalar<bit U, bits<2> size, bits<5> opcode,
4900 RegisterClass regtype, string asm,
4901 list<dag> pattern>
4902 : I<(outs regtype:$Rd), (ins regtype:$Rn, regtype:$Rm), asm,
4903 "\t$Rd, $Rn, $Rm", "", pattern>,
4904 Sched<[WriteV]> {
4905 bits<5> Rd;
4906 bits<5> Rn;
4907 bits<5> Rm;
4908 let Inst{31-30} = 0b01;
4909 let Inst{29} = U;
4910 let Inst{28-24} = 0b11110;
4911 let Inst{23-22} = size;
4912 let Inst{21} = 1;
4913 let Inst{20-16} = Rm;
4914 let Inst{15-11} = opcode;
4915 let Inst{10} = 1;
4916 let Inst{9-5} = Rn;
4917 let Inst{4-0} = Rd;
4918}
4919
4920multiclass SIMDThreeScalarD<bit U, bits<5> opc, string asm,
4921 SDPatternOperator OpNode> {
4922 def v1i64 : BaseSIMDThreeScalar<U, 0b11, opc, FPR64, asm,
4923 [(set (v1i64 FPR64:$Rd), (OpNode (v1i64 FPR64:$Rn), (v1i64 FPR64:$Rm)))]>;
4924}
4925
4926multiclass SIMDThreeScalarBHSD<bit U, bits<5> opc, string asm,
4927 SDPatternOperator OpNode> {
4928 def v1i64 : BaseSIMDThreeScalar<U, 0b11, opc, FPR64, asm,
4929 [(set (v1i64 FPR64:$Rd), (OpNode (v1i64 FPR64:$Rn), (v1i64 FPR64:$Rm)))]>;
4930 def v1i32 : BaseSIMDThreeScalar<U, 0b10, opc, FPR32, asm, []>;
4931 def v1i16 : BaseSIMDThreeScalar<U, 0b01, opc, FPR16, asm, []>;
4932 def v1i8 : BaseSIMDThreeScalar<U, 0b00, opc, FPR8 , asm, []>;
4933
4934 def : Pat<(i64 (OpNode (i64 FPR64:$Rn), (i64 FPR64:$Rm))),
4935 (!cast<Instruction>(NAME#"v1i64") FPR64:$Rn, FPR64:$Rm)>;
4936 def : Pat<(i32 (OpNode (i32 FPR32:$Rn), (i32 FPR32:$Rm))),
4937 (!cast<Instruction>(NAME#"v1i32") FPR32:$Rn, FPR32:$Rm)>;
4938}
4939
4940multiclass SIMDThreeScalarHS<bit U, bits<5> opc, string asm,
4941 SDPatternOperator OpNode> {
4942 def v1i32 : BaseSIMDThreeScalar<U, 0b10, opc, FPR32, asm,
4943 [(set FPR32:$Rd, (OpNode FPR32:$Rn, FPR32:$Rm))]>;
4944 def v1i16 : BaseSIMDThreeScalar<U, 0b01, opc, FPR16, asm, []>;
4945}
4946
4947multiclass SIMDThreeScalarSD<bit U, bit S, bits<5> opc, string asm,
4948 SDPatternOperator OpNode = null_frag> {
4949 let mayLoad = 0, mayStore = 0, hasSideEffects = 0 in {
4950 def #NAME#64 : BaseSIMDThreeScalar<U, {S,1}, opc, FPR64, asm,
4951 [(set (f64 FPR64:$Rd), (OpNode (f64 FPR64:$Rn), (f64 FPR64:$Rm)))]>;
4952 def #NAME#32 : BaseSIMDThreeScalar<U, {S,0}, opc, FPR32, asm,
4953 [(set FPR32:$Rd, (OpNode FPR32:$Rn, FPR32:$Rm))]>;
4954 }
4955
4956 def : Pat<(v1f64 (OpNode (v1f64 FPR64:$Rn), (v1f64 FPR64:$Rm))),
4957 (!cast<Instruction>(NAME # "64") FPR64:$Rn, FPR64:$Rm)>;
4958}
4959
4960multiclass SIMDThreeScalarFPCmp<bit U, bit S, bits<5> opc, string asm,
4961 SDPatternOperator OpNode = null_frag> {
4962 let mayLoad = 0, mayStore = 0, hasSideEffects = 0 in {
4963 def #NAME#64 : BaseSIMDThreeScalar<U, {S,1}, opc, FPR64, asm,
4964 [(set (i64 FPR64:$Rd), (OpNode (f64 FPR64:$Rn), (f64 FPR64:$Rm)))]>;
4965 def #NAME#32 : BaseSIMDThreeScalar<U, {S,0}, opc, FPR32, asm,
4966 [(set (i32 FPR32:$Rd), (OpNode (f32 FPR32:$Rn), (f32 FPR32:$Rm)))]>;
4967 }
4968
4969 def : Pat<(v1i64 (OpNode (v1f64 FPR64:$Rn), (v1f64 FPR64:$Rm))),
4970 (!cast<Instruction>(NAME # "64") FPR64:$Rn, FPR64:$Rm)>;
4971}
4972
4973class BaseSIMDThreeScalarMixed<bit U, bits<2> size, bits<5> opcode,
4974 dag oops, dag iops, string asm, string cstr, list<dag> pat>
4975 : I<oops, iops, asm,
4976 "\t$Rd, $Rn, $Rm", cstr, pat>,
4977 Sched<[WriteV]> {
4978 bits<5> Rd;
4979 bits<5> Rn;
4980 bits<5> Rm;
4981 let Inst{31-30} = 0b01;
4982 let Inst{29} = U;
4983 let Inst{28-24} = 0b11110;
4984 let Inst{23-22} = size;
4985 let Inst{21} = 1;
4986 let Inst{20-16} = Rm;
4987 let Inst{15-11} = opcode;
4988 let Inst{10} = 0;
4989 let Inst{9-5} = Rn;
4990 let Inst{4-0} = Rd;
4991}
4992
4993let mayLoad = 0, mayStore = 0, hasSideEffects = 0 in
4994multiclass SIMDThreeScalarMixedHS<bit U, bits<5> opc, string asm,
4995 SDPatternOperator OpNode = null_frag> {
4996 def i16 : BaseSIMDThreeScalarMixed<U, 0b01, opc,
4997 (outs FPR32:$Rd),
4998 (ins FPR16:$Rn, FPR16:$Rm), asm, "", []>;
4999 def i32 : BaseSIMDThreeScalarMixed<U, 0b10, opc,
5000 (outs FPR64:$Rd),
5001 (ins FPR32:$Rn, FPR32:$Rm), asm, "",
5002 [(set (i64 FPR64:$Rd), (OpNode (i32 FPR32:$Rn), (i32 FPR32:$Rm)))]>;
5003}
5004
5005let mayLoad = 0, mayStore = 0, hasSideEffects = 0 in
5006multiclass SIMDThreeScalarMixedTiedHS<bit U, bits<5> opc, string asm,
5007 SDPatternOperator OpNode = null_frag> {
5008 def i16 : BaseSIMDThreeScalarMixed<U, 0b01, opc,
5009 (outs FPR32:$dst),
5010 (ins FPR32:$Rd, FPR16:$Rn, FPR16:$Rm),
5011 asm, "$Rd = $dst", []>;
5012 def i32 : BaseSIMDThreeScalarMixed<U, 0b10, opc,
5013 (outs FPR64:$dst),
5014 (ins FPR64:$Rd, FPR32:$Rn, FPR32:$Rm),
5015 asm, "$Rd = $dst",
5016 [(set (i64 FPR64:$dst),
5017 (OpNode (i64 FPR64:$Rd), (i32 FPR32:$Rn), (i32 FPR32:$Rm)))]>;
5018}
5019
5020//----------------------------------------------------------------------------
5021// AdvSIMD two register scalar instructions
5022//----------------------------------------------------------------------------
5023
5024let mayLoad = 0, mayStore = 0, hasSideEffects = 0 in
5025class BaseSIMDTwoScalar<bit U, bits<2> size, bits<5> opcode,
5026 RegisterClass regtype, RegisterClass regtype2,
5027 string asm, list<dag> pat>
5028 : I<(outs regtype:$Rd), (ins regtype2:$Rn), asm,
5029 "\t$Rd, $Rn", "", pat>,
5030 Sched<[WriteV]> {
5031 bits<5> Rd;
5032 bits<5> Rn;
5033 let Inst{31-30} = 0b01;
5034 let Inst{29} = U;
5035 let Inst{28-24} = 0b11110;
5036 let Inst{23-22} = size;
5037 let Inst{21-17} = 0b10000;
5038 let Inst{16-12} = opcode;
5039 let Inst{11-10} = 0b10;
5040 let Inst{9-5} = Rn;
5041 let Inst{4-0} = Rd;
5042}
5043
5044let mayLoad = 0, mayStore = 0, hasSideEffects = 0 in
5045class BaseSIMDTwoScalarTied<bit U, bits<2> size, bits<5> opcode,
5046 RegisterClass regtype, RegisterClass regtype2,
5047 string asm, list<dag> pat>
5048 : I<(outs regtype:$dst), (ins regtype:$Rd, regtype2:$Rn), asm,
5049 "\t$Rd, $Rn", "$Rd = $dst", pat>,
5050 Sched<[WriteV]> {
5051 bits<5> Rd;
5052 bits<5> Rn;
5053 let Inst{31-30} = 0b01;
5054 let Inst{29} = U;
5055 let Inst{28-24} = 0b11110;
5056 let Inst{23-22} = size;
5057 let Inst{21-17} = 0b10000;
5058 let Inst{16-12} = opcode;
5059 let Inst{11-10} = 0b10;
5060 let Inst{9-5} = Rn;
5061 let Inst{4-0} = Rd;
5062}
5063
5064
5065let mayLoad = 0, mayStore = 0, hasSideEffects = 0 in
5066class BaseSIMDCmpTwoScalar<bit U, bits<2> size, bits<5> opcode,
5067 RegisterClass regtype, string asm>
5068 : I<(outs regtype:$Rd), (ins regtype:$Rn), asm,
5069 "\t$Rd, $Rn, #0", "", []>,
5070 Sched<[WriteV]> {
5071 bits<5> Rd;
5072 bits<5> Rn;
5073 let Inst{31-30} = 0b01;
5074 let Inst{29} = U;
5075 let Inst{28-24} = 0b11110;
5076 let Inst{23-22} = size;
5077 let Inst{21-17} = 0b10000;
5078 let Inst{16-12} = opcode;
5079 let Inst{11-10} = 0b10;
5080 let Inst{9-5} = Rn;
5081 let Inst{4-0} = Rd;
5082}
5083
5084class SIMDInexactCvtTwoScalar<bits<5> opcode, string asm>
5085 : I<(outs FPR32:$Rd), (ins FPR64:$Rn), asm, "\t$Rd, $Rn", "",
5086 [(set (f32 FPR32:$Rd), (int_arm64_sisd_fcvtxn (f64 FPR64:$Rn)))]>,
5087 Sched<[WriteV]> {
5088 bits<5> Rd;
5089 bits<5> Rn;
5090 let Inst{31-17} = 0b011111100110000;
5091 let Inst{16-12} = opcode;
5092 let Inst{11-10} = 0b10;
5093 let Inst{9-5} = Rn;
5094 let Inst{4-0} = Rd;
5095}
5096
5097multiclass SIMDCmpTwoScalarD<bit U, bits<5> opc, string asm,
5098 SDPatternOperator OpNode> {
5099 def v1i64rz : BaseSIMDCmpTwoScalar<U, 0b11, opc, FPR64, asm>;
5100
5101 def : Pat<(v1i64 (OpNode FPR64:$Rn)),
5102 (!cast<Instruction>(NAME # v1i64rz) FPR64:$Rn)>;
5103}
5104
5105multiclass SIMDCmpTwoScalarSD<bit U, bit S, bits<5> opc, string asm,
5106 SDPatternOperator OpNode> {
5107 def v1i64rz : BaseSIMDCmpTwoScalar<U, {S,1}, opc, FPR64, asm>;
5108 def v1i32rz : BaseSIMDCmpTwoScalar<U, {S,0}, opc, FPR32, asm>;
5109
5110 def : Pat<(v1i64 (OpNode (v1f64 FPR64:$Rn))),
5111 (!cast<Instruction>(NAME # v1i64rz) FPR64:$Rn)>;
5112}
5113
5114multiclass SIMDTwoScalarD<bit U, bits<5> opc, string asm,
5115 SDPatternOperator OpNode = null_frag> {
5116 def v1i64 : BaseSIMDTwoScalar<U, 0b11, opc, FPR64, FPR64, asm,
5117 [(set (v1i64 FPR64:$Rd), (OpNode (v1i64 FPR64:$Rn)))]>;
Tim Northoverf4810362014-03-31 15:46:17 +00005118
5119 def : Pat<(i64 (OpNode (i64 FPR64:$Rn))),
5120 (!cast<Instruction>(NAME # "v1i64") FPR64:$Rn)>;
Tim Northover00ed9962014-03-29 10:18:08 +00005121}
5122
5123multiclass SIMDTwoScalarSD<bit U, bit S, bits<5> opc, string asm> {
5124 def v1i64 : BaseSIMDTwoScalar<U, {S,1}, opc, FPR64, FPR64, asm,[]>;
5125 def v1i32 : BaseSIMDTwoScalar<U, {S,0}, opc, FPR32, FPR32, asm,[]>;
5126}
5127
5128multiclass SIMDTwoScalarCVTSD<bit U, bit S, bits<5> opc, string asm,
5129 SDPatternOperator OpNode> {
5130 def v1i64 : BaseSIMDTwoScalar<U, {S,1}, opc, FPR64, FPR64, asm,
5131 [(set FPR64:$Rd, (OpNode (f64 FPR64:$Rn)))]>;
5132 def v1i32 : BaseSIMDTwoScalar<U, {S,0}, opc, FPR32, FPR32, asm,
5133 [(set FPR32:$Rd, (OpNode (f32 FPR32:$Rn)))]>;
5134}
5135
5136multiclass SIMDTwoScalarBHSD<bit U, bits<5> opc, string asm,
5137 SDPatternOperator OpNode = null_frag> {
5138 let mayLoad = 0, mayStore = 0, hasSideEffects = 0 in {
5139 def v1i64 : BaseSIMDTwoScalar<U, 0b11, opc, FPR64, FPR64, asm,
5140 [(set (i64 FPR64:$Rd), (OpNode (i64 FPR64:$Rn)))]>;
5141 def v1i32 : BaseSIMDTwoScalar<U, 0b10, opc, FPR32, FPR32, asm,
5142 [(set (i32 FPR32:$Rd), (OpNode (i32 FPR32:$Rn)))]>;
5143 def v1i16 : BaseSIMDTwoScalar<U, 0b01, opc, FPR16, FPR16, asm, []>;
5144 def v1i8 : BaseSIMDTwoScalar<U, 0b00, opc, FPR8 , FPR8 , asm, []>;
5145 }
5146
5147 def : Pat<(v1i64 (OpNode (v1i64 FPR64:$Rn))),
5148 (!cast<Instruction>(NAME # v1i64) FPR64:$Rn)>;
5149}
5150
Tim Northover00ed9962014-03-29 10:18:08 +00005151multiclass SIMDTwoScalarBHSDTied<bit U, bits<5> opc, string asm,
5152 Intrinsic OpNode> {
Tim Northover903814c2014-03-31 15:46:26 +00005153 let mayLoad = 0, mayStore = 0, hasSideEffects = 0 in {
5154 def v1i64 : BaseSIMDTwoScalarTied<U, 0b11, opc, FPR64, FPR64, asm,
5155 [(set (i64 FPR64:$dst), (OpNode (i64 FPR64:$Rd), (i64 FPR64:$Rn)))]>;
5156 def v1i32 : BaseSIMDTwoScalarTied<U, 0b10, opc, FPR32, FPR32, asm,
5157 [(set (i32 FPR32:$dst), (OpNode (i32 FPR32:$Rd), (i32 FPR32:$Rn)))]>;
5158 def v1i16 : BaseSIMDTwoScalarTied<U, 0b01, opc, FPR16, FPR16, asm, []>;
5159 def v1i8 : BaseSIMDTwoScalarTied<U, 0b00, opc, FPR8 , FPR8 , asm, []>;
5160 }
5161
5162 def : Pat<(v1i64 (OpNode (v1i64 FPR64:$Rd), (v1i64 FPR64:$Rn))),
5163 (!cast<Instruction>(NAME # v1i64) FPR64:$Rd, FPR64:$Rn)>;
Tim Northover00ed9962014-03-29 10:18:08 +00005164}
5165
5166
5167
5168let mayLoad = 0, mayStore = 0, hasSideEffects = 0 in
5169multiclass SIMDTwoScalarMixedBHS<bit U, bits<5> opc, string asm,
5170 SDPatternOperator OpNode = null_frag> {
5171 def v1i32 : BaseSIMDTwoScalar<U, 0b10, opc, FPR32, FPR64, asm,
5172 [(set (i32 FPR32:$Rd), (OpNode (i64 FPR64:$Rn)))]>;
5173 def v1i16 : BaseSIMDTwoScalar<U, 0b01, opc, FPR16, FPR32, asm, []>;
5174 def v1i8 : BaseSIMDTwoScalar<U, 0b00, opc, FPR8 , FPR16, asm, []>;
5175}
5176
5177//----------------------------------------------------------------------------
5178// AdvSIMD scalar pairwise instructions
5179//----------------------------------------------------------------------------
5180
5181let mayLoad = 0, mayStore = 0, hasSideEffects = 0 in
5182class BaseSIMDPairwiseScalar<bit U, bits<2> size, bits<5> opcode,
5183 RegisterOperand regtype, RegisterOperand vectype,
5184 string asm, string kind>
5185 : I<(outs regtype:$Rd), (ins vectype:$Rn), asm,
5186 "{\t$Rd, $Rn" # kind # "|" # kind # "\t$Rd, $Rn}", "", []>,
5187 Sched<[WriteV]> {
5188 bits<5> Rd;
5189 bits<5> Rn;
5190 let Inst{31-30} = 0b01;
5191 let Inst{29} = U;
5192 let Inst{28-24} = 0b11110;
5193 let Inst{23-22} = size;
5194 let Inst{21-17} = 0b11000;
5195 let Inst{16-12} = opcode;
5196 let Inst{11-10} = 0b10;
5197 let Inst{9-5} = Rn;
5198 let Inst{4-0} = Rd;
5199}
5200
5201multiclass SIMDPairwiseScalarD<bit U, bits<5> opc, string asm> {
5202 def v2i64p : BaseSIMDPairwiseScalar<U, 0b11, opc, FPR64Op, V128,
5203 asm, ".2d">;
5204}
5205
5206multiclass SIMDPairwiseScalarSD<bit U, bit S, bits<5> opc, string asm> {
5207 def v2i32p : BaseSIMDPairwiseScalar<U, {S,0}, opc, FPR32Op, V64,
5208 asm, ".2s">;
5209 def v2i64p : BaseSIMDPairwiseScalar<U, {S,1}, opc, FPR64Op, V128,
5210 asm, ".2d">;
5211}
5212
5213//----------------------------------------------------------------------------
5214// AdvSIMD across lanes instructions
5215//----------------------------------------------------------------------------
5216
5217let mayLoad = 0, mayStore = 0, hasSideEffects = 0 in
5218class BaseSIMDAcrossLanes<bit Q, bit U, bits<2> size, bits<5> opcode,
5219 RegisterClass regtype, RegisterOperand vectype,
5220 string asm, string kind, list<dag> pattern>
5221 : I<(outs regtype:$Rd), (ins vectype:$Rn), asm,
5222 "{\t$Rd, $Rn" # kind # "|" # kind # "\t$Rd, $Rn}", "", pattern>,
5223 Sched<[WriteV]> {
5224 bits<5> Rd;
5225 bits<5> Rn;
5226 let Inst{31} = 0;
5227 let Inst{30} = Q;
5228 let Inst{29} = U;
5229 let Inst{28-24} = 0b01110;
5230 let Inst{23-22} = size;
5231 let Inst{21-17} = 0b11000;
5232 let Inst{16-12} = opcode;
5233 let Inst{11-10} = 0b10;
5234 let Inst{9-5} = Rn;
5235 let Inst{4-0} = Rd;
5236}
5237
5238multiclass SIMDAcrossLanesBHS<bit U, bits<5> opcode,
5239 string asm> {
5240 def v8i8v : BaseSIMDAcrossLanes<0, U, 0b00, opcode, FPR8, V64,
5241 asm, ".8b", []>;
5242 def v16i8v : BaseSIMDAcrossLanes<1, U, 0b00, opcode, FPR8, V128,
5243 asm, ".16b", []>;
5244 def v4i16v : BaseSIMDAcrossLanes<0, U, 0b01, opcode, FPR16, V64,
5245 asm, ".4h", []>;
5246 def v8i16v : BaseSIMDAcrossLanes<1, U, 0b01, opcode, FPR16, V128,
5247 asm, ".8h", []>;
5248 def v4i32v : BaseSIMDAcrossLanes<1, U, 0b10, opcode, FPR32, V128,
5249 asm, ".4s", []>;
5250}
5251
5252multiclass SIMDAcrossLanesHSD<bit U, bits<5> opcode, string asm> {
5253 def v8i8v : BaseSIMDAcrossLanes<0, U, 0b00, opcode, FPR16, V64,
5254 asm, ".8b", []>;
5255 def v16i8v : BaseSIMDAcrossLanes<1, U, 0b00, opcode, FPR16, V128,
5256 asm, ".16b", []>;
5257 def v4i16v : BaseSIMDAcrossLanes<0, U, 0b01, opcode, FPR32, V64,
5258 asm, ".4h", []>;
5259 def v8i16v : BaseSIMDAcrossLanes<1, U, 0b01, opcode, FPR32, V128,
5260 asm, ".8h", []>;
5261 def v4i32v : BaseSIMDAcrossLanes<1, U, 0b10, opcode, FPR64, V128,
5262 asm, ".4s", []>;
5263}
5264
5265multiclass SIMDAcrossLanesS<bits<5> opcode, bit sz1, string asm,
5266 Intrinsic intOp> {
5267 def v4i32v : BaseSIMDAcrossLanes<1, 1, {sz1, 0}, opcode, FPR32, V128,
5268 asm, ".4s",
5269 [(set FPR32:$Rd, (intOp (v4f32 V128:$Rn)))]>;
5270}
5271
5272//----------------------------------------------------------------------------
5273// AdvSIMD INS/DUP instructions
5274//----------------------------------------------------------------------------
5275
5276// FIXME: There has got to be a better way to factor these. ugh.
5277
5278class BaseSIMDInsDup<bit Q, bit op, dag outs, dag ins, string asm,
5279 string operands, string constraints, list<dag> pattern>
5280 : I<outs, ins, asm, operands, constraints, pattern>,
5281 Sched<[WriteV]> {
5282 bits<5> Rd;
5283 bits<5> Rn;
5284 let Inst{31} = 0;
5285 let Inst{30} = Q;
5286 let Inst{29} = op;
5287 let Inst{28-21} = 0b01110000;
5288 let Inst{15} = 0;
5289 let Inst{10} = 1;
5290 let Inst{9-5} = Rn;
5291 let Inst{4-0} = Rd;
5292}
5293
5294class SIMDDupFromMain<bit Q, bits<5> imm5, string size, ValueType vectype,
5295 RegisterOperand vecreg, RegisterClass regtype>
5296 : BaseSIMDInsDup<Q, 0, (outs vecreg:$Rd), (ins regtype:$Rn), "dup",
5297 "{\t$Rd" # size # ", $Rn" #
5298 "|" # size # "\t$Rd, $Rn}", "",
5299 [(set (vectype vecreg:$Rd), (ARM64dup regtype:$Rn))]> {
5300 let Inst{20-16} = imm5;
5301 let Inst{14-11} = 0b0001;
5302}
5303
5304class SIMDDupFromElement<bit Q, string dstkind, string srckind,
5305 ValueType vectype, ValueType insreg,
5306 RegisterOperand vecreg, Operand idxtype,
5307 ValueType elttype, SDNode OpNode>
5308 : BaseSIMDInsDup<Q, 0, (outs vecreg:$Rd), (ins V128:$Rn, idxtype:$idx), "dup",
5309 "{\t$Rd" # dstkind # ", $Rn" # srckind # "$idx" #
5310 "|" # dstkind # "\t$Rd, $Rn$idx}", "",
5311 [(set (vectype vecreg:$Rd),
5312 (OpNode (insreg V128:$Rn), idxtype:$idx))]> {
5313 let Inst{14-11} = 0b0000;
5314}
5315
5316class SIMDDup64FromElement
5317 : SIMDDupFromElement<1, ".2d", ".d", v2i64, v2i64, V128,
5318 VectorIndexD, i64, ARM64duplane64> {
5319 bits<1> idx;
5320 let Inst{20} = idx;
5321 let Inst{19-16} = 0b1000;
5322}
5323
5324class SIMDDup32FromElement<bit Q, string size, ValueType vectype,
5325 RegisterOperand vecreg>
5326 : SIMDDupFromElement<Q, size, ".s", vectype, v4i32, vecreg,
5327 VectorIndexS, i64, ARM64duplane32> {
5328 bits<2> idx;
5329 let Inst{20-19} = idx;
5330 let Inst{18-16} = 0b100;
5331}
5332
5333class SIMDDup16FromElement<bit Q, string size, ValueType vectype,
5334 RegisterOperand vecreg>
5335 : SIMDDupFromElement<Q, size, ".h", vectype, v8i16, vecreg,
5336 VectorIndexH, i64, ARM64duplane16> {
5337 bits<3> idx;
5338 let Inst{20-18} = idx;
5339 let Inst{17-16} = 0b10;
5340}
5341
5342class SIMDDup8FromElement<bit Q, string size, ValueType vectype,
5343 RegisterOperand vecreg>
5344 : SIMDDupFromElement<Q, size, ".b", vectype, v16i8, vecreg,
5345 VectorIndexB, i64, ARM64duplane8> {
5346 bits<4> idx;
5347 let Inst{20-17} = idx;
5348 let Inst{16} = 1;
5349}
5350
5351class BaseSIMDMov<bit Q, string size, bits<4> imm4, RegisterClass regtype,
5352 Operand idxtype, string asm, list<dag> pattern>
5353 : BaseSIMDInsDup<Q, 0, (outs regtype:$Rd), (ins V128:$Rn, idxtype:$idx), asm,
5354 "{\t$Rd, $Rn" # size # "$idx" #
5355 "|" # size # "\t$Rd, $Rn$idx}", "", pattern> {
5356 let Inst{14-11} = imm4;
5357}
5358
5359class SIMDSMov<bit Q, string size, RegisterClass regtype,
5360 Operand idxtype>
5361 : BaseSIMDMov<Q, size, 0b0101, regtype, idxtype, "smov", []>;
5362class SIMDUMov<bit Q, string size, ValueType vectype, RegisterClass regtype,
5363 Operand idxtype>
5364 : BaseSIMDMov<Q, size, 0b0111, regtype, idxtype, "umov",
5365 [(set regtype:$Rd, (vector_extract (vectype V128:$Rn), idxtype:$idx))]>;
5366
5367class SIMDMovAlias<string asm, string size, Instruction inst,
5368 RegisterClass regtype, Operand idxtype>
5369 : InstAlias<asm#"{\t$dst, $src"#size#"$idx" #
5370 "|" # size # "\t$dst, $src$idx}",
5371 (inst regtype:$dst, V128:$src, idxtype:$idx)>;
5372
5373multiclass SMov {
5374 def vi8to32 : SIMDSMov<0, ".b", GPR32, VectorIndexB> {
5375 bits<4> idx;
5376 let Inst{20-17} = idx;
5377 let Inst{16} = 1;
5378 }
5379 def vi8to64 : SIMDSMov<1, ".b", GPR64, VectorIndexB> {
5380 bits<4> idx;
5381 let Inst{20-17} = idx;
5382 let Inst{16} = 1;
5383 }
5384 def vi16to32 : SIMDSMov<0, ".h", GPR32, VectorIndexH> {
5385 bits<3> idx;
5386 let Inst{20-18} = idx;
5387 let Inst{17-16} = 0b10;
5388 }
5389 def vi16to64 : SIMDSMov<1, ".h", GPR64, VectorIndexH> {
5390 bits<3> idx;
5391 let Inst{20-18} = idx;
5392 let Inst{17-16} = 0b10;
5393 }
5394 def vi32to64 : SIMDSMov<1, ".s", GPR64, VectorIndexS> {
5395 bits<2> idx;
5396 let Inst{20-19} = idx;
5397 let Inst{18-16} = 0b100;
5398 }
5399}
5400
5401multiclass UMov {
5402 def vi8 : SIMDUMov<0, ".b", v16i8, GPR32, VectorIndexB> {
5403 bits<4> idx;
5404 let Inst{20-17} = idx;
5405 let Inst{16} = 1;
5406 }
5407 def vi16 : SIMDUMov<0, ".h", v8i16, GPR32, VectorIndexH> {
5408 bits<3> idx;
5409 let Inst{20-18} = idx;
5410 let Inst{17-16} = 0b10;
5411 }
5412 def vi32 : SIMDUMov<0, ".s", v4i32, GPR32, VectorIndexS> {
5413 bits<2> idx;
5414 let Inst{20-19} = idx;
5415 let Inst{18-16} = 0b100;
5416 }
5417 def vi64 : SIMDUMov<1, ".d", v2i64, GPR64, VectorIndexD> {
5418 bits<1> idx;
5419 let Inst{20} = idx;
5420 let Inst{19-16} = 0b1000;
5421 }
5422 def : SIMDMovAlias<"mov", ".s",
5423 !cast<Instruction>(NAME#"vi32"),
5424 GPR32, VectorIndexS>;
5425 def : SIMDMovAlias<"mov", ".d",
5426 !cast<Instruction>(NAME#"vi64"),
5427 GPR64, VectorIndexD>;
5428}
5429
5430class SIMDInsFromMain<string size, ValueType vectype,
5431 RegisterClass regtype, Operand idxtype>
5432 : BaseSIMDInsDup<1, 0, (outs V128:$dst),
5433 (ins V128:$Rd, idxtype:$idx, regtype:$Rn), "ins",
5434 "{\t$Rd" # size # "$idx, $Rn" #
5435 "|" # size # "\t$Rd$idx, $Rn}",
5436 "$Rd = $dst",
5437 [(set V128:$dst,
5438 (vector_insert (vectype V128:$Rd), regtype:$Rn, idxtype:$idx))]> {
5439 let Inst{14-11} = 0b0011;
5440}
5441
5442class SIMDInsFromElement<string size, ValueType vectype,
5443 ValueType elttype, Operand idxtype>
5444 : BaseSIMDInsDup<1, 1, (outs V128:$dst),
5445 (ins V128:$Rd, idxtype:$idx, V128:$Rn, idxtype:$idx2), "ins",
5446 "{\t$Rd" # size # "$idx, $Rn" # size # "$idx2" #
5447 "|" # size # "\t$Rd$idx, $Rn$idx2}",
5448 "$Rd = $dst",
5449 [(set V128:$dst,
5450 (vector_insert
5451 (vectype V128:$Rd),
5452 (elttype (vector_extract (vectype V128:$Rn), idxtype:$idx2)),
5453 idxtype:$idx))]>;
5454
5455class SIMDInsMainMovAlias<string size, Instruction inst,
5456 RegisterClass regtype, Operand idxtype>
5457 : InstAlias<"mov" # "{\t$dst" # size # "$idx, $src" #
5458 "|" # size #"\t$dst$idx, $src}",
5459 (inst V128:$dst, idxtype:$idx, regtype:$src)>;
5460class SIMDInsElementMovAlias<string size, Instruction inst,
5461 Operand idxtype>
5462 : InstAlias<"mov" # "{\t$dst" # size # "$idx, $src" # size # "$idx2" #
5463 # "|" # size #" $dst$idx, $src$idx2}",
5464 (inst V128:$dst, idxtype:$idx, V128:$src, idxtype:$idx2)>;
5465
5466
5467multiclass SIMDIns {
5468 def vi8gpr : SIMDInsFromMain<".b", v16i8, GPR32, VectorIndexB> {
5469 bits<4> idx;
5470 let Inst{20-17} = idx;
5471 let Inst{16} = 1;
5472 }
5473 def vi16gpr : SIMDInsFromMain<".h", v8i16, GPR32, VectorIndexH> {
5474 bits<3> idx;
5475 let Inst{20-18} = idx;
5476 let Inst{17-16} = 0b10;
5477 }
5478 def vi32gpr : SIMDInsFromMain<".s", v4i32, GPR32, VectorIndexS> {
5479 bits<2> idx;
5480 let Inst{20-19} = idx;
5481 let Inst{18-16} = 0b100;
5482 }
5483 def vi64gpr : SIMDInsFromMain<".d", v2i64, GPR64, VectorIndexD> {
5484 bits<1> idx;
5485 let Inst{20} = idx;
5486 let Inst{19-16} = 0b1000;
5487 }
5488
5489 def vi8lane : SIMDInsFromElement<".b", v16i8, i32, VectorIndexB> {
5490 bits<4> idx;
5491 bits<4> idx2;
5492 let Inst{20-17} = idx;
5493 let Inst{16} = 1;
5494 let Inst{14-11} = idx2;
5495 }
5496 def vi16lane : SIMDInsFromElement<".h", v8i16, i32, VectorIndexH> {
5497 bits<3> idx;
5498 bits<3> idx2;
5499 let Inst{20-18} = idx;
5500 let Inst{17-16} = 0b10;
5501 let Inst{14-12} = idx2;
5502 let Inst{11} = 0;
5503 }
5504 def vi32lane : SIMDInsFromElement<".s", v4i32, i32, VectorIndexS> {
5505 bits<2> idx;
5506 bits<2> idx2;
5507 let Inst{20-19} = idx;
5508 let Inst{18-16} = 0b100;
5509 let Inst{14-13} = idx2;
5510 let Inst{12-11} = 0;
5511 }
5512 def vi64lane : SIMDInsFromElement<".d", v2i64, i64, VectorIndexD> {
5513 bits<1> idx;
5514 bits<1> idx2;
5515 let Inst{20} = idx;
5516 let Inst{19-16} = 0b1000;
5517 let Inst{14} = idx2;
5518 let Inst{13-11} = 0;
5519 }
5520
5521 // For all forms of the INS instruction, the "mov" mnemonic is the
5522 // preferred alias. Why they didn't just call the instruction "mov" in
5523 // the first place is a very good question indeed...
5524 def : SIMDInsMainMovAlias<".b", !cast<Instruction>(NAME#"vi8gpr"),
5525 GPR32, VectorIndexB>;
5526 def : SIMDInsMainMovAlias<".h", !cast<Instruction>(NAME#"vi16gpr"),
5527 GPR32, VectorIndexH>;
5528 def : SIMDInsMainMovAlias<".s", !cast<Instruction>(NAME#"vi32gpr"),
5529 GPR32, VectorIndexS>;
5530 def : SIMDInsMainMovAlias<".d", !cast<Instruction>(NAME#"vi64gpr"),
5531 GPR64, VectorIndexD>;
5532
5533 def : SIMDInsElementMovAlias<".b", !cast<Instruction>(NAME#"vi8lane"),
5534 VectorIndexB>;
5535 def : SIMDInsElementMovAlias<".h", !cast<Instruction>(NAME#"vi16lane"),
5536 VectorIndexH>;
5537 def : SIMDInsElementMovAlias<".s", !cast<Instruction>(NAME#"vi32lane"),
5538 VectorIndexS>;
5539 def : SIMDInsElementMovAlias<".d", !cast<Instruction>(NAME#"vi64lane"),
5540 VectorIndexD>;
5541}
5542
5543//----------------------------------------------------------------------------
5544// AdvSIMD TBL/TBX
5545//----------------------------------------------------------------------------
5546
5547let mayStore = 0, mayLoad = 0, hasSideEffects = 0 in
5548class BaseSIMDTableLookup<bit Q, bits<2> len, bit op, RegisterOperand vectype,
5549 RegisterOperand listtype, string asm, string kind>
5550 : I<(outs vectype:$Vd), (ins listtype:$Vn, vectype:$Vm), asm,
5551 "\t$Vd" # kind # ", $Vn, $Vm" # kind, "", []>,
5552 Sched<[WriteV]> {
5553 bits<5> Vd;
5554 bits<5> Vn;
5555 bits<5> Vm;
5556 let Inst{31} = 0;
5557 let Inst{30} = Q;
5558 let Inst{29-21} = 0b001110000;
5559 let Inst{20-16} = Vm;
5560 let Inst{15} = 0;
5561 let Inst{14-13} = len;
5562 let Inst{12} = op;
5563 let Inst{11-10} = 0b00;
5564 let Inst{9-5} = Vn;
5565 let Inst{4-0} = Vd;
5566}
5567
5568let mayStore = 0, mayLoad = 0, hasSideEffects = 0 in
5569class BaseSIMDTableLookupTied<bit Q, bits<2> len, bit op, RegisterOperand vectype,
5570 RegisterOperand listtype, string asm, string kind>
5571 : I<(outs vectype:$dst), (ins vectype:$Vd, listtype:$Vn, vectype:$Vm), asm,
5572 "\t$Vd" # kind # ", $Vn, $Vm" # kind, "$Vd = $dst", []>,
5573 Sched<[WriteV]> {
5574 bits<5> Vd;
5575 bits<5> Vn;
5576 bits<5> Vm;
5577 let Inst{31} = 0;
5578 let Inst{30} = Q;
5579 let Inst{29-21} = 0b001110000;
5580 let Inst{20-16} = Vm;
5581 let Inst{15} = 0;
5582 let Inst{14-13} = len;
5583 let Inst{12} = op;
5584 let Inst{11-10} = 0b00;
5585 let Inst{9-5} = Vn;
5586 let Inst{4-0} = Vd;
5587}
5588
5589class SIMDTableLookupAlias<string asm, Instruction inst,
5590 RegisterOperand vectype, RegisterOperand listtype>
5591 : InstAlias<!strconcat(asm, "\t$dst, $lst, $index"),
5592 (inst vectype:$dst, listtype:$lst, vectype:$index), 0>;
5593
5594multiclass SIMDTableLookup<bit op, string asm> {
5595 def v8i8One : BaseSIMDTableLookup<0, 0b00, op, V64, VecListOne16b,
5596 asm, ".8b">;
5597 def v8i8Two : BaseSIMDTableLookup<0, 0b01, op, V64, VecListTwo16b,
5598 asm, ".8b">;
5599 def v8i8Three : BaseSIMDTableLookup<0, 0b10, op, V64, VecListThree16b,
5600 asm, ".8b">;
5601 def v8i8Four : BaseSIMDTableLookup<0, 0b11, op, V64, VecListFour16b,
5602 asm, ".8b">;
5603 def v16i8One : BaseSIMDTableLookup<1, 0b00, op, V128, VecListOne16b,
5604 asm, ".16b">;
5605 def v16i8Two : BaseSIMDTableLookup<1, 0b01, op, V128, VecListTwo16b,
5606 asm, ".16b">;
5607 def v16i8Three: BaseSIMDTableLookup<1, 0b10, op, V128, VecListThree16b,
5608 asm, ".16b">;
5609 def v16i8Four : BaseSIMDTableLookup<1, 0b11, op, V128, VecListFour16b,
5610 asm, ".16b">;
5611
5612 def : SIMDTableLookupAlias<asm # ".8b",
5613 !cast<Instruction>(NAME#"v8i8One"),
5614 V64, VecListOne128>;
5615 def : SIMDTableLookupAlias<asm # ".8b",
5616 !cast<Instruction>(NAME#"v8i8Two"),
5617 V64, VecListTwo128>;
5618 def : SIMDTableLookupAlias<asm # ".8b",
5619 !cast<Instruction>(NAME#"v8i8Three"),
5620 V64, VecListThree128>;
5621 def : SIMDTableLookupAlias<asm # ".8b",
5622 !cast<Instruction>(NAME#"v8i8Four"),
5623 V64, VecListFour128>;
5624 def : SIMDTableLookupAlias<asm # ".16b",
5625 !cast<Instruction>(NAME#"v16i8One"),
5626 V128, VecListOne128>;
5627 def : SIMDTableLookupAlias<asm # ".16b",
5628 !cast<Instruction>(NAME#"v16i8Two"),
5629 V128, VecListTwo128>;
5630 def : SIMDTableLookupAlias<asm # ".16b",
5631 !cast<Instruction>(NAME#"v16i8Three"),
5632 V128, VecListThree128>;
5633 def : SIMDTableLookupAlias<asm # ".16b",
5634 !cast<Instruction>(NAME#"v16i8Four"),
5635 V128, VecListFour128>;
5636}
5637
5638multiclass SIMDTableLookupTied<bit op, string asm> {
5639 def v8i8One : BaseSIMDTableLookupTied<0, 0b00, op, V64, VecListOne16b,
5640 asm, ".8b">;
5641 def v8i8Two : BaseSIMDTableLookupTied<0, 0b01, op, V64, VecListTwo16b,
5642 asm, ".8b">;
5643 def v8i8Three : BaseSIMDTableLookupTied<0, 0b10, op, V64, VecListThree16b,
5644 asm, ".8b">;
5645 def v8i8Four : BaseSIMDTableLookupTied<0, 0b11, op, V64, VecListFour16b,
5646 asm, ".8b">;
5647 def v16i8One : BaseSIMDTableLookupTied<1, 0b00, op, V128, VecListOne16b,
5648 asm, ".16b">;
5649 def v16i8Two : BaseSIMDTableLookupTied<1, 0b01, op, V128, VecListTwo16b,
5650 asm, ".16b">;
5651 def v16i8Three: BaseSIMDTableLookupTied<1, 0b10, op, V128, VecListThree16b,
5652 asm, ".16b">;
5653 def v16i8Four : BaseSIMDTableLookupTied<1, 0b11, op, V128, VecListFour16b,
5654 asm, ".16b">;
5655
5656 def : SIMDTableLookupAlias<asm # ".8b",
5657 !cast<Instruction>(NAME#"v8i8One"),
5658 V64, VecListOne128>;
5659 def : SIMDTableLookupAlias<asm # ".8b",
5660 !cast<Instruction>(NAME#"v8i8Two"),
5661 V64, VecListTwo128>;
5662 def : SIMDTableLookupAlias<asm # ".8b",
5663 !cast<Instruction>(NAME#"v8i8Three"),
5664 V64, VecListThree128>;
5665 def : SIMDTableLookupAlias<asm # ".8b",
5666 !cast<Instruction>(NAME#"v8i8Four"),
5667 V64, VecListFour128>;
5668 def : SIMDTableLookupAlias<asm # ".16b",
5669 !cast<Instruction>(NAME#"v16i8One"),
5670 V128, VecListOne128>;
5671 def : SIMDTableLookupAlias<asm # ".16b",
5672 !cast<Instruction>(NAME#"v16i8Two"),
5673 V128, VecListTwo128>;
5674 def : SIMDTableLookupAlias<asm # ".16b",
5675 !cast<Instruction>(NAME#"v16i8Three"),
5676 V128, VecListThree128>;
5677 def : SIMDTableLookupAlias<asm # ".16b",
5678 !cast<Instruction>(NAME#"v16i8Four"),
5679 V128, VecListFour128>;
5680}
5681
5682
5683//----------------------------------------------------------------------------
5684// AdvSIMD scalar CPY
5685//----------------------------------------------------------------------------
5686let mayLoad = 0, mayStore = 0, hasSideEffects = 0 in
5687class BaseSIMDScalarCPY<RegisterClass regtype, RegisterOperand vectype,
5688 string kind, Operand idxtype>
5689 : I<(outs regtype:$dst), (ins vectype:$src, idxtype:$idx), "mov",
5690 "{\t$dst, $src" # kind # "$idx" #
5691 "|\t$dst, $src$idx}", "", []>,
5692 Sched<[WriteV]> {
5693 bits<5> dst;
5694 bits<5> src;
5695 let Inst{31-21} = 0b01011110000;
5696 let Inst{15-10} = 0b000001;
5697 let Inst{9-5} = src;
5698 let Inst{4-0} = dst;
5699}
5700
5701class SIMDScalarCPYAlias<string asm, string size, Instruction inst,
5702 RegisterClass regtype, RegisterOperand vectype, Operand idxtype>
5703 : InstAlias<asm # "{\t$dst, $src" # size # "$index" #
5704 # "|\t$dst, $src$index}",
5705 (inst regtype:$dst, vectype:$src, idxtype:$index)>;
5706
5707
5708multiclass SIMDScalarCPY<string asm> {
5709 def i8 : BaseSIMDScalarCPY<FPR8, V128, ".b", VectorIndexB> {
5710 bits<4> idx;
5711 let Inst{20-17} = idx;
5712 let Inst{16} = 1;
5713 }
5714 def i16 : BaseSIMDScalarCPY<FPR16, V128, ".h", VectorIndexH> {
5715 bits<3> idx;
5716 let Inst{20-18} = idx;
5717 let Inst{17-16} = 0b10;
5718 }
5719 def i32 : BaseSIMDScalarCPY<FPR32, V128, ".s", VectorIndexS> {
5720 bits<2> idx;
5721 let Inst{20-19} = idx;
5722 let Inst{18-16} = 0b100;
5723 }
5724 def i64 : BaseSIMDScalarCPY<FPR64, V128, ".d", VectorIndexD> {
5725 bits<1> idx;
5726 let Inst{20} = idx;
5727 let Inst{19-16} = 0b1000;
5728 }
5729
5730 // 'DUP' mnemonic aliases.
5731 def : SIMDScalarCPYAlias<"dup", ".b",
5732 !cast<Instruction>(NAME#"i8"),
5733 FPR8, V128, VectorIndexB>;
5734 def : SIMDScalarCPYAlias<"dup", ".h",
5735 !cast<Instruction>(NAME#"i16"),
5736 FPR16, V128, VectorIndexH>;
5737 def : SIMDScalarCPYAlias<"dup", ".s",
5738 !cast<Instruction>(NAME#"i32"),
5739 FPR32, V128, VectorIndexS>;
5740 def : SIMDScalarCPYAlias<"dup", ".d",
5741 !cast<Instruction>(NAME#"i64"),
5742 FPR64, V128, VectorIndexD>;
5743}
5744
5745//----------------------------------------------------------------------------
5746// AdvSIMD modified immediate instructions
5747//----------------------------------------------------------------------------
5748
5749class BaseSIMDModifiedImm<bit Q, bit op, dag oops, dag iops,
5750 string asm, string op_string,
5751 string cstr, list<dag> pattern>
5752 : I<oops, iops, asm, op_string, cstr, pattern>,
5753 Sched<[WriteV]> {
5754 bits<5> Rd;
5755 bits<8> imm8;
5756 let Inst{31} = 0;
5757 let Inst{30} = Q;
5758 let Inst{29} = op;
5759 let Inst{28-19} = 0b0111100000;
5760 let Inst{18-16} = imm8{7-5};
5761 let Inst{11-10} = 0b01;
5762 let Inst{9-5} = imm8{4-0};
5763 let Inst{4-0} = Rd;
5764}
5765
5766class BaseSIMDModifiedImmVector<bit Q, bit op, RegisterOperand vectype,
5767 Operand immtype, dag opt_shift_iop,
5768 string opt_shift, string asm, string kind,
5769 list<dag> pattern>
5770 : BaseSIMDModifiedImm<Q, op, (outs vectype:$Rd),
5771 !con((ins immtype:$imm8), opt_shift_iop), asm,
5772 "{\t$Rd" # kind # ", $imm8" # opt_shift #
5773 "|" # kind # "\t$Rd, $imm8" # opt_shift # "}",
5774 "", pattern> {
5775 let DecoderMethod = "DecodeModImmInstruction";
5776}
5777
5778class BaseSIMDModifiedImmVectorTied<bit Q, bit op, RegisterOperand vectype,
5779 Operand immtype, dag opt_shift_iop,
5780 string opt_shift, string asm, string kind,
5781 list<dag> pattern>
5782 : BaseSIMDModifiedImm<Q, op, (outs vectype:$dst),
5783 !con((ins vectype:$Rd, immtype:$imm8), opt_shift_iop),
5784 asm, "{\t$Rd" # kind # ", $imm8" # opt_shift #
5785 "|" # kind # "\t$Rd, $imm8" # opt_shift # "}",
5786 "$Rd = $dst", pattern> {
5787 let DecoderMethod = "DecodeModImmTiedInstruction";
5788}
5789
5790class BaseSIMDModifiedImmVectorShift<bit Q, bit op, bits<2> b15_b12,
5791 RegisterOperand vectype, string asm,
5792 string kind, list<dag> pattern>
5793 : BaseSIMDModifiedImmVector<Q, op, vectype, imm0_255,
5794 (ins logical_vec_shift:$shift),
5795 "$shift", asm, kind, pattern> {
5796 bits<2> shift;
5797 let Inst{15} = b15_b12{1};
5798 let Inst{14-13} = shift;
5799 let Inst{12} = b15_b12{0};
5800}
5801
5802class BaseSIMDModifiedImmVectorShiftTied<bit Q, bit op, bits<2> b15_b12,
5803 RegisterOperand vectype, string asm,
5804 string kind, list<dag> pattern>
5805 : BaseSIMDModifiedImmVectorTied<Q, op, vectype, imm0_255,
5806 (ins logical_vec_shift:$shift),
5807 "$shift", asm, kind, pattern> {
5808 bits<2> shift;
5809 let Inst{15} = b15_b12{1};
5810 let Inst{14-13} = shift;
5811 let Inst{12} = b15_b12{0};
5812}
5813
5814
5815class BaseSIMDModifiedImmVectorShiftHalf<bit Q, bit op, bits<2> b15_b12,
5816 RegisterOperand vectype, string asm,
5817 string kind, list<dag> pattern>
5818 : BaseSIMDModifiedImmVector<Q, op, vectype, imm0_255,
5819 (ins logical_vec_hw_shift:$shift),
5820 "$shift", asm, kind, pattern> {
5821 bits<2> shift;
5822 let Inst{15} = b15_b12{1};
5823 let Inst{14} = 0;
5824 let Inst{13} = shift{0};
5825 let Inst{12} = b15_b12{0};
5826}
5827
5828class BaseSIMDModifiedImmVectorShiftHalfTied<bit Q, bit op, bits<2> b15_b12,
5829 RegisterOperand vectype, string asm,
5830 string kind, list<dag> pattern>
5831 : BaseSIMDModifiedImmVectorTied<Q, op, vectype, imm0_255,
5832 (ins logical_vec_hw_shift:$shift),
5833 "$shift", asm, kind, pattern> {
5834 bits<2> shift;
5835 let Inst{15} = b15_b12{1};
5836 let Inst{14} = 0;
5837 let Inst{13} = shift{0};
5838 let Inst{12} = b15_b12{0};
5839}
5840
5841multiclass SIMDModifiedImmVectorShift<bit op, bits<2> hw_cmode, bits<2> w_cmode,
5842 string asm> {
5843 def v4i16 : BaseSIMDModifiedImmVectorShiftHalf<0, op, hw_cmode, V64,
5844 asm, ".4h", []>;
5845 def v8i16 : BaseSIMDModifiedImmVectorShiftHalf<1, op, hw_cmode, V128,
5846 asm, ".8h", []>;
5847
5848 def v2i32 : BaseSIMDModifiedImmVectorShift<0, op, w_cmode, V64,
5849 asm, ".2s", []>;
5850 def v4i32 : BaseSIMDModifiedImmVectorShift<1, op, w_cmode, V128,
5851 asm, ".4s", []>;
5852}
5853
5854multiclass SIMDModifiedImmVectorShiftTied<bit op, bits<2> hw_cmode,
5855 bits<2> w_cmode, string asm,
5856 SDNode OpNode> {
5857 def v4i16 : BaseSIMDModifiedImmVectorShiftHalfTied<0, op, hw_cmode, V64,
5858 asm, ".4h",
5859 [(set (v4i16 V64:$dst), (OpNode V64:$Rd,
5860 imm0_255:$imm8,
5861 (i32 imm:$shift)))]>;
5862 def v8i16 : BaseSIMDModifiedImmVectorShiftHalfTied<1, op, hw_cmode, V128,
5863 asm, ".8h",
5864 [(set (v8i16 V128:$dst), (OpNode V128:$Rd,
5865 imm0_255:$imm8,
5866 (i32 imm:$shift)))]>;
5867
5868 def v2i32 : BaseSIMDModifiedImmVectorShiftTied<0, op, w_cmode, V64,
5869 asm, ".2s",
5870 [(set (v2i32 V64:$dst), (OpNode V64:$Rd,
5871 imm0_255:$imm8,
5872 (i32 imm:$shift)))]>;
5873 def v4i32 : BaseSIMDModifiedImmVectorShiftTied<1, op, w_cmode, V128,
5874 asm, ".4s",
5875 [(set (v4i32 V128:$dst), (OpNode V128:$Rd,
5876 imm0_255:$imm8,
5877 (i32 imm:$shift)))]>;
5878}
5879
5880class SIMDModifiedImmMoveMSL<bit Q, bit op, bits<4> cmode,
5881 RegisterOperand vectype, string asm,
5882 string kind, list<dag> pattern>
5883 : BaseSIMDModifiedImmVector<Q, op, vectype, imm0_255,
5884 (ins move_vec_shift:$shift),
5885 "$shift", asm, kind, pattern> {
5886 bits<1> shift;
5887 let Inst{15-13} = cmode{3-1};
5888 let Inst{12} = shift;
5889}
5890
5891class SIMDModifiedImmVectorNoShift<bit Q, bit op, bits<4> cmode,
5892 RegisterOperand vectype,
5893 Operand imm_type, string asm,
5894 string kind, list<dag> pattern>
5895 : BaseSIMDModifiedImmVector<Q, op, vectype, imm_type, (ins), "",
5896 asm, kind, pattern> {
5897 let Inst{15-12} = cmode;
5898}
5899
5900class SIMDModifiedImmScalarNoShift<bit Q, bit op, bits<4> cmode, string asm,
5901 list<dag> pattern>
5902 : BaseSIMDModifiedImm<Q, op, (outs FPR64:$Rd), (ins simdimmtype10:$imm8), asm,
5903 "\t$Rd, $imm8", "", pattern> {
5904 let Inst{15-12} = cmode;
5905 let DecoderMethod = "DecodeModImmInstruction";
5906}
5907
5908//----------------------------------------------------------------------------
5909// AdvSIMD indexed element
5910//----------------------------------------------------------------------------
5911
5912let mayLoad = 0, mayStore = 0, hasSideEffects = 0 in
5913class BaseSIMDIndexed<bit Q, bit U, bit Scalar, bits<2> size, bits<4> opc,
5914 RegisterOperand dst_reg, RegisterOperand lhs_reg,
5915 RegisterOperand rhs_reg, Operand vec_idx, string asm,
5916 string apple_kind, string dst_kind, string lhs_kind,
5917 string rhs_kind, list<dag> pattern>
5918 : I<(outs dst_reg:$Rd), (ins lhs_reg:$Rn, rhs_reg:$Rm, vec_idx:$idx),
5919 asm,
5920 "{\t$Rd" # dst_kind # ", $Rn" # lhs_kind # ", $Rm" # rhs_kind # "$idx" #
5921 "|" # apple_kind # "\t$Rd, $Rn, $Rm$idx}", "", pattern>,
5922 Sched<[WriteV]> {
5923 bits<5> Rd;
5924 bits<5> Rn;
5925 bits<5> Rm;
5926
5927 let Inst{31} = 0;
5928 let Inst{30} = Q;
5929 let Inst{29} = U;
5930 let Inst{28} = Scalar;
5931 let Inst{27-24} = 0b1111;
5932 let Inst{23-22} = size;
5933 // Bit 21 must be set by the derived class.
5934 let Inst{20-16} = Rm;
5935 let Inst{15-12} = opc;
5936 // Bit 11 must be set by the derived class.
5937 let Inst{10} = 0;
5938 let Inst{9-5} = Rn;
5939 let Inst{4-0} = Rd;
5940}
5941
5942let mayLoad = 0, mayStore = 0, hasSideEffects = 0 in
5943class BaseSIMDIndexedTied<bit Q, bit U, bit Scalar, bits<2> size, bits<4> opc,
5944 RegisterOperand dst_reg, RegisterOperand lhs_reg,
5945 RegisterOperand rhs_reg, Operand vec_idx, string asm,
5946 string apple_kind, string dst_kind, string lhs_kind,
5947 string rhs_kind, list<dag> pattern>
5948 : I<(outs dst_reg:$dst),
5949 (ins dst_reg:$Rd, lhs_reg:$Rn, rhs_reg:$Rm, vec_idx:$idx), asm,
5950 "{\t$Rd" # dst_kind # ", $Rn" # lhs_kind # ", $Rm" # rhs_kind # "$idx" #
5951 "|" # apple_kind # "\t$Rd, $Rn, $Rm$idx}", "$Rd = $dst", pattern>,
5952 Sched<[WriteV]> {
5953 bits<5> Rd;
5954 bits<5> Rn;
5955 bits<5> Rm;
5956
5957 let Inst{31} = 0;
5958 let Inst{30} = Q;
5959 let Inst{29} = U;
5960 let Inst{28} = Scalar;
5961 let Inst{27-24} = 0b1111;
5962 let Inst{23-22} = size;
5963 // Bit 21 must be set by the derived class.
5964 let Inst{20-16} = Rm;
5965 let Inst{15-12} = opc;
5966 // Bit 11 must be set by the derived class.
5967 let Inst{10} = 0;
5968 let Inst{9-5} = Rn;
5969 let Inst{4-0} = Rd;
5970}
5971
5972multiclass SIMDFPIndexedSD<bit U, bits<4> opc, string asm,
5973 SDPatternOperator OpNode> {
5974 def v2i32_indexed : BaseSIMDIndexed<0, U, 0, 0b10, opc,
5975 V64, V64,
5976 V128, VectorIndexS,
5977 asm, ".2s", ".2s", ".2s", ".s",
5978 [(set (v2f32 V64:$Rd),
5979 (OpNode (v2f32 V64:$Rn),
5980 (v2f32 (ARM64duplane32 (v4f32 V128:$Rm), VectorIndexS:$idx))))]> {
5981 bits<2> idx;
5982 let Inst{11} = idx{1};
5983 let Inst{21} = idx{0};
5984 }
5985
5986 def v4i32_indexed : BaseSIMDIndexed<1, U, 0, 0b10, opc,
5987 V128, V128,
5988 V128, VectorIndexS,
5989 asm, ".4s", ".4s", ".4s", ".s",
5990 [(set (v4f32 V128:$Rd),
5991 (OpNode (v4f32 V128:$Rn),
5992 (v4f32 (ARM64duplane32 (v4f32 V128:$Rm), VectorIndexS:$idx))))]> {
5993 bits<2> idx;
5994 let Inst{11} = idx{1};
5995 let Inst{21} = idx{0};
5996 }
5997
5998 def v2i64_indexed : BaseSIMDIndexed<1, U, 0, 0b11, opc,
5999 V128, V128,
6000 V128, VectorIndexD,
6001 asm, ".2d", ".2d", ".2d", ".d",
6002 [(set (v2f64 V128:$Rd),
6003 (OpNode (v2f64 V128:$Rn),
6004 (v2f64 (ARM64duplane64 (v2f64 V128:$Rm), VectorIndexD:$idx))))]> {
6005 bits<1> idx;
6006 let Inst{11} = idx{0};
6007 let Inst{21} = 0;
6008 }
6009
6010 def v1i32_indexed : BaseSIMDIndexed<1, U, 1, 0b10, opc,
6011 FPR32Op, FPR32Op, V128, VectorIndexS,
6012 asm, ".s", "", "", ".s",
6013 [(set (f32 FPR32Op:$Rd),
6014 (OpNode (f32 FPR32Op:$Rn),
6015 (f32 (vector_extract (v4f32 V128:$Rm),
6016 VectorIndexS:$idx))))]> {
6017 bits<2> idx;
6018 let Inst{11} = idx{1};
6019 let Inst{21} = idx{0};
6020 }
6021
6022 def v1i64_indexed : BaseSIMDIndexed<1, U, 1, 0b11, opc,
6023 FPR64Op, FPR64Op, V128, VectorIndexD,
6024 asm, ".d", "", "", ".d",
6025 [(set (f64 FPR64Op:$Rd),
6026 (OpNode (f64 FPR64Op:$Rn),
6027 (f64 (vector_extract (v2f64 V128:$Rm),
6028 VectorIndexD:$idx))))]> {
6029 bits<1> idx;
6030 let Inst{11} = idx{0};
6031 let Inst{21} = 0;
6032 }
6033}
6034
6035multiclass SIMDFPIndexedSDTiedPatterns<string INST, SDPatternOperator OpNode> {
6036 // 2 variants for the .2s version: DUPLANE from 128-bit and DUP scalar.
6037 def : Pat<(v2f32 (OpNode (v2f32 V64:$Rd), (v2f32 V64:$Rn),
6038 (ARM64duplane32 (v4f32 V128:$Rm),
6039 VectorIndexS:$idx))),
6040 (!cast<Instruction>(INST # v2i32_indexed)
6041 V64:$Rd, V64:$Rn, V128:$Rm, VectorIndexS:$idx)>;
6042 def : Pat<(v2f32 (OpNode (v2f32 V64:$Rd), (v2f32 V64:$Rn),
6043 (ARM64dup (f32 FPR32Op:$Rm)))),
6044 (!cast<Instruction>(INST # "v2i32_indexed") V64:$Rd, V64:$Rn,
6045 (SUBREG_TO_REG (i32 0), FPR32Op:$Rm, ssub), (i64 0))>;
6046
6047
6048 // 2 variants for the .4s version: DUPLANE from 128-bit and DUP scalar.
6049 def : Pat<(v4f32 (OpNode (v4f32 V128:$Rd), (v4f32 V128:$Rn),
6050 (ARM64duplane32 (v4f32 V128:$Rm),
6051 VectorIndexS:$idx))),
6052 (!cast<Instruction>(INST # "v4i32_indexed")
6053 V128:$Rd, V128:$Rn, V128:$Rm, VectorIndexS:$idx)>;
6054 def : Pat<(v4f32 (OpNode (v4f32 V128:$Rd), (v4f32 V128:$Rn),
6055 (ARM64dup (f32 FPR32Op:$Rm)))),
6056 (!cast<Instruction>(INST # "v4i32_indexed") V128:$Rd, V128:$Rn,
6057 (SUBREG_TO_REG (i32 0), FPR32Op:$Rm, ssub), (i64 0))>;
6058
6059 // 2 variants for the .2d version: DUPLANE from 128-bit and DUP scalar.
6060 def : Pat<(v2f64 (OpNode (v2f64 V128:$Rd), (v2f64 V128:$Rn),
6061 (ARM64duplane64 (v2f64 V128:$Rm),
6062 VectorIndexD:$idx))),
6063 (!cast<Instruction>(INST # "v2i64_indexed")
6064 V128:$Rd, V128:$Rn, V128:$Rm, VectorIndexS:$idx)>;
6065 def : Pat<(v2f64 (OpNode (v2f64 V128:$Rd), (v2f64 V128:$Rn),
6066 (ARM64dup (f64 FPR64Op:$Rm)))),
6067 (!cast<Instruction>(INST # "v2i64_indexed") V128:$Rd, V128:$Rn,
6068 (SUBREG_TO_REG (i32 0), FPR64Op:$Rm, dsub), (i64 0))>;
6069
6070 // 2 variants for 32-bit scalar version: extract from .2s or from .4s
6071 def : Pat<(f32 (OpNode (f32 FPR32:$Rd), (f32 FPR32:$Rn),
6072 (vector_extract (v4f32 V128:$Rm), VectorIndexS:$idx))),
6073 (!cast<Instruction>(INST # "v1i32_indexed") FPR32:$Rd, FPR32:$Rn,
6074 V128:$Rm, VectorIndexS:$idx)>;
6075 def : Pat<(f32 (OpNode (f32 FPR32:$Rd), (f32 FPR32:$Rn),
6076 (vector_extract (v2f32 V64:$Rm), VectorIndexS:$idx))),
6077 (!cast<Instruction>(INST # "v1i32_indexed") FPR32:$Rd, FPR32:$Rn,
6078 (SUBREG_TO_REG (i32 0), V64:$Rm, dsub), VectorIndexS:$idx)>;
6079
6080 // 1 variant for 64-bit scalar version: extract from .1d or from .2d
6081 def : Pat<(f64 (OpNode (f64 FPR64:$Rd), (f64 FPR64:$Rn),
6082 (vector_extract (v2f64 V128:$Rm), VectorIndexD:$idx))),
6083 (!cast<Instruction>(INST # "v1i64_indexed") FPR64:$Rd, FPR64:$Rn,
6084 V128:$Rm, VectorIndexD:$idx)>;
6085}
6086
6087multiclass SIMDFPIndexedSDTied<bit U, bits<4> opc, string asm> {
6088 def v2i32_indexed : BaseSIMDIndexedTied<0, U, 0, 0b10, opc, V64, V64,
6089 V128, VectorIndexS,
6090 asm, ".2s", ".2s", ".2s", ".s", []> {
6091 bits<2> idx;
6092 let Inst{11} = idx{1};
6093 let Inst{21} = idx{0};
6094 }
6095
6096 def v4i32_indexed : BaseSIMDIndexedTied<1, U, 0, 0b10, opc,
6097 V128, V128,
6098 V128, VectorIndexS,
6099 asm, ".4s", ".4s", ".4s", ".s", []> {
6100 bits<2> idx;
6101 let Inst{11} = idx{1};
6102 let Inst{21} = idx{0};
6103 }
6104
6105 def v2i64_indexed : BaseSIMDIndexedTied<1, U, 0, 0b11, opc,
6106 V128, V128,
6107 V128, VectorIndexD,
6108 asm, ".2d", ".2d", ".2d", ".d", []> {
6109 bits<1> idx;
6110 let Inst{11} = idx{0};
6111 let Inst{21} = 0;
6112 }
6113
6114
6115 def v1i32_indexed : BaseSIMDIndexedTied<1, U, 1, 0b10, opc,
6116 FPR32Op, FPR32Op, V128, VectorIndexS,
6117 asm, ".s", "", "", ".s", []> {
6118 bits<2> idx;
6119 let Inst{11} = idx{1};
6120 let Inst{21} = idx{0};
6121 }
6122
6123 def v1i64_indexed : BaseSIMDIndexedTied<1, U, 1, 0b11, opc,
6124 FPR64Op, FPR64Op, V128, VectorIndexD,
6125 asm, ".d", "", "", ".d", []> {
6126 bits<1> idx;
6127 let Inst{11} = idx{0};
6128 let Inst{21} = 0;
6129 }
6130}
6131
6132multiclass SIMDIndexedHS<bit U, bits<4> opc, string asm,
6133 SDPatternOperator OpNode> {
6134 def v4i16_indexed : BaseSIMDIndexed<0, U, 0, 0b01, opc, V64, V64,
6135 V128_lo, VectorIndexH,
6136 asm, ".4h", ".4h", ".4h", ".h",
6137 [(set (v4i16 V64:$Rd),
6138 (OpNode (v4i16 V64:$Rn),
6139 (v4i16 (ARM64duplane16 (v8i16 V128_lo:$Rm), VectorIndexH:$idx))))]> {
6140 bits<3> idx;
6141 let Inst{11} = idx{2};
6142 let Inst{21} = idx{1};
6143 let Inst{20} = idx{0};
6144 }
6145
6146 def v8i16_indexed : BaseSIMDIndexed<1, U, 0, 0b01, opc,
6147 V128, V128,
6148 V128_lo, VectorIndexH,
6149 asm, ".8h", ".8h", ".8h", ".h",
6150 [(set (v8i16 V128:$Rd),
6151 (OpNode (v8i16 V128:$Rn),
6152 (v8i16 (ARM64duplane16 (v8i16 V128_lo:$Rm), VectorIndexH:$idx))))]> {
6153 bits<3> idx;
6154 let Inst{11} = idx{2};
6155 let Inst{21} = idx{1};
6156 let Inst{20} = idx{0};
6157 }
6158
6159 def v2i32_indexed : BaseSIMDIndexed<0, U, 0, 0b10, opc,
6160 V64, V64,
6161 V128, VectorIndexS,
6162 asm, ".2s", ".2s", ".2s", ".s",
6163 [(set (v2i32 V64:$Rd),
6164 (OpNode (v2i32 V64:$Rn),
6165 (v2i32 (ARM64duplane32 (v4i32 V128:$Rm), VectorIndexS:$idx))))]> {
6166 bits<2> idx;
6167 let Inst{11} = idx{1};
6168 let Inst{21} = idx{0};
6169 }
6170
6171 def v4i32_indexed : BaseSIMDIndexed<1, U, 0, 0b10, opc,
6172 V128, V128,
6173 V128, VectorIndexS,
6174 asm, ".4s", ".4s", ".4s", ".s",
6175 [(set (v4i32 V128:$Rd),
6176 (OpNode (v4i32 V128:$Rn),
6177 (v4i32 (ARM64duplane32 (v4i32 V128:$Rm), VectorIndexS:$idx))))]> {
6178 bits<2> idx;
6179 let Inst{11} = idx{1};
6180 let Inst{21} = idx{0};
6181 }
6182
6183 def v1i16_indexed : BaseSIMDIndexed<1, U, 1, 0b01, opc,
6184 FPR16Op, FPR16Op, V128_lo, VectorIndexH,
6185 asm, ".h", "", "", ".h", []> {
6186 bits<3> idx;
6187 let Inst{11} = idx{2};
6188 let Inst{21} = idx{1};
6189 let Inst{20} = idx{0};
6190 }
6191
6192 def v1i32_indexed : BaseSIMDIndexed<1, U, 1, 0b10, opc,
6193 FPR32Op, FPR32Op, V128, VectorIndexS,
6194 asm, ".s", "", "", ".s",
6195 [(set (i32 FPR32Op:$Rd),
6196 (OpNode FPR32Op:$Rn,
6197 (i32 (vector_extract (v4i32 V128:$Rm),
6198 VectorIndexS:$idx))))]> {
6199 bits<2> idx;
6200 let Inst{11} = idx{1};
6201 let Inst{21} = idx{0};
6202 }
6203}
6204
6205multiclass SIMDVectorIndexedHS<bit U, bits<4> opc, string asm,
6206 SDPatternOperator OpNode> {
6207 def v4i16_indexed : BaseSIMDIndexed<0, U, 0, 0b01, opc,
6208 V64, V64,
6209 V128_lo, VectorIndexH,
6210 asm, ".4h", ".4h", ".4h", ".h",
6211 [(set (v4i16 V64:$Rd),
6212 (OpNode (v4i16 V64:$Rn),
6213 (v4i16 (ARM64duplane16 (v8i16 V128_lo:$Rm), VectorIndexH:$idx))))]> {
6214 bits<3> idx;
6215 let Inst{11} = idx{2};
6216 let Inst{21} = idx{1};
6217 let Inst{20} = idx{0};
6218 }
6219
6220 def v8i16_indexed : BaseSIMDIndexed<1, U, 0, 0b01, opc,
6221 V128, V128,
6222 V128_lo, VectorIndexH,
6223 asm, ".8h", ".8h", ".8h", ".h",
6224 [(set (v8i16 V128:$Rd),
6225 (OpNode (v8i16 V128:$Rn),
6226 (v8i16 (ARM64duplane16 (v8i16 V128_lo:$Rm), VectorIndexH:$idx))))]> {
6227 bits<3> idx;
6228 let Inst{11} = idx{2};
6229 let Inst{21} = idx{1};
6230 let Inst{20} = idx{0};
6231 }
6232
6233 def v2i32_indexed : BaseSIMDIndexed<0, U, 0, 0b10, opc,
6234 V64, V64,
6235 V128, VectorIndexS,
6236 asm, ".2s", ".2s", ".2s", ".s",
6237 [(set (v2i32 V64:$Rd),
6238 (OpNode (v2i32 V64:$Rn),
6239 (v2i32 (ARM64duplane32 (v4i32 V128:$Rm), VectorIndexS:$idx))))]> {
6240 bits<2> idx;
6241 let Inst{11} = idx{1};
6242 let Inst{21} = idx{0};
6243 }
6244
6245 def v4i32_indexed : BaseSIMDIndexed<1, U, 0, 0b10, opc,
6246 V128, V128,
6247 V128, VectorIndexS,
6248 asm, ".4s", ".4s", ".4s", ".s",
6249 [(set (v4i32 V128:$Rd),
6250 (OpNode (v4i32 V128:$Rn),
6251 (v4i32 (ARM64duplane32 (v4i32 V128:$Rm), VectorIndexS:$idx))))]> {
6252 bits<2> idx;
6253 let Inst{11} = idx{1};
6254 let Inst{21} = idx{0};
6255 }
6256}
6257
6258multiclass SIMDVectorIndexedHSTied<bit U, bits<4> opc, string asm,
6259 SDPatternOperator OpNode> {
6260 def v4i16_indexed : BaseSIMDIndexedTied<0, U, 0, 0b01, opc, V64, V64,
6261 V128_lo, VectorIndexH,
6262 asm, ".4h", ".4h", ".4h", ".h",
6263 [(set (v4i16 V64:$dst),
6264 (OpNode (v4i16 V64:$Rd),(v4i16 V64:$Rn),
6265 (v4i16 (ARM64duplane16 (v8i16 V128_lo:$Rm), VectorIndexH:$idx))))]> {
6266 bits<3> idx;
6267 let Inst{11} = idx{2};
6268 let Inst{21} = idx{1};
6269 let Inst{20} = idx{0};
6270 }
6271
6272 def v8i16_indexed : BaseSIMDIndexedTied<1, U, 0, 0b01, opc,
6273 V128, V128,
6274 V128_lo, VectorIndexH,
6275 asm, ".8h", ".8h", ".8h", ".h",
6276 [(set (v8i16 V128:$dst),
6277 (OpNode (v8i16 V128:$Rd), (v8i16 V128:$Rn),
6278 (v8i16 (ARM64duplane16 (v8i16 V128_lo:$Rm), VectorIndexH:$idx))))]> {
6279 bits<3> idx;
6280 let Inst{11} = idx{2};
6281 let Inst{21} = idx{1};
6282 let Inst{20} = idx{0};
6283 }
6284
6285 def v2i32_indexed : BaseSIMDIndexedTied<0, U, 0, 0b10, opc,
6286 V64, V64,
6287 V128, VectorIndexS,
6288 asm, ".2s", ".2s", ".2s", ".s",
6289 [(set (v2i32 V64:$dst),
6290 (OpNode (v2i32 V64:$Rd), (v2i32 V64:$Rn),
6291 (v2i32 (ARM64duplane32 (v4i32 V128:$Rm), VectorIndexS:$idx))))]> {
6292 bits<2> idx;
6293 let Inst{11} = idx{1};
6294 let Inst{21} = idx{0};
6295 }
6296
6297 def v4i32_indexed : BaseSIMDIndexedTied<1, U, 0, 0b10, opc,
6298 V128, V128,
6299 V128, VectorIndexS,
6300 asm, ".4s", ".4s", ".4s", ".s",
6301 [(set (v4i32 V128:$dst),
6302 (OpNode (v4i32 V128:$Rd), (v4i32 V128:$Rn),
6303 (v4i32 (ARM64duplane32 (v4i32 V128:$Rm), VectorIndexS:$idx))))]> {
6304 bits<2> idx;
6305 let Inst{11} = idx{1};
6306 let Inst{21} = idx{0};
6307 }
6308}
6309
6310multiclass SIMDIndexedLongSD<bit U, bits<4> opc, string asm,
6311 SDPatternOperator OpNode> {
6312 def v4i16_indexed : BaseSIMDIndexed<0, U, 0, 0b01, opc,
6313 V128, V64,
6314 V128_lo, VectorIndexH,
6315 asm, ".4s", ".4s", ".4h", ".h",
6316 [(set (v4i32 V128:$Rd),
6317 (OpNode (v4i16 V64:$Rn),
6318 (v4i16 (ARM64duplane16 (v8i16 V128_lo:$Rm), VectorIndexH:$idx))))]> {
6319 bits<3> idx;
6320 let Inst{11} = idx{2};
6321 let Inst{21} = idx{1};
6322 let Inst{20} = idx{0};
6323 }
6324
6325 def v8i16_indexed : BaseSIMDIndexed<1, U, 0, 0b01, opc,
6326 V128, V128,
6327 V128_lo, VectorIndexH,
6328 asm#"2", ".4s", ".4s", ".8h", ".h",
6329 [(set (v4i32 V128:$Rd),
6330 (OpNode (extract_high_v8i16 V128:$Rn),
6331 (extract_high_v8i16 (ARM64duplane16 (v8i16 V128_lo:$Rm),
6332 VectorIndexH:$idx))))]> {
6333
6334 bits<3> idx;
6335 let Inst{11} = idx{2};
6336 let Inst{21} = idx{1};
6337 let Inst{20} = idx{0};
6338 }
6339
6340 def v2i32_indexed : BaseSIMDIndexed<0, U, 0, 0b10, opc,
6341 V128, V64,
6342 V128, VectorIndexS,
6343 asm, ".2d", ".2d", ".2s", ".s",
6344 [(set (v2i64 V128:$Rd),
6345 (OpNode (v2i32 V64:$Rn),
6346 (v2i32 (ARM64duplane32 (v4i32 V128:$Rm), VectorIndexS:$idx))))]> {
6347 bits<2> idx;
6348 let Inst{11} = idx{1};
6349 let Inst{21} = idx{0};
6350 }
6351
6352 def v4i32_indexed : BaseSIMDIndexed<1, U, 0, 0b10, opc,
6353 V128, V128,
6354 V128, VectorIndexS,
6355 asm#"2", ".2d", ".2d", ".4s", ".s",
6356 [(set (v2i64 V128:$Rd),
6357 (OpNode (extract_high_v4i32 V128:$Rn),
6358 (extract_high_v4i32 (ARM64duplane32 (v4i32 V128:$Rm),
6359 VectorIndexS:$idx))))]> {
6360 bits<2> idx;
6361 let Inst{11} = idx{1};
6362 let Inst{21} = idx{0};
6363 }
6364
6365 def v1i32_indexed : BaseSIMDIndexed<1, U, 1, 0b01, opc,
6366 FPR32Op, FPR16Op, V128_lo, VectorIndexH,
6367 asm, ".h", "", "", ".h", []> {
6368 bits<3> idx;
6369 let Inst{11} = idx{2};
6370 let Inst{21} = idx{1};
6371 let Inst{20} = idx{0};
6372 }
6373
6374 def v1i64_indexed : BaseSIMDIndexed<1, U, 1, 0b10, opc,
6375 FPR64Op, FPR32Op, V128, VectorIndexS,
6376 asm, ".s", "", "", ".s", []> {
6377 bits<2> idx;
6378 let Inst{11} = idx{1};
6379 let Inst{21} = idx{0};
6380 }
6381}
6382
6383multiclass SIMDIndexedLongSQDMLXSDTied<bit U, bits<4> opc, string asm,
6384 SDPatternOperator Accum> {
6385 def v4i16_indexed : BaseSIMDIndexedTied<0, U, 0, 0b01, opc,
6386 V128, V64,
6387 V128_lo, VectorIndexH,
6388 asm, ".4s", ".4s", ".4h", ".h",
6389 [(set (v4i32 V128:$dst),
6390 (Accum (v4i32 V128:$Rd),
6391 (v4i32 (int_arm64_neon_sqdmull
6392 (v4i16 V64:$Rn),
6393 (v4i16 (ARM64duplane16 (v8i16 V128_lo:$Rm),
6394 VectorIndexH:$idx))))))]> {
6395 bits<3> idx;
6396 let Inst{11} = idx{2};
6397 let Inst{21} = idx{1};
6398 let Inst{20} = idx{0};
6399 }
6400
6401 // FIXME: it would be nice to use the scalar (v1i32) instruction here, but an
6402 // intermediate EXTRACT_SUBREG would be untyped.
6403 def : Pat<(i32 (Accum (i32 FPR32Op:$Rd),
6404 (i32 (vector_extract (v4i32
6405 (int_arm64_neon_sqdmull (v4i16 V64:$Rn),
6406 (v4i16 (ARM64duplane16 (v8i16 V128_lo:$Rm),
6407 VectorIndexH:$idx)))),
6408 (i64 0))))),
6409 (EXTRACT_SUBREG
6410 (!cast<Instruction>(NAME # v4i16_indexed)
6411 (SUBREG_TO_REG (i32 0), FPR32Op:$Rd, ssub), V64:$Rn,
6412 V128_lo:$Rm, VectorIndexH:$idx),
6413 ssub)>;
6414
6415 def v8i16_indexed : BaseSIMDIndexedTied<1, U, 0, 0b01, opc,
6416 V128, V128,
6417 V128_lo, VectorIndexH,
6418 asm#"2", ".4s", ".4s", ".8h", ".h",
6419 [(set (v4i32 V128:$dst),
6420 (Accum (v4i32 V128:$Rd),
6421 (v4i32 (int_arm64_neon_sqdmull
6422 (extract_high_v8i16 V128:$Rn),
6423 (extract_high_v8i16
6424 (ARM64duplane16 (v8i16 V128_lo:$Rm),
6425 VectorIndexH:$idx))))))]> {
6426 bits<3> idx;
6427 let Inst{11} = idx{2};
6428 let Inst{21} = idx{1};
6429 let Inst{20} = idx{0};
6430 }
6431
6432 def v2i32_indexed : BaseSIMDIndexedTied<0, U, 0, 0b10, opc,
6433 V128, V64,
6434 V128, VectorIndexS,
6435 asm, ".2d", ".2d", ".2s", ".s",
6436 [(set (v2i64 V128:$dst),
6437 (Accum (v2i64 V128:$Rd),
6438 (v2i64 (int_arm64_neon_sqdmull
6439 (v2i32 V64:$Rn),
6440 (v2i32 (ARM64duplane32 (v4i32 V128:$Rm),
6441 VectorIndexS:$idx))))))]> {
6442 bits<2> idx;
6443 let Inst{11} = idx{1};
6444 let Inst{21} = idx{0};
6445 }
6446
6447 def v4i32_indexed : BaseSIMDIndexedTied<1, U, 0, 0b10, opc,
6448 V128, V128,
6449 V128, VectorIndexS,
6450 asm#"2", ".2d", ".2d", ".4s", ".s",
6451 [(set (v2i64 V128:$dst),
6452 (Accum (v2i64 V128:$Rd),
6453 (v2i64 (int_arm64_neon_sqdmull
6454 (extract_high_v4i32 V128:$Rn),
6455 (extract_high_v4i32
6456 (ARM64duplane32 (v4i32 V128:$Rm),
6457 VectorIndexS:$idx))))))]> {
6458 bits<2> idx;
6459 let Inst{11} = idx{1};
6460 let Inst{21} = idx{0};
6461 }
6462
6463 def v1i32_indexed : BaseSIMDIndexedTied<1, U, 1, 0b01, opc,
6464 FPR32Op, FPR16Op, V128_lo, VectorIndexH,
6465 asm, ".h", "", "", ".h", []> {
6466 bits<3> idx;
6467 let Inst{11} = idx{2};
6468 let Inst{21} = idx{1};
6469 let Inst{20} = idx{0};
6470 }
6471
6472
6473 def v1i64_indexed : BaseSIMDIndexedTied<1, U, 1, 0b10, opc,
6474 FPR64Op, FPR32Op, V128, VectorIndexS,
6475 asm, ".s", "", "", ".s",
6476 [(set (i64 FPR64Op:$dst),
6477 (Accum (i64 FPR64Op:$Rd),
6478 (i64 (int_arm64_neon_sqdmulls_scalar
6479 (i32 FPR32Op:$Rn),
6480 (i32 (vector_extract (v4i32 V128:$Rm),
6481 VectorIndexS:$idx))))))]> {
6482
6483 bits<2> idx;
6484 let Inst{11} = idx{1};
6485 let Inst{21} = idx{0};
6486 }
6487}
6488
6489multiclass SIMDVectorIndexedLongSD<bit U, bits<4> opc, string asm,
6490 SDPatternOperator OpNode> {
6491 let mayLoad = 0, mayStore = 0, hasSideEffects = 0 in {
6492 def v4i16_indexed : BaseSIMDIndexed<0, U, 0, 0b01, opc,
6493 V128, V64,
6494 V128_lo, VectorIndexH,
6495 asm, ".4s", ".4s", ".4h", ".h",
6496 [(set (v4i32 V128:$Rd),
6497 (OpNode (v4i16 V64:$Rn),
6498 (v4i16 (ARM64duplane16 (v8i16 V128_lo:$Rm), VectorIndexH:$idx))))]> {
6499 bits<3> idx;
6500 let Inst{11} = idx{2};
6501 let Inst{21} = idx{1};
6502 let Inst{20} = idx{0};
6503 }
6504
6505 def v8i16_indexed : BaseSIMDIndexed<1, U, 0, 0b01, opc,
6506 V128, V128,
6507 V128_lo, VectorIndexH,
6508 asm#"2", ".4s", ".4s", ".8h", ".h",
6509 [(set (v4i32 V128:$Rd),
6510 (OpNode (extract_high_v8i16 V128:$Rn),
6511 (extract_high_v8i16 (ARM64duplane16 (v8i16 V128_lo:$Rm),
6512 VectorIndexH:$idx))))]> {
6513
6514 bits<3> idx;
6515 let Inst{11} = idx{2};
6516 let Inst{21} = idx{1};
6517 let Inst{20} = idx{0};
6518 }
6519
6520 def v2i32_indexed : BaseSIMDIndexed<0, U, 0, 0b10, opc,
6521 V128, V64,
6522 V128, VectorIndexS,
6523 asm, ".2d", ".2d", ".2s", ".s",
6524 [(set (v2i64 V128:$Rd),
6525 (OpNode (v2i32 V64:$Rn),
6526 (v2i32 (ARM64duplane32 (v4i32 V128:$Rm), VectorIndexS:$idx))))]> {
6527 bits<2> idx;
6528 let Inst{11} = idx{1};
6529 let Inst{21} = idx{0};
6530 }
6531
6532 def v4i32_indexed : BaseSIMDIndexed<1, U, 0, 0b10, opc,
6533 V128, V128,
6534 V128, VectorIndexS,
6535 asm#"2", ".2d", ".2d", ".4s", ".s",
6536 [(set (v2i64 V128:$Rd),
6537 (OpNode (extract_high_v4i32 V128:$Rn),
6538 (extract_high_v4i32 (ARM64duplane32 (v4i32 V128:$Rm),
6539 VectorIndexS:$idx))))]> {
6540 bits<2> idx;
6541 let Inst{11} = idx{1};
6542 let Inst{21} = idx{0};
6543 }
6544 }
6545}
6546
6547multiclass SIMDVectorIndexedLongSDTied<bit U, bits<4> opc, string asm,
6548 SDPatternOperator OpNode> {
6549 let mayLoad = 0, mayStore = 0, hasSideEffects = 0 in {
6550 def v4i16_indexed : BaseSIMDIndexedTied<0, U, 0, 0b01, opc,
6551 V128, V64,
6552 V128_lo, VectorIndexH,
6553 asm, ".4s", ".4s", ".4h", ".h",
6554 [(set (v4i32 V128:$dst),
6555 (OpNode (v4i32 V128:$Rd), (v4i16 V64:$Rn),
6556 (v4i16 (ARM64duplane16 (v8i16 V128_lo:$Rm), VectorIndexH:$idx))))]> {
6557 bits<3> idx;
6558 let Inst{11} = idx{2};
6559 let Inst{21} = idx{1};
6560 let Inst{20} = idx{0};
6561 }
6562
6563 def v8i16_indexed : BaseSIMDIndexedTied<1, U, 0, 0b01, opc,
6564 V128, V128,
6565 V128_lo, VectorIndexH,
6566 asm#"2", ".4s", ".4s", ".8h", ".h",
6567 [(set (v4i32 V128:$dst),
6568 (OpNode (v4i32 V128:$Rd),
6569 (extract_high_v8i16 V128:$Rn),
6570 (extract_high_v8i16 (ARM64duplane16 (v8i16 V128_lo:$Rm),
6571 VectorIndexH:$idx))))]> {
6572 bits<3> idx;
6573 let Inst{11} = idx{2};
6574 let Inst{21} = idx{1};
6575 let Inst{20} = idx{0};
6576 }
6577
6578 def v2i32_indexed : BaseSIMDIndexedTied<0, U, 0, 0b10, opc,
6579 V128, V64,
6580 V128, VectorIndexS,
6581 asm, ".2d", ".2d", ".2s", ".s",
6582 [(set (v2i64 V128:$dst),
6583 (OpNode (v2i64 V128:$Rd), (v2i32 V64:$Rn),
6584 (v2i32 (ARM64duplane32 (v4i32 V128:$Rm), VectorIndexS:$idx))))]> {
6585 bits<2> idx;
6586 let Inst{11} = idx{1};
6587 let Inst{21} = idx{0};
6588 }
6589
6590 def v4i32_indexed : BaseSIMDIndexedTied<1, U, 0, 0b10, opc,
6591 V128, V128,
6592 V128, VectorIndexS,
6593 asm#"2", ".2d", ".2d", ".4s", ".s",
6594 [(set (v2i64 V128:$dst),
6595 (OpNode (v2i64 V128:$Rd),
6596 (extract_high_v4i32 V128:$Rn),
6597 (extract_high_v4i32 (ARM64duplane32 (v4i32 V128:$Rm),
6598 VectorIndexS:$idx))))]> {
6599 bits<2> idx;
6600 let Inst{11} = idx{1};
6601 let Inst{21} = idx{0};
6602 }
6603 }
6604}
6605
6606//----------------------------------------------------------------------------
6607// AdvSIMD scalar shift by immediate
6608//----------------------------------------------------------------------------
6609
6610let mayStore = 0, mayLoad = 0, hasSideEffects = 0 in
6611class BaseSIMDScalarShift<bit U, bits<5> opc, bits<7> fixed_imm,
6612 RegisterClass regtype1, RegisterClass regtype2,
6613 Operand immtype, string asm, list<dag> pattern>
6614 : I<(outs regtype1:$Rd), (ins regtype2:$Rn, immtype:$imm),
6615 asm, "\t$Rd, $Rn, $imm", "", pattern>,
6616 Sched<[WriteV]> {
6617 bits<5> Rd;
6618 bits<5> Rn;
6619 bits<7> imm;
6620 let Inst{31-30} = 0b01;
6621 let Inst{29} = U;
6622 let Inst{28-23} = 0b111110;
6623 let Inst{22-16} = fixed_imm;
6624 let Inst{15-11} = opc;
6625 let Inst{10} = 1;
6626 let Inst{9-5} = Rn;
6627 let Inst{4-0} = Rd;
6628}
6629
6630let mayStore = 0, mayLoad = 0, hasSideEffects = 0 in
6631class BaseSIMDScalarShiftTied<bit U, bits<5> opc, bits<7> fixed_imm,
6632 RegisterClass regtype1, RegisterClass regtype2,
6633 Operand immtype, string asm, list<dag> pattern>
6634 : I<(outs regtype1:$dst), (ins regtype1:$Rd, regtype2:$Rn, immtype:$imm),
6635 asm, "\t$Rd, $Rn, $imm", "$Rd = $dst", pattern>,
6636 Sched<[WriteV]> {
6637 bits<5> Rd;
6638 bits<5> Rn;
6639 bits<7> imm;
6640 let Inst{31-30} = 0b01;
6641 let Inst{29} = U;
6642 let Inst{28-23} = 0b111110;
6643 let Inst{22-16} = fixed_imm;
6644 let Inst{15-11} = opc;
6645 let Inst{10} = 1;
6646 let Inst{9-5} = Rn;
6647 let Inst{4-0} = Rd;
6648}
6649
6650
6651multiclass SIMDScalarRShiftSD<bit U, bits<5> opc, string asm> {
6652 def s : BaseSIMDScalarShift<U, opc, {0,1,?,?,?,?,?},
6653 FPR32, FPR32, vecshiftR32, asm, []> {
6654 let Inst{20-16} = imm{4-0};
6655 }
6656
6657 def d : BaseSIMDScalarShift<U, opc, {1,?,?,?,?,?,?},
6658 FPR64, FPR64, vecshiftR64, asm, []> {
6659 let Inst{21-16} = imm{5-0};
6660 }
6661}
6662
6663multiclass SIMDScalarRShiftD<bit U, bits<5> opc, string asm,
6664 SDPatternOperator OpNode> {
6665 def d : BaseSIMDScalarShift<U, opc, {1,?,?,?,?,?,?},
6666 FPR64, FPR64, vecshiftR64, asm,
Tim Northover5081cd02014-03-31 15:46:46 +00006667 [(set (i64 FPR64:$Rd),
6668 (OpNode (i64 FPR64:$Rn), (i32 vecshiftR64:$imm)))]> {
Tim Northover00ed9962014-03-29 10:18:08 +00006669 let Inst{21-16} = imm{5-0};
6670 }
Tim Northover5081cd02014-03-31 15:46:46 +00006671
6672 def : Pat<(v1i64 (OpNode (v1i64 FPR64:$Rn), (i32 vecshiftR64:$imm))),
6673 (!cast<Instruction>(NAME # "d") FPR64:$Rn, vecshiftR64:$imm)>;
Tim Northover00ed9962014-03-29 10:18:08 +00006674}
6675
Tim Northover00ed9962014-03-29 10:18:08 +00006676multiclass SIMDScalarRShiftDTied<bit U, bits<5> opc, string asm,
6677 SDPatternOperator OpNode = null_frag> {
6678 def d : BaseSIMDScalarShiftTied<U, opc, {1,?,?,?,?,?,?},
6679 FPR64, FPR64, vecshiftR64, asm,
Tim Northover5081cd02014-03-31 15:46:46 +00006680 [(set (i64 FPR64:$dst), (OpNode (i64 FPR64:$Rd), (i64 FPR64:$Rn),
6681 (i32 vecshiftR64:$imm)))]> {
Tim Northover00ed9962014-03-29 10:18:08 +00006682 let Inst{21-16} = imm{5-0};
6683 }
Tim Northover5081cd02014-03-31 15:46:46 +00006684
6685 def : Pat<(v1i64 (OpNode (v1i64 FPR64:$Rd), (v1i64 FPR64:$Rn),
6686 (i32 vecshiftR64:$imm))),
6687 (!cast<Instruction>(NAME # "d") FPR64:$Rd, FPR64:$Rn,
6688 vecshiftR64:$imm)>;
Tim Northover00ed9962014-03-29 10:18:08 +00006689}
6690
6691multiclass SIMDScalarLShiftD<bit U, bits<5> opc, string asm,
6692 SDPatternOperator OpNode> {
6693 def d : BaseSIMDScalarShift<U, opc, {1,?,?,?,?,?,?},
6694 FPR64, FPR64, vecshiftL64, asm,
6695 [(set (v1i64 FPR64:$Rd),
6696 (OpNode (v1i64 FPR64:$Rn), (i32 vecshiftL64:$imm)))]> {
6697 let Inst{21-16} = imm{5-0};
6698 }
6699}
6700
6701let mayStore = 0, mayLoad = 0, hasSideEffects = 0 in
6702multiclass SIMDScalarLShiftDTied<bit U, bits<5> opc, string asm> {
6703 def d : BaseSIMDScalarShiftTied<U, opc, {1,?,?,?,?,?,?},
6704 FPR64, FPR64, vecshiftL64, asm, []> {
6705 let Inst{21-16} = imm{5-0};
6706 }
6707}
6708
6709let mayStore = 0, mayLoad = 0, hasSideEffects = 0 in
6710multiclass SIMDScalarRShiftBHS<bit U, bits<5> opc, string asm,
6711 SDPatternOperator OpNode = null_frag> {
6712 def b : BaseSIMDScalarShift<U, opc, {0,0,0,1,?,?,?},
6713 FPR8, FPR16, vecshiftR8, asm, []> {
6714 let Inst{18-16} = imm{2-0};
6715 }
6716
6717 def h : BaseSIMDScalarShift<U, opc, {0,0,1,?,?,?,?},
6718 FPR16, FPR32, vecshiftR16, asm, []> {
6719 let Inst{19-16} = imm{3-0};
6720 }
6721
6722 def s : BaseSIMDScalarShift<U, opc, {0,1,?,?,?,?,?},
6723 FPR32, FPR64, vecshiftR32, asm,
6724 [(set (i32 FPR32:$Rd), (OpNode (i64 FPR64:$Rn), vecshiftR32:$imm))]> {
6725 let Inst{20-16} = imm{4-0};
6726 }
6727}
6728
6729multiclass SIMDScalarLShiftBHSD<bit U, bits<5> opc, string asm,
6730 SDPatternOperator OpNode> {
6731 def b : BaseSIMDScalarShift<U, opc, {0,0,0,1,?,?,?},
6732 FPR8, FPR8, vecshiftL8, asm, []> {
6733 let Inst{18-16} = imm{2-0};
6734 }
6735
6736 def h : BaseSIMDScalarShift<U, opc, {0,0,1,?,?,?,?},
6737 FPR16, FPR16, vecshiftL16, asm, []> {
6738 let Inst{19-16} = imm{3-0};
6739 }
6740
6741 def s : BaseSIMDScalarShift<U, opc, {0,1,?,?,?,?,?},
6742 FPR32, FPR32, vecshiftL32, asm,
6743 [(set (i32 FPR32:$Rd), (OpNode (i32 FPR32:$Rn), (i32 vecshiftL32:$imm)))]> {
6744 let Inst{20-16} = imm{4-0};
6745 }
6746
6747 def d : BaseSIMDScalarShift<U, opc, {1,?,?,?,?,?,?},
6748 FPR64, FPR64, vecshiftL64, asm,
6749 [(set (v1i64 FPR64:$Rd), (OpNode (v1i64 FPR64:$Rn),
6750 (i32 vecshiftL64:$imm)))]> {
6751 let Inst{21-16} = imm{5-0};
6752 }
6753}
6754
6755multiclass SIMDScalarRShiftBHSD<bit U, bits<5> opc, string asm> {
6756 def b : BaseSIMDScalarShift<U, opc, {0,0,0,1,?,?,?},
6757 FPR8, FPR8, vecshiftR8, asm, []> {
6758 let Inst{18-16} = imm{2-0};
6759 }
6760
6761 def h : BaseSIMDScalarShift<U, opc, {0,0,1,?,?,?,?},
6762 FPR16, FPR16, vecshiftR16, asm, []> {
6763 let Inst{19-16} = imm{3-0};
6764 }
6765
6766 def s : BaseSIMDScalarShift<U, opc, {0,1,?,?,?,?,?},
6767 FPR32, FPR32, vecshiftR32, asm, []> {
6768 let Inst{20-16} = imm{4-0};
6769 }
6770
6771 def d : BaseSIMDScalarShift<U, opc, {1,?,?,?,?,?,?},
6772 FPR64, FPR64, vecshiftR64, asm, []> {
6773 let Inst{21-16} = imm{5-0};
6774 }
6775}
6776
6777//----------------------------------------------------------------------------
6778// AdvSIMD vector x indexed element
6779//----------------------------------------------------------------------------
6780
6781let mayStore = 0, mayLoad = 0, hasSideEffects = 0 in
6782class BaseSIMDVectorShift<bit Q, bit U, bits<5> opc, bits<7> fixed_imm,
6783 RegisterOperand dst_reg, RegisterOperand src_reg,
6784 Operand immtype,
6785 string asm, string dst_kind, string src_kind,
6786 list<dag> pattern>
6787 : I<(outs dst_reg:$Rd), (ins src_reg:$Rn, immtype:$imm),
6788 asm, "{\t$Rd" # dst_kind # ", $Rn" # src_kind # ", $imm" #
6789 "|" # dst_kind # "\t$Rd, $Rn, $imm}", "", pattern>,
6790 Sched<[WriteV]> {
6791 bits<5> Rd;
6792 bits<5> Rn;
6793 let Inst{31} = 0;
6794 let Inst{30} = Q;
6795 let Inst{29} = U;
6796 let Inst{28-23} = 0b011110;
6797 let Inst{22-16} = fixed_imm;
6798 let Inst{15-11} = opc;
6799 let Inst{10} = 1;
6800 let Inst{9-5} = Rn;
6801 let Inst{4-0} = Rd;
6802}
6803
6804let mayStore = 0, mayLoad = 0, hasSideEffects = 0 in
6805class BaseSIMDVectorShiftTied<bit Q, bit U, bits<5> opc, bits<7> fixed_imm,
6806 RegisterOperand vectype1, RegisterOperand vectype2,
6807 Operand immtype,
6808 string asm, string dst_kind, string src_kind,
6809 list<dag> pattern>
6810 : I<(outs vectype1:$dst), (ins vectype1:$Rd, vectype2:$Rn, immtype:$imm),
6811 asm, "{\t$Rd" # dst_kind # ", $Rn" # src_kind # ", $imm" #
6812 "|" # dst_kind # "\t$Rd, $Rn, $imm}", "$Rd = $dst", pattern>,
6813 Sched<[WriteV]> {
6814 bits<5> Rd;
6815 bits<5> Rn;
6816 let Inst{31} = 0;
6817 let Inst{30} = Q;
6818 let Inst{29} = U;
6819 let Inst{28-23} = 0b011110;
6820 let Inst{22-16} = fixed_imm;
6821 let Inst{15-11} = opc;
6822 let Inst{10} = 1;
6823 let Inst{9-5} = Rn;
6824 let Inst{4-0} = Rd;
6825}
6826
6827multiclass SIMDVectorRShiftSD<bit U, bits<5> opc, string asm,
6828 Intrinsic OpNode> {
6829 def v2i32_shift : BaseSIMDVectorShift<0, U, opc, {0,1,?,?,?,?,?},
6830 V64, V64, vecshiftR32,
6831 asm, ".2s", ".2s",
6832 [(set (v2i32 V64:$Rd), (OpNode (v2f32 V64:$Rn), (i32 imm:$imm)))]> {
6833 bits<5> imm;
6834 let Inst{20-16} = imm;
6835 }
6836
6837 def v4i32_shift : BaseSIMDVectorShift<1, U, opc, {0,1,?,?,?,?,?},
6838 V128, V128, vecshiftR32,
6839 asm, ".4s", ".4s",
6840 [(set (v4i32 V128:$Rd), (OpNode (v4f32 V128:$Rn), (i32 imm:$imm)))]> {
6841 bits<5> imm;
6842 let Inst{20-16} = imm;
6843 }
6844
6845 def v2i64_shift : BaseSIMDVectorShift<1, U, opc, {1,?,?,?,?,?,?},
6846 V128, V128, vecshiftR64,
6847 asm, ".2d", ".2d",
6848 [(set (v2i64 V128:$Rd), (OpNode (v2f64 V128:$Rn), (i32 imm:$imm)))]> {
6849 bits<6> imm;
6850 let Inst{21-16} = imm;
6851 }
6852}
6853
6854multiclass SIMDVectorRShiftSDToFP<bit U, bits<5> opc, string asm,
6855 Intrinsic OpNode> {
6856 def v2i32_shift : BaseSIMDVectorShift<0, U, opc, {0,1,?,?,?,?,?},
6857 V64, V64, vecshiftR32,
6858 asm, ".2s", ".2s",
6859 [(set (v2f32 V64:$Rd), (OpNode (v2i32 V64:$Rn), (i32 imm:$imm)))]> {
6860 bits<5> imm;
6861 let Inst{20-16} = imm;
6862 }
6863
6864 def v4i32_shift : BaseSIMDVectorShift<1, U, opc, {0,1,?,?,?,?,?},
6865 V128, V128, vecshiftR32,
6866 asm, ".4s", ".4s",
6867 [(set (v4f32 V128:$Rd), (OpNode (v4i32 V128:$Rn), (i32 imm:$imm)))]> {
6868 bits<5> imm;
6869 let Inst{20-16} = imm;
6870 }
6871
6872 def v2i64_shift : BaseSIMDVectorShift<1, U, opc, {1,?,?,?,?,?,?},
6873 V128, V128, vecshiftR64,
6874 asm, ".2d", ".2d",
6875 [(set (v2f64 V128:$Rd), (OpNode (v2i64 V128:$Rn), (i32 imm:$imm)))]> {
6876 bits<6> imm;
6877 let Inst{21-16} = imm;
6878 }
6879}
6880
6881multiclass SIMDVectorRShiftNarrowBHS<bit U, bits<5> opc, string asm,
6882 SDPatternOperator OpNode> {
6883 def v8i8_shift : BaseSIMDVectorShift<0, U, opc, {0,0,0,1,?,?,?},
6884 V64, V128, vecshiftR16Narrow,
6885 asm, ".8b", ".8h",
6886 [(set (v8i8 V64:$Rd), (OpNode (v8i16 V128:$Rn), vecshiftR16Narrow:$imm))]> {
6887 bits<3> imm;
6888 let Inst{18-16} = imm;
6889 }
6890
6891 def v16i8_shift : BaseSIMDVectorShiftTied<1, U, opc, {0,0,0,1,?,?,?},
6892 V128, V128, vecshiftR16Narrow,
6893 asm#"2", ".16b", ".8h", []> {
6894 bits<3> imm;
6895 let Inst{18-16} = imm;
6896 let hasSideEffects = 0;
6897 }
6898
6899 def v4i16_shift : BaseSIMDVectorShift<0, U, opc, {0,0,1,?,?,?,?},
6900 V64, V128, vecshiftR32Narrow,
6901 asm, ".4h", ".4s",
6902 [(set (v4i16 V64:$Rd), (OpNode (v4i32 V128:$Rn), vecshiftR32Narrow:$imm))]> {
6903 bits<4> imm;
6904 let Inst{19-16} = imm;
6905 }
6906
6907 def v8i16_shift : BaseSIMDVectorShiftTied<1, U, opc, {0,0,1,?,?,?,?},
6908 V128, V128, vecshiftR32Narrow,
6909 asm#"2", ".8h", ".4s", []> {
6910 bits<4> imm;
6911 let Inst{19-16} = imm;
6912 let hasSideEffects = 0;
6913 }
6914
6915 def v2i32_shift : BaseSIMDVectorShift<0, U, opc, {0,1,?,?,?,?,?},
6916 V64, V128, vecshiftR64Narrow,
6917 asm, ".2s", ".2d",
6918 [(set (v2i32 V64:$Rd), (OpNode (v2i64 V128:$Rn), vecshiftR64Narrow:$imm))]> {
6919 bits<5> imm;
6920 let Inst{20-16} = imm;
6921 }
6922
6923 def v4i32_shift : BaseSIMDVectorShiftTied<1, U, opc, {0,1,?,?,?,?,?},
6924 V128, V128, vecshiftR64Narrow,
6925 asm#"2", ".4s", ".2d", []> {
6926 bits<5> imm;
6927 let Inst{20-16} = imm;
6928 let hasSideEffects = 0;
6929 }
6930
6931 // TableGen doesn't like patters w/ INSERT_SUBREG on the instructions
6932 // themselves, so put them here instead.
6933
6934 // Patterns involving what's effectively an insert high and a normal
6935 // intrinsic, represented by CONCAT_VECTORS.
6936 def : Pat<(concat_vectors (v8i8 V64:$Rd),(OpNode (v8i16 V128:$Rn),
6937 vecshiftR16Narrow:$imm)),
6938 (!cast<Instruction>(NAME # "v16i8_shift")
6939 (INSERT_SUBREG (IMPLICIT_DEF), V64:$Rd, dsub),
6940 V128:$Rn, vecshiftR16Narrow:$imm)>;
6941 def : Pat<(concat_vectors (v4i16 V64:$Rd), (OpNode (v4i32 V128:$Rn),
6942 vecshiftR32Narrow:$imm)),
6943 (!cast<Instruction>(NAME # "v8i16_shift")
6944 (INSERT_SUBREG (IMPLICIT_DEF), V64:$Rd, dsub),
6945 V128:$Rn, vecshiftR32Narrow:$imm)>;
6946 def : Pat<(concat_vectors (v2i32 V64:$Rd), (OpNode (v2i64 V128:$Rn),
6947 vecshiftR64Narrow:$imm)),
6948 (!cast<Instruction>(NAME # "v4i32_shift")
6949 (INSERT_SUBREG (IMPLICIT_DEF), V64:$Rd, dsub),
6950 V128:$Rn, vecshiftR64Narrow:$imm)>;
6951}
6952
6953multiclass SIMDVectorLShiftBHSD<bit U, bits<5> opc, string asm,
6954 SDPatternOperator OpNode> {
6955 def v8i8_shift : BaseSIMDVectorShift<0, U, opc, {0,0,0,1,?,?,?},
6956 V64, V64, vecshiftL8,
6957 asm, ".8b", ".8b",
6958 [(set (v8i8 V64:$Rd), (OpNode (v8i8 V64:$Rn),
6959 (i32 vecshiftL8:$imm)))]> {
6960 bits<3> imm;
6961 let Inst{18-16} = imm;
6962 }
6963
6964 def v16i8_shift : BaseSIMDVectorShift<1, U, opc, {0,0,0,1,?,?,?},
6965 V128, V128, vecshiftL8,
6966 asm, ".16b", ".16b",
6967 [(set (v16i8 V128:$Rd), (OpNode (v16i8 V128:$Rn),
6968 (i32 vecshiftL8:$imm)))]> {
6969 bits<3> imm;
6970 let Inst{18-16} = imm;
6971 }
6972
6973 def v4i16_shift : BaseSIMDVectorShift<0, U, opc, {0,0,1,?,?,?,?},
6974 V64, V64, vecshiftL16,
6975 asm, ".4h", ".4h",
6976 [(set (v4i16 V64:$Rd), (OpNode (v4i16 V64:$Rn),
6977 (i32 vecshiftL16:$imm)))]> {
6978 bits<4> imm;
6979 let Inst{19-16} = imm;
6980 }
6981
6982 def v8i16_shift : BaseSIMDVectorShift<1, U, opc, {0,0,1,?,?,?,?},
6983 V128, V128, vecshiftL16,
6984 asm, ".8h", ".8h",
6985 [(set (v8i16 V128:$Rd), (OpNode (v8i16 V128:$Rn),
6986 (i32 vecshiftL16:$imm)))]> {
6987 bits<4> imm;
6988 let Inst{19-16} = imm;
6989 }
6990
6991 def v2i32_shift : BaseSIMDVectorShift<0, U, opc, {0,1,?,?,?,?,?},
6992 V64, V64, vecshiftL32,
6993 asm, ".2s", ".2s",
6994 [(set (v2i32 V64:$Rd), (OpNode (v2i32 V64:$Rn),
6995 (i32 vecshiftL32:$imm)))]> {
6996 bits<5> imm;
6997 let Inst{20-16} = imm;
6998 }
6999
7000 def v4i32_shift : BaseSIMDVectorShift<1, U, opc, {0,1,?,?,?,?,?},
7001 V128, V128, vecshiftL32,
7002 asm, ".4s", ".4s",
7003 [(set (v4i32 V128:$Rd), (OpNode (v4i32 V128:$Rn),
7004 (i32 vecshiftL32:$imm)))]> {
7005 bits<5> imm;
7006 let Inst{20-16} = imm;
7007 }
7008
7009 def v2i64_shift : BaseSIMDVectorShift<1, U, opc, {1,?,?,?,?,?,?},
7010 V128, V128, vecshiftL64,
7011 asm, ".2d", ".2d",
7012 [(set (v2i64 V128:$Rd), (OpNode (v2i64 V128:$Rn),
7013 (i32 vecshiftL64:$imm)))]> {
7014 bits<6> imm;
7015 let Inst{21-16} = imm;
7016 }
7017}
7018
7019multiclass SIMDVectorRShiftBHSD<bit U, bits<5> opc, string asm,
7020 SDPatternOperator OpNode> {
7021 def v8i8_shift : BaseSIMDVectorShift<0, U, opc, {0,0,0,1,?,?,?},
7022 V64, V64, vecshiftR8,
7023 asm, ".8b", ".8b",
7024 [(set (v8i8 V64:$Rd), (OpNode (v8i8 V64:$Rn),
7025 (i32 vecshiftR8:$imm)))]> {
7026 bits<3> imm;
7027 let Inst{18-16} = imm;
7028 }
7029
7030 def v16i8_shift : BaseSIMDVectorShift<1, U, opc, {0,0,0,1,?,?,?},
7031 V128, V128, vecshiftR8,
7032 asm, ".16b", ".16b",
7033 [(set (v16i8 V128:$Rd), (OpNode (v16i8 V128:$Rn),
7034 (i32 vecshiftR8:$imm)))]> {
7035 bits<3> imm;
7036 let Inst{18-16} = imm;
7037 }
7038
7039 def v4i16_shift : BaseSIMDVectorShift<0, U, opc, {0,0,1,?,?,?,?},
7040 V64, V64, vecshiftR16,
7041 asm, ".4h", ".4h",
7042 [(set (v4i16 V64:$Rd), (OpNode (v4i16 V64:$Rn),
7043 (i32 vecshiftR16:$imm)))]> {
7044 bits<4> imm;
7045 let Inst{19-16} = imm;
7046 }
7047
7048 def v8i16_shift : BaseSIMDVectorShift<1, U, opc, {0,0,1,?,?,?,?},
7049 V128, V128, vecshiftR16,
7050 asm, ".8h", ".8h",
7051 [(set (v8i16 V128:$Rd), (OpNode (v8i16 V128:$Rn),
7052 (i32 vecshiftR16:$imm)))]> {
7053 bits<4> imm;
7054 let Inst{19-16} = imm;
7055 }
7056
7057 def v2i32_shift : BaseSIMDVectorShift<0, U, opc, {0,1,?,?,?,?,?},
7058 V64, V64, vecshiftR32,
7059 asm, ".2s", ".2s",
7060 [(set (v2i32 V64:$Rd), (OpNode (v2i32 V64:$Rn),
7061 (i32 vecshiftR32:$imm)))]> {
7062 bits<5> imm;
7063 let Inst{20-16} = imm;
7064 }
7065
7066 def v4i32_shift : BaseSIMDVectorShift<1, U, opc, {0,1,?,?,?,?,?},
7067 V128, V128, vecshiftR32,
7068 asm, ".4s", ".4s",
7069 [(set (v4i32 V128:$Rd), (OpNode (v4i32 V128:$Rn),
7070 (i32 vecshiftR32:$imm)))]> {
7071 bits<5> imm;
7072 let Inst{20-16} = imm;
7073 }
7074
7075 def v2i64_shift : BaseSIMDVectorShift<1, U, opc, {1,?,?,?,?,?,?},
7076 V128, V128, vecshiftR64,
7077 asm, ".2d", ".2d",
7078 [(set (v2i64 V128:$Rd), (OpNode (v2i64 V128:$Rn),
7079 (i32 vecshiftR64:$imm)))]> {
7080 bits<6> imm;
7081 let Inst{21-16} = imm;
7082 }
7083}
7084
7085let mayLoad = 0, mayStore = 0, hasSideEffects = 0 in
7086multiclass SIMDVectorRShiftBHSDTied<bit U, bits<5> opc, string asm,
7087 SDPatternOperator OpNode = null_frag> {
7088 def v8i8_shift : BaseSIMDVectorShiftTied<0, U, opc, {0,0,0,1,?,?,?},
7089 V64, V64, vecshiftR8, asm, ".8b", ".8b",
7090 [(set (v8i8 V64:$dst),
7091 (OpNode (v8i8 V64:$Rd), (v8i8 V64:$Rn),
7092 (i32 vecshiftR8:$imm)))]> {
7093 bits<3> imm;
7094 let Inst{18-16} = imm;
7095 }
7096
7097 def v16i8_shift : BaseSIMDVectorShiftTied<1, U, opc, {0,0,0,1,?,?,?},
7098 V128, V128, vecshiftR8, asm, ".16b", ".16b",
7099 [(set (v16i8 V128:$dst),
7100 (OpNode (v16i8 V128:$Rd), (v16i8 V128:$Rn),
7101 (i32 vecshiftR8:$imm)))]> {
7102 bits<3> imm;
7103 let Inst{18-16} = imm;
7104 }
7105
7106 def v4i16_shift : BaseSIMDVectorShiftTied<0, U, opc, {0,0,1,?,?,?,?},
7107 V64, V64, vecshiftR16, asm, ".4h", ".4h",
7108 [(set (v4i16 V64:$dst),
7109 (OpNode (v4i16 V64:$Rd), (v4i16 V64:$Rn),
7110 (i32 vecshiftR16:$imm)))]> {
7111 bits<4> imm;
7112 let Inst{19-16} = imm;
7113 }
7114
7115 def v8i16_shift : BaseSIMDVectorShiftTied<1, U, opc, {0,0,1,?,?,?,?},
7116 V128, V128, vecshiftR16, asm, ".8h", ".8h",
7117 [(set (v8i16 V128:$dst),
7118 (OpNode (v8i16 V128:$Rd), (v8i16 V128:$Rn),
7119 (i32 vecshiftR16:$imm)))]> {
7120 bits<4> imm;
7121 let Inst{19-16} = imm;
7122 }
7123
7124 def v2i32_shift : BaseSIMDVectorShiftTied<0, U, opc, {0,1,?,?,?,?,?},
7125 V64, V64, vecshiftR32, asm, ".2s", ".2s",
7126 [(set (v2i32 V64:$dst),
7127 (OpNode (v2i32 V64:$Rd), (v2i32 V64:$Rn),
7128 (i32 vecshiftR32:$imm)))]> {
7129 bits<5> imm;
7130 let Inst{20-16} = imm;
7131 }
7132
7133 def v4i32_shift : BaseSIMDVectorShiftTied<1, U, opc, {0,1,?,?,?,?,?},
7134 V128, V128, vecshiftR32, asm, ".4s", ".4s",
7135 [(set (v4i32 V128:$dst),
7136 (OpNode (v4i32 V128:$Rd), (v4i32 V128:$Rn),
7137 (i32 vecshiftR32:$imm)))]> {
7138 bits<5> imm;
7139 let Inst{20-16} = imm;
7140 }
7141
7142 def v2i64_shift : BaseSIMDVectorShiftTied<1, U, opc, {1,?,?,?,?,?,?},
7143 V128, V128, vecshiftR64,
7144 asm, ".2d", ".2d", [(set (v2i64 V128:$dst),
7145 (OpNode (v2i64 V128:$Rd), (v2i64 V128:$Rn),
7146 (i32 vecshiftR64:$imm)))]> {
7147 bits<6> imm;
7148 let Inst{21-16} = imm;
7149 }
7150}
7151
7152multiclass SIMDVectorLShiftBHSDTied<bit U, bits<5> opc, string asm,
7153 SDPatternOperator OpNode = null_frag> {
7154 def v8i8_shift : BaseSIMDVectorShiftTied<0, U, opc, {0,0,0,1,?,?,?},
7155 V64, V64, vecshiftL8,
7156 asm, ".8b", ".8b",
7157 [(set (v8i8 V64:$dst),
7158 (OpNode (v8i8 V64:$Rd), (v8i8 V64:$Rn),
7159 (i32 vecshiftL8:$imm)))]> {
7160 bits<3> imm;
7161 let Inst{18-16} = imm;
7162 }
7163
7164 def v16i8_shift : BaseSIMDVectorShiftTied<1, U, opc, {0,0,0,1,?,?,?},
7165 V128, V128, vecshiftL8,
7166 asm, ".16b", ".16b",
7167 [(set (v16i8 V128:$dst),
7168 (OpNode (v16i8 V128:$Rd), (v16i8 V128:$Rn),
7169 (i32 vecshiftL8:$imm)))]> {
7170 bits<3> imm;
7171 let Inst{18-16} = imm;
7172 }
7173
7174 def v4i16_shift : BaseSIMDVectorShiftTied<0, U, opc, {0,0,1,?,?,?,?},
7175 V64, V64, vecshiftL16,
7176 asm, ".4h", ".4h",
7177 [(set (v4i16 V64:$dst),
7178 (OpNode (v4i16 V64:$Rd), (v4i16 V64:$Rn),
7179 (i32 vecshiftL16:$imm)))]> {
7180 bits<4> imm;
7181 let Inst{19-16} = imm;
7182 }
7183
7184 def v8i16_shift : BaseSIMDVectorShiftTied<1, U, opc, {0,0,1,?,?,?,?},
7185 V128, V128, vecshiftL16,
7186 asm, ".8h", ".8h",
7187 [(set (v8i16 V128:$dst),
7188 (OpNode (v8i16 V128:$Rd), (v8i16 V128:$Rn),
7189 (i32 vecshiftL16:$imm)))]> {
7190 bits<4> imm;
7191 let Inst{19-16} = imm;
7192 }
7193
7194 def v2i32_shift : BaseSIMDVectorShiftTied<0, U, opc, {0,1,?,?,?,?,?},
7195 V64, V64, vecshiftL32,
7196 asm, ".2s", ".2s",
7197 [(set (v2i32 V64:$dst),
7198 (OpNode (v2i32 V64:$Rd), (v2i32 V64:$Rn),
7199 (i32 vecshiftL32:$imm)))]> {
7200 bits<5> imm;
7201 let Inst{20-16} = imm;
7202 }
7203
7204 def v4i32_shift : BaseSIMDVectorShiftTied<1, U, opc, {0,1,?,?,?,?,?},
7205 V128, V128, vecshiftL32,
7206 asm, ".4s", ".4s",
7207 [(set (v4i32 V128:$dst),
7208 (OpNode (v4i32 V128:$Rd), (v4i32 V128:$Rn),
7209 (i32 vecshiftL32:$imm)))]> {
7210 bits<5> imm;
7211 let Inst{20-16} = imm;
7212 }
7213
7214 def v2i64_shift : BaseSIMDVectorShiftTied<1, U, opc, {1,?,?,?,?,?,?},
7215 V128, V128, vecshiftL64,
7216 asm, ".2d", ".2d",
7217 [(set (v2i64 V128:$dst),
7218 (OpNode (v2i64 V128:$Rd), (v2i64 V128:$Rn),
7219 (i32 vecshiftL64:$imm)))]> {
7220 bits<6> imm;
7221 let Inst{21-16} = imm;
7222 }
7223}
7224
7225multiclass SIMDVectorLShiftLongBHSD<bit U, bits<5> opc, string asm,
7226 SDPatternOperator OpNode> {
7227 def v8i8_shift : BaseSIMDVectorShift<0, U, opc, {0,0,0,1,?,?,?},
7228 V128, V64, vecshiftL8, asm, ".8h", ".8b",
7229 [(set (v8i16 V128:$Rd), (OpNode (v8i8 V64:$Rn), vecshiftL8:$imm))]> {
7230 bits<3> imm;
7231 let Inst{18-16} = imm;
7232 }
7233
7234 def v16i8_shift : BaseSIMDVectorShift<1, U, opc, {0,0,0,1,?,?,?},
7235 V128, V128, vecshiftL8,
7236 asm#"2", ".8h", ".16b",
7237 [(set (v8i16 V128:$Rd),
7238 (OpNode (extract_high_v16i8 V128:$Rn), vecshiftL8:$imm))]> {
7239 bits<3> imm;
7240 let Inst{18-16} = imm;
7241 }
7242
7243 def v4i16_shift : BaseSIMDVectorShift<0, U, opc, {0,0,1,?,?,?,?},
7244 V128, V64, vecshiftL16, asm, ".4s", ".4h",
7245 [(set (v4i32 V128:$Rd), (OpNode (v4i16 V64:$Rn), vecshiftL16:$imm))]> {
7246 bits<4> imm;
7247 let Inst{19-16} = imm;
7248 }
7249
7250 def v8i16_shift : BaseSIMDVectorShift<1, U, opc, {0,0,1,?,?,?,?},
7251 V128, V128, vecshiftL16,
7252 asm#"2", ".4s", ".8h",
7253 [(set (v4i32 V128:$Rd),
7254 (OpNode (extract_high_v8i16 V128:$Rn), vecshiftL16:$imm))]> {
7255
7256 bits<4> imm;
7257 let Inst{19-16} = imm;
7258 }
7259
7260 def v2i32_shift : BaseSIMDVectorShift<0, U, opc, {0,1,?,?,?,?,?},
7261 V128, V64, vecshiftL32, asm, ".2d", ".2s",
7262 [(set (v2i64 V128:$Rd), (OpNode (v2i32 V64:$Rn), vecshiftL32:$imm))]> {
7263 bits<5> imm;
7264 let Inst{20-16} = imm;
7265 }
7266
7267 def v4i32_shift : BaseSIMDVectorShift<1, U, opc, {0,1,?,?,?,?,?},
7268 V128, V128, vecshiftL32,
7269 asm#"2", ".2d", ".4s",
7270 [(set (v2i64 V128:$Rd),
7271 (OpNode (extract_high_v4i32 V128:$Rn), vecshiftL32:$imm))]> {
7272 bits<5> imm;
7273 let Inst{20-16} = imm;
7274 }
7275}
7276
7277
7278//---
7279// Vector load/store
7280//---
7281// SIMD ldX/stX no-index memory references don't allow the optional
7282// ", #0" constant and handle post-indexing explicitly, so we use
7283// a more specialized parse method for them. Otherwise, it's the same as
7284// the general am_noindex handling.
7285def MemorySIMDNoIndexOperand : AsmOperandClass {
7286 let Name = "MemorySIMDNoIndex";
7287 let ParserMethod = "tryParseNoIndexMemory";
7288}
7289def am_simdnoindex : Operand<i64>,
7290 ComplexPattern<i64, 1, "SelectAddrModeNoIndex", []> {
7291 let PrintMethod = "printAMNoIndex";
7292 let ParserMatchClass = MemorySIMDNoIndexOperand;
7293 let MIOperandInfo = (ops GPR64sp:$base);
7294 let DecoderMethod = "DecodeGPR64spRegisterClass";
7295}
7296
7297class BaseSIMDLdSt<bit Q, bit L, bits<4> opcode, bits<2> size,
7298 string asm, dag oops, dag iops, list<dag> pattern>
7299 : I<oops, iops, asm, "\t$Vt, $vaddr", "", pattern> {
7300 bits<5> Vt;
7301 bits<5> vaddr;
7302 let Inst{31} = 0;
7303 let Inst{30} = Q;
7304 let Inst{29-23} = 0b0011000;
7305 let Inst{22} = L;
7306 let Inst{21-16} = 0b000000;
7307 let Inst{15-12} = opcode;
7308 let Inst{11-10} = size;
7309 let Inst{9-5} = vaddr;
7310 let Inst{4-0} = Vt;
7311}
7312
7313class BaseSIMDLdStPost<bit Q, bit L, bits<4> opcode, bits<2> size,
7314 string asm, dag oops, dag iops>
7315 : I<oops, iops, asm, "\t$Vt, $vaddr, $Xm", "", []> {
7316 bits<5> Vt;
7317 bits<5> vaddr;
7318 bits<5> Xm;
7319 let Inst{31} = 0;
7320 let Inst{30} = Q;
7321 let Inst{29-23} = 0b0011001;
7322 let Inst{22} = L;
7323 let Inst{21} = 0;
7324 let Inst{20-16} = Xm;
7325 let Inst{15-12} = opcode;
7326 let Inst{11-10} = size;
7327 let Inst{9-5} = vaddr;
7328 let Inst{4-0} = Vt;
7329 let DecoderMethod = "DecodeSIMDLdStPost";
7330}
7331
7332// The immediate form of AdvSIMD post-indexed addressing is encoded with
7333// register post-index addressing from the zero register.
7334multiclass SIMDLdStAliases<string asm, string layout, string Count,
7335 int Offset, int Size> {
7336 // E.g. "ld1 { v0.8b, v1.8b }, [x1], #16"
7337 // "ld1\t$Vt, $vaddr, #16"
7338 // may get mapped to
7339 // (LD1Twov8b_POST VecListTwo8b:$Vt, am_simdnoindex:$vaddr, XZR)
7340 def : InstAlias<asm # "\t$Vt, $vaddr, #" # Offset,
7341 (!cast<Instruction>(NAME # Count # "v" # layout # "_POST")
7342 !cast<RegisterOperand>("VecList" # Count # layout):$Vt,
7343 am_simdnoindex:$vaddr, XZR), 1>;
7344
7345 // E.g. "ld1.8b { v0, v1 }, [x1], #16"
7346 // "ld1.8b\t$Vt, $vaddr, #16"
7347 // may get mapped to
7348 // (LD1Twov8b_POST VecListTwo64:$Vt, am_simdnoindex:$vaddr, XZR)
7349 def : InstAlias<asm # "." # layout # "\t$Vt, $vaddr, #" # Offset,
7350 (!cast<Instruction>(NAME # Count # "v" # layout # "_POST")
7351 !cast<RegisterOperand>("VecList" # Count # Size):$Vt,
7352 am_simdnoindex:$vaddr, XZR), 0>;
7353
7354 // E.g. "ld1.8b { v0, v1 }, [x1]"
7355 // "ld1\t$Vt, $vaddr"
7356 // may get mapped to
7357 // (LD1Twov8b VecListTwo64:$Vt, am_simdnoindex:$vaddr)
7358 def : InstAlias<asm # "." # layout # "\t$Vt, $vaddr",
7359 (!cast<Instruction>(NAME # Count # "v" # layout)
7360 !cast<RegisterOperand>("VecList" # Count # Size):$Vt,
7361 am_simdnoindex:$vaddr), 0>;
7362
7363 // E.g. "ld1.8b { v0, v1 }, [x1], x2"
7364 // "ld1\t$Vt, $vaddr, $Xm"
7365 // may get mapped to
7366 // (LD1Twov8b_POST VecListTwo64:$Vt, am_simdnoindex:$vaddr, GPR64pi8:$Xm)
7367 def : InstAlias<asm # "." # layout # "\t$Vt, $vaddr, $Xm",
7368 (!cast<Instruction>(NAME # Count # "v" # layout # "_POST")
7369 !cast<RegisterOperand>("VecList" # Count # Size):$Vt,
7370 am_simdnoindex:$vaddr,
7371 !cast<RegisterOperand>("GPR64pi" # Offset):$Xm), 0>;
7372}
7373
7374multiclass BaseSIMDLdN<string Count, string asm, string veclist, int Offset128,
7375 int Offset64, bits<4> opcode> {
7376 let hasSideEffects = 0, mayLoad = 1, mayStore = 0 in {
7377 def v16b: BaseSIMDLdSt<1, 1, opcode, 0b00, asm,
7378 (outs !cast<RegisterOperand>(veclist # "16b"):$Vt),
7379 (ins am_simdnoindex:$vaddr), []>;
7380 def v8h : BaseSIMDLdSt<1, 1, opcode, 0b01, asm,
7381 (outs !cast<RegisterOperand>(veclist # "8h"):$Vt),
7382 (ins am_simdnoindex:$vaddr), []>;
7383 def v4s : BaseSIMDLdSt<1, 1, opcode, 0b10, asm,
7384 (outs !cast<RegisterOperand>(veclist # "4s"):$Vt),
7385 (ins am_simdnoindex:$vaddr), []>;
7386 def v2d : BaseSIMDLdSt<1, 1, opcode, 0b11, asm,
7387 (outs !cast<RegisterOperand>(veclist # "2d"):$Vt),
7388 (ins am_simdnoindex:$vaddr), []>;
7389 def v8b : BaseSIMDLdSt<0, 1, opcode, 0b00, asm,
7390 (outs !cast<RegisterOperand>(veclist # "8b"):$Vt),
7391 (ins am_simdnoindex:$vaddr), []>;
7392 def v4h : BaseSIMDLdSt<0, 1, opcode, 0b01, asm,
7393 (outs !cast<RegisterOperand>(veclist # "4h"):$Vt),
7394 (ins am_simdnoindex:$vaddr), []>;
7395 def v2s : BaseSIMDLdSt<0, 1, opcode, 0b10, asm,
7396 (outs !cast<RegisterOperand>(veclist # "2s"):$Vt),
7397 (ins am_simdnoindex:$vaddr), []>;
7398
7399
7400 def v16b_POST: BaseSIMDLdStPost<1, 1, opcode, 0b00, asm,
7401 (outs !cast<RegisterOperand>(veclist # "16b"):$Vt),
7402 (ins am_simdnoindex:$vaddr,
7403 !cast<RegisterOperand>("GPR64pi" # Offset128):$Xm)>;
7404 def v8h_POST : BaseSIMDLdStPost<1, 1, opcode, 0b01, asm,
7405 (outs !cast<RegisterOperand>(veclist # "8h"):$Vt),
7406 (ins am_simdnoindex:$vaddr,
7407 !cast<RegisterOperand>("GPR64pi" # Offset128):$Xm)>;
7408 def v4s_POST : BaseSIMDLdStPost<1, 1, opcode, 0b10, asm,
7409 (outs !cast<RegisterOperand>(veclist # "4s"):$Vt),
7410 (ins am_simdnoindex:$vaddr,
7411 !cast<RegisterOperand>("GPR64pi" # Offset128):$Xm)>;
7412 def v2d_POST : BaseSIMDLdStPost<1, 1, opcode, 0b11, asm,
7413 (outs !cast<RegisterOperand>(veclist # "2d"):$Vt),
7414 (ins am_simdnoindex:$vaddr,
7415 !cast<RegisterOperand>("GPR64pi" # Offset128):$Xm)>;
7416 def v8b_POST : BaseSIMDLdStPost<0, 1, opcode, 0b00, asm,
7417 (outs !cast<RegisterOperand>(veclist # "8b"):$Vt),
7418 (ins am_simdnoindex:$vaddr,
7419 !cast<RegisterOperand>("GPR64pi" # Offset64):$Xm)>;
7420 def v4h_POST : BaseSIMDLdStPost<0, 1, opcode, 0b01, asm,
7421 (outs !cast<RegisterOperand>(veclist # "4h"):$Vt),
7422 (ins am_simdnoindex:$vaddr,
7423 !cast<RegisterOperand>("GPR64pi" # Offset64):$Xm)>;
7424 def v2s_POST : BaseSIMDLdStPost<0, 1, opcode, 0b10, asm,
7425 (outs !cast<RegisterOperand>(veclist # "2s"):$Vt),
7426 (ins am_simdnoindex:$vaddr,
7427 !cast<RegisterOperand>("GPR64pi" # Offset64):$Xm)>;
7428 }
7429
7430 defm : SIMDLdStAliases<asm, "16b", Count, Offset128, 128>;
7431 defm : SIMDLdStAliases<asm, "8h", Count, Offset128, 128>;
7432 defm : SIMDLdStAliases<asm, "4s", Count, Offset128, 128>;
7433 defm : SIMDLdStAliases<asm, "2d", Count, Offset128, 128>;
7434 defm : SIMDLdStAliases<asm, "8b", Count, Offset64, 64>;
7435 defm : SIMDLdStAliases<asm, "4h", Count, Offset64, 64>;
7436 defm : SIMDLdStAliases<asm, "2s", Count, Offset64, 64>;
7437}
7438
7439// Only ld1/st1 has a v1d version.
7440multiclass BaseSIMDStN<string Count, string asm, string veclist, int Offset128,
7441 int Offset64, bits<4> opcode> {
7442 let hasSideEffects = 0, mayStore = 1, mayLoad = 0 in {
7443 def v16b : BaseSIMDLdSt<1, 0, opcode, 0b00, asm, (outs),
7444 (ins !cast<RegisterOperand>(veclist # "16b"):$Vt,
7445 am_simdnoindex:$vaddr), []>;
7446 def v8h : BaseSIMDLdSt<1, 0, opcode, 0b01, asm, (outs),
7447 (ins !cast<RegisterOperand>(veclist # "8h"):$Vt,
7448 am_simdnoindex:$vaddr), []>;
7449 def v4s : BaseSIMDLdSt<1, 0, opcode, 0b10, asm, (outs),
7450 (ins !cast<RegisterOperand>(veclist # "4s"):$Vt,
7451 am_simdnoindex:$vaddr), []>;
7452 def v2d : BaseSIMDLdSt<1, 0, opcode, 0b11, asm, (outs),
7453 (ins !cast<RegisterOperand>(veclist # "2d"):$Vt,
7454 am_simdnoindex:$vaddr), []>;
7455 def v8b : BaseSIMDLdSt<0, 0, opcode, 0b00, asm, (outs),
7456 (ins !cast<RegisterOperand>(veclist # "8b"):$Vt,
7457 am_simdnoindex:$vaddr), []>;
7458 def v4h : BaseSIMDLdSt<0, 0, opcode, 0b01, asm, (outs),
7459 (ins !cast<RegisterOperand>(veclist # "4h"):$Vt,
7460 am_simdnoindex:$vaddr), []>;
7461 def v2s : BaseSIMDLdSt<0, 0, opcode, 0b10, asm, (outs),
7462 (ins !cast<RegisterOperand>(veclist # "2s"):$Vt,
7463 am_simdnoindex:$vaddr), []>;
7464
7465 def v16b_POST : BaseSIMDLdStPost<1, 0, opcode, 0b00, asm, (outs),
7466 (ins !cast<RegisterOperand>(veclist # "16b"):$Vt,
7467 am_simdnoindex:$vaddr,
7468 !cast<RegisterOperand>("GPR64pi" # Offset128):$Xm)>;
7469 def v8h_POST : BaseSIMDLdStPost<1, 0, opcode, 0b01, asm, (outs),
7470 (ins !cast<RegisterOperand>(veclist # "8h"):$Vt,
7471 am_simdnoindex:$vaddr,
7472 !cast<RegisterOperand>("GPR64pi" # Offset128):$Xm)>;
7473 def v4s_POST : BaseSIMDLdStPost<1, 0, opcode, 0b10, asm, (outs),
7474 (ins !cast<RegisterOperand>(veclist # "4s"):$Vt,
7475 am_simdnoindex:$vaddr,
7476 !cast<RegisterOperand>("GPR64pi" # Offset128):$Xm)>;
7477 def v2d_POST : BaseSIMDLdStPost<1, 0, opcode, 0b11, asm, (outs),
7478 (ins !cast<RegisterOperand>(veclist # "2d"):$Vt,
7479 am_simdnoindex:$vaddr,
7480 !cast<RegisterOperand>("GPR64pi" # Offset128):$Xm)>;
7481 def v8b_POST : BaseSIMDLdStPost<0, 0, opcode, 0b00, asm, (outs),
7482 (ins !cast<RegisterOperand>(veclist # "8b"):$Vt,
7483 am_simdnoindex:$vaddr,
7484 !cast<RegisterOperand>("GPR64pi" # Offset64):$Xm)>;
7485 def v4h_POST : BaseSIMDLdStPost<0, 0, opcode, 0b01, asm, (outs),
7486 (ins !cast<RegisterOperand>(veclist # "4h"):$Vt,
7487 am_simdnoindex:$vaddr,
7488 !cast<RegisterOperand>("GPR64pi" # Offset64):$Xm)>;
7489 def v2s_POST : BaseSIMDLdStPost<0, 0, opcode, 0b10, asm, (outs),
7490 (ins !cast<RegisterOperand>(veclist # "2s"):$Vt,
7491 am_simdnoindex:$vaddr,
7492 !cast<RegisterOperand>("GPR64pi" # Offset64):$Xm)>;
7493 }
7494
7495 defm : SIMDLdStAliases<asm, "16b", Count, Offset128, 128>;
7496 defm : SIMDLdStAliases<asm, "8h", Count, Offset128, 128>;
7497 defm : SIMDLdStAliases<asm, "4s", Count, Offset128, 128>;
7498 defm : SIMDLdStAliases<asm, "2d", Count, Offset128, 128>;
7499 defm : SIMDLdStAliases<asm, "8b", Count, Offset64, 64>;
7500 defm : SIMDLdStAliases<asm, "4h", Count, Offset64, 64>;
7501 defm : SIMDLdStAliases<asm, "2s", Count, Offset64, 64>;
7502}
7503
7504multiclass BaseSIMDLd1<string Count, string asm, string veclist,
7505 int Offset128, int Offset64, bits<4> opcode>
7506 : BaseSIMDLdN<Count, asm, veclist, Offset128, Offset64, opcode> {
7507
7508 // LD1 instructions have extra "1d" variants.
7509 let hasSideEffects = 0, mayLoad = 1, mayStore = 0 in {
7510 def v1d : BaseSIMDLdSt<0, 1, opcode, 0b11, asm,
7511 (outs !cast<RegisterOperand>(veclist # "1d"):$Vt),
7512 (ins am_simdnoindex:$vaddr), []>;
7513
7514 def v1d_POST : BaseSIMDLdStPost<0, 1, opcode, 0b11, asm,
7515 (outs !cast<RegisterOperand>(veclist # "1d"):$Vt),
7516 (ins am_simdnoindex:$vaddr,
7517 !cast<RegisterOperand>("GPR64pi" # Offset64):$Xm)>;
7518 }
7519
7520 defm : SIMDLdStAliases<asm, "1d", Count, Offset64, 64>;
7521}
7522
7523multiclass BaseSIMDSt1<string Count, string asm, string veclist,
7524 int Offset128, int Offset64, bits<4> opcode>
7525 : BaseSIMDStN<Count, asm, veclist, Offset128, Offset64, opcode> {
7526
7527 // ST1 instructions have extra "1d" variants.
7528 let hasSideEffects = 0, mayLoad = 0, mayStore = 1 in {
7529 def v1d : BaseSIMDLdSt<0, 0, opcode, 0b11, asm, (outs),
7530 (ins !cast<RegisterOperand>(veclist # "1d"):$Vt,
7531 am_simdnoindex:$vaddr), []>;
7532
7533 def v1d_POST : BaseSIMDLdStPost<0, 0, opcode, 0b11, asm, (outs),
7534 (ins !cast<RegisterOperand>(veclist # "1d"):$Vt,
7535 am_simdnoindex:$vaddr,
7536 !cast<RegisterOperand>("GPR64pi" # Offset64):$Xm)>;
7537 }
7538
7539 defm : SIMDLdStAliases<asm, "1d", Count, Offset64, 64>;
7540}
7541
7542multiclass SIMDLd1Multiple<string asm> {
7543 defm One : BaseSIMDLd1<"One", asm, "VecListOne", 16, 8, 0b0111>;
7544 defm Two : BaseSIMDLd1<"Two", asm, "VecListTwo", 32, 16, 0b1010>;
7545 defm Three : BaseSIMDLd1<"Three", asm, "VecListThree", 48, 24, 0b0110>;
7546 defm Four : BaseSIMDLd1<"Four", asm, "VecListFour", 64, 32, 0b0010>;
7547}
7548
7549multiclass SIMDSt1Multiple<string asm> {
7550 defm One : BaseSIMDSt1<"One", asm, "VecListOne", 16, 8, 0b0111>;
7551 defm Two : BaseSIMDSt1<"Two", asm, "VecListTwo", 32, 16, 0b1010>;
7552 defm Three : BaseSIMDSt1<"Three", asm, "VecListThree", 48, 24, 0b0110>;
7553 defm Four : BaseSIMDSt1<"Four", asm, "VecListFour", 64, 32, 0b0010>;
7554}
7555
7556multiclass SIMDLd2Multiple<string asm> {
7557 defm Two : BaseSIMDLdN<"Two", asm, "VecListTwo", 32, 16, 0b1000>;
7558}
7559
7560multiclass SIMDSt2Multiple<string asm> {
7561 defm Two : BaseSIMDStN<"Two", asm, "VecListTwo", 32, 16, 0b1000>;
7562}
7563
7564multiclass SIMDLd3Multiple<string asm> {
7565 defm Three : BaseSIMDLdN<"Three", asm, "VecListThree", 48, 24, 0b0100>;
7566}
7567
7568multiclass SIMDSt3Multiple<string asm> {
7569 defm Three : BaseSIMDStN<"Three", asm, "VecListThree", 48, 24, 0b0100>;
7570}
7571
7572multiclass SIMDLd4Multiple<string asm> {
7573 defm Four : BaseSIMDLdN<"Four", asm, "VecListFour", 64, 32, 0b0000>;
7574}
7575
7576multiclass SIMDSt4Multiple<string asm> {
7577 defm Four : BaseSIMDStN<"Four", asm, "VecListFour", 64, 32, 0b0000>;
7578}
7579
7580//---
7581// AdvSIMD Load/store single-element
7582//---
7583
7584class BaseSIMDLdStSingle<bit L, bit R, bits<3> opcode,
7585 string asm, string operands, dag oops, dag iops,
7586 list<dag> pattern>
7587 : I<oops, iops, asm, operands, "", pattern> {
7588 bits<5> Vt;
7589 bits<5> vaddr;
7590 let Inst{31} = 0;
7591 let Inst{29-24} = 0b001101;
7592 let Inst{22} = L;
7593 let Inst{21} = R;
7594 let Inst{15-13} = opcode;
7595 let Inst{9-5} = vaddr;
7596 let Inst{4-0} = Vt;
7597 let DecoderMethod = "DecodeSIMDLdStSingle";
7598}
7599
7600class BaseSIMDLdStSingleTied<bit L, bit R, bits<3> opcode,
7601 string asm, string operands, dag oops, dag iops,
7602 list<dag> pattern>
7603 : I<oops, iops, asm, operands, "$Vt = $dst", pattern> {
7604 bits<5> Vt;
7605 bits<5> vaddr;
7606 let Inst{31} = 0;
7607 let Inst{29-24} = 0b001101;
7608 let Inst{22} = L;
7609 let Inst{21} = R;
7610 let Inst{15-13} = opcode;
7611 let Inst{9-5} = vaddr;
7612 let Inst{4-0} = Vt;
7613 let DecoderMethod = "DecodeSIMDLdStSingleTied";
7614}
7615
7616
7617let mayLoad = 1, mayStore = 0, hasSideEffects = 0 in
7618class BaseSIMDLdR<bit Q, bit R, bits<3> opcode, bit S, bits<2> size, string asm,
7619 Operand listtype>
7620 : BaseSIMDLdStSingle<1, R, opcode, asm, "\t$Vt, $vaddr",
7621 (outs listtype:$Vt), (ins am_simdnoindex:$vaddr), []> {
7622 let Inst{30} = Q;
7623 let Inst{23} = 0;
7624 let Inst{20-16} = 0b00000;
7625 let Inst{12} = S;
7626 let Inst{11-10} = size;
7627}
7628let mayLoad = 1, mayStore = 0, hasSideEffects = 0 in
7629class BaseSIMDLdRPost<bit Q, bit R, bits<3> opcode, bit S, bits<2> size,
7630 string asm, Operand listtype, Operand GPR64pi>
7631 : BaseSIMDLdStSingle<1, R, opcode, asm, "\t$Vt, $vaddr, $Xm",
7632 (outs listtype:$Vt),
7633 (ins am_simdnoindex:$vaddr, GPR64pi:$Xm), []> {
7634 bits<5> Xm;
7635 let Inst{30} = Q;
7636 let Inst{23} = 1;
7637 let Inst{20-16} = Xm;
7638 let Inst{12} = S;
7639 let Inst{11-10} = size;
7640}
7641
7642multiclass SIMDLdrAliases<string asm, string layout, string Count,
7643 int Offset, int Size> {
7644 // E.g. "ld1r { v0.8b }, [x1], #1"
7645 // "ld1r.8b\t$Vt, $vaddr, #1"
7646 // may get mapped to
7647 // (LD1Rv8b_POST VecListOne8b:$Vt, am_simdnoindex:$vaddr, XZR)
7648 def : InstAlias<asm # "\t$Vt, $vaddr, #" # Offset,
7649 (!cast<Instruction>(NAME # "v" # layout # "_POST")
7650 !cast<RegisterOperand>("VecList" # Count # layout):$Vt,
7651 am_simdnoindex:$vaddr, XZR), 1>;
7652
7653 // E.g. "ld1r.8b { v0 }, [x1], #1"
7654 // "ld1r.8b\t$Vt, $vaddr, #1"
7655 // may get mapped to
7656 // (LD1Rv8b_POST VecListOne64:$Vt, am_simdnoindex:$vaddr, XZR)
7657 def : InstAlias<asm # "." # layout # "\t$Vt, $vaddr, #" # Offset,
7658 (!cast<Instruction>(NAME # "v" # layout # "_POST")
7659 !cast<RegisterOperand>("VecList" # Count # Size):$Vt,
7660 am_simdnoindex:$vaddr, XZR), 0>;
7661
7662 // E.g. "ld1r.8b { v0 }, [x1]"
7663 // "ld1r.8b\t$Vt, $vaddr"
7664 // may get mapped to
7665 // (LD1Rv8b VecListOne64:$Vt, am_simdnoindex:$vaddr)
7666 def : InstAlias<asm # "." # layout # "\t$Vt, $vaddr",
7667 (!cast<Instruction>(NAME # "v" # layout)
7668 !cast<RegisterOperand>("VecList" # Count # Size):$Vt,
7669 am_simdnoindex:$vaddr), 0>;
7670
7671 // E.g. "ld1r.8b { v0 }, [x1], x2"
7672 // "ld1r.8b\t$Vt, $vaddr, $Xm"
7673 // may get mapped to
7674 // (LD1Rv8b_POST VecListOne64:$Vt, am_simdnoindex:$vaddr, GPR64pi1:$Xm)
7675 def : InstAlias<asm # "." # layout # "\t$Vt, $vaddr, $Xm",
7676 (!cast<Instruction>(NAME # "v" # layout # "_POST")
7677 !cast<RegisterOperand>("VecList" # Count # Size):$Vt,
7678 am_simdnoindex:$vaddr,
7679 !cast<RegisterOperand>("GPR64pi" # Offset):$Xm), 0>;
7680}
7681
7682multiclass SIMDLdR<bit R, bits<3> opcode, bit S, string asm, string Count,
7683 int Offset1, int Offset2, int Offset4, int Offset8> {
7684 def v8b : BaseSIMDLdR<0, R, opcode, S, 0b00, asm,
7685 !cast<Operand>("VecList" # Count # "8b")>;
7686 def v16b: BaseSIMDLdR<1, R, opcode, S, 0b00, asm,
7687 !cast<Operand>("VecList" # Count #"16b")>;
7688 def v4h : BaseSIMDLdR<0, R, opcode, S, 0b01, asm,
7689 !cast<Operand>("VecList" # Count #"4h")>;
7690 def v8h : BaseSIMDLdR<1, R, opcode, S, 0b01, asm,
7691 !cast<Operand>("VecList" # Count #"8h")>;
7692 def v2s : BaseSIMDLdR<0, R, opcode, S, 0b10, asm,
7693 !cast<Operand>("VecList" # Count #"2s")>;
7694 def v4s : BaseSIMDLdR<1, R, opcode, S, 0b10, asm,
7695 !cast<Operand>("VecList" # Count #"4s")>;
7696 def v1d : BaseSIMDLdR<0, R, opcode, S, 0b11, asm,
7697 !cast<Operand>("VecList" # Count #"1d")>;
7698 def v2d : BaseSIMDLdR<1, R, opcode, S, 0b11, asm,
7699 !cast<Operand>("VecList" # Count #"2d")>;
7700
7701 def v8b_POST : BaseSIMDLdRPost<0, R, opcode, S, 0b00, asm,
7702 !cast<Operand>("VecList" # Count # "8b"),
7703 !cast<Operand>("GPR64pi" # Offset1)>;
7704 def v16b_POST: BaseSIMDLdRPost<1, R, opcode, S, 0b00, asm,
7705 !cast<Operand>("VecList" # Count # "16b"),
7706 !cast<Operand>("GPR64pi" # Offset1)>;
7707 def v4h_POST : BaseSIMDLdRPost<0, R, opcode, S, 0b01, asm,
7708 !cast<Operand>("VecList" # Count # "4h"),
7709 !cast<Operand>("GPR64pi" # Offset2)>;
7710 def v8h_POST : BaseSIMDLdRPost<1, R, opcode, S, 0b01, asm,
7711 !cast<Operand>("VecList" # Count # "8h"),
7712 !cast<Operand>("GPR64pi" # Offset2)>;
7713 def v2s_POST : BaseSIMDLdRPost<0, R, opcode, S, 0b10, asm,
7714 !cast<Operand>("VecList" # Count # "2s"),
7715 !cast<Operand>("GPR64pi" # Offset4)>;
7716 def v4s_POST : BaseSIMDLdRPost<1, R, opcode, S, 0b10, asm,
7717 !cast<Operand>("VecList" # Count # "4s"),
7718 !cast<Operand>("GPR64pi" # Offset4)>;
7719 def v1d_POST : BaseSIMDLdRPost<0, R, opcode, S, 0b11, asm,
7720 !cast<Operand>("VecList" # Count # "1d"),
7721 !cast<Operand>("GPR64pi" # Offset8)>;
7722 def v2d_POST : BaseSIMDLdRPost<1, R, opcode, S, 0b11, asm,
7723 !cast<Operand>("VecList" # Count # "2d"),
7724 !cast<Operand>("GPR64pi" # Offset8)>;
7725
7726 defm : SIMDLdrAliases<asm, "8b", Count, Offset1, 64>;
7727 defm : SIMDLdrAliases<asm, "16b", Count, Offset1, 128>;
7728 defm : SIMDLdrAliases<asm, "4h", Count, Offset2, 64>;
7729 defm : SIMDLdrAliases<asm, "8h", Count, Offset2, 128>;
7730 defm : SIMDLdrAliases<asm, "2s", Count, Offset4, 64>;
7731 defm : SIMDLdrAliases<asm, "4s", Count, Offset4, 128>;
7732 defm : SIMDLdrAliases<asm, "1d", Count, Offset8, 64>;
7733 defm : SIMDLdrAliases<asm, "2d", Count, Offset8, 128>;
7734}
7735
7736class SIMDLdStSingleB<bit L, bit R, bits<3> opcode, string asm,
7737 dag oops, dag iops, list<dag> pattern>
7738 : BaseSIMDLdStSingle<L, R, opcode, asm, "\t$Vt$idx, $vaddr", oops, iops,
7739 pattern> {
7740 // idx encoded in Q:S:size fields.
7741 bits<4> idx;
7742 let Inst{30} = idx{3};
7743 let Inst{23} = 0;
7744 let Inst{20-16} = 0b00000;
7745 let Inst{12} = idx{2};
7746 let Inst{11-10} = idx{1-0};
7747}
7748class SIMDLdStSingleBTied<bit L, bit R, bits<3> opcode, string asm,
7749 dag oops, dag iops, list<dag> pattern>
7750 : BaseSIMDLdStSingleTied<L, R, opcode, asm, "\t$Vt$idx, $vaddr", oops, iops,
7751 pattern> {
7752 // idx encoded in Q:S:size fields.
7753 bits<4> idx;
7754 let Inst{30} = idx{3};
7755 let Inst{23} = 0;
7756 let Inst{20-16} = 0b00000;
7757 let Inst{12} = idx{2};
7758 let Inst{11-10} = idx{1-0};
7759}
7760class SIMDLdStSingleBPost<bit L, bit R, bits<3> opcode, string asm,
7761 dag oops, dag iops>
7762 : BaseSIMDLdStSingle<L, R, opcode, asm, "\t$Vt$idx, $vaddr, $Xm",
7763 oops, iops, []> {
7764 // idx encoded in Q:S:size fields.
7765 bits<4> idx;
7766 bits<5> Xm;
7767 let Inst{30} = idx{3};
7768 let Inst{23} = 1;
7769 let Inst{20-16} = Xm;
7770 let Inst{12} = idx{2};
7771 let Inst{11-10} = idx{1-0};
7772}
7773class SIMDLdStSingleBTiedPost<bit L, bit R, bits<3> opcode, string asm,
7774 dag oops, dag iops>
7775 : BaseSIMDLdStSingleTied<L, R, opcode, asm, "\t$Vt$idx, $vaddr, $Xm",
7776 oops, iops, []> {
7777 // idx encoded in Q:S:size fields.
7778 bits<4> idx;
7779 bits<5> Xm;
7780 let Inst{30} = idx{3};
7781 let Inst{23} = 1;
7782 let Inst{20-16} = Xm;
7783 let Inst{12} = idx{2};
7784 let Inst{11-10} = idx{1-0};
7785}
7786
7787class SIMDLdStSingleH<bit L, bit R, bits<3> opcode, bit size, string asm,
7788 dag oops, dag iops, list<dag> pattern>
7789 : BaseSIMDLdStSingle<L, R, opcode, asm, "\t$Vt$idx, $vaddr", oops, iops,
7790 pattern> {
7791 // idx encoded in Q:S:size<1> fields.
7792 bits<3> idx;
7793 let Inst{30} = idx{2};
7794 let Inst{23} = 0;
7795 let Inst{20-16} = 0b00000;
7796 let Inst{12} = idx{1};
7797 let Inst{11} = idx{0};
7798 let Inst{10} = size;
7799}
7800class SIMDLdStSingleHTied<bit L, bit R, bits<3> opcode, bit size, string asm,
7801 dag oops, dag iops, list<dag> pattern>
7802 : BaseSIMDLdStSingleTied<L, R, opcode, asm, "\t$Vt$idx, $vaddr", oops, iops,
7803 pattern> {
7804 // idx encoded in Q:S:size<1> fields.
7805 bits<3> idx;
7806 let Inst{30} = idx{2};
7807 let Inst{23} = 0;
7808 let Inst{20-16} = 0b00000;
7809 let Inst{12} = idx{1};
7810 let Inst{11} = idx{0};
7811 let Inst{10} = size;
7812}
7813
7814class SIMDLdStSingleHPost<bit L, bit R, bits<3> opcode, bit size, string asm,
7815 dag oops, dag iops>
7816 : BaseSIMDLdStSingle<L, R, opcode, asm, "\t$Vt$idx, $vaddr, $Xm",
7817 oops, iops, []> {
7818 // idx encoded in Q:S:size<1> fields.
7819 bits<3> idx;
7820 bits<5> Xm;
7821 let Inst{30} = idx{2};
7822 let Inst{23} = 1;
7823 let Inst{20-16} = Xm;
7824 let Inst{12} = idx{1};
7825 let Inst{11} = idx{0};
7826 let Inst{10} = size;
7827}
7828class SIMDLdStSingleHTiedPost<bit L, bit R, bits<3> opcode, bit size, string asm,
7829 dag oops, dag iops>
7830 : BaseSIMDLdStSingleTied<L, R, opcode, asm, "\t$Vt$idx, $vaddr, $Xm",
7831 oops, iops, []> {
7832 // idx encoded in Q:S:size<1> fields.
7833 bits<3> idx;
7834 bits<5> Xm;
7835 let Inst{30} = idx{2};
7836 let Inst{23} = 1;
7837 let Inst{20-16} = Xm;
7838 let Inst{12} = idx{1};
7839 let Inst{11} = idx{0};
7840 let Inst{10} = size;
7841}
7842class SIMDLdStSingleS<bit L, bit R, bits<3> opcode, bits<2> size, string asm,
7843 dag oops, dag iops, list<dag> pattern>
7844 : BaseSIMDLdStSingle<L, R, opcode, asm, "\t$Vt$idx, $vaddr", oops, iops,
7845 pattern> {
7846 // idx encoded in Q:S fields.
7847 bits<2> idx;
7848 let Inst{30} = idx{1};
7849 let Inst{23} = 0;
7850 let Inst{20-16} = 0b00000;
7851 let Inst{12} = idx{0};
7852 let Inst{11-10} = size;
7853}
7854class SIMDLdStSingleSTied<bit L, bit R, bits<3> opcode, bits<2> size, string asm,
7855 dag oops, dag iops, list<dag> pattern>
7856 : BaseSIMDLdStSingleTied<L, R, opcode, asm, "\t$Vt$idx, $vaddr", oops, iops,
7857 pattern> {
7858 // idx encoded in Q:S fields.
7859 bits<2> idx;
7860 let Inst{30} = idx{1};
7861 let Inst{23} = 0;
7862 let Inst{20-16} = 0b00000;
7863 let Inst{12} = idx{0};
7864 let Inst{11-10} = size;
7865}
7866class SIMDLdStSingleSPost<bit L, bit R, bits<3> opcode, bits<2> size,
7867 string asm, dag oops, dag iops>
7868 : BaseSIMDLdStSingle<L, R, opcode, asm, "\t$Vt$idx, $vaddr, $Xm",
7869 oops, iops, []> {
7870 // idx encoded in Q:S fields.
7871 bits<2> idx;
7872 bits<5> Xm;
7873 let Inst{30} = idx{1};
7874 let Inst{23} = 1;
7875 let Inst{20-16} = Xm;
7876 let Inst{12} = idx{0};
7877 let Inst{11-10} = size;
7878}
7879class SIMDLdStSingleSTiedPost<bit L, bit R, bits<3> opcode, bits<2> size,
7880 string asm, dag oops, dag iops>
7881 : BaseSIMDLdStSingleTied<L, R, opcode, asm, "\t$Vt$idx, $vaddr, $Xm",
7882 oops, iops, []> {
7883 // idx encoded in Q:S fields.
7884 bits<2> idx;
7885 bits<5> Xm;
7886 let Inst{30} = idx{1};
7887 let Inst{23} = 1;
7888 let Inst{20-16} = Xm;
7889 let Inst{12} = idx{0};
7890 let Inst{11-10} = size;
7891}
7892class SIMDLdStSingleD<bit L, bit R, bits<3> opcode, bits<2> size, string asm,
7893 dag oops, dag iops, list<dag> pattern>
7894 : BaseSIMDLdStSingle<L, R, opcode, asm, "\t$Vt$idx, $vaddr", oops, iops,
7895 pattern> {
7896 // idx encoded in Q field.
7897 bits<1> idx;
7898 let Inst{30} = idx;
7899 let Inst{23} = 0;
7900 let Inst{20-16} = 0b00000;
7901 let Inst{12} = 0;
7902 let Inst{11-10} = size;
7903}
7904class SIMDLdStSingleDTied<bit L, bit R, bits<3> opcode, bits<2> size, string asm,
7905 dag oops, dag iops, list<dag> pattern>
7906 : BaseSIMDLdStSingleTied<L, R, opcode, asm, "\t$Vt$idx, $vaddr", oops, iops,
7907 pattern> {
7908 // idx encoded in Q field.
7909 bits<1> idx;
7910 let Inst{30} = idx;
7911 let Inst{23} = 0;
7912 let Inst{20-16} = 0b00000;
7913 let Inst{12} = 0;
7914 let Inst{11-10} = size;
7915}
7916class SIMDLdStSingleDPost<bit L, bit R, bits<3> opcode, bits<2> size,
7917 string asm, dag oops, dag iops>
7918 : BaseSIMDLdStSingle<L, R, opcode, asm, "\t$Vt$idx, $vaddr, $Xm",
7919 oops, iops, []> {
7920 // idx encoded in Q field.
7921 bits<1> idx;
7922 bits<5> Xm;
7923 let Inst{30} = idx;
7924 let Inst{23} = 1;
7925 let Inst{20-16} = Xm;
7926 let Inst{12} = 0;
7927 let Inst{11-10} = size;
7928}
7929class SIMDLdStSingleDTiedPost<bit L, bit R, bits<3> opcode, bits<2> size,
7930 string asm, dag oops, dag iops>
7931 : BaseSIMDLdStSingleTied<L, R, opcode, asm, "\t$Vt$idx, $vaddr, $Xm",
7932 oops, iops, []> {
7933 // idx encoded in Q field.
7934 bits<1> idx;
7935 bits<5> Xm;
7936 let Inst{30} = idx;
7937 let Inst{23} = 1;
7938 let Inst{20-16} = Xm;
7939 let Inst{12} = 0;
7940 let Inst{11-10} = size;
7941}
7942
7943let mayLoad = 1, mayStore = 0, hasSideEffects = 0 in
7944multiclass SIMDLdSingleBTied<bit R, bits<3> opcode, string asm,
7945 RegisterOperand listtype,
7946 RegisterOperand GPR64pi> {
7947 def i8 : SIMDLdStSingleBTied<1, R, opcode, asm,
7948 (outs listtype:$dst),
7949 (ins listtype:$Vt, VectorIndexB:$idx,
7950 am_simdnoindex:$vaddr), []>;
7951
7952 def i8_POST : SIMDLdStSingleBTiedPost<1, R, opcode, asm,
7953 (outs listtype:$dst),
7954 (ins listtype:$Vt, VectorIndexB:$idx,
7955 am_simdnoindex:$vaddr, GPR64pi:$Xm)>;
7956}
7957let mayLoad = 1, mayStore = 0, hasSideEffects = 0 in
7958multiclass SIMDLdSingleHTied<bit R, bits<3> opcode, bit size, string asm,
7959 RegisterOperand listtype,
7960 RegisterOperand GPR64pi> {
7961 def i16 : SIMDLdStSingleHTied<1, R, opcode, size, asm,
7962 (outs listtype:$dst),
7963 (ins listtype:$Vt, VectorIndexH:$idx,
7964 am_simdnoindex:$vaddr), []>;
7965
7966 def i16_POST : SIMDLdStSingleHTiedPost<1, R, opcode, size, asm,
7967 (outs listtype:$dst),
7968 (ins listtype:$Vt, VectorIndexH:$idx,
7969 am_simdnoindex:$vaddr, GPR64pi:$Xm)>;
7970}
7971let mayLoad = 1, mayStore = 0, hasSideEffects = 0 in
7972multiclass SIMDLdSingleSTied<bit R, bits<3> opcode, bits<2> size,string asm,
7973 RegisterOperand listtype,
7974 RegisterOperand GPR64pi> {
7975 def i32 : SIMDLdStSingleSTied<1, R, opcode, size, asm,
7976 (outs listtype:$dst),
7977 (ins listtype:$Vt, VectorIndexS:$idx,
7978 am_simdnoindex:$vaddr), []>;
7979
7980 def i32_POST : SIMDLdStSingleSTiedPost<1, R, opcode, size, asm,
7981 (outs listtype:$dst),
7982 (ins listtype:$Vt, VectorIndexS:$idx,
7983 am_simdnoindex:$vaddr, GPR64pi:$Xm)>;
7984}
7985let mayLoad = 1, mayStore = 0, hasSideEffects = 0 in
7986multiclass SIMDLdSingleDTied<bit R, bits<3> opcode, bits<2> size, string asm,
Tim Northoverff179ba2014-04-01 10:37:09 +00007987 RegisterOperand listtype, RegisterOperand GPR64pi> {
Tim Northover00ed9962014-03-29 10:18:08 +00007988 def i64 : SIMDLdStSingleDTied<1, R, opcode, size, asm,
7989 (outs listtype:$dst),
7990 (ins listtype:$Vt, VectorIndexD:$idx,
7991 am_simdnoindex:$vaddr), []>;
7992
7993 def i64_POST : SIMDLdStSingleDTiedPost<1, R, opcode, size, asm,
7994 (outs listtype:$dst),
7995 (ins listtype:$Vt, VectorIndexD:$idx,
7996 am_simdnoindex:$vaddr, GPR64pi:$Xm)>;
7997}
7998let mayLoad = 0, mayStore = 1, hasSideEffects = 0 in
7999multiclass SIMDStSingleB<bit R, bits<3> opcode, string asm,
Tim Northoverff179ba2014-04-01 10:37:09 +00008000 RegisterOperand listtype, RegisterOperand GPR64pi> {
Tim Northover00ed9962014-03-29 10:18:08 +00008001 def i8 : SIMDLdStSingleB<0, R, opcode, asm,
8002 (outs), (ins listtype:$Vt, VectorIndexB:$idx,
Tim Northoverff179ba2014-04-01 10:37:09 +00008003 am_simdnoindex:$vaddr), []>;
Tim Northover00ed9962014-03-29 10:18:08 +00008004
8005 def i8_POST : SIMDLdStSingleBPost<0, R, opcode, asm,
8006 (outs), (ins listtype:$Vt, VectorIndexB:$idx,
8007 am_simdnoindex:$vaddr, GPR64pi:$Xm)>;
8008}
8009let mayLoad = 0, mayStore = 1, hasSideEffects = 0 in
8010multiclass SIMDStSingleH<bit R, bits<3> opcode, bit size, string asm,
Tim Northoverff179ba2014-04-01 10:37:09 +00008011 RegisterOperand listtype, RegisterOperand GPR64pi> {
Tim Northover00ed9962014-03-29 10:18:08 +00008012 def i16 : SIMDLdStSingleH<0, R, opcode, size, asm,
8013 (outs), (ins listtype:$Vt, VectorIndexH:$idx,
Tim Northoverff179ba2014-04-01 10:37:09 +00008014 am_simdnoindex:$vaddr), []>;
Tim Northover00ed9962014-03-29 10:18:08 +00008015
8016 def i16_POST : SIMDLdStSingleHPost<0, R, opcode, size, asm,
8017 (outs), (ins listtype:$Vt, VectorIndexH:$idx,
8018 am_simdnoindex:$vaddr, GPR64pi:$Xm)>;
8019}
8020let mayLoad = 0, mayStore = 1, hasSideEffects = 0 in
8021multiclass SIMDStSingleS<bit R, bits<3> opcode, bits<2> size,string asm,
Tim Northoverff179ba2014-04-01 10:37:09 +00008022 RegisterOperand listtype, RegisterOperand GPR64pi> {
Tim Northover00ed9962014-03-29 10:18:08 +00008023 def i32 : SIMDLdStSingleS<0, R, opcode, size, asm,
8024 (outs), (ins listtype:$Vt, VectorIndexS:$idx,
Tim Northoverff179ba2014-04-01 10:37:09 +00008025 am_simdnoindex:$vaddr), []>;
Tim Northover00ed9962014-03-29 10:18:08 +00008026
8027 def i32_POST : SIMDLdStSingleSPost<0, R, opcode, size, asm,
8028 (outs), (ins listtype:$Vt, VectorIndexS:$idx,
8029 am_simdnoindex:$vaddr, GPR64pi:$Xm)>;
8030}
8031let mayLoad = 0, mayStore = 1, hasSideEffects = 0 in
8032multiclass SIMDStSingleD<bit R, bits<3> opcode, bits<2> size, string asm,
Tim Northoverff179ba2014-04-01 10:37:09 +00008033 RegisterOperand listtype, RegisterOperand GPR64pi> {
Tim Northover00ed9962014-03-29 10:18:08 +00008034 def i64 : SIMDLdStSingleD<0, R, opcode, size, asm,
8035 (outs), (ins listtype:$Vt, VectorIndexD:$idx,
Tim Northoverff179ba2014-04-01 10:37:09 +00008036 am_simdnoindex:$vaddr), []>;
Tim Northover00ed9962014-03-29 10:18:08 +00008037
8038 def i64_POST : SIMDLdStSingleDPost<0, R, opcode, size, asm,
8039 (outs), (ins listtype:$Vt, VectorIndexD:$idx,
8040 am_simdnoindex:$vaddr, GPR64pi:$Xm)>;
8041}
8042
8043multiclass SIMDLdStSingleAliases<string asm, string layout, string Type,
8044 string Count, int Offset, Operand idxtype> {
8045 // E.g. "ld1 { v0.8b }[0], [x1], #1"
8046 // "ld1\t$Vt, $vaddr, #1"
8047 // may get mapped to
8048 // (LD1Rv8b_POST VecListOne8b:$Vt, am_simdnoindex:$vaddr, XZR)
8049 def : InstAlias<asm # "\t$Vt$idx, $vaddr, #" # Offset,
8050 (!cast<Instruction>(NAME # Type # "_POST")
8051 !cast<RegisterOperand>("VecList" # Count # layout):$Vt,
8052 idxtype:$idx, am_simdnoindex:$vaddr, XZR), 1>;
8053
8054 // E.g. "ld1.8b { v0 }[0], [x1], #1"
8055 // "ld1.8b\t$Vt, $vaddr, #1"
8056 // may get mapped to
8057 // (LD1Rv8b_POST VecListOne64:$Vt, am_simdnoindex:$vaddr, XZR)
8058 def : InstAlias<asm # "." # layout # "\t$Vt$idx, $vaddr, #" # Offset,
8059 (!cast<Instruction>(NAME # Type # "_POST")
8060 !cast<RegisterOperand>("VecList" # Count # "128"):$Vt,
8061 idxtype:$idx, am_simdnoindex:$vaddr, XZR), 0>;
8062
8063 // E.g. "ld1.8b { v0 }[0], [x1]"
8064 // "ld1.8b\t$Vt, $vaddr"
8065 // may get mapped to
8066 // (LD1Rv8b VecListOne64:$Vt, am_simdnoindex:$vaddr)
8067 def : InstAlias<asm # "." # layout # "\t$Vt$idx, $vaddr",
8068 (!cast<Instruction>(NAME # Type)
8069 !cast<RegisterOperand>("VecList" # Count # "128"):$Vt,
8070 idxtype:$idx, am_simdnoindex:$vaddr), 0>;
8071
8072 // E.g. "ld1.8b { v0 }[0], [x1], x2"
8073 // "ld1.8b\t$Vt, $vaddr, $Xm"
8074 // may get mapped to
8075 // (LD1Rv8b_POST VecListOne64:$Vt, am_simdnoindex:$vaddr, GPR64pi1:$Xm)
8076 def : InstAlias<asm # "." # layout # "\t$Vt$idx, $vaddr, $Xm",
8077 (!cast<Instruction>(NAME # Type # "_POST")
8078 !cast<RegisterOperand>("VecList" # Count # "128"):$Vt,
8079 idxtype:$idx, am_simdnoindex:$vaddr,
8080 !cast<RegisterOperand>("GPR64pi" # Offset):$Xm), 0>;
8081}
8082
8083multiclass SIMDLdSt1SingleAliases<string asm> {
8084 defm : SIMDLdStSingleAliases<asm, "b", "i8", "One", 1, VectorIndexB>;
8085 defm : SIMDLdStSingleAliases<asm, "h", "i16", "One", 2, VectorIndexH>;
8086 defm : SIMDLdStSingleAliases<asm, "s", "i32", "One", 4, VectorIndexS>;
8087 defm : SIMDLdStSingleAliases<asm, "d", "i64", "One", 8, VectorIndexD>;
8088}
8089
8090multiclass SIMDLdSt2SingleAliases<string asm> {
8091 defm : SIMDLdStSingleAliases<asm, "b", "i8", "Two", 2, VectorIndexB>;
8092 defm : SIMDLdStSingleAliases<asm, "h", "i16", "Two", 4, VectorIndexH>;
8093 defm : SIMDLdStSingleAliases<asm, "s", "i32", "Two", 8, VectorIndexS>;
8094 defm : SIMDLdStSingleAliases<asm, "d", "i64", "Two", 16, VectorIndexD>;
8095}
8096
8097multiclass SIMDLdSt3SingleAliases<string asm> {
8098 defm : SIMDLdStSingleAliases<asm, "b", "i8", "Three", 3, VectorIndexB>;
8099 defm : SIMDLdStSingleAliases<asm, "h", "i16", "Three", 6, VectorIndexH>;
8100 defm : SIMDLdStSingleAliases<asm, "s", "i32", "Three", 12, VectorIndexS>;
8101 defm : SIMDLdStSingleAliases<asm, "d", "i64", "Three", 24, VectorIndexD>;
8102}
8103
8104multiclass SIMDLdSt4SingleAliases<string asm> {
8105 defm : SIMDLdStSingleAliases<asm, "b", "i8", "Four", 4, VectorIndexB>;
8106 defm : SIMDLdStSingleAliases<asm, "h", "i16", "Four", 8, VectorIndexH>;
8107 defm : SIMDLdStSingleAliases<asm, "s", "i32", "Four", 16, VectorIndexS>;
8108 defm : SIMDLdStSingleAliases<asm, "d", "i64", "Four", 32, VectorIndexD>;
8109}
8110
8111//----------------------------------------------------------------------------
8112// Crypto extensions
8113//----------------------------------------------------------------------------
8114
8115let mayLoad = 0, mayStore = 0, hasSideEffects = 0 in
8116class AESBase<bits<4> opc, string asm, dag outs, dag ins, string cstr,
8117 list<dag> pat>
8118 : I<outs, ins, asm, "{\t$Rd.16b, $Rn.16b|.16b\t$Rd, $Rn}", cstr, pat>,
8119 Sched<[WriteV]>{
8120 bits<5> Rd;
8121 bits<5> Rn;
8122 let Inst{31-16} = 0b0100111000101000;
8123 let Inst{15-12} = opc;
8124 let Inst{11-10} = 0b10;
8125 let Inst{9-5} = Rn;
8126 let Inst{4-0} = Rd;
8127}
8128
8129class AESInst<bits<4> opc, string asm, Intrinsic OpNode>
8130 : AESBase<opc, asm, (outs V128:$Rd), (ins V128:$Rn), "",
8131 [(set (v16i8 V128:$Rd), (OpNode (v16i8 V128:$Rn)))]>;
8132
8133class AESTiedInst<bits<4> opc, string asm, Intrinsic OpNode>
8134 : AESBase<opc, asm, (outs V128:$dst), (ins V128:$Rd, V128:$Rn),
8135 "$Rd = $dst",
8136 [(set (v16i8 V128:$dst),
8137 (OpNode (v16i8 V128:$Rd), (v16i8 V128:$Rn)))]>;
8138
8139let mayLoad = 0, mayStore = 0, hasSideEffects = 0 in
8140class SHA3OpTiedInst<bits<3> opc, string asm, string dst_lhs_kind,
8141 dag oops, dag iops, list<dag> pat>
8142 : I<oops, iops, asm,
8143 "{\t$Rd" # dst_lhs_kind # ", $Rn" # dst_lhs_kind # ", $Rm.4s" #
8144 "|.4s\t$Rd, $Rn, $Rm}", "$Rd = $dst", pat>,
8145 Sched<[WriteV]>{
8146 bits<5> Rd;
8147 bits<5> Rn;
8148 bits<5> Rm;
8149 let Inst{31-21} = 0b01011110000;
8150 let Inst{20-16} = Rm;
8151 let Inst{15} = 0;
8152 let Inst{14-12} = opc;
8153 let Inst{11-10} = 0b00;
8154 let Inst{9-5} = Rn;
8155 let Inst{4-0} = Rd;
8156}
8157
8158class SHATiedInstQSV<bits<3> opc, string asm, Intrinsic OpNode>
8159 : SHA3OpTiedInst<opc, asm, "", (outs FPR128:$dst),
8160 (ins FPR128:$Rd, FPR32:$Rn, V128:$Rm),
8161 [(set (v4i32 FPR128:$dst),
8162 (OpNode (v4i32 FPR128:$Rd), (i32 FPR32:$Rn),
8163 (v4i32 V128:$Rm)))]>;
8164
8165class SHATiedInstVVV<bits<3> opc, string asm, Intrinsic OpNode>
8166 : SHA3OpTiedInst<opc, asm, ".4s", (outs V128:$dst),
8167 (ins V128:$Rd, V128:$Rn, V128:$Rm),
8168 [(set (v4i32 V128:$dst),
8169 (OpNode (v4i32 V128:$Rd), (v4i32 V128:$Rn),
8170 (v4i32 V128:$Rm)))]>;
8171
8172class SHATiedInstQQV<bits<3> opc, string asm, Intrinsic OpNode>
8173 : SHA3OpTiedInst<opc, asm, "", (outs FPR128:$dst),
8174 (ins FPR128:$Rd, FPR128:$Rn, V128:$Rm),
8175 [(set (v4i32 FPR128:$dst),
8176 (OpNode (v4i32 FPR128:$Rd), (v4i32 FPR128:$Rn),
8177 (v4i32 V128:$Rm)))]>;
8178
8179let mayLoad = 0, mayStore = 0, hasSideEffects = 0 in
8180class SHA2OpInst<bits<4> opc, string asm, string kind,
8181 string cstr, dag oops, dag iops,
8182 list<dag> pat>
8183 : I<oops, iops, asm, "{\t$Rd" # kind # ", $Rn" # kind #
8184 "|" # kind # "\t$Rd, $Rn}", cstr, pat>,
8185 Sched<[WriteV]>{
8186 bits<5> Rd;
8187 bits<5> Rn;
8188 let Inst{31-16} = 0b0101111000101000;
8189 let Inst{15-12} = opc;
8190 let Inst{11-10} = 0b10;
8191 let Inst{9-5} = Rn;
8192 let Inst{4-0} = Rd;
8193}
8194
8195class SHATiedInstVV<bits<4> opc, string asm, Intrinsic OpNode>
8196 : SHA2OpInst<opc, asm, ".4s", "$Rd = $dst", (outs V128:$dst),
8197 (ins V128:$Rd, V128:$Rn),
8198 [(set (v4i32 V128:$dst),
8199 (OpNode (v4i32 V128:$Rd), (v4i32 V128:$Rn)))]>;
8200
8201class SHAInstSS<bits<4> opc, string asm, Intrinsic OpNode>
8202 : SHA2OpInst<opc, asm, "", "", (outs FPR32:$Rd), (ins FPR32:$Rn),
8203 [(set (i32 FPR32:$Rd), (OpNode (i32 FPR32:$Rn)))]>;
8204
8205// Allow the size specifier tokens to be upper case, not just lower.
8206def : TokenAlias<".8B", ".8b">;
8207def : TokenAlias<".4H", ".4h">;
8208def : TokenAlias<".2S", ".2s">;
8209def : TokenAlias<".1D", ".1d">;
8210def : TokenAlias<".16B", ".16b">;
8211def : TokenAlias<".8H", ".8h">;
8212def : TokenAlias<".4S", ".4s">;
8213def : TokenAlias<".2D", ".2d">;
Bradley Smith6d7af172014-04-09 14:42:01 +00008214def : TokenAlias<".1Q", ".1q">;
Tim Northover00ed9962014-03-29 10:18:08 +00008215def : TokenAlias<".B", ".b">;
8216def : TokenAlias<".H", ".h">;
8217def : TokenAlias<".S", ".s">;
8218def : TokenAlias<".D", ".d">;
Bradley Smith6d7af172014-04-09 14:42:01 +00008219def : TokenAlias<".Q", ".q">;