blob: 42326fc182bc7453ae44d94c1503e6a5202ef150 [file] [log] [blame]
Tim Northover3b0846e2014-05-24 12:50:23 +00001//===- AArch64InstrFormats.td - AArch64 Instruction Formats --*- tblgen -*-===//
2//
3// The LLVM Compiler Infrastructure
4//
5// This file is distributed under the University of Illinois Open Source
6// License. See LICENSE.TXT for details.
7//
8//===----------------------------------------------------------------------===//
9
10//===----------------------------------------------------------------------===//
11// Describe AArch64 instructions format here
12//
13
14// Format specifies the encoding used by the instruction. This is part of the
15// ad-hoc solution used to emit machine instruction encodings by our machine
16// code emitter.
17class Format<bits<2> val> {
18 bits<2> Value = val;
19}
20
21def PseudoFrm : Format<0>;
22def NormalFrm : Format<1>; // Do we need any others?
23
24// AArch64 Instruction Format
25class AArch64Inst<Format f, string cstr> : Instruction {
26 field bits<32> Inst; // Instruction encoding.
27 // Mask of bits that cause an encoding to be UNPREDICTABLE.
28 // If a bit is set, then if the corresponding bit in the
29 // target encoding differs from its value in the "Inst" field,
30 // the instruction is UNPREDICTABLE (SoftFail in abstract parlance).
31 field bits<32> Unpredictable = 0;
32 // SoftFail is the generic name for this field, but we alias it so
33 // as to make it more obvious what it means in ARM-land.
34 field bits<32> SoftFail = Unpredictable;
35 let Namespace = "AArch64";
36 Format F = f;
37 bits<2> Form = F.Value;
38 let Pattern = [];
39 let Constraints = cstr;
40}
41
42// Pseudo instructions (don't have encoding information)
43class Pseudo<dag oops, dag iops, list<dag> pattern, string cstr = "">
44 : AArch64Inst<PseudoFrm, cstr> {
45 dag OutOperandList = oops;
46 dag InOperandList = iops;
47 let Pattern = pattern;
48 let isCodeGenOnly = 1;
49}
50
51// Real instructions (have encoding information)
52class EncodedI<string cstr, list<dag> pattern> : AArch64Inst<NormalFrm, cstr> {
53 let Pattern = pattern;
54 let Size = 4;
55}
56
57// Normal instructions
58class I<dag oops, dag iops, string asm, string operands, string cstr,
59 list<dag> pattern>
60 : EncodedI<cstr, pattern> {
61 dag OutOperandList = oops;
62 dag InOperandList = iops;
63 let AsmString = !strconcat(asm, operands);
64}
65
66class TriOpFrag<dag res> : PatFrag<(ops node:$LHS, node:$MHS, node:$RHS), res>;
67class BinOpFrag<dag res> : PatFrag<(ops node:$LHS, node:$RHS), res>;
68class UnOpFrag<dag res> : PatFrag<(ops node:$LHS), res>;
69
70// Helper fragment for an extract of the high portion of a 128-bit vector.
71def extract_high_v16i8 :
72 UnOpFrag<(extract_subvector (v16i8 node:$LHS), (i64 8))>;
73def extract_high_v8i16 :
74 UnOpFrag<(extract_subvector (v8i16 node:$LHS), (i64 4))>;
75def extract_high_v4i32 :
76 UnOpFrag<(extract_subvector (v4i32 node:$LHS), (i64 2))>;
77def extract_high_v2i64 :
78 UnOpFrag<(extract_subvector (v2i64 node:$LHS), (i64 1))>;
79
80//===----------------------------------------------------------------------===//
81// Asm Operand Classes.
82//
83
84// Shifter operand for arithmetic shifted encodings.
85def ShifterOperand : AsmOperandClass {
86 let Name = "Shifter";
87}
88
89// Shifter operand for mov immediate encodings.
90def MovImm32ShifterOperand : AsmOperandClass {
91 let SuperClasses = [ShifterOperand];
92 let Name = "MovImm32Shifter";
93 let RenderMethod = "addShifterOperands";
94 let DiagnosticType = "InvalidMovImm32Shift";
95}
96def MovImm64ShifterOperand : AsmOperandClass {
97 let SuperClasses = [ShifterOperand];
98 let Name = "MovImm64Shifter";
99 let RenderMethod = "addShifterOperands";
100 let DiagnosticType = "InvalidMovImm64Shift";
101}
102
103// Shifter operand for arithmetic register shifted encodings.
104class ArithmeticShifterOperand<int width> : AsmOperandClass {
105 let SuperClasses = [ShifterOperand];
106 let Name = "ArithmeticShifter" # width;
107 let PredicateMethod = "isArithmeticShifter<" # width # ">";
108 let RenderMethod = "addShifterOperands";
109 let DiagnosticType = "AddSubRegShift" # width;
110}
111
112def ArithmeticShifterOperand32 : ArithmeticShifterOperand<32>;
113def ArithmeticShifterOperand64 : ArithmeticShifterOperand<64>;
114
115// Shifter operand for logical register shifted encodings.
116class LogicalShifterOperand<int width> : AsmOperandClass {
117 let SuperClasses = [ShifterOperand];
118 let Name = "LogicalShifter" # width;
119 let PredicateMethod = "isLogicalShifter<" # width # ">";
120 let RenderMethod = "addShifterOperands";
121 let DiagnosticType = "AddSubRegShift" # width;
122}
123
124def LogicalShifterOperand32 : LogicalShifterOperand<32>;
125def LogicalShifterOperand64 : LogicalShifterOperand<64>;
126
127// Shifter operand for logical vector 128/64-bit shifted encodings.
128def LogicalVecShifterOperand : AsmOperandClass {
129 let SuperClasses = [ShifterOperand];
130 let Name = "LogicalVecShifter";
131 let RenderMethod = "addShifterOperands";
132}
133def LogicalVecHalfWordShifterOperand : AsmOperandClass {
134 let SuperClasses = [LogicalVecShifterOperand];
135 let Name = "LogicalVecHalfWordShifter";
136 let RenderMethod = "addShifterOperands";
137}
138
139// The "MSL" shifter on the vector MOVI instruction.
140def MoveVecShifterOperand : AsmOperandClass {
141 let SuperClasses = [ShifterOperand];
142 let Name = "MoveVecShifter";
143 let RenderMethod = "addShifterOperands";
144}
145
146// Extend operand for arithmetic encodings.
147def ExtendOperand : AsmOperandClass {
148 let Name = "Extend";
149 let DiagnosticType = "AddSubRegExtendLarge";
150}
151def ExtendOperand64 : AsmOperandClass {
152 let SuperClasses = [ExtendOperand];
153 let Name = "Extend64";
154 let DiagnosticType = "AddSubRegExtendSmall";
155}
156// 'extend' that's a lsl of a 64-bit register.
157def ExtendOperandLSL64 : AsmOperandClass {
158 let SuperClasses = [ExtendOperand];
159 let Name = "ExtendLSL64";
160 let RenderMethod = "addExtend64Operands";
161 let DiagnosticType = "AddSubRegExtendLarge";
162}
163
164// 8-bit floating-point immediate encodings.
165def FPImmOperand : AsmOperandClass {
166 let Name = "FPImm";
167 let ParserMethod = "tryParseFPImm";
168 let DiagnosticType = "InvalidFPImm";
169}
170
171def CondCode : AsmOperandClass {
172 let Name = "CondCode";
173 let DiagnosticType = "InvalidCondCode";
174}
175
176// A 32-bit register pasrsed as 64-bit
177def GPR32as64Operand : AsmOperandClass {
178 let Name = "GPR32as64";
179}
180def GPR32as64 : RegisterOperand<GPR32> {
181 let ParserMatchClass = GPR32as64Operand;
182}
183
184// 8-bit immediate for AdvSIMD where 64-bit values of the form:
185// aaaaaaaa bbbbbbbb cccccccc dddddddd eeeeeeee ffffffff gggggggg hhhhhhhh
186// are encoded as the eight bit value 'abcdefgh'.
187def SIMDImmType10Operand : AsmOperandClass { let Name = "SIMDImmType10"; }
188
189
190//===----------------------------------------------------------------------===//
191// Operand Definitions.
192//
193
194// ADR[P] instruction labels.
195def AdrpOperand : AsmOperandClass {
196 let Name = "AdrpLabel";
197 let ParserMethod = "tryParseAdrpLabel";
198 let DiagnosticType = "InvalidLabel";
199}
200def adrplabel : Operand<i64> {
201 let EncoderMethod = "getAdrLabelOpValue";
202 let PrintMethod = "printAdrpLabel";
203 let ParserMatchClass = AdrpOperand;
204}
205
206def AdrOperand : AsmOperandClass {
207 let Name = "AdrLabel";
208 let ParserMethod = "tryParseAdrLabel";
209 let DiagnosticType = "InvalidLabel";
210}
211def adrlabel : Operand<i64> {
212 let EncoderMethod = "getAdrLabelOpValue";
213 let ParserMatchClass = AdrOperand;
214}
215
216// simm9 predicate - True if the immediate is in the range [-256, 255].
217def SImm9Operand : AsmOperandClass {
218 let Name = "SImm9";
219 let DiagnosticType = "InvalidMemoryIndexedSImm9";
220}
221def simm9 : Operand<i64>, ImmLeaf<i64, [{ return Imm >= -256 && Imm < 256; }]> {
222 let ParserMatchClass = SImm9Operand;
223}
224
225// simm7sN predicate - True if the immediate is a multiple of N in the range
226// [-64 * N, 63 * N].
227class SImm7Scaled<int Scale> : AsmOperandClass {
228 let Name = "SImm7s" # Scale;
229 let DiagnosticType = "InvalidMemoryIndexed" # Scale # "SImm7";
230}
231
232def SImm7s4Operand : SImm7Scaled<4>;
233def SImm7s8Operand : SImm7Scaled<8>;
234def SImm7s16Operand : SImm7Scaled<16>;
235
236def simm7s4 : Operand<i32> {
237 let ParserMatchClass = SImm7s4Operand;
238 let PrintMethod = "printImmScale<4>";
239}
240
241def simm7s8 : Operand<i32> {
242 let ParserMatchClass = SImm7s8Operand;
243 let PrintMethod = "printImmScale<8>";
244}
245
246def simm7s16 : Operand<i32> {
247 let ParserMatchClass = SImm7s16Operand;
248 let PrintMethod = "printImmScale<16>";
249}
250
251class AsmImmRange<int Low, int High> : AsmOperandClass {
252 let Name = "Imm" # Low # "_" # High;
253 let DiagnosticType = "InvalidImm" # Low # "_" # High;
254}
255
256def Imm1_8Operand : AsmImmRange<1, 8>;
257def Imm1_16Operand : AsmImmRange<1, 16>;
258def Imm1_32Operand : AsmImmRange<1, 32>;
259def Imm1_64Operand : AsmImmRange<1, 64>;
260
261def MovZSymbolG3AsmOperand : AsmOperandClass {
262 let Name = "MovZSymbolG3";
263 let RenderMethod = "addImmOperands";
264}
265
266def movz_symbol_g3 : Operand<i32> {
267 let ParserMatchClass = MovZSymbolG3AsmOperand;
268}
269
270def MovZSymbolG2AsmOperand : AsmOperandClass {
271 let Name = "MovZSymbolG2";
272 let RenderMethod = "addImmOperands";
273}
274
275def movz_symbol_g2 : Operand<i32> {
276 let ParserMatchClass = MovZSymbolG2AsmOperand;
277}
278
279def MovZSymbolG1AsmOperand : AsmOperandClass {
280 let Name = "MovZSymbolG1";
281 let RenderMethod = "addImmOperands";
282}
283
284def movz_symbol_g1 : Operand<i32> {
285 let ParserMatchClass = MovZSymbolG1AsmOperand;
286}
287
288def MovZSymbolG0AsmOperand : AsmOperandClass {
289 let Name = "MovZSymbolG0";
290 let RenderMethod = "addImmOperands";
291}
292
293def movz_symbol_g0 : Operand<i32> {
294 let ParserMatchClass = MovZSymbolG0AsmOperand;
295}
296
297def MovKSymbolG3AsmOperand : AsmOperandClass {
298 let Name = "MovKSymbolG3";
299 let RenderMethod = "addImmOperands";
300}
301
302def movk_symbol_g3 : Operand<i32> {
303 let ParserMatchClass = MovKSymbolG3AsmOperand;
304}
305
306def MovKSymbolG2AsmOperand : AsmOperandClass {
307 let Name = "MovKSymbolG2";
308 let RenderMethod = "addImmOperands";
309}
310
311def movk_symbol_g2 : Operand<i32> {
312 let ParserMatchClass = MovKSymbolG2AsmOperand;
313}
314
315def MovKSymbolG1AsmOperand : AsmOperandClass {
316 let Name = "MovKSymbolG1";
317 let RenderMethod = "addImmOperands";
318}
319
320def movk_symbol_g1 : Operand<i32> {
321 let ParserMatchClass = MovKSymbolG1AsmOperand;
322}
323
324def MovKSymbolG0AsmOperand : AsmOperandClass {
325 let Name = "MovKSymbolG0";
326 let RenderMethod = "addImmOperands";
327}
328
329def movk_symbol_g0 : Operand<i32> {
330 let ParserMatchClass = MovKSymbolG0AsmOperand;
331}
332
333class fixedpoint_i32<ValueType FloatVT>
334 : Operand<FloatVT>,
335 ComplexPattern<FloatVT, 1, "SelectCVTFixedPosOperand<32>", [fpimm, ld]> {
336 let EncoderMethod = "getFixedPointScaleOpValue";
337 let DecoderMethod = "DecodeFixedPointScaleImm32";
338 let ParserMatchClass = Imm1_32Operand;
339}
340
341class fixedpoint_i64<ValueType FloatVT>
342 : Operand<FloatVT>,
343 ComplexPattern<FloatVT, 1, "SelectCVTFixedPosOperand<64>", [fpimm, ld]> {
344 let EncoderMethod = "getFixedPointScaleOpValue";
345 let DecoderMethod = "DecodeFixedPointScaleImm64";
346 let ParserMatchClass = Imm1_64Operand;
347}
348
349def fixedpoint_f32_i32 : fixedpoint_i32<f32>;
350def fixedpoint_f64_i32 : fixedpoint_i32<f64>;
351
352def fixedpoint_f32_i64 : fixedpoint_i64<f32>;
353def fixedpoint_f64_i64 : fixedpoint_i64<f64>;
354
355def vecshiftR8 : Operand<i32>, ImmLeaf<i32, [{
356 return (((uint32_t)Imm) > 0) && (((uint32_t)Imm) < 9);
357}]> {
358 let EncoderMethod = "getVecShiftR8OpValue";
359 let DecoderMethod = "DecodeVecShiftR8Imm";
360 let ParserMatchClass = Imm1_8Operand;
361}
362def vecshiftR16 : Operand<i32>, ImmLeaf<i32, [{
363 return (((uint32_t)Imm) > 0) && (((uint32_t)Imm) < 17);
364}]> {
365 let EncoderMethod = "getVecShiftR16OpValue";
366 let DecoderMethod = "DecodeVecShiftR16Imm";
367 let ParserMatchClass = Imm1_16Operand;
368}
369def vecshiftR16Narrow : Operand<i32>, ImmLeaf<i32, [{
370 return (((uint32_t)Imm) > 0) && (((uint32_t)Imm) < 9);
371}]> {
372 let EncoderMethod = "getVecShiftR16OpValue";
373 let DecoderMethod = "DecodeVecShiftR16ImmNarrow";
374 let ParserMatchClass = Imm1_8Operand;
375}
376def vecshiftR32 : Operand<i32>, ImmLeaf<i32, [{
377 return (((uint32_t)Imm) > 0) && (((uint32_t)Imm) < 33);
378}]> {
379 let EncoderMethod = "getVecShiftR32OpValue";
380 let DecoderMethod = "DecodeVecShiftR32Imm";
381 let ParserMatchClass = Imm1_32Operand;
382}
383def vecshiftR32Narrow : Operand<i32>, ImmLeaf<i32, [{
384 return (((uint32_t)Imm) > 0) && (((uint32_t)Imm) < 17);
385}]> {
386 let EncoderMethod = "getVecShiftR32OpValue";
387 let DecoderMethod = "DecodeVecShiftR32ImmNarrow";
388 let ParserMatchClass = Imm1_16Operand;
389}
390def vecshiftR64 : Operand<i32>, ImmLeaf<i32, [{
391 return (((uint32_t)Imm) > 0) && (((uint32_t)Imm) < 65);
392}]> {
393 let EncoderMethod = "getVecShiftR64OpValue";
394 let DecoderMethod = "DecodeVecShiftR64Imm";
395 let ParserMatchClass = Imm1_64Operand;
396}
397def vecshiftR64Narrow : Operand<i32>, ImmLeaf<i32, [{
398 return (((uint32_t)Imm) > 0) && (((uint32_t)Imm) < 33);
399}]> {
400 let EncoderMethod = "getVecShiftR64OpValue";
401 let DecoderMethod = "DecodeVecShiftR64ImmNarrow";
402 let ParserMatchClass = Imm1_32Operand;
403}
404
405def Imm0_7Operand : AsmImmRange<0, 7>;
406def Imm0_15Operand : AsmImmRange<0, 15>;
407def Imm0_31Operand : AsmImmRange<0, 31>;
408def Imm0_63Operand : AsmImmRange<0, 63>;
409
410def vecshiftL8 : Operand<i32>, ImmLeaf<i32, [{
411 return (((uint32_t)Imm) < 8);
412}]> {
413 let EncoderMethod = "getVecShiftL8OpValue";
414 let DecoderMethod = "DecodeVecShiftL8Imm";
415 let ParserMatchClass = Imm0_7Operand;
416}
417def vecshiftL16 : Operand<i32>, ImmLeaf<i32, [{
418 return (((uint32_t)Imm) < 16);
419}]> {
420 let EncoderMethod = "getVecShiftL16OpValue";
421 let DecoderMethod = "DecodeVecShiftL16Imm";
422 let ParserMatchClass = Imm0_15Operand;
423}
424def vecshiftL32 : Operand<i32>, ImmLeaf<i32, [{
425 return (((uint32_t)Imm) < 32);
426}]> {
427 let EncoderMethod = "getVecShiftL32OpValue";
428 let DecoderMethod = "DecodeVecShiftL32Imm";
429 let ParserMatchClass = Imm0_31Operand;
430}
431def vecshiftL64 : Operand<i32>, ImmLeaf<i32, [{
432 return (((uint32_t)Imm) < 64);
433}]> {
434 let EncoderMethod = "getVecShiftL64OpValue";
435 let DecoderMethod = "DecodeVecShiftL64Imm";
436 let ParserMatchClass = Imm0_63Operand;
437}
438
439
440// Crazy immediate formats used by 32-bit and 64-bit logical immediate
441// instructions for splatting repeating bit patterns across the immediate.
442def logical_imm32_XFORM : SDNodeXForm<imm, [{
443 uint64_t enc = AArch64_AM::encodeLogicalImmediate(N->getZExtValue(), 32);
444 return CurDAG->getTargetConstant(enc, MVT::i32);
445}]>;
446def logical_imm64_XFORM : SDNodeXForm<imm, [{
447 uint64_t enc = AArch64_AM::encodeLogicalImmediate(N->getZExtValue(), 64);
448 return CurDAG->getTargetConstant(enc, MVT::i32);
449}]>;
450
451def LogicalImm32Operand : AsmOperandClass {
452 let Name = "LogicalImm32";
453 let DiagnosticType = "LogicalSecondSource";
454}
455def LogicalImm64Operand : AsmOperandClass {
456 let Name = "LogicalImm64";
457 let DiagnosticType = "LogicalSecondSource";
458}
459def logical_imm32 : Operand<i32>, PatLeaf<(imm), [{
460 return AArch64_AM::isLogicalImmediate(N->getZExtValue(), 32);
461}], logical_imm32_XFORM> {
462 let PrintMethod = "printLogicalImm32";
463 let ParserMatchClass = LogicalImm32Operand;
464}
465def logical_imm64 : Operand<i64>, PatLeaf<(imm), [{
466 return AArch64_AM::isLogicalImmediate(N->getZExtValue(), 64);
467}], logical_imm64_XFORM> {
468 let PrintMethod = "printLogicalImm64";
469 let ParserMatchClass = LogicalImm64Operand;
470}
471
472// imm0_65535 predicate - True if the immediate is in the range [0,65535].
473def Imm0_65535Operand : AsmImmRange<0, 65535>;
474def imm0_65535 : Operand<i32>, ImmLeaf<i32, [{
475 return ((uint32_t)Imm) < 65536;
476}]> {
477 let ParserMatchClass = Imm0_65535Operand;
478 let PrintMethod = "printHexImm";
479}
480
481// imm0_255 predicate - True if the immediate is in the range [0,255].
482def Imm0_255Operand : AsmOperandClass { let Name = "Imm0_255"; }
483def imm0_255 : Operand<i32>, ImmLeaf<i32, [{
484 return ((uint32_t)Imm) < 256;
485}]> {
486 let ParserMatchClass = Imm0_255Operand;
487 let PrintMethod = "printHexImm";
488}
489
490// imm0_127 predicate - True if the immediate is in the range [0,127]
491def Imm0_127Operand : AsmImmRange<0, 127>;
492def imm0_127 : Operand<i32>, ImmLeaf<i32, [{
493 return ((uint32_t)Imm) < 128;
494}]> {
495 let ParserMatchClass = Imm0_127Operand;
496 let PrintMethod = "printHexImm";
497}
498
499// NOTE: These imm0_N operands have to be of type i64 because i64 is the size
500// for all shift-amounts.
501
502// imm0_63 predicate - True if the immediate is in the range [0,63]
503def imm0_63 : Operand<i64>, ImmLeaf<i64, [{
504 return ((uint64_t)Imm) < 64;
505}]> {
506 let ParserMatchClass = Imm0_63Operand;
507}
508
509// imm0_31 predicate - True if the immediate is in the range [0,31]
510def imm0_31 : Operand<i64>, ImmLeaf<i64, [{
511 return ((uint64_t)Imm) < 32;
512}]> {
513 let ParserMatchClass = Imm0_31Operand;
514}
515
516// imm0_15 predicate - True if the immediate is in the range [0,15]
517def imm0_15 : Operand<i64>, ImmLeaf<i64, [{
518 return ((uint64_t)Imm) < 16;
519}]> {
520 let ParserMatchClass = Imm0_15Operand;
521}
522
523// imm0_7 predicate - True if the immediate is in the range [0,7]
524def imm0_7 : Operand<i64>, ImmLeaf<i64, [{
525 return ((uint64_t)Imm) < 8;
526}]> {
527 let ParserMatchClass = Imm0_7Operand;
528}
529
530// An arithmetic shifter operand:
531// {7-6} - shift type: 00 = lsl, 01 = lsr, 10 = asr
532// {5-0} - imm6
533class arith_shift<ValueType Ty, int width> : Operand<Ty> {
534 let PrintMethod = "printShifter";
535 let ParserMatchClass = !cast<AsmOperandClass>(
536 "ArithmeticShifterOperand" # width);
537}
538
539def arith_shift32 : arith_shift<i32, 32>;
540def arith_shift64 : arith_shift<i64, 64>;
541
542class arith_shifted_reg<ValueType Ty, RegisterClass regclass, int width>
543 : Operand<Ty>,
544 ComplexPattern<Ty, 2, "SelectArithShiftedRegister", []> {
545 let PrintMethod = "printShiftedRegister";
546 let MIOperandInfo = (ops regclass, !cast<Operand>("arith_shift" # width));
547}
548
549def arith_shifted_reg32 : arith_shifted_reg<i32, GPR32, 32>;
550def arith_shifted_reg64 : arith_shifted_reg<i64, GPR64, 64>;
551
552// An arithmetic shifter operand:
553// {7-6} - shift type: 00 = lsl, 01 = lsr, 10 = asr, 11 = ror
554// {5-0} - imm6
555class logical_shift<int width> : Operand<i32> {
556 let PrintMethod = "printShifter";
557 let ParserMatchClass = !cast<AsmOperandClass>(
558 "LogicalShifterOperand" # width);
559}
560
561def logical_shift32 : logical_shift<32>;
562def logical_shift64 : logical_shift<64>;
563
564class logical_shifted_reg<ValueType Ty, RegisterClass regclass, Operand shiftop>
565 : Operand<Ty>,
566 ComplexPattern<Ty, 2, "SelectLogicalShiftedRegister", []> {
567 let PrintMethod = "printShiftedRegister";
568 let MIOperandInfo = (ops regclass, shiftop);
569}
570
571def logical_shifted_reg32 : logical_shifted_reg<i32, GPR32, logical_shift32>;
572def logical_shifted_reg64 : logical_shifted_reg<i64, GPR64, logical_shift64>;
573
574// A logical vector shifter operand:
575// {7-6} - shift type: 00 = lsl
576// {5-0} - imm6: #0, #8, #16, or #24
577def logical_vec_shift : Operand<i32> {
578 let PrintMethod = "printShifter";
579 let EncoderMethod = "getVecShifterOpValue";
580 let ParserMatchClass = LogicalVecShifterOperand;
581}
582
583// A logical vector half-word shifter operand:
584// {7-6} - shift type: 00 = lsl
585// {5-0} - imm6: #0 or #8
586def logical_vec_hw_shift : Operand<i32> {
587 let PrintMethod = "printShifter";
588 let EncoderMethod = "getVecShifterOpValue";
589 let ParserMatchClass = LogicalVecHalfWordShifterOperand;
590}
591
592// A vector move shifter operand:
593// {0} - imm1: #8 or #16
594def move_vec_shift : Operand<i32> {
595 let PrintMethod = "printShifter";
596 let EncoderMethod = "getMoveVecShifterOpValue";
597 let ParserMatchClass = MoveVecShifterOperand;
598}
599
600def AddSubImmOperand : AsmOperandClass {
601 let Name = "AddSubImm";
602 let ParserMethod = "tryParseAddSubImm";
603 let DiagnosticType = "AddSubSecondSource";
604}
605// An ADD/SUB immediate shifter operand:
606// second operand:
607// {7-6} - shift type: 00 = lsl
608// {5-0} - imm6: #0 or #12
609class addsub_shifted_imm<ValueType Ty>
610 : Operand<Ty>, ComplexPattern<Ty, 2, "SelectArithImmed", [imm]> {
611 let PrintMethod = "printAddSubImm";
612 let EncoderMethod = "getAddSubImmOpValue";
613 let ParserMatchClass = AddSubImmOperand;
614 let MIOperandInfo = (ops i32imm, i32imm);
615}
616
617def addsub_shifted_imm32 : addsub_shifted_imm<i32>;
618def addsub_shifted_imm64 : addsub_shifted_imm<i64>;
619
620class neg_addsub_shifted_imm<ValueType Ty>
621 : Operand<Ty>, ComplexPattern<Ty, 2, "SelectNegArithImmed", [imm]> {
622 let PrintMethod = "printAddSubImm";
623 let EncoderMethod = "getAddSubImmOpValue";
624 let ParserMatchClass = AddSubImmOperand;
625 let MIOperandInfo = (ops i32imm, i32imm);
626}
627
628def neg_addsub_shifted_imm32 : neg_addsub_shifted_imm<i32>;
629def neg_addsub_shifted_imm64 : neg_addsub_shifted_imm<i64>;
630
631// An extend operand:
632// {5-3} - extend type
633// {2-0} - imm3
634def arith_extend : Operand<i32> {
635 let PrintMethod = "printArithExtend";
636 let ParserMatchClass = ExtendOperand;
637}
638def arith_extend64 : Operand<i32> {
639 let PrintMethod = "printArithExtend";
640 let ParserMatchClass = ExtendOperand64;
641}
642
643// 'extend' that's a lsl of a 64-bit register.
644def arith_extendlsl64 : Operand<i32> {
645 let PrintMethod = "printArithExtend";
646 let ParserMatchClass = ExtendOperandLSL64;
647}
648
649class arith_extended_reg32<ValueType Ty> : Operand<Ty>,
650 ComplexPattern<Ty, 2, "SelectArithExtendedRegister", []> {
651 let PrintMethod = "printExtendedRegister";
652 let MIOperandInfo = (ops GPR32, arith_extend);
653}
654
655class arith_extended_reg32to64<ValueType Ty> : Operand<Ty>,
656 ComplexPattern<Ty, 2, "SelectArithExtendedRegister", []> {
657 let PrintMethod = "printExtendedRegister";
658 let MIOperandInfo = (ops GPR32, arith_extend64);
659}
660
661// Floating-point immediate.
662def fpimm32 : Operand<f32>,
663 PatLeaf<(f32 fpimm), [{
664 return AArch64_AM::getFP32Imm(N->getValueAPF()) != -1;
665 }], SDNodeXForm<fpimm, [{
666 APFloat InVal = N->getValueAPF();
667 uint32_t enc = AArch64_AM::getFP32Imm(InVal);
668 return CurDAG->getTargetConstant(enc, MVT::i32);
669 }]>> {
670 let ParserMatchClass = FPImmOperand;
671 let PrintMethod = "printFPImmOperand";
672}
673def fpimm64 : Operand<f64>,
674 PatLeaf<(f64 fpimm), [{
675 return AArch64_AM::getFP64Imm(N->getValueAPF()) != -1;
676 }], SDNodeXForm<fpimm, [{
677 APFloat InVal = N->getValueAPF();
678 uint32_t enc = AArch64_AM::getFP64Imm(InVal);
679 return CurDAG->getTargetConstant(enc, MVT::i32);
680 }]>> {
681 let ParserMatchClass = FPImmOperand;
682 let PrintMethod = "printFPImmOperand";
683}
684
685def fpimm8 : Operand<i32> {
686 let ParserMatchClass = FPImmOperand;
687 let PrintMethod = "printFPImmOperand";
688}
689
690def fpimm0 : PatLeaf<(fpimm), [{
691 return N->isExactlyValue(+0.0);
692}]>;
693
694// Vector lane operands
695class AsmVectorIndex<string Suffix> : AsmOperandClass {
696 let Name = "VectorIndex" # Suffix;
697 let DiagnosticType = "InvalidIndex" # Suffix;
698}
699def VectorIndex1Operand : AsmVectorIndex<"1">;
700def VectorIndexBOperand : AsmVectorIndex<"B">;
701def VectorIndexHOperand : AsmVectorIndex<"H">;
702def VectorIndexSOperand : AsmVectorIndex<"S">;
703def VectorIndexDOperand : AsmVectorIndex<"D">;
704
705def VectorIndex1 : Operand<i64>, ImmLeaf<i64, [{
706 return ((uint64_t)Imm) == 1;
707}]> {
708 let ParserMatchClass = VectorIndex1Operand;
709 let PrintMethod = "printVectorIndex";
710 let MIOperandInfo = (ops i64imm);
711}
712def VectorIndexB : Operand<i64>, ImmLeaf<i64, [{
713 return ((uint64_t)Imm) < 16;
714}]> {
715 let ParserMatchClass = VectorIndexBOperand;
716 let PrintMethod = "printVectorIndex";
717 let MIOperandInfo = (ops i64imm);
718}
719def VectorIndexH : Operand<i64>, ImmLeaf<i64, [{
720 return ((uint64_t)Imm) < 8;
721}]> {
722 let ParserMatchClass = VectorIndexHOperand;
723 let PrintMethod = "printVectorIndex";
724 let MIOperandInfo = (ops i64imm);
725}
726def VectorIndexS : Operand<i64>, ImmLeaf<i64, [{
727 return ((uint64_t)Imm) < 4;
728}]> {
729 let ParserMatchClass = VectorIndexSOperand;
730 let PrintMethod = "printVectorIndex";
731 let MIOperandInfo = (ops i64imm);
732}
733def VectorIndexD : Operand<i64>, ImmLeaf<i64, [{
734 return ((uint64_t)Imm) < 2;
735}]> {
736 let ParserMatchClass = VectorIndexDOperand;
737 let PrintMethod = "printVectorIndex";
738 let MIOperandInfo = (ops i64imm);
739}
740
741// 8-bit immediate for AdvSIMD where 64-bit values of the form:
742// aaaaaaaa bbbbbbbb cccccccc dddddddd eeeeeeee ffffffff gggggggg hhhhhhhh
743// are encoded as the eight bit value 'abcdefgh'.
744def simdimmtype10 : Operand<i32>,
745 PatLeaf<(f64 fpimm), [{
746 return AArch64_AM::isAdvSIMDModImmType10(N->getValueAPF()
747 .bitcastToAPInt()
748 .getZExtValue());
749 }], SDNodeXForm<fpimm, [{
750 APFloat InVal = N->getValueAPF();
751 uint32_t enc = AArch64_AM::encodeAdvSIMDModImmType10(N->getValueAPF()
752 .bitcastToAPInt()
753 .getZExtValue());
754 return CurDAG->getTargetConstant(enc, MVT::i32);
755 }]>> {
756 let ParserMatchClass = SIMDImmType10Operand;
757 let PrintMethod = "printSIMDType10Operand";
758}
759
760
761//---
762// System management
763//---
764
765// Base encoding for system instruction operands.
766let mayLoad = 0, mayStore = 0, hasSideEffects = 1 in
767class BaseSystemI<bit L, dag oops, dag iops, string asm, string operands>
768 : I<oops, iops, asm, operands, "", []> {
769 let Inst{31-22} = 0b1101010100;
770 let Inst{21} = L;
771}
772
773// System instructions which do not have an Rt register.
774class SimpleSystemI<bit L, dag iops, string asm, string operands>
775 : BaseSystemI<L, (outs), iops, asm, operands> {
776 let Inst{4-0} = 0b11111;
777}
778
779// System instructions which have an Rt register.
780class RtSystemI<bit L, dag oops, dag iops, string asm, string operands>
781 : BaseSystemI<L, oops, iops, asm, operands>,
782 Sched<[WriteSys]> {
783 bits<5> Rt;
784 let Inst{4-0} = Rt;
785}
786
787// Hint instructions that take both a CRm and a 3-bit immediate.
788class HintI<string mnemonic>
789 : SimpleSystemI<0, (ins imm0_127:$imm), mnemonic#" $imm", "">,
790 Sched<[WriteHint]> {
791 bits <7> imm;
792 let Inst{20-12} = 0b000110010;
793 let Inst{11-5} = imm;
794}
795
796// System instructions taking a single literal operand which encodes into
797// CRm. op2 differentiates the opcodes.
798def BarrierAsmOperand : AsmOperandClass {
799 let Name = "Barrier";
800 let ParserMethod = "tryParseBarrierOperand";
801}
802def barrier_op : Operand<i32> {
803 let PrintMethod = "printBarrierOption";
804 let ParserMatchClass = BarrierAsmOperand;
805}
806class CRmSystemI<Operand crmtype, bits<3> opc, string asm>
807 : SimpleSystemI<0, (ins crmtype:$CRm), asm, "\t$CRm">,
808 Sched<[WriteBarrier]> {
809 bits<4> CRm;
810 let Inst{20-12} = 0b000110011;
811 let Inst{11-8} = CRm;
812 let Inst{7-5} = opc;
813}
814
815// MRS/MSR system instructions. These have different operand classes because
816// a different subset of registers can be accessed through each instruction.
817def MRSSystemRegisterOperand : AsmOperandClass {
818 let Name = "MRSSystemRegister";
819 let ParserMethod = "tryParseSysReg";
820 let DiagnosticType = "MRS";
821}
822// concatenation of 1, op0, op1, CRn, CRm, op2. 16-bit immediate.
823def mrs_sysreg_op : Operand<i32> {
824 let ParserMatchClass = MRSSystemRegisterOperand;
825 let DecoderMethod = "DecodeMRSSystemRegister";
826 let PrintMethod = "printMRSSystemRegister";
827}
828
829def MSRSystemRegisterOperand : AsmOperandClass {
830 let Name = "MSRSystemRegister";
831 let ParserMethod = "tryParseSysReg";
832 let DiagnosticType = "MSR";
833}
834def msr_sysreg_op : Operand<i32> {
835 let ParserMatchClass = MSRSystemRegisterOperand;
836 let DecoderMethod = "DecodeMSRSystemRegister";
837 let PrintMethod = "printMSRSystemRegister";
838}
839
840class MRSI : RtSystemI<1, (outs GPR64:$Rt), (ins mrs_sysreg_op:$systemreg),
841 "mrs", "\t$Rt, $systemreg"> {
842 bits<15> systemreg;
843 let Inst{20} = 1;
844 let Inst{19-5} = systemreg;
845}
846
847// FIXME: Some of these def NZCV, others don't. Best way to model that?
848// Explicitly modeling each of the system register as a register class
849// would do it, but feels like overkill at this point.
850class MSRI : RtSystemI<0, (outs), (ins msr_sysreg_op:$systemreg, GPR64:$Rt),
851 "msr", "\t$systemreg, $Rt"> {
852 bits<15> systemreg;
853 let Inst{20} = 1;
854 let Inst{19-5} = systemreg;
855}
856
857def SystemPStateFieldOperand : AsmOperandClass {
858 let Name = "SystemPStateField";
859 let ParserMethod = "tryParseSysReg";
860}
861def pstatefield_op : Operand<i32> {
862 let ParserMatchClass = SystemPStateFieldOperand;
863 let PrintMethod = "printSystemPStateField";
864}
865
866let Defs = [NZCV] in
867class MSRpstateI
868 : SimpleSystemI<0, (ins pstatefield_op:$pstate_field, imm0_15:$imm),
869 "msr", "\t$pstate_field, $imm">,
870 Sched<[WriteSys]> {
871 bits<6> pstatefield;
872 bits<4> imm;
873 let Inst{20-19} = 0b00;
874 let Inst{18-16} = pstatefield{5-3};
875 let Inst{15-12} = 0b0100;
876 let Inst{11-8} = imm;
877 let Inst{7-5} = pstatefield{2-0};
878
879 let DecoderMethod = "DecodeSystemPStateInstruction";
880}
881
882// SYS and SYSL generic system instructions.
883def SysCRAsmOperand : AsmOperandClass {
884 let Name = "SysCR";
885 let ParserMethod = "tryParseSysCROperand";
886}
887
888def sys_cr_op : Operand<i32> {
889 let PrintMethod = "printSysCROperand";
890 let ParserMatchClass = SysCRAsmOperand;
891}
892
893class SystemXtI<bit L, string asm>
894 : RtSystemI<L, (outs),
895 (ins imm0_7:$op1, sys_cr_op:$Cn, sys_cr_op:$Cm, imm0_7:$op2, GPR64:$Rt),
896 asm, "\t$op1, $Cn, $Cm, $op2, $Rt"> {
897 bits<3> op1;
898 bits<4> Cn;
899 bits<4> Cm;
900 bits<3> op2;
901 let Inst{20-19} = 0b01;
902 let Inst{18-16} = op1;
903 let Inst{15-12} = Cn;
904 let Inst{11-8} = Cm;
905 let Inst{7-5} = op2;
906}
907
908class SystemLXtI<bit L, string asm>
909 : RtSystemI<L, (outs),
910 (ins GPR64:$Rt, imm0_7:$op1, sys_cr_op:$Cn, sys_cr_op:$Cm, imm0_7:$op2),
911 asm, "\t$Rt, $op1, $Cn, $Cm, $op2"> {
912 bits<3> op1;
913 bits<4> Cn;
914 bits<4> Cm;
915 bits<3> op2;
916 let Inst{20-19} = 0b01;
917 let Inst{18-16} = op1;
918 let Inst{15-12} = Cn;
919 let Inst{11-8} = Cm;
920 let Inst{7-5} = op2;
921}
922
923
924// Branch (register) instructions:
925//
926// case opc of
927// 0001 blr
928// 0000 br
929// 0101 dret
930// 0100 eret
931// 0010 ret
932// otherwise UNDEFINED
933class BaseBranchReg<bits<4> opc, dag oops, dag iops, string asm,
934 string operands, list<dag> pattern>
935 : I<oops, iops, asm, operands, "", pattern>, Sched<[WriteBrReg]> {
936 let Inst{31-25} = 0b1101011;
937 let Inst{24-21} = opc;
938 let Inst{20-16} = 0b11111;
939 let Inst{15-10} = 0b000000;
940 let Inst{4-0} = 0b00000;
941}
942
943class BranchReg<bits<4> opc, string asm, list<dag> pattern>
944 : BaseBranchReg<opc, (outs), (ins GPR64:$Rn), asm, "\t$Rn", pattern> {
945 bits<5> Rn;
946 let Inst{9-5} = Rn;
947}
948
949let mayLoad = 0, mayStore = 0, hasSideEffects = 1, isReturn = 1 in
950class SpecialReturn<bits<4> opc, string asm>
951 : BaseBranchReg<opc, (outs), (ins), asm, "", []> {
952 let Inst{9-5} = 0b11111;
953}
954
955//---
956// Conditional branch instruction.
957//---
958
959// Condition code.
960// 4-bit immediate. Pretty-printed as <cc>
961def ccode : Operand<i32> {
962 let PrintMethod = "printCondCode";
963 let ParserMatchClass = CondCode;
964}
965def inv_ccode : Operand<i32> {
966 let PrintMethod = "printInverseCondCode";
967 let ParserMatchClass = CondCode;
968}
969
970// Conditional branch target. 19-bit immediate. The low two bits of the target
971// offset are implied zero and so are not part of the immediate.
972def PCRelLabel19Operand : AsmOperandClass {
973 let Name = "PCRelLabel19";
974 let DiagnosticType = "InvalidLabel";
975}
976def am_brcond : Operand<OtherVT> {
977 let EncoderMethod = "getCondBranchTargetOpValue";
978 let DecoderMethod = "DecodePCRelLabel19";
979 let PrintMethod = "printAlignedLabel";
980 let ParserMatchClass = PCRelLabel19Operand;
981}
982
983class BranchCond : I<(outs), (ins ccode:$cond, am_brcond:$target),
984 "b", ".$cond\t$target", "",
985 [(AArch64brcond bb:$target, imm:$cond, NZCV)]>,
986 Sched<[WriteBr]> {
987 let isBranch = 1;
988 let isTerminator = 1;
989 let Uses = [NZCV];
990
991 bits<4> cond;
992 bits<19> target;
993 let Inst{31-24} = 0b01010100;
994 let Inst{23-5} = target;
995 let Inst{4} = 0;
996 let Inst{3-0} = cond;
997}
998
999//---
1000// Compare-and-branch instructions.
1001//---
1002class BaseCmpBranch<RegisterClass regtype, bit op, string asm, SDNode node>
1003 : I<(outs), (ins regtype:$Rt, am_brcond:$target),
1004 asm, "\t$Rt, $target", "",
1005 [(node regtype:$Rt, bb:$target)]>,
1006 Sched<[WriteBr]> {
1007 let isBranch = 1;
1008 let isTerminator = 1;
1009
1010 bits<5> Rt;
1011 bits<19> target;
1012 let Inst{30-25} = 0b011010;
1013 let Inst{24} = op;
1014 let Inst{23-5} = target;
1015 let Inst{4-0} = Rt;
1016}
1017
1018multiclass CmpBranch<bit op, string asm, SDNode node> {
1019 def W : BaseCmpBranch<GPR32, op, asm, node> {
1020 let Inst{31} = 0;
1021 }
1022 def X : BaseCmpBranch<GPR64, op, asm, node> {
1023 let Inst{31} = 1;
1024 }
1025}
1026
1027//---
1028// Test-bit-and-branch instructions.
1029//---
1030// Test-and-branch target. 14-bit sign-extended immediate. The low two bits of
1031// the target offset are implied zero and so are not part of the immediate.
1032def BranchTarget14Operand : AsmOperandClass {
1033 let Name = "BranchTarget14";
1034}
1035def am_tbrcond : Operand<OtherVT> {
1036 let EncoderMethod = "getTestBranchTargetOpValue";
1037 let PrintMethod = "printAlignedLabel";
1038 let ParserMatchClass = BranchTarget14Operand;
1039}
1040
1041// AsmOperand classes to emit (or not) special diagnostics
1042def TBZImm0_31Operand : AsmOperandClass {
1043 let Name = "TBZImm0_31";
1044 let PredicateMethod = "isImm0_31";
1045 let RenderMethod = "addImm0_31Operands";
1046}
1047def TBZImm32_63Operand : AsmOperandClass {
1048 let Name = "Imm32_63";
1049 let DiagnosticType = "InvalidImm0_63";
1050}
1051
1052class tbz_imm0_31<AsmOperandClass matcher> : Operand<i64>, ImmLeaf<i64, [{
1053 return (((uint32_t)Imm) < 32);
1054}]> {
1055 let ParserMatchClass = matcher;
1056}
1057
1058def tbz_imm0_31_diag : tbz_imm0_31<Imm0_31Operand>;
1059def tbz_imm0_31_nodiag : tbz_imm0_31<TBZImm0_31Operand>;
1060
1061def tbz_imm32_63 : Operand<i64>, ImmLeaf<i64, [{
1062 return (((uint32_t)Imm) > 31) && (((uint32_t)Imm) < 64);
1063}]> {
1064 let ParserMatchClass = TBZImm32_63Operand;
1065}
1066
1067class BaseTestBranch<RegisterClass regtype, Operand immtype,
1068 bit op, string asm, SDNode node>
1069 : I<(outs), (ins regtype:$Rt, immtype:$bit_off, am_tbrcond:$target),
1070 asm, "\t$Rt, $bit_off, $target", "",
1071 [(node regtype:$Rt, immtype:$bit_off, bb:$target)]>,
1072 Sched<[WriteBr]> {
1073 let isBranch = 1;
1074 let isTerminator = 1;
1075
1076 bits<5> Rt;
1077 bits<6> bit_off;
1078 bits<14> target;
1079
1080 let Inst{30-25} = 0b011011;
1081 let Inst{24} = op;
1082 let Inst{23-19} = bit_off{4-0};
1083 let Inst{18-5} = target;
1084 let Inst{4-0} = Rt;
1085
1086 let DecoderMethod = "DecodeTestAndBranch";
1087}
1088
1089multiclass TestBranch<bit op, string asm, SDNode node> {
1090 def W : BaseTestBranch<GPR32, tbz_imm0_31_diag, op, asm, node> {
1091 let Inst{31} = 0;
1092 }
1093
1094 def X : BaseTestBranch<GPR64, tbz_imm32_63, op, asm, node> {
1095 let Inst{31} = 1;
1096 }
1097
1098 // Alias X-reg with 0-31 imm to W-Reg.
1099 def : InstAlias<asm # "\t$Rd, $imm, $target",
1100 (!cast<Instruction>(NAME#"W") GPR32as64:$Rd,
1101 tbz_imm0_31_nodiag:$imm, am_tbrcond:$target), 0>;
1102 def : Pat<(node GPR64:$Rn, tbz_imm0_31_diag:$imm, bb:$target),
1103 (!cast<Instruction>(NAME#"W") (EXTRACT_SUBREG GPR64:$Rn, sub_32),
1104 tbz_imm0_31_diag:$imm, bb:$target)>;
1105}
1106
1107//---
1108// Unconditional branch (immediate) instructions.
1109//---
1110def BranchTarget26Operand : AsmOperandClass {
1111 let Name = "BranchTarget26";
1112 let DiagnosticType = "InvalidLabel";
1113}
1114def am_b_target : Operand<OtherVT> {
1115 let EncoderMethod = "getBranchTargetOpValue";
1116 let PrintMethod = "printAlignedLabel";
1117 let ParserMatchClass = BranchTarget26Operand;
1118}
1119def am_bl_target : Operand<i64> {
1120 let EncoderMethod = "getBranchTargetOpValue";
1121 let PrintMethod = "printAlignedLabel";
1122 let ParserMatchClass = BranchTarget26Operand;
1123}
1124
1125class BImm<bit op, dag iops, string asm, list<dag> pattern>
1126 : I<(outs), iops, asm, "\t$addr", "", pattern>, Sched<[WriteBr]> {
1127 bits<26> addr;
1128 let Inst{31} = op;
1129 let Inst{30-26} = 0b00101;
1130 let Inst{25-0} = addr;
1131
1132 let DecoderMethod = "DecodeUnconditionalBranch";
1133}
1134
1135class BranchImm<bit op, string asm, list<dag> pattern>
1136 : BImm<op, (ins am_b_target:$addr), asm, pattern>;
1137class CallImm<bit op, string asm, list<dag> pattern>
1138 : BImm<op, (ins am_bl_target:$addr), asm, pattern>;
1139
1140//---
1141// Basic one-operand data processing instructions.
1142//---
1143
1144let mayLoad = 0, mayStore = 0, hasSideEffects = 0 in
1145class BaseOneOperandData<bits<3> opc, RegisterClass regtype, string asm,
1146 SDPatternOperator node>
1147 : I<(outs regtype:$Rd), (ins regtype:$Rn), asm, "\t$Rd, $Rn", "",
1148 [(set regtype:$Rd, (node regtype:$Rn))]>,
1149 Sched<[WriteI, ReadI]> {
1150 bits<5> Rd;
1151 bits<5> Rn;
1152
1153 let Inst{30-13} = 0b101101011000000000;
1154 let Inst{12-10} = opc;
1155 let Inst{9-5} = Rn;
1156 let Inst{4-0} = Rd;
1157}
1158
1159let mayLoad = 0, mayStore = 0, hasSideEffects = 0 in
1160multiclass OneOperandData<bits<3> opc, string asm,
1161 SDPatternOperator node = null_frag> {
1162 def Wr : BaseOneOperandData<opc, GPR32, asm, node> {
1163 let Inst{31} = 0;
1164 }
1165
1166 def Xr : BaseOneOperandData<opc, GPR64, asm, node> {
1167 let Inst{31} = 1;
1168 }
1169}
1170
1171class OneWRegData<bits<3> opc, string asm, SDPatternOperator node>
1172 : BaseOneOperandData<opc, GPR32, asm, node> {
1173 let Inst{31} = 0;
1174}
1175
1176class OneXRegData<bits<3> opc, string asm, SDPatternOperator node>
1177 : BaseOneOperandData<opc, GPR64, asm, node> {
1178 let Inst{31} = 1;
1179}
1180
1181//---
1182// Basic two-operand data processing instructions.
1183//---
1184class BaseBaseAddSubCarry<bit isSub, RegisterClass regtype, string asm,
1185 list<dag> pattern>
1186 : I<(outs regtype:$Rd), (ins regtype:$Rn, regtype:$Rm),
1187 asm, "\t$Rd, $Rn, $Rm", "", pattern>,
1188 Sched<[WriteI, ReadI, ReadI]> {
1189 let Uses = [NZCV];
1190 bits<5> Rd;
1191 bits<5> Rn;
1192 bits<5> Rm;
1193 let Inst{30} = isSub;
1194 let Inst{28-21} = 0b11010000;
1195 let Inst{20-16} = Rm;
1196 let Inst{15-10} = 0;
1197 let Inst{9-5} = Rn;
1198 let Inst{4-0} = Rd;
1199}
1200
1201class BaseAddSubCarry<bit isSub, RegisterClass regtype, string asm,
1202 SDNode OpNode>
1203 : BaseBaseAddSubCarry<isSub, regtype, asm,
1204 [(set regtype:$Rd, (OpNode regtype:$Rn, regtype:$Rm, NZCV))]>;
1205
1206class BaseAddSubCarrySetFlags<bit isSub, RegisterClass regtype, string asm,
1207 SDNode OpNode>
1208 : BaseBaseAddSubCarry<isSub, regtype, asm,
1209 [(set regtype:$Rd, (OpNode regtype:$Rn, regtype:$Rm, NZCV)),
1210 (implicit NZCV)]> {
1211 let Defs = [NZCV];
1212}
1213
1214multiclass AddSubCarry<bit isSub, string asm, string asm_setflags,
1215 SDNode OpNode, SDNode OpNode_setflags> {
1216 def Wr : BaseAddSubCarry<isSub, GPR32, asm, OpNode> {
1217 let Inst{31} = 0;
1218 let Inst{29} = 0;
1219 }
1220 def Xr : BaseAddSubCarry<isSub, GPR64, asm, OpNode> {
1221 let Inst{31} = 1;
1222 let Inst{29} = 0;
1223 }
1224
1225 // Sets flags.
1226 def SWr : BaseAddSubCarrySetFlags<isSub, GPR32, asm_setflags,
1227 OpNode_setflags> {
1228 let Inst{31} = 0;
1229 let Inst{29} = 1;
1230 }
1231 def SXr : BaseAddSubCarrySetFlags<isSub, GPR64, asm_setflags,
1232 OpNode_setflags> {
1233 let Inst{31} = 1;
1234 let Inst{29} = 1;
1235 }
1236}
1237
1238class BaseTwoOperand<bits<4> opc, RegisterClass regtype, string asm,
1239 SDPatternOperator OpNode>
1240 : I<(outs regtype:$Rd), (ins regtype:$Rn, regtype:$Rm),
1241 asm, "\t$Rd, $Rn, $Rm", "",
1242 [(set regtype:$Rd, (OpNode regtype:$Rn, regtype:$Rm))]> {
1243 bits<5> Rd;
1244 bits<5> Rn;
1245 bits<5> Rm;
1246 let Inst{30-21} = 0b0011010110;
1247 let Inst{20-16} = Rm;
1248 let Inst{15-14} = 0b00;
1249 let Inst{13-10} = opc;
1250 let Inst{9-5} = Rn;
1251 let Inst{4-0} = Rd;
1252}
1253
1254class BaseDiv<bit isSigned, RegisterClass regtype, string asm,
1255 SDPatternOperator OpNode>
1256 : BaseTwoOperand<{0,0,1,?}, regtype, asm, OpNode> {
1257 let Inst{10} = isSigned;
1258}
1259
1260multiclass Div<bit isSigned, string asm, SDPatternOperator OpNode> {
1261 def Wr : BaseDiv<isSigned, GPR32, asm, OpNode>,
1262 Sched<[WriteID32, ReadID, ReadID]> {
1263 let Inst{31} = 0;
1264 }
1265 def Xr : BaseDiv<isSigned, GPR64, asm, OpNode>,
1266 Sched<[WriteID64, ReadID, ReadID]> {
1267 let Inst{31} = 1;
1268 }
1269}
1270
1271class BaseShift<bits<2> shift_type, RegisterClass regtype, string asm,
1272 SDPatternOperator OpNode = null_frag>
1273 : BaseTwoOperand<{1,0,?,?}, regtype, asm, OpNode>,
1274 Sched<[WriteIS, ReadI]> {
1275 let Inst{11-10} = shift_type;
1276}
1277
1278multiclass Shift<bits<2> shift_type, string asm, SDNode OpNode> {
1279 def Wr : BaseShift<shift_type, GPR32, asm> {
1280 let Inst{31} = 0;
1281 }
1282
1283 def Xr : BaseShift<shift_type, GPR64, asm, OpNode> {
1284 let Inst{31} = 1;
1285 }
1286
1287 def : Pat<(i32 (OpNode GPR32:$Rn, i64:$Rm)),
1288 (!cast<Instruction>(NAME # "Wr") GPR32:$Rn,
1289 (EXTRACT_SUBREG i64:$Rm, sub_32))>;
1290
1291 def : Pat<(i32 (OpNode GPR32:$Rn, (i64 (zext GPR32:$Rm)))),
1292 (!cast<Instruction>(NAME # "Wr") GPR32:$Rn, GPR32:$Rm)>;
1293
1294 def : Pat<(i32 (OpNode GPR32:$Rn, (i64 (anyext GPR32:$Rm)))),
1295 (!cast<Instruction>(NAME # "Wr") GPR32:$Rn, GPR32:$Rm)>;
1296
1297 def : Pat<(i32 (OpNode GPR32:$Rn, (i64 (sext GPR32:$Rm)))),
1298 (!cast<Instruction>(NAME # "Wr") GPR32:$Rn, GPR32:$Rm)>;
1299}
1300
1301class ShiftAlias<string asm, Instruction inst, RegisterClass regtype>
1302 : InstAlias<asm#" $dst, $src1, $src2",
1303 (inst regtype:$dst, regtype:$src1, regtype:$src2), 0>;
1304
1305class BaseMulAccum<bit isSub, bits<3> opc, RegisterClass multype,
1306 RegisterClass addtype, string asm,
1307 list<dag> pattern>
1308 : I<(outs addtype:$Rd), (ins multype:$Rn, multype:$Rm, addtype:$Ra),
1309 asm, "\t$Rd, $Rn, $Rm, $Ra", "", pattern> {
1310 bits<5> Rd;
1311 bits<5> Rn;
1312 bits<5> Rm;
1313 bits<5> Ra;
1314 let Inst{30-24} = 0b0011011;
1315 let Inst{23-21} = opc;
1316 let Inst{20-16} = Rm;
1317 let Inst{15} = isSub;
1318 let Inst{14-10} = Ra;
1319 let Inst{9-5} = Rn;
1320 let Inst{4-0} = Rd;
1321}
1322
1323multiclass MulAccum<bit isSub, string asm, SDNode AccNode> {
1324 def Wrrr : BaseMulAccum<isSub, 0b000, GPR32, GPR32, asm,
1325 [(set GPR32:$Rd, (AccNode GPR32:$Ra, (mul GPR32:$Rn, GPR32:$Rm)))]>,
Chad Rosier3fe0c872014-06-09 01:54:00 +00001326 Sched<[WriteIM32, ReadIM, ReadIM, ReadIMA]> {
Tim Northover3b0846e2014-05-24 12:50:23 +00001327 let Inst{31} = 0;
1328 }
1329
1330 def Xrrr : BaseMulAccum<isSub, 0b000, GPR64, GPR64, asm,
1331 [(set GPR64:$Rd, (AccNode GPR64:$Ra, (mul GPR64:$Rn, GPR64:$Rm)))]>,
Chad Rosier3fe0c872014-06-09 01:54:00 +00001332 Sched<[WriteIM64, ReadIM, ReadIM, ReadIMA]> {
Tim Northover3b0846e2014-05-24 12:50:23 +00001333 let Inst{31} = 1;
1334 }
1335}
1336
1337class WideMulAccum<bit isSub, bits<3> opc, string asm,
1338 SDNode AccNode, SDNode ExtNode>
1339 : BaseMulAccum<isSub, opc, GPR32, GPR64, asm,
1340 [(set GPR64:$Rd, (AccNode GPR64:$Ra,
1341 (mul (ExtNode GPR32:$Rn), (ExtNode GPR32:$Rm))))]>,
Chad Rosier3fe0c872014-06-09 01:54:00 +00001342 Sched<[WriteIM32, ReadIM, ReadIM, ReadIMA]> {
Tim Northover3b0846e2014-05-24 12:50:23 +00001343 let Inst{31} = 1;
1344}
1345
1346class MulHi<bits<3> opc, string asm, SDNode OpNode>
1347 : I<(outs GPR64:$Rd), (ins GPR64:$Rn, GPR64:$Rm),
1348 asm, "\t$Rd, $Rn, $Rm", "",
1349 [(set GPR64:$Rd, (OpNode GPR64:$Rn, GPR64:$Rm))]>,
1350 Sched<[WriteIM64, ReadIM, ReadIM]> {
1351 bits<5> Rd;
1352 bits<5> Rn;
1353 bits<5> Rm;
1354 let Inst{31-24} = 0b10011011;
1355 let Inst{23-21} = opc;
1356 let Inst{20-16} = Rm;
1357 let Inst{15} = 0;
1358 let Inst{9-5} = Rn;
1359 let Inst{4-0} = Rd;
1360
1361 // The Ra field of SMULH and UMULH is unused: it should be assembled as 31
1362 // (i.e. all bits 1) but is ignored by the processor.
1363 let PostEncoderMethod = "fixMulHigh";
1364}
1365
1366class MulAccumWAlias<string asm, Instruction inst>
1367 : InstAlias<asm#" $dst, $src1, $src2",
1368 (inst GPR32:$dst, GPR32:$src1, GPR32:$src2, WZR)>;
1369class MulAccumXAlias<string asm, Instruction inst>
1370 : InstAlias<asm#" $dst, $src1, $src2",
1371 (inst GPR64:$dst, GPR64:$src1, GPR64:$src2, XZR)>;
1372class WideMulAccumAlias<string asm, Instruction inst>
1373 : InstAlias<asm#" $dst, $src1, $src2",
1374 (inst GPR64:$dst, GPR32:$src1, GPR32:$src2, XZR)>;
1375
1376class BaseCRC32<bit sf, bits<2> sz, bit C, RegisterClass StreamReg,
1377 SDPatternOperator OpNode, string asm>
1378 : I<(outs GPR32:$Rd), (ins GPR32:$Rn, StreamReg:$Rm),
1379 asm, "\t$Rd, $Rn, $Rm", "",
1380 [(set GPR32:$Rd, (OpNode GPR32:$Rn, StreamReg:$Rm))]>,
1381 Sched<[WriteISReg, ReadI, ReadISReg]> {
1382 bits<5> Rd;
1383 bits<5> Rn;
1384 bits<5> Rm;
1385
1386 let Inst{31} = sf;
1387 let Inst{30-21} = 0b0011010110;
1388 let Inst{20-16} = Rm;
1389 let Inst{15-13} = 0b010;
1390 let Inst{12} = C;
1391 let Inst{11-10} = sz;
1392 let Inst{9-5} = Rn;
1393 let Inst{4-0} = Rd;
1394 let Predicates = [HasCRC];
1395}
1396
1397//---
1398// Address generation.
1399//---
1400
1401class ADRI<bit page, string asm, Operand adr, list<dag> pattern>
1402 : I<(outs GPR64:$Xd), (ins adr:$label), asm, "\t$Xd, $label", "",
1403 pattern>,
1404 Sched<[WriteI]> {
1405 bits<5> Xd;
1406 bits<21> label;
1407 let Inst{31} = page;
1408 let Inst{30-29} = label{1-0};
1409 let Inst{28-24} = 0b10000;
1410 let Inst{23-5} = label{20-2};
1411 let Inst{4-0} = Xd;
1412
1413 let DecoderMethod = "DecodeAdrInstruction";
1414}
1415
1416//---
1417// Move immediate.
1418//---
1419
1420def movimm32_imm : Operand<i32> {
1421 let ParserMatchClass = Imm0_65535Operand;
1422 let EncoderMethod = "getMoveWideImmOpValue";
1423 let PrintMethod = "printHexImm";
1424}
1425def movimm32_shift : Operand<i32> {
1426 let PrintMethod = "printShifter";
1427 let ParserMatchClass = MovImm32ShifterOperand;
1428}
1429def movimm64_shift : Operand<i32> {
1430 let PrintMethod = "printShifter";
1431 let ParserMatchClass = MovImm64ShifterOperand;
1432}
1433
1434let mayLoad = 0, mayStore = 0, hasSideEffects = 0 in
1435class BaseMoveImmediate<bits<2> opc, RegisterClass regtype, Operand shifter,
1436 string asm>
1437 : I<(outs regtype:$Rd), (ins movimm32_imm:$imm, shifter:$shift),
1438 asm, "\t$Rd, $imm$shift", "", []>,
1439 Sched<[WriteImm]> {
1440 bits<5> Rd;
1441 bits<16> imm;
1442 bits<6> shift;
1443 let Inst{30-29} = opc;
1444 let Inst{28-23} = 0b100101;
1445 let Inst{22-21} = shift{5-4};
1446 let Inst{20-5} = imm;
1447 let Inst{4-0} = Rd;
1448
1449 let DecoderMethod = "DecodeMoveImmInstruction";
1450}
1451
1452multiclass MoveImmediate<bits<2> opc, string asm> {
1453 def Wi : BaseMoveImmediate<opc, GPR32, movimm32_shift, asm> {
1454 let Inst{31} = 0;
1455 }
1456
1457 def Xi : BaseMoveImmediate<opc, GPR64, movimm64_shift, asm> {
1458 let Inst{31} = 1;
1459 }
1460}
1461
1462let mayLoad = 0, mayStore = 0, hasSideEffects = 0 in
1463class BaseInsertImmediate<bits<2> opc, RegisterClass regtype, Operand shifter,
1464 string asm>
1465 : I<(outs regtype:$Rd),
1466 (ins regtype:$src, movimm32_imm:$imm, shifter:$shift),
1467 asm, "\t$Rd, $imm$shift", "$src = $Rd", []>,
1468 Sched<[WriteI, ReadI]> {
1469 bits<5> Rd;
1470 bits<16> imm;
1471 bits<6> shift;
1472 let Inst{30-29} = opc;
1473 let Inst{28-23} = 0b100101;
1474 let Inst{22-21} = shift{5-4};
1475 let Inst{20-5} = imm;
1476 let Inst{4-0} = Rd;
1477
1478 let DecoderMethod = "DecodeMoveImmInstruction";
1479}
1480
1481multiclass InsertImmediate<bits<2> opc, string asm> {
1482 def Wi : BaseInsertImmediate<opc, GPR32, movimm32_shift, asm> {
1483 let Inst{31} = 0;
1484 }
1485
1486 def Xi : BaseInsertImmediate<opc, GPR64, movimm64_shift, asm> {
1487 let Inst{31} = 1;
1488 }
1489}
1490
1491//---
1492// Add/Subtract
1493//---
1494
1495class BaseAddSubImm<bit isSub, bit setFlags, RegisterClass dstRegtype,
1496 RegisterClass srcRegtype, addsub_shifted_imm immtype,
1497 string asm, SDPatternOperator OpNode>
1498 : I<(outs dstRegtype:$Rd), (ins srcRegtype:$Rn, immtype:$imm),
1499 asm, "\t$Rd, $Rn, $imm", "",
1500 [(set dstRegtype:$Rd, (OpNode srcRegtype:$Rn, immtype:$imm))]>,
1501 Sched<[WriteI, ReadI]> {
1502 bits<5> Rd;
1503 bits<5> Rn;
1504 bits<14> imm;
1505 let Inst{30} = isSub;
1506 let Inst{29} = setFlags;
1507 let Inst{28-24} = 0b10001;
1508 let Inst{23-22} = imm{13-12}; // '00' => lsl #0, '01' => lsl #12
1509 let Inst{21-10} = imm{11-0};
1510 let Inst{9-5} = Rn;
1511 let Inst{4-0} = Rd;
1512 let DecoderMethod = "DecodeBaseAddSubImm";
1513}
1514
1515class BaseAddSubRegPseudo<RegisterClass regtype,
1516 SDPatternOperator OpNode>
1517 : Pseudo<(outs regtype:$Rd), (ins regtype:$Rn, regtype:$Rm),
1518 [(set regtype:$Rd, (OpNode regtype:$Rn, regtype:$Rm))]>,
1519 Sched<[WriteI, ReadI, ReadI]>;
1520
1521class BaseAddSubSReg<bit isSub, bit setFlags, RegisterClass regtype,
1522 arith_shifted_reg shifted_regtype, string asm,
1523 SDPatternOperator OpNode>
1524 : I<(outs regtype:$Rd), (ins regtype:$Rn, shifted_regtype:$Rm),
1525 asm, "\t$Rd, $Rn, $Rm", "",
1526 [(set regtype:$Rd, (OpNode regtype:$Rn, shifted_regtype:$Rm))]>,
1527 Sched<[WriteISReg, ReadI, ReadISReg]> {
1528 // The operands are in order to match the 'addr' MI operands, so we
1529 // don't need an encoder method and by-name matching. Just use the default
1530 // in-order handling. Since we're using by-order, make sure the names
1531 // do not match.
1532 bits<5> dst;
1533 bits<5> src1;
1534 bits<5> src2;
1535 bits<8> shift;
1536 let Inst{30} = isSub;
1537 let Inst{29} = setFlags;
1538 let Inst{28-24} = 0b01011;
1539 let Inst{23-22} = shift{7-6};
1540 let Inst{21} = 0;
1541 let Inst{20-16} = src2;
1542 let Inst{15-10} = shift{5-0};
1543 let Inst{9-5} = src1;
1544 let Inst{4-0} = dst;
1545
1546 let DecoderMethod = "DecodeThreeAddrSRegInstruction";
1547}
1548
1549class BaseAddSubEReg<bit isSub, bit setFlags, RegisterClass dstRegtype,
1550 RegisterClass src1Regtype, Operand src2Regtype,
1551 string asm, SDPatternOperator OpNode>
1552 : I<(outs dstRegtype:$R1),
1553 (ins src1Regtype:$R2, src2Regtype:$R3),
1554 asm, "\t$R1, $R2, $R3", "",
1555 [(set dstRegtype:$R1, (OpNode src1Regtype:$R2, src2Regtype:$R3))]>,
1556 Sched<[WriteIEReg, ReadI, ReadIEReg]> {
1557 bits<5> Rd;
1558 bits<5> Rn;
1559 bits<5> Rm;
1560 bits<6> ext;
1561 let Inst{30} = isSub;
1562 let Inst{29} = setFlags;
1563 let Inst{28-24} = 0b01011;
1564 let Inst{23-21} = 0b001;
1565 let Inst{20-16} = Rm;
1566 let Inst{15-13} = ext{5-3};
1567 let Inst{12-10} = ext{2-0};
1568 let Inst{9-5} = Rn;
1569 let Inst{4-0} = Rd;
1570
1571 let DecoderMethod = "DecodeAddSubERegInstruction";
1572}
1573
1574let mayLoad = 0, mayStore = 0, hasSideEffects = 0 in
1575class BaseAddSubEReg64<bit isSub, bit setFlags, RegisterClass dstRegtype,
1576 RegisterClass src1Regtype, RegisterClass src2Regtype,
1577 Operand ext_op, string asm>
1578 : I<(outs dstRegtype:$Rd),
1579 (ins src1Regtype:$Rn, src2Regtype:$Rm, ext_op:$ext),
1580 asm, "\t$Rd, $Rn, $Rm$ext", "", []>,
1581 Sched<[WriteIEReg, ReadI, ReadIEReg]> {
1582 bits<5> Rd;
1583 bits<5> Rn;
1584 bits<5> Rm;
1585 bits<6> ext;
1586 let Inst{30} = isSub;
1587 let Inst{29} = setFlags;
1588 let Inst{28-24} = 0b01011;
1589 let Inst{23-21} = 0b001;
1590 let Inst{20-16} = Rm;
1591 let Inst{15} = ext{5};
1592 let Inst{12-10} = ext{2-0};
1593 let Inst{9-5} = Rn;
1594 let Inst{4-0} = Rd;
1595
1596 let DecoderMethod = "DecodeAddSubERegInstruction";
1597}
1598
1599// Aliases for register+register add/subtract.
1600class AddSubRegAlias<string asm, Instruction inst, RegisterClass dstRegtype,
1601 RegisterClass src1Regtype, RegisterClass src2Regtype,
1602 int shiftExt>
1603 : InstAlias<asm#" $dst, $src1, $src2",
1604 (inst dstRegtype:$dst, src1Regtype:$src1, src2Regtype:$src2,
1605 shiftExt)>;
1606
1607multiclass AddSub<bit isSub, string mnemonic,
1608 SDPatternOperator OpNode = null_frag> {
1609 let hasSideEffects = 0 in {
1610 // Add/Subtract immediate
1611 def Wri : BaseAddSubImm<isSub, 0, GPR32sp, GPR32sp, addsub_shifted_imm32,
1612 mnemonic, OpNode> {
1613 let Inst{31} = 0;
1614 }
1615 def Xri : BaseAddSubImm<isSub, 0, GPR64sp, GPR64sp, addsub_shifted_imm64,
1616 mnemonic, OpNode> {
1617 let Inst{31} = 1;
1618 }
1619
1620 // Add/Subtract register - Only used for CodeGen
1621 def Wrr : BaseAddSubRegPseudo<GPR32, OpNode>;
1622 def Xrr : BaseAddSubRegPseudo<GPR64, OpNode>;
1623
1624 // Add/Subtract shifted register
1625 def Wrs : BaseAddSubSReg<isSub, 0, GPR32, arith_shifted_reg32, mnemonic,
1626 OpNode> {
1627 let Inst{31} = 0;
1628 }
1629 def Xrs : BaseAddSubSReg<isSub, 0, GPR64, arith_shifted_reg64, mnemonic,
1630 OpNode> {
1631 let Inst{31} = 1;
1632 }
1633 }
1634
1635 // Add/Subtract extended register
1636 let AddedComplexity = 1, hasSideEffects = 0 in {
1637 def Wrx : BaseAddSubEReg<isSub, 0, GPR32sp, GPR32sp,
1638 arith_extended_reg32<i32>, mnemonic, OpNode> {
1639 let Inst{31} = 0;
1640 }
1641 def Xrx : BaseAddSubEReg<isSub, 0, GPR64sp, GPR64sp,
1642 arith_extended_reg32to64<i64>, mnemonic, OpNode> {
1643 let Inst{31} = 1;
1644 }
1645 }
1646
1647 def Xrx64 : BaseAddSubEReg64<isSub, 0, GPR64sp, GPR64sp, GPR64,
1648 arith_extendlsl64, mnemonic> {
1649 // UXTX and SXTX only.
1650 let Inst{14-13} = 0b11;
1651 let Inst{31} = 1;
1652 }
1653
1654 // Register/register aliases with no shift when SP is not used.
1655 def : AddSubRegAlias<mnemonic, !cast<Instruction>(NAME#"Wrs"),
1656 GPR32, GPR32, GPR32, 0>;
1657 def : AddSubRegAlias<mnemonic, !cast<Instruction>(NAME#"Xrs"),
1658 GPR64, GPR64, GPR64, 0>;
1659
1660 // Register/register aliases with no shift when either the destination or
1661 // first source register is SP.
1662 def : AddSubRegAlias<mnemonic, !cast<Instruction>(NAME#"Wrx"),
1663 GPR32sponly, GPR32sp, GPR32, 16>; // UXTW #0
1664 def : AddSubRegAlias<mnemonic, !cast<Instruction>(NAME#"Wrx"),
1665 GPR32sp, GPR32sponly, GPR32, 16>; // UXTW #0
1666 def : AddSubRegAlias<mnemonic,
1667 !cast<Instruction>(NAME#"Xrx64"),
1668 GPR64sponly, GPR64sp, GPR64, 24>; // UXTX #0
1669 def : AddSubRegAlias<mnemonic,
1670 !cast<Instruction>(NAME#"Xrx64"),
1671 GPR64sp, GPR64sponly, GPR64, 24>; // UXTX #0
1672}
1673
1674multiclass AddSubS<bit isSub, string mnemonic, SDNode OpNode, string cmp> {
1675 let isCompare = 1, Defs = [NZCV] in {
1676 // Add/Subtract immediate
1677 def Wri : BaseAddSubImm<isSub, 1, GPR32, GPR32sp, addsub_shifted_imm32,
1678 mnemonic, OpNode> {
1679 let Inst{31} = 0;
1680 }
1681 def Xri : BaseAddSubImm<isSub, 1, GPR64, GPR64sp, addsub_shifted_imm64,
1682 mnemonic, OpNode> {
1683 let Inst{31} = 1;
1684 }
1685
1686 // Add/Subtract register
1687 def Wrr : BaseAddSubRegPseudo<GPR32, OpNode>;
1688 def Xrr : BaseAddSubRegPseudo<GPR64, OpNode>;
1689
1690 // Add/Subtract shifted register
1691 def Wrs : BaseAddSubSReg<isSub, 1, GPR32, arith_shifted_reg32, mnemonic,
1692 OpNode> {
1693 let Inst{31} = 0;
1694 }
1695 def Xrs : BaseAddSubSReg<isSub, 1, GPR64, arith_shifted_reg64, mnemonic,
1696 OpNode> {
1697 let Inst{31} = 1;
1698 }
1699
1700 // Add/Subtract extended register
1701 let AddedComplexity = 1 in {
1702 def Wrx : BaseAddSubEReg<isSub, 1, GPR32, GPR32sp,
1703 arith_extended_reg32<i32>, mnemonic, OpNode> {
1704 let Inst{31} = 0;
1705 }
1706 def Xrx : BaseAddSubEReg<isSub, 1, GPR64, GPR64sp,
1707 arith_extended_reg32<i64>, mnemonic, OpNode> {
1708 let Inst{31} = 1;
1709 }
1710 }
1711
1712 def Xrx64 : BaseAddSubEReg64<isSub, 1, GPR64, GPR64sp, GPR64,
1713 arith_extendlsl64, mnemonic> {
1714 // UXTX and SXTX only.
1715 let Inst{14-13} = 0b11;
1716 let Inst{31} = 1;
1717 }
1718 } // Defs = [NZCV]
1719
1720 // Compare aliases
1721 def : InstAlias<cmp#" $src, $imm", (!cast<Instruction>(NAME#"Wri")
1722 WZR, GPR32sp:$src, addsub_shifted_imm32:$imm), 5>;
1723 def : InstAlias<cmp#" $src, $imm", (!cast<Instruction>(NAME#"Xri")
1724 XZR, GPR64sp:$src, addsub_shifted_imm64:$imm), 5>;
1725 def : InstAlias<cmp#" $src1, $src2$sh", (!cast<Instruction>(NAME#"Wrx")
1726 WZR, GPR32sp:$src1, GPR32:$src2, arith_extend:$sh), 4>;
1727 def : InstAlias<cmp#" $src1, $src2$sh", (!cast<Instruction>(NAME#"Xrx")
1728 XZR, GPR64sp:$src1, GPR32:$src2, arith_extend:$sh), 4>;
1729 def : InstAlias<cmp#" $src1, $src2$sh", (!cast<Instruction>(NAME#"Xrx64")
1730 XZR, GPR64sp:$src1, GPR64:$src2, arith_extendlsl64:$sh), 4>;
1731 def : InstAlias<cmp#" $src1, $src2$sh", (!cast<Instruction>(NAME#"Wrs")
1732 WZR, GPR32:$src1, GPR32:$src2, arith_shift32:$sh), 4>;
1733 def : InstAlias<cmp#" $src1, $src2$sh", (!cast<Instruction>(NAME#"Xrs")
1734 XZR, GPR64:$src1, GPR64:$src2, arith_shift64:$sh), 4>;
1735
1736 // Compare shorthands
1737 def : InstAlias<cmp#" $src1, $src2", (!cast<Instruction>(NAME#"Wrs")
1738 WZR, GPR32:$src1, GPR32:$src2, 0), 5>;
1739 def : InstAlias<cmp#" $src1, $src2", (!cast<Instruction>(NAME#"Xrs")
1740 XZR, GPR64:$src1, GPR64:$src2, 0), 5>;
Artyom Skrobov82ae94f2014-06-09 11:10:14 +00001741 def : InstAlias<cmp#" $src1, $src2", (!cast<Instruction>(NAME#"Wrx")
1742 WZR, GPR32sponly:$src1, GPR32:$src2, 16), 5>;
1743 def : InstAlias<cmp#" $src1, $src2", (!cast<Instruction>(NAME#"Xrx64")
1744 XZR, GPR64sponly:$src1, GPR64:$src2, 24), 5>;
Tim Northover3b0846e2014-05-24 12:50:23 +00001745
1746 // Register/register aliases with no shift when SP is not used.
1747 def : AddSubRegAlias<mnemonic, !cast<Instruction>(NAME#"Wrs"),
1748 GPR32, GPR32, GPR32, 0>;
1749 def : AddSubRegAlias<mnemonic, !cast<Instruction>(NAME#"Xrs"),
1750 GPR64, GPR64, GPR64, 0>;
1751
1752 // Register/register aliases with no shift when the first source register
1753 // is SP.
1754 def : AddSubRegAlias<mnemonic, !cast<Instruction>(NAME#"Wrx"),
1755 GPR32, GPR32sponly, GPR32, 16>; // UXTW #0
1756 def : AddSubRegAlias<mnemonic,
1757 !cast<Instruction>(NAME#"Xrx64"),
1758 GPR64, GPR64sponly, GPR64, 24>; // UXTX #0
1759}
1760
1761//---
1762// Extract
1763//---
1764def SDTA64EXTR : SDTypeProfile<1, 3, [SDTCisSameAs<0, 1>, SDTCisSameAs<0, 2>,
1765 SDTCisPtrTy<3>]>;
1766def AArch64Extr : SDNode<"AArch64ISD::EXTR", SDTA64EXTR>;
1767
1768class BaseExtractImm<RegisterClass regtype, Operand imm_type, string asm,
1769 list<dag> patterns>
1770 : I<(outs regtype:$Rd), (ins regtype:$Rn, regtype:$Rm, imm_type:$imm),
1771 asm, "\t$Rd, $Rn, $Rm, $imm", "", patterns>,
1772 Sched<[WriteExtr, ReadExtrHi]> {
1773 bits<5> Rd;
1774 bits<5> Rn;
1775 bits<5> Rm;
1776 bits<6> imm;
1777
1778 let Inst{30-23} = 0b00100111;
1779 let Inst{21} = 0;
1780 let Inst{20-16} = Rm;
1781 let Inst{15-10} = imm;
1782 let Inst{9-5} = Rn;
1783 let Inst{4-0} = Rd;
1784}
1785
1786multiclass ExtractImm<string asm> {
1787 def Wrri : BaseExtractImm<GPR32, imm0_31, asm,
1788 [(set GPR32:$Rd,
1789 (AArch64Extr GPR32:$Rn, GPR32:$Rm, imm0_31:$imm))]> {
1790 let Inst{31} = 0;
1791 let Inst{22} = 0;
1792 // imm<5> must be zero.
1793 let imm{5} = 0;
1794 }
1795 def Xrri : BaseExtractImm<GPR64, imm0_63, asm,
1796 [(set GPR64:$Rd,
1797 (AArch64Extr GPR64:$Rn, GPR64:$Rm, imm0_63:$imm))]> {
1798
1799 let Inst{31} = 1;
1800 let Inst{22} = 1;
1801 }
1802}
1803
1804//---
1805// Bitfield
1806//---
1807
1808let mayLoad = 0, mayStore = 0, hasSideEffects = 0 in
1809class BaseBitfieldImm<bits<2> opc,
1810 RegisterClass regtype, Operand imm_type, string asm>
1811 : I<(outs regtype:$Rd), (ins regtype:$Rn, imm_type:$immr, imm_type:$imms),
1812 asm, "\t$Rd, $Rn, $immr, $imms", "", []>,
1813 Sched<[WriteIS, ReadI]> {
1814 bits<5> Rd;
1815 bits<5> Rn;
1816 bits<6> immr;
1817 bits<6> imms;
1818
1819 let Inst{30-29} = opc;
1820 let Inst{28-23} = 0b100110;
1821 let Inst{21-16} = immr;
1822 let Inst{15-10} = imms;
1823 let Inst{9-5} = Rn;
1824 let Inst{4-0} = Rd;
1825}
1826
1827multiclass BitfieldImm<bits<2> opc, string asm> {
1828 def Wri : BaseBitfieldImm<opc, GPR32, imm0_31, asm> {
1829 let Inst{31} = 0;
1830 let Inst{22} = 0;
1831 // imms<5> and immr<5> must be zero, else ReservedValue().
1832 let Inst{21} = 0;
1833 let Inst{15} = 0;
1834 }
1835 def Xri : BaseBitfieldImm<opc, GPR64, imm0_63, asm> {
1836 let Inst{31} = 1;
1837 let Inst{22} = 1;
1838 }
1839}
1840
1841let mayLoad = 0, mayStore = 0, hasSideEffects = 0 in
1842class BaseBitfieldImmWith2RegArgs<bits<2> opc,
1843 RegisterClass regtype, Operand imm_type, string asm>
1844 : I<(outs regtype:$Rd), (ins regtype:$src, regtype:$Rn, imm_type:$immr,
1845 imm_type:$imms),
1846 asm, "\t$Rd, $Rn, $immr, $imms", "$src = $Rd", []>,
1847 Sched<[WriteIS, ReadI]> {
1848 bits<5> Rd;
1849 bits<5> Rn;
1850 bits<6> immr;
1851 bits<6> imms;
1852
1853 let Inst{30-29} = opc;
1854 let Inst{28-23} = 0b100110;
1855 let Inst{21-16} = immr;
1856 let Inst{15-10} = imms;
1857 let Inst{9-5} = Rn;
1858 let Inst{4-0} = Rd;
1859}
1860
1861multiclass BitfieldImmWith2RegArgs<bits<2> opc, string asm> {
1862 def Wri : BaseBitfieldImmWith2RegArgs<opc, GPR32, imm0_31, asm> {
1863 let Inst{31} = 0;
1864 let Inst{22} = 0;
1865 // imms<5> and immr<5> must be zero, else ReservedValue().
1866 let Inst{21} = 0;
1867 let Inst{15} = 0;
1868 }
1869 def Xri : BaseBitfieldImmWith2RegArgs<opc, GPR64, imm0_63, asm> {
1870 let Inst{31} = 1;
1871 let Inst{22} = 1;
1872 }
1873}
1874
1875//---
1876// Logical
1877//---
1878
1879// Logical (immediate)
1880class BaseLogicalImm<bits<2> opc, RegisterClass dregtype,
1881 RegisterClass sregtype, Operand imm_type, string asm,
1882 list<dag> pattern>
1883 : I<(outs dregtype:$Rd), (ins sregtype:$Rn, imm_type:$imm),
1884 asm, "\t$Rd, $Rn, $imm", "", pattern>,
1885 Sched<[WriteI, ReadI]> {
1886 bits<5> Rd;
1887 bits<5> Rn;
1888 bits<13> imm;
1889 let Inst{30-29} = opc;
1890 let Inst{28-23} = 0b100100;
1891 let Inst{22} = imm{12};
1892 let Inst{21-16} = imm{11-6};
1893 let Inst{15-10} = imm{5-0};
1894 let Inst{9-5} = Rn;
1895 let Inst{4-0} = Rd;
1896
1897 let DecoderMethod = "DecodeLogicalImmInstruction";
1898}
1899
1900// Logical (shifted register)
1901class BaseLogicalSReg<bits<2> opc, bit N, RegisterClass regtype,
1902 logical_shifted_reg shifted_regtype, string asm,
1903 list<dag> pattern>
1904 : I<(outs regtype:$Rd), (ins regtype:$Rn, shifted_regtype:$Rm),
1905 asm, "\t$Rd, $Rn, $Rm", "", pattern>,
1906 Sched<[WriteISReg, ReadI, ReadISReg]> {
1907 // The operands are in order to match the 'addr' MI operands, so we
1908 // don't need an encoder method and by-name matching. Just use the default
1909 // in-order handling. Since we're using by-order, make sure the names
1910 // do not match.
1911 bits<5> dst;
1912 bits<5> src1;
1913 bits<5> src2;
1914 bits<8> shift;
1915 let Inst{30-29} = opc;
1916 let Inst{28-24} = 0b01010;
1917 let Inst{23-22} = shift{7-6};
1918 let Inst{21} = N;
1919 let Inst{20-16} = src2;
1920 let Inst{15-10} = shift{5-0};
1921 let Inst{9-5} = src1;
1922 let Inst{4-0} = dst;
1923
1924 let DecoderMethod = "DecodeThreeAddrSRegInstruction";
1925}
1926
1927// Aliases for register+register logical instructions.
1928class LogicalRegAlias<string asm, Instruction inst, RegisterClass regtype>
1929 : InstAlias<asm#" $dst, $src1, $src2",
1930 (inst regtype:$dst, regtype:$src1, regtype:$src2, 0)>;
1931
1932let AddedComplexity = 6 in
1933multiclass LogicalImm<bits<2> opc, string mnemonic, SDNode OpNode> {
1934 def Wri : BaseLogicalImm<opc, GPR32sp, GPR32, logical_imm32, mnemonic,
1935 [(set GPR32sp:$Rd, (OpNode GPR32:$Rn,
1936 logical_imm32:$imm))]> {
1937 let Inst{31} = 0;
1938 let Inst{22} = 0; // 64-bit version has an additional bit of immediate.
1939 }
1940 def Xri : BaseLogicalImm<opc, GPR64sp, GPR64, logical_imm64, mnemonic,
1941 [(set GPR64sp:$Rd, (OpNode GPR64:$Rn,
1942 logical_imm64:$imm))]> {
1943 let Inst{31} = 1;
1944 }
1945}
1946
1947multiclass LogicalImmS<bits<2> opc, string mnemonic, SDNode OpNode> {
1948 let isCompare = 1, Defs = [NZCV] in {
1949 def Wri : BaseLogicalImm<opc, GPR32, GPR32, logical_imm32, mnemonic,
1950 [(set GPR32:$Rd, (OpNode GPR32:$Rn, logical_imm32:$imm))]> {
1951 let Inst{31} = 0;
1952 let Inst{22} = 0; // 64-bit version has an additional bit of immediate.
1953 }
1954 def Xri : BaseLogicalImm<opc, GPR64, GPR64, logical_imm64, mnemonic,
1955 [(set GPR64:$Rd, (OpNode GPR64:$Rn, logical_imm64:$imm))]> {
1956 let Inst{31} = 1;
1957 }
1958 } // end Defs = [NZCV]
1959}
1960
1961class BaseLogicalRegPseudo<RegisterClass regtype, SDPatternOperator OpNode>
1962 : Pseudo<(outs regtype:$Rd), (ins regtype:$Rn, regtype:$Rm),
1963 [(set regtype:$Rd, (OpNode regtype:$Rn, regtype:$Rm))]>,
1964 Sched<[WriteI, ReadI, ReadI]>;
1965
1966// Split from LogicalImm as not all instructions have both.
1967multiclass LogicalReg<bits<2> opc, bit N, string mnemonic,
1968 SDPatternOperator OpNode> {
1969 def Wrr : BaseLogicalRegPseudo<GPR32, OpNode>;
1970 def Xrr : BaseLogicalRegPseudo<GPR64, OpNode>;
1971
1972 def Wrs : BaseLogicalSReg<opc, N, GPR32, logical_shifted_reg32, mnemonic,
1973 [(set GPR32:$Rd, (OpNode GPR32:$Rn,
1974 logical_shifted_reg32:$Rm))]> {
1975 let Inst{31} = 0;
1976 }
1977 def Xrs : BaseLogicalSReg<opc, N, GPR64, logical_shifted_reg64, mnemonic,
1978 [(set GPR64:$Rd, (OpNode GPR64:$Rn,
1979 logical_shifted_reg64:$Rm))]> {
1980 let Inst{31} = 1;
1981 }
1982
1983 def : LogicalRegAlias<mnemonic,
1984 !cast<Instruction>(NAME#"Wrs"), GPR32>;
1985 def : LogicalRegAlias<mnemonic,
1986 !cast<Instruction>(NAME#"Xrs"), GPR64>;
1987}
1988
1989// Split from LogicalReg to allow setting NZCV Defs
1990multiclass LogicalRegS<bits<2> opc, bit N, string mnemonic,
1991 SDPatternOperator OpNode = null_frag> {
1992 let Defs = [NZCV], mayLoad = 0, mayStore = 0, hasSideEffects = 0 in {
1993 def Wrr : BaseLogicalRegPseudo<GPR32, OpNode>;
1994 def Xrr : BaseLogicalRegPseudo<GPR64, OpNode>;
1995
1996 def Wrs : BaseLogicalSReg<opc, N, GPR32, logical_shifted_reg32, mnemonic,
1997 [(set GPR32:$Rd, (OpNode GPR32:$Rn, logical_shifted_reg32:$Rm))]> {
1998 let Inst{31} = 0;
1999 }
2000 def Xrs : BaseLogicalSReg<opc, N, GPR64, logical_shifted_reg64, mnemonic,
2001 [(set GPR64:$Rd, (OpNode GPR64:$Rn, logical_shifted_reg64:$Rm))]> {
2002 let Inst{31} = 1;
2003 }
2004 } // Defs = [NZCV]
2005
2006 def : LogicalRegAlias<mnemonic,
2007 !cast<Instruction>(NAME#"Wrs"), GPR32>;
2008 def : LogicalRegAlias<mnemonic,
2009 !cast<Instruction>(NAME#"Xrs"), GPR64>;
2010}
2011
2012//---
2013// Conditionally set flags
2014//---
2015
2016let mayLoad = 0, mayStore = 0, hasSideEffects = 0 in
2017class BaseCondSetFlagsImm<bit op, RegisterClass regtype, string asm>
2018 : I<(outs), (ins regtype:$Rn, imm0_31:$imm, imm0_15:$nzcv, ccode:$cond),
2019 asm, "\t$Rn, $imm, $nzcv, $cond", "", []>,
2020 Sched<[WriteI, ReadI]> {
2021 let Uses = [NZCV];
2022 let Defs = [NZCV];
2023
2024 bits<5> Rn;
2025 bits<5> imm;
2026 bits<4> nzcv;
2027 bits<4> cond;
2028
2029 let Inst{30} = op;
2030 let Inst{29-21} = 0b111010010;
2031 let Inst{20-16} = imm;
2032 let Inst{15-12} = cond;
2033 let Inst{11-10} = 0b10;
2034 let Inst{9-5} = Rn;
2035 let Inst{4} = 0b0;
2036 let Inst{3-0} = nzcv;
2037}
2038
2039multiclass CondSetFlagsImm<bit op, string asm> {
2040 def Wi : BaseCondSetFlagsImm<op, GPR32, asm> {
2041 let Inst{31} = 0;
2042 }
2043 def Xi : BaseCondSetFlagsImm<op, GPR64, asm> {
2044 let Inst{31} = 1;
2045 }
2046}
2047
2048let mayLoad = 0, mayStore = 0, hasSideEffects = 0 in
2049class BaseCondSetFlagsReg<bit op, RegisterClass regtype, string asm>
2050 : I<(outs), (ins regtype:$Rn, regtype:$Rm, imm0_15:$nzcv, ccode:$cond),
2051 asm, "\t$Rn, $Rm, $nzcv, $cond", "", []>,
2052 Sched<[WriteI, ReadI, ReadI]> {
2053 let Uses = [NZCV];
2054 let Defs = [NZCV];
2055
2056 bits<5> Rn;
2057 bits<5> Rm;
2058 bits<4> nzcv;
2059 bits<4> cond;
2060
2061 let Inst{30} = op;
2062 let Inst{29-21} = 0b111010010;
2063 let Inst{20-16} = Rm;
2064 let Inst{15-12} = cond;
2065 let Inst{11-10} = 0b00;
2066 let Inst{9-5} = Rn;
2067 let Inst{4} = 0b0;
2068 let Inst{3-0} = nzcv;
2069}
2070
2071multiclass CondSetFlagsReg<bit op, string asm> {
2072 def Wr : BaseCondSetFlagsReg<op, GPR32, asm> {
2073 let Inst{31} = 0;
2074 }
2075 def Xr : BaseCondSetFlagsReg<op, GPR64, asm> {
2076 let Inst{31} = 1;
2077 }
2078}
2079
2080//---
2081// Conditional select
2082//---
2083
2084class BaseCondSelect<bit op, bits<2> op2, RegisterClass regtype, string asm>
2085 : I<(outs regtype:$Rd), (ins regtype:$Rn, regtype:$Rm, ccode:$cond),
2086 asm, "\t$Rd, $Rn, $Rm, $cond", "",
2087 [(set regtype:$Rd,
2088 (AArch64csel regtype:$Rn, regtype:$Rm, (i32 imm:$cond), NZCV))]>,
2089 Sched<[WriteI, ReadI, ReadI]> {
2090 let Uses = [NZCV];
2091
2092 bits<5> Rd;
2093 bits<5> Rn;
2094 bits<5> Rm;
2095 bits<4> cond;
2096
2097 let Inst{30} = op;
2098 let Inst{29-21} = 0b011010100;
2099 let Inst{20-16} = Rm;
2100 let Inst{15-12} = cond;
2101 let Inst{11-10} = op2;
2102 let Inst{9-5} = Rn;
2103 let Inst{4-0} = Rd;
2104}
2105
2106multiclass CondSelect<bit op, bits<2> op2, string asm> {
2107 def Wr : BaseCondSelect<op, op2, GPR32, asm> {
2108 let Inst{31} = 0;
2109 }
2110 def Xr : BaseCondSelect<op, op2, GPR64, asm> {
2111 let Inst{31} = 1;
2112 }
2113}
2114
2115class BaseCondSelectOp<bit op, bits<2> op2, RegisterClass regtype, string asm,
2116 PatFrag frag>
2117 : I<(outs regtype:$Rd), (ins regtype:$Rn, regtype:$Rm, ccode:$cond),
2118 asm, "\t$Rd, $Rn, $Rm, $cond", "",
2119 [(set regtype:$Rd,
2120 (AArch64csel regtype:$Rn, (frag regtype:$Rm),
2121 (i32 imm:$cond), NZCV))]>,
2122 Sched<[WriteI, ReadI, ReadI]> {
2123 let Uses = [NZCV];
2124
2125 bits<5> Rd;
2126 bits<5> Rn;
2127 bits<5> Rm;
2128 bits<4> cond;
2129
2130 let Inst{30} = op;
2131 let Inst{29-21} = 0b011010100;
2132 let Inst{20-16} = Rm;
2133 let Inst{15-12} = cond;
2134 let Inst{11-10} = op2;
2135 let Inst{9-5} = Rn;
2136 let Inst{4-0} = Rd;
2137}
2138
2139def inv_cond_XFORM : SDNodeXForm<imm, [{
2140 AArch64CC::CondCode CC = static_cast<AArch64CC::CondCode>(N->getZExtValue());
2141 return CurDAG->getTargetConstant(AArch64CC::getInvertedCondCode(CC), MVT::i32);
2142}]>;
2143
2144multiclass CondSelectOp<bit op, bits<2> op2, string asm, PatFrag frag> {
2145 def Wr : BaseCondSelectOp<op, op2, GPR32, asm, frag> {
2146 let Inst{31} = 0;
2147 }
2148 def Xr : BaseCondSelectOp<op, op2, GPR64, asm, frag> {
2149 let Inst{31} = 1;
2150 }
2151
2152 def : Pat<(AArch64csel (frag GPR32:$Rm), GPR32:$Rn, (i32 imm:$cond), NZCV),
2153 (!cast<Instruction>(NAME # Wr) GPR32:$Rn, GPR32:$Rm,
2154 (inv_cond_XFORM imm:$cond))>;
2155
2156 def : Pat<(AArch64csel (frag GPR64:$Rm), GPR64:$Rn, (i32 imm:$cond), NZCV),
2157 (!cast<Instruction>(NAME # Xr) GPR64:$Rn, GPR64:$Rm,
2158 (inv_cond_XFORM imm:$cond))>;
2159}
2160
2161//---
2162// Special Mask Value
2163//---
2164def maski8_or_more : Operand<i32>,
2165 ImmLeaf<i32, [{ return (Imm & 0xff) == 0xff; }]> {
2166}
2167def maski16_or_more : Operand<i32>,
2168 ImmLeaf<i32, [{ return (Imm & 0xffff) == 0xffff; }]> {
2169}
2170
2171
2172//---
2173// Load/store
2174//---
2175
2176// (unsigned immediate)
2177// Indexed for 8-bit registers. offset is in range [0,4095].
2178def am_indexed8 : ComplexPattern<i64, 2, "SelectAddrModeIndexed8", []>;
2179def am_indexed16 : ComplexPattern<i64, 2, "SelectAddrModeIndexed16", []>;
2180def am_indexed32 : ComplexPattern<i64, 2, "SelectAddrModeIndexed32", []>;
2181def am_indexed64 : ComplexPattern<i64, 2, "SelectAddrModeIndexed64", []>;
2182def am_indexed128 : ComplexPattern<i64, 2, "SelectAddrModeIndexed128", []>;
2183
2184class UImm12OffsetOperand<int Scale> : AsmOperandClass {
2185 let Name = "UImm12Offset" # Scale;
2186 let RenderMethod = "addUImm12OffsetOperands<" # Scale # ">";
2187 let PredicateMethod = "isUImm12Offset<" # Scale # ">";
2188 let DiagnosticType = "InvalidMemoryIndexed" # Scale;
2189}
2190
2191def UImm12OffsetScale1Operand : UImm12OffsetOperand<1>;
2192def UImm12OffsetScale2Operand : UImm12OffsetOperand<2>;
2193def UImm12OffsetScale4Operand : UImm12OffsetOperand<4>;
2194def UImm12OffsetScale8Operand : UImm12OffsetOperand<8>;
2195def UImm12OffsetScale16Operand : UImm12OffsetOperand<16>;
2196
2197class uimm12_scaled<int Scale> : Operand<i64> {
2198 let ParserMatchClass
2199 = !cast<AsmOperandClass>("UImm12OffsetScale" # Scale # "Operand");
2200 let EncoderMethod
2201 = "getLdStUImm12OpValue<AArch64::fixup_aarch64_ldst_imm12_scale" # Scale # ">";
2202 let PrintMethod = "printUImm12Offset<" # Scale # ">";
2203}
2204
2205def uimm12s1 : uimm12_scaled<1>;
2206def uimm12s2 : uimm12_scaled<2>;
2207def uimm12s4 : uimm12_scaled<4>;
2208def uimm12s8 : uimm12_scaled<8>;
2209def uimm12s16 : uimm12_scaled<16>;
2210
2211class BaseLoadStoreUI<bits<2> sz, bit V, bits<2> opc, dag oops, dag iops,
2212 string asm, list<dag> pattern>
2213 : I<oops, iops, asm, "\t$Rt, [$Rn, $offset]", "", pattern> {
2214 bits<5> Rt;
2215
2216 bits<5> Rn;
2217 bits<12> offset;
2218
2219 let Inst{31-30} = sz;
2220 let Inst{29-27} = 0b111;
2221 let Inst{26} = V;
2222 let Inst{25-24} = 0b01;
2223 let Inst{23-22} = opc;
2224 let Inst{21-10} = offset;
2225 let Inst{9-5} = Rn;
2226 let Inst{4-0} = Rt;
2227
2228 let DecoderMethod = "DecodeUnsignedLdStInstruction";
2229}
2230
2231multiclass LoadUI<bits<2> sz, bit V, bits<2> opc, RegisterClass regtype,
2232 Operand indextype, string asm, list<dag> pattern> {
2233 let AddedComplexity = 10, mayLoad = 1, mayStore = 0, hasSideEffects = 0 in
2234 def ui : BaseLoadStoreUI<sz, V, opc, (outs regtype:$Rt),
2235 (ins GPR64sp:$Rn, indextype:$offset),
2236 asm, pattern>,
2237 Sched<[WriteLD]>;
2238
2239 def : InstAlias<asm # " $Rt, [$Rn]",
2240 (!cast<Instruction>(NAME # "ui") regtype:$Rt, GPR64sp:$Rn, 0)>;
2241}
2242
2243multiclass StoreUI<bits<2> sz, bit V, bits<2> opc, RegisterClass regtype,
2244 Operand indextype, string asm, list<dag> pattern> {
2245 let AddedComplexity = 10, mayLoad = 0, mayStore = 1, hasSideEffects = 0 in
2246 def ui : BaseLoadStoreUI<sz, V, opc, (outs),
2247 (ins regtype:$Rt, GPR64sp:$Rn, indextype:$offset),
2248 asm, pattern>,
2249 Sched<[WriteST]>;
2250
2251 def : InstAlias<asm # " $Rt, [$Rn]",
2252 (!cast<Instruction>(NAME # "ui") regtype:$Rt, GPR64sp:$Rn, 0)>;
2253}
2254
2255def PrefetchOperand : AsmOperandClass {
2256 let Name = "Prefetch";
2257 let ParserMethod = "tryParsePrefetch";
2258}
2259def prfop : Operand<i32> {
2260 let PrintMethod = "printPrefetchOp";
2261 let ParserMatchClass = PrefetchOperand;
2262}
2263
2264let mayLoad = 0, mayStore = 0, hasSideEffects = 1 in
2265class PrefetchUI<bits<2> sz, bit V, bits<2> opc, string asm, list<dag> pat>
2266 : BaseLoadStoreUI<sz, V, opc,
2267 (outs), (ins prfop:$Rt, GPR64sp:$Rn, uimm12s8:$offset),
2268 asm, pat>,
2269 Sched<[WriteLD]>;
2270
2271//---
2272// Load literal
2273//---
2274
2275// Load literal address: 19-bit immediate. The low two bits of the target
2276// offset are implied zero and so are not part of the immediate.
2277def am_ldrlit : Operand<OtherVT> {
2278 let EncoderMethod = "getLoadLiteralOpValue";
2279 let DecoderMethod = "DecodePCRelLabel19";
2280 let PrintMethod = "printAlignedLabel";
2281 let ParserMatchClass = PCRelLabel19Operand;
2282}
2283
2284let mayLoad = 1, mayStore = 0, hasSideEffects = 0 in
2285class LoadLiteral<bits<2> opc, bit V, RegisterClass regtype, string asm>
2286 : I<(outs regtype:$Rt), (ins am_ldrlit:$label),
2287 asm, "\t$Rt, $label", "", []>,
2288 Sched<[WriteLD]> {
2289 bits<5> Rt;
2290 bits<19> label;
2291 let Inst{31-30} = opc;
2292 let Inst{29-27} = 0b011;
2293 let Inst{26} = V;
2294 let Inst{25-24} = 0b00;
2295 let Inst{23-5} = label;
2296 let Inst{4-0} = Rt;
2297}
2298
2299let mayLoad = 0, mayStore = 0, hasSideEffects = 1 in
2300class PrefetchLiteral<bits<2> opc, bit V, string asm, list<dag> pat>
2301 : I<(outs), (ins prfop:$Rt, am_ldrlit:$label),
2302 asm, "\t$Rt, $label", "", pat>,
2303 Sched<[WriteLD]> {
2304 bits<5> Rt;
2305 bits<19> label;
2306 let Inst{31-30} = opc;
2307 let Inst{29-27} = 0b011;
2308 let Inst{26} = V;
2309 let Inst{25-24} = 0b00;
2310 let Inst{23-5} = label;
2311 let Inst{4-0} = Rt;
2312}
2313
2314//---
2315// Load/store register offset
2316//---
2317
2318def ro_Xindexed8 : ComplexPattern<i64, 4, "SelectAddrModeXRO<8>", []>;
2319def ro_Xindexed16 : ComplexPattern<i64, 4, "SelectAddrModeXRO<16>", []>;
2320def ro_Xindexed32 : ComplexPattern<i64, 4, "SelectAddrModeXRO<32>", []>;
2321def ro_Xindexed64 : ComplexPattern<i64, 4, "SelectAddrModeXRO<64>", []>;
2322def ro_Xindexed128 : ComplexPattern<i64, 4, "SelectAddrModeXRO<128>", []>;
2323
2324def ro_Windexed8 : ComplexPattern<i64, 4, "SelectAddrModeWRO<8>", []>;
2325def ro_Windexed16 : ComplexPattern<i64, 4, "SelectAddrModeWRO<16>", []>;
2326def ro_Windexed32 : ComplexPattern<i64, 4, "SelectAddrModeWRO<32>", []>;
2327def ro_Windexed64 : ComplexPattern<i64, 4, "SelectAddrModeWRO<64>", []>;
2328def ro_Windexed128 : ComplexPattern<i64, 4, "SelectAddrModeWRO<128>", []>;
2329
2330class MemExtendOperand<string Reg, int Width> : AsmOperandClass {
2331 let Name = "Mem" # Reg # "Extend" # Width;
2332 let PredicateMethod = "isMem" # Reg # "Extend<" # Width # ">";
2333 let RenderMethod = "addMemExtendOperands";
2334 let DiagnosticType = "InvalidMemory" # Reg # "Extend" # Width;
2335}
2336
2337def MemWExtend8Operand : MemExtendOperand<"W", 8> {
2338 // The address "[x0, x1, lsl #0]" actually maps to the variant which performs
2339 // the trivial shift.
2340 let RenderMethod = "addMemExtend8Operands";
2341}
2342def MemWExtend16Operand : MemExtendOperand<"W", 16>;
2343def MemWExtend32Operand : MemExtendOperand<"W", 32>;
2344def MemWExtend64Operand : MemExtendOperand<"W", 64>;
2345def MemWExtend128Operand : MemExtendOperand<"W", 128>;
2346
2347def MemXExtend8Operand : MemExtendOperand<"X", 8> {
2348 // The address "[x0, x1, lsl #0]" actually maps to the variant which performs
2349 // the trivial shift.
2350 let RenderMethod = "addMemExtend8Operands";
2351}
2352def MemXExtend16Operand : MemExtendOperand<"X", 16>;
2353def MemXExtend32Operand : MemExtendOperand<"X", 32>;
2354def MemXExtend64Operand : MemExtendOperand<"X", 64>;
2355def MemXExtend128Operand : MemExtendOperand<"X", 128>;
2356
2357class ro_extend<AsmOperandClass ParserClass, string Reg, int Width>
2358 : Operand<i32> {
2359 let ParserMatchClass = ParserClass;
2360 let PrintMethod = "printMemExtend<'" # Reg # "', " # Width # ">";
2361 let DecoderMethod = "DecodeMemExtend";
2362 let EncoderMethod = "getMemExtendOpValue";
2363 let MIOperandInfo = (ops i32imm:$signed, i32imm:$doshift);
2364}
2365
2366def ro_Wextend8 : ro_extend<MemWExtend8Operand, "w", 8>;
2367def ro_Wextend16 : ro_extend<MemWExtend16Operand, "w", 16>;
2368def ro_Wextend32 : ro_extend<MemWExtend32Operand, "w", 32>;
2369def ro_Wextend64 : ro_extend<MemWExtend64Operand, "w", 64>;
2370def ro_Wextend128 : ro_extend<MemWExtend128Operand, "w", 128>;
2371
2372def ro_Xextend8 : ro_extend<MemXExtend8Operand, "x", 8>;
2373def ro_Xextend16 : ro_extend<MemXExtend16Operand, "x", 16>;
2374def ro_Xextend32 : ro_extend<MemXExtend32Operand, "x", 32>;
2375def ro_Xextend64 : ro_extend<MemXExtend64Operand, "x", 64>;
2376def ro_Xextend128 : ro_extend<MemXExtend128Operand, "x", 128>;
2377
2378class ROAddrMode<ComplexPattern windex, ComplexPattern xindex,
2379 Operand wextend, Operand xextend> {
2380 // CodeGen-level pattern covering the entire addressing mode.
2381 ComplexPattern Wpat = windex;
2382 ComplexPattern Xpat = xindex;
2383
2384 // Asm-level Operand covering the valid "uxtw #3" style syntax.
2385 Operand Wext = wextend;
2386 Operand Xext = xextend;
2387}
2388
2389def ro8 : ROAddrMode<ro_Windexed8, ro_Xindexed8, ro_Wextend8, ro_Xextend8>;
2390def ro16 : ROAddrMode<ro_Windexed16, ro_Xindexed16, ro_Wextend16, ro_Xextend16>;
2391def ro32 : ROAddrMode<ro_Windexed32, ro_Xindexed32, ro_Wextend32, ro_Xextend32>;
2392def ro64 : ROAddrMode<ro_Windexed64, ro_Xindexed64, ro_Wextend64, ro_Xextend64>;
2393def ro128 : ROAddrMode<ro_Windexed128, ro_Xindexed128, ro_Wextend128,
2394 ro_Xextend128>;
2395
2396class LoadStore8RO<bits<2> sz, bit V, bits<2> opc, RegisterClass regtype,
2397 string asm, dag ins, dag outs, list<dag> pat>
2398 : I<ins, outs, asm, "\t$Rt, [$Rn, $Rm, $extend]", "", pat> {
2399 bits<5> Rt;
2400 bits<5> Rn;
2401 bits<5> Rm;
2402 bits<2> extend;
2403 let Inst{31-30} = sz;
2404 let Inst{29-27} = 0b111;
2405 let Inst{26} = V;
2406 let Inst{25-24} = 0b00;
2407 let Inst{23-22} = opc;
2408 let Inst{21} = 1;
2409 let Inst{20-16} = Rm;
2410 let Inst{15} = extend{1}; // sign extend Rm?
2411 let Inst{14} = 1;
2412 let Inst{12} = extend{0}; // do shift?
2413 let Inst{11-10} = 0b10;
2414 let Inst{9-5} = Rn;
2415 let Inst{4-0} = Rt;
2416}
2417
2418class ROInstAlias<string asm, RegisterClass regtype, Instruction INST>
2419 : InstAlias<asm # " $Rt, [$Rn, $Rm]",
2420 (INST regtype:$Rt, GPR64sp:$Rn, GPR64:$Rm, 0, 0)>;
2421
2422multiclass Load8RO<bits<2> sz, bit V, bits<2> opc, RegisterClass regtype,
2423 string asm, ValueType Ty, SDPatternOperator loadop> {
2424 let AddedComplexity = 10 in
2425 def roW : LoadStore8RO<sz, V, opc, regtype, asm,
2426 (outs regtype:$Rt),
2427 (ins GPR64sp:$Rn, GPR32:$Rm, ro_Wextend8:$extend),
2428 [(set (Ty regtype:$Rt),
2429 (loadop (ro_Windexed8 GPR64sp:$Rn, GPR32:$Rm,
2430 ro_Wextend8:$extend)))]>,
2431 Sched<[WriteLDIdx, ReadAdrBase]> {
2432 let Inst{13} = 0b0;
2433 }
2434
2435 let AddedComplexity = 10 in
2436 def roX : LoadStore8RO<sz, V, opc, regtype, asm,
2437 (outs regtype:$Rt),
2438 (ins GPR64sp:$Rn, GPR64:$Rm, ro_Xextend8:$extend),
2439 [(set (Ty regtype:$Rt),
2440 (loadop (ro_Xindexed8 GPR64sp:$Rn, GPR64:$Rm,
2441 ro_Xextend8:$extend)))]>,
2442 Sched<[WriteLDIdx, ReadAdrBase]> {
2443 let Inst{13} = 0b1;
2444 }
2445
2446 def : ROInstAlias<asm, regtype, !cast<Instruction>(NAME # "roX")>;
2447}
2448
2449multiclass Store8RO<bits<2> sz, bit V, bits<2> opc, RegisterClass regtype,
2450 string asm, ValueType Ty, SDPatternOperator storeop> {
2451 let AddedComplexity = 10 in
2452 def roW : LoadStore8RO<sz, V, opc, regtype, asm, (outs),
2453 (ins regtype:$Rt, GPR64sp:$Rn, GPR32:$Rm, ro_Wextend8:$extend),
2454 [(storeop (Ty regtype:$Rt),
2455 (ro_Windexed8 GPR64sp:$Rn, GPR32:$Rm,
2456 ro_Wextend8:$extend))]>,
2457 Sched<[WriteSTIdx, ReadAdrBase]> {
2458 let Inst{13} = 0b0;
2459 }
2460
2461 let AddedComplexity = 10 in
2462 def roX : LoadStore8RO<sz, V, opc, regtype, asm, (outs),
2463 (ins regtype:$Rt, GPR64sp:$Rn, GPR64:$Rm, ro_Xextend8:$extend),
2464 [(storeop (Ty regtype:$Rt),
2465 (ro_Xindexed8 GPR64sp:$Rn, GPR64:$Rm,
2466 ro_Xextend8:$extend))]>,
2467 Sched<[WriteSTIdx, ReadAdrBase]> {
2468 let Inst{13} = 0b1;
2469 }
2470
2471 def : ROInstAlias<asm, regtype, !cast<Instruction>(NAME # "roX")>;
2472}
2473
2474class LoadStore16RO<bits<2> sz, bit V, bits<2> opc, RegisterClass regtype,
2475 string asm, dag ins, dag outs, list<dag> pat>
2476 : I<ins, outs, asm, "\t$Rt, [$Rn, $Rm, $extend]", "", pat> {
2477 bits<5> Rt;
2478 bits<5> Rn;
2479 bits<5> Rm;
2480 bits<2> extend;
2481 let Inst{31-30} = sz;
2482 let Inst{29-27} = 0b111;
2483 let Inst{26} = V;
2484 let Inst{25-24} = 0b00;
2485 let Inst{23-22} = opc;
2486 let Inst{21} = 1;
2487 let Inst{20-16} = Rm;
2488 let Inst{15} = extend{1}; // sign extend Rm?
2489 let Inst{14} = 1;
2490 let Inst{12} = extend{0}; // do shift?
2491 let Inst{11-10} = 0b10;
2492 let Inst{9-5} = Rn;
2493 let Inst{4-0} = Rt;
2494}
2495
2496multiclass Load16RO<bits<2> sz, bit V, bits<2> opc, RegisterClass regtype,
2497 string asm, ValueType Ty, SDPatternOperator loadop> {
2498 let AddedComplexity = 10 in
2499 def roW : LoadStore16RO<sz, V, opc, regtype, asm, (outs regtype:$Rt),
2500 (ins GPR64sp:$Rn, GPR32:$Rm, ro_Wextend16:$extend),
2501 [(set (Ty regtype:$Rt),
2502 (loadop (ro_Windexed16 GPR64sp:$Rn, GPR32:$Rm,
2503 ro_Wextend16:$extend)))]>,
2504 Sched<[WriteLDIdx, ReadAdrBase]> {
2505 let Inst{13} = 0b0;
2506 }
2507
2508 let AddedComplexity = 10 in
2509 def roX : LoadStore16RO<sz, V, opc, regtype, asm, (outs regtype:$Rt),
2510 (ins GPR64sp:$Rn, GPR64:$Rm, ro_Xextend16:$extend),
2511 [(set (Ty regtype:$Rt),
2512 (loadop (ro_Xindexed16 GPR64sp:$Rn, GPR64:$Rm,
2513 ro_Xextend16:$extend)))]>,
2514 Sched<[WriteLDIdx, ReadAdrBase]> {
2515 let Inst{13} = 0b1;
2516 }
2517
2518 def : ROInstAlias<asm, regtype, !cast<Instruction>(NAME # "roX")>;
2519}
2520
2521multiclass Store16RO<bits<2> sz, bit V, bits<2> opc, RegisterClass regtype,
2522 string asm, ValueType Ty, SDPatternOperator storeop> {
2523 let AddedComplexity = 10 in
2524 def roW : LoadStore16RO<sz, V, opc, regtype, asm, (outs),
2525 (ins regtype:$Rt, GPR64sp:$Rn, GPR32:$Rm, ro_Wextend16:$extend),
2526 [(storeop (Ty regtype:$Rt),
2527 (ro_Windexed16 GPR64sp:$Rn, GPR32:$Rm,
2528 ro_Wextend16:$extend))]>,
2529 Sched<[WriteSTIdx, ReadAdrBase]> {
2530 let Inst{13} = 0b0;
2531 }
2532
2533 let AddedComplexity = 10 in
2534 def roX : LoadStore16RO<sz, V, opc, regtype, asm, (outs),
2535 (ins regtype:$Rt, GPR64sp:$Rn, GPR64:$Rm, ro_Xextend16:$extend),
2536 [(storeop (Ty regtype:$Rt),
2537 (ro_Xindexed16 GPR64sp:$Rn, GPR64:$Rm,
2538 ro_Xextend16:$extend))]>,
2539 Sched<[WriteSTIdx, ReadAdrBase]> {
2540 let Inst{13} = 0b1;
2541 }
2542
2543 def : ROInstAlias<asm, regtype, !cast<Instruction>(NAME # "roX")>;
2544}
2545
2546class LoadStore32RO<bits<2> sz, bit V, bits<2> opc, RegisterClass regtype,
2547 string asm, dag ins, dag outs, list<dag> pat>
2548 : I<ins, outs, asm, "\t$Rt, [$Rn, $Rm, $extend]", "", pat> {
2549 bits<5> Rt;
2550 bits<5> Rn;
2551 bits<5> Rm;
2552 bits<2> extend;
2553 let Inst{31-30} = sz;
2554 let Inst{29-27} = 0b111;
2555 let Inst{26} = V;
2556 let Inst{25-24} = 0b00;
2557 let Inst{23-22} = opc;
2558 let Inst{21} = 1;
2559 let Inst{20-16} = Rm;
2560 let Inst{15} = extend{1}; // sign extend Rm?
2561 let Inst{14} = 1;
2562 let Inst{12} = extend{0}; // do shift?
2563 let Inst{11-10} = 0b10;
2564 let Inst{9-5} = Rn;
2565 let Inst{4-0} = Rt;
2566}
2567
2568multiclass Load32RO<bits<2> sz, bit V, bits<2> opc, RegisterClass regtype,
2569 string asm, ValueType Ty, SDPatternOperator loadop> {
2570 let AddedComplexity = 10 in
2571 def roW : LoadStore32RO<sz, V, opc, regtype, asm, (outs regtype:$Rt),
2572 (ins GPR64sp:$Rn, GPR32:$Rm, ro_Wextend32:$extend),
2573 [(set (Ty regtype:$Rt),
2574 (loadop (ro_Windexed32 GPR64sp:$Rn, GPR32:$Rm,
2575 ro_Wextend32:$extend)))]>,
2576 Sched<[WriteLDIdx, ReadAdrBase]> {
2577 let Inst{13} = 0b0;
2578 }
2579
2580 let AddedComplexity = 10 in
2581 def roX : LoadStore32RO<sz, V, opc, regtype, asm, (outs regtype:$Rt),
2582 (ins GPR64sp:$Rn, GPR64:$Rm, ro_Xextend32:$extend),
2583 [(set (Ty regtype:$Rt),
2584 (loadop (ro_Xindexed32 GPR64sp:$Rn, GPR64:$Rm,
2585 ro_Xextend32:$extend)))]>,
2586 Sched<[WriteLDIdx, ReadAdrBase]> {
2587 let Inst{13} = 0b1;
2588 }
2589
2590 def : ROInstAlias<asm, regtype, !cast<Instruction>(NAME # "roX")>;
2591}
2592
2593multiclass Store32RO<bits<2> sz, bit V, bits<2> opc, RegisterClass regtype,
2594 string asm, ValueType Ty, SDPatternOperator storeop> {
2595 let AddedComplexity = 10 in
2596 def roW : LoadStore32RO<sz, V, opc, regtype, asm, (outs),
2597 (ins regtype:$Rt, GPR64sp:$Rn, GPR32:$Rm, ro_Wextend32:$extend),
2598 [(storeop (Ty regtype:$Rt),
2599 (ro_Windexed32 GPR64sp:$Rn, GPR32:$Rm,
2600 ro_Wextend32:$extend))]>,
2601 Sched<[WriteSTIdx, ReadAdrBase]> {
2602 let Inst{13} = 0b0;
2603 }
2604
2605 let AddedComplexity = 10 in
2606 def roX : LoadStore32RO<sz, V, opc, regtype, asm, (outs),
2607 (ins regtype:$Rt, GPR64sp:$Rn, GPR64:$Rm, ro_Xextend32:$extend),
2608 [(storeop (Ty regtype:$Rt),
2609 (ro_Xindexed32 GPR64sp:$Rn, GPR64:$Rm,
2610 ro_Xextend32:$extend))]>,
2611 Sched<[WriteSTIdx, ReadAdrBase]> {
2612 let Inst{13} = 0b1;
2613 }
2614
2615 def : ROInstAlias<asm, regtype, !cast<Instruction>(NAME # "roX")>;
2616}
2617
2618class LoadStore64RO<bits<2> sz, bit V, bits<2> opc, RegisterClass regtype,
2619 string asm, dag ins, dag outs, list<dag> pat>
2620 : I<ins, outs, asm, "\t$Rt, [$Rn, $Rm, $extend]", "", pat> {
2621 bits<5> Rt;
2622 bits<5> Rn;
2623 bits<5> Rm;
2624 bits<2> extend;
2625 let Inst{31-30} = sz;
2626 let Inst{29-27} = 0b111;
2627 let Inst{26} = V;
2628 let Inst{25-24} = 0b00;
2629 let Inst{23-22} = opc;
2630 let Inst{21} = 1;
2631 let Inst{20-16} = Rm;
2632 let Inst{15} = extend{1}; // sign extend Rm?
2633 let Inst{14} = 1;
2634 let Inst{12} = extend{0}; // do shift?
2635 let Inst{11-10} = 0b10;
2636 let Inst{9-5} = Rn;
2637 let Inst{4-0} = Rt;
2638}
2639
2640multiclass Load64RO<bits<2> sz, bit V, bits<2> opc, RegisterClass regtype,
2641 string asm, ValueType Ty, SDPatternOperator loadop> {
2642 let AddedComplexity = 10, mayLoad = 1, mayStore = 0, hasSideEffects = 0 in
2643 def roW : LoadStore64RO<sz, V, opc, regtype, asm, (outs regtype:$Rt),
2644 (ins GPR64sp:$Rn, GPR32:$Rm, ro_Wextend64:$extend),
2645 [(set (Ty regtype:$Rt),
2646 (loadop (ro_Windexed64 GPR64sp:$Rn, GPR32:$Rm,
2647 ro_Wextend64:$extend)))]>,
2648 Sched<[WriteLDIdx, ReadAdrBase]> {
2649 let Inst{13} = 0b0;
2650 }
2651
2652 let AddedComplexity = 10, mayLoad = 1, mayStore = 0, hasSideEffects = 0 in
2653 def roX : LoadStore64RO<sz, V, opc, regtype, asm, (outs regtype:$Rt),
2654 (ins GPR64sp:$Rn, GPR64:$Rm, ro_Xextend64:$extend),
2655 [(set (Ty regtype:$Rt),
2656 (loadop (ro_Xindexed64 GPR64sp:$Rn, GPR64:$Rm,
2657 ro_Xextend64:$extend)))]>,
2658 Sched<[WriteLDIdx, ReadAdrBase]> {
2659 let Inst{13} = 0b1;
2660 }
2661
2662 def : ROInstAlias<asm, regtype, !cast<Instruction>(NAME # "roX")>;
2663}
2664
2665multiclass Store64RO<bits<2> sz, bit V, bits<2> opc, RegisterClass regtype,
2666 string asm, ValueType Ty, SDPatternOperator storeop> {
2667 let AddedComplexity = 10, mayLoad = 0, mayStore = 1, hasSideEffects = 0 in
2668 def roW : LoadStore64RO<sz, V, opc, regtype, asm, (outs),
2669 (ins regtype:$Rt, GPR64sp:$Rn, GPR32:$Rm, ro_Wextend64:$extend),
2670 [(storeop (Ty regtype:$Rt),
2671 (ro_Windexed64 GPR64sp:$Rn, GPR32:$Rm,
2672 ro_Wextend64:$extend))]>,
2673 Sched<[WriteSTIdx, ReadAdrBase]> {
2674 let Inst{13} = 0b0;
2675 }
2676
2677 let AddedComplexity = 10, mayLoad = 0, mayStore = 1, hasSideEffects = 0 in
2678 def roX : LoadStore64RO<sz, V, opc, regtype, asm, (outs),
2679 (ins regtype:$Rt, GPR64sp:$Rn, GPR64:$Rm, ro_Xextend64:$extend),
2680 [(storeop (Ty regtype:$Rt),
2681 (ro_Xindexed64 GPR64sp:$Rn, GPR64:$Rm,
2682 ro_Xextend64:$extend))]>,
2683 Sched<[WriteSTIdx, ReadAdrBase]> {
2684 let Inst{13} = 0b1;
2685 }
2686
2687 def : ROInstAlias<asm, regtype, !cast<Instruction>(NAME # "roX")>;
2688}
2689
2690class LoadStore128RO<bits<2> sz, bit V, bits<2> opc, RegisterClass regtype,
2691 string asm, dag ins, dag outs, list<dag> pat>
2692 : I<ins, outs, asm, "\t$Rt, [$Rn, $Rm, $extend]", "", pat> {
2693 bits<5> Rt;
2694 bits<5> Rn;
2695 bits<5> Rm;
2696 bits<2> extend;
2697 let Inst{31-30} = sz;
2698 let Inst{29-27} = 0b111;
2699 let Inst{26} = V;
2700 let Inst{25-24} = 0b00;
2701 let Inst{23-22} = opc;
2702 let Inst{21} = 1;
2703 let Inst{20-16} = Rm;
2704 let Inst{15} = extend{1}; // sign extend Rm?
2705 let Inst{14} = 1;
2706 let Inst{12} = extend{0}; // do shift?
2707 let Inst{11-10} = 0b10;
2708 let Inst{9-5} = Rn;
2709 let Inst{4-0} = Rt;
2710}
2711
2712multiclass Load128RO<bits<2> sz, bit V, bits<2> opc, RegisterClass regtype,
2713 string asm, ValueType Ty, SDPatternOperator loadop> {
2714 let AddedComplexity = 10, mayLoad = 1, mayStore = 0, hasSideEffects = 0 in
2715 def roW : LoadStore128RO<sz, V, opc, regtype, asm, (outs regtype:$Rt),
2716 (ins GPR64sp:$Rn, GPR32:$Rm, ro_Wextend128:$extend),
2717 [(set (Ty regtype:$Rt),
2718 (loadop (ro_Windexed128 GPR64sp:$Rn, GPR32:$Rm,
2719 ro_Wextend128:$extend)))]>,
2720 Sched<[WriteLDIdx, ReadAdrBase]> {
2721 let Inst{13} = 0b0;
2722 }
2723
2724 let AddedComplexity = 10, mayLoad = 1, mayStore = 0, hasSideEffects = 0 in
2725 def roX : LoadStore128RO<sz, V, opc, regtype, asm, (outs regtype:$Rt),
2726 (ins GPR64sp:$Rn, GPR64:$Rm, ro_Xextend128:$extend),
2727 [(set (Ty regtype:$Rt),
2728 (loadop (ro_Xindexed128 GPR64sp:$Rn, GPR64:$Rm,
2729 ro_Xextend128:$extend)))]>,
2730 Sched<[WriteLDIdx, ReadAdrBase]> {
2731 let Inst{13} = 0b1;
2732 }
2733
2734 def : ROInstAlias<asm, regtype, !cast<Instruction>(NAME # "roX")>;
2735}
2736
2737multiclass Store128RO<bits<2> sz, bit V, bits<2> opc, RegisterClass regtype,
2738 string asm, ValueType Ty, SDPatternOperator storeop> {
2739 let AddedComplexity = 10, mayLoad = 0, mayStore = 1, hasSideEffects = 0 in
2740 def roW : LoadStore128RO<sz, V, opc, regtype, asm, (outs),
2741 (ins regtype:$Rt, GPR64sp:$Rn, GPR32:$Rm, ro_Wextend128:$extend),
2742 [(storeop (Ty regtype:$Rt),
2743 (ro_Windexed128 GPR64sp:$Rn, GPR32:$Rm,
2744 ro_Wextend128:$extend))]>,
2745 Sched<[WriteSTIdx, ReadAdrBase]> {
2746 let Inst{13} = 0b0;
2747 }
2748
2749 let AddedComplexity = 10, mayLoad = 0, mayStore = 1, hasSideEffects = 0 in
2750 def roX : LoadStore128RO<sz, V, opc, regtype, asm, (outs),
2751 (ins regtype:$Rt, GPR64sp:$Rn, GPR64:$Rm, ro_Xextend128:$extend),
2752 [(storeop (Ty regtype:$Rt),
2753 (ro_Xindexed128 GPR64sp:$Rn, GPR64:$Rm,
2754 ro_Xextend128:$extend))]>,
2755 Sched<[WriteSTIdx, ReadAdrBase]> {
2756 let Inst{13} = 0b1;
2757 }
2758
2759 def : ROInstAlias<asm, regtype, !cast<Instruction>(NAME # "roX")>;
2760}
2761
2762let mayLoad = 0, mayStore = 0, hasSideEffects = 1 in
2763class BasePrefetchRO<bits<2> sz, bit V, bits<2> opc, dag outs, dag ins,
2764 string asm, list<dag> pat>
2765 : I<outs, ins, asm, "\t$Rt, [$Rn, $Rm, $extend]", "", pat>,
2766 Sched<[WriteLD]> {
2767 bits<5> Rt;
2768 bits<5> Rn;
2769 bits<5> Rm;
2770 bits<2> extend;
2771 let Inst{31-30} = sz;
2772 let Inst{29-27} = 0b111;
2773 let Inst{26} = V;
2774 let Inst{25-24} = 0b00;
2775 let Inst{23-22} = opc;
2776 let Inst{21} = 1;
2777 let Inst{20-16} = Rm;
2778 let Inst{15} = extend{1}; // sign extend Rm?
2779 let Inst{14} = 1;
2780 let Inst{12} = extend{0}; // do shift?
2781 let Inst{11-10} = 0b10;
2782 let Inst{9-5} = Rn;
2783 let Inst{4-0} = Rt;
2784}
2785
2786multiclass PrefetchRO<bits<2> sz, bit V, bits<2> opc, string asm> {
2787 def roW : BasePrefetchRO<sz, V, opc, (outs),
2788 (ins prfop:$Rt, GPR64sp:$Rn, GPR32:$Rm, ro_Wextend64:$extend),
2789 asm, [(AArch64Prefetch imm:$Rt,
2790 (ro_Windexed64 GPR64sp:$Rn, GPR32:$Rm,
2791 ro_Wextend64:$extend))]> {
2792 let Inst{13} = 0b0;
2793 }
2794
2795 def roX : BasePrefetchRO<sz, V, opc, (outs),
2796 (ins prfop:$Rt, GPR64sp:$Rn, GPR64:$Rm, ro_Xextend64:$extend),
2797 asm, [(AArch64Prefetch imm:$Rt,
2798 (ro_Xindexed64 GPR64sp:$Rn, GPR64:$Rm,
2799 ro_Xextend64:$extend))]> {
2800 let Inst{13} = 0b1;
2801 }
2802
2803 def : InstAlias<"prfm $Rt, [$Rn, $Rm]",
2804 (!cast<Instruction>(NAME # "roX") prfop:$Rt,
2805 GPR64sp:$Rn, GPR64:$Rm, 0, 0)>;
2806}
2807
2808//---
2809// Load/store unscaled immediate
2810//---
2811
2812def am_unscaled8 : ComplexPattern<i64, 2, "SelectAddrModeUnscaled8", []>;
2813def am_unscaled16 : ComplexPattern<i64, 2, "SelectAddrModeUnscaled16", []>;
2814def am_unscaled32 : ComplexPattern<i64, 2, "SelectAddrModeUnscaled32", []>;
2815def am_unscaled64 : ComplexPattern<i64, 2, "SelectAddrModeUnscaled64", []>;
2816def am_unscaled128 :ComplexPattern<i64, 2, "SelectAddrModeUnscaled128", []>;
2817
2818class BaseLoadStoreUnscale<bits<2> sz, bit V, bits<2> opc, dag oops, dag iops,
2819 string asm, list<dag> pattern>
2820 : I<oops, iops, asm, "\t$Rt, [$Rn, $offset]", "", pattern> {
2821 bits<5> Rt;
2822 bits<5> Rn;
2823 bits<9> offset;
2824 let Inst{31-30} = sz;
2825 let Inst{29-27} = 0b111;
2826 let Inst{26} = V;
2827 let Inst{25-24} = 0b00;
2828 let Inst{23-22} = opc;
2829 let Inst{21} = 0;
2830 let Inst{20-12} = offset;
2831 let Inst{11-10} = 0b00;
2832 let Inst{9-5} = Rn;
2833 let Inst{4-0} = Rt;
2834
2835 let DecoderMethod = "DecodeSignedLdStInstruction";
2836}
2837
2838multiclass LoadUnscaled<bits<2> sz, bit V, bits<2> opc, RegisterClass regtype,
2839 string asm, list<dag> pattern> {
2840 let AddedComplexity = 1 in // try this before LoadUI
2841 def i : BaseLoadStoreUnscale<sz, V, opc, (outs regtype:$Rt),
2842 (ins GPR64sp:$Rn, simm9:$offset), asm, pattern>,
2843 Sched<[WriteLD]>;
2844
2845 def : InstAlias<asm # " $Rt, [$Rn]",
2846 (!cast<Instruction>(NAME # "i") regtype:$Rt, GPR64sp:$Rn, 0)>;
2847}
2848
2849multiclass StoreUnscaled<bits<2> sz, bit V, bits<2> opc, RegisterClass regtype,
2850 string asm, list<dag> pattern> {
2851 let AddedComplexity = 1 in // try this before StoreUI
2852 def i : BaseLoadStoreUnscale<sz, V, opc, (outs),
2853 (ins regtype:$Rt, GPR64sp:$Rn, simm9:$offset),
2854 asm, pattern>,
2855 Sched<[WriteST]>;
2856
2857 def : InstAlias<asm # " $Rt, [$Rn]",
2858 (!cast<Instruction>(NAME # "i") regtype:$Rt, GPR64sp:$Rn, 0)>;
2859}
2860
2861multiclass PrefetchUnscaled<bits<2> sz, bit V, bits<2> opc, string asm,
2862 list<dag> pat> {
2863 let mayLoad = 0, mayStore = 0, hasSideEffects = 1 in
2864 def i : BaseLoadStoreUnscale<sz, V, opc, (outs),
2865 (ins prfop:$Rt, GPR64sp:$Rn, simm9:$offset),
2866 asm, pat>,
2867 Sched<[WriteLD]>;
2868
2869 def : InstAlias<asm # " $Rt, [$Rn]",
2870 (!cast<Instruction>(NAME # "i") prfop:$Rt, GPR64sp:$Rn, 0)>;
2871}
2872
2873//---
2874// Load/store unscaled immediate, unprivileged
2875//---
2876
2877class BaseLoadStoreUnprivileged<bits<2> sz, bit V, bits<2> opc,
2878 dag oops, dag iops, string asm>
2879 : I<oops, iops, asm, "\t$Rt, [$Rn, $offset]", "", []> {
2880 bits<5> Rt;
2881 bits<5> Rn;
2882 bits<9> offset;
2883 let Inst{31-30} = sz;
2884 let Inst{29-27} = 0b111;
2885 let Inst{26} = V;
2886 let Inst{25-24} = 0b00;
2887 let Inst{23-22} = opc;
2888 let Inst{21} = 0;
2889 let Inst{20-12} = offset;
2890 let Inst{11-10} = 0b10;
2891 let Inst{9-5} = Rn;
2892 let Inst{4-0} = Rt;
2893
2894 let DecoderMethod = "DecodeSignedLdStInstruction";
2895}
2896
2897multiclass LoadUnprivileged<bits<2> sz, bit V, bits<2> opc,
2898 RegisterClass regtype, string asm> {
2899 let mayStore = 0, mayLoad = 1, hasSideEffects = 0 in
2900 def i : BaseLoadStoreUnprivileged<sz, V, opc, (outs regtype:$Rt),
2901 (ins GPR64sp:$Rn, simm9:$offset), asm>,
2902 Sched<[WriteLD]>;
2903
2904 def : InstAlias<asm # " $Rt, [$Rn]",
2905 (!cast<Instruction>(NAME # "i") regtype:$Rt, GPR64sp:$Rn, 0)>;
2906}
2907
2908multiclass StoreUnprivileged<bits<2> sz, bit V, bits<2> opc,
2909 RegisterClass regtype, string asm> {
2910 let mayStore = 1, mayLoad = 0, hasSideEffects = 0 in
2911 def i : BaseLoadStoreUnprivileged<sz, V, opc, (outs),
2912 (ins regtype:$Rt, GPR64sp:$Rn, simm9:$offset),
2913 asm>,
2914 Sched<[WriteST]>;
2915
2916 def : InstAlias<asm # " $Rt, [$Rn]",
2917 (!cast<Instruction>(NAME # "i") regtype:$Rt, GPR64sp:$Rn, 0)>;
2918}
2919
2920//---
2921// Load/store pre-indexed
2922//---
2923
2924class BaseLoadStorePreIdx<bits<2> sz, bit V, bits<2> opc, dag oops, dag iops,
2925 string asm, string cstr, list<dag> pat>
2926 : I<oops, iops, asm, "\t$Rt, [$Rn, $offset]!", cstr, pat> {
2927 bits<5> Rt;
2928 bits<5> Rn;
2929 bits<9> offset;
2930 let Inst{31-30} = sz;
2931 let Inst{29-27} = 0b111;
2932 let Inst{26} = V;
2933 let Inst{25-24} = 0;
2934 let Inst{23-22} = opc;
2935 let Inst{21} = 0;
2936 let Inst{20-12} = offset;
2937 let Inst{11-10} = 0b11;
2938 let Inst{9-5} = Rn;
2939 let Inst{4-0} = Rt;
2940
2941 let DecoderMethod = "DecodeSignedLdStInstruction";
2942}
2943
2944let hasSideEffects = 0 in {
2945let mayStore = 0, mayLoad = 1 in
2946class LoadPreIdx<bits<2> sz, bit V, bits<2> opc, RegisterClass regtype,
2947 string asm>
2948 : BaseLoadStorePreIdx<sz, V, opc,
2949 (outs GPR64sp:$wback, regtype:$Rt),
2950 (ins GPR64sp:$Rn, simm9:$offset), asm,
2951 "$Rn = $wback", []>,
2952 Sched<[WriteLD, WriteAdr]>;
2953
2954let mayStore = 1, mayLoad = 0 in
2955class StorePreIdx<bits<2> sz, bit V, bits<2> opc, RegisterClass regtype,
2956 string asm, SDPatternOperator storeop, ValueType Ty>
2957 : BaseLoadStorePreIdx<sz, V, opc,
2958 (outs GPR64sp:$wback),
2959 (ins regtype:$Rt, GPR64sp:$Rn, simm9:$offset),
2960 asm, "$Rn = $wback",
2961 [(set GPR64sp:$wback,
2962 (storeop (Ty regtype:$Rt), GPR64sp:$Rn, simm9:$offset))]>,
2963 Sched<[WriteAdr, WriteST]>;
2964} // hasSideEffects = 0
2965
2966//---
2967// Load/store post-indexed
2968//---
2969
2970// (pre-index) load/stores.
2971class BaseLoadStorePostIdx<bits<2> sz, bit V, bits<2> opc, dag oops, dag iops,
2972 string asm, string cstr, list<dag> pat>
2973 : I<oops, iops, asm, "\t$Rt, [$Rn], $offset", cstr, pat> {
2974 bits<5> Rt;
2975 bits<5> Rn;
2976 bits<9> offset;
2977 let Inst{31-30} = sz;
2978 let Inst{29-27} = 0b111;
2979 let Inst{26} = V;
2980 let Inst{25-24} = 0b00;
2981 let Inst{23-22} = opc;
2982 let Inst{21} = 0b0;
2983 let Inst{20-12} = offset;
2984 let Inst{11-10} = 0b01;
2985 let Inst{9-5} = Rn;
2986 let Inst{4-0} = Rt;
2987
2988 let DecoderMethod = "DecodeSignedLdStInstruction";
2989}
2990
2991let hasSideEffects = 0 in {
2992let mayStore = 0, mayLoad = 1 in
2993class LoadPostIdx<bits<2> sz, bit V, bits<2> opc, RegisterClass regtype,
2994 string asm>
2995 : BaseLoadStorePostIdx<sz, V, opc,
2996 (outs GPR64sp:$wback, regtype:$Rt),
2997 (ins GPR64sp:$Rn, simm9:$offset),
2998 asm, "$Rn = $wback", []>,
2999 Sched<[WriteLD, WriteI]>;
3000
3001let mayStore = 1, mayLoad = 0 in
3002class StorePostIdx<bits<2> sz, bit V, bits<2> opc, RegisterClass regtype,
3003 string asm, SDPatternOperator storeop, ValueType Ty>
3004 : BaseLoadStorePostIdx<sz, V, opc,
3005 (outs GPR64sp:$wback),
3006 (ins regtype:$Rt, GPR64sp:$Rn, simm9:$offset),
3007 asm, "$Rn = $wback",
3008 [(set GPR64sp:$wback,
3009 (storeop (Ty regtype:$Rt), GPR64sp:$Rn, simm9:$offset))]>,
3010 Sched<[WriteAdr, WriteST, ReadAdrBase]>;
3011} // hasSideEffects = 0
3012
3013
3014//---
3015// Load/store pair
3016//---
3017
3018// (indexed, offset)
3019
3020class BaseLoadStorePairOffset<bits<2> opc, bit V, bit L, dag oops, dag iops,
3021 string asm>
3022 : I<oops, iops, asm, "\t$Rt, $Rt2, [$Rn, $offset]", "", []> {
3023 bits<5> Rt;
3024 bits<5> Rt2;
3025 bits<5> Rn;
3026 bits<7> offset;
3027 let Inst{31-30} = opc;
3028 let Inst{29-27} = 0b101;
3029 let Inst{26} = V;
3030 let Inst{25-23} = 0b010;
3031 let Inst{22} = L;
3032 let Inst{21-15} = offset;
3033 let Inst{14-10} = Rt2;
3034 let Inst{9-5} = Rn;
3035 let Inst{4-0} = Rt;
3036
3037 let DecoderMethod = "DecodePairLdStInstruction";
3038}
3039
3040multiclass LoadPairOffset<bits<2> opc, bit V, RegisterClass regtype,
3041 Operand indextype, string asm> {
3042 let hasSideEffects = 0, mayStore = 0, mayLoad = 1 in
3043 def i : BaseLoadStorePairOffset<opc, V, 1,
3044 (outs regtype:$Rt, regtype:$Rt2),
3045 (ins GPR64sp:$Rn, indextype:$offset), asm>,
3046 Sched<[WriteLD, WriteLDHi]>;
3047
3048 def : InstAlias<asm # " $Rt, $Rt2, [$Rn]",
3049 (!cast<Instruction>(NAME # "i") regtype:$Rt, regtype:$Rt2,
3050 GPR64sp:$Rn, 0)>;
3051}
3052
3053
3054multiclass StorePairOffset<bits<2> opc, bit V, RegisterClass regtype,
3055 Operand indextype, string asm> {
3056 let hasSideEffects = 0, mayLoad = 0, mayStore = 1 in
3057 def i : BaseLoadStorePairOffset<opc, V, 0, (outs),
3058 (ins regtype:$Rt, regtype:$Rt2,
3059 GPR64sp:$Rn, indextype:$offset),
3060 asm>,
3061 Sched<[WriteSTP]>;
3062
3063 def : InstAlias<asm # " $Rt, $Rt2, [$Rn]",
3064 (!cast<Instruction>(NAME # "i") regtype:$Rt, regtype:$Rt2,
3065 GPR64sp:$Rn, 0)>;
3066}
3067
3068// (pre-indexed)
3069class BaseLoadStorePairPreIdx<bits<2> opc, bit V, bit L, dag oops, dag iops,
3070 string asm>
3071 : I<oops, iops, asm, "\t$Rt, $Rt2, [$Rn, $offset]!", "$Rn = $wback", []> {
3072 bits<5> Rt;
3073 bits<5> Rt2;
3074 bits<5> Rn;
3075 bits<7> offset;
3076 let Inst{31-30} = opc;
3077 let Inst{29-27} = 0b101;
3078 let Inst{26} = V;
3079 let Inst{25-23} = 0b011;
3080 let Inst{22} = L;
3081 let Inst{21-15} = offset;
3082 let Inst{14-10} = Rt2;
3083 let Inst{9-5} = Rn;
3084 let Inst{4-0} = Rt;
3085
3086 let DecoderMethod = "DecodePairLdStInstruction";
3087}
3088
3089let hasSideEffects = 0 in {
3090let mayStore = 0, mayLoad = 1 in
3091class LoadPairPreIdx<bits<2> opc, bit V, RegisterClass regtype,
3092 Operand indextype, string asm>
3093 : BaseLoadStorePairPreIdx<opc, V, 1,
3094 (outs GPR64sp:$wback, regtype:$Rt, regtype:$Rt2),
3095 (ins GPR64sp:$Rn, indextype:$offset), asm>,
3096 Sched<[WriteLD, WriteLDHi, WriteAdr]>;
3097
3098let mayStore = 1, mayLoad = 0 in
3099class StorePairPreIdx<bits<2> opc, bit V, RegisterClass regtype,
3100 Operand indextype, string asm>
3101 : BaseLoadStorePairPreIdx<opc, V, 0, (outs GPR64sp:$wback),
3102 (ins regtype:$Rt, regtype:$Rt2,
3103 GPR64sp:$Rn, indextype:$offset),
3104 asm>,
3105 Sched<[WriteAdr, WriteSTP]>;
3106} // hasSideEffects = 0
3107
3108// (post-indexed)
3109
3110class BaseLoadStorePairPostIdx<bits<2> opc, bit V, bit L, dag oops, dag iops,
3111 string asm>
3112 : I<oops, iops, asm, "\t$Rt, $Rt2, [$Rn], $offset", "$Rn = $wback", []> {
3113 bits<5> Rt;
3114 bits<5> Rt2;
3115 bits<5> Rn;
3116 bits<7> offset;
3117 let Inst{31-30} = opc;
3118 let Inst{29-27} = 0b101;
3119 let Inst{26} = V;
3120 let Inst{25-23} = 0b001;
3121 let Inst{22} = L;
3122 let Inst{21-15} = offset;
3123 let Inst{14-10} = Rt2;
3124 let Inst{9-5} = Rn;
3125 let Inst{4-0} = Rt;
3126
3127 let DecoderMethod = "DecodePairLdStInstruction";
3128}
3129
3130let hasSideEffects = 0 in {
3131let mayStore = 0, mayLoad = 1 in
3132class LoadPairPostIdx<bits<2> opc, bit V, RegisterClass regtype,
3133 Operand idxtype, string asm>
3134 : BaseLoadStorePairPostIdx<opc, V, 1,
3135 (outs GPR64sp:$wback, regtype:$Rt, regtype:$Rt2),
3136 (ins GPR64sp:$Rn, idxtype:$offset), asm>,
3137 Sched<[WriteLD, WriteLDHi, WriteAdr]>;
3138
3139let mayStore = 1, mayLoad = 0 in
3140class StorePairPostIdx<bits<2> opc, bit V, RegisterClass regtype,
3141 Operand idxtype, string asm>
3142 : BaseLoadStorePairPostIdx<opc, V, 0, (outs),
3143 (ins GPR64sp:$wback, regtype:$Rt, regtype:$Rt2,
3144 GPR64sp:$Rn, idxtype:$offset),
3145 asm>,
3146 Sched<[WriteAdr, WriteSTP]>;
3147} // hasSideEffects = 0
3148
3149// (no-allocate)
3150
3151class BaseLoadStorePairNoAlloc<bits<2> opc, bit V, bit L, dag oops, dag iops,
3152 string asm>
3153 : I<oops, iops, asm, "\t$Rt, $Rt2, [$Rn, $offset]", "", []> {
3154 bits<5> Rt;
3155 bits<5> Rt2;
3156 bits<5> Rn;
3157 bits<7> offset;
3158 let Inst{31-30} = opc;
3159 let Inst{29-27} = 0b101;
3160 let Inst{26} = V;
3161 let Inst{25-23} = 0b000;
3162 let Inst{22} = L;
3163 let Inst{21-15} = offset;
3164 let Inst{14-10} = Rt2;
3165 let Inst{9-5} = Rn;
3166 let Inst{4-0} = Rt;
3167
3168 let DecoderMethod = "DecodePairLdStInstruction";
3169}
3170
3171multiclass LoadPairNoAlloc<bits<2> opc, bit V, RegisterClass regtype,
3172 Operand indextype, string asm> {
3173 let hasSideEffects = 0, mayStore = 0, mayLoad = 1 in
3174 def i : BaseLoadStorePairNoAlloc<opc, V, 1,
3175 (outs regtype:$Rt, regtype:$Rt2),
3176 (ins GPR64sp:$Rn, indextype:$offset), asm>,
3177 Sched<[WriteLD, WriteLDHi]>;
3178
3179
3180 def : InstAlias<asm # "\t$Rt, $Rt2, [$Rn]",
3181 (!cast<Instruction>(NAME # "i") regtype:$Rt, regtype:$Rt2,
3182 GPR64sp:$Rn, 0)>;
3183}
3184
3185multiclass StorePairNoAlloc<bits<2> opc, bit V, RegisterClass regtype,
3186 Operand indextype, string asm> {
3187 let hasSideEffects = 0, mayStore = 1, mayLoad = 0 in
3188 def i : BaseLoadStorePairNoAlloc<opc, V, 0, (outs),
3189 (ins regtype:$Rt, regtype:$Rt2,
3190 GPR64sp:$Rn, indextype:$offset),
3191 asm>,
3192 Sched<[WriteSTP]>;
3193
3194 def : InstAlias<asm # "\t$Rt, $Rt2, [$Rn]",
3195 (!cast<Instruction>(NAME # "i") regtype:$Rt, regtype:$Rt2,
3196 GPR64sp:$Rn, 0)>;
3197}
3198
3199//---
3200// Load/store exclusive
3201//---
3202
3203// True exclusive operations write to and/or read from the system's exclusive
3204// monitors, which as far as a compiler is concerned can be modelled as a
3205// random shared memory address. Hence LoadExclusive mayStore.
3206//
3207// Since these instructions have the undefined register bits set to 1 in
3208// their canonical form, we need a post encoder method to set those bits
3209// to 1 when encoding these instructions. We do this using the
3210// fixLoadStoreExclusive function. This function has template parameters:
3211//
3212// fixLoadStoreExclusive<int hasRs, int hasRt2>
3213//
3214// hasRs indicates that the instruction uses the Rs field, so we won't set
3215// it to 1 (and the same for Rt2). We don't need template parameters for
3216// the other register fields since Rt and Rn are always used.
3217//
3218let hasSideEffects = 1, mayLoad = 1, mayStore = 1 in
3219class BaseLoadStoreExclusive<bits<2> sz, bit o2, bit L, bit o1, bit o0,
3220 dag oops, dag iops, string asm, string operands>
3221 : I<oops, iops, asm, operands, "", []> {
3222 let Inst{31-30} = sz;
3223 let Inst{29-24} = 0b001000;
3224 let Inst{23} = o2;
3225 let Inst{22} = L;
3226 let Inst{21} = o1;
3227 let Inst{15} = o0;
3228
3229 let DecoderMethod = "DecodeExclusiveLdStInstruction";
3230}
3231
3232// Neither Rs nor Rt2 operands.
3233class LoadStoreExclusiveSimple<bits<2> sz, bit o2, bit L, bit o1, bit o0,
3234 dag oops, dag iops, string asm, string operands>
3235 : BaseLoadStoreExclusive<sz, o2, L, o1, o0, oops, iops, asm, operands> {
3236 bits<5> Rt;
3237 bits<5> Rn;
3238 let Inst{9-5} = Rn;
3239 let Inst{4-0} = Rt;
3240
3241 let PostEncoderMethod = "fixLoadStoreExclusive<0,0>";
3242}
3243
3244// Simple load acquires don't set the exclusive monitor
3245let mayLoad = 1, mayStore = 0 in
3246class LoadAcquire<bits<2> sz, bit o2, bit L, bit o1, bit o0,
3247 RegisterClass regtype, string asm>
3248 : LoadStoreExclusiveSimple<sz, o2, L, o1, o0, (outs regtype:$Rt),
3249 (ins GPR64sp0:$Rn), asm, "\t$Rt, [$Rn]">,
3250 Sched<[WriteLD]>;
3251
3252class LoadExclusive<bits<2> sz, bit o2, bit L, bit o1, bit o0,
3253 RegisterClass regtype, string asm>
3254 : LoadStoreExclusiveSimple<sz, o2, L, o1, o0, (outs regtype:$Rt),
3255 (ins GPR64sp0:$Rn), asm, "\t$Rt, [$Rn]">,
3256 Sched<[WriteLD]>;
3257
3258class LoadExclusivePair<bits<2> sz, bit o2, bit L, bit o1, bit o0,
3259 RegisterClass regtype, string asm>
3260 : BaseLoadStoreExclusive<sz, o2, L, o1, o0,
3261 (outs regtype:$Rt, regtype:$Rt2),
3262 (ins GPR64sp0:$Rn), asm,
3263 "\t$Rt, $Rt2, [$Rn]">,
3264 Sched<[WriteLD, WriteLDHi]> {
3265 bits<5> Rt;
3266 bits<5> Rt2;
3267 bits<5> Rn;
3268 let Inst{14-10} = Rt2;
3269 let Inst{9-5} = Rn;
3270 let Inst{4-0} = Rt;
3271
3272 let PostEncoderMethod = "fixLoadStoreExclusive<0,1>";
3273}
3274
3275// Simple store release operations do not check the exclusive monitor.
3276let mayLoad = 0, mayStore = 1 in
3277class StoreRelease<bits<2> sz, bit o2, bit L, bit o1, bit o0,
3278 RegisterClass regtype, string asm>
3279 : LoadStoreExclusiveSimple<sz, o2, L, o1, o0, (outs),
3280 (ins regtype:$Rt, GPR64sp0:$Rn),
3281 asm, "\t$Rt, [$Rn]">,
3282 Sched<[WriteST]>;
3283
3284let mayLoad = 1, mayStore = 1 in
3285class StoreExclusive<bits<2> sz, bit o2, bit L, bit o1, bit o0,
3286 RegisterClass regtype, string asm>
3287 : BaseLoadStoreExclusive<sz, o2, L, o1, o0, (outs GPR32:$Ws),
3288 (ins regtype:$Rt, GPR64sp0:$Rn),
3289 asm, "\t$Ws, $Rt, [$Rn]">,
3290 Sched<[WriteSTX]> {
3291 bits<5> Ws;
3292 bits<5> Rt;
3293 bits<5> Rn;
3294 let Inst{20-16} = Ws;
3295 let Inst{9-5} = Rn;
3296 let Inst{4-0} = Rt;
3297
3298 let Constraints = "@earlyclobber $Ws";
3299 let PostEncoderMethod = "fixLoadStoreExclusive<1,0>";
3300}
3301
3302class StoreExclusivePair<bits<2> sz, bit o2, bit L, bit o1, bit o0,
3303 RegisterClass regtype, string asm>
3304 : BaseLoadStoreExclusive<sz, o2, L, o1, o0,
3305 (outs GPR32:$Ws),
3306 (ins regtype:$Rt, regtype:$Rt2, GPR64sp0:$Rn),
3307 asm, "\t$Ws, $Rt, $Rt2, [$Rn]">,
3308 Sched<[WriteSTX]> {
3309 bits<5> Ws;
3310 bits<5> Rt;
3311 bits<5> Rt2;
3312 bits<5> Rn;
3313 let Inst{20-16} = Ws;
3314 let Inst{14-10} = Rt2;
3315 let Inst{9-5} = Rn;
3316 let Inst{4-0} = Rt;
3317
3318 let Constraints = "@earlyclobber $Ws";
3319}
3320
3321//---
3322// Exception generation
3323//---
3324
3325let mayLoad = 0, mayStore = 0, hasSideEffects = 1 in
3326class ExceptionGeneration<bits<3> op1, bits<2> ll, string asm>
3327 : I<(outs), (ins imm0_65535:$imm), asm, "\t$imm", "", []>,
3328 Sched<[WriteSys]> {
3329 bits<16> imm;
3330 let Inst{31-24} = 0b11010100;
3331 let Inst{23-21} = op1;
3332 let Inst{20-5} = imm;
3333 let Inst{4-2} = 0b000;
3334 let Inst{1-0} = ll;
3335}
3336
3337let Predicates = [HasFPARMv8] in {
3338
3339//---
3340// Floating point to integer conversion
3341//---
3342
3343class BaseFPToIntegerUnscaled<bits<2> type, bits<2> rmode, bits<3> opcode,
3344 RegisterClass srcType, RegisterClass dstType,
3345 string asm, list<dag> pattern>
3346 : I<(outs dstType:$Rd), (ins srcType:$Rn),
3347 asm, "\t$Rd, $Rn", "", pattern>,
3348 Sched<[WriteFCvt]> {
3349 bits<5> Rd;
3350 bits<5> Rn;
3351 let Inst{30-29} = 0b00;
3352 let Inst{28-24} = 0b11110;
3353 let Inst{23-22} = type;
3354 let Inst{21} = 1;
3355 let Inst{20-19} = rmode;
3356 let Inst{18-16} = opcode;
3357 let Inst{15-10} = 0;
3358 let Inst{9-5} = Rn;
3359 let Inst{4-0} = Rd;
3360}
3361
3362let mayLoad = 0, mayStore = 0, hasSideEffects = 0 in
3363class BaseFPToInteger<bits<2> type, bits<2> rmode, bits<3> opcode,
3364 RegisterClass srcType, RegisterClass dstType,
3365 Operand immType, string asm, list<dag> pattern>
3366 : I<(outs dstType:$Rd), (ins srcType:$Rn, immType:$scale),
3367 asm, "\t$Rd, $Rn, $scale", "", pattern>,
3368 Sched<[WriteFCvt]> {
3369 bits<5> Rd;
3370 bits<5> Rn;
3371 bits<6> scale;
3372 let Inst{30-29} = 0b00;
3373 let Inst{28-24} = 0b11110;
3374 let Inst{23-22} = type;
3375 let Inst{21} = 0;
3376 let Inst{20-19} = rmode;
3377 let Inst{18-16} = opcode;
3378 let Inst{15-10} = scale;
3379 let Inst{9-5} = Rn;
3380 let Inst{4-0} = Rd;
3381}
3382
3383multiclass FPToIntegerUnscaled<bits<2> rmode, bits<3> opcode, string asm,
3384 SDPatternOperator OpN> {
3385 // Unscaled single-precision to 32-bit
3386 def UWSr : BaseFPToIntegerUnscaled<0b00, rmode, opcode, FPR32, GPR32, asm,
3387 [(set GPR32:$Rd, (OpN FPR32:$Rn))]> {
3388 let Inst{31} = 0; // 32-bit GPR flag
3389 }
3390
3391 // Unscaled single-precision to 64-bit
3392 def UXSr : BaseFPToIntegerUnscaled<0b00, rmode, opcode, FPR32, GPR64, asm,
3393 [(set GPR64:$Rd, (OpN FPR32:$Rn))]> {
3394 let Inst{31} = 1; // 64-bit GPR flag
3395 }
3396
3397 // Unscaled double-precision to 32-bit
3398 def UWDr : BaseFPToIntegerUnscaled<0b01, rmode, opcode, FPR64, GPR32, asm,
3399 [(set GPR32:$Rd, (OpN (f64 FPR64:$Rn)))]> {
3400 let Inst{31} = 0; // 32-bit GPR flag
3401 }
3402
3403 // Unscaled double-precision to 64-bit
3404 def UXDr : BaseFPToIntegerUnscaled<0b01, rmode, opcode, FPR64, GPR64, asm,
3405 [(set GPR64:$Rd, (OpN (f64 FPR64:$Rn)))]> {
3406 let Inst{31} = 1; // 64-bit GPR flag
3407 }
3408}
3409
3410multiclass FPToIntegerScaled<bits<2> rmode, bits<3> opcode, string asm,
3411 SDPatternOperator OpN> {
3412 // Scaled single-precision to 32-bit
3413 def SWSri : BaseFPToInteger<0b00, rmode, opcode, FPR32, GPR32,
3414 fixedpoint_f32_i32, asm,
3415 [(set GPR32:$Rd, (OpN (fmul FPR32:$Rn,
3416 fixedpoint_f32_i32:$scale)))]> {
3417 let Inst{31} = 0; // 32-bit GPR flag
3418 let scale{5} = 1;
3419 }
3420
3421 // Scaled single-precision to 64-bit
3422 def SXSri : BaseFPToInteger<0b00, rmode, opcode, FPR32, GPR64,
3423 fixedpoint_f32_i64, asm,
3424 [(set GPR64:$Rd, (OpN (fmul FPR32:$Rn,
3425 fixedpoint_f32_i64:$scale)))]> {
3426 let Inst{31} = 1; // 64-bit GPR flag
3427 }
3428
3429 // Scaled double-precision to 32-bit
3430 def SWDri : BaseFPToInteger<0b01, rmode, opcode, FPR64, GPR32,
3431 fixedpoint_f64_i32, asm,
3432 [(set GPR32:$Rd, (OpN (fmul FPR64:$Rn,
3433 fixedpoint_f64_i32:$scale)))]> {
3434 let Inst{31} = 0; // 32-bit GPR flag
3435 let scale{5} = 1;
3436 }
3437
3438 // Scaled double-precision to 64-bit
3439 def SXDri : BaseFPToInteger<0b01, rmode, opcode, FPR64, GPR64,
3440 fixedpoint_f64_i64, asm,
3441 [(set GPR64:$Rd, (OpN (fmul FPR64:$Rn,
3442 fixedpoint_f64_i64:$scale)))]> {
3443 let Inst{31} = 1; // 64-bit GPR flag
3444 }
3445}
3446
3447//---
3448// Integer to floating point conversion
3449//---
3450
3451let mayStore = 0, mayLoad = 0, hasSideEffects = 0 in
3452class BaseIntegerToFP<bit isUnsigned,
3453 RegisterClass srcType, RegisterClass dstType,
3454 Operand immType, string asm, list<dag> pattern>
3455 : I<(outs dstType:$Rd), (ins srcType:$Rn, immType:$scale),
3456 asm, "\t$Rd, $Rn, $scale", "", pattern>,
3457 Sched<[WriteFCvt]> {
3458 bits<5> Rd;
3459 bits<5> Rn;
3460 bits<6> scale;
3461 let Inst{30-23} = 0b00111100;
3462 let Inst{21-17} = 0b00001;
3463 let Inst{16} = isUnsigned;
3464 let Inst{15-10} = scale;
3465 let Inst{9-5} = Rn;
3466 let Inst{4-0} = Rd;
3467}
3468
3469class BaseIntegerToFPUnscaled<bit isUnsigned,
3470 RegisterClass srcType, RegisterClass dstType,
3471 ValueType dvt, string asm, SDNode node>
3472 : I<(outs dstType:$Rd), (ins srcType:$Rn),
3473 asm, "\t$Rd, $Rn", "", [(set (dvt dstType:$Rd), (node srcType:$Rn))]>,
3474 Sched<[WriteFCvt]> {
3475 bits<5> Rd;
3476 bits<5> Rn;
3477 bits<6> scale;
3478 let Inst{30-23} = 0b00111100;
3479 let Inst{21-17} = 0b10001;
3480 let Inst{16} = isUnsigned;
3481 let Inst{15-10} = 0b000000;
3482 let Inst{9-5} = Rn;
3483 let Inst{4-0} = Rd;
3484}
3485
3486multiclass IntegerToFP<bit isUnsigned, string asm, SDNode node> {
3487 // Unscaled
3488 def UWSri: BaseIntegerToFPUnscaled<isUnsigned, GPR32, FPR32, f32, asm, node> {
3489 let Inst{31} = 0; // 32-bit GPR flag
3490 let Inst{22} = 0; // 32-bit FPR flag
3491 }
3492
3493 def UWDri: BaseIntegerToFPUnscaled<isUnsigned, GPR32, FPR64, f64, asm, node> {
3494 let Inst{31} = 0; // 32-bit GPR flag
3495 let Inst{22} = 1; // 64-bit FPR flag
3496 }
3497
3498 def UXSri: BaseIntegerToFPUnscaled<isUnsigned, GPR64, FPR32, f32, asm, node> {
3499 let Inst{31} = 1; // 64-bit GPR flag
3500 let Inst{22} = 0; // 32-bit FPR flag
3501 }
3502
3503 def UXDri: BaseIntegerToFPUnscaled<isUnsigned, GPR64, FPR64, f64, asm, node> {
3504 let Inst{31} = 1; // 64-bit GPR flag
3505 let Inst{22} = 1; // 64-bit FPR flag
3506 }
3507
3508 // Scaled
3509 def SWSri: BaseIntegerToFP<isUnsigned, GPR32, FPR32, fixedpoint_f32_i32, asm,
3510 [(set FPR32:$Rd,
3511 (fdiv (node GPR32:$Rn),
3512 fixedpoint_f32_i32:$scale))]> {
3513 let Inst{31} = 0; // 32-bit GPR flag
3514 let Inst{22} = 0; // 32-bit FPR flag
3515 let scale{5} = 1;
3516 }
3517
3518 def SWDri: BaseIntegerToFP<isUnsigned, GPR32, FPR64, fixedpoint_f64_i32, asm,
3519 [(set FPR64:$Rd,
3520 (fdiv (node GPR32:$Rn),
3521 fixedpoint_f64_i32:$scale))]> {
3522 let Inst{31} = 0; // 32-bit GPR flag
3523 let Inst{22} = 1; // 64-bit FPR flag
3524 let scale{5} = 1;
3525 }
3526
3527 def SXSri: BaseIntegerToFP<isUnsigned, GPR64, FPR32, fixedpoint_f32_i64, asm,
3528 [(set FPR32:$Rd,
3529 (fdiv (node GPR64:$Rn),
3530 fixedpoint_f32_i64:$scale))]> {
3531 let Inst{31} = 1; // 64-bit GPR flag
3532 let Inst{22} = 0; // 32-bit FPR flag
3533 }
3534
3535 def SXDri: BaseIntegerToFP<isUnsigned, GPR64, FPR64, fixedpoint_f64_i64, asm,
3536 [(set FPR64:$Rd,
3537 (fdiv (node GPR64:$Rn),
3538 fixedpoint_f64_i64:$scale))]> {
3539 let Inst{31} = 1; // 64-bit GPR flag
3540 let Inst{22} = 1; // 64-bit FPR flag
3541 }
3542}
3543
3544//---
3545// Unscaled integer <-> floating point conversion (i.e. FMOV)
3546//---
3547
3548let mayLoad = 0, mayStore = 0, hasSideEffects = 0 in
3549class BaseUnscaledConversion<bits<2> rmode, bits<3> opcode,
3550 RegisterClass srcType, RegisterClass dstType,
3551 string asm>
3552 : I<(outs dstType:$Rd), (ins srcType:$Rn), asm, "\t$Rd, $Rn", "",
3553 // We use COPY_TO_REGCLASS for these bitconvert operations.
3554 // copyPhysReg() expands the resultant COPY instructions after
3555 // regalloc is done. This gives greater freedom for the allocator
3556 // and related passes (coalescing, copy propagation, et. al.) to
3557 // be more effective.
3558 [/*(set (dvt dstType:$Rd), (bitconvert (svt srcType:$Rn)))*/]>,
3559 Sched<[WriteFCopy]> {
3560 bits<5> Rd;
3561 bits<5> Rn;
3562 let Inst{30-23} = 0b00111100;
3563 let Inst{21} = 1;
3564 let Inst{20-19} = rmode;
3565 let Inst{18-16} = opcode;
3566 let Inst{15-10} = 0b000000;
3567 let Inst{9-5} = Rn;
3568 let Inst{4-0} = Rd;
3569}
3570
3571let mayLoad = 0, mayStore = 0, hasSideEffects = 0 in
3572class BaseUnscaledConversionToHigh<bits<2> rmode, bits<3> opcode,
3573 RegisterClass srcType, RegisterOperand dstType, string asm,
3574 string kind>
3575 : I<(outs dstType:$Rd), (ins srcType:$Rn, VectorIndex1:$idx), asm,
3576 "{\t$Rd"#kind#"$idx, $Rn|"#kind#"\t$Rd$idx, $Rn}", "", []>,
3577 Sched<[WriteFCopy]> {
3578 bits<5> Rd;
3579 bits<5> Rn;
3580 let Inst{30-23} = 0b00111101;
3581 let Inst{21} = 1;
3582 let Inst{20-19} = rmode;
3583 let Inst{18-16} = opcode;
3584 let Inst{15-10} = 0b000000;
3585 let Inst{9-5} = Rn;
3586 let Inst{4-0} = Rd;
3587
3588 let DecoderMethod = "DecodeFMOVLaneInstruction";
3589}
3590
3591let mayLoad = 0, mayStore = 0, hasSideEffects = 0 in
3592class BaseUnscaledConversionFromHigh<bits<2> rmode, bits<3> opcode,
3593 RegisterOperand srcType, RegisterClass dstType, string asm,
3594 string kind>
3595 : I<(outs dstType:$Rd), (ins srcType:$Rn, VectorIndex1:$idx), asm,
3596 "{\t$Rd, $Rn"#kind#"$idx|"#kind#"\t$Rd, $Rn$idx}", "", []>,
3597 Sched<[WriteFCopy]> {
3598 bits<5> Rd;
3599 bits<5> Rn;
3600 let Inst{30-23} = 0b00111101;
3601 let Inst{21} = 1;
3602 let Inst{20-19} = rmode;
3603 let Inst{18-16} = opcode;
3604 let Inst{15-10} = 0b000000;
3605 let Inst{9-5} = Rn;
3606 let Inst{4-0} = Rd;
3607
3608 let DecoderMethod = "DecodeFMOVLaneInstruction";
3609}
3610
3611
3612
3613multiclass UnscaledConversion<string asm> {
3614 def WSr : BaseUnscaledConversion<0b00, 0b111, GPR32, FPR32, asm> {
3615 let Inst{31} = 0; // 32-bit GPR flag
3616 let Inst{22} = 0; // 32-bit FPR flag
3617 }
3618
3619 def XDr : BaseUnscaledConversion<0b00, 0b111, GPR64, FPR64, asm> {
3620 let Inst{31} = 1; // 64-bit GPR flag
3621 let Inst{22} = 1; // 64-bit FPR flag
3622 }
3623
3624 def SWr : BaseUnscaledConversion<0b00, 0b110, FPR32, GPR32, asm> {
3625 let Inst{31} = 0; // 32-bit GPR flag
3626 let Inst{22} = 0; // 32-bit FPR flag
3627 }
3628
3629 def DXr : BaseUnscaledConversion<0b00, 0b110, FPR64, GPR64, asm> {
3630 let Inst{31} = 1; // 64-bit GPR flag
3631 let Inst{22} = 1; // 64-bit FPR flag
3632 }
3633
3634 def XDHighr : BaseUnscaledConversionToHigh<0b01, 0b111, GPR64, V128,
3635 asm, ".d"> {
3636 let Inst{31} = 1;
3637 let Inst{22} = 0;
3638 }
3639
3640 def DXHighr : BaseUnscaledConversionFromHigh<0b01, 0b110, V128, GPR64,
3641 asm, ".d"> {
3642 let Inst{31} = 1;
3643 let Inst{22} = 0;
3644 }
3645}
3646
3647//---
3648// Floating point conversion
3649//---
3650
3651class BaseFPConversion<bits<2> type, bits<2> opcode, RegisterClass dstType,
3652 RegisterClass srcType, string asm, list<dag> pattern>
3653 : I<(outs dstType:$Rd), (ins srcType:$Rn), asm, "\t$Rd, $Rn", "", pattern>,
3654 Sched<[WriteFCvt]> {
3655 bits<5> Rd;
3656 bits<5> Rn;
3657 let Inst{31-24} = 0b00011110;
3658 let Inst{23-22} = type;
3659 let Inst{21-17} = 0b10001;
3660 let Inst{16-15} = opcode;
3661 let Inst{14-10} = 0b10000;
3662 let Inst{9-5} = Rn;
3663 let Inst{4-0} = Rd;
3664}
3665
3666multiclass FPConversion<string asm> {
3667 // Double-precision to Half-precision
3668 def HDr : BaseFPConversion<0b01, 0b11, FPR16, FPR64, asm,
3669 [(set FPR16:$Rd, (fround FPR64:$Rn))]>;
3670
3671 // Double-precision to Single-precision
3672 def SDr : BaseFPConversion<0b01, 0b00, FPR32, FPR64, asm,
3673 [(set FPR32:$Rd, (fround FPR64:$Rn))]>;
3674
3675 // Half-precision to Double-precision
3676 def DHr : BaseFPConversion<0b11, 0b01, FPR64, FPR16, asm,
3677 [(set FPR64:$Rd, (fextend FPR16:$Rn))]>;
3678
3679 // Half-precision to Single-precision
3680 def SHr : BaseFPConversion<0b11, 0b00, FPR32, FPR16, asm,
3681 [(set FPR32:$Rd, (fextend FPR16:$Rn))]>;
3682
3683 // Single-precision to Double-precision
3684 def DSr : BaseFPConversion<0b00, 0b01, FPR64, FPR32, asm,
3685 [(set FPR64:$Rd, (fextend FPR32:$Rn))]>;
3686
3687 // Single-precision to Half-precision
3688 def HSr : BaseFPConversion<0b00, 0b11, FPR16, FPR32, asm,
3689 [(set FPR16:$Rd, (fround FPR32:$Rn))]>;
3690}
3691
3692//---
3693// Single operand floating point data processing
3694//---
3695
3696let mayLoad = 0, mayStore = 0, hasSideEffects = 0 in
3697class BaseSingleOperandFPData<bits<4> opcode, RegisterClass regtype,
3698 ValueType vt, string asm, SDPatternOperator node>
3699 : I<(outs regtype:$Rd), (ins regtype:$Rn), asm, "\t$Rd, $Rn", "",
3700 [(set (vt regtype:$Rd), (node (vt regtype:$Rn)))]>,
3701 Sched<[WriteF]> {
3702 bits<5> Rd;
3703 bits<5> Rn;
3704 let Inst{31-23} = 0b000111100;
3705 let Inst{21-19} = 0b100;
3706 let Inst{18-15} = opcode;
3707 let Inst{14-10} = 0b10000;
3708 let Inst{9-5} = Rn;
3709 let Inst{4-0} = Rd;
3710}
3711
3712multiclass SingleOperandFPData<bits<4> opcode, string asm,
3713 SDPatternOperator node = null_frag> {
3714 def Sr : BaseSingleOperandFPData<opcode, FPR32, f32, asm, node> {
3715 let Inst{22} = 0; // 32-bit size flag
3716 }
3717
3718 def Dr : BaseSingleOperandFPData<opcode, FPR64, f64, asm, node> {
3719 let Inst{22} = 1; // 64-bit size flag
3720 }
3721}
3722
3723//---
3724// Two operand floating point data processing
3725//---
3726
3727let mayLoad = 0, mayStore = 0, hasSideEffects = 0 in
3728class BaseTwoOperandFPData<bits<4> opcode, RegisterClass regtype,
3729 string asm, list<dag> pat>
3730 : I<(outs regtype:$Rd), (ins regtype:$Rn, regtype:$Rm),
3731 asm, "\t$Rd, $Rn, $Rm", "", pat>,
3732 Sched<[WriteF]> {
3733 bits<5> Rd;
3734 bits<5> Rn;
3735 bits<5> Rm;
3736 let Inst{31-23} = 0b000111100;
3737 let Inst{21} = 1;
3738 let Inst{20-16} = Rm;
3739 let Inst{15-12} = opcode;
3740 let Inst{11-10} = 0b10;
3741 let Inst{9-5} = Rn;
3742 let Inst{4-0} = Rd;
3743}
3744
3745multiclass TwoOperandFPData<bits<4> opcode, string asm,
3746 SDPatternOperator node = null_frag> {
3747 def Srr : BaseTwoOperandFPData<opcode, FPR32, asm,
3748 [(set (f32 FPR32:$Rd),
3749 (node (f32 FPR32:$Rn), (f32 FPR32:$Rm)))]> {
3750 let Inst{22} = 0; // 32-bit size flag
3751 }
3752
3753 def Drr : BaseTwoOperandFPData<opcode, FPR64, asm,
3754 [(set (f64 FPR64:$Rd),
3755 (node (f64 FPR64:$Rn), (f64 FPR64:$Rm)))]> {
3756 let Inst{22} = 1; // 64-bit size flag
3757 }
3758}
3759
3760multiclass TwoOperandFPDataNeg<bits<4> opcode, string asm, SDNode node> {
3761 def Srr : BaseTwoOperandFPData<opcode, FPR32, asm,
3762 [(set FPR32:$Rd, (fneg (node FPR32:$Rn, (f32 FPR32:$Rm))))]> {
3763 let Inst{22} = 0; // 32-bit size flag
3764 }
3765
3766 def Drr : BaseTwoOperandFPData<opcode, FPR64, asm,
3767 [(set FPR64:$Rd, (fneg (node FPR64:$Rn, (f64 FPR64:$Rm))))]> {
3768 let Inst{22} = 1; // 64-bit size flag
3769 }
3770}
3771
3772
3773//---
3774// Three operand floating point data processing
3775//---
3776
3777class BaseThreeOperandFPData<bit isNegated, bit isSub,
3778 RegisterClass regtype, string asm, list<dag> pat>
3779 : I<(outs regtype:$Rd), (ins regtype:$Rn, regtype:$Rm, regtype: $Ra),
3780 asm, "\t$Rd, $Rn, $Rm, $Ra", "", pat>,
3781 Sched<[WriteFMul]> {
3782 bits<5> Rd;
3783 bits<5> Rn;
3784 bits<5> Rm;
3785 bits<5> Ra;
3786 let Inst{31-23} = 0b000111110;
3787 let Inst{21} = isNegated;
3788 let Inst{20-16} = Rm;
3789 let Inst{15} = isSub;
3790 let Inst{14-10} = Ra;
3791 let Inst{9-5} = Rn;
3792 let Inst{4-0} = Rd;
3793}
3794
3795multiclass ThreeOperandFPData<bit isNegated, bit isSub,string asm,
3796 SDPatternOperator node> {
3797 def Srrr : BaseThreeOperandFPData<isNegated, isSub, FPR32, asm,
3798 [(set FPR32:$Rd,
3799 (node (f32 FPR32:$Rn), (f32 FPR32:$Rm), (f32 FPR32:$Ra)))]> {
3800 let Inst{22} = 0; // 32-bit size flag
3801 }
3802
3803 def Drrr : BaseThreeOperandFPData<isNegated, isSub, FPR64, asm,
3804 [(set FPR64:$Rd,
3805 (node (f64 FPR64:$Rn), (f64 FPR64:$Rm), (f64 FPR64:$Ra)))]> {
3806 let Inst{22} = 1; // 64-bit size flag
3807 }
3808}
3809
3810//---
3811// Floating point data comparisons
3812//---
3813
3814let mayLoad = 0, mayStore = 0, hasSideEffects = 0 in
3815class BaseOneOperandFPComparison<bit signalAllNans,
3816 RegisterClass regtype, string asm,
3817 list<dag> pat>
3818 : I<(outs), (ins regtype:$Rn), asm, "\t$Rn, #0.0", "", pat>,
3819 Sched<[WriteFCmp]> {
3820 bits<5> Rn;
3821 let Inst{31-23} = 0b000111100;
3822 let Inst{21} = 1;
3823
3824 let Inst{15-10} = 0b001000;
3825 let Inst{9-5} = Rn;
3826 let Inst{4} = signalAllNans;
3827 let Inst{3-0} = 0b1000;
3828
3829 // Rm should be 0b00000 canonically, but we need to accept any value.
3830 let PostEncoderMethod = "fixOneOperandFPComparison";
3831}
3832
3833let mayLoad = 0, mayStore = 0, hasSideEffects = 0 in
3834class BaseTwoOperandFPComparison<bit signalAllNans, RegisterClass regtype,
3835 string asm, list<dag> pat>
3836 : I<(outs), (ins regtype:$Rn, regtype:$Rm), asm, "\t$Rn, $Rm", "", pat>,
3837 Sched<[WriteFCmp]> {
3838 bits<5> Rm;
3839 bits<5> Rn;
3840 let Inst{31-23} = 0b000111100;
3841 let Inst{21} = 1;
3842 let Inst{20-16} = Rm;
3843 let Inst{15-10} = 0b001000;
3844 let Inst{9-5} = Rn;
3845 let Inst{4} = signalAllNans;
3846 let Inst{3-0} = 0b0000;
3847}
3848
3849multiclass FPComparison<bit signalAllNans, string asm,
3850 SDPatternOperator OpNode = null_frag> {
3851 let Defs = [NZCV] in {
3852 def Srr : BaseTwoOperandFPComparison<signalAllNans, FPR32, asm,
3853 [(OpNode FPR32:$Rn, (f32 FPR32:$Rm)), (implicit NZCV)]> {
3854 let Inst{22} = 0;
3855 }
3856
3857 def Sri : BaseOneOperandFPComparison<signalAllNans, FPR32, asm,
3858 [(OpNode (f32 FPR32:$Rn), fpimm0), (implicit NZCV)]> {
3859 let Inst{22} = 0;
3860 }
3861
3862 def Drr : BaseTwoOperandFPComparison<signalAllNans, FPR64, asm,
3863 [(OpNode FPR64:$Rn, (f64 FPR64:$Rm)), (implicit NZCV)]> {
3864 let Inst{22} = 1;
3865 }
3866
3867 def Dri : BaseOneOperandFPComparison<signalAllNans, FPR64, asm,
3868 [(OpNode (f64 FPR64:$Rn), fpimm0), (implicit NZCV)]> {
3869 let Inst{22} = 1;
3870 }
3871 } // Defs = [NZCV]
3872}
3873
3874//---
3875// Floating point conditional comparisons
3876//---
3877
3878let mayLoad = 0, mayStore = 0, hasSideEffects = 0 in
3879class BaseFPCondComparison<bit signalAllNans,
3880 RegisterClass regtype, string asm>
3881 : I<(outs), (ins regtype:$Rn, regtype:$Rm, imm0_15:$nzcv, ccode:$cond),
3882 asm, "\t$Rn, $Rm, $nzcv, $cond", "", []>,
3883 Sched<[WriteFCmp]> {
3884 bits<5> Rn;
3885 bits<5> Rm;
3886 bits<4> nzcv;
3887 bits<4> cond;
3888
3889 let Inst{31-23} = 0b000111100;
3890 let Inst{21} = 1;
3891 let Inst{20-16} = Rm;
3892 let Inst{15-12} = cond;
3893 let Inst{11-10} = 0b01;
3894 let Inst{9-5} = Rn;
3895 let Inst{4} = signalAllNans;
3896 let Inst{3-0} = nzcv;
3897}
3898
3899multiclass FPCondComparison<bit signalAllNans, string asm> {
3900 let Defs = [NZCV], Uses = [NZCV] in {
3901 def Srr : BaseFPCondComparison<signalAllNans, FPR32, asm> {
3902 let Inst{22} = 0;
3903 }
3904
3905 def Drr : BaseFPCondComparison<signalAllNans, FPR64, asm> {
3906 let Inst{22} = 1;
3907 }
3908 } // Defs = [NZCV], Uses = [NZCV]
3909}
3910
3911//---
3912// Floating point conditional select
3913//---
3914
3915class BaseFPCondSelect<RegisterClass regtype, ValueType vt, string asm>
3916 : I<(outs regtype:$Rd), (ins regtype:$Rn, regtype:$Rm, ccode:$cond),
3917 asm, "\t$Rd, $Rn, $Rm, $cond", "",
3918 [(set regtype:$Rd,
3919 (AArch64csel (vt regtype:$Rn), regtype:$Rm,
3920 (i32 imm:$cond), NZCV))]>,
3921 Sched<[WriteF]> {
3922 bits<5> Rd;
3923 bits<5> Rn;
3924 bits<5> Rm;
3925 bits<4> cond;
3926
3927 let Inst{31-23} = 0b000111100;
3928 let Inst{21} = 1;
3929 let Inst{20-16} = Rm;
3930 let Inst{15-12} = cond;
3931 let Inst{11-10} = 0b11;
3932 let Inst{9-5} = Rn;
3933 let Inst{4-0} = Rd;
3934}
3935
3936multiclass FPCondSelect<string asm> {
3937 let Uses = [NZCV] in {
3938 def Srrr : BaseFPCondSelect<FPR32, f32, asm> {
3939 let Inst{22} = 0;
3940 }
3941
3942 def Drrr : BaseFPCondSelect<FPR64, f64, asm> {
3943 let Inst{22} = 1;
3944 }
3945 } // Uses = [NZCV]
3946}
3947
3948//---
3949// Floating move immediate
3950//---
3951
3952class BaseFPMoveImmediate<RegisterClass regtype, Operand fpimmtype, string asm>
3953 : I<(outs regtype:$Rd), (ins fpimmtype:$imm), asm, "\t$Rd, $imm", "",
3954 [(set regtype:$Rd, fpimmtype:$imm)]>,
3955 Sched<[WriteFImm]> {
3956 bits<5> Rd;
3957 bits<8> imm;
3958 let Inst{31-23} = 0b000111100;
3959 let Inst{21} = 1;
3960 let Inst{20-13} = imm;
3961 let Inst{12-5} = 0b10000000;
3962 let Inst{4-0} = Rd;
3963}
3964
3965multiclass FPMoveImmediate<string asm> {
3966 def Si : BaseFPMoveImmediate<FPR32, fpimm32, asm> {
3967 let Inst{22} = 0;
3968 }
3969
3970 def Di : BaseFPMoveImmediate<FPR64, fpimm64, asm> {
3971 let Inst{22} = 1;
3972 }
3973}
3974} // end of 'let Predicates = [HasFPARMv8]'
3975
3976//----------------------------------------------------------------------------
3977// AdvSIMD
3978//----------------------------------------------------------------------------
3979
3980let Predicates = [HasNEON] in {
3981
3982//----------------------------------------------------------------------------
3983// AdvSIMD three register vector instructions
3984//----------------------------------------------------------------------------
3985
3986let mayLoad = 0, mayStore = 0, hasSideEffects = 0 in
3987class BaseSIMDThreeSameVector<bit Q, bit U, bits<2> size, bits<5> opcode,
3988 RegisterOperand regtype, string asm, string kind,
3989 list<dag> pattern>
3990 : I<(outs regtype:$Rd), (ins regtype:$Rn, regtype:$Rm), asm,
3991 "{\t$Rd" # kind # ", $Rn" # kind # ", $Rm" # kind #
3992 "|" # kind # "\t$Rd, $Rn, $Rm|}", "", pattern>,
3993 Sched<[WriteV]> {
3994 bits<5> Rd;
3995 bits<5> Rn;
3996 bits<5> Rm;
3997 let Inst{31} = 0;
3998 let Inst{30} = Q;
3999 let Inst{29} = U;
4000 let Inst{28-24} = 0b01110;
4001 let Inst{23-22} = size;
4002 let Inst{21} = 1;
4003 let Inst{20-16} = Rm;
4004 let Inst{15-11} = opcode;
4005 let Inst{10} = 1;
4006 let Inst{9-5} = Rn;
4007 let Inst{4-0} = Rd;
4008}
4009
4010let mayLoad = 0, mayStore = 0, hasSideEffects = 0 in
4011class BaseSIMDThreeSameVectorTied<bit Q, bit U, bits<2> size, bits<5> opcode,
4012 RegisterOperand regtype, string asm, string kind,
4013 list<dag> pattern>
4014 : I<(outs regtype:$dst), (ins regtype:$Rd, regtype:$Rn, regtype:$Rm), asm,
4015 "{\t$Rd" # kind # ", $Rn" # kind # ", $Rm" # kind #
4016 "|" # kind # "\t$Rd, $Rn, $Rm}", "$Rd = $dst", pattern>,
4017 Sched<[WriteV]> {
4018 bits<5> Rd;
4019 bits<5> Rn;
4020 bits<5> Rm;
4021 let Inst{31} = 0;
4022 let Inst{30} = Q;
4023 let Inst{29} = U;
4024 let Inst{28-24} = 0b01110;
4025 let Inst{23-22} = size;
4026 let Inst{21} = 1;
4027 let Inst{20-16} = Rm;
4028 let Inst{15-11} = opcode;
4029 let Inst{10} = 1;
4030 let Inst{9-5} = Rn;
4031 let Inst{4-0} = Rd;
4032}
4033
4034// All operand sizes distinguished in the encoding.
4035multiclass SIMDThreeSameVector<bit U, bits<5> opc, string asm,
4036 SDPatternOperator OpNode> {
4037 def v8i8 : BaseSIMDThreeSameVector<0, U, 0b00, opc, V64,
4038 asm, ".8b",
4039 [(set (v8i8 V64:$Rd), (OpNode (v8i8 V64:$Rn), (v8i8 V64:$Rm)))]>;
4040 def v16i8 : BaseSIMDThreeSameVector<1, U, 0b00, opc, V128,
4041 asm, ".16b",
4042 [(set (v16i8 V128:$Rd), (OpNode (v16i8 V128:$Rn), (v16i8 V128:$Rm)))]>;
4043 def v4i16 : BaseSIMDThreeSameVector<0, U, 0b01, opc, V64,
4044 asm, ".4h",
4045 [(set (v4i16 V64:$Rd), (OpNode (v4i16 V64:$Rn), (v4i16 V64:$Rm)))]>;
4046 def v8i16 : BaseSIMDThreeSameVector<1, U, 0b01, opc, V128,
4047 asm, ".8h",
4048 [(set (v8i16 V128:$Rd), (OpNode (v8i16 V128:$Rn), (v8i16 V128:$Rm)))]>;
4049 def v2i32 : BaseSIMDThreeSameVector<0, U, 0b10, opc, V64,
4050 asm, ".2s",
4051 [(set (v2i32 V64:$Rd), (OpNode (v2i32 V64:$Rn), (v2i32 V64:$Rm)))]>;
4052 def v4i32 : BaseSIMDThreeSameVector<1, U, 0b10, opc, V128,
4053 asm, ".4s",
4054 [(set (v4i32 V128:$Rd), (OpNode (v4i32 V128:$Rn), (v4i32 V128:$Rm)))]>;
4055 def v2i64 : BaseSIMDThreeSameVector<1, U, 0b11, opc, V128,
4056 asm, ".2d",
4057 [(set (v2i64 V128:$Rd), (OpNode (v2i64 V128:$Rn), (v2i64 V128:$Rm)))]>;
4058}
4059
4060// As above, but D sized elements unsupported.
4061multiclass SIMDThreeSameVectorBHS<bit U, bits<5> opc, string asm,
4062 SDPatternOperator OpNode> {
4063 def v8i8 : BaseSIMDThreeSameVector<0, U, 0b00, opc, V64,
4064 asm, ".8b",
4065 [(set V64:$Rd, (v8i8 (OpNode (v8i8 V64:$Rn), (v8i8 V64:$Rm))))]>;
4066 def v16i8 : BaseSIMDThreeSameVector<1, U, 0b00, opc, V128,
4067 asm, ".16b",
4068 [(set V128:$Rd, (v16i8 (OpNode (v16i8 V128:$Rn), (v16i8 V128:$Rm))))]>;
4069 def v4i16 : BaseSIMDThreeSameVector<0, U, 0b01, opc, V64,
4070 asm, ".4h",
4071 [(set V64:$Rd, (v4i16 (OpNode (v4i16 V64:$Rn), (v4i16 V64:$Rm))))]>;
4072 def v8i16 : BaseSIMDThreeSameVector<1, U, 0b01, opc, V128,
4073 asm, ".8h",
4074 [(set V128:$Rd, (v8i16 (OpNode (v8i16 V128:$Rn), (v8i16 V128:$Rm))))]>;
4075 def v2i32 : BaseSIMDThreeSameVector<0, U, 0b10, opc, V64,
4076 asm, ".2s",
4077 [(set V64:$Rd, (v2i32 (OpNode (v2i32 V64:$Rn), (v2i32 V64:$Rm))))]>;
4078 def v4i32 : BaseSIMDThreeSameVector<1, U, 0b10, opc, V128,
4079 asm, ".4s",
4080 [(set V128:$Rd, (v4i32 (OpNode (v4i32 V128:$Rn), (v4i32 V128:$Rm))))]>;
4081}
4082
4083multiclass SIMDThreeSameVectorBHSTied<bit U, bits<5> opc, string asm,
4084 SDPatternOperator OpNode> {
4085 def v8i8 : BaseSIMDThreeSameVectorTied<0, U, 0b00, opc, V64,
4086 asm, ".8b",
4087 [(set (v8i8 V64:$dst),
4088 (OpNode (v8i8 V64:$Rd), (v8i8 V64:$Rn), (v8i8 V64:$Rm)))]>;
4089 def v16i8 : BaseSIMDThreeSameVectorTied<1, U, 0b00, opc, V128,
4090 asm, ".16b",
4091 [(set (v16i8 V128:$dst),
4092 (OpNode (v16i8 V128:$Rd), (v16i8 V128:$Rn), (v16i8 V128:$Rm)))]>;
4093 def v4i16 : BaseSIMDThreeSameVectorTied<0, U, 0b01, opc, V64,
4094 asm, ".4h",
4095 [(set (v4i16 V64:$dst),
4096 (OpNode (v4i16 V64:$Rd), (v4i16 V64:$Rn), (v4i16 V64:$Rm)))]>;
4097 def v8i16 : BaseSIMDThreeSameVectorTied<1, U, 0b01, opc, V128,
4098 asm, ".8h",
4099 [(set (v8i16 V128:$dst),
4100 (OpNode (v8i16 V128:$Rd), (v8i16 V128:$Rn), (v8i16 V128:$Rm)))]>;
4101 def v2i32 : BaseSIMDThreeSameVectorTied<0, U, 0b10, opc, V64,
4102 asm, ".2s",
4103 [(set (v2i32 V64:$dst),
4104 (OpNode (v2i32 V64:$Rd), (v2i32 V64:$Rn), (v2i32 V64:$Rm)))]>;
4105 def v4i32 : BaseSIMDThreeSameVectorTied<1, U, 0b10, opc, V128,
4106 asm, ".4s",
4107 [(set (v4i32 V128:$dst),
4108 (OpNode (v4i32 V128:$Rd), (v4i32 V128:$Rn), (v4i32 V128:$Rm)))]>;
4109}
4110
4111// As above, but only B sized elements supported.
4112multiclass SIMDThreeSameVectorB<bit U, bits<5> opc, string asm,
4113 SDPatternOperator OpNode> {
4114 def v8i8 : BaseSIMDThreeSameVector<0, U, 0b00, opc, V64,
4115 asm, ".8b",
4116 [(set (v8i8 V64:$Rd), (OpNode (v8i8 V64:$Rn), (v8i8 V64:$Rm)))]>;
4117 def v16i8 : BaseSIMDThreeSameVector<1, U, 0b00, opc, V128,
4118 asm, ".16b",
4119 [(set (v16i8 V128:$Rd),
4120 (OpNode (v16i8 V128:$Rn), (v16i8 V128:$Rm)))]>;
4121}
4122
4123// As above, but only S and D sized floating point elements supported.
4124multiclass SIMDThreeSameVectorFP<bit U, bit S, bits<5> opc,
4125 string asm, SDPatternOperator OpNode> {
4126 def v2f32 : BaseSIMDThreeSameVector<0, U, {S,0}, opc, V64,
4127 asm, ".2s",
4128 [(set (v2f32 V64:$Rd), (OpNode (v2f32 V64:$Rn), (v2f32 V64:$Rm)))]>;
4129 def v4f32 : BaseSIMDThreeSameVector<1, U, {S,0}, opc, V128,
4130 asm, ".4s",
4131 [(set (v4f32 V128:$Rd), (OpNode (v4f32 V128:$Rn), (v4f32 V128:$Rm)))]>;
4132 def v2f64 : BaseSIMDThreeSameVector<1, U, {S,1}, opc, V128,
4133 asm, ".2d",
4134 [(set (v2f64 V128:$Rd), (OpNode (v2f64 V128:$Rn), (v2f64 V128:$Rm)))]>;
4135}
4136
4137multiclass SIMDThreeSameVectorFPCmp<bit U, bit S, bits<5> opc,
4138 string asm,
4139 SDPatternOperator OpNode> {
4140 def v2f32 : BaseSIMDThreeSameVector<0, U, {S,0}, opc, V64,
4141 asm, ".2s",
4142 [(set (v2i32 V64:$Rd), (OpNode (v2f32 V64:$Rn), (v2f32 V64:$Rm)))]>;
4143 def v4f32 : BaseSIMDThreeSameVector<1, U, {S,0}, opc, V128,
4144 asm, ".4s",
4145 [(set (v4i32 V128:$Rd), (OpNode (v4f32 V128:$Rn), (v4f32 V128:$Rm)))]>;
4146 def v2f64 : BaseSIMDThreeSameVector<1, U, {S,1}, opc, V128,
4147 asm, ".2d",
4148 [(set (v2i64 V128:$Rd), (OpNode (v2f64 V128:$Rn), (v2f64 V128:$Rm)))]>;
4149}
4150
4151multiclass SIMDThreeSameVectorFPTied<bit U, bit S, bits<5> opc,
4152 string asm, SDPatternOperator OpNode> {
4153 def v2f32 : BaseSIMDThreeSameVectorTied<0, U, {S,0}, opc, V64,
4154 asm, ".2s",
4155 [(set (v2f32 V64:$dst),
4156 (OpNode (v2f32 V64:$Rd), (v2f32 V64:$Rn), (v2f32 V64:$Rm)))]>;
4157 def v4f32 : BaseSIMDThreeSameVectorTied<1, U, {S,0}, opc, V128,
4158 asm, ".4s",
4159 [(set (v4f32 V128:$dst),
4160 (OpNode (v4f32 V128:$Rd), (v4f32 V128:$Rn), (v4f32 V128:$Rm)))]>;
4161 def v2f64 : BaseSIMDThreeSameVectorTied<1, U, {S,1}, opc, V128,
4162 asm, ".2d",
4163 [(set (v2f64 V128:$dst),
4164 (OpNode (v2f64 V128:$Rd), (v2f64 V128:$Rn), (v2f64 V128:$Rm)))]>;
4165}
4166
4167// As above, but D and B sized elements unsupported.
4168multiclass SIMDThreeSameVectorHS<bit U, bits<5> opc, string asm,
4169 SDPatternOperator OpNode> {
4170 def v4i16 : BaseSIMDThreeSameVector<0, U, 0b01, opc, V64,
4171 asm, ".4h",
4172 [(set (v4i16 V64:$Rd), (OpNode (v4i16 V64:$Rn), (v4i16 V64:$Rm)))]>;
4173 def v8i16 : BaseSIMDThreeSameVector<1, U, 0b01, opc, V128,
4174 asm, ".8h",
4175 [(set (v8i16 V128:$Rd), (OpNode (v8i16 V128:$Rn), (v8i16 V128:$Rm)))]>;
4176 def v2i32 : BaseSIMDThreeSameVector<0, U, 0b10, opc, V64,
4177 asm, ".2s",
4178 [(set (v2i32 V64:$Rd), (OpNode (v2i32 V64:$Rn), (v2i32 V64:$Rm)))]>;
4179 def v4i32 : BaseSIMDThreeSameVector<1, U, 0b10, opc, V128,
4180 asm, ".4s",
4181 [(set (v4i32 V128:$Rd), (OpNode (v4i32 V128:$Rn), (v4i32 V128:$Rm)))]>;
4182}
4183
4184// Logical three vector ops share opcode bits, and only use B sized elements.
4185multiclass SIMDLogicalThreeVector<bit U, bits<2> size, string asm,
4186 SDPatternOperator OpNode = null_frag> {
4187 def v8i8 : BaseSIMDThreeSameVector<0, U, size, 0b00011, V64,
4188 asm, ".8b",
4189 [(set (v8i8 V64:$Rd), (OpNode V64:$Rn, V64:$Rm))]>;
4190 def v16i8 : BaseSIMDThreeSameVector<1, U, size, 0b00011, V128,
4191 asm, ".16b",
4192 [(set (v16i8 V128:$Rd), (OpNode V128:$Rn, V128:$Rm))]>;
4193
4194 def : Pat<(v4i16 (OpNode V64:$LHS, V64:$RHS)),
4195 (!cast<Instruction>(NAME#"v8i8") V64:$LHS, V64:$RHS)>;
4196 def : Pat<(v2i32 (OpNode V64:$LHS, V64:$RHS)),
4197 (!cast<Instruction>(NAME#"v8i8") V64:$LHS, V64:$RHS)>;
4198 def : Pat<(v1i64 (OpNode V64:$LHS, V64:$RHS)),
4199 (!cast<Instruction>(NAME#"v8i8") V64:$LHS, V64:$RHS)>;
4200
4201 def : Pat<(v8i16 (OpNode V128:$LHS, V128:$RHS)),
4202 (!cast<Instruction>(NAME#"v16i8") V128:$LHS, V128:$RHS)>;
4203 def : Pat<(v4i32 (OpNode V128:$LHS, V128:$RHS)),
4204 (!cast<Instruction>(NAME#"v16i8") V128:$LHS, V128:$RHS)>;
4205 def : Pat<(v2i64 (OpNode V128:$LHS, V128:$RHS)),
4206 (!cast<Instruction>(NAME#"v16i8") V128:$LHS, V128:$RHS)>;
4207}
4208
4209multiclass SIMDLogicalThreeVectorTied<bit U, bits<2> size,
4210 string asm, SDPatternOperator OpNode> {
4211 def v8i8 : BaseSIMDThreeSameVectorTied<0, U, size, 0b00011, V64,
4212 asm, ".8b",
4213 [(set (v8i8 V64:$dst),
4214 (OpNode (v8i8 V64:$Rd), (v8i8 V64:$Rn), (v8i8 V64:$Rm)))]>;
4215 def v16i8 : BaseSIMDThreeSameVectorTied<1, U, size, 0b00011, V128,
4216 asm, ".16b",
4217 [(set (v16i8 V128:$dst),
4218 (OpNode (v16i8 V128:$Rd), (v16i8 V128:$Rn),
4219 (v16i8 V128:$Rm)))]>;
4220
4221 def : Pat<(v4i16 (OpNode (v4i16 V64:$LHS), (v4i16 V64:$MHS),
4222 (v4i16 V64:$RHS))),
4223 (!cast<Instruction>(NAME#"v8i8")
4224 V64:$LHS, V64:$MHS, V64:$RHS)>;
4225 def : Pat<(v2i32 (OpNode (v2i32 V64:$LHS), (v2i32 V64:$MHS),
4226 (v2i32 V64:$RHS))),
4227 (!cast<Instruction>(NAME#"v8i8")
4228 V64:$LHS, V64:$MHS, V64:$RHS)>;
4229 def : Pat<(v1i64 (OpNode (v1i64 V64:$LHS), (v1i64 V64:$MHS),
4230 (v1i64 V64:$RHS))),
4231 (!cast<Instruction>(NAME#"v8i8")
4232 V64:$LHS, V64:$MHS, V64:$RHS)>;
4233
4234 def : Pat<(v8i16 (OpNode (v8i16 V128:$LHS), (v8i16 V128:$MHS),
4235 (v8i16 V128:$RHS))),
4236 (!cast<Instruction>(NAME#"v16i8")
4237 V128:$LHS, V128:$MHS, V128:$RHS)>;
4238 def : Pat<(v4i32 (OpNode (v4i32 V128:$LHS), (v4i32 V128:$MHS),
4239 (v4i32 V128:$RHS))),
4240 (!cast<Instruction>(NAME#"v16i8")
4241 V128:$LHS, V128:$MHS, V128:$RHS)>;
4242 def : Pat<(v2i64 (OpNode (v2i64 V128:$LHS), (v2i64 V128:$MHS),
4243 (v2i64 V128:$RHS))),
4244 (!cast<Instruction>(NAME#"v16i8")
4245 V128:$LHS, V128:$MHS, V128:$RHS)>;
4246}
4247
4248
4249//----------------------------------------------------------------------------
4250// AdvSIMD two register vector instructions.
4251//----------------------------------------------------------------------------
4252
4253let mayLoad = 0, mayStore = 0, hasSideEffects = 0 in
4254class BaseSIMDTwoSameVector<bit Q, bit U, bits<2> size, bits<5> opcode,
4255 RegisterOperand regtype, string asm, string dstkind,
4256 string srckind, list<dag> pattern>
4257 : I<(outs regtype:$Rd), (ins regtype:$Rn), asm,
4258 "{\t$Rd" # dstkind # ", $Rn" # srckind #
4259 "|" # dstkind # "\t$Rd, $Rn}", "", pattern>,
4260 Sched<[WriteV]> {
4261 bits<5> Rd;
4262 bits<5> Rn;
4263 let Inst{31} = 0;
4264 let Inst{30} = Q;
4265 let Inst{29} = U;
4266 let Inst{28-24} = 0b01110;
4267 let Inst{23-22} = size;
4268 let Inst{21-17} = 0b10000;
4269 let Inst{16-12} = opcode;
4270 let Inst{11-10} = 0b10;
4271 let Inst{9-5} = Rn;
4272 let Inst{4-0} = Rd;
4273}
4274
4275let mayLoad = 0, mayStore = 0, hasSideEffects = 0 in
4276class BaseSIMDTwoSameVectorTied<bit Q, bit U, bits<2> size, bits<5> opcode,
4277 RegisterOperand regtype, string asm, string dstkind,
4278 string srckind, list<dag> pattern>
4279 : I<(outs regtype:$dst), (ins regtype:$Rd, regtype:$Rn), asm,
4280 "{\t$Rd" # dstkind # ", $Rn" # srckind #
4281 "|" # dstkind # "\t$Rd, $Rn}", "$Rd = $dst", pattern>,
4282 Sched<[WriteV]> {
4283 bits<5> Rd;
4284 bits<5> Rn;
4285 let Inst{31} = 0;
4286 let Inst{30} = Q;
4287 let Inst{29} = U;
4288 let Inst{28-24} = 0b01110;
4289 let Inst{23-22} = size;
4290 let Inst{21-17} = 0b10000;
4291 let Inst{16-12} = opcode;
4292 let Inst{11-10} = 0b10;
4293 let Inst{9-5} = Rn;
4294 let Inst{4-0} = Rd;
4295}
4296
4297// Supports B, H, and S element sizes.
4298multiclass SIMDTwoVectorBHS<bit U, bits<5> opc, string asm,
4299 SDPatternOperator OpNode> {
4300 def v8i8 : BaseSIMDTwoSameVector<0, U, 0b00, opc, V64,
4301 asm, ".8b", ".8b",
4302 [(set (v8i8 V64:$Rd), (OpNode (v8i8 V64:$Rn)))]>;
4303 def v16i8 : BaseSIMDTwoSameVector<1, U, 0b00, opc, V128,
4304 asm, ".16b", ".16b",
4305 [(set (v16i8 V128:$Rd), (OpNode (v16i8 V128:$Rn)))]>;
4306 def v4i16 : BaseSIMDTwoSameVector<0, U, 0b01, opc, V64,
4307 asm, ".4h", ".4h",
4308 [(set (v4i16 V64:$Rd), (OpNode (v4i16 V64:$Rn)))]>;
4309 def v8i16 : BaseSIMDTwoSameVector<1, U, 0b01, opc, V128,
4310 asm, ".8h", ".8h",
4311 [(set (v8i16 V128:$Rd), (OpNode (v8i16 V128:$Rn)))]>;
4312 def v2i32 : BaseSIMDTwoSameVector<0, U, 0b10, opc, V64,
4313 asm, ".2s", ".2s",
4314 [(set (v2i32 V64:$Rd), (OpNode (v2i32 V64:$Rn)))]>;
4315 def v4i32 : BaseSIMDTwoSameVector<1, U, 0b10, opc, V128,
4316 asm, ".4s", ".4s",
4317 [(set (v4i32 V128:$Rd), (OpNode (v4i32 V128:$Rn)))]>;
4318}
4319
4320class BaseSIMDVectorLShiftLongBySize<bit Q, bits<2> size,
4321 RegisterOperand regtype, string asm, string dstkind,
4322 string srckind, string amount>
4323 : I<(outs V128:$Rd), (ins regtype:$Rn), asm,
4324 "{\t$Rd" # dstkind # ", $Rn" # srckind # ", #" # amount #
4325 "|" # dstkind # "\t$Rd, $Rn, #" # amount # "}", "", []>,
4326 Sched<[WriteV]> {
4327 bits<5> Rd;
4328 bits<5> Rn;
4329 let Inst{31} = 0;
4330 let Inst{30} = Q;
4331 let Inst{29-24} = 0b101110;
4332 let Inst{23-22} = size;
4333 let Inst{21-10} = 0b100001001110;
4334 let Inst{9-5} = Rn;
4335 let Inst{4-0} = Rd;
4336}
4337
4338multiclass SIMDVectorLShiftLongBySizeBHS {
4339 let neverHasSideEffects = 1 in {
4340 def v8i8 : BaseSIMDVectorLShiftLongBySize<0, 0b00, V64,
4341 "shll", ".8h", ".8b", "8">;
4342 def v16i8 : BaseSIMDVectorLShiftLongBySize<1, 0b00, V128,
4343 "shll2", ".8h", ".16b", "8">;
4344 def v4i16 : BaseSIMDVectorLShiftLongBySize<0, 0b01, V64,
4345 "shll", ".4s", ".4h", "16">;
4346 def v8i16 : BaseSIMDVectorLShiftLongBySize<1, 0b01, V128,
4347 "shll2", ".4s", ".8h", "16">;
4348 def v2i32 : BaseSIMDVectorLShiftLongBySize<0, 0b10, V64,
4349 "shll", ".2d", ".2s", "32">;
4350 def v4i32 : BaseSIMDVectorLShiftLongBySize<1, 0b10, V128,
4351 "shll2", ".2d", ".4s", "32">;
4352 }
4353}
4354
4355// Supports all element sizes.
4356multiclass SIMDLongTwoVector<bit U, bits<5> opc, string asm,
4357 SDPatternOperator OpNode> {
4358 def v8i8_v4i16 : BaseSIMDTwoSameVector<0, U, 0b00, opc, V64,
4359 asm, ".4h", ".8b",
4360 [(set (v4i16 V64:$Rd), (OpNode (v8i8 V64:$Rn)))]>;
4361 def v16i8_v8i16 : BaseSIMDTwoSameVector<1, U, 0b00, opc, V128,
4362 asm, ".8h", ".16b",
4363 [(set (v8i16 V128:$Rd), (OpNode (v16i8 V128:$Rn)))]>;
4364 def v4i16_v2i32 : BaseSIMDTwoSameVector<0, U, 0b01, opc, V64,
4365 asm, ".2s", ".4h",
4366 [(set (v2i32 V64:$Rd), (OpNode (v4i16 V64:$Rn)))]>;
4367 def v8i16_v4i32 : BaseSIMDTwoSameVector<1, U, 0b01, opc, V128,
4368 asm, ".4s", ".8h",
4369 [(set (v4i32 V128:$Rd), (OpNode (v8i16 V128:$Rn)))]>;
4370 def v2i32_v1i64 : BaseSIMDTwoSameVector<0, U, 0b10, opc, V64,
4371 asm, ".1d", ".2s",
4372 [(set (v1i64 V64:$Rd), (OpNode (v2i32 V64:$Rn)))]>;
4373 def v4i32_v2i64 : BaseSIMDTwoSameVector<1, U, 0b10, opc, V128,
4374 asm, ".2d", ".4s",
4375 [(set (v2i64 V128:$Rd), (OpNode (v4i32 V128:$Rn)))]>;
4376}
4377
4378multiclass SIMDLongTwoVectorTied<bit U, bits<5> opc, string asm,
4379 SDPatternOperator OpNode> {
4380 def v8i8_v4i16 : BaseSIMDTwoSameVectorTied<0, U, 0b00, opc, V64,
4381 asm, ".4h", ".8b",
4382 [(set (v4i16 V64:$dst), (OpNode (v4i16 V64:$Rd),
4383 (v8i8 V64:$Rn)))]>;
4384 def v16i8_v8i16 : BaseSIMDTwoSameVectorTied<1, U, 0b00, opc, V128,
4385 asm, ".8h", ".16b",
4386 [(set (v8i16 V128:$dst), (OpNode (v8i16 V128:$Rd),
4387 (v16i8 V128:$Rn)))]>;
4388 def v4i16_v2i32 : BaseSIMDTwoSameVectorTied<0, U, 0b01, opc, V64,
4389 asm, ".2s", ".4h",
4390 [(set (v2i32 V64:$dst), (OpNode (v2i32 V64:$Rd),
4391 (v4i16 V64:$Rn)))]>;
4392 def v8i16_v4i32 : BaseSIMDTwoSameVectorTied<1, U, 0b01, opc, V128,
4393 asm, ".4s", ".8h",
4394 [(set (v4i32 V128:$dst), (OpNode (v4i32 V128:$Rd),
4395 (v8i16 V128:$Rn)))]>;
4396 def v2i32_v1i64 : BaseSIMDTwoSameVectorTied<0, U, 0b10, opc, V64,
4397 asm, ".1d", ".2s",
4398 [(set (v1i64 V64:$dst), (OpNode (v1i64 V64:$Rd),
4399 (v2i32 V64:$Rn)))]>;
4400 def v4i32_v2i64 : BaseSIMDTwoSameVectorTied<1, U, 0b10, opc, V128,
4401 asm, ".2d", ".4s",
4402 [(set (v2i64 V128:$dst), (OpNode (v2i64 V128:$Rd),
4403 (v4i32 V128:$Rn)))]>;
4404}
4405
4406// Supports all element sizes, except 1xD.
4407multiclass SIMDTwoVectorBHSDTied<bit U, bits<5> opc, string asm,
4408 SDPatternOperator OpNode> {
4409 def v8i8 : BaseSIMDTwoSameVectorTied<0, U, 0b00, opc, V64,
4410 asm, ".8b", ".8b",
4411 [(set (v8i8 V64:$dst), (OpNode (v8i8 V64:$Rd), (v8i8 V64:$Rn)))]>;
4412 def v16i8 : BaseSIMDTwoSameVectorTied<1, U, 0b00, opc, V128,
4413 asm, ".16b", ".16b",
4414 [(set (v16i8 V128:$dst), (OpNode (v16i8 V128:$Rd), (v16i8 V128:$Rn)))]>;
4415 def v4i16 : BaseSIMDTwoSameVectorTied<0, U, 0b01, opc, V64,
4416 asm, ".4h", ".4h",
4417 [(set (v4i16 V64:$dst), (OpNode (v4i16 V64:$Rd), (v4i16 V64:$Rn)))]>;
4418 def v8i16 : BaseSIMDTwoSameVectorTied<1, U, 0b01, opc, V128,
4419 asm, ".8h", ".8h",
4420 [(set (v8i16 V128:$dst), (OpNode (v8i16 V128:$Rd), (v8i16 V128:$Rn)))]>;
4421 def v2i32 : BaseSIMDTwoSameVectorTied<0, U, 0b10, opc, V64,
4422 asm, ".2s", ".2s",
4423 [(set (v2i32 V64:$dst), (OpNode (v2i32 V64:$Rd), (v2i32 V64:$Rn)))]>;
4424 def v4i32 : BaseSIMDTwoSameVectorTied<1, U, 0b10, opc, V128,
4425 asm, ".4s", ".4s",
4426 [(set (v4i32 V128:$dst), (OpNode (v4i32 V128:$Rd), (v4i32 V128:$Rn)))]>;
4427 def v2i64 : BaseSIMDTwoSameVectorTied<1, U, 0b11, opc, V128,
4428 asm, ".2d", ".2d",
4429 [(set (v2i64 V128:$dst), (OpNode (v2i64 V128:$Rd), (v2i64 V128:$Rn)))]>;
4430}
4431
4432multiclass SIMDTwoVectorBHSD<bit U, bits<5> opc, string asm,
4433 SDPatternOperator OpNode = null_frag> {
4434 def v8i8 : BaseSIMDTwoSameVector<0, U, 0b00, opc, V64,
4435 asm, ".8b", ".8b",
4436 [(set (v8i8 V64:$Rd), (OpNode (v8i8 V64:$Rn)))]>;
4437 def v16i8 : BaseSIMDTwoSameVector<1, U, 0b00, opc, V128,
4438 asm, ".16b", ".16b",
4439 [(set (v16i8 V128:$Rd), (OpNode (v16i8 V128:$Rn)))]>;
4440 def v4i16 : BaseSIMDTwoSameVector<0, U, 0b01, opc, V64,
4441 asm, ".4h", ".4h",
4442 [(set (v4i16 V64:$Rd), (OpNode (v4i16 V64:$Rn)))]>;
4443 def v8i16 : BaseSIMDTwoSameVector<1, U, 0b01, opc, V128,
4444 asm, ".8h", ".8h",
4445 [(set (v8i16 V128:$Rd), (OpNode (v8i16 V128:$Rn)))]>;
4446 def v2i32 : BaseSIMDTwoSameVector<0, U, 0b10, opc, V64,
4447 asm, ".2s", ".2s",
4448 [(set (v2i32 V64:$Rd), (OpNode (v2i32 V64:$Rn)))]>;
4449 def v4i32 : BaseSIMDTwoSameVector<1, U, 0b10, opc, V128,
4450 asm, ".4s", ".4s",
4451 [(set (v4i32 V128:$Rd), (OpNode (v4i32 V128:$Rn)))]>;
4452 def v2i64 : BaseSIMDTwoSameVector<1, U, 0b11, opc, V128,
4453 asm, ".2d", ".2d",
4454 [(set (v2i64 V128:$Rd), (OpNode (v2i64 V128:$Rn)))]>;
4455}
4456
4457
4458// Supports only B element sizes.
4459multiclass SIMDTwoVectorB<bit U, bits<2> size, bits<5> opc, string asm,
4460 SDPatternOperator OpNode> {
4461 def v8i8 : BaseSIMDTwoSameVector<0, U, size, opc, V64,
4462 asm, ".8b", ".8b",
4463 [(set (v8i8 V64:$Rd), (OpNode (v8i8 V64:$Rn)))]>;
4464 def v16i8 : BaseSIMDTwoSameVector<1, U, size, opc, V128,
4465 asm, ".16b", ".16b",
4466 [(set (v16i8 V128:$Rd), (OpNode (v16i8 V128:$Rn)))]>;
4467
4468}
4469
4470// Supports only B and H element sizes.
4471multiclass SIMDTwoVectorBH<bit U, bits<5> opc, string asm,
4472 SDPatternOperator OpNode> {
4473 def v8i8 : BaseSIMDTwoSameVector<0, U, 0b00, opc, V64,
4474 asm, ".8b", ".8b",
4475 [(set (v8i8 V64:$Rd), (OpNode V64:$Rn))]>;
4476 def v16i8 : BaseSIMDTwoSameVector<1, U, 0b00, opc, V128,
4477 asm, ".16b", ".16b",
4478 [(set (v16i8 V128:$Rd), (OpNode V128:$Rn))]>;
4479 def v4i16 : BaseSIMDTwoSameVector<0, U, 0b01, opc, V64,
4480 asm, ".4h", ".4h",
4481 [(set (v4i16 V64:$Rd), (OpNode V64:$Rn))]>;
4482 def v8i16 : BaseSIMDTwoSameVector<1, U, 0b01, opc, V128,
4483 asm, ".8h", ".8h",
4484 [(set (v8i16 V128:$Rd), (OpNode V128:$Rn))]>;
4485}
4486
4487// Supports only S and D element sizes, uses high bit of the size field
4488// as an extra opcode bit.
4489multiclass SIMDTwoVectorFP<bit U, bit S, bits<5> opc, string asm,
4490 SDPatternOperator OpNode> {
4491 def v2f32 : BaseSIMDTwoSameVector<0, U, {S,0}, opc, V64,
4492 asm, ".2s", ".2s",
4493 [(set (v2f32 V64:$Rd), (OpNode (v2f32 V64:$Rn)))]>;
4494 def v4f32 : BaseSIMDTwoSameVector<1, U, {S,0}, opc, V128,
4495 asm, ".4s", ".4s",
4496 [(set (v4f32 V128:$Rd), (OpNode (v4f32 V128:$Rn)))]>;
4497 def v2f64 : BaseSIMDTwoSameVector<1, U, {S,1}, opc, V128,
4498 asm, ".2d", ".2d",
4499 [(set (v2f64 V128:$Rd), (OpNode (v2f64 V128:$Rn)))]>;
4500}
4501
4502// Supports only S element size.
4503multiclass SIMDTwoVectorS<bit U, bit S, bits<5> opc, string asm,
4504 SDPatternOperator OpNode> {
4505 def v2i32 : BaseSIMDTwoSameVector<0, U, {S,0}, opc, V64,
4506 asm, ".2s", ".2s",
4507 [(set (v2i32 V64:$Rd), (OpNode (v2i32 V64:$Rn)))]>;
4508 def v4i32 : BaseSIMDTwoSameVector<1, U, {S,0}, opc, V128,
4509 asm, ".4s", ".4s",
4510 [(set (v4i32 V128:$Rd), (OpNode (v4i32 V128:$Rn)))]>;
4511}
4512
4513
4514multiclass SIMDTwoVectorFPToInt<bit U, bit S, bits<5> opc, string asm,
4515 SDPatternOperator OpNode> {
4516 def v2f32 : BaseSIMDTwoSameVector<0, U, {S,0}, opc, V64,
4517 asm, ".2s", ".2s",
4518 [(set (v2i32 V64:$Rd), (OpNode (v2f32 V64:$Rn)))]>;
4519 def v4f32 : BaseSIMDTwoSameVector<1, U, {S,0}, opc, V128,
4520 asm, ".4s", ".4s",
4521 [(set (v4i32 V128:$Rd), (OpNode (v4f32 V128:$Rn)))]>;
4522 def v2f64 : BaseSIMDTwoSameVector<1, U, {S,1}, opc, V128,
4523 asm, ".2d", ".2d",
4524 [(set (v2i64 V128:$Rd), (OpNode (v2f64 V128:$Rn)))]>;
4525}
4526
4527multiclass SIMDTwoVectorIntToFP<bit U, bit S, bits<5> opc, string asm,
4528 SDPatternOperator OpNode> {
4529 def v2f32 : BaseSIMDTwoSameVector<0, U, {S,0}, opc, V64,
4530 asm, ".2s", ".2s",
4531 [(set (v2f32 V64:$Rd), (OpNode (v2i32 V64:$Rn)))]>;
4532 def v4f32 : BaseSIMDTwoSameVector<1, U, {S,0}, opc, V128,
4533 asm, ".4s", ".4s",
4534 [(set (v4f32 V128:$Rd), (OpNode (v4i32 V128:$Rn)))]>;
4535 def v2f64 : BaseSIMDTwoSameVector<1, U, {S,1}, opc, V128,
4536 asm, ".2d", ".2d",
4537 [(set (v2f64 V128:$Rd), (OpNode (v2i64 V128:$Rn)))]>;
4538}
4539
4540
4541class BaseSIMDMixedTwoVector<bit Q, bit U, bits<2> size, bits<5> opcode,
4542 RegisterOperand inreg, RegisterOperand outreg,
4543 string asm, string outkind, string inkind,
4544 list<dag> pattern>
4545 : I<(outs outreg:$Rd), (ins inreg:$Rn), asm,
4546 "{\t$Rd" # outkind # ", $Rn" # inkind #
4547 "|" # outkind # "\t$Rd, $Rn}", "", pattern>,
4548 Sched<[WriteV]> {
4549 bits<5> Rd;
4550 bits<5> Rn;
4551 let Inst{31} = 0;
4552 let Inst{30} = Q;
4553 let Inst{29} = U;
4554 let Inst{28-24} = 0b01110;
4555 let Inst{23-22} = size;
4556 let Inst{21-17} = 0b10000;
4557 let Inst{16-12} = opcode;
4558 let Inst{11-10} = 0b10;
4559 let Inst{9-5} = Rn;
4560 let Inst{4-0} = Rd;
4561}
4562
4563class BaseSIMDMixedTwoVectorTied<bit Q, bit U, bits<2> size, bits<5> opcode,
4564 RegisterOperand inreg, RegisterOperand outreg,
4565 string asm, string outkind, string inkind,
4566 list<dag> pattern>
4567 : I<(outs outreg:$dst), (ins outreg:$Rd, inreg:$Rn), asm,
4568 "{\t$Rd" # outkind # ", $Rn" # inkind #
4569 "|" # outkind # "\t$Rd, $Rn}", "$Rd = $dst", pattern>,
4570 Sched<[WriteV]> {
4571 bits<5> Rd;
4572 bits<5> Rn;
4573 let Inst{31} = 0;
4574 let Inst{30} = Q;
4575 let Inst{29} = U;
4576 let Inst{28-24} = 0b01110;
4577 let Inst{23-22} = size;
4578 let Inst{21-17} = 0b10000;
4579 let Inst{16-12} = opcode;
4580 let Inst{11-10} = 0b10;
4581 let Inst{9-5} = Rn;
4582 let Inst{4-0} = Rd;
4583}
4584
4585multiclass SIMDMixedTwoVector<bit U, bits<5> opc, string asm,
4586 SDPatternOperator OpNode> {
4587 def v8i8 : BaseSIMDMixedTwoVector<0, U, 0b00, opc, V128, V64,
4588 asm, ".8b", ".8h",
4589 [(set (v8i8 V64:$Rd), (OpNode (v8i16 V128:$Rn)))]>;
4590 def v16i8 : BaseSIMDMixedTwoVectorTied<1, U, 0b00, opc, V128, V128,
4591 asm#"2", ".16b", ".8h", []>;
4592 def v4i16 : BaseSIMDMixedTwoVector<0, U, 0b01, opc, V128, V64,
4593 asm, ".4h", ".4s",
4594 [(set (v4i16 V64:$Rd), (OpNode (v4i32 V128:$Rn)))]>;
4595 def v8i16 : BaseSIMDMixedTwoVectorTied<1, U, 0b01, opc, V128, V128,
4596 asm#"2", ".8h", ".4s", []>;
4597 def v2i32 : BaseSIMDMixedTwoVector<0, U, 0b10, opc, V128, V64,
4598 asm, ".2s", ".2d",
4599 [(set (v2i32 V64:$Rd), (OpNode (v2i64 V128:$Rn)))]>;
4600 def v4i32 : BaseSIMDMixedTwoVectorTied<1, U, 0b10, opc, V128, V128,
4601 asm#"2", ".4s", ".2d", []>;
4602
4603 def : Pat<(concat_vectors (v8i8 V64:$Rd), (OpNode (v8i16 V128:$Rn))),
4604 (!cast<Instruction>(NAME # "v16i8")
4605 (INSERT_SUBREG (IMPLICIT_DEF), V64:$Rd, dsub), V128:$Rn)>;
4606 def : Pat<(concat_vectors (v4i16 V64:$Rd), (OpNode (v4i32 V128:$Rn))),
4607 (!cast<Instruction>(NAME # "v8i16")
4608 (INSERT_SUBREG (IMPLICIT_DEF), V64:$Rd, dsub), V128:$Rn)>;
4609 def : Pat<(concat_vectors (v2i32 V64:$Rd), (OpNode (v2i64 V128:$Rn))),
4610 (!cast<Instruction>(NAME # "v4i32")
4611 (INSERT_SUBREG (IMPLICIT_DEF), V64:$Rd, dsub), V128:$Rn)>;
4612}
4613
4614class BaseSIMDCmpTwoVector<bit Q, bit U, bits<2> size, bits<5> opcode,
4615 RegisterOperand regtype,
4616 string asm, string kind, string zero,
4617 ValueType dty, ValueType sty, SDNode OpNode>
4618 : I<(outs regtype:$Rd), (ins regtype:$Rn), asm,
4619 "{\t$Rd" # kind # ", $Rn" # kind # ", #" # zero #
4620 "|" # kind # "\t$Rd, $Rn, #" # zero # "}", "",
4621 [(set (dty regtype:$Rd), (OpNode (sty regtype:$Rn)))]>,
4622 Sched<[WriteV]> {
4623 bits<5> Rd;
4624 bits<5> Rn;
4625 let Inst{31} = 0;
4626 let Inst{30} = Q;
4627 let Inst{29} = U;
4628 let Inst{28-24} = 0b01110;
4629 let Inst{23-22} = size;
4630 let Inst{21-17} = 0b10000;
4631 let Inst{16-12} = opcode;
4632 let Inst{11-10} = 0b10;
4633 let Inst{9-5} = Rn;
4634 let Inst{4-0} = Rd;
4635}
4636
4637// Comparisons support all element sizes, except 1xD.
4638multiclass SIMDCmpTwoVector<bit U, bits<5> opc, string asm,
4639 SDNode OpNode> {
4640 def v8i8rz : BaseSIMDCmpTwoVector<0, U, 0b00, opc, V64,
4641 asm, ".8b", "0",
4642 v8i8, v8i8, OpNode>;
4643 def v16i8rz : BaseSIMDCmpTwoVector<1, U, 0b00, opc, V128,
4644 asm, ".16b", "0",
4645 v16i8, v16i8, OpNode>;
4646 def v4i16rz : BaseSIMDCmpTwoVector<0, U, 0b01, opc, V64,
4647 asm, ".4h", "0",
4648 v4i16, v4i16, OpNode>;
4649 def v8i16rz : BaseSIMDCmpTwoVector<1, U, 0b01, opc, V128,
4650 asm, ".8h", "0",
4651 v8i16, v8i16, OpNode>;
4652 def v2i32rz : BaseSIMDCmpTwoVector<0, U, 0b10, opc, V64,
4653 asm, ".2s", "0",
4654 v2i32, v2i32, OpNode>;
4655 def v4i32rz : BaseSIMDCmpTwoVector<1, U, 0b10, opc, V128,
4656 asm, ".4s", "0",
4657 v4i32, v4i32, OpNode>;
4658 def v2i64rz : BaseSIMDCmpTwoVector<1, U, 0b11, opc, V128,
4659 asm, ".2d", "0",
4660 v2i64, v2i64, OpNode>;
4661}
4662
4663// FP Comparisons support only S and D element sizes.
4664multiclass SIMDFPCmpTwoVector<bit U, bit S, bits<5> opc,
4665 string asm, SDNode OpNode> {
4666
4667 def v2i32rz : BaseSIMDCmpTwoVector<0, U, {S,0}, opc, V64,
4668 asm, ".2s", "0.0",
4669 v2i32, v2f32, OpNode>;
4670 def v4i32rz : BaseSIMDCmpTwoVector<1, U, {S,0}, opc, V128,
4671 asm, ".4s", "0.0",
4672 v4i32, v4f32, OpNode>;
4673 def v2i64rz : BaseSIMDCmpTwoVector<1, U, {S,1}, opc, V128,
4674 asm, ".2d", "0.0",
4675 v2i64, v2f64, OpNode>;
4676
4677 def : InstAlias<asm # " $Vd.2s, $Vn.2s, #0",
4678 (!cast<Instruction>(NAME # v2i32rz) V64:$Vd, V64:$Vn), 0>;
4679 def : InstAlias<asm # " $Vd.4s, $Vn.4s, #0",
4680 (!cast<Instruction>(NAME # v4i32rz) V128:$Vd, V128:$Vn), 0>;
4681 def : InstAlias<asm # " $Vd.2d, $Vn.2d, #0",
4682 (!cast<Instruction>(NAME # v2i64rz) V128:$Vd, V128:$Vn), 0>;
4683 def : InstAlias<asm # ".2s $Vd, $Vn, #0",
4684 (!cast<Instruction>(NAME # v2i32rz) V64:$Vd, V64:$Vn), 0>;
4685 def : InstAlias<asm # ".4s $Vd, $Vn, #0",
4686 (!cast<Instruction>(NAME # v4i32rz) V128:$Vd, V128:$Vn), 0>;
4687 def : InstAlias<asm # ".2d $Vd, $Vn, #0",
4688 (!cast<Instruction>(NAME # v2i64rz) V128:$Vd, V128:$Vn), 0>;
4689}
4690
4691let mayLoad = 0, mayStore = 0, hasSideEffects = 0 in
4692class BaseSIMDFPCvtTwoVector<bit Q, bit U, bits<2> size, bits<5> opcode,
4693 RegisterOperand outtype, RegisterOperand intype,
4694 string asm, string VdTy, string VnTy,
4695 list<dag> pattern>
4696 : I<(outs outtype:$Rd), (ins intype:$Rn), asm,
4697 !strconcat("\t$Rd", VdTy, ", $Rn", VnTy), "", pattern>,
4698 Sched<[WriteV]> {
4699 bits<5> Rd;
4700 bits<5> Rn;
4701 let Inst{31} = 0;
4702 let Inst{30} = Q;
4703 let Inst{29} = U;
4704 let Inst{28-24} = 0b01110;
4705 let Inst{23-22} = size;
4706 let Inst{21-17} = 0b10000;
4707 let Inst{16-12} = opcode;
4708 let Inst{11-10} = 0b10;
4709 let Inst{9-5} = Rn;
4710 let Inst{4-0} = Rd;
4711}
4712
4713class BaseSIMDFPCvtTwoVectorTied<bit Q, bit U, bits<2> size, bits<5> opcode,
4714 RegisterOperand outtype, RegisterOperand intype,
4715 string asm, string VdTy, string VnTy,
4716 list<dag> pattern>
4717 : I<(outs outtype:$dst), (ins outtype:$Rd, intype:$Rn), asm,
4718 !strconcat("\t$Rd", VdTy, ", $Rn", VnTy), "$Rd = $dst", pattern>,
4719 Sched<[WriteV]> {
4720 bits<5> Rd;
4721 bits<5> Rn;
4722 let Inst{31} = 0;
4723 let Inst{30} = Q;
4724 let Inst{29} = U;
4725 let Inst{28-24} = 0b01110;
4726 let Inst{23-22} = size;
4727 let Inst{21-17} = 0b10000;
4728 let Inst{16-12} = opcode;
4729 let Inst{11-10} = 0b10;
4730 let Inst{9-5} = Rn;
4731 let Inst{4-0} = Rd;
4732}
4733
4734multiclass SIMDFPWidenTwoVector<bit U, bit S, bits<5> opc, string asm> {
4735 def v4i16 : BaseSIMDFPCvtTwoVector<0, U, {S,0}, opc, V128, V64,
4736 asm, ".4s", ".4h", []>;
4737 def v8i16 : BaseSIMDFPCvtTwoVector<1, U, {S,0}, opc, V128, V128,
4738 asm#"2", ".4s", ".8h", []>;
4739 def v2i32 : BaseSIMDFPCvtTwoVector<0, U, {S,1}, opc, V128, V64,
4740 asm, ".2d", ".2s", []>;
4741 def v4i32 : BaseSIMDFPCvtTwoVector<1, U, {S,1}, opc, V128, V128,
4742 asm#"2", ".2d", ".4s", []>;
4743}
4744
4745multiclass SIMDFPNarrowTwoVector<bit U, bit S, bits<5> opc, string asm> {
4746 def v4i16 : BaseSIMDFPCvtTwoVector<0, U, {S,0}, opc, V64, V128,
4747 asm, ".4h", ".4s", []>;
4748 def v8i16 : BaseSIMDFPCvtTwoVectorTied<1, U, {S,0}, opc, V128, V128,
4749 asm#"2", ".8h", ".4s", []>;
4750 def v2i32 : BaseSIMDFPCvtTwoVector<0, U, {S,1}, opc, V64, V128,
4751 asm, ".2s", ".2d", []>;
4752 def v4i32 : BaseSIMDFPCvtTwoVectorTied<1, U, {S,1}, opc, V128, V128,
4753 asm#"2", ".4s", ".2d", []>;
4754}
4755
4756multiclass SIMDFPInexactCvtTwoVector<bit U, bit S, bits<5> opc, string asm,
4757 Intrinsic OpNode> {
4758 def v2f32 : BaseSIMDFPCvtTwoVector<0, U, {S,1}, opc, V64, V128,
4759 asm, ".2s", ".2d",
4760 [(set (v2f32 V64:$Rd), (OpNode (v2f64 V128:$Rn)))]>;
4761 def v4f32 : BaseSIMDFPCvtTwoVectorTied<1, U, {S,1}, opc, V128, V128,
4762 asm#"2", ".4s", ".2d", []>;
4763
4764 def : Pat<(concat_vectors (v2f32 V64:$Rd), (OpNode (v2f64 V128:$Rn))),
4765 (!cast<Instruction>(NAME # "v4f32")
4766 (INSERT_SUBREG (IMPLICIT_DEF), V64:$Rd, dsub), V128:$Rn)>;
4767}
4768
4769//----------------------------------------------------------------------------
4770// AdvSIMD three register different-size vector instructions.
4771//----------------------------------------------------------------------------
4772
4773let mayLoad = 0, mayStore = 0, hasSideEffects = 0 in
4774class BaseSIMDDifferentThreeVector<bit U, bits<3> size, bits<4> opcode,
4775 RegisterOperand outtype, RegisterOperand intype1,
4776 RegisterOperand intype2, string asm,
4777 string outkind, string inkind1, string inkind2,
4778 list<dag> pattern>
4779 : I<(outs outtype:$Rd), (ins intype1:$Rn, intype2:$Rm), asm,
4780 "{\t$Rd" # outkind # ", $Rn" # inkind1 # ", $Rm" # inkind2 #
4781 "|" # outkind # "\t$Rd, $Rn, $Rm}", "", pattern>,
4782 Sched<[WriteV]> {
4783 bits<5> Rd;
4784 bits<5> Rn;
4785 bits<5> Rm;
4786 let Inst{31} = 0;
4787 let Inst{30} = size{0};
4788 let Inst{29} = U;
4789 let Inst{28-24} = 0b01110;
4790 let Inst{23-22} = size{2-1};
4791 let Inst{21} = 1;
4792 let Inst{20-16} = Rm;
4793 let Inst{15-12} = opcode;
4794 let Inst{11-10} = 0b00;
4795 let Inst{9-5} = Rn;
4796 let Inst{4-0} = Rd;
4797}
4798
4799let mayLoad = 0, mayStore = 0, hasSideEffects = 0 in
4800class BaseSIMDDifferentThreeVectorTied<bit U, bits<3> size, bits<4> opcode,
4801 RegisterOperand outtype, RegisterOperand intype1,
4802 RegisterOperand intype2, string asm,
4803 string outkind, string inkind1, string inkind2,
4804 list<dag> pattern>
4805 : I<(outs outtype:$dst), (ins outtype:$Rd, intype1:$Rn, intype2:$Rm), asm,
4806 "{\t$Rd" # outkind # ", $Rn" # inkind1 # ", $Rm" # inkind2 #
4807 "|" # outkind # "\t$Rd, $Rn, $Rm}", "$Rd = $dst", pattern>,
4808 Sched<[WriteV]> {
4809 bits<5> Rd;
4810 bits<5> Rn;
4811 bits<5> Rm;
4812 let Inst{31} = 0;
4813 let Inst{30} = size{0};
4814 let Inst{29} = U;
4815 let Inst{28-24} = 0b01110;
4816 let Inst{23-22} = size{2-1};
4817 let Inst{21} = 1;
4818 let Inst{20-16} = Rm;
4819 let Inst{15-12} = opcode;
4820 let Inst{11-10} = 0b00;
4821 let Inst{9-5} = Rn;
4822 let Inst{4-0} = Rd;
4823}
4824
4825// FIXME: TableGen doesn't know how to deal with expanded types that also
4826// change the element count (in this case, placing the results in
4827// the high elements of the result register rather than the low
4828// elements). Until that's fixed, we can't code-gen those.
4829multiclass SIMDNarrowThreeVectorBHS<bit U, bits<4> opc, string asm,
4830 Intrinsic IntOp> {
4831 def v8i16_v8i8 : BaseSIMDDifferentThreeVector<U, 0b000, opc,
4832 V64, V128, V128,
4833 asm, ".8b", ".8h", ".8h",
4834 [(set (v8i8 V64:$Rd), (IntOp (v8i16 V128:$Rn), (v8i16 V128:$Rm)))]>;
4835 def v8i16_v16i8 : BaseSIMDDifferentThreeVectorTied<U, 0b001, opc,
4836 V128, V128, V128,
4837 asm#"2", ".16b", ".8h", ".8h",
4838 []>;
4839 def v4i32_v4i16 : BaseSIMDDifferentThreeVector<U, 0b010, opc,
4840 V64, V128, V128,
4841 asm, ".4h", ".4s", ".4s",
4842 [(set (v4i16 V64:$Rd), (IntOp (v4i32 V128:$Rn), (v4i32 V128:$Rm)))]>;
4843 def v4i32_v8i16 : BaseSIMDDifferentThreeVectorTied<U, 0b011, opc,
4844 V128, V128, V128,
4845 asm#"2", ".8h", ".4s", ".4s",
4846 []>;
4847 def v2i64_v2i32 : BaseSIMDDifferentThreeVector<U, 0b100, opc,
4848 V64, V128, V128,
4849 asm, ".2s", ".2d", ".2d",
4850 [(set (v2i32 V64:$Rd), (IntOp (v2i64 V128:$Rn), (v2i64 V128:$Rm)))]>;
4851 def v2i64_v4i32 : BaseSIMDDifferentThreeVectorTied<U, 0b101, opc,
4852 V128, V128, V128,
4853 asm#"2", ".4s", ".2d", ".2d",
4854 []>;
4855
4856
4857 // Patterns for the '2' variants involve INSERT_SUBREG, which you can't put in
4858 // a version attached to an instruction.
4859 def : Pat<(concat_vectors (v8i8 V64:$Rd), (IntOp (v8i16 V128:$Rn),
4860 (v8i16 V128:$Rm))),
4861 (!cast<Instruction>(NAME # "v8i16_v16i8")
4862 (INSERT_SUBREG (IMPLICIT_DEF), V64:$Rd, dsub),
4863 V128:$Rn, V128:$Rm)>;
4864 def : Pat<(concat_vectors (v4i16 V64:$Rd), (IntOp (v4i32 V128:$Rn),
4865 (v4i32 V128:$Rm))),
4866 (!cast<Instruction>(NAME # "v4i32_v8i16")
4867 (INSERT_SUBREG (IMPLICIT_DEF), V64:$Rd, dsub),
4868 V128:$Rn, V128:$Rm)>;
4869 def : Pat<(concat_vectors (v2i32 V64:$Rd), (IntOp (v2i64 V128:$Rn),
4870 (v2i64 V128:$Rm))),
4871 (!cast<Instruction>(NAME # "v2i64_v4i32")
4872 (INSERT_SUBREG (IMPLICIT_DEF), V64:$Rd, dsub),
4873 V128:$Rn, V128:$Rm)>;
4874}
4875
4876multiclass SIMDDifferentThreeVectorBD<bit U, bits<4> opc, string asm,
4877 Intrinsic IntOp> {
4878 def v8i8 : BaseSIMDDifferentThreeVector<U, 0b000, opc,
4879 V128, V64, V64,
4880 asm, ".8h", ".8b", ".8b",
4881 [(set (v8i16 V128:$Rd), (IntOp (v8i8 V64:$Rn), (v8i8 V64:$Rm)))]>;
4882 def v16i8 : BaseSIMDDifferentThreeVector<U, 0b001, opc,
4883 V128, V128, V128,
4884 asm#"2", ".8h", ".16b", ".16b", []>;
4885 let Predicates = [HasCrypto] in {
4886 def v1i64 : BaseSIMDDifferentThreeVector<U, 0b110, opc,
4887 V128, V64, V64,
4888 asm, ".1q", ".1d", ".1d", []>;
4889 def v2i64 : BaseSIMDDifferentThreeVector<U, 0b111, opc,
4890 V128, V128, V128,
4891 asm#"2", ".1q", ".2d", ".2d", []>;
4892 }
4893
4894 def : Pat<(v8i16 (IntOp (v8i8 (extract_high_v16i8 V128:$Rn)),
4895 (v8i8 (extract_high_v16i8 V128:$Rm)))),
4896 (!cast<Instruction>(NAME#"v16i8") V128:$Rn, V128:$Rm)>;
4897}
4898
4899multiclass SIMDLongThreeVectorHS<bit U, bits<4> opc, string asm,
4900 SDPatternOperator OpNode> {
4901 def v4i16_v4i32 : BaseSIMDDifferentThreeVector<U, 0b010, opc,
4902 V128, V64, V64,
4903 asm, ".4s", ".4h", ".4h",
4904 [(set (v4i32 V128:$Rd), (OpNode (v4i16 V64:$Rn), (v4i16 V64:$Rm)))]>;
4905 def v8i16_v4i32 : BaseSIMDDifferentThreeVector<U, 0b011, opc,
4906 V128, V128, V128,
4907 asm#"2", ".4s", ".8h", ".8h",
4908 [(set (v4i32 V128:$Rd), (OpNode (extract_high_v8i16 V128:$Rn),
4909 (extract_high_v8i16 V128:$Rm)))]>;
4910 def v2i32_v2i64 : BaseSIMDDifferentThreeVector<U, 0b100, opc,
4911 V128, V64, V64,
4912 asm, ".2d", ".2s", ".2s",
4913 [(set (v2i64 V128:$Rd), (OpNode (v2i32 V64:$Rn), (v2i32 V64:$Rm)))]>;
4914 def v4i32_v2i64 : BaseSIMDDifferentThreeVector<U, 0b101, opc,
4915 V128, V128, V128,
4916 asm#"2", ".2d", ".4s", ".4s",
4917 [(set (v2i64 V128:$Rd), (OpNode (extract_high_v4i32 V128:$Rn),
4918 (extract_high_v4i32 V128:$Rm)))]>;
4919}
4920
4921multiclass SIMDLongThreeVectorBHSabdl<bit U, bits<4> opc, string asm,
4922 SDPatternOperator OpNode = null_frag> {
4923 def v8i8_v8i16 : BaseSIMDDifferentThreeVector<U, 0b000, opc,
4924 V128, V64, V64,
4925 asm, ".8h", ".8b", ".8b",
4926 [(set (v8i16 V128:$Rd),
4927 (zext (v8i8 (OpNode (v8i8 V64:$Rn), (v8i8 V64:$Rm)))))]>;
4928 def v16i8_v8i16 : BaseSIMDDifferentThreeVector<U, 0b001, opc,
4929 V128, V128, V128,
4930 asm#"2", ".8h", ".16b", ".16b",
4931 [(set (v8i16 V128:$Rd),
4932 (zext (v8i8 (OpNode (extract_high_v16i8 V128:$Rn),
4933 (extract_high_v16i8 V128:$Rm)))))]>;
4934 def v4i16_v4i32 : BaseSIMDDifferentThreeVector<U, 0b010, opc,
4935 V128, V64, V64,
4936 asm, ".4s", ".4h", ".4h",
4937 [(set (v4i32 V128:$Rd),
4938 (zext (v4i16 (OpNode (v4i16 V64:$Rn), (v4i16 V64:$Rm)))))]>;
4939 def v8i16_v4i32 : BaseSIMDDifferentThreeVector<U, 0b011, opc,
4940 V128, V128, V128,
4941 asm#"2", ".4s", ".8h", ".8h",
4942 [(set (v4i32 V128:$Rd),
4943 (zext (v4i16 (OpNode (extract_high_v8i16 V128:$Rn),
4944 (extract_high_v8i16 V128:$Rm)))))]>;
4945 def v2i32_v2i64 : BaseSIMDDifferentThreeVector<U, 0b100, opc,
4946 V128, V64, V64,
4947 asm, ".2d", ".2s", ".2s",
4948 [(set (v2i64 V128:$Rd),
4949 (zext (v2i32 (OpNode (v2i32 V64:$Rn), (v2i32 V64:$Rm)))))]>;
4950 def v4i32_v2i64 : BaseSIMDDifferentThreeVector<U, 0b101, opc,
4951 V128, V128, V128,
4952 asm#"2", ".2d", ".4s", ".4s",
4953 [(set (v2i64 V128:$Rd),
4954 (zext (v2i32 (OpNode (extract_high_v4i32 V128:$Rn),
4955 (extract_high_v4i32 V128:$Rm)))))]>;
4956}
4957
4958multiclass SIMDLongThreeVectorTiedBHSabal<bit U, bits<4> opc,
4959 string asm,
4960 SDPatternOperator OpNode> {
4961 def v8i8_v8i16 : BaseSIMDDifferentThreeVectorTied<U, 0b000, opc,
4962 V128, V64, V64,
4963 asm, ".8h", ".8b", ".8b",
4964 [(set (v8i16 V128:$dst),
4965 (add (v8i16 V128:$Rd),
4966 (zext (v8i8 (OpNode (v8i8 V64:$Rn), (v8i8 V64:$Rm))))))]>;
4967 def v16i8_v8i16 : BaseSIMDDifferentThreeVectorTied<U, 0b001, opc,
4968 V128, V128, V128,
4969 asm#"2", ".8h", ".16b", ".16b",
4970 [(set (v8i16 V128:$dst),
4971 (add (v8i16 V128:$Rd),
4972 (zext (v8i8 (OpNode (extract_high_v16i8 V128:$Rn),
4973 (extract_high_v16i8 V128:$Rm))))))]>;
4974 def v4i16_v4i32 : BaseSIMDDifferentThreeVectorTied<U, 0b010, opc,
4975 V128, V64, V64,
4976 asm, ".4s", ".4h", ".4h",
4977 [(set (v4i32 V128:$dst),
4978 (add (v4i32 V128:$Rd),
4979 (zext (v4i16 (OpNode (v4i16 V64:$Rn), (v4i16 V64:$Rm))))))]>;
4980 def v8i16_v4i32 : BaseSIMDDifferentThreeVectorTied<U, 0b011, opc,
4981 V128, V128, V128,
4982 asm#"2", ".4s", ".8h", ".8h",
4983 [(set (v4i32 V128:$dst),
4984 (add (v4i32 V128:$Rd),
4985 (zext (v4i16 (OpNode (extract_high_v8i16 V128:$Rn),
4986 (extract_high_v8i16 V128:$Rm))))))]>;
4987 def v2i32_v2i64 : BaseSIMDDifferentThreeVectorTied<U, 0b100, opc,
4988 V128, V64, V64,
4989 asm, ".2d", ".2s", ".2s",
4990 [(set (v2i64 V128:$dst),
4991 (add (v2i64 V128:$Rd),
4992 (zext (v2i32 (OpNode (v2i32 V64:$Rn), (v2i32 V64:$Rm))))))]>;
4993 def v4i32_v2i64 : BaseSIMDDifferentThreeVectorTied<U, 0b101, opc,
4994 V128, V128, V128,
4995 asm#"2", ".2d", ".4s", ".4s",
4996 [(set (v2i64 V128:$dst),
4997 (add (v2i64 V128:$Rd),
4998 (zext (v2i32 (OpNode (extract_high_v4i32 V128:$Rn),
4999 (extract_high_v4i32 V128:$Rm))))))]>;
5000}
5001
5002multiclass SIMDLongThreeVectorBHS<bit U, bits<4> opc, string asm,
5003 SDPatternOperator OpNode = null_frag> {
5004 def v8i8_v8i16 : BaseSIMDDifferentThreeVector<U, 0b000, opc,
5005 V128, V64, V64,
5006 asm, ".8h", ".8b", ".8b",
5007 [(set (v8i16 V128:$Rd), (OpNode (v8i8 V64:$Rn), (v8i8 V64:$Rm)))]>;
5008 def v16i8_v8i16 : BaseSIMDDifferentThreeVector<U, 0b001, opc,
5009 V128, V128, V128,
5010 asm#"2", ".8h", ".16b", ".16b",
5011 [(set (v8i16 V128:$Rd), (OpNode (extract_high_v16i8 V128:$Rn),
5012 (extract_high_v16i8 V128:$Rm)))]>;
5013 def v4i16_v4i32 : BaseSIMDDifferentThreeVector<U, 0b010, opc,
5014 V128, V64, V64,
5015 asm, ".4s", ".4h", ".4h",
5016 [(set (v4i32 V128:$Rd), (OpNode (v4i16 V64:$Rn), (v4i16 V64:$Rm)))]>;
5017 def v8i16_v4i32 : BaseSIMDDifferentThreeVector<U, 0b011, opc,
5018 V128, V128, V128,
5019 asm#"2", ".4s", ".8h", ".8h",
5020 [(set (v4i32 V128:$Rd), (OpNode (extract_high_v8i16 V128:$Rn),
5021 (extract_high_v8i16 V128:$Rm)))]>;
5022 def v2i32_v2i64 : BaseSIMDDifferentThreeVector<U, 0b100, opc,
5023 V128, V64, V64,
5024 asm, ".2d", ".2s", ".2s",
5025 [(set (v2i64 V128:$Rd), (OpNode (v2i32 V64:$Rn), (v2i32 V64:$Rm)))]>;
5026 def v4i32_v2i64 : BaseSIMDDifferentThreeVector<U, 0b101, opc,
5027 V128, V128, V128,
5028 asm#"2", ".2d", ".4s", ".4s",
5029 [(set (v2i64 V128:$Rd), (OpNode (extract_high_v4i32 V128:$Rn),
5030 (extract_high_v4i32 V128:$Rm)))]>;
5031}
5032
5033multiclass SIMDLongThreeVectorTiedBHS<bit U, bits<4> opc,
5034 string asm,
5035 SDPatternOperator OpNode> {
5036 def v8i8_v8i16 : BaseSIMDDifferentThreeVectorTied<U, 0b000, opc,
5037 V128, V64, V64,
5038 asm, ".8h", ".8b", ".8b",
5039 [(set (v8i16 V128:$dst),
5040 (OpNode (v8i16 V128:$Rd), (v8i8 V64:$Rn), (v8i8 V64:$Rm)))]>;
5041 def v16i8_v8i16 : BaseSIMDDifferentThreeVectorTied<U, 0b001, opc,
5042 V128, V128, V128,
5043 asm#"2", ".8h", ".16b", ".16b",
5044 [(set (v8i16 V128:$dst),
5045 (OpNode (v8i16 V128:$Rd),
5046 (extract_high_v16i8 V128:$Rn),
5047 (extract_high_v16i8 V128:$Rm)))]>;
5048 def v4i16_v4i32 : BaseSIMDDifferentThreeVectorTied<U, 0b010, opc,
5049 V128, V64, V64,
5050 asm, ".4s", ".4h", ".4h",
5051 [(set (v4i32 V128:$dst),
5052 (OpNode (v4i32 V128:$Rd), (v4i16 V64:$Rn), (v4i16 V64:$Rm)))]>;
5053 def v8i16_v4i32 : BaseSIMDDifferentThreeVectorTied<U, 0b011, opc,
5054 V128, V128, V128,
5055 asm#"2", ".4s", ".8h", ".8h",
5056 [(set (v4i32 V128:$dst),
5057 (OpNode (v4i32 V128:$Rd),
5058 (extract_high_v8i16 V128:$Rn),
5059 (extract_high_v8i16 V128:$Rm)))]>;
5060 def v2i32_v2i64 : BaseSIMDDifferentThreeVectorTied<U, 0b100, opc,
5061 V128, V64, V64,
5062 asm, ".2d", ".2s", ".2s",
5063 [(set (v2i64 V128:$dst),
5064 (OpNode (v2i64 V128:$Rd), (v2i32 V64:$Rn), (v2i32 V64:$Rm)))]>;
5065 def v4i32_v2i64 : BaseSIMDDifferentThreeVectorTied<U, 0b101, opc,
5066 V128, V128, V128,
5067 asm#"2", ".2d", ".4s", ".4s",
5068 [(set (v2i64 V128:$dst),
5069 (OpNode (v2i64 V128:$Rd),
5070 (extract_high_v4i32 V128:$Rn),
5071 (extract_high_v4i32 V128:$Rm)))]>;
5072}
5073
5074multiclass SIMDLongThreeVectorSQDMLXTiedHS<bit U, bits<4> opc, string asm,
5075 SDPatternOperator Accum> {
5076 def v4i16_v4i32 : BaseSIMDDifferentThreeVectorTied<U, 0b010, opc,
5077 V128, V64, V64,
5078 asm, ".4s", ".4h", ".4h",
5079 [(set (v4i32 V128:$dst),
5080 (Accum (v4i32 V128:$Rd),
5081 (v4i32 (int_aarch64_neon_sqdmull (v4i16 V64:$Rn),
5082 (v4i16 V64:$Rm)))))]>;
5083 def v8i16_v4i32 : BaseSIMDDifferentThreeVectorTied<U, 0b011, opc,
5084 V128, V128, V128,
5085 asm#"2", ".4s", ".8h", ".8h",
5086 [(set (v4i32 V128:$dst),
5087 (Accum (v4i32 V128:$Rd),
5088 (v4i32 (int_aarch64_neon_sqdmull (extract_high_v8i16 V128:$Rn),
5089 (extract_high_v8i16 V128:$Rm)))))]>;
5090 def v2i32_v2i64 : BaseSIMDDifferentThreeVectorTied<U, 0b100, opc,
5091 V128, V64, V64,
5092 asm, ".2d", ".2s", ".2s",
5093 [(set (v2i64 V128:$dst),
5094 (Accum (v2i64 V128:$Rd),
5095 (v2i64 (int_aarch64_neon_sqdmull (v2i32 V64:$Rn),
5096 (v2i32 V64:$Rm)))))]>;
5097 def v4i32_v2i64 : BaseSIMDDifferentThreeVectorTied<U, 0b101, opc,
5098 V128, V128, V128,
5099 asm#"2", ".2d", ".4s", ".4s",
5100 [(set (v2i64 V128:$dst),
5101 (Accum (v2i64 V128:$Rd),
5102 (v2i64 (int_aarch64_neon_sqdmull (extract_high_v4i32 V128:$Rn),
5103 (extract_high_v4i32 V128:$Rm)))))]>;
5104}
5105
5106multiclass SIMDWideThreeVectorBHS<bit U, bits<4> opc, string asm,
5107 SDPatternOperator OpNode> {
5108 def v8i8_v8i16 : BaseSIMDDifferentThreeVector<U, 0b000, opc,
5109 V128, V128, V64,
5110 asm, ".8h", ".8h", ".8b",
5111 [(set (v8i16 V128:$Rd), (OpNode (v8i16 V128:$Rn), (v8i8 V64:$Rm)))]>;
5112 def v16i8_v8i16 : BaseSIMDDifferentThreeVector<U, 0b001, opc,
5113 V128, V128, V128,
5114 asm#"2", ".8h", ".8h", ".16b",
5115 [(set (v8i16 V128:$Rd), (OpNode (v8i16 V128:$Rn),
5116 (extract_high_v16i8 V128:$Rm)))]>;
5117 def v4i16_v4i32 : BaseSIMDDifferentThreeVector<U, 0b010, opc,
5118 V128, V128, V64,
5119 asm, ".4s", ".4s", ".4h",
5120 [(set (v4i32 V128:$Rd), (OpNode (v4i32 V128:$Rn), (v4i16 V64:$Rm)))]>;
5121 def v8i16_v4i32 : BaseSIMDDifferentThreeVector<U, 0b011, opc,
5122 V128, V128, V128,
5123 asm#"2", ".4s", ".4s", ".8h",
5124 [(set (v4i32 V128:$Rd), (OpNode (v4i32 V128:$Rn),
5125 (extract_high_v8i16 V128:$Rm)))]>;
5126 def v2i32_v2i64 : BaseSIMDDifferentThreeVector<U, 0b100, opc,
5127 V128, V128, V64,
5128 asm, ".2d", ".2d", ".2s",
5129 [(set (v2i64 V128:$Rd), (OpNode (v2i64 V128:$Rn), (v2i32 V64:$Rm)))]>;
5130 def v4i32_v2i64 : BaseSIMDDifferentThreeVector<U, 0b101, opc,
5131 V128, V128, V128,
5132 asm#"2", ".2d", ".2d", ".4s",
5133 [(set (v2i64 V128:$Rd), (OpNode (v2i64 V128:$Rn),
5134 (extract_high_v4i32 V128:$Rm)))]>;
5135}
5136
5137//----------------------------------------------------------------------------
5138// AdvSIMD bitwise extract from vector
5139//----------------------------------------------------------------------------
5140
5141class BaseSIMDBitwiseExtract<bit size, RegisterOperand regtype, ValueType vty,
5142 string asm, string kind>
5143 : I<(outs regtype:$Rd), (ins regtype:$Rn, regtype:$Rm, i32imm:$imm), asm,
5144 "{\t$Rd" # kind # ", $Rn" # kind # ", $Rm" # kind # ", $imm" #
5145 "|" # kind # "\t$Rd, $Rn, $Rm, $imm}", "",
5146 [(set (vty regtype:$Rd),
5147 (AArch64ext regtype:$Rn, regtype:$Rm, (i32 imm:$imm)))]>,
5148 Sched<[WriteV]> {
5149 bits<5> Rd;
5150 bits<5> Rn;
5151 bits<5> Rm;
5152 bits<4> imm;
5153 let Inst{31} = 0;
5154 let Inst{30} = size;
5155 let Inst{29-21} = 0b101110000;
5156 let Inst{20-16} = Rm;
5157 let Inst{15} = 0;
5158 let Inst{14-11} = imm;
5159 let Inst{10} = 0;
5160 let Inst{9-5} = Rn;
5161 let Inst{4-0} = Rd;
5162}
5163
5164
5165multiclass SIMDBitwiseExtract<string asm> {
5166 def v8i8 : BaseSIMDBitwiseExtract<0, V64, v8i8, asm, ".8b"> {
5167 let imm{3} = 0;
5168 }
5169 def v16i8 : BaseSIMDBitwiseExtract<1, V128, v16i8, asm, ".16b">;
5170}
5171
5172//----------------------------------------------------------------------------
5173// AdvSIMD zip vector
5174//----------------------------------------------------------------------------
5175
5176class BaseSIMDZipVector<bits<3> size, bits<3> opc, RegisterOperand regtype,
5177 string asm, string kind, SDNode OpNode, ValueType valty>
5178 : I<(outs regtype:$Rd), (ins regtype:$Rn, regtype:$Rm), asm,
5179 "{\t$Rd" # kind # ", $Rn" # kind # ", $Rm" # kind #
5180 "|" # kind # "\t$Rd, $Rn, $Rm}", "",
5181 [(set (valty regtype:$Rd), (OpNode regtype:$Rn, regtype:$Rm))]>,
5182 Sched<[WriteV]> {
5183 bits<5> Rd;
5184 bits<5> Rn;
5185 bits<5> Rm;
5186 let Inst{31} = 0;
5187 let Inst{30} = size{0};
5188 let Inst{29-24} = 0b001110;
5189 let Inst{23-22} = size{2-1};
5190 let Inst{21} = 0;
5191 let Inst{20-16} = Rm;
5192 let Inst{15} = 0;
5193 let Inst{14-12} = opc;
5194 let Inst{11-10} = 0b10;
5195 let Inst{9-5} = Rn;
5196 let Inst{4-0} = Rd;
5197}
5198
5199multiclass SIMDZipVector<bits<3>opc, string asm,
5200 SDNode OpNode> {
5201 def v8i8 : BaseSIMDZipVector<0b000, opc, V64,
5202 asm, ".8b", OpNode, v8i8>;
5203 def v16i8 : BaseSIMDZipVector<0b001, opc, V128,
5204 asm, ".16b", OpNode, v16i8>;
5205 def v4i16 : BaseSIMDZipVector<0b010, opc, V64,
5206 asm, ".4h", OpNode, v4i16>;
5207 def v8i16 : BaseSIMDZipVector<0b011, opc, V128,
5208 asm, ".8h", OpNode, v8i16>;
5209 def v2i32 : BaseSIMDZipVector<0b100, opc, V64,
5210 asm, ".2s", OpNode, v2i32>;
5211 def v4i32 : BaseSIMDZipVector<0b101, opc, V128,
5212 asm, ".4s", OpNode, v4i32>;
5213 def v2i64 : BaseSIMDZipVector<0b111, opc, V128,
5214 asm, ".2d", OpNode, v2i64>;
5215
5216 def : Pat<(v2f32 (OpNode V64:$Rn, V64:$Rm)),
5217 (!cast<Instruction>(NAME#"v2i32") V64:$Rn, V64:$Rm)>;
5218 def : Pat<(v4f32 (OpNode V128:$Rn, V128:$Rm)),
5219 (!cast<Instruction>(NAME#"v4i32") V128:$Rn, V128:$Rm)>;
5220 def : Pat<(v2f64 (OpNode V128:$Rn, V128:$Rm)),
5221 (!cast<Instruction>(NAME#"v2i64") V128:$Rn, V128:$Rm)>;
5222}
5223
5224//----------------------------------------------------------------------------
5225// AdvSIMD three register scalar instructions
5226//----------------------------------------------------------------------------
5227
5228let mayStore = 0, mayLoad = 0, hasSideEffects = 0 in
5229class BaseSIMDThreeScalar<bit U, bits<2> size, bits<5> opcode,
5230 RegisterClass regtype, string asm,
5231 list<dag> pattern>
5232 : I<(outs regtype:$Rd), (ins regtype:$Rn, regtype:$Rm), asm,
5233 "\t$Rd, $Rn, $Rm", "", pattern>,
5234 Sched<[WriteV]> {
5235 bits<5> Rd;
5236 bits<5> Rn;
5237 bits<5> Rm;
5238 let Inst{31-30} = 0b01;
5239 let Inst{29} = U;
5240 let Inst{28-24} = 0b11110;
5241 let Inst{23-22} = size;
5242 let Inst{21} = 1;
5243 let Inst{20-16} = Rm;
5244 let Inst{15-11} = opcode;
5245 let Inst{10} = 1;
5246 let Inst{9-5} = Rn;
5247 let Inst{4-0} = Rd;
5248}
5249
5250multiclass SIMDThreeScalarD<bit U, bits<5> opc, string asm,
5251 SDPatternOperator OpNode> {
5252 def v1i64 : BaseSIMDThreeScalar<U, 0b11, opc, FPR64, asm,
5253 [(set (v1i64 FPR64:$Rd), (OpNode (v1i64 FPR64:$Rn), (v1i64 FPR64:$Rm)))]>;
5254}
5255
5256multiclass SIMDThreeScalarBHSD<bit U, bits<5> opc, string asm,
5257 SDPatternOperator OpNode> {
5258 def v1i64 : BaseSIMDThreeScalar<U, 0b11, opc, FPR64, asm,
5259 [(set (v1i64 FPR64:$Rd), (OpNode (v1i64 FPR64:$Rn), (v1i64 FPR64:$Rm)))]>;
5260 def v1i32 : BaseSIMDThreeScalar<U, 0b10, opc, FPR32, asm, []>;
5261 def v1i16 : BaseSIMDThreeScalar<U, 0b01, opc, FPR16, asm, []>;
5262 def v1i8 : BaseSIMDThreeScalar<U, 0b00, opc, FPR8 , asm, []>;
5263
5264 def : Pat<(i64 (OpNode (i64 FPR64:$Rn), (i64 FPR64:$Rm))),
5265 (!cast<Instruction>(NAME#"v1i64") FPR64:$Rn, FPR64:$Rm)>;
5266 def : Pat<(i32 (OpNode (i32 FPR32:$Rn), (i32 FPR32:$Rm))),
5267 (!cast<Instruction>(NAME#"v1i32") FPR32:$Rn, FPR32:$Rm)>;
5268}
5269
5270multiclass SIMDThreeScalarHS<bit U, bits<5> opc, string asm,
5271 SDPatternOperator OpNode> {
5272 def v1i32 : BaseSIMDThreeScalar<U, 0b10, opc, FPR32, asm,
5273 [(set FPR32:$Rd, (OpNode FPR32:$Rn, FPR32:$Rm))]>;
5274 def v1i16 : BaseSIMDThreeScalar<U, 0b01, opc, FPR16, asm, []>;
5275}
5276
5277multiclass SIMDThreeScalarSD<bit U, bit S, bits<5> opc, string asm,
5278 SDPatternOperator OpNode = null_frag> {
5279 let mayLoad = 0, mayStore = 0, hasSideEffects = 0 in {
5280 def #NAME#64 : BaseSIMDThreeScalar<U, {S,1}, opc, FPR64, asm,
5281 [(set (f64 FPR64:$Rd), (OpNode (f64 FPR64:$Rn), (f64 FPR64:$Rm)))]>;
5282 def #NAME#32 : BaseSIMDThreeScalar<U, {S,0}, opc, FPR32, asm,
5283 [(set FPR32:$Rd, (OpNode FPR32:$Rn, FPR32:$Rm))]>;
5284 }
5285
5286 def : Pat<(v1f64 (OpNode (v1f64 FPR64:$Rn), (v1f64 FPR64:$Rm))),
5287 (!cast<Instruction>(NAME # "64") FPR64:$Rn, FPR64:$Rm)>;
5288}
5289
5290multiclass SIMDThreeScalarFPCmp<bit U, bit S, bits<5> opc, string asm,
5291 SDPatternOperator OpNode = null_frag> {
5292 let mayLoad = 0, mayStore = 0, hasSideEffects = 0 in {
5293 def #NAME#64 : BaseSIMDThreeScalar<U, {S,1}, opc, FPR64, asm,
5294 [(set (i64 FPR64:$Rd), (OpNode (f64 FPR64:$Rn), (f64 FPR64:$Rm)))]>;
5295 def #NAME#32 : BaseSIMDThreeScalar<U, {S,0}, opc, FPR32, asm,
5296 [(set (i32 FPR32:$Rd), (OpNode (f32 FPR32:$Rn), (f32 FPR32:$Rm)))]>;
5297 }
5298
5299 def : Pat<(v1i64 (OpNode (v1f64 FPR64:$Rn), (v1f64 FPR64:$Rm))),
5300 (!cast<Instruction>(NAME # "64") FPR64:$Rn, FPR64:$Rm)>;
5301}
5302
5303class BaseSIMDThreeScalarMixed<bit U, bits<2> size, bits<5> opcode,
5304 dag oops, dag iops, string asm, string cstr, list<dag> pat>
5305 : I<oops, iops, asm,
5306 "\t$Rd, $Rn, $Rm", cstr, pat>,
5307 Sched<[WriteV]> {
5308 bits<5> Rd;
5309 bits<5> Rn;
5310 bits<5> Rm;
5311 let Inst{31-30} = 0b01;
5312 let Inst{29} = U;
5313 let Inst{28-24} = 0b11110;
5314 let Inst{23-22} = size;
5315 let Inst{21} = 1;
5316 let Inst{20-16} = Rm;
5317 let Inst{15-11} = opcode;
5318 let Inst{10} = 0;
5319 let Inst{9-5} = Rn;
5320 let Inst{4-0} = Rd;
5321}
5322
5323let mayLoad = 0, mayStore = 0, hasSideEffects = 0 in
5324multiclass SIMDThreeScalarMixedHS<bit U, bits<5> opc, string asm,
5325 SDPatternOperator OpNode = null_frag> {
5326 def i16 : BaseSIMDThreeScalarMixed<U, 0b01, opc,
5327 (outs FPR32:$Rd),
5328 (ins FPR16:$Rn, FPR16:$Rm), asm, "", []>;
5329 def i32 : BaseSIMDThreeScalarMixed<U, 0b10, opc,
5330 (outs FPR64:$Rd),
5331 (ins FPR32:$Rn, FPR32:$Rm), asm, "",
5332 [(set (i64 FPR64:$Rd), (OpNode (i32 FPR32:$Rn), (i32 FPR32:$Rm)))]>;
5333}
5334
5335let mayLoad = 0, mayStore = 0, hasSideEffects = 0 in
5336multiclass SIMDThreeScalarMixedTiedHS<bit U, bits<5> opc, string asm,
5337 SDPatternOperator OpNode = null_frag> {
5338 def i16 : BaseSIMDThreeScalarMixed<U, 0b01, opc,
5339 (outs FPR32:$dst),
5340 (ins FPR32:$Rd, FPR16:$Rn, FPR16:$Rm),
5341 asm, "$Rd = $dst", []>;
5342 def i32 : BaseSIMDThreeScalarMixed<U, 0b10, opc,
5343 (outs FPR64:$dst),
5344 (ins FPR64:$Rd, FPR32:$Rn, FPR32:$Rm),
5345 asm, "$Rd = $dst",
5346 [(set (i64 FPR64:$dst),
5347 (OpNode (i64 FPR64:$Rd), (i32 FPR32:$Rn), (i32 FPR32:$Rm)))]>;
5348}
5349
5350//----------------------------------------------------------------------------
5351// AdvSIMD two register scalar instructions
5352//----------------------------------------------------------------------------
5353
5354let mayLoad = 0, mayStore = 0, hasSideEffects = 0 in
5355class BaseSIMDTwoScalar<bit U, bits<2> size, bits<5> opcode,
5356 RegisterClass regtype, RegisterClass regtype2,
5357 string asm, list<dag> pat>
5358 : I<(outs regtype:$Rd), (ins regtype2:$Rn), asm,
5359 "\t$Rd, $Rn", "", pat>,
5360 Sched<[WriteV]> {
5361 bits<5> Rd;
5362 bits<5> Rn;
5363 let Inst{31-30} = 0b01;
5364 let Inst{29} = U;
5365 let Inst{28-24} = 0b11110;
5366 let Inst{23-22} = size;
5367 let Inst{21-17} = 0b10000;
5368 let Inst{16-12} = opcode;
5369 let Inst{11-10} = 0b10;
5370 let Inst{9-5} = Rn;
5371 let Inst{4-0} = Rd;
5372}
5373
5374let mayLoad = 0, mayStore = 0, hasSideEffects = 0 in
5375class BaseSIMDTwoScalarTied<bit U, bits<2> size, bits<5> opcode,
5376 RegisterClass regtype, RegisterClass regtype2,
5377 string asm, list<dag> pat>
5378 : I<(outs regtype:$dst), (ins regtype:$Rd, regtype2:$Rn), asm,
5379 "\t$Rd, $Rn", "$Rd = $dst", pat>,
5380 Sched<[WriteV]> {
5381 bits<5> Rd;
5382 bits<5> Rn;
5383 let Inst{31-30} = 0b01;
5384 let Inst{29} = U;
5385 let Inst{28-24} = 0b11110;
5386 let Inst{23-22} = size;
5387 let Inst{21-17} = 0b10000;
5388 let Inst{16-12} = opcode;
5389 let Inst{11-10} = 0b10;
5390 let Inst{9-5} = Rn;
5391 let Inst{4-0} = Rd;
5392}
5393
5394
5395let mayLoad = 0, mayStore = 0, hasSideEffects = 0 in
5396class BaseSIMDCmpTwoScalar<bit U, bits<2> size, bits<5> opcode,
5397 RegisterClass regtype, string asm, string zero>
5398 : I<(outs regtype:$Rd), (ins regtype:$Rn), asm,
5399 "\t$Rd, $Rn, #" # zero, "", []>,
5400 Sched<[WriteV]> {
5401 bits<5> Rd;
5402 bits<5> Rn;
5403 let Inst{31-30} = 0b01;
5404 let Inst{29} = U;
5405 let Inst{28-24} = 0b11110;
5406 let Inst{23-22} = size;
5407 let Inst{21-17} = 0b10000;
5408 let Inst{16-12} = opcode;
5409 let Inst{11-10} = 0b10;
5410 let Inst{9-5} = Rn;
5411 let Inst{4-0} = Rd;
5412}
5413
5414class SIMDInexactCvtTwoScalar<bits<5> opcode, string asm>
5415 : I<(outs FPR32:$Rd), (ins FPR64:$Rn), asm, "\t$Rd, $Rn", "",
5416 [(set (f32 FPR32:$Rd), (int_aarch64_sisd_fcvtxn (f64 FPR64:$Rn)))]>,
5417 Sched<[WriteV]> {
5418 bits<5> Rd;
5419 bits<5> Rn;
5420 let Inst{31-17} = 0b011111100110000;
5421 let Inst{16-12} = opcode;
5422 let Inst{11-10} = 0b10;
5423 let Inst{9-5} = Rn;
5424 let Inst{4-0} = Rd;
5425}
5426
5427multiclass SIMDCmpTwoScalarD<bit U, bits<5> opc, string asm,
5428 SDPatternOperator OpNode> {
5429 def v1i64rz : BaseSIMDCmpTwoScalar<U, 0b11, opc, FPR64, asm, "0">;
5430
5431 def : Pat<(v1i64 (OpNode FPR64:$Rn)),
5432 (!cast<Instruction>(NAME # v1i64rz) FPR64:$Rn)>;
5433}
5434
5435multiclass SIMDCmpTwoScalarSD<bit U, bit S, bits<5> opc, string asm,
5436 SDPatternOperator OpNode> {
5437 def v1i64rz : BaseSIMDCmpTwoScalar<U, {S,1}, opc, FPR64, asm, "0.0">;
5438 def v1i32rz : BaseSIMDCmpTwoScalar<U, {S,0}, opc, FPR32, asm, "0.0">;
5439
5440 def : InstAlias<asm # " $Rd, $Rn, #0",
5441 (!cast<Instruction>(NAME # v1i64rz) FPR64:$Rd, FPR64:$Rn), 0>;
5442 def : InstAlias<asm # " $Rd, $Rn, #0",
5443 (!cast<Instruction>(NAME # v1i32rz) FPR32:$Rd, FPR32:$Rn), 0>;
5444
5445 def : Pat<(v1i64 (OpNode (v1f64 FPR64:$Rn))),
5446 (!cast<Instruction>(NAME # v1i64rz) FPR64:$Rn)>;
5447}
5448
5449multiclass SIMDTwoScalarD<bit U, bits<5> opc, string asm,
5450 SDPatternOperator OpNode = null_frag> {
5451 def v1i64 : BaseSIMDTwoScalar<U, 0b11, opc, FPR64, FPR64, asm,
5452 [(set (v1i64 FPR64:$Rd), (OpNode (v1i64 FPR64:$Rn)))]>;
5453
5454 def : Pat<(i64 (OpNode (i64 FPR64:$Rn))),
5455 (!cast<Instruction>(NAME # "v1i64") FPR64:$Rn)>;
5456}
5457
5458multiclass SIMDTwoScalarSD<bit U, bit S, bits<5> opc, string asm> {
5459 def v1i64 : BaseSIMDTwoScalar<U, {S,1}, opc, FPR64, FPR64, asm,[]>;
5460 def v1i32 : BaseSIMDTwoScalar<U, {S,0}, opc, FPR32, FPR32, asm,[]>;
5461}
5462
5463multiclass SIMDTwoScalarCVTSD<bit U, bit S, bits<5> opc, string asm,
5464 SDPatternOperator OpNode> {
5465 def v1i64 : BaseSIMDTwoScalar<U, {S,1}, opc, FPR64, FPR64, asm,
5466 [(set FPR64:$Rd, (OpNode (f64 FPR64:$Rn)))]>;
5467 def v1i32 : BaseSIMDTwoScalar<U, {S,0}, opc, FPR32, FPR32, asm,
5468 [(set FPR32:$Rd, (OpNode (f32 FPR32:$Rn)))]>;
5469}
5470
5471multiclass SIMDTwoScalarBHSD<bit U, bits<5> opc, string asm,
5472 SDPatternOperator OpNode = null_frag> {
5473 let mayLoad = 0, mayStore = 0, hasSideEffects = 0 in {
5474 def v1i64 : BaseSIMDTwoScalar<U, 0b11, opc, FPR64, FPR64, asm,
5475 [(set (i64 FPR64:$Rd), (OpNode (i64 FPR64:$Rn)))]>;
5476 def v1i32 : BaseSIMDTwoScalar<U, 0b10, opc, FPR32, FPR32, asm,
5477 [(set (i32 FPR32:$Rd), (OpNode (i32 FPR32:$Rn)))]>;
5478 def v1i16 : BaseSIMDTwoScalar<U, 0b01, opc, FPR16, FPR16, asm, []>;
5479 def v1i8 : BaseSIMDTwoScalar<U, 0b00, opc, FPR8 , FPR8 , asm, []>;
5480 }
5481
5482 def : Pat<(v1i64 (OpNode (v1i64 FPR64:$Rn))),
5483 (!cast<Instruction>(NAME # v1i64) FPR64:$Rn)>;
5484}
5485
5486multiclass SIMDTwoScalarBHSDTied<bit U, bits<5> opc, string asm,
5487 Intrinsic OpNode> {
5488 let mayLoad = 0, mayStore = 0, hasSideEffects = 0 in {
5489 def v1i64 : BaseSIMDTwoScalarTied<U, 0b11, opc, FPR64, FPR64, asm,
5490 [(set (i64 FPR64:$dst), (OpNode (i64 FPR64:$Rd), (i64 FPR64:$Rn)))]>;
5491 def v1i32 : BaseSIMDTwoScalarTied<U, 0b10, opc, FPR32, FPR32, asm,
5492 [(set (i32 FPR32:$dst), (OpNode (i32 FPR32:$Rd), (i32 FPR32:$Rn)))]>;
5493 def v1i16 : BaseSIMDTwoScalarTied<U, 0b01, opc, FPR16, FPR16, asm, []>;
5494 def v1i8 : BaseSIMDTwoScalarTied<U, 0b00, opc, FPR8 , FPR8 , asm, []>;
5495 }
5496
5497 def : Pat<(v1i64 (OpNode (v1i64 FPR64:$Rd), (v1i64 FPR64:$Rn))),
5498 (!cast<Instruction>(NAME # v1i64) FPR64:$Rd, FPR64:$Rn)>;
5499}
5500
5501
5502
5503let mayLoad = 0, mayStore = 0, hasSideEffects = 0 in
5504multiclass SIMDTwoScalarMixedBHS<bit U, bits<5> opc, string asm,
5505 SDPatternOperator OpNode = null_frag> {
5506 def v1i32 : BaseSIMDTwoScalar<U, 0b10, opc, FPR32, FPR64, asm,
5507 [(set (i32 FPR32:$Rd), (OpNode (i64 FPR64:$Rn)))]>;
5508 def v1i16 : BaseSIMDTwoScalar<U, 0b01, opc, FPR16, FPR32, asm, []>;
5509 def v1i8 : BaseSIMDTwoScalar<U, 0b00, opc, FPR8 , FPR16, asm, []>;
5510}
5511
5512//----------------------------------------------------------------------------
5513// AdvSIMD scalar pairwise instructions
5514//----------------------------------------------------------------------------
5515
5516let mayLoad = 0, mayStore = 0, hasSideEffects = 0 in
5517class BaseSIMDPairwiseScalar<bit U, bits<2> size, bits<5> opcode,
5518 RegisterOperand regtype, RegisterOperand vectype,
5519 string asm, string kind>
5520 : I<(outs regtype:$Rd), (ins vectype:$Rn), asm,
5521 "{\t$Rd, $Rn" # kind # "|" # kind # "\t$Rd, $Rn}", "", []>,
5522 Sched<[WriteV]> {
5523 bits<5> Rd;
5524 bits<5> Rn;
5525 let Inst{31-30} = 0b01;
5526 let Inst{29} = U;
5527 let Inst{28-24} = 0b11110;
5528 let Inst{23-22} = size;
5529 let Inst{21-17} = 0b11000;
5530 let Inst{16-12} = opcode;
5531 let Inst{11-10} = 0b10;
5532 let Inst{9-5} = Rn;
5533 let Inst{4-0} = Rd;
5534}
5535
5536multiclass SIMDPairwiseScalarD<bit U, bits<5> opc, string asm> {
5537 def v2i64p : BaseSIMDPairwiseScalar<U, 0b11, opc, FPR64Op, V128,
5538 asm, ".2d">;
5539}
5540
5541multiclass SIMDPairwiseScalarSD<bit U, bit S, bits<5> opc, string asm> {
5542 def v2i32p : BaseSIMDPairwiseScalar<U, {S,0}, opc, FPR32Op, V64,
5543 asm, ".2s">;
5544 def v2i64p : BaseSIMDPairwiseScalar<U, {S,1}, opc, FPR64Op, V128,
5545 asm, ".2d">;
5546}
5547
5548//----------------------------------------------------------------------------
5549// AdvSIMD across lanes instructions
5550//----------------------------------------------------------------------------
5551
5552let mayLoad = 0, mayStore = 0, hasSideEffects = 0 in
5553class BaseSIMDAcrossLanes<bit Q, bit U, bits<2> size, bits<5> opcode,
5554 RegisterClass regtype, RegisterOperand vectype,
5555 string asm, string kind, list<dag> pattern>
5556 : I<(outs regtype:$Rd), (ins vectype:$Rn), asm,
5557 "{\t$Rd, $Rn" # kind # "|" # kind # "\t$Rd, $Rn}", "", pattern>,
5558 Sched<[WriteV]> {
5559 bits<5> Rd;
5560 bits<5> Rn;
5561 let Inst{31} = 0;
5562 let Inst{30} = Q;
5563 let Inst{29} = U;
5564 let Inst{28-24} = 0b01110;
5565 let Inst{23-22} = size;
5566 let Inst{21-17} = 0b11000;
5567 let Inst{16-12} = opcode;
5568 let Inst{11-10} = 0b10;
5569 let Inst{9-5} = Rn;
5570 let Inst{4-0} = Rd;
5571}
5572
5573multiclass SIMDAcrossLanesBHS<bit U, bits<5> opcode,
5574 string asm> {
5575 def v8i8v : BaseSIMDAcrossLanes<0, U, 0b00, opcode, FPR8, V64,
5576 asm, ".8b", []>;
5577 def v16i8v : BaseSIMDAcrossLanes<1, U, 0b00, opcode, FPR8, V128,
5578 asm, ".16b", []>;
5579 def v4i16v : BaseSIMDAcrossLanes<0, U, 0b01, opcode, FPR16, V64,
5580 asm, ".4h", []>;
5581 def v8i16v : BaseSIMDAcrossLanes<1, U, 0b01, opcode, FPR16, V128,
5582 asm, ".8h", []>;
5583 def v4i32v : BaseSIMDAcrossLanes<1, U, 0b10, opcode, FPR32, V128,
5584 asm, ".4s", []>;
5585}
5586
5587multiclass SIMDAcrossLanesHSD<bit U, bits<5> opcode, string asm> {
5588 def v8i8v : BaseSIMDAcrossLanes<0, U, 0b00, opcode, FPR16, V64,
5589 asm, ".8b", []>;
5590 def v16i8v : BaseSIMDAcrossLanes<1, U, 0b00, opcode, FPR16, V128,
5591 asm, ".16b", []>;
5592 def v4i16v : BaseSIMDAcrossLanes<0, U, 0b01, opcode, FPR32, V64,
5593 asm, ".4h", []>;
5594 def v8i16v : BaseSIMDAcrossLanes<1, U, 0b01, opcode, FPR32, V128,
5595 asm, ".8h", []>;
5596 def v4i32v : BaseSIMDAcrossLanes<1, U, 0b10, opcode, FPR64, V128,
5597 asm, ".4s", []>;
5598}
5599
5600multiclass SIMDAcrossLanesS<bits<5> opcode, bit sz1, string asm,
5601 Intrinsic intOp> {
5602 def v4i32v : BaseSIMDAcrossLanes<1, 1, {sz1, 0}, opcode, FPR32, V128,
5603 asm, ".4s",
5604 [(set FPR32:$Rd, (intOp (v4f32 V128:$Rn)))]>;
5605}
5606
5607//----------------------------------------------------------------------------
5608// AdvSIMD INS/DUP instructions
5609//----------------------------------------------------------------------------
5610
5611// FIXME: There has got to be a better way to factor these. ugh.
5612
5613class BaseSIMDInsDup<bit Q, bit op, dag outs, dag ins, string asm,
5614 string operands, string constraints, list<dag> pattern>
5615 : I<outs, ins, asm, operands, constraints, pattern>,
5616 Sched<[WriteV]> {
5617 bits<5> Rd;
5618 bits<5> Rn;
5619 let Inst{31} = 0;
5620 let Inst{30} = Q;
5621 let Inst{29} = op;
5622 let Inst{28-21} = 0b01110000;
5623 let Inst{15} = 0;
5624 let Inst{10} = 1;
5625 let Inst{9-5} = Rn;
5626 let Inst{4-0} = Rd;
5627}
5628
5629class SIMDDupFromMain<bit Q, bits<5> imm5, string size, ValueType vectype,
5630 RegisterOperand vecreg, RegisterClass regtype>
5631 : BaseSIMDInsDup<Q, 0, (outs vecreg:$Rd), (ins regtype:$Rn), "dup",
5632 "{\t$Rd" # size # ", $Rn" #
5633 "|" # size # "\t$Rd, $Rn}", "",
5634 [(set (vectype vecreg:$Rd), (AArch64dup regtype:$Rn))]> {
5635 let Inst{20-16} = imm5;
5636 let Inst{14-11} = 0b0001;
5637}
5638
5639class SIMDDupFromElement<bit Q, string dstkind, string srckind,
5640 ValueType vectype, ValueType insreg,
5641 RegisterOperand vecreg, Operand idxtype,
5642 ValueType elttype, SDNode OpNode>
5643 : BaseSIMDInsDup<Q, 0, (outs vecreg:$Rd), (ins V128:$Rn, idxtype:$idx), "dup",
5644 "{\t$Rd" # dstkind # ", $Rn" # srckind # "$idx" #
5645 "|" # dstkind # "\t$Rd, $Rn$idx}", "",
5646 [(set (vectype vecreg:$Rd),
5647 (OpNode (insreg V128:$Rn), idxtype:$idx))]> {
5648 let Inst{14-11} = 0b0000;
5649}
5650
5651class SIMDDup64FromElement
5652 : SIMDDupFromElement<1, ".2d", ".d", v2i64, v2i64, V128,
5653 VectorIndexD, i64, AArch64duplane64> {
5654 bits<1> idx;
5655 let Inst{20} = idx;
5656 let Inst{19-16} = 0b1000;
5657}
5658
5659class SIMDDup32FromElement<bit Q, string size, ValueType vectype,
5660 RegisterOperand vecreg>
5661 : SIMDDupFromElement<Q, size, ".s", vectype, v4i32, vecreg,
5662 VectorIndexS, i64, AArch64duplane32> {
5663 bits<2> idx;
5664 let Inst{20-19} = idx;
5665 let Inst{18-16} = 0b100;
5666}
5667
5668class SIMDDup16FromElement<bit Q, string size, ValueType vectype,
5669 RegisterOperand vecreg>
5670 : SIMDDupFromElement<Q, size, ".h", vectype, v8i16, vecreg,
5671 VectorIndexH, i64, AArch64duplane16> {
5672 bits<3> idx;
5673 let Inst{20-18} = idx;
5674 let Inst{17-16} = 0b10;
5675}
5676
5677class SIMDDup8FromElement<bit Q, string size, ValueType vectype,
5678 RegisterOperand vecreg>
5679 : SIMDDupFromElement<Q, size, ".b", vectype, v16i8, vecreg,
5680 VectorIndexB, i64, AArch64duplane8> {
5681 bits<4> idx;
5682 let Inst{20-17} = idx;
5683 let Inst{16} = 1;
5684}
5685
5686class BaseSIMDMov<bit Q, string size, bits<4> imm4, RegisterClass regtype,
5687 Operand idxtype, string asm, list<dag> pattern>
5688 : BaseSIMDInsDup<Q, 0, (outs regtype:$Rd), (ins V128:$Rn, idxtype:$idx), asm,
5689 "{\t$Rd, $Rn" # size # "$idx" #
5690 "|" # size # "\t$Rd, $Rn$idx}", "", pattern> {
5691 let Inst{14-11} = imm4;
5692}
5693
5694class SIMDSMov<bit Q, string size, RegisterClass regtype,
5695 Operand idxtype>
5696 : BaseSIMDMov<Q, size, 0b0101, regtype, idxtype, "smov", []>;
5697class SIMDUMov<bit Q, string size, ValueType vectype, RegisterClass regtype,
5698 Operand idxtype>
5699 : BaseSIMDMov<Q, size, 0b0111, regtype, idxtype, "umov",
5700 [(set regtype:$Rd, (vector_extract (vectype V128:$Rn), idxtype:$idx))]>;
5701
5702class SIMDMovAlias<string asm, string size, Instruction inst,
5703 RegisterClass regtype, Operand idxtype>
5704 : InstAlias<asm#"{\t$dst, $src"#size#"$idx" #
5705 "|" # size # "\t$dst, $src$idx}",
5706 (inst regtype:$dst, V128:$src, idxtype:$idx)>;
5707
5708multiclass SMov {
5709 def vi8to32 : SIMDSMov<0, ".b", GPR32, VectorIndexB> {
5710 bits<4> idx;
5711 let Inst{20-17} = idx;
5712 let Inst{16} = 1;
5713 }
5714 def vi8to64 : SIMDSMov<1, ".b", GPR64, VectorIndexB> {
5715 bits<4> idx;
5716 let Inst{20-17} = idx;
5717 let Inst{16} = 1;
5718 }
5719 def vi16to32 : SIMDSMov<0, ".h", GPR32, VectorIndexH> {
5720 bits<3> idx;
5721 let Inst{20-18} = idx;
5722 let Inst{17-16} = 0b10;
5723 }
5724 def vi16to64 : SIMDSMov<1, ".h", GPR64, VectorIndexH> {
5725 bits<3> idx;
5726 let Inst{20-18} = idx;
5727 let Inst{17-16} = 0b10;
5728 }
5729 def vi32to64 : SIMDSMov<1, ".s", GPR64, VectorIndexS> {
5730 bits<2> idx;
5731 let Inst{20-19} = idx;
5732 let Inst{18-16} = 0b100;
5733 }
5734}
5735
5736multiclass UMov {
5737 def vi8 : SIMDUMov<0, ".b", v16i8, GPR32, VectorIndexB> {
5738 bits<4> idx;
5739 let Inst{20-17} = idx;
5740 let Inst{16} = 1;
5741 }
5742 def vi16 : SIMDUMov<0, ".h", v8i16, GPR32, VectorIndexH> {
5743 bits<3> idx;
5744 let Inst{20-18} = idx;
5745 let Inst{17-16} = 0b10;
5746 }
5747 def vi32 : SIMDUMov<0, ".s", v4i32, GPR32, VectorIndexS> {
5748 bits<2> idx;
5749 let Inst{20-19} = idx;
5750 let Inst{18-16} = 0b100;
5751 }
5752 def vi64 : SIMDUMov<1, ".d", v2i64, GPR64, VectorIndexD> {
5753 bits<1> idx;
5754 let Inst{20} = idx;
5755 let Inst{19-16} = 0b1000;
5756 }
5757 def : SIMDMovAlias<"mov", ".s",
5758 !cast<Instruction>(NAME#"vi32"),
5759 GPR32, VectorIndexS>;
5760 def : SIMDMovAlias<"mov", ".d",
5761 !cast<Instruction>(NAME#"vi64"),
5762 GPR64, VectorIndexD>;
5763}
5764
5765class SIMDInsFromMain<string size, ValueType vectype,
5766 RegisterClass regtype, Operand idxtype>
5767 : BaseSIMDInsDup<1, 0, (outs V128:$dst),
5768 (ins V128:$Rd, idxtype:$idx, regtype:$Rn), "ins",
5769 "{\t$Rd" # size # "$idx, $Rn" #
5770 "|" # size # "\t$Rd$idx, $Rn}",
5771 "$Rd = $dst",
5772 [(set V128:$dst,
5773 (vector_insert (vectype V128:$Rd), regtype:$Rn, idxtype:$idx))]> {
5774 let Inst{14-11} = 0b0011;
5775}
5776
5777class SIMDInsFromElement<string size, ValueType vectype,
5778 ValueType elttype, Operand idxtype>
5779 : BaseSIMDInsDup<1, 1, (outs V128:$dst),
5780 (ins V128:$Rd, idxtype:$idx, V128:$Rn, idxtype:$idx2), "ins",
5781 "{\t$Rd" # size # "$idx, $Rn" # size # "$idx2" #
5782 "|" # size # "\t$Rd$idx, $Rn$idx2}",
5783 "$Rd = $dst",
5784 [(set V128:$dst,
5785 (vector_insert
5786 (vectype V128:$Rd),
5787 (elttype (vector_extract (vectype V128:$Rn), idxtype:$idx2)),
5788 idxtype:$idx))]>;
5789
5790class SIMDInsMainMovAlias<string size, Instruction inst,
5791 RegisterClass regtype, Operand idxtype>
5792 : InstAlias<"mov" # "{\t$dst" # size # "$idx, $src" #
5793 "|" # size #"\t$dst$idx, $src}",
5794 (inst V128:$dst, idxtype:$idx, regtype:$src)>;
5795class SIMDInsElementMovAlias<string size, Instruction inst,
5796 Operand idxtype>
5797 : InstAlias<"mov" # "{\t$dst" # size # "$idx, $src" # size # "$idx2" #
5798 # "|" # size #" $dst$idx, $src$idx2}",
5799 (inst V128:$dst, idxtype:$idx, V128:$src, idxtype:$idx2)>;
5800
5801
5802multiclass SIMDIns {
5803 def vi8gpr : SIMDInsFromMain<".b", v16i8, GPR32, VectorIndexB> {
5804 bits<4> idx;
5805 let Inst{20-17} = idx;
5806 let Inst{16} = 1;
5807 }
5808 def vi16gpr : SIMDInsFromMain<".h", v8i16, GPR32, VectorIndexH> {
5809 bits<3> idx;
5810 let Inst{20-18} = idx;
5811 let Inst{17-16} = 0b10;
5812 }
5813 def vi32gpr : SIMDInsFromMain<".s", v4i32, GPR32, VectorIndexS> {
5814 bits<2> idx;
5815 let Inst{20-19} = idx;
5816 let Inst{18-16} = 0b100;
5817 }
5818 def vi64gpr : SIMDInsFromMain<".d", v2i64, GPR64, VectorIndexD> {
5819 bits<1> idx;
5820 let Inst{20} = idx;
5821 let Inst{19-16} = 0b1000;
5822 }
5823
5824 def vi8lane : SIMDInsFromElement<".b", v16i8, i32, VectorIndexB> {
5825 bits<4> idx;
5826 bits<4> idx2;
5827 let Inst{20-17} = idx;
5828 let Inst{16} = 1;
5829 let Inst{14-11} = idx2;
5830 }
5831 def vi16lane : SIMDInsFromElement<".h", v8i16, i32, VectorIndexH> {
5832 bits<3> idx;
5833 bits<3> idx2;
5834 let Inst{20-18} = idx;
5835 let Inst{17-16} = 0b10;
5836 let Inst{14-12} = idx2;
5837 let Inst{11} = 0;
5838 }
5839 def vi32lane : SIMDInsFromElement<".s", v4i32, i32, VectorIndexS> {
5840 bits<2> idx;
5841 bits<2> idx2;
5842 let Inst{20-19} = idx;
5843 let Inst{18-16} = 0b100;
5844 let Inst{14-13} = idx2;
5845 let Inst{12-11} = 0;
5846 }
5847 def vi64lane : SIMDInsFromElement<".d", v2i64, i64, VectorIndexD> {
5848 bits<1> idx;
5849 bits<1> idx2;
5850 let Inst{20} = idx;
5851 let Inst{19-16} = 0b1000;
5852 let Inst{14} = idx2;
5853 let Inst{13-11} = 0;
5854 }
5855
5856 // For all forms of the INS instruction, the "mov" mnemonic is the
5857 // preferred alias. Why they didn't just call the instruction "mov" in
5858 // the first place is a very good question indeed...
5859 def : SIMDInsMainMovAlias<".b", !cast<Instruction>(NAME#"vi8gpr"),
5860 GPR32, VectorIndexB>;
5861 def : SIMDInsMainMovAlias<".h", !cast<Instruction>(NAME#"vi16gpr"),
5862 GPR32, VectorIndexH>;
5863 def : SIMDInsMainMovAlias<".s", !cast<Instruction>(NAME#"vi32gpr"),
5864 GPR32, VectorIndexS>;
5865 def : SIMDInsMainMovAlias<".d", !cast<Instruction>(NAME#"vi64gpr"),
5866 GPR64, VectorIndexD>;
5867
5868 def : SIMDInsElementMovAlias<".b", !cast<Instruction>(NAME#"vi8lane"),
5869 VectorIndexB>;
5870 def : SIMDInsElementMovAlias<".h", !cast<Instruction>(NAME#"vi16lane"),
5871 VectorIndexH>;
5872 def : SIMDInsElementMovAlias<".s", !cast<Instruction>(NAME#"vi32lane"),
5873 VectorIndexS>;
5874 def : SIMDInsElementMovAlias<".d", !cast<Instruction>(NAME#"vi64lane"),
5875 VectorIndexD>;
5876}
5877
5878//----------------------------------------------------------------------------
5879// AdvSIMD TBL/TBX
5880//----------------------------------------------------------------------------
5881
5882let mayStore = 0, mayLoad = 0, hasSideEffects = 0 in
5883class BaseSIMDTableLookup<bit Q, bits<2> len, bit op, RegisterOperand vectype,
5884 RegisterOperand listtype, string asm, string kind>
5885 : I<(outs vectype:$Vd), (ins listtype:$Vn, vectype:$Vm), asm,
5886 "\t$Vd" # kind # ", $Vn, $Vm" # kind, "", []>,
5887 Sched<[WriteV]> {
5888 bits<5> Vd;
5889 bits<5> Vn;
5890 bits<5> Vm;
5891 let Inst{31} = 0;
5892 let Inst{30} = Q;
5893 let Inst{29-21} = 0b001110000;
5894 let Inst{20-16} = Vm;
5895 let Inst{15} = 0;
5896 let Inst{14-13} = len;
5897 let Inst{12} = op;
5898 let Inst{11-10} = 0b00;
5899 let Inst{9-5} = Vn;
5900 let Inst{4-0} = Vd;
5901}
5902
5903let mayStore = 0, mayLoad = 0, hasSideEffects = 0 in
5904class BaseSIMDTableLookupTied<bit Q, bits<2> len, bit op, RegisterOperand vectype,
5905 RegisterOperand listtype, string asm, string kind>
5906 : I<(outs vectype:$dst), (ins vectype:$Vd, listtype:$Vn, vectype:$Vm), asm,
5907 "\t$Vd" # kind # ", $Vn, $Vm" # kind, "$Vd = $dst", []>,
5908 Sched<[WriteV]> {
5909 bits<5> Vd;
5910 bits<5> Vn;
5911 bits<5> Vm;
5912 let Inst{31} = 0;
5913 let Inst{30} = Q;
5914 let Inst{29-21} = 0b001110000;
5915 let Inst{20-16} = Vm;
5916 let Inst{15} = 0;
5917 let Inst{14-13} = len;
5918 let Inst{12} = op;
5919 let Inst{11-10} = 0b00;
5920 let Inst{9-5} = Vn;
5921 let Inst{4-0} = Vd;
5922}
5923
5924class SIMDTableLookupAlias<string asm, Instruction inst,
5925 RegisterOperand vectype, RegisterOperand listtype>
5926 : InstAlias<!strconcat(asm, "\t$dst, $lst, $index"),
5927 (inst vectype:$dst, listtype:$lst, vectype:$index), 0>;
5928
5929multiclass SIMDTableLookup<bit op, string asm> {
5930 def v8i8One : BaseSIMDTableLookup<0, 0b00, op, V64, VecListOne16b,
5931 asm, ".8b">;
5932 def v8i8Two : BaseSIMDTableLookup<0, 0b01, op, V64, VecListTwo16b,
5933 asm, ".8b">;
5934 def v8i8Three : BaseSIMDTableLookup<0, 0b10, op, V64, VecListThree16b,
5935 asm, ".8b">;
5936 def v8i8Four : BaseSIMDTableLookup<0, 0b11, op, V64, VecListFour16b,
5937 asm, ".8b">;
5938 def v16i8One : BaseSIMDTableLookup<1, 0b00, op, V128, VecListOne16b,
5939 asm, ".16b">;
5940 def v16i8Two : BaseSIMDTableLookup<1, 0b01, op, V128, VecListTwo16b,
5941 asm, ".16b">;
5942 def v16i8Three: BaseSIMDTableLookup<1, 0b10, op, V128, VecListThree16b,
5943 asm, ".16b">;
5944 def v16i8Four : BaseSIMDTableLookup<1, 0b11, op, V128, VecListFour16b,
5945 asm, ".16b">;
5946
5947 def : SIMDTableLookupAlias<asm # ".8b",
5948 !cast<Instruction>(NAME#"v8i8One"),
5949 V64, VecListOne128>;
5950 def : SIMDTableLookupAlias<asm # ".8b",
5951 !cast<Instruction>(NAME#"v8i8Two"),
5952 V64, VecListTwo128>;
5953 def : SIMDTableLookupAlias<asm # ".8b",
5954 !cast<Instruction>(NAME#"v8i8Three"),
5955 V64, VecListThree128>;
5956 def : SIMDTableLookupAlias<asm # ".8b",
5957 !cast<Instruction>(NAME#"v8i8Four"),
5958 V64, VecListFour128>;
5959 def : SIMDTableLookupAlias<asm # ".16b",
5960 !cast<Instruction>(NAME#"v16i8One"),
5961 V128, VecListOne128>;
5962 def : SIMDTableLookupAlias<asm # ".16b",
5963 !cast<Instruction>(NAME#"v16i8Two"),
5964 V128, VecListTwo128>;
5965 def : SIMDTableLookupAlias<asm # ".16b",
5966 !cast<Instruction>(NAME#"v16i8Three"),
5967 V128, VecListThree128>;
5968 def : SIMDTableLookupAlias<asm # ".16b",
5969 !cast<Instruction>(NAME#"v16i8Four"),
5970 V128, VecListFour128>;
5971}
5972
5973multiclass SIMDTableLookupTied<bit op, string asm> {
5974 def v8i8One : BaseSIMDTableLookupTied<0, 0b00, op, V64, VecListOne16b,
5975 asm, ".8b">;
5976 def v8i8Two : BaseSIMDTableLookupTied<0, 0b01, op, V64, VecListTwo16b,
5977 asm, ".8b">;
5978 def v8i8Three : BaseSIMDTableLookupTied<0, 0b10, op, V64, VecListThree16b,
5979 asm, ".8b">;
5980 def v8i8Four : BaseSIMDTableLookupTied<0, 0b11, op, V64, VecListFour16b,
5981 asm, ".8b">;
5982 def v16i8One : BaseSIMDTableLookupTied<1, 0b00, op, V128, VecListOne16b,
5983 asm, ".16b">;
5984 def v16i8Two : BaseSIMDTableLookupTied<1, 0b01, op, V128, VecListTwo16b,
5985 asm, ".16b">;
5986 def v16i8Three: BaseSIMDTableLookupTied<1, 0b10, op, V128, VecListThree16b,
5987 asm, ".16b">;
5988 def v16i8Four : BaseSIMDTableLookupTied<1, 0b11, op, V128, VecListFour16b,
5989 asm, ".16b">;
5990
5991 def : SIMDTableLookupAlias<asm # ".8b",
5992 !cast<Instruction>(NAME#"v8i8One"),
5993 V64, VecListOne128>;
5994 def : SIMDTableLookupAlias<asm # ".8b",
5995 !cast<Instruction>(NAME#"v8i8Two"),
5996 V64, VecListTwo128>;
5997 def : SIMDTableLookupAlias<asm # ".8b",
5998 !cast<Instruction>(NAME#"v8i8Three"),
5999 V64, VecListThree128>;
6000 def : SIMDTableLookupAlias<asm # ".8b",
6001 !cast<Instruction>(NAME#"v8i8Four"),
6002 V64, VecListFour128>;
6003 def : SIMDTableLookupAlias<asm # ".16b",
6004 !cast<Instruction>(NAME#"v16i8One"),
6005 V128, VecListOne128>;
6006 def : SIMDTableLookupAlias<asm # ".16b",
6007 !cast<Instruction>(NAME#"v16i8Two"),
6008 V128, VecListTwo128>;
6009 def : SIMDTableLookupAlias<asm # ".16b",
6010 !cast<Instruction>(NAME#"v16i8Three"),
6011 V128, VecListThree128>;
6012 def : SIMDTableLookupAlias<asm # ".16b",
6013 !cast<Instruction>(NAME#"v16i8Four"),
6014 V128, VecListFour128>;
6015}
6016
6017
6018//----------------------------------------------------------------------------
6019// AdvSIMD scalar CPY
6020//----------------------------------------------------------------------------
6021let mayLoad = 0, mayStore = 0, hasSideEffects = 0 in
6022class BaseSIMDScalarCPY<RegisterClass regtype, RegisterOperand vectype,
6023 string kind, Operand idxtype>
6024 : I<(outs regtype:$dst), (ins vectype:$src, idxtype:$idx), "mov",
6025 "{\t$dst, $src" # kind # "$idx" #
6026 "|\t$dst, $src$idx}", "", []>,
6027 Sched<[WriteV]> {
6028 bits<5> dst;
6029 bits<5> src;
6030 let Inst{31-21} = 0b01011110000;
6031 let Inst{15-10} = 0b000001;
6032 let Inst{9-5} = src;
6033 let Inst{4-0} = dst;
6034}
6035
6036class SIMDScalarCPYAlias<string asm, string size, Instruction inst,
6037 RegisterClass regtype, RegisterOperand vectype, Operand idxtype>
6038 : InstAlias<asm # "{\t$dst, $src" # size # "$index" #
6039 # "|\t$dst, $src$index}",
6040 (inst regtype:$dst, vectype:$src, idxtype:$index), 0>;
6041
6042
6043multiclass SIMDScalarCPY<string asm> {
6044 def i8 : BaseSIMDScalarCPY<FPR8, V128, ".b", VectorIndexB> {
6045 bits<4> idx;
6046 let Inst{20-17} = idx;
6047 let Inst{16} = 1;
6048 }
6049 def i16 : BaseSIMDScalarCPY<FPR16, V128, ".h", VectorIndexH> {
6050 bits<3> idx;
6051 let Inst{20-18} = idx;
6052 let Inst{17-16} = 0b10;
6053 }
6054 def i32 : BaseSIMDScalarCPY<FPR32, V128, ".s", VectorIndexS> {
6055 bits<2> idx;
6056 let Inst{20-19} = idx;
6057 let Inst{18-16} = 0b100;
6058 }
6059 def i64 : BaseSIMDScalarCPY<FPR64, V128, ".d", VectorIndexD> {
6060 bits<1> idx;
6061 let Inst{20} = idx;
6062 let Inst{19-16} = 0b1000;
6063 }
6064
6065 def : Pat<(v1i64 (scalar_to_vector (i64 (vector_extract (v2i64 V128:$src),
6066 VectorIndexD:$idx)))),
6067 (!cast<Instruction>(NAME # i64) V128:$src, VectorIndexD:$idx)>;
6068
6069 // 'DUP' mnemonic aliases.
6070 def : SIMDScalarCPYAlias<"dup", ".b",
6071 !cast<Instruction>(NAME#"i8"),
6072 FPR8, V128, VectorIndexB>;
6073 def : SIMDScalarCPYAlias<"dup", ".h",
6074 !cast<Instruction>(NAME#"i16"),
6075 FPR16, V128, VectorIndexH>;
6076 def : SIMDScalarCPYAlias<"dup", ".s",
6077 !cast<Instruction>(NAME#"i32"),
6078 FPR32, V128, VectorIndexS>;
6079 def : SIMDScalarCPYAlias<"dup", ".d",
6080 !cast<Instruction>(NAME#"i64"),
6081 FPR64, V128, VectorIndexD>;
6082}
6083
6084//----------------------------------------------------------------------------
6085// AdvSIMD modified immediate instructions
6086//----------------------------------------------------------------------------
6087
6088class BaseSIMDModifiedImm<bit Q, bit op, dag oops, dag iops,
6089 string asm, string op_string,
6090 string cstr, list<dag> pattern>
6091 : I<oops, iops, asm, op_string, cstr, pattern>,
6092 Sched<[WriteV]> {
6093 bits<5> Rd;
6094 bits<8> imm8;
6095 let Inst{31} = 0;
6096 let Inst{30} = Q;
6097 let Inst{29} = op;
6098 let Inst{28-19} = 0b0111100000;
6099 let Inst{18-16} = imm8{7-5};
6100 let Inst{11-10} = 0b01;
6101 let Inst{9-5} = imm8{4-0};
6102 let Inst{4-0} = Rd;
6103}
6104
6105class BaseSIMDModifiedImmVector<bit Q, bit op, RegisterOperand vectype,
6106 Operand immtype, dag opt_shift_iop,
6107 string opt_shift, string asm, string kind,
6108 list<dag> pattern>
6109 : BaseSIMDModifiedImm<Q, op, (outs vectype:$Rd),
6110 !con((ins immtype:$imm8), opt_shift_iop), asm,
6111 "{\t$Rd" # kind # ", $imm8" # opt_shift #
6112 "|" # kind # "\t$Rd, $imm8" # opt_shift # "}",
6113 "", pattern> {
6114 let DecoderMethod = "DecodeModImmInstruction";
6115}
6116
6117class BaseSIMDModifiedImmVectorTied<bit Q, bit op, RegisterOperand vectype,
6118 Operand immtype, dag opt_shift_iop,
6119 string opt_shift, string asm, string kind,
6120 list<dag> pattern>
6121 : BaseSIMDModifiedImm<Q, op, (outs vectype:$dst),
6122 !con((ins vectype:$Rd, immtype:$imm8), opt_shift_iop),
6123 asm, "{\t$Rd" # kind # ", $imm8" # opt_shift #
6124 "|" # kind # "\t$Rd, $imm8" # opt_shift # "}",
6125 "$Rd = $dst", pattern> {
6126 let DecoderMethod = "DecodeModImmTiedInstruction";
6127}
6128
6129class BaseSIMDModifiedImmVectorShift<bit Q, bit op, bits<2> b15_b12,
6130 RegisterOperand vectype, string asm,
6131 string kind, list<dag> pattern>
6132 : BaseSIMDModifiedImmVector<Q, op, vectype, imm0_255,
6133 (ins logical_vec_shift:$shift),
6134 "$shift", asm, kind, pattern> {
6135 bits<2> shift;
6136 let Inst{15} = b15_b12{1};
6137 let Inst{14-13} = shift;
6138 let Inst{12} = b15_b12{0};
6139}
6140
6141class BaseSIMDModifiedImmVectorShiftTied<bit Q, bit op, bits<2> b15_b12,
6142 RegisterOperand vectype, string asm,
6143 string kind, list<dag> pattern>
6144 : BaseSIMDModifiedImmVectorTied<Q, op, vectype, imm0_255,
6145 (ins logical_vec_shift:$shift),
6146 "$shift", asm, kind, pattern> {
6147 bits<2> shift;
6148 let Inst{15} = b15_b12{1};
6149 let Inst{14-13} = shift;
6150 let Inst{12} = b15_b12{0};
6151}
6152
6153
6154class BaseSIMDModifiedImmVectorShiftHalf<bit Q, bit op, bits<2> b15_b12,
6155 RegisterOperand vectype, string asm,
6156 string kind, list<dag> pattern>
6157 : BaseSIMDModifiedImmVector<Q, op, vectype, imm0_255,
6158 (ins logical_vec_hw_shift:$shift),
6159 "$shift", asm, kind, pattern> {
6160 bits<2> shift;
6161 let Inst{15} = b15_b12{1};
6162 let Inst{14} = 0;
6163 let Inst{13} = shift{0};
6164 let Inst{12} = b15_b12{0};
6165}
6166
6167class BaseSIMDModifiedImmVectorShiftHalfTied<bit Q, bit op, bits<2> b15_b12,
6168 RegisterOperand vectype, string asm,
6169 string kind, list<dag> pattern>
6170 : BaseSIMDModifiedImmVectorTied<Q, op, vectype, imm0_255,
6171 (ins logical_vec_hw_shift:$shift),
6172 "$shift", asm, kind, pattern> {
6173 bits<2> shift;
6174 let Inst{15} = b15_b12{1};
6175 let Inst{14} = 0;
6176 let Inst{13} = shift{0};
6177 let Inst{12} = b15_b12{0};
6178}
6179
6180multiclass SIMDModifiedImmVectorShift<bit op, bits<2> hw_cmode, bits<2> w_cmode,
6181 string asm> {
6182 def v4i16 : BaseSIMDModifiedImmVectorShiftHalf<0, op, hw_cmode, V64,
6183 asm, ".4h", []>;
6184 def v8i16 : BaseSIMDModifiedImmVectorShiftHalf<1, op, hw_cmode, V128,
6185 asm, ".8h", []>;
6186
6187 def v2i32 : BaseSIMDModifiedImmVectorShift<0, op, w_cmode, V64,
6188 asm, ".2s", []>;
6189 def v4i32 : BaseSIMDModifiedImmVectorShift<1, op, w_cmode, V128,
6190 asm, ".4s", []>;
6191}
6192
6193multiclass SIMDModifiedImmVectorShiftTied<bit op, bits<2> hw_cmode,
6194 bits<2> w_cmode, string asm,
6195 SDNode OpNode> {
6196 def v4i16 : BaseSIMDModifiedImmVectorShiftHalfTied<0, op, hw_cmode, V64,
6197 asm, ".4h",
6198 [(set (v4i16 V64:$dst), (OpNode V64:$Rd,
6199 imm0_255:$imm8,
6200 (i32 imm:$shift)))]>;
6201 def v8i16 : BaseSIMDModifiedImmVectorShiftHalfTied<1, op, hw_cmode, V128,
6202 asm, ".8h",
6203 [(set (v8i16 V128:$dst), (OpNode V128:$Rd,
6204 imm0_255:$imm8,
6205 (i32 imm:$shift)))]>;
6206
6207 def v2i32 : BaseSIMDModifiedImmVectorShiftTied<0, op, w_cmode, V64,
6208 asm, ".2s",
6209 [(set (v2i32 V64:$dst), (OpNode V64:$Rd,
6210 imm0_255:$imm8,
6211 (i32 imm:$shift)))]>;
6212 def v4i32 : BaseSIMDModifiedImmVectorShiftTied<1, op, w_cmode, V128,
6213 asm, ".4s",
6214 [(set (v4i32 V128:$dst), (OpNode V128:$Rd,
6215 imm0_255:$imm8,
6216 (i32 imm:$shift)))]>;
6217}
6218
6219class SIMDModifiedImmMoveMSL<bit Q, bit op, bits<4> cmode,
6220 RegisterOperand vectype, string asm,
6221 string kind, list<dag> pattern>
6222 : BaseSIMDModifiedImmVector<Q, op, vectype, imm0_255,
6223 (ins move_vec_shift:$shift),
6224 "$shift", asm, kind, pattern> {
6225 bits<1> shift;
6226 let Inst{15-13} = cmode{3-1};
6227 let Inst{12} = shift;
6228}
6229
6230class SIMDModifiedImmVectorNoShift<bit Q, bit op, bits<4> cmode,
6231 RegisterOperand vectype,
6232 Operand imm_type, string asm,
6233 string kind, list<dag> pattern>
6234 : BaseSIMDModifiedImmVector<Q, op, vectype, imm_type, (ins), "",
6235 asm, kind, pattern> {
6236 let Inst{15-12} = cmode;
6237}
6238
6239class SIMDModifiedImmScalarNoShift<bit Q, bit op, bits<4> cmode, string asm,
6240 list<dag> pattern>
6241 : BaseSIMDModifiedImm<Q, op, (outs FPR64:$Rd), (ins simdimmtype10:$imm8), asm,
6242 "\t$Rd, $imm8", "", pattern> {
6243 let Inst{15-12} = cmode;
6244 let DecoderMethod = "DecodeModImmInstruction";
6245}
6246
6247//----------------------------------------------------------------------------
6248// AdvSIMD indexed element
6249//----------------------------------------------------------------------------
6250
6251let mayLoad = 0, mayStore = 0, hasSideEffects = 0 in
6252class BaseSIMDIndexed<bit Q, bit U, bit Scalar, bits<2> size, bits<4> opc,
6253 RegisterOperand dst_reg, RegisterOperand lhs_reg,
6254 RegisterOperand rhs_reg, Operand vec_idx, string asm,
6255 string apple_kind, string dst_kind, string lhs_kind,
6256 string rhs_kind, list<dag> pattern>
6257 : I<(outs dst_reg:$Rd), (ins lhs_reg:$Rn, rhs_reg:$Rm, vec_idx:$idx),
6258 asm,
6259 "{\t$Rd" # dst_kind # ", $Rn" # lhs_kind # ", $Rm" # rhs_kind # "$idx" #
6260 "|" # apple_kind # "\t$Rd, $Rn, $Rm$idx}", "", pattern>,
6261 Sched<[WriteV]> {
6262 bits<5> Rd;
6263 bits<5> Rn;
6264 bits<5> Rm;
6265
6266 let Inst{31} = 0;
6267 let Inst{30} = Q;
6268 let Inst{29} = U;
6269 let Inst{28} = Scalar;
6270 let Inst{27-24} = 0b1111;
6271 let Inst{23-22} = size;
6272 // Bit 21 must be set by the derived class.
6273 let Inst{20-16} = Rm;
6274 let Inst{15-12} = opc;
6275 // Bit 11 must be set by the derived class.
6276 let Inst{10} = 0;
6277 let Inst{9-5} = Rn;
6278 let Inst{4-0} = Rd;
6279}
6280
6281let mayLoad = 0, mayStore = 0, hasSideEffects = 0 in
6282class BaseSIMDIndexedTied<bit Q, bit U, bit Scalar, bits<2> size, bits<4> opc,
6283 RegisterOperand dst_reg, RegisterOperand lhs_reg,
6284 RegisterOperand rhs_reg, Operand vec_idx, string asm,
6285 string apple_kind, string dst_kind, string lhs_kind,
6286 string rhs_kind, list<dag> pattern>
6287 : I<(outs dst_reg:$dst),
6288 (ins dst_reg:$Rd, lhs_reg:$Rn, rhs_reg:$Rm, vec_idx:$idx), asm,
6289 "{\t$Rd" # dst_kind # ", $Rn" # lhs_kind # ", $Rm" # rhs_kind # "$idx" #
6290 "|" # apple_kind # "\t$Rd, $Rn, $Rm$idx}", "$Rd = $dst", pattern>,
6291 Sched<[WriteV]> {
6292 bits<5> Rd;
6293 bits<5> Rn;
6294 bits<5> Rm;
6295
6296 let Inst{31} = 0;
6297 let Inst{30} = Q;
6298 let Inst{29} = U;
6299 let Inst{28} = Scalar;
6300 let Inst{27-24} = 0b1111;
6301 let Inst{23-22} = size;
6302 // Bit 21 must be set by the derived class.
6303 let Inst{20-16} = Rm;
6304 let Inst{15-12} = opc;
6305 // Bit 11 must be set by the derived class.
6306 let Inst{10} = 0;
6307 let Inst{9-5} = Rn;
6308 let Inst{4-0} = Rd;
6309}
6310
6311multiclass SIMDFPIndexedSD<bit U, bits<4> opc, string asm,
6312 SDPatternOperator OpNode> {
6313 def v2i32_indexed : BaseSIMDIndexed<0, U, 0, 0b10, opc,
6314 V64, V64,
6315 V128, VectorIndexS,
6316 asm, ".2s", ".2s", ".2s", ".s",
6317 [(set (v2f32 V64:$Rd),
6318 (OpNode (v2f32 V64:$Rn),
6319 (v2f32 (AArch64duplane32 (v4f32 V128:$Rm), VectorIndexS:$idx))))]> {
6320 bits<2> idx;
6321 let Inst{11} = idx{1};
6322 let Inst{21} = idx{0};
6323 }
6324
6325 def v4i32_indexed : BaseSIMDIndexed<1, U, 0, 0b10, opc,
6326 V128, V128,
6327 V128, VectorIndexS,
6328 asm, ".4s", ".4s", ".4s", ".s",
6329 [(set (v4f32 V128:$Rd),
6330 (OpNode (v4f32 V128:$Rn),
6331 (v4f32 (AArch64duplane32 (v4f32 V128:$Rm), VectorIndexS:$idx))))]> {
6332 bits<2> idx;
6333 let Inst{11} = idx{1};
6334 let Inst{21} = idx{0};
6335 }
6336
6337 def v2i64_indexed : BaseSIMDIndexed<1, U, 0, 0b11, opc,
6338 V128, V128,
6339 V128, VectorIndexD,
6340 asm, ".2d", ".2d", ".2d", ".d",
6341 [(set (v2f64 V128:$Rd),
6342 (OpNode (v2f64 V128:$Rn),
6343 (v2f64 (AArch64duplane64 (v2f64 V128:$Rm), VectorIndexD:$idx))))]> {
6344 bits<1> idx;
6345 let Inst{11} = idx{0};
6346 let Inst{21} = 0;
6347 }
6348
6349 def v1i32_indexed : BaseSIMDIndexed<1, U, 1, 0b10, opc,
6350 FPR32Op, FPR32Op, V128, VectorIndexS,
6351 asm, ".s", "", "", ".s",
6352 [(set (f32 FPR32Op:$Rd),
6353 (OpNode (f32 FPR32Op:$Rn),
6354 (f32 (vector_extract (v4f32 V128:$Rm),
6355 VectorIndexS:$idx))))]> {
6356 bits<2> idx;
6357 let Inst{11} = idx{1};
6358 let Inst{21} = idx{0};
6359 }
6360
6361 def v1i64_indexed : BaseSIMDIndexed<1, U, 1, 0b11, opc,
6362 FPR64Op, FPR64Op, V128, VectorIndexD,
6363 asm, ".d", "", "", ".d",
6364 [(set (f64 FPR64Op:$Rd),
6365 (OpNode (f64 FPR64Op:$Rn),
6366 (f64 (vector_extract (v2f64 V128:$Rm),
6367 VectorIndexD:$idx))))]> {
6368 bits<1> idx;
6369 let Inst{11} = idx{0};
6370 let Inst{21} = 0;
6371 }
6372}
6373
6374multiclass SIMDFPIndexedSDTiedPatterns<string INST, SDPatternOperator OpNode> {
6375 // 2 variants for the .2s version: DUPLANE from 128-bit and DUP scalar.
6376 def : Pat<(v2f32 (OpNode (v2f32 V64:$Rd), (v2f32 V64:$Rn),
6377 (AArch64duplane32 (v4f32 V128:$Rm),
6378 VectorIndexS:$idx))),
6379 (!cast<Instruction>(INST # v2i32_indexed)
6380 V64:$Rd, V64:$Rn, V128:$Rm, VectorIndexS:$idx)>;
6381 def : Pat<(v2f32 (OpNode (v2f32 V64:$Rd), (v2f32 V64:$Rn),
6382 (AArch64dup (f32 FPR32Op:$Rm)))),
6383 (!cast<Instruction>(INST # "v2i32_indexed") V64:$Rd, V64:$Rn,
6384 (SUBREG_TO_REG (i32 0), FPR32Op:$Rm, ssub), (i64 0))>;
6385
6386
6387 // 2 variants for the .4s version: DUPLANE from 128-bit and DUP scalar.
6388 def : Pat<(v4f32 (OpNode (v4f32 V128:$Rd), (v4f32 V128:$Rn),
6389 (AArch64duplane32 (v4f32 V128:$Rm),
6390 VectorIndexS:$idx))),
6391 (!cast<Instruction>(INST # "v4i32_indexed")
6392 V128:$Rd, V128:$Rn, V128:$Rm, VectorIndexS:$idx)>;
6393 def : Pat<(v4f32 (OpNode (v4f32 V128:$Rd), (v4f32 V128:$Rn),
6394 (AArch64dup (f32 FPR32Op:$Rm)))),
6395 (!cast<Instruction>(INST # "v4i32_indexed") V128:$Rd, V128:$Rn,
6396 (SUBREG_TO_REG (i32 0), FPR32Op:$Rm, ssub), (i64 0))>;
6397
6398 // 2 variants for the .2d version: DUPLANE from 128-bit and DUP scalar.
6399 def : Pat<(v2f64 (OpNode (v2f64 V128:$Rd), (v2f64 V128:$Rn),
6400 (AArch64duplane64 (v2f64 V128:$Rm),
6401 VectorIndexD:$idx))),
6402 (!cast<Instruction>(INST # "v2i64_indexed")
6403 V128:$Rd, V128:$Rn, V128:$Rm, VectorIndexS:$idx)>;
6404 def : Pat<(v2f64 (OpNode (v2f64 V128:$Rd), (v2f64 V128:$Rn),
6405 (AArch64dup (f64 FPR64Op:$Rm)))),
6406 (!cast<Instruction>(INST # "v2i64_indexed") V128:$Rd, V128:$Rn,
6407 (SUBREG_TO_REG (i32 0), FPR64Op:$Rm, dsub), (i64 0))>;
6408
6409 // 2 variants for 32-bit scalar version: extract from .2s or from .4s
6410 def : Pat<(f32 (OpNode (f32 FPR32:$Rd), (f32 FPR32:$Rn),
6411 (vector_extract (v4f32 V128:$Rm), VectorIndexS:$idx))),
6412 (!cast<Instruction>(INST # "v1i32_indexed") FPR32:$Rd, FPR32:$Rn,
6413 V128:$Rm, VectorIndexS:$idx)>;
6414 def : Pat<(f32 (OpNode (f32 FPR32:$Rd), (f32 FPR32:$Rn),
6415 (vector_extract (v2f32 V64:$Rm), VectorIndexS:$idx))),
6416 (!cast<Instruction>(INST # "v1i32_indexed") FPR32:$Rd, FPR32:$Rn,
6417 (SUBREG_TO_REG (i32 0), V64:$Rm, dsub), VectorIndexS:$idx)>;
6418
6419 // 1 variant for 64-bit scalar version: extract from .1d or from .2d
6420 def : Pat<(f64 (OpNode (f64 FPR64:$Rd), (f64 FPR64:$Rn),
6421 (vector_extract (v2f64 V128:$Rm), VectorIndexD:$idx))),
6422 (!cast<Instruction>(INST # "v1i64_indexed") FPR64:$Rd, FPR64:$Rn,
6423 V128:$Rm, VectorIndexD:$idx)>;
6424}
6425
6426multiclass SIMDFPIndexedSDTied<bit U, bits<4> opc, string asm> {
6427 def v2i32_indexed : BaseSIMDIndexedTied<0, U, 0, 0b10, opc, V64, V64,
6428 V128, VectorIndexS,
6429 asm, ".2s", ".2s", ".2s", ".s", []> {
6430 bits<2> idx;
6431 let Inst{11} = idx{1};
6432 let Inst{21} = idx{0};
6433 }
6434
6435 def v4i32_indexed : BaseSIMDIndexedTied<1, U, 0, 0b10, opc,
6436 V128, V128,
6437 V128, VectorIndexS,
6438 asm, ".4s", ".4s", ".4s", ".s", []> {
6439 bits<2> idx;
6440 let Inst{11} = idx{1};
6441 let Inst{21} = idx{0};
6442 }
6443
6444 def v2i64_indexed : BaseSIMDIndexedTied<1, U, 0, 0b11, opc,
6445 V128, V128,
6446 V128, VectorIndexD,
6447 asm, ".2d", ".2d", ".2d", ".d", []> {
6448 bits<1> idx;
6449 let Inst{11} = idx{0};
6450 let Inst{21} = 0;
6451 }
6452
6453
6454 def v1i32_indexed : BaseSIMDIndexedTied<1, U, 1, 0b10, opc,
6455 FPR32Op, FPR32Op, V128, VectorIndexS,
6456 asm, ".s", "", "", ".s", []> {
6457 bits<2> idx;
6458 let Inst{11} = idx{1};
6459 let Inst{21} = idx{0};
6460 }
6461
6462 def v1i64_indexed : BaseSIMDIndexedTied<1, U, 1, 0b11, opc,
6463 FPR64Op, FPR64Op, V128, VectorIndexD,
6464 asm, ".d", "", "", ".d", []> {
6465 bits<1> idx;
6466 let Inst{11} = idx{0};
6467 let Inst{21} = 0;
6468 }
6469}
6470
6471multiclass SIMDIndexedHS<bit U, bits<4> opc, string asm,
6472 SDPatternOperator OpNode> {
6473 def v4i16_indexed : BaseSIMDIndexed<0, U, 0, 0b01, opc, V64, V64,
6474 V128_lo, VectorIndexH,
6475 asm, ".4h", ".4h", ".4h", ".h",
6476 [(set (v4i16 V64:$Rd),
6477 (OpNode (v4i16 V64:$Rn),
6478 (v4i16 (AArch64duplane16 (v8i16 V128_lo:$Rm), VectorIndexH:$idx))))]> {
6479 bits<3> idx;
6480 let Inst{11} = idx{2};
6481 let Inst{21} = idx{1};
6482 let Inst{20} = idx{0};
6483 }
6484
6485 def v8i16_indexed : BaseSIMDIndexed<1, U, 0, 0b01, opc,
6486 V128, V128,
6487 V128_lo, VectorIndexH,
6488 asm, ".8h", ".8h", ".8h", ".h",
6489 [(set (v8i16 V128:$Rd),
6490 (OpNode (v8i16 V128:$Rn),
6491 (v8i16 (AArch64duplane16 (v8i16 V128_lo:$Rm), VectorIndexH:$idx))))]> {
6492 bits<3> idx;
6493 let Inst{11} = idx{2};
6494 let Inst{21} = idx{1};
6495 let Inst{20} = idx{0};
6496 }
6497
6498 def v2i32_indexed : BaseSIMDIndexed<0, U, 0, 0b10, opc,
6499 V64, V64,
6500 V128, VectorIndexS,
6501 asm, ".2s", ".2s", ".2s", ".s",
6502 [(set (v2i32 V64:$Rd),
6503 (OpNode (v2i32 V64:$Rn),
6504 (v2i32 (AArch64duplane32 (v4i32 V128:$Rm), VectorIndexS:$idx))))]> {
6505 bits<2> idx;
6506 let Inst{11} = idx{1};
6507 let Inst{21} = idx{0};
6508 }
6509
6510 def v4i32_indexed : BaseSIMDIndexed<1, U, 0, 0b10, opc,
6511 V128, V128,
6512 V128, VectorIndexS,
6513 asm, ".4s", ".4s", ".4s", ".s",
6514 [(set (v4i32 V128:$Rd),
6515 (OpNode (v4i32 V128:$Rn),
6516 (v4i32 (AArch64duplane32 (v4i32 V128:$Rm), VectorIndexS:$idx))))]> {
6517 bits<2> idx;
6518 let Inst{11} = idx{1};
6519 let Inst{21} = idx{0};
6520 }
6521
6522 def v1i16_indexed : BaseSIMDIndexed<1, U, 1, 0b01, opc,
6523 FPR16Op, FPR16Op, V128_lo, VectorIndexH,
6524 asm, ".h", "", "", ".h", []> {
6525 bits<3> idx;
6526 let Inst{11} = idx{2};
6527 let Inst{21} = idx{1};
6528 let Inst{20} = idx{0};
6529 }
6530
6531 def v1i32_indexed : BaseSIMDIndexed<1, U, 1, 0b10, opc,
6532 FPR32Op, FPR32Op, V128, VectorIndexS,
6533 asm, ".s", "", "", ".s",
6534 [(set (i32 FPR32Op:$Rd),
6535 (OpNode FPR32Op:$Rn,
6536 (i32 (vector_extract (v4i32 V128:$Rm),
6537 VectorIndexS:$idx))))]> {
6538 bits<2> idx;
6539 let Inst{11} = idx{1};
6540 let Inst{21} = idx{0};
6541 }
6542}
6543
6544multiclass SIMDVectorIndexedHS<bit U, bits<4> opc, string asm,
6545 SDPatternOperator OpNode> {
6546 def v4i16_indexed : BaseSIMDIndexed<0, U, 0, 0b01, opc,
6547 V64, V64,
6548 V128_lo, VectorIndexH,
6549 asm, ".4h", ".4h", ".4h", ".h",
6550 [(set (v4i16 V64:$Rd),
6551 (OpNode (v4i16 V64:$Rn),
6552 (v4i16 (AArch64duplane16 (v8i16 V128_lo:$Rm), VectorIndexH:$idx))))]> {
6553 bits<3> idx;
6554 let Inst{11} = idx{2};
6555 let Inst{21} = idx{1};
6556 let Inst{20} = idx{0};
6557 }
6558
6559 def v8i16_indexed : BaseSIMDIndexed<1, U, 0, 0b01, opc,
6560 V128, V128,
6561 V128_lo, VectorIndexH,
6562 asm, ".8h", ".8h", ".8h", ".h",
6563 [(set (v8i16 V128:$Rd),
6564 (OpNode (v8i16 V128:$Rn),
6565 (v8i16 (AArch64duplane16 (v8i16 V128_lo:$Rm), VectorIndexH:$idx))))]> {
6566 bits<3> idx;
6567 let Inst{11} = idx{2};
6568 let Inst{21} = idx{1};
6569 let Inst{20} = idx{0};
6570 }
6571
6572 def v2i32_indexed : BaseSIMDIndexed<0, U, 0, 0b10, opc,
6573 V64, V64,
6574 V128, VectorIndexS,
6575 asm, ".2s", ".2s", ".2s", ".s",
6576 [(set (v2i32 V64:$Rd),
6577 (OpNode (v2i32 V64:$Rn),
6578 (v2i32 (AArch64duplane32 (v4i32 V128:$Rm), VectorIndexS:$idx))))]> {
6579 bits<2> idx;
6580 let Inst{11} = idx{1};
6581 let Inst{21} = idx{0};
6582 }
6583
6584 def v4i32_indexed : BaseSIMDIndexed<1, U, 0, 0b10, opc,
6585 V128, V128,
6586 V128, VectorIndexS,
6587 asm, ".4s", ".4s", ".4s", ".s",
6588 [(set (v4i32 V128:$Rd),
6589 (OpNode (v4i32 V128:$Rn),
6590 (v4i32 (AArch64duplane32 (v4i32 V128:$Rm), VectorIndexS:$idx))))]> {
6591 bits<2> idx;
6592 let Inst{11} = idx{1};
6593 let Inst{21} = idx{0};
6594 }
6595}
6596
6597multiclass SIMDVectorIndexedHSTied<bit U, bits<4> opc, string asm,
6598 SDPatternOperator OpNode> {
6599 def v4i16_indexed : BaseSIMDIndexedTied<0, U, 0, 0b01, opc, V64, V64,
6600 V128_lo, VectorIndexH,
6601 asm, ".4h", ".4h", ".4h", ".h",
6602 [(set (v4i16 V64:$dst),
6603 (OpNode (v4i16 V64:$Rd),(v4i16 V64:$Rn),
6604 (v4i16 (AArch64duplane16 (v8i16 V128_lo:$Rm), VectorIndexH:$idx))))]> {
6605 bits<3> idx;
6606 let Inst{11} = idx{2};
6607 let Inst{21} = idx{1};
6608 let Inst{20} = idx{0};
6609 }
6610
6611 def v8i16_indexed : BaseSIMDIndexedTied<1, U, 0, 0b01, opc,
6612 V128, V128,
6613 V128_lo, VectorIndexH,
6614 asm, ".8h", ".8h", ".8h", ".h",
6615 [(set (v8i16 V128:$dst),
6616 (OpNode (v8i16 V128:$Rd), (v8i16 V128:$Rn),
6617 (v8i16 (AArch64duplane16 (v8i16 V128_lo:$Rm), VectorIndexH:$idx))))]> {
6618 bits<3> idx;
6619 let Inst{11} = idx{2};
6620 let Inst{21} = idx{1};
6621 let Inst{20} = idx{0};
6622 }
6623
6624 def v2i32_indexed : BaseSIMDIndexedTied<0, U, 0, 0b10, opc,
6625 V64, V64,
6626 V128, VectorIndexS,
6627 asm, ".2s", ".2s", ".2s", ".s",
6628 [(set (v2i32 V64:$dst),
6629 (OpNode (v2i32 V64:$Rd), (v2i32 V64:$Rn),
6630 (v2i32 (AArch64duplane32 (v4i32 V128:$Rm), VectorIndexS:$idx))))]> {
6631 bits<2> idx;
6632 let Inst{11} = idx{1};
6633 let Inst{21} = idx{0};
6634 }
6635
6636 def v4i32_indexed : BaseSIMDIndexedTied<1, U, 0, 0b10, opc,
6637 V128, V128,
6638 V128, VectorIndexS,
6639 asm, ".4s", ".4s", ".4s", ".s",
6640 [(set (v4i32 V128:$dst),
6641 (OpNode (v4i32 V128:$Rd), (v4i32 V128:$Rn),
6642 (v4i32 (AArch64duplane32 (v4i32 V128:$Rm), VectorIndexS:$idx))))]> {
6643 bits<2> idx;
6644 let Inst{11} = idx{1};
6645 let Inst{21} = idx{0};
6646 }
6647}
6648
6649multiclass SIMDIndexedLongSD<bit U, bits<4> opc, string asm,
6650 SDPatternOperator OpNode> {
6651 def v4i16_indexed : BaseSIMDIndexed<0, U, 0, 0b01, opc,
6652 V128, V64,
6653 V128_lo, VectorIndexH,
6654 asm, ".4s", ".4s", ".4h", ".h",
6655 [(set (v4i32 V128:$Rd),
6656 (OpNode (v4i16 V64:$Rn),
6657 (v4i16 (AArch64duplane16 (v8i16 V128_lo:$Rm), VectorIndexH:$idx))))]> {
6658 bits<3> idx;
6659 let Inst{11} = idx{2};
6660 let Inst{21} = idx{1};
6661 let Inst{20} = idx{0};
6662 }
6663
6664 def v8i16_indexed : BaseSIMDIndexed<1, U, 0, 0b01, opc,
6665 V128, V128,
6666 V128_lo, VectorIndexH,
6667 asm#"2", ".4s", ".4s", ".8h", ".h",
6668 [(set (v4i32 V128:$Rd),
6669 (OpNode (extract_high_v8i16 V128:$Rn),
6670 (extract_high_v8i16 (AArch64duplane16 (v8i16 V128_lo:$Rm),
6671 VectorIndexH:$idx))))]> {
6672
6673 bits<3> idx;
6674 let Inst{11} = idx{2};
6675 let Inst{21} = idx{1};
6676 let Inst{20} = idx{0};
6677 }
6678
6679 def v2i32_indexed : BaseSIMDIndexed<0, U, 0, 0b10, opc,
6680 V128, V64,
6681 V128, VectorIndexS,
6682 asm, ".2d", ".2d", ".2s", ".s",
6683 [(set (v2i64 V128:$Rd),
6684 (OpNode (v2i32 V64:$Rn),
6685 (v2i32 (AArch64duplane32 (v4i32 V128:$Rm), VectorIndexS:$idx))))]> {
6686 bits<2> idx;
6687 let Inst{11} = idx{1};
6688 let Inst{21} = idx{0};
6689 }
6690
6691 def v4i32_indexed : BaseSIMDIndexed<1, U, 0, 0b10, opc,
6692 V128, V128,
6693 V128, VectorIndexS,
6694 asm#"2", ".2d", ".2d", ".4s", ".s",
6695 [(set (v2i64 V128:$Rd),
6696 (OpNode (extract_high_v4i32 V128:$Rn),
6697 (extract_high_v4i32 (AArch64duplane32 (v4i32 V128:$Rm),
6698 VectorIndexS:$idx))))]> {
6699 bits<2> idx;
6700 let Inst{11} = idx{1};
6701 let Inst{21} = idx{0};
6702 }
6703
6704 def v1i32_indexed : BaseSIMDIndexed<1, U, 1, 0b01, opc,
6705 FPR32Op, FPR16Op, V128_lo, VectorIndexH,
6706 asm, ".h", "", "", ".h", []> {
6707 bits<3> idx;
6708 let Inst{11} = idx{2};
6709 let Inst{21} = idx{1};
6710 let Inst{20} = idx{0};
6711 }
6712
6713 def v1i64_indexed : BaseSIMDIndexed<1, U, 1, 0b10, opc,
6714 FPR64Op, FPR32Op, V128, VectorIndexS,
6715 asm, ".s", "", "", ".s", []> {
6716 bits<2> idx;
6717 let Inst{11} = idx{1};
6718 let Inst{21} = idx{0};
6719 }
6720}
6721
6722multiclass SIMDIndexedLongSQDMLXSDTied<bit U, bits<4> opc, string asm,
6723 SDPatternOperator Accum> {
6724 def v4i16_indexed : BaseSIMDIndexedTied<0, U, 0, 0b01, opc,
6725 V128, V64,
6726 V128_lo, VectorIndexH,
6727 asm, ".4s", ".4s", ".4h", ".h",
6728 [(set (v4i32 V128:$dst),
6729 (Accum (v4i32 V128:$Rd),
6730 (v4i32 (int_aarch64_neon_sqdmull
6731 (v4i16 V64:$Rn),
6732 (v4i16 (AArch64duplane16 (v8i16 V128_lo:$Rm),
6733 VectorIndexH:$idx))))))]> {
6734 bits<3> idx;
6735 let Inst{11} = idx{2};
6736 let Inst{21} = idx{1};
6737 let Inst{20} = idx{0};
6738 }
6739
6740 // FIXME: it would be nice to use the scalar (v1i32) instruction here, but an
6741 // intermediate EXTRACT_SUBREG would be untyped.
6742 def : Pat<(i32 (Accum (i32 FPR32Op:$Rd),
6743 (i32 (vector_extract (v4i32
6744 (int_aarch64_neon_sqdmull (v4i16 V64:$Rn),
6745 (v4i16 (AArch64duplane16 (v8i16 V128_lo:$Rm),
6746 VectorIndexH:$idx)))),
6747 (i64 0))))),
6748 (EXTRACT_SUBREG
6749 (!cast<Instruction>(NAME # v4i16_indexed)
6750 (SUBREG_TO_REG (i32 0), FPR32Op:$Rd, ssub), V64:$Rn,
6751 V128_lo:$Rm, VectorIndexH:$idx),
6752 ssub)>;
6753
6754 def v8i16_indexed : BaseSIMDIndexedTied<1, U, 0, 0b01, opc,
6755 V128, V128,
6756 V128_lo, VectorIndexH,
6757 asm#"2", ".4s", ".4s", ".8h", ".h",
6758 [(set (v4i32 V128:$dst),
6759 (Accum (v4i32 V128:$Rd),
6760 (v4i32 (int_aarch64_neon_sqdmull
6761 (extract_high_v8i16 V128:$Rn),
6762 (extract_high_v8i16
6763 (AArch64duplane16 (v8i16 V128_lo:$Rm),
6764 VectorIndexH:$idx))))))]> {
6765 bits<3> idx;
6766 let Inst{11} = idx{2};
6767 let Inst{21} = idx{1};
6768 let Inst{20} = idx{0};
6769 }
6770
6771 def v2i32_indexed : BaseSIMDIndexedTied<0, U, 0, 0b10, opc,
6772 V128, V64,
6773 V128, VectorIndexS,
6774 asm, ".2d", ".2d", ".2s", ".s",
6775 [(set (v2i64 V128:$dst),
6776 (Accum (v2i64 V128:$Rd),
6777 (v2i64 (int_aarch64_neon_sqdmull
6778 (v2i32 V64:$Rn),
6779 (v2i32 (AArch64duplane32 (v4i32 V128:$Rm),
6780 VectorIndexS:$idx))))))]> {
6781 bits<2> idx;
6782 let Inst{11} = idx{1};
6783 let Inst{21} = idx{0};
6784 }
6785
6786 def v4i32_indexed : BaseSIMDIndexedTied<1, U, 0, 0b10, opc,
6787 V128, V128,
6788 V128, VectorIndexS,
6789 asm#"2", ".2d", ".2d", ".4s", ".s",
6790 [(set (v2i64 V128:$dst),
6791 (Accum (v2i64 V128:$Rd),
6792 (v2i64 (int_aarch64_neon_sqdmull
6793 (extract_high_v4i32 V128:$Rn),
6794 (extract_high_v4i32
6795 (AArch64duplane32 (v4i32 V128:$Rm),
6796 VectorIndexS:$idx))))))]> {
6797 bits<2> idx;
6798 let Inst{11} = idx{1};
6799 let Inst{21} = idx{0};
6800 }
6801
6802 def v1i32_indexed : BaseSIMDIndexedTied<1, U, 1, 0b01, opc,
6803 FPR32Op, FPR16Op, V128_lo, VectorIndexH,
6804 asm, ".h", "", "", ".h", []> {
6805 bits<3> idx;
6806 let Inst{11} = idx{2};
6807 let Inst{21} = idx{1};
6808 let Inst{20} = idx{0};
6809 }
6810
6811
6812 def v1i64_indexed : BaseSIMDIndexedTied<1, U, 1, 0b10, opc,
6813 FPR64Op, FPR32Op, V128, VectorIndexS,
6814 asm, ".s", "", "", ".s",
6815 [(set (i64 FPR64Op:$dst),
6816 (Accum (i64 FPR64Op:$Rd),
6817 (i64 (int_aarch64_neon_sqdmulls_scalar
6818 (i32 FPR32Op:$Rn),
6819 (i32 (vector_extract (v4i32 V128:$Rm),
6820 VectorIndexS:$idx))))))]> {
6821
6822 bits<2> idx;
6823 let Inst{11} = idx{1};
6824 let Inst{21} = idx{0};
6825 }
6826}
6827
6828multiclass SIMDVectorIndexedLongSD<bit U, bits<4> opc, string asm,
6829 SDPatternOperator OpNode> {
6830 let mayLoad = 0, mayStore = 0, hasSideEffects = 0 in {
6831 def v4i16_indexed : BaseSIMDIndexed<0, U, 0, 0b01, opc,
6832 V128, V64,
6833 V128_lo, VectorIndexH,
6834 asm, ".4s", ".4s", ".4h", ".h",
6835 [(set (v4i32 V128:$Rd),
6836 (OpNode (v4i16 V64:$Rn),
6837 (v4i16 (AArch64duplane16 (v8i16 V128_lo:$Rm), VectorIndexH:$idx))))]> {
6838 bits<3> idx;
6839 let Inst{11} = idx{2};
6840 let Inst{21} = idx{1};
6841 let Inst{20} = idx{0};
6842 }
6843
6844 def v8i16_indexed : BaseSIMDIndexed<1, U, 0, 0b01, opc,
6845 V128, V128,
6846 V128_lo, VectorIndexH,
6847 asm#"2", ".4s", ".4s", ".8h", ".h",
6848 [(set (v4i32 V128:$Rd),
6849 (OpNode (extract_high_v8i16 V128:$Rn),
6850 (extract_high_v8i16 (AArch64duplane16 (v8i16 V128_lo:$Rm),
6851 VectorIndexH:$idx))))]> {
6852
6853 bits<3> idx;
6854 let Inst{11} = idx{2};
6855 let Inst{21} = idx{1};
6856 let Inst{20} = idx{0};
6857 }
6858
6859 def v2i32_indexed : BaseSIMDIndexed<0, U, 0, 0b10, opc,
6860 V128, V64,
6861 V128, VectorIndexS,
6862 asm, ".2d", ".2d", ".2s", ".s",
6863 [(set (v2i64 V128:$Rd),
6864 (OpNode (v2i32 V64:$Rn),
6865 (v2i32 (AArch64duplane32 (v4i32 V128:$Rm), VectorIndexS:$idx))))]> {
6866 bits<2> idx;
6867 let Inst{11} = idx{1};
6868 let Inst{21} = idx{0};
6869 }
6870
6871 def v4i32_indexed : BaseSIMDIndexed<1, U, 0, 0b10, opc,
6872 V128, V128,
6873 V128, VectorIndexS,
6874 asm#"2", ".2d", ".2d", ".4s", ".s",
6875 [(set (v2i64 V128:$Rd),
6876 (OpNode (extract_high_v4i32 V128:$Rn),
6877 (extract_high_v4i32 (AArch64duplane32 (v4i32 V128:$Rm),
6878 VectorIndexS:$idx))))]> {
6879 bits<2> idx;
6880 let Inst{11} = idx{1};
6881 let Inst{21} = idx{0};
6882 }
6883 }
6884}
6885
6886multiclass SIMDVectorIndexedLongSDTied<bit U, bits<4> opc, string asm,
6887 SDPatternOperator OpNode> {
6888 let mayLoad = 0, mayStore = 0, hasSideEffects = 0 in {
6889 def v4i16_indexed : BaseSIMDIndexedTied<0, U, 0, 0b01, opc,
6890 V128, V64,
6891 V128_lo, VectorIndexH,
6892 asm, ".4s", ".4s", ".4h", ".h",
6893 [(set (v4i32 V128:$dst),
6894 (OpNode (v4i32 V128:$Rd), (v4i16 V64:$Rn),
6895 (v4i16 (AArch64duplane16 (v8i16 V128_lo:$Rm), VectorIndexH:$idx))))]> {
6896 bits<3> idx;
6897 let Inst{11} = idx{2};
6898 let Inst{21} = idx{1};
6899 let Inst{20} = idx{0};
6900 }
6901
6902 def v8i16_indexed : BaseSIMDIndexedTied<1, U, 0, 0b01, opc,
6903 V128, V128,
6904 V128_lo, VectorIndexH,
6905 asm#"2", ".4s", ".4s", ".8h", ".h",
6906 [(set (v4i32 V128:$dst),
6907 (OpNode (v4i32 V128:$Rd),
6908 (extract_high_v8i16 V128:$Rn),
6909 (extract_high_v8i16 (AArch64duplane16 (v8i16 V128_lo:$Rm),
6910 VectorIndexH:$idx))))]> {
6911 bits<3> idx;
6912 let Inst{11} = idx{2};
6913 let Inst{21} = idx{1};
6914 let Inst{20} = idx{0};
6915 }
6916
6917 def v2i32_indexed : BaseSIMDIndexedTied<0, U, 0, 0b10, opc,
6918 V128, V64,
6919 V128, VectorIndexS,
6920 asm, ".2d", ".2d", ".2s", ".s",
6921 [(set (v2i64 V128:$dst),
6922 (OpNode (v2i64 V128:$Rd), (v2i32 V64:$Rn),
6923 (v2i32 (AArch64duplane32 (v4i32 V128:$Rm), VectorIndexS:$idx))))]> {
6924 bits<2> idx;
6925 let Inst{11} = idx{1};
6926 let Inst{21} = idx{0};
6927 }
6928
6929 def v4i32_indexed : BaseSIMDIndexedTied<1, U, 0, 0b10, opc,
6930 V128, V128,
6931 V128, VectorIndexS,
6932 asm#"2", ".2d", ".2d", ".4s", ".s",
6933 [(set (v2i64 V128:$dst),
6934 (OpNode (v2i64 V128:$Rd),
6935 (extract_high_v4i32 V128:$Rn),
6936 (extract_high_v4i32 (AArch64duplane32 (v4i32 V128:$Rm),
6937 VectorIndexS:$idx))))]> {
6938 bits<2> idx;
6939 let Inst{11} = idx{1};
6940 let Inst{21} = idx{0};
6941 }
6942 }
6943}
6944
6945//----------------------------------------------------------------------------
6946// AdvSIMD scalar shift by immediate
6947//----------------------------------------------------------------------------
6948
6949let mayStore = 0, mayLoad = 0, hasSideEffects = 0 in
6950class BaseSIMDScalarShift<bit U, bits<5> opc, bits<7> fixed_imm,
6951 RegisterClass regtype1, RegisterClass regtype2,
6952 Operand immtype, string asm, list<dag> pattern>
6953 : I<(outs regtype1:$Rd), (ins regtype2:$Rn, immtype:$imm),
6954 asm, "\t$Rd, $Rn, $imm", "", pattern>,
6955 Sched<[WriteV]> {
6956 bits<5> Rd;
6957 bits<5> Rn;
6958 bits<7> imm;
6959 let Inst{31-30} = 0b01;
6960 let Inst{29} = U;
6961 let Inst{28-23} = 0b111110;
6962 let Inst{22-16} = fixed_imm;
6963 let Inst{15-11} = opc;
6964 let Inst{10} = 1;
6965 let Inst{9-5} = Rn;
6966 let Inst{4-0} = Rd;
6967}
6968
6969let mayStore = 0, mayLoad = 0, hasSideEffects = 0 in
6970class BaseSIMDScalarShiftTied<bit U, bits<5> opc, bits<7> fixed_imm,
6971 RegisterClass regtype1, RegisterClass regtype2,
6972 Operand immtype, string asm, list<dag> pattern>
6973 : I<(outs regtype1:$dst), (ins regtype1:$Rd, regtype2:$Rn, immtype:$imm),
6974 asm, "\t$Rd, $Rn, $imm", "$Rd = $dst", pattern>,
6975 Sched<[WriteV]> {
6976 bits<5> Rd;
6977 bits<5> Rn;
6978 bits<7> imm;
6979 let Inst{31-30} = 0b01;
6980 let Inst{29} = U;
6981 let Inst{28-23} = 0b111110;
6982 let Inst{22-16} = fixed_imm;
6983 let Inst{15-11} = opc;
6984 let Inst{10} = 1;
6985 let Inst{9-5} = Rn;
6986 let Inst{4-0} = Rd;
6987}
6988
6989
6990multiclass SIMDScalarRShiftSD<bit U, bits<5> opc, string asm> {
6991 def s : BaseSIMDScalarShift<U, opc, {0,1,?,?,?,?,?},
6992 FPR32, FPR32, vecshiftR32, asm, []> {
6993 let Inst{20-16} = imm{4-0};
6994 }
6995
6996 def d : BaseSIMDScalarShift<U, opc, {1,?,?,?,?,?,?},
6997 FPR64, FPR64, vecshiftR64, asm, []> {
6998 let Inst{21-16} = imm{5-0};
6999 }
7000}
7001
7002multiclass SIMDScalarRShiftD<bit U, bits<5> opc, string asm,
7003 SDPatternOperator OpNode> {
7004 def d : BaseSIMDScalarShift<U, opc, {1,?,?,?,?,?,?},
7005 FPR64, FPR64, vecshiftR64, asm,
7006 [(set (i64 FPR64:$Rd),
7007 (OpNode (i64 FPR64:$Rn), (i32 vecshiftR64:$imm)))]> {
7008 let Inst{21-16} = imm{5-0};
7009 }
7010
7011 def : Pat<(v1i64 (OpNode (v1i64 FPR64:$Rn), (i32 vecshiftR64:$imm))),
7012 (!cast<Instruction>(NAME # "d") FPR64:$Rn, vecshiftR64:$imm)>;
7013}
7014
7015multiclass SIMDScalarRShiftDTied<bit U, bits<5> opc, string asm,
7016 SDPatternOperator OpNode = null_frag> {
7017 def d : BaseSIMDScalarShiftTied<U, opc, {1,?,?,?,?,?,?},
7018 FPR64, FPR64, vecshiftR64, asm,
7019 [(set (i64 FPR64:$dst), (OpNode (i64 FPR64:$Rd), (i64 FPR64:$Rn),
7020 (i32 vecshiftR64:$imm)))]> {
7021 let Inst{21-16} = imm{5-0};
7022 }
7023
7024 def : Pat<(v1i64 (OpNode (v1i64 FPR64:$Rd), (v1i64 FPR64:$Rn),
7025 (i32 vecshiftR64:$imm))),
7026 (!cast<Instruction>(NAME # "d") FPR64:$Rd, FPR64:$Rn,
7027 vecshiftR64:$imm)>;
7028}
7029
7030multiclass SIMDScalarLShiftD<bit U, bits<5> opc, string asm,
7031 SDPatternOperator OpNode> {
7032 def d : BaseSIMDScalarShift<U, opc, {1,?,?,?,?,?,?},
7033 FPR64, FPR64, vecshiftL64, asm,
7034 [(set (v1i64 FPR64:$Rd),
7035 (OpNode (v1i64 FPR64:$Rn), (i32 vecshiftL64:$imm)))]> {
7036 let Inst{21-16} = imm{5-0};
7037 }
7038}
7039
7040let mayStore = 0, mayLoad = 0, hasSideEffects = 0 in
7041multiclass SIMDScalarLShiftDTied<bit U, bits<5> opc, string asm> {
7042 def d : BaseSIMDScalarShiftTied<U, opc, {1,?,?,?,?,?,?},
7043 FPR64, FPR64, vecshiftL64, asm, []> {
7044 let Inst{21-16} = imm{5-0};
7045 }
7046}
7047
7048let mayStore = 0, mayLoad = 0, hasSideEffects = 0 in
7049multiclass SIMDScalarRShiftBHS<bit U, bits<5> opc, string asm,
7050 SDPatternOperator OpNode = null_frag> {
7051 def b : BaseSIMDScalarShift<U, opc, {0,0,0,1,?,?,?},
7052 FPR8, FPR16, vecshiftR8, asm, []> {
7053 let Inst{18-16} = imm{2-0};
7054 }
7055
7056 def h : BaseSIMDScalarShift<U, opc, {0,0,1,?,?,?,?},
7057 FPR16, FPR32, vecshiftR16, asm, []> {
7058 let Inst{19-16} = imm{3-0};
7059 }
7060
7061 def s : BaseSIMDScalarShift<U, opc, {0,1,?,?,?,?,?},
7062 FPR32, FPR64, vecshiftR32, asm,
7063 [(set (i32 FPR32:$Rd), (OpNode (i64 FPR64:$Rn), vecshiftR32:$imm))]> {
7064 let Inst{20-16} = imm{4-0};
7065 }
7066}
7067
7068multiclass SIMDScalarLShiftBHSD<bit U, bits<5> opc, string asm,
7069 SDPatternOperator OpNode> {
7070 def b : BaseSIMDScalarShift<U, opc, {0,0,0,1,?,?,?},
7071 FPR8, FPR8, vecshiftL8, asm, []> {
7072 let Inst{18-16} = imm{2-0};
7073 }
7074
7075 def h : BaseSIMDScalarShift<U, opc, {0,0,1,?,?,?,?},
7076 FPR16, FPR16, vecshiftL16, asm, []> {
7077 let Inst{19-16} = imm{3-0};
7078 }
7079
7080 def s : BaseSIMDScalarShift<U, opc, {0,1,?,?,?,?,?},
7081 FPR32, FPR32, vecshiftL32, asm,
7082 [(set (i32 FPR32:$Rd), (OpNode (i32 FPR32:$Rn), (i32 vecshiftL32:$imm)))]> {
7083 let Inst{20-16} = imm{4-0};
7084 }
7085
7086 def d : BaseSIMDScalarShift<U, opc, {1,?,?,?,?,?,?},
7087 FPR64, FPR64, vecshiftL64, asm,
7088 [(set (i64 FPR64:$Rd), (OpNode (i64 FPR64:$Rn), (i32 vecshiftL64:$imm)))]> {
7089 let Inst{21-16} = imm{5-0};
7090 }
7091
7092 def : Pat<(v1i64 (OpNode (v1i64 FPR64:$Rn), (i32 vecshiftL64:$imm))),
7093 (!cast<Instruction>(NAME # "d") FPR64:$Rn, vecshiftL64:$imm)>;
7094}
7095
7096multiclass SIMDScalarRShiftBHSD<bit U, bits<5> opc, string asm> {
7097 def b : BaseSIMDScalarShift<U, opc, {0,0,0,1,?,?,?},
7098 FPR8, FPR8, vecshiftR8, asm, []> {
7099 let Inst{18-16} = imm{2-0};
7100 }
7101
7102 def h : BaseSIMDScalarShift<U, opc, {0,0,1,?,?,?,?},
7103 FPR16, FPR16, vecshiftR16, asm, []> {
7104 let Inst{19-16} = imm{3-0};
7105 }
7106
7107 def s : BaseSIMDScalarShift<U, opc, {0,1,?,?,?,?,?},
7108 FPR32, FPR32, vecshiftR32, asm, []> {
7109 let Inst{20-16} = imm{4-0};
7110 }
7111
7112 def d : BaseSIMDScalarShift<U, opc, {1,?,?,?,?,?,?},
7113 FPR64, FPR64, vecshiftR64, asm, []> {
7114 let Inst{21-16} = imm{5-0};
7115 }
7116}
7117
7118//----------------------------------------------------------------------------
7119// AdvSIMD vector x indexed element
7120//----------------------------------------------------------------------------
7121
7122let mayStore = 0, mayLoad = 0, hasSideEffects = 0 in
7123class BaseSIMDVectorShift<bit Q, bit U, bits<5> opc, bits<7> fixed_imm,
7124 RegisterOperand dst_reg, RegisterOperand src_reg,
7125 Operand immtype,
7126 string asm, string dst_kind, string src_kind,
7127 list<dag> pattern>
7128 : I<(outs dst_reg:$Rd), (ins src_reg:$Rn, immtype:$imm),
7129 asm, "{\t$Rd" # dst_kind # ", $Rn" # src_kind # ", $imm" #
7130 "|" # dst_kind # "\t$Rd, $Rn, $imm}", "", pattern>,
7131 Sched<[WriteV]> {
7132 bits<5> Rd;
7133 bits<5> Rn;
7134 let Inst{31} = 0;
7135 let Inst{30} = Q;
7136 let Inst{29} = U;
7137 let Inst{28-23} = 0b011110;
7138 let Inst{22-16} = fixed_imm;
7139 let Inst{15-11} = opc;
7140 let Inst{10} = 1;
7141 let Inst{9-5} = Rn;
7142 let Inst{4-0} = Rd;
7143}
7144
7145let mayStore = 0, mayLoad = 0, hasSideEffects = 0 in
7146class BaseSIMDVectorShiftTied<bit Q, bit U, bits<5> opc, bits<7> fixed_imm,
7147 RegisterOperand vectype1, RegisterOperand vectype2,
7148 Operand immtype,
7149 string asm, string dst_kind, string src_kind,
7150 list<dag> pattern>
7151 : I<(outs vectype1:$dst), (ins vectype1:$Rd, vectype2:$Rn, immtype:$imm),
7152 asm, "{\t$Rd" # dst_kind # ", $Rn" # src_kind # ", $imm" #
7153 "|" # dst_kind # "\t$Rd, $Rn, $imm}", "$Rd = $dst", pattern>,
7154 Sched<[WriteV]> {
7155 bits<5> Rd;
7156 bits<5> Rn;
7157 let Inst{31} = 0;
7158 let Inst{30} = Q;
7159 let Inst{29} = U;
7160 let Inst{28-23} = 0b011110;
7161 let Inst{22-16} = fixed_imm;
7162 let Inst{15-11} = opc;
7163 let Inst{10} = 1;
7164 let Inst{9-5} = Rn;
7165 let Inst{4-0} = Rd;
7166}
7167
7168multiclass SIMDVectorRShiftSD<bit U, bits<5> opc, string asm,
7169 Intrinsic OpNode> {
7170 def v2i32_shift : BaseSIMDVectorShift<0, U, opc, {0,1,?,?,?,?,?},
7171 V64, V64, vecshiftR32,
7172 asm, ".2s", ".2s",
7173 [(set (v2i32 V64:$Rd), (OpNode (v2f32 V64:$Rn), (i32 imm:$imm)))]> {
7174 bits<5> imm;
7175 let Inst{20-16} = imm;
7176 }
7177
7178 def v4i32_shift : BaseSIMDVectorShift<1, U, opc, {0,1,?,?,?,?,?},
7179 V128, V128, vecshiftR32,
7180 asm, ".4s", ".4s",
7181 [(set (v4i32 V128:$Rd), (OpNode (v4f32 V128:$Rn), (i32 imm:$imm)))]> {
7182 bits<5> imm;
7183 let Inst{20-16} = imm;
7184 }
7185
7186 def v2i64_shift : BaseSIMDVectorShift<1, U, opc, {1,?,?,?,?,?,?},
7187 V128, V128, vecshiftR64,
7188 asm, ".2d", ".2d",
7189 [(set (v2i64 V128:$Rd), (OpNode (v2f64 V128:$Rn), (i32 imm:$imm)))]> {
7190 bits<6> imm;
7191 let Inst{21-16} = imm;
7192 }
7193}
7194
7195multiclass SIMDVectorRShiftSDToFP<bit U, bits<5> opc, string asm,
7196 Intrinsic OpNode> {
7197 def v2i32_shift : BaseSIMDVectorShift<0, U, opc, {0,1,?,?,?,?,?},
7198 V64, V64, vecshiftR32,
7199 asm, ".2s", ".2s",
7200 [(set (v2f32 V64:$Rd), (OpNode (v2i32 V64:$Rn), (i32 imm:$imm)))]> {
7201 bits<5> imm;
7202 let Inst{20-16} = imm;
7203 }
7204
7205 def v4i32_shift : BaseSIMDVectorShift<1, U, opc, {0,1,?,?,?,?,?},
7206 V128, V128, vecshiftR32,
7207 asm, ".4s", ".4s",
7208 [(set (v4f32 V128:$Rd), (OpNode (v4i32 V128:$Rn), (i32 imm:$imm)))]> {
7209 bits<5> imm;
7210 let Inst{20-16} = imm;
7211 }
7212
7213 def v2i64_shift : BaseSIMDVectorShift<1, U, opc, {1,?,?,?,?,?,?},
7214 V128, V128, vecshiftR64,
7215 asm, ".2d", ".2d",
7216 [(set (v2f64 V128:$Rd), (OpNode (v2i64 V128:$Rn), (i32 imm:$imm)))]> {
7217 bits<6> imm;
7218 let Inst{21-16} = imm;
7219 }
7220}
7221
7222multiclass SIMDVectorRShiftNarrowBHS<bit U, bits<5> opc, string asm,
7223 SDPatternOperator OpNode> {
7224 def v8i8_shift : BaseSIMDVectorShift<0, U, opc, {0,0,0,1,?,?,?},
7225 V64, V128, vecshiftR16Narrow,
7226 asm, ".8b", ".8h",
7227 [(set (v8i8 V64:$Rd), (OpNode (v8i16 V128:$Rn), vecshiftR16Narrow:$imm))]> {
7228 bits<3> imm;
7229 let Inst{18-16} = imm;
7230 }
7231
7232 def v16i8_shift : BaseSIMDVectorShiftTied<1, U, opc, {0,0,0,1,?,?,?},
7233 V128, V128, vecshiftR16Narrow,
7234 asm#"2", ".16b", ".8h", []> {
7235 bits<3> imm;
7236 let Inst{18-16} = imm;
7237 let hasSideEffects = 0;
7238 }
7239
7240 def v4i16_shift : BaseSIMDVectorShift<0, U, opc, {0,0,1,?,?,?,?},
7241 V64, V128, vecshiftR32Narrow,
7242 asm, ".4h", ".4s",
7243 [(set (v4i16 V64:$Rd), (OpNode (v4i32 V128:$Rn), vecshiftR32Narrow:$imm))]> {
7244 bits<4> imm;
7245 let Inst{19-16} = imm;
7246 }
7247
7248 def v8i16_shift : BaseSIMDVectorShiftTied<1, U, opc, {0,0,1,?,?,?,?},
7249 V128, V128, vecshiftR32Narrow,
7250 asm#"2", ".8h", ".4s", []> {
7251 bits<4> imm;
7252 let Inst{19-16} = imm;
7253 let hasSideEffects = 0;
7254 }
7255
7256 def v2i32_shift : BaseSIMDVectorShift<0, U, opc, {0,1,?,?,?,?,?},
7257 V64, V128, vecshiftR64Narrow,
7258 asm, ".2s", ".2d",
7259 [(set (v2i32 V64:$Rd), (OpNode (v2i64 V128:$Rn), vecshiftR64Narrow:$imm))]> {
7260 bits<5> imm;
7261 let Inst{20-16} = imm;
7262 }
7263
7264 def v4i32_shift : BaseSIMDVectorShiftTied<1, U, opc, {0,1,?,?,?,?,?},
7265 V128, V128, vecshiftR64Narrow,
7266 asm#"2", ".4s", ".2d", []> {
7267 bits<5> imm;
7268 let Inst{20-16} = imm;
7269 let hasSideEffects = 0;
7270 }
7271
7272 // TableGen doesn't like patters w/ INSERT_SUBREG on the instructions
7273 // themselves, so put them here instead.
7274
7275 // Patterns involving what's effectively an insert high and a normal
7276 // intrinsic, represented by CONCAT_VECTORS.
7277 def : Pat<(concat_vectors (v8i8 V64:$Rd),(OpNode (v8i16 V128:$Rn),
7278 vecshiftR16Narrow:$imm)),
7279 (!cast<Instruction>(NAME # "v16i8_shift")
7280 (INSERT_SUBREG (IMPLICIT_DEF), V64:$Rd, dsub),
7281 V128:$Rn, vecshiftR16Narrow:$imm)>;
7282 def : Pat<(concat_vectors (v4i16 V64:$Rd), (OpNode (v4i32 V128:$Rn),
7283 vecshiftR32Narrow:$imm)),
7284 (!cast<Instruction>(NAME # "v8i16_shift")
7285 (INSERT_SUBREG (IMPLICIT_DEF), V64:$Rd, dsub),
7286 V128:$Rn, vecshiftR32Narrow:$imm)>;
7287 def : Pat<(concat_vectors (v2i32 V64:$Rd), (OpNode (v2i64 V128:$Rn),
7288 vecshiftR64Narrow:$imm)),
7289 (!cast<Instruction>(NAME # "v4i32_shift")
7290 (INSERT_SUBREG (IMPLICIT_DEF), V64:$Rd, dsub),
7291 V128:$Rn, vecshiftR64Narrow:$imm)>;
7292}
7293
7294multiclass SIMDVectorLShiftBHSD<bit U, bits<5> opc, string asm,
7295 SDPatternOperator OpNode> {
7296 def v8i8_shift : BaseSIMDVectorShift<0, U, opc, {0,0,0,1,?,?,?},
7297 V64, V64, vecshiftL8,
7298 asm, ".8b", ".8b",
7299 [(set (v8i8 V64:$Rd), (OpNode (v8i8 V64:$Rn),
7300 (i32 vecshiftL8:$imm)))]> {
7301 bits<3> imm;
7302 let Inst{18-16} = imm;
7303 }
7304
7305 def v16i8_shift : BaseSIMDVectorShift<1, U, opc, {0,0,0,1,?,?,?},
7306 V128, V128, vecshiftL8,
7307 asm, ".16b", ".16b",
7308 [(set (v16i8 V128:$Rd), (OpNode (v16i8 V128:$Rn),
7309 (i32 vecshiftL8:$imm)))]> {
7310 bits<3> imm;
7311 let Inst{18-16} = imm;
7312 }
7313
7314 def v4i16_shift : BaseSIMDVectorShift<0, U, opc, {0,0,1,?,?,?,?},
7315 V64, V64, vecshiftL16,
7316 asm, ".4h", ".4h",
7317 [(set (v4i16 V64:$Rd), (OpNode (v4i16 V64:$Rn),
7318 (i32 vecshiftL16:$imm)))]> {
7319 bits<4> imm;
7320 let Inst{19-16} = imm;
7321 }
7322
7323 def v8i16_shift : BaseSIMDVectorShift<1, U, opc, {0,0,1,?,?,?,?},
7324 V128, V128, vecshiftL16,
7325 asm, ".8h", ".8h",
7326 [(set (v8i16 V128:$Rd), (OpNode (v8i16 V128:$Rn),
7327 (i32 vecshiftL16:$imm)))]> {
7328 bits<4> imm;
7329 let Inst{19-16} = imm;
7330 }
7331
7332 def v2i32_shift : BaseSIMDVectorShift<0, U, opc, {0,1,?,?,?,?,?},
7333 V64, V64, vecshiftL32,
7334 asm, ".2s", ".2s",
7335 [(set (v2i32 V64:$Rd), (OpNode (v2i32 V64:$Rn),
7336 (i32 vecshiftL32:$imm)))]> {
7337 bits<5> imm;
7338 let Inst{20-16} = imm;
7339 }
7340
7341 def v4i32_shift : BaseSIMDVectorShift<1, U, opc, {0,1,?,?,?,?,?},
7342 V128, V128, vecshiftL32,
7343 asm, ".4s", ".4s",
7344 [(set (v4i32 V128:$Rd), (OpNode (v4i32 V128:$Rn),
7345 (i32 vecshiftL32:$imm)))]> {
7346 bits<5> imm;
7347 let Inst{20-16} = imm;
7348 }
7349
7350 def v2i64_shift : BaseSIMDVectorShift<1, U, opc, {1,?,?,?,?,?,?},
7351 V128, V128, vecshiftL64,
7352 asm, ".2d", ".2d",
7353 [(set (v2i64 V128:$Rd), (OpNode (v2i64 V128:$Rn),
7354 (i32 vecshiftL64:$imm)))]> {
7355 bits<6> imm;
7356 let Inst{21-16} = imm;
7357 }
7358}
7359
7360multiclass SIMDVectorRShiftBHSD<bit U, bits<5> opc, string asm,
7361 SDPatternOperator OpNode> {
7362 def v8i8_shift : BaseSIMDVectorShift<0, U, opc, {0,0,0,1,?,?,?},
7363 V64, V64, vecshiftR8,
7364 asm, ".8b", ".8b",
7365 [(set (v8i8 V64:$Rd), (OpNode (v8i8 V64:$Rn),
7366 (i32 vecshiftR8:$imm)))]> {
7367 bits<3> imm;
7368 let Inst{18-16} = imm;
7369 }
7370
7371 def v16i8_shift : BaseSIMDVectorShift<1, U, opc, {0,0,0,1,?,?,?},
7372 V128, V128, vecshiftR8,
7373 asm, ".16b", ".16b",
7374 [(set (v16i8 V128:$Rd), (OpNode (v16i8 V128:$Rn),
7375 (i32 vecshiftR8:$imm)))]> {
7376 bits<3> imm;
7377 let Inst{18-16} = imm;
7378 }
7379
7380 def v4i16_shift : BaseSIMDVectorShift<0, U, opc, {0,0,1,?,?,?,?},
7381 V64, V64, vecshiftR16,
7382 asm, ".4h", ".4h",
7383 [(set (v4i16 V64:$Rd), (OpNode (v4i16 V64:$Rn),
7384 (i32 vecshiftR16:$imm)))]> {
7385 bits<4> imm;
7386 let Inst{19-16} = imm;
7387 }
7388
7389 def v8i16_shift : BaseSIMDVectorShift<1, U, opc, {0,0,1,?,?,?,?},
7390 V128, V128, vecshiftR16,
7391 asm, ".8h", ".8h",
7392 [(set (v8i16 V128:$Rd), (OpNode (v8i16 V128:$Rn),
7393 (i32 vecshiftR16:$imm)))]> {
7394 bits<4> imm;
7395 let Inst{19-16} = imm;
7396 }
7397
7398 def v2i32_shift : BaseSIMDVectorShift<0, U, opc, {0,1,?,?,?,?,?},
7399 V64, V64, vecshiftR32,
7400 asm, ".2s", ".2s",
7401 [(set (v2i32 V64:$Rd), (OpNode (v2i32 V64:$Rn),
7402 (i32 vecshiftR32:$imm)))]> {
7403 bits<5> imm;
7404 let Inst{20-16} = imm;
7405 }
7406
7407 def v4i32_shift : BaseSIMDVectorShift<1, U, opc, {0,1,?,?,?,?,?},
7408 V128, V128, vecshiftR32,
7409 asm, ".4s", ".4s",
7410 [(set (v4i32 V128:$Rd), (OpNode (v4i32 V128:$Rn),
7411 (i32 vecshiftR32:$imm)))]> {
7412 bits<5> imm;
7413 let Inst{20-16} = imm;
7414 }
7415
7416 def v2i64_shift : BaseSIMDVectorShift<1, U, opc, {1,?,?,?,?,?,?},
7417 V128, V128, vecshiftR64,
7418 asm, ".2d", ".2d",
7419 [(set (v2i64 V128:$Rd), (OpNode (v2i64 V128:$Rn),
7420 (i32 vecshiftR64:$imm)))]> {
7421 bits<6> imm;
7422 let Inst{21-16} = imm;
7423 }
7424}
7425
7426let mayLoad = 0, mayStore = 0, hasSideEffects = 0 in
7427multiclass SIMDVectorRShiftBHSDTied<bit U, bits<5> opc, string asm,
7428 SDPatternOperator OpNode = null_frag> {
7429 def v8i8_shift : BaseSIMDVectorShiftTied<0, U, opc, {0,0,0,1,?,?,?},
7430 V64, V64, vecshiftR8, asm, ".8b", ".8b",
7431 [(set (v8i8 V64:$dst),
7432 (OpNode (v8i8 V64:$Rd), (v8i8 V64:$Rn),
7433 (i32 vecshiftR8:$imm)))]> {
7434 bits<3> imm;
7435 let Inst{18-16} = imm;
7436 }
7437
7438 def v16i8_shift : BaseSIMDVectorShiftTied<1, U, opc, {0,0,0,1,?,?,?},
7439 V128, V128, vecshiftR8, asm, ".16b", ".16b",
7440 [(set (v16i8 V128:$dst),
7441 (OpNode (v16i8 V128:$Rd), (v16i8 V128:$Rn),
7442 (i32 vecshiftR8:$imm)))]> {
7443 bits<3> imm;
7444 let Inst{18-16} = imm;
7445 }
7446
7447 def v4i16_shift : BaseSIMDVectorShiftTied<0, U, opc, {0,0,1,?,?,?,?},
7448 V64, V64, vecshiftR16, asm, ".4h", ".4h",
7449 [(set (v4i16 V64:$dst),
7450 (OpNode (v4i16 V64:$Rd), (v4i16 V64:$Rn),
7451 (i32 vecshiftR16:$imm)))]> {
7452 bits<4> imm;
7453 let Inst{19-16} = imm;
7454 }
7455
7456 def v8i16_shift : BaseSIMDVectorShiftTied<1, U, opc, {0,0,1,?,?,?,?},
7457 V128, V128, vecshiftR16, asm, ".8h", ".8h",
7458 [(set (v8i16 V128:$dst),
7459 (OpNode (v8i16 V128:$Rd), (v8i16 V128:$Rn),
7460 (i32 vecshiftR16:$imm)))]> {
7461 bits<4> imm;
7462 let Inst{19-16} = imm;
7463 }
7464
7465 def v2i32_shift : BaseSIMDVectorShiftTied<0, U, opc, {0,1,?,?,?,?,?},
7466 V64, V64, vecshiftR32, asm, ".2s", ".2s",
7467 [(set (v2i32 V64:$dst),
7468 (OpNode (v2i32 V64:$Rd), (v2i32 V64:$Rn),
7469 (i32 vecshiftR32:$imm)))]> {
7470 bits<5> imm;
7471 let Inst{20-16} = imm;
7472 }
7473
7474 def v4i32_shift : BaseSIMDVectorShiftTied<1, U, opc, {0,1,?,?,?,?,?},
7475 V128, V128, vecshiftR32, asm, ".4s", ".4s",
7476 [(set (v4i32 V128:$dst),
7477 (OpNode (v4i32 V128:$Rd), (v4i32 V128:$Rn),
7478 (i32 vecshiftR32:$imm)))]> {
7479 bits<5> imm;
7480 let Inst{20-16} = imm;
7481 }
7482
7483 def v2i64_shift : BaseSIMDVectorShiftTied<1, U, opc, {1,?,?,?,?,?,?},
7484 V128, V128, vecshiftR64,
7485 asm, ".2d", ".2d", [(set (v2i64 V128:$dst),
7486 (OpNode (v2i64 V128:$Rd), (v2i64 V128:$Rn),
7487 (i32 vecshiftR64:$imm)))]> {
7488 bits<6> imm;
7489 let Inst{21-16} = imm;
7490 }
7491}
7492
7493multiclass SIMDVectorLShiftBHSDTied<bit U, bits<5> opc, string asm,
7494 SDPatternOperator OpNode = null_frag> {
7495 def v8i8_shift : BaseSIMDVectorShiftTied<0, U, opc, {0,0,0,1,?,?,?},
7496 V64, V64, vecshiftL8,
7497 asm, ".8b", ".8b",
7498 [(set (v8i8 V64:$dst),
7499 (OpNode (v8i8 V64:$Rd), (v8i8 V64:$Rn),
7500 (i32 vecshiftL8:$imm)))]> {
7501 bits<3> imm;
7502 let Inst{18-16} = imm;
7503 }
7504
7505 def v16i8_shift : BaseSIMDVectorShiftTied<1, U, opc, {0,0,0,1,?,?,?},
7506 V128, V128, vecshiftL8,
7507 asm, ".16b", ".16b",
7508 [(set (v16i8 V128:$dst),
7509 (OpNode (v16i8 V128:$Rd), (v16i8 V128:$Rn),
7510 (i32 vecshiftL8:$imm)))]> {
7511 bits<3> imm;
7512 let Inst{18-16} = imm;
7513 }
7514
7515 def v4i16_shift : BaseSIMDVectorShiftTied<0, U, opc, {0,0,1,?,?,?,?},
7516 V64, V64, vecshiftL16,
7517 asm, ".4h", ".4h",
7518 [(set (v4i16 V64:$dst),
7519 (OpNode (v4i16 V64:$Rd), (v4i16 V64:$Rn),
7520 (i32 vecshiftL16:$imm)))]> {
7521 bits<4> imm;
7522 let Inst{19-16} = imm;
7523 }
7524
7525 def v8i16_shift : BaseSIMDVectorShiftTied<1, U, opc, {0,0,1,?,?,?,?},
7526 V128, V128, vecshiftL16,
7527 asm, ".8h", ".8h",
7528 [(set (v8i16 V128:$dst),
7529 (OpNode (v8i16 V128:$Rd), (v8i16 V128:$Rn),
7530 (i32 vecshiftL16:$imm)))]> {
7531 bits<4> imm;
7532 let Inst{19-16} = imm;
7533 }
7534
7535 def v2i32_shift : BaseSIMDVectorShiftTied<0, U, opc, {0,1,?,?,?,?,?},
7536 V64, V64, vecshiftL32,
7537 asm, ".2s", ".2s",
7538 [(set (v2i32 V64:$dst),
7539 (OpNode (v2i32 V64:$Rd), (v2i32 V64:$Rn),
7540 (i32 vecshiftL32:$imm)))]> {
7541 bits<5> imm;
7542 let Inst{20-16} = imm;
7543 }
7544
7545 def v4i32_shift : BaseSIMDVectorShiftTied<1, U, opc, {0,1,?,?,?,?,?},
7546 V128, V128, vecshiftL32,
7547 asm, ".4s", ".4s",
7548 [(set (v4i32 V128:$dst),
7549 (OpNode (v4i32 V128:$Rd), (v4i32 V128:$Rn),
7550 (i32 vecshiftL32:$imm)))]> {
7551 bits<5> imm;
7552 let Inst{20-16} = imm;
7553 }
7554
7555 def v2i64_shift : BaseSIMDVectorShiftTied<1, U, opc, {1,?,?,?,?,?,?},
7556 V128, V128, vecshiftL64,
7557 asm, ".2d", ".2d",
7558 [(set (v2i64 V128:$dst),
7559 (OpNode (v2i64 V128:$Rd), (v2i64 V128:$Rn),
7560 (i32 vecshiftL64:$imm)))]> {
7561 bits<6> imm;
7562 let Inst{21-16} = imm;
7563 }
7564}
7565
7566multiclass SIMDVectorLShiftLongBHSD<bit U, bits<5> opc, string asm,
7567 SDPatternOperator OpNode> {
7568 def v8i8_shift : BaseSIMDVectorShift<0, U, opc, {0,0,0,1,?,?,?},
7569 V128, V64, vecshiftL8, asm, ".8h", ".8b",
7570 [(set (v8i16 V128:$Rd), (OpNode (v8i8 V64:$Rn), vecshiftL8:$imm))]> {
7571 bits<3> imm;
7572 let Inst{18-16} = imm;
7573 }
7574
7575 def v16i8_shift : BaseSIMDVectorShift<1, U, opc, {0,0,0,1,?,?,?},
7576 V128, V128, vecshiftL8,
7577 asm#"2", ".8h", ".16b",
7578 [(set (v8i16 V128:$Rd),
7579 (OpNode (extract_high_v16i8 V128:$Rn), vecshiftL8:$imm))]> {
7580 bits<3> imm;
7581 let Inst{18-16} = imm;
7582 }
7583
7584 def v4i16_shift : BaseSIMDVectorShift<0, U, opc, {0,0,1,?,?,?,?},
7585 V128, V64, vecshiftL16, asm, ".4s", ".4h",
7586 [(set (v4i32 V128:$Rd), (OpNode (v4i16 V64:$Rn), vecshiftL16:$imm))]> {
7587 bits<4> imm;
7588 let Inst{19-16} = imm;
7589 }
7590
7591 def v8i16_shift : BaseSIMDVectorShift<1, U, opc, {0,0,1,?,?,?,?},
7592 V128, V128, vecshiftL16,
7593 asm#"2", ".4s", ".8h",
7594 [(set (v4i32 V128:$Rd),
7595 (OpNode (extract_high_v8i16 V128:$Rn), vecshiftL16:$imm))]> {
7596
7597 bits<4> imm;
7598 let Inst{19-16} = imm;
7599 }
7600
7601 def v2i32_shift : BaseSIMDVectorShift<0, U, opc, {0,1,?,?,?,?,?},
7602 V128, V64, vecshiftL32, asm, ".2d", ".2s",
7603 [(set (v2i64 V128:$Rd), (OpNode (v2i32 V64:$Rn), vecshiftL32:$imm))]> {
7604 bits<5> imm;
7605 let Inst{20-16} = imm;
7606 }
7607
7608 def v4i32_shift : BaseSIMDVectorShift<1, U, opc, {0,1,?,?,?,?,?},
7609 V128, V128, vecshiftL32,
7610 asm#"2", ".2d", ".4s",
7611 [(set (v2i64 V128:$Rd),
7612 (OpNode (extract_high_v4i32 V128:$Rn), vecshiftL32:$imm))]> {
7613 bits<5> imm;
7614 let Inst{20-16} = imm;
7615 }
7616}
7617
7618
7619//---
7620// Vector load/store
7621//---
7622// SIMD ldX/stX no-index memory references don't allow the optional
7623// ", #0" constant and handle post-indexing explicitly, so we use
7624// a more specialized parse method for them. Otherwise, it's the same as
7625// the general GPR64sp handling.
7626
7627class BaseSIMDLdSt<bit Q, bit L, bits<4> opcode, bits<2> size,
7628 string asm, dag oops, dag iops, list<dag> pattern>
7629 : I<oops, iops, asm, "\t$Vt, [$Rn]", "", pattern> {
7630 bits<5> Vt;
7631 bits<5> Rn;
7632 let Inst{31} = 0;
7633 let Inst{30} = Q;
7634 let Inst{29-23} = 0b0011000;
7635 let Inst{22} = L;
7636 let Inst{21-16} = 0b000000;
7637 let Inst{15-12} = opcode;
7638 let Inst{11-10} = size;
7639 let Inst{9-5} = Rn;
7640 let Inst{4-0} = Vt;
7641}
7642
7643class BaseSIMDLdStPost<bit Q, bit L, bits<4> opcode, bits<2> size,
7644 string asm, dag oops, dag iops>
7645 : I<oops, iops, asm, "\t$Vt, [$Rn], $Xm", "$Rn = $wback", []> {
7646 bits<5> Vt;
7647 bits<5> Rn;
7648 bits<5> Xm;
7649 let Inst{31} = 0;
7650 let Inst{30} = Q;
7651 let Inst{29-23} = 0b0011001;
7652 let Inst{22} = L;
7653 let Inst{21} = 0;
7654 let Inst{20-16} = Xm;
7655 let Inst{15-12} = opcode;
7656 let Inst{11-10} = size;
7657 let Inst{9-5} = Rn;
7658 let Inst{4-0} = Vt;
7659}
7660
7661// The immediate form of AdvSIMD post-indexed addressing is encoded with
7662// register post-index addressing from the zero register.
7663multiclass SIMDLdStAliases<string asm, string layout, string Count,
7664 int Offset, int Size> {
7665 // E.g. "ld1 { v0.8b, v1.8b }, [x1], #16"
7666 // "ld1\t$Vt, [$Rn], #16"
7667 // may get mapped to
7668 // (LD1Twov8b_POST VecListTwo8b:$Vt, GPR64sp:$Rn, XZR)
7669 def : InstAlias<asm # "\t$Vt, [$Rn], #" # Offset,
7670 (!cast<Instruction>(NAME # Count # "v" # layout # "_POST")
7671 GPR64sp:$Rn,
7672 !cast<RegisterOperand>("VecList" # Count # layout):$Vt,
7673 XZR), 1>;
7674
7675 // E.g. "ld1.8b { v0, v1 }, [x1], #16"
7676 // "ld1.8b\t$Vt, [$Rn], #16"
7677 // may get mapped to
7678 // (LD1Twov8b_POST VecListTwo64:$Vt, GPR64sp:$Rn, XZR)
7679 def : InstAlias<asm # "." # layout # "\t$Vt, [$Rn], #" # Offset,
7680 (!cast<Instruction>(NAME # Count # "v" # layout # "_POST")
7681 GPR64sp:$Rn,
7682 !cast<RegisterOperand>("VecList" # Count # Size):$Vt,
7683 XZR), 0>;
7684
7685 // E.g. "ld1.8b { v0, v1 }, [x1]"
7686 // "ld1\t$Vt, [$Rn]"
7687 // may get mapped to
7688 // (LD1Twov8b VecListTwo64:$Vt, GPR64sp:$Rn)
7689 def : InstAlias<asm # "." # layout # "\t$Vt, [$Rn]",
7690 (!cast<Instruction>(NAME # Count # "v" # layout)
7691 !cast<RegisterOperand>("VecList" # Count # Size):$Vt,
7692 GPR64sp:$Rn), 0>;
7693
7694 // E.g. "ld1.8b { v0, v1 }, [x1], x2"
7695 // "ld1\t$Vt, [$Rn], $Xm"
7696 // may get mapped to
7697 // (LD1Twov8b_POST VecListTwo64:$Vt, GPR64sp:$Rn, GPR64pi8:$Xm)
7698 def : InstAlias<asm # "." # layout # "\t$Vt, [$Rn], $Xm",
7699 (!cast<Instruction>(NAME # Count # "v" # layout # "_POST")
7700 GPR64sp:$Rn,
7701 !cast<RegisterOperand>("VecList" # Count # Size):$Vt,
7702 !cast<RegisterOperand>("GPR64pi" # Offset):$Xm), 0>;
7703}
7704
7705multiclass BaseSIMDLdN<string Count, string asm, string veclist, int Offset128,
7706 int Offset64, bits<4> opcode> {
7707 let hasSideEffects = 0, mayLoad = 1, mayStore = 0 in {
7708 def v16b: BaseSIMDLdSt<1, 1, opcode, 0b00, asm,
7709 (outs !cast<RegisterOperand>(veclist # "16b"):$Vt),
7710 (ins GPR64sp:$Rn), []>;
7711 def v8h : BaseSIMDLdSt<1, 1, opcode, 0b01, asm,
7712 (outs !cast<RegisterOperand>(veclist # "8h"):$Vt),
7713 (ins GPR64sp:$Rn), []>;
7714 def v4s : BaseSIMDLdSt<1, 1, opcode, 0b10, asm,
7715 (outs !cast<RegisterOperand>(veclist # "4s"):$Vt),
7716 (ins GPR64sp:$Rn), []>;
7717 def v2d : BaseSIMDLdSt<1, 1, opcode, 0b11, asm,
7718 (outs !cast<RegisterOperand>(veclist # "2d"):$Vt),
7719 (ins GPR64sp:$Rn), []>;
7720 def v8b : BaseSIMDLdSt<0, 1, opcode, 0b00, asm,
7721 (outs !cast<RegisterOperand>(veclist # "8b"):$Vt),
7722 (ins GPR64sp:$Rn), []>;
7723 def v4h : BaseSIMDLdSt<0, 1, opcode, 0b01, asm,
7724 (outs !cast<RegisterOperand>(veclist # "4h"):$Vt),
7725 (ins GPR64sp:$Rn), []>;
7726 def v2s : BaseSIMDLdSt<0, 1, opcode, 0b10, asm,
7727 (outs !cast<RegisterOperand>(veclist # "2s"):$Vt),
7728 (ins GPR64sp:$Rn), []>;
7729
7730
7731 def v16b_POST: BaseSIMDLdStPost<1, 1, opcode, 0b00, asm,
7732 (outs GPR64sp:$wback,
7733 !cast<RegisterOperand>(veclist # "16b"):$Vt),
7734 (ins GPR64sp:$Rn,
7735 !cast<RegisterOperand>("GPR64pi" # Offset128):$Xm)>;
7736 def v8h_POST : BaseSIMDLdStPost<1, 1, opcode, 0b01, asm,
7737 (outs GPR64sp:$wback,
7738 !cast<RegisterOperand>(veclist # "8h"):$Vt),
7739 (ins GPR64sp:$Rn,
7740 !cast<RegisterOperand>("GPR64pi" # Offset128):$Xm)>;
7741 def v4s_POST : BaseSIMDLdStPost<1, 1, opcode, 0b10, asm,
7742 (outs GPR64sp:$wback,
7743 !cast<RegisterOperand>(veclist # "4s"):$Vt),
7744 (ins GPR64sp:$Rn,
7745 !cast<RegisterOperand>("GPR64pi" # Offset128):$Xm)>;
7746 def v2d_POST : BaseSIMDLdStPost<1, 1, opcode, 0b11, asm,
7747 (outs GPR64sp:$wback,
7748 !cast<RegisterOperand>(veclist # "2d"):$Vt),
7749 (ins GPR64sp:$Rn,
7750 !cast<RegisterOperand>("GPR64pi" # Offset128):$Xm)>;
7751 def v8b_POST : BaseSIMDLdStPost<0, 1, opcode, 0b00, asm,
7752 (outs GPR64sp:$wback,
7753 !cast<RegisterOperand>(veclist # "8b"):$Vt),
7754 (ins GPR64sp:$Rn,
7755 !cast<RegisterOperand>("GPR64pi" # Offset64):$Xm)>;
7756 def v4h_POST : BaseSIMDLdStPost<0, 1, opcode, 0b01, asm,
7757 (outs GPR64sp:$wback,
7758 !cast<RegisterOperand>(veclist # "4h"):$Vt),
7759 (ins GPR64sp:$Rn,
7760 !cast<RegisterOperand>("GPR64pi" # Offset64):$Xm)>;
7761 def v2s_POST : BaseSIMDLdStPost<0, 1, opcode, 0b10, asm,
7762 (outs GPR64sp:$wback,
7763 !cast<RegisterOperand>(veclist # "2s"):$Vt),
7764 (ins GPR64sp:$Rn,
7765 !cast<RegisterOperand>("GPR64pi" # Offset64):$Xm)>;
7766 }
7767
7768 defm : SIMDLdStAliases<asm, "16b", Count, Offset128, 128>;
7769 defm : SIMDLdStAliases<asm, "8h", Count, Offset128, 128>;
7770 defm : SIMDLdStAliases<asm, "4s", Count, Offset128, 128>;
7771 defm : SIMDLdStAliases<asm, "2d", Count, Offset128, 128>;
7772 defm : SIMDLdStAliases<asm, "8b", Count, Offset64, 64>;
7773 defm : SIMDLdStAliases<asm, "4h", Count, Offset64, 64>;
7774 defm : SIMDLdStAliases<asm, "2s", Count, Offset64, 64>;
7775}
7776
7777// Only ld1/st1 has a v1d version.
7778multiclass BaseSIMDStN<string Count, string asm, string veclist, int Offset128,
7779 int Offset64, bits<4> opcode> {
7780 let hasSideEffects = 0, mayStore = 1, mayLoad = 0 in {
7781 def v16b : BaseSIMDLdSt<1, 0, opcode, 0b00, asm, (outs),
7782 (ins !cast<RegisterOperand>(veclist # "16b"):$Vt,
7783 GPR64sp:$Rn), []>;
7784 def v8h : BaseSIMDLdSt<1, 0, opcode, 0b01, asm, (outs),
7785 (ins !cast<RegisterOperand>(veclist # "8h"):$Vt,
7786 GPR64sp:$Rn), []>;
7787 def v4s : BaseSIMDLdSt<1, 0, opcode, 0b10, asm, (outs),
7788 (ins !cast<RegisterOperand>(veclist # "4s"):$Vt,
7789 GPR64sp:$Rn), []>;
7790 def v2d : BaseSIMDLdSt<1, 0, opcode, 0b11, asm, (outs),
7791 (ins !cast<RegisterOperand>(veclist # "2d"):$Vt,
7792 GPR64sp:$Rn), []>;
7793 def v8b : BaseSIMDLdSt<0, 0, opcode, 0b00, asm, (outs),
7794 (ins !cast<RegisterOperand>(veclist # "8b"):$Vt,
7795 GPR64sp:$Rn), []>;
7796 def v4h : BaseSIMDLdSt<0, 0, opcode, 0b01, asm, (outs),
7797 (ins !cast<RegisterOperand>(veclist # "4h"):$Vt,
7798 GPR64sp:$Rn), []>;
7799 def v2s : BaseSIMDLdSt<0, 0, opcode, 0b10, asm, (outs),
7800 (ins !cast<RegisterOperand>(veclist # "2s"):$Vt,
7801 GPR64sp:$Rn), []>;
7802
7803 def v16b_POST : BaseSIMDLdStPost<1, 0, opcode, 0b00, asm,
7804 (outs GPR64sp:$wback),
7805 (ins !cast<RegisterOperand>(veclist # "16b"):$Vt,
7806 GPR64sp:$Rn,
7807 !cast<RegisterOperand>("GPR64pi" # Offset128):$Xm)>;
7808 def v8h_POST : BaseSIMDLdStPost<1, 0, opcode, 0b01, asm,
7809 (outs GPR64sp:$wback),
7810 (ins !cast<RegisterOperand>(veclist # "8h"):$Vt,
7811 GPR64sp:$Rn,
7812 !cast<RegisterOperand>("GPR64pi" # Offset128):$Xm)>;
7813 def v4s_POST : BaseSIMDLdStPost<1, 0, opcode, 0b10, asm,
7814 (outs GPR64sp:$wback),
7815 (ins !cast<RegisterOperand>(veclist # "4s"):$Vt,
7816 GPR64sp:$Rn,
7817 !cast<RegisterOperand>("GPR64pi" # Offset128):$Xm)>;
7818 def v2d_POST : BaseSIMDLdStPost<1, 0, opcode, 0b11, asm,
7819 (outs GPR64sp:$wback),
7820 (ins !cast<RegisterOperand>(veclist # "2d"):$Vt,
7821 GPR64sp:$Rn,
7822 !cast<RegisterOperand>("GPR64pi" # Offset128):$Xm)>;
7823 def v8b_POST : BaseSIMDLdStPost<0, 0, opcode, 0b00, asm,
7824 (outs GPR64sp:$wback),
7825 (ins !cast<RegisterOperand>(veclist # "8b"):$Vt,
7826 GPR64sp:$Rn,
7827 !cast<RegisterOperand>("GPR64pi" # Offset64):$Xm)>;
7828 def v4h_POST : BaseSIMDLdStPost<0, 0, opcode, 0b01, asm,
7829 (outs GPR64sp:$wback),
7830 (ins !cast<RegisterOperand>(veclist # "4h"):$Vt,
7831 GPR64sp:$Rn,
7832 !cast<RegisterOperand>("GPR64pi" # Offset64):$Xm)>;
7833 def v2s_POST : BaseSIMDLdStPost<0, 0, opcode, 0b10, asm,
7834 (outs GPR64sp:$wback),
7835 (ins !cast<RegisterOperand>(veclist # "2s"):$Vt,
7836 GPR64sp:$Rn,
7837 !cast<RegisterOperand>("GPR64pi" # Offset64):$Xm)>;
7838 }
7839
7840 defm : SIMDLdStAliases<asm, "16b", Count, Offset128, 128>;
7841 defm : SIMDLdStAliases<asm, "8h", Count, Offset128, 128>;
7842 defm : SIMDLdStAliases<asm, "4s", Count, Offset128, 128>;
7843 defm : SIMDLdStAliases<asm, "2d", Count, Offset128, 128>;
7844 defm : SIMDLdStAliases<asm, "8b", Count, Offset64, 64>;
7845 defm : SIMDLdStAliases<asm, "4h", Count, Offset64, 64>;
7846 defm : SIMDLdStAliases<asm, "2s", Count, Offset64, 64>;
7847}
7848
7849multiclass BaseSIMDLd1<string Count, string asm, string veclist,
7850 int Offset128, int Offset64, bits<4> opcode>
7851 : BaseSIMDLdN<Count, asm, veclist, Offset128, Offset64, opcode> {
7852
7853 // LD1 instructions have extra "1d" variants.
7854 let hasSideEffects = 0, mayLoad = 1, mayStore = 0 in {
7855 def v1d : BaseSIMDLdSt<0, 1, opcode, 0b11, asm,
7856 (outs !cast<RegisterOperand>(veclist # "1d"):$Vt),
7857 (ins GPR64sp:$Rn), []>;
7858
7859 def v1d_POST : BaseSIMDLdStPost<0, 1, opcode, 0b11, asm,
7860 (outs GPR64sp:$wback,
7861 !cast<RegisterOperand>(veclist # "1d"):$Vt),
7862 (ins GPR64sp:$Rn,
7863 !cast<RegisterOperand>("GPR64pi" # Offset64):$Xm)>;
7864 }
7865
7866 defm : SIMDLdStAliases<asm, "1d", Count, Offset64, 64>;
7867}
7868
7869multiclass BaseSIMDSt1<string Count, string asm, string veclist,
7870 int Offset128, int Offset64, bits<4> opcode>
7871 : BaseSIMDStN<Count, asm, veclist, Offset128, Offset64, opcode> {
7872
7873 // ST1 instructions have extra "1d" variants.
7874 let hasSideEffects = 0, mayLoad = 0, mayStore = 1 in {
7875 def v1d : BaseSIMDLdSt<0, 0, opcode, 0b11, asm, (outs),
7876 (ins !cast<RegisterOperand>(veclist # "1d"):$Vt,
7877 GPR64sp:$Rn), []>;
7878
7879 def v1d_POST : BaseSIMDLdStPost<0, 0, opcode, 0b11, asm,
7880 (outs GPR64sp:$wback),
7881 (ins !cast<RegisterOperand>(veclist # "1d"):$Vt,
7882 GPR64sp:$Rn,
7883 !cast<RegisterOperand>("GPR64pi" # Offset64):$Xm)>;
7884 }
7885
7886 defm : SIMDLdStAliases<asm, "1d", Count, Offset64, 64>;
7887}
7888
7889multiclass SIMDLd1Multiple<string asm> {
7890 defm One : BaseSIMDLd1<"One", asm, "VecListOne", 16, 8, 0b0111>;
7891 defm Two : BaseSIMDLd1<"Two", asm, "VecListTwo", 32, 16, 0b1010>;
7892 defm Three : BaseSIMDLd1<"Three", asm, "VecListThree", 48, 24, 0b0110>;
7893 defm Four : BaseSIMDLd1<"Four", asm, "VecListFour", 64, 32, 0b0010>;
7894}
7895
7896multiclass SIMDSt1Multiple<string asm> {
7897 defm One : BaseSIMDSt1<"One", asm, "VecListOne", 16, 8, 0b0111>;
7898 defm Two : BaseSIMDSt1<"Two", asm, "VecListTwo", 32, 16, 0b1010>;
7899 defm Three : BaseSIMDSt1<"Three", asm, "VecListThree", 48, 24, 0b0110>;
7900 defm Four : BaseSIMDSt1<"Four", asm, "VecListFour", 64, 32, 0b0010>;
7901}
7902
7903multiclass SIMDLd2Multiple<string asm> {
7904 defm Two : BaseSIMDLdN<"Two", asm, "VecListTwo", 32, 16, 0b1000>;
7905}
7906
7907multiclass SIMDSt2Multiple<string asm> {
7908 defm Two : BaseSIMDStN<"Two", asm, "VecListTwo", 32, 16, 0b1000>;
7909}
7910
7911multiclass SIMDLd3Multiple<string asm> {
7912 defm Three : BaseSIMDLdN<"Three", asm, "VecListThree", 48, 24, 0b0100>;
7913}
7914
7915multiclass SIMDSt3Multiple<string asm> {
7916 defm Three : BaseSIMDStN<"Three", asm, "VecListThree", 48, 24, 0b0100>;
7917}
7918
7919multiclass SIMDLd4Multiple<string asm> {
7920 defm Four : BaseSIMDLdN<"Four", asm, "VecListFour", 64, 32, 0b0000>;
7921}
7922
7923multiclass SIMDSt4Multiple<string asm> {
7924 defm Four : BaseSIMDStN<"Four", asm, "VecListFour", 64, 32, 0b0000>;
7925}
7926
7927//---
7928// AdvSIMD Load/store single-element
7929//---
7930
7931class BaseSIMDLdStSingle<bit L, bit R, bits<3> opcode,
7932 string asm, string operands, string cst,
7933 dag oops, dag iops, list<dag> pattern>
7934 : I<oops, iops, asm, operands, cst, pattern> {
7935 bits<5> Vt;
7936 bits<5> Rn;
7937 let Inst{31} = 0;
7938 let Inst{29-24} = 0b001101;
7939 let Inst{22} = L;
7940 let Inst{21} = R;
7941 let Inst{15-13} = opcode;
7942 let Inst{9-5} = Rn;
7943 let Inst{4-0} = Vt;
7944}
7945
7946class BaseSIMDLdStSingleTied<bit L, bit R, bits<3> opcode,
7947 string asm, string operands, string cst,
7948 dag oops, dag iops, list<dag> pattern>
7949 : I<oops, iops, asm, operands, "$Vt = $dst," # cst, pattern> {
7950 bits<5> Vt;
7951 bits<5> Rn;
7952 let Inst{31} = 0;
7953 let Inst{29-24} = 0b001101;
7954 let Inst{22} = L;
7955 let Inst{21} = R;
7956 let Inst{15-13} = opcode;
7957 let Inst{9-5} = Rn;
7958 let Inst{4-0} = Vt;
7959}
7960
7961
7962let mayLoad = 1, mayStore = 0, hasSideEffects = 0 in
7963class BaseSIMDLdR<bit Q, bit R, bits<3> opcode, bit S, bits<2> size, string asm,
7964 Operand listtype>
7965 : BaseSIMDLdStSingle<1, R, opcode, asm, "\t$Vt, [$Rn]", "",
7966 (outs listtype:$Vt), (ins GPR64sp:$Rn),
7967 []> {
7968 let Inst{30} = Q;
7969 let Inst{23} = 0;
7970 let Inst{20-16} = 0b00000;
7971 let Inst{12} = S;
7972 let Inst{11-10} = size;
7973}
7974let mayLoad = 1, mayStore = 0, hasSideEffects = 0 in
7975class BaseSIMDLdRPost<bit Q, bit R, bits<3> opcode, bit S, bits<2> size,
7976 string asm, Operand listtype, Operand GPR64pi>
7977 : BaseSIMDLdStSingle<1, R, opcode, asm, "\t$Vt, [$Rn], $Xm",
7978 "$Rn = $wback",
7979 (outs GPR64sp:$wback, listtype:$Vt),
7980 (ins GPR64sp:$Rn, GPR64pi:$Xm), []> {
7981 bits<5> Xm;
7982 let Inst{30} = Q;
7983 let Inst{23} = 1;
7984 let Inst{20-16} = Xm;
7985 let Inst{12} = S;
7986 let Inst{11-10} = size;
7987}
7988
7989multiclass SIMDLdrAliases<string asm, string layout, string Count,
7990 int Offset, int Size> {
7991 // E.g. "ld1r { v0.8b }, [x1], #1"
7992 // "ld1r.8b\t$Vt, [$Rn], #1"
7993 // may get mapped to
7994 // (LD1Rv8b_POST VecListOne8b:$Vt, GPR64sp:$Rn, XZR)
7995 def : InstAlias<asm # "\t$Vt, [$Rn], #" # Offset,
7996 (!cast<Instruction>(NAME # "v" # layout # "_POST")
7997 GPR64sp:$Rn,
7998 !cast<RegisterOperand>("VecList" # Count # layout):$Vt,
7999 XZR), 1>;
8000
8001 // E.g. "ld1r.8b { v0 }, [x1], #1"
8002 // "ld1r.8b\t$Vt, [$Rn], #1"
8003 // may get mapped to
8004 // (LD1Rv8b_POST VecListOne64:$Vt, GPR64sp:$Rn, XZR)
8005 def : InstAlias<asm # "." # layout # "\t$Vt, [$Rn], #" # Offset,
8006 (!cast<Instruction>(NAME # "v" # layout # "_POST")
8007 GPR64sp:$Rn,
8008 !cast<RegisterOperand>("VecList" # Count # Size):$Vt,
8009 XZR), 0>;
8010
8011 // E.g. "ld1r.8b { v0 }, [x1]"
8012 // "ld1r.8b\t$Vt, [$Rn]"
8013 // may get mapped to
8014 // (LD1Rv8b VecListOne64:$Vt, GPR64sp:$Rn)
8015 def : InstAlias<asm # "." # layout # "\t$Vt, [$Rn]",
8016 (!cast<Instruction>(NAME # "v" # layout)
8017 !cast<RegisterOperand>("VecList" # Count # Size):$Vt,
8018 GPR64sp:$Rn), 0>;
8019
8020 // E.g. "ld1r.8b { v0 }, [x1], x2"
8021 // "ld1r.8b\t$Vt, [$Rn], $Xm"
8022 // may get mapped to
8023 // (LD1Rv8b_POST VecListOne64:$Vt, GPR64sp:$Rn, GPR64pi1:$Xm)
8024 def : InstAlias<asm # "." # layout # "\t$Vt, [$Rn], $Xm",
8025 (!cast<Instruction>(NAME # "v" # layout # "_POST")
8026 GPR64sp:$Rn,
8027 !cast<RegisterOperand>("VecList" # Count # Size):$Vt,
8028 !cast<RegisterOperand>("GPR64pi" # Offset):$Xm), 0>;
8029}
8030
8031multiclass SIMDLdR<bit R, bits<3> opcode, bit S, string asm, string Count,
8032 int Offset1, int Offset2, int Offset4, int Offset8> {
8033 def v8b : BaseSIMDLdR<0, R, opcode, S, 0b00, asm,
8034 !cast<Operand>("VecList" # Count # "8b")>;
8035 def v16b: BaseSIMDLdR<1, R, opcode, S, 0b00, asm,
8036 !cast<Operand>("VecList" # Count #"16b")>;
8037 def v4h : BaseSIMDLdR<0, R, opcode, S, 0b01, asm,
8038 !cast<Operand>("VecList" # Count #"4h")>;
8039 def v8h : BaseSIMDLdR<1, R, opcode, S, 0b01, asm,
8040 !cast<Operand>("VecList" # Count #"8h")>;
8041 def v2s : BaseSIMDLdR<0, R, opcode, S, 0b10, asm,
8042 !cast<Operand>("VecList" # Count #"2s")>;
8043 def v4s : BaseSIMDLdR<1, R, opcode, S, 0b10, asm,
8044 !cast<Operand>("VecList" # Count #"4s")>;
8045 def v1d : BaseSIMDLdR<0, R, opcode, S, 0b11, asm,
8046 !cast<Operand>("VecList" # Count #"1d")>;
8047 def v2d : BaseSIMDLdR<1, R, opcode, S, 0b11, asm,
8048 !cast<Operand>("VecList" # Count #"2d")>;
8049
8050 def v8b_POST : BaseSIMDLdRPost<0, R, opcode, S, 0b00, asm,
8051 !cast<Operand>("VecList" # Count # "8b"),
8052 !cast<Operand>("GPR64pi" # Offset1)>;
8053 def v16b_POST: BaseSIMDLdRPost<1, R, opcode, S, 0b00, asm,
8054 !cast<Operand>("VecList" # Count # "16b"),
8055 !cast<Operand>("GPR64pi" # Offset1)>;
8056 def v4h_POST : BaseSIMDLdRPost<0, R, opcode, S, 0b01, asm,
8057 !cast<Operand>("VecList" # Count # "4h"),
8058 !cast<Operand>("GPR64pi" # Offset2)>;
8059 def v8h_POST : BaseSIMDLdRPost<1, R, opcode, S, 0b01, asm,
8060 !cast<Operand>("VecList" # Count # "8h"),
8061 !cast<Operand>("GPR64pi" # Offset2)>;
8062 def v2s_POST : BaseSIMDLdRPost<0, R, opcode, S, 0b10, asm,
8063 !cast<Operand>("VecList" # Count # "2s"),
8064 !cast<Operand>("GPR64pi" # Offset4)>;
8065 def v4s_POST : BaseSIMDLdRPost<1, R, opcode, S, 0b10, asm,
8066 !cast<Operand>("VecList" # Count # "4s"),
8067 !cast<Operand>("GPR64pi" # Offset4)>;
8068 def v1d_POST : BaseSIMDLdRPost<0, R, opcode, S, 0b11, asm,
8069 !cast<Operand>("VecList" # Count # "1d"),
8070 !cast<Operand>("GPR64pi" # Offset8)>;
8071 def v2d_POST : BaseSIMDLdRPost<1, R, opcode, S, 0b11, asm,
8072 !cast<Operand>("VecList" # Count # "2d"),
8073 !cast<Operand>("GPR64pi" # Offset8)>;
8074
8075 defm : SIMDLdrAliases<asm, "8b", Count, Offset1, 64>;
8076 defm : SIMDLdrAliases<asm, "16b", Count, Offset1, 128>;
8077 defm : SIMDLdrAliases<asm, "4h", Count, Offset2, 64>;
8078 defm : SIMDLdrAliases<asm, "8h", Count, Offset2, 128>;
8079 defm : SIMDLdrAliases<asm, "2s", Count, Offset4, 64>;
8080 defm : SIMDLdrAliases<asm, "4s", Count, Offset4, 128>;
8081 defm : SIMDLdrAliases<asm, "1d", Count, Offset8, 64>;
8082 defm : SIMDLdrAliases<asm, "2d", Count, Offset8, 128>;
8083}
8084
8085class SIMDLdStSingleB<bit L, bit R, bits<3> opcode, string asm,
8086 dag oops, dag iops, list<dag> pattern>
8087 : BaseSIMDLdStSingle<L, R, opcode, asm, "\t$Vt$idx, [$Rn]", "", oops, iops,
8088 pattern> {
8089 // idx encoded in Q:S:size fields.
8090 bits<4> idx;
8091 let Inst{30} = idx{3};
8092 let Inst{23} = 0;
8093 let Inst{20-16} = 0b00000;
8094 let Inst{12} = idx{2};
8095 let Inst{11-10} = idx{1-0};
8096}
8097class SIMDLdStSingleBTied<bit L, bit R, bits<3> opcode, string asm,
8098 dag oops, dag iops, list<dag> pattern>
8099 : BaseSIMDLdStSingleTied<L, R, opcode, asm, "\t$Vt$idx, [$Rn]", "",
8100 oops, iops, pattern> {
8101 // idx encoded in Q:S:size fields.
8102 bits<4> idx;
8103 let Inst{30} = idx{3};
8104 let Inst{23} = 0;
8105 let Inst{20-16} = 0b00000;
8106 let Inst{12} = idx{2};
8107 let Inst{11-10} = idx{1-0};
8108}
8109class SIMDLdStSingleBPost<bit L, bit R, bits<3> opcode, string asm,
8110 dag oops, dag iops>
8111 : BaseSIMDLdStSingle<L, R, opcode, asm, "\t$Vt$idx, [$Rn], $Xm",
8112 "$Rn = $wback", oops, iops, []> {
8113 // idx encoded in Q:S:size fields.
8114 bits<4> idx;
8115 bits<5> Xm;
8116 let Inst{30} = idx{3};
8117 let Inst{23} = 1;
8118 let Inst{20-16} = Xm;
8119 let Inst{12} = idx{2};
8120 let Inst{11-10} = idx{1-0};
8121}
8122class SIMDLdStSingleBTiedPost<bit L, bit R, bits<3> opcode, string asm,
8123 dag oops, dag iops>
8124 : BaseSIMDLdStSingleTied<L, R, opcode, asm, "\t$Vt$idx, [$Rn], $Xm",
8125 "$Rn = $wback", oops, iops, []> {
8126 // idx encoded in Q:S:size fields.
8127 bits<4> idx;
8128 bits<5> Xm;
8129 let Inst{30} = idx{3};
8130 let Inst{23} = 1;
8131 let Inst{20-16} = Xm;
8132 let Inst{12} = idx{2};
8133 let Inst{11-10} = idx{1-0};
8134}
8135
8136class SIMDLdStSingleH<bit L, bit R, bits<3> opcode, bit size, string asm,
8137 dag oops, dag iops, list<dag> pattern>
8138 : BaseSIMDLdStSingle<L, R, opcode, asm, "\t$Vt$idx, [$Rn]", "", oops, iops,
8139 pattern> {
8140 // idx encoded in Q:S:size<1> fields.
8141 bits<3> idx;
8142 let Inst{30} = idx{2};
8143 let Inst{23} = 0;
8144 let Inst{20-16} = 0b00000;
8145 let Inst{12} = idx{1};
8146 let Inst{11} = idx{0};
8147 let Inst{10} = size;
8148}
8149class SIMDLdStSingleHTied<bit L, bit R, bits<3> opcode, bit size, string asm,
8150 dag oops, dag iops, list<dag> pattern>
8151 : BaseSIMDLdStSingleTied<L, R, opcode, asm, "\t$Vt$idx, [$Rn]", "",
8152 oops, iops, pattern> {
8153 // idx encoded in Q:S:size<1> fields.
8154 bits<3> idx;
8155 let Inst{30} = idx{2};
8156 let Inst{23} = 0;
8157 let Inst{20-16} = 0b00000;
8158 let Inst{12} = idx{1};
8159 let Inst{11} = idx{0};
8160 let Inst{10} = size;
8161}
8162
8163class SIMDLdStSingleHPost<bit L, bit R, bits<3> opcode, bit size, string asm,
8164 dag oops, dag iops>
8165 : BaseSIMDLdStSingle<L, R, opcode, asm, "\t$Vt$idx, [$Rn], $Xm",
8166 "$Rn = $wback", oops, iops, []> {
8167 // idx encoded in Q:S:size<1> fields.
8168 bits<3> idx;
8169 bits<5> Xm;
8170 let Inst{30} = idx{2};
8171 let Inst{23} = 1;
8172 let Inst{20-16} = Xm;
8173 let Inst{12} = idx{1};
8174 let Inst{11} = idx{0};
8175 let Inst{10} = size;
8176}
8177class SIMDLdStSingleHTiedPost<bit L, bit R, bits<3> opcode, bit size, string asm,
8178 dag oops, dag iops>
8179 : BaseSIMDLdStSingleTied<L, R, opcode, asm, "\t$Vt$idx, [$Rn], $Xm",
8180 "$Rn = $wback", oops, iops, []> {
8181 // idx encoded in Q:S:size<1> fields.
8182 bits<3> idx;
8183 bits<5> Xm;
8184 let Inst{30} = idx{2};
8185 let Inst{23} = 1;
8186 let Inst{20-16} = Xm;
8187 let Inst{12} = idx{1};
8188 let Inst{11} = idx{0};
8189 let Inst{10} = size;
8190}
8191class SIMDLdStSingleS<bit L, bit R, bits<3> opcode, bits<2> size, string asm,
8192 dag oops, dag iops, list<dag> pattern>
8193 : BaseSIMDLdStSingle<L, R, opcode, asm, "\t$Vt$idx, [$Rn]", "", oops, iops,
8194 pattern> {
8195 // idx encoded in Q:S fields.
8196 bits<2> idx;
8197 let Inst{30} = idx{1};
8198 let Inst{23} = 0;
8199 let Inst{20-16} = 0b00000;
8200 let Inst{12} = idx{0};
8201 let Inst{11-10} = size;
8202}
8203class SIMDLdStSingleSTied<bit L, bit R, bits<3> opcode, bits<2> size, string asm,
8204 dag oops, dag iops, list<dag> pattern>
8205 : BaseSIMDLdStSingleTied<L, R, opcode, asm, "\t$Vt$idx, [$Rn]", "",
8206 oops, iops, pattern> {
8207 // idx encoded in Q:S fields.
8208 bits<2> idx;
8209 let Inst{30} = idx{1};
8210 let Inst{23} = 0;
8211 let Inst{20-16} = 0b00000;
8212 let Inst{12} = idx{0};
8213 let Inst{11-10} = size;
8214}
8215class SIMDLdStSingleSPost<bit L, bit R, bits<3> opcode, bits<2> size,
8216 string asm, dag oops, dag iops>
8217 : BaseSIMDLdStSingle<L, R, opcode, asm, "\t$Vt$idx, [$Rn], $Xm",
8218 "$Rn = $wback", oops, iops, []> {
8219 // idx encoded in Q:S fields.
8220 bits<2> idx;
8221 bits<5> Xm;
8222 let Inst{30} = idx{1};
8223 let Inst{23} = 1;
8224 let Inst{20-16} = Xm;
8225 let Inst{12} = idx{0};
8226 let Inst{11-10} = size;
8227}
8228class SIMDLdStSingleSTiedPost<bit L, bit R, bits<3> opcode, bits<2> size,
8229 string asm, dag oops, dag iops>
8230 : BaseSIMDLdStSingleTied<L, R, opcode, asm, "\t$Vt$idx, [$Rn], $Xm",
8231 "$Rn = $wback", oops, iops, []> {
8232 // idx encoded in Q:S fields.
8233 bits<2> idx;
8234 bits<5> Xm;
8235 let Inst{30} = idx{1};
8236 let Inst{23} = 1;
8237 let Inst{20-16} = Xm;
8238 let Inst{12} = idx{0};
8239 let Inst{11-10} = size;
8240}
8241class SIMDLdStSingleD<bit L, bit R, bits<3> opcode, bits<2> size, string asm,
8242 dag oops, dag iops, list<dag> pattern>
8243 : BaseSIMDLdStSingle<L, R, opcode, asm, "\t$Vt$idx, [$Rn]", "", oops, iops,
8244 pattern> {
8245 // idx encoded in Q field.
8246 bits<1> idx;
8247 let Inst{30} = idx;
8248 let Inst{23} = 0;
8249 let Inst{20-16} = 0b00000;
8250 let Inst{12} = 0;
8251 let Inst{11-10} = size;
8252}
8253class SIMDLdStSingleDTied<bit L, bit R, bits<3> opcode, bits<2> size, string asm,
8254 dag oops, dag iops, list<dag> pattern>
8255 : BaseSIMDLdStSingleTied<L, R, opcode, asm, "\t$Vt$idx, [$Rn]", "",
8256 oops, iops, pattern> {
8257 // idx encoded in Q field.
8258 bits<1> idx;
8259 let Inst{30} = idx;
8260 let Inst{23} = 0;
8261 let Inst{20-16} = 0b00000;
8262 let Inst{12} = 0;
8263 let Inst{11-10} = size;
8264}
8265class SIMDLdStSingleDPost<bit L, bit R, bits<3> opcode, bits<2> size,
8266 string asm, dag oops, dag iops>
8267 : BaseSIMDLdStSingle<L, R, opcode, asm, "\t$Vt$idx, [$Rn], $Xm",
8268 "$Rn = $wback", oops, iops, []> {
8269 // idx encoded in Q field.
8270 bits<1> idx;
8271 bits<5> Xm;
8272 let Inst{30} = idx;
8273 let Inst{23} = 1;
8274 let Inst{20-16} = Xm;
8275 let Inst{12} = 0;
8276 let Inst{11-10} = size;
8277}
8278class SIMDLdStSingleDTiedPost<bit L, bit R, bits<3> opcode, bits<2> size,
8279 string asm, dag oops, dag iops>
8280 : BaseSIMDLdStSingleTied<L, R, opcode, asm, "\t$Vt$idx, [$Rn], $Xm",
8281 "$Rn = $wback", oops, iops, []> {
8282 // idx encoded in Q field.
8283 bits<1> idx;
8284 bits<5> Xm;
8285 let Inst{30} = idx;
8286 let Inst{23} = 1;
8287 let Inst{20-16} = Xm;
8288 let Inst{12} = 0;
8289 let Inst{11-10} = size;
8290}
8291
8292let mayLoad = 1, mayStore = 0, hasSideEffects = 0 in
8293multiclass SIMDLdSingleBTied<bit R, bits<3> opcode, string asm,
8294 RegisterOperand listtype,
8295 RegisterOperand GPR64pi> {
8296 def i8 : SIMDLdStSingleBTied<1, R, opcode, asm,
8297 (outs listtype:$dst),
8298 (ins listtype:$Vt, VectorIndexB:$idx,
8299 GPR64sp:$Rn), []>;
8300
8301 def i8_POST : SIMDLdStSingleBTiedPost<1, R, opcode, asm,
8302 (outs GPR64sp:$wback, listtype:$dst),
8303 (ins listtype:$Vt, VectorIndexB:$idx,
8304 GPR64sp:$Rn, GPR64pi:$Xm)>;
8305}
8306let mayLoad = 1, mayStore = 0, hasSideEffects = 0 in
8307multiclass SIMDLdSingleHTied<bit R, bits<3> opcode, bit size, string asm,
8308 RegisterOperand listtype,
8309 RegisterOperand GPR64pi> {
8310 def i16 : SIMDLdStSingleHTied<1, R, opcode, size, asm,
8311 (outs listtype:$dst),
8312 (ins listtype:$Vt, VectorIndexH:$idx,
8313 GPR64sp:$Rn), []>;
8314
8315 def i16_POST : SIMDLdStSingleHTiedPost<1, R, opcode, size, asm,
8316 (outs GPR64sp:$wback, listtype:$dst),
8317 (ins listtype:$Vt, VectorIndexH:$idx,
8318 GPR64sp:$Rn, GPR64pi:$Xm)>;
8319}
8320let mayLoad = 1, mayStore = 0, hasSideEffects = 0 in
8321multiclass SIMDLdSingleSTied<bit R, bits<3> opcode, bits<2> size,string asm,
8322 RegisterOperand listtype,
8323 RegisterOperand GPR64pi> {
8324 def i32 : SIMDLdStSingleSTied<1, R, opcode, size, asm,
8325 (outs listtype:$dst),
8326 (ins listtype:$Vt, VectorIndexS:$idx,
8327 GPR64sp:$Rn), []>;
8328
8329 def i32_POST : SIMDLdStSingleSTiedPost<1, R, opcode, size, asm,
8330 (outs GPR64sp:$wback, listtype:$dst),
8331 (ins listtype:$Vt, VectorIndexS:$idx,
8332 GPR64sp:$Rn, GPR64pi:$Xm)>;
8333}
8334let mayLoad = 1, mayStore = 0, hasSideEffects = 0 in
8335multiclass SIMDLdSingleDTied<bit R, bits<3> opcode, bits<2> size, string asm,
8336 RegisterOperand listtype, RegisterOperand GPR64pi> {
8337 def i64 : SIMDLdStSingleDTied<1, R, opcode, size, asm,
8338 (outs listtype:$dst),
8339 (ins listtype:$Vt, VectorIndexD:$idx,
8340 GPR64sp:$Rn), []>;
8341
8342 def i64_POST : SIMDLdStSingleDTiedPost<1, R, opcode, size, asm,
8343 (outs GPR64sp:$wback, listtype:$dst),
8344 (ins listtype:$Vt, VectorIndexD:$idx,
8345 GPR64sp:$Rn, GPR64pi:$Xm)>;
8346}
8347let mayLoad = 0, mayStore = 1, hasSideEffects = 0 in
8348multiclass SIMDStSingleB<bit R, bits<3> opcode, string asm,
8349 RegisterOperand listtype, RegisterOperand GPR64pi> {
8350 def i8 : SIMDLdStSingleB<0, R, opcode, asm,
8351 (outs), (ins listtype:$Vt, VectorIndexB:$idx,
8352 GPR64sp:$Rn), []>;
8353
8354 def i8_POST : SIMDLdStSingleBPost<0, R, opcode, asm,
8355 (outs GPR64sp:$wback),
8356 (ins listtype:$Vt, VectorIndexB:$idx,
8357 GPR64sp:$Rn, GPR64pi:$Xm)>;
8358}
8359let mayLoad = 0, mayStore = 1, hasSideEffects = 0 in
8360multiclass SIMDStSingleH<bit R, bits<3> opcode, bit size, string asm,
8361 RegisterOperand listtype, RegisterOperand GPR64pi> {
8362 def i16 : SIMDLdStSingleH<0, R, opcode, size, asm,
8363 (outs), (ins listtype:$Vt, VectorIndexH:$idx,
8364 GPR64sp:$Rn), []>;
8365
8366 def i16_POST : SIMDLdStSingleHPost<0, R, opcode, size, asm,
8367 (outs GPR64sp:$wback),
8368 (ins listtype:$Vt, VectorIndexH:$idx,
8369 GPR64sp:$Rn, GPR64pi:$Xm)>;
8370}
8371let mayLoad = 0, mayStore = 1, hasSideEffects = 0 in
8372multiclass SIMDStSingleS<bit R, bits<3> opcode, bits<2> size,string asm,
8373 RegisterOperand listtype, RegisterOperand GPR64pi> {
8374 def i32 : SIMDLdStSingleS<0, R, opcode, size, asm,
8375 (outs), (ins listtype:$Vt, VectorIndexS:$idx,
8376 GPR64sp:$Rn), []>;
8377
8378 def i32_POST : SIMDLdStSingleSPost<0, R, opcode, size, asm,
8379 (outs GPR64sp:$wback),
8380 (ins listtype:$Vt, VectorIndexS:$idx,
8381 GPR64sp:$Rn, GPR64pi:$Xm)>;
8382}
8383let mayLoad = 0, mayStore = 1, hasSideEffects = 0 in
8384multiclass SIMDStSingleD<bit R, bits<3> opcode, bits<2> size, string asm,
8385 RegisterOperand listtype, RegisterOperand GPR64pi> {
8386 def i64 : SIMDLdStSingleD<0, R, opcode, size, asm,
8387 (outs), (ins listtype:$Vt, VectorIndexD:$idx,
8388 GPR64sp:$Rn), []>;
8389
8390 def i64_POST : SIMDLdStSingleDPost<0, R, opcode, size, asm,
8391 (outs GPR64sp:$wback),
8392 (ins listtype:$Vt, VectorIndexD:$idx,
8393 GPR64sp:$Rn, GPR64pi:$Xm)>;
8394}
8395
8396multiclass SIMDLdStSingleAliases<string asm, string layout, string Type,
8397 string Count, int Offset, Operand idxtype> {
8398 // E.g. "ld1 { v0.8b }[0], [x1], #1"
8399 // "ld1\t$Vt, [$Rn], #1"
8400 // may get mapped to
8401 // (LD1Rv8b_POST VecListOne8b:$Vt, GPR64sp:$Rn, XZR)
8402 def : InstAlias<asm # "\t$Vt$idx, [$Rn], #" # Offset,
8403 (!cast<Instruction>(NAME # Type # "_POST")
8404 GPR64sp:$Rn,
8405 !cast<RegisterOperand>("VecList" # Count # layout):$Vt,
8406 idxtype:$idx, XZR), 1>;
8407
8408 // E.g. "ld1.8b { v0 }[0], [x1], #1"
8409 // "ld1.8b\t$Vt, [$Rn], #1"
8410 // may get mapped to
8411 // (LD1Rv8b_POST VecListOne64:$Vt, GPR64sp:$Rn, XZR)
8412 def : InstAlias<asm # "." # layout # "\t$Vt$idx, [$Rn], #" # Offset,
8413 (!cast<Instruction>(NAME # Type # "_POST")
8414 GPR64sp:$Rn,
8415 !cast<RegisterOperand>("VecList" # Count # "128"):$Vt,
8416 idxtype:$idx, XZR), 0>;
8417
8418 // E.g. "ld1.8b { v0 }[0], [x1]"
8419 // "ld1.8b\t$Vt, [$Rn]"
8420 // may get mapped to
8421 // (LD1Rv8b VecListOne64:$Vt, GPR64sp:$Rn)
8422 def : InstAlias<asm # "." # layout # "\t$Vt$idx, [$Rn]",
8423 (!cast<Instruction>(NAME # Type)
8424 !cast<RegisterOperand>("VecList" # Count # "128"):$Vt,
8425 idxtype:$idx, GPR64sp:$Rn), 0>;
8426
8427 // E.g. "ld1.8b { v0 }[0], [x1], x2"
8428 // "ld1.8b\t$Vt, [$Rn], $Xm"
8429 // may get mapped to
8430 // (LD1Rv8b_POST VecListOne64:$Vt, GPR64sp:$Rn, GPR64pi1:$Xm)
8431 def : InstAlias<asm # "." # layout # "\t$Vt$idx, [$Rn], $Xm",
8432 (!cast<Instruction>(NAME # Type # "_POST")
8433 GPR64sp:$Rn,
8434 !cast<RegisterOperand>("VecList" # Count # "128"):$Vt,
8435 idxtype:$idx,
8436 !cast<RegisterOperand>("GPR64pi" # Offset):$Xm), 0>;
8437}
8438
8439multiclass SIMDLdSt1SingleAliases<string asm> {
8440 defm : SIMDLdStSingleAliases<asm, "b", "i8", "One", 1, VectorIndexB>;
8441 defm : SIMDLdStSingleAliases<asm, "h", "i16", "One", 2, VectorIndexH>;
8442 defm : SIMDLdStSingleAliases<asm, "s", "i32", "One", 4, VectorIndexS>;
8443 defm : SIMDLdStSingleAliases<asm, "d", "i64", "One", 8, VectorIndexD>;
8444}
8445
8446multiclass SIMDLdSt2SingleAliases<string asm> {
8447 defm : SIMDLdStSingleAliases<asm, "b", "i8", "Two", 2, VectorIndexB>;
8448 defm : SIMDLdStSingleAliases<asm, "h", "i16", "Two", 4, VectorIndexH>;
8449 defm : SIMDLdStSingleAliases<asm, "s", "i32", "Two", 8, VectorIndexS>;
8450 defm : SIMDLdStSingleAliases<asm, "d", "i64", "Two", 16, VectorIndexD>;
8451}
8452
8453multiclass SIMDLdSt3SingleAliases<string asm> {
8454 defm : SIMDLdStSingleAliases<asm, "b", "i8", "Three", 3, VectorIndexB>;
8455 defm : SIMDLdStSingleAliases<asm, "h", "i16", "Three", 6, VectorIndexH>;
8456 defm : SIMDLdStSingleAliases<asm, "s", "i32", "Three", 12, VectorIndexS>;
8457 defm : SIMDLdStSingleAliases<asm, "d", "i64", "Three", 24, VectorIndexD>;
8458}
8459
8460multiclass SIMDLdSt4SingleAliases<string asm> {
8461 defm : SIMDLdStSingleAliases<asm, "b", "i8", "Four", 4, VectorIndexB>;
8462 defm : SIMDLdStSingleAliases<asm, "h", "i16", "Four", 8, VectorIndexH>;
8463 defm : SIMDLdStSingleAliases<asm, "s", "i32", "Four", 16, VectorIndexS>;
8464 defm : SIMDLdStSingleAliases<asm, "d", "i64", "Four", 32, VectorIndexD>;
8465}
8466} // end of 'let Predicates = [HasNEON]'
8467
8468//----------------------------------------------------------------------------
8469// Crypto extensions
8470//----------------------------------------------------------------------------
8471
8472let Predicates = [HasCrypto] in {
8473let mayLoad = 0, mayStore = 0, hasSideEffects = 0 in
8474class AESBase<bits<4> opc, string asm, dag outs, dag ins, string cstr,
8475 list<dag> pat>
8476 : I<outs, ins, asm, "{\t$Rd.16b, $Rn.16b|.16b\t$Rd, $Rn}", cstr, pat>,
8477 Sched<[WriteV]>{
8478 bits<5> Rd;
8479 bits<5> Rn;
8480 let Inst{31-16} = 0b0100111000101000;
8481 let Inst{15-12} = opc;
8482 let Inst{11-10} = 0b10;
8483 let Inst{9-5} = Rn;
8484 let Inst{4-0} = Rd;
8485}
8486
8487class AESInst<bits<4> opc, string asm, Intrinsic OpNode>
8488 : AESBase<opc, asm, (outs V128:$Rd), (ins V128:$Rn), "",
8489 [(set (v16i8 V128:$Rd), (OpNode (v16i8 V128:$Rn)))]>;
8490
8491class AESTiedInst<bits<4> opc, string asm, Intrinsic OpNode>
8492 : AESBase<opc, asm, (outs V128:$dst), (ins V128:$Rd, V128:$Rn),
8493 "$Rd = $dst",
8494 [(set (v16i8 V128:$dst),
8495 (OpNode (v16i8 V128:$Rd), (v16i8 V128:$Rn)))]>;
8496
8497let mayLoad = 0, mayStore = 0, hasSideEffects = 0 in
8498class SHA3OpTiedInst<bits<3> opc, string asm, string dst_lhs_kind,
8499 dag oops, dag iops, list<dag> pat>
8500 : I<oops, iops, asm,
8501 "{\t$Rd" # dst_lhs_kind # ", $Rn" # dst_lhs_kind # ", $Rm.4s" #
8502 "|.4s\t$Rd, $Rn, $Rm}", "$Rd = $dst", pat>,
8503 Sched<[WriteV]>{
8504 bits<5> Rd;
8505 bits<5> Rn;
8506 bits<5> Rm;
8507 let Inst{31-21} = 0b01011110000;
8508 let Inst{20-16} = Rm;
8509 let Inst{15} = 0;
8510 let Inst{14-12} = opc;
8511 let Inst{11-10} = 0b00;
8512 let Inst{9-5} = Rn;
8513 let Inst{4-0} = Rd;
8514}
8515
8516class SHATiedInstQSV<bits<3> opc, string asm, Intrinsic OpNode>
8517 : SHA3OpTiedInst<opc, asm, "", (outs FPR128:$dst),
8518 (ins FPR128:$Rd, FPR32:$Rn, V128:$Rm),
8519 [(set (v4i32 FPR128:$dst),
8520 (OpNode (v4i32 FPR128:$Rd), (i32 FPR32:$Rn),
8521 (v4i32 V128:$Rm)))]>;
8522
8523class SHATiedInstVVV<bits<3> opc, string asm, Intrinsic OpNode>
8524 : SHA3OpTiedInst<opc, asm, ".4s", (outs V128:$dst),
8525 (ins V128:$Rd, V128:$Rn, V128:$Rm),
8526 [(set (v4i32 V128:$dst),
8527 (OpNode (v4i32 V128:$Rd), (v4i32 V128:$Rn),
8528 (v4i32 V128:$Rm)))]>;
8529
8530class SHATiedInstQQV<bits<3> opc, string asm, Intrinsic OpNode>
8531 : SHA3OpTiedInst<opc, asm, "", (outs FPR128:$dst),
8532 (ins FPR128:$Rd, FPR128:$Rn, V128:$Rm),
8533 [(set (v4i32 FPR128:$dst),
8534 (OpNode (v4i32 FPR128:$Rd), (v4i32 FPR128:$Rn),
8535 (v4i32 V128:$Rm)))]>;
8536
8537let mayLoad = 0, mayStore = 0, hasSideEffects = 0 in
8538class SHA2OpInst<bits<4> opc, string asm, string kind,
8539 string cstr, dag oops, dag iops,
8540 list<dag> pat>
8541 : I<oops, iops, asm, "{\t$Rd" # kind # ", $Rn" # kind #
8542 "|" # kind # "\t$Rd, $Rn}", cstr, pat>,
8543 Sched<[WriteV]>{
8544 bits<5> Rd;
8545 bits<5> Rn;
8546 let Inst{31-16} = 0b0101111000101000;
8547 let Inst{15-12} = opc;
8548 let Inst{11-10} = 0b10;
8549 let Inst{9-5} = Rn;
8550 let Inst{4-0} = Rd;
8551}
8552
8553class SHATiedInstVV<bits<4> opc, string asm, Intrinsic OpNode>
8554 : SHA2OpInst<opc, asm, ".4s", "$Rd = $dst", (outs V128:$dst),
8555 (ins V128:$Rd, V128:$Rn),
8556 [(set (v4i32 V128:$dst),
8557 (OpNode (v4i32 V128:$Rd), (v4i32 V128:$Rn)))]>;
8558
8559class SHAInstSS<bits<4> opc, string asm, Intrinsic OpNode>
8560 : SHA2OpInst<opc, asm, "", "", (outs FPR32:$Rd), (ins FPR32:$Rn),
8561 [(set (i32 FPR32:$Rd), (OpNode (i32 FPR32:$Rn)))]>;
8562} // end of 'let Predicates = [HasCrypto]'
8563
8564// Allow the size specifier tokens to be upper case, not just lower.
8565def : TokenAlias<".8B", ".8b">;
8566def : TokenAlias<".4H", ".4h">;
8567def : TokenAlias<".2S", ".2s">;
8568def : TokenAlias<".1D", ".1d">;
8569def : TokenAlias<".16B", ".16b">;
8570def : TokenAlias<".8H", ".8h">;
8571def : TokenAlias<".4S", ".4s">;
8572def : TokenAlias<".2D", ".2d">;
8573def : TokenAlias<".1Q", ".1q">;
8574def : TokenAlias<".B", ".b">;
8575def : TokenAlias<".H", ".h">;
8576def : TokenAlias<".S", ".s">;
8577def : TokenAlias<".D", ".d">;
8578def : TokenAlias<".Q", ".q">;