blob: 04a13e204ac20e8b1f0a0a108192f4ab2d05a742 [file] [log] [blame]
Hal Finkel27774d92014-03-13 07:58:58 +00001//===- PPCInstrVSX.td - The PowerPC VSX Extension --*- tablegen -*-===//
2//
3// The LLVM Compiler Infrastructure
4//
5// This file is distributed under the University of Illinois Open Source
6// License. See LICENSE.TXT for details.
7//
8//===----------------------------------------------------------------------===//
9//
10// This file describes the VSX extension to the PowerPC instruction set.
11//
12//===----------------------------------------------------------------------===//
13
Bill Schmidtfe723b92015-04-27 19:57:34 +000014// *********************************** NOTE ***********************************
15// ** For POWER8 Little Endian, the VSX swap optimization relies on knowing **
16// ** which VMX and VSX instructions are lane-sensitive and which are not. **
17// ** A lane-sensitive instruction relies, implicitly or explicitly, on **
18// ** whether lanes are numbered from left to right. An instruction like **
19// ** VADDFP is not lane-sensitive, because each lane of the result vector **
20// ** relies only on the corresponding lane of the source vectors. However, **
21// ** an instruction like VMULESB is lane-sensitive, because "even" and **
22// ** "odd" lanes are different for big-endian and little-endian numbering. **
23// ** **
24// ** When adding new VMX and VSX instructions, please consider whether they **
25// ** are lane-sensitive. If so, they must be added to a switch statement **
26// ** in PPCVSXSwapRemoval::gatherVectorInstructions(). **
27// ****************************************************************************
28
Hal Finkel27774d92014-03-13 07:58:58 +000029def PPCRegVSRCAsmOperand : AsmOperandClass {
30 let Name = "RegVSRC"; let PredicateMethod = "isVSRegNumber";
31}
32def vsrc : RegisterOperand<VSRC> {
33 let ParserMatchClass = PPCRegVSRCAsmOperand;
34}
35
Hal Finkel19be5062014-03-29 05:29:01 +000036def PPCRegVSFRCAsmOperand : AsmOperandClass {
37 let Name = "RegVSFRC"; let PredicateMethod = "isVSRegNumber";
38}
39def vsfrc : RegisterOperand<VSFRC> {
40 let ParserMatchClass = PPCRegVSFRCAsmOperand;
41}
42
Nemanja Ivanovicf3c94b12015-05-07 18:24:05 +000043def PPCRegVSSRCAsmOperand : AsmOperandClass {
44 let Name = "RegVSSRC"; let PredicateMethod = "isVSRegNumber";
45}
46def vssrc : RegisterOperand<VSSRC> {
47 let ParserMatchClass = PPCRegVSSRCAsmOperand;
48}
49
Zaara Syedafcd96972017-09-21 16:12:33 +000050def PPCRegSPILLTOVSRRCAsmOperand : AsmOperandClass {
51 let Name = "RegSPILLTOVSRRC"; let PredicateMethod = "isVSRegNumber";
52}
53
54def spilltovsrrc : RegisterOperand<SPILLTOVSRRC> {
55 let ParserMatchClass = PPCRegSPILLTOVSRRCAsmOperand;
56}
Bill Schmidtfae5d712014-12-09 16:35:51 +000057// Little-endian-specific nodes.
58def SDT_PPClxvd2x : SDTypeProfile<1, 1, [
59 SDTCisVT<0, v2f64>, SDTCisPtrTy<1>
60]>;
61def SDT_PPCstxvd2x : SDTypeProfile<0, 2, [
62 SDTCisVT<0, v2f64>, SDTCisPtrTy<1>
63]>;
64def SDT_PPCxxswapd : SDTypeProfile<1, 1, [
65 SDTCisSameAs<0, 1>
66]>;
Nemanja Ivanovic44513e52016-07-05 09:22:29 +000067def SDTVecConv : SDTypeProfile<1, 2, [
68 SDTCisVec<0>, SDTCisVec<1>, SDTCisPtrTy<2>
69]>;
Bill Schmidtfae5d712014-12-09 16:35:51 +000070
71def PPClxvd2x : SDNode<"PPCISD::LXVD2X", SDT_PPClxvd2x,
Sean Fertile3c8c3852017-01-26 18:59:15 +000072 [SDNPHasChain, SDNPMayLoad, SDNPMemOperand]>;
Bill Schmidtfae5d712014-12-09 16:35:51 +000073def PPCstxvd2x : SDNode<"PPCISD::STXVD2X", SDT_PPCstxvd2x,
74 [SDNPHasChain, SDNPMayStore]>;
75def PPCxxswapd : SDNode<"PPCISD::XXSWAPD", SDT_PPCxxswapd, [SDNPHasChain]>;
Nemanja Ivanovicc38b5312015-04-11 10:40:42 +000076def PPCmfvsr : SDNode<"PPCISD::MFVSR", SDTUnaryOp, []>;
77def PPCmtvsra : SDNode<"PPCISD::MTVSRA", SDTUnaryOp, []>;
78def PPCmtvsrz : SDNode<"PPCISD::MTVSRZ", SDTUnaryOp, []>;
Nemanja Ivanovic44513e52016-07-05 09:22:29 +000079def PPCsvec2fp : SDNode<"PPCISD::SINT_VEC_TO_FP", SDTVecConv, []>;
80def PPCuvec2fp: SDNode<"PPCISD::UINT_VEC_TO_FP", SDTVecConv, []>;
Nemanja Ivanoviceebbcb62016-07-12 12:16:27 +000081def PPCswapNoChain : SDNode<"PPCISD::SWAP_NO_CHAIN", SDT_PPCxxswapd>;
Bill Schmidtfae5d712014-12-09 16:35:51 +000082
Nemanja Ivanovic2c84b292015-09-29 17:41:53 +000083multiclass XX3Form_Rcr<bits<6> opcode, bits<7> xo, string asmbase,
84 string asmstr, InstrItinClass itin, Intrinsic Int,
85 ValueType OutTy, ValueType InTy> {
Hal Finkel27774d92014-03-13 07:58:58 +000086 let BaseName = asmbase in {
Nemanja Ivanovic2c84b292015-09-29 17:41:53 +000087 def NAME : XX3Form_Rc<opcode, xo, (outs vsrc:$XT), (ins vsrc:$XA, vsrc:$XB),
Hal Finkel27774d92014-03-13 07:58:58 +000088 !strconcat(asmbase, !strconcat(" ", asmstr)), itin,
Nemanja Ivanovic2c84b292015-09-29 17:41:53 +000089 [(set OutTy:$XT, (Int InTy:$XA, InTy:$XB))]>;
Hal Finkel27774d92014-03-13 07:58:58 +000090 let Defs = [CR6] in
Nemanja Ivanovic2c84b292015-09-29 17:41:53 +000091 def o : XX3Form_Rc<opcode, xo, (outs vsrc:$XT), (ins vsrc:$XA, vsrc:$XB),
Hal Finkel27774d92014-03-13 07:58:58 +000092 !strconcat(asmbase, !strconcat(". ", asmstr)), itin,
Nemanja Ivanovic2c84b292015-09-29 17:41:53 +000093 [(set InTy:$XT,
94 (InTy (PPCvcmp_o InTy:$XA, InTy:$XB, xo)))]>,
95 isDOT;
Hal Finkel27774d92014-03-13 07:58:58 +000096 }
97}
98
Nemanja Ivanovic11049f82016-10-04 06:59:23 +000099// Instruction form with a single input register for instructions such as
100// XXPERMDI. The reason for defining this is that specifying multiple chained
101// operands (such as loads) to an instruction will perform both chained
102// operations rather than coalescing them into a single register - even though
103// the source memory location is the same. This simply forces the instruction
104// to use the same register for both inputs.
105// For example, an output DAG such as this:
106// (XXPERMDI (LXSIBZX xoaddr:$src), (LXSIBZX xoaddr:$src ), 0))
107// would result in two load instructions emitted and used as separate inputs
108// to the XXPERMDI instruction.
109class XX3Form_2s<bits<6> opcode, bits<5> xo, dag OOL, dag IOL, string asmstr,
110 InstrItinClass itin, list<dag> pattern>
111 : XX3Form_2<opcode, xo, OOL, IOL, asmstr, itin, pattern> {
112 let XB = XA;
113}
114
Eric Christopher1b8e7632014-05-22 01:07:24 +0000115def HasVSX : Predicate<"PPCSubTarget->hasVSX()">;
Bill Schmidtfae5d712014-12-09 16:35:51 +0000116def IsLittleEndian : Predicate<"PPCSubTarget->isLittleEndian()">;
117def IsBigEndian : Predicate<"!PPCSubTarget->isLittleEndian()">;
Nemanja Ivanovic6e7879c2016-09-22 09:52:19 +0000118def HasOnlySwappingMemOps : Predicate<"!PPCSubTarget->hasP9Vector()">;
Bill Schmidtfae5d712014-12-09 16:35:51 +0000119
Hal Finkel27774d92014-03-13 07:58:58 +0000120let Predicates = [HasVSX] in {
121let AddedComplexity = 400 in { // Prefer VSX patterns over non-VSX patterns.
Nemanja Ivanovic11049f82016-10-04 06:59:23 +0000122let UseVSXReg = 1 in {
Craig Topperc50d64b2014-11-26 00:46:26 +0000123let hasSideEffects = 0 in { // VSX instructions don't have side effects.
Hal Finkel27774d92014-03-13 07:58:58 +0000124let Uses = [RM] in {
125
126 // Load indexed instructions
Sean Fertile3c8c3852017-01-26 18:59:15 +0000127 let mayLoad = 1, mayStore = 0 in {
Nemanja Ivanovic6354d232016-10-04 11:25:52 +0000128 let CodeSize = 3 in
Stefan Pintilie26d4f922018-03-26 17:39:18 +0000129 def LXSDX : XX1Form_memOp<31, 588,
Hal Finkel19be5062014-03-29 05:29:01 +0000130 (outs vsfrc:$XT), (ins memrr:$src),
Hal Finkel27774d92014-03-13 07:58:58 +0000131 "lxsdx $XT, $src", IIC_LdStLFD,
132 [(set f64:$XT, (load xoaddr:$src))]>;
133
Tony Jiang438bf4a2017-11-20 14:38:30 +0000134 // Pseudo instruction XFLOADf64 will be expanded to LXSDX or LFDX later
135 let isPseudo = 1, CodeSize = 3 in
Stefan Pintilie26d4f922018-03-26 17:39:18 +0000136 def XFLOADf64 : PseudoXFormMemOp<(outs vsfrc:$XT), (ins memrr:$src),
Tony Jiang438bf4a2017-11-20 14:38:30 +0000137 "#XFLOADf64",
138 [(set f64:$XT, (load xoaddr:$src))]>;
139
Nemanja Ivanovic6e7879c2016-09-22 09:52:19 +0000140 let Predicates = [HasVSX, HasOnlySwappingMemOps] in
Stefan Pintilie26d4f922018-03-26 17:39:18 +0000141 def LXVD2X : XX1Form_memOp<31, 844,
Hal Finkel27774d92014-03-13 07:58:58 +0000142 (outs vsrc:$XT), (ins memrr:$src),
143 "lxvd2x $XT, $src", IIC_LdStLFD,
Bill Schmidt72954782014-11-12 04:19:40 +0000144 [(set v2f64:$XT, (int_ppc_vsx_lxvd2x xoaddr:$src))]>;
Hal Finkel27774d92014-03-13 07:58:58 +0000145
Stefan Pintilie26d4f922018-03-26 17:39:18 +0000146 def LXVDSX : XX1Form_memOp<31, 332,
Hal Finkel27774d92014-03-13 07:58:58 +0000147 (outs vsrc:$XT), (ins memrr:$src),
148 "lxvdsx $XT, $src", IIC_LdStLFD, []>;
Hal Finkel27774d92014-03-13 07:58:58 +0000149
Nemanja Ivanovic6e7879c2016-09-22 09:52:19 +0000150 let Predicates = [HasVSX, HasOnlySwappingMemOps] in
Stefan Pintilie26d4f922018-03-26 17:39:18 +0000151 def LXVW4X : XX1Form_memOp<31, 780,
Hal Finkel27774d92014-03-13 07:58:58 +0000152 (outs vsrc:$XT), (ins memrr:$src),
Bill Schmidt2d1128a2014-10-17 15:13:38 +0000153 "lxvw4x $XT, $src", IIC_LdStLFD,
Nemanja Ivanovicb89c27f2017-05-02 01:47:34 +0000154 []>;
Nemanja Ivanovicf3c94b12015-05-07 18:24:05 +0000155 } // mayLoad
Hal Finkel27774d92014-03-13 07:58:58 +0000156
157 // Store indexed instructions
Sean Fertile3c8c3852017-01-26 18:59:15 +0000158 let mayStore = 1, mayLoad = 0 in {
Nemanja Ivanovic6354d232016-10-04 11:25:52 +0000159 let CodeSize = 3 in
Stefan Pintilie26d4f922018-03-26 17:39:18 +0000160 def STXSDX : XX1Form_memOp<31, 716,
Hal Finkel19be5062014-03-29 05:29:01 +0000161 (outs), (ins vsfrc:$XT, memrr:$dst),
Hal Finkel27774d92014-03-13 07:58:58 +0000162 "stxsdx $XT, $dst", IIC_LdStSTFD,
163 [(store f64:$XT, xoaddr:$dst)]>;
164
Tony Jiang438bf4a2017-11-20 14:38:30 +0000165 // Pseudo instruction XFSTOREf64 will be expanded to STXSDX or STFDX later
166 let isPseudo = 1, CodeSize = 3 in
Stefan Pintilie26d4f922018-03-26 17:39:18 +0000167 def XFSTOREf64 : PseudoXFormMemOp<(outs), (ins vsfrc:$XT, memrr:$dst),
Tony Jiang438bf4a2017-11-20 14:38:30 +0000168 "#XFSTOREf64",
169 [(store f64:$XT, xoaddr:$dst)]>;
170
Nemanja Ivanovic6e7879c2016-09-22 09:52:19 +0000171 let Predicates = [HasVSX, HasOnlySwappingMemOps] in {
Nemanja Ivanovice78ffed2016-09-22 10:32:03 +0000172 // The behaviour of this instruction is endianness-specific so we provide no
173 // pattern to match it without considering endianness.
Stefan Pintilie26d4f922018-03-26 17:39:18 +0000174 def STXVD2X : XX1Form_memOp<31, 972,
Hal Finkel27774d92014-03-13 07:58:58 +0000175 (outs), (ins vsrc:$XT, memrr:$dst),
176 "stxvd2x $XT, $dst", IIC_LdStSTFD,
Nemanja Ivanovice78ffed2016-09-22 10:32:03 +0000177 []>;
Hal Finkel27774d92014-03-13 07:58:58 +0000178
Stefan Pintilie26d4f922018-03-26 17:39:18 +0000179 def STXVW4X : XX1Form_memOp<31, 908,
Hal Finkel27774d92014-03-13 07:58:58 +0000180 (outs), (ins vsrc:$XT, memrr:$dst),
Bill Schmidt2d1128a2014-10-17 15:13:38 +0000181 "stxvw4x $XT, $dst", IIC_LdStSTFD,
Nemanja Ivanovicb89c27f2017-05-02 01:47:34 +0000182 []>;
Nemanja Ivanovic6e7879c2016-09-22 09:52:19 +0000183 }
Nemanja Ivanovicf3c94b12015-05-07 18:24:05 +0000184 } // mayStore
Hal Finkel27774d92014-03-13 07:58:58 +0000185
186 // Add/Mul Instructions
187 let isCommutable = 1 in {
188 def XSADDDP : XX3Form<60, 32,
Hal Finkel19be5062014-03-29 05:29:01 +0000189 (outs vsfrc:$XT), (ins vsfrc:$XA, vsfrc:$XB),
Hal Finkel27774d92014-03-13 07:58:58 +0000190 "xsadddp $XT, $XA, $XB", IIC_VecFP,
191 [(set f64:$XT, (fadd f64:$XA, f64:$XB))]>;
192 def XSMULDP : XX3Form<60, 48,
Hal Finkel19be5062014-03-29 05:29:01 +0000193 (outs vsfrc:$XT), (ins vsfrc:$XA, vsfrc:$XB),
Hal Finkel27774d92014-03-13 07:58:58 +0000194 "xsmuldp $XT, $XA, $XB", IIC_VecFP,
195 [(set f64:$XT, (fmul f64:$XA, f64:$XB))]>;
196
197 def XVADDDP : XX3Form<60, 96,
198 (outs vsrc:$XT), (ins vsrc:$XA, vsrc:$XB),
199 "xvadddp $XT, $XA, $XB", IIC_VecFP,
200 [(set v2f64:$XT, (fadd v2f64:$XA, v2f64:$XB))]>;
201
202 def XVADDSP : XX3Form<60, 64,
203 (outs vsrc:$XT), (ins vsrc:$XA, vsrc:$XB),
204 "xvaddsp $XT, $XA, $XB", IIC_VecFP,
205 [(set v4f32:$XT, (fadd v4f32:$XA, v4f32:$XB))]>;
206
207 def XVMULDP : XX3Form<60, 112,
208 (outs vsrc:$XT), (ins vsrc:$XA, vsrc:$XB),
209 "xvmuldp $XT, $XA, $XB", IIC_VecFP,
210 [(set v2f64:$XT, (fmul v2f64:$XA, v2f64:$XB))]>;
211
212 def XVMULSP : XX3Form<60, 80,
213 (outs vsrc:$XT), (ins vsrc:$XA, vsrc:$XB),
214 "xvmulsp $XT, $XA, $XB", IIC_VecFP,
215 [(set v4f32:$XT, (fmul v4f32:$XA, v4f32:$XB))]>;
216 }
217
218 // Subtract Instructions
219 def XSSUBDP : XX3Form<60, 40,
Hal Finkel19be5062014-03-29 05:29:01 +0000220 (outs vsfrc:$XT), (ins vsfrc:$XA, vsfrc:$XB),
Hal Finkel27774d92014-03-13 07:58:58 +0000221 "xssubdp $XT, $XA, $XB", IIC_VecFP,
222 [(set f64:$XT, (fsub f64:$XA, f64:$XB))]>;
223
224 def XVSUBDP : XX3Form<60, 104,
225 (outs vsrc:$XT), (ins vsrc:$XA, vsrc:$XB),
226 "xvsubdp $XT, $XA, $XB", IIC_VecFP,
227 [(set v2f64:$XT, (fsub v2f64:$XA, v2f64:$XB))]>;
228 def XVSUBSP : XX3Form<60, 72,
229 (outs vsrc:$XT), (ins vsrc:$XA, vsrc:$XB),
230 "xvsubsp $XT, $XA, $XB", IIC_VecFP,
231 [(set v4f32:$XT, (fsub v4f32:$XA, v4f32:$XB))]>;
232
233 // FMA Instructions
Hal Finkel25e04542014-03-25 18:55:11 +0000234 let BaseName = "XSMADDADP" in {
Hal Finkele01d3212014-03-24 15:07:28 +0000235 let isCommutable = 1 in
Hal Finkel27774d92014-03-13 07:58:58 +0000236 def XSMADDADP : XX3Form<60, 33,
Hal Finkel19be5062014-03-29 05:29:01 +0000237 (outs vsfrc:$XT), (ins vsfrc:$XTi, vsfrc:$XA, vsfrc:$XB),
Hal Finkel27774d92014-03-13 07:58:58 +0000238 "xsmaddadp $XT, $XA, $XB", IIC_VecFP,
239 [(set f64:$XT, (fma f64:$XA, f64:$XB, f64:$XTi))]>,
Hal Finkel25e04542014-03-25 18:55:11 +0000240 RegConstraint<"$XTi = $XT">, NoEncode<"$XTi">,
241 AltVSXFMARel;
242 let IsVSXFMAAlt = 1 in
Hal Finkel27774d92014-03-13 07:58:58 +0000243 def XSMADDMDP : XX3Form<60, 41,
Hal Finkel19be5062014-03-29 05:29:01 +0000244 (outs vsfrc:$XT), (ins vsfrc:$XTi, vsfrc:$XA, vsfrc:$XB),
Hal Finkel27774d92014-03-13 07:58:58 +0000245 "xsmaddmdp $XT, $XA, $XB", IIC_VecFP, []>,
Hal Finkel25e04542014-03-25 18:55:11 +0000246 RegConstraint<"$XTi = $XT">, NoEncode<"$XTi">,
247 AltVSXFMARel;
248 }
Hal Finkel27774d92014-03-13 07:58:58 +0000249
Hal Finkel25e04542014-03-25 18:55:11 +0000250 let BaseName = "XSMSUBADP" in {
Hal Finkele01d3212014-03-24 15:07:28 +0000251 let isCommutable = 1 in
Hal Finkel27774d92014-03-13 07:58:58 +0000252 def XSMSUBADP : XX3Form<60, 49,
Hal Finkel19be5062014-03-29 05:29:01 +0000253 (outs vsfrc:$XT), (ins vsfrc:$XTi, vsfrc:$XA, vsfrc:$XB),
Hal Finkel27774d92014-03-13 07:58:58 +0000254 "xsmsubadp $XT, $XA, $XB", IIC_VecFP,
255 [(set f64:$XT, (fma f64:$XA, f64:$XB, (fneg f64:$XTi)))]>,
Hal Finkel25e04542014-03-25 18:55:11 +0000256 RegConstraint<"$XTi = $XT">, NoEncode<"$XTi">,
257 AltVSXFMARel;
258 let IsVSXFMAAlt = 1 in
Hal Finkel27774d92014-03-13 07:58:58 +0000259 def XSMSUBMDP : XX3Form<60, 57,
Hal Finkel19be5062014-03-29 05:29:01 +0000260 (outs vsfrc:$XT), (ins vsfrc:$XTi, vsfrc:$XA, vsfrc:$XB),
Hal Finkel27774d92014-03-13 07:58:58 +0000261 "xsmsubmdp $XT, $XA, $XB", IIC_VecFP, []>,
Hal Finkel25e04542014-03-25 18:55:11 +0000262 RegConstraint<"$XTi = $XT">, NoEncode<"$XTi">,
263 AltVSXFMARel;
264 }
Hal Finkel27774d92014-03-13 07:58:58 +0000265
Hal Finkel25e04542014-03-25 18:55:11 +0000266 let BaseName = "XSNMADDADP" in {
Hal Finkele01d3212014-03-24 15:07:28 +0000267 let isCommutable = 1 in
Hal Finkel27774d92014-03-13 07:58:58 +0000268 def XSNMADDADP : XX3Form<60, 161,
Hal Finkel19be5062014-03-29 05:29:01 +0000269 (outs vsfrc:$XT), (ins vsfrc:$XTi, vsfrc:$XA, vsfrc:$XB),
Hal Finkel27774d92014-03-13 07:58:58 +0000270 "xsnmaddadp $XT, $XA, $XB", IIC_VecFP,
271 [(set f64:$XT, (fneg (fma f64:$XA, f64:$XB, f64:$XTi)))]>,
Hal Finkel25e04542014-03-25 18:55:11 +0000272 RegConstraint<"$XTi = $XT">, NoEncode<"$XTi">,
273 AltVSXFMARel;
274 let IsVSXFMAAlt = 1 in
Hal Finkel27774d92014-03-13 07:58:58 +0000275 def XSNMADDMDP : XX3Form<60, 169,
Hal Finkel19be5062014-03-29 05:29:01 +0000276 (outs vsfrc:$XT), (ins vsfrc:$XTi, vsfrc:$XA, vsfrc:$XB),
Hal Finkel27774d92014-03-13 07:58:58 +0000277 "xsnmaddmdp $XT, $XA, $XB", IIC_VecFP, []>,
Hal Finkel25e04542014-03-25 18:55:11 +0000278 RegConstraint<"$XTi = $XT">, NoEncode<"$XTi">,
279 AltVSXFMARel;
280 }
Hal Finkel27774d92014-03-13 07:58:58 +0000281
Hal Finkel25e04542014-03-25 18:55:11 +0000282 let BaseName = "XSNMSUBADP" in {
Hal Finkele01d3212014-03-24 15:07:28 +0000283 let isCommutable = 1 in
Hal Finkel27774d92014-03-13 07:58:58 +0000284 def XSNMSUBADP : XX3Form<60, 177,
Hal Finkel19be5062014-03-29 05:29:01 +0000285 (outs vsfrc:$XT), (ins vsfrc:$XTi, vsfrc:$XA, vsfrc:$XB),
Hal Finkel27774d92014-03-13 07:58:58 +0000286 "xsnmsubadp $XT, $XA, $XB", IIC_VecFP,
287 [(set f64:$XT, (fneg (fma f64:$XA, f64:$XB, (fneg f64:$XTi))))]>,
Hal Finkel25e04542014-03-25 18:55:11 +0000288 RegConstraint<"$XTi = $XT">, NoEncode<"$XTi">,
289 AltVSXFMARel;
290 let IsVSXFMAAlt = 1 in
Hal Finkel27774d92014-03-13 07:58:58 +0000291 def XSNMSUBMDP : XX3Form<60, 185,
Hal Finkel19be5062014-03-29 05:29:01 +0000292 (outs vsfrc:$XT), (ins vsfrc:$XTi, vsfrc:$XA, vsfrc:$XB),
Hal Finkel27774d92014-03-13 07:58:58 +0000293 "xsnmsubmdp $XT, $XA, $XB", IIC_VecFP, []>,
Hal Finkel25e04542014-03-25 18:55:11 +0000294 RegConstraint<"$XTi = $XT">, NoEncode<"$XTi">,
295 AltVSXFMARel;
296 }
Hal Finkel27774d92014-03-13 07:58:58 +0000297
Hal Finkel25e04542014-03-25 18:55:11 +0000298 let BaseName = "XVMADDADP" in {
Hal Finkele01d3212014-03-24 15:07:28 +0000299 let isCommutable = 1 in
Hal Finkel27774d92014-03-13 07:58:58 +0000300 def XVMADDADP : XX3Form<60, 97,
301 (outs vsrc:$XT), (ins vsrc:$XTi, vsrc:$XA, vsrc:$XB),
302 "xvmaddadp $XT, $XA, $XB", IIC_VecFP,
303 [(set v2f64:$XT, (fma v2f64:$XA, v2f64:$XB, v2f64:$XTi))]>,
Hal Finkel25e04542014-03-25 18:55:11 +0000304 RegConstraint<"$XTi = $XT">, NoEncode<"$XTi">,
305 AltVSXFMARel;
306 let IsVSXFMAAlt = 1 in
Hal Finkel27774d92014-03-13 07:58:58 +0000307 def XVMADDMDP : XX3Form<60, 105,
308 (outs vsrc:$XT), (ins vsrc:$XTi, vsrc:$XA, vsrc:$XB),
309 "xvmaddmdp $XT, $XA, $XB", IIC_VecFP, []>,
Hal Finkel25e04542014-03-25 18:55:11 +0000310 RegConstraint<"$XTi = $XT">, NoEncode<"$XTi">,
311 AltVSXFMARel;
312 }
Hal Finkel27774d92014-03-13 07:58:58 +0000313
Hal Finkel25e04542014-03-25 18:55:11 +0000314 let BaseName = "XVMADDASP" in {
Hal Finkele01d3212014-03-24 15:07:28 +0000315 let isCommutable = 1 in
Hal Finkel27774d92014-03-13 07:58:58 +0000316 def XVMADDASP : XX3Form<60, 65,
317 (outs vsrc:$XT), (ins vsrc:$XTi, vsrc:$XA, vsrc:$XB),
318 "xvmaddasp $XT, $XA, $XB", IIC_VecFP,
319 [(set v4f32:$XT, (fma v4f32:$XA, v4f32:$XB, v4f32:$XTi))]>,
Hal Finkel25e04542014-03-25 18:55:11 +0000320 RegConstraint<"$XTi = $XT">, NoEncode<"$XTi">,
321 AltVSXFMARel;
322 let IsVSXFMAAlt = 1 in
Hal Finkel27774d92014-03-13 07:58:58 +0000323 def XVMADDMSP : XX3Form<60, 73,
324 (outs vsrc:$XT), (ins vsrc:$XTi, vsrc:$XA, vsrc:$XB),
325 "xvmaddmsp $XT, $XA, $XB", IIC_VecFP, []>,
Hal Finkel25e04542014-03-25 18:55:11 +0000326 RegConstraint<"$XTi = $XT">, NoEncode<"$XTi">,
327 AltVSXFMARel;
328 }
Hal Finkel27774d92014-03-13 07:58:58 +0000329
Hal Finkel25e04542014-03-25 18:55:11 +0000330 let BaseName = "XVMSUBADP" in {
Hal Finkele01d3212014-03-24 15:07:28 +0000331 let isCommutable = 1 in
Hal Finkel27774d92014-03-13 07:58:58 +0000332 def XVMSUBADP : XX3Form<60, 113,
333 (outs vsrc:$XT), (ins vsrc:$XTi, vsrc:$XA, vsrc:$XB),
334 "xvmsubadp $XT, $XA, $XB", IIC_VecFP,
335 [(set v2f64:$XT, (fma v2f64:$XA, v2f64:$XB, (fneg v2f64:$XTi)))]>,
Hal Finkel25e04542014-03-25 18:55:11 +0000336 RegConstraint<"$XTi = $XT">, NoEncode<"$XTi">,
337 AltVSXFMARel;
338 let IsVSXFMAAlt = 1 in
Hal Finkel27774d92014-03-13 07:58:58 +0000339 def XVMSUBMDP : XX3Form<60, 121,
340 (outs vsrc:$XT), (ins vsrc:$XTi, vsrc:$XA, vsrc:$XB),
341 "xvmsubmdp $XT, $XA, $XB", IIC_VecFP, []>,
Hal Finkel25e04542014-03-25 18:55:11 +0000342 RegConstraint<"$XTi = $XT">, NoEncode<"$XTi">,
343 AltVSXFMARel;
344 }
Hal Finkel27774d92014-03-13 07:58:58 +0000345
Hal Finkel25e04542014-03-25 18:55:11 +0000346 let BaseName = "XVMSUBASP" in {
Hal Finkele01d3212014-03-24 15:07:28 +0000347 let isCommutable = 1 in
Hal Finkel27774d92014-03-13 07:58:58 +0000348 def XVMSUBASP : XX3Form<60, 81,
349 (outs vsrc:$XT), (ins vsrc:$XTi, vsrc:$XA, vsrc:$XB),
350 "xvmsubasp $XT, $XA, $XB", IIC_VecFP,
351 [(set v4f32:$XT, (fma v4f32:$XA, v4f32:$XB, (fneg v4f32:$XTi)))]>,
Hal Finkel25e04542014-03-25 18:55:11 +0000352 RegConstraint<"$XTi = $XT">, NoEncode<"$XTi">,
353 AltVSXFMARel;
354 let IsVSXFMAAlt = 1 in
Hal Finkel27774d92014-03-13 07:58:58 +0000355 def XVMSUBMSP : XX3Form<60, 89,
356 (outs vsrc:$XT), (ins vsrc:$XTi, vsrc:$XA, vsrc:$XB),
357 "xvmsubmsp $XT, $XA, $XB", IIC_VecFP, []>,
Hal Finkel25e04542014-03-25 18:55:11 +0000358 RegConstraint<"$XTi = $XT">, NoEncode<"$XTi">,
359 AltVSXFMARel;
360 }
Hal Finkel27774d92014-03-13 07:58:58 +0000361
Hal Finkel25e04542014-03-25 18:55:11 +0000362 let BaseName = "XVNMADDADP" in {
Hal Finkele01d3212014-03-24 15:07:28 +0000363 let isCommutable = 1 in
Hal Finkel27774d92014-03-13 07:58:58 +0000364 def XVNMADDADP : XX3Form<60, 225,
365 (outs vsrc:$XT), (ins vsrc:$XTi, vsrc:$XA, vsrc:$XB),
366 "xvnmaddadp $XT, $XA, $XB", IIC_VecFP,
367 [(set v2f64:$XT, (fneg (fma v2f64:$XA, v2f64:$XB, v2f64:$XTi)))]>,
Hal Finkel25e04542014-03-25 18:55:11 +0000368 RegConstraint<"$XTi = $XT">, NoEncode<"$XTi">,
369 AltVSXFMARel;
370 let IsVSXFMAAlt = 1 in
Hal Finkel27774d92014-03-13 07:58:58 +0000371 def XVNMADDMDP : XX3Form<60, 233,
372 (outs vsrc:$XT), (ins vsrc:$XTi, vsrc:$XA, vsrc:$XB),
373 "xvnmaddmdp $XT, $XA, $XB", IIC_VecFP, []>,
Hal Finkel25e04542014-03-25 18:55:11 +0000374 RegConstraint<"$XTi = $XT">, NoEncode<"$XTi">,
375 AltVSXFMARel;
376 }
Hal Finkel27774d92014-03-13 07:58:58 +0000377
Hal Finkel25e04542014-03-25 18:55:11 +0000378 let BaseName = "XVNMADDASP" in {
Hal Finkele01d3212014-03-24 15:07:28 +0000379 let isCommutable = 1 in
Hal Finkel27774d92014-03-13 07:58:58 +0000380 def XVNMADDASP : XX3Form<60, 193,
381 (outs vsrc:$XT), (ins vsrc:$XTi, vsrc:$XA, vsrc:$XB),
382 "xvnmaddasp $XT, $XA, $XB", IIC_VecFP,
383 [(set v4f32:$XT, (fneg (fma v4f32:$XA, v4f32:$XB, v4f32:$XTi)))]>,
Hal Finkel25e04542014-03-25 18:55:11 +0000384 RegConstraint<"$XTi = $XT">, NoEncode<"$XTi">,
385 AltVSXFMARel;
386 let IsVSXFMAAlt = 1 in
Hal Finkel27774d92014-03-13 07:58:58 +0000387 def XVNMADDMSP : XX3Form<60, 201,
388 (outs vsrc:$XT), (ins vsrc:$XTi, vsrc:$XA, vsrc:$XB),
389 "xvnmaddmsp $XT, $XA, $XB", IIC_VecFP, []>,
Hal Finkel25e04542014-03-25 18:55:11 +0000390 RegConstraint<"$XTi = $XT">, NoEncode<"$XTi">,
391 AltVSXFMARel;
392 }
Hal Finkel27774d92014-03-13 07:58:58 +0000393
Hal Finkel25e04542014-03-25 18:55:11 +0000394 let BaseName = "XVNMSUBADP" in {
Hal Finkele01d3212014-03-24 15:07:28 +0000395 let isCommutable = 1 in
Hal Finkel27774d92014-03-13 07:58:58 +0000396 def XVNMSUBADP : XX3Form<60, 241,
397 (outs vsrc:$XT), (ins vsrc:$XTi, vsrc:$XA, vsrc:$XB),
398 "xvnmsubadp $XT, $XA, $XB", IIC_VecFP,
399 [(set v2f64:$XT, (fneg (fma v2f64:$XA, v2f64:$XB, (fneg v2f64:$XTi))))]>,
Hal Finkel25e04542014-03-25 18:55:11 +0000400 RegConstraint<"$XTi = $XT">, NoEncode<"$XTi">,
401 AltVSXFMARel;
402 let IsVSXFMAAlt = 1 in
Hal Finkel27774d92014-03-13 07:58:58 +0000403 def XVNMSUBMDP : XX3Form<60, 249,
404 (outs vsrc:$XT), (ins vsrc:$XTi, vsrc:$XA, vsrc:$XB),
405 "xvnmsubmdp $XT, $XA, $XB", IIC_VecFP, []>,
Hal Finkel25e04542014-03-25 18:55:11 +0000406 RegConstraint<"$XTi = $XT">, NoEncode<"$XTi">,
407 AltVSXFMARel;
408 }
Hal Finkel27774d92014-03-13 07:58:58 +0000409
Hal Finkel25e04542014-03-25 18:55:11 +0000410 let BaseName = "XVNMSUBASP" in {
Hal Finkele01d3212014-03-24 15:07:28 +0000411 let isCommutable = 1 in
Hal Finkel27774d92014-03-13 07:58:58 +0000412 def XVNMSUBASP : XX3Form<60, 209,
413 (outs vsrc:$XT), (ins vsrc:$XTi, vsrc:$XA, vsrc:$XB),
414 "xvnmsubasp $XT, $XA, $XB", IIC_VecFP,
415 [(set v4f32:$XT, (fneg (fma v4f32:$XA, v4f32:$XB, (fneg v4f32:$XTi))))]>,
Hal Finkel25e04542014-03-25 18:55:11 +0000416 RegConstraint<"$XTi = $XT">, NoEncode<"$XTi">,
417 AltVSXFMARel;
418 let IsVSXFMAAlt = 1 in
Hal Finkel27774d92014-03-13 07:58:58 +0000419 def XVNMSUBMSP : XX3Form<60, 217,
420 (outs vsrc:$XT), (ins vsrc:$XTi, vsrc:$XA, vsrc:$XB),
421 "xvnmsubmsp $XT, $XA, $XB", IIC_VecFP, []>,
Hal Finkel25e04542014-03-25 18:55:11 +0000422 RegConstraint<"$XTi = $XT">, NoEncode<"$XTi">,
423 AltVSXFMARel;
424 }
Hal Finkel27774d92014-03-13 07:58:58 +0000425
426 // Division Instructions
427 def XSDIVDP : XX3Form<60, 56,
Hal Finkel19be5062014-03-29 05:29:01 +0000428 (outs vsfrc:$XT), (ins vsfrc:$XA, vsfrc:$XB),
Hal Finkele8fba982014-03-29 13:20:31 +0000429 "xsdivdp $XT, $XA, $XB", IIC_FPDivD,
Hal Finkel27774d92014-03-13 07:58:58 +0000430 [(set f64:$XT, (fdiv f64:$XA, f64:$XB))]>;
431 def XSSQRTDP : XX2Form<60, 75,
Hal Finkel19be5062014-03-29 05:29:01 +0000432 (outs vsfrc:$XT), (ins vsfrc:$XB),
Hal Finkele8fba982014-03-29 13:20:31 +0000433 "xssqrtdp $XT, $XB", IIC_FPSqrtD,
Hal Finkel27774d92014-03-13 07:58:58 +0000434 [(set f64:$XT, (fsqrt f64:$XB))]>;
435
436 def XSREDP : XX2Form<60, 90,
Hal Finkel19be5062014-03-29 05:29:01 +0000437 (outs vsfrc:$XT), (ins vsfrc:$XB),
Hal Finkel27774d92014-03-13 07:58:58 +0000438 "xsredp $XT, $XB", IIC_VecFP,
439 [(set f64:$XT, (PPCfre f64:$XB))]>;
440 def XSRSQRTEDP : XX2Form<60, 74,
Hal Finkel19be5062014-03-29 05:29:01 +0000441 (outs vsfrc:$XT), (ins vsfrc:$XB),
Hal Finkel27774d92014-03-13 07:58:58 +0000442 "xsrsqrtedp $XT, $XB", IIC_VecFP,
443 [(set f64:$XT, (PPCfrsqrte f64:$XB))]>;
444
445 def XSTDIVDP : XX3Form_1<60, 61,
Hal Finkel19be5062014-03-29 05:29:01 +0000446 (outs crrc:$crD), (ins vsfrc:$XA, vsfrc:$XB),
Hal Finkele8fba982014-03-29 13:20:31 +0000447 "xstdivdp $crD, $XA, $XB", IIC_FPCompare, []>;
Hal Finkel27774d92014-03-13 07:58:58 +0000448 def XSTSQRTDP : XX2Form_1<60, 106,
Hal Finkel19be5062014-03-29 05:29:01 +0000449 (outs crrc:$crD), (ins vsfrc:$XB),
Hal Finkele8fba982014-03-29 13:20:31 +0000450 "xstsqrtdp $crD, $XB", IIC_FPCompare, []>;
Hal Finkel27774d92014-03-13 07:58:58 +0000451
452 def XVDIVDP : XX3Form<60, 120,
453 (outs vsrc:$XT), (ins vsrc:$XA, vsrc:$XB),
Hal Finkele8fba982014-03-29 13:20:31 +0000454 "xvdivdp $XT, $XA, $XB", IIC_FPDivD,
Hal Finkel27774d92014-03-13 07:58:58 +0000455 [(set v2f64:$XT, (fdiv v2f64:$XA, v2f64:$XB))]>;
456 def XVDIVSP : XX3Form<60, 88,
457 (outs vsrc:$XT), (ins vsrc:$XA, vsrc:$XB),
Hal Finkele8fba982014-03-29 13:20:31 +0000458 "xvdivsp $XT, $XA, $XB", IIC_FPDivS,
Hal Finkel27774d92014-03-13 07:58:58 +0000459 [(set v4f32:$XT, (fdiv v4f32:$XA, v4f32:$XB))]>;
460
461 def XVSQRTDP : XX2Form<60, 203,
462 (outs vsrc:$XT), (ins vsrc:$XB),
Hal Finkele8fba982014-03-29 13:20:31 +0000463 "xvsqrtdp $XT, $XB", IIC_FPSqrtD,
Hal Finkel27774d92014-03-13 07:58:58 +0000464 [(set v2f64:$XT, (fsqrt v2f64:$XB))]>;
465 def XVSQRTSP : XX2Form<60, 139,
466 (outs vsrc:$XT), (ins vsrc:$XB),
Hal Finkele8fba982014-03-29 13:20:31 +0000467 "xvsqrtsp $XT, $XB", IIC_FPSqrtS,
Hal Finkel27774d92014-03-13 07:58:58 +0000468 [(set v4f32:$XT, (fsqrt v4f32:$XB))]>;
469
470 def XVTDIVDP : XX3Form_1<60, 125,
471 (outs crrc:$crD), (ins vsrc:$XA, vsrc:$XB),
Hal Finkele8fba982014-03-29 13:20:31 +0000472 "xvtdivdp $crD, $XA, $XB", IIC_FPCompare, []>;
Hal Finkel27774d92014-03-13 07:58:58 +0000473 def XVTDIVSP : XX3Form_1<60, 93,
474 (outs crrc:$crD), (ins vsrc:$XA, vsrc:$XB),
Hal Finkele8fba982014-03-29 13:20:31 +0000475 "xvtdivsp $crD, $XA, $XB", IIC_FPCompare, []>;
Hal Finkel27774d92014-03-13 07:58:58 +0000476
477 def XVTSQRTDP : XX2Form_1<60, 234,
478 (outs crrc:$crD), (ins vsrc:$XB),
Hal Finkele8fba982014-03-29 13:20:31 +0000479 "xvtsqrtdp $crD, $XB", IIC_FPCompare, []>;
Hal Finkel27774d92014-03-13 07:58:58 +0000480 def XVTSQRTSP : XX2Form_1<60, 170,
481 (outs crrc:$crD), (ins vsrc:$XB),
Hal Finkele8fba982014-03-29 13:20:31 +0000482 "xvtsqrtsp $crD, $XB", IIC_FPCompare, []>;
Hal Finkel27774d92014-03-13 07:58:58 +0000483
484 def XVREDP : XX2Form<60, 218,
485 (outs vsrc:$XT), (ins vsrc:$XB),
486 "xvredp $XT, $XB", IIC_VecFP,
487 [(set v2f64:$XT, (PPCfre v2f64:$XB))]>;
488 def XVRESP : XX2Form<60, 154,
489 (outs vsrc:$XT), (ins vsrc:$XB),
490 "xvresp $XT, $XB", IIC_VecFP,
491 [(set v4f32:$XT, (PPCfre v4f32:$XB))]>;
492
493 def XVRSQRTEDP : XX2Form<60, 202,
494 (outs vsrc:$XT), (ins vsrc:$XB),
495 "xvrsqrtedp $XT, $XB", IIC_VecFP,
496 [(set v2f64:$XT, (PPCfrsqrte v2f64:$XB))]>;
497 def XVRSQRTESP : XX2Form<60, 138,
498 (outs vsrc:$XT), (ins vsrc:$XB),
499 "xvrsqrtesp $XT, $XB", IIC_VecFP,
500 [(set v4f32:$XT, (PPCfrsqrte v4f32:$XB))]>;
501
502 // Compare Instructions
503 def XSCMPODP : XX3Form_1<60, 43,
Hal Finkel19be5062014-03-29 05:29:01 +0000504 (outs crrc:$crD), (ins vsfrc:$XA, vsfrc:$XB),
Hal Finkele8fba982014-03-29 13:20:31 +0000505 "xscmpodp $crD, $XA, $XB", IIC_FPCompare, []>;
Hal Finkel27774d92014-03-13 07:58:58 +0000506 def XSCMPUDP : XX3Form_1<60, 35,
Hal Finkel19be5062014-03-29 05:29:01 +0000507 (outs crrc:$crD), (ins vsfrc:$XA, vsfrc:$XB),
Hal Finkele8fba982014-03-29 13:20:31 +0000508 "xscmpudp $crD, $XA, $XB", IIC_FPCompare, []>;
Hal Finkel27774d92014-03-13 07:58:58 +0000509
510 defm XVCMPEQDP : XX3Form_Rcr<60, 99,
Nemanja Ivanovicf502a422015-06-26 19:26:53 +0000511 "xvcmpeqdp", "$XT, $XA, $XB", IIC_VecFPCompare,
Nemanja Ivanovic2c84b292015-09-29 17:41:53 +0000512 int_ppc_vsx_xvcmpeqdp, v2i64, v2f64>;
Hal Finkel27774d92014-03-13 07:58:58 +0000513 defm XVCMPEQSP : XX3Form_Rcr<60, 67,
Nemanja Ivanovicf502a422015-06-26 19:26:53 +0000514 "xvcmpeqsp", "$XT, $XA, $XB", IIC_VecFPCompare,
Nemanja Ivanovic2c84b292015-09-29 17:41:53 +0000515 int_ppc_vsx_xvcmpeqsp, v4i32, v4f32>;
Hal Finkel27774d92014-03-13 07:58:58 +0000516 defm XVCMPGEDP : XX3Form_Rcr<60, 115,
Nemanja Ivanovicf502a422015-06-26 19:26:53 +0000517 "xvcmpgedp", "$XT, $XA, $XB", IIC_VecFPCompare,
Nemanja Ivanovic2c84b292015-09-29 17:41:53 +0000518 int_ppc_vsx_xvcmpgedp, v2i64, v2f64>;
Hal Finkel27774d92014-03-13 07:58:58 +0000519 defm XVCMPGESP : XX3Form_Rcr<60, 83,
Nemanja Ivanovicf502a422015-06-26 19:26:53 +0000520 "xvcmpgesp", "$XT, $XA, $XB", IIC_VecFPCompare,
Nemanja Ivanovic2c84b292015-09-29 17:41:53 +0000521 int_ppc_vsx_xvcmpgesp, v4i32, v4f32>;
Hal Finkel27774d92014-03-13 07:58:58 +0000522 defm XVCMPGTDP : XX3Form_Rcr<60, 107,
Nemanja Ivanovicf502a422015-06-26 19:26:53 +0000523 "xvcmpgtdp", "$XT, $XA, $XB", IIC_VecFPCompare,
Nemanja Ivanovic2c84b292015-09-29 17:41:53 +0000524 int_ppc_vsx_xvcmpgtdp, v2i64, v2f64>;
Hal Finkel27774d92014-03-13 07:58:58 +0000525 defm XVCMPGTSP : XX3Form_Rcr<60, 75,
Nemanja Ivanovicf502a422015-06-26 19:26:53 +0000526 "xvcmpgtsp", "$XT, $XA, $XB", IIC_VecFPCompare,
Nemanja Ivanovic2c84b292015-09-29 17:41:53 +0000527 int_ppc_vsx_xvcmpgtsp, v4i32, v4f32>;
Hal Finkel27774d92014-03-13 07:58:58 +0000528
529 // Move Instructions
530 def XSABSDP : XX2Form<60, 345,
Hal Finkel19be5062014-03-29 05:29:01 +0000531 (outs vsfrc:$XT), (ins vsfrc:$XB),
Hal Finkel27774d92014-03-13 07:58:58 +0000532 "xsabsdp $XT, $XB", IIC_VecFP,
533 [(set f64:$XT, (fabs f64:$XB))]>;
534 def XSNABSDP : XX2Form<60, 361,
Hal Finkel19be5062014-03-29 05:29:01 +0000535 (outs vsfrc:$XT), (ins vsfrc:$XB),
Hal Finkel27774d92014-03-13 07:58:58 +0000536 "xsnabsdp $XT, $XB", IIC_VecFP,
537 [(set f64:$XT, (fneg (fabs f64:$XB)))]>;
538 def XSNEGDP : XX2Form<60, 377,
Hal Finkel19be5062014-03-29 05:29:01 +0000539 (outs vsfrc:$XT), (ins vsfrc:$XB),
Hal Finkel27774d92014-03-13 07:58:58 +0000540 "xsnegdp $XT, $XB", IIC_VecFP,
541 [(set f64:$XT, (fneg f64:$XB))]>;
542 def XSCPSGNDP : XX3Form<60, 176,
Hal Finkel19be5062014-03-29 05:29:01 +0000543 (outs vsfrc:$XT), (ins vsfrc:$XA, vsfrc:$XB),
Hal Finkel27774d92014-03-13 07:58:58 +0000544 "xscpsgndp $XT, $XA, $XB", IIC_VecFP,
545 [(set f64:$XT, (fcopysign f64:$XB, f64:$XA))]>;
546
547 def XVABSDP : XX2Form<60, 473,
548 (outs vsrc:$XT), (ins vsrc:$XB),
549 "xvabsdp $XT, $XB", IIC_VecFP,
550 [(set v2f64:$XT, (fabs v2f64:$XB))]>;
551
552 def XVABSSP : XX2Form<60, 409,
553 (outs vsrc:$XT), (ins vsrc:$XB),
554 "xvabssp $XT, $XB", IIC_VecFP,
555 [(set v4f32:$XT, (fabs v4f32:$XB))]>;
556
557 def XVCPSGNDP : XX3Form<60, 240,
558 (outs vsrc:$XT), (ins vsrc:$XA, vsrc:$XB),
559 "xvcpsgndp $XT, $XA, $XB", IIC_VecFP,
560 [(set v2f64:$XT, (fcopysign v2f64:$XB, v2f64:$XA))]>;
561 def XVCPSGNSP : XX3Form<60, 208,
562 (outs vsrc:$XT), (ins vsrc:$XA, vsrc:$XB),
563 "xvcpsgnsp $XT, $XA, $XB", IIC_VecFP,
564 [(set v4f32:$XT, (fcopysign v4f32:$XB, v4f32:$XA))]>;
565
566 def XVNABSDP : XX2Form<60, 489,
567 (outs vsrc:$XT), (ins vsrc:$XB),
568 "xvnabsdp $XT, $XB", IIC_VecFP,
569 [(set v2f64:$XT, (fneg (fabs v2f64:$XB)))]>;
570 def XVNABSSP : XX2Form<60, 425,
571 (outs vsrc:$XT), (ins vsrc:$XB),
572 "xvnabssp $XT, $XB", IIC_VecFP,
573 [(set v4f32:$XT, (fneg (fabs v4f32:$XB)))]>;
574
575 def XVNEGDP : XX2Form<60, 505,
576 (outs vsrc:$XT), (ins vsrc:$XB),
577 "xvnegdp $XT, $XB", IIC_VecFP,
578 [(set v2f64:$XT, (fneg v2f64:$XB))]>;
579 def XVNEGSP : XX2Form<60, 441,
580 (outs vsrc:$XT), (ins vsrc:$XB),
581 "xvnegsp $XT, $XB", IIC_VecFP,
582 [(set v4f32:$XT, (fneg v4f32:$XB))]>;
583
584 // Conversion Instructions
585 def XSCVDPSP : XX2Form<60, 265,
Hal Finkel19be5062014-03-29 05:29:01 +0000586 (outs vsfrc:$XT), (ins vsfrc:$XB),
Hal Finkel27774d92014-03-13 07:58:58 +0000587 "xscvdpsp $XT, $XB", IIC_VecFP, []>;
588 def XSCVDPSXDS : XX2Form<60, 344,
Hal Finkel19be5062014-03-29 05:29:01 +0000589 (outs vsfrc:$XT), (ins vsfrc:$XB),
Hal Finkel4a912252014-03-23 05:35:00 +0000590 "xscvdpsxds $XT, $XB", IIC_VecFP,
591 [(set f64:$XT, (PPCfctidz f64:$XB))]>;
Nemanja Ivanovicdf1cb522016-11-29 16:11:34 +0000592 let isCodeGenOnly = 1 in
593 def XSCVDPSXDSs : XX2Form<60, 344,
594 (outs vssrc:$XT), (ins vssrc:$XB),
595 "xscvdpsxds $XT, $XB", IIC_VecFP,
596 [(set f32:$XT, (PPCfctidz f32:$XB))]>;
Hal Finkel27774d92014-03-13 07:58:58 +0000597 def XSCVDPSXWS : XX2Form<60, 88,
Hal Finkel19be5062014-03-29 05:29:01 +0000598 (outs vsfrc:$XT), (ins vsfrc:$XB),
Hal Finkel4a912252014-03-23 05:35:00 +0000599 "xscvdpsxws $XT, $XB", IIC_VecFP,
600 [(set f64:$XT, (PPCfctiwz f64:$XB))]>;
Nemanja Ivanovicdf1cb522016-11-29 16:11:34 +0000601 let isCodeGenOnly = 1 in
602 def XSCVDPSXWSs : XX2Form<60, 88,
603 (outs vssrc:$XT), (ins vssrc:$XB),
604 "xscvdpsxws $XT, $XB", IIC_VecFP,
605 [(set f32:$XT, (PPCfctiwz f32:$XB))]>;
Hal Finkel27774d92014-03-13 07:58:58 +0000606 def XSCVDPUXDS : XX2Form<60, 328,
Hal Finkel19be5062014-03-29 05:29:01 +0000607 (outs vsfrc:$XT), (ins vsfrc:$XB),
Hal Finkel4a912252014-03-23 05:35:00 +0000608 "xscvdpuxds $XT, $XB", IIC_VecFP,
609 [(set f64:$XT, (PPCfctiduz f64:$XB))]>;
Nemanja Ivanovicdf1cb522016-11-29 16:11:34 +0000610 let isCodeGenOnly = 1 in
611 def XSCVDPUXDSs : XX2Form<60, 328,
612 (outs vssrc:$XT), (ins vssrc:$XB),
613 "xscvdpuxds $XT, $XB", IIC_VecFP,
614 [(set f32:$XT, (PPCfctiduz f32:$XB))]>;
Hal Finkel27774d92014-03-13 07:58:58 +0000615 def XSCVDPUXWS : XX2Form<60, 72,
Hal Finkel19be5062014-03-29 05:29:01 +0000616 (outs vsfrc:$XT), (ins vsfrc:$XB),
Hal Finkel4a912252014-03-23 05:35:00 +0000617 "xscvdpuxws $XT, $XB", IIC_VecFP,
618 [(set f64:$XT, (PPCfctiwuz f64:$XB))]>;
Nemanja Ivanovicdf1cb522016-11-29 16:11:34 +0000619 let isCodeGenOnly = 1 in
620 def XSCVDPUXWSs : XX2Form<60, 72,
621 (outs vssrc:$XT), (ins vssrc:$XB),
622 "xscvdpuxws $XT, $XB", IIC_VecFP,
623 [(set f32:$XT, (PPCfctiwuz f32:$XB))]>;
Hal Finkel27774d92014-03-13 07:58:58 +0000624 def XSCVSPDP : XX2Form<60, 329,
Hal Finkel19be5062014-03-29 05:29:01 +0000625 (outs vsfrc:$XT), (ins vsfrc:$XB),
Hal Finkel27774d92014-03-13 07:58:58 +0000626 "xscvspdp $XT, $XB", IIC_VecFP, []>;
627 def XSCVSXDDP : XX2Form<60, 376,
Hal Finkel19be5062014-03-29 05:29:01 +0000628 (outs vsfrc:$XT), (ins vsfrc:$XB),
Hal Finkel4a912252014-03-23 05:35:00 +0000629 "xscvsxddp $XT, $XB", IIC_VecFP,
630 [(set f64:$XT, (PPCfcfid f64:$XB))]>;
Hal Finkel27774d92014-03-13 07:58:58 +0000631 def XSCVUXDDP : XX2Form<60, 360,
Hal Finkel19be5062014-03-29 05:29:01 +0000632 (outs vsfrc:$XT), (ins vsfrc:$XB),
Hal Finkel4a912252014-03-23 05:35:00 +0000633 "xscvuxddp $XT, $XB", IIC_VecFP,
634 [(set f64:$XT, (PPCfcfidu f64:$XB))]>;
Hal Finkel27774d92014-03-13 07:58:58 +0000635
636 def XVCVDPSP : XX2Form<60, 393,
637 (outs vsrc:$XT), (ins vsrc:$XB),
Nemanja Ivanovic2efc3cb2016-11-11 14:41:19 +0000638 "xvcvdpsp $XT, $XB", IIC_VecFP,
639 [(set v4f32:$XT, (int_ppc_vsx_xvcvdpsp v2f64:$XB))]>;
Hal Finkel27774d92014-03-13 07:58:58 +0000640 def XVCVDPSXDS : XX2Form<60, 472,
641 (outs vsrc:$XT), (ins vsrc:$XB),
Hal Finkel7279f4b2014-03-26 19:13:54 +0000642 "xvcvdpsxds $XT, $XB", IIC_VecFP,
643 [(set v2i64:$XT, (fp_to_sint v2f64:$XB))]>;
Hal Finkel27774d92014-03-13 07:58:58 +0000644 def XVCVDPSXWS : XX2Form<60, 216,
645 (outs vsrc:$XT), (ins vsrc:$XB),
Nemanja Ivanovic2efc3cb2016-11-11 14:41:19 +0000646 "xvcvdpsxws $XT, $XB", IIC_VecFP,
647 [(set v4i32:$XT, (int_ppc_vsx_xvcvdpsxws v2f64:$XB))]>;
Hal Finkel27774d92014-03-13 07:58:58 +0000648 def XVCVDPUXDS : XX2Form<60, 456,
649 (outs vsrc:$XT), (ins vsrc:$XB),
Hal Finkel7279f4b2014-03-26 19:13:54 +0000650 "xvcvdpuxds $XT, $XB", IIC_VecFP,
651 [(set v2i64:$XT, (fp_to_uint v2f64:$XB))]>;
Hal Finkel27774d92014-03-13 07:58:58 +0000652 def XVCVDPUXWS : XX2Form<60, 200,
653 (outs vsrc:$XT), (ins vsrc:$XB),
Nemanja Ivanovic2efc3cb2016-11-11 14:41:19 +0000654 "xvcvdpuxws $XT, $XB", IIC_VecFP,
655 [(set v4i32:$XT, (int_ppc_vsx_xvcvdpuxws v2f64:$XB))]>;
Hal Finkel27774d92014-03-13 07:58:58 +0000656
657 def XVCVSPDP : XX2Form<60, 457,
658 (outs vsrc:$XT), (ins vsrc:$XB),
Nemanja Ivanovic2efc3cb2016-11-11 14:41:19 +0000659 "xvcvspdp $XT, $XB", IIC_VecFP,
660 [(set v2f64:$XT, (int_ppc_vsx_xvcvspdp v4f32:$XB))]>;
Hal Finkel27774d92014-03-13 07:58:58 +0000661 def XVCVSPSXDS : XX2Form<60, 408,
662 (outs vsrc:$XT), (ins vsrc:$XB),
663 "xvcvspsxds $XT, $XB", IIC_VecFP, []>;
664 def XVCVSPSXWS : XX2Form<60, 152,
665 (outs vsrc:$XT), (ins vsrc:$XB),
Nemanja Ivanovicdf1cb522016-11-29 16:11:34 +0000666 "xvcvspsxws $XT, $XB", IIC_VecFP,
667 [(set v4i32:$XT, (fp_to_sint v4f32:$XB))]>;
Hal Finkel27774d92014-03-13 07:58:58 +0000668 def XVCVSPUXDS : XX2Form<60, 392,
669 (outs vsrc:$XT), (ins vsrc:$XB),
670 "xvcvspuxds $XT, $XB", IIC_VecFP, []>;
671 def XVCVSPUXWS : XX2Form<60, 136,
672 (outs vsrc:$XT), (ins vsrc:$XB),
Nemanja Ivanovicdf1cb522016-11-29 16:11:34 +0000673 "xvcvspuxws $XT, $XB", IIC_VecFP,
674 [(set v4i32:$XT, (fp_to_uint v4f32:$XB))]>;
Hal Finkel27774d92014-03-13 07:58:58 +0000675 def XVCVSXDDP : XX2Form<60, 504,
676 (outs vsrc:$XT), (ins vsrc:$XB),
Hal Finkel7279f4b2014-03-26 19:13:54 +0000677 "xvcvsxddp $XT, $XB", IIC_VecFP,
678 [(set v2f64:$XT, (sint_to_fp v2i64:$XB))]>;
Hal Finkel27774d92014-03-13 07:58:58 +0000679 def XVCVSXDSP : XX2Form<60, 440,
680 (outs vsrc:$XT), (ins vsrc:$XB),
Nemanja Ivanovic2efc3cb2016-11-11 14:41:19 +0000681 "xvcvsxdsp $XT, $XB", IIC_VecFP,
682 [(set v4f32:$XT, (int_ppc_vsx_xvcvsxdsp v2i64:$XB))]>;
Hal Finkel27774d92014-03-13 07:58:58 +0000683 def XVCVSXWDP : XX2Form<60, 248,
684 (outs vsrc:$XT), (ins vsrc:$XB),
Nemanja Ivanovic2efc3cb2016-11-11 14:41:19 +0000685 "xvcvsxwdp $XT, $XB", IIC_VecFP,
686 [(set v2f64:$XT, (int_ppc_vsx_xvcvsxwdp v4i32:$XB))]>;
Hal Finkel27774d92014-03-13 07:58:58 +0000687 def XVCVSXWSP : XX2Form<60, 184,
688 (outs vsrc:$XT), (ins vsrc:$XB),
Nemanja Ivanovic44513e52016-07-05 09:22:29 +0000689 "xvcvsxwsp $XT, $XB", IIC_VecFP,
690 [(set v4f32:$XT, (sint_to_fp v4i32:$XB))]>;
Hal Finkel27774d92014-03-13 07:58:58 +0000691 def XVCVUXDDP : XX2Form<60, 488,
692 (outs vsrc:$XT), (ins vsrc:$XB),
Hal Finkel7279f4b2014-03-26 19:13:54 +0000693 "xvcvuxddp $XT, $XB", IIC_VecFP,
694 [(set v2f64:$XT, (uint_to_fp v2i64:$XB))]>;
Hal Finkel27774d92014-03-13 07:58:58 +0000695 def XVCVUXDSP : XX2Form<60, 424,
696 (outs vsrc:$XT), (ins vsrc:$XB),
Nemanja Ivanovic2efc3cb2016-11-11 14:41:19 +0000697 "xvcvuxdsp $XT, $XB", IIC_VecFP,
698 [(set v4f32:$XT, (int_ppc_vsx_xvcvuxdsp v2i64:$XB))]>;
Hal Finkel27774d92014-03-13 07:58:58 +0000699 def XVCVUXWDP : XX2Form<60, 232,
700 (outs vsrc:$XT), (ins vsrc:$XB),
Nemanja Ivanovic2efc3cb2016-11-11 14:41:19 +0000701 "xvcvuxwdp $XT, $XB", IIC_VecFP,
702 [(set v2f64:$XT, (int_ppc_vsx_xvcvuxwdp v4i32:$XB))]>;
Hal Finkel27774d92014-03-13 07:58:58 +0000703 def XVCVUXWSP : XX2Form<60, 168,
704 (outs vsrc:$XT), (ins vsrc:$XB),
Nemanja Ivanovicdf1cb522016-11-29 16:11:34 +0000705 "xvcvuxwsp $XT, $XB", IIC_VecFP,
706 [(set v4f32:$XT, (uint_to_fp v4i32:$XB))]>;
Hal Finkel27774d92014-03-13 07:58:58 +0000707
708 // Rounding Instructions
709 def XSRDPI : XX2Form<60, 73,
Hal Finkel19be5062014-03-29 05:29:01 +0000710 (outs vsfrc:$XT), (ins vsfrc:$XB),
Hal Finkel27774d92014-03-13 07:58:58 +0000711 "xsrdpi $XT, $XB", IIC_VecFP,
Michael Kuperstein2bc3d4d2016-08-18 20:08:15 +0000712 [(set f64:$XT, (fround f64:$XB))]>;
Hal Finkel27774d92014-03-13 07:58:58 +0000713 def XSRDPIC : XX2Form<60, 107,
Hal Finkel19be5062014-03-29 05:29:01 +0000714 (outs vsfrc:$XT), (ins vsfrc:$XB),
Hal Finkel27774d92014-03-13 07:58:58 +0000715 "xsrdpic $XT, $XB", IIC_VecFP,
716 [(set f64:$XT, (fnearbyint f64:$XB))]>;
717 def XSRDPIM : XX2Form<60, 121,
Hal Finkel19be5062014-03-29 05:29:01 +0000718 (outs vsfrc:$XT), (ins vsfrc:$XB),
Hal Finkel27774d92014-03-13 07:58:58 +0000719 "xsrdpim $XT, $XB", IIC_VecFP,
720 [(set f64:$XT, (ffloor f64:$XB))]>;
721 def XSRDPIP : XX2Form<60, 105,
Hal Finkel19be5062014-03-29 05:29:01 +0000722 (outs vsfrc:$XT), (ins vsfrc:$XB),
Hal Finkel27774d92014-03-13 07:58:58 +0000723 "xsrdpip $XT, $XB", IIC_VecFP,
724 [(set f64:$XT, (fceil f64:$XB))]>;
725 def XSRDPIZ : XX2Form<60, 89,
Hal Finkel19be5062014-03-29 05:29:01 +0000726 (outs vsfrc:$XT), (ins vsfrc:$XB),
Hal Finkel27774d92014-03-13 07:58:58 +0000727 "xsrdpiz $XT, $XB", IIC_VecFP,
728 [(set f64:$XT, (ftrunc f64:$XB))]>;
729
730 def XVRDPI : XX2Form<60, 201,
731 (outs vsrc:$XT), (ins vsrc:$XB),
732 "xvrdpi $XT, $XB", IIC_VecFP,
Michael Kuperstein2bc3d4d2016-08-18 20:08:15 +0000733 [(set v2f64:$XT, (fround v2f64:$XB))]>;
Hal Finkel27774d92014-03-13 07:58:58 +0000734 def XVRDPIC : XX2Form<60, 235,
735 (outs vsrc:$XT), (ins vsrc:$XB),
736 "xvrdpic $XT, $XB", IIC_VecFP,
737 [(set v2f64:$XT, (fnearbyint v2f64:$XB))]>;
738 def XVRDPIM : XX2Form<60, 249,
739 (outs vsrc:$XT), (ins vsrc:$XB),
740 "xvrdpim $XT, $XB", IIC_VecFP,
741 [(set v2f64:$XT, (ffloor v2f64:$XB))]>;
742 def XVRDPIP : XX2Form<60, 233,
743 (outs vsrc:$XT), (ins vsrc:$XB),
744 "xvrdpip $XT, $XB", IIC_VecFP,
745 [(set v2f64:$XT, (fceil v2f64:$XB))]>;
746 def XVRDPIZ : XX2Form<60, 217,
747 (outs vsrc:$XT), (ins vsrc:$XB),
748 "xvrdpiz $XT, $XB", IIC_VecFP,
749 [(set v2f64:$XT, (ftrunc v2f64:$XB))]>;
750
751 def XVRSPI : XX2Form<60, 137,
752 (outs vsrc:$XT), (ins vsrc:$XB),
753 "xvrspi $XT, $XB", IIC_VecFP,
Michael Kuperstein2bc3d4d2016-08-18 20:08:15 +0000754 [(set v4f32:$XT, (fround v4f32:$XB))]>;
Hal Finkel27774d92014-03-13 07:58:58 +0000755 def XVRSPIC : XX2Form<60, 171,
756 (outs vsrc:$XT), (ins vsrc:$XB),
757 "xvrspic $XT, $XB", IIC_VecFP,
758 [(set v4f32:$XT, (fnearbyint v4f32:$XB))]>;
759 def XVRSPIM : XX2Form<60, 185,
760 (outs vsrc:$XT), (ins vsrc:$XB),
761 "xvrspim $XT, $XB", IIC_VecFP,
762 [(set v4f32:$XT, (ffloor v4f32:$XB))]>;
763 def XVRSPIP : XX2Form<60, 169,
764 (outs vsrc:$XT), (ins vsrc:$XB),
765 "xvrspip $XT, $XB", IIC_VecFP,
766 [(set v4f32:$XT, (fceil v4f32:$XB))]>;
767 def XVRSPIZ : XX2Form<60, 153,
768 (outs vsrc:$XT), (ins vsrc:$XB),
769 "xvrspiz $XT, $XB", IIC_VecFP,
770 [(set v4f32:$XT, (ftrunc v4f32:$XB))]>;
771
772 // Max/Min Instructions
Hal Finkele01d3212014-03-24 15:07:28 +0000773 let isCommutable = 1 in {
Hal Finkel27774d92014-03-13 07:58:58 +0000774 def XSMAXDP : XX3Form<60, 160,
Hal Finkel19be5062014-03-29 05:29:01 +0000775 (outs vsfrc:$XT), (ins vsfrc:$XA, vsfrc:$XB),
Bill Schmidt1ca69fa2014-10-31 19:19:07 +0000776 "xsmaxdp $XT, $XA, $XB", IIC_VecFP,
777 [(set vsfrc:$XT,
778 (int_ppc_vsx_xsmaxdp vsfrc:$XA, vsfrc:$XB))]>;
Hal Finkel27774d92014-03-13 07:58:58 +0000779 def XSMINDP : XX3Form<60, 168,
Hal Finkel19be5062014-03-29 05:29:01 +0000780 (outs vsfrc:$XT), (ins vsfrc:$XA, vsfrc:$XB),
Bill Schmidt1ca69fa2014-10-31 19:19:07 +0000781 "xsmindp $XT, $XA, $XB", IIC_VecFP,
782 [(set vsfrc:$XT,
783 (int_ppc_vsx_xsmindp vsfrc:$XA, vsfrc:$XB))]>;
Hal Finkel27774d92014-03-13 07:58:58 +0000784
785 def XVMAXDP : XX3Form<60, 224,
786 (outs vsrc:$XT), (ins vsrc:$XA, vsrc:$XB),
Bill Schmidt1ca69fa2014-10-31 19:19:07 +0000787 "xvmaxdp $XT, $XA, $XB", IIC_VecFP,
788 [(set vsrc:$XT,
789 (int_ppc_vsx_xvmaxdp vsrc:$XA, vsrc:$XB))]>;
Hal Finkel27774d92014-03-13 07:58:58 +0000790 def XVMINDP : XX3Form<60, 232,
791 (outs vsrc:$XT), (ins vsrc:$XA, vsrc:$XB),
Bill Schmidt1ca69fa2014-10-31 19:19:07 +0000792 "xvmindp $XT, $XA, $XB", IIC_VecFP,
793 [(set vsrc:$XT,
794 (int_ppc_vsx_xvmindp vsrc:$XA, vsrc:$XB))]>;
Hal Finkel27774d92014-03-13 07:58:58 +0000795
796 def XVMAXSP : XX3Form<60, 192,
797 (outs vsrc:$XT), (ins vsrc:$XA, vsrc:$XB),
Bill Schmidt1ca69fa2014-10-31 19:19:07 +0000798 "xvmaxsp $XT, $XA, $XB", IIC_VecFP,
799 [(set vsrc:$XT,
800 (int_ppc_vsx_xvmaxsp vsrc:$XA, vsrc:$XB))]>;
Hal Finkel27774d92014-03-13 07:58:58 +0000801 def XVMINSP : XX3Form<60, 200,
802 (outs vsrc:$XT), (ins vsrc:$XA, vsrc:$XB),
Bill Schmidt1ca69fa2014-10-31 19:19:07 +0000803 "xvminsp $XT, $XA, $XB", IIC_VecFP,
804 [(set vsrc:$XT,
805 (int_ppc_vsx_xvminsp vsrc:$XA, vsrc:$XB))]>;
Hal Finkele01d3212014-03-24 15:07:28 +0000806 } // isCommutable
Hal Finkel27774d92014-03-13 07:58:58 +0000807} // Uses = [RM]
808
809 // Logical Instructions
Hal Finkele01d3212014-03-24 15:07:28 +0000810 let isCommutable = 1 in
Hal Finkel27774d92014-03-13 07:58:58 +0000811 def XXLAND : XX3Form<60, 130,
812 (outs vsrc:$XT), (ins vsrc:$XA, vsrc:$XB),
Hal Finkelbd4de9d2014-03-26 04:55:40 +0000813 "xxland $XT, $XA, $XB", IIC_VecGeneral,
814 [(set v4i32:$XT, (and v4i32:$XA, v4i32:$XB))]>;
Hal Finkel27774d92014-03-13 07:58:58 +0000815 def XXLANDC : XX3Form<60, 138,
816 (outs vsrc:$XT), (ins vsrc:$XA, vsrc:$XB),
Hal Finkelbd4de9d2014-03-26 04:55:40 +0000817 "xxlandc $XT, $XA, $XB", IIC_VecGeneral,
818 [(set v4i32:$XT, (and v4i32:$XA,
819 (vnot_ppc v4i32:$XB)))]>;
Hal Finkele01d3212014-03-24 15:07:28 +0000820 let isCommutable = 1 in {
Hal Finkel27774d92014-03-13 07:58:58 +0000821 def XXLNOR : XX3Form<60, 162,
822 (outs vsrc:$XT), (ins vsrc:$XA, vsrc:$XB),
Hal Finkelbd4de9d2014-03-26 04:55:40 +0000823 "xxlnor $XT, $XA, $XB", IIC_VecGeneral,
824 [(set v4i32:$XT, (vnot_ppc (or v4i32:$XA,
825 v4i32:$XB)))]>;
Hal Finkel27774d92014-03-13 07:58:58 +0000826 def XXLOR : XX3Form<60, 146,
827 (outs vsrc:$XT), (ins vsrc:$XA, vsrc:$XB),
Hal Finkelbd4de9d2014-03-26 04:55:40 +0000828 "xxlor $XT, $XA, $XB", IIC_VecGeneral,
829 [(set v4i32:$XT, (or v4i32:$XA, v4i32:$XB))]>;
Hal Finkel19be5062014-03-29 05:29:01 +0000830 let isCodeGenOnly = 1 in
831 def XXLORf: XX3Form<60, 146,
832 (outs vsfrc:$XT), (ins vsfrc:$XA, vsfrc:$XB),
833 "xxlor $XT, $XA, $XB", IIC_VecGeneral, []>;
Hal Finkel27774d92014-03-13 07:58:58 +0000834 def XXLXOR : XX3Form<60, 154,
835 (outs vsrc:$XT), (ins vsrc:$XA, vsrc:$XB),
Hal Finkelbd4de9d2014-03-26 04:55:40 +0000836 "xxlxor $XT, $XA, $XB", IIC_VecGeneral,
837 [(set v4i32:$XT, (xor v4i32:$XA, v4i32:$XB))]>;
Hal Finkele01d3212014-03-24 15:07:28 +0000838 } // isCommutable
Nemanja Ivanovicd2c3c512016-09-23 13:25:31 +0000839 let isCodeGenOnly = 1 in
840 def XXLXORz : XX3Form_Zero<60, 154, (outs vsrc:$XT), (ins),
841 "xxlxor $XT, $XT, $XT", IIC_VecGeneral,
842 [(set v4i32:$XT, (v4i32 immAllZerosV))]>;
Hal Finkel27774d92014-03-13 07:58:58 +0000843
Ehsan Amiric90b02c2016-10-24 17:31:09 +0000844 let isCodeGenOnly = 1 in {
845 def XXLXORdpz : XX3Form_SetZero<60, 154,
846 (outs vsfrc:$XT), (ins),
847 "xxlxor $XT, $XT, $XT", IIC_VecGeneral,
848 [(set f64:$XT, (fpimm0))]>;
849 def XXLXORspz : XX3Form_SetZero<60, 154,
850 (outs vssrc:$XT), (ins),
851 "xxlxor $XT, $XT, $XT", IIC_VecGeneral,
852 [(set f32:$XT, (fpimm0))]>;
853 }
854
Hal Finkel27774d92014-03-13 07:58:58 +0000855 // Permutation Instructions
856 def XXMRGHW : XX3Form<60, 18,
857 (outs vsrc:$XT), (ins vsrc:$XA, vsrc:$XB),
858 "xxmrghw $XT, $XA, $XB", IIC_VecPerm, []>;
859 def XXMRGLW : XX3Form<60, 50,
860 (outs vsrc:$XT), (ins vsrc:$XA, vsrc:$XB),
861 "xxmrglw $XT, $XA, $XB", IIC_VecPerm, []>;
862
863 def XXPERMDI : XX3Form_2<60, 10,
864 (outs vsrc:$XT), (ins vsrc:$XA, vsrc:$XB, u2imm:$DM),
Tony Jiang60c247d2017-05-31 13:09:57 +0000865 "xxpermdi $XT, $XA, $XB, $DM", IIC_VecPerm,
866 [(set v2i64:$XT, (PPCxxpermdi v2i64:$XA, v2i64:$XB,
867 imm32SExt16:$DM))]>;
Nemanja Ivanovic15748f42016-12-06 11:47:14 +0000868 let isCodeGenOnly = 1 in
869 def XXPERMDIs : XX3Form_2s<60, 10, (outs vsrc:$XT), (ins vsfrc:$XA, u2imm:$DM),
Nemanja Ivanovic11049f82016-10-04 06:59:23 +0000870 "xxpermdi $XT, $XA, $XA, $DM", IIC_VecPerm, []>;
Hal Finkel27774d92014-03-13 07:58:58 +0000871 def XXSEL : XX4Form<60, 3,
872 (outs vsrc:$XT), (ins vsrc:$XA, vsrc:$XB, vsrc:$XC),
873 "xxsel $XT, $XA, $XB, $XC", IIC_VecPerm, []>;
874
875 def XXSLDWI : XX3Form_2<60, 2,
876 (outs vsrc:$XT), (ins vsrc:$XA, vsrc:$XB, u2imm:$SHW),
Nemanja Ivanovicb43bb612016-07-12 21:00:10 +0000877 "xxsldwi $XT, $XA, $XB, $SHW", IIC_VecPerm,
878 [(set v4i32:$XT, (PPCvecshl v4i32:$XA, v4i32:$XB,
879 imm32SExt16:$SHW))]>;
Hal Finkel27774d92014-03-13 07:58:58 +0000880 def XXSPLTW : XX2Form_2<60, 164,
881 (outs vsrc:$XT), (ins vsrc:$XB, u2imm:$UIM),
Nemanja Ivanovic1a2b2f02016-05-04 16:04:02 +0000882 "xxspltw $XT, $XB, $UIM", IIC_VecPerm,
883 [(set v4i32:$XT,
884 (PPCxxsplt v4i32:$XB, imm32SExt16:$UIM))]>;
Nemanja Ivanovic11049f82016-10-04 06:59:23 +0000885 let isCodeGenOnly = 1 in
886 def XXSPLTWs : XX2Form_2<60, 164,
887 (outs vsrc:$XT), (ins vfrc:$XB, u2imm:$UIM),
888 "xxspltw $XT, $XB, $UIM", IIC_VecPerm, []>;
Craig Topperc50d64b2014-11-26 00:46:26 +0000889} // hasSideEffects
Nemanja Ivanovic11049f82016-10-04 06:59:23 +0000890} // UseVSXReg = 1
Hal Finkel27774d92014-03-13 07:58:58 +0000891
Bill Schmidt61e65232014-10-22 13:13:40 +0000892// SELECT_CC_* - Used to implement the SELECT_CC DAG operation. Expanded after
893// instruction selection into a branch sequence.
894let usesCustomInserter = 1, // Expanded after instruction selection.
895 PPC970_Single = 1 in {
896
897 def SELECT_CC_VSRC: Pseudo<(outs vsrc:$dst),
898 (ins crrc:$cond, vsrc:$T, vsrc:$F, i32imm:$BROPC),
899 "#SELECT_CC_VSRC",
900 []>;
Bill Schmidt9c54bbd2014-10-22 16:58:20 +0000901 def SELECT_VSRC: Pseudo<(outs vsrc:$dst),
902 (ins crbitrc:$cond, vsrc:$T, vsrc:$F),
903 "#SELECT_VSRC",
Bill Schmidt61e65232014-10-22 13:13:40 +0000904 [(set v2f64:$dst,
905 (select i1:$cond, v2f64:$T, v2f64:$F))]>;
Bill Schmidt9c54bbd2014-10-22 16:58:20 +0000906 def SELECT_CC_VSFRC: Pseudo<(outs f8rc:$dst),
907 (ins crrc:$cond, f8rc:$T, f8rc:$F,
908 i32imm:$BROPC), "#SELECT_CC_VSFRC",
909 []>;
910 def SELECT_VSFRC: Pseudo<(outs f8rc:$dst),
911 (ins crbitrc:$cond, f8rc:$T, f8rc:$F),
912 "#SELECT_VSFRC",
913 [(set f64:$dst,
914 (select i1:$cond, f64:$T, f64:$F))]>;
Nemanja Ivanovicf3c94b12015-05-07 18:24:05 +0000915 def SELECT_CC_VSSRC: Pseudo<(outs f4rc:$dst),
916 (ins crrc:$cond, f4rc:$T, f4rc:$F,
917 i32imm:$BROPC), "#SELECT_CC_VSSRC",
918 []>;
919 def SELECT_VSSRC: Pseudo<(outs f4rc:$dst),
920 (ins crbitrc:$cond, f4rc:$T, f4rc:$F),
921 "#SELECT_VSSRC",
922 [(set f32:$dst,
923 (select i1:$cond, f32:$T, f32:$F))]>;
Bill Schmidt9c54bbd2014-10-22 16:58:20 +0000924} // usesCustomInserter
925} // AddedComplexity
Bill Schmidt61e65232014-10-22 13:13:40 +0000926
Hal Finkel27774d92014-03-13 07:58:58 +0000927def : InstAlias<"xvmovdp $XT, $XB",
928 (XVCPSGNDP vsrc:$XT, vsrc:$XB, vsrc:$XB)>;
929def : InstAlias<"xvmovsp $XT, $XB",
930 (XVCPSGNSP vsrc:$XT, vsrc:$XB, vsrc:$XB)>;
931
932def : InstAlias<"xxspltd $XT, $XB, 0",
933 (XXPERMDI vsrc:$XT, vsrc:$XB, vsrc:$XB, 0)>;
934def : InstAlias<"xxspltd $XT, $XB, 1",
935 (XXPERMDI vsrc:$XT, vsrc:$XB, vsrc:$XB, 3)>;
936def : InstAlias<"xxmrghd $XT, $XA, $XB",
937 (XXPERMDI vsrc:$XT, vsrc:$XA, vsrc:$XB, 0)>;
938def : InstAlias<"xxmrgld $XT, $XA, $XB",
939 (XXPERMDI vsrc:$XT, vsrc:$XA, vsrc:$XB, 3)>;
940def : InstAlias<"xxswapd $XT, $XB",
941 (XXPERMDI vsrc:$XT, vsrc:$XB, vsrc:$XB, 2)>;
Nemanja Ivanovic15748f42016-12-06 11:47:14 +0000942def : InstAlias<"xxspltd $XT, $XB, 0",
943 (XXPERMDIs vsrc:$XT, vsfrc:$XB, 0)>;
944def : InstAlias<"xxspltd $XT, $XB, 1",
945 (XXPERMDIs vsrc:$XT, vsfrc:$XB, 3)>;
946def : InstAlias<"xxswapd $XT, $XB",
947 (XXPERMDIs vsrc:$XT, vsfrc:$XB, 2)>;
Hal Finkel27774d92014-03-13 07:58:58 +0000948
949let AddedComplexity = 400 in { // Prefer VSX patterns over non-VSX patterns.
Bill Schmidt10f6eb92014-12-09 16:43:32 +0000950
Nemanja Ivanovic6f22b412016-09-27 08:42:12 +0000951def : Pat<(v4i32 (vnot_ppc v4i32:$A)),
952 (v4i32 (XXLNOR $A, $A))>;
Bill Schmidt10f6eb92014-12-09 16:43:32 +0000953let Predicates = [IsBigEndian] in {
Hal Finkel27774d92014-03-13 07:58:58 +0000954def : Pat<(v2f64 (scalar_to_vector f64:$A)),
Hal Finkel19be5062014-03-29 05:29:01 +0000955 (v2f64 (SUBREG_TO_REG (i64 1), $A, sub_64))>;
Hal Finkel27774d92014-03-13 07:58:58 +0000956
Matt Arsenaultfbd9bbf2015-12-11 19:20:16 +0000957def : Pat<(f64 (extractelt v2f64:$S, 0)),
Hal Finkel19be5062014-03-29 05:29:01 +0000958 (f64 (EXTRACT_SUBREG $S, sub_64))>;
Matt Arsenaultfbd9bbf2015-12-11 19:20:16 +0000959def : Pat<(f64 (extractelt v2f64:$S, 1)),
Hal Finkel19be5062014-03-29 05:29:01 +0000960 (f64 (EXTRACT_SUBREG (XXPERMDI $S, $S, 2), sub_64))>;
Bill Schmidt10f6eb92014-12-09 16:43:32 +0000961}
962
963let Predicates = [IsLittleEndian] in {
964def : Pat<(v2f64 (scalar_to_vector f64:$A)),
965 (v2f64 (XXPERMDI (SUBREG_TO_REG (i64 1), $A, sub_64),
966 (SUBREG_TO_REG (i64 1), $A, sub_64), 0))>;
967
Matt Arsenaultfbd9bbf2015-12-11 19:20:16 +0000968def : Pat<(f64 (extractelt v2f64:$S, 0)),
Bill Schmidt10f6eb92014-12-09 16:43:32 +0000969 (f64 (EXTRACT_SUBREG (XXPERMDI $S, $S, 2), sub_64))>;
Matt Arsenaultfbd9bbf2015-12-11 19:20:16 +0000970def : Pat<(f64 (extractelt v2f64:$S, 1)),
Bill Schmidt10f6eb92014-12-09 16:43:32 +0000971 (f64 (EXTRACT_SUBREG $S, sub_64))>;
972}
Hal Finkel27774d92014-03-13 07:58:58 +0000973
974// Additional fnmsub patterns: -a*c + b == -(a*c - b)
975def : Pat<(fma (fneg f64:$A), f64:$C, f64:$B),
976 (XSNMSUBADP $B, $C, $A)>;
977def : Pat<(fma f64:$A, (fneg f64:$C), f64:$B),
978 (XSNMSUBADP $B, $C, $A)>;
979
980def : Pat<(fma (fneg v2f64:$A), v2f64:$C, v2f64:$B),
981 (XVNMSUBADP $B, $C, $A)>;
982def : Pat<(fma v2f64:$A, (fneg v2f64:$C), v2f64:$B),
983 (XVNMSUBADP $B, $C, $A)>;
984
985def : Pat<(fma (fneg v4f32:$A), v4f32:$C, v4f32:$B),
986 (XVNMSUBASP $B, $C, $A)>;
987def : Pat<(fma v4f32:$A, (fneg v4f32:$C), v4f32:$B),
988 (XVNMSUBASP $B, $C, $A)>;
989
Hal Finkel9e0baa62014-04-01 19:24:27 +0000990def : Pat<(v2f64 (bitconvert v4f32:$A)),
991 (COPY_TO_REGCLASS $A, VSRC)>;
Hal Finkel27774d92014-03-13 07:58:58 +0000992def : Pat<(v2f64 (bitconvert v4i32:$A)),
993 (COPY_TO_REGCLASS $A, VSRC)>;
994def : Pat<(v2f64 (bitconvert v8i16:$A)),
995 (COPY_TO_REGCLASS $A, VSRC)>;
996def : Pat<(v2f64 (bitconvert v16i8:$A)),
997 (COPY_TO_REGCLASS $A, VSRC)>;
998
Hal Finkel9e0baa62014-04-01 19:24:27 +0000999def : Pat<(v4f32 (bitconvert v2f64:$A)),
1000 (COPY_TO_REGCLASS $A, VRRC)>;
Hal Finkel27774d92014-03-13 07:58:58 +00001001def : Pat<(v4i32 (bitconvert v2f64:$A)),
1002 (COPY_TO_REGCLASS $A, VRRC)>;
1003def : Pat<(v8i16 (bitconvert v2f64:$A)),
1004 (COPY_TO_REGCLASS $A, VRRC)>;
1005def : Pat<(v16i8 (bitconvert v2f64:$A)),
1006 (COPY_TO_REGCLASS $A, VRRC)>;
1007
Hal Finkel9e0baa62014-04-01 19:24:27 +00001008def : Pat<(v2i64 (bitconvert v4f32:$A)),
1009 (COPY_TO_REGCLASS $A, VSRC)>;
Hal Finkela6c8b512014-03-26 16:12:58 +00001010def : Pat<(v2i64 (bitconvert v4i32:$A)),
1011 (COPY_TO_REGCLASS $A, VSRC)>;
1012def : Pat<(v2i64 (bitconvert v8i16:$A)),
1013 (COPY_TO_REGCLASS $A, VSRC)>;
1014def : Pat<(v2i64 (bitconvert v16i8:$A)),
1015 (COPY_TO_REGCLASS $A, VSRC)>;
1016
Hal Finkel9e0baa62014-04-01 19:24:27 +00001017def : Pat<(v4f32 (bitconvert v2i64:$A)),
1018 (COPY_TO_REGCLASS $A, VRRC)>;
Hal Finkela6c8b512014-03-26 16:12:58 +00001019def : Pat<(v4i32 (bitconvert v2i64:$A)),
1020 (COPY_TO_REGCLASS $A, VRRC)>;
1021def : Pat<(v8i16 (bitconvert v2i64:$A)),
1022 (COPY_TO_REGCLASS $A, VRRC)>;
1023def : Pat<(v16i8 (bitconvert v2i64:$A)),
1024 (COPY_TO_REGCLASS $A, VRRC)>;
1025
Hal Finkel9281c9a2014-03-26 18:26:30 +00001026def : Pat<(v2f64 (bitconvert v2i64:$A)),
1027 (COPY_TO_REGCLASS $A, VRRC)>;
1028def : Pat<(v2i64 (bitconvert v2f64:$A)),
1029 (COPY_TO_REGCLASS $A, VRRC)>;
1030
Kit Bartond4eb73c2015-05-05 16:10:44 +00001031def : Pat<(v2f64 (bitconvert v1i128:$A)),
1032 (COPY_TO_REGCLASS $A, VRRC)>;
1033def : Pat<(v1i128 (bitconvert v2f64:$A)),
1034 (COPY_TO_REGCLASS $A, VRRC)>;
1035
Hal Finkel5c0d1452014-03-30 13:22:59 +00001036// sign extension patterns
1037// To extend "in place" from v2i32 to v2i64, we have input data like:
1038// | undef | i32 | undef | i32 |
1039// but xvcvsxwdp expects the input in big-Endian format:
1040// | i32 | undef | i32 | undef |
1041// so we need to shift everything to the left by one i32 (word) before
1042// the conversion.
1043def : Pat<(sext_inreg v2i64:$C, v2i32),
1044 (XVCVDPSXDS (XVCVSXWDP (XXSLDWI $C, $C, 1)))>;
1045def : Pat<(v2f64 (sint_to_fp (sext_inreg v2i64:$C, v2i32))),
1046 (XVCVSXWDP (XXSLDWI $C, $C, 1))>;
1047
Nemanja Ivanovic44513e52016-07-05 09:22:29 +00001048def : Pat<(v2f64 (PPCsvec2fp v4i32:$C, 0)),
1049 (v2f64 (XVCVSXWDP (v2i64 (XXMRGHW $C, $C))))>;
1050def : Pat<(v2f64 (PPCsvec2fp v4i32:$C, 1)),
1051 (v2f64 (XVCVSXWDP (v2i64 (XXMRGLW $C, $C))))>;
1052
1053def : Pat<(v2f64 (PPCuvec2fp v4i32:$C, 0)),
1054 (v2f64 (XVCVUXWDP (v2i64 (XXMRGHW $C, $C))))>;
1055def : Pat<(v2f64 (PPCuvec2fp v4i32:$C, 1)),
1056 (v2f64 (XVCVUXWDP (v2i64 (XXMRGLW $C, $C))))>;
1057
Bill Schmidt2d1128a2014-10-17 15:13:38 +00001058// Loads.
Nemanja Ivanovic6e7879c2016-09-22 09:52:19 +00001059let Predicates = [HasVSX, HasOnlySwappingMemOps] in {
Nemanja Ivanovic6e7879c2016-09-22 09:52:19 +00001060 def : Pat<(v2f64 (PPClxvd2x xoaddr:$src)), (LXVD2X xoaddr:$src)>;
Bill Schmidt2d1128a2014-10-17 15:13:38 +00001061
Nemanja Ivanovic6e7879c2016-09-22 09:52:19 +00001062 // Stores.
1063 def : Pat<(int_ppc_vsx_stxvd2x v2f64:$rS, xoaddr:$dst),
1064 (STXVD2X $rS, xoaddr:$dst)>;
Tony Jiang5f850cd2016-11-15 14:25:56 +00001065 def : Pat<(int_ppc_vsx_stxvd2x_be v2f64:$rS, xoaddr:$dst),
1066 (STXVD2X $rS, xoaddr:$dst)>;
1067 def : Pat<(int_ppc_vsx_stxvw4x_be v4i32:$rS, xoaddr:$dst),
1068 (STXVW4X $rS, xoaddr:$dst)>;
Nemanja Ivanovic6e7879c2016-09-22 09:52:19 +00001069 def : Pat<(PPCstxvd2x v2f64:$rS, xoaddr:$dst), (STXVD2X $rS, xoaddr:$dst)>;
1070}
Nemanja Ivanovice78ffed2016-09-22 10:32:03 +00001071let Predicates = [IsBigEndian, HasVSX, HasOnlySwappingMemOps] in {
1072 def : Pat<(v2f64 (load xoaddr:$src)), (LXVD2X xoaddr:$src)>;
1073 def : Pat<(v2i64 (load xoaddr:$src)), (LXVD2X xoaddr:$src)>;
1074 def : Pat<(v4i32 (load xoaddr:$src)), (LXVW4X xoaddr:$src)>;
Nemanja Ivanovicb89c27f2017-05-02 01:47:34 +00001075 def : Pat<(v4i32 (int_ppc_vsx_lxvw4x xoaddr:$src)), (LXVW4X xoaddr:$src)>;
Nemanja Ivanovice78ffed2016-09-22 10:32:03 +00001076 def : Pat<(store v2f64:$rS, xoaddr:$dst), (STXVD2X $rS, xoaddr:$dst)>;
1077 def : Pat<(store v2i64:$rS, xoaddr:$dst), (STXVD2X $rS, xoaddr:$dst)>;
Nemanja Ivanovicb89c27f2017-05-02 01:47:34 +00001078 def : Pat<(store v4i32:$XT, xoaddr:$dst), (STXVW4X $XT, xoaddr:$dst)>;
1079 def : Pat<(int_ppc_vsx_stxvw4x v4i32:$rS, xoaddr:$dst),
1080 (STXVW4X $rS, xoaddr:$dst)>;
Nemanja Ivanovice78ffed2016-09-22 10:32:03 +00001081}
Bill Schmidtfae5d712014-12-09 16:35:51 +00001082
1083// Permutes.
1084def : Pat<(v2f64 (PPCxxswapd v2f64:$src)), (XXPERMDI $src, $src, 2)>;
1085def : Pat<(v2i64 (PPCxxswapd v2i64:$src)), (XXPERMDI $src, $src, 2)>;
1086def : Pat<(v4f32 (PPCxxswapd v4f32:$src)), (XXPERMDI $src, $src, 2)>;
1087def : Pat<(v4i32 (PPCxxswapd v4i32:$src)), (XXPERMDI $src, $src, 2)>;
Nemanja Ivanoviceebbcb62016-07-12 12:16:27 +00001088def : Pat<(v2f64 (PPCswapNoChain v2f64:$src)), (XXPERMDI $src, $src, 2)>;
Bill Schmidt2d1128a2014-10-17 15:13:38 +00001089
Tony Jiang0a429f02017-05-24 23:48:29 +00001090// PPCvecshl XT, XA, XA, 2 can be selected to both XXSLDWI XT,XA,XA,2 and
1091// XXSWAPD XT,XA (i.e. XXPERMDI XT,XA,XA,2), the later one is more profitable.
1092def : Pat<(v4i32 (PPCvecshl v4i32:$src, v4i32:$src, 2)), (XXPERMDI $src, $src, 2)>;
1093
Bill Schmidt61e65232014-10-22 13:13:40 +00001094// Selects.
1095def : Pat<(v2f64 (selectcc i1:$lhs, i1:$rhs, v2f64:$tval, v2f64:$fval, SETLT)),
Hal Finkela2cdbce2015-08-30 22:12:50 +00001096 (SELECT_VSRC (CRANDC $lhs, $rhs), $tval, $fval)>;
1097def : Pat<(v2f64 (selectcc i1:$lhs, i1:$rhs, v2f64:$tval, v2f64:$fval, SETULT)),
Bill Schmidt61e65232014-10-22 13:13:40 +00001098 (SELECT_VSRC (CRANDC $rhs, $lhs), $tval, $fval)>;
1099def : Pat<(v2f64 (selectcc i1:$lhs, i1:$rhs, v2f64:$tval, v2f64:$fval, SETLE)),
Hal Finkela2cdbce2015-08-30 22:12:50 +00001100 (SELECT_VSRC (CRORC $lhs, $rhs), $tval, $fval)>;
1101def : Pat<(v2f64 (selectcc i1:$lhs, i1:$rhs, v2f64:$tval, v2f64:$fval, SETULE)),
Bill Schmidt61e65232014-10-22 13:13:40 +00001102 (SELECT_VSRC (CRORC $rhs, $lhs), $tval, $fval)>;
1103def : Pat<(v2f64 (selectcc i1:$lhs, i1:$rhs, v2f64:$tval, v2f64:$fval, SETEQ)),
1104 (SELECT_VSRC (CREQV $lhs, $rhs), $tval, $fval)>;
1105def : Pat<(v2f64 (selectcc i1:$lhs, i1:$rhs, v2f64:$tval, v2f64:$fval, SETGE)),
Hal Finkela2cdbce2015-08-30 22:12:50 +00001106 (SELECT_VSRC (CRORC $rhs, $lhs), $tval, $fval)>;
1107def : Pat<(v2f64 (selectcc i1:$lhs, i1:$rhs, v2f64:$tval, v2f64:$fval, SETUGE)),
Bill Schmidt61e65232014-10-22 13:13:40 +00001108 (SELECT_VSRC (CRORC $lhs, $rhs), $tval, $fval)>;
1109def : Pat<(v2f64 (selectcc i1:$lhs, i1:$rhs, v2f64:$tval, v2f64:$fval, SETGT)),
Hal Finkela2cdbce2015-08-30 22:12:50 +00001110 (SELECT_VSRC (CRANDC $rhs, $lhs), $tval, $fval)>;
1111def : Pat<(v2f64 (selectcc i1:$lhs, i1:$rhs, v2f64:$tval, v2f64:$fval, SETUGT)),
Bill Schmidt61e65232014-10-22 13:13:40 +00001112 (SELECT_VSRC (CRANDC $lhs, $rhs), $tval, $fval)>;
1113def : Pat<(v2f64 (selectcc i1:$lhs, i1:$rhs, v2f64:$tval, v2f64:$fval, SETNE)),
1114 (SELECT_VSRC (CRXOR $lhs, $rhs), $tval, $fval)>;
1115
Bill Schmidt9c54bbd2014-10-22 16:58:20 +00001116def : Pat<(f64 (selectcc i1:$lhs, i1:$rhs, f64:$tval, f64:$fval, SETLT)),
Hal Finkela2cdbce2015-08-30 22:12:50 +00001117 (SELECT_VSFRC (CRANDC $lhs, $rhs), $tval, $fval)>;
1118def : Pat<(f64 (selectcc i1:$lhs, i1:$rhs, f64:$tval, f64:$fval, SETULT)),
Bill Schmidt9c54bbd2014-10-22 16:58:20 +00001119 (SELECT_VSFRC (CRANDC $rhs, $lhs), $tval, $fval)>;
1120def : Pat<(f64 (selectcc i1:$lhs, i1:$rhs, f64:$tval, f64:$fval, SETLE)),
Hal Finkela2cdbce2015-08-30 22:12:50 +00001121 (SELECT_VSFRC (CRORC $lhs, $rhs), $tval, $fval)>;
1122def : Pat<(f64 (selectcc i1:$lhs, i1:$rhs, f64:$tval, f64:$fval, SETULE)),
Bill Schmidt9c54bbd2014-10-22 16:58:20 +00001123 (SELECT_VSFRC (CRORC $rhs, $lhs), $tval, $fval)>;
1124def : Pat<(f64 (selectcc i1:$lhs, i1:$rhs, f64:$tval, f64:$fval, SETEQ)),
1125 (SELECT_VSFRC (CREQV $lhs, $rhs), $tval, $fval)>;
1126def : Pat<(f64 (selectcc i1:$lhs, i1:$rhs, f64:$tval, f64:$fval, SETGE)),
Hal Finkela2cdbce2015-08-30 22:12:50 +00001127 (SELECT_VSFRC (CRORC $rhs, $lhs), $tval, $fval)>;
1128def : Pat<(f64 (selectcc i1:$lhs, i1:$rhs, f64:$tval, f64:$fval, SETUGE)),
Bill Schmidt9c54bbd2014-10-22 16:58:20 +00001129 (SELECT_VSFRC (CRORC $lhs, $rhs), $tval, $fval)>;
1130def : Pat<(f64 (selectcc i1:$lhs, i1:$rhs, f64:$tval, f64:$fval, SETGT)),
Hal Finkela2cdbce2015-08-30 22:12:50 +00001131 (SELECT_VSFRC (CRANDC $rhs, $lhs), $tval, $fval)>;
1132def : Pat<(f64 (selectcc i1:$lhs, i1:$rhs, f64:$tval, f64:$fval, SETUGT)),
Bill Schmidt9c54bbd2014-10-22 16:58:20 +00001133 (SELECT_VSFRC (CRANDC $lhs, $rhs), $tval, $fval)>;
1134def : Pat<(f64 (selectcc i1:$lhs, i1:$rhs, f64:$tval, f64:$fval, SETNE)),
1135 (SELECT_VSFRC (CRXOR $lhs, $rhs), $tval, $fval)>;
1136
Bill Schmidt76746922014-11-14 12:10:40 +00001137// Divides.
1138def : Pat<(int_ppc_vsx_xvdivsp v4f32:$A, v4f32:$B),
1139 (XVDIVSP $A, $B)>;
1140def : Pat<(int_ppc_vsx_xvdivdp v2f64:$A, v2f64:$B),
1141 (XVDIVDP $A, $B)>;
1142
Nemanja Ivanovic984a3612015-07-14 17:25:20 +00001143// Reciprocal estimate
1144def : Pat<(int_ppc_vsx_xvresp v4f32:$A),
1145 (XVRESP $A)>;
1146def : Pat<(int_ppc_vsx_xvredp v2f64:$A),
1147 (XVREDP $A)>;
1148
Nemanja Ivanovicd358b8f2015-07-05 06:03:51 +00001149// Recip. square root estimate
1150def : Pat<(int_ppc_vsx_xvrsqrtesp v4f32:$A),
1151 (XVRSQRTESP $A)>;
1152def : Pat<(int_ppc_vsx_xvrsqrtedp v2f64:$A),
1153 (XVRSQRTEDP $A)>;
1154
Nemanja Ivanovicd3c284f2016-07-18 15:30:00 +00001155let Predicates = [IsLittleEndian] in {
1156def : Pat<(f64 (PPCfcfid (PPCmtvsra (i64 (vector_extract v2i64:$S, 0))))),
1157 (f64 (XSCVSXDDP (COPY_TO_REGCLASS (XXPERMDI $S, $S, 2), VSFRC)))>;
1158def : Pat<(f64 (PPCfcfid (PPCmtvsra (i64 (vector_extract v2i64:$S, 1))))),
1159 (f64 (XSCVSXDDP (COPY_TO_REGCLASS (f64 (COPY_TO_REGCLASS $S, VSRC)), VSFRC)))>;
1160def : Pat<(f64 (PPCfcfidu (PPCmtvsra (i64 (vector_extract v2i64:$S, 0))))),
1161 (f64 (XSCVUXDDP (COPY_TO_REGCLASS (XXPERMDI $S, $S, 2), VSFRC)))>;
1162def : Pat<(f64 (PPCfcfidu (PPCmtvsra (i64 (vector_extract v2i64:$S, 1))))),
1163 (f64 (XSCVUXDDP (COPY_TO_REGCLASS (f64 (COPY_TO_REGCLASS $S, VSRC)), VSFRC)))>;
1164} // IsLittleEndian
1165
1166let Predicates = [IsBigEndian] in {
1167def : Pat<(f64 (PPCfcfid (PPCmtvsra (i64 (vector_extract v2i64:$S, 0))))),
1168 (f64 (XSCVSXDDP (COPY_TO_REGCLASS $S, VSFRC)))>;
1169def : Pat<(f64 (PPCfcfid (PPCmtvsra (i64 (vector_extract v2i64:$S, 1))))),
1170 (f64 (XSCVSXDDP (COPY_TO_REGCLASS (XXPERMDI $S, $S, 2), VSFRC)))>;
1171def : Pat<(f64 (PPCfcfidu (PPCmtvsra (i64 (vector_extract v2i64:$S, 0))))),
1172 (f64 (XSCVUXDDP (COPY_TO_REGCLASS $S, VSFRC)))>;
1173def : Pat<(f64 (PPCfcfidu (PPCmtvsra (i64 (vector_extract v2i64:$S, 1))))),
1174 (f64 (XSCVUXDDP (COPY_TO_REGCLASS (XXPERMDI $S, $S, 2), VSFRC)))>;
1175} // IsBigEndian
1176
Hal Finkel27774d92014-03-13 07:58:58 +00001177} // AddedComplexity
1178} // HasVSX
1179
Nemanja Ivanovic11049f82016-10-04 06:59:23 +00001180def ScalarLoads {
1181 dag Li8 = (i32 (extloadi8 xoaddr:$src));
1182 dag ZELi8 = (i32 (zextloadi8 xoaddr:$src));
1183 dag ZELi8i64 = (i64 (zextloadi8 xoaddr:$src));
1184 dag SELi8 = (i32 (sext_inreg (extloadi8 xoaddr:$src), i8));
1185 dag SELi8i64 = (i64 (sext_inreg (extloadi8 xoaddr:$src), i8));
1186
1187 dag Li16 = (i32 (extloadi16 xoaddr:$src));
1188 dag ZELi16 = (i32 (zextloadi16 xoaddr:$src));
1189 dag ZELi16i64 = (i64 (zextloadi16 xoaddr:$src));
1190 dag SELi16 = (i32 (sextloadi16 xoaddr:$src));
1191 dag SELi16i64 = (i64 (sextloadi16 xoaddr:$src));
1192
1193 dag Li32 = (i32 (load xoaddr:$src));
1194}
1195
Kit Barton298beb52015-02-18 16:21:46 +00001196// The following VSX instructions were introduced in Power ISA 2.07
1197/* FIXME: if the operands are v2i64, these patterns will not match.
1198 we should define new patterns or otherwise match the same patterns
1199 when the elements are larger than i32.
1200*/
1201def HasP8Vector : Predicate<"PPCSubTarget->hasP8Vector()">;
Nemanja Ivanovicc38b5312015-04-11 10:40:42 +00001202def HasDirectMove : Predicate<"PPCSubTarget->hasDirectMove()">;
Kit Barton298beb52015-02-18 16:21:46 +00001203let Predicates = [HasP8Vector] in {
1204let AddedComplexity = 400 in { // Prefer VSX patterns over non-VSX patterns.
Nemanja Ivanovic11049f82016-10-04 06:59:23 +00001205 let isCommutable = 1, UseVSXReg = 1 in {
Nemanja Ivanovicf02def62015-05-21 19:32:49 +00001206 def XXLEQV : XX3Form<60, 186,
1207 (outs vsrc:$XT), (ins vsrc:$XA, vsrc:$XB),
1208 "xxleqv $XT, $XA, $XB", IIC_VecGeneral,
1209 [(set v4i32:$XT, (vnot_ppc (xor v4i32:$XA, v4i32:$XB)))]>;
1210 def XXLNAND : XX3Form<60, 178,
1211 (outs vsrc:$XT), (ins vsrc:$XA, vsrc:$XB),
1212 "xxlnand $XT, $XA, $XB", IIC_VecGeneral,
1213 [(set v4i32:$XT, (vnot_ppc (and v4i32:$XA,
Kit Barton298beb52015-02-18 16:21:46 +00001214 v4i32:$XB)))]>;
Nemanja Ivanovic11049f82016-10-04 06:59:23 +00001215 } // isCommutable, UseVSXReg
Nemanja Ivanovicd9e4b4f2015-07-10 14:25:17 +00001216
Nemanja Ivanovic5655fb32015-07-10 12:38:08 +00001217 def : Pat<(int_ppc_vsx_xxleqv v4i32:$A, v4i32:$B),
1218 (XXLEQV $A, $B)>;
Nemanja Ivanovicf02def62015-05-21 19:32:49 +00001219
Nemanja Ivanovic11049f82016-10-04 06:59:23 +00001220 let UseVSXReg = 1 in {
Nemanja Ivanovicf02def62015-05-21 19:32:49 +00001221 def XXLORC : XX3Form<60, 170,
1222 (outs vsrc:$XT), (ins vsrc:$XA, vsrc:$XB),
1223 "xxlorc $XT, $XA, $XB", IIC_VecGeneral,
1224 [(set v4i32:$XT, (or v4i32:$XA, (vnot_ppc v4i32:$XB)))]>;
1225
Nemanja Ivanovicf3c94b12015-05-07 18:24:05 +00001226 // VSX scalar loads introduced in ISA 2.07
Sean Fertile3c8c3852017-01-26 18:59:15 +00001227 let mayLoad = 1, mayStore = 0 in {
Nemanja Ivanovic6354d232016-10-04 11:25:52 +00001228 let CodeSize = 3 in
Stefan Pintilie26d4f922018-03-26 17:39:18 +00001229 def LXSSPX : XX1Form_memOp<31, 524, (outs vssrc:$XT), (ins memrr:$src),
Tony Jiang438bf4a2017-11-20 14:38:30 +00001230 "lxsspx $XT, $src", IIC_LdStLFD, []>;
Stefan Pintilie26d4f922018-03-26 17:39:18 +00001231 def LXSIWAX : XX1Form_memOp<31, 76, (outs vsfrc:$XT), (ins memrr:$src),
Tony Jiang438bf4a2017-11-20 14:38:30 +00001232 "lxsiwax $XT, $src", IIC_LdStLFD, []>;
Stefan Pintilie26d4f922018-03-26 17:39:18 +00001233 def LXSIWZX : XX1Form_memOp<31, 12, (outs vsfrc:$XT), (ins memrr:$src),
Tony Jiang438bf4a2017-11-20 14:38:30 +00001234 "lxsiwzx $XT, $src", IIC_LdStLFD, []>;
1235
1236 // Please note let isPseudo = 1 is not part of class Pseudo<>. Missing it
1237 // would cause these Pseudos are not expanded in expandPostRAPseudos()
1238 let isPseudo = 1 in {
1239 // Pseudo instruction XFLOADf32 will be expanded to LXSSPX or LFSX later
1240 let CodeSize = 3 in
Stefan Pintilie26d4f922018-03-26 17:39:18 +00001241 def XFLOADf32 : PseudoXFormMemOp<(outs vssrc:$XT), (ins memrr:$src),
Tony Jiang438bf4a2017-11-20 14:38:30 +00001242 "#XFLOADf32",
1243 [(set f32:$XT, (load xoaddr:$src))]>;
1244 // Pseudo instruction LIWAX will be expanded to LXSIWAX or LFIWAX later
Stefan Pintilie26d4f922018-03-26 17:39:18 +00001245 def LIWAX : PseudoXFormMemOp<(outs vsfrc:$XT), (ins memrr:$src),
Tony Jiang438bf4a2017-11-20 14:38:30 +00001246 "#LIWAX",
1247 [(set f64:$XT, (PPClfiwax xoaddr:$src))]>;
1248 // Pseudo instruction LIWZX will be expanded to LXSIWZX or LFIWZX later
Stefan Pintilie26d4f922018-03-26 17:39:18 +00001249 def LIWZX : PseudoXFormMemOp<(outs vsfrc:$XT), (ins memrr:$src),
Tony Jiang438bf4a2017-11-20 14:38:30 +00001250 "#LIWZX",
1251 [(set f64:$XT, (PPClfiwzx xoaddr:$src))]>;
1252 }
Nemanja Ivanovicf3c94b12015-05-07 18:24:05 +00001253 } // mayLoad
1254
1255 // VSX scalar stores introduced in ISA 2.07
Sean Fertile3c8c3852017-01-26 18:59:15 +00001256 let mayStore = 1, mayLoad = 0 in {
Nemanja Ivanovic6354d232016-10-04 11:25:52 +00001257 let CodeSize = 3 in
Stefan Pintilie26d4f922018-03-26 17:39:18 +00001258 def STXSSPX : XX1Form_memOp<31, 652, (outs), (ins vssrc:$XT, memrr:$dst),
Tony Jiang438bf4a2017-11-20 14:38:30 +00001259 "stxsspx $XT, $dst", IIC_LdStSTFD, []>;
Stefan Pintilie26d4f922018-03-26 17:39:18 +00001260 def STXSIWX : XX1Form_memOp<31, 140, (outs), (ins vsfrc:$XT, memrr:$dst),
Tony Jiang438bf4a2017-11-20 14:38:30 +00001261 "stxsiwx $XT, $dst", IIC_LdStSTFD, []>;
1262
1263 // Please note let isPseudo = 1 is not part of class Pseudo<>. Missing it
1264 // would cause these Pseudos are not expanded in expandPostRAPseudos()
1265 let isPseudo = 1 in {
1266 // Pseudo instruction XFSTOREf32 will be expanded to STXSSPX or STFSX later
1267 let CodeSize = 3 in
Stefan Pintilie26d4f922018-03-26 17:39:18 +00001268 def XFSTOREf32 : PseudoXFormMemOp<(outs), (ins vssrc:$XT, memrr:$dst),
Tony Jiang438bf4a2017-11-20 14:38:30 +00001269 "#XFSTOREf32",
1270 [(store f32:$XT, xoaddr:$dst)]>;
1271 // Pseudo instruction STIWX will be expanded to STXSIWX or STFIWX later
Stefan Pintilie26d4f922018-03-26 17:39:18 +00001272 def STIWX : PseudoXFormMemOp<(outs), (ins vsfrc:$XT, memrr:$dst),
Tony Jiang438bf4a2017-11-20 14:38:30 +00001273 "#STIWX",
1274 [(PPCstfiwx f64:$XT, xoaddr:$dst)]>;
1275 }
Nemanja Ivanovicf3c94b12015-05-07 18:24:05 +00001276 } // mayStore
Nemanja Ivanovic11049f82016-10-04 06:59:23 +00001277 } // UseVSXReg = 1
Nemanja Ivanovicf02def62015-05-21 19:32:49 +00001278
1279 def : Pat<(f64 (extloadf32 xoaddr:$src)),
Tony Jiang438bf4a2017-11-20 14:38:30 +00001280 (COPY_TO_REGCLASS (XFLOADf32 xoaddr:$src), VSFRC)>;
Lei Huangcd4f3852018-03-12 19:26:18 +00001281 def : Pat<(f32 (fpround (f64 (extloadf32 xoaddr:$src)))),
Tony Jiang438bf4a2017-11-20 14:38:30 +00001282 (f32 (XFLOADf32 xoaddr:$src))>;
Michael Kuperstein2bc3d4d2016-08-18 20:08:15 +00001283 def : Pat<(f64 (fpextend f32:$src)),
Nemanja Ivanovicf02def62015-05-21 19:32:49 +00001284 (COPY_TO_REGCLASS $src, VSFRC)>;
Hal Finkela2cdbce2015-08-30 22:12:50 +00001285
Nemanja Ivanovicf02def62015-05-21 19:32:49 +00001286 def : Pat<(f32 (selectcc i1:$lhs, i1:$rhs, f32:$tval, f32:$fval, SETLT)),
Hal Finkela2cdbce2015-08-30 22:12:50 +00001287 (SELECT_VSSRC (CRANDC $lhs, $rhs), $tval, $fval)>;
1288 def : Pat<(f32 (selectcc i1:$lhs, i1:$rhs, f32:$tval, f32:$fval, SETULT)),
Nemanja Ivanovicf02def62015-05-21 19:32:49 +00001289 (SELECT_VSSRC (CRANDC $rhs, $lhs), $tval, $fval)>;
1290 def : Pat<(f32 (selectcc i1:$lhs, i1:$rhs, f32:$tval, f32:$fval, SETLE)),
Hal Finkela2cdbce2015-08-30 22:12:50 +00001291 (SELECT_VSSRC (CRORC $lhs, $rhs), $tval, $fval)>;
1292 def : Pat<(f32 (selectcc i1:$lhs, i1:$rhs, f32:$tval, f32:$fval, SETULE)),
Nemanja Ivanovicf02def62015-05-21 19:32:49 +00001293 (SELECT_VSSRC (CRORC $rhs, $lhs), $tval, $fval)>;
1294 def : Pat<(f32 (selectcc i1:$lhs, i1:$rhs, f32:$tval, f32:$fval, SETEQ)),
1295 (SELECT_VSSRC (CREQV $lhs, $rhs), $tval, $fval)>;
1296 def : Pat<(f32 (selectcc i1:$lhs, i1:$rhs, f32:$tval, f32:$fval, SETGE)),
Hal Finkela2cdbce2015-08-30 22:12:50 +00001297 (SELECT_VSSRC (CRORC $rhs, $lhs), $tval, $fval)>;
1298 def : Pat<(f32 (selectcc i1:$lhs, i1:$rhs, f32:$tval, f32:$fval, SETUGE)),
Nemanja Ivanovicf02def62015-05-21 19:32:49 +00001299 (SELECT_VSSRC (CRORC $lhs, $rhs), $tval, $fval)>;
1300 def : Pat<(f32 (selectcc i1:$lhs, i1:$rhs, f32:$tval, f32:$fval, SETGT)),
Hal Finkela2cdbce2015-08-30 22:12:50 +00001301 (SELECT_VSSRC (CRANDC $rhs, $lhs), $tval, $fval)>;
1302 def : Pat<(f32 (selectcc i1:$lhs, i1:$rhs, f32:$tval, f32:$fval, SETUGT)),
Nemanja Ivanovicf02def62015-05-21 19:32:49 +00001303 (SELECT_VSSRC (CRANDC $lhs, $rhs), $tval, $fval)>;
1304 def : Pat<(f32 (selectcc i1:$lhs, i1:$rhs, f32:$tval, f32:$fval, SETNE)),
Hal Finkela2cdbce2015-08-30 22:12:50 +00001305 (SELECT_VSSRC (CRXOR $lhs, $rhs), $tval, $fval)>;
Nemanja Ivanovicf02def62015-05-21 19:32:49 +00001306
Nemanja Ivanovic11049f82016-10-04 06:59:23 +00001307 let UseVSXReg = 1 in {
Nemanja Ivanovicf02def62015-05-21 19:32:49 +00001308 // VSX Elementary Scalar FP arithmetic (SP)
1309 let isCommutable = 1 in {
1310 def XSADDSP : XX3Form<60, 0,
1311 (outs vssrc:$XT), (ins vssrc:$XA, vssrc:$XB),
1312 "xsaddsp $XT, $XA, $XB", IIC_VecFP,
1313 [(set f32:$XT, (fadd f32:$XA, f32:$XB))]>;
1314 def XSMULSP : XX3Form<60, 16,
1315 (outs vssrc:$XT), (ins vssrc:$XA, vssrc:$XB),
1316 "xsmulsp $XT, $XA, $XB", IIC_VecFP,
1317 [(set f32:$XT, (fmul f32:$XA, f32:$XB))]>;
1318 } // isCommutable
1319
1320 def XSDIVSP : XX3Form<60, 24,
1321 (outs vssrc:$XT), (ins vssrc:$XA, vssrc:$XB),
1322 "xsdivsp $XT, $XA, $XB", IIC_FPDivS,
1323 [(set f32:$XT, (fdiv f32:$XA, f32:$XB))]>;
1324 def XSRESP : XX2Form<60, 26,
1325 (outs vssrc:$XT), (ins vssrc:$XB),
1326 "xsresp $XT, $XB", IIC_VecFP,
1327 [(set f32:$XT, (PPCfre f32:$XB))]>;
1328 def XSSQRTSP : XX2Form<60, 11,
1329 (outs vssrc:$XT), (ins vssrc:$XB),
1330 "xssqrtsp $XT, $XB", IIC_FPSqrtS,
1331 [(set f32:$XT, (fsqrt f32:$XB))]>;
1332 def XSRSQRTESP : XX2Form<60, 10,
1333 (outs vssrc:$XT), (ins vssrc:$XB),
1334 "xsrsqrtesp $XT, $XB", IIC_VecFP,
1335 [(set f32:$XT, (PPCfrsqrte f32:$XB))]>;
1336 def XSSUBSP : XX3Form<60, 8,
1337 (outs vssrc:$XT), (ins vssrc:$XA, vssrc:$XB),
1338 "xssubsp $XT, $XA, $XB", IIC_VecFP,
1339 [(set f32:$XT, (fsub f32:$XA, f32:$XB))]>;
Nemanja Ivanovic376e1732015-05-29 17:13:25 +00001340
1341 // FMA Instructions
1342 let BaseName = "XSMADDASP" in {
1343 let isCommutable = 1 in
1344 def XSMADDASP : XX3Form<60, 1,
1345 (outs vssrc:$XT),
1346 (ins vssrc:$XTi, vssrc:$XA, vssrc:$XB),
1347 "xsmaddasp $XT, $XA, $XB", IIC_VecFP,
1348 [(set f32:$XT, (fma f32:$XA, f32:$XB, f32:$XTi))]>,
1349 RegConstraint<"$XTi = $XT">, NoEncode<"$XTi">,
1350 AltVSXFMARel;
1351 let IsVSXFMAAlt = 1 in
1352 def XSMADDMSP : XX3Form<60, 9,
1353 (outs vssrc:$XT),
1354 (ins vssrc:$XTi, vssrc:$XA, vssrc:$XB),
1355 "xsmaddmsp $XT, $XA, $XB", IIC_VecFP, []>,
1356 RegConstraint<"$XTi = $XT">, NoEncode<"$XTi">,
1357 AltVSXFMARel;
1358 }
1359
1360 let BaseName = "XSMSUBASP" in {
1361 let isCommutable = 1 in
1362 def XSMSUBASP : XX3Form<60, 17,
1363 (outs vssrc:$XT),
1364 (ins vssrc:$XTi, vssrc:$XA, vssrc:$XB),
1365 "xsmsubasp $XT, $XA, $XB", IIC_VecFP,
1366 [(set f32:$XT, (fma f32:$XA, f32:$XB,
1367 (fneg f32:$XTi)))]>,
1368 RegConstraint<"$XTi = $XT">, NoEncode<"$XTi">,
1369 AltVSXFMARel;
1370 let IsVSXFMAAlt = 1 in
1371 def XSMSUBMSP : XX3Form<60, 25,
1372 (outs vssrc:$XT),
1373 (ins vssrc:$XTi, vssrc:$XA, vssrc:$XB),
1374 "xsmsubmsp $XT, $XA, $XB", IIC_VecFP, []>,
1375 RegConstraint<"$XTi = $XT">, NoEncode<"$XTi">,
1376 AltVSXFMARel;
1377 }
1378
1379 let BaseName = "XSNMADDASP" in {
1380 let isCommutable = 1 in
1381 def XSNMADDASP : XX3Form<60, 129,
1382 (outs vssrc:$XT),
1383 (ins vssrc:$XTi, vssrc:$XA, vssrc:$XB),
1384 "xsnmaddasp $XT, $XA, $XB", IIC_VecFP,
1385 [(set f32:$XT, (fneg (fma f32:$XA, f32:$XB,
1386 f32:$XTi)))]>,
1387 RegConstraint<"$XTi = $XT">, NoEncode<"$XTi">,
1388 AltVSXFMARel;
1389 let IsVSXFMAAlt = 1 in
1390 def XSNMADDMSP : XX3Form<60, 137,
1391 (outs vssrc:$XT),
1392 (ins vssrc:$XTi, vssrc:$XA, vssrc:$XB),
1393 "xsnmaddmsp $XT, $XA, $XB", IIC_VecFP, []>,
1394 RegConstraint<"$XTi = $XT">, NoEncode<"$XTi">,
1395 AltVSXFMARel;
1396 }
1397
1398 let BaseName = "XSNMSUBASP" in {
1399 let isCommutable = 1 in
1400 def XSNMSUBASP : XX3Form<60, 145,
1401 (outs vssrc:$XT),
1402 (ins vssrc:$XTi, vssrc:$XA, vssrc:$XB),
1403 "xsnmsubasp $XT, $XA, $XB", IIC_VecFP,
1404 [(set f32:$XT, (fneg (fma f32:$XA, f32:$XB,
1405 (fneg f32:$XTi))))]>,
1406 RegConstraint<"$XTi = $XT">, NoEncode<"$XTi">,
1407 AltVSXFMARel;
1408 let IsVSXFMAAlt = 1 in
1409 def XSNMSUBMSP : XX3Form<60, 153,
1410 (outs vssrc:$XT),
1411 (ins vssrc:$XTi, vssrc:$XA, vssrc:$XB),
1412 "xsnmsubmsp $XT, $XA, $XB", IIC_VecFP, []>,
1413 RegConstraint<"$XTi = $XT">, NoEncode<"$XTi">,
1414 AltVSXFMARel;
1415 }
Nemanja Ivanovic1c39ca62015-08-13 17:40:44 +00001416
1417 // Single Precision Conversions (FP <-> INT)
1418 def XSCVSXDSP : XX2Form<60, 312,
1419 (outs vssrc:$XT), (ins vsfrc:$XB),
1420 "xscvsxdsp $XT, $XB", IIC_VecFP,
1421 [(set f32:$XT, (PPCfcfids f64:$XB))]>;
1422 def XSCVUXDSP : XX2Form<60, 296,
1423 (outs vssrc:$XT), (ins vsfrc:$XB),
1424 "xscvuxdsp $XT, $XB", IIC_VecFP,
1425 [(set f32:$XT, (PPCfcfidus f64:$XB))]>;
1426
1427 // Conversions between vector and scalar single precision
1428 def XSCVDPSPN : XX2Form<60, 267, (outs vsrc:$XT), (ins vssrc:$XB),
1429 "xscvdpspn $XT, $XB", IIC_VecFP, []>;
1430 def XSCVSPDPN : XX2Form<60, 331, (outs vssrc:$XT), (ins vsrc:$XB),
1431 "xscvspdpn $XT, $XB", IIC_VecFP, []>;
Nemanja Ivanovic11049f82016-10-04 06:59:23 +00001432 } // UseVSXReg = 1
Nemanja Ivanovic1c39ca62015-08-13 17:40:44 +00001433
Nemanja Ivanovicd3c284f2016-07-18 15:30:00 +00001434 let Predicates = [IsLittleEndian] in {
Lei Huangcd4f3852018-03-12 19:26:18 +00001435 def : Pat<(f32 (PPCfcfids
1436 (f64 (PPCmtvsra (i64 (vector_extract v2i64:$S, 0)))))),
Nemanja Ivanovicd3c284f2016-07-18 15:30:00 +00001437 (f32 (XSCVSXDSP (COPY_TO_REGCLASS (XXPERMDI $S, $S, 2), VSFRC)))>;
Lei Huangcd4f3852018-03-12 19:26:18 +00001438 def : Pat<(f32 (PPCfcfids
1439 (f64 (PPCmtvsra (i64 (vector_extract v2i64:$S, 1)))))),
1440 (f32 (XSCVSXDSP (COPY_TO_REGCLASS
1441 (f64 (COPY_TO_REGCLASS $S, VSRC)), VSFRC)))>;
1442 def : Pat<(f32 (PPCfcfidus
1443 (f64 (PPCmtvsra (i64 (vector_extract v2i64:$S, 0)))))),
Nemanja Ivanovicd3c284f2016-07-18 15:30:00 +00001444 (f32 (XSCVUXDSP (COPY_TO_REGCLASS (XXPERMDI $S, $S, 2), VSFRC)))>;
Lei Huangcd4f3852018-03-12 19:26:18 +00001445 def : Pat<(f32 (PPCfcfidus
1446 (f64 (PPCmtvsra (i64 (vector_extract v2i64:$S, 1)))))),
1447 (f32 (XSCVUXDSP (COPY_TO_REGCLASS
1448 (f64 (COPY_TO_REGCLASS $S, VSRC)), VSFRC)))>;
Nemanja Ivanovicd3c284f2016-07-18 15:30:00 +00001449 }
1450
1451 let Predicates = [IsBigEndian] in {
Lei Huangcd4f3852018-03-12 19:26:18 +00001452 def : Pat<(f32 (PPCfcfids
1453 (f64 (PPCmtvsra (i64 (vector_extract v2i64:$S, 0)))))),
Nemanja Ivanovicd3c284f2016-07-18 15:30:00 +00001454 (f32 (XSCVSXDSP (COPY_TO_REGCLASS $S, VSFRC)))>;
Lei Huangcd4f3852018-03-12 19:26:18 +00001455 def : Pat<(f32 (PPCfcfids
1456 (f64 (PPCmtvsra (i64 (vector_extract v2i64:$S, 1)))))),
Nemanja Ivanovicd3c284f2016-07-18 15:30:00 +00001457 (f32 (XSCVSXDSP (COPY_TO_REGCLASS (XXPERMDI $S, $S, 2), VSFRC)))>;
Lei Huangcd4f3852018-03-12 19:26:18 +00001458 def : Pat<(f32 (PPCfcfidus
1459 (f64 (PPCmtvsra (i64 (vector_extract v2i64:$S, 0)))))),
Nemanja Ivanovicd3c284f2016-07-18 15:30:00 +00001460 (f32 (XSCVUXDSP (COPY_TO_REGCLASS $S, VSFRC)))>;
Lei Huangcd4f3852018-03-12 19:26:18 +00001461 def : Pat<(f32 (PPCfcfidus
1462 (f64 (PPCmtvsra (i64 (vector_extract v2i64:$S, 1)))))),
Nemanja Ivanovicd3c284f2016-07-18 15:30:00 +00001463 (f32 (XSCVUXDSP (COPY_TO_REGCLASS (XXPERMDI $S, $S, 2), VSFRC)))>;
1464 }
Nemanja Ivanovic11049f82016-10-04 06:59:23 +00001465 def : Pat<(v4i32 (scalar_to_vector ScalarLoads.Li32)),
Tony Jiang438bf4a2017-11-20 14:38:30 +00001466 (v4i32 (XXSPLTWs (LIWAX xoaddr:$src), 1))>;
Nemanja Ivanovicf3c94b12015-05-07 18:24:05 +00001467} // AddedComplexity = 400
Kit Barton298beb52015-02-18 16:21:46 +00001468} // HasP8Vector
Nemanja Ivanovicc38b5312015-04-11 10:40:42 +00001469
Nemanja Ivanovicdf1cb522016-11-29 16:11:34 +00001470let UseVSXReg = 1, AddedComplexity = 400 in {
Ehsan Amiri99b017a2016-03-31 17:47:17 +00001471let Predicates = [HasDirectMove] in {
Nemanja Ivanovicf02def62015-05-21 19:32:49 +00001472 // VSX direct move instructions
1473 def MFVSRD : XX1_RS6_RD5_XO<31, 51, (outs g8rc:$rA), (ins vsfrc:$XT),
1474 "mfvsrd $rA, $XT", IIC_VecGeneral,
1475 [(set i64:$rA, (PPCmfvsr f64:$XT))]>,
1476 Requires<[In64BitMode]>;
Nemanja Ivanovicffcf0fb2017-03-15 16:04:53 +00001477 let isCodeGenOnly = 1 in
1478 def MFVRD : XX1_RS6_RD5_XO<31, 51, (outs g8rc:$rA), (ins vrrc:$XT),
1479 "mfvsrd $rA, $XT", IIC_VecGeneral,
1480 []>,
1481 Requires<[In64BitMode]>;
Nemanja Ivanovicf02def62015-05-21 19:32:49 +00001482 def MFVSRWZ : XX1_RS6_RD5_XO<31, 115, (outs gprc:$rA), (ins vsfrc:$XT),
1483 "mfvsrwz $rA, $XT", IIC_VecGeneral,
1484 [(set i32:$rA, (PPCmfvsr f64:$XT))]>;
1485 def MTVSRD : XX1_RS6_RD5_XO<31, 179, (outs vsfrc:$XT), (ins g8rc:$rA),
1486 "mtvsrd $XT, $rA", IIC_VecGeneral,
1487 [(set f64:$XT, (PPCmtvsra i64:$rA))]>,
1488 Requires<[In64BitMode]>;
1489 def MTVSRWA : XX1_RS6_RD5_XO<31, 211, (outs vsfrc:$XT), (ins gprc:$rA),
1490 "mtvsrwa $XT, $rA", IIC_VecGeneral,
1491 [(set f64:$XT, (PPCmtvsra i32:$rA))]>;
1492 def MTVSRWZ : XX1_RS6_RD5_XO<31, 243, (outs vsfrc:$XT), (ins gprc:$rA),
1493 "mtvsrwz $XT, $rA", IIC_VecGeneral,
1494 [(set f64:$XT, (PPCmtvsrz i32:$rA))]>;
Ehsan Amiri99b017a2016-03-31 17:47:17 +00001495} // HasDirectMove
1496
1497let Predicates = [IsISA3_0, HasDirectMove] in {
1498 def MTVSRWS: XX1_RS6_RD5_XO<31, 403, (outs vsrc:$XT), (ins gprc:$rA),
Nemanja Ivanovicd2c3c512016-09-23 13:25:31 +00001499 "mtvsrws $XT, $rA", IIC_VecGeneral, []>;
Ehsan Amiri99b017a2016-03-31 17:47:17 +00001500
Guozhi Wei22e7da92017-05-11 22:17:35 +00001501 def MTVSRDD: XX1Form<31, 435, (outs vsrc:$XT), (ins g8rc_nox0:$rA, g8rc:$rB),
Ehsan Amiri99b017a2016-03-31 17:47:17 +00001502 "mtvsrdd $XT, $rA, $rB", IIC_VecGeneral,
1503 []>, Requires<[In64BitMode]>;
1504
1505 def MFVSRLD: XX1_RS6_RD5_XO<31, 307, (outs g8rc:$rA), (ins vsrc:$XT),
1506 "mfvsrld $rA, $XT", IIC_VecGeneral,
1507 []>, Requires<[In64BitMode]>;
1508
1509} // IsISA3_0, HasDirectMove
Nemanja Ivanovic11049f82016-10-04 06:59:23 +00001510} // UseVSXReg = 1
Nemanja Ivanovic1c39ca62015-08-13 17:40:44 +00001511
Nemanja Ivanovicffcf0fb2017-03-15 16:04:53 +00001512// We want to parse this from asm, but we don't want to emit this as it would
1513// be emitted with a VSX reg. So leave Emit = 0 here.
1514def : InstAlias<"mfvrd $rA, $XT",
1515 (MFVRD g8rc:$rA, vrrc:$XT), 0>;
1516def : InstAlias<"mffprd $rA, $src",
1517 (MFVSRD g8rc:$rA, f8rc:$src)>;
1518
Nemanja Ivanovicd3896572015-10-09 11:12:18 +00001519/* Direct moves of various widths from GPR's into VSR's. Each move lines
Nemanja Ivanovic1c39ca62015-08-13 17:40:44 +00001520 the value up into element 0 (both BE and LE). Namely, entities smaller than
1521 a doubleword are shifted left and moved for BE. For LE, they're moved, then
1522 swapped to go into the least significant element of the VSR.
1523*/
Nemanja Ivanovicd3896572015-10-09 11:12:18 +00001524def MovesToVSR {
1525 dag BE_BYTE_0 =
1526 (MTVSRD
1527 (RLDICR
1528 (INSERT_SUBREG (i64 (IMPLICIT_DEF)), $A, sub_32), 56, 7));
1529 dag BE_HALF_0 =
1530 (MTVSRD
1531 (RLDICR
1532 (INSERT_SUBREG (i64 (IMPLICIT_DEF)), $A, sub_32), 48, 15));
1533 dag BE_WORD_0 =
1534 (MTVSRD
1535 (RLDICR
1536 (INSERT_SUBREG (i64 (IMPLICIT_DEF)), $A, sub_32), 32, 31));
Nemanja Ivanovic1c39ca62015-08-13 17:40:44 +00001537 dag BE_DWORD_0 = (MTVSRD $A);
1538
1539 dag LE_MTVSRW = (MTVSRD (INSERT_SUBREG (i64 (IMPLICIT_DEF)), $A, sub_32));
Nemanja Ivanovicd3896572015-10-09 11:12:18 +00001540 dag LE_WORD_1 = (v2i64 (INSERT_SUBREG (v2i64 (IMPLICIT_DEF)),
1541 LE_MTVSRW, sub_64));
Nemanja Ivanovic1c39ca62015-08-13 17:40:44 +00001542 dag LE_WORD_0 = (XXPERMDI LE_WORD_1, LE_WORD_1, 2);
Nemanja Ivanovicd3896572015-10-09 11:12:18 +00001543 dag LE_DWORD_1 = (v2i64 (INSERT_SUBREG (v2i64 (IMPLICIT_DEF)),
1544 BE_DWORD_0, sub_64));
Nemanja Ivanovic1c39ca62015-08-13 17:40:44 +00001545 dag LE_DWORD_0 = (XXPERMDI LE_DWORD_1, LE_DWORD_1, 2);
1546}
1547
Nemanja Ivanovicac8d01a2015-12-10 13:35:28 +00001548/* Patterns for extracting elements out of vectors. Integer elements are
1549 extracted using direct move operations. Patterns for extracting elements
1550 whose indices are not available at compile time are also provided with
1551 various _VARIABLE_ patterns.
Nemanja Ivanovicd3896572015-10-09 11:12:18 +00001552 The numbering for the DAG's is for LE, but when used on BE, the correct
1553 LE element can just be used (i.e. LE_BYTE_2 == BE_BYTE_13).
1554*/
Nemanja Ivanovicac8d01a2015-12-10 13:35:28 +00001555def VectorExtractions {
Nemanja Ivanovicd3896572015-10-09 11:12:18 +00001556 // Doubleword extraction
1557 dag LE_DWORD_0 =
1558 (MFVSRD
1559 (EXTRACT_SUBREG
1560 (XXPERMDI (COPY_TO_REGCLASS $S, VSRC),
1561 (COPY_TO_REGCLASS $S, VSRC), 2), sub_64));
1562 dag LE_DWORD_1 = (MFVSRD
1563 (EXTRACT_SUBREG
1564 (v2i64 (COPY_TO_REGCLASS $S, VSRC)), sub_64));
1565
1566 // Word extraction
Nemanja Ivanoviceebbcb62016-07-12 12:16:27 +00001567 dag LE_WORD_0 = (MFVSRWZ (EXTRACT_SUBREG (XXPERMDI $S, $S, 2), sub_64));
Nemanja Ivanovicd3896572015-10-09 11:12:18 +00001568 dag LE_WORD_1 = (MFVSRWZ (EXTRACT_SUBREG (XXSLDWI $S, $S, 1), sub_64));
1569 dag LE_WORD_2 = (MFVSRWZ (EXTRACT_SUBREG
1570 (v2i64 (COPY_TO_REGCLASS $S, VSRC)), sub_64));
1571 dag LE_WORD_3 = (MFVSRWZ (EXTRACT_SUBREG (XXSLDWI $S, $S, 3), sub_64));
1572
1573 // Halfword extraction
1574 dag LE_HALF_0 = (i32 (EXTRACT_SUBREG (RLDICL LE_DWORD_0, 0, 48), sub_32));
1575 dag LE_HALF_1 = (i32 (EXTRACT_SUBREG (RLDICL LE_DWORD_0, 48, 48), sub_32));
1576 dag LE_HALF_2 = (i32 (EXTRACT_SUBREG (RLDICL LE_DWORD_0, 32, 48), sub_32));
1577 dag LE_HALF_3 = (i32 (EXTRACT_SUBREG (RLDICL LE_DWORD_0, 16, 48), sub_32));
1578 dag LE_HALF_4 = (i32 (EXTRACT_SUBREG (RLDICL LE_DWORD_1, 0, 48), sub_32));
1579 dag LE_HALF_5 = (i32 (EXTRACT_SUBREG (RLDICL LE_DWORD_1, 48, 48), sub_32));
1580 dag LE_HALF_6 = (i32 (EXTRACT_SUBREG (RLDICL LE_DWORD_1, 32, 48), sub_32));
1581 dag LE_HALF_7 = (i32 (EXTRACT_SUBREG (RLDICL LE_DWORD_1, 16, 48), sub_32));
1582
1583 // Byte extraction
1584 dag LE_BYTE_0 = (i32 (EXTRACT_SUBREG (RLDICL LE_DWORD_0, 0, 56), sub_32));
1585 dag LE_BYTE_1 = (i32 (EXTRACT_SUBREG (RLDICL LE_DWORD_0, 56, 56), sub_32));
1586 dag LE_BYTE_2 = (i32 (EXTRACT_SUBREG (RLDICL LE_DWORD_0, 48, 56), sub_32));
1587 dag LE_BYTE_3 = (i32 (EXTRACT_SUBREG (RLDICL LE_DWORD_0, 40, 56), sub_32));
1588 dag LE_BYTE_4 = (i32 (EXTRACT_SUBREG (RLDICL LE_DWORD_0, 32, 56), sub_32));
1589 dag LE_BYTE_5 = (i32 (EXTRACT_SUBREG (RLDICL LE_DWORD_0, 24, 56), sub_32));
1590 dag LE_BYTE_6 = (i32 (EXTRACT_SUBREG (RLDICL LE_DWORD_0, 16, 56), sub_32));
1591 dag LE_BYTE_7 = (i32 (EXTRACT_SUBREG (RLDICL LE_DWORD_0, 8, 56), sub_32));
1592 dag LE_BYTE_8 = (i32 (EXTRACT_SUBREG (RLDICL LE_DWORD_1, 0, 56), sub_32));
1593 dag LE_BYTE_9 = (i32 (EXTRACT_SUBREG (RLDICL LE_DWORD_1, 56, 56), sub_32));
1594 dag LE_BYTE_10 = (i32 (EXTRACT_SUBREG (RLDICL LE_DWORD_1, 48, 56), sub_32));
1595 dag LE_BYTE_11 = (i32 (EXTRACT_SUBREG (RLDICL LE_DWORD_1, 40, 56), sub_32));
1596 dag LE_BYTE_12 = (i32 (EXTRACT_SUBREG (RLDICL LE_DWORD_1, 32, 56), sub_32));
1597 dag LE_BYTE_13 = (i32 (EXTRACT_SUBREG (RLDICL LE_DWORD_1, 24, 56), sub_32));
1598 dag LE_BYTE_14 = (i32 (EXTRACT_SUBREG (RLDICL LE_DWORD_1, 16, 56), sub_32));
1599 dag LE_BYTE_15 = (i32 (EXTRACT_SUBREG (RLDICL LE_DWORD_1, 8, 56), sub_32));
1600
1601 /* Variable element number (BE and LE patterns must be specified separately)
1602 This is a rather involved process.
1603
1604 Conceptually, this is how the move is accomplished:
1605 1. Identify which doubleword contains the element
1606 2. Shift in the VMX register so that the correct doubleword is correctly
1607 lined up for the MFVSRD
1608 3. Perform the move so that the element (along with some extra stuff)
1609 is in the GPR
1610 4. Right shift within the GPR so that the element is right-justified
1611
1612 Of course, the index is an element number which has a different meaning
1613 on LE/BE so the patterns have to be specified separately.
1614
1615 Note: The final result will be the element right-justified with high
1616 order bits being arbitrarily defined (namely, whatever was in the
1617 vector register to the left of the value originally).
1618 */
1619
1620 /* LE variable byte
1621 Number 1. above:
1622 - For elements 0-7, we shift left by 8 bytes since they're on the right
1623 - For elements 8-15, we need not shift (shift left by zero bytes)
1624 This is accomplished by inverting the bits of the index and AND-ing
1625 with 0x8 (i.e. clearing all bits of the index and inverting bit 60).
1626 */
Lei Huangcd4f3852018-03-12 19:26:18 +00001627 dag LE_VBYTE_PERM_VEC = (v16i8 (LVSL ZERO8, (ANDC8 (LI8 8), $Idx)));
Nemanja Ivanovicd3896572015-10-09 11:12:18 +00001628
1629 // Number 2. above:
1630 // - Now that we set up the shift amount, we shift in the VMX register
Lei Huangcd4f3852018-03-12 19:26:18 +00001631 dag LE_VBYTE_PERMUTE = (v16i8 (VPERM $S, $S, LE_VBYTE_PERM_VEC));
Nemanja Ivanovicd3896572015-10-09 11:12:18 +00001632
1633 // Number 3. above:
1634 // - The doubleword containing our element is moved to a GPR
1635 dag LE_MV_VBYTE = (MFVSRD
1636 (EXTRACT_SUBREG
1637 (v2i64 (COPY_TO_REGCLASS LE_VBYTE_PERMUTE, VSRC)),
1638 sub_64));
1639
1640 /* Number 4. above:
1641 - Truncate the element number to the range 0-7 (8-15 are symmetrical
1642 and out of range values are truncated accordingly)
1643 - Multiply by 8 as we need to shift right by the number of bits, not bytes
1644 - Shift right in the GPR by the calculated value
1645 */
1646 dag LE_VBYTE_SHIFT = (EXTRACT_SUBREG (RLDICR (AND8 (LI8 7), $Idx), 3, 60),
1647 sub_32);
1648 dag LE_VARIABLE_BYTE = (EXTRACT_SUBREG (SRD LE_MV_VBYTE, LE_VBYTE_SHIFT),
1649 sub_32);
1650
Nemanja Ivanovicd3896572015-10-09 11:12:18 +00001651 /* LE variable halfword
1652 Number 1. above:
1653 - For elements 0-3, we shift left by 8 since they're on the right
1654 - For elements 4-7, we need not shift (shift left by zero bytes)
1655 Similarly to the byte pattern, we invert the bits of the index, but we
1656 AND with 0x4 (i.e. clear all bits of the index and invert bit 61).
1657 Of course, the shift is still by 8 bytes, so we must multiply by 2.
1658 */
Lei Huangcd4f3852018-03-12 19:26:18 +00001659 dag LE_VHALF_PERM_VEC =
1660 (v16i8 (LVSL ZERO8, (RLDICR (ANDC8 (LI8 4), $Idx), 1, 62)));
Nemanja Ivanovicd3896572015-10-09 11:12:18 +00001661
1662 // Number 2. above:
1663 // - Now that we set up the shift amount, we shift in the VMX register
Lei Huangcd4f3852018-03-12 19:26:18 +00001664 dag LE_VHALF_PERMUTE = (v16i8 (VPERM $S, $S, LE_VHALF_PERM_VEC));
Nemanja Ivanovicd3896572015-10-09 11:12:18 +00001665
1666 // Number 3. above:
1667 // - The doubleword containing our element is moved to a GPR
1668 dag LE_MV_VHALF = (MFVSRD
1669 (EXTRACT_SUBREG
1670 (v2i64 (COPY_TO_REGCLASS LE_VHALF_PERMUTE, VSRC)),
1671 sub_64));
1672
1673 /* Number 4. above:
1674 - Truncate the element number to the range 0-3 (4-7 are symmetrical
1675 and out of range values are truncated accordingly)
1676 - Multiply by 16 as we need to shift right by the number of bits
1677 - Shift right in the GPR by the calculated value
1678 */
1679 dag LE_VHALF_SHIFT = (EXTRACT_SUBREG (RLDICR (AND8 (LI8 3), $Idx), 4, 59),
1680 sub_32);
1681 dag LE_VARIABLE_HALF = (EXTRACT_SUBREG (SRD LE_MV_VHALF, LE_VHALF_SHIFT),
1682 sub_32);
1683
Nemanja Ivanovicac8d01a2015-12-10 13:35:28 +00001684 /* LE variable word
1685 Number 1. above:
1686 - For elements 0-1, we shift left by 8 since they're on the right
1687 - For elements 2-3, we need not shift
1688 */
Lei Huangcd4f3852018-03-12 19:26:18 +00001689 dag LE_VWORD_PERM_VEC = (v16i8 (LVSL ZERO8,
1690 (RLDICR (ANDC8 (LI8 2), $Idx), 2, 61)));
Nemanja Ivanovicac8d01a2015-12-10 13:35:28 +00001691
1692 // Number 2. above:
1693 // - Now that we set up the shift amount, we shift in the VMX register
Lei Huangcd4f3852018-03-12 19:26:18 +00001694 dag LE_VWORD_PERMUTE = (v16i8 (VPERM $S, $S, LE_VWORD_PERM_VEC));
Nemanja Ivanovicac8d01a2015-12-10 13:35:28 +00001695
1696 // Number 3. above:
1697 // - The doubleword containing our element is moved to a GPR
1698 dag LE_MV_VWORD = (MFVSRD
1699 (EXTRACT_SUBREG
1700 (v2i64 (COPY_TO_REGCLASS LE_VWORD_PERMUTE, VSRC)),
1701 sub_64));
1702
1703 /* Number 4. above:
1704 - Truncate the element number to the range 0-1 (2-3 are symmetrical
1705 and out of range values are truncated accordingly)
1706 - Multiply by 32 as we need to shift right by the number of bits
1707 - Shift right in the GPR by the calculated value
1708 */
1709 dag LE_VWORD_SHIFT = (EXTRACT_SUBREG (RLDICR (AND8 (LI8 1), $Idx), 5, 58),
1710 sub_32);
1711 dag LE_VARIABLE_WORD = (EXTRACT_SUBREG (SRD LE_MV_VWORD, LE_VWORD_SHIFT),
1712 sub_32);
1713
1714 /* LE variable doubleword
1715 Number 1. above:
1716 - For element 0, we shift left by 8 since it's on the right
1717 - For element 1, we need not shift
1718 */
Lei Huangcd4f3852018-03-12 19:26:18 +00001719 dag LE_VDWORD_PERM_VEC = (v16i8 (LVSL ZERO8,
1720 (RLDICR (ANDC8 (LI8 1), $Idx), 3, 60)));
Nemanja Ivanovicac8d01a2015-12-10 13:35:28 +00001721
1722 // Number 2. above:
1723 // - Now that we set up the shift amount, we shift in the VMX register
Lei Huangcd4f3852018-03-12 19:26:18 +00001724 dag LE_VDWORD_PERMUTE = (v16i8 (VPERM $S, $S, LE_VDWORD_PERM_VEC));
Nemanja Ivanovicac8d01a2015-12-10 13:35:28 +00001725
1726 // Number 3. above:
1727 // - The doubleword containing our element is moved to a GPR
1728 // - Number 4. is not needed for the doubleword as the value is 64-bits
1729 dag LE_VARIABLE_DWORD =
1730 (MFVSRD (EXTRACT_SUBREG
1731 (v2i64 (COPY_TO_REGCLASS LE_VDWORD_PERMUTE, VSRC)),
1732 sub_64));
1733
1734 /* LE variable float
1735 - Shift the vector to line up the desired element to BE Word 0
1736 - Convert 32-bit float to a 64-bit single precision float
1737 */
Lei Huangcd4f3852018-03-12 19:26:18 +00001738 dag LE_VFLOAT_PERM_VEC = (v16i8 (LVSL ZERO8,
1739 (RLDICR (XOR8 (LI8 3), $Idx), 2, 61)));
Nemanja Ivanovicac8d01a2015-12-10 13:35:28 +00001740 dag LE_VFLOAT_PERMUTE = (VPERM $S, $S, LE_VFLOAT_PERM_VEC);
1741 dag LE_VARIABLE_FLOAT = (XSCVSPDPN LE_VFLOAT_PERMUTE);
1742
1743 /* LE variable double
1744 Same as the LE doubleword except there is no move.
1745 */
Lei Huangcd4f3852018-03-12 19:26:18 +00001746 dag LE_VDOUBLE_PERMUTE = (v16i8 (VPERM (v16i8 (COPY_TO_REGCLASS $S, VRRC)),
1747 (v16i8 (COPY_TO_REGCLASS $S, VRRC)),
1748 LE_VDWORD_PERM_VEC));
Nemanja Ivanovicac8d01a2015-12-10 13:35:28 +00001749 dag LE_VARIABLE_DOUBLE = (COPY_TO_REGCLASS LE_VDOUBLE_PERMUTE, VSRC);
1750
1751 /* BE variable byte
1752 The algorithm here is the same as the LE variable byte except:
1753 - The shift in the VMX register is by 0/8 for opposite element numbers so
1754 we simply AND the element number with 0x8
1755 - The order of elements after the move to GPR is reversed, so we invert
1756 the bits of the index prior to truncating to the range 0-7
1757 */
Lei Huangcd4f3852018-03-12 19:26:18 +00001758 dag BE_VBYTE_PERM_VEC = (v16i8 (LVSL ZERO8, (ANDIo8 $Idx, 8)));
1759 dag BE_VBYTE_PERMUTE = (v16i8 (VPERM $S, $S, BE_VBYTE_PERM_VEC));
Nemanja Ivanovicac8d01a2015-12-10 13:35:28 +00001760 dag BE_MV_VBYTE = (MFVSRD
1761 (EXTRACT_SUBREG
1762 (v2i64 (COPY_TO_REGCLASS BE_VBYTE_PERMUTE, VSRC)),
1763 sub_64));
1764 dag BE_VBYTE_SHIFT = (EXTRACT_SUBREG (RLDICR (ANDC8 (LI8 7), $Idx), 3, 60),
1765 sub_32);
1766 dag BE_VARIABLE_BYTE = (EXTRACT_SUBREG (SRD BE_MV_VBYTE, BE_VBYTE_SHIFT),
1767 sub_32);
1768
Nemanja Ivanovicd3896572015-10-09 11:12:18 +00001769 /* BE variable halfword
1770 The algorithm here is the same as the LE variable halfword except:
1771 - The shift in the VMX register is by 0/8 for opposite element numbers so
1772 we simply AND the element number with 0x4 and multiply by 2
1773 - The order of elements after the move to GPR is reversed, so we invert
1774 the bits of the index prior to truncating to the range 0-3
1775 */
Lei Huangcd4f3852018-03-12 19:26:18 +00001776 dag BE_VHALF_PERM_VEC = (v16i8 (LVSL ZERO8,
1777 (RLDICR (ANDIo8 $Idx, 4), 1, 62)));
1778 dag BE_VHALF_PERMUTE = (v16i8 (VPERM $S, $S, BE_VHALF_PERM_VEC));
Nemanja Ivanovicd3896572015-10-09 11:12:18 +00001779 dag BE_MV_VHALF = (MFVSRD
1780 (EXTRACT_SUBREG
1781 (v2i64 (COPY_TO_REGCLASS BE_VHALF_PERMUTE, VSRC)),
1782 sub_64));
Nemanja Ivanovicac8d01a2015-12-10 13:35:28 +00001783 dag BE_VHALF_SHIFT = (EXTRACT_SUBREG (RLDICR (ANDC8 (LI8 3), $Idx), 4, 59),
Nemanja Ivanovicd3896572015-10-09 11:12:18 +00001784 sub_32);
1785 dag BE_VARIABLE_HALF = (EXTRACT_SUBREG (SRD BE_MV_VHALF, BE_VHALF_SHIFT),
1786 sub_32);
Nemanja Ivanovicac8d01a2015-12-10 13:35:28 +00001787
1788 /* BE variable word
1789 The algorithm is the same as the LE variable word except:
1790 - The shift in the VMX register happens for opposite element numbers
1791 - The order of elements after the move to GPR is reversed, so we invert
1792 the bits of the index prior to truncating to the range 0-1
1793 */
Lei Huangcd4f3852018-03-12 19:26:18 +00001794 dag BE_VWORD_PERM_VEC = (v16i8 (LVSL ZERO8,
1795 (RLDICR (ANDIo8 $Idx, 2), 2, 61)));
1796 dag BE_VWORD_PERMUTE = (v16i8 (VPERM $S, $S, BE_VWORD_PERM_VEC));
Nemanja Ivanovicac8d01a2015-12-10 13:35:28 +00001797 dag BE_MV_VWORD = (MFVSRD
1798 (EXTRACT_SUBREG
1799 (v2i64 (COPY_TO_REGCLASS BE_VWORD_PERMUTE, VSRC)),
1800 sub_64));
1801 dag BE_VWORD_SHIFT = (EXTRACT_SUBREG (RLDICR (ANDC8 (LI8 1), $Idx), 5, 58),
1802 sub_32);
1803 dag BE_VARIABLE_WORD = (EXTRACT_SUBREG (SRD BE_MV_VWORD, BE_VWORD_SHIFT),
1804 sub_32);
1805
1806 /* BE variable doubleword
1807 Same as the LE doubleword except we shift in the VMX register for opposite
1808 element indices.
1809 */
Lei Huangcd4f3852018-03-12 19:26:18 +00001810 dag BE_VDWORD_PERM_VEC = (v16i8 (LVSL ZERO8,
1811 (RLDICR (ANDIo8 $Idx, 1), 3, 60)));
1812 dag BE_VDWORD_PERMUTE = (v16i8 (VPERM $S, $S, BE_VDWORD_PERM_VEC));
Nemanja Ivanovicac8d01a2015-12-10 13:35:28 +00001813 dag BE_VARIABLE_DWORD =
1814 (MFVSRD (EXTRACT_SUBREG
1815 (v2i64 (COPY_TO_REGCLASS BE_VDWORD_PERMUTE, VSRC)),
1816 sub_64));
1817
1818 /* BE variable float
1819 - Shift the vector to line up the desired element to BE Word 0
1820 - Convert 32-bit float to a 64-bit single precision float
1821 */
Lei Huangcd4f3852018-03-12 19:26:18 +00001822 dag BE_VFLOAT_PERM_VEC = (v16i8 (LVSL ZERO8, (RLDICR $Idx, 2, 61)));
Nemanja Ivanovicac8d01a2015-12-10 13:35:28 +00001823 dag BE_VFLOAT_PERMUTE = (VPERM $S, $S, BE_VFLOAT_PERM_VEC);
1824 dag BE_VARIABLE_FLOAT = (XSCVSPDPN BE_VFLOAT_PERMUTE);
1825
1826 /* BE variable double
1827 Same as the BE doubleword except there is no move.
1828 */
Lei Huangcd4f3852018-03-12 19:26:18 +00001829 dag BE_VDOUBLE_PERMUTE = (v16i8 (VPERM (v16i8 (COPY_TO_REGCLASS $S, VRRC)),
1830 (v16i8 (COPY_TO_REGCLASS $S, VRRC)),
1831 BE_VDWORD_PERM_VEC));
Nemanja Ivanovicac8d01a2015-12-10 13:35:28 +00001832 dag BE_VARIABLE_DOUBLE = (COPY_TO_REGCLASS BE_VDOUBLE_PERMUTE, VSRC);
Nemanja Ivanovicd3896572015-10-09 11:12:18 +00001833}
1834
Zaara Syeda48cb3c12017-11-27 17:11:03 +00001835def NoP9Altivec : Predicate<"!PPCSubTarget->hasP9Altivec()">;
Nemanja Ivanovicdf1cb522016-11-29 16:11:34 +00001836let AddedComplexity = 400 in {
Nemanja Ivanovicd3896572015-10-09 11:12:18 +00001837// v4f32 scalar <-> vector conversions (BE)
Nemanja Ivanovic1c39ca62015-08-13 17:40:44 +00001838let Predicates = [IsBigEndian, HasP8Vector] in {
1839 def : Pat<(v4f32 (scalar_to_vector f32:$A)),
1840 (v4f32 (XSCVDPSPN $A))>;
Nemanja Ivanovicd3896572015-10-09 11:12:18 +00001841 def : Pat<(f32 (vector_extract v4f32:$S, 0)),
1842 (f32 (XSCVSPDPN $S))>;
1843 def : Pat<(f32 (vector_extract v4f32:$S, 1)),
1844 (f32 (XSCVSPDPN (XXSLDWI $S, $S, 1)))>;
1845 def : Pat<(f32 (vector_extract v4f32:$S, 2)),
Nemanja Ivanoviceebbcb62016-07-12 12:16:27 +00001846 (f32 (XSCVSPDPN (XXPERMDI $S, $S, 2)))>;
Nemanja Ivanovicd3896572015-10-09 11:12:18 +00001847 def : Pat<(f32 (vector_extract v4f32:$S, 3)),
1848 (f32 (XSCVSPDPN (XXSLDWI $S, $S, 3)))>;
Nemanja Ivanovicac8d01a2015-12-10 13:35:28 +00001849 def : Pat<(f32 (vector_extract v4f32:$S, i64:$Idx)),
1850 (f32 VectorExtractions.BE_VARIABLE_FLOAT)>;
Nemanja Ivanovic1c39ca62015-08-13 17:40:44 +00001851} // IsBigEndian, HasP8Vector
1852
Nemanja Ivanovicac8d01a2015-12-10 13:35:28 +00001853// Variable index vector_extract for v2f64 does not require P8Vector
1854let Predicates = [IsBigEndian, HasVSX] in
1855 def : Pat<(f64 (vector_extract v2f64:$S, i64:$Idx)),
1856 (f64 VectorExtractions.BE_VARIABLE_DOUBLE)>;
1857
Nemanja Ivanovic1c39ca62015-08-13 17:40:44 +00001858let Predicates = [IsBigEndian, HasDirectMove] in {
Nemanja Ivanovicd3896572015-10-09 11:12:18 +00001859 // v16i8 scalar <-> vector conversions (BE)
Nemanja Ivanovic1c39ca62015-08-13 17:40:44 +00001860 def : Pat<(v16i8 (scalar_to_vector i32:$A)),
Nemanja Ivanovicd3896572015-10-09 11:12:18 +00001861 (v16i8 (SUBREG_TO_REG (i64 1), MovesToVSR.BE_BYTE_0, sub_64))>;
Nemanja Ivanovic1c39ca62015-08-13 17:40:44 +00001862 def : Pat<(v8i16 (scalar_to_vector i32:$A)),
Nemanja Ivanovicd3896572015-10-09 11:12:18 +00001863 (v8i16 (SUBREG_TO_REG (i64 1), MovesToVSR.BE_HALF_0, sub_64))>;
Nemanja Ivanovic1c39ca62015-08-13 17:40:44 +00001864 def : Pat<(v4i32 (scalar_to_vector i32:$A)),
Nemanja Ivanovicd3896572015-10-09 11:12:18 +00001865 (v4i32 (SUBREG_TO_REG (i64 1), MovesToVSR.BE_WORD_0, sub_64))>;
Nemanja Ivanovic1c39ca62015-08-13 17:40:44 +00001866 def : Pat<(v2i64 (scalar_to_vector i64:$A)),
Nemanja Ivanovicd3896572015-10-09 11:12:18 +00001867 (v2i64 (SUBREG_TO_REG (i64 1), MovesToVSR.BE_DWORD_0, sub_64))>;
Zaara Syeda48cb3c12017-11-27 17:11:03 +00001868
1869 // v2i64 scalar <-> vector conversions (BE)
1870 def : Pat<(i64 (vector_extract v2i64:$S, 0)),
1871 (i64 VectorExtractions.LE_DWORD_1)>;
1872 def : Pat<(i64 (vector_extract v2i64:$S, 1)),
1873 (i64 VectorExtractions.LE_DWORD_0)>;
1874 def : Pat<(i64 (vector_extract v2i64:$S, i64:$Idx)),
1875 (i64 VectorExtractions.BE_VARIABLE_DWORD)>;
1876} // IsBigEndian, HasDirectMove
1877
1878let Predicates = [IsBigEndian, HasDirectMove, NoP9Altivec] in {
Nemanja Ivanovicd3896572015-10-09 11:12:18 +00001879 def : Pat<(i32 (vector_extract v16i8:$S, 0)),
Nemanja Ivanovicac8d01a2015-12-10 13:35:28 +00001880 (i32 VectorExtractions.LE_BYTE_15)>;
Nemanja Ivanovicd3896572015-10-09 11:12:18 +00001881 def : Pat<(i32 (vector_extract v16i8:$S, 1)),
Nemanja Ivanovicac8d01a2015-12-10 13:35:28 +00001882 (i32 VectorExtractions.LE_BYTE_14)>;
Nemanja Ivanovicd3896572015-10-09 11:12:18 +00001883 def : Pat<(i32 (vector_extract v16i8:$S, 2)),
Nemanja Ivanovicac8d01a2015-12-10 13:35:28 +00001884 (i32 VectorExtractions.LE_BYTE_13)>;
Nemanja Ivanovicd3896572015-10-09 11:12:18 +00001885 def : Pat<(i32 (vector_extract v16i8:$S, 3)),
Nemanja Ivanovicac8d01a2015-12-10 13:35:28 +00001886 (i32 VectorExtractions.LE_BYTE_12)>;
Nemanja Ivanovicd3896572015-10-09 11:12:18 +00001887 def : Pat<(i32 (vector_extract v16i8:$S, 4)),
Nemanja Ivanovicac8d01a2015-12-10 13:35:28 +00001888 (i32 VectorExtractions.LE_BYTE_11)>;
Nemanja Ivanovicd3896572015-10-09 11:12:18 +00001889 def : Pat<(i32 (vector_extract v16i8:$S, 5)),
Nemanja Ivanovicac8d01a2015-12-10 13:35:28 +00001890 (i32 VectorExtractions.LE_BYTE_10)>;
Nemanja Ivanovicd3896572015-10-09 11:12:18 +00001891 def : Pat<(i32 (vector_extract v16i8:$S, 6)),
Nemanja Ivanovicac8d01a2015-12-10 13:35:28 +00001892 (i32 VectorExtractions.LE_BYTE_9)>;
Nemanja Ivanovicd3896572015-10-09 11:12:18 +00001893 def : Pat<(i32 (vector_extract v16i8:$S, 7)),
Nemanja Ivanovicac8d01a2015-12-10 13:35:28 +00001894 (i32 VectorExtractions.LE_BYTE_8)>;
Nemanja Ivanovicd3896572015-10-09 11:12:18 +00001895 def : Pat<(i32 (vector_extract v16i8:$S, 8)),
Nemanja Ivanovicac8d01a2015-12-10 13:35:28 +00001896 (i32 VectorExtractions.LE_BYTE_7)>;
Nemanja Ivanovicd3896572015-10-09 11:12:18 +00001897 def : Pat<(i32 (vector_extract v16i8:$S, 9)),
Nemanja Ivanovicac8d01a2015-12-10 13:35:28 +00001898 (i32 VectorExtractions.LE_BYTE_6)>;
Nemanja Ivanovicd3896572015-10-09 11:12:18 +00001899 def : Pat<(i32 (vector_extract v16i8:$S, 10)),
Nemanja Ivanovicac8d01a2015-12-10 13:35:28 +00001900 (i32 VectorExtractions.LE_BYTE_5)>;
Nemanja Ivanovicd3896572015-10-09 11:12:18 +00001901 def : Pat<(i32 (vector_extract v16i8:$S, 11)),
Nemanja Ivanovicac8d01a2015-12-10 13:35:28 +00001902 (i32 VectorExtractions.LE_BYTE_4)>;
Nemanja Ivanovicd3896572015-10-09 11:12:18 +00001903 def : Pat<(i32 (vector_extract v16i8:$S, 12)),
Nemanja Ivanovicac8d01a2015-12-10 13:35:28 +00001904 (i32 VectorExtractions.LE_BYTE_3)>;
Nemanja Ivanovicd3896572015-10-09 11:12:18 +00001905 def : Pat<(i32 (vector_extract v16i8:$S, 13)),
Nemanja Ivanovicac8d01a2015-12-10 13:35:28 +00001906 (i32 VectorExtractions.LE_BYTE_2)>;
Nemanja Ivanovicd3896572015-10-09 11:12:18 +00001907 def : Pat<(i32 (vector_extract v16i8:$S, 14)),
Nemanja Ivanovicac8d01a2015-12-10 13:35:28 +00001908 (i32 VectorExtractions.LE_BYTE_1)>;
Nemanja Ivanovicd3896572015-10-09 11:12:18 +00001909 def : Pat<(i32 (vector_extract v16i8:$S, 15)),
Nemanja Ivanovicac8d01a2015-12-10 13:35:28 +00001910 (i32 VectorExtractions.LE_BYTE_0)>;
Nemanja Ivanovicd3896572015-10-09 11:12:18 +00001911 def : Pat<(i32 (vector_extract v16i8:$S, i64:$Idx)),
Nemanja Ivanovicac8d01a2015-12-10 13:35:28 +00001912 (i32 VectorExtractions.BE_VARIABLE_BYTE)>;
Nemanja Ivanovicd3896572015-10-09 11:12:18 +00001913
1914 // v8i16 scalar <-> vector conversions (BE)
1915 def : Pat<(i32 (vector_extract v8i16:$S, 0)),
Nemanja Ivanovicac8d01a2015-12-10 13:35:28 +00001916 (i32 VectorExtractions.LE_HALF_7)>;
Nemanja Ivanovicd3896572015-10-09 11:12:18 +00001917 def : Pat<(i32 (vector_extract v8i16:$S, 1)),
Nemanja Ivanovicac8d01a2015-12-10 13:35:28 +00001918 (i32 VectorExtractions.LE_HALF_6)>;
Nemanja Ivanovicd3896572015-10-09 11:12:18 +00001919 def : Pat<(i32 (vector_extract v8i16:$S, 2)),
Nemanja Ivanovicac8d01a2015-12-10 13:35:28 +00001920 (i32 VectorExtractions.LE_HALF_5)>;
Nemanja Ivanovicd3896572015-10-09 11:12:18 +00001921 def : Pat<(i32 (vector_extract v8i16:$S, 3)),
Nemanja Ivanovicac8d01a2015-12-10 13:35:28 +00001922 (i32 VectorExtractions.LE_HALF_4)>;
Nemanja Ivanovicd3896572015-10-09 11:12:18 +00001923 def : Pat<(i32 (vector_extract v8i16:$S, 4)),
Nemanja Ivanovicac8d01a2015-12-10 13:35:28 +00001924 (i32 VectorExtractions.LE_HALF_3)>;
Nemanja Ivanovicd3896572015-10-09 11:12:18 +00001925 def : Pat<(i32 (vector_extract v8i16:$S, 5)),
Nemanja Ivanovicac8d01a2015-12-10 13:35:28 +00001926 (i32 VectorExtractions.LE_HALF_2)>;
Nemanja Ivanovicd3896572015-10-09 11:12:18 +00001927 def : Pat<(i32 (vector_extract v8i16:$S, 6)),
Nemanja Ivanovicac8d01a2015-12-10 13:35:28 +00001928 (i32 VectorExtractions.LE_HALF_1)>;
Nemanja Ivanovicd3896572015-10-09 11:12:18 +00001929 def : Pat<(i32 (vector_extract v8i16:$S, 7)),
Nemanja Ivanovicac8d01a2015-12-10 13:35:28 +00001930 (i32 VectorExtractions.LE_HALF_0)>;
Nemanja Ivanovicd3896572015-10-09 11:12:18 +00001931 def : Pat<(i32 (vector_extract v8i16:$S, i64:$Idx)),
Nemanja Ivanovicac8d01a2015-12-10 13:35:28 +00001932 (i32 VectorExtractions.BE_VARIABLE_HALF)>;
Nemanja Ivanovicd3896572015-10-09 11:12:18 +00001933
1934 // v4i32 scalar <-> vector conversions (BE)
1935 def : Pat<(i32 (vector_extract v4i32:$S, 0)),
Nemanja Ivanovicac8d01a2015-12-10 13:35:28 +00001936 (i32 VectorExtractions.LE_WORD_3)>;
Nemanja Ivanovicd3896572015-10-09 11:12:18 +00001937 def : Pat<(i32 (vector_extract v4i32:$S, 1)),
Nemanja Ivanovicac8d01a2015-12-10 13:35:28 +00001938 (i32 VectorExtractions.LE_WORD_2)>;
Nemanja Ivanovicd3896572015-10-09 11:12:18 +00001939 def : Pat<(i32 (vector_extract v4i32:$S, 2)),
Nemanja Ivanovicac8d01a2015-12-10 13:35:28 +00001940 (i32 VectorExtractions.LE_WORD_1)>;
Nemanja Ivanovicd3896572015-10-09 11:12:18 +00001941 def : Pat<(i32 (vector_extract v4i32:$S, 3)),
Nemanja Ivanovicac8d01a2015-12-10 13:35:28 +00001942 (i32 VectorExtractions.LE_WORD_0)>;
1943 def : Pat<(i32 (vector_extract v4i32:$S, i64:$Idx)),
1944 (i32 VectorExtractions.BE_VARIABLE_WORD)>;
Zaara Syeda48cb3c12017-11-27 17:11:03 +00001945} // IsBigEndian, HasDirectMove, NoP9Altivec
Nemanja Ivanovic1c39ca62015-08-13 17:40:44 +00001946
Nemanja Ivanovicd3896572015-10-09 11:12:18 +00001947// v4f32 scalar <-> vector conversions (LE)
Nemanja Ivanovic1c39ca62015-08-13 17:40:44 +00001948let Predicates = [IsLittleEndian, HasP8Vector] in {
1949 def : Pat<(v4f32 (scalar_to_vector f32:$A)),
1950 (v4f32 (XXSLDWI (XSCVDPSPN $A), (XSCVDPSPN $A), 1))>;
Nemanja Ivanovicd3896572015-10-09 11:12:18 +00001951 def : Pat<(f32 (vector_extract v4f32:$S, 0)),
1952 (f32 (XSCVSPDPN (XXSLDWI $S, $S, 3)))>;
1953 def : Pat<(f32 (vector_extract v4f32:$S, 1)),
Nemanja Ivanoviceebbcb62016-07-12 12:16:27 +00001954 (f32 (XSCVSPDPN (XXPERMDI $S, $S, 2)))>;
Nemanja Ivanovicd3896572015-10-09 11:12:18 +00001955 def : Pat<(f32 (vector_extract v4f32:$S, 2)),
1956 (f32 (XSCVSPDPN (XXSLDWI $S, $S, 1)))>;
1957 def : Pat<(f32 (vector_extract v4f32:$S, 3)),
1958 (f32 (XSCVSPDPN $S))>;
Nemanja Ivanovicac8d01a2015-12-10 13:35:28 +00001959 def : Pat<(f32 (vector_extract v4f32:$S, i64:$Idx)),
1960 (f32 VectorExtractions.LE_VARIABLE_FLOAT)>;
Nemanja Ivanovic1c39ca62015-08-13 17:40:44 +00001961} // IsLittleEndian, HasP8Vector
1962
Nemanja Ivanovicac8d01a2015-12-10 13:35:28 +00001963// Variable index vector_extract for v2f64 does not require P8Vector
1964let Predicates = [IsLittleEndian, HasVSX] in
1965 def : Pat<(f64 (vector_extract v2f64:$S, i64:$Idx)),
1966 (f64 VectorExtractions.LE_VARIABLE_DOUBLE)>;
1967
Nemanja Ivanovicb89c27f2017-05-02 01:47:34 +00001968def : Pat<(v4i32 (int_ppc_vsx_lxvw4x_be xoaddr:$src)), (LXVW4X xoaddr:$src)>;
1969def : Pat<(v2f64 (int_ppc_vsx_lxvd2x_be xoaddr:$src)), (LXVD2X xoaddr:$src)>;
Tony Jiang5f850cd2016-11-15 14:25:56 +00001970
Tony Jiangaa5a6a12017-07-05 16:55:00 +00001971// Variable index unsigned vector_extract on Power9
1972let Predicates = [HasP9Altivec, IsLittleEndian] in {
1973 def : Pat<(i64 (anyext (i32 (vector_extract v16i8:$S, i64:$Idx)))),
1974 (VEXTUBRX $Idx, $S)>;
1975
1976 def : Pat<(i64 (anyext (i32 (vector_extract v8i16:$S, i64:$Idx)))),
1977 (VEXTUHRX (RLWINM8 $Idx, 1, 28, 30), $S)>;
1978 def : Pat<(i64 (anyext (i32 (vector_extract v8i16:$S, 0)))),
1979 (VEXTUHRX (LI8 0), $S)>;
1980 def : Pat<(i64 (anyext (i32 (vector_extract v8i16:$S, 1)))),
1981 (VEXTUHRX (LI8 2), $S)>;
1982 def : Pat<(i64 (anyext (i32 (vector_extract v8i16:$S, 2)))),
1983 (VEXTUHRX (LI8 4), $S)>;
1984 def : Pat<(i64 (anyext (i32 (vector_extract v8i16:$S, 3)))),
1985 (VEXTUHRX (LI8 6), $S)>;
1986 def : Pat<(i64 (anyext (i32 (vector_extract v8i16:$S, 4)))),
1987 (VEXTUHRX (LI8 8), $S)>;
1988 def : Pat<(i64 (anyext (i32 (vector_extract v8i16:$S, 5)))),
1989 (VEXTUHRX (LI8 10), $S)>;
1990 def : Pat<(i64 (anyext (i32 (vector_extract v8i16:$S, 6)))),
1991 (VEXTUHRX (LI8 12), $S)>;
1992 def : Pat<(i64 (anyext (i32 (vector_extract v8i16:$S, 7)))),
1993 (VEXTUHRX (LI8 14), $S)>;
1994
1995 def : Pat<(i64 (zext (i32 (vector_extract v4i32:$S, i64:$Idx)))),
1996 (VEXTUWRX (RLWINM8 $Idx, 2, 28, 29), $S)>;
1997 def : Pat<(i64 (zext (i32 (vector_extract v4i32:$S, 0)))),
1998 (VEXTUWRX (LI8 0), $S)>;
1999 def : Pat<(i64 (zext (i32 (vector_extract v4i32:$S, 1)))),
2000 (VEXTUWRX (LI8 4), $S)>;
Zaara Syeda48cb3c12017-11-27 17:11:03 +00002001 // For extracting LE word 2, MFVSRWZ is better than VEXTUWRX
Tony Jiangaa5a6a12017-07-05 16:55:00 +00002002 def : Pat<(i64 (zext (i32 (vector_extract v4i32:$S, 2)))),
Zaara Syeda48cb3c12017-11-27 17:11:03 +00002003 (INSERT_SUBREG (i64 (IMPLICIT_DEF)),
2004 (i32 VectorExtractions.LE_WORD_2), sub_32)>;
Tony Jiangaa5a6a12017-07-05 16:55:00 +00002005 def : Pat<(i64 (zext (i32 (vector_extract v4i32:$S, 3)))),
2006 (VEXTUWRX (LI8 12), $S)>;
2007
2008 def : Pat<(i64 (sext (i32 (vector_extract v4i32:$S, i64:$Idx)))),
2009 (EXTSW (VEXTUWRX (RLWINM8 $Idx, 2, 28, 29), $S))>;
2010 def : Pat<(i64 (sext (i32 (vector_extract v4i32:$S, 0)))),
2011 (EXTSW (VEXTUWRX (LI8 0), $S))>;
2012 def : Pat<(i64 (sext (i32 (vector_extract v4i32:$S, 1)))),
2013 (EXTSW (VEXTUWRX (LI8 4), $S))>;
Zaara Syeda48cb3c12017-11-27 17:11:03 +00002014 // For extracting LE word 2, MFVSRWZ is better than VEXTUWRX
Tony Jiangaa5a6a12017-07-05 16:55:00 +00002015 def : Pat<(i64 (sext (i32 (vector_extract v4i32:$S, 2)))),
Zaara Syeda48cb3c12017-11-27 17:11:03 +00002016 (EXTSW (INSERT_SUBREG (i64 (IMPLICIT_DEF)),
2017 (i32 VectorExtractions.LE_WORD_2), sub_32))>;
Tony Jiangaa5a6a12017-07-05 16:55:00 +00002018 def : Pat<(i64 (sext (i32 (vector_extract v4i32:$S, 3)))),
2019 (EXTSW (VEXTUWRX (LI8 12), $S))>;
Zaara Syeda48cb3c12017-11-27 17:11:03 +00002020
2021 def : Pat<(i32 (vector_extract v16i8:$S, i64:$Idx)),
2022 (i32 (EXTRACT_SUBREG (VEXTUBRX $Idx, $S), sub_32))>;
2023 def : Pat<(i32 (vector_extract v16i8:$S, 0)),
2024 (i32 (EXTRACT_SUBREG (VEXTUBRX (LI8 0), $S), sub_32))>;
2025 def : Pat<(i32 (vector_extract v16i8:$S, 1)),
2026 (i32 (EXTRACT_SUBREG (VEXTUBRX (LI8 1), $S), sub_32))>;
2027 def : Pat<(i32 (vector_extract v16i8:$S, 2)),
2028 (i32 (EXTRACT_SUBREG (VEXTUBRX (LI8 2), $S), sub_32))>;
2029 def : Pat<(i32 (vector_extract v16i8:$S, 3)),
2030 (i32 (EXTRACT_SUBREG (VEXTUBRX (LI8 3), $S), sub_32))>;
2031 def : Pat<(i32 (vector_extract v16i8:$S, 4)),
2032 (i32 (EXTRACT_SUBREG (VEXTUBRX (LI8 4), $S), sub_32))>;
2033 def : Pat<(i32 (vector_extract v16i8:$S, 5)),
2034 (i32 (EXTRACT_SUBREG (VEXTUBRX (LI8 5), $S), sub_32))>;
2035 def : Pat<(i32 (vector_extract v16i8:$S, 6)),
2036 (i32 (EXTRACT_SUBREG (VEXTUBRX (LI8 6), $S), sub_32))>;
2037 def : Pat<(i32 (vector_extract v16i8:$S, 7)),
2038 (i32 (EXTRACT_SUBREG (VEXTUBRX (LI8 7), $S), sub_32))>;
2039 def : Pat<(i32 (vector_extract v16i8:$S, 8)),
2040 (i32 (EXTRACT_SUBREG (VEXTUBRX (LI8 8), $S), sub_32))>;
2041 def : Pat<(i32 (vector_extract v16i8:$S, 9)),
2042 (i32 (EXTRACT_SUBREG (VEXTUBRX (LI8 9), $S), sub_32))>;
2043 def : Pat<(i32 (vector_extract v16i8:$S, 10)),
2044 (i32 (EXTRACT_SUBREG (VEXTUBRX (LI8 10), $S), sub_32))>;
2045 def : Pat<(i32 (vector_extract v16i8:$S, 11)),
2046 (i32 (EXTRACT_SUBREG (VEXTUBRX (LI8 11), $S), sub_32))>;
2047 def : Pat<(i32 (vector_extract v16i8:$S, 12)),
2048 (i32 (EXTRACT_SUBREG (VEXTUBRX (LI8 12), $S), sub_32))>;
2049 def : Pat<(i32 (vector_extract v16i8:$S, 13)),
2050 (i32 (EXTRACT_SUBREG (VEXTUBRX (LI8 13), $S), sub_32))>;
2051 def : Pat<(i32 (vector_extract v16i8:$S, 14)),
2052 (i32 (EXTRACT_SUBREG (VEXTUBRX (LI8 14), $S), sub_32))>;
2053 def : Pat<(i32 (vector_extract v16i8:$S, 15)),
2054 (i32 (EXTRACT_SUBREG (VEXTUBRX (LI8 15), $S), sub_32))>;
2055
2056 def : Pat<(i32 (vector_extract v8i16:$S, i64:$Idx)),
2057 (i32 (EXTRACT_SUBREG (VEXTUHRX
2058 (RLWINM8 $Idx, 1, 28, 30), $S), sub_32))>;
2059 def : Pat<(i32 (vector_extract v8i16:$S, 0)),
2060 (i32 (EXTRACT_SUBREG (VEXTUHRX (LI8 0), $S), sub_32))>;
2061 def : Pat<(i32 (vector_extract v8i16:$S, 1)),
2062 (i32 (EXTRACT_SUBREG (VEXTUHRX (LI8 2), $S), sub_32))>;
2063 def : Pat<(i32 (vector_extract v8i16:$S, 2)),
2064 (i32 (EXTRACT_SUBREG (VEXTUHRX (LI8 4), $S), sub_32))>;
2065 def : Pat<(i32 (vector_extract v8i16:$S, 3)),
2066 (i32 (EXTRACT_SUBREG (VEXTUHRX (LI8 6), $S), sub_32))>;
2067 def : Pat<(i32 (vector_extract v8i16:$S, 4)),
2068 (i32 (EXTRACT_SUBREG (VEXTUHRX (LI8 8), $S), sub_32))>;
2069 def : Pat<(i32 (vector_extract v8i16:$S, 5)),
2070 (i32 (EXTRACT_SUBREG (VEXTUHRX (LI8 10), $S), sub_32))>;
2071 def : Pat<(i32 (vector_extract v8i16:$S, 6)),
2072 (i32 (EXTRACT_SUBREG (VEXTUHRX (LI8 12), $S), sub_32))>;
2073 def : Pat<(i32 (vector_extract v8i16:$S, 6)),
2074 (i32 (EXTRACT_SUBREG (VEXTUHRX (LI8 14), $S), sub_32))>;
2075
2076 def : Pat<(i32 (vector_extract v4i32:$S, i64:$Idx)),
2077 (i32 (EXTRACT_SUBREG (VEXTUWRX
2078 (RLWINM8 $Idx, 2, 28, 29), $S), sub_32))>;
2079 def : Pat<(i32 (vector_extract v4i32:$S, 0)),
2080 (i32 (EXTRACT_SUBREG (VEXTUWRX (LI8 0), $S), sub_32))>;
2081 def : Pat<(i32 (vector_extract v4i32:$S, 1)),
2082 (i32 (EXTRACT_SUBREG (VEXTUWRX (LI8 4), $S), sub_32))>;
2083 // For extracting LE word 2, MFVSRWZ is better than VEXTUWRX
2084 def : Pat<(i32 (vector_extract v4i32:$S, 2)),
2085 (i32 VectorExtractions.LE_WORD_2)>;
2086 def : Pat<(i32 (vector_extract v4i32:$S, 3)),
2087 (i32 (EXTRACT_SUBREG (VEXTUWRX (LI8 12), $S), sub_32))>;
Tony Jiangaa5a6a12017-07-05 16:55:00 +00002088}
Zaara Syeda48cb3c12017-11-27 17:11:03 +00002089
Tony Jiangaa5a6a12017-07-05 16:55:00 +00002090let Predicates = [HasP9Altivec, IsBigEndian] in {
2091 def : Pat<(i64 (anyext (i32 (vector_extract v16i8:$S, i64:$Idx)))),
2092 (VEXTUBLX $Idx, $S)>;
2093
2094 def : Pat<(i64 (anyext (i32 (vector_extract v8i16:$S, i64:$Idx)))),
2095 (VEXTUHLX (RLWINM8 $Idx, 1, 28, 30), $S)>;
2096 def : Pat<(i64 (anyext (i32 (vector_extract v8i16:$S, 0)))),
2097 (VEXTUHLX (LI8 0), $S)>;
2098 def : Pat<(i64 (anyext (i32 (vector_extract v8i16:$S, 1)))),
2099 (VEXTUHLX (LI8 2), $S)>;
2100 def : Pat<(i64 (anyext (i32 (vector_extract v8i16:$S, 2)))),
2101 (VEXTUHLX (LI8 4), $S)>;
2102 def : Pat<(i64 (anyext (i32 (vector_extract v8i16:$S, 3)))),
2103 (VEXTUHLX (LI8 6), $S)>;
2104 def : Pat<(i64 (anyext (i32 (vector_extract v8i16:$S, 4)))),
2105 (VEXTUHLX (LI8 8), $S)>;
2106 def : Pat<(i64 (anyext (i32 (vector_extract v8i16:$S, 5)))),
2107 (VEXTUHLX (LI8 10), $S)>;
2108 def : Pat<(i64 (anyext (i32 (vector_extract v8i16:$S, 6)))),
2109 (VEXTUHLX (LI8 12), $S)>;
2110 def : Pat<(i64 (anyext (i32 (vector_extract v8i16:$S, 7)))),
2111 (VEXTUHLX (LI8 14), $S)>;
2112
2113 def : Pat<(i64 (zext (i32 (vector_extract v4i32:$S, i64:$Idx)))),
2114 (VEXTUWLX (RLWINM8 $Idx, 2, 28, 29), $S)>;
2115 def : Pat<(i64 (zext (i32 (vector_extract v4i32:$S, 0)))),
2116 (VEXTUWLX (LI8 0), $S)>;
Zaara Syeda48cb3c12017-11-27 17:11:03 +00002117
2118 // For extracting BE word 1, MFVSRWZ is better than VEXTUWLX
Tony Jiangaa5a6a12017-07-05 16:55:00 +00002119 def : Pat<(i64 (zext (i32 (vector_extract v4i32:$S, 1)))),
Zaara Syeda48cb3c12017-11-27 17:11:03 +00002120 (INSERT_SUBREG (i64 (IMPLICIT_DEF)),
2121 (i32 VectorExtractions.LE_WORD_2), sub_32)>;
Tony Jiangaa5a6a12017-07-05 16:55:00 +00002122 def : Pat<(i64 (zext (i32 (vector_extract v4i32:$S, 2)))),
2123 (VEXTUWLX (LI8 8), $S)>;
2124 def : Pat<(i64 (zext (i32 (vector_extract v4i32:$S, 3)))),
2125 (VEXTUWLX (LI8 12), $S)>;
2126
2127 def : Pat<(i64 (sext (i32 (vector_extract v4i32:$S, i64:$Idx)))),
2128 (EXTSW (VEXTUWLX (RLWINM8 $Idx, 2, 28, 29), $S))>;
2129 def : Pat<(i64 (sext (i32 (vector_extract v4i32:$S, 0)))),
2130 (EXTSW (VEXTUWLX (LI8 0), $S))>;
Zaara Syeda48cb3c12017-11-27 17:11:03 +00002131 // For extracting BE word 1, MFVSRWZ is better than VEXTUWLX
Tony Jiangaa5a6a12017-07-05 16:55:00 +00002132 def : Pat<(i64 (sext (i32 (vector_extract v4i32:$S, 1)))),
Zaara Syeda48cb3c12017-11-27 17:11:03 +00002133 (EXTSW (INSERT_SUBREG (i64 (IMPLICIT_DEF)),
2134 (i32 VectorExtractions.LE_WORD_2), sub_32))>;
Tony Jiangaa5a6a12017-07-05 16:55:00 +00002135 def : Pat<(i64 (sext (i32 (vector_extract v4i32:$S, 2)))),
2136 (EXTSW (VEXTUWLX (LI8 8), $S))>;
2137 def : Pat<(i64 (sext (i32 (vector_extract v4i32:$S, 3)))),
2138 (EXTSW (VEXTUWLX (LI8 12), $S))>;
Zaara Syeda48cb3c12017-11-27 17:11:03 +00002139
2140 def : Pat<(i32 (vector_extract v16i8:$S, i64:$Idx)),
2141 (i32 (EXTRACT_SUBREG (VEXTUBLX $Idx, $S), sub_32))>;
2142 def : Pat<(i32 (vector_extract v16i8:$S, 0)),
2143 (i32 (EXTRACT_SUBREG (VEXTUBLX (LI8 0), $S), sub_32))>;
2144 def : Pat<(i32 (vector_extract v16i8:$S, 1)),
2145 (i32 (EXTRACT_SUBREG (VEXTUBLX (LI8 1), $S), sub_32))>;
2146 def : Pat<(i32 (vector_extract v16i8:$S, 2)),
2147 (i32 (EXTRACT_SUBREG (VEXTUBLX (LI8 2), $S), sub_32))>;
2148 def : Pat<(i32 (vector_extract v16i8:$S, 3)),
2149 (i32 (EXTRACT_SUBREG (VEXTUBLX (LI8 3), $S), sub_32))>;
2150 def : Pat<(i32 (vector_extract v16i8:$S, 4)),
2151 (i32 (EXTRACT_SUBREG (VEXTUBLX (LI8 4), $S), sub_32))>;
2152 def : Pat<(i32 (vector_extract v16i8:$S, 5)),
2153 (i32 (EXTRACT_SUBREG (VEXTUBLX (LI8 5), $S), sub_32))>;
2154 def : Pat<(i32 (vector_extract v16i8:$S, 6)),
2155 (i32 (EXTRACT_SUBREG (VEXTUBLX (LI8 6), $S), sub_32))>;
2156 def : Pat<(i32 (vector_extract v16i8:$S, 7)),
2157 (i32 (EXTRACT_SUBREG (VEXTUBLX (LI8 7), $S), sub_32))>;
2158 def : Pat<(i32 (vector_extract v16i8:$S, 8)),
2159 (i32 (EXTRACT_SUBREG (VEXTUBLX (LI8 8), $S), sub_32))>;
2160 def : Pat<(i32 (vector_extract v16i8:$S, 9)),
2161 (i32 (EXTRACT_SUBREG (VEXTUBLX (LI8 9), $S), sub_32))>;
2162 def : Pat<(i32 (vector_extract v16i8:$S, 10)),
2163 (i32 (EXTRACT_SUBREG (VEXTUBLX (LI8 10), $S), sub_32))>;
2164 def : Pat<(i32 (vector_extract v16i8:$S, 11)),
2165 (i32 (EXTRACT_SUBREG (VEXTUBLX (LI8 11), $S), sub_32))>;
2166 def : Pat<(i32 (vector_extract v16i8:$S, 12)),
2167 (i32 (EXTRACT_SUBREG (VEXTUBLX (LI8 12), $S), sub_32))>;
2168 def : Pat<(i32 (vector_extract v16i8:$S, 13)),
2169 (i32 (EXTRACT_SUBREG (VEXTUBLX (LI8 13), $S), sub_32))>;
2170 def : Pat<(i32 (vector_extract v16i8:$S, 14)),
2171 (i32 (EXTRACT_SUBREG (VEXTUBLX (LI8 14), $S), sub_32))>;
2172 def : Pat<(i32 (vector_extract v16i8:$S, 15)),
2173 (i32 (EXTRACT_SUBREG (VEXTUBLX (LI8 15), $S), sub_32))>;
2174
2175 def : Pat<(i32 (vector_extract v8i16:$S, i64:$Idx)),
2176 (i32 (EXTRACT_SUBREG (VEXTUHLX
2177 (RLWINM8 $Idx, 1, 28, 30), $S), sub_32))>;
2178 def : Pat<(i32 (vector_extract v8i16:$S, 0)),
2179 (i32 (EXTRACT_SUBREG (VEXTUHLX (LI8 0), $S), sub_32))>;
2180 def : Pat<(i32 (vector_extract v8i16:$S, 1)),
2181 (i32 (EXTRACT_SUBREG (VEXTUHLX (LI8 2), $S), sub_32))>;
2182 def : Pat<(i32 (vector_extract v8i16:$S, 2)),
2183 (i32 (EXTRACT_SUBREG (VEXTUHLX (LI8 4), $S), sub_32))>;
2184 def : Pat<(i32 (vector_extract v8i16:$S, 3)),
2185 (i32 (EXTRACT_SUBREG (VEXTUHLX (LI8 6), $S), sub_32))>;
2186 def : Pat<(i32 (vector_extract v8i16:$S, 4)),
2187 (i32 (EXTRACT_SUBREG (VEXTUHLX (LI8 8), $S), sub_32))>;
2188 def : Pat<(i32 (vector_extract v8i16:$S, 5)),
2189 (i32 (EXTRACT_SUBREG (VEXTUHLX (LI8 10), $S), sub_32))>;
2190 def : Pat<(i32 (vector_extract v8i16:$S, 6)),
2191 (i32 (EXTRACT_SUBREG (VEXTUHLX (LI8 12), $S), sub_32))>;
2192 def : Pat<(i32 (vector_extract v8i16:$S, 6)),
2193 (i32 (EXTRACT_SUBREG (VEXTUHLX (LI8 14), $S), sub_32))>;
2194
2195 def : Pat<(i32 (vector_extract v4i32:$S, i64:$Idx)),
2196 (i32 (EXTRACT_SUBREG (VEXTUWLX
2197 (RLWINM8 $Idx, 2, 28, 29), $S), sub_32))>;
2198 def : Pat<(i32 (vector_extract v4i32:$S, 0)),
2199 (i32 (EXTRACT_SUBREG (VEXTUWLX (LI8 0), $S), sub_32))>;
2200 // For extracting BE word 1, MFVSRWZ is better than VEXTUWLX
2201 def : Pat<(i32 (vector_extract v4i32:$S, 1)),
2202 (i32 VectorExtractions.LE_WORD_2)>;
2203 def : Pat<(i32 (vector_extract v4i32:$S, 2)),
2204 (i32 (EXTRACT_SUBREG (VEXTUWLX (LI8 8), $S), sub_32))>;
2205 def : Pat<(i32 (vector_extract v4i32:$S, 3)),
2206 (i32 (EXTRACT_SUBREG (VEXTUWLX (LI8 12), $S), sub_32))>;
Tony Jiangaa5a6a12017-07-05 16:55:00 +00002207}
2208
Nemanja Ivanovic1c39ca62015-08-13 17:40:44 +00002209let Predicates = [IsLittleEndian, HasDirectMove] in {
Nemanja Ivanovicd3896572015-10-09 11:12:18 +00002210 // v16i8 scalar <-> vector conversions (LE)
Nemanja Ivanovic1c39ca62015-08-13 17:40:44 +00002211 def : Pat<(v16i8 (scalar_to_vector i32:$A)),
Nemanja Ivanovicd3896572015-10-09 11:12:18 +00002212 (v16i8 (COPY_TO_REGCLASS MovesToVSR.LE_WORD_0, VSRC))>;
Nemanja Ivanovic1c39ca62015-08-13 17:40:44 +00002213 def : Pat<(v8i16 (scalar_to_vector i32:$A)),
Nemanja Ivanovicd3896572015-10-09 11:12:18 +00002214 (v8i16 (COPY_TO_REGCLASS MovesToVSR.LE_WORD_0, VSRC))>;
Nemanja Ivanovic1c39ca62015-08-13 17:40:44 +00002215 def : Pat<(v4i32 (scalar_to_vector i32:$A)),
Nemanja Ivanovicd3896572015-10-09 11:12:18 +00002216 (v4i32 MovesToVSR.LE_WORD_0)>;
Nemanja Ivanovic1c39ca62015-08-13 17:40:44 +00002217 def : Pat<(v2i64 (scalar_to_vector i64:$A)),
Nemanja Ivanovicd3896572015-10-09 11:12:18 +00002218 (v2i64 MovesToVSR.LE_DWORD_0)>;
Zaara Syeda48cb3c12017-11-27 17:11:03 +00002219 // v2i64 scalar <-> vector conversions (LE)
2220 def : Pat<(i64 (vector_extract v2i64:$S, 0)),
2221 (i64 VectorExtractions.LE_DWORD_0)>;
2222 def : Pat<(i64 (vector_extract v2i64:$S, 1)),
2223 (i64 VectorExtractions.LE_DWORD_1)>;
2224 def : Pat<(i64 (vector_extract v2i64:$S, i64:$Idx)),
2225 (i64 VectorExtractions.LE_VARIABLE_DWORD)>;
2226} // IsLittleEndian, HasDirectMove
2227
2228let Predicates = [IsLittleEndian, HasDirectMove, NoP9Altivec] in {
Nemanja Ivanovicd3896572015-10-09 11:12:18 +00002229 def : Pat<(i32 (vector_extract v16i8:$S, 0)),
Nemanja Ivanovicac8d01a2015-12-10 13:35:28 +00002230 (i32 VectorExtractions.LE_BYTE_0)>;
Nemanja Ivanovicd3896572015-10-09 11:12:18 +00002231 def : Pat<(i32 (vector_extract v16i8:$S, 1)),
Nemanja Ivanovicac8d01a2015-12-10 13:35:28 +00002232 (i32 VectorExtractions.LE_BYTE_1)>;
Nemanja Ivanovicd3896572015-10-09 11:12:18 +00002233 def : Pat<(i32 (vector_extract v16i8:$S, 2)),
Nemanja Ivanovicac8d01a2015-12-10 13:35:28 +00002234 (i32 VectorExtractions.LE_BYTE_2)>;
Nemanja Ivanovicd3896572015-10-09 11:12:18 +00002235 def : Pat<(i32 (vector_extract v16i8:$S, 3)),
Nemanja Ivanovicac8d01a2015-12-10 13:35:28 +00002236 (i32 VectorExtractions.LE_BYTE_3)>;
Nemanja Ivanovicd3896572015-10-09 11:12:18 +00002237 def : Pat<(i32 (vector_extract v16i8:$S, 4)),
Nemanja Ivanovicac8d01a2015-12-10 13:35:28 +00002238 (i32 VectorExtractions.LE_BYTE_4)>;
Nemanja Ivanovicd3896572015-10-09 11:12:18 +00002239 def : Pat<(i32 (vector_extract v16i8:$S, 5)),
Nemanja Ivanovicac8d01a2015-12-10 13:35:28 +00002240 (i32 VectorExtractions.LE_BYTE_5)>;
Nemanja Ivanovicd3896572015-10-09 11:12:18 +00002241 def : Pat<(i32 (vector_extract v16i8:$S, 6)),
Nemanja Ivanovicac8d01a2015-12-10 13:35:28 +00002242 (i32 VectorExtractions.LE_BYTE_6)>;
Nemanja Ivanovicd3896572015-10-09 11:12:18 +00002243 def : Pat<(i32 (vector_extract v16i8:$S, 7)),
Nemanja Ivanovicac8d01a2015-12-10 13:35:28 +00002244 (i32 VectorExtractions.LE_BYTE_7)>;
Nemanja Ivanovicd3896572015-10-09 11:12:18 +00002245 def : Pat<(i32 (vector_extract v16i8:$S, 8)),
Nemanja Ivanovicac8d01a2015-12-10 13:35:28 +00002246 (i32 VectorExtractions.LE_BYTE_8)>;
Nemanja Ivanovicd3896572015-10-09 11:12:18 +00002247 def : Pat<(i32 (vector_extract v16i8:$S, 9)),
Nemanja Ivanovicac8d01a2015-12-10 13:35:28 +00002248 (i32 VectorExtractions.LE_BYTE_9)>;
Nemanja Ivanovicd3896572015-10-09 11:12:18 +00002249 def : Pat<(i32 (vector_extract v16i8:$S, 10)),
Nemanja Ivanovicac8d01a2015-12-10 13:35:28 +00002250 (i32 VectorExtractions.LE_BYTE_10)>;
Nemanja Ivanovicd3896572015-10-09 11:12:18 +00002251 def : Pat<(i32 (vector_extract v16i8:$S, 11)),
Nemanja Ivanovicac8d01a2015-12-10 13:35:28 +00002252 (i32 VectorExtractions.LE_BYTE_11)>;
Nemanja Ivanovicd3896572015-10-09 11:12:18 +00002253 def : Pat<(i32 (vector_extract v16i8:$S, 12)),
Nemanja Ivanovicac8d01a2015-12-10 13:35:28 +00002254 (i32 VectorExtractions.LE_BYTE_12)>;
Nemanja Ivanovicd3896572015-10-09 11:12:18 +00002255 def : Pat<(i32 (vector_extract v16i8:$S, 13)),
Nemanja Ivanovicac8d01a2015-12-10 13:35:28 +00002256 (i32 VectorExtractions.LE_BYTE_13)>;
Nemanja Ivanovicd3896572015-10-09 11:12:18 +00002257 def : Pat<(i32 (vector_extract v16i8:$S, 14)),
Nemanja Ivanovicac8d01a2015-12-10 13:35:28 +00002258 (i32 VectorExtractions.LE_BYTE_14)>;
Nemanja Ivanovicd3896572015-10-09 11:12:18 +00002259 def : Pat<(i32 (vector_extract v16i8:$S, 15)),
Nemanja Ivanovicac8d01a2015-12-10 13:35:28 +00002260 (i32 VectorExtractions.LE_BYTE_15)>;
Nemanja Ivanovicd3896572015-10-09 11:12:18 +00002261 def : Pat<(i32 (vector_extract v16i8:$S, i64:$Idx)),
Nemanja Ivanovicac8d01a2015-12-10 13:35:28 +00002262 (i32 VectorExtractions.LE_VARIABLE_BYTE)>;
Nemanja Ivanovic1c39ca62015-08-13 17:40:44 +00002263
Nemanja Ivanovicd3896572015-10-09 11:12:18 +00002264 // v8i16 scalar <-> vector conversions (LE)
2265 def : Pat<(i32 (vector_extract v8i16:$S, 0)),
Nemanja Ivanovicac8d01a2015-12-10 13:35:28 +00002266 (i32 VectorExtractions.LE_HALF_0)>;
Nemanja Ivanovicd3896572015-10-09 11:12:18 +00002267 def : Pat<(i32 (vector_extract v8i16:$S, 1)),
Nemanja Ivanovicac8d01a2015-12-10 13:35:28 +00002268 (i32 VectorExtractions.LE_HALF_1)>;
Nemanja Ivanovicd3896572015-10-09 11:12:18 +00002269 def : Pat<(i32 (vector_extract v8i16:$S, 2)),
Nemanja Ivanovicac8d01a2015-12-10 13:35:28 +00002270 (i32 VectorExtractions.LE_HALF_2)>;
Nemanja Ivanovicd3896572015-10-09 11:12:18 +00002271 def : Pat<(i32 (vector_extract v8i16:$S, 3)),
Nemanja Ivanovicac8d01a2015-12-10 13:35:28 +00002272 (i32 VectorExtractions.LE_HALF_3)>;
Nemanja Ivanovicd3896572015-10-09 11:12:18 +00002273 def : Pat<(i32 (vector_extract v8i16:$S, 4)),
Nemanja Ivanovicac8d01a2015-12-10 13:35:28 +00002274 (i32 VectorExtractions.LE_HALF_4)>;
Nemanja Ivanovicd3896572015-10-09 11:12:18 +00002275 def : Pat<(i32 (vector_extract v8i16:$S, 5)),
Nemanja Ivanovicac8d01a2015-12-10 13:35:28 +00002276 (i32 VectorExtractions.LE_HALF_5)>;
Nemanja Ivanovicd3896572015-10-09 11:12:18 +00002277 def : Pat<(i32 (vector_extract v8i16:$S, 6)),
Nemanja Ivanovicac8d01a2015-12-10 13:35:28 +00002278 (i32 VectorExtractions.LE_HALF_6)>;
Nemanja Ivanovicd3896572015-10-09 11:12:18 +00002279 def : Pat<(i32 (vector_extract v8i16:$S, 7)),
Nemanja Ivanovicac8d01a2015-12-10 13:35:28 +00002280 (i32 VectorExtractions.LE_HALF_7)>;
Nemanja Ivanovicd3896572015-10-09 11:12:18 +00002281 def : Pat<(i32 (vector_extract v8i16:$S, i64:$Idx)),
Nemanja Ivanovicac8d01a2015-12-10 13:35:28 +00002282 (i32 VectorExtractions.LE_VARIABLE_HALF)>;
Nemanja Ivanovicd3896572015-10-09 11:12:18 +00002283
2284 // v4i32 scalar <-> vector conversions (LE)
2285 def : Pat<(i32 (vector_extract v4i32:$S, 0)),
Nemanja Ivanovicac8d01a2015-12-10 13:35:28 +00002286 (i32 VectorExtractions.LE_WORD_0)>;
Nemanja Ivanovicd3896572015-10-09 11:12:18 +00002287 def : Pat<(i32 (vector_extract v4i32:$S, 1)),
Nemanja Ivanovicac8d01a2015-12-10 13:35:28 +00002288 (i32 VectorExtractions.LE_WORD_1)>;
Nemanja Ivanovicd3896572015-10-09 11:12:18 +00002289 def : Pat<(i32 (vector_extract v4i32:$S, 2)),
Nemanja Ivanovicac8d01a2015-12-10 13:35:28 +00002290 (i32 VectorExtractions.LE_WORD_2)>;
Nemanja Ivanovicd3896572015-10-09 11:12:18 +00002291 def : Pat<(i32 (vector_extract v4i32:$S, 3)),
Nemanja Ivanovicac8d01a2015-12-10 13:35:28 +00002292 (i32 VectorExtractions.LE_WORD_3)>;
2293 def : Pat<(i32 (vector_extract v4i32:$S, i64:$Idx)),
2294 (i32 VectorExtractions.LE_VARIABLE_WORD)>;
Zaara Syeda48cb3c12017-11-27 17:11:03 +00002295} // IsLittleEndian, HasDirectMove, NoP9Altivec
Nemanja Ivanovic89224762015-12-15 14:50:34 +00002296
2297let Predicates = [HasDirectMove, HasVSX] in {
2298// bitconvert f32 -> i32
2299// (convert to 32-bit fp single, shift right 1 word, move to GPR)
2300def : Pat<(i32 (bitconvert f32:$S)),
2301 (i32 (MFVSRWZ (EXTRACT_SUBREG
Lei Huangcd4f3852018-03-12 19:26:18 +00002302 (XXSLDWI (XSCVDPSPN $S), (XSCVDPSPN $S), 3),
Nemanja Ivanovic89224762015-12-15 14:50:34 +00002303 sub_64)))>;
2304// bitconvert i32 -> f32
2305// (move to FPR, shift left 1 word, convert to 64-bit fp single)
2306def : Pat<(f32 (bitconvert i32:$A)),
2307 (f32 (XSCVSPDPN
2308 (XXSLDWI MovesToVSR.LE_WORD_1, MovesToVSR.LE_WORD_1, 1)))>;
2309
2310// bitconvert f64 -> i64
2311// (move to GPR, nothing else needed)
2312def : Pat<(i64 (bitconvert f64:$S)),
2313 (i64 (MFVSRD $S))>;
2314
2315// bitconvert i64 -> f64
2316// (move to FPR, nothing else needed)
2317def : Pat<(f64 (bitconvert i64:$S)),
2318 (f64 (MTVSRD $S))>;
2319}
Kit Barton93612ec2016-02-26 21:11:55 +00002320
Nemanja Ivanovicdf1cb522016-11-29 16:11:34 +00002321// Materialize a zero-vector of long long
2322def : Pat<(v2i64 immAllZerosV),
2323 (v2i64 (XXLXORz))>;
2324}
2325
Nemanja Ivanovicb43bb612016-07-12 21:00:10 +00002326def AlignValues {
2327 dag F32_TO_BE_WORD1 = (v4f32 (XXSLDWI (XSCVDPSPN $B), (XSCVDPSPN $B), 3));
2328 dag I32_TO_BE_WORD1 = (COPY_TO_REGCLASS (MTVSRWZ $B), VSRC);
2329}
2330
Kit Barton93612ec2016-02-26 21:11:55 +00002331// The following VSX instructions were introduced in Power ISA 3.0
2332def HasP9Vector : Predicate<"PPCSubTarget->hasP9Vector()">;
Nemanja Ivanovicb43bb612016-07-12 21:00:10 +00002333let AddedComplexity = 400, Predicates = [HasP9Vector] in {
Kit Barton93612ec2016-02-26 21:11:55 +00002334
2335 // [PO VRT XO VRB XO /]
2336 class X_VT5_XO5_VB5<bits<6> opcode, bits<5> xo2, bits<10> xo, string opc,
2337 list<dag> pattern>
2338 : X_RD5_XO5_RS5<opcode, xo2, xo, (outs vrrc:$vT), (ins vrrc:$vB),
2339 !strconcat(opc, " $vT, $vB"), IIC_VecFP, pattern>;
2340
2341 // [PO VRT XO VRB XO RO], Round to Odd version of [PO VRT XO VRB XO /]
2342 class X_VT5_XO5_VB5_Ro<bits<6> opcode, bits<5> xo2, bits<10> xo, string opc,
2343 list<dag> pattern>
2344 : X_VT5_XO5_VB5<opcode, xo2, xo, opc, pattern>, isDOT;
2345
2346 // [PO VRT XO VRB XO /], but the VRB is only used the left 64 bits (or less),
2347 // So we use different operand class for VRB
2348 class X_VT5_XO5_VB5_TyVB<bits<6> opcode, bits<5> xo2, bits<10> xo, string opc,
2349 RegisterOperand vbtype, list<dag> pattern>
2350 : X_RD5_XO5_RS5<opcode, xo2, xo, (outs vrrc:$vT), (ins vbtype:$vB),
2351 !strconcat(opc, " $vT, $vB"), IIC_VecFP, pattern>;
2352
Nemanja Ivanovic11049f82016-10-04 06:59:23 +00002353 let UseVSXReg = 1 in {
Chuang-Yu Cheng80722712016-03-28 08:34:28 +00002354 // [PO T XO B XO BX /]
2355 class XX2_RT5_XO5_XB6<bits<6> opcode, bits<5> xo2, bits<9> xo, string opc,
2356 list<dag> pattern>
2357 : XX2_RD5_XO5_RS6<opcode, xo2, xo, (outs g8rc:$rT), (ins vsfrc:$XB),
2358 !strconcat(opc, " $rT, $XB"), IIC_VecFP, pattern>;
2359
Kit Barton93612ec2016-02-26 21:11:55 +00002360 // [PO T XO B XO BX TX]
2361 class XX2_XT6_XO5_XB6<bits<6> opcode, bits<5> xo2, bits<9> xo, string opc,
2362 RegisterOperand vtype, list<dag> pattern>
2363 : XX2_RD6_XO5_RS6<opcode, xo2, xo, (outs vtype:$XT), (ins vtype:$XB),
2364 !strconcat(opc, " $XT, $XB"), IIC_VecFP, pattern>;
2365
2366 // [PO T A B XO AX BX TX], src and dest register use different operand class
2367 class XX3_XT5_XA5_XB5<bits<6> opcode, bits<8> xo, string opc,
2368 RegisterOperand xty, RegisterOperand aty, RegisterOperand bty,
2369 InstrItinClass itin, list<dag> pattern>
2370 : XX3Form<opcode, xo, (outs xty:$XT), (ins aty:$XA, bty:$XB),
2371 !strconcat(opc, " $XT, $XA, $XB"), itin, pattern>;
Nemanja Ivanovic11049f82016-10-04 06:59:23 +00002372 } // UseVSXReg = 1
Kit Barton93612ec2016-02-26 21:11:55 +00002373
Chuang-Yu Cheng56638482016-03-28 07:38:01 +00002374 // [PO VRT VRA VRB XO /]
2375 class X_VT5_VA5_VB5<bits<6> opcode, bits<10> xo, string opc,
2376 list<dag> pattern>
2377 : XForm_1<opcode, xo, (outs vrrc:$vT), (ins vrrc:$vA, vrrc:$vB),
2378 !strconcat(opc, " $vT, $vA, $vB"), IIC_VecFP, pattern>;
2379
2380 // [PO VRT VRA VRB XO RO], Round to Odd version of [PO VRT VRA VRB XO /]
2381 class X_VT5_VA5_VB5_Ro<bits<6> opcode, bits<10> xo, string opc,
2382 list<dag> pattern>
2383 : X_VT5_VA5_VB5<opcode, xo, opc, pattern>, isDOT;
2384
Lei Huang09fda632018-04-04 16:43:50 +00002385 // [PO VRT VRA VRB XO /]
2386 class X_VT5_VA5_VB5_FMA<bits<6> opcode, bits<10> xo, string opc,
2387 list<dag> pattern>
2388 : XForm_1<opcode, xo, (outs vrrc:$vT), (ins vrrc:$vTi, vrrc:$vA, vrrc:$vB),
2389 !strconcat(opc, " $vT, $vA, $vB"), IIC_VecFP, pattern>,
2390 RegConstraint<"$vTi = $vT">, NoEncode<"$vTi">;
2391
2392 // [PO VRT VRA VRB XO RO], Round to Odd version of [PO VRT VRA VRB XO /]
2393 class X_VT5_VA5_VB5_FMA_Ro<bits<6> opcode, bits<10> xo, string opc,
2394 list<dag> pattern>
2395 : X_VT5_VA5_VB5_FMA<opcode, xo, opc, pattern>, isDOT;
2396
Chuang-Yu Cheng56638482016-03-28 07:38:01 +00002397 //===--------------------------------------------------------------------===//
2398 // Quad-Precision Scalar Move Instructions:
2399
2400 // Copy Sign
Lei Huangecfede92018-03-19 19:22:52 +00002401 def XSCPSGNQP : X_VT5_VA5_VB5<63, 100, "xscpsgnqp",
2402 [(set f128:$vT,
2403 (fcopysign f128:$vB, f128:$vA))]>;
Chuang-Yu Cheng56638482016-03-28 07:38:01 +00002404
2405 // Absolute/Negative-Absolute/Negate
Lei Huangecfede92018-03-19 19:22:52 +00002406 def XSABSQP : X_VT5_XO5_VB5<63, 0, 804, "xsabsqp",
2407 [(set f128:$vT, (fabs f128:$vB))]>;
2408 def XSNABSQP : X_VT5_XO5_VB5<63, 8, 804, "xsnabsqp",
2409 [(set f128:$vT, (fneg (fabs f128:$vB)))]>;
2410 def XSNEGQP : X_VT5_XO5_VB5<63, 16, 804, "xsnegqp",
2411 [(set f128:$vT, (fneg f128:$vB))]>;
Chuang-Yu Cheng56638482016-03-28 07:38:01 +00002412
2413 //===--------------------------------------------------------------------===//
2414 // Quad-Precision Scalar Floating-Point Arithmetic Instructions:
2415
2416 // Add/Divide/Multiply/Subtract
Lei Huang6d1596a2018-03-19 18:52:20 +00002417 let isCommutable = 1 in {
2418 def XSADDQP : X_VT5_VA5_VB5 <63, 4, "xsaddqp",
2419 [(set f128:$vT, (fadd f128:$vA, f128:$vB))]>;
Chuang-Yu Cheng56638482016-03-28 07:38:01 +00002420 def XSADDQPO : X_VT5_VA5_VB5_Ro<63, 4, "xsaddqpo", []>;
Lei Huang6d1596a2018-03-19 18:52:20 +00002421 def XSMULQP : X_VT5_VA5_VB5 <63, 36, "xsmulqp",
2422 [(set f128:$vT, (fmul f128:$vA, f128:$vB))]>;
Chuang-Yu Cheng56638482016-03-28 07:38:01 +00002423 def XSMULQPO : X_VT5_VA5_VB5_Ro<63, 36, "xsmulqpo", []>;
Lei Huang6d1596a2018-03-19 18:52:20 +00002424 }
2425
2426 def XSSUBQP : X_VT5_VA5_VB5 <63, 516, "xssubqp" ,
2427 [(set f128:$vT, (fsub f128:$vA, f128:$vB))]>;
Chuang-Yu Cheng56638482016-03-28 07:38:01 +00002428 def XSSUBQPO : X_VT5_VA5_VB5_Ro<63, 516, "xssubqpo", []>;
Lei Huang6d1596a2018-03-19 18:52:20 +00002429 def XSDIVQP : X_VT5_VA5_VB5 <63, 548, "xsdivqp",
2430 [(set f128:$vT, (fdiv f128:$vA, f128:$vB))]>;
2431 def XSDIVQPO : X_VT5_VA5_VB5_Ro<63, 548, "xsdivqpo", []>;
Chuang-Yu Cheng56638482016-03-28 07:38:01 +00002432
2433 // Square-Root
Lei Huangecfede92018-03-19 19:22:52 +00002434 def XSSQRTQP : X_VT5_XO5_VB5 <63, 27, 804, "xssqrtqp",
2435 [(set f128:$vT, (fsqrt f128:$vB))]>;
Chuang-Yu Cheng56638482016-03-28 07:38:01 +00002436 def XSSQRTQPO : X_VT5_XO5_VB5_Ro<63, 27, 804, "xssqrtqpo", []>;
2437
2438 // (Negative) Multiply-{Add/Subtract}
Lei Huang09fda632018-04-04 16:43:50 +00002439 def XSMADDQP : X_VT5_VA5_VB5_FMA <63, 388, "xsmaddqp",
2440 [(set f128:$vT,
2441 (fma f128:$vA, f128:$vB,
2442 f128:$vTi))]>;
2443 def XSMADDQPO : X_VT5_VA5_VB5_FMA_Ro<63, 388, "xsmaddqpo" , []>;
2444 def XSMSUBQP : X_VT5_VA5_VB5_FMA <63, 420, "xsmsubqp" ,
2445 [(set f128:$vT,
2446 (fma f128:$vA, f128:$vB,
2447 (fneg f128:$vTi)))]>;
2448 def XSMSUBQPO : X_VT5_VA5_VB5_FMA_Ro<63, 420, "xsmsubqpo" , []>;
2449 def XSNMADDQP : X_VT5_VA5_VB5_FMA <63, 452, "xsnmaddqp",
2450 [(set f128:$vT,
2451 (fneg (fma f128:$vA, f128:$vB,
2452 f128:$vTi)))]>;
2453 def XSNMADDQPO: X_VT5_VA5_VB5_FMA_Ro<63, 452, "xsnmaddqpo", []>;
2454 def XSNMSUBQP : X_VT5_VA5_VB5_FMA <63, 484, "xsnmsubqp",
2455 [(set f128:$vT,
2456 (fneg (fma f128:$vA, f128:$vB,
2457 (fneg f128:$vTi))))]>;
2458 def XSNMSUBQPO: X_VT5_VA5_VB5_FMA_Ro<63, 484, "xsnmsubqpo", []>;
2459
2460 // Additional fnmsub patterns: -a*c + b == -(a*c - b)
2461 def : Pat<(fma (fneg f128:$A), f128:$C, f128:$B), (XSNMSUBQP $B, $C, $A)>;
2462 def : Pat<(fma f128:$A, (fneg f128:$C), f128:$B), (XSNMSUBQP $B, $C, $A)>;
Chuang-Yu Cheng56638482016-03-28 07:38:01 +00002463
Kit Barton93612ec2016-02-26 21:11:55 +00002464 //===--------------------------------------------------------------------===//
2465 // Quad/Double-Precision Compare Instructions:
2466
2467 // [PO BF // VRA VRB XO /]
2468 class X_BF3_VA5_VB5<bits<6> opcode, bits<10> xo, string opc,
2469 list<dag> pattern>
2470 : XForm_17<opcode, xo, (outs crrc:$crD), (ins vrrc:$VA, vrrc:$VB),
2471 !strconcat(opc, " $crD, $VA, $VB"), IIC_FPCompare> {
2472 let Pattern = pattern;
2473 }
2474
2475 // QP Compare Ordered/Unordered
2476 def XSCMPOQP : X_BF3_VA5_VB5<63, 132, "xscmpoqp", []>;
2477 def XSCMPUQP : X_BF3_VA5_VB5<63, 644, "xscmpuqp", []>;
2478
2479 // DP/QP Compare Exponents
2480 def XSCMPEXPDP : XX3Form_1<60, 59,
2481 (outs crrc:$crD), (ins vsfrc:$XA, vsfrc:$XB),
Nemanja Ivanovic11049f82016-10-04 06:59:23 +00002482 "xscmpexpdp $crD, $XA, $XB", IIC_FPCompare, []>,
2483 UseVSXReg;
Kit Barton93612ec2016-02-26 21:11:55 +00002484 def XSCMPEXPQP : X_BF3_VA5_VB5<63, 164, "xscmpexpqp", []>;
2485
2486 // DP Compare ==, >=, >, !=
2487 // Use vsrc for XT, because the entire register of XT is set.
2488 // XT.dword[1] = 0x0000_0000_0000_0000
2489 def XSCMPEQDP : XX3_XT5_XA5_XB5<60, 3, "xscmpeqdp", vsrc, vsfrc, vsfrc,
2490 IIC_FPCompare, []>;
2491 def XSCMPGEDP : XX3_XT5_XA5_XB5<60, 19, "xscmpgedp", vsrc, vsfrc, vsfrc,
2492 IIC_FPCompare, []>;
2493 def XSCMPGTDP : XX3_XT5_XA5_XB5<60, 11, "xscmpgtdp", vsrc, vsfrc, vsfrc,
2494 IIC_FPCompare, []>;
Kit Barton93612ec2016-02-26 21:11:55 +00002495
2496 //===--------------------------------------------------------------------===//
2497 // Quad-Precision Floating-Point Conversion Instructions:
2498
2499 // Convert DP -> QP
Nemanja Ivanovic11049f82016-10-04 06:59:23 +00002500 def XSCVDPQP : X_VT5_XO5_VB5_TyVB<63, 22, 836, "xscvdpqp", vfrc, []>;
Lei Huangbe0afb02018-03-26 17:46:25 +00002501 def : Pat<(f128 (fpextend f64:$src)), (f128 (XSCVDPQP $src))>;
Kit Barton93612ec2016-02-26 21:11:55 +00002502
2503 // Round & Convert QP -> DP (dword[1] is set to zero)
2504 def XSCVQPDP : X_VT5_XO5_VB5 <63, 20, 836, "xscvqpdp" , []>;
2505 def XSCVQPDPO : X_VT5_XO5_VB5_Ro<63, 20, 836, "xscvqpdpo", []>;
2506
2507 // Truncate & Convert QP -> (Un)Signed (D)Word (dword[1] is set to zero)
2508 def XSCVQPSDZ : X_VT5_XO5_VB5<63, 25, 836, "xscvqpsdz", []>;
2509 def XSCVQPSWZ : X_VT5_XO5_VB5<63, 9, 836, "xscvqpswz", []>;
2510 def XSCVQPUDZ : X_VT5_XO5_VB5<63, 17, 836, "xscvqpudz", []>;
2511 def XSCVQPUWZ : X_VT5_XO5_VB5<63, 1, 836, "xscvqpuwz", []>;
2512
2513 // Convert (Un)Signed DWord -> QP
Nemanja Ivanovic11049f82016-10-04 06:59:23 +00002514 def XSCVSDQP : X_VT5_XO5_VB5_TyVB<63, 10, 836, "xscvsdqp", vfrc, []>;
2515 def XSCVUDQP : X_VT5_XO5_VB5_TyVB<63, 2, 836, "xscvudqp", vfrc, []>;
Kit Barton93612ec2016-02-26 21:11:55 +00002516
Sean Fertilea435e072016-11-14 18:43:59 +00002517 let UseVSXReg = 1 in {
Kit Barton93612ec2016-02-26 21:11:55 +00002518 //===--------------------------------------------------------------------===//
2519 // Round to Floating-Point Integer Instructions
2520
2521 // (Round &) Convert DP <-> HP
2522 // Note! xscvdphp's src and dest register both use the left 64 bits, so we use
2523 // vsfrc for src and dest register. xscvhpdp's src only use the left 16 bits,
2524 // but we still use vsfrc for it.
2525 def XSCVDPHP : XX2_XT6_XO5_XB6<60, 17, 347, "xscvdphp", vsfrc, []>;
2526 def XSCVHPDP : XX2_XT6_XO5_XB6<60, 16, 347, "xscvhpdp", vsfrc, []>;
2527
2528 // Vector HP -> SP
2529 def XVCVHPSP : XX2_XT6_XO5_XB6<60, 24, 475, "xvcvhpsp", vsrc, []>;
Nemanja Ivanovicec4b0c32016-11-11 21:42:01 +00002530 def XVCVSPHP : XX2_XT6_XO5_XB6<60, 25, 475, "xvcvsphp", vsrc,
2531 [(set v4f32:$XT,
2532 (int_ppc_vsx_xvcvsphp v4f32:$XB))]>;
Kit Barton93612ec2016-02-26 21:11:55 +00002533
Sean Fertilea435e072016-11-14 18:43:59 +00002534 } // UseVSXReg = 1
2535
2536 // Pattern for matching Vector HP -> Vector SP intrinsic. Defined as a
Simon Pilgrim68168d12017-03-30 12:59:53 +00002537 // separate pattern so that it can convert the input register class from
Sean Fertilea435e072016-11-14 18:43:59 +00002538 // VRRC(v8i16) to VSRC.
2539 def : Pat<(v4f32 (int_ppc_vsx_xvcvhpsp v8i16:$A)),
2540 (v4f32 (XVCVHPSP (COPY_TO_REGCLASS $A, VSRC)))>;
2541
Kit Barton93612ec2016-02-26 21:11:55 +00002542 class Z23_VT5_R1_VB5_RMC2_EX1<bits<6> opcode, bits<8> xo, bit ex, string opc,
2543 list<dag> pattern>
2544 : Z23Form_1<opcode, xo,
2545 (outs vrrc:$vT), (ins u1imm:$r, vrrc:$vB, u2imm:$rmc),
2546 !strconcat(opc, " $r, $vT, $vB, $rmc"), IIC_VecFP, pattern> {
2547 let RC = ex;
2548 }
2549
2550 // Round to Quad-Precision Integer [with Inexact]
2551 def XSRQPI : Z23_VT5_R1_VB5_RMC2_EX1<63, 5, 0, "xsrqpi" , []>;
2552 def XSRQPIX : Z23_VT5_R1_VB5_RMC2_EX1<63, 5, 1, "xsrqpix", []>;
2553
2554 // Round Quad-Precision to Double-Extended Precision (fp80)
2555 def XSRQPXP : Z23_VT5_R1_VB5_RMC2_EX1<63, 37, 0, "xsrqpxp", []>;
Kit Bartonba532dc2016-03-08 03:49:13 +00002556
2557 //===--------------------------------------------------------------------===//
Chuang-Yu Cheng80722712016-03-28 08:34:28 +00002558 // Insert/Extract Instructions
2559
2560 // Insert Exponent DP/QP
2561 // XT NOTE: XT.dword[1] = 0xUUUU_UUUU_UUUU_UUUU
2562 def XSIEXPDP : XX1Form <60, 918, (outs vsrc:$XT), (ins g8rc:$rA, g8rc:$rB),
Nemanja Ivanovic11049f82016-10-04 06:59:23 +00002563 "xsiexpdp $XT, $rA, $rB", IIC_VecFP, []>, UseVSXReg;
Chuang-Yu Cheng80722712016-03-28 08:34:28 +00002564 // vB NOTE: only vB.dword[0] is used, that's why we don't use
2565 // X_VT5_VA5_VB5 form
2566 def XSIEXPQP : XForm_18<63, 868, (outs vrrc:$vT), (ins vrrc:$vA, vsfrc:$vB),
2567 "xsiexpqp $vT, $vA, $vB", IIC_VecFP, []>;
2568
2569 // Extract Exponent/Significand DP/QP
2570 def XSXEXPDP : XX2_RT5_XO5_XB6<60, 0, 347, "xsxexpdp", []>;
2571 def XSXSIGDP : XX2_RT5_XO5_XB6<60, 1, 347, "xsxsigdp", []>;
Nemanja Ivanovic11049f82016-10-04 06:59:23 +00002572
Chuang-Yu Cheng80722712016-03-28 08:34:28 +00002573 def XSXEXPQP : X_VT5_XO5_VB5 <63, 2, 804, "xsxexpqp", []>;
2574 def XSXSIGQP : X_VT5_XO5_VB5 <63, 18, 804, "xsxsigqp", []>;
2575
2576 // Vector Insert Word
Nemanja Ivanovic11049f82016-10-04 06:59:23 +00002577 let UseVSXReg = 1 in {
Chuang-Yu Cheng80722712016-03-28 08:34:28 +00002578 // XB NOTE: Only XB.dword[1] is used, but we use vsrc on XB.
Nemanja Ivanovicb43bb612016-07-12 21:00:10 +00002579 def XXINSERTW :
2580 XX2_RD6_UIM5_RS6<60, 181, (outs vsrc:$XT),
2581 (ins vsrc:$XTi, vsrc:$XB, u4imm:$UIM),
2582 "xxinsertw $XT, $XB, $UIM", IIC_VecFP,
Tony Jiang61ef1c52017-09-05 18:08:02 +00002583 [(set v4i32:$XT, (PPCvecinsert v4i32:$XTi, v4i32:$XB,
Nemanja Ivanovicb43bb612016-07-12 21:00:10 +00002584 imm32SExt16:$UIM))]>,
2585 RegConstraint<"$XTi = $XT">, NoEncode<"$XTi">;
Chuang-Yu Cheng80722712016-03-28 08:34:28 +00002586
2587 // Vector Extract Unsigned Word
2588 def XXEXTRACTUW : XX2_RD6_UIM5_RS6<60, 165,
Nemanja Ivanovicb43bb612016-07-12 21:00:10 +00002589 (outs vsfrc:$XT), (ins vsrc:$XB, u4imm:$UIMM),
Chuang-Yu Cheng80722712016-03-28 08:34:28 +00002590 "xxextractuw $XT, $XB, $UIMM", IIC_VecFP, []>;
Nemanja Ivanovic11049f82016-10-04 06:59:23 +00002591 } // UseVSXReg = 1
Chuang-Yu Cheng80722712016-03-28 08:34:28 +00002592
2593 // Vector Insert Exponent DP/SP
2594 def XVIEXPDP : XX3_XT5_XA5_XB5<60, 248, "xviexpdp", vsrc, vsrc, vsrc,
Nemanja Ivanovic0f459982016-10-26 19:03:40 +00002595 IIC_VecFP, [(set v2f64: $XT,(int_ppc_vsx_xviexpdp v2i64:$XA, v2i64:$XB))]>;
Chuang-Yu Cheng80722712016-03-28 08:34:28 +00002596 def XVIEXPSP : XX3_XT5_XA5_XB5<60, 216, "xviexpsp", vsrc, vsrc, vsrc,
Nemanja Ivanovic0f459982016-10-26 19:03:40 +00002597 IIC_VecFP, [(set v4f32: $XT,(int_ppc_vsx_xviexpsp v4i32:$XA, v4i32:$XB))]>;
Chuang-Yu Cheng80722712016-03-28 08:34:28 +00002598
2599 // Vector Extract Exponent/Significand DP/SP
Sean Fertileadda5b22016-11-14 14:42:37 +00002600 def XVXEXPDP : XX2_XT6_XO5_XB6<60, 0, 475, "xvxexpdp", vsrc,
2601 [(set v2i64: $XT,
2602 (int_ppc_vsx_xvxexpdp v2f64:$XB))]>;
2603 def XVXEXPSP : XX2_XT6_XO5_XB6<60, 8, 475, "xvxexpsp", vsrc,
2604 [(set v4i32: $XT,
2605 (int_ppc_vsx_xvxexpsp v4f32:$XB))]>;
2606 def XVXSIGDP : XX2_XT6_XO5_XB6<60, 1, 475, "xvxsigdp", vsrc,
2607 [(set v2i64: $XT,
2608 (int_ppc_vsx_xvxsigdp v2f64:$XB))]>;
2609 def XVXSIGSP : XX2_XT6_XO5_XB6<60, 9, 475, "xvxsigsp", vsrc,
2610 [(set v4i32: $XT,
2611 (int_ppc_vsx_xvxsigsp v4f32:$XB))]>;
Chuang-Yu Cheng80722712016-03-28 08:34:28 +00002612
Sean Fertile1c4109b2016-12-09 17:21:42 +00002613 let AddedComplexity = 400, Predicates = [HasP9Vector] in {
2614 // Extra patterns expanding to vector Extract Word/Insert Word
2615 def : Pat<(v4i32 (int_ppc_vsx_xxinsertw v4i32:$A, v2i64:$B, imm:$IMM)),
2616 (v4i32 (XXINSERTW $A, $B, imm:$IMM))>;
2617 def : Pat<(v2i64 (int_ppc_vsx_xxextractuw v2i64:$A, imm:$IMM)),
2618 (v2i64 (COPY_TO_REGCLASS (XXEXTRACTUW $A, imm:$IMM), VSRC))>;
2619 } // AddedComplexity = 400, HasP9Vector
2620
Chuang-Yu Cheng80722712016-03-28 08:34:28 +00002621 //===--------------------------------------------------------------------===//
2622
2623 // Test Data Class SP/DP/QP
Nemanja Ivanovic11049f82016-10-04 06:59:23 +00002624 let UseVSXReg = 1 in {
Chuang-Yu Cheng80722712016-03-28 08:34:28 +00002625 def XSTSTDCSP : XX2_BF3_DCMX7_RS6<60, 298,
2626 (outs crrc:$BF), (ins u7imm:$DCMX, vsfrc:$XB),
2627 "xststdcsp $BF, $XB, $DCMX", IIC_VecFP, []>;
2628 def XSTSTDCDP : XX2_BF3_DCMX7_RS6<60, 362,
2629 (outs crrc:$BF), (ins u7imm:$DCMX, vsfrc:$XB),
2630 "xststdcdp $BF, $XB, $DCMX", IIC_VecFP, []>;
Nemanja Ivanovic11049f82016-10-04 06:59:23 +00002631 } // UseVSXReg = 1
Chuang-Yu Cheng80722712016-03-28 08:34:28 +00002632 def XSTSTDCQP : X_BF3_DCMX7_RS5 <63, 708,
2633 (outs crrc:$BF), (ins u7imm:$DCMX, vrrc:$vB),
2634 "xststdcqp $BF, $vB, $DCMX", IIC_VecFP, []>;
2635
2636 // Vector Test Data Class SP/DP
Nemanja Ivanovic11049f82016-10-04 06:59:23 +00002637 let UseVSXReg = 1 in {
Chuang-Yu Cheng80722712016-03-28 08:34:28 +00002638 def XVTSTDCSP : XX2_RD6_DCMX7_RS6<60, 13, 5,
2639 (outs vsrc:$XT), (ins u7imm:$DCMX, vsrc:$XB),
Sean Fertileadda5b22016-11-14 14:42:37 +00002640 "xvtstdcsp $XT, $XB, $DCMX", IIC_VecFP,
2641 [(set v4i32: $XT,
2642 (int_ppc_vsx_xvtstdcsp v4f32:$XB, imm:$DCMX))]>;
Chuang-Yu Cheng80722712016-03-28 08:34:28 +00002643 def XVTSTDCDP : XX2_RD6_DCMX7_RS6<60, 15, 5,
2644 (outs vsrc:$XT), (ins u7imm:$DCMX, vsrc:$XB),
Sean Fertileadda5b22016-11-14 14:42:37 +00002645 "xvtstdcdp $XT, $XB, $DCMX", IIC_VecFP,
2646 [(set v2i64: $XT,
2647 (int_ppc_vsx_xvtstdcdp v2f64:$XB, imm:$DCMX))]>;
Nemanja Ivanovic11049f82016-10-04 06:59:23 +00002648 } // UseVSXReg = 1
Chuang-Yu Cheng80722712016-03-28 08:34:28 +00002649
2650 //===--------------------------------------------------------------------===//
2651
2652 // Maximum/Minimum Type-C/Type-J DP
2653 // XT.dword[1] = 0xUUUU_UUUU_UUUU_UUUU, so we use vsrc for XT
2654 def XSMAXCDP : XX3_XT5_XA5_XB5<60, 128, "xsmaxcdp", vsrc, vsfrc, vsfrc,
2655 IIC_VecFP, []>;
2656 def XSMAXJDP : XX3_XT5_XA5_XB5<60, 144, "xsmaxjdp", vsrc, vsfrc, vsfrc,
2657 IIC_VecFP, []>;
2658 def XSMINCDP : XX3_XT5_XA5_XB5<60, 136, "xsmincdp", vsrc, vsfrc, vsfrc,
2659 IIC_VecFP, []>;
2660 def XSMINJDP : XX3_XT5_XA5_XB5<60, 152, "xsminjdp", vsrc, vsfrc, vsfrc,
2661 IIC_VecFP, []>;
2662
2663 //===--------------------------------------------------------------------===//
2664
2665 // Vector Byte-Reverse H/W/D/Q Word
2666 def XXBRH : XX2_XT6_XO5_XB6<60, 7, 475, "xxbrh", vsrc, []>;
2667 def XXBRW : XX2_XT6_XO5_XB6<60, 15, 475, "xxbrw", vsrc, []>;
2668 def XXBRD : XX2_XT6_XO5_XB6<60, 23, 475, "xxbrd", vsrc, []>;
2669 def XXBRQ : XX2_XT6_XO5_XB6<60, 31, 475, "xxbrq", vsrc, []>;
2670
Tony Jiang1a8eec12017-06-12 18:24:36 +00002671 // Vector Reverse
2672 def : Pat<(v8i16 (PPCxxreverse v8i16 :$A)),
2673 (v8i16 (COPY_TO_REGCLASS (XXBRH (COPY_TO_REGCLASS $A, VSRC)), VRRC))>;
2674 def : Pat<(v4i32 (PPCxxreverse v4i32 :$A)),
2675 (v4i32 (XXBRW $A))>;
2676 def : Pat<(v2i64 (PPCxxreverse v2i64 :$A)),
2677 (v2i64 (XXBRD $A))>;
2678 def : Pat<(v1i128 (PPCxxreverse v1i128 :$A)),
2679 (v1i128 (COPY_TO_REGCLASS (XXBRQ (COPY_TO_REGCLASS $A, VSRC)), VRRC))>;
2680
Chuang-Yu Cheng80722712016-03-28 08:34:28 +00002681 // Vector Permute
2682 def XXPERM : XX3_XT5_XA5_XB5<60, 26, "xxperm" , vsrc, vsrc, vsrc,
2683 IIC_VecPerm, []>;
2684 def XXPERMR : XX3_XT5_XA5_XB5<60, 58, "xxpermr", vsrc, vsrc, vsrc,
2685 IIC_VecPerm, []>;
2686
2687 // Vector Splat Immediate Byte
2688 def XXSPLTIB : X_RD6_IMM8<60, 360, (outs vsrc:$XT), (ins u8imm:$IMM8),
Nemanja Ivanovic11049f82016-10-04 06:59:23 +00002689 "xxspltib $XT, $IMM8", IIC_VecPerm, []>, UseVSXReg;
Chuang-Yu Cheng80722712016-03-28 08:34:28 +00002690
2691 //===--------------------------------------------------------------------===//
Kit Bartonba532dc2016-03-08 03:49:13 +00002692 // Vector/Scalar Load/Store Instructions
2693
Nemanja Ivanovic6354d232016-10-04 11:25:52 +00002694 // When adding new D-Form loads/stores, be sure to update the ImmToIdxMap in
2695 // PPCRegisterInfo::PPCRegisterInfo and maybe save yourself some debugging.
Sean Fertile3c8c3852017-01-26 18:59:15 +00002696 let mayLoad = 1, mayStore = 0 in {
Kit Bartonba532dc2016-03-08 03:49:13 +00002697 // Load Vector
2698 def LXV : DQ_RD6_RS5_DQ12<61, 1, (outs vsrc:$XT), (ins memrix16:$src),
Nemanja Ivanovic11049f82016-10-04 06:59:23 +00002699 "lxv $XT, $src", IIC_LdStLFD, []>, UseVSXReg;
Kit Bartonba532dc2016-03-08 03:49:13 +00002700 // Load DWord
Nemanja Ivanovic11049f82016-10-04 06:59:23 +00002701 def LXSD : DSForm_1<57, 2, (outs vfrc:$vD), (ins memrix:$src),
Kit Bartonba532dc2016-03-08 03:49:13 +00002702 "lxsd $vD, $src", IIC_LdStLFD, []>;
2703 // Load SP from src, convert it to DP, and place in dword[0]
Nemanja Ivanovic11049f82016-10-04 06:59:23 +00002704 def LXSSP : DSForm_1<57, 3, (outs vfrc:$vD), (ins memrix:$src),
Kit Bartonba532dc2016-03-08 03:49:13 +00002705 "lxssp $vD, $src", IIC_LdStLFD, []>;
2706
2707 // [PO T RA RB XO TX] almost equal to [PO S RA RB XO SX], but has different
2708 // "out" and "in" dag
2709 class X_XT6_RA5_RB5<bits<6> opcode, bits<10> xo, string opc,
2710 RegisterOperand vtype, list<dag> pattern>
Stefan Pintilie26d4f922018-03-26 17:39:18 +00002711 : XX1Form_memOp<opcode, xo, (outs vtype:$XT), (ins memrr:$src),
Nemanja Ivanovic11049f82016-10-04 06:59:23 +00002712 !strconcat(opc, " $XT, $src"), IIC_LdStLFD, pattern>, UseVSXReg;
Kit Bartonba532dc2016-03-08 03:49:13 +00002713
2714 // Load as Integer Byte/Halfword & Zero Indexed
Nemanja Ivanovic11049f82016-10-04 06:59:23 +00002715 def LXSIBZX : X_XT6_RA5_RB5<31, 781, "lxsibzx", vsfrc,
2716 [(set f64:$XT, (PPClxsizx xoaddr:$src, 1))]>;
2717 def LXSIHZX : X_XT6_RA5_RB5<31, 813, "lxsihzx", vsfrc,
2718 [(set f64:$XT, (PPClxsizx xoaddr:$src, 2))]>;
Kit Bartonba532dc2016-03-08 03:49:13 +00002719
2720 // Load Vector Halfword*8/Byte*16 Indexed
2721 def LXVH8X : X_XT6_RA5_RB5<31, 812, "lxvh8x" , vsrc, []>;
2722 def LXVB16X : X_XT6_RA5_RB5<31, 876, "lxvb16x", vsrc, []>;
2723
2724 // Load Vector Indexed
Nemanja Ivanovic6e7879c2016-09-22 09:52:19 +00002725 def LXVX : X_XT6_RA5_RB5<31, 268, "lxvx" , vsrc,
Zaara Syeda93297832017-05-24 17:50:37 +00002726 [(set v2f64:$XT, (load xaddr:$src))]>;
Kit Bartonba532dc2016-03-08 03:49:13 +00002727 // Load Vector (Left-justified) with Length
Stefan Pintilie26d4f922018-03-26 17:39:18 +00002728 def LXVL : XX1Form_memOp<31, 269, (outs vsrc:$XT), (ins memr:$src, g8rc:$rB),
Zaara Syedaa19c9e62016-11-15 17:54:19 +00002729 "lxvl $XT, $src, $rB", IIC_LdStLoad,
2730 [(set v4i32:$XT, (int_ppc_vsx_lxvl addr:$src, i64:$rB))]>,
2731 UseVSXReg;
Stefan Pintilie26d4f922018-03-26 17:39:18 +00002732 def LXVLL : XX1Form_memOp<31,301, (outs vsrc:$XT), (ins memr:$src, g8rc:$rB),
Zaara Syedaa19c9e62016-11-15 17:54:19 +00002733 "lxvll $XT, $src, $rB", IIC_LdStLoad,
2734 [(set v4i32:$XT, (int_ppc_vsx_lxvll addr:$src, i64:$rB))]>,
2735 UseVSXReg;
Kit Bartonba532dc2016-03-08 03:49:13 +00002736
2737 // Load Vector Word & Splat Indexed
2738 def LXVWSX : X_XT6_RA5_RB5<31, 364, "lxvwsx" , vsrc, []>;
Nemanja Ivanovic11049f82016-10-04 06:59:23 +00002739 } // mayLoad
Kit Bartonba532dc2016-03-08 03:49:13 +00002740
Nemanja Ivanovic6354d232016-10-04 11:25:52 +00002741 // When adding new D-Form loads/stores, be sure to update the ImmToIdxMap in
2742 // PPCRegisterInfo::PPCRegisterInfo and maybe save yourself some debugging.
Sean Fertile3c8c3852017-01-26 18:59:15 +00002743 let mayStore = 1, mayLoad = 0 in {
Kit Bartonba532dc2016-03-08 03:49:13 +00002744 // Store Vector
2745 def STXV : DQ_RD6_RS5_DQ12<61, 5, (outs), (ins vsrc:$XT, memrix16:$dst),
Nemanja Ivanovic11049f82016-10-04 06:59:23 +00002746 "stxv $XT, $dst", IIC_LdStSTFD, []>, UseVSXReg;
Kit Bartonba532dc2016-03-08 03:49:13 +00002747 // Store DWord
Nemanja Ivanovic11049f82016-10-04 06:59:23 +00002748 def STXSD : DSForm_1<61, 2, (outs), (ins vfrc:$vS, memrix:$dst),
Kit Bartonba532dc2016-03-08 03:49:13 +00002749 "stxsd $vS, $dst", IIC_LdStSTFD, []>;
2750 // Convert DP of dword[0] to SP, and Store to dst
Nemanja Ivanovic11049f82016-10-04 06:59:23 +00002751 def STXSSP : DSForm_1<61, 3, (outs), (ins vfrc:$vS, memrix:$dst),
Kit Bartonba532dc2016-03-08 03:49:13 +00002752 "stxssp $vS, $dst", IIC_LdStSTFD, []>;
2753
2754 // [PO S RA RB XO SX]
2755 class X_XS6_RA5_RB5<bits<6> opcode, bits<10> xo, string opc,
2756 RegisterOperand vtype, list<dag> pattern>
Stefan Pintilie26d4f922018-03-26 17:39:18 +00002757 : XX1Form_memOp<opcode, xo, (outs), (ins vtype:$XT, memrr:$dst),
Nemanja Ivanovic11049f82016-10-04 06:59:23 +00002758 !strconcat(opc, " $XT, $dst"), IIC_LdStSTFD, pattern>, UseVSXReg;
Kit Bartonba532dc2016-03-08 03:49:13 +00002759
2760 // Store as Integer Byte/Halfword Indexed
Nemanja Ivanovic11049f82016-10-04 06:59:23 +00002761 def STXSIBX : X_XS6_RA5_RB5<31, 909, "stxsibx" , vsfrc,
2762 [(PPCstxsix f64:$XT, xoaddr:$dst, 1)]>;
2763 def STXSIHX : X_XS6_RA5_RB5<31, 941, "stxsihx" , vsfrc,
2764 [(PPCstxsix f64:$XT, xoaddr:$dst, 2)]>;
2765 let isCodeGenOnly = 1 in {
2766 def STXSIBXv : X_XS6_RA5_RB5<31, 909, "stxsibx" , vrrc, []>;
2767 def STXSIHXv : X_XS6_RA5_RB5<31, 941, "stxsihx" , vrrc, []>;
2768 }
Kit Bartonba532dc2016-03-08 03:49:13 +00002769
2770 // Store Vector Halfword*8/Byte*16 Indexed
2771 def STXVH8X : X_XS6_RA5_RB5<31, 940, "stxvh8x" , vsrc, []>;
2772 def STXVB16X : X_XS6_RA5_RB5<31, 1004, "stxvb16x", vsrc, []>;
2773
2774 // Store Vector Indexed
Nemanja Ivanovic6e7879c2016-09-22 09:52:19 +00002775 def STXVX : X_XS6_RA5_RB5<31, 396, "stxvx" , vsrc,
Zaara Syeda93297832017-05-24 17:50:37 +00002776 [(store v2f64:$XT, xaddr:$dst)]>;
Kit Bartonba532dc2016-03-08 03:49:13 +00002777
2778 // Store Vector (Left-justified) with Length
Stefan Pintilie26d4f922018-03-26 17:39:18 +00002779 def STXVL : XX1Form_memOp<31, 397, (outs),
2780 (ins vsrc:$XT, memr:$dst, g8rc:$rB),
2781 "stxvl $XT, $dst, $rB", IIC_LdStLoad,
2782 [(int_ppc_vsx_stxvl v4i32:$XT, addr:$dst,
2783 i64:$rB)]>,
2784 UseVSXReg;
2785 def STXVLL : XX1Form_memOp<31, 429, (outs),
2786 (ins vsrc:$XT, memr:$dst, g8rc:$rB),
2787 "stxvll $XT, $dst, $rB", IIC_LdStLoad,
2788 [(int_ppc_vsx_stxvll v4i32:$XT, addr:$dst,
2789 i64:$rB)]>,
2790 UseVSXReg;
Nemanja Ivanovic11049f82016-10-04 06:59:23 +00002791 } // mayStore
Nemanja Ivanovicb43bb612016-07-12 21:00:10 +00002792
Lei Huang451ef4a2017-08-14 18:09:29 +00002793 let Predicates = [IsLittleEndian] in {
Lei Huangcd4f3852018-03-12 19:26:18 +00002794 def: Pat<(f32 (PPCfcfids (f64 (PPCmtvsra (i32 (extractelt v4i32:$A, 0)))))),
Lei Huang451ef4a2017-08-14 18:09:29 +00002795 (f32 (XSCVSPDPN (XVCVSXWSP (XXSPLTW $A, 3))))>;
Lei Huangcd4f3852018-03-12 19:26:18 +00002796 def: Pat<(f32 (PPCfcfids (f64 (PPCmtvsra (i32 (extractelt v4i32:$A, 1)))))),
Lei Huang451ef4a2017-08-14 18:09:29 +00002797 (f32 (XSCVSPDPN (XVCVSXWSP (XXSPLTW $A, 2))))>;
Lei Huangcd4f3852018-03-12 19:26:18 +00002798 def: Pat<(f32 (PPCfcfids (f64 (PPCmtvsra (i32 (extractelt v4i32:$A, 2)))))),
Lei Huang451ef4a2017-08-14 18:09:29 +00002799 (f32 (XSCVSPDPN (XVCVSXWSP (XXSPLTW $A, 1))))>;
Lei Huangcd4f3852018-03-12 19:26:18 +00002800 def: Pat<(f32 (PPCfcfids (f64 (PPCmtvsra (i32 (extractelt v4i32:$A, 3)))))),
Lei Huang451ef4a2017-08-14 18:09:29 +00002801 (f32 (XSCVSPDPN (XVCVSXWSP (XXSPLTW $A, 0))))>;
Lei Huangcd4f3852018-03-12 19:26:18 +00002802 def: Pat<(f64 (PPCfcfid (f64 (PPCmtvsra (i32 (extractelt v4i32:$A, 0)))))),
Lei Huang451ef4a2017-08-14 18:09:29 +00002803 (f64 (COPY_TO_REGCLASS (XVCVSXWDP (XXSPLTW $A, 3)), VSFRC))>;
Lei Huangcd4f3852018-03-12 19:26:18 +00002804 def: Pat<(f64 (PPCfcfid (f64 (PPCmtvsra (i32 (extractelt v4i32:$A, 1)))))),
Lei Huang451ef4a2017-08-14 18:09:29 +00002805 (f64 (COPY_TO_REGCLASS (XVCVSXWDP (XXSPLTW $A, 2)), VSFRC))>;
Lei Huangcd4f3852018-03-12 19:26:18 +00002806 def: Pat<(f64 (PPCfcfid (f64 (PPCmtvsra (i32 (extractelt v4i32:$A, 2)))))),
Lei Huang451ef4a2017-08-14 18:09:29 +00002807 (f64 (COPY_TO_REGCLASS (XVCVSXWDP (XXSPLTW $A, 1)), VSFRC))>;
Lei Huangcd4f3852018-03-12 19:26:18 +00002808 def: Pat<(f64 (PPCfcfid (f64 (PPCmtvsra (i32 (extractelt v4i32:$A, 3)))))),
Lei Huang451ef4a2017-08-14 18:09:29 +00002809 (f64 (COPY_TO_REGCLASS (XVCVSXWDP (XXSPLTW $A, 0)), VSFRC))>;
2810 }
2811
2812 let Predicates = [IsBigEndian] in {
Lei Huangcd4f3852018-03-12 19:26:18 +00002813 def: Pat<(f32 (PPCfcfids (f64 (PPCmtvsra (i32 (extractelt v4i32:$A, 0)))))),
Lei Huang451ef4a2017-08-14 18:09:29 +00002814 (f32 (XSCVSPDPN (XVCVSXWSP (XXSPLTW $A, 0))))>;
Lei Huangcd4f3852018-03-12 19:26:18 +00002815 def: Pat<(f32 (PPCfcfids (f64 (PPCmtvsra (i32 (extractelt v4i32:$A, 1)))))),
Lei Huang451ef4a2017-08-14 18:09:29 +00002816 (f32 (XSCVSPDPN (XVCVSXWSP (XXSPLTW $A, 1))))>;
Lei Huangcd4f3852018-03-12 19:26:18 +00002817 def: Pat<(f32 (PPCfcfids (f64 (PPCmtvsra (i32 (extractelt v4i32:$A, 2)))))),
Lei Huang451ef4a2017-08-14 18:09:29 +00002818 (f32 (XSCVSPDPN (XVCVSXWSP (XXSPLTW $A, 2))))>;
Lei Huangcd4f3852018-03-12 19:26:18 +00002819 def: Pat<(f32 (PPCfcfids (f64 (PPCmtvsra (i32 (extractelt v4i32:$A, 3)))))),
Lei Huang451ef4a2017-08-14 18:09:29 +00002820 (f32 (XSCVSPDPN (XVCVSXWSP (XXSPLTW $A, 3))))>;
Lei Huangcd4f3852018-03-12 19:26:18 +00002821 def: Pat<(f64 (PPCfcfid (f64 (PPCmtvsra (i32 (extractelt v4i32:$A, 0)))))),
Lei Huang451ef4a2017-08-14 18:09:29 +00002822 (f64 (COPY_TO_REGCLASS (XVCVSXWDP (XXSPLTW $A, 0)), VSFRC))>;
Lei Huangcd4f3852018-03-12 19:26:18 +00002823 def: Pat<(f64 (PPCfcfid (f64 (PPCmtvsra (i32 (extractelt v4i32:$A, 1)))))),
Lei Huang451ef4a2017-08-14 18:09:29 +00002824 (f64 (COPY_TO_REGCLASS (XVCVSXWDP (XXSPLTW $A, 1)), VSFRC))>;
Lei Huangcd4f3852018-03-12 19:26:18 +00002825 def: Pat<(f64 (PPCfcfid (f64 (PPCmtvsra (i32 (extractelt v4i32:$A, 2)))))),
Lei Huang451ef4a2017-08-14 18:09:29 +00002826 (f64 (COPY_TO_REGCLASS (XVCVSXWDP (XXSPLTW $A, 2)), VSFRC))>;
Lei Huangcd4f3852018-03-12 19:26:18 +00002827 def: Pat<(f64 (PPCfcfid (f64 (PPCmtvsra (i32 (extractelt v4i32:$A, 3)))))),
Lei Huang451ef4a2017-08-14 18:09:29 +00002828 (f64 (COPY_TO_REGCLASS (XVCVSXWDP (XXSPLTW $A, 3)), VSFRC))>;
2829 }
2830
Graham Yiu5cd044e2017-11-07 20:55:43 +00002831 // Alternate patterns for PPCmtvsrz where the output is v8i16 or v16i8 instead
2832 // of f64
2833 def : Pat<(v8i16 (PPCmtvsrz i32:$A)),
2834 (v8i16 (SUBREG_TO_REG (i64 1), (MTVSRWZ $A), sub_64))>;
2835 def : Pat<(v16i8 (PPCmtvsrz i32:$A)),
2836 (v16i8 (SUBREG_TO_REG (i64 1), (MTVSRWZ $A), sub_64))>;
2837
Nemanja Ivanovicb43bb612016-07-12 21:00:10 +00002838 // Patterns for which instructions from ISA 3.0 are a better match
2839 let Predicates = [IsLittleEndian, HasP9Vector] in {
Lei Huangcd4f3852018-03-12 19:26:18 +00002840 def : Pat<(f32 (PPCfcfidus (f64 (PPCmtvsrz (i32 (extractelt v4i32:$A, 0)))))),
Nemanja Ivanovicb43bb612016-07-12 21:00:10 +00002841 (f32 (XSCVUXDSP (XXEXTRACTUW $A, 12)))>;
Lei Huangcd4f3852018-03-12 19:26:18 +00002842 def : Pat<(f32 (PPCfcfidus (f64 (PPCmtvsrz (i32 (extractelt v4i32:$A, 1)))))),
Nemanja Ivanovicb43bb612016-07-12 21:00:10 +00002843 (f32 (XSCVUXDSP (XXEXTRACTUW $A, 8)))>;
Lei Huangcd4f3852018-03-12 19:26:18 +00002844 def : Pat<(f32 (PPCfcfidus (f64 (PPCmtvsrz (i32 (extractelt v4i32:$A, 2)))))),
Nemanja Ivanovicb43bb612016-07-12 21:00:10 +00002845 (f32 (XSCVUXDSP (XXEXTRACTUW $A, 4)))>;
Lei Huangcd4f3852018-03-12 19:26:18 +00002846 def : Pat<(f32 (PPCfcfidus (f64 (PPCmtvsrz (i32 (extractelt v4i32:$A, 3)))))),
Nemanja Ivanovicb43bb612016-07-12 21:00:10 +00002847 (f32 (XSCVUXDSP (XXEXTRACTUW $A, 0)))>;
Lei Huangcd4f3852018-03-12 19:26:18 +00002848 def : Pat<(f64 (PPCfcfidu (f64 (PPCmtvsrz (i32 (extractelt v4i32:$A, 0)))))),
Lei Huang451ef4a2017-08-14 18:09:29 +00002849 (f64 (XSCVUXDDP (XXEXTRACTUW $A, 12)))>;
Lei Huangcd4f3852018-03-12 19:26:18 +00002850 def : Pat<(f64 (PPCfcfidu (f64 (PPCmtvsrz (i32 (extractelt v4i32:$A, 1)))))),
Lei Huang451ef4a2017-08-14 18:09:29 +00002851 (f64 (XSCVUXDDP (XXEXTRACTUW $A, 8)))>;
Lei Huangcd4f3852018-03-12 19:26:18 +00002852 def : Pat<(f64 (PPCfcfidu (f64 (PPCmtvsrz (i32 (extractelt v4i32:$A, 2)))))),
Lei Huang451ef4a2017-08-14 18:09:29 +00002853 (f64 (XSCVUXDDP (XXEXTRACTUW $A, 4)))>;
Lei Huangcd4f3852018-03-12 19:26:18 +00002854 def : Pat<(f64 (PPCfcfidu (f64 (PPCmtvsrz (i32 (extractelt v4i32:$A, 3)))))),
Lei Huang451ef4a2017-08-14 18:09:29 +00002855 (f64 (XSCVUXDDP (XXEXTRACTUW $A, 0)))>;
Nemanja Ivanovicb43bb612016-07-12 21:00:10 +00002856 def : Pat<(v4i32 (insertelt v4i32:$A, i32:$B, 0)),
2857 (v4i32 (XXINSERTW v4i32:$A, AlignValues.I32_TO_BE_WORD1, 12))>;
2858 def : Pat<(v4i32 (insertelt v4i32:$A, i32:$B, 1)),
2859 (v4i32 (XXINSERTW v4i32:$A, AlignValues.I32_TO_BE_WORD1, 8))>;
2860 def : Pat<(v4i32 (insertelt v4i32:$A, i32:$B, 2)),
2861 (v4i32 (XXINSERTW v4i32:$A, AlignValues.I32_TO_BE_WORD1, 4))>;
2862 def : Pat<(v4i32 (insertelt v4i32:$A, i32:$B, 3)),
2863 (v4i32 (XXINSERTW v4i32:$A, AlignValues.I32_TO_BE_WORD1, 0))>;
2864 def : Pat<(v4f32 (insertelt v4f32:$A, f32:$B, 0)),
2865 (v4f32 (XXINSERTW v4f32:$A, AlignValues.F32_TO_BE_WORD1, 12))>;
2866 def : Pat<(v4f32 (insertelt v4f32:$A, f32:$B, 1)),
2867 (v4f32 (XXINSERTW v4f32:$A, AlignValues.F32_TO_BE_WORD1, 8))>;
2868 def : Pat<(v4f32 (insertelt v4f32:$A, f32:$B, 2)),
2869 (v4f32 (XXINSERTW v4f32:$A, AlignValues.F32_TO_BE_WORD1, 4))>;
2870 def : Pat<(v4f32 (insertelt v4f32:$A, f32:$B, 3)),
2871 (v4f32 (XXINSERTW v4f32:$A, AlignValues.F32_TO_BE_WORD1, 0))>;
2872 } // IsLittleEndian, HasP9Vector
2873
2874 let Predicates = [IsBigEndian, HasP9Vector] in {
Lei Huangcd4f3852018-03-12 19:26:18 +00002875 def : Pat<(f32 (PPCfcfidus (f64 (PPCmtvsrz (i32 (extractelt v4i32:$A, 0)))))),
Nemanja Ivanovicb43bb612016-07-12 21:00:10 +00002876 (f32 (XSCVUXDSP (XXEXTRACTUW $A, 0)))>;
Lei Huangcd4f3852018-03-12 19:26:18 +00002877 def : Pat<(f32 (PPCfcfidus (f64 (PPCmtvsrz (i32 (extractelt v4i32:$A, 1)))))),
Nemanja Ivanovicb43bb612016-07-12 21:00:10 +00002878 (f32 (XSCVUXDSP (XXEXTRACTUW $A, 4)))>;
Lei Huangcd4f3852018-03-12 19:26:18 +00002879 def : Pat<(f32 (PPCfcfidus (f64 (PPCmtvsrz (i32 (extractelt v4i32:$A, 2)))))),
Nemanja Ivanovicb43bb612016-07-12 21:00:10 +00002880 (f32 (XSCVUXDSP (XXEXTRACTUW $A, 8)))>;
Lei Huangcd4f3852018-03-12 19:26:18 +00002881 def : Pat<(f32 (PPCfcfidus (f64 (PPCmtvsrz (i32 (extractelt v4i32:$A, 3)))))),
Nemanja Ivanovicb43bb612016-07-12 21:00:10 +00002882 (f32 (XSCVUXDSP (XXEXTRACTUW $A, 12)))>;
Lei Huangcd4f3852018-03-12 19:26:18 +00002883 def : Pat<(f64 (PPCfcfidu (f64 (PPCmtvsrz (i32 (extractelt v4i32:$A, 0)))))),
Lei Huang451ef4a2017-08-14 18:09:29 +00002884 (f64 (XSCVUXDDP (XXEXTRACTUW $A, 0)))>;
Lei Huangcd4f3852018-03-12 19:26:18 +00002885 def : Pat<(f64 (PPCfcfidu (f64 (PPCmtvsrz (i32 (extractelt v4i32:$A, 1)))))),
Lei Huang451ef4a2017-08-14 18:09:29 +00002886 (f64 (XSCVUXDDP (XXEXTRACTUW $A, 4)))>;
Lei Huangcd4f3852018-03-12 19:26:18 +00002887 def : Pat<(f64 (PPCfcfidu (f64 (PPCmtvsrz (i32 (extractelt v4i32:$A, 2)))))),
Lei Huang451ef4a2017-08-14 18:09:29 +00002888 (f64 (XSCVUXDDP (XXEXTRACTUW $A, 8)))>;
Lei Huangcd4f3852018-03-12 19:26:18 +00002889 def : Pat<(f64 (PPCfcfidu (f64 (PPCmtvsrz (i32 (extractelt v4i32:$A, 3)))))),
Lei Huang451ef4a2017-08-14 18:09:29 +00002890 (f64 (XSCVUXDDP (XXEXTRACTUW $A, 12)))>;
Nemanja Ivanovicb43bb612016-07-12 21:00:10 +00002891 def : Pat<(v4i32 (insertelt v4i32:$A, i32:$B, 0)),
2892 (v4i32 (XXINSERTW v4i32:$A, AlignValues.I32_TO_BE_WORD1, 0))>;
2893 def : Pat<(v4i32 (insertelt v4i32:$A, i32:$B, 1)),
2894 (v4i32 (XXINSERTW v4i32:$A, AlignValues.I32_TO_BE_WORD1, 4))>;
2895 def : Pat<(v4i32 (insertelt v4i32:$A, i32:$B, 2)),
2896 (v4i32 (XXINSERTW v4i32:$A, AlignValues.I32_TO_BE_WORD1, 8))>;
2897 def : Pat<(v4i32 (insertelt v4i32:$A, i32:$B, 3)),
2898 (v4i32 (XXINSERTW v4i32:$A, AlignValues.I32_TO_BE_WORD1, 12))>;
2899 def : Pat<(v4f32 (insertelt v4f32:$A, f32:$B, 0)),
2900 (v4f32 (XXINSERTW v4f32:$A, AlignValues.F32_TO_BE_WORD1, 0))>;
2901 def : Pat<(v4f32 (insertelt v4f32:$A, f32:$B, 1)),
2902 (v4f32 (XXINSERTW v4f32:$A, AlignValues.F32_TO_BE_WORD1, 4))>;
2903 def : Pat<(v4f32 (insertelt v4f32:$A, f32:$B, 2)),
2904 (v4f32 (XXINSERTW v4f32:$A, AlignValues.F32_TO_BE_WORD1, 8))>;
2905 def : Pat<(v4f32 (insertelt v4f32:$A, f32:$B, 3)),
2906 (v4f32 (XXINSERTW v4f32:$A, AlignValues.F32_TO_BE_WORD1, 12))>;
2907 } // IsLittleEndian, HasP9Vector
Nemanja Ivanovic6e7879c2016-09-22 09:52:19 +00002908
Zaara Syeda93297832017-05-24 17:50:37 +00002909 // D-Form Load/Store
Nemanja Ivanovic3c7e276d2017-07-13 18:17:10 +00002910 def : Pat<(v4i32 (quadwOffsetLoad iqaddr:$src)), (LXV memrix16:$src)>;
2911 def : Pat<(v4f32 (quadwOffsetLoad iqaddr:$src)), (LXV memrix16:$src)>;
2912 def : Pat<(v2i64 (quadwOffsetLoad iqaddr:$src)), (LXV memrix16:$src)>;
2913 def : Pat<(v2f64 (quadwOffsetLoad iqaddr:$src)), (LXV memrix16:$src)>;
Lei Huang6d1596a2018-03-19 18:52:20 +00002914 def : Pat<(f128 (quadwOffsetLoad iqaddr:$src)),
2915 (COPY_TO_REGCLASS (LXV memrix16:$src), VRRC)>;
Nemanja Ivanovic3c7e276d2017-07-13 18:17:10 +00002916 def : Pat<(v4i32 (int_ppc_vsx_lxvw4x iqaddr:$src)), (LXV memrix16:$src)>;
2917 def : Pat<(v2f64 (int_ppc_vsx_lxvd2x iqaddr:$src)), (LXV memrix16:$src)>;
Nemanja Ivanovicd2c3c512016-09-23 13:25:31 +00002918
Nemanja Ivanovic3c7e276d2017-07-13 18:17:10 +00002919 def : Pat<(quadwOffsetStore v4f32:$rS, iqaddr:$dst), (STXV $rS, memrix16:$dst)>;
2920 def : Pat<(quadwOffsetStore v4i32:$rS, iqaddr:$dst), (STXV $rS, memrix16:$dst)>;
2921 def : Pat<(quadwOffsetStore v2f64:$rS, iqaddr:$dst), (STXV $rS, memrix16:$dst)>;
Lei Huang6d1596a2018-03-19 18:52:20 +00002922 def : Pat<(quadwOffsetStore f128:$rS, iqaddr:$dst),
2923 (STXV (COPY_TO_REGCLASS $rS, VSRC), memrix16:$dst)>;
Nemanja Ivanovic3c7e276d2017-07-13 18:17:10 +00002924 def : Pat<(quadwOffsetStore v2i64:$rS, iqaddr:$dst), (STXV $rS, memrix16:$dst)>;
2925 def : Pat<(int_ppc_vsx_stxvw4x v4i32:$rS, iqaddr:$dst),
Zaara Syeda93297832017-05-24 17:50:37 +00002926 (STXV $rS, memrix16:$dst)>;
Nemanja Ivanovic3c7e276d2017-07-13 18:17:10 +00002927 def : Pat<(int_ppc_vsx_stxvd2x v2f64:$rS, iqaddr:$dst),
Zaara Syeda93297832017-05-24 17:50:37 +00002928 (STXV $rS, memrix16:$dst)>;
2929
2930
Nemanja Ivanovic3c7e276d2017-07-13 18:17:10 +00002931 def : Pat<(v2f64 (nonQuadwOffsetLoad xoaddr:$src)), (LXVX xoaddr:$src)>;
2932 def : Pat<(v2i64 (nonQuadwOffsetLoad xoaddr:$src)), (LXVX xoaddr:$src)>;
2933 def : Pat<(v4f32 (nonQuadwOffsetLoad xoaddr:$src)), (LXVX xoaddr:$src)>;
2934 def : Pat<(v4i32 (nonQuadwOffsetLoad xoaddr:$src)), (LXVX xoaddr:$src)>;
2935 def : Pat<(v4i32 (int_ppc_vsx_lxvw4x xoaddr:$src)), (LXVX xoaddr:$src)>;
2936 def : Pat<(v2f64 (int_ppc_vsx_lxvd2x xoaddr:$src)), (LXVX xoaddr:$src)>;
Lei Huang6d1596a2018-03-19 18:52:20 +00002937 def : Pat<(f128 (nonQuadwOffsetLoad xoaddr:$src)),
2938 (COPY_TO_REGCLASS (LXVX xoaddr:$src), VRRC)>;
2939 def : Pat<(nonQuadwOffsetStore f128:$rS, xoaddr:$dst),
2940 (STXVX (COPY_TO_REGCLASS $rS, VSRC), xoaddr:$dst)>;
Nemanja Ivanovic3c7e276d2017-07-13 18:17:10 +00002941 def : Pat<(nonQuadwOffsetStore v2f64:$rS, xoaddr:$dst),
2942 (STXVX $rS, xoaddr:$dst)>;
2943 def : Pat<(nonQuadwOffsetStore v2i64:$rS, xoaddr:$dst),
2944 (STXVX $rS, xoaddr:$dst)>;
2945 def : Pat<(nonQuadwOffsetStore v4f32:$rS, xoaddr:$dst),
2946 (STXVX $rS, xoaddr:$dst)>;
2947 def : Pat<(nonQuadwOffsetStore v4i32:$rS, xoaddr:$dst),
2948 (STXVX $rS, xoaddr:$dst)>;
2949 def : Pat<(int_ppc_vsx_stxvw4x v4i32:$rS, xoaddr:$dst),
2950 (STXVX $rS, xoaddr:$dst)>;
2951 def : Pat<(int_ppc_vsx_stxvd2x v2f64:$rS, xoaddr:$dst),
2952 (STXVX $rS, xoaddr:$dst)>;
Nemanja Ivanovicd2c3c512016-09-23 13:25:31 +00002953 def : Pat<(v4i32 (scalar_to_vector (i32 (load xoaddr:$src)))),
2954 (v4i32 (LXVWSX xoaddr:$src))>;
2955 def : Pat<(v4f32 (scalar_to_vector (f32 (load xoaddr:$src)))),
2956 (v4f32 (LXVWSX xoaddr:$src))>;
Lei Huangcd4f3852018-03-12 19:26:18 +00002957 def : Pat<(v4f32 (scalar_to_vector
2958 (f32 (fpround (f64 (extloadf32 xoaddr:$src)))))),
Nemanja Ivanovicdf1cb522016-11-29 16:11:34 +00002959 (v4f32 (LXVWSX xoaddr:$src))>;
Nemanja Ivanovic11049f82016-10-04 06:59:23 +00002960
2961 // Build vectors from i8 loads
2962 def : Pat<(v16i8 (scalar_to_vector ScalarLoads.Li8)),
2963 (v16i8 (VSPLTBs 7, (LXSIBZX xoaddr:$src)))>;
2964 def : Pat<(v8i16 (scalar_to_vector ScalarLoads.ZELi8)),
2965 (v8i16 (VSPLTHs 3, (LXSIBZX xoaddr:$src)))>;
2966 def : Pat<(v4i32 (scalar_to_vector ScalarLoads.ZELi8)),
2967 (v4i32 (XXSPLTWs (LXSIBZX xoaddr:$src), 1))>;
2968 def : Pat<(v2i64 (scalar_to_vector ScalarLoads.ZELi8i64)),
Nemanja Ivanovic15748f42016-12-06 11:47:14 +00002969 (v2i64 (XXPERMDIs (LXSIBZX xoaddr:$src), 0))>;
Nemanja Ivanovic11049f82016-10-04 06:59:23 +00002970 def : Pat<(v4i32 (scalar_to_vector ScalarLoads.SELi8)),
2971 (v4i32 (XXSPLTWs (VEXTSB2Ws (LXSIBZX xoaddr:$src)), 1))>;
2972 def : Pat<(v2i64 (scalar_to_vector ScalarLoads.SELi8i64)),
Nemanja Ivanovic15748f42016-12-06 11:47:14 +00002973 (v2i64 (XXPERMDIs (VEXTSB2Ds (LXSIBZX xoaddr:$src)), 0))>;
Nemanja Ivanovic11049f82016-10-04 06:59:23 +00002974
2975 // Build vectors from i16 loads
2976 def : Pat<(v8i16 (scalar_to_vector ScalarLoads.Li16)),
2977 (v8i16 (VSPLTHs 3, (LXSIHZX xoaddr:$src)))>;
2978 def : Pat<(v4i32 (scalar_to_vector ScalarLoads.ZELi16)),
2979 (v4i32 (XXSPLTWs (LXSIHZX xoaddr:$src), 1))>;
2980 def : Pat<(v2i64 (scalar_to_vector ScalarLoads.ZELi16i64)),
Nemanja Ivanovic15748f42016-12-06 11:47:14 +00002981 (v2i64 (XXPERMDIs (LXSIHZX xoaddr:$src), 0))>;
Nemanja Ivanovic11049f82016-10-04 06:59:23 +00002982 def : Pat<(v4i32 (scalar_to_vector ScalarLoads.SELi16)),
2983 (v4i32 (XXSPLTWs (VEXTSH2Ws (LXSIHZX xoaddr:$src)), 1))>;
2984 def : Pat<(v2i64 (scalar_to_vector ScalarLoads.SELi16i64)),
Nemanja Ivanovic15748f42016-12-06 11:47:14 +00002985 (v2i64 (XXPERMDIs (VEXTSH2Ds (LXSIHZX xoaddr:$src)), 0))>;
Nemanja Ivanovic11049f82016-10-04 06:59:23 +00002986
2987 let Predicates = [IsBigEndian, HasP9Vector] in {
2988 // Scalar stores of i8
2989 def : Pat<(truncstorei8 (i32 (vector_extract v16i8:$S, 0)), xoaddr:$dst),
Lei Huangcd4f3852018-03-12 19:26:18 +00002990 (STXSIBXv (v16i8 (VSLDOI $S, $S, 9)), xoaddr:$dst)>;
Nemanja Ivanovic11049f82016-10-04 06:59:23 +00002991 def : Pat<(truncstorei8 (i32 (vector_extract v16i8:$S, 1)), xoaddr:$dst),
Lei Huangcd4f3852018-03-12 19:26:18 +00002992 (STXSIBXv (v16i8 (VSLDOI $S, $S, 10)), xoaddr:$dst)>;
Nemanja Ivanovic11049f82016-10-04 06:59:23 +00002993 def : Pat<(truncstorei8 (i32 (vector_extract v16i8:$S, 2)), xoaddr:$dst),
Lei Huangcd4f3852018-03-12 19:26:18 +00002994 (STXSIBXv (v16i8 (VSLDOI $S, $S, 11)), xoaddr:$dst)>;
Nemanja Ivanovic11049f82016-10-04 06:59:23 +00002995 def : Pat<(truncstorei8 (i32 (vector_extract v16i8:$S, 3)), xoaddr:$dst),
Lei Huangcd4f3852018-03-12 19:26:18 +00002996 (STXSIBXv (v16i8 (VSLDOI $S, $S, 12)), xoaddr:$dst)>;
Nemanja Ivanovic11049f82016-10-04 06:59:23 +00002997 def : Pat<(truncstorei8 (i32 (vector_extract v16i8:$S, 4)), xoaddr:$dst),
Lei Huangcd4f3852018-03-12 19:26:18 +00002998 (STXSIBXv (v16i8 (VSLDOI $S, $S, 13)), xoaddr:$dst)>;
Nemanja Ivanovic11049f82016-10-04 06:59:23 +00002999 def : Pat<(truncstorei8 (i32 (vector_extract v16i8:$S, 5)), xoaddr:$dst),
Lei Huangcd4f3852018-03-12 19:26:18 +00003000 (STXSIBXv (v16i8 (VSLDOI $S, $S, 14)), xoaddr:$dst)>;
Nemanja Ivanovic11049f82016-10-04 06:59:23 +00003001 def : Pat<(truncstorei8 (i32 (vector_extract v16i8:$S, 6)), xoaddr:$dst),
Lei Huangcd4f3852018-03-12 19:26:18 +00003002 (STXSIBXv (v16i8 (VSLDOI $S, $S, 15)), xoaddr:$dst)>;
Nemanja Ivanovic11049f82016-10-04 06:59:23 +00003003 def : Pat<(truncstorei8 (i32 (vector_extract v16i8:$S, 7)), xoaddr:$dst),
3004 (STXSIBXv $S, xoaddr:$dst)>;
3005 def : Pat<(truncstorei8 (i32 (vector_extract v16i8:$S, 8)), xoaddr:$dst),
Lei Huangcd4f3852018-03-12 19:26:18 +00003006 (STXSIBXv (v16i8 (VSLDOI $S, $S, 1)), xoaddr:$dst)>;
Nemanja Ivanovic11049f82016-10-04 06:59:23 +00003007 def : Pat<(truncstorei8 (i32 (vector_extract v16i8:$S, 9)), xoaddr:$dst),
Lei Huangcd4f3852018-03-12 19:26:18 +00003008 (STXSIBXv (v16i8 (VSLDOI $S, $S, 2)), xoaddr:$dst)>;
Nemanja Ivanovic11049f82016-10-04 06:59:23 +00003009 def : Pat<(truncstorei8 (i32 (vector_extract v16i8:$S, 10)), xoaddr:$dst),
Lei Huangcd4f3852018-03-12 19:26:18 +00003010 (STXSIBXv (v16i8 (VSLDOI $S, $S, 3)), xoaddr:$dst)>;
Nemanja Ivanovic11049f82016-10-04 06:59:23 +00003011 def : Pat<(truncstorei8 (i32 (vector_extract v16i8:$S, 11)), xoaddr:$dst),
Lei Huangcd4f3852018-03-12 19:26:18 +00003012 (STXSIBXv (v16i8 (VSLDOI $S, $S, 4)), xoaddr:$dst)>;
Nemanja Ivanovic11049f82016-10-04 06:59:23 +00003013 def : Pat<(truncstorei8 (i32 (vector_extract v16i8:$S, 12)), xoaddr:$dst),
Lei Huangcd4f3852018-03-12 19:26:18 +00003014 (STXSIBXv (v16i8 (VSLDOI $S, $S, 5)), xoaddr:$dst)>;
Nemanja Ivanovic11049f82016-10-04 06:59:23 +00003015 def : Pat<(truncstorei8 (i32 (vector_extract v16i8:$S, 13)), xoaddr:$dst),
Lei Huangcd4f3852018-03-12 19:26:18 +00003016 (STXSIBXv (v16i8 (VSLDOI $S, $S, 6)), xoaddr:$dst)>;
Nemanja Ivanovic11049f82016-10-04 06:59:23 +00003017 def : Pat<(truncstorei8 (i32 (vector_extract v16i8:$S, 14)), xoaddr:$dst),
Lei Huangcd4f3852018-03-12 19:26:18 +00003018 (STXSIBXv (v16i8 (VSLDOI $S, $S, 7)), xoaddr:$dst)>;
Nemanja Ivanovic11049f82016-10-04 06:59:23 +00003019 def : Pat<(truncstorei8 (i32 (vector_extract v16i8:$S, 15)), xoaddr:$dst),
Lei Huangcd4f3852018-03-12 19:26:18 +00003020 (STXSIBXv (v16i8 (VSLDOI $S, $S, 8)), xoaddr:$dst)>;
Nemanja Ivanovic11049f82016-10-04 06:59:23 +00003021
3022 // Scalar stores of i16
3023 def : Pat<(truncstorei16 (i32 (vector_extract v8i16:$S, 0)), xoaddr:$dst),
Lei Huangcd4f3852018-03-12 19:26:18 +00003024 (STXSIHXv (v16i8 (VSLDOI $S, $S, 10)), xoaddr:$dst)>;
Nemanja Ivanovic11049f82016-10-04 06:59:23 +00003025 def : Pat<(truncstorei16 (i32 (vector_extract v8i16:$S, 1)), xoaddr:$dst),
Lei Huangcd4f3852018-03-12 19:26:18 +00003026 (STXSIHXv (v16i8 (VSLDOI $S, $S, 12)), xoaddr:$dst)>;
Nemanja Ivanovic11049f82016-10-04 06:59:23 +00003027 def : Pat<(truncstorei16 (i32 (vector_extract v8i16:$S, 2)), xoaddr:$dst),
Lei Huangcd4f3852018-03-12 19:26:18 +00003028 (STXSIHXv (v16i8 (VSLDOI $S, $S, 14)), xoaddr:$dst)>;
Nemanja Ivanovic11049f82016-10-04 06:59:23 +00003029 def : Pat<(truncstorei16 (i32 (vector_extract v8i16:$S, 3)), xoaddr:$dst),
3030 (STXSIHXv $S, xoaddr:$dst)>;
3031 def : Pat<(truncstorei16 (i32 (vector_extract v8i16:$S, 4)), xoaddr:$dst),
Lei Huangcd4f3852018-03-12 19:26:18 +00003032 (STXSIHXv (v16i8 (VSLDOI $S, $S, 2)), xoaddr:$dst)>;
Nemanja Ivanovic11049f82016-10-04 06:59:23 +00003033 def : Pat<(truncstorei16 (i32 (vector_extract v8i16:$S, 5)), xoaddr:$dst),
Lei Huangcd4f3852018-03-12 19:26:18 +00003034 (STXSIHXv (v16i8 (VSLDOI $S, $S, 4)), xoaddr:$dst)>;
Nemanja Ivanovic11049f82016-10-04 06:59:23 +00003035 def : Pat<(truncstorei16 (i32 (vector_extract v8i16:$S, 6)), xoaddr:$dst),
Lei Huangcd4f3852018-03-12 19:26:18 +00003036 (STXSIHXv (v16i8 (VSLDOI $S, $S, 6)), xoaddr:$dst)>;
Nemanja Ivanovic11049f82016-10-04 06:59:23 +00003037 def : Pat<(truncstorei16 (i32 (vector_extract v8i16:$S, 7)), xoaddr:$dst),
Lei Huangcd4f3852018-03-12 19:26:18 +00003038 (STXSIHXv (v16i8 (VSLDOI $S, $S, 8)), xoaddr:$dst)>;
Nemanja Ivanovic11049f82016-10-04 06:59:23 +00003039 } // IsBigEndian, HasP9Vector
3040
3041 let Predicates = [IsLittleEndian, HasP9Vector] in {
3042 // Scalar stores of i8
3043 def : Pat<(truncstorei8 (i32 (vector_extract v16i8:$S, 0)), xoaddr:$dst),
Lei Huangcd4f3852018-03-12 19:26:18 +00003044 (STXSIBXv (v16i8 (VSLDOI $S, $S, 8)), xoaddr:$dst)>;
Nemanja Ivanovic11049f82016-10-04 06:59:23 +00003045 def : Pat<(truncstorei8 (i32 (vector_extract v16i8:$S, 1)), xoaddr:$dst),
Lei Huangcd4f3852018-03-12 19:26:18 +00003046 (STXSIBXv (v16i8 (VSLDOI $S, $S, 7)), xoaddr:$dst)>;
Nemanja Ivanovic11049f82016-10-04 06:59:23 +00003047 def : Pat<(truncstorei8 (i32 (vector_extract v16i8:$S, 2)), xoaddr:$dst),
Lei Huangcd4f3852018-03-12 19:26:18 +00003048 (STXSIBXv (v16i8 (VSLDOI $S, $S, 6)), xoaddr:$dst)>;
Nemanja Ivanovic11049f82016-10-04 06:59:23 +00003049 def : Pat<(truncstorei8 (i32 (vector_extract v16i8:$S, 3)), xoaddr:$dst),
Lei Huangcd4f3852018-03-12 19:26:18 +00003050 (STXSIBXv (v16i8 (VSLDOI $S, $S, 5)), xoaddr:$dst)>;
Nemanja Ivanovic11049f82016-10-04 06:59:23 +00003051 def : Pat<(truncstorei8 (i32 (vector_extract v16i8:$S, 4)), xoaddr:$dst),
Lei Huangcd4f3852018-03-12 19:26:18 +00003052 (STXSIBXv (v16i8 (VSLDOI $S, $S, 4)), xoaddr:$dst)>;
Nemanja Ivanovic11049f82016-10-04 06:59:23 +00003053 def : Pat<(truncstorei8 (i32 (vector_extract v16i8:$S, 5)), xoaddr:$dst),
Lei Huangcd4f3852018-03-12 19:26:18 +00003054 (STXSIBXv (v16i8 (VSLDOI $S, $S, 3)), xoaddr:$dst)>;
Nemanja Ivanovic11049f82016-10-04 06:59:23 +00003055 def : Pat<(truncstorei8 (i32 (vector_extract v16i8:$S, 6)), xoaddr:$dst),
Lei Huangcd4f3852018-03-12 19:26:18 +00003056 (STXSIBXv (v16i8 (VSLDOI $S, $S, 2)), xoaddr:$dst)>;
Nemanja Ivanovic11049f82016-10-04 06:59:23 +00003057 def : Pat<(truncstorei8 (i32 (vector_extract v16i8:$S, 7)), xoaddr:$dst),
Lei Huangcd4f3852018-03-12 19:26:18 +00003058 (STXSIBXv (v16i8 (VSLDOI $S, $S, 1)), xoaddr:$dst)>;
Nemanja Ivanovic11049f82016-10-04 06:59:23 +00003059 def : Pat<(truncstorei8 (i32 (vector_extract v16i8:$S, 8)), xoaddr:$dst),
3060 (STXSIBXv $S, xoaddr:$dst)>;
3061 def : Pat<(truncstorei8 (i32 (vector_extract v16i8:$S, 9)), xoaddr:$dst),
Lei Huangcd4f3852018-03-12 19:26:18 +00003062 (STXSIBXv (v16i8 (VSLDOI $S, $S, 15)), xoaddr:$dst)>;
Nemanja Ivanovic11049f82016-10-04 06:59:23 +00003063 def : Pat<(truncstorei8 (i32 (vector_extract v16i8:$S, 10)), xoaddr:$dst),
Lei Huangcd4f3852018-03-12 19:26:18 +00003064 (STXSIBXv (v16i8 (VSLDOI $S, $S, 14)), xoaddr:$dst)>;
Nemanja Ivanovic11049f82016-10-04 06:59:23 +00003065 def : Pat<(truncstorei8 (i32 (vector_extract v16i8:$S, 11)), xoaddr:$dst),
Lei Huangcd4f3852018-03-12 19:26:18 +00003066 (STXSIBXv (v16i8 (VSLDOI $S, $S, 13)), xoaddr:$dst)>;
Nemanja Ivanovic11049f82016-10-04 06:59:23 +00003067 def : Pat<(truncstorei8 (i32 (vector_extract v16i8:$S, 12)), xoaddr:$dst),
Lei Huangcd4f3852018-03-12 19:26:18 +00003068 (STXSIBXv (v16i8 (VSLDOI $S, $S, 12)), xoaddr:$dst)>;
Nemanja Ivanovic11049f82016-10-04 06:59:23 +00003069 def : Pat<(truncstorei8 (i32 (vector_extract v16i8:$S, 13)), xoaddr:$dst),
Lei Huangcd4f3852018-03-12 19:26:18 +00003070 (STXSIBXv (v16i8 (VSLDOI $S, $S, 11)), xoaddr:$dst)>;
Nemanja Ivanovic11049f82016-10-04 06:59:23 +00003071 def : Pat<(truncstorei8 (i32 (vector_extract v16i8:$S, 14)), xoaddr:$dst),
Lei Huangcd4f3852018-03-12 19:26:18 +00003072 (STXSIBXv (v16i8 (VSLDOI $S, $S, 10)), xoaddr:$dst)>;
Nemanja Ivanovic11049f82016-10-04 06:59:23 +00003073 def : Pat<(truncstorei8 (i32 (vector_extract v16i8:$S, 15)), xoaddr:$dst),
Lei Huangcd4f3852018-03-12 19:26:18 +00003074 (STXSIBXv (v16i8 (VSLDOI $S, $S, 9)), xoaddr:$dst)>;
Nemanja Ivanovic11049f82016-10-04 06:59:23 +00003075
3076 // Scalar stores of i16
3077 def : Pat<(truncstorei16 (i32 (vector_extract v8i16:$S, 0)), xoaddr:$dst),
Lei Huangcd4f3852018-03-12 19:26:18 +00003078 (STXSIHXv (v16i8 (VSLDOI $S, $S, 8)), xoaddr:$dst)>;
Nemanja Ivanovic11049f82016-10-04 06:59:23 +00003079 def : Pat<(truncstorei16 (i32 (vector_extract v8i16:$S, 1)), xoaddr:$dst),
Lei Huangcd4f3852018-03-12 19:26:18 +00003080 (STXSIHXv (v16i8 (VSLDOI $S, $S, 6)), xoaddr:$dst)>;
Nemanja Ivanovic11049f82016-10-04 06:59:23 +00003081 def : Pat<(truncstorei16 (i32 (vector_extract v8i16:$S, 2)), xoaddr:$dst),
Lei Huangcd4f3852018-03-12 19:26:18 +00003082 (STXSIHXv (v16i8 (VSLDOI $S, $S, 4)), xoaddr:$dst)>;
Nemanja Ivanovic11049f82016-10-04 06:59:23 +00003083 def : Pat<(truncstorei16 (i32 (vector_extract v8i16:$S, 3)), xoaddr:$dst),
Lei Huangcd4f3852018-03-12 19:26:18 +00003084 (STXSIHXv (v16i8 (VSLDOI $S, $S, 2)), xoaddr:$dst)>;
Nemanja Ivanovic11049f82016-10-04 06:59:23 +00003085 def : Pat<(truncstorei16 (i32 (vector_extract v8i16:$S, 4)), xoaddr:$dst),
3086 (STXSIHXv $S, xoaddr:$dst)>;
3087 def : Pat<(truncstorei16 (i32 (vector_extract v8i16:$S, 5)), xoaddr:$dst),
Lei Huangcd4f3852018-03-12 19:26:18 +00003088 (STXSIHXv (v16i8 (VSLDOI $S, $S, 14)), xoaddr:$dst)>;
Nemanja Ivanovic11049f82016-10-04 06:59:23 +00003089 def : Pat<(truncstorei16 (i32 (vector_extract v8i16:$S, 6)), xoaddr:$dst),
Lei Huangcd4f3852018-03-12 19:26:18 +00003090 (STXSIHXv (v16i8 (VSLDOI $S, $S, 12)), xoaddr:$dst)>;
Nemanja Ivanovic11049f82016-10-04 06:59:23 +00003091 def : Pat<(truncstorei16 (i32 (vector_extract v8i16:$S, 7)), xoaddr:$dst),
Lei Huangcd4f3852018-03-12 19:26:18 +00003092 (STXSIHXv (v16i8 (VSLDOI $S, $S, 10)), xoaddr:$dst)>;
Nemanja Ivanovic11049f82016-10-04 06:59:23 +00003093 } // IsLittleEndian, HasP9Vector
3094
Sean Fertile1c4109b2016-12-09 17:21:42 +00003095
Nemanja Ivanovic11049f82016-10-04 06:59:23 +00003096 // Vector sign extensions
3097 def : Pat<(f64 (PPCVexts f64:$A, 1)),
3098 (f64 (COPY_TO_REGCLASS (VEXTSB2Ds $A), VSFRC))>;
3099 def : Pat<(f64 (PPCVexts f64:$A, 2)),
3100 (f64 (COPY_TO_REGCLASS (VEXTSH2Ds $A), VSFRC))>;
Nemanja Ivanovicdf1cb522016-11-29 16:11:34 +00003101
Nemanja Ivanovic6354d232016-10-04 11:25:52 +00003102 let isPseudo = 1 in {
3103 def DFLOADf32 : Pseudo<(outs vssrc:$XT), (ins memrix:$src),
3104 "#DFLOADf32",
Nemanja Ivanovic3c7e276d2017-07-13 18:17:10 +00003105 [(set f32:$XT, (load ixaddr:$src))]>;
Nemanja Ivanovic6354d232016-10-04 11:25:52 +00003106 def DFLOADf64 : Pseudo<(outs vsfrc:$XT), (ins memrix:$src),
3107 "#DFLOADf64",
Nemanja Ivanovic3c7e276d2017-07-13 18:17:10 +00003108 [(set f64:$XT, (load ixaddr:$src))]>;
Nemanja Ivanovic6354d232016-10-04 11:25:52 +00003109 def DFSTOREf32 : Pseudo<(outs), (ins vssrc:$XT, memrix:$dst),
3110 "#DFSTOREf32",
Nemanja Ivanovic3c7e276d2017-07-13 18:17:10 +00003111 [(store f32:$XT, ixaddr:$dst)]>;
Nemanja Ivanovic6354d232016-10-04 11:25:52 +00003112 def DFSTOREf64 : Pseudo<(outs), (ins vsfrc:$XT, memrix:$dst),
3113 "#DFSTOREf64",
Nemanja Ivanovic3c7e276d2017-07-13 18:17:10 +00003114 [(store f64:$XT, ixaddr:$dst)]>;
Nemanja Ivanovic6354d232016-10-04 11:25:52 +00003115 }
Nemanja Ivanovic3c7e276d2017-07-13 18:17:10 +00003116 def : Pat<(f64 (extloadf32 ixaddr:$src)),
3117 (COPY_TO_REGCLASS (DFLOADf32 ixaddr:$src), VSFRC)>;
Lei Huangcd4f3852018-03-12 19:26:18 +00003118 def : Pat<(f32 (fpround (f64 (extloadf32 ixaddr:$src)))),
Nemanja Ivanovic3c7e276d2017-07-13 18:17:10 +00003119 (f32 (DFLOADf32 ixaddr:$src))>;
Nemanja Ivanovicb43bb612016-07-12 21:00:10 +00003120} // end HasP9Vector, AddedComplexity
Nemanja Ivanovicd2c3c512016-09-23 13:25:31 +00003121
Zaara Syedafcd96972017-09-21 16:12:33 +00003122let Predicates = [HasP9Vector] in {
3123 let isPseudo = 1 in {
3124 let mayStore = 1 in {
Stefan Pintilie26d4f922018-03-26 17:39:18 +00003125 def SPILLTOVSR_STX : PseudoXFormMemOp<(outs),
3126 (ins spilltovsrrc:$XT, memrr:$dst),
3127 "#SPILLTOVSR_STX", []>;
Zaara Syedafcd96972017-09-21 16:12:33 +00003128 def SPILLTOVSR_ST : Pseudo<(outs), (ins spilltovsrrc:$XT, memrix:$dst),
3129 "#SPILLTOVSR_ST", []>;
3130 }
3131 let mayLoad = 1 in {
Stefan Pintilie26d4f922018-03-26 17:39:18 +00003132 def SPILLTOVSR_LDX : PseudoXFormMemOp<(outs spilltovsrrc:$XT),
3133 (ins memrr:$src),
3134 "#SPILLTOVSR_LDX", []>;
Zaara Syedafcd96972017-09-21 16:12:33 +00003135 def SPILLTOVSR_LD : Pseudo<(outs spilltovsrrc:$XT), (ins memrix:$src),
3136 "#SPILLTOVSR_LD", []>;
3137
3138 }
3139 }
3140}
Nemanja Ivanovicdf1cb522016-11-29 16:11:34 +00003141// Integer extend helper dags 32 -> 64
3142def AnyExts {
3143 dag A = (INSERT_SUBREG (i64 (IMPLICIT_DEF)), $A, sub_32);
3144 dag B = (INSERT_SUBREG (i64 (IMPLICIT_DEF)), $B, sub_32);
3145 dag C = (INSERT_SUBREG (i64 (IMPLICIT_DEF)), $C, sub_32);
3146 dag D = (INSERT_SUBREG (i64 (IMPLICIT_DEF)), $D, sub_32);
Nemanja Ivanovicd2c3c512016-09-23 13:25:31 +00003147}
3148
Nemanja Ivanovicdf1cb522016-11-29 16:11:34 +00003149def DblToFlt {
3150 dag A0 = (f32 (fpround (f64 (extractelt v2f64:$A, 0))));
3151 dag A1 = (f32 (fpround (f64 (extractelt v2f64:$A, 1))));
3152 dag B0 = (f32 (fpround (f64 (extractelt v2f64:$B, 0))));
3153 dag B1 = (f32 (fpround (f64 (extractelt v2f64:$B, 1))));
3154}
Zaara Syeda79acbbe2017-06-08 17:14:36 +00003155
3156def ByteToWord {
Tony Jiang9a91a182017-07-05 16:00:38 +00003157 dag LE_A0 = (i32 (sext_inreg (i32 (vector_extract v16i8:$A, 0)), i8));
3158 dag LE_A1 = (i32 (sext_inreg (i32 (vector_extract v16i8:$A, 4)), i8));
3159 dag LE_A2 = (i32 (sext_inreg (i32 (vector_extract v16i8:$A, 8)), i8));
3160 dag LE_A3 = (i32 (sext_inreg (i32 (vector_extract v16i8:$A, 12)), i8));
3161 dag BE_A0 = (i32 (sext_inreg (i32 (vector_extract v16i8:$A, 3)), i8));
3162 dag BE_A1 = (i32 (sext_inreg (i32 (vector_extract v16i8:$A, 7)), i8));
3163 dag BE_A2 = (i32 (sext_inreg (i32 (vector_extract v16i8:$A, 11)), i8));
3164 dag BE_A3 = (i32 (sext_inreg (i32 (vector_extract v16i8:$A, 15)), i8));
Zaara Syeda79acbbe2017-06-08 17:14:36 +00003165}
3166
3167def ByteToDWord {
Tony Jiang9a91a182017-07-05 16:00:38 +00003168 dag LE_A0 = (i64 (sext_inreg
3169 (i64 (anyext (i32 (vector_extract v16i8:$A, 0)))), i8));
3170 dag LE_A1 = (i64 (sext_inreg
3171 (i64 (anyext (i32 (vector_extract v16i8:$A, 8)))), i8));
3172 dag BE_A0 = (i64 (sext_inreg
3173 (i64 (anyext (i32 (vector_extract v16i8:$A, 7)))), i8));
3174 dag BE_A1 = (i64 (sext_inreg
3175 (i64 (anyext (i32 (vector_extract v16i8:$A, 15)))), i8));
Zaara Syeda79acbbe2017-06-08 17:14:36 +00003176}
3177
3178def HWordToWord {
Tony Jiang9a91a182017-07-05 16:00:38 +00003179 dag LE_A0 = (i32 (sext_inreg (i32 (vector_extract v8i16:$A, 0)), i16));
3180 dag LE_A1 = (i32 (sext_inreg (i32 (vector_extract v8i16:$A, 2)), i16));
3181 dag LE_A2 = (i32 (sext_inreg (i32 (vector_extract v8i16:$A, 4)), i16));
3182 dag LE_A3 = (i32 (sext_inreg (i32 (vector_extract v8i16:$A, 6)), i16));
3183 dag BE_A0 = (i32 (sext_inreg (i32 (vector_extract v8i16:$A, 1)), i16));
3184 dag BE_A1 = (i32 (sext_inreg (i32 (vector_extract v8i16:$A, 3)), i16));
3185 dag BE_A2 = (i32 (sext_inreg (i32 (vector_extract v8i16:$A, 5)), i16));
3186 dag BE_A3 = (i32 (sext_inreg (i32 (vector_extract v8i16:$A, 7)), i16));
Zaara Syeda79acbbe2017-06-08 17:14:36 +00003187}
3188
3189def HWordToDWord {
Tony Jiang9a91a182017-07-05 16:00:38 +00003190 dag LE_A0 = (i64 (sext_inreg
3191 (i64 (anyext (i32 (vector_extract v8i16:$A, 0)))), i16));
3192 dag LE_A1 = (i64 (sext_inreg
3193 (i64 (anyext (i32 (vector_extract v8i16:$A, 4)))), i16));
3194 dag BE_A0 = (i64 (sext_inreg
3195 (i64 (anyext (i32 (vector_extract v8i16:$A, 3)))), i16));
3196 dag BE_A1 = (i64 (sext_inreg
3197 (i64 (anyext (i32 (vector_extract v8i16:$A, 7)))), i16));
Zaara Syeda79acbbe2017-06-08 17:14:36 +00003198}
3199
3200def WordToDWord {
Tony Jiang9a91a182017-07-05 16:00:38 +00003201 dag LE_A0 = (i64 (sext (i32 (vector_extract v4i32:$A, 0))));
3202 dag LE_A1 = (i64 (sext (i32 (vector_extract v4i32:$A, 2))));
3203 dag BE_A0 = (i64 (sext (i32 (vector_extract v4i32:$A, 1))));
3204 dag BE_A1 = (i64 (sext (i32 (vector_extract v4i32:$A, 3))));
Zaara Syeda79acbbe2017-06-08 17:14:36 +00003205}
3206
Nemanja Ivanovicdf1cb522016-11-29 16:11:34 +00003207def FltToIntLoad {
3208 dag A = (i32 (PPCmfvsr (PPCfctiwz (f64 (extloadf32 xoaddr:$A)))));
3209}
3210def FltToUIntLoad {
3211 dag A = (i32 (PPCmfvsr (PPCfctiwuz (f64 (extloadf32 xoaddr:$A)))));
3212}
3213def FltToLongLoad {
3214 dag A = (i64 (PPCmfvsr (PPCfctidz (f64 (extloadf32 xoaddr:$A)))));
3215}
Hiroshi Inouee3c14eb2017-05-29 07:12:39 +00003216def FltToLongLoadP9 {
Nemanja Ivanovic3c7e276d2017-07-13 18:17:10 +00003217 dag A = (i64 (PPCmfvsr (PPCfctidz (f64 (extloadf32 ixaddr:$A)))));
Hiroshi Inouee3c14eb2017-05-29 07:12:39 +00003218}
Nemanja Ivanovicdf1cb522016-11-29 16:11:34 +00003219def FltToULongLoad {
3220 dag A = (i64 (PPCmfvsr (PPCfctiduz (f64 (extloadf32 xoaddr:$A)))));
3221}
Hiroshi Inouee3c14eb2017-05-29 07:12:39 +00003222def FltToULongLoadP9 {
Nemanja Ivanovic3c7e276d2017-07-13 18:17:10 +00003223 dag A = (i64 (PPCmfvsr (PPCfctiduz (f64 (extloadf32 ixaddr:$A)))));
Hiroshi Inouee3c14eb2017-05-29 07:12:39 +00003224}
Nemanja Ivanovicdf1cb522016-11-29 16:11:34 +00003225def FltToLong {
Lei Huangcd4f3852018-03-12 19:26:18 +00003226 dag A = (i64 (PPCmfvsr (f64 (PPCfctidz (fpextend f32:$A)))));
Nemanja Ivanovicdf1cb522016-11-29 16:11:34 +00003227}
3228def FltToULong {
Lei Huangcd4f3852018-03-12 19:26:18 +00003229 dag A = (i64 (PPCmfvsr (f64 (PPCfctiduz (fpextend f32:$A)))));
Nemanja Ivanovicdf1cb522016-11-29 16:11:34 +00003230}
3231def DblToInt {
3232 dag A = (i32 (PPCmfvsr (f64 (PPCfctiwz f64:$A))));
3233}
3234def DblToUInt {
3235 dag A = (i32 (PPCmfvsr (f64 (PPCfctiwuz f64:$A))));
3236}
3237def DblToLong {
3238 dag A = (i64 (PPCmfvsr (f64 (PPCfctidz f64:$A))));
3239}
3240def DblToULong {
3241 dag A = (i64 (PPCmfvsr (f64 (PPCfctiduz f64:$A))));
3242}
3243def DblToIntLoad {
3244 dag A = (i32 (PPCmfvsr (PPCfctiwz (f64 (load xoaddr:$A)))));
3245}
Hiroshi Inouee3c14eb2017-05-29 07:12:39 +00003246def DblToIntLoadP9 {
Nemanja Ivanovic3c7e276d2017-07-13 18:17:10 +00003247 dag A = (i32 (PPCmfvsr (PPCfctiwz (f64 (load ixaddr:$A)))));
Hiroshi Inouee3c14eb2017-05-29 07:12:39 +00003248}
Nemanja Ivanovicdf1cb522016-11-29 16:11:34 +00003249def DblToUIntLoad {
3250 dag A = (i32 (PPCmfvsr (PPCfctiwuz (f64 (load xoaddr:$A)))));
3251}
Hiroshi Inouee3c14eb2017-05-29 07:12:39 +00003252def DblToUIntLoadP9 {
Nemanja Ivanovic3c7e276d2017-07-13 18:17:10 +00003253 dag A = (i32 (PPCmfvsr (PPCfctiwuz (f64 (load ixaddr:$A)))));
Hiroshi Inouee3c14eb2017-05-29 07:12:39 +00003254}
Nemanja Ivanovicdf1cb522016-11-29 16:11:34 +00003255def DblToLongLoad {
3256 dag A = (i64 (PPCmfvsr (PPCfctidz (f64 (load xoaddr:$A)))));
3257}
3258def DblToULongLoad {
3259 dag A = (i64 (PPCmfvsr (PPCfctiduz (f64 (load xoaddr:$A)))));
3260}
3261
3262// FP merge dags (for f32 -> v4f32)
3263def MrgFP {
3264 dag AC = (XVCVDPSP (XXPERMDI (COPY_TO_REGCLASS $A, VSRC),
3265 (COPY_TO_REGCLASS $C, VSRC), 0));
3266 dag BD = (XVCVDPSP (XXPERMDI (COPY_TO_REGCLASS $B, VSRC),
3267 (COPY_TO_REGCLASS $D, VSRC), 0));
3268 dag ABhToFlt = (XVCVDPSP (XXPERMDI $A, $B, 0));
3269 dag ABlToFlt = (XVCVDPSP (XXPERMDI $A, $B, 3));
3270 dag BAhToFlt = (XVCVDPSP (XXPERMDI $B, $A, 0));
3271 dag BAlToFlt = (XVCVDPSP (XXPERMDI $B, $A, 3));
3272}
3273
3274// Patterns for BUILD_VECTOR nodes.
3275def NoP9Vector : Predicate<"!PPCSubTarget->hasP9Vector()">;
3276let AddedComplexity = 400 in {
3277
3278 let Predicates = [HasVSX] in {
3279 // Build vectors of floating point converted to i32.
3280 def : Pat<(v4i32 (build_vector DblToInt.A, DblToInt.A,
3281 DblToInt.A, DblToInt.A)),
3282 (v4i32 (XXSPLTW (COPY_TO_REGCLASS (XSCVDPSXWS $A), VSRC), 1))>;
3283 def : Pat<(v4i32 (build_vector DblToUInt.A, DblToUInt.A,
3284 DblToUInt.A, DblToUInt.A)),
3285 (v4i32 (XXSPLTW (COPY_TO_REGCLASS (XSCVDPUXWS $A), VSRC), 1))>;
3286 def : Pat<(v2i64 (build_vector DblToLong.A, DblToLong.A)),
3287 (v2i64 (XXPERMDI (COPY_TO_REGCLASS (XSCVDPSXDS $A), VSRC),
3288 (COPY_TO_REGCLASS (XSCVDPSXDS $A), VSRC), 0))>;
3289 def : Pat<(v2i64 (build_vector DblToULong.A, DblToULong.A)),
3290 (v2i64 (XXPERMDI (COPY_TO_REGCLASS (XSCVDPUXDS $A), VSRC),
3291 (COPY_TO_REGCLASS (XSCVDPUXDS $A), VSRC), 0))>;
3292 def : Pat<(v4i32 (scalar_to_vector FltToIntLoad.A)),
3293 (v4i32 (XXSPLTW (COPY_TO_REGCLASS
Tony Jiang438bf4a2017-11-20 14:38:30 +00003294 (XSCVDPSXWSs (XFLOADf32 xoaddr:$A)), VSRC), 1))>;
Nemanja Ivanovicdf1cb522016-11-29 16:11:34 +00003295 def : Pat<(v4i32 (scalar_to_vector FltToUIntLoad.A)),
3296 (v4i32 (XXSPLTW (COPY_TO_REGCLASS
Tony Jiang438bf4a2017-11-20 14:38:30 +00003297 (XSCVDPUXWSs (XFLOADf32 xoaddr:$A)), VSRC), 1))>;
Nemanja Ivanovicdf1cb522016-11-29 16:11:34 +00003298 def : Pat<(v4f32 (build_vector f32:$A, f32:$A, f32:$A, f32:$A)),
3299 (v4f32 (XXSPLTW (v4f32 (XSCVDPSPN $A)), 0))>;
3300
3301 // Build vectors of floating point converted to i64.
3302 def : Pat<(v2i64 (build_vector FltToLong.A, FltToLong.A)),
Nemanja Ivanovic15748f42016-12-06 11:47:14 +00003303 (v2i64 (XXPERMDIs
3304 (COPY_TO_REGCLASS (XSCVDPSXDSs $A), VSFRC), 0))>;
Nemanja Ivanovicdf1cb522016-11-29 16:11:34 +00003305 def : Pat<(v2i64 (build_vector FltToULong.A, FltToULong.A)),
Nemanja Ivanovic15748f42016-12-06 11:47:14 +00003306 (v2i64 (XXPERMDIs
3307 (COPY_TO_REGCLASS (XSCVDPUXDSs $A), VSFRC), 0))>;
Nemanja Ivanovicdf1cb522016-11-29 16:11:34 +00003308 def : Pat<(v2i64 (scalar_to_vector DblToLongLoad.A)),
3309 (v2i64 (XVCVDPSXDS (LXVDSX xoaddr:$A)))>;
3310 def : Pat<(v2i64 (scalar_to_vector DblToULongLoad.A)),
3311 (v2i64 (XVCVDPUXDS (LXVDSX xoaddr:$A)))>;
3312 }
3313
3314 let Predicates = [HasVSX, NoP9Vector] in {
Tony Jiang438bf4a2017-11-20 14:38:30 +00003315 // Load-and-splat with fp-to-int conversion (using X-Form VSX/FP loads).
Nemanja Ivanovicdf1cb522016-11-29 16:11:34 +00003316 def : Pat<(v4i32 (scalar_to_vector DblToIntLoad.A)),
3317 (v4i32 (XXSPLTW (COPY_TO_REGCLASS
Tony Jiang438bf4a2017-11-20 14:38:30 +00003318 (XSCVDPSXWS (XFLOADf64 xoaddr:$A)), VSRC), 1))>;
Nemanja Ivanovicdf1cb522016-11-29 16:11:34 +00003319 def : Pat<(v4i32 (scalar_to_vector DblToUIntLoad.A)),
3320 (v4i32 (XXSPLTW (COPY_TO_REGCLASS
Tony Jiang438bf4a2017-11-20 14:38:30 +00003321 (XSCVDPUXWS (XFLOADf64 xoaddr:$A)), VSRC), 1))>;
Nemanja Ivanovicdf1cb522016-11-29 16:11:34 +00003322 def : Pat<(v2i64 (scalar_to_vector FltToLongLoad.A)),
3323 (v2i64 (XXPERMDIs (XSCVDPSXDS (COPY_TO_REGCLASS
Tony Jiang438bf4a2017-11-20 14:38:30 +00003324 (XFLOADf32 xoaddr:$A), VSFRC)), 0))>;
Nemanja Ivanovicdf1cb522016-11-29 16:11:34 +00003325 def : Pat<(v2i64 (scalar_to_vector FltToULongLoad.A)),
3326 (v2i64 (XXPERMDIs (XSCVDPUXDS (COPY_TO_REGCLASS
Tony Jiang438bf4a2017-11-20 14:38:30 +00003327 (XFLOADf32 xoaddr:$A), VSFRC)), 0))>;
Nemanja Ivanovicdf1cb522016-11-29 16:11:34 +00003328 }
3329
3330 // Big endian, available on all targets with VSX
3331 let Predicates = [IsBigEndian, HasVSX] in {
3332 def : Pat<(v2f64 (build_vector f64:$A, f64:$B)),
3333 (v2f64 (XXPERMDI
3334 (COPY_TO_REGCLASS $A, VSRC),
3335 (COPY_TO_REGCLASS $B, VSRC), 0))>;
3336
3337 def : Pat<(v4f32 (build_vector f32:$A, f32:$B, f32:$C, f32:$D)),
3338 (VMRGEW MrgFP.AC, MrgFP.BD)>;
3339 def : Pat<(v4f32 (build_vector DblToFlt.A0, DblToFlt.A1,
3340 DblToFlt.B0, DblToFlt.B1)),
3341 (v4f32 (VMRGEW MrgFP.ABhToFlt, MrgFP.ABlToFlt))>;
3342 }
3343
3344 let Predicates = [IsLittleEndian, HasVSX] in {
3345 // Little endian, available on all targets with VSX
3346 def : Pat<(v2f64 (build_vector f64:$A, f64:$B)),
3347 (v2f64 (XXPERMDI
3348 (COPY_TO_REGCLASS $B, VSRC),
3349 (COPY_TO_REGCLASS $A, VSRC), 0))>;
3350
3351 def : Pat<(v4f32 (build_vector f32:$D, f32:$C, f32:$B, f32:$A)),
3352 (VMRGEW MrgFP.AC, MrgFP.BD)>;
3353 def : Pat<(v4f32 (build_vector DblToFlt.A0, DblToFlt.A1,
3354 DblToFlt.B0, DblToFlt.B1)),
3355 (v4f32 (VMRGEW MrgFP.BAhToFlt, MrgFP.BAlToFlt))>;
3356 }
3357
3358 let Predicates = [HasDirectMove] in {
3359 // Endianness-neutral constant splat on P8 and newer targets. The reason
3360 // for this pattern is that on targets with direct moves, we don't expand
3361 // BUILD_VECTOR nodes for v4i32.
3362 def : Pat<(v4i32 (build_vector immSExt5NonZero:$A, immSExt5NonZero:$A,
3363 immSExt5NonZero:$A, immSExt5NonZero:$A)),
3364 (v4i32 (VSPLTISW imm:$A))>;
3365 }
3366
3367 let Predicates = [IsBigEndian, HasDirectMove, NoP9Vector] in {
3368 // Big endian integer vectors using direct moves.
3369 def : Pat<(v2i64 (build_vector i64:$A, i64:$B)),
3370 (v2i64 (XXPERMDI
3371 (COPY_TO_REGCLASS (MTVSRD $A), VSRC),
3372 (COPY_TO_REGCLASS (MTVSRD $B), VSRC), 0))>;
3373 def : Pat<(v4i32 (build_vector i32:$A, i32:$B, i32:$C, i32:$D)),
3374 (VMRGOW (XXPERMDI (COPY_TO_REGCLASS (MTVSRWZ $A), VSRC),
3375 (COPY_TO_REGCLASS (MTVSRWZ $C), VSRC), 0),
3376 (XXPERMDI (COPY_TO_REGCLASS (MTVSRWZ $B), VSRC),
3377 (COPY_TO_REGCLASS (MTVSRWZ $D), VSRC), 0))>;
3378 def : Pat<(v4i32 (build_vector i32:$A, i32:$A, i32:$A, i32:$A)),
3379 (XXSPLTW (COPY_TO_REGCLASS (MTVSRWZ $A), VSRC), 1)>;
3380 }
3381
3382 let Predicates = [IsLittleEndian, HasDirectMove, NoP9Vector] in {
3383 // Little endian integer vectors using direct moves.
3384 def : Pat<(v2i64 (build_vector i64:$A, i64:$B)),
3385 (v2i64 (XXPERMDI
3386 (COPY_TO_REGCLASS (MTVSRD $B), VSRC),
3387 (COPY_TO_REGCLASS (MTVSRD $A), VSRC), 0))>;
3388 def : Pat<(v4i32 (build_vector i32:$A, i32:$B, i32:$C, i32:$D)),
3389 (VMRGOW (XXPERMDI (COPY_TO_REGCLASS (MTVSRWZ $D), VSRC),
3390 (COPY_TO_REGCLASS (MTVSRWZ $B), VSRC), 0),
3391 (XXPERMDI (COPY_TO_REGCLASS (MTVSRWZ $C), VSRC),
3392 (COPY_TO_REGCLASS (MTVSRWZ $A), VSRC), 0))>;
3393 def : Pat<(v4i32 (build_vector i32:$A, i32:$A, i32:$A, i32:$A)),
3394 (XXSPLTW (COPY_TO_REGCLASS (MTVSRWZ $A), VSRC), 1)>;
3395 }
3396
3397 let Predicates = [HasP9Vector] in {
3398 // Endianness-neutral patterns for const splats with ISA 3.0 instructions.
3399 def : Pat<(v4i32 (scalar_to_vector i32:$A)),
3400 (v4i32 (MTVSRWS $A))>;
3401 def : Pat<(v4i32 (build_vector i32:$A, i32:$A, i32:$A, i32:$A)),
3402 (v4i32 (MTVSRWS $A))>;
Nemanja Ivanovic552c8e92016-12-15 11:16:20 +00003403 def : Pat<(v16i8 (build_vector immAnyExt8:$A, immAnyExt8:$A, immAnyExt8:$A,
3404 immAnyExt8:$A, immAnyExt8:$A, immAnyExt8:$A,
3405 immAnyExt8:$A, immAnyExt8:$A, immAnyExt8:$A,
3406 immAnyExt8:$A, immAnyExt8:$A, immAnyExt8:$A,
3407 immAnyExt8:$A, immAnyExt8:$A, immAnyExt8:$A,
3408 immAnyExt8:$A)),
Nemanja Ivanovicdf1cb522016-11-29 16:11:34 +00003409 (v16i8 (COPY_TO_REGCLASS (XXSPLTIB imm:$A), VSRC))>;
3410 def : Pat<(v16i8 immAllOnesV),
3411 (v16i8 (COPY_TO_REGCLASS (XXSPLTIB 255), VSRC))>;
3412 def : Pat<(v8i16 immAllOnesV),
3413 (v8i16 (COPY_TO_REGCLASS (XXSPLTIB 255), VSRC))>;
3414 def : Pat<(v4i32 immAllOnesV),
3415 (v4i32 (XXSPLTIB 255))>;
3416 def : Pat<(v2i64 immAllOnesV),
3417 (v2i64 (XXSPLTIB 255))>;
3418 def : Pat<(v4i32 (scalar_to_vector FltToIntLoad.A)),
3419 (v4i32 (XVCVSPSXWS (LXVWSX xoaddr:$A)))>;
3420 def : Pat<(v4i32 (scalar_to_vector FltToUIntLoad.A)),
3421 (v4i32 (XVCVSPUXWS (LXVWSX xoaddr:$A)))>;
Hiroshi Inouee3c14eb2017-05-29 07:12:39 +00003422 def : Pat<(v4i32 (scalar_to_vector DblToIntLoadP9.A)),
Nemanja Ivanovicdf1cb522016-11-29 16:11:34 +00003423 (v4i32 (XXSPLTW (COPY_TO_REGCLASS
Nemanja Ivanovic3c7e276d2017-07-13 18:17:10 +00003424 (XSCVDPSXWS (DFLOADf64 ixaddr:$A)), VSRC), 1))>;
Hiroshi Inouee3c14eb2017-05-29 07:12:39 +00003425 def : Pat<(v4i32 (scalar_to_vector DblToUIntLoadP9.A)),
Nemanja Ivanovicdf1cb522016-11-29 16:11:34 +00003426 (v4i32 (XXSPLTW (COPY_TO_REGCLASS
Nemanja Ivanovic3c7e276d2017-07-13 18:17:10 +00003427 (XSCVDPUXWS (DFLOADf64 ixaddr:$A)), VSRC), 1))>;
Hiroshi Inouee3c14eb2017-05-29 07:12:39 +00003428 def : Pat<(v2i64 (scalar_to_vector FltToLongLoadP9.A)),
Nemanja Ivanovicdf1cb522016-11-29 16:11:34 +00003429 (v2i64 (XXPERMDIs (XSCVDPSXDS (COPY_TO_REGCLASS
Nemanja Ivanovic3c7e276d2017-07-13 18:17:10 +00003430 (DFLOADf32 ixaddr:$A),
Nemanja Ivanovicdf1cb522016-11-29 16:11:34 +00003431 VSFRC)), 0))>;
Hiroshi Inouee3c14eb2017-05-29 07:12:39 +00003432 def : Pat<(v2i64 (scalar_to_vector FltToULongLoadP9.A)),
Nemanja Ivanovicdf1cb522016-11-29 16:11:34 +00003433 (v2i64 (XXPERMDIs (XSCVDPUXDS (COPY_TO_REGCLASS
Nemanja Ivanovic3c7e276d2017-07-13 18:17:10 +00003434 (DFLOADf32 ixaddr:$A),
Nemanja Ivanovicdf1cb522016-11-29 16:11:34 +00003435 VSFRC)), 0))>;
3436 }
3437
3438 let Predicates = [IsISA3_0, HasDirectMove, IsBigEndian] in {
3439 def : Pat<(i64 (extractelt v2i64:$A, 1)),
3440 (i64 (MFVSRLD $A))>;
3441 // Better way to build integer vectors if we have MTVSRDD. Big endian.
3442 def : Pat<(v2i64 (build_vector i64:$rB, i64:$rA)),
3443 (v2i64 (MTVSRDD $rB, $rA))>;
3444 def : Pat<(v4i32 (build_vector i32:$A, i32:$B, i32:$C, i32:$D)),
Lei Huangcd4f3852018-03-12 19:26:18 +00003445 (VMRGOW
3446 (v4i32 (COPY_TO_REGCLASS (MTVSRDD AnyExts.A, AnyExts.C), VSRC)),
3447 (v4i32
3448 (COPY_TO_REGCLASS (MTVSRDD AnyExts.B, AnyExts.D), VSRC)))>;
Nemanja Ivanovicdf1cb522016-11-29 16:11:34 +00003449 }
3450
3451 let Predicates = [IsISA3_0, HasDirectMove, IsLittleEndian] in {
3452 def : Pat<(i64 (extractelt v2i64:$A, 0)),
3453 (i64 (MFVSRLD $A))>;
3454 // Better way to build integer vectors if we have MTVSRDD. Little endian.
3455 def : Pat<(v2i64 (build_vector i64:$rA, i64:$rB)),
3456 (v2i64 (MTVSRDD $rB, $rA))>;
3457 def : Pat<(v4i32 (build_vector i32:$A, i32:$B, i32:$C, i32:$D)),
Lei Huangcd4f3852018-03-12 19:26:18 +00003458 (VMRGOW
3459 (v4i32 (COPY_TO_REGCLASS (MTVSRDD AnyExts.D, AnyExts.B), VSRC)),
3460 (v4i32
3461 (COPY_TO_REGCLASS (MTVSRDD AnyExts.C, AnyExts.A), VSRC)))>;
Nemanja Ivanovicdf1cb522016-11-29 16:11:34 +00003462 }
Zaara Syeda79acbbe2017-06-08 17:14:36 +00003463 // P9 Altivec instructions that can be used to build vectors.
3464 // Adding them to PPCInstrVSX.td rather than PPCAltivecVSX.td to compete
3465 // with complexities of existing build vector patterns in this file.
Tony Jiang9a91a182017-07-05 16:00:38 +00003466 let Predicates = [HasP9Altivec, IsLittleEndian] in {
3467 def : Pat<(v2i64 (build_vector WordToDWord.LE_A0, WordToDWord.LE_A1)),
Zaara Syeda79acbbe2017-06-08 17:14:36 +00003468 (v2i64 (VEXTSW2D $A))>;
Tony Jiang9a91a182017-07-05 16:00:38 +00003469 def : Pat<(v2i64 (build_vector HWordToDWord.LE_A0, HWordToDWord.LE_A1)),
Zaara Syeda79acbbe2017-06-08 17:14:36 +00003470 (v2i64 (VEXTSH2D $A))>;
Tony Jiang9a91a182017-07-05 16:00:38 +00003471 def : Pat<(v4i32 (build_vector HWordToWord.LE_A0, HWordToWord.LE_A1,
3472 HWordToWord.LE_A2, HWordToWord.LE_A3)),
Zaara Syeda79acbbe2017-06-08 17:14:36 +00003473 (v4i32 (VEXTSH2W $A))>;
Tony Jiang9a91a182017-07-05 16:00:38 +00003474 def : Pat<(v4i32 (build_vector ByteToWord.LE_A0, ByteToWord.LE_A1,
3475 ByteToWord.LE_A2, ByteToWord.LE_A3)),
Zaara Syeda79acbbe2017-06-08 17:14:36 +00003476 (v4i32 (VEXTSB2W $A))>;
Tony Jiang9a91a182017-07-05 16:00:38 +00003477 def : Pat<(v2i64 (build_vector ByteToDWord.LE_A0, ByteToDWord.LE_A1)),
Zaara Syeda79acbbe2017-06-08 17:14:36 +00003478 (v2i64 (VEXTSB2D $A))>;
3479 }
Tony Jiang9a91a182017-07-05 16:00:38 +00003480
3481 let Predicates = [HasP9Altivec, IsBigEndian] in {
3482 def : Pat<(v2i64 (build_vector WordToDWord.BE_A0, WordToDWord.BE_A1)),
3483 (v2i64 (VEXTSW2D $A))>;
3484 def : Pat<(v2i64 (build_vector HWordToDWord.BE_A0, HWordToDWord.BE_A1)),
3485 (v2i64 (VEXTSH2D $A))>;
3486 def : Pat<(v4i32 (build_vector HWordToWord.BE_A0, HWordToWord.BE_A1,
3487 HWordToWord.BE_A2, HWordToWord.BE_A3)),
3488 (v4i32 (VEXTSH2W $A))>;
3489 def : Pat<(v4i32 (build_vector ByteToWord.BE_A0, ByteToWord.BE_A1,
3490 ByteToWord.BE_A2, ByteToWord.BE_A3)),
3491 (v4i32 (VEXTSB2W $A))>;
3492 def : Pat<(v2i64 (build_vector ByteToDWord.BE_A0, ByteToDWord.BE_A1)),
3493 (v2i64 (VEXTSB2D $A))>;
3494 }
3495
3496 let Predicates = [HasP9Altivec] in {
3497 def: Pat<(v2i64 (PPCSExtVElems v16i8:$A)),
3498 (v2i64 (VEXTSB2D $A))>;
3499 def: Pat<(v2i64 (PPCSExtVElems v8i16:$A)),
3500 (v2i64 (VEXTSH2D $A))>;
3501 def: Pat<(v2i64 (PPCSExtVElems v4i32:$A)),
3502 (v2i64 (VEXTSW2D $A))>;
3503 def: Pat<(v4i32 (PPCSExtVElems v16i8:$A)),
3504 (v4i32 (VEXTSB2W $A))>;
3505 def: Pat<(v4i32 (PPCSExtVElems v8i16:$A)),
3506 (v4i32 (VEXTSH2W $A))>;
3507 }
Nemanja Ivanovicd2c3c512016-09-23 13:25:31 +00003508}