blob: 21e4a9d4bf01f45995e81b77de06dfa4b7cf0eb4 [file] [log] [blame]
Hal Finkel27774d92014-03-13 07:58:58 +00001//===- PPCInstrVSX.td - The PowerPC VSX Extension --*- tablegen -*-===//
2//
3// The LLVM Compiler Infrastructure
4//
5// This file is distributed under the University of Illinois Open Source
6// License. See LICENSE.TXT for details.
7//
8//===----------------------------------------------------------------------===//
9//
10// This file describes the VSX extension to the PowerPC instruction set.
11//
12//===----------------------------------------------------------------------===//
13
Bill Schmidtfe723b92015-04-27 19:57:34 +000014// *********************************** NOTE ***********************************
15// ** For POWER8 Little Endian, the VSX swap optimization relies on knowing **
16// ** which VMX and VSX instructions are lane-sensitive and which are not. **
17// ** A lane-sensitive instruction relies, implicitly or explicitly, on **
18// ** whether lanes are numbered from left to right. An instruction like **
19// ** VADDFP is not lane-sensitive, because each lane of the result vector **
20// ** relies only on the corresponding lane of the source vectors. However, **
21// ** an instruction like VMULESB is lane-sensitive, because "even" and **
22// ** "odd" lanes are different for big-endian and little-endian numbering. **
23// ** **
24// ** When adding new VMX and VSX instructions, please consider whether they **
25// ** are lane-sensitive. If so, they must be added to a switch statement **
26// ** in PPCVSXSwapRemoval::gatherVectorInstructions(). **
27// ****************************************************************************
28
Hal Finkel27774d92014-03-13 07:58:58 +000029def PPCRegVSRCAsmOperand : AsmOperandClass {
30 let Name = "RegVSRC"; let PredicateMethod = "isVSRegNumber";
31}
32def vsrc : RegisterOperand<VSRC> {
33 let ParserMatchClass = PPCRegVSRCAsmOperand;
34}
35
Hal Finkel19be5062014-03-29 05:29:01 +000036def PPCRegVSFRCAsmOperand : AsmOperandClass {
37 let Name = "RegVSFRC"; let PredicateMethod = "isVSRegNumber";
38}
39def vsfrc : RegisterOperand<VSFRC> {
40 let ParserMatchClass = PPCRegVSFRCAsmOperand;
41}
42
Nemanja Ivanovicf3c94b12015-05-07 18:24:05 +000043def PPCRegVSSRCAsmOperand : AsmOperandClass {
44 let Name = "RegVSSRC"; let PredicateMethod = "isVSRegNumber";
45}
46def vssrc : RegisterOperand<VSSRC> {
47 let ParserMatchClass = PPCRegVSSRCAsmOperand;
48}
49
Bill Schmidtfae5d712014-12-09 16:35:51 +000050// Little-endian-specific nodes.
51def SDT_PPClxvd2x : SDTypeProfile<1, 1, [
52 SDTCisVT<0, v2f64>, SDTCisPtrTy<1>
53]>;
54def SDT_PPCstxvd2x : SDTypeProfile<0, 2, [
55 SDTCisVT<0, v2f64>, SDTCisPtrTy<1>
56]>;
57def SDT_PPCxxswapd : SDTypeProfile<1, 1, [
58 SDTCisSameAs<0, 1>
59]>;
Nemanja Ivanovic44513e52016-07-05 09:22:29 +000060def SDTVecConv : SDTypeProfile<1, 2, [
61 SDTCisVec<0>, SDTCisVec<1>, SDTCisPtrTy<2>
62]>;
Bill Schmidtfae5d712014-12-09 16:35:51 +000063
64def PPClxvd2x : SDNode<"PPCISD::LXVD2X", SDT_PPClxvd2x,
Sean Fertile3c8c3852017-01-26 18:59:15 +000065 [SDNPHasChain, SDNPMayLoad, SDNPMemOperand]>;
Bill Schmidtfae5d712014-12-09 16:35:51 +000066def PPCstxvd2x : SDNode<"PPCISD::STXVD2X", SDT_PPCstxvd2x,
67 [SDNPHasChain, SDNPMayStore]>;
68def PPCxxswapd : SDNode<"PPCISD::XXSWAPD", SDT_PPCxxswapd, [SDNPHasChain]>;
Nemanja Ivanovicc38b5312015-04-11 10:40:42 +000069def PPCmfvsr : SDNode<"PPCISD::MFVSR", SDTUnaryOp, []>;
70def PPCmtvsra : SDNode<"PPCISD::MTVSRA", SDTUnaryOp, []>;
71def PPCmtvsrz : SDNode<"PPCISD::MTVSRZ", SDTUnaryOp, []>;
Nemanja Ivanovic44513e52016-07-05 09:22:29 +000072def PPCsvec2fp : SDNode<"PPCISD::SINT_VEC_TO_FP", SDTVecConv, []>;
73def PPCuvec2fp: SDNode<"PPCISD::UINT_VEC_TO_FP", SDTVecConv, []>;
Nemanja Ivanoviceebbcb62016-07-12 12:16:27 +000074def PPCswapNoChain : SDNode<"PPCISD::SWAP_NO_CHAIN", SDT_PPCxxswapd>;
Bill Schmidtfae5d712014-12-09 16:35:51 +000075
Nemanja Ivanovic2c84b292015-09-29 17:41:53 +000076multiclass XX3Form_Rcr<bits<6> opcode, bits<7> xo, string asmbase,
77 string asmstr, InstrItinClass itin, Intrinsic Int,
78 ValueType OutTy, ValueType InTy> {
Hal Finkel27774d92014-03-13 07:58:58 +000079 let BaseName = asmbase in {
Nemanja Ivanovic2c84b292015-09-29 17:41:53 +000080 def NAME : XX3Form_Rc<opcode, xo, (outs vsrc:$XT), (ins vsrc:$XA, vsrc:$XB),
Hal Finkel27774d92014-03-13 07:58:58 +000081 !strconcat(asmbase, !strconcat(" ", asmstr)), itin,
Nemanja Ivanovic2c84b292015-09-29 17:41:53 +000082 [(set OutTy:$XT, (Int InTy:$XA, InTy:$XB))]>;
Hal Finkel27774d92014-03-13 07:58:58 +000083 let Defs = [CR6] in
Nemanja Ivanovic2c84b292015-09-29 17:41:53 +000084 def o : XX3Form_Rc<opcode, xo, (outs vsrc:$XT), (ins vsrc:$XA, vsrc:$XB),
Hal Finkel27774d92014-03-13 07:58:58 +000085 !strconcat(asmbase, !strconcat(". ", asmstr)), itin,
Nemanja Ivanovic2c84b292015-09-29 17:41:53 +000086 [(set InTy:$XT,
87 (InTy (PPCvcmp_o InTy:$XA, InTy:$XB, xo)))]>,
88 isDOT;
Hal Finkel27774d92014-03-13 07:58:58 +000089 }
90}
91
Nemanja Ivanovic11049f82016-10-04 06:59:23 +000092// Instruction form with a single input register for instructions such as
93// XXPERMDI. The reason for defining this is that specifying multiple chained
94// operands (such as loads) to an instruction will perform both chained
95// operations rather than coalescing them into a single register - even though
96// the source memory location is the same. This simply forces the instruction
97// to use the same register for both inputs.
98// For example, an output DAG such as this:
99// (XXPERMDI (LXSIBZX xoaddr:$src), (LXSIBZX xoaddr:$src ), 0))
100// would result in two load instructions emitted and used as separate inputs
101// to the XXPERMDI instruction.
102class XX3Form_2s<bits<6> opcode, bits<5> xo, dag OOL, dag IOL, string asmstr,
103 InstrItinClass itin, list<dag> pattern>
104 : XX3Form_2<opcode, xo, OOL, IOL, asmstr, itin, pattern> {
105 let XB = XA;
106}
107
Eric Christopher1b8e7632014-05-22 01:07:24 +0000108def HasVSX : Predicate<"PPCSubTarget->hasVSX()">;
Bill Schmidtfae5d712014-12-09 16:35:51 +0000109def IsLittleEndian : Predicate<"PPCSubTarget->isLittleEndian()">;
110def IsBigEndian : Predicate<"!PPCSubTarget->isLittleEndian()">;
Nemanja Ivanovic6e7879c2016-09-22 09:52:19 +0000111def HasOnlySwappingMemOps : Predicate<"!PPCSubTarget->hasP9Vector()">;
Bill Schmidtfae5d712014-12-09 16:35:51 +0000112
Hal Finkel27774d92014-03-13 07:58:58 +0000113let Predicates = [HasVSX] in {
114let AddedComplexity = 400 in { // Prefer VSX patterns over non-VSX patterns.
Nemanja Ivanovic11049f82016-10-04 06:59:23 +0000115let UseVSXReg = 1 in {
Craig Topperc50d64b2014-11-26 00:46:26 +0000116let hasSideEffects = 0 in { // VSX instructions don't have side effects.
Hal Finkel27774d92014-03-13 07:58:58 +0000117let Uses = [RM] in {
118
119 // Load indexed instructions
Sean Fertile3c8c3852017-01-26 18:59:15 +0000120 let mayLoad = 1, mayStore = 0 in {
Nemanja Ivanovic6354d232016-10-04 11:25:52 +0000121 let CodeSize = 3 in
Bill Schmidtcb34fd02014-10-09 17:51:35 +0000122 def LXSDX : XX1Form<31, 588,
Hal Finkel19be5062014-03-29 05:29:01 +0000123 (outs vsfrc:$XT), (ins memrr:$src),
Hal Finkel27774d92014-03-13 07:58:58 +0000124 "lxsdx $XT, $src", IIC_LdStLFD,
125 [(set f64:$XT, (load xoaddr:$src))]>;
126
Nemanja Ivanovic6e7879c2016-09-22 09:52:19 +0000127 let Predicates = [HasVSX, HasOnlySwappingMemOps] in
Bill Schmidtcb34fd02014-10-09 17:51:35 +0000128 def LXVD2X : XX1Form<31, 844,
Hal Finkel27774d92014-03-13 07:58:58 +0000129 (outs vsrc:$XT), (ins memrr:$src),
130 "lxvd2x $XT, $src", IIC_LdStLFD,
Bill Schmidt72954782014-11-12 04:19:40 +0000131 [(set v2f64:$XT, (int_ppc_vsx_lxvd2x xoaddr:$src))]>;
Hal Finkel27774d92014-03-13 07:58:58 +0000132
Bill Schmidtcb34fd02014-10-09 17:51:35 +0000133 def LXVDSX : XX1Form<31, 332,
Hal Finkel27774d92014-03-13 07:58:58 +0000134 (outs vsrc:$XT), (ins memrr:$src),
135 "lxvdsx $XT, $src", IIC_LdStLFD, []>;
Hal Finkel27774d92014-03-13 07:58:58 +0000136
Nemanja Ivanovic6e7879c2016-09-22 09:52:19 +0000137 let Predicates = [HasVSX, HasOnlySwappingMemOps] in
Bill Schmidtcb34fd02014-10-09 17:51:35 +0000138 def LXVW4X : XX1Form<31, 780,
Hal Finkel27774d92014-03-13 07:58:58 +0000139 (outs vsrc:$XT), (ins memrr:$src),
Bill Schmidt2d1128a2014-10-17 15:13:38 +0000140 "lxvw4x $XT, $src", IIC_LdStLFD,
Nemanja Ivanovicb89c27f2017-05-02 01:47:34 +0000141 []>;
Nemanja Ivanovicf3c94b12015-05-07 18:24:05 +0000142 } // mayLoad
Hal Finkel27774d92014-03-13 07:58:58 +0000143
144 // Store indexed instructions
Sean Fertile3c8c3852017-01-26 18:59:15 +0000145 let mayStore = 1, mayLoad = 0 in {
Nemanja Ivanovic6354d232016-10-04 11:25:52 +0000146 let CodeSize = 3 in
Hal Finkel27774d92014-03-13 07:58:58 +0000147 def STXSDX : XX1Form<31, 716,
Hal Finkel19be5062014-03-29 05:29:01 +0000148 (outs), (ins vsfrc:$XT, memrr:$dst),
Hal Finkel27774d92014-03-13 07:58:58 +0000149 "stxsdx $XT, $dst", IIC_LdStSTFD,
150 [(store f64:$XT, xoaddr:$dst)]>;
151
Nemanja Ivanovic6e7879c2016-09-22 09:52:19 +0000152 let Predicates = [HasVSX, HasOnlySwappingMemOps] in {
Nemanja Ivanovice78ffed2016-09-22 10:32:03 +0000153 // The behaviour of this instruction is endianness-specific so we provide no
154 // pattern to match it without considering endianness.
Hal Finkel27774d92014-03-13 07:58:58 +0000155 def STXVD2X : XX1Form<31, 972,
156 (outs), (ins vsrc:$XT, memrr:$dst),
157 "stxvd2x $XT, $dst", IIC_LdStSTFD,
Nemanja Ivanovice78ffed2016-09-22 10:32:03 +0000158 []>;
Hal Finkel27774d92014-03-13 07:58:58 +0000159
160 def STXVW4X : XX1Form<31, 908,
161 (outs), (ins vsrc:$XT, memrr:$dst),
Bill Schmidt2d1128a2014-10-17 15:13:38 +0000162 "stxvw4x $XT, $dst", IIC_LdStSTFD,
Nemanja Ivanovicb89c27f2017-05-02 01:47:34 +0000163 []>;
Nemanja Ivanovic6e7879c2016-09-22 09:52:19 +0000164 }
Nemanja Ivanovicf3c94b12015-05-07 18:24:05 +0000165 } // mayStore
Hal Finkel27774d92014-03-13 07:58:58 +0000166
167 // Add/Mul Instructions
168 let isCommutable = 1 in {
169 def XSADDDP : XX3Form<60, 32,
Hal Finkel19be5062014-03-29 05:29:01 +0000170 (outs vsfrc:$XT), (ins vsfrc:$XA, vsfrc:$XB),
Hal Finkel27774d92014-03-13 07:58:58 +0000171 "xsadddp $XT, $XA, $XB", IIC_VecFP,
172 [(set f64:$XT, (fadd f64:$XA, f64:$XB))]>;
173 def XSMULDP : XX3Form<60, 48,
Hal Finkel19be5062014-03-29 05:29:01 +0000174 (outs vsfrc:$XT), (ins vsfrc:$XA, vsfrc:$XB),
Hal Finkel27774d92014-03-13 07:58:58 +0000175 "xsmuldp $XT, $XA, $XB", IIC_VecFP,
176 [(set f64:$XT, (fmul f64:$XA, f64:$XB))]>;
177
178 def XVADDDP : XX3Form<60, 96,
179 (outs vsrc:$XT), (ins vsrc:$XA, vsrc:$XB),
180 "xvadddp $XT, $XA, $XB", IIC_VecFP,
181 [(set v2f64:$XT, (fadd v2f64:$XA, v2f64:$XB))]>;
182
183 def XVADDSP : XX3Form<60, 64,
184 (outs vsrc:$XT), (ins vsrc:$XA, vsrc:$XB),
185 "xvaddsp $XT, $XA, $XB", IIC_VecFP,
186 [(set v4f32:$XT, (fadd v4f32:$XA, v4f32:$XB))]>;
187
188 def XVMULDP : XX3Form<60, 112,
189 (outs vsrc:$XT), (ins vsrc:$XA, vsrc:$XB),
190 "xvmuldp $XT, $XA, $XB", IIC_VecFP,
191 [(set v2f64:$XT, (fmul v2f64:$XA, v2f64:$XB))]>;
192
193 def XVMULSP : XX3Form<60, 80,
194 (outs vsrc:$XT), (ins vsrc:$XA, vsrc:$XB),
195 "xvmulsp $XT, $XA, $XB", IIC_VecFP,
196 [(set v4f32:$XT, (fmul v4f32:$XA, v4f32:$XB))]>;
197 }
198
199 // Subtract Instructions
200 def XSSUBDP : XX3Form<60, 40,
Hal Finkel19be5062014-03-29 05:29:01 +0000201 (outs vsfrc:$XT), (ins vsfrc:$XA, vsfrc:$XB),
Hal Finkel27774d92014-03-13 07:58:58 +0000202 "xssubdp $XT, $XA, $XB", IIC_VecFP,
203 [(set f64:$XT, (fsub f64:$XA, f64:$XB))]>;
204
205 def XVSUBDP : XX3Form<60, 104,
206 (outs vsrc:$XT), (ins vsrc:$XA, vsrc:$XB),
207 "xvsubdp $XT, $XA, $XB", IIC_VecFP,
208 [(set v2f64:$XT, (fsub v2f64:$XA, v2f64:$XB))]>;
209 def XVSUBSP : XX3Form<60, 72,
210 (outs vsrc:$XT), (ins vsrc:$XA, vsrc:$XB),
211 "xvsubsp $XT, $XA, $XB", IIC_VecFP,
212 [(set v4f32:$XT, (fsub v4f32:$XA, v4f32:$XB))]>;
213
214 // FMA Instructions
Hal Finkel25e04542014-03-25 18:55:11 +0000215 let BaseName = "XSMADDADP" in {
Hal Finkele01d3212014-03-24 15:07:28 +0000216 let isCommutable = 1 in
Hal Finkel27774d92014-03-13 07:58:58 +0000217 def XSMADDADP : XX3Form<60, 33,
Hal Finkel19be5062014-03-29 05:29:01 +0000218 (outs vsfrc:$XT), (ins vsfrc:$XTi, vsfrc:$XA, vsfrc:$XB),
Hal Finkel27774d92014-03-13 07:58:58 +0000219 "xsmaddadp $XT, $XA, $XB", IIC_VecFP,
220 [(set f64:$XT, (fma f64:$XA, f64:$XB, f64:$XTi))]>,
Hal Finkel25e04542014-03-25 18:55:11 +0000221 RegConstraint<"$XTi = $XT">, NoEncode<"$XTi">,
222 AltVSXFMARel;
223 let IsVSXFMAAlt = 1 in
Hal Finkel27774d92014-03-13 07:58:58 +0000224 def XSMADDMDP : XX3Form<60, 41,
Hal Finkel19be5062014-03-29 05:29:01 +0000225 (outs vsfrc:$XT), (ins vsfrc:$XTi, vsfrc:$XA, vsfrc:$XB),
Hal Finkel27774d92014-03-13 07:58:58 +0000226 "xsmaddmdp $XT, $XA, $XB", IIC_VecFP, []>,
Hal Finkel25e04542014-03-25 18:55:11 +0000227 RegConstraint<"$XTi = $XT">, NoEncode<"$XTi">,
228 AltVSXFMARel;
229 }
Hal Finkel27774d92014-03-13 07:58:58 +0000230
Hal Finkel25e04542014-03-25 18:55:11 +0000231 let BaseName = "XSMSUBADP" in {
Hal Finkele01d3212014-03-24 15:07:28 +0000232 let isCommutable = 1 in
Hal Finkel27774d92014-03-13 07:58:58 +0000233 def XSMSUBADP : XX3Form<60, 49,
Hal Finkel19be5062014-03-29 05:29:01 +0000234 (outs vsfrc:$XT), (ins vsfrc:$XTi, vsfrc:$XA, vsfrc:$XB),
Hal Finkel27774d92014-03-13 07:58:58 +0000235 "xsmsubadp $XT, $XA, $XB", IIC_VecFP,
236 [(set f64:$XT, (fma f64:$XA, f64:$XB, (fneg f64:$XTi)))]>,
Hal Finkel25e04542014-03-25 18:55:11 +0000237 RegConstraint<"$XTi = $XT">, NoEncode<"$XTi">,
238 AltVSXFMARel;
239 let IsVSXFMAAlt = 1 in
Hal Finkel27774d92014-03-13 07:58:58 +0000240 def XSMSUBMDP : XX3Form<60, 57,
Hal Finkel19be5062014-03-29 05:29:01 +0000241 (outs vsfrc:$XT), (ins vsfrc:$XTi, vsfrc:$XA, vsfrc:$XB),
Hal Finkel27774d92014-03-13 07:58:58 +0000242 "xsmsubmdp $XT, $XA, $XB", IIC_VecFP, []>,
Hal Finkel25e04542014-03-25 18:55:11 +0000243 RegConstraint<"$XTi = $XT">, NoEncode<"$XTi">,
244 AltVSXFMARel;
245 }
Hal Finkel27774d92014-03-13 07:58:58 +0000246
Hal Finkel25e04542014-03-25 18:55:11 +0000247 let BaseName = "XSNMADDADP" in {
Hal Finkele01d3212014-03-24 15:07:28 +0000248 let isCommutable = 1 in
Hal Finkel27774d92014-03-13 07:58:58 +0000249 def XSNMADDADP : XX3Form<60, 161,
Hal Finkel19be5062014-03-29 05:29:01 +0000250 (outs vsfrc:$XT), (ins vsfrc:$XTi, vsfrc:$XA, vsfrc:$XB),
Hal Finkel27774d92014-03-13 07:58:58 +0000251 "xsnmaddadp $XT, $XA, $XB", IIC_VecFP,
252 [(set f64:$XT, (fneg (fma f64:$XA, f64:$XB, f64:$XTi)))]>,
Hal Finkel25e04542014-03-25 18:55:11 +0000253 RegConstraint<"$XTi = $XT">, NoEncode<"$XTi">,
254 AltVSXFMARel;
255 let IsVSXFMAAlt = 1 in
Hal Finkel27774d92014-03-13 07:58:58 +0000256 def XSNMADDMDP : XX3Form<60, 169,
Hal Finkel19be5062014-03-29 05:29:01 +0000257 (outs vsfrc:$XT), (ins vsfrc:$XTi, vsfrc:$XA, vsfrc:$XB),
Hal Finkel27774d92014-03-13 07:58:58 +0000258 "xsnmaddmdp $XT, $XA, $XB", IIC_VecFP, []>,
Hal Finkel25e04542014-03-25 18:55:11 +0000259 RegConstraint<"$XTi = $XT">, NoEncode<"$XTi">,
260 AltVSXFMARel;
261 }
Hal Finkel27774d92014-03-13 07:58:58 +0000262
Hal Finkel25e04542014-03-25 18:55:11 +0000263 let BaseName = "XSNMSUBADP" in {
Hal Finkele01d3212014-03-24 15:07:28 +0000264 let isCommutable = 1 in
Hal Finkel27774d92014-03-13 07:58:58 +0000265 def XSNMSUBADP : XX3Form<60, 177,
Hal Finkel19be5062014-03-29 05:29:01 +0000266 (outs vsfrc:$XT), (ins vsfrc:$XTi, vsfrc:$XA, vsfrc:$XB),
Hal Finkel27774d92014-03-13 07:58:58 +0000267 "xsnmsubadp $XT, $XA, $XB", IIC_VecFP,
268 [(set f64:$XT, (fneg (fma f64:$XA, f64:$XB, (fneg f64:$XTi))))]>,
Hal Finkel25e04542014-03-25 18:55:11 +0000269 RegConstraint<"$XTi = $XT">, NoEncode<"$XTi">,
270 AltVSXFMARel;
271 let IsVSXFMAAlt = 1 in
Hal Finkel27774d92014-03-13 07:58:58 +0000272 def XSNMSUBMDP : XX3Form<60, 185,
Hal Finkel19be5062014-03-29 05:29:01 +0000273 (outs vsfrc:$XT), (ins vsfrc:$XTi, vsfrc:$XA, vsfrc:$XB),
Hal Finkel27774d92014-03-13 07:58:58 +0000274 "xsnmsubmdp $XT, $XA, $XB", IIC_VecFP, []>,
Hal Finkel25e04542014-03-25 18:55:11 +0000275 RegConstraint<"$XTi = $XT">, NoEncode<"$XTi">,
276 AltVSXFMARel;
277 }
Hal Finkel27774d92014-03-13 07:58:58 +0000278
Hal Finkel25e04542014-03-25 18:55:11 +0000279 let BaseName = "XVMADDADP" in {
Hal Finkele01d3212014-03-24 15:07:28 +0000280 let isCommutable = 1 in
Hal Finkel27774d92014-03-13 07:58:58 +0000281 def XVMADDADP : XX3Form<60, 97,
282 (outs vsrc:$XT), (ins vsrc:$XTi, vsrc:$XA, vsrc:$XB),
283 "xvmaddadp $XT, $XA, $XB", IIC_VecFP,
284 [(set v2f64:$XT, (fma v2f64:$XA, v2f64:$XB, v2f64:$XTi))]>,
Hal Finkel25e04542014-03-25 18:55:11 +0000285 RegConstraint<"$XTi = $XT">, NoEncode<"$XTi">,
286 AltVSXFMARel;
287 let IsVSXFMAAlt = 1 in
Hal Finkel27774d92014-03-13 07:58:58 +0000288 def XVMADDMDP : XX3Form<60, 105,
289 (outs vsrc:$XT), (ins vsrc:$XTi, vsrc:$XA, vsrc:$XB),
290 "xvmaddmdp $XT, $XA, $XB", IIC_VecFP, []>,
Hal Finkel25e04542014-03-25 18:55:11 +0000291 RegConstraint<"$XTi = $XT">, NoEncode<"$XTi">,
292 AltVSXFMARel;
293 }
Hal Finkel27774d92014-03-13 07:58:58 +0000294
Hal Finkel25e04542014-03-25 18:55:11 +0000295 let BaseName = "XVMADDASP" in {
Hal Finkele01d3212014-03-24 15:07:28 +0000296 let isCommutable = 1 in
Hal Finkel27774d92014-03-13 07:58:58 +0000297 def XVMADDASP : XX3Form<60, 65,
298 (outs vsrc:$XT), (ins vsrc:$XTi, vsrc:$XA, vsrc:$XB),
299 "xvmaddasp $XT, $XA, $XB", IIC_VecFP,
300 [(set v4f32:$XT, (fma v4f32:$XA, v4f32:$XB, v4f32:$XTi))]>,
Hal Finkel25e04542014-03-25 18:55:11 +0000301 RegConstraint<"$XTi = $XT">, NoEncode<"$XTi">,
302 AltVSXFMARel;
303 let IsVSXFMAAlt = 1 in
Hal Finkel27774d92014-03-13 07:58:58 +0000304 def XVMADDMSP : XX3Form<60, 73,
305 (outs vsrc:$XT), (ins vsrc:$XTi, vsrc:$XA, vsrc:$XB),
306 "xvmaddmsp $XT, $XA, $XB", IIC_VecFP, []>,
Hal Finkel25e04542014-03-25 18:55:11 +0000307 RegConstraint<"$XTi = $XT">, NoEncode<"$XTi">,
308 AltVSXFMARel;
309 }
Hal Finkel27774d92014-03-13 07:58:58 +0000310
Hal Finkel25e04542014-03-25 18:55:11 +0000311 let BaseName = "XVMSUBADP" in {
Hal Finkele01d3212014-03-24 15:07:28 +0000312 let isCommutable = 1 in
Hal Finkel27774d92014-03-13 07:58:58 +0000313 def XVMSUBADP : XX3Form<60, 113,
314 (outs vsrc:$XT), (ins vsrc:$XTi, vsrc:$XA, vsrc:$XB),
315 "xvmsubadp $XT, $XA, $XB", IIC_VecFP,
316 [(set v2f64:$XT, (fma v2f64:$XA, v2f64:$XB, (fneg v2f64:$XTi)))]>,
Hal Finkel25e04542014-03-25 18:55:11 +0000317 RegConstraint<"$XTi = $XT">, NoEncode<"$XTi">,
318 AltVSXFMARel;
319 let IsVSXFMAAlt = 1 in
Hal Finkel27774d92014-03-13 07:58:58 +0000320 def XVMSUBMDP : XX3Form<60, 121,
321 (outs vsrc:$XT), (ins vsrc:$XTi, vsrc:$XA, vsrc:$XB),
322 "xvmsubmdp $XT, $XA, $XB", IIC_VecFP, []>,
Hal Finkel25e04542014-03-25 18:55:11 +0000323 RegConstraint<"$XTi = $XT">, NoEncode<"$XTi">,
324 AltVSXFMARel;
325 }
Hal Finkel27774d92014-03-13 07:58:58 +0000326
Hal Finkel25e04542014-03-25 18:55:11 +0000327 let BaseName = "XVMSUBASP" in {
Hal Finkele01d3212014-03-24 15:07:28 +0000328 let isCommutable = 1 in
Hal Finkel27774d92014-03-13 07:58:58 +0000329 def XVMSUBASP : XX3Form<60, 81,
330 (outs vsrc:$XT), (ins vsrc:$XTi, vsrc:$XA, vsrc:$XB),
331 "xvmsubasp $XT, $XA, $XB", IIC_VecFP,
332 [(set v4f32:$XT, (fma v4f32:$XA, v4f32:$XB, (fneg v4f32:$XTi)))]>,
Hal Finkel25e04542014-03-25 18:55:11 +0000333 RegConstraint<"$XTi = $XT">, NoEncode<"$XTi">,
334 AltVSXFMARel;
335 let IsVSXFMAAlt = 1 in
Hal Finkel27774d92014-03-13 07:58:58 +0000336 def XVMSUBMSP : XX3Form<60, 89,
337 (outs vsrc:$XT), (ins vsrc:$XTi, vsrc:$XA, vsrc:$XB),
338 "xvmsubmsp $XT, $XA, $XB", IIC_VecFP, []>,
Hal Finkel25e04542014-03-25 18:55:11 +0000339 RegConstraint<"$XTi = $XT">, NoEncode<"$XTi">,
340 AltVSXFMARel;
341 }
Hal Finkel27774d92014-03-13 07:58:58 +0000342
Hal Finkel25e04542014-03-25 18:55:11 +0000343 let BaseName = "XVNMADDADP" in {
Hal Finkele01d3212014-03-24 15:07:28 +0000344 let isCommutable = 1 in
Hal Finkel27774d92014-03-13 07:58:58 +0000345 def XVNMADDADP : XX3Form<60, 225,
346 (outs vsrc:$XT), (ins vsrc:$XTi, vsrc:$XA, vsrc:$XB),
347 "xvnmaddadp $XT, $XA, $XB", IIC_VecFP,
348 [(set v2f64:$XT, (fneg (fma v2f64:$XA, v2f64:$XB, v2f64:$XTi)))]>,
Hal Finkel25e04542014-03-25 18:55:11 +0000349 RegConstraint<"$XTi = $XT">, NoEncode<"$XTi">,
350 AltVSXFMARel;
351 let IsVSXFMAAlt = 1 in
Hal Finkel27774d92014-03-13 07:58:58 +0000352 def XVNMADDMDP : XX3Form<60, 233,
353 (outs vsrc:$XT), (ins vsrc:$XTi, vsrc:$XA, vsrc:$XB),
354 "xvnmaddmdp $XT, $XA, $XB", IIC_VecFP, []>,
Hal Finkel25e04542014-03-25 18:55:11 +0000355 RegConstraint<"$XTi = $XT">, NoEncode<"$XTi">,
356 AltVSXFMARel;
357 }
Hal Finkel27774d92014-03-13 07:58:58 +0000358
Hal Finkel25e04542014-03-25 18:55:11 +0000359 let BaseName = "XVNMADDASP" in {
Hal Finkele01d3212014-03-24 15:07:28 +0000360 let isCommutable = 1 in
Hal Finkel27774d92014-03-13 07:58:58 +0000361 def XVNMADDASP : XX3Form<60, 193,
362 (outs vsrc:$XT), (ins vsrc:$XTi, vsrc:$XA, vsrc:$XB),
363 "xvnmaddasp $XT, $XA, $XB", IIC_VecFP,
364 [(set v4f32:$XT, (fneg (fma v4f32:$XA, v4f32:$XB, v4f32:$XTi)))]>,
Hal Finkel25e04542014-03-25 18:55:11 +0000365 RegConstraint<"$XTi = $XT">, NoEncode<"$XTi">,
366 AltVSXFMARel;
367 let IsVSXFMAAlt = 1 in
Hal Finkel27774d92014-03-13 07:58:58 +0000368 def XVNMADDMSP : XX3Form<60, 201,
369 (outs vsrc:$XT), (ins vsrc:$XTi, vsrc:$XA, vsrc:$XB),
370 "xvnmaddmsp $XT, $XA, $XB", IIC_VecFP, []>,
Hal Finkel25e04542014-03-25 18:55:11 +0000371 RegConstraint<"$XTi = $XT">, NoEncode<"$XTi">,
372 AltVSXFMARel;
373 }
Hal Finkel27774d92014-03-13 07:58:58 +0000374
Hal Finkel25e04542014-03-25 18:55:11 +0000375 let BaseName = "XVNMSUBADP" in {
Hal Finkele01d3212014-03-24 15:07:28 +0000376 let isCommutable = 1 in
Hal Finkel27774d92014-03-13 07:58:58 +0000377 def XVNMSUBADP : XX3Form<60, 241,
378 (outs vsrc:$XT), (ins vsrc:$XTi, vsrc:$XA, vsrc:$XB),
379 "xvnmsubadp $XT, $XA, $XB", IIC_VecFP,
380 [(set v2f64:$XT, (fneg (fma v2f64:$XA, v2f64:$XB, (fneg v2f64:$XTi))))]>,
Hal Finkel25e04542014-03-25 18:55:11 +0000381 RegConstraint<"$XTi = $XT">, NoEncode<"$XTi">,
382 AltVSXFMARel;
383 let IsVSXFMAAlt = 1 in
Hal Finkel27774d92014-03-13 07:58:58 +0000384 def XVNMSUBMDP : XX3Form<60, 249,
385 (outs vsrc:$XT), (ins vsrc:$XTi, vsrc:$XA, vsrc:$XB),
386 "xvnmsubmdp $XT, $XA, $XB", IIC_VecFP, []>,
Hal Finkel25e04542014-03-25 18:55:11 +0000387 RegConstraint<"$XTi = $XT">, NoEncode<"$XTi">,
388 AltVSXFMARel;
389 }
Hal Finkel27774d92014-03-13 07:58:58 +0000390
Hal Finkel25e04542014-03-25 18:55:11 +0000391 let BaseName = "XVNMSUBASP" in {
Hal Finkele01d3212014-03-24 15:07:28 +0000392 let isCommutable = 1 in
Hal Finkel27774d92014-03-13 07:58:58 +0000393 def XVNMSUBASP : XX3Form<60, 209,
394 (outs vsrc:$XT), (ins vsrc:$XTi, vsrc:$XA, vsrc:$XB),
395 "xvnmsubasp $XT, $XA, $XB", IIC_VecFP,
396 [(set v4f32:$XT, (fneg (fma v4f32:$XA, v4f32:$XB, (fneg v4f32:$XTi))))]>,
Hal Finkel25e04542014-03-25 18:55:11 +0000397 RegConstraint<"$XTi = $XT">, NoEncode<"$XTi">,
398 AltVSXFMARel;
399 let IsVSXFMAAlt = 1 in
Hal Finkel27774d92014-03-13 07:58:58 +0000400 def XVNMSUBMSP : XX3Form<60, 217,
401 (outs vsrc:$XT), (ins vsrc:$XTi, vsrc:$XA, vsrc:$XB),
402 "xvnmsubmsp $XT, $XA, $XB", IIC_VecFP, []>,
Hal Finkel25e04542014-03-25 18:55:11 +0000403 RegConstraint<"$XTi = $XT">, NoEncode<"$XTi">,
404 AltVSXFMARel;
405 }
Hal Finkel27774d92014-03-13 07:58:58 +0000406
407 // Division Instructions
408 def XSDIVDP : XX3Form<60, 56,
Hal Finkel19be5062014-03-29 05:29:01 +0000409 (outs vsfrc:$XT), (ins vsfrc:$XA, vsfrc:$XB),
Hal Finkele8fba982014-03-29 13:20:31 +0000410 "xsdivdp $XT, $XA, $XB", IIC_FPDivD,
Hal Finkel27774d92014-03-13 07:58:58 +0000411 [(set f64:$XT, (fdiv f64:$XA, f64:$XB))]>;
412 def XSSQRTDP : XX2Form<60, 75,
Hal Finkel19be5062014-03-29 05:29:01 +0000413 (outs vsfrc:$XT), (ins vsfrc:$XB),
Hal Finkele8fba982014-03-29 13:20:31 +0000414 "xssqrtdp $XT, $XB", IIC_FPSqrtD,
Hal Finkel27774d92014-03-13 07:58:58 +0000415 [(set f64:$XT, (fsqrt f64:$XB))]>;
416
417 def XSREDP : XX2Form<60, 90,
Hal Finkel19be5062014-03-29 05:29:01 +0000418 (outs vsfrc:$XT), (ins vsfrc:$XB),
Hal Finkel27774d92014-03-13 07:58:58 +0000419 "xsredp $XT, $XB", IIC_VecFP,
420 [(set f64:$XT, (PPCfre f64:$XB))]>;
421 def XSRSQRTEDP : XX2Form<60, 74,
Hal Finkel19be5062014-03-29 05:29:01 +0000422 (outs vsfrc:$XT), (ins vsfrc:$XB),
Hal Finkel27774d92014-03-13 07:58:58 +0000423 "xsrsqrtedp $XT, $XB", IIC_VecFP,
424 [(set f64:$XT, (PPCfrsqrte f64:$XB))]>;
425
426 def XSTDIVDP : XX3Form_1<60, 61,
Hal Finkel19be5062014-03-29 05:29:01 +0000427 (outs crrc:$crD), (ins vsfrc:$XA, vsfrc:$XB),
Hal Finkele8fba982014-03-29 13:20:31 +0000428 "xstdivdp $crD, $XA, $XB", IIC_FPCompare, []>;
Hal Finkel27774d92014-03-13 07:58:58 +0000429 def XSTSQRTDP : XX2Form_1<60, 106,
Hal Finkel19be5062014-03-29 05:29:01 +0000430 (outs crrc:$crD), (ins vsfrc:$XB),
Hal Finkele8fba982014-03-29 13:20:31 +0000431 "xstsqrtdp $crD, $XB", IIC_FPCompare, []>;
Hal Finkel27774d92014-03-13 07:58:58 +0000432
433 def XVDIVDP : XX3Form<60, 120,
434 (outs vsrc:$XT), (ins vsrc:$XA, vsrc:$XB),
Hal Finkele8fba982014-03-29 13:20:31 +0000435 "xvdivdp $XT, $XA, $XB", IIC_FPDivD,
Hal Finkel27774d92014-03-13 07:58:58 +0000436 [(set v2f64:$XT, (fdiv v2f64:$XA, v2f64:$XB))]>;
437 def XVDIVSP : XX3Form<60, 88,
438 (outs vsrc:$XT), (ins vsrc:$XA, vsrc:$XB),
Hal Finkele8fba982014-03-29 13:20:31 +0000439 "xvdivsp $XT, $XA, $XB", IIC_FPDivS,
Hal Finkel27774d92014-03-13 07:58:58 +0000440 [(set v4f32:$XT, (fdiv v4f32:$XA, v4f32:$XB))]>;
441
442 def XVSQRTDP : XX2Form<60, 203,
443 (outs vsrc:$XT), (ins vsrc:$XB),
Hal Finkele8fba982014-03-29 13:20:31 +0000444 "xvsqrtdp $XT, $XB", IIC_FPSqrtD,
Hal Finkel27774d92014-03-13 07:58:58 +0000445 [(set v2f64:$XT, (fsqrt v2f64:$XB))]>;
446 def XVSQRTSP : XX2Form<60, 139,
447 (outs vsrc:$XT), (ins vsrc:$XB),
Hal Finkele8fba982014-03-29 13:20:31 +0000448 "xvsqrtsp $XT, $XB", IIC_FPSqrtS,
Hal Finkel27774d92014-03-13 07:58:58 +0000449 [(set v4f32:$XT, (fsqrt v4f32:$XB))]>;
450
451 def XVTDIVDP : XX3Form_1<60, 125,
452 (outs crrc:$crD), (ins vsrc:$XA, vsrc:$XB),
Hal Finkele8fba982014-03-29 13:20:31 +0000453 "xvtdivdp $crD, $XA, $XB", IIC_FPCompare, []>;
Hal Finkel27774d92014-03-13 07:58:58 +0000454 def XVTDIVSP : XX3Form_1<60, 93,
455 (outs crrc:$crD), (ins vsrc:$XA, vsrc:$XB),
Hal Finkele8fba982014-03-29 13:20:31 +0000456 "xvtdivsp $crD, $XA, $XB", IIC_FPCompare, []>;
Hal Finkel27774d92014-03-13 07:58:58 +0000457
458 def XVTSQRTDP : XX2Form_1<60, 234,
459 (outs crrc:$crD), (ins vsrc:$XB),
Hal Finkele8fba982014-03-29 13:20:31 +0000460 "xvtsqrtdp $crD, $XB", IIC_FPCompare, []>;
Hal Finkel27774d92014-03-13 07:58:58 +0000461 def XVTSQRTSP : XX2Form_1<60, 170,
462 (outs crrc:$crD), (ins vsrc:$XB),
Hal Finkele8fba982014-03-29 13:20:31 +0000463 "xvtsqrtsp $crD, $XB", IIC_FPCompare, []>;
Hal Finkel27774d92014-03-13 07:58:58 +0000464
465 def XVREDP : XX2Form<60, 218,
466 (outs vsrc:$XT), (ins vsrc:$XB),
467 "xvredp $XT, $XB", IIC_VecFP,
468 [(set v2f64:$XT, (PPCfre v2f64:$XB))]>;
469 def XVRESP : XX2Form<60, 154,
470 (outs vsrc:$XT), (ins vsrc:$XB),
471 "xvresp $XT, $XB", IIC_VecFP,
472 [(set v4f32:$XT, (PPCfre v4f32:$XB))]>;
473
474 def XVRSQRTEDP : XX2Form<60, 202,
475 (outs vsrc:$XT), (ins vsrc:$XB),
476 "xvrsqrtedp $XT, $XB", IIC_VecFP,
477 [(set v2f64:$XT, (PPCfrsqrte v2f64:$XB))]>;
478 def XVRSQRTESP : XX2Form<60, 138,
479 (outs vsrc:$XT), (ins vsrc:$XB),
480 "xvrsqrtesp $XT, $XB", IIC_VecFP,
481 [(set v4f32:$XT, (PPCfrsqrte v4f32:$XB))]>;
482
483 // Compare Instructions
484 def XSCMPODP : XX3Form_1<60, 43,
Hal Finkel19be5062014-03-29 05:29:01 +0000485 (outs crrc:$crD), (ins vsfrc:$XA, vsfrc:$XB),
Hal Finkele8fba982014-03-29 13:20:31 +0000486 "xscmpodp $crD, $XA, $XB", IIC_FPCompare, []>;
Hal Finkel27774d92014-03-13 07:58:58 +0000487 def XSCMPUDP : XX3Form_1<60, 35,
Hal Finkel19be5062014-03-29 05:29:01 +0000488 (outs crrc:$crD), (ins vsfrc:$XA, vsfrc:$XB),
Hal Finkele8fba982014-03-29 13:20:31 +0000489 "xscmpudp $crD, $XA, $XB", IIC_FPCompare, []>;
Hal Finkel27774d92014-03-13 07:58:58 +0000490
491 defm XVCMPEQDP : XX3Form_Rcr<60, 99,
Nemanja Ivanovicf502a422015-06-26 19:26:53 +0000492 "xvcmpeqdp", "$XT, $XA, $XB", IIC_VecFPCompare,
Nemanja Ivanovic2c84b292015-09-29 17:41:53 +0000493 int_ppc_vsx_xvcmpeqdp, v2i64, v2f64>;
Hal Finkel27774d92014-03-13 07:58:58 +0000494 defm XVCMPEQSP : XX3Form_Rcr<60, 67,
Nemanja Ivanovicf502a422015-06-26 19:26:53 +0000495 "xvcmpeqsp", "$XT, $XA, $XB", IIC_VecFPCompare,
Nemanja Ivanovic2c84b292015-09-29 17:41:53 +0000496 int_ppc_vsx_xvcmpeqsp, v4i32, v4f32>;
Hal Finkel27774d92014-03-13 07:58:58 +0000497 defm XVCMPGEDP : XX3Form_Rcr<60, 115,
Nemanja Ivanovicf502a422015-06-26 19:26:53 +0000498 "xvcmpgedp", "$XT, $XA, $XB", IIC_VecFPCompare,
Nemanja Ivanovic2c84b292015-09-29 17:41:53 +0000499 int_ppc_vsx_xvcmpgedp, v2i64, v2f64>;
Hal Finkel27774d92014-03-13 07:58:58 +0000500 defm XVCMPGESP : XX3Form_Rcr<60, 83,
Nemanja Ivanovicf502a422015-06-26 19:26:53 +0000501 "xvcmpgesp", "$XT, $XA, $XB", IIC_VecFPCompare,
Nemanja Ivanovic2c84b292015-09-29 17:41:53 +0000502 int_ppc_vsx_xvcmpgesp, v4i32, v4f32>;
Hal Finkel27774d92014-03-13 07:58:58 +0000503 defm XVCMPGTDP : XX3Form_Rcr<60, 107,
Nemanja Ivanovicf502a422015-06-26 19:26:53 +0000504 "xvcmpgtdp", "$XT, $XA, $XB", IIC_VecFPCompare,
Nemanja Ivanovic2c84b292015-09-29 17:41:53 +0000505 int_ppc_vsx_xvcmpgtdp, v2i64, v2f64>;
Hal Finkel27774d92014-03-13 07:58:58 +0000506 defm XVCMPGTSP : XX3Form_Rcr<60, 75,
Nemanja Ivanovicf502a422015-06-26 19:26:53 +0000507 "xvcmpgtsp", "$XT, $XA, $XB", IIC_VecFPCompare,
Nemanja Ivanovic2c84b292015-09-29 17:41:53 +0000508 int_ppc_vsx_xvcmpgtsp, v4i32, v4f32>;
Hal Finkel27774d92014-03-13 07:58:58 +0000509
510 // Move Instructions
511 def XSABSDP : XX2Form<60, 345,
Hal Finkel19be5062014-03-29 05:29:01 +0000512 (outs vsfrc:$XT), (ins vsfrc:$XB),
Hal Finkel27774d92014-03-13 07:58:58 +0000513 "xsabsdp $XT, $XB", IIC_VecFP,
514 [(set f64:$XT, (fabs f64:$XB))]>;
515 def XSNABSDP : XX2Form<60, 361,
Hal Finkel19be5062014-03-29 05:29:01 +0000516 (outs vsfrc:$XT), (ins vsfrc:$XB),
Hal Finkel27774d92014-03-13 07:58:58 +0000517 "xsnabsdp $XT, $XB", IIC_VecFP,
518 [(set f64:$XT, (fneg (fabs f64:$XB)))]>;
519 def XSNEGDP : XX2Form<60, 377,
Hal Finkel19be5062014-03-29 05:29:01 +0000520 (outs vsfrc:$XT), (ins vsfrc:$XB),
Hal Finkel27774d92014-03-13 07:58:58 +0000521 "xsnegdp $XT, $XB", IIC_VecFP,
522 [(set f64:$XT, (fneg f64:$XB))]>;
523 def XSCPSGNDP : XX3Form<60, 176,
Hal Finkel19be5062014-03-29 05:29:01 +0000524 (outs vsfrc:$XT), (ins vsfrc:$XA, vsfrc:$XB),
Hal Finkel27774d92014-03-13 07:58:58 +0000525 "xscpsgndp $XT, $XA, $XB", IIC_VecFP,
526 [(set f64:$XT, (fcopysign f64:$XB, f64:$XA))]>;
527
528 def XVABSDP : XX2Form<60, 473,
529 (outs vsrc:$XT), (ins vsrc:$XB),
530 "xvabsdp $XT, $XB", IIC_VecFP,
531 [(set v2f64:$XT, (fabs v2f64:$XB))]>;
532
533 def XVABSSP : XX2Form<60, 409,
534 (outs vsrc:$XT), (ins vsrc:$XB),
535 "xvabssp $XT, $XB", IIC_VecFP,
536 [(set v4f32:$XT, (fabs v4f32:$XB))]>;
537
538 def XVCPSGNDP : XX3Form<60, 240,
539 (outs vsrc:$XT), (ins vsrc:$XA, vsrc:$XB),
540 "xvcpsgndp $XT, $XA, $XB", IIC_VecFP,
541 [(set v2f64:$XT, (fcopysign v2f64:$XB, v2f64:$XA))]>;
542 def XVCPSGNSP : XX3Form<60, 208,
543 (outs vsrc:$XT), (ins vsrc:$XA, vsrc:$XB),
544 "xvcpsgnsp $XT, $XA, $XB", IIC_VecFP,
545 [(set v4f32:$XT, (fcopysign v4f32:$XB, v4f32:$XA))]>;
546
547 def XVNABSDP : XX2Form<60, 489,
548 (outs vsrc:$XT), (ins vsrc:$XB),
549 "xvnabsdp $XT, $XB", IIC_VecFP,
550 [(set v2f64:$XT, (fneg (fabs v2f64:$XB)))]>;
551 def XVNABSSP : XX2Form<60, 425,
552 (outs vsrc:$XT), (ins vsrc:$XB),
553 "xvnabssp $XT, $XB", IIC_VecFP,
554 [(set v4f32:$XT, (fneg (fabs v4f32:$XB)))]>;
555
556 def XVNEGDP : XX2Form<60, 505,
557 (outs vsrc:$XT), (ins vsrc:$XB),
558 "xvnegdp $XT, $XB", IIC_VecFP,
559 [(set v2f64:$XT, (fneg v2f64:$XB))]>;
560 def XVNEGSP : XX2Form<60, 441,
561 (outs vsrc:$XT), (ins vsrc:$XB),
562 "xvnegsp $XT, $XB", IIC_VecFP,
563 [(set v4f32:$XT, (fneg v4f32:$XB))]>;
564
565 // Conversion Instructions
566 def XSCVDPSP : XX2Form<60, 265,
Hal Finkel19be5062014-03-29 05:29:01 +0000567 (outs vsfrc:$XT), (ins vsfrc:$XB),
Hal Finkel27774d92014-03-13 07:58:58 +0000568 "xscvdpsp $XT, $XB", IIC_VecFP, []>;
569 def XSCVDPSXDS : XX2Form<60, 344,
Hal Finkel19be5062014-03-29 05:29:01 +0000570 (outs vsfrc:$XT), (ins vsfrc:$XB),
Hal Finkel4a912252014-03-23 05:35:00 +0000571 "xscvdpsxds $XT, $XB", IIC_VecFP,
572 [(set f64:$XT, (PPCfctidz f64:$XB))]>;
Nemanja Ivanovicdf1cb522016-11-29 16:11:34 +0000573 let isCodeGenOnly = 1 in
574 def XSCVDPSXDSs : XX2Form<60, 344,
575 (outs vssrc:$XT), (ins vssrc:$XB),
576 "xscvdpsxds $XT, $XB", IIC_VecFP,
577 [(set f32:$XT, (PPCfctidz f32:$XB))]>;
Hal Finkel27774d92014-03-13 07:58:58 +0000578 def XSCVDPSXWS : XX2Form<60, 88,
Hal Finkel19be5062014-03-29 05:29:01 +0000579 (outs vsfrc:$XT), (ins vsfrc:$XB),
Hal Finkel4a912252014-03-23 05:35:00 +0000580 "xscvdpsxws $XT, $XB", IIC_VecFP,
581 [(set f64:$XT, (PPCfctiwz f64:$XB))]>;
Nemanja Ivanovicdf1cb522016-11-29 16:11:34 +0000582 let isCodeGenOnly = 1 in
583 def XSCVDPSXWSs : XX2Form<60, 88,
584 (outs vssrc:$XT), (ins vssrc:$XB),
585 "xscvdpsxws $XT, $XB", IIC_VecFP,
586 [(set f32:$XT, (PPCfctiwz f32:$XB))]>;
Hal Finkel27774d92014-03-13 07:58:58 +0000587 def XSCVDPUXDS : XX2Form<60, 328,
Hal Finkel19be5062014-03-29 05:29:01 +0000588 (outs vsfrc:$XT), (ins vsfrc:$XB),
Hal Finkel4a912252014-03-23 05:35:00 +0000589 "xscvdpuxds $XT, $XB", IIC_VecFP,
590 [(set f64:$XT, (PPCfctiduz f64:$XB))]>;
Nemanja Ivanovicdf1cb522016-11-29 16:11:34 +0000591 let isCodeGenOnly = 1 in
592 def XSCVDPUXDSs : XX2Form<60, 328,
593 (outs vssrc:$XT), (ins vssrc:$XB),
594 "xscvdpuxds $XT, $XB", IIC_VecFP,
595 [(set f32:$XT, (PPCfctiduz f32:$XB))]>;
Hal Finkel27774d92014-03-13 07:58:58 +0000596 def XSCVDPUXWS : XX2Form<60, 72,
Hal Finkel19be5062014-03-29 05:29:01 +0000597 (outs vsfrc:$XT), (ins vsfrc:$XB),
Hal Finkel4a912252014-03-23 05:35:00 +0000598 "xscvdpuxws $XT, $XB", IIC_VecFP,
599 [(set f64:$XT, (PPCfctiwuz f64:$XB))]>;
Nemanja Ivanovicdf1cb522016-11-29 16:11:34 +0000600 let isCodeGenOnly = 1 in
601 def XSCVDPUXWSs : XX2Form<60, 72,
602 (outs vssrc:$XT), (ins vssrc:$XB),
603 "xscvdpuxws $XT, $XB", IIC_VecFP,
604 [(set f32:$XT, (PPCfctiwuz f32:$XB))]>;
Hal Finkel27774d92014-03-13 07:58:58 +0000605 def XSCVSPDP : XX2Form<60, 329,
Hal Finkel19be5062014-03-29 05:29:01 +0000606 (outs vsfrc:$XT), (ins vsfrc:$XB),
Hal Finkel27774d92014-03-13 07:58:58 +0000607 "xscvspdp $XT, $XB", IIC_VecFP, []>;
608 def XSCVSXDDP : XX2Form<60, 376,
Hal Finkel19be5062014-03-29 05:29:01 +0000609 (outs vsfrc:$XT), (ins vsfrc:$XB),
Hal Finkel4a912252014-03-23 05:35:00 +0000610 "xscvsxddp $XT, $XB", IIC_VecFP,
611 [(set f64:$XT, (PPCfcfid f64:$XB))]>;
Hal Finkel27774d92014-03-13 07:58:58 +0000612 def XSCVUXDDP : XX2Form<60, 360,
Hal Finkel19be5062014-03-29 05:29:01 +0000613 (outs vsfrc:$XT), (ins vsfrc:$XB),
Hal Finkel4a912252014-03-23 05:35:00 +0000614 "xscvuxddp $XT, $XB", IIC_VecFP,
615 [(set f64:$XT, (PPCfcfidu f64:$XB))]>;
Hal Finkel27774d92014-03-13 07:58:58 +0000616
617 def XVCVDPSP : XX2Form<60, 393,
618 (outs vsrc:$XT), (ins vsrc:$XB),
Nemanja Ivanovic2efc3cb2016-11-11 14:41:19 +0000619 "xvcvdpsp $XT, $XB", IIC_VecFP,
620 [(set v4f32:$XT, (int_ppc_vsx_xvcvdpsp v2f64:$XB))]>;
Hal Finkel27774d92014-03-13 07:58:58 +0000621 def XVCVDPSXDS : XX2Form<60, 472,
622 (outs vsrc:$XT), (ins vsrc:$XB),
Hal Finkel7279f4b2014-03-26 19:13:54 +0000623 "xvcvdpsxds $XT, $XB", IIC_VecFP,
624 [(set v2i64:$XT, (fp_to_sint v2f64:$XB))]>;
Hal Finkel27774d92014-03-13 07:58:58 +0000625 def XVCVDPSXWS : XX2Form<60, 216,
626 (outs vsrc:$XT), (ins vsrc:$XB),
Nemanja Ivanovic2efc3cb2016-11-11 14:41:19 +0000627 "xvcvdpsxws $XT, $XB", IIC_VecFP,
628 [(set v4i32:$XT, (int_ppc_vsx_xvcvdpsxws v2f64:$XB))]>;
Hal Finkel27774d92014-03-13 07:58:58 +0000629 def XVCVDPUXDS : XX2Form<60, 456,
630 (outs vsrc:$XT), (ins vsrc:$XB),
Hal Finkel7279f4b2014-03-26 19:13:54 +0000631 "xvcvdpuxds $XT, $XB", IIC_VecFP,
632 [(set v2i64:$XT, (fp_to_uint v2f64:$XB))]>;
Hal Finkel27774d92014-03-13 07:58:58 +0000633 def XVCVDPUXWS : XX2Form<60, 200,
634 (outs vsrc:$XT), (ins vsrc:$XB),
Nemanja Ivanovic2efc3cb2016-11-11 14:41:19 +0000635 "xvcvdpuxws $XT, $XB", IIC_VecFP,
636 [(set v4i32:$XT, (int_ppc_vsx_xvcvdpuxws v2f64:$XB))]>;
Hal Finkel27774d92014-03-13 07:58:58 +0000637
638 def XVCVSPDP : XX2Form<60, 457,
639 (outs vsrc:$XT), (ins vsrc:$XB),
Nemanja Ivanovic2efc3cb2016-11-11 14:41:19 +0000640 "xvcvspdp $XT, $XB", IIC_VecFP,
641 [(set v2f64:$XT, (int_ppc_vsx_xvcvspdp v4f32:$XB))]>;
Hal Finkel27774d92014-03-13 07:58:58 +0000642 def XVCVSPSXDS : XX2Form<60, 408,
643 (outs vsrc:$XT), (ins vsrc:$XB),
644 "xvcvspsxds $XT, $XB", IIC_VecFP, []>;
645 def XVCVSPSXWS : XX2Form<60, 152,
646 (outs vsrc:$XT), (ins vsrc:$XB),
Nemanja Ivanovicdf1cb522016-11-29 16:11:34 +0000647 "xvcvspsxws $XT, $XB", IIC_VecFP,
648 [(set v4i32:$XT, (fp_to_sint v4f32:$XB))]>;
Hal Finkel27774d92014-03-13 07:58:58 +0000649 def XVCVSPUXDS : XX2Form<60, 392,
650 (outs vsrc:$XT), (ins vsrc:$XB),
651 "xvcvspuxds $XT, $XB", IIC_VecFP, []>;
652 def XVCVSPUXWS : XX2Form<60, 136,
653 (outs vsrc:$XT), (ins vsrc:$XB),
Nemanja Ivanovicdf1cb522016-11-29 16:11:34 +0000654 "xvcvspuxws $XT, $XB", IIC_VecFP,
655 [(set v4i32:$XT, (fp_to_uint v4f32:$XB))]>;
Hal Finkel27774d92014-03-13 07:58:58 +0000656 def XVCVSXDDP : XX2Form<60, 504,
657 (outs vsrc:$XT), (ins vsrc:$XB),
Hal Finkel7279f4b2014-03-26 19:13:54 +0000658 "xvcvsxddp $XT, $XB", IIC_VecFP,
659 [(set v2f64:$XT, (sint_to_fp v2i64:$XB))]>;
Hal Finkel27774d92014-03-13 07:58:58 +0000660 def XVCVSXDSP : XX2Form<60, 440,
661 (outs vsrc:$XT), (ins vsrc:$XB),
Nemanja Ivanovic2efc3cb2016-11-11 14:41:19 +0000662 "xvcvsxdsp $XT, $XB", IIC_VecFP,
663 [(set v4f32:$XT, (int_ppc_vsx_xvcvsxdsp v2i64:$XB))]>;
Hal Finkel27774d92014-03-13 07:58:58 +0000664 def XVCVSXWDP : XX2Form<60, 248,
665 (outs vsrc:$XT), (ins vsrc:$XB),
Nemanja Ivanovic2efc3cb2016-11-11 14:41:19 +0000666 "xvcvsxwdp $XT, $XB", IIC_VecFP,
667 [(set v2f64:$XT, (int_ppc_vsx_xvcvsxwdp v4i32:$XB))]>;
Hal Finkel27774d92014-03-13 07:58:58 +0000668 def XVCVSXWSP : XX2Form<60, 184,
669 (outs vsrc:$XT), (ins vsrc:$XB),
Nemanja Ivanovic44513e52016-07-05 09:22:29 +0000670 "xvcvsxwsp $XT, $XB", IIC_VecFP,
671 [(set v4f32:$XT, (sint_to_fp v4i32:$XB))]>;
Hal Finkel27774d92014-03-13 07:58:58 +0000672 def XVCVUXDDP : XX2Form<60, 488,
673 (outs vsrc:$XT), (ins vsrc:$XB),
Hal Finkel7279f4b2014-03-26 19:13:54 +0000674 "xvcvuxddp $XT, $XB", IIC_VecFP,
675 [(set v2f64:$XT, (uint_to_fp v2i64:$XB))]>;
Hal Finkel27774d92014-03-13 07:58:58 +0000676 def XVCVUXDSP : XX2Form<60, 424,
677 (outs vsrc:$XT), (ins vsrc:$XB),
Nemanja Ivanovic2efc3cb2016-11-11 14:41:19 +0000678 "xvcvuxdsp $XT, $XB", IIC_VecFP,
679 [(set v4f32:$XT, (int_ppc_vsx_xvcvuxdsp v2i64:$XB))]>;
Hal Finkel27774d92014-03-13 07:58:58 +0000680 def XVCVUXWDP : XX2Form<60, 232,
681 (outs vsrc:$XT), (ins vsrc:$XB),
Nemanja Ivanovic2efc3cb2016-11-11 14:41:19 +0000682 "xvcvuxwdp $XT, $XB", IIC_VecFP,
683 [(set v2f64:$XT, (int_ppc_vsx_xvcvuxwdp v4i32:$XB))]>;
Hal Finkel27774d92014-03-13 07:58:58 +0000684 def XVCVUXWSP : XX2Form<60, 168,
685 (outs vsrc:$XT), (ins vsrc:$XB),
Nemanja Ivanovicdf1cb522016-11-29 16:11:34 +0000686 "xvcvuxwsp $XT, $XB", IIC_VecFP,
687 [(set v4f32:$XT, (uint_to_fp v4i32:$XB))]>;
Hal Finkel27774d92014-03-13 07:58:58 +0000688
689 // Rounding Instructions
690 def XSRDPI : XX2Form<60, 73,
Hal Finkel19be5062014-03-29 05:29:01 +0000691 (outs vsfrc:$XT), (ins vsfrc:$XB),
Hal Finkel27774d92014-03-13 07:58:58 +0000692 "xsrdpi $XT, $XB", IIC_VecFP,
Michael Kuperstein2bc3d4d2016-08-18 20:08:15 +0000693 [(set f64:$XT, (fround f64:$XB))]>;
Hal Finkel27774d92014-03-13 07:58:58 +0000694 def XSRDPIC : XX2Form<60, 107,
Hal Finkel19be5062014-03-29 05:29:01 +0000695 (outs vsfrc:$XT), (ins vsfrc:$XB),
Hal Finkel27774d92014-03-13 07:58:58 +0000696 "xsrdpic $XT, $XB", IIC_VecFP,
697 [(set f64:$XT, (fnearbyint f64:$XB))]>;
698 def XSRDPIM : XX2Form<60, 121,
Hal Finkel19be5062014-03-29 05:29:01 +0000699 (outs vsfrc:$XT), (ins vsfrc:$XB),
Hal Finkel27774d92014-03-13 07:58:58 +0000700 "xsrdpim $XT, $XB", IIC_VecFP,
701 [(set f64:$XT, (ffloor f64:$XB))]>;
702 def XSRDPIP : XX2Form<60, 105,
Hal Finkel19be5062014-03-29 05:29:01 +0000703 (outs vsfrc:$XT), (ins vsfrc:$XB),
Hal Finkel27774d92014-03-13 07:58:58 +0000704 "xsrdpip $XT, $XB", IIC_VecFP,
705 [(set f64:$XT, (fceil f64:$XB))]>;
706 def XSRDPIZ : XX2Form<60, 89,
Hal Finkel19be5062014-03-29 05:29:01 +0000707 (outs vsfrc:$XT), (ins vsfrc:$XB),
Hal Finkel27774d92014-03-13 07:58:58 +0000708 "xsrdpiz $XT, $XB", IIC_VecFP,
709 [(set f64:$XT, (ftrunc f64:$XB))]>;
710
711 def XVRDPI : XX2Form<60, 201,
712 (outs vsrc:$XT), (ins vsrc:$XB),
713 "xvrdpi $XT, $XB", IIC_VecFP,
Michael Kuperstein2bc3d4d2016-08-18 20:08:15 +0000714 [(set v2f64:$XT, (fround v2f64:$XB))]>;
Hal Finkel27774d92014-03-13 07:58:58 +0000715 def XVRDPIC : XX2Form<60, 235,
716 (outs vsrc:$XT), (ins vsrc:$XB),
717 "xvrdpic $XT, $XB", IIC_VecFP,
718 [(set v2f64:$XT, (fnearbyint v2f64:$XB))]>;
719 def XVRDPIM : XX2Form<60, 249,
720 (outs vsrc:$XT), (ins vsrc:$XB),
721 "xvrdpim $XT, $XB", IIC_VecFP,
722 [(set v2f64:$XT, (ffloor v2f64:$XB))]>;
723 def XVRDPIP : XX2Form<60, 233,
724 (outs vsrc:$XT), (ins vsrc:$XB),
725 "xvrdpip $XT, $XB", IIC_VecFP,
726 [(set v2f64:$XT, (fceil v2f64:$XB))]>;
727 def XVRDPIZ : XX2Form<60, 217,
728 (outs vsrc:$XT), (ins vsrc:$XB),
729 "xvrdpiz $XT, $XB", IIC_VecFP,
730 [(set v2f64:$XT, (ftrunc v2f64:$XB))]>;
731
732 def XVRSPI : XX2Form<60, 137,
733 (outs vsrc:$XT), (ins vsrc:$XB),
734 "xvrspi $XT, $XB", IIC_VecFP,
Michael Kuperstein2bc3d4d2016-08-18 20:08:15 +0000735 [(set v4f32:$XT, (fround v4f32:$XB))]>;
Hal Finkel27774d92014-03-13 07:58:58 +0000736 def XVRSPIC : XX2Form<60, 171,
737 (outs vsrc:$XT), (ins vsrc:$XB),
738 "xvrspic $XT, $XB", IIC_VecFP,
739 [(set v4f32:$XT, (fnearbyint v4f32:$XB))]>;
740 def XVRSPIM : XX2Form<60, 185,
741 (outs vsrc:$XT), (ins vsrc:$XB),
742 "xvrspim $XT, $XB", IIC_VecFP,
743 [(set v4f32:$XT, (ffloor v4f32:$XB))]>;
744 def XVRSPIP : XX2Form<60, 169,
745 (outs vsrc:$XT), (ins vsrc:$XB),
746 "xvrspip $XT, $XB", IIC_VecFP,
747 [(set v4f32:$XT, (fceil v4f32:$XB))]>;
748 def XVRSPIZ : XX2Form<60, 153,
749 (outs vsrc:$XT), (ins vsrc:$XB),
750 "xvrspiz $XT, $XB", IIC_VecFP,
751 [(set v4f32:$XT, (ftrunc v4f32:$XB))]>;
752
753 // Max/Min Instructions
Hal Finkele01d3212014-03-24 15:07:28 +0000754 let isCommutable = 1 in {
Hal Finkel27774d92014-03-13 07:58:58 +0000755 def XSMAXDP : XX3Form<60, 160,
Hal Finkel19be5062014-03-29 05:29:01 +0000756 (outs vsfrc:$XT), (ins vsfrc:$XA, vsfrc:$XB),
Bill Schmidt1ca69fa2014-10-31 19:19:07 +0000757 "xsmaxdp $XT, $XA, $XB", IIC_VecFP,
758 [(set vsfrc:$XT,
759 (int_ppc_vsx_xsmaxdp vsfrc:$XA, vsfrc:$XB))]>;
Hal Finkel27774d92014-03-13 07:58:58 +0000760 def XSMINDP : XX3Form<60, 168,
Hal Finkel19be5062014-03-29 05:29:01 +0000761 (outs vsfrc:$XT), (ins vsfrc:$XA, vsfrc:$XB),
Bill Schmidt1ca69fa2014-10-31 19:19:07 +0000762 "xsmindp $XT, $XA, $XB", IIC_VecFP,
763 [(set vsfrc:$XT,
764 (int_ppc_vsx_xsmindp vsfrc:$XA, vsfrc:$XB))]>;
Hal Finkel27774d92014-03-13 07:58:58 +0000765
766 def XVMAXDP : XX3Form<60, 224,
767 (outs vsrc:$XT), (ins vsrc:$XA, vsrc:$XB),
Bill Schmidt1ca69fa2014-10-31 19:19:07 +0000768 "xvmaxdp $XT, $XA, $XB", IIC_VecFP,
769 [(set vsrc:$XT,
770 (int_ppc_vsx_xvmaxdp vsrc:$XA, vsrc:$XB))]>;
Hal Finkel27774d92014-03-13 07:58:58 +0000771 def XVMINDP : XX3Form<60, 232,
772 (outs vsrc:$XT), (ins vsrc:$XA, vsrc:$XB),
Bill Schmidt1ca69fa2014-10-31 19:19:07 +0000773 "xvmindp $XT, $XA, $XB", IIC_VecFP,
774 [(set vsrc:$XT,
775 (int_ppc_vsx_xvmindp vsrc:$XA, vsrc:$XB))]>;
Hal Finkel27774d92014-03-13 07:58:58 +0000776
777 def XVMAXSP : XX3Form<60, 192,
778 (outs vsrc:$XT), (ins vsrc:$XA, vsrc:$XB),
Bill Schmidt1ca69fa2014-10-31 19:19:07 +0000779 "xvmaxsp $XT, $XA, $XB", IIC_VecFP,
780 [(set vsrc:$XT,
781 (int_ppc_vsx_xvmaxsp vsrc:$XA, vsrc:$XB))]>;
Hal Finkel27774d92014-03-13 07:58:58 +0000782 def XVMINSP : XX3Form<60, 200,
783 (outs vsrc:$XT), (ins vsrc:$XA, vsrc:$XB),
Bill Schmidt1ca69fa2014-10-31 19:19:07 +0000784 "xvminsp $XT, $XA, $XB", IIC_VecFP,
785 [(set vsrc:$XT,
786 (int_ppc_vsx_xvminsp vsrc:$XA, vsrc:$XB))]>;
Hal Finkele01d3212014-03-24 15:07:28 +0000787 } // isCommutable
Hal Finkel27774d92014-03-13 07:58:58 +0000788} // Uses = [RM]
789
790 // Logical Instructions
Hal Finkele01d3212014-03-24 15:07:28 +0000791 let isCommutable = 1 in
Hal Finkel27774d92014-03-13 07:58:58 +0000792 def XXLAND : XX3Form<60, 130,
793 (outs vsrc:$XT), (ins vsrc:$XA, vsrc:$XB),
Hal Finkelbd4de9d2014-03-26 04:55:40 +0000794 "xxland $XT, $XA, $XB", IIC_VecGeneral,
795 [(set v4i32:$XT, (and v4i32:$XA, v4i32:$XB))]>;
Hal Finkel27774d92014-03-13 07:58:58 +0000796 def XXLANDC : XX3Form<60, 138,
797 (outs vsrc:$XT), (ins vsrc:$XA, vsrc:$XB),
Hal Finkelbd4de9d2014-03-26 04:55:40 +0000798 "xxlandc $XT, $XA, $XB", IIC_VecGeneral,
799 [(set v4i32:$XT, (and v4i32:$XA,
800 (vnot_ppc v4i32:$XB)))]>;
Hal Finkele01d3212014-03-24 15:07:28 +0000801 let isCommutable = 1 in {
Hal Finkel27774d92014-03-13 07:58:58 +0000802 def XXLNOR : XX3Form<60, 162,
803 (outs vsrc:$XT), (ins vsrc:$XA, vsrc:$XB),
Hal Finkelbd4de9d2014-03-26 04:55:40 +0000804 "xxlnor $XT, $XA, $XB", IIC_VecGeneral,
805 [(set v4i32:$XT, (vnot_ppc (or v4i32:$XA,
806 v4i32:$XB)))]>;
Hal Finkel27774d92014-03-13 07:58:58 +0000807 def XXLOR : XX3Form<60, 146,
808 (outs vsrc:$XT), (ins vsrc:$XA, vsrc:$XB),
Hal Finkelbd4de9d2014-03-26 04:55:40 +0000809 "xxlor $XT, $XA, $XB", IIC_VecGeneral,
810 [(set v4i32:$XT, (or v4i32:$XA, v4i32:$XB))]>;
Hal Finkel19be5062014-03-29 05:29:01 +0000811 let isCodeGenOnly = 1 in
812 def XXLORf: XX3Form<60, 146,
813 (outs vsfrc:$XT), (ins vsfrc:$XA, vsfrc:$XB),
814 "xxlor $XT, $XA, $XB", IIC_VecGeneral, []>;
Hal Finkel27774d92014-03-13 07:58:58 +0000815 def XXLXOR : XX3Form<60, 154,
816 (outs vsrc:$XT), (ins vsrc:$XA, vsrc:$XB),
Hal Finkelbd4de9d2014-03-26 04:55:40 +0000817 "xxlxor $XT, $XA, $XB", IIC_VecGeneral,
818 [(set v4i32:$XT, (xor v4i32:$XA, v4i32:$XB))]>;
Hal Finkele01d3212014-03-24 15:07:28 +0000819 } // isCommutable
Nemanja Ivanovicd2c3c512016-09-23 13:25:31 +0000820 let isCodeGenOnly = 1 in
821 def XXLXORz : XX3Form_Zero<60, 154, (outs vsrc:$XT), (ins),
822 "xxlxor $XT, $XT, $XT", IIC_VecGeneral,
823 [(set v4i32:$XT, (v4i32 immAllZerosV))]>;
Hal Finkel27774d92014-03-13 07:58:58 +0000824
Ehsan Amiric90b02c2016-10-24 17:31:09 +0000825 let isCodeGenOnly = 1 in {
826 def XXLXORdpz : XX3Form_SetZero<60, 154,
827 (outs vsfrc:$XT), (ins),
828 "xxlxor $XT, $XT, $XT", IIC_VecGeneral,
829 [(set f64:$XT, (fpimm0))]>;
830 def XXLXORspz : XX3Form_SetZero<60, 154,
831 (outs vssrc:$XT), (ins),
832 "xxlxor $XT, $XT, $XT", IIC_VecGeneral,
833 [(set f32:$XT, (fpimm0))]>;
834 }
835
Hal Finkel27774d92014-03-13 07:58:58 +0000836 // Permutation Instructions
837 def XXMRGHW : XX3Form<60, 18,
838 (outs vsrc:$XT), (ins vsrc:$XA, vsrc:$XB),
839 "xxmrghw $XT, $XA, $XB", IIC_VecPerm, []>;
840 def XXMRGLW : XX3Form<60, 50,
841 (outs vsrc:$XT), (ins vsrc:$XA, vsrc:$XB),
842 "xxmrglw $XT, $XA, $XB", IIC_VecPerm, []>;
843
844 def XXPERMDI : XX3Form_2<60, 10,
845 (outs vsrc:$XT), (ins vsrc:$XA, vsrc:$XB, u2imm:$DM),
Tony Jiang60c247d2017-05-31 13:09:57 +0000846 "xxpermdi $XT, $XA, $XB, $DM", IIC_VecPerm,
847 [(set v2i64:$XT, (PPCxxpermdi v2i64:$XA, v2i64:$XB,
848 imm32SExt16:$DM))]>;
Nemanja Ivanovic15748f42016-12-06 11:47:14 +0000849 let isCodeGenOnly = 1 in
850 def XXPERMDIs : XX3Form_2s<60, 10, (outs vsrc:$XT), (ins vsfrc:$XA, u2imm:$DM),
Nemanja Ivanovic11049f82016-10-04 06:59:23 +0000851 "xxpermdi $XT, $XA, $XA, $DM", IIC_VecPerm, []>;
Hal Finkel27774d92014-03-13 07:58:58 +0000852 def XXSEL : XX4Form<60, 3,
853 (outs vsrc:$XT), (ins vsrc:$XA, vsrc:$XB, vsrc:$XC),
854 "xxsel $XT, $XA, $XB, $XC", IIC_VecPerm, []>;
855
856 def XXSLDWI : XX3Form_2<60, 2,
857 (outs vsrc:$XT), (ins vsrc:$XA, vsrc:$XB, u2imm:$SHW),
Nemanja Ivanovicb43bb612016-07-12 21:00:10 +0000858 "xxsldwi $XT, $XA, $XB, $SHW", IIC_VecPerm,
859 [(set v4i32:$XT, (PPCvecshl v4i32:$XA, v4i32:$XB,
860 imm32SExt16:$SHW))]>;
Hal Finkel27774d92014-03-13 07:58:58 +0000861 def XXSPLTW : XX2Form_2<60, 164,
862 (outs vsrc:$XT), (ins vsrc:$XB, u2imm:$UIM),
Nemanja Ivanovic1a2b2f02016-05-04 16:04:02 +0000863 "xxspltw $XT, $XB, $UIM", IIC_VecPerm,
864 [(set v4i32:$XT,
865 (PPCxxsplt v4i32:$XB, imm32SExt16:$UIM))]>;
Nemanja Ivanovic11049f82016-10-04 06:59:23 +0000866 let isCodeGenOnly = 1 in
867 def XXSPLTWs : XX2Form_2<60, 164,
868 (outs vsrc:$XT), (ins vfrc:$XB, u2imm:$UIM),
869 "xxspltw $XT, $XB, $UIM", IIC_VecPerm, []>;
Craig Topperc50d64b2014-11-26 00:46:26 +0000870} // hasSideEffects
Nemanja Ivanovic11049f82016-10-04 06:59:23 +0000871} // UseVSXReg = 1
Hal Finkel27774d92014-03-13 07:58:58 +0000872
Bill Schmidt61e65232014-10-22 13:13:40 +0000873// SELECT_CC_* - Used to implement the SELECT_CC DAG operation. Expanded after
874// instruction selection into a branch sequence.
875let usesCustomInserter = 1, // Expanded after instruction selection.
876 PPC970_Single = 1 in {
877
878 def SELECT_CC_VSRC: Pseudo<(outs vsrc:$dst),
879 (ins crrc:$cond, vsrc:$T, vsrc:$F, i32imm:$BROPC),
880 "#SELECT_CC_VSRC",
881 []>;
Bill Schmidt9c54bbd2014-10-22 16:58:20 +0000882 def SELECT_VSRC: Pseudo<(outs vsrc:$dst),
883 (ins crbitrc:$cond, vsrc:$T, vsrc:$F),
884 "#SELECT_VSRC",
Bill Schmidt61e65232014-10-22 13:13:40 +0000885 [(set v2f64:$dst,
886 (select i1:$cond, v2f64:$T, v2f64:$F))]>;
Bill Schmidt9c54bbd2014-10-22 16:58:20 +0000887 def SELECT_CC_VSFRC: Pseudo<(outs f8rc:$dst),
888 (ins crrc:$cond, f8rc:$T, f8rc:$F,
889 i32imm:$BROPC), "#SELECT_CC_VSFRC",
890 []>;
891 def SELECT_VSFRC: Pseudo<(outs f8rc:$dst),
892 (ins crbitrc:$cond, f8rc:$T, f8rc:$F),
893 "#SELECT_VSFRC",
894 [(set f64:$dst,
895 (select i1:$cond, f64:$T, f64:$F))]>;
Nemanja Ivanovicf3c94b12015-05-07 18:24:05 +0000896 def SELECT_CC_VSSRC: Pseudo<(outs f4rc:$dst),
897 (ins crrc:$cond, f4rc:$T, f4rc:$F,
898 i32imm:$BROPC), "#SELECT_CC_VSSRC",
899 []>;
900 def SELECT_VSSRC: Pseudo<(outs f4rc:$dst),
901 (ins crbitrc:$cond, f4rc:$T, f4rc:$F),
902 "#SELECT_VSSRC",
903 [(set f32:$dst,
904 (select i1:$cond, f32:$T, f32:$F))]>;
Bill Schmidt9c54bbd2014-10-22 16:58:20 +0000905} // usesCustomInserter
906} // AddedComplexity
Bill Schmidt61e65232014-10-22 13:13:40 +0000907
Hal Finkel27774d92014-03-13 07:58:58 +0000908def : InstAlias<"xvmovdp $XT, $XB",
909 (XVCPSGNDP vsrc:$XT, vsrc:$XB, vsrc:$XB)>;
910def : InstAlias<"xvmovsp $XT, $XB",
911 (XVCPSGNSP vsrc:$XT, vsrc:$XB, vsrc:$XB)>;
912
913def : InstAlias<"xxspltd $XT, $XB, 0",
914 (XXPERMDI vsrc:$XT, vsrc:$XB, vsrc:$XB, 0)>;
915def : InstAlias<"xxspltd $XT, $XB, 1",
916 (XXPERMDI vsrc:$XT, vsrc:$XB, vsrc:$XB, 3)>;
917def : InstAlias<"xxmrghd $XT, $XA, $XB",
918 (XXPERMDI vsrc:$XT, vsrc:$XA, vsrc:$XB, 0)>;
919def : InstAlias<"xxmrgld $XT, $XA, $XB",
920 (XXPERMDI vsrc:$XT, vsrc:$XA, vsrc:$XB, 3)>;
921def : InstAlias<"xxswapd $XT, $XB",
922 (XXPERMDI vsrc:$XT, vsrc:$XB, vsrc:$XB, 2)>;
Nemanja Ivanovic15748f42016-12-06 11:47:14 +0000923def : InstAlias<"xxspltd $XT, $XB, 0",
924 (XXPERMDIs vsrc:$XT, vsfrc:$XB, 0)>;
925def : InstAlias<"xxspltd $XT, $XB, 1",
926 (XXPERMDIs vsrc:$XT, vsfrc:$XB, 3)>;
927def : InstAlias<"xxswapd $XT, $XB",
928 (XXPERMDIs vsrc:$XT, vsfrc:$XB, 2)>;
Hal Finkel27774d92014-03-13 07:58:58 +0000929
930let AddedComplexity = 400 in { // Prefer VSX patterns over non-VSX patterns.
Bill Schmidt10f6eb92014-12-09 16:43:32 +0000931
Nemanja Ivanovic6f22b412016-09-27 08:42:12 +0000932def : Pat<(v4i32 (vnot_ppc v4i32:$A)),
933 (v4i32 (XXLNOR $A, $A))>;
Bill Schmidt10f6eb92014-12-09 16:43:32 +0000934let Predicates = [IsBigEndian] in {
Hal Finkel27774d92014-03-13 07:58:58 +0000935def : Pat<(v2f64 (scalar_to_vector f64:$A)),
Hal Finkel19be5062014-03-29 05:29:01 +0000936 (v2f64 (SUBREG_TO_REG (i64 1), $A, sub_64))>;
Hal Finkel27774d92014-03-13 07:58:58 +0000937
Matt Arsenaultfbd9bbf2015-12-11 19:20:16 +0000938def : Pat<(f64 (extractelt v2f64:$S, 0)),
Hal Finkel19be5062014-03-29 05:29:01 +0000939 (f64 (EXTRACT_SUBREG $S, sub_64))>;
Matt Arsenaultfbd9bbf2015-12-11 19:20:16 +0000940def : Pat<(f64 (extractelt v2f64:$S, 1)),
Hal Finkel19be5062014-03-29 05:29:01 +0000941 (f64 (EXTRACT_SUBREG (XXPERMDI $S, $S, 2), sub_64))>;
Bill Schmidt10f6eb92014-12-09 16:43:32 +0000942}
943
944let Predicates = [IsLittleEndian] in {
945def : Pat<(v2f64 (scalar_to_vector f64:$A)),
946 (v2f64 (XXPERMDI (SUBREG_TO_REG (i64 1), $A, sub_64),
947 (SUBREG_TO_REG (i64 1), $A, sub_64), 0))>;
948
Matt Arsenaultfbd9bbf2015-12-11 19:20:16 +0000949def : Pat<(f64 (extractelt v2f64:$S, 0)),
Bill Schmidt10f6eb92014-12-09 16:43:32 +0000950 (f64 (EXTRACT_SUBREG (XXPERMDI $S, $S, 2), sub_64))>;
Matt Arsenaultfbd9bbf2015-12-11 19:20:16 +0000951def : Pat<(f64 (extractelt v2f64:$S, 1)),
Bill Schmidt10f6eb92014-12-09 16:43:32 +0000952 (f64 (EXTRACT_SUBREG $S, sub_64))>;
953}
Hal Finkel27774d92014-03-13 07:58:58 +0000954
955// Additional fnmsub patterns: -a*c + b == -(a*c - b)
956def : Pat<(fma (fneg f64:$A), f64:$C, f64:$B),
957 (XSNMSUBADP $B, $C, $A)>;
958def : Pat<(fma f64:$A, (fneg f64:$C), f64:$B),
959 (XSNMSUBADP $B, $C, $A)>;
960
961def : Pat<(fma (fneg v2f64:$A), v2f64:$C, v2f64:$B),
962 (XVNMSUBADP $B, $C, $A)>;
963def : Pat<(fma v2f64:$A, (fneg v2f64:$C), v2f64:$B),
964 (XVNMSUBADP $B, $C, $A)>;
965
966def : Pat<(fma (fneg v4f32:$A), v4f32:$C, v4f32:$B),
967 (XVNMSUBASP $B, $C, $A)>;
968def : Pat<(fma v4f32:$A, (fneg v4f32:$C), v4f32:$B),
969 (XVNMSUBASP $B, $C, $A)>;
970
Hal Finkel9e0baa62014-04-01 19:24:27 +0000971def : Pat<(v2f64 (bitconvert v4f32:$A)),
972 (COPY_TO_REGCLASS $A, VSRC)>;
Hal Finkel27774d92014-03-13 07:58:58 +0000973def : Pat<(v2f64 (bitconvert v4i32:$A)),
974 (COPY_TO_REGCLASS $A, VSRC)>;
975def : Pat<(v2f64 (bitconvert v8i16:$A)),
976 (COPY_TO_REGCLASS $A, VSRC)>;
977def : Pat<(v2f64 (bitconvert v16i8:$A)),
978 (COPY_TO_REGCLASS $A, VSRC)>;
979
Hal Finkel9e0baa62014-04-01 19:24:27 +0000980def : Pat<(v4f32 (bitconvert v2f64:$A)),
981 (COPY_TO_REGCLASS $A, VRRC)>;
Hal Finkel27774d92014-03-13 07:58:58 +0000982def : Pat<(v4i32 (bitconvert v2f64:$A)),
983 (COPY_TO_REGCLASS $A, VRRC)>;
984def : Pat<(v8i16 (bitconvert v2f64:$A)),
985 (COPY_TO_REGCLASS $A, VRRC)>;
986def : Pat<(v16i8 (bitconvert v2f64:$A)),
987 (COPY_TO_REGCLASS $A, VRRC)>;
988
Hal Finkel9e0baa62014-04-01 19:24:27 +0000989def : Pat<(v2i64 (bitconvert v4f32:$A)),
990 (COPY_TO_REGCLASS $A, VSRC)>;
Hal Finkela6c8b512014-03-26 16:12:58 +0000991def : Pat<(v2i64 (bitconvert v4i32:$A)),
992 (COPY_TO_REGCLASS $A, VSRC)>;
993def : Pat<(v2i64 (bitconvert v8i16:$A)),
994 (COPY_TO_REGCLASS $A, VSRC)>;
995def : Pat<(v2i64 (bitconvert v16i8:$A)),
996 (COPY_TO_REGCLASS $A, VSRC)>;
997
Hal Finkel9e0baa62014-04-01 19:24:27 +0000998def : Pat<(v4f32 (bitconvert v2i64:$A)),
999 (COPY_TO_REGCLASS $A, VRRC)>;
Hal Finkela6c8b512014-03-26 16:12:58 +00001000def : Pat<(v4i32 (bitconvert v2i64:$A)),
1001 (COPY_TO_REGCLASS $A, VRRC)>;
1002def : Pat<(v8i16 (bitconvert v2i64:$A)),
1003 (COPY_TO_REGCLASS $A, VRRC)>;
1004def : Pat<(v16i8 (bitconvert v2i64:$A)),
1005 (COPY_TO_REGCLASS $A, VRRC)>;
1006
Hal Finkel9281c9a2014-03-26 18:26:30 +00001007def : Pat<(v2f64 (bitconvert v2i64:$A)),
1008 (COPY_TO_REGCLASS $A, VRRC)>;
1009def : Pat<(v2i64 (bitconvert v2f64:$A)),
1010 (COPY_TO_REGCLASS $A, VRRC)>;
1011
Kit Bartond4eb73c2015-05-05 16:10:44 +00001012def : Pat<(v2f64 (bitconvert v1i128:$A)),
1013 (COPY_TO_REGCLASS $A, VRRC)>;
1014def : Pat<(v1i128 (bitconvert v2f64:$A)),
1015 (COPY_TO_REGCLASS $A, VRRC)>;
1016
Hal Finkel5c0d1452014-03-30 13:22:59 +00001017// sign extension patterns
1018// To extend "in place" from v2i32 to v2i64, we have input data like:
1019// | undef | i32 | undef | i32 |
1020// but xvcvsxwdp expects the input in big-Endian format:
1021// | i32 | undef | i32 | undef |
1022// so we need to shift everything to the left by one i32 (word) before
1023// the conversion.
1024def : Pat<(sext_inreg v2i64:$C, v2i32),
1025 (XVCVDPSXDS (XVCVSXWDP (XXSLDWI $C, $C, 1)))>;
1026def : Pat<(v2f64 (sint_to_fp (sext_inreg v2i64:$C, v2i32))),
1027 (XVCVSXWDP (XXSLDWI $C, $C, 1))>;
1028
Nemanja Ivanovic44513e52016-07-05 09:22:29 +00001029def : Pat<(v2f64 (PPCsvec2fp v4i32:$C, 0)),
1030 (v2f64 (XVCVSXWDP (v2i64 (XXMRGHW $C, $C))))>;
1031def : Pat<(v2f64 (PPCsvec2fp v4i32:$C, 1)),
1032 (v2f64 (XVCVSXWDP (v2i64 (XXMRGLW $C, $C))))>;
1033
1034def : Pat<(v2f64 (PPCuvec2fp v4i32:$C, 0)),
1035 (v2f64 (XVCVUXWDP (v2i64 (XXMRGHW $C, $C))))>;
1036def : Pat<(v2f64 (PPCuvec2fp v4i32:$C, 1)),
1037 (v2f64 (XVCVUXWDP (v2i64 (XXMRGLW $C, $C))))>;
1038
Bill Schmidt2d1128a2014-10-17 15:13:38 +00001039// Loads.
Nemanja Ivanovic6e7879c2016-09-22 09:52:19 +00001040let Predicates = [HasVSX, HasOnlySwappingMemOps] in {
Nemanja Ivanovic6e7879c2016-09-22 09:52:19 +00001041 def : Pat<(v2f64 (PPClxvd2x xoaddr:$src)), (LXVD2X xoaddr:$src)>;
Bill Schmidt2d1128a2014-10-17 15:13:38 +00001042
Nemanja Ivanovic6e7879c2016-09-22 09:52:19 +00001043 // Stores.
1044 def : Pat<(int_ppc_vsx_stxvd2x v2f64:$rS, xoaddr:$dst),
1045 (STXVD2X $rS, xoaddr:$dst)>;
Tony Jiang5f850cd2016-11-15 14:25:56 +00001046 def : Pat<(int_ppc_vsx_stxvd2x_be v2f64:$rS, xoaddr:$dst),
1047 (STXVD2X $rS, xoaddr:$dst)>;
1048 def : Pat<(int_ppc_vsx_stxvw4x_be v4i32:$rS, xoaddr:$dst),
1049 (STXVW4X $rS, xoaddr:$dst)>;
Nemanja Ivanovic6e7879c2016-09-22 09:52:19 +00001050 def : Pat<(PPCstxvd2x v2f64:$rS, xoaddr:$dst), (STXVD2X $rS, xoaddr:$dst)>;
1051}
Nemanja Ivanovice78ffed2016-09-22 10:32:03 +00001052let Predicates = [IsBigEndian, HasVSX, HasOnlySwappingMemOps] in {
1053 def : Pat<(v2f64 (load xoaddr:$src)), (LXVD2X xoaddr:$src)>;
1054 def : Pat<(v2i64 (load xoaddr:$src)), (LXVD2X xoaddr:$src)>;
1055 def : Pat<(v4i32 (load xoaddr:$src)), (LXVW4X xoaddr:$src)>;
Nemanja Ivanovicb89c27f2017-05-02 01:47:34 +00001056 def : Pat<(v4i32 (int_ppc_vsx_lxvw4x xoaddr:$src)), (LXVW4X xoaddr:$src)>;
Nemanja Ivanovice78ffed2016-09-22 10:32:03 +00001057 def : Pat<(store v2f64:$rS, xoaddr:$dst), (STXVD2X $rS, xoaddr:$dst)>;
1058 def : Pat<(store v2i64:$rS, xoaddr:$dst), (STXVD2X $rS, xoaddr:$dst)>;
Nemanja Ivanovicb89c27f2017-05-02 01:47:34 +00001059 def : Pat<(store v4i32:$XT, xoaddr:$dst), (STXVW4X $XT, xoaddr:$dst)>;
1060 def : Pat<(int_ppc_vsx_stxvw4x v4i32:$rS, xoaddr:$dst),
1061 (STXVW4X $rS, xoaddr:$dst)>;
Nemanja Ivanovice78ffed2016-09-22 10:32:03 +00001062}
Bill Schmidtfae5d712014-12-09 16:35:51 +00001063
1064// Permutes.
1065def : Pat<(v2f64 (PPCxxswapd v2f64:$src)), (XXPERMDI $src, $src, 2)>;
1066def : Pat<(v2i64 (PPCxxswapd v2i64:$src)), (XXPERMDI $src, $src, 2)>;
1067def : Pat<(v4f32 (PPCxxswapd v4f32:$src)), (XXPERMDI $src, $src, 2)>;
1068def : Pat<(v4i32 (PPCxxswapd v4i32:$src)), (XXPERMDI $src, $src, 2)>;
Nemanja Ivanoviceebbcb62016-07-12 12:16:27 +00001069def : Pat<(v2f64 (PPCswapNoChain v2f64:$src)), (XXPERMDI $src, $src, 2)>;
Bill Schmidt2d1128a2014-10-17 15:13:38 +00001070
Tony Jiang0a429f02017-05-24 23:48:29 +00001071// PPCvecshl XT, XA, XA, 2 can be selected to both XXSLDWI XT,XA,XA,2 and
1072// XXSWAPD XT,XA (i.e. XXPERMDI XT,XA,XA,2), the later one is more profitable.
1073def : Pat<(v4i32 (PPCvecshl v4i32:$src, v4i32:$src, 2)), (XXPERMDI $src, $src, 2)>;
1074
Bill Schmidt61e65232014-10-22 13:13:40 +00001075// Selects.
1076def : Pat<(v2f64 (selectcc i1:$lhs, i1:$rhs, v2f64:$tval, v2f64:$fval, SETLT)),
Hal Finkela2cdbce2015-08-30 22:12:50 +00001077 (SELECT_VSRC (CRANDC $lhs, $rhs), $tval, $fval)>;
1078def : Pat<(v2f64 (selectcc i1:$lhs, i1:$rhs, v2f64:$tval, v2f64:$fval, SETULT)),
Bill Schmidt61e65232014-10-22 13:13:40 +00001079 (SELECT_VSRC (CRANDC $rhs, $lhs), $tval, $fval)>;
1080def : Pat<(v2f64 (selectcc i1:$lhs, i1:$rhs, v2f64:$tval, v2f64:$fval, SETLE)),
Hal Finkela2cdbce2015-08-30 22:12:50 +00001081 (SELECT_VSRC (CRORC $lhs, $rhs), $tval, $fval)>;
1082def : Pat<(v2f64 (selectcc i1:$lhs, i1:$rhs, v2f64:$tval, v2f64:$fval, SETULE)),
Bill Schmidt61e65232014-10-22 13:13:40 +00001083 (SELECT_VSRC (CRORC $rhs, $lhs), $tval, $fval)>;
1084def : Pat<(v2f64 (selectcc i1:$lhs, i1:$rhs, v2f64:$tval, v2f64:$fval, SETEQ)),
1085 (SELECT_VSRC (CREQV $lhs, $rhs), $tval, $fval)>;
1086def : Pat<(v2f64 (selectcc i1:$lhs, i1:$rhs, v2f64:$tval, v2f64:$fval, SETGE)),
Hal Finkela2cdbce2015-08-30 22:12:50 +00001087 (SELECT_VSRC (CRORC $rhs, $lhs), $tval, $fval)>;
1088def : Pat<(v2f64 (selectcc i1:$lhs, i1:$rhs, v2f64:$tval, v2f64:$fval, SETUGE)),
Bill Schmidt61e65232014-10-22 13:13:40 +00001089 (SELECT_VSRC (CRORC $lhs, $rhs), $tval, $fval)>;
1090def : Pat<(v2f64 (selectcc i1:$lhs, i1:$rhs, v2f64:$tval, v2f64:$fval, SETGT)),
Hal Finkela2cdbce2015-08-30 22:12:50 +00001091 (SELECT_VSRC (CRANDC $rhs, $lhs), $tval, $fval)>;
1092def : Pat<(v2f64 (selectcc i1:$lhs, i1:$rhs, v2f64:$tval, v2f64:$fval, SETUGT)),
Bill Schmidt61e65232014-10-22 13:13:40 +00001093 (SELECT_VSRC (CRANDC $lhs, $rhs), $tval, $fval)>;
1094def : Pat<(v2f64 (selectcc i1:$lhs, i1:$rhs, v2f64:$tval, v2f64:$fval, SETNE)),
1095 (SELECT_VSRC (CRXOR $lhs, $rhs), $tval, $fval)>;
1096
Bill Schmidt9c54bbd2014-10-22 16:58:20 +00001097def : Pat<(f64 (selectcc i1:$lhs, i1:$rhs, f64:$tval, f64:$fval, SETLT)),
Hal Finkela2cdbce2015-08-30 22:12:50 +00001098 (SELECT_VSFRC (CRANDC $lhs, $rhs), $tval, $fval)>;
1099def : Pat<(f64 (selectcc i1:$lhs, i1:$rhs, f64:$tval, f64:$fval, SETULT)),
Bill Schmidt9c54bbd2014-10-22 16:58:20 +00001100 (SELECT_VSFRC (CRANDC $rhs, $lhs), $tval, $fval)>;
1101def : Pat<(f64 (selectcc i1:$lhs, i1:$rhs, f64:$tval, f64:$fval, SETLE)),
Hal Finkela2cdbce2015-08-30 22:12:50 +00001102 (SELECT_VSFRC (CRORC $lhs, $rhs), $tval, $fval)>;
1103def : Pat<(f64 (selectcc i1:$lhs, i1:$rhs, f64:$tval, f64:$fval, SETULE)),
Bill Schmidt9c54bbd2014-10-22 16:58:20 +00001104 (SELECT_VSFRC (CRORC $rhs, $lhs), $tval, $fval)>;
1105def : Pat<(f64 (selectcc i1:$lhs, i1:$rhs, f64:$tval, f64:$fval, SETEQ)),
1106 (SELECT_VSFRC (CREQV $lhs, $rhs), $tval, $fval)>;
1107def : Pat<(f64 (selectcc i1:$lhs, i1:$rhs, f64:$tval, f64:$fval, SETGE)),
Hal Finkela2cdbce2015-08-30 22:12:50 +00001108 (SELECT_VSFRC (CRORC $rhs, $lhs), $tval, $fval)>;
1109def : Pat<(f64 (selectcc i1:$lhs, i1:$rhs, f64:$tval, f64:$fval, SETUGE)),
Bill Schmidt9c54bbd2014-10-22 16:58:20 +00001110 (SELECT_VSFRC (CRORC $lhs, $rhs), $tval, $fval)>;
1111def : Pat<(f64 (selectcc i1:$lhs, i1:$rhs, f64:$tval, f64:$fval, SETGT)),
Hal Finkela2cdbce2015-08-30 22:12:50 +00001112 (SELECT_VSFRC (CRANDC $rhs, $lhs), $tval, $fval)>;
1113def : Pat<(f64 (selectcc i1:$lhs, i1:$rhs, f64:$tval, f64:$fval, SETUGT)),
Bill Schmidt9c54bbd2014-10-22 16:58:20 +00001114 (SELECT_VSFRC (CRANDC $lhs, $rhs), $tval, $fval)>;
1115def : Pat<(f64 (selectcc i1:$lhs, i1:$rhs, f64:$tval, f64:$fval, SETNE)),
1116 (SELECT_VSFRC (CRXOR $lhs, $rhs), $tval, $fval)>;
1117
Bill Schmidt76746922014-11-14 12:10:40 +00001118// Divides.
1119def : Pat<(int_ppc_vsx_xvdivsp v4f32:$A, v4f32:$B),
1120 (XVDIVSP $A, $B)>;
1121def : Pat<(int_ppc_vsx_xvdivdp v2f64:$A, v2f64:$B),
1122 (XVDIVDP $A, $B)>;
1123
Nemanja Ivanovic984a3612015-07-14 17:25:20 +00001124// Reciprocal estimate
1125def : Pat<(int_ppc_vsx_xvresp v4f32:$A),
1126 (XVRESP $A)>;
1127def : Pat<(int_ppc_vsx_xvredp v2f64:$A),
1128 (XVREDP $A)>;
1129
Nemanja Ivanovicd358b8f2015-07-05 06:03:51 +00001130// Recip. square root estimate
1131def : Pat<(int_ppc_vsx_xvrsqrtesp v4f32:$A),
1132 (XVRSQRTESP $A)>;
1133def : Pat<(int_ppc_vsx_xvrsqrtedp v2f64:$A),
1134 (XVRSQRTEDP $A)>;
1135
Nemanja Ivanovicd3c284f2016-07-18 15:30:00 +00001136let Predicates = [IsLittleEndian] in {
1137def : Pat<(f64 (PPCfcfid (PPCmtvsra (i64 (vector_extract v2i64:$S, 0))))),
1138 (f64 (XSCVSXDDP (COPY_TO_REGCLASS (XXPERMDI $S, $S, 2), VSFRC)))>;
1139def : Pat<(f64 (PPCfcfid (PPCmtvsra (i64 (vector_extract v2i64:$S, 1))))),
1140 (f64 (XSCVSXDDP (COPY_TO_REGCLASS (f64 (COPY_TO_REGCLASS $S, VSRC)), VSFRC)))>;
1141def : Pat<(f64 (PPCfcfidu (PPCmtvsra (i64 (vector_extract v2i64:$S, 0))))),
1142 (f64 (XSCVUXDDP (COPY_TO_REGCLASS (XXPERMDI $S, $S, 2), VSFRC)))>;
1143def : Pat<(f64 (PPCfcfidu (PPCmtvsra (i64 (vector_extract v2i64:$S, 1))))),
1144 (f64 (XSCVUXDDP (COPY_TO_REGCLASS (f64 (COPY_TO_REGCLASS $S, VSRC)), VSFRC)))>;
1145} // IsLittleEndian
1146
1147let Predicates = [IsBigEndian] in {
1148def : Pat<(f64 (PPCfcfid (PPCmtvsra (i64 (vector_extract v2i64:$S, 0))))),
1149 (f64 (XSCVSXDDP (COPY_TO_REGCLASS $S, VSFRC)))>;
1150def : Pat<(f64 (PPCfcfid (PPCmtvsra (i64 (vector_extract v2i64:$S, 1))))),
1151 (f64 (XSCVSXDDP (COPY_TO_REGCLASS (XXPERMDI $S, $S, 2), VSFRC)))>;
1152def : Pat<(f64 (PPCfcfidu (PPCmtvsra (i64 (vector_extract v2i64:$S, 0))))),
1153 (f64 (XSCVUXDDP (COPY_TO_REGCLASS $S, VSFRC)))>;
1154def : Pat<(f64 (PPCfcfidu (PPCmtvsra (i64 (vector_extract v2i64:$S, 1))))),
1155 (f64 (XSCVUXDDP (COPY_TO_REGCLASS (XXPERMDI $S, $S, 2), VSFRC)))>;
1156} // IsBigEndian
1157
Hal Finkel27774d92014-03-13 07:58:58 +00001158} // AddedComplexity
1159} // HasVSX
1160
Nemanja Ivanovic11049f82016-10-04 06:59:23 +00001161def ScalarLoads {
1162 dag Li8 = (i32 (extloadi8 xoaddr:$src));
1163 dag ZELi8 = (i32 (zextloadi8 xoaddr:$src));
1164 dag ZELi8i64 = (i64 (zextloadi8 xoaddr:$src));
1165 dag SELi8 = (i32 (sext_inreg (extloadi8 xoaddr:$src), i8));
1166 dag SELi8i64 = (i64 (sext_inreg (extloadi8 xoaddr:$src), i8));
1167
1168 dag Li16 = (i32 (extloadi16 xoaddr:$src));
1169 dag ZELi16 = (i32 (zextloadi16 xoaddr:$src));
1170 dag ZELi16i64 = (i64 (zextloadi16 xoaddr:$src));
1171 dag SELi16 = (i32 (sextloadi16 xoaddr:$src));
1172 dag SELi16i64 = (i64 (sextloadi16 xoaddr:$src));
1173
1174 dag Li32 = (i32 (load xoaddr:$src));
1175}
1176
Kit Barton298beb52015-02-18 16:21:46 +00001177// The following VSX instructions were introduced in Power ISA 2.07
1178/* FIXME: if the operands are v2i64, these patterns will not match.
1179 we should define new patterns or otherwise match the same patterns
1180 when the elements are larger than i32.
1181*/
1182def HasP8Vector : Predicate<"PPCSubTarget->hasP8Vector()">;
Nemanja Ivanovicc38b5312015-04-11 10:40:42 +00001183def HasDirectMove : Predicate<"PPCSubTarget->hasDirectMove()">;
Kit Barton298beb52015-02-18 16:21:46 +00001184let Predicates = [HasP8Vector] in {
1185let AddedComplexity = 400 in { // Prefer VSX patterns over non-VSX patterns.
Nemanja Ivanovic11049f82016-10-04 06:59:23 +00001186 let isCommutable = 1, UseVSXReg = 1 in {
Nemanja Ivanovicf02def62015-05-21 19:32:49 +00001187 def XXLEQV : XX3Form<60, 186,
1188 (outs vsrc:$XT), (ins vsrc:$XA, vsrc:$XB),
1189 "xxleqv $XT, $XA, $XB", IIC_VecGeneral,
1190 [(set v4i32:$XT, (vnot_ppc (xor v4i32:$XA, v4i32:$XB)))]>;
1191 def XXLNAND : XX3Form<60, 178,
1192 (outs vsrc:$XT), (ins vsrc:$XA, vsrc:$XB),
1193 "xxlnand $XT, $XA, $XB", IIC_VecGeneral,
1194 [(set v4i32:$XT, (vnot_ppc (and v4i32:$XA,
Kit Barton298beb52015-02-18 16:21:46 +00001195 v4i32:$XB)))]>;
Nemanja Ivanovic11049f82016-10-04 06:59:23 +00001196 } // isCommutable, UseVSXReg
Nemanja Ivanovicd9e4b4f2015-07-10 14:25:17 +00001197
Nemanja Ivanovic5655fb32015-07-10 12:38:08 +00001198 def : Pat<(int_ppc_vsx_xxleqv v4i32:$A, v4i32:$B),
1199 (XXLEQV $A, $B)>;
Nemanja Ivanovicf02def62015-05-21 19:32:49 +00001200
Nemanja Ivanovic11049f82016-10-04 06:59:23 +00001201 let UseVSXReg = 1 in {
Nemanja Ivanovicf02def62015-05-21 19:32:49 +00001202 def XXLORC : XX3Form<60, 170,
1203 (outs vsrc:$XT), (ins vsrc:$XA, vsrc:$XB),
1204 "xxlorc $XT, $XA, $XB", IIC_VecGeneral,
1205 [(set v4i32:$XT, (or v4i32:$XA, (vnot_ppc v4i32:$XB)))]>;
1206
Nemanja Ivanovicf3c94b12015-05-07 18:24:05 +00001207 // VSX scalar loads introduced in ISA 2.07
Sean Fertile3c8c3852017-01-26 18:59:15 +00001208 let mayLoad = 1, mayStore = 0 in {
Nemanja Ivanovic6354d232016-10-04 11:25:52 +00001209 let CodeSize = 3 in
Nemanja Ivanovicf3c94b12015-05-07 18:24:05 +00001210 def LXSSPX : XX1Form<31, 524, (outs vssrc:$XT), (ins memrr:$src),
1211 "lxsspx $XT, $src", IIC_LdStLFD,
1212 [(set f32:$XT, (load xoaddr:$src))]>;
1213 def LXSIWAX : XX1Form<31, 76, (outs vsfrc:$XT), (ins memrr:$src),
1214 "lxsiwax $XT, $src", IIC_LdStLFD,
1215 [(set f64:$XT, (PPClfiwax xoaddr:$src))]>;
1216 def LXSIWZX : XX1Form<31, 12, (outs vsfrc:$XT), (ins memrr:$src),
1217 "lxsiwzx $XT, $src", IIC_LdStLFD,
1218 [(set f64:$XT, (PPClfiwzx xoaddr:$src))]>;
1219 } // mayLoad
1220
1221 // VSX scalar stores introduced in ISA 2.07
Sean Fertile3c8c3852017-01-26 18:59:15 +00001222 let mayStore = 1, mayLoad = 0 in {
Nemanja Ivanovic6354d232016-10-04 11:25:52 +00001223 let CodeSize = 3 in
Nemanja Ivanovicf3c94b12015-05-07 18:24:05 +00001224 def STXSSPX : XX1Form<31, 652, (outs), (ins vssrc:$XT, memrr:$dst),
1225 "stxsspx $XT, $dst", IIC_LdStSTFD,
1226 [(store f32:$XT, xoaddr:$dst)]>;
1227 def STXSIWX : XX1Form<31, 140, (outs), (ins vsfrc:$XT, memrr:$dst),
1228 "stxsiwx $XT, $dst", IIC_LdStSTFD,
1229 [(PPCstfiwx f64:$XT, xoaddr:$dst)]>;
1230 } // mayStore
Nemanja Ivanovic11049f82016-10-04 06:59:23 +00001231 } // UseVSXReg = 1
Nemanja Ivanovicf02def62015-05-21 19:32:49 +00001232
1233 def : Pat<(f64 (extloadf32 xoaddr:$src)),
1234 (COPY_TO_REGCLASS (LXSSPX xoaddr:$src), VSFRC)>;
Nemanja Ivanovicdf1cb522016-11-29 16:11:34 +00001235 def : Pat<(f32 (fpround (extloadf32 xoaddr:$src))),
1236 (f32 (LXSSPX xoaddr:$src))>;
Michael Kuperstein2bc3d4d2016-08-18 20:08:15 +00001237 def : Pat<(f64 (fpextend f32:$src)),
Nemanja Ivanovicf02def62015-05-21 19:32:49 +00001238 (COPY_TO_REGCLASS $src, VSFRC)>;
Hal Finkela2cdbce2015-08-30 22:12:50 +00001239
Nemanja Ivanovicf02def62015-05-21 19:32:49 +00001240 def : Pat<(f32 (selectcc i1:$lhs, i1:$rhs, f32:$tval, f32:$fval, SETLT)),
Hal Finkela2cdbce2015-08-30 22:12:50 +00001241 (SELECT_VSSRC (CRANDC $lhs, $rhs), $tval, $fval)>;
1242 def : Pat<(f32 (selectcc i1:$lhs, i1:$rhs, f32:$tval, f32:$fval, SETULT)),
Nemanja Ivanovicf02def62015-05-21 19:32:49 +00001243 (SELECT_VSSRC (CRANDC $rhs, $lhs), $tval, $fval)>;
1244 def : Pat<(f32 (selectcc i1:$lhs, i1:$rhs, f32:$tval, f32:$fval, SETLE)),
Hal Finkela2cdbce2015-08-30 22:12:50 +00001245 (SELECT_VSSRC (CRORC $lhs, $rhs), $tval, $fval)>;
1246 def : Pat<(f32 (selectcc i1:$lhs, i1:$rhs, f32:$tval, f32:$fval, SETULE)),
Nemanja Ivanovicf02def62015-05-21 19:32:49 +00001247 (SELECT_VSSRC (CRORC $rhs, $lhs), $tval, $fval)>;
1248 def : Pat<(f32 (selectcc i1:$lhs, i1:$rhs, f32:$tval, f32:$fval, SETEQ)),
1249 (SELECT_VSSRC (CREQV $lhs, $rhs), $tval, $fval)>;
1250 def : Pat<(f32 (selectcc i1:$lhs, i1:$rhs, f32:$tval, f32:$fval, SETGE)),
Hal Finkela2cdbce2015-08-30 22:12:50 +00001251 (SELECT_VSSRC (CRORC $rhs, $lhs), $tval, $fval)>;
1252 def : Pat<(f32 (selectcc i1:$lhs, i1:$rhs, f32:$tval, f32:$fval, SETUGE)),
Nemanja Ivanovicf02def62015-05-21 19:32:49 +00001253 (SELECT_VSSRC (CRORC $lhs, $rhs), $tval, $fval)>;
1254 def : Pat<(f32 (selectcc i1:$lhs, i1:$rhs, f32:$tval, f32:$fval, SETGT)),
Hal Finkela2cdbce2015-08-30 22:12:50 +00001255 (SELECT_VSSRC (CRANDC $rhs, $lhs), $tval, $fval)>;
1256 def : Pat<(f32 (selectcc i1:$lhs, i1:$rhs, f32:$tval, f32:$fval, SETUGT)),
Nemanja Ivanovicf02def62015-05-21 19:32:49 +00001257 (SELECT_VSSRC (CRANDC $lhs, $rhs), $tval, $fval)>;
1258 def : Pat<(f32 (selectcc i1:$lhs, i1:$rhs, f32:$tval, f32:$fval, SETNE)),
Hal Finkela2cdbce2015-08-30 22:12:50 +00001259 (SELECT_VSSRC (CRXOR $lhs, $rhs), $tval, $fval)>;
Nemanja Ivanovicf02def62015-05-21 19:32:49 +00001260
Nemanja Ivanovic11049f82016-10-04 06:59:23 +00001261 let UseVSXReg = 1 in {
Nemanja Ivanovicf02def62015-05-21 19:32:49 +00001262 // VSX Elementary Scalar FP arithmetic (SP)
1263 let isCommutable = 1 in {
1264 def XSADDSP : XX3Form<60, 0,
1265 (outs vssrc:$XT), (ins vssrc:$XA, vssrc:$XB),
1266 "xsaddsp $XT, $XA, $XB", IIC_VecFP,
1267 [(set f32:$XT, (fadd f32:$XA, f32:$XB))]>;
1268 def XSMULSP : XX3Form<60, 16,
1269 (outs vssrc:$XT), (ins vssrc:$XA, vssrc:$XB),
1270 "xsmulsp $XT, $XA, $XB", IIC_VecFP,
1271 [(set f32:$XT, (fmul f32:$XA, f32:$XB))]>;
1272 } // isCommutable
1273
1274 def XSDIVSP : XX3Form<60, 24,
1275 (outs vssrc:$XT), (ins vssrc:$XA, vssrc:$XB),
1276 "xsdivsp $XT, $XA, $XB", IIC_FPDivS,
1277 [(set f32:$XT, (fdiv f32:$XA, f32:$XB))]>;
1278 def XSRESP : XX2Form<60, 26,
1279 (outs vssrc:$XT), (ins vssrc:$XB),
1280 "xsresp $XT, $XB", IIC_VecFP,
1281 [(set f32:$XT, (PPCfre f32:$XB))]>;
1282 def XSSQRTSP : XX2Form<60, 11,
1283 (outs vssrc:$XT), (ins vssrc:$XB),
1284 "xssqrtsp $XT, $XB", IIC_FPSqrtS,
1285 [(set f32:$XT, (fsqrt f32:$XB))]>;
1286 def XSRSQRTESP : XX2Form<60, 10,
1287 (outs vssrc:$XT), (ins vssrc:$XB),
1288 "xsrsqrtesp $XT, $XB", IIC_VecFP,
1289 [(set f32:$XT, (PPCfrsqrte f32:$XB))]>;
1290 def XSSUBSP : XX3Form<60, 8,
1291 (outs vssrc:$XT), (ins vssrc:$XA, vssrc:$XB),
1292 "xssubsp $XT, $XA, $XB", IIC_VecFP,
1293 [(set f32:$XT, (fsub f32:$XA, f32:$XB))]>;
Nemanja Ivanovic376e1732015-05-29 17:13:25 +00001294
1295 // FMA Instructions
1296 let BaseName = "XSMADDASP" in {
1297 let isCommutable = 1 in
1298 def XSMADDASP : XX3Form<60, 1,
1299 (outs vssrc:$XT),
1300 (ins vssrc:$XTi, vssrc:$XA, vssrc:$XB),
1301 "xsmaddasp $XT, $XA, $XB", IIC_VecFP,
1302 [(set f32:$XT, (fma f32:$XA, f32:$XB, f32:$XTi))]>,
1303 RegConstraint<"$XTi = $XT">, NoEncode<"$XTi">,
1304 AltVSXFMARel;
1305 let IsVSXFMAAlt = 1 in
1306 def XSMADDMSP : XX3Form<60, 9,
1307 (outs vssrc:$XT),
1308 (ins vssrc:$XTi, vssrc:$XA, vssrc:$XB),
1309 "xsmaddmsp $XT, $XA, $XB", IIC_VecFP, []>,
1310 RegConstraint<"$XTi = $XT">, NoEncode<"$XTi">,
1311 AltVSXFMARel;
1312 }
1313
1314 let BaseName = "XSMSUBASP" in {
1315 let isCommutable = 1 in
1316 def XSMSUBASP : XX3Form<60, 17,
1317 (outs vssrc:$XT),
1318 (ins vssrc:$XTi, vssrc:$XA, vssrc:$XB),
1319 "xsmsubasp $XT, $XA, $XB", IIC_VecFP,
1320 [(set f32:$XT, (fma f32:$XA, f32:$XB,
1321 (fneg f32:$XTi)))]>,
1322 RegConstraint<"$XTi = $XT">, NoEncode<"$XTi">,
1323 AltVSXFMARel;
1324 let IsVSXFMAAlt = 1 in
1325 def XSMSUBMSP : XX3Form<60, 25,
1326 (outs vssrc:$XT),
1327 (ins vssrc:$XTi, vssrc:$XA, vssrc:$XB),
1328 "xsmsubmsp $XT, $XA, $XB", IIC_VecFP, []>,
1329 RegConstraint<"$XTi = $XT">, NoEncode<"$XTi">,
1330 AltVSXFMARel;
1331 }
1332
1333 let BaseName = "XSNMADDASP" in {
1334 let isCommutable = 1 in
1335 def XSNMADDASP : XX3Form<60, 129,
1336 (outs vssrc:$XT),
1337 (ins vssrc:$XTi, vssrc:$XA, vssrc:$XB),
1338 "xsnmaddasp $XT, $XA, $XB", IIC_VecFP,
1339 [(set f32:$XT, (fneg (fma f32:$XA, f32:$XB,
1340 f32:$XTi)))]>,
1341 RegConstraint<"$XTi = $XT">, NoEncode<"$XTi">,
1342 AltVSXFMARel;
1343 let IsVSXFMAAlt = 1 in
1344 def XSNMADDMSP : XX3Form<60, 137,
1345 (outs vssrc:$XT),
1346 (ins vssrc:$XTi, vssrc:$XA, vssrc:$XB),
1347 "xsnmaddmsp $XT, $XA, $XB", IIC_VecFP, []>,
1348 RegConstraint<"$XTi = $XT">, NoEncode<"$XTi">,
1349 AltVSXFMARel;
1350 }
1351
1352 let BaseName = "XSNMSUBASP" in {
1353 let isCommutable = 1 in
1354 def XSNMSUBASP : XX3Form<60, 145,
1355 (outs vssrc:$XT),
1356 (ins vssrc:$XTi, vssrc:$XA, vssrc:$XB),
1357 "xsnmsubasp $XT, $XA, $XB", IIC_VecFP,
1358 [(set f32:$XT, (fneg (fma f32:$XA, f32:$XB,
1359 (fneg f32:$XTi))))]>,
1360 RegConstraint<"$XTi = $XT">, NoEncode<"$XTi">,
1361 AltVSXFMARel;
1362 let IsVSXFMAAlt = 1 in
1363 def XSNMSUBMSP : XX3Form<60, 153,
1364 (outs vssrc:$XT),
1365 (ins vssrc:$XTi, vssrc:$XA, vssrc:$XB),
1366 "xsnmsubmsp $XT, $XA, $XB", IIC_VecFP, []>,
1367 RegConstraint<"$XTi = $XT">, NoEncode<"$XTi">,
1368 AltVSXFMARel;
1369 }
Nemanja Ivanovic1c39ca62015-08-13 17:40:44 +00001370
1371 // Single Precision Conversions (FP <-> INT)
1372 def XSCVSXDSP : XX2Form<60, 312,
1373 (outs vssrc:$XT), (ins vsfrc:$XB),
1374 "xscvsxdsp $XT, $XB", IIC_VecFP,
1375 [(set f32:$XT, (PPCfcfids f64:$XB))]>;
1376 def XSCVUXDSP : XX2Form<60, 296,
1377 (outs vssrc:$XT), (ins vsfrc:$XB),
1378 "xscvuxdsp $XT, $XB", IIC_VecFP,
1379 [(set f32:$XT, (PPCfcfidus f64:$XB))]>;
1380
1381 // Conversions between vector and scalar single precision
1382 def XSCVDPSPN : XX2Form<60, 267, (outs vsrc:$XT), (ins vssrc:$XB),
1383 "xscvdpspn $XT, $XB", IIC_VecFP, []>;
1384 def XSCVSPDPN : XX2Form<60, 331, (outs vssrc:$XT), (ins vsrc:$XB),
1385 "xscvspdpn $XT, $XB", IIC_VecFP, []>;
Nemanja Ivanovic11049f82016-10-04 06:59:23 +00001386 } // UseVSXReg = 1
Nemanja Ivanovic1c39ca62015-08-13 17:40:44 +00001387
Nemanja Ivanovicd3c284f2016-07-18 15:30:00 +00001388 let Predicates = [IsLittleEndian] in {
1389 def : Pat<(f32 (PPCfcfids (PPCmtvsra (i64 (vector_extract v2i64:$S, 0))))),
1390 (f32 (XSCVSXDSP (COPY_TO_REGCLASS (XXPERMDI $S, $S, 2), VSFRC)))>;
1391 def : Pat<(f32 (PPCfcfids (PPCmtvsra (i64 (vector_extract v2i64:$S, 1))))),
1392 (f32 (XSCVSXDSP (COPY_TO_REGCLASS (f64 (COPY_TO_REGCLASS $S, VSRC)), VSFRC)))>;
1393 def : Pat<(f32 (PPCfcfidus (PPCmtvsra (i64 (vector_extract v2i64:$S, 0))))),
1394 (f32 (XSCVUXDSP (COPY_TO_REGCLASS (XXPERMDI $S, $S, 2), VSFRC)))>;
1395 def : Pat<(f32 (PPCfcfidus (PPCmtvsra (i64 (vector_extract v2i64:$S, 1))))),
1396 (f32 (XSCVUXDSP (COPY_TO_REGCLASS (f64 (COPY_TO_REGCLASS $S, VSRC)), VSFRC)))>;
1397 }
1398
1399 let Predicates = [IsBigEndian] in {
1400 def : Pat<(f32 (PPCfcfids (PPCmtvsra (i64 (vector_extract v2i64:$S, 0))))),
1401 (f32 (XSCVSXDSP (COPY_TO_REGCLASS $S, VSFRC)))>;
1402 def : Pat<(f32 (PPCfcfids (PPCmtvsra (i64 (vector_extract v2i64:$S, 1))))),
1403 (f32 (XSCVSXDSP (COPY_TO_REGCLASS (XXPERMDI $S, $S, 2), VSFRC)))>;
1404 def : Pat<(f32 (PPCfcfidus (PPCmtvsra (i64 (vector_extract v2i64:$S, 0))))),
1405 (f32 (XSCVUXDSP (COPY_TO_REGCLASS $S, VSFRC)))>;
1406 def : Pat<(f32 (PPCfcfidus (PPCmtvsra (i64 (vector_extract v2i64:$S, 1))))),
1407 (f32 (XSCVUXDSP (COPY_TO_REGCLASS (XXPERMDI $S, $S, 2), VSFRC)))>;
1408 }
Nemanja Ivanovic11049f82016-10-04 06:59:23 +00001409 def : Pat<(v4i32 (scalar_to_vector ScalarLoads.Li32)),
1410 (v4i32 (XXSPLTWs (LXSIWAX xoaddr:$src), 1))>;
Nemanja Ivanovicf3c94b12015-05-07 18:24:05 +00001411} // AddedComplexity = 400
Kit Barton298beb52015-02-18 16:21:46 +00001412} // HasP8Vector
Nemanja Ivanovicc38b5312015-04-11 10:40:42 +00001413
Nemanja Ivanovicdf1cb522016-11-29 16:11:34 +00001414let UseVSXReg = 1, AddedComplexity = 400 in {
Ehsan Amiri99b017a2016-03-31 17:47:17 +00001415let Predicates = [HasDirectMove] in {
Nemanja Ivanovicf02def62015-05-21 19:32:49 +00001416 // VSX direct move instructions
1417 def MFVSRD : XX1_RS6_RD5_XO<31, 51, (outs g8rc:$rA), (ins vsfrc:$XT),
1418 "mfvsrd $rA, $XT", IIC_VecGeneral,
1419 [(set i64:$rA, (PPCmfvsr f64:$XT))]>,
1420 Requires<[In64BitMode]>;
Nemanja Ivanovicffcf0fb2017-03-15 16:04:53 +00001421 let isCodeGenOnly = 1 in
1422 def MFVRD : XX1_RS6_RD5_XO<31, 51, (outs g8rc:$rA), (ins vrrc:$XT),
1423 "mfvsrd $rA, $XT", IIC_VecGeneral,
1424 []>,
1425 Requires<[In64BitMode]>;
Nemanja Ivanovicf02def62015-05-21 19:32:49 +00001426 def MFVSRWZ : XX1_RS6_RD5_XO<31, 115, (outs gprc:$rA), (ins vsfrc:$XT),
1427 "mfvsrwz $rA, $XT", IIC_VecGeneral,
1428 [(set i32:$rA, (PPCmfvsr f64:$XT))]>;
1429 def MTVSRD : XX1_RS6_RD5_XO<31, 179, (outs vsfrc:$XT), (ins g8rc:$rA),
1430 "mtvsrd $XT, $rA", IIC_VecGeneral,
1431 [(set f64:$XT, (PPCmtvsra i64:$rA))]>,
1432 Requires<[In64BitMode]>;
1433 def MTVSRWA : XX1_RS6_RD5_XO<31, 211, (outs vsfrc:$XT), (ins gprc:$rA),
1434 "mtvsrwa $XT, $rA", IIC_VecGeneral,
1435 [(set f64:$XT, (PPCmtvsra i32:$rA))]>;
1436 def MTVSRWZ : XX1_RS6_RD5_XO<31, 243, (outs vsfrc:$XT), (ins gprc:$rA),
1437 "mtvsrwz $XT, $rA", IIC_VecGeneral,
1438 [(set f64:$XT, (PPCmtvsrz i32:$rA))]>;
Ehsan Amiri99b017a2016-03-31 17:47:17 +00001439} // HasDirectMove
1440
1441let Predicates = [IsISA3_0, HasDirectMove] in {
1442 def MTVSRWS: XX1_RS6_RD5_XO<31, 403, (outs vsrc:$XT), (ins gprc:$rA),
Nemanja Ivanovicd2c3c512016-09-23 13:25:31 +00001443 "mtvsrws $XT, $rA", IIC_VecGeneral, []>;
Ehsan Amiri99b017a2016-03-31 17:47:17 +00001444
Guozhi Wei22e7da92017-05-11 22:17:35 +00001445 def MTVSRDD: XX1Form<31, 435, (outs vsrc:$XT), (ins g8rc_nox0:$rA, g8rc:$rB),
Ehsan Amiri99b017a2016-03-31 17:47:17 +00001446 "mtvsrdd $XT, $rA, $rB", IIC_VecGeneral,
1447 []>, Requires<[In64BitMode]>;
1448
1449 def MFVSRLD: XX1_RS6_RD5_XO<31, 307, (outs g8rc:$rA), (ins vsrc:$XT),
1450 "mfvsrld $rA, $XT", IIC_VecGeneral,
1451 []>, Requires<[In64BitMode]>;
1452
1453} // IsISA3_0, HasDirectMove
Nemanja Ivanovic11049f82016-10-04 06:59:23 +00001454} // UseVSXReg = 1
Nemanja Ivanovic1c39ca62015-08-13 17:40:44 +00001455
Nemanja Ivanovicffcf0fb2017-03-15 16:04:53 +00001456// We want to parse this from asm, but we don't want to emit this as it would
1457// be emitted with a VSX reg. So leave Emit = 0 here.
1458def : InstAlias<"mfvrd $rA, $XT",
1459 (MFVRD g8rc:$rA, vrrc:$XT), 0>;
1460def : InstAlias<"mffprd $rA, $src",
1461 (MFVSRD g8rc:$rA, f8rc:$src)>;
1462
Nemanja Ivanovicd3896572015-10-09 11:12:18 +00001463/* Direct moves of various widths from GPR's into VSR's. Each move lines
Nemanja Ivanovic1c39ca62015-08-13 17:40:44 +00001464 the value up into element 0 (both BE and LE). Namely, entities smaller than
1465 a doubleword are shifted left and moved for BE. For LE, they're moved, then
1466 swapped to go into the least significant element of the VSR.
1467*/
Nemanja Ivanovicd3896572015-10-09 11:12:18 +00001468def MovesToVSR {
1469 dag BE_BYTE_0 =
1470 (MTVSRD
1471 (RLDICR
1472 (INSERT_SUBREG (i64 (IMPLICIT_DEF)), $A, sub_32), 56, 7));
1473 dag BE_HALF_0 =
1474 (MTVSRD
1475 (RLDICR
1476 (INSERT_SUBREG (i64 (IMPLICIT_DEF)), $A, sub_32), 48, 15));
1477 dag BE_WORD_0 =
1478 (MTVSRD
1479 (RLDICR
1480 (INSERT_SUBREG (i64 (IMPLICIT_DEF)), $A, sub_32), 32, 31));
Nemanja Ivanovic1c39ca62015-08-13 17:40:44 +00001481 dag BE_DWORD_0 = (MTVSRD $A);
1482
1483 dag LE_MTVSRW = (MTVSRD (INSERT_SUBREG (i64 (IMPLICIT_DEF)), $A, sub_32));
Nemanja Ivanovicd3896572015-10-09 11:12:18 +00001484 dag LE_WORD_1 = (v2i64 (INSERT_SUBREG (v2i64 (IMPLICIT_DEF)),
1485 LE_MTVSRW, sub_64));
Nemanja Ivanovic1c39ca62015-08-13 17:40:44 +00001486 dag LE_WORD_0 = (XXPERMDI LE_WORD_1, LE_WORD_1, 2);
Nemanja Ivanovicd3896572015-10-09 11:12:18 +00001487 dag LE_DWORD_1 = (v2i64 (INSERT_SUBREG (v2i64 (IMPLICIT_DEF)),
1488 BE_DWORD_0, sub_64));
Nemanja Ivanovic1c39ca62015-08-13 17:40:44 +00001489 dag LE_DWORD_0 = (XXPERMDI LE_DWORD_1, LE_DWORD_1, 2);
1490}
1491
Nemanja Ivanovicac8d01a2015-12-10 13:35:28 +00001492/* Patterns for extracting elements out of vectors. Integer elements are
1493 extracted using direct move operations. Patterns for extracting elements
1494 whose indices are not available at compile time are also provided with
1495 various _VARIABLE_ patterns.
Nemanja Ivanovicd3896572015-10-09 11:12:18 +00001496 The numbering for the DAG's is for LE, but when used on BE, the correct
1497 LE element can just be used (i.e. LE_BYTE_2 == BE_BYTE_13).
1498*/
Nemanja Ivanovicac8d01a2015-12-10 13:35:28 +00001499def VectorExtractions {
Nemanja Ivanovicd3896572015-10-09 11:12:18 +00001500 // Doubleword extraction
1501 dag LE_DWORD_0 =
1502 (MFVSRD
1503 (EXTRACT_SUBREG
1504 (XXPERMDI (COPY_TO_REGCLASS $S, VSRC),
1505 (COPY_TO_REGCLASS $S, VSRC), 2), sub_64));
1506 dag LE_DWORD_1 = (MFVSRD
1507 (EXTRACT_SUBREG
1508 (v2i64 (COPY_TO_REGCLASS $S, VSRC)), sub_64));
1509
1510 // Word extraction
Nemanja Ivanoviceebbcb62016-07-12 12:16:27 +00001511 dag LE_WORD_0 = (MFVSRWZ (EXTRACT_SUBREG (XXPERMDI $S, $S, 2), sub_64));
Nemanja Ivanovicd3896572015-10-09 11:12:18 +00001512 dag LE_WORD_1 = (MFVSRWZ (EXTRACT_SUBREG (XXSLDWI $S, $S, 1), sub_64));
1513 dag LE_WORD_2 = (MFVSRWZ (EXTRACT_SUBREG
1514 (v2i64 (COPY_TO_REGCLASS $S, VSRC)), sub_64));
1515 dag LE_WORD_3 = (MFVSRWZ (EXTRACT_SUBREG (XXSLDWI $S, $S, 3), sub_64));
1516
1517 // Halfword extraction
1518 dag LE_HALF_0 = (i32 (EXTRACT_SUBREG (RLDICL LE_DWORD_0, 0, 48), sub_32));
1519 dag LE_HALF_1 = (i32 (EXTRACT_SUBREG (RLDICL LE_DWORD_0, 48, 48), sub_32));
1520 dag LE_HALF_2 = (i32 (EXTRACT_SUBREG (RLDICL LE_DWORD_0, 32, 48), sub_32));
1521 dag LE_HALF_3 = (i32 (EXTRACT_SUBREG (RLDICL LE_DWORD_0, 16, 48), sub_32));
1522 dag LE_HALF_4 = (i32 (EXTRACT_SUBREG (RLDICL LE_DWORD_1, 0, 48), sub_32));
1523 dag LE_HALF_5 = (i32 (EXTRACT_SUBREG (RLDICL LE_DWORD_1, 48, 48), sub_32));
1524 dag LE_HALF_6 = (i32 (EXTRACT_SUBREG (RLDICL LE_DWORD_1, 32, 48), sub_32));
1525 dag LE_HALF_7 = (i32 (EXTRACT_SUBREG (RLDICL LE_DWORD_1, 16, 48), sub_32));
1526
1527 // Byte extraction
1528 dag LE_BYTE_0 = (i32 (EXTRACT_SUBREG (RLDICL LE_DWORD_0, 0, 56), sub_32));
1529 dag LE_BYTE_1 = (i32 (EXTRACT_SUBREG (RLDICL LE_DWORD_0, 56, 56), sub_32));
1530 dag LE_BYTE_2 = (i32 (EXTRACT_SUBREG (RLDICL LE_DWORD_0, 48, 56), sub_32));
1531 dag LE_BYTE_3 = (i32 (EXTRACT_SUBREG (RLDICL LE_DWORD_0, 40, 56), sub_32));
1532 dag LE_BYTE_4 = (i32 (EXTRACT_SUBREG (RLDICL LE_DWORD_0, 32, 56), sub_32));
1533 dag LE_BYTE_5 = (i32 (EXTRACT_SUBREG (RLDICL LE_DWORD_0, 24, 56), sub_32));
1534 dag LE_BYTE_6 = (i32 (EXTRACT_SUBREG (RLDICL LE_DWORD_0, 16, 56), sub_32));
1535 dag LE_BYTE_7 = (i32 (EXTRACT_SUBREG (RLDICL LE_DWORD_0, 8, 56), sub_32));
1536 dag LE_BYTE_8 = (i32 (EXTRACT_SUBREG (RLDICL LE_DWORD_1, 0, 56), sub_32));
1537 dag LE_BYTE_9 = (i32 (EXTRACT_SUBREG (RLDICL LE_DWORD_1, 56, 56), sub_32));
1538 dag LE_BYTE_10 = (i32 (EXTRACT_SUBREG (RLDICL LE_DWORD_1, 48, 56), sub_32));
1539 dag LE_BYTE_11 = (i32 (EXTRACT_SUBREG (RLDICL LE_DWORD_1, 40, 56), sub_32));
1540 dag LE_BYTE_12 = (i32 (EXTRACT_SUBREG (RLDICL LE_DWORD_1, 32, 56), sub_32));
1541 dag LE_BYTE_13 = (i32 (EXTRACT_SUBREG (RLDICL LE_DWORD_1, 24, 56), sub_32));
1542 dag LE_BYTE_14 = (i32 (EXTRACT_SUBREG (RLDICL LE_DWORD_1, 16, 56), sub_32));
1543 dag LE_BYTE_15 = (i32 (EXTRACT_SUBREG (RLDICL LE_DWORD_1, 8, 56), sub_32));
1544
1545 /* Variable element number (BE and LE patterns must be specified separately)
1546 This is a rather involved process.
1547
1548 Conceptually, this is how the move is accomplished:
1549 1. Identify which doubleword contains the element
1550 2. Shift in the VMX register so that the correct doubleword is correctly
1551 lined up for the MFVSRD
1552 3. Perform the move so that the element (along with some extra stuff)
1553 is in the GPR
1554 4. Right shift within the GPR so that the element is right-justified
1555
1556 Of course, the index is an element number which has a different meaning
1557 on LE/BE so the patterns have to be specified separately.
1558
1559 Note: The final result will be the element right-justified with high
1560 order bits being arbitrarily defined (namely, whatever was in the
1561 vector register to the left of the value originally).
1562 */
1563
1564 /* LE variable byte
1565 Number 1. above:
1566 - For elements 0-7, we shift left by 8 bytes since they're on the right
1567 - For elements 8-15, we need not shift (shift left by zero bytes)
1568 This is accomplished by inverting the bits of the index and AND-ing
1569 with 0x8 (i.e. clearing all bits of the index and inverting bit 60).
1570 */
1571 dag LE_VBYTE_PERM_VEC = (LVSL ZERO8, (ANDC8 (LI8 8), $Idx));
1572
1573 // Number 2. above:
1574 // - Now that we set up the shift amount, we shift in the VMX register
1575 dag LE_VBYTE_PERMUTE = (VPERM $S, $S, LE_VBYTE_PERM_VEC);
1576
1577 // Number 3. above:
1578 // - The doubleword containing our element is moved to a GPR
1579 dag LE_MV_VBYTE = (MFVSRD
1580 (EXTRACT_SUBREG
1581 (v2i64 (COPY_TO_REGCLASS LE_VBYTE_PERMUTE, VSRC)),
1582 sub_64));
1583
1584 /* Number 4. above:
1585 - Truncate the element number to the range 0-7 (8-15 are symmetrical
1586 and out of range values are truncated accordingly)
1587 - Multiply by 8 as we need to shift right by the number of bits, not bytes
1588 - Shift right in the GPR by the calculated value
1589 */
1590 dag LE_VBYTE_SHIFT = (EXTRACT_SUBREG (RLDICR (AND8 (LI8 7), $Idx), 3, 60),
1591 sub_32);
1592 dag LE_VARIABLE_BYTE = (EXTRACT_SUBREG (SRD LE_MV_VBYTE, LE_VBYTE_SHIFT),
1593 sub_32);
1594
Nemanja Ivanovicd3896572015-10-09 11:12:18 +00001595 /* LE variable halfword
1596 Number 1. above:
1597 - For elements 0-3, we shift left by 8 since they're on the right
1598 - For elements 4-7, we need not shift (shift left by zero bytes)
1599 Similarly to the byte pattern, we invert the bits of the index, but we
1600 AND with 0x4 (i.e. clear all bits of the index and invert bit 61).
1601 Of course, the shift is still by 8 bytes, so we must multiply by 2.
1602 */
1603 dag LE_VHALF_PERM_VEC = (LVSL ZERO8, (RLDICR (ANDC8 (LI8 4), $Idx), 1, 62));
1604
1605 // Number 2. above:
1606 // - Now that we set up the shift amount, we shift in the VMX register
1607 dag LE_VHALF_PERMUTE = (VPERM $S, $S, LE_VHALF_PERM_VEC);
1608
1609 // Number 3. above:
1610 // - The doubleword containing our element is moved to a GPR
1611 dag LE_MV_VHALF = (MFVSRD
1612 (EXTRACT_SUBREG
1613 (v2i64 (COPY_TO_REGCLASS LE_VHALF_PERMUTE, VSRC)),
1614 sub_64));
1615
1616 /* Number 4. above:
1617 - Truncate the element number to the range 0-3 (4-7 are symmetrical
1618 and out of range values are truncated accordingly)
1619 - Multiply by 16 as we need to shift right by the number of bits
1620 - Shift right in the GPR by the calculated value
1621 */
1622 dag LE_VHALF_SHIFT = (EXTRACT_SUBREG (RLDICR (AND8 (LI8 3), $Idx), 4, 59),
1623 sub_32);
1624 dag LE_VARIABLE_HALF = (EXTRACT_SUBREG (SRD LE_MV_VHALF, LE_VHALF_SHIFT),
1625 sub_32);
1626
Nemanja Ivanovicac8d01a2015-12-10 13:35:28 +00001627 /* LE variable word
1628 Number 1. above:
1629 - For elements 0-1, we shift left by 8 since they're on the right
1630 - For elements 2-3, we need not shift
1631 */
1632 dag LE_VWORD_PERM_VEC = (LVSL ZERO8, (RLDICR (ANDC8 (LI8 2), $Idx), 2, 61));
1633
1634 // Number 2. above:
1635 // - Now that we set up the shift amount, we shift in the VMX register
1636 dag LE_VWORD_PERMUTE = (VPERM $S, $S, LE_VWORD_PERM_VEC);
1637
1638 // Number 3. above:
1639 // - The doubleword containing our element is moved to a GPR
1640 dag LE_MV_VWORD = (MFVSRD
1641 (EXTRACT_SUBREG
1642 (v2i64 (COPY_TO_REGCLASS LE_VWORD_PERMUTE, VSRC)),
1643 sub_64));
1644
1645 /* Number 4. above:
1646 - Truncate the element number to the range 0-1 (2-3 are symmetrical
1647 and out of range values are truncated accordingly)
1648 - Multiply by 32 as we need to shift right by the number of bits
1649 - Shift right in the GPR by the calculated value
1650 */
1651 dag LE_VWORD_SHIFT = (EXTRACT_SUBREG (RLDICR (AND8 (LI8 1), $Idx), 5, 58),
1652 sub_32);
1653 dag LE_VARIABLE_WORD = (EXTRACT_SUBREG (SRD LE_MV_VWORD, LE_VWORD_SHIFT),
1654 sub_32);
1655
1656 /* LE variable doubleword
1657 Number 1. above:
1658 - For element 0, we shift left by 8 since it's on the right
1659 - For element 1, we need not shift
1660 */
1661 dag LE_VDWORD_PERM_VEC = (LVSL ZERO8, (RLDICR (ANDC8 (LI8 1), $Idx), 3, 60));
1662
1663 // Number 2. above:
1664 // - Now that we set up the shift amount, we shift in the VMX register
1665 dag LE_VDWORD_PERMUTE = (VPERM $S, $S, LE_VDWORD_PERM_VEC);
1666
1667 // Number 3. above:
1668 // - The doubleword containing our element is moved to a GPR
1669 // - Number 4. is not needed for the doubleword as the value is 64-bits
1670 dag LE_VARIABLE_DWORD =
1671 (MFVSRD (EXTRACT_SUBREG
1672 (v2i64 (COPY_TO_REGCLASS LE_VDWORD_PERMUTE, VSRC)),
1673 sub_64));
1674
1675 /* LE variable float
1676 - Shift the vector to line up the desired element to BE Word 0
1677 - Convert 32-bit float to a 64-bit single precision float
1678 */
1679 dag LE_VFLOAT_PERM_VEC = (LVSL ZERO8, (RLDICR (XOR8 (LI8 3), $Idx), 2, 61));
1680 dag LE_VFLOAT_PERMUTE = (VPERM $S, $S, LE_VFLOAT_PERM_VEC);
1681 dag LE_VARIABLE_FLOAT = (XSCVSPDPN LE_VFLOAT_PERMUTE);
1682
1683 /* LE variable double
1684 Same as the LE doubleword except there is no move.
1685 */
1686 dag LE_VDOUBLE_PERMUTE = (VPERM (COPY_TO_REGCLASS $S, VRRC),
1687 (COPY_TO_REGCLASS $S, VRRC),
1688 LE_VDWORD_PERM_VEC);
1689 dag LE_VARIABLE_DOUBLE = (COPY_TO_REGCLASS LE_VDOUBLE_PERMUTE, VSRC);
1690
1691 /* BE variable byte
1692 The algorithm here is the same as the LE variable byte except:
1693 - The shift in the VMX register is by 0/8 for opposite element numbers so
1694 we simply AND the element number with 0x8
1695 - The order of elements after the move to GPR is reversed, so we invert
1696 the bits of the index prior to truncating to the range 0-7
1697 */
1698 dag BE_VBYTE_PERM_VEC = (LVSL ZERO8, (ANDIo8 $Idx, 8));
1699 dag BE_VBYTE_PERMUTE = (VPERM $S, $S, BE_VBYTE_PERM_VEC);
1700 dag BE_MV_VBYTE = (MFVSRD
1701 (EXTRACT_SUBREG
1702 (v2i64 (COPY_TO_REGCLASS BE_VBYTE_PERMUTE, VSRC)),
1703 sub_64));
1704 dag BE_VBYTE_SHIFT = (EXTRACT_SUBREG (RLDICR (ANDC8 (LI8 7), $Idx), 3, 60),
1705 sub_32);
1706 dag BE_VARIABLE_BYTE = (EXTRACT_SUBREG (SRD BE_MV_VBYTE, BE_VBYTE_SHIFT),
1707 sub_32);
1708
Nemanja Ivanovicd3896572015-10-09 11:12:18 +00001709 /* BE variable halfword
1710 The algorithm here is the same as the LE variable halfword except:
1711 - The shift in the VMX register is by 0/8 for opposite element numbers so
1712 we simply AND the element number with 0x4 and multiply by 2
1713 - The order of elements after the move to GPR is reversed, so we invert
1714 the bits of the index prior to truncating to the range 0-3
1715 */
1716 dag BE_VHALF_PERM_VEC = (LVSL ZERO8, (RLDICR (ANDIo8 $Idx, 4), 1, 62));
1717 dag BE_VHALF_PERMUTE = (VPERM $S, $S, BE_VHALF_PERM_VEC);
1718 dag BE_MV_VHALF = (MFVSRD
1719 (EXTRACT_SUBREG
1720 (v2i64 (COPY_TO_REGCLASS BE_VHALF_PERMUTE, VSRC)),
1721 sub_64));
Nemanja Ivanovicac8d01a2015-12-10 13:35:28 +00001722 dag BE_VHALF_SHIFT = (EXTRACT_SUBREG (RLDICR (ANDC8 (LI8 3), $Idx), 4, 59),
Nemanja Ivanovicd3896572015-10-09 11:12:18 +00001723 sub_32);
1724 dag BE_VARIABLE_HALF = (EXTRACT_SUBREG (SRD BE_MV_VHALF, BE_VHALF_SHIFT),
1725 sub_32);
Nemanja Ivanovicac8d01a2015-12-10 13:35:28 +00001726
1727 /* BE variable word
1728 The algorithm is the same as the LE variable word except:
1729 - The shift in the VMX register happens for opposite element numbers
1730 - The order of elements after the move to GPR is reversed, so we invert
1731 the bits of the index prior to truncating to the range 0-1
1732 */
1733 dag BE_VWORD_PERM_VEC = (LVSL ZERO8, (RLDICR (ANDIo8 $Idx, 2), 2, 61));
1734 dag BE_VWORD_PERMUTE = (VPERM $S, $S, BE_VWORD_PERM_VEC);
1735 dag BE_MV_VWORD = (MFVSRD
1736 (EXTRACT_SUBREG
1737 (v2i64 (COPY_TO_REGCLASS BE_VWORD_PERMUTE, VSRC)),
1738 sub_64));
1739 dag BE_VWORD_SHIFT = (EXTRACT_SUBREG (RLDICR (ANDC8 (LI8 1), $Idx), 5, 58),
1740 sub_32);
1741 dag BE_VARIABLE_WORD = (EXTRACT_SUBREG (SRD BE_MV_VWORD, BE_VWORD_SHIFT),
1742 sub_32);
1743
1744 /* BE variable doubleword
1745 Same as the LE doubleword except we shift in the VMX register for opposite
1746 element indices.
1747 */
1748 dag BE_VDWORD_PERM_VEC = (LVSL ZERO8, (RLDICR (ANDIo8 $Idx, 1), 3, 60));
1749 dag BE_VDWORD_PERMUTE = (VPERM $S, $S, BE_VDWORD_PERM_VEC);
1750 dag BE_VARIABLE_DWORD =
1751 (MFVSRD (EXTRACT_SUBREG
1752 (v2i64 (COPY_TO_REGCLASS BE_VDWORD_PERMUTE, VSRC)),
1753 sub_64));
1754
1755 /* BE variable float
1756 - Shift the vector to line up the desired element to BE Word 0
1757 - Convert 32-bit float to a 64-bit single precision float
1758 */
1759 dag BE_VFLOAT_PERM_VEC = (LVSL ZERO8, (RLDICR $Idx, 2, 61));
1760 dag BE_VFLOAT_PERMUTE = (VPERM $S, $S, BE_VFLOAT_PERM_VEC);
1761 dag BE_VARIABLE_FLOAT = (XSCVSPDPN BE_VFLOAT_PERMUTE);
1762
1763 /* BE variable double
1764 Same as the BE doubleword except there is no move.
1765 */
1766 dag BE_VDOUBLE_PERMUTE = (VPERM (COPY_TO_REGCLASS $S, VRRC),
1767 (COPY_TO_REGCLASS $S, VRRC),
1768 BE_VDWORD_PERM_VEC);
1769 dag BE_VARIABLE_DOUBLE = (COPY_TO_REGCLASS BE_VDOUBLE_PERMUTE, VSRC);
Nemanja Ivanovicd3896572015-10-09 11:12:18 +00001770}
1771
Nemanja Ivanovicdf1cb522016-11-29 16:11:34 +00001772let AddedComplexity = 400 in {
Nemanja Ivanovicd3896572015-10-09 11:12:18 +00001773// v4f32 scalar <-> vector conversions (BE)
Nemanja Ivanovic1c39ca62015-08-13 17:40:44 +00001774let Predicates = [IsBigEndian, HasP8Vector] in {
1775 def : Pat<(v4f32 (scalar_to_vector f32:$A)),
1776 (v4f32 (XSCVDPSPN $A))>;
Nemanja Ivanovicd3896572015-10-09 11:12:18 +00001777 def : Pat<(f32 (vector_extract v4f32:$S, 0)),
1778 (f32 (XSCVSPDPN $S))>;
1779 def : Pat<(f32 (vector_extract v4f32:$S, 1)),
1780 (f32 (XSCVSPDPN (XXSLDWI $S, $S, 1)))>;
1781 def : Pat<(f32 (vector_extract v4f32:$S, 2)),
Nemanja Ivanoviceebbcb62016-07-12 12:16:27 +00001782 (f32 (XSCVSPDPN (XXPERMDI $S, $S, 2)))>;
Nemanja Ivanovicd3896572015-10-09 11:12:18 +00001783 def : Pat<(f32 (vector_extract v4f32:$S, 3)),
1784 (f32 (XSCVSPDPN (XXSLDWI $S, $S, 3)))>;
Nemanja Ivanovicac8d01a2015-12-10 13:35:28 +00001785 def : Pat<(f32 (vector_extract v4f32:$S, i64:$Idx)),
1786 (f32 VectorExtractions.BE_VARIABLE_FLOAT)>;
Nemanja Ivanovic1c39ca62015-08-13 17:40:44 +00001787} // IsBigEndian, HasP8Vector
1788
Nemanja Ivanovicac8d01a2015-12-10 13:35:28 +00001789// Variable index vector_extract for v2f64 does not require P8Vector
1790let Predicates = [IsBigEndian, HasVSX] in
1791 def : Pat<(f64 (vector_extract v2f64:$S, i64:$Idx)),
1792 (f64 VectorExtractions.BE_VARIABLE_DOUBLE)>;
1793
Nemanja Ivanovic1c39ca62015-08-13 17:40:44 +00001794let Predicates = [IsBigEndian, HasDirectMove] in {
Nemanja Ivanovicd3896572015-10-09 11:12:18 +00001795 // v16i8 scalar <-> vector conversions (BE)
Nemanja Ivanovic1c39ca62015-08-13 17:40:44 +00001796 def : Pat<(v16i8 (scalar_to_vector i32:$A)),
Nemanja Ivanovicd3896572015-10-09 11:12:18 +00001797 (v16i8 (SUBREG_TO_REG (i64 1), MovesToVSR.BE_BYTE_0, sub_64))>;
Nemanja Ivanovic1c39ca62015-08-13 17:40:44 +00001798 def : Pat<(v8i16 (scalar_to_vector i32:$A)),
Nemanja Ivanovicd3896572015-10-09 11:12:18 +00001799 (v8i16 (SUBREG_TO_REG (i64 1), MovesToVSR.BE_HALF_0, sub_64))>;
Nemanja Ivanovic1c39ca62015-08-13 17:40:44 +00001800 def : Pat<(v4i32 (scalar_to_vector i32:$A)),
Nemanja Ivanovicd3896572015-10-09 11:12:18 +00001801 (v4i32 (SUBREG_TO_REG (i64 1), MovesToVSR.BE_WORD_0, sub_64))>;
Nemanja Ivanovic1c39ca62015-08-13 17:40:44 +00001802 def : Pat<(v2i64 (scalar_to_vector i64:$A)),
Nemanja Ivanovicd3896572015-10-09 11:12:18 +00001803 (v2i64 (SUBREG_TO_REG (i64 1), MovesToVSR.BE_DWORD_0, sub_64))>;
1804 def : Pat<(i32 (vector_extract v16i8:$S, 0)),
Nemanja Ivanovicac8d01a2015-12-10 13:35:28 +00001805 (i32 VectorExtractions.LE_BYTE_15)>;
Nemanja Ivanovicd3896572015-10-09 11:12:18 +00001806 def : Pat<(i32 (vector_extract v16i8:$S, 1)),
Nemanja Ivanovicac8d01a2015-12-10 13:35:28 +00001807 (i32 VectorExtractions.LE_BYTE_14)>;
Nemanja Ivanovicd3896572015-10-09 11:12:18 +00001808 def : Pat<(i32 (vector_extract v16i8:$S, 2)),
Nemanja Ivanovicac8d01a2015-12-10 13:35:28 +00001809 (i32 VectorExtractions.LE_BYTE_13)>;
Nemanja Ivanovicd3896572015-10-09 11:12:18 +00001810 def : Pat<(i32 (vector_extract v16i8:$S, 3)),
Nemanja Ivanovicac8d01a2015-12-10 13:35:28 +00001811 (i32 VectorExtractions.LE_BYTE_12)>;
Nemanja Ivanovicd3896572015-10-09 11:12:18 +00001812 def : Pat<(i32 (vector_extract v16i8:$S, 4)),
Nemanja Ivanovicac8d01a2015-12-10 13:35:28 +00001813 (i32 VectorExtractions.LE_BYTE_11)>;
Nemanja Ivanovicd3896572015-10-09 11:12:18 +00001814 def : Pat<(i32 (vector_extract v16i8:$S, 5)),
Nemanja Ivanovicac8d01a2015-12-10 13:35:28 +00001815 (i32 VectorExtractions.LE_BYTE_10)>;
Nemanja Ivanovicd3896572015-10-09 11:12:18 +00001816 def : Pat<(i32 (vector_extract v16i8:$S, 6)),
Nemanja Ivanovicac8d01a2015-12-10 13:35:28 +00001817 (i32 VectorExtractions.LE_BYTE_9)>;
Nemanja Ivanovicd3896572015-10-09 11:12:18 +00001818 def : Pat<(i32 (vector_extract v16i8:$S, 7)),
Nemanja Ivanovicac8d01a2015-12-10 13:35:28 +00001819 (i32 VectorExtractions.LE_BYTE_8)>;
Nemanja Ivanovicd3896572015-10-09 11:12:18 +00001820 def : Pat<(i32 (vector_extract v16i8:$S, 8)),
Nemanja Ivanovicac8d01a2015-12-10 13:35:28 +00001821 (i32 VectorExtractions.LE_BYTE_7)>;
Nemanja Ivanovicd3896572015-10-09 11:12:18 +00001822 def : Pat<(i32 (vector_extract v16i8:$S, 9)),
Nemanja Ivanovicac8d01a2015-12-10 13:35:28 +00001823 (i32 VectorExtractions.LE_BYTE_6)>;
Nemanja Ivanovicd3896572015-10-09 11:12:18 +00001824 def : Pat<(i32 (vector_extract v16i8:$S, 10)),
Nemanja Ivanovicac8d01a2015-12-10 13:35:28 +00001825 (i32 VectorExtractions.LE_BYTE_5)>;
Nemanja Ivanovicd3896572015-10-09 11:12:18 +00001826 def : Pat<(i32 (vector_extract v16i8:$S, 11)),
Nemanja Ivanovicac8d01a2015-12-10 13:35:28 +00001827 (i32 VectorExtractions.LE_BYTE_4)>;
Nemanja Ivanovicd3896572015-10-09 11:12:18 +00001828 def : Pat<(i32 (vector_extract v16i8:$S, 12)),
Nemanja Ivanovicac8d01a2015-12-10 13:35:28 +00001829 (i32 VectorExtractions.LE_BYTE_3)>;
Nemanja Ivanovicd3896572015-10-09 11:12:18 +00001830 def : Pat<(i32 (vector_extract v16i8:$S, 13)),
Nemanja Ivanovicac8d01a2015-12-10 13:35:28 +00001831 (i32 VectorExtractions.LE_BYTE_2)>;
Nemanja Ivanovicd3896572015-10-09 11:12:18 +00001832 def : Pat<(i32 (vector_extract v16i8:$S, 14)),
Nemanja Ivanovicac8d01a2015-12-10 13:35:28 +00001833 (i32 VectorExtractions.LE_BYTE_1)>;
Nemanja Ivanovicd3896572015-10-09 11:12:18 +00001834 def : Pat<(i32 (vector_extract v16i8:$S, 15)),
Nemanja Ivanovicac8d01a2015-12-10 13:35:28 +00001835 (i32 VectorExtractions.LE_BYTE_0)>;
Nemanja Ivanovicd3896572015-10-09 11:12:18 +00001836 def : Pat<(i32 (vector_extract v16i8:$S, i64:$Idx)),
Nemanja Ivanovicac8d01a2015-12-10 13:35:28 +00001837 (i32 VectorExtractions.BE_VARIABLE_BYTE)>;
Nemanja Ivanovicd3896572015-10-09 11:12:18 +00001838
1839 // v8i16 scalar <-> vector conversions (BE)
1840 def : Pat<(i32 (vector_extract v8i16:$S, 0)),
Nemanja Ivanovicac8d01a2015-12-10 13:35:28 +00001841 (i32 VectorExtractions.LE_HALF_7)>;
Nemanja Ivanovicd3896572015-10-09 11:12:18 +00001842 def : Pat<(i32 (vector_extract v8i16:$S, 1)),
Nemanja Ivanovicac8d01a2015-12-10 13:35:28 +00001843 (i32 VectorExtractions.LE_HALF_6)>;
Nemanja Ivanovicd3896572015-10-09 11:12:18 +00001844 def : Pat<(i32 (vector_extract v8i16:$S, 2)),
Nemanja Ivanovicac8d01a2015-12-10 13:35:28 +00001845 (i32 VectorExtractions.LE_HALF_5)>;
Nemanja Ivanovicd3896572015-10-09 11:12:18 +00001846 def : Pat<(i32 (vector_extract v8i16:$S, 3)),
Nemanja Ivanovicac8d01a2015-12-10 13:35:28 +00001847 (i32 VectorExtractions.LE_HALF_4)>;
Nemanja Ivanovicd3896572015-10-09 11:12:18 +00001848 def : Pat<(i32 (vector_extract v8i16:$S, 4)),
Nemanja Ivanovicac8d01a2015-12-10 13:35:28 +00001849 (i32 VectorExtractions.LE_HALF_3)>;
Nemanja Ivanovicd3896572015-10-09 11:12:18 +00001850 def : Pat<(i32 (vector_extract v8i16:$S, 5)),
Nemanja Ivanovicac8d01a2015-12-10 13:35:28 +00001851 (i32 VectorExtractions.LE_HALF_2)>;
Nemanja Ivanovicd3896572015-10-09 11:12:18 +00001852 def : Pat<(i32 (vector_extract v8i16:$S, 6)),
Nemanja Ivanovicac8d01a2015-12-10 13:35:28 +00001853 (i32 VectorExtractions.LE_HALF_1)>;
Nemanja Ivanovicd3896572015-10-09 11:12:18 +00001854 def : Pat<(i32 (vector_extract v8i16:$S, 7)),
Nemanja Ivanovicac8d01a2015-12-10 13:35:28 +00001855 (i32 VectorExtractions.LE_HALF_0)>;
Nemanja Ivanovicd3896572015-10-09 11:12:18 +00001856 def : Pat<(i32 (vector_extract v8i16:$S, i64:$Idx)),
Nemanja Ivanovicac8d01a2015-12-10 13:35:28 +00001857 (i32 VectorExtractions.BE_VARIABLE_HALF)>;
Nemanja Ivanovicd3896572015-10-09 11:12:18 +00001858
1859 // v4i32 scalar <-> vector conversions (BE)
1860 def : Pat<(i32 (vector_extract v4i32:$S, 0)),
Nemanja Ivanovicac8d01a2015-12-10 13:35:28 +00001861 (i32 VectorExtractions.LE_WORD_3)>;
Nemanja Ivanovicd3896572015-10-09 11:12:18 +00001862 def : Pat<(i32 (vector_extract v4i32:$S, 1)),
Nemanja Ivanovicac8d01a2015-12-10 13:35:28 +00001863 (i32 VectorExtractions.LE_WORD_2)>;
Nemanja Ivanovicd3896572015-10-09 11:12:18 +00001864 def : Pat<(i32 (vector_extract v4i32:$S, 2)),
Nemanja Ivanovicac8d01a2015-12-10 13:35:28 +00001865 (i32 VectorExtractions.LE_WORD_1)>;
Nemanja Ivanovicd3896572015-10-09 11:12:18 +00001866 def : Pat<(i32 (vector_extract v4i32:$S, 3)),
Nemanja Ivanovicac8d01a2015-12-10 13:35:28 +00001867 (i32 VectorExtractions.LE_WORD_0)>;
1868 def : Pat<(i32 (vector_extract v4i32:$S, i64:$Idx)),
1869 (i32 VectorExtractions.BE_VARIABLE_WORD)>;
Nemanja Ivanovicd3896572015-10-09 11:12:18 +00001870
1871 // v2i64 scalar <-> vector conversions (BE)
1872 def : Pat<(i64 (vector_extract v2i64:$S, 0)),
Nemanja Ivanovicac8d01a2015-12-10 13:35:28 +00001873 (i64 VectorExtractions.LE_DWORD_1)>;
Nemanja Ivanovicd3896572015-10-09 11:12:18 +00001874 def : Pat<(i64 (vector_extract v2i64:$S, 1)),
Nemanja Ivanovicac8d01a2015-12-10 13:35:28 +00001875 (i64 VectorExtractions.LE_DWORD_0)>;
1876 def : Pat<(i64 (vector_extract v2i64:$S, i64:$Idx)),
1877 (i64 VectorExtractions.BE_VARIABLE_DWORD)>;
Nemanja Ivanovic1c39ca62015-08-13 17:40:44 +00001878} // IsBigEndian, HasDirectMove
1879
Nemanja Ivanovicd3896572015-10-09 11:12:18 +00001880// v4f32 scalar <-> vector conversions (LE)
Nemanja Ivanovic1c39ca62015-08-13 17:40:44 +00001881let Predicates = [IsLittleEndian, HasP8Vector] in {
1882 def : Pat<(v4f32 (scalar_to_vector f32:$A)),
1883 (v4f32 (XXSLDWI (XSCVDPSPN $A), (XSCVDPSPN $A), 1))>;
Nemanja Ivanovicd3896572015-10-09 11:12:18 +00001884 def : Pat<(f32 (vector_extract v4f32:$S, 0)),
1885 (f32 (XSCVSPDPN (XXSLDWI $S, $S, 3)))>;
1886 def : Pat<(f32 (vector_extract v4f32:$S, 1)),
Nemanja Ivanoviceebbcb62016-07-12 12:16:27 +00001887 (f32 (XSCVSPDPN (XXPERMDI $S, $S, 2)))>;
Nemanja Ivanovicd3896572015-10-09 11:12:18 +00001888 def : Pat<(f32 (vector_extract v4f32:$S, 2)),
1889 (f32 (XSCVSPDPN (XXSLDWI $S, $S, 1)))>;
1890 def : Pat<(f32 (vector_extract v4f32:$S, 3)),
1891 (f32 (XSCVSPDPN $S))>;
Nemanja Ivanovicac8d01a2015-12-10 13:35:28 +00001892 def : Pat<(f32 (vector_extract v4f32:$S, i64:$Idx)),
1893 (f32 VectorExtractions.LE_VARIABLE_FLOAT)>;
Nemanja Ivanovic1c39ca62015-08-13 17:40:44 +00001894} // IsLittleEndian, HasP8Vector
1895
Nemanja Ivanovicac8d01a2015-12-10 13:35:28 +00001896// Variable index vector_extract for v2f64 does not require P8Vector
1897let Predicates = [IsLittleEndian, HasVSX] in
1898 def : Pat<(f64 (vector_extract v2f64:$S, i64:$Idx)),
1899 (f64 VectorExtractions.LE_VARIABLE_DOUBLE)>;
1900
Nemanja Ivanovicb89c27f2017-05-02 01:47:34 +00001901def : Pat<(v4i32 (int_ppc_vsx_lxvw4x_be xoaddr:$src)), (LXVW4X xoaddr:$src)>;
1902def : Pat<(v2f64 (int_ppc_vsx_lxvd2x_be xoaddr:$src)), (LXVD2X xoaddr:$src)>;
Tony Jiang5f850cd2016-11-15 14:25:56 +00001903
Tony Jiangaa5a6a12017-07-05 16:55:00 +00001904// Variable index unsigned vector_extract on Power9
1905let Predicates = [HasP9Altivec, IsLittleEndian] in {
1906 def : Pat<(i64 (anyext (i32 (vector_extract v16i8:$S, i64:$Idx)))),
1907 (VEXTUBRX $Idx, $S)>;
1908
1909 def : Pat<(i64 (anyext (i32 (vector_extract v8i16:$S, i64:$Idx)))),
1910 (VEXTUHRX (RLWINM8 $Idx, 1, 28, 30), $S)>;
1911 def : Pat<(i64 (anyext (i32 (vector_extract v8i16:$S, 0)))),
1912 (VEXTUHRX (LI8 0), $S)>;
1913 def : Pat<(i64 (anyext (i32 (vector_extract v8i16:$S, 1)))),
1914 (VEXTUHRX (LI8 2), $S)>;
1915 def : Pat<(i64 (anyext (i32 (vector_extract v8i16:$S, 2)))),
1916 (VEXTUHRX (LI8 4), $S)>;
1917 def : Pat<(i64 (anyext (i32 (vector_extract v8i16:$S, 3)))),
1918 (VEXTUHRX (LI8 6), $S)>;
1919 def : Pat<(i64 (anyext (i32 (vector_extract v8i16:$S, 4)))),
1920 (VEXTUHRX (LI8 8), $S)>;
1921 def : Pat<(i64 (anyext (i32 (vector_extract v8i16:$S, 5)))),
1922 (VEXTUHRX (LI8 10), $S)>;
1923 def : Pat<(i64 (anyext (i32 (vector_extract v8i16:$S, 6)))),
1924 (VEXTUHRX (LI8 12), $S)>;
1925 def : Pat<(i64 (anyext (i32 (vector_extract v8i16:$S, 7)))),
1926 (VEXTUHRX (LI8 14), $S)>;
1927
1928 def : Pat<(i64 (zext (i32 (vector_extract v4i32:$S, i64:$Idx)))),
1929 (VEXTUWRX (RLWINM8 $Idx, 2, 28, 29), $S)>;
1930 def : Pat<(i64 (zext (i32 (vector_extract v4i32:$S, 0)))),
1931 (VEXTUWRX (LI8 0), $S)>;
1932 def : Pat<(i64 (zext (i32 (vector_extract v4i32:$S, 1)))),
1933 (VEXTUWRX (LI8 4), $S)>;
1934 def : Pat<(i64 (zext (i32 (vector_extract v4i32:$S, 2)))),
1935 (VEXTUWRX (LI8 8), $S)>;
1936 def : Pat<(i64 (zext (i32 (vector_extract v4i32:$S, 3)))),
1937 (VEXTUWRX (LI8 12), $S)>;
1938
1939 def : Pat<(i64 (sext (i32 (vector_extract v4i32:$S, i64:$Idx)))),
1940 (EXTSW (VEXTUWRX (RLWINM8 $Idx, 2, 28, 29), $S))>;
1941 def : Pat<(i64 (sext (i32 (vector_extract v4i32:$S, 0)))),
1942 (EXTSW (VEXTUWRX (LI8 0), $S))>;
1943 def : Pat<(i64 (sext (i32 (vector_extract v4i32:$S, 1)))),
1944 (EXTSW (VEXTUWRX (LI8 4), $S))>;
1945 def : Pat<(i64 (sext (i32 (vector_extract v4i32:$S, 2)))),
1946 (EXTSW (VEXTUWRX (LI8 8), $S))>;
1947 def : Pat<(i64 (sext (i32 (vector_extract v4i32:$S, 3)))),
1948 (EXTSW (VEXTUWRX (LI8 12), $S))>;
1949}
1950let Predicates = [HasP9Altivec, IsBigEndian] in {
1951 def : Pat<(i64 (anyext (i32 (vector_extract v16i8:$S, i64:$Idx)))),
1952 (VEXTUBLX $Idx, $S)>;
1953
1954 def : Pat<(i64 (anyext (i32 (vector_extract v8i16:$S, i64:$Idx)))),
1955 (VEXTUHLX (RLWINM8 $Idx, 1, 28, 30), $S)>;
1956 def : Pat<(i64 (anyext (i32 (vector_extract v8i16:$S, 0)))),
1957 (VEXTUHLX (LI8 0), $S)>;
1958 def : Pat<(i64 (anyext (i32 (vector_extract v8i16:$S, 1)))),
1959 (VEXTUHLX (LI8 2), $S)>;
1960 def : Pat<(i64 (anyext (i32 (vector_extract v8i16:$S, 2)))),
1961 (VEXTUHLX (LI8 4), $S)>;
1962 def : Pat<(i64 (anyext (i32 (vector_extract v8i16:$S, 3)))),
1963 (VEXTUHLX (LI8 6), $S)>;
1964 def : Pat<(i64 (anyext (i32 (vector_extract v8i16:$S, 4)))),
1965 (VEXTUHLX (LI8 8), $S)>;
1966 def : Pat<(i64 (anyext (i32 (vector_extract v8i16:$S, 5)))),
1967 (VEXTUHLX (LI8 10), $S)>;
1968 def : Pat<(i64 (anyext (i32 (vector_extract v8i16:$S, 6)))),
1969 (VEXTUHLX (LI8 12), $S)>;
1970 def : Pat<(i64 (anyext (i32 (vector_extract v8i16:$S, 7)))),
1971 (VEXTUHLX (LI8 14), $S)>;
1972
1973 def : Pat<(i64 (zext (i32 (vector_extract v4i32:$S, i64:$Idx)))),
1974 (VEXTUWLX (RLWINM8 $Idx, 2, 28, 29), $S)>;
1975 def : Pat<(i64 (zext (i32 (vector_extract v4i32:$S, 0)))),
1976 (VEXTUWLX (LI8 0), $S)>;
1977 def : Pat<(i64 (zext (i32 (vector_extract v4i32:$S, 1)))),
1978 (VEXTUWLX (LI8 4), $S)>;
1979 def : Pat<(i64 (zext (i32 (vector_extract v4i32:$S, 2)))),
1980 (VEXTUWLX (LI8 8), $S)>;
1981 def : Pat<(i64 (zext (i32 (vector_extract v4i32:$S, 3)))),
1982 (VEXTUWLX (LI8 12), $S)>;
1983
1984 def : Pat<(i64 (sext (i32 (vector_extract v4i32:$S, i64:$Idx)))),
1985 (EXTSW (VEXTUWLX (RLWINM8 $Idx, 2, 28, 29), $S))>;
1986 def : Pat<(i64 (sext (i32 (vector_extract v4i32:$S, 0)))),
1987 (EXTSW (VEXTUWLX (LI8 0), $S))>;
1988 def : Pat<(i64 (sext (i32 (vector_extract v4i32:$S, 1)))),
1989 (EXTSW (VEXTUWLX (LI8 4), $S))>;
1990 def : Pat<(i64 (sext (i32 (vector_extract v4i32:$S, 2)))),
1991 (EXTSW (VEXTUWLX (LI8 8), $S))>;
1992 def : Pat<(i64 (sext (i32 (vector_extract v4i32:$S, 3)))),
1993 (EXTSW (VEXTUWLX (LI8 12), $S))>;
1994}
1995
Nemanja Ivanovic1c39ca62015-08-13 17:40:44 +00001996let Predicates = [IsLittleEndian, HasDirectMove] in {
Nemanja Ivanovicd3896572015-10-09 11:12:18 +00001997 // v16i8 scalar <-> vector conversions (LE)
Nemanja Ivanovic1c39ca62015-08-13 17:40:44 +00001998 def : Pat<(v16i8 (scalar_to_vector i32:$A)),
Nemanja Ivanovicd3896572015-10-09 11:12:18 +00001999 (v16i8 (COPY_TO_REGCLASS MovesToVSR.LE_WORD_0, VSRC))>;
Nemanja Ivanovic1c39ca62015-08-13 17:40:44 +00002000 def : Pat<(v8i16 (scalar_to_vector i32:$A)),
Nemanja Ivanovicd3896572015-10-09 11:12:18 +00002001 (v8i16 (COPY_TO_REGCLASS MovesToVSR.LE_WORD_0, VSRC))>;
Nemanja Ivanovic1c39ca62015-08-13 17:40:44 +00002002 def : Pat<(v4i32 (scalar_to_vector i32:$A)),
Nemanja Ivanovicd3896572015-10-09 11:12:18 +00002003 (v4i32 MovesToVSR.LE_WORD_0)>;
Nemanja Ivanovic1c39ca62015-08-13 17:40:44 +00002004 def : Pat<(v2i64 (scalar_to_vector i64:$A)),
Nemanja Ivanovicd3896572015-10-09 11:12:18 +00002005 (v2i64 MovesToVSR.LE_DWORD_0)>;
2006 def : Pat<(i32 (vector_extract v16i8:$S, 0)),
Nemanja Ivanovicac8d01a2015-12-10 13:35:28 +00002007 (i32 VectorExtractions.LE_BYTE_0)>;
Nemanja Ivanovicd3896572015-10-09 11:12:18 +00002008 def : Pat<(i32 (vector_extract v16i8:$S, 1)),
Nemanja Ivanovicac8d01a2015-12-10 13:35:28 +00002009 (i32 VectorExtractions.LE_BYTE_1)>;
Nemanja Ivanovicd3896572015-10-09 11:12:18 +00002010 def : Pat<(i32 (vector_extract v16i8:$S, 2)),
Nemanja Ivanovicac8d01a2015-12-10 13:35:28 +00002011 (i32 VectorExtractions.LE_BYTE_2)>;
Nemanja Ivanovicd3896572015-10-09 11:12:18 +00002012 def : Pat<(i32 (vector_extract v16i8:$S, 3)),
Nemanja Ivanovicac8d01a2015-12-10 13:35:28 +00002013 (i32 VectorExtractions.LE_BYTE_3)>;
Nemanja Ivanovicd3896572015-10-09 11:12:18 +00002014 def : Pat<(i32 (vector_extract v16i8:$S, 4)),
Nemanja Ivanovicac8d01a2015-12-10 13:35:28 +00002015 (i32 VectorExtractions.LE_BYTE_4)>;
Nemanja Ivanovicd3896572015-10-09 11:12:18 +00002016 def : Pat<(i32 (vector_extract v16i8:$S, 5)),
Nemanja Ivanovicac8d01a2015-12-10 13:35:28 +00002017 (i32 VectorExtractions.LE_BYTE_5)>;
Nemanja Ivanovicd3896572015-10-09 11:12:18 +00002018 def : Pat<(i32 (vector_extract v16i8:$S, 6)),
Nemanja Ivanovicac8d01a2015-12-10 13:35:28 +00002019 (i32 VectorExtractions.LE_BYTE_6)>;
Nemanja Ivanovicd3896572015-10-09 11:12:18 +00002020 def : Pat<(i32 (vector_extract v16i8:$S, 7)),
Nemanja Ivanovicac8d01a2015-12-10 13:35:28 +00002021 (i32 VectorExtractions.LE_BYTE_7)>;
Nemanja Ivanovicd3896572015-10-09 11:12:18 +00002022 def : Pat<(i32 (vector_extract v16i8:$S, 8)),
Nemanja Ivanovicac8d01a2015-12-10 13:35:28 +00002023 (i32 VectorExtractions.LE_BYTE_8)>;
Nemanja Ivanovicd3896572015-10-09 11:12:18 +00002024 def : Pat<(i32 (vector_extract v16i8:$S, 9)),
Nemanja Ivanovicac8d01a2015-12-10 13:35:28 +00002025 (i32 VectorExtractions.LE_BYTE_9)>;
Nemanja Ivanovicd3896572015-10-09 11:12:18 +00002026 def : Pat<(i32 (vector_extract v16i8:$S, 10)),
Nemanja Ivanovicac8d01a2015-12-10 13:35:28 +00002027 (i32 VectorExtractions.LE_BYTE_10)>;
Nemanja Ivanovicd3896572015-10-09 11:12:18 +00002028 def : Pat<(i32 (vector_extract v16i8:$S, 11)),
Nemanja Ivanovicac8d01a2015-12-10 13:35:28 +00002029 (i32 VectorExtractions.LE_BYTE_11)>;
Nemanja Ivanovicd3896572015-10-09 11:12:18 +00002030 def : Pat<(i32 (vector_extract v16i8:$S, 12)),
Nemanja Ivanovicac8d01a2015-12-10 13:35:28 +00002031 (i32 VectorExtractions.LE_BYTE_12)>;
Nemanja Ivanovicd3896572015-10-09 11:12:18 +00002032 def : Pat<(i32 (vector_extract v16i8:$S, 13)),
Nemanja Ivanovicac8d01a2015-12-10 13:35:28 +00002033 (i32 VectorExtractions.LE_BYTE_13)>;
Nemanja Ivanovicd3896572015-10-09 11:12:18 +00002034 def : Pat<(i32 (vector_extract v16i8:$S, 14)),
Nemanja Ivanovicac8d01a2015-12-10 13:35:28 +00002035 (i32 VectorExtractions.LE_BYTE_14)>;
Nemanja Ivanovicd3896572015-10-09 11:12:18 +00002036 def : Pat<(i32 (vector_extract v16i8:$S, 15)),
Nemanja Ivanovicac8d01a2015-12-10 13:35:28 +00002037 (i32 VectorExtractions.LE_BYTE_15)>;
Nemanja Ivanovicd3896572015-10-09 11:12:18 +00002038 def : Pat<(i32 (vector_extract v16i8:$S, i64:$Idx)),
Nemanja Ivanovicac8d01a2015-12-10 13:35:28 +00002039 (i32 VectorExtractions.LE_VARIABLE_BYTE)>;
Nemanja Ivanovic1c39ca62015-08-13 17:40:44 +00002040
Nemanja Ivanovicd3896572015-10-09 11:12:18 +00002041 // v8i16 scalar <-> vector conversions (LE)
2042 def : Pat<(i32 (vector_extract v8i16:$S, 0)),
Nemanja Ivanovicac8d01a2015-12-10 13:35:28 +00002043 (i32 VectorExtractions.LE_HALF_0)>;
Nemanja Ivanovicd3896572015-10-09 11:12:18 +00002044 def : Pat<(i32 (vector_extract v8i16:$S, 1)),
Nemanja Ivanovicac8d01a2015-12-10 13:35:28 +00002045 (i32 VectorExtractions.LE_HALF_1)>;
Nemanja Ivanovicd3896572015-10-09 11:12:18 +00002046 def : Pat<(i32 (vector_extract v8i16:$S, 2)),
Nemanja Ivanovicac8d01a2015-12-10 13:35:28 +00002047 (i32 VectorExtractions.LE_HALF_2)>;
Nemanja Ivanovicd3896572015-10-09 11:12:18 +00002048 def : Pat<(i32 (vector_extract v8i16:$S, 3)),
Nemanja Ivanovicac8d01a2015-12-10 13:35:28 +00002049 (i32 VectorExtractions.LE_HALF_3)>;
Nemanja Ivanovicd3896572015-10-09 11:12:18 +00002050 def : Pat<(i32 (vector_extract v8i16:$S, 4)),
Nemanja Ivanovicac8d01a2015-12-10 13:35:28 +00002051 (i32 VectorExtractions.LE_HALF_4)>;
Nemanja Ivanovicd3896572015-10-09 11:12:18 +00002052 def : Pat<(i32 (vector_extract v8i16:$S, 5)),
Nemanja Ivanovicac8d01a2015-12-10 13:35:28 +00002053 (i32 VectorExtractions.LE_HALF_5)>;
Nemanja Ivanovicd3896572015-10-09 11:12:18 +00002054 def : Pat<(i32 (vector_extract v8i16:$S, 6)),
Nemanja Ivanovicac8d01a2015-12-10 13:35:28 +00002055 (i32 VectorExtractions.LE_HALF_6)>;
Nemanja Ivanovicd3896572015-10-09 11:12:18 +00002056 def : Pat<(i32 (vector_extract v8i16:$S, 7)),
Nemanja Ivanovicac8d01a2015-12-10 13:35:28 +00002057 (i32 VectorExtractions.LE_HALF_7)>;
Nemanja Ivanovicd3896572015-10-09 11:12:18 +00002058 def : Pat<(i32 (vector_extract v8i16:$S, i64:$Idx)),
Nemanja Ivanovicac8d01a2015-12-10 13:35:28 +00002059 (i32 VectorExtractions.LE_VARIABLE_HALF)>;
Nemanja Ivanovicd3896572015-10-09 11:12:18 +00002060
2061 // v4i32 scalar <-> vector conversions (LE)
2062 def : Pat<(i32 (vector_extract v4i32:$S, 0)),
Nemanja Ivanovicac8d01a2015-12-10 13:35:28 +00002063 (i32 VectorExtractions.LE_WORD_0)>;
Nemanja Ivanovicd3896572015-10-09 11:12:18 +00002064 def : Pat<(i32 (vector_extract v4i32:$S, 1)),
Nemanja Ivanovicac8d01a2015-12-10 13:35:28 +00002065 (i32 VectorExtractions.LE_WORD_1)>;
Nemanja Ivanovicd3896572015-10-09 11:12:18 +00002066 def : Pat<(i32 (vector_extract v4i32:$S, 2)),
Nemanja Ivanovicac8d01a2015-12-10 13:35:28 +00002067 (i32 VectorExtractions.LE_WORD_2)>;
Nemanja Ivanovicd3896572015-10-09 11:12:18 +00002068 def : Pat<(i32 (vector_extract v4i32:$S, 3)),
Nemanja Ivanovicac8d01a2015-12-10 13:35:28 +00002069 (i32 VectorExtractions.LE_WORD_3)>;
2070 def : Pat<(i32 (vector_extract v4i32:$S, i64:$Idx)),
2071 (i32 VectorExtractions.LE_VARIABLE_WORD)>;
Nemanja Ivanovicd3896572015-10-09 11:12:18 +00002072
2073 // v2i64 scalar <-> vector conversions (LE)
2074 def : Pat<(i64 (vector_extract v2i64:$S, 0)),
Nemanja Ivanovicac8d01a2015-12-10 13:35:28 +00002075 (i64 VectorExtractions.LE_DWORD_0)>;
Nemanja Ivanovicd3896572015-10-09 11:12:18 +00002076 def : Pat<(i64 (vector_extract v2i64:$S, 1)),
Nemanja Ivanovicac8d01a2015-12-10 13:35:28 +00002077 (i64 VectorExtractions.LE_DWORD_1)>;
2078 def : Pat<(i64 (vector_extract v2i64:$S, i64:$Idx)),
2079 (i64 VectorExtractions.LE_VARIABLE_DWORD)>;
Nemanja Ivanovicd3896572015-10-09 11:12:18 +00002080} // IsLittleEndian, HasDirectMove
Nemanja Ivanovic89224762015-12-15 14:50:34 +00002081
2082let Predicates = [HasDirectMove, HasVSX] in {
2083// bitconvert f32 -> i32
2084// (convert to 32-bit fp single, shift right 1 word, move to GPR)
2085def : Pat<(i32 (bitconvert f32:$S)),
2086 (i32 (MFVSRWZ (EXTRACT_SUBREG
2087 (XXSLDWI (XSCVDPSPN $S),(XSCVDPSPN $S), 3),
2088 sub_64)))>;
2089// bitconvert i32 -> f32
2090// (move to FPR, shift left 1 word, convert to 64-bit fp single)
2091def : Pat<(f32 (bitconvert i32:$A)),
2092 (f32 (XSCVSPDPN
2093 (XXSLDWI MovesToVSR.LE_WORD_1, MovesToVSR.LE_WORD_1, 1)))>;
2094
2095// bitconvert f64 -> i64
2096// (move to GPR, nothing else needed)
2097def : Pat<(i64 (bitconvert f64:$S)),
2098 (i64 (MFVSRD $S))>;
2099
2100// bitconvert i64 -> f64
2101// (move to FPR, nothing else needed)
2102def : Pat<(f64 (bitconvert i64:$S)),
2103 (f64 (MTVSRD $S))>;
2104}
Kit Barton93612ec2016-02-26 21:11:55 +00002105
Nemanja Ivanovicdf1cb522016-11-29 16:11:34 +00002106// Materialize a zero-vector of long long
2107def : Pat<(v2i64 immAllZerosV),
2108 (v2i64 (XXLXORz))>;
2109}
2110
Nemanja Ivanovicb43bb612016-07-12 21:00:10 +00002111def AlignValues {
2112 dag F32_TO_BE_WORD1 = (v4f32 (XXSLDWI (XSCVDPSPN $B), (XSCVDPSPN $B), 3));
2113 dag I32_TO_BE_WORD1 = (COPY_TO_REGCLASS (MTVSRWZ $B), VSRC);
2114}
2115
Kit Barton93612ec2016-02-26 21:11:55 +00002116// The following VSX instructions were introduced in Power ISA 3.0
2117def HasP9Vector : Predicate<"PPCSubTarget->hasP9Vector()">;
Nemanja Ivanovicb43bb612016-07-12 21:00:10 +00002118let AddedComplexity = 400, Predicates = [HasP9Vector] in {
Kit Barton93612ec2016-02-26 21:11:55 +00002119
2120 // [PO VRT XO VRB XO /]
2121 class X_VT5_XO5_VB5<bits<6> opcode, bits<5> xo2, bits<10> xo, string opc,
2122 list<dag> pattern>
2123 : X_RD5_XO5_RS5<opcode, xo2, xo, (outs vrrc:$vT), (ins vrrc:$vB),
2124 !strconcat(opc, " $vT, $vB"), IIC_VecFP, pattern>;
2125
2126 // [PO VRT XO VRB XO RO], Round to Odd version of [PO VRT XO VRB XO /]
2127 class X_VT5_XO5_VB5_Ro<bits<6> opcode, bits<5> xo2, bits<10> xo, string opc,
2128 list<dag> pattern>
2129 : X_VT5_XO5_VB5<opcode, xo2, xo, opc, pattern>, isDOT;
2130
2131 // [PO VRT XO VRB XO /], but the VRB is only used the left 64 bits (or less),
2132 // So we use different operand class for VRB
2133 class X_VT5_XO5_VB5_TyVB<bits<6> opcode, bits<5> xo2, bits<10> xo, string opc,
2134 RegisterOperand vbtype, list<dag> pattern>
2135 : X_RD5_XO5_RS5<opcode, xo2, xo, (outs vrrc:$vT), (ins vbtype:$vB),
2136 !strconcat(opc, " $vT, $vB"), IIC_VecFP, pattern>;
2137
Nemanja Ivanovic11049f82016-10-04 06:59:23 +00002138 let UseVSXReg = 1 in {
Chuang-Yu Cheng80722712016-03-28 08:34:28 +00002139 // [PO T XO B XO BX /]
2140 class XX2_RT5_XO5_XB6<bits<6> opcode, bits<5> xo2, bits<9> xo, string opc,
2141 list<dag> pattern>
2142 : XX2_RD5_XO5_RS6<opcode, xo2, xo, (outs g8rc:$rT), (ins vsfrc:$XB),
2143 !strconcat(opc, " $rT, $XB"), IIC_VecFP, pattern>;
2144
Kit Barton93612ec2016-02-26 21:11:55 +00002145 // [PO T XO B XO BX TX]
2146 class XX2_XT6_XO5_XB6<bits<6> opcode, bits<5> xo2, bits<9> xo, string opc,
2147 RegisterOperand vtype, list<dag> pattern>
2148 : XX2_RD6_XO5_RS6<opcode, xo2, xo, (outs vtype:$XT), (ins vtype:$XB),
2149 !strconcat(opc, " $XT, $XB"), IIC_VecFP, pattern>;
2150
2151 // [PO T A B XO AX BX TX], src and dest register use different operand class
2152 class XX3_XT5_XA5_XB5<bits<6> opcode, bits<8> xo, string opc,
2153 RegisterOperand xty, RegisterOperand aty, RegisterOperand bty,
2154 InstrItinClass itin, list<dag> pattern>
2155 : XX3Form<opcode, xo, (outs xty:$XT), (ins aty:$XA, bty:$XB),
2156 !strconcat(opc, " $XT, $XA, $XB"), itin, pattern>;
Nemanja Ivanovic11049f82016-10-04 06:59:23 +00002157 } // UseVSXReg = 1
Kit Barton93612ec2016-02-26 21:11:55 +00002158
Chuang-Yu Cheng56638482016-03-28 07:38:01 +00002159 // [PO VRT VRA VRB XO /]
2160 class X_VT5_VA5_VB5<bits<6> opcode, bits<10> xo, string opc,
2161 list<dag> pattern>
2162 : XForm_1<opcode, xo, (outs vrrc:$vT), (ins vrrc:$vA, vrrc:$vB),
2163 !strconcat(opc, " $vT, $vA, $vB"), IIC_VecFP, pattern>;
2164
2165 // [PO VRT VRA VRB XO RO], Round to Odd version of [PO VRT VRA VRB XO /]
2166 class X_VT5_VA5_VB5_Ro<bits<6> opcode, bits<10> xo, string opc,
2167 list<dag> pattern>
2168 : X_VT5_VA5_VB5<opcode, xo, opc, pattern>, isDOT;
2169
2170 //===--------------------------------------------------------------------===//
2171 // Quad-Precision Scalar Move Instructions:
2172
2173 // Copy Sign
2174 def XSCPSGNQP : X_VT5_VA5_VB5<63, 100, "xscpsgnqp", []>;
2175
2176 // Absolute/Negative-Absolute/Negate
2177 def XSABSQP : X_VT5_XO5_VB5<63, 0, 804, "xsabsqp" , []>;
2178 def XSNABSQP : X_VT5_XO5_VB5<63, 8, 804, "xsnabsqp", []>;
2179 def XSNEGQP : X_VT5_XO5_VB5<63, 16, 804, "xsnegqp" , []>;
2180
2181 //===--------------------------------------------------------------------===//
2182 // Quad-Precision Scalar Floating-Point Arithmetic Instructions:
2183
2184 // Add/Divide/Multiply/Subtract
2185 def XSADDQP : X_VT5_VA5_VB5 <63, 4, "xsaddqp" , []>;
2186 def XSADDQPO : X_VT5_VA5_VB5_Ro<63, 4, "xsaddqpo", []>;
2187 def XSDIVQP : X_VT5_VA5_VB5 <63, 548, "xsdivqp" , []>;
2188 def XSDIVQPO : X_VT5_VA5_VB5_Ro<63, 548, "xsdivqpo", []>;
2189 def XSMULQP : X_VT5_VA5_VB5 <63, 36, "xsmulqp" , []>;
2190 def XSMULQPO : X_VT5_VA5_VB5_Ro<63, 36, "xsmulqpo", []>;
2191 def XSSUBQP : X_VT5_VA5_VB5 <63, 516, "xssubqp" , []>;
2192 def XSSUBQPO : X_VT5_VA5_VB5_Ro<63, 516, "xssubqpo", []>;
2193
2194 // Square-Root
2195 def XSSQRTQP : X_VT5_XO5_VB5 <63, 27, 804, "xssqrtqp" , []>;
2196 def XSSQRTQPO : X_VT5_XO5_VB5_Ro<63, 27, 804, "xssqrtqpo", []>;
2197
2198 // (Negative) Multiply-{Add/Subtract}
2199 def XSMADDQP : X_VT5_VA5_VB5 <63, 388, "xsmaddqp" , []>;
2200 def XSMADDQPO : X_VT5_VA5_VB5_Ro<63, 388, "xsmaddqpo" , []>;
2201 def XSMSUBQP : X_VT5_VA5_VB5 <63, 420, "xsmsubqp" , []>;
2202 def XSMSUBQPO : X_VT5_VA5_VB5_Ro<63, 420, "xsmsubqpo" , []>;
2203 def XSNMADDQP : X_VT5_VA5_VB5 <63, 452, "xsnmaddqp" , []>;
2204 def XSNMADDQPO: X_VT5_VA5_VB5_Ro<63, 452, "xsnmaddqpo", []>;
2205 def XSNMSUBQP : X_VT5_VA5_VB5 <63, 484, "xsnmsubqp" , []>;
2206 def XSNMSUBQPO: X_VT5_VA5_VB5_Ro<63, 484, "xsnmsubqpo", []>;
2207
Kit Barton93612ec2016-02-26 21:11:55 +00002208 //===--------------------------------------------------------------------===//
2209 // Quad/Double-Precision Compare Instructions:
2210
2211 // [PO BF // VRA VRB XO /]
2212 class X_BF3_VA5_VB5<bits<6> opcode, bits<10> xo, string opc,
2213 list<dag> pattern>
2214 : XForm_17<opcode, xo, (outs crrc:$crD), (ins vrrc:$VA, vrrc:$VB),
2215 !strconcat(opc, " $crD, $VA, $VB"), IIC_FPCompare> {
2216 let Pattern = pattern;
2217 }
2218
2219 // QP Compare Ordered/Unordered
2220 def XSCMPOQP : X_BF3_VA5_VB5<63, 132, "xscmpoqp", []>;
2221 def XSCMPUQP : X_BF3_VA5_VB5<63, 644, "xscmpuqp", []>;
2222
2223 // DP/QP Compare Exponents
2224 def XSCMPEXPDP : XX3Form_1<60, 59,
2225 (outs crrc:$crD), (ins vsfrc:$XA, vsfrc:$XB),
Nemanja Ivanovic11049f82016-10-04 06:59:23 +00002226 "xscmpexpdp $crD, $XA, $XB", IIC_FPCompare, []>,
2227 UseVSXReg;
Kit Barton93612ec2016-02-26 21:11:55 +00002228 def XSCMPEXPQP : X_BF3_VA5_VB5<63, 164, "xscmpexpqp", []>;
2229
2230 // DP Compare ==, >=, >, !=
2231 // Use vsrc for XT, because the entire register of XT is set.
2232 // XT.dword[1] = 0x0000_0000_0000_0000
2233 def XSCMPEQDP : XX3_XT5_XA5_XB5<60, 3, "xscmpeqdp", vsrc, vsfrc, vsfrc,
2234 IIC_FPCompare, []>;
2235 def XSCMPGEDP : XX3_XT5_XA5_XB5<60, 19, "xscmpgedp", vsrc, vsfrc, vsfrc,
2236 IIC_FPCompare, []>;
2237 def XSCMPGTDP : XX3_XT5_XA5_XB5<60, 11, "xscmpgtdp", vsrc, vsfrc, vsfrc,
2238 IIC_FPCompare, []>;
2239 def XSCMPNEDP : XX3_XT5_XA5_XB5<60, 27, "xscmpnedp", vsrc, vsfrc, vsfrc,
2240 IIC_FPCompare, []>;
Nemanja Ivanovic11049f82016-10-04 06:59:23 +00002241 let UseVSXReg = 1 in {
Kit Barton93612ec2016-02-26 21:11:55 +00002242 // Vector Compare Not Equal
2243 def XVCMPNEDP : XX3Form_Rc<60, 123,
2244 (outs vsrc:$XT), (ins vsrc:$XA, vsrc:$XB),
2245 "xvcmpnedp $XT, $XA, $XB", IIC_VecFPCompare, []>;
2246 let Defs = [CR6] in
2247 def XVCMPNEDPo : XX3Form_Rc<60, 123,
2248 (outs vsrc:$XT), (ins vsrc:$XA, vsrc:$XB),
2249 "xvcmpnedp. $XT, $XA, $XB", IIC_VecFPCompare, []>,
2250 isDOT;
2251 def XVCMPNESP : XX3Form_Rc<60, 91,
2252 (outs vsrc:$XT), (ins vsrc:$XA, vsrc:$XB),
2253 "xvcmpnesp $XT, $XA, $XB", IIC_VecFPCompare, []>;
2254 let Defs = [CR6] in
2255 def XVCMPNESPo : XX3Form_Rc<60, 91,
2256 (outs vsrc:$XT), (ins vsrc:$XA, vsrc:$XB),
2257 "xvcmpnesp. $XT, $XA, $XB", IIC_VecFPCompare, []>,
2258 isDOT;
Nemanja Ivanovic11049f82016-10-04 06:59:23 +00002259 } // UseVSXReg = 1
Kit Barton93612ec2016-02-26 21:11:55 +00002260
2261 //===--------------------------------------------------------------------===//
2262 // Quad-Precision Floating-Point Conversion Instructions:
2263
2264 // Convert DP -> QP
Nemanja Ivanovic11049f82016-10-04 06:59:23 +00002265 def XSCVDPQP : X_VT5_XO5_VB5_TyVB<63, 22, 836, "xscvdpqp", vfrc, []>;
Kit Barton93612ec2016-02-26 21:11:55 +00002266
2267 // Round & Convert QP -> DP (dword[1] is set to zero)
2268 def XSCVQPDP : X_VT5_XO5_VB5 <63, 20, 836, "xscvqpdp" , []>;
2269 def XSCVQPDPO : X_VT5_XO5_VB5_Ro<63, 20, 836, "xscvqpdpo", []>;
2270
2271 // Truncate & Convert QP -> (Un)Signed (D)Word (dword[1] is set to zero)
2272 def XSCVQPSDZ : X_VT5_XO5_VB5<63, 25, 836, "xscvqpsdz", []>;
2273 def XSCVQPSWZ : X_VT5_XO5_VB5<63, 9, 836, "xscvqpswz", []>;
2274 def XSCVQPUDZ : X_VT5_XO5_VB5<63, 17, 836, "xscvqpudz", []>;
2275 def XSCVQPUWZ : X_VT5_XO5_VB5<63, 1, 836, "xscvqpuwz", []>;
2276
2277 // Convert (Un)Signed DWord -> QP
Nemanja Ivanovic11049f82016-10-04 06:59:23 +00002278 def XSCVSDQP : X_VT5_XO5_VB5_TyVB<63, 10, 836, "xscvsdqp", vfrc, []>;
2279 def XSCVUDQP : X_VT5_XO5_VB5_TyVB<63, 2, 836, "xscvudqp", vfrc, []>;
Kit Barton93612ec2016-02-26 21:11:55 +00002280
Sean Fertilea435e072016-11-14 18:43:59 +00002281 let UseVSXReg = 1 in {
Kit Barton93612ec2016-02-26 21:11:55 +00002282 //===--------------------------------------------------------------------===//
2283 // Round to Floating-Point Integer Instructions
2284
2285 // (Round &) Convert DP <-> HP
2286 // Note! xscvdphp's src and dest register both use the left 64 bits, so we use
2287 // vsfrc for src and dest register. xscvhpdp's src only use the left 16 bits,
2288 // but we still use vsfrc for it.
2289 def XSCVDPHP : XX2_XT6_XO5_XB6<60, 17, 347, "xscvdphp", vsfrc, []>;
2290 def XSCVHPDP : XX2_XT6_XO5_XB6<60, 16, 347, "xscvhpdp", vsfrc, []>;
2291
2292 // Vector HP -> SP
2293 def XVCVHPSP : XX2_XT6_XO5_XB6<60, 24, 475, "xvcvhpsp", vsrc, []>;
Nemanja Ivanovicec4b0c32016-11-11 21:42:01 +00002294 def XVCVSPHP : XX2_XT6_XO5_XB6<60, 25, 475, "xvcvsphp", vsrc,
2295 [(set v4f32:$XT,
2296 (int_ppc_vsx_xvcvsphp v4f32:$XB))]>;
Kit Barton93612ec2016-02-26 21:11:55 +00002297
Sean Fertilea435e072016-11-14 18:43:59 +00002298 } // UseVSXReg = 1
2299
2300 // Pattern for matching Vector HP -> Vector SP intrinsic. Defined as a
Simon Pilgrim68168d12017-03-30 12:59:53 +00002301 // separate pattern so that it can convert the input register class from
Sean Fertilea435e072016-11-14 18:43:59 +00002302 // VRRC(v8i16) to VSRC.
2303 def : Pat<(v4f32 (int_ppc_vsx_xvcvhpsp v8i16:$A)),
2304 (v4f32 (XVCVHPSP (COPY_TO_REGCLASS $A, VSRC)))>;
2305
Kit Barton93612ec2016-02-26 21:11:55 +00002306 class Z23_VT5_R1_VB5_RMC2_EX1<bits<6> opcode, bits<8> xo, bit ex, string opc,
2307 list<dag> pattern>
2308 : Z23Form_1<opcode, xo,
2309 (outs vrrc:$vT), (ins u1imm:$r, vrrc:$vB, u2imm:$rmc),
2310 !strconcat(opc, " $r, $vT, $vB, $rmc"), IIC_VecFP, pattern> {
2311 let RC = ex;
2312 }
2313
2314 // Round to Quad-Precision Integer [with Inexact]
2315 def XSRQPI : Z23_VT5_R1_VB5_RMC2_EX1<63, 5, 0, "xsrqpi" , []>;
2316 def XSRQPIX : Z23_VT5_R1_VB5_RMC2_EX1<63, 5, 1, "xsrqpix", []>;
2317
2318 // Round Quad-Precision to Double-Extended Precision (fp80)
2319 def XSRQPXP : Z23_VT5_R1_VB5_RMC2_EX1<63, 37, 0, "xsrqpxp", []>;
Kit Bartonba532dc2016-03-08 03:49:13 +00002320
2321 //===--------------------------------------------------------------------===//
Chuang-Yu Cheng80722712016-03-28 08:34:28 +00002322 // Insert/Extract Instructions
2323
2324 // Insert Exponent DP/QP
2325 // XT NOTE: XT.dword[1] = 0xUUUU_UUUU_UUUU_UUUU
2326 def XSIEXPDP : XX1Form <60, 918, (outs vsrc:$XT), (ins g8rc:$rA, g8rc:$rB),
Nemanja Ivanovic11049f82016-10-04 06:59:23 +00002327 "xsiexpdp $XT, $rA, $rB", IIC_VecFP, []>, UseVSXReg;
Chuang-Yu Cheng80722712016-03-28 08:34:28 +00002328 // vB NOTE: only vB.dword[0] is used, that's why we don't use
2329 // X_VT5_VA5_VB5 form
2330 def XSIEXPQP : XForm_18<63, 868, (outs vrrc:$vT), (ins vrrc:$vA, vsfrc:$vB),
2331 "xsiexpqp $vT, $vA, $vB", IIC_VecFP, []>;
2332
2333 // Extract Exponent/Significand DP/QP
2334 def XSXEXPDP : XX2_RT5_XO5_XB6<60, 0, 347, "xsxexpdp", []>;
2335 def XSXSIGDP : XX2_RT5_XO5_XB6<60, 1, 347, "xsxsigdp", []>;
Nemanja Ivanovic11049f82016-10-04 06:59:23 +00002336
Chuang-Yu Cheng80722712016-03-28 08:34:28 +00002337 def XSXEXPQP : X_VT5_XO5_VB5 <63, 2, 804, "xsxexpqp", []>;
2338 def XSXSIGQP : X_VT5_XO5_VB5 <63, 18, 804, "xsxsigqp", []>;
2339
2340 // Vector Insert Word
Nemanja Ivanovic11049f82016-10-04 06:59:23 +00002341 let UseVSXReg = 1 in {
Chuang-Yu Cheng80722712016-03-28 08:34:28 +00002342 // XB NOTE: Only XB.dword[1] is used, but we use vsrc on XB.
Nemanja Ivanovicb43bb612016-07-12 21:00:10 +00002343 def XXINSERTW :
2344 XX2_RD6_UIM5_RS6<60, 181, (outs vsrc:$XT),
2345 (ins vsrc:$XTi, vsrc:$XB, u4imm:$UIM),
2346 "xxinsertw $XT, $XB, $UIM", IIC_VecFP,
2347 [(set v4i32:$XT, (PPCxxinsert v4i32:$XTi, v4i32:$XB,
2348 imm32SExt16:$UIM))]>,
2349 RegConstraint<"$XTi = $XT">, NoEncode<"$XTi">;
Chuang-Yu Cheng80722712016-03-28 08:34:28 +00002350
2351 // Vector Extract Unsigned Word
2352 def XXEXTRACTUW : XX2_RD6_UIM5_RS6<60, 165,
Nemanja Ivanovicb43bb612016-07-12 21:00:10 +00002353 (outs vsfrc:$XT), (ins vsrc:$XB, u4imm:$UIMM),
Chuang-Yu Cheng80722712016-03-28 08:34:28 +00002354 "xxextractuw $XT, $XB, $UIMM", IIC_VecFP, []>;
Nemanja Ivanovic11049f82016-10-04 06:59:23 +00002355 } // UseVSXReg = 1
Chuang-Yu Cheng80722712016-03-28 08:34:28 +00002356
2357 // Vector Insert Exponent DP/SP
2358 def XVIEXPDP : XX3_XT5_XA5_XB5<60, 248, "xviexpdp", vsrc, vsrc, vsrc,
Nemanja Ivanovic0f459982016-10-26 19:03:40 +00002359 IIC_VecFP, [(set v2f64: $XT,(int_ppc_vsx_xviexpdp v2i64:$XA, v2i64:$XB))]>;
Chuang-Yu Cheng80722712016-03-28 08:34:28 +00002360 def XVIEXPSP : XX3_XT5_XA5_XB5<60, 216, "xviexpsp", vsrc, vsrc, vsrc,
Nemanja Ivanovic0f459982016-10-26 19:03:40 +00002361 IIC_VecFP, [(set v4f32: $XT,(int_ppc_vsx_xviexpsp v4i32:$XA, v4i32:$XB))]>;
Chuang-Yu Cheng80722712016-03-28 08:34:28 +00002362
2363 // Vector Extract Exponent/Significand DP/SP
Sean Fertileadda5b22016-11-14 14:42:37 +00002364 def XVXEXPDP : XX2_XT6_XO5_XB6<60, 0, 475, "xvxexpdp", vsrc,
2365 [(set v2i64: $XT,
2366 (int_ppc_vsx_xvxexpdp v2f64:$XB))]>;
2367 def XVXEXPSP : XX2_XT6_XO5_XB6<60, 8, 475, "xvxexpsp", vsrc,
2368 [(set v4i32: $XT,
2369 (int_ppc_vsx_xvxexpsp v4f32:$XB))]>;
2370 def XVXSIGDP : XX2_XT6_XO5_XB6<60, 1, 475, "xvxsigdp", vsrc,
2371 [(set v2i64: $XT,
2372 (int_ppc_vsx_xvxsigdp v2f64:$XB))]>;
2373 def XVXSIGSP : XX2_XT6_XO5_XB6<60, 9, 475, "xvxsigsp", vsrc,
2374 [(set v4i32: $XT,
2375 (int_ppc_vsx_xvxsigsp v4f32:$XB))]>;
Chuang-Yu Cheng80722712016-03-28 08:34:28 +00002376
Sean Fertile1c4109b2016-12-09 17:21:42 +00002377 let AddedComplexity = 400, Predicates = [HasP9Vector] in {
2378 // Extra patterns expanding to vector Extract Word/Insert Word
2379 def : Pat<(v4i32 (int_ppc_vsx_xxinsertw v4i32:$A, v2i64:$B, imm:$IMM)),
2380 (v4i32 (XXINSERTW $A, $B, imm:$IMM))>;
2381 def : Pat<(v2i64 (int_ppc_vsx_xxextractuw v2i64:$A, imm:$IMM)),
2382 (v2i64 (COPY_TO_REGCLASS (XXEXTRACTUW $A, imm:$IMM), VSRC))>;
2383 } // AddedComplexity = 400, HasP9Vector
2384
Chuang-Yu Cheng80722712016-03-28 08:34:28 +00002385 //===--------------------------------------------------------------------===//
2386
2387 // Test Data Class SP/DP/QP
Nemanja Ivanovic11049f82016-10-04 06:59:23 +00002388 let UseVSXReg = 1 in {
Chuang-Yu Cheng80722712016-03-28 08:34:28 +00002389 def XSTSTDCSP : XX2_BF3_DCMX7_RS6<60, 298,
2390 (outs crrc:$BF), (ins u7imm:$DCMX, vsfrc:$XB),
2391 "xststdcsp $BF, $XB, $DCMX", IIC_VecFP, []>;
2392 def XSTSTDCDP : XX2_BF3_DCMX7_RS6<60, 362,
2393 (outs crrc:$BF), (ins u7imm:$DCMX, vsfrc:$XB),
2394 "xststdcdp $BF, $XB, $DCMX", IIC_VecFP, []>;
Nemanja Ivanovic11049f82016-10-04 06:59:23 +00002395 } // UseVSXReg = 1
Chuang-Yu Cheng80722712016-03-28 08:34:28 +00002396 def XSTSTDCQP : X_BF3_DCMX7_RS5 <63, 708,
2397 (outs crrc:$BF), (ins u7imm:$DCMX, vrrc:$vB),
2398 "xststdcqp $BF, $vB, $DCMX", IIC_VecFP, []>;
2399
2400 // Vector Test Data Class SP/DP
Nemanja Ivanovic11049f82016-10-04 06:59:23 +00002401 let UseVSXReg = 1 in {
Chuang-Yu Cheng80722712016-03-28 08:34:28 +00002402 def XVTSTDCSP : XX2_RD6_DCMX7_RS6<60, 13, 5,
2403 (outs vsrc:$XT), (ins u7imm:$DCMX, vsrc:$XB),
Sean Fertileadda5b22016-11-14 14:42:37 +00002404 "xvtstdcsp $XT, $XB, $DCMX", IIC_VecFP,
2405 [(set v4i32: $XT,
2406 (int_ppc_vsx_xvtstdcsp v4f32:$XB, imm:$DCMX))]>;
Chuang-Yu Cheng80722712016-03-28 08:34:28 +00002407 def XVTSTDCDP : XX2_RD6_DCMX7_RS6<60, 15, 5,
2408 (outs vsrc:$XT), (ins u7imm:$DCMX, vsrc:$XB),
Sean Fertileadda5b22016-11-14 14:42:37 +00002409 "xvtstdcdp $XT, $XB, $DCMX", IIC_VecFP,
2410 [(set v2i64: $XT,
2411 (int_ppc_vsx_xvtstdcdp v2f64:$XB, imm:$DCMX))]>;
Nemanja Ivanovic11049f82016-10-04 06:59:23 +00002412 } // UseVSXReg = 1
Chuang-Yu Cheng80722712016-03-28 08:34:28 +00002413
2414 //===--------------------------------------------------------------------===//
2415
2416 // Maximum/Minimum Type-C/Type-J DP
2417 // XT.dword[1] = 0xUUUU_UUUU_UUUU_UUUU, so we use vsrc for XT
2418 def XSMAXCDP : XX3_XT5_XA5_XB5<60, 128, "xsmaxcdp", vsrc, vsfrc, vsfrc,
2419 IIC_VecFP, []>;
2420 def XSMAXJDP : XX3_XT5_XA5_XB5<60, 144, "xsmaxjdp", vsrc, vsfrc, vsfrc,
2421 IIC_VecFP, []>;
2422 def XSMINCDP : XX3_XT5_XA5_XB5<60, 136, "xsmincdp", vsrc, vsfrc, vsfrc,
2423 IIC_VecFP, []>;
2424 def XSMINJDP : XX3_XT5_XA5_XB5<60, 152, "xsminjdp", vsrc, vsfrc, vsfrc,
2425 IIC_VecFP, []>;
2426
2427 //===--------------------------------------------------------------------===//
2428
2429 // Vector Byte-Reverse H/W/D/Q Word
2430 def XXBRH : XX2_XT6_XO5_XB6<60, 7, 475, "xxbrh", vsrc, []>;
2431 def XXBRW : XX2_XT6_XO5_XB6<60, 15, 475, "xxbrw", vsrc, []>;
2432 def XXBRD : XX2_XT6_XO5_XB6<60, 23, 475, "xxbrd", vsrc, []>;
2433 def XXBRQ : XX2_XT6_XO5_XB6<60, 31, 475, "xxbrq", vsrc, []>;
2434
Tony Jiang1a8eec12017-06-12 18:24:36 +00002435 // Vector Reverse
2436 def : Pat<(v8i16 (PPCxxreverse v8i16 :$A)),
2437 (v8i16 (COPY_TO_REGCLASS (XXBRH (COPY_TO_REGCLASS $A, VSRC)), VRRC))>;
2438 def : Pat<(v4i32 (PPCxxreverse v4i32 :$A)),
2439 (v4i32 (XXBRW $A))>;
2440 def : Pat<(v2i64 (PPCxxreverse v2i64 :$A)),
2441 (v2i64 (XXBRD $A))>;
2442 def : Pat<(v1i128 (PPCxxreverse v1i128 :$A)),
2443 (v1i128 (COPY_TO_REGCLASS (XXBRQ (COPY_TO_REGCLASS $A, VSRC)), VRRC))>;
2444
Chuang-Yu Cheng80722712016-03-28 08:34:28 +00002445 // Vector Permute
2446 def XXPERM : XX3_XT5_XA5_XB5<60, 26, "xxperm" , vsrc, vsrc, vsrc,
2447 IIC_VecPerm, []>;
2448 def XXPERMR : XX3_XT5_XA5_XB5<60, 58, "xxpermr", vsrc, vsrc, vsrc,
2449 IIC_VecPerm, []>;
2450
2451 // Vector Splat Immediate Byte
2452 def XXSPLTIB : X_RD6_IMM8<60, 360, (outs vsrc:$XT), (ins u8imm:$IMM8),
Nemanja Ivanovic11049f82016-10-04 06:59:23 +00002453 "xxspltib $XT, $IMM8", IIC_VecPerm, []>, UseVSXReg;
Chuang-Yu Cheng80722712016-03-28 08:34:28 +00002454
2455 //===--------------------------------------------------------------------===//
Kit Bartonba532dc2016-03-08 03:49:13 +00002456 // Vector/Scalar Load/Store Instructions
2457
Nemanja Ivanovic6354d232016-10-04 11:25:52 +00002458 // When adding new D-Form loads/stores, be sure to update the ImmToIdxMap in
2459 // PPCRegisterInfo::PPCRegisterInfo and maybe save yourself some debugging.
Sean Fertile3c8c3852017-01-26 18:59:15 +00002460 let mayLoad = 1, mayStore = 0 in {
Kit Bartonba532dc2016-03-08 03:49:13 +00002461 // Load Vector
2462 def LXV : DQ_RD6_RS5_DQ12<61, 1, (outs vsrc:$XT), (ins memrix16:$src),
Nemanja Ivanovic11049f82016-10-04 06:59:23 +00002463 "lxv $XT, $src", IIC_LdStLFD, []>, UseVSXReg;
Kit Bartonba532dc2016-03-08 03:49:13 +00002464 // Load DWord
Nemanja Ivanovic11049f82016-10-04 06:59:23 +00002465 def LXSD : DSForm_1<57, 2, (outs vfrc:$vD), (ins memrix:$src),
Kit Bartonba532dc2016-03-08 03:49:13 +00002466 "lxsd $vD, $src", IIC_LdStLFD, []>;
2467 // Load SP from src, convert it to DP, and place in dword[0]
Nemanja Ivanovic11049f82016-10-04 06:59:23 +00002468 def LXSSP : DSForm_1<57, 3, (outs vfrc:$vD), (ins memrix:$src),
Kit Bartonba532dc2016-03-08 03:49:13 +00002469 "lxssp $vD, $src", IIC_LdStLFD, []>;
2470
2471 // [PO T RA RB XO TX] almost equal to [PO S RA RB XO SX], but has different
2472 // "out" and "in" dag
2473 class X_XT6_RA5_RB5<bits<6> opcode, bits<10> xo, string opc,
2474 RegisterOperand vtype, list<dag> pattern>
2475 : XX1Form<opcode, xo, (outs vtype:$XT), (ins memrr:$src),
Nemanja Ivanovic11049f82016-10-04 06:59:23 +00002476 !strconcat(opc, " $XT, $src"), IIC_LdStLFD, pattern>, UseVSXReg;
Kit Bartonba532dc2016-03-08 03:49:13 +00002477
2478 // Load as Integer Byte/Halfword & Zero Indexed
Nemanja Ivanovic11049f82016-10-04 06:59:23 +00002479 def LXSIBZX : X_XT6_RA5_RB5<31, 781, "lxsibzx", vsfrc,
2480 [(set f64:$XT, (PPClxsizx xoaddr:$src, 1))]>;
2481 def LXSIHZX : X_XT6_RA5_RB5<31, 813, "lxsihzx", vsfrc,
2482 [(set f64:$XT, (PPClxsizx xoaddr:$src, 2))]>;
Kit Bartonba532dc2016-03-08 03:49:13 +00002483
2484 // Load Vector Halfword*8/Byte*16 Indexed
2485 def LXVH8X : X_XT6_RA5_RB5<31, 812, "lxvh8x" , vsrc, []>;
2486 def LXVB16X : X_XT6_RA5_RB5<31, 876, "lxvb16x", vsrc, []>;
2487
2488 // Load Vector Indexed
Nemanja Ivanovic6e7879c2016-09-22 09:52:19 +00002489 def LXVX : X_XT6_RA5_RB5<31, 268, "lxvx" , vsrc,
Zaara Syeda93297832017-05-24 17:50:37 +00002490 [(set v2f64:$XT, (load xaddr:$src))]>;
Kit Bartonba532dc2016-03-08 03:49:13 +00002491 // Load Vector (Left-justified) with Length
Zaara Syedaa19c9e62016-11-15 17:54:19 +00002492 def LXVL : XX1Form<31, 269, (outs vsrc:$XT), (ins memr:$src, g8rc:$rB),
2493 "lxvl $XT, $src, $rB", IIC_LdStLoad,
2494 [(set v4i32:$XT, (int_ppc_vsx_lxvl addr:$src, i64:$rB))]>,
2495 UseVSXReg;
2496 def LXVLL : XX1Form<31,301, (outs vsrc:$XT), (ins memr:$src, g8rc:$rB),
2497 "lxvll $XT, $src, $rB", IIC_LdStLoad,
2498 [(set v4i32:$XT, (int_ppc_vsx_lxvll addr:$src, i64:$rB))]>,
2499 UseVSXReg;
Kit Bartonba532dc2016-03-08 03:49:13 +00002500
2501 // Load Vector Word & Splat Indexed
2502 def LXVWSX : X_XT6_RA5_RB5<31, 364, "lxvwsx" , vsrc, []>;
Nemanja Ivanovic11049f82016-10-04 06:59:23 +00002503 } // mayLoad
Kit Bartonba532dc2016-03-08 03:49:13 +00002504
Nemanja Ivanovic6354d232016-10-04 11:25:52 +00002505 // When adding new D-Form loads/stores, be sure to update the ImmToIdxMap in
2506 // PPCRegisterInfo::PPCRegisterInfo and maybe save yourself some debugging.
Sean Fertile3c8c3852017-01-26 18:59:15 +00002507 let mayStore = 1, mayLoad = 0 in {
Kit Bartonba532dc2016-03-08 03:49:13 +00002508 // Store Vector
2509 def STXV : DQ_RD6_RS5_DQ12<61, 5, (outs), (ins vsrc:$XT, memrix16:$dst),
Nemanja Ivanovic11049f82016-10-04 06:59:23 +00002510 "stxv $XT, $dst", IIC_LdStSTFD, []>, UseVSXReg;
Kit Bartonba532dc2016-03-08 03:49:13 +00002511 // Store DWord
Nemanja Ivanovic11049f82016-10-04 06:59:23 +00002512 def STXSD : DSForm_1<61, 2, (outs), (ins vfrc:$vS, memrix:$dst),
Kit Bartonba532dc2016-03-08 03:49:13 +00002513 "stxsd $vS, $dst", IIC_LdStSTFD, []>;
2514 // Convert DP of dword[0] to SP, and Store to dst
Nemanja Ivanovic11049f82016-10-04 06:59:23 +00002515 def STXSSP : DSForm_1<61, 3, (outs), (ins vfrc:$vS, memrix:$dst),
Kit Bartonba532dc2016-03-08 03:49:13 +00002516 "stxssp $vS, $dst", IIC_LdStSTFD, []>;
2517
2518 // [PO S RA RB XO SX]
2519 class X_XS6_RA5_RB5<bits<6> opcode, bits<10> xo, string opc,
2520 RegisterOperand vtype, list<dag> pattern>
2521 : XX1Form<opcode, xo, (outs), (ins vtype:$XT, memrr:$dst),
Nemanja Ivanovic11049f82016-10-04 06:59:23 +00002522 !strconcat(opc, " $XT, $dst"), IIC_LdStSTFD, pattern>, UseVSXReg;
Kit Bartonba532dc2016-03-08 03:49:13 +00002523
2524 // Store as Integer Byte/Halfword Indexed
Nemanja Ivanovic11049f82016-10-04 06:59:23 +00002525 def STXSIBX : X_XS6_RA5_RB5<31, 909, "stxsibx" , vsfrc,
2526 [(PPCstxsix f64:$XT, xoaddr:$dst, 1)]>;
2527 def STXSIHX : X_XS6_RA5_RB5<31, 941, "stxsihx" , vsfrc,
2528 [(PPCstxsix f64:$XT, xoaddr:$dst, 2)]>;
2529 let isCodeGenOnly = 1 in {
2530 def STXSIBXv : X_XS6_RA5_RB5<31, 909, "stxsibx" , vrrc, []>;
2531 def STXSIHXv : X_XS6_RA5_RB5<31, 941, "stxsihx" , vrrc, []>;
2532 }
Kit Bartonba532dc2016-03-08 03:49:13 +00002533
2534 // Store Vector Halfword*8/Byte*16 Indexed
2535 def STXVH8X : X_XS6_RA5_RB5<31, 940, "stxvh8x" , vsrc, []>;
2536 def STXVB16X : X_XS6_RA5_RB5<31, 1004, "stxvb16x", vsrc, []>;
2537
2538 // Store Vector Indexed
Nemanja Ivanovic6e7879c2016-09-22 09:52:19 +00002539 def STXVX : X_XS6_RA5_RB5<31, 396, "stxvx" , vsrc,
Zaara Syeda93297832017-05-24 17:50:37 +00002540 [(store v2f64:$XT, xaddr:$dst)]>;
Kit Bartonba532dc2016-03-08 03:49:13 +00002541
2542 // Store Vector (Left-justified) with Length
Zaara Syedaa19c9e62016-11-15 17:54:19 +00002543 def STXVL : XX1Form<31, 397, (outs), (ins vsrc:$XT, memr:$dst, g8rc:$rB),
2544 "stxvl $XT, $dst, $rB", IIC_LdStLoad,
2545 [(int_ppc_vsx_stxvl v4i32:$XT, addr:$dst, i64:$rB)]>,
2546 UseVSXReg;
2547 def STXVLL : XX1Form<31, 429, (outs), (ins vsrc:$XT, memr:$dst, g8rc:$rB),
2548 "stxvll $XT, $dst, $rB", IIC_LdStLoad,
2549 [(int_ppc_vsx_stxvll v4i32:$XT, addr:$dst, i64:$rB)]>,
2550 UseVSXReg;
Nemanja Ivanovic11049f82016-10-04 06:59:23 +00002551 } // mayStore
Nemanja Ivanovicb43bb612016-07-12 21:00:10 +00002552
Lei Huang451ef4a2017-08-14 18:09:29 +00002553 let Predicates = [IsLittleEndian] in {
2554 def: Pat<(f32 (PPCfcfids (PPCmtvsra (i32 (extractelt v4i32:$A, 0))))),
2555 (f32 (XSCVSPDPN (XVCVSXWSP (XXSPLTW $A, 3))))>;
2556 def: Pat<(f32 (PPCfcfids (PPCmtvsra (i32 (extractelt v4i32:$A, 1))))),
2557 (f32 (XSCVSPDPN (XVCVSXWSP (XXSPLTW $A, 2))))>;
2558 def: Pat<(f32 (PPCfcfids (PPCmtvsra (i32 (extractelt v4i32:$A, 2))))),
2559 (f32 (XSCVSPDPN (XVCVSXWSP (XXSPLTW $A, 1))))>;
2560 def: Pat<(f32 (PPCfcfids (PPCmtvsra (i32 (extractelt v4i32:$A, 3))))),
2561 (f32 (XSCVSPDPN (XVCVSXWSP (XXSPLTW $A, 0))))>;
2562 def: Pat<(f64 (PPCfcfid (PPCmtvsra (i32 (extractelt v4i32:$A, 0))))),
2563 (f64 (COPY_TO_REGCLASS (XVCVSXWDP (XXSPLTW $A, 3)), VSFRC))>;
2564 def: Pat<(f64 (PPCfcfid (PPCmtvsra (i32 (extractelt v4i32:$A, 1))))),
2565 (f64 (COPY_TO_REGCLASS (XVCVSXWDP (XXSPLTW $A, 2)), VSFRC))>;
2566 def: Pat<(f64 (PPCfcfid (PPCmtvsra (i32 (extractelt v4i32:$A, 2))))),
2567 (f64 (COPY_TO_REGCLASS (XVCVSXWDP (XXSPLTW $A, 1)), VSFRC))>;
2568 def: Pat<(f64 (PPCfcfid (PPCmtvsra (i32 (extractelt v4i32:$A, 3))))),
2569 (f64 (COPY_TO_REGCLASS (XVCVSXWDP (XXSPLTW $A, 0)), VSFRC))>;
2570 }
2571
2572 let Predicates = [IsBigEndian] in {
2573 def: Pat<(f32 (PPCfcfids (PPCmtvsra (i32 (extractelt v4i32:$A, 0))))),
2574 (f32 (XSCVSPDPN (XVCVSXWSP (XXSPLTW $A, 0))))>;
2575 def: Pat<(f32 (PPCfcfids (PPCmtvsra (i32 (extractelt v4i32:$A, 1))))),
2576 (f32 (XSCVSPDPN (XVCVSXWSP (XXSPLTW $A, 1))))>;
2577 def: Pat<(f32 (PPCfcfids (PPCmtvsra (i32 (extractelt v4i32:$A, 2))))),
2578 (f32 (XSCVSPDPN (XVCVSXWSP (XXSPLTW $A, 2))))>;
2579 def: Pat<(f32 (PPCfcfids (PPCmtvsra (i32 (extractelt v4i32:$A, 3))))),
2580 (f32 (XSCVSPDPN (XVCVSXWSP (XXSPLTW $A, 3))))>;
2581 def: Pat<(f64 (PPCfcfid (PPCmtvsra (i32 (extractelt v4i32:$A, 0))))),
2582 (f64 (COPY_TO_REGCLASS (XVCVSXWDP (XXSPLTW $A, 0)), VSFRC))>;
2583 def: Pat<(f64 (PPCfcfid (PPCmtvsra (i32 (extractelt v4i32:$A, 1))))),
2584 (f64 (COPY_TO_REGCLASS (XVCVSXWDP (XXSPLTW $A, 1)), VSFRC))>;
2585 def: Pat<(f64 (PPCfcfid (PPCmtvsra (i32 (extractelt v4i32:$A, 2))))),
2586 (f64 (COPY_TO_REGCLASS (XVCVSXWDP (XXSPLTW $A, 2)), VSFRC))>;
2587 def: Pat<(f64 (PPCfcfid (PPCmtvsra (i32 (extractelt v4i32:$A, 3))))),
2588 (f64 (COPY_TO_REGCLASS (XVCVSXWDP (XXSPLTW $A, 3)), VSFRC))>;
2589 }
2590
Nemanja Ivanovicb43bb612016-07-12 21:00:10 +00002591 // Patterns for which instructions from ISA 3.0 are a better match
2592 let Predicates = [IsLittleEndian, HasP9Vector] in {
2593 def : Pat<(f32 (PPCfcfidus (PPCmtvsrz (i32 (extractelt v4i32:$A, 0))))),
2594 (f32 (XSCVUXDSP (XXEXTRACTUW $A, 12)))>;
2595 def : Pat<(f32 (PPCfcfidus (PPCmtvsrz (i32 (extractelt v4i32:$A, 1))))),
2596 (f32 (XSCVUXDSP (XXEXTRACTUW $A, 8)))>;
2597 def : Pat<(f32 (PPCfcfidus (PPCmtvsrz (i32 (extractelt v4i32:$A, 2))))),
2598 (f32 (XSCVUXDSP (XXEXTRACTUW $A, 4)))>;
2599 def : Pat<(f32 (PPCfcfidus (PPCmtvsrz (i32 (extractelt v4i32:$A, 3))))),
2600 (f32 (XSCVUXDSP (XXEXTRACTUW $A, 0)))>;
Lei Huang451ef4a2017-08-14 18:09:29 +00002601 def : Pat<(f64 (PPCfcfidu (PPCmtvsrz (i32 (extractelt v4i32:$A, 0))))),
2602 (f64 (XSCVUXDDP (XXEXTRACTUW $A, 12)))>;
2603 def : Pat<(f64 (PPCfcfidu (PPCmtvsrz (i32 (extractelt v4i32:$A, 1))))),
2604 (f64 (XSCVUXDDP (XXEXTRACTUW $A, 8)))>;
2605 def : Pat<(f64 (PPCfcfidu (PPCmtvsrz (i32 (extractelt v4i32:$A, 2))))),
2606 (f64 (XSCVUXDDP (XXEXTRACTUW $A, 4)))>;
2607 def : Pat<(f64 (PPCfcfidu (PPCmtvsrz (i32 (extractelt v4i32:$A, 3))))),
2608 (f64 (XSCVUXDDP (XXEXTRACTUW $A, 0)))>;
Nemanja Ivanovicb43bb612016-07-12 21:00:10 +00002609 def : Pat<(v4i32 (insertelt v4i32:$A, i32:$B, 0)),
2610 (v4i32 (XXINSERTW v4i32:$A, AlignValues.I32_TO_BE_WORD1, 12))>;
2611 def : Pat<(v4i32 (insertelt v4i32:$A, i32:$B, 1)),
2612 (v4i32 (XXINSERTW v4i32:$A, AlignValues.I32_TO_BE_WORD1, 8))>;
2613 def : Pat<(v4i32 (insertelt v4i32:$A, i32:$B, 2)),
2614 (v4i32 (XXINSERTW v4i32:$A, AlignValues.I32_TO_BE_WORD1, 4))>;
2615 def : Pat<(v4i32 (insertelt v4i32:$A, i32:$B, 3)),
2616 (v4i32 (XXINSERTW v4i32:$A, AlignValues.I32_TO_BE_WORD1, 0))>;
2617 def : Pat<(v4f32 (insertelt v4f32:$A, f32:$B, 0)),
2618 (v4f32 (XXINSERTW v4f32:$A, AlignValues.F32_TO_BE_WORD1, 12))>;
2619 def : Pat<(v4f32 (insertelt v4f32:$A, f32:$B, 1)),
2620 (v4f32 (XXINSERTW v4f32:$A, AlignValues.F32_TO_BE_WORD1, 8))>;
2621 def : Pat<(v4f32 (insertelt v4f32:$A, f32:$B, 2)),
2622 (v4f32 (XXINSERTW v4f32:$A, AlignValues.F32_TO_BE_WORD1, 4))>;
2623 def : Pat<(v4f32 (insertelt v4f32:$A, f32:$B, 3)),
2624 (v4f32 (XXINSERTW v4f32:$A, AlignValues.F32_TO_BE_WORD1, 0))>;
2625 } // IsLittleEndian, HasP9Vector
2626
2627 let Predicates = [IsBigEndian, HasP9Vector] in {
2628 def : Pat<(f32 (PPCfcfidus (PPCmtvsrz (i32 (extractelt v4i32:$A, 0))))),
2629 (f32 (XSCVUXDSP (XXEXTRACTUW $A, 0)))>;
2630 def : Pat<(f32 (PPCfcfidus (PPCmtvsrz (i32 (extractelt v4i32:$A, 1))))),
2631 (f32 (XSCVUXDSP (XXEXTRACTUW $A, 4)))>;
2632 def : Pat<(f32 (PPCfcfidus (PPCmtvsrz (i32 (extractelt v4i32:$A, 2))))),
2633 (f32 (XSCVUXDSP (XXEXTRACTUW $A, 8)))>;
2634 def : Pat<(f32 (PPCfcfidus (PPCmtvsrz (i32 (extractelt v4i32:$A, 3))))),
2635 (f32 (XSCVUXDSP (XXEXTRACTUW $A, 12)))>;
Lei Huang451ef4a2017-08-14 18:09:29 +00002636 def : Pat<(f64 (PPCfcfidu (PPCmtvsrz (i32 (extractelt v4i32:$A, 0))))),
2637 (f64 (XSCVUXDDP (XXEXTRACTUW $A, 0)))>;
2638 def : Pat<(f64 (PPCfcfidu (PPCmtvsrz (i32 (extractelt v4i32:$A, 1))))),
2639 (f64 (XSCVUXDDP (XXEXTRACTUW $A, 4)))>;
2640 def : Pat<(f64 (PPCfcfidu (PPCmtvsrz (i32 (extractelt v4i32:$A, 2))))),
2641 (f64 (XSCVUXDDP (XXEXTRACTUW $A, 8)))>;
2642 def : Pat<(f64 (PPCfcfidu (PPCmtvsrz (i32 (extractelt v4i32:$A, 3))))),
2643 (f64 (XSCVUXDDP (XXEXTRACTUW $A, 12)))>;
Nemanja Ivanovicb43bb612016-07-12 21:00:10 +00002644 def : Pat<(v4i32 (insertelt v4i32:$A, i32:$B, 0)),
2645 (v4i32 (XXINSERTW v4i32:$A, AlignValues.I32_TO_BE_WORD1, 0))>;
2646 def : Pat<(v4i32 (insertelt v4i32:$A, i32:$B, 1)),
2647 (v4i32 (XXINSERTW v4i32:$A, AlignValues.I32_TO_BE_WORD1, 4))>;
2648 def : Pat<(v4i32 (insertelt v4i32:$A, i32:$B, 2)),
2649 (v4i32 (XXINSERTW v4i32:$A, AlignValues.I32_TO_BE_WORD1, 8))>;
2650 def : Pat<(v4i32 (insertelt v4i32:$A, i32:$B, 3)),
2651 (v4i32 (XXINSERTW v4i32:$A, AlignValues.I32_TO_BE_WORD1, 12))>;
2652 def : Pat<(v4f32 (insertelt v4f32:$A, f32:$B, 0)),
2653 (v4f32 (XXINSERTW v4f32:$A, AlignValues.F32_TO_BE_WORD1, 0))>;
2654 def : Pat<(v4f32 (insertelt v4f32:$A, f32:$B, 1)),
2655 (v4f32 (XXINSERTW v4f32:$A, AlignValues.F32_TO_BE_WORD1, 4))>;
2656 def : Pat<(v4f32 (insertelt v4f32:$A, f32:$B, 2)),
2657 (v4f32 (XXINSERTW v4f32:$A, AlignValues.F32_TO_BE_WORD1, 8))>;
2658 def : Pat<(v4f32 (insertelt v4f32:$A, f32:$B, 3)),
2659 (v4f32 (XXINSERTW v4f32:$A, AlignValues.F32_TO_BE_WORD1, 12))>;
2660 } // IsLittleEndian, HasP9Vector
Nemanja Ivanovic6e7879c2016-09-22 09:52:19 +00002661
Zaara Syeda93297832017-05-24 17:50:37 +00002662 // D-Form Load/Store
Nemanja Ivanovic3c7e276d2017-07-13 18:17:10 +00002663 def : Pat<(v4i32 (quadwOffsetLoad iqaddr:$src)), (LXV memrix16:$src)>;
2664 def : Pat<(v4f32 (quadwOffsetLoad iqaddr:$src)), (LXV memrix16:$src)>;
2665 def : Pat<(v2i64 (quadwOffsetLoad iqaddr:$src)), (LXV memrix16:$src)>;
2666 def : Pat<(v2f64 (quadwOffsetLoad iqaddr:$src)), (LXV memrix16:$src)>;
2667 def : Pat<(v4i32 (int_ppc_vsx_lxvw4x iqaddr:$src)), (LXV memrix16:$src)>;
2668 def : Pat<(v2f64 (int_ppc_vsx_lxvd2x iqaddr:$src)), (LXV memrix16:$src)>;
Nemanja Ivanovicd2c3c512016-09-23 13:25:31 +00002669
Nemanja Ivanovic3c7e276d2017-07-13 18:17:10 +00002670 def : Pat<(quadwOffsetStore v4f32:$rS, iqaddr:$dst), (STXV $rS, memrix16:$dst)>;
2671 def : Pat<(quadwOffsetStore v4i32:$rS, iqaddr:$dst), (STXV $rS, memrix16:$dst)>;
2672 def : Pat<(quadwOffsetStore v2f64:$rS, iqaddr:$dst), (STXV $rS, memrix16:$dst)>;
2673 def : Pat<(quadwOffsetStore v2i64:$rS, iqaddr:$dst), (STXV $rS, memrix16:$dst)>;
2674 def : Pat<(int_ppc_vsx_stxvw4x v4i32:$rS, iqaddr:$dst),
Zaara Syeda93297832017-05-24 17:50:37 +00002675 (STXV $rS, memrix16:$dst)>;
Nemanja Ivanovic3c7e276d2017-07-13 18:17:10 +00002676 def : Pat<(int_ppc_vsx_stxvd2x v2f64:$rS, iqaddr:$dst),
Zaara Syeda93297832017-05-24 17:50:37 +00002677 (STXV $rS, memrix16:$dst)>;
2678
2679
Nemanja Ivanovic3c7e276d2017-07-13 18:17:10 +00002680 def : Pat<(v2f64 (nonQuadwOffsetLoad xoaddr:$src)), (LXVX xoaddr:$src)>;
2681 def : Pat<(v2i64 (nonQuadwOffsetLoad xoaddr:$src)), (LXVX xoaddr:$src)>;
2682 def : Pat<(v4f32 (nonQuadwOffsetLoad xoaddr:$src)), (LXVX xoaddr:$src)>;
2683 def : Pat<(v4i32 (nonQuadwOffsetLoad xoaddr:$src)), (LXVX xoaddr:$src)>;
2684 def : Pat<(v4i32 (int_ppc_vsx_lxvw4x xoaddr:$src)), (LXVX xoaddr:$src)>;
2685 def : Pat<(v2f64 (int_ppc_vsx_lxvd2x xoaddr:$src)), (LXVX xoaddr:$src)>;
2686 def : Pat<(nonQuadwOffsetStore v2f64:$rS, xoaddr:$dst),
2687 (STXVX $rS, xoaddr:$dst)>;
2688 def : Pat<(nonQuadwOffsetStore v2i64:$rS, xoaddr:$dst),
2689 (STXVX $rS, xoaddr:$dst)>;
2690 def : Pat<(nonQuadwOffsetStore v4f32:$rS, xoaddr:$dst),
2691 (STXVX $rS, xoaddr:$dst)>;
2692 def : Pat<(nonQuadwOffsetStore v4i32:$rS, xoaddr:$dst),
2693 (STXVX $rS, xoaddr:$dst)>;
2694 def : Pat<(int_ppc_vsx_stxvw4x v4i32:$rS, xoaddr:$dst),
2695 (STXVX $rS, xoaddr:$dst)>;
2696 def : Pat<(int_ppc_vsx_stxvd2x v2f64:$rS, xoaddr:$dst),
2697 (STXVX $rS, xoaddr:$dst)>;
Nemanja Ivanovicd2c3c512016-09-23 13:25:31 +00002698 def : Pat<(v4i32 (scalar_to_vector (i32 (load xoaddr:$src)))),
2699 (v4i32 (LXVWSX xoaddr:$src))>;
2700 def : Pat<(v4f32 (scalar_to_vector (f32 (load xoaddr:$src)))),
2701 (v4f32 (LXVWSX xoaddr:$src))>;
Nemanja Ivanovicdf1cb522016-11-29 16:11:34 +00002702 def : Pat<(v4f32 (scalar_to_vector (f32 (fpround (extloadf32 xoaddr:$src))))),
2703 (v4f32 (LXVWSX xoaddr:$src))>;
Nemanja Ivanovic11049f82016-10-04 06:59:23 +00002704
2705 // Build vectors from i8 loads
2706 def : Pat<(v16i8 (scalar_to_vector ScalarLoads.Li8)),
2707 (v16i8 (VSPLTBs 7, (LXSIBZX xoaddr:$src)))>;
2708 def : Pat<(v8i16 (scalar_to_vector ScalarLoads.ZELi8)),
2709 (v8i16 (VSPLTHs 3, (LXSIBZX xoaddr:$src)))>;
2710 def : Pat<(v4i32 (scalar_to_vector ScalarLoads.ZELi8)),
2711 (v4i32 (XXSPLTWs (LXSIBZX xoaddr:$src), 1))>;
2712 def : Pat<(v2i64 (scalar_to_vector ScalarLoads.ZELi8i64)),
Nemanja Ivanovic15748f42016-12-06 11:47:14 +00002713 (v2i64 (XXPERMDIs (LXSIBZX xoaddr:$src), 0))>;
Nemanja Ivanovic11049f82016-10-04 06:59:23 +00002714 def : Pat<(v4i32 (scalar_to_vector ScalarLoads.SELi8)),
2715 (v4i32 (XXSPLTWs (VEXTSB2Ws (LXSIBZX xoaddr:$src)), 1))>;
2716 def : Pat<(v2i64 (scalar_to_vector ScalarLoads.SELi8i64)),
Nemanja Ivanovic15748f42016-12-06 11:47:14 +00002717 (v2i64 (XXPERMDIs (VEXTSB2Ds (LXSIBZX xoaddr:$src)), 0))>;
Nemanja Ivanovic11049f82016-10-04 06:59:23 +00002718
2719 // Build vectors from i16 loads
2720 def : Pat<(v8i16 (scalar_to_vector ScalarLoads.Li16)),
2721 (v8i16 (VSPLTHs 3, (LXSIHZX xoaddr:$src)))>;
2722 def : Pat<(v4i32 (scalar_to_vector ScalarLoads.ZELi16)),
2723 (v4i32 (XXSPLTWs (LXSIHZX xoaddr:$src), 1))>;
2724 def : Pat<(v2i64 (scalar_to_vector ScalarLoads.ZELi16i64)),
Nemanja Ivanovic15748f42016-12-06 11:47:14 +00002725 (v2i64 (XXPERMDIs (LXSIHZX xoaddr:$src), 0))>;
Nemanja Ivanovic11049f82016-10-04 06:59:23 +00002726 def : Pat<(v4i32 (scalar_to_vector ScalarLoads.SELi16)),
2727 (v4i32 (XXSPLTWs (VEXTSH2Ws (LXSIHZX xoaddr:$src)), 1))>;
2728 def : Pat<(v2i64 (scalar_to_vector ScalarLoads.SELi16i64)),
Nemanja Ivanovic15748f42016-12-06 11:47:14 +00002729 (v2i64 (XXPERMDIs (VEXTSH2Ds (LXSIHZX xoaddr:$src)), 0))>;
Nemanja Ivanovic11049f82016-10-04 06:59:23 +00002730
2731 let Predicates = [IsBigEndian, HasP9Vector] in {
2732 // Scalar stores of i8
2733 def : Pat<(truncstorei8 (i32 (vector_extract v16i8:$S, 0)), xoaddr:$dst),
2734 (STXSIBXv (VSLDOI $S, $S, 9), xoaddr:$dst)>;
2735 def : Pat<(truncstorei8 (i32 (vector_extract v16i8:$S, 1)), xoaddr:$dst),
2736 (STXSIBXv (VSLDOI $S, $S, 10), xoaddr:$dst)>;
2737 def : Pat<(truncstorei8 (i32 (vector_extract v16i8:$S, 2)), xoaddr:$dst),
2738 (STXSIBXv (VSLDOI $S, $S, 11), xoaddr:$dst)>;
2739 def : Pat<(truncstorei8 (i32 (vector_extract v16i8:$S, 3)), xoaddr:$dst),
2740 (STXSIBXv (VSLDOI $S, $S, 12), xoaddr:$dst)>;
2741 def : Pat<(truncstorei8 (i32 (vector_extract v16i8:$S, 4)), xoaddr:$dst),
2742 (STXSIBXv (VSLDOI $S, $S, 13), xoaddr:$dst)>;
2743 def : Pat<(truncstorei8 (i32 (vector_extract v16i8:$S, 5)), xoaddr:$dst),
2744 (STXSIBXv (VSLDOI $S, $S, 14), xoaddr:$dst)>;
2745 def : Pat<(truncstorei8 (i32 (vector_extract v16i8:$S, 6)), xoaddr:$dst),
2746 (STXSIBXv (VSLDOI $S, $S, 15), xoaddr:$dst)>;
2747 def : Pat<(truncstorei8 (i32 (vector_extract v16i8:$S, 7)), xoaddr:$dst),
2748 (STXSIBXv $S, xoaddr:$dst)>;
2749 def : Pat<(truncstorei8 (i32 (vector_extract v16i8:$S, 8)), xoaddr:$dst),
2750 (STXSIBXv (VSLDOI $S, $S, 1), xoaddr:$dst)>;
2751 def : Pat<(truncstorei8 (i32 (vector_extract v16i8:$S, 9)), xoaddr:$dst),
2752 (STXSIBXv (VSLDOI $S, $S, 2), xoaddr:$dst)>;
2753 def : Pat<(truncstorei8 (i32 (vector_extract v16i8:$S, 10)), xoaddr:$dst),
2754 (STXSIBXv (VSLDOI $S, $S, 3), xoaddr:$dst)>;
2755 def : Pat<(truncstorei8 (i32 (vector_extract v16i8:$S, 11)), xoaddr:$dst),
2756 (STXSIBXv (VSLDOI $S, $S, 4), xoaddr:$dst)>;
2757 def : Pat<(truncstorei8 (i32 (vector_extract v16i8:$S, 12)), xoaddr:$dst),
2758 (STXSIBXv (VSLDOI $S, $S, 5), xoaddr:$dst)>;
2759 def : Pat<(truncstorei8 (i32 (vector_extract v16i8:$S, 13)), xoaddr:$dst),
2760 (STXSIBXv (VSLDOI $S, $S, 6), xoaddr:$dst)>;
2761 def : Pat<(truncstorei8 (i32 (vector_extract v16i8:$S, 14)), xoaddr:$dst),
2762 (STXSIBXv (VSLDOI $S, $S, 7), xoaddr:$dst)>;
2763 def : Pat<(truncstorei8 (i32 (vector_extract v16i8:$S, 15)), xoaddr:$dst),
2764 (STXSIBXv (VSLDOI $S, $S, 8), xoaddr:$dst)>;
2765
2766 // Scalar stores of i16
2767 def : Pat<(truncstorei16 (i32 (vector_extract v8i16:$S, 0)), xoaddr:$dst),
2768 (STXSIHXv (VSLDOI $S, $S, 10), xoaddr:$dst)>;
2769 def : Pat<(truncstorei16 (i32 (vector_extract v8i16:$S, 1)), xoaddr:$dst),
2770 (STXSIHXv (VSLDOI $S, $S, 12), xoaddr:$dst)>;
2771 def : Pat<(truncstorei16 (i32 (vector_extract v8i16:$S, 2)), xoaddr:$dst),
2772 (STXSIHXv (VSLDOI $S, $S, 14), xoaddr:$dst)>;
2773 def : Pat<(truncstorei16 (i32 (vector_extract v8i16:$S, 3)), xoaddr:$dst),
2774 (STXSIHXv $S, xoaddr:$dst)>;
2775 def : Pat<(truncstorei16 (i32 (vector_extract v8i16:$S, 4)), xoaddr:$dst),
2776 (STXSIHXv (VSLDOI $S, $S, 2), xoaddr:$dst)>;
2777 def : Pat<(truncstorei16 (i32 (vector_extract v8i16:$S, 5)), xoaddr:$dst),
2778 (STXSIHXv (VSLDOI $S, $S, 4), xoaddr:$dst)>;
2779 def : Pat<(truncstorei16 (i32 (vector_extract v8i16:$S, 6)), xoaddr:$dst),
2780 (STXSIHXv (VSLDOI $S, $S, 6), xoaddr:$dst)>;
2781 def : Pat<(truncstorei16 (i32 (vector_extract v8i16:$S, 7)), xoaddr:$dst),
2782 (STXSIHXv (VSLDOI $S, $S, 8), xoaddr:$dst)>;
2783 } // IsBigEndian, HasP9Vector
2784
2785 let Predicates = [IsLittleEndian, HasP9Vector] in {
2786 // Scalar stores of i8
2787 def : Pat<(truncstorei8 (i32 (vector_extract v16i8:$S, 0)), xoaddr:$dst),
2788 (STXSIBXv (VSLDOI $S, $S, 8), xoaddr:$dst)>;
2789 def : Pat<(truncstorei8 (i32 (vector_extract v16i8:$S, 1)), xoaddr:$dst),
2790 (STXSIBXv (VSLDOI $S, $S, 7), xoaddr:$dst)>;
2791 def : Pat<(truncstorei8 (i32 (vector_extract v16i8:$S, 2)), xoaddr:$dst),
2792 (STXSIBXv (VSLDOI $S, $S, 6), xoaddr:$dst)>;
2793 def : Pat<(truncstorei8 (i32 (vector_extract v16i8:$S, 3)), xoaddr:$dst),
2794 (STXSIBXv (VSLDOI $S, $S, 5), xoaddr:$dst)>;
2795 def : Pat<(truncstorei8 (i32 (vector_extract v16i8:$S, 4)), xoaddr:$dst),
2796 (STXSIBXv (VSLDOI $S, $S, 4), xoaddr:$dst)>;
2797 def : Pat<(truncstorei8 (i32 (vector_extract v16i8:$S, 5)), xoaddr:$dst),
2798 (STXSIBXv (VSLDOI $S, $S, 3), xoaddr:$dst)>;
2799 def : Pat<(truncstorei8 (i32 (vector_extract v16i8:$S, 6)), xoaddr:$dst),
2800 (STXSIBXv (VSLDOI $S, $S, 2), xoaddr:$dst)>;
2801 def : Pat<(truncstorei8 (i32 (vector_extract v16i8:$S, 7)), xoaddr:$dst),
2802 (STXSIBXv (VSLDOI $S, $S, 1), xoaddr:$dst)>;
2803 def : Pat<(truncstorei8 (i32 (vector_extract v16i8:$S, 8)), xoaddr:$dst),
2804 (STXSIBXv $S, xoaddr:$dst)>;
2805 def : Pat<(truncstorei8 (i32 (vector_extract v16i8:$S, 9)), xoaddr:$dst),
2806 (STXSIBXv (VSLDOI $S, $S, 15), xoaddr:$dst)>;
2807 def : Pat<(truncstorei8 (i32 (vector_extract v16i8:$S, 10)), xoaddr:$dst),
2808 (STXSIBXv (VSLDOI $S, $S, 14), xoaddr:$dst)>;
2809 def : Pat<(truncstorei8 (i32 (vector_extract v16i8:$S, 11)), xoaddr:$dst),
2810 (STXSIBXv (VSLDOI $S, $S, 13), xoaddr:$dst)>;
2811 def : Pat<(truncstorei8 (i32 (vector_extract v16i8:$S, 12)), xoaddr:$dst),
2812 (STXSIBXv (VSLDOI $S, $S, 12), xoaddr:$dst)>;
2813 def : Pat<(truncstorei8 (i32 (vector_extract v16i8:$S, 13)), xoaddr:$dst),
2814 (STXSIBXv (VSLDOI $S, $S, 11), xoaddr:$dst)>;
2815 def : Pat<(truncstorei8 (i32 (vector_extract v16i8:$S, 14)), xoaddr:$dst),
2816 (STXSIBXv (VSLDOI $S, $S, 10), xoaddr:$dst)>;
2817 def : Pat<(truncstorei8 (i32 (vector_extract v16i8:$S, 15)), xoaddr:$dst),
2818 (STXSIBXv (VSLDOI $S, $S, 9), xoaddr:$dst)>;
2819
2820 // Scalar stores of i16
2821 def : Pat<(truncstorei16 (i32 (vector_extract v8i16:$S, 0)), xoaddr:$dst),
2822 (STXSIHXv (VSLDOI $S, $S, 8), xoaddr:$dst)>;
2823 def : Pat<(truncstorei16 (i32 (vector_extract v8i16:$S, 1)), xoaddr:$dst),
2824 (STXSIHXv (VSLDOI $S, $S, 6), xoaddr:$dst)>;
2825 def : Pat<(truncstorei16 (i32 (vector_extract v8i16:$S, 2)), xoaddr:$dst),
2826 (STXSIHXv (VSLDOI $S, $S, 4), xoaddr:$dst)>;
2827 def : Pat<(truncstorei16 (i32 (vector_extract v8i16:$S, 3)), xoaddr:$dst),
2828 (STXSIHXv (VSLDOI $S, $S, 2), xoaddr:$dst)>;
2829 def : Pat<(truncstorei16 (i32 (vector_extract v8i16:$S, 4)), xoaddr:$dst),
2830 (STXSIHXv $S, xoaddr:$dst)>;
2831 def : Pat<(truncstorei16 (i32 (vector_extract v8i16:$S, 5)), xoaddr:$dst),
2832 (STXSIHXv (VSLDOI $S, $S, 14), xoaddr:$dst)>;
2833 def : Pat<(truncstorei16 (i32 (vector_extract v8i16:$S, 6)), xoaddr:$dst),
2834 (STXSIHXv (VSLDOI $S, $S, 12), xoaddr:$dst)>;
2835 def : Pat<(truncstorei16 (i32 (vector_extract v8i16:$S, 7)), xoaddr:$dst),
2836 (STXSIHXv (VSLDOI $S, $S, 10), xoaddr:$dst)>;
2837 } // IsLittleEndian, HasP9Vector
2838
Sean Fertile1c4109b2016-12-09 17:21:42 +00002839
Nemanja Ivanovic11049f82016-10-04 06:59:23 +00002840 // Vector sign extensions
2841 def : Pat<(f64 (PPCVexts f64:$A, 1)),
2842 (f64 (COPY_TO_REGCLASS (VEXTSB2Ds $A), VSFRC))>;
2843 def : Pat<(f64 (PPCVexts f64:$A, 2)),
2844 (f64 (COPY_TO_REGCLASS (VEXTSH2Ds $A), VSFRC))>;
Nemanja Ivanovicdf1cb522016-11-29 16:11:34 +00002845
Nemanja Ivanovic6354d232016-10-04 11:25:52 +00002846 let isPseudo = 1 in {
2847 def DFLOADf32 : Pseudo<(outs vssrc:$XT), (ins memrix:$src),
2848 "#DFLOADf32",
Nemanja Ivanovic3c7e276d2017-07-13 18:17:10 +00002849 [(set f32:$XT, (load ixaddr:$src))]>;
Nemanja Ivanovic6354d232016-10-04 11:25:52 +00002850 def DFLOADf64 : Pseudo<(outs vsfrc:$XT), (ins memrix:$src),
2851 "#DFLOADf64",
Nemanja Ivanovic3c7e276d2017-07-13 18:17:10 +00002852 [(set f64:$XT, (load ixaddr:$src))]>;
Nemanja Ivanovic6354d232016-10-04 11:25:52 +00002853 def DFSTOREf32 : Pseudo<(outs), (ins vssrc:$XT, memrix:$dst),
2854 "#DFSTOREf32",
Nemanja Ivanovic3c7e276d2017-07-13 18:17:10 +00002855 [(store f32:$XT, ixaddr:$dst)]>;
Nemanja Ivanovic6354d232016-10-04 11:25:52 +00002856 def DFSTOREf64 : Pseudo<(outs), (ins vsfrc:$XT, memrix:$dst),
2857 "#DFSTOREf64",
Nemanja Ivanovic3c7e276d2017-07-13 18:17:10 +00002858 [(store f64:$XT, ixaddr:$dst)]>;
Nemanja Ivanovic6354d232016-10-04 11:25:52 +00002859 }
Nemanja Ivanovic3c7e276d2017-07-13 18:17:10 +00002860 def : Pat<(f64 (extloadf32 ixaddr:$src)),
2861 (COPY_TO_REGCLASS (DFLOADf32 ixaddr:$src), VSFRC)>;
2862 def : Pat<(f32 (fpround (extloadf32 ixaddr:$src))),
2863 (f32 (DFLOADf32 ixaddr:$src))>;
Nemanja Ivanovicb43bb612016-07-12 21:00:10 +00002864} // end HasP9Vector, AddedComplexity
Nemanja Ivanovicd2c3c512016-09-23 13:25:31 +00002865
Nemanja Ivanovicdf1cb522016-11-29 16:11:34 +00002866// Integer extend helper dags 32 -> 64
2867def AnyExts {
2868 dag A = (INSERT_SUBREG (i64 (IMPLICIT_DEF)), $A, sub_32);
2869 dag B = (INSERT_SUBREG (i64 (IMPLICIT_DEF)), $B, sub_32);
2870 dag C = (INSERT_SUBREG (i64 (IMPLICIT_DEF)), $C, sub_32);
2871 dag D = (INSERT_SUBREG (i64 (IMPLICIT_DEF)), $D, sub_32);
Nemanja Ivanovicd2c3c512016-09-23 13:25:31 +00002872}
2873
Nemanja Ivanovicdf1cb522016-11-29 16:11:34 +00002874def DblToFlt {
2875 dag A0 = (f32 (fpround (f64 (extractelt v2f64:$A, 0))));
2876 dag A1 = (f32 (fpround (f64 (extractelt v2f64:$A, 1))));
2877 dag B0 = (f32 (fpround (f64 (extractelt v2f64:$B, 0))));
2878 dag B1 = (f32 (fpround (f64 (extractelt v2f64:$B, 1))));
2879}
Zaara Syeda79acbbe2017-06-08 17:14:36 +00002880
2881def ByteToWord {
Tony Jiang9a91a182017-07-05 16:00:38 +00002882 dag LE_A0 = (i32 (sext_inreg (i32 (vector_extract v16i8:$A, 0)), i8));
2883 dag LE_A1 = (i32 (sext_inreg (i32 (vector_extract v16i8:$A, 4)), i8));
2884 dag LE_A2 = (i32 (sext_inreg (i32 (vector_extract v16i8:$A, 8)), i8));
2885 dag LE_A3 = (i32 (sext_inreg (i32 (vector_extract v16i8:$A, 12)), i8));
2886 dag BE_A0 = (i32 (sext_inreg (i32 (vector_extract v16i8:$A, 3)), i8));
2887 dag BE_A1 = (i32 (sext_inreg (i32 (vector_extract v16i8:$A, 7)), i8));
2888 dag BE_A2 = (i32 (sext_inreg (i32 (vector_extract v16i8:$A, 11)), i8));
2889 dag BE_A3 = (i32 (sext_inreg (i32 (vector_extract v16i8:$A, 15)), i8));
Zaara Syeda79acbbe2017-06-08 17:14:36 +00002890}
2891
2892def ByteToDWord {
Tony Jiang9a91a182017-07-05 16:00:38 +00002893 dag LE_A0 = (i64 (sext_inreg
2894 (i64 (anyext (i32 (vector_extract v16i8:$A, 0)))), i8));
2895 dag LE_A1 = (i64 (sext_inreg
2896 (i64 (anyext (i32 (vector_extract v16i8:$A, 8)))), i8));
2897 dag BE_A0 = (i64 (sext_inreg
2898 (i64 (anyext (i32 (vector_extract v16i8:$A, 7)))), i8));
2899 dag BE_A1 = (i64 (sext_inreg
2900 (i64 (anyext (i32 (vector_extract v16i8:$A, 15)))), i8));
Zaara Syeda79acbbe2017-06-08 17:14:36 +00002901}
2902
2903def HWordToWord {
Tony Jiang9a91a182017-07-05 16:00:38 +00002904 dag LE_A0 = (i32 (sext_inreg (i32 (vector_extract v8i16:$A, 0)), i16));
2905 dag LE_A1 = (i32 (sext_inreg (i32 (vector_extract v8i16:$A, 2)), i16));
2906 dag LE_A2 = (i32 (sext_inreg (i32 (vector_extract v8i16:$A, 4)), i16));
2907 dag LE_A3 = (i32 (sext_inreg (i32 (vector_extract v8i16:$A, 6)), i16));
2908 dag BE_A0 = (i32 (sext_inreg (i32 (vector_extract v8i16:$A, 1)), i16));
2909 dag BE_A1 = (i32 (sext_inreg (i32 (vector_extract v8i16:$A, 3)), i16));
2910 dag BE_A2 = (i32 (sext_inreg (i32 (vector_extract v8i16:$A, 5)), i16));
2911 dag BE_A3 = (i32 (sext_inreg (i32 (vector_extract v8i16:$A, 7)), i16));
Zaara Syeda79acbbe2017-06-08 17:14:36 +00002912}
2913
2914def HWordToDWord {
Tony Jiang9a91a182017-07-05 16:00:38 +00002915 dag LE_A0 = (i64 (sext_inreg
2916 (i64 (anyext (i32 (vector_extract v8i16:$A, 0)))), i16));
2917 dag LE_A1 = (i64 (sext_inreg
2918 (i64 (anyext (i32 (vector_extract v8i16:$A, 4)))), i16));
2919 dag BE_A0 = (i64 (sext_inreg
2920 (i64 (anyext (i32 (vector_extract v8i16:$A, 3)))), i16));
2921 dag BE_A1 = (i64 (sext_inreg
2922 (i64 (anyext (i32 (vector_extract v8i16:$A, 7)))), i16));
Zaara Syeda79acbbe2017-06-08 17:14:36 +00002923}
2924
2925def WordToDWord {
Tony Jiang9a91a182017-07-05 16:00:38 +00002926 dag LE_A0 = (i64 (sext (i32 (vector_extract v4i32:$A, 0))));
2927 dag LE_A1 = (i64 (sext (i32 (vector_extract v4i32:$A, 2))));
2928 dag BE_A0 = (i64 (sext (i32 (vector_extract v4i32:$A, 1))));
2929 dag BE_A1 = (i64 (sext (i32 (vector_extract v4i32:$A, 3))));
Zaara Syeda79acbbe2017-06-08 17:14:36 +00002930}
2931
Nemanja Ivanovicdf1cb522016-11-29 16:11:34 +00002932def FltToIntLoad {
2933 dag A = (i32 (PPCmfvsr (PPCfctiwz (f64 (extloadf32 xoaddr:$A)))));
2934}
2935def FltToUIntLoad {
2936 dag A = (i32 (PPCmfvsr (PPCfctiwuz (f64 (extloadf32 xoaddr:$A)))));
2937}
2938def FltToLongLoad {
2939 dag A = (i64 (PPCmfvsr (PPCfctidz (f64 (extloadf32 xoaddr:$A)))));
2940}
Hiroshi Inouee3c14eb2017-05-29 07:12:39 +00002941def FltToLongLoadP9 {
Nemanja Ivanovic3c7e276d2017-07-13 18:17:10 +00002942 dag A = (i64 (PPCmfvsr (PPCfctidz (f64 (extloadf32 ixaddr:$A)))));
Hiroshi Inouee3c14eb2017-05-29 07:12:39 +00002943}
Nemanja Ivanovicdf1cb522016-11-29 16:11:34 +00002944def FltToULongLoad {
2945 dag A = (i64 (PPCmfvsr (PPCfctiduz (f64 (extloadf32 xoaddr:$A)))));
2946}
Hiroshi Inouee3c14eb2017-05-29 07:12:39 +00002947def FltToULongLoadP9 {
Nemanja Ivanovic3c7e276d2017-07-13 18:17:10 +00002948 dag A = (i64 (PPCmfvsr (PPCfctiduz (f64 (extloadf32 ixaddr:$A)))));
Hiroshi Inouee3c14eb2017-05-29 07:12:39 +00002949}
Nemanja Ivanovicdf1cb522016-11-29 16:11:34 +00002950def FltToLong {
2951 dag A = (i64 (PPCmfvsr (PPCfctidz (fpextend f32:$A))));
2952}
2953def FltToULong {
2954 dag A = (i64 (PPCmfvsr (PPCfctiduz (fpextend f32:$A))));
2955}
2956def DblToInt {
2957 dag A = (i32 (PPCmfvsr (f64 (PPCfctiwz f64:$A))));
2958}
2959def DblToUInt {
2960 dag A = (i32 (PPCmfvsr (f64 (PPCfctiwuz f64:$A))));
2961}
2962def DblToLong {
2963 dag A = (i64 (PPCmfvsr (f64 (PPCfctidz f64:$A))));
2964}
2965def DblToULong {
2966 dag A = (i64 (PPCmfvsr (f64 (PPCfctiduz f64:$A))));
2967}
2968def DblToIntLoad {
2969 dag A = (i32 (PPCmfvsr (PPCfctiwz (f64 (load xoaddr:$A)))));
2970}
Hiroshi Inouee3c14eb2017-05-29 07:12:39 +00002971def DblToIntLoadP9 {
Nemanja Ivanovic3c7e276d2017-07-13 18:17:10 +00002972 dag A = (i32 (PPCmfvsr (PPCfctiwz (f64 (load ixaddr:$A)))));
Hiroshi Inouee3c14eb2017-05-29 07:12:39 +00002973}
Nemanja Ivanovicdf1cb522016-11-29 16:11:34 +00002974def DblToUIntLoad {
2975 dag A = (i32 (PPCmfvsr (PPCfctiwuz (f64 (load xoaddr:$A)))));
2976}
Hiroshi Inouee3c14eb2017-05-29 07:12:39 +00002977def DblToUIntLoadP9 {
Nemanja Ivanovic3c7e276d2017-07-13 18:17:10 +00002978 dag A = (i32 (PPCmfvsr (PPCfctiwuz (f64 (load ixaddr:$A)))));
Hiroshi Inouee3c14eb2017-05-29 07:12:39 +00002979}
Nemanja Ivanovicdf1cb522016-11-29 16:11:34 +00002980def DblToLongLoad {
2981 dag A = (i64 (PPCmfvsr (PPCfctidz (f64 (load xoaddr:$A)))));
2982}
2983def DblToULongLoad {
2984 dag A = (i64 (PPCmfvsr (PPCfctiduz (f64 (load xoaddr:$A)))));
2985}
2986
2987// FP merge dags (for f32 -> v4f32)
2988def MrgFP {
2989 dag AC = (XVCVDPSP (XXPERMDI (COPY_TO_REGCLASS $A, VSRC),
2990 (COPY_TO_REGCLASS $C, VSRC), 0));
2991 dag BD = (XVCVDPSP (XXPERMDI (COPY_TO_REGCLASS $B, VSRC),
2992 (COPY_TO_REGCLASS $D, VSRC), 0));
2993 dag ABhToFlt = (XVCVDPSP (XXPERMDI $A, $B, 0));
2994 dag ABlToFlt = (XVCVDPSP (XXPERMDI $A, $B, 3));
2995 dag BAhToFlt = (XVCVDPSP (XXPERMDI $B, $A, 0));
2996 dag BAlToFlt = (XVCVDPSP (XXPERMDI $B, $A, 3));
2997}
2998
2999// Patterns for BUILD_VECTOR nodes.
3000def NoP9Vector : Predicate<"!PPCSubTarget->hasP9Vector()">;
3001let AddedComplexity = 400 in {
3002
3003 let Predicates = [HasVSX] in {
3004 // Build vectors of floating point converted to i32.
3005 def : Pat<(v4i32 (build_vector DblToInt.A, DblToInt.A,
3006 DblToInt.A, DblToInt.A)),
3007 (v4i32 (XXSPLTW (COPY_TO_REGCLASS (XSCVDPSXWS $A), VSRC), 1))>;
3008 def : Pat<(v4i32 (build_vector DblToUInt.A, DblToUInt.A,
3009 DblToUInt.A, DblToUInt.A)),
3010 (v4i32 (XXSPLTW (COPY_TO_REGCLASS (XSCVDPUXWS $A), VSRC), 1))>;
3011 def : Pat<(v2i64 (build_vector DblToLong.A, DblToLong.A)),
3012 (v2i64 (XXPERMDI (COPY_TO_REGCLASS (XSCVDPSXDS $A), VSRC),
3013 (COPY_TO_REGCLASS (XSCVDPSXDS $A), VSRC), 0))>;
3014 def : Pat<(v2i64 (build_vector DblToULong.A, DblToULong.A)),
3015 (v2i64 (XXPERMDI (COPY_TO_REGCLASS (XSCVDPUXDS $A), VSRC),
3016 (COPY_TO_REGCLASS (XSCVDPUXDS $A), VSRC), 0))>;
3017 def : Pat<(v4i32 (scalar_to_vector FltToIntLoad.A)),
3018 (v4i32 (XXSPLTW (COPY_TO_REGCLASS
3019 (XSCVDPSXWSs (LXSSPX xoaddr:$A)), VSRC), 1))>;
3020 def : Pat<(v4i32 (scalar_to_vector FltToUIntLoad.A)),
3021 (v4i32 (XXSPLTW (COPY_TO_REGCLASS
3022 (XSCVDPUXWSs (LXSSPX xoaddr:$A)), VSRC), 1))>;
3023 def : Pat<(v4f32 (build_vector f32:$A, f32:$A, f32:$A, f32:$A)),
3024 (v4f32 (XXSPLTW (v4f32 (XSCVDPSPN $A)), 0))>;
3025
3026 // Build vectors of floating point converted to i64.
3027 def : Pat<(v2i64 (build_vector FltToLong.A, FltToLong.A)),
Nemanja Ivanovic15748f42016-12-06 11:47:14 +00003028 (v2i64 (XXPERMDIs
3029 (COPY_TO_REGCLASS (XSCVDPSXDSs $A), VSFRC), 0))>;
Nemanja Ivanovicdf1cb522016-11-29 16:11:34 +00003030 def : Pat<(v2i64 (build_vector FltToULong.A, FltToULong.A)),
Nemanja Ivanovic15748f42016-12-06 11:47:14 +00003031 (v2i64 (XXPERMDIs
3032 (COPY_TO_REGCLASS (XSCVDPUXDSs $A), VSFRC), 0))>;
Nemanja Ivanovicdf1cb522016-11-29 16:11:34 +00003033 def : Pat<(v2i64 (scalar_to_vector DblToLongLoad.A)),
3034 (v2i64 (XVCVDPSXDS (LXVDSX xoaddr:$A)))>;
3035 def : Pat<(v2i64 (scalar_to_vector DblToULongLoad.A)),
3036 (v2i64 (XVCVDPUXDS (LXVDSX xoaddr:$A)))>;
3037 }
3038
3039 let Predicates = [HasVSX, NoP9Vector] in {
3040 // Load-and-splat with fp-to-int conversion (using X-Form VSX loads).
3041 def : Pat<(v4i32 (scalar_to_vector DblToIntLoad.A)),
3042 (v4i32 (XXSPLTW (COPY_TO_REGCLASS
3043 (XSCVDPSXWS (LXSDX xoaddr:$A)), VSRC), 1))>;
3044 def : Pat<(v4i32 (scalar_to_vector DblToUIntLoad.A)),
3045 (v4i32 (XXSPLTW (COPY_TO_REGCLASS
3046 (XSCVDPUXWS (LXSDX xoaddr:$A)), VSRC), 1))>;
3047 def : Pat<(v2i64 (scalar_to_vector FltToLongLoad.A)),
3048 (v2i64 (XXPERMDIs (XSCVDPSXDS (COPY_TO_REGCLASS
3049 (LXSSPX xoaddr:$A), VSFRC)), 0))>;
3050 def : Pat<(v2i64 (scalar_to_vector FltToULongLoad.A)),
3051 (v2i64 (XXPERMDIs (XSCVDPUXDS (COPY_TO_REGCLASS
3052 (LXSSPX xoaddr:$A), VSFRC)), 0))>;
3053 }
3054
3055 // Big endian, available on all targets with VSX
3056 let Predicates = [IsBigEndian, HasVSX] in {
3057 def : Pat<(v2f64 (build_vector f64:$A, f64:$B)),
3058 (v2f64 (XXPERMDI
3059 (COPY_TO_REGCLASS $A, VSRC),
3060 (COPY_TO_REGCLASS $B, VSRC), 0))>;
3061
3062 def : Pat<(v4f32 (build_vector f32:$A, f32:$B, f32:$C, f32:$D)),
3063 (VMRGEW MrgFP.AC, MrgFP.BD)>;
3064 def : Pat<(v4f32 (build_vector DblToFlt.A0, DblToFlt.A1,
3065 DblToFlt.B0, DblToFlt.B1)),
3066 (v4f32 (VMRGEW MrgFP.ABhToFlt, MrgFP.ABlToFlt))>;
3067 }
3068
3069 let Predicates = [IsLittleEndian, HasVSX] in {
3070 // Little endian, available on all targets with VSX
3071 def : Pat<(v2f64 (build_vector f64:$A, f64:$B)),
3072 (v2f64 (XXPERMDI
3073 (COPY_TO_REGCLASS $B, VSRC),
3074 (COPY_TO_REGCLASS $A, VSRC), 0))>;
3075
3076 def : Pat<(v4f32 (build_vector f32:$D, f32:$C, f32:$B, f32:$A)),
3077 (VMRGEW MrgFP.AC, MrgFP.BD)>;
3078 def : Pat<(v4f32 (build_vector DblToFlt.A0, DblToFlt.A1,
3079 DblToFlt.B0, DblToFlt.B1)),
3080 (v4f32 (VMRGEW MrgFP.BAhToFlt, MrgFP.BAlToFlt))>;
3081 }
3082
3083 let Predicates = [HasDirectMove] in {
3084 // Endianness-neutral constant splat on P8 and newer targets. The reason
3085 // for this pattern is that on targets with direct moves, we don't expand
3086 // BUILD_VECTOR nodes for v4i32.
3087 def : Pat<(v4i32 (build_vector immSExt5NonZero:$A, immSExt5NonZero:$A,
3088 immSExt5NonZero:$A, immSExt5NonZero:$A)),
3089 (v4i32 (VSPLTISW imm:$A))>;
3090 }
3091
3092 let Predicates = [IsBigEndian, HasDirectMove, NoP9Vector] in {
3093 // Big endian integer vectors using direct moves.
3094 def : Pat<(v2i64 (build_vector i64:$A, i64:$B)),
3095 (v2i64 (XXPERMDI
3096 (COPY_TO_REGCLASS (MTVSRD $A), VSRC),
3097 (COPY_TO_REGCLASS (MTVSRD $B), VSRC), 0))>;
3098 def : Pat<(v4i32 (build_vector i32:$A, i32:$B, i32:$C, i32:$D)),
3099 (VMRGOW (XXPERMDI (COPY_TO_REGCLASS (MTVSRWZ $A), VSRC),
3100 (COPY_TO_REGCLASS (MTVSRWZ $C), VSRC), 0),
3101 (XXPERMDI (COPY_TO_REGCLASS (MTVSRWZ $B), VSRC),
3102 (COPY_TO_REGCLASS (MTVSRWZ $D), VSRC), 0))>;
3103 def : Pat<(v4i32 (build_vector i32:$A, i32:$A, i32:$A, i32:$A)),
3104 (XXSPLTW (COPY_TO_REGCLASS (MTVSRWZ $A), VSRC), 1)>;
3105 }
3106
3107 let Predicates = [IsLittleEndian, HasDirectMove, NoP9Vector] in {
3108 // Little endian integer vectors using direct moves.
3109 def : Pat<(v2i64 (build_vector i64:$A, i64:$B)),
3110 (v2i64 (XXPERMDI
3111 (COPY_TO_REGCLASS (MTVSRD $B), VSRC),
3112 (COPY_TO_REGCLASS (MTVSRD $A), VSRC), 0))>;
3113 def : Pat<(v4i32 (build_vector i32:$A, i32:$B, i32:$C, i32:$D)),
3114 (VMRGOW (XXPERMDI (COPY_TO_REGCLASS (MTVSRWZ $D), VSRC),
3115 (COPY_TO_REGCLASS (MTVSRWZ $B), VSRC), 0),
3116 (XXPERMDI (COPY_TO_REGCLASS (MTVSRWZ $C), VSRC),
3117 (COPY_TO_REGCLASS (MTVSRWZ $A), VSRC), 0))>;
3118 def : Pat<(v4i32 (build_vector i32:$A, i32:$A, i32:$A, i32:$A)),
3119 (XXSPLTW (COPY_TO_REGCLASS (MTVSRWZ $A), VSRC), 1)>;
3120 }
3121
3122 let Predicates = [HasP9Vector] in {
3123 // Endianness-neutral patterns for const splats with ISA 3.0 instructions.
3124 def : Pat<(v4i32 (scalar_to_vector i32:$A)),
3125 (v4i32 (MTVSRWS $A))>;
3126 def : Pat<(v4i32 (build_vector i32:$A, i32:$A, i32:$A, i32:$A)),
3127 (v4i32 (MTVSRWS $A))>;
Nemanja Ivanovic552c8e92016-12-15 11:16:20 +00003128 def : Pat<(v16i8 (build_vector immAnyExt8:$A, immAnyExt8:$A, immAnyExt8:$A,
3129 immAnyExt8:$A, immAnyExt8:$A, immAnyExt8:$A,
3130 immAnyExt8:$A, immAnyExt8:$A, immAnyExt8:$A,
3131 immAnyExt8:$A, immAnyExt8:$A, immAnyExt8:$A,
3132 immAnyExt8:$A, immAnyExt8:$A, immAnyExt8:$A,
3133 immAnyExt8:$A)),
Nemanja Ivanovicdf1cb522016-11-29 16:11:34 +00003134 (v16i8 (COPY_TO_REGCLASS (XXSPLTIB imm:$A), VSRC))>;
3135 def : Pat<(v16i8 immAllOnesV),
3136 (v16i8 (COPY_TO_REGCLASS (XXSPLTIB 255), VSRC))>;
3137 def : Pat<(v8i16 immAllOnesV),
3138 (v8i16 (COPY_TO_REGCLASS (XXSPLTIB 255), VSRC))>;
3139 def : Pat<(v4i32 immAllOnesV),
3140 (v4i32 (XXSPLTIB 255))>;
3141 def : Pat<(v2i64 immAllOnesV),
3142 (v2i64 (XXSPLTIB 255))>;
3143 def : Pat<(v4i32 (scalar_to_vector FltToIntLoad.A)),
3144 (v4i32 (XVCVSPSXWS (LXVWSX xoaddr:$A)))>;
3145 def : Pat<(v4i32 (scalar_to_vector FltToUIntLoad.A)),
3146 (v4i32 (XVCVSPUXWS (LXVWSX xoaddr:$A)))>;
Hiroshi Inouee3c14eb2017-05-29 07:12:39 +00003147 def : Pat<(v4i32 (scalar_to_vector DblToIntLoadP9.A)),
Nemanja Ivanovicdf1cb522016-11-29 16:11:34 +00003148 (v4i32 (XXSPLTW (COPY_TO_REGCLASS
Nemanja Ivanovic3c7e276d2017-07-13 18:17:10 +00003149 (XSCVDPSXWS (DFLOADf64 ixaddr:$A)), VSRC), 1))>;
Hiroshi Inouee3c14eb2017-05-29 07:12:39 +00003150 def : Pat<(v4i32 (scalar_to_vector DblToUIntLoadP9.A)),
Nemanja Ivanovicdf1cb522016-11-29 16:11:34 +00003151 (v4i32 (XXSPLTW (COPY_TO_REGCLASS
Nemanja Ivanovic3c7e276d2017-07-13 18:17:10 +00003152 (XSCVDPUXWS (DFLOADf64 ixaddr:$A)), VSRC), 1))>;
Hiroshi Inouee3c14eb2017-05-29 07:12:39 +00003153 def : Pat<(v2i64 (scalar_to_vector FltToLongLoadP9.A)),
Nemanja Ivanovicdf1cb522016-11-29 16:11:34 +00003154 (v2i64 (XXPERMDIs (XSCVDPSXDS (COPY_TO_REGCLASS
Nemanja Ivanovic3c7e276d2017-07-13 18:17:10 +00003155 (DFLOADf32 ixaddr:$A),
Nemanja Ivanovicdf1cb522016-11-29 16:11:34 +00003156 VSFRC)), 0))>;
Hiroshi Inouee3c14eb2017-05-29 07:12:39 +00003157 def : Pat<(v2i64 (scalar_to_vector FltToULongLoadP9.A)),
Nemanja Ivanovicdf1cb522016-11-29 16:11:34 +00003158 (v2i64 (XXPERMDIs (XSCVDPUXDS (COPY_TO_REGCLASS
Nemanja Ivanovic3c7e276d2017-07-13 18:17:10 +00003159 (DFLOADf32 ixaddr:$A),
Nemanja Ivanovicdf1cb522016-11-29 16:11:34 +00003160 VSFRC)), 0))>;
3161 }
3162
3163 let Predicates = [IsISA3_0, HasDirectMove, IsBigEndian] in {
3164 def : Pat<(i64 (extractelt v2i64:$A, 1)),
3165 (i64 (MFVSRLD $A))>;
3166 // Better way to build integer vectors if we have MTVSRDD. Big endian.
3167 def : Pat<(v2i64 (build_vector i64:$rB, i64:$rA)),
3168 (v2i64 (MTVSRDD $rB, $rA))>;
3169 def : Pat<(v4i32 (build_vector i32:$A, i32:$B, i32:$C, i32:$D)),
3170 (VMRGOW (COPY_TO_REGCLASS (MTVSRDD AnyExts.A, AnyExts.C), VSRC),
3171 (COPY_TO_REGCLASS (MTVSRDD AnyExts.B, AnyExts.D), VSRC))>;
3172 }
3173
3174 let Predicates = [IsISA3_0, HasDirectMove, IsLittleEndian] in {
3175 def : Pat<(i64 (extractelt v2i64:$A, 0)),
3176 (i64 (MFVSRLD $A))>;
3177 // Better way to build integer vectors if we have MTVSRDD. Little endian.
3178 def : Pat<(v2i64 (build_vector i64:$rA, i64:$rB)),
3179 (v2i64 (MTVSRDD $rB, $rA))>;
3180 def : Pat<(v4i32 (build_vector i32:$A, i32:$B, i32:$C, i32:$D)),
3181 (VMRGOW (COPY_TO_REGCLASS (MTVSRDD AnyExts.D, AnyExts.B), VSRC),
3182 (COPY_TO_REGCLASS (MTVSRDD AnyExts.C, AnyExts.A), VSRC))>;
3183 }
Zaara Syeda79acbbe2017-06-08 17:14:36 +00003184 // P9 Altivec instructions that can be used to build vectors.
3185 // Adding them to PPCInstrVSX.td rather than PPCAltivecVSX.td to compete
3186 // with complexities of existing build vector patterns in this file.
Tony Jiang9a91a182017-07-05 16:00:38 +00003187 let Predicates = [HasP9Altivec, IsLittleEndian] in {
3188 def : Pat<(v2i64 (build_vector WordToDWord.LE_A0, WordToDWord.LE_A1)),
Zaara Syeda79acbbe2017-06-08 17:14:36 +00003189 (v2i64 (VEXTSW2D $A))>;
Tony Jiang9a91a182017-07-05 16:00:38 +00003190 def : Pat<(v2i64 (build_vector HWordToDWord.LE_A0, HWordToDWord.LE_A1)),
Zaara Syeda79acbbe2017-06-08 17:14:36 +00003191 (v2i64 (VEXTSH2D $A))>;
Tony Jiang9a91a182017-07-05 16:00:38 +00003192 def : Pat<(v4i32 (build_vector HWordToWord.LE_A0, HWordToWord.LE_A1,
3193 HWordToWord.LE_A2, HWordToWord.LE_A3)),
Zaara Syeda79acbbe2017-06-08 17:14:36 +00003194 (v4i32 (VEXTSH2W $A))>;
Tony Jiang9a91a182017-07-05 16:00:38 +00003195 def : Pat<(v4i32 (build_vector ByteToWord.LE_A0, ByteToWord.LE_A1,
3196 ByteToWord.LE_A2, ByteToWord.LE_A3)),
Zaara Syeda79acbbe2017-06-08 17:14:36 +00003197 (v4i32 (VEXTSB2W $A))>;
Tony Jiang9a91a182017-07-05 16:00:38 +00003198 def : Pat<(v2i64 (build_vector ByteToDWord.LE_A0, ByteToDWord.LE_A1)),
Zaara Syeda79acbbe2017-06-08 17:14:36 +00003199 (v2i64 (VEXTSB2D $A))>;
3200 }
Tony Jiang9a91a182017-07-05 16:00:38 +00003201
3202 let Predicates = [HasP9Altivec, IsBigEndian] in {
3203 def : Pat<(v2i64 (build_vector WordToDWord.BE_A0, WordToDWord.BE_A1)),
3204 (v2i64 (VEXTSW2D $A))>;
3205 def : Pat<(v2i64 (build_vector HWordToDWord.BE_A0, HWordToDWord.BE_A1)),
3206 (v2i64 (VEXTSH2D $A))>;
3207 def : Pat<(v4i32 (build_vector HWordToWord.BE_A0, HWordToWord.BE_A1,
3208 HWordToWord.BE_A2, HWordToWord.BE_A3)),
3209 (v4i32 (VEXTSH2W $A))>;
3210 def : Pat<(v4i32 (build_vector ByteToWord.BE_A0, ByteToWord.BE_A1,
3211 ByteToWord.BE_A2, ByteToWord.BE_A3)),
3212 (v4i32 (VEXTSB2W $A))>;
3213 def : Pat<(v2i64 (build_vector ByteToDWord.BE_A0, ByteToDWord.BE_A1)),
3214 (v2i64 (VEXTSB2D $A))>;
3215 }
3216
3217 let Predicates = [HasP9Altivec] in {
3218 def: Pat<(v2i64 (PPCSExtVElems v16i8:$A)),
3219 (v2i64 (VEXTSB2D $A))>;
3220 def: Pat<(v2i64 (PPCSExtVElems v8i16:$A)),
3221 (v2i64 (VEXTSH2D $A))>;
3222 def: Pat<(v2i64 (PPCSExtVElems v4i32:$A)),
3223 (v2i64 (VEXTSW2D $A))>;
3224 def: Pat<(v4i32 (PPCSExtVElems v16i8:$A)),
3225 (v4i32 (VEXTSB2W $A))>;
3226 def: Pat<(v4i32 (PPCSExtVElems v8i16:$A)),
3227 (v4i32 (VEXTSH2W $A))>;
3228 }
Nemanja Ivanovicd2c3c512016-09-23 13:25:31 +00003229}