blob: f203c67a651d0616a993d18223040d46e3417b0d [file] [log] [blame]
Hal Finkel27774d92014-03-13 07:58:58 +00001//===- PPCInstrVSX.td - The PowerPC VSX Extension --*- tablegen -*-===//
2//
3// The LLVM Compiler Infrastructure
4//
5// This file is distributed under the University of Illinois Open Source
6// License. See LICENSE.TXT for details.
7//
8//===----------------------------------------------------------------------===//
9//
10// This file describes the VSX extension to the PowerPC instruction set.
11//
12//===----------------------------------------------------------------------===//
13
Bill Schmidtfe723b92015-04-27 19:57:34 +000014// *********************************** NOTE ***********************************
15// ** For POWER8 Little Endian, the VSX swap optimization relies on knowing **
16// ** which VMX and VSX instructions are lane-sensitive and which are not. **
17// ** A lane-sensitive instruction relies, implicitly or explicitly, on **
18// ** whether lanes are numbered from left to right. An instruction like **
19// ** VADDFP is not lane-sensitive, because each lane of the result vector **
20// ** relies only on the corresponding lane of the source vectors. However, **
21// ** an instruction like VMULESB is lane-sensitive, because "even" and **
22// ** "odd" lanes are different for big-endian and little-endian numbering. **
23// ** **
24// ** When adding new VMX and VSX instructions, please consider whether they **
25// ** are lane-sensitive. If so, they must be added to a switch statement **
26// ** in PPCVSXSwapRemoval::gatherVectorInstructions(). **
27// ****************************************************************************
28
Hal Finkel27774d92014-03-13 07:58:58 +000029def PPCRegVSRCAsmOperand : AsmOperandClass {
30 let Name = "RegVSRC"; let PredicateMethod = "isVSRegNumber";
31}
32def vsrc : RegisterOperand<VSRC> {
33 let ParserMatchClass = PPCRegVSRCAsmOperand;
34}
35
Hal Finkel19be5062014-03-29 05:29:01 +000036def PPCRegVSFRCAsmOperand : AsmOperandClass {
37 let Name = "RegVSFRC"; let PredicateMethod = "isVSRegNumber";
38}
39def vsfrc : RegisterOperand<VSFRC> {
40 let ParserMatchClass = PPCRegVSFRCAsmOperand;
41}
42
Nemanja Ivanovicf3c94b12015-05-07 18:24:05 +000043def PPCRegVSSRCAsmOperand : AsmOperandClass {
44 let Name = "RegVSSRC"; let PredicateMethod = "isVSRegNumber";
45}
46def vssrc : RegisterOperand<VSSRC> {
47 let ParserMatchClass = PPCRegVSSRCAsmOperand;
48}
49
Bill Schmidtfae5d712014-12-09 16:35:51 +000050// Little-endian-specific nodes.
51def SDT_PPClxvd2x : SDTypeProfile<1, 1, [
52 SDTCisVT<0, v2f64>, SDTCisPtrTy<1>
53]>;
54def SDT_PPCstxvd2x : SDTypeProfile<0, 2, [
55 SDTCisVT<0, v2f64>, SDTCisPtrTy<1>
56]>;
57def SDT_PPCxxswapd : SDTypeProfile<1, 1, [
58 SDTCisSameAs<0, 1>
59]>;
Nemanja Ivanovic44513e52016-07-05 09:22:29 +000060def SDTVecConv : SDTypeProfile<1, 2, [
61 SDTCisVec<0>, SDTCisVec<1>, SDTCisPtrTy<2>
62]>;
Bill Schmidtfae5d712014-12-09 16:35:51 +000063
64def PPClxvd2x : SDNode<"PPCISD::LXVD2X", SDT_PPClxvd2x,
65 [SDNPHasChain, SDNPMayLoad]>;
66def PPCstxvd2x : SDNode<"PPCISD::STXVD2X", SDT_PPCstxvd2x,
67 [SDNPHasChain, SDNPMayStore]>;
68def PPCxxswapd : SDNode<"PPCISD::XXSWAPD", SDT_PPCxxswapd, [SDNPHasChain]>;
Nemanja Ivanovicc38b5312015-04-11 10:40:42 +000069def PPCmfvsr : SDNode<"PPCISD::MFVSR", SDTUnaryOp, []>;
70def PPCmtvsra : SDNode<"PPCISD::MTVSRA", SDTUnaryOp, []>;
71def PPCmtvsrz : SDNode<"PPCISD::MTVSRZ", SDTUnaryOp, []>;
Nemanja Ivanovic44513e52016-07-05 09:22:29 +000072def PPCsvec2fp : SDNode<"PPCISD::SINT_VEC_TO_FP", SDTVecConv, []>;
73def PPCuvec2fp: SDNode<"PPCISD::UINT_VEC_TO_FP", SDTVecConv, []>;
Nemanja Ivanoviceebbcb62016-07-12 12:16:27 +000074def PPCswapNoChain : SDNode<"PPCISD::SWAP_NO_CHAIN", SDT_PPCxxswapd>;
Bill Schmidtfae5d712014-12-09 16:35:51 +000075
Nemanja Ivanovic2c84b292015-09-29 17:41:53 +000076multiclass XX3Form_Rcr<bits<6> opcode, bits<7> xo, string asmbase,
77 string asmstr, InstrItinClass itin, Intrinsic Int,
78 ValueType OutTy, ValueType InTy> {
Hal Finkel27774d92014-03-13 07:58:58 +000079 let BaseName = asmbase in {
Nemanja Ivanovic2c84b292015-09-29 17:41:53 +000080 def NAME : XX3Form_Rc<opcode, xo, (outs vsrc:$XT), (ins vsrc:$XA, vsrc:$XB),
Hal Finkel27774d92014-03-13 07:58:58 +000081 !strconcat(asmbase, !strconcat(" ", asmstr)), itin,
Nemanja Ivanovic2c84b292015-09-29 17:41:53 +000082 [(set OutTy:$XT, (Int InTy:$XA, InTy:$XB))]>;
Hal Finkel27774d92014-03-13 07:58:58 +000083 let Defs = [CR6] in
Nemanja Ivanovic2c84b292015-09-29 17:41:53 +000084 def o : XX3Form_Rc<opcode, xo, (outs vsrc:$XT), (ins vsrc:$XA, vsrc:$XB),
Hal Finkel27774d92014-03-13 07:58:58 +000085 !strconcat(asmbase, !strconcat(". ", asmstr)), itin,
Nemanja Ivanovic2c84b292015-09-29 17:41:53 +000086 [(set InTy:$XT,
87 (InTy (PPCvcmp_o InTy:$XA, InTy:$XB, xo)))]>,
88 isDOT;
Hal Finkel27774d92014-03-13 07:58:58 +000089 }
90}
91
Nemanja Ivanovic11049f82016-10-04 06:59:23 +000092// Instruction form with a single input register for instructions such as
93// XXPERMDI. The reason for defining this is that specifying multiple chained
94// operands (such as loads) to an instruction will perform both chained
95// operations rather than coalescing them into a single register - even though
96// the source memory location is the same. This simply forces the instruction
97// to use the same register for both inputs.
98// For example, an output DAG such as this:
99// (XXPERMDI (LXSIBZX xoaddr:$src), (LXSIBZX xoaddr:$src ), 0))
100// would result in two load instructions emitted and used as separate inputs
101// to the XXPERMDI instruction.
102class XX3Form_2s<bits<6> opcode, bits<5> xo, dag OOL, dag IOL, string asmstr,
103 InstrItinClass itin, list<dag> pattern>
104 : XX3Form_2<opcode, xo, OOL, IOL, asmstr, itin, pattern> {
105 let XB = XA;
106}
107
Eric Christopher1b8e7632014-05-22 01:07:24 +0000108def HasVSX : Predicate<"PPCSubTarget->hasVSX()">;
Bill Schmidtfae5d712014-12-09 16:35:51 +0000109def IsLittleEndian : Predicate<"PPCSubTarget->isLittleEndian()">;
110def IsBigEndian : Predicate<"!PPCSubTarget->isLittleEndian()">;
Nemanja Ivanovic6e7879c2016-09-22 09:52:19 +0000111def HasOnlySwappingMemOps : Predicate<"!PPCSubTarget->hasP9Vector()">;
Bill Schmidtfae5d712014-12-09 16:35:51 +0000112
Hal Finkel27774d92014-03-13 07:58:58 +0000113let Predicates = [HasVSX] in {
114let AddedComplexity = 400 in { // Prefer VSX patterns over non-VSX patterns.
Nemanja Ivanovic11049f82016-10-04 06:59:23 +0000115let UseVSXReg = 1 in {
Craig Topperc50d64b2014-11-26 00:46:26 +0000116let hasSideEffects = 0 in { // VSX instructions don't have side effects.
Hal Finkel27774d92014-03-13 07:58:58 +0000117let Uses = [RM] in {
118
119 // Load indexed instructions
Hal Finkel6a778fb2015-03-11 23:28:38 +0000120 let mayLoad = 1 in {
Nemanja Ivanovic6354d232016-10-04 11:25:52 +0000121 let CodeSize = 3 in
Bill Schmidtcb34fd02014-10-09 17:51:35 +0000122 def LXSDX : XX1Form<31, 588,
Hal Finkel19be5062014-03-29 05:29:01 +0000123 (outs vsfrc:$XT), (ins memrr:$src),
Hal Finkel27774d92014-03-13 07:58:58 +0000124 "lxsdx $XT, $src", IIC_LdStLFD,
125 [(set f64:$XT, (load xoaddr:$src))]>;
126
Nemanja Ivanovic6e7879c2016-09-22 09:52:19 +0000127 let Predicates = [HasVSX, HasOnlySwappingMemOps] in
Bill Schmidtcb34fd02014-10-09 17:51:35 +0000128 def LXVD2X : XX1Form<31, 844,
Hal Finkel27774d92014-03-13 07:58:58 +0000129 (outs vsrc:$XT), (ins memrr:$src),
130 "lxvd2x $XT, $src", IIC_LdStLFD,
Bill Schmidt72954782014-11-12 04:19:40 +0000131 [(set v2f64:$XT, (int_ppc_vsx_lxvd2x xoaddr:$src))]>;
Hal Finkel27774d92014-03-13 07:58:58 +0000132
Bill Schmidtcb34fd02014-10-09 17:51:35 +0000133 def LXVDSX : XX1Form<31, 332,
Hal Finkel27774d92014-03-13 07:58:58 +0000134 (outs vsrc:$XT), (ins memrr:$src),
135 "lxvdsx $XT, $src", IIC_LdStLFD, []>;
Hal Finkel27774d92014-03-13 07:58:58 +0000136
Nemanja Ivanovic6e7879c2016-09-22 09:52:19 +0000137 let Predicates = [HasVSX, HasOnlySwappingMemOps] in
Bill Schmidtcb34fd02014-10-09 17:51:35 +0000138 def LXVW4X : XX1Form<31, 780,
Hal Finkel27774d92014-03-13 07:58:58 +0000139 (outs vsrc:$XT), (ins memrr:$src),
Bill Schmidt2d1128a2014-10-17 15:13:38 +0000140 "lxvw4x $XT, $src", IIC_LdStLFD,
Nemanja Ivanovicb8e30d62016-11-22 19:02:07 +0000141 []>;
Nemanja Ivanovicf3c94b12015-05-07 18:24:05 +0000142 } // mayLoad
Hal Finkel27774d92014-03-13 07:58:58 +0000143
144 // Store indexed instructions
145 let mayStore = 1 in {
Nemanja Ivanovic6354d232016-10-04 11:25:52 +0000146 let CodeSize = 3 in
Hal Finkel27774d92014-03-13 07:58:58 +0000147 def STXSDX : XX1Form<31, 716,
Hal Finkel19be5062014-03-29 05:29:01 +0000148 (outs), (ins vsfrc:$XT, memrr:$dst),
Hal Finkel27774d92014-03-13 07:58:58 +0000149 "stxsdx $XT, $dst", IIC_LdStSTFD,
150 [(store f64:$XT, xoaddr:$dst)]>;
151
Nemanja Ivanovic6e7879c2016-09-22 09:52:19 +0000152 let Predicates = [HasVSX, HasOnlySwappingMemOps] in {
Nemanja Ivanovice78ffed2016-09-22 10:32:03 +0000153 // The behaviour of this instruction is endianness-specific so we provide no
154 // pattern to match it without considering endianness.
Hal Finkel27774d92014-03-13 07:58:58 +0000155 def STXVD2X : XX1Form<31, 972,
156 (outs), (ins vsrc:$XT, memrr:$dst),
157 "stxvd2x $XT, $dst", IIC_LdStSTFD,
Nemanja Ivanovice78ffed2016-09-22 10:32:03 +0000158 []>;
Hal Finkel27774d92014-03-13 07:58:58 +0000159
160 def STXVW4X : XX1Form<31, 908,
161 (outs), (ins vsrc:$XT, memrr:$dst),
Bill Schmidt2d1128a2014-10-17 15:13:38 +0000162 "stxvw4x $XT, $dst", IIC_LdStSTFD,
Nemanja Ivanovicb8e30d62016-11-22 19:02:07 +0000163 []>;
Nemanja Ivanovic6e7879c2016-09-22 09:52:19 +0000164 }
Nemanja Ivanovicf3c94b12015-05-07 18:24:05 +0000165 } // mayStore
Hal Finkel27774d92014-03-13 07:58:58 +0000166
167 // Add/Mul Instructions
168 let isCommutable = 1 in {
169 def XSADDDP : XX3Form<60, 32,
Hal Finkel19be5062014-03-29 05:29:01 +0000170 (outs vsfrc:$XT), (ins vsfrc:$XA, vsfrc:$XB),
Hal Finkel27774d92014-03-13 07:58:58 +0000171 "xsadddp $XT, $XA, $XB", IIC_VecFP,
172 [(set f64:$XT, (fadd f64:$XA, f64:$XB))]>;
173 def XSMULDP : XX3Form<60, 48,
Hal Finkel19be5062014-03-29 05:29:01 +0000174 (outs vsfrc:$XT), (ins vsfrc:$XA, vsfrc:$XB),
Hal Finkel27774d92014-03-13 07:58:58 +0000175 "xsmuldp $XT, $XA, $XB", IIC_VecFP,
176 [(set f64:$XT, (fmul f64:$XA, f64:$XB))]>;
177
178 def XVADDDP : XX3Form<60, 96,
179 (outs vsrc:$XT), (ins vsrc:$XA, vsrc:$XB),
180 "xvadddp $XT, $XA, $XB", IIC_VecFP,
181 [(set v2f64:$XT, (fadd v2f64:$XA, v2f64:$XB))]>;
182
183 def XVADDSP : XX3Form<60, 64,
184 (outs vsrc:$XT), (ins vsrc:$XA, vsrc:$XB),
185 "xvaddsp $XT, $XA, $XB", IIC_VecFP,
186 [(set v4f32:$XT, (fadd v4f32:$XA, v4f32:$XB))]>;
187
188 def XVMULDP : XX3Form<60, 112,
189 (outs vsrc:$XT), (ins vsrc:$XA, vsrc:$XB),
190 "xvmuldp $XT, $XA, $XB", IIC_VecFP,
191 [(set v2f64:$XT, (fmul v2f64:$XA, v2f64:$XB))]>;
192
193 def XVMULSP : XX3Form<60, 80,
194 (outs vsrc:$XT), (ins vsrc:$XA, vsrc:$XB),
195 "xvmulsp $XT, $XA, $XB", IIC_VecFP,
196 [(set v4f32:$XT, (fmul v4f32:$XA, v4f32:$XB))]>;
197 }
198
199 // Subtract Instructions
200 def XSSUBDP : XX3Form<60, 40,
Hal Finkel19be5062014-03-29 05:29:01 +0000201 (outs vsfrc:$XT), (ins vsfrc:$XA, vsfrc:$XB),
Hal Finkel27774d92014-03-13 07:58:58 +0000202 "xssubdp $XT, $XA, $XB", IIC_VecFP,
203 [(set f64:$XT, (fsub f64:$XA, f64:$XB))]>;
204
205 def XVSUBDP : XX3Form<60, 104,
206 (outs vsrc:$XT), (ins vsrc:$XA, vsrc:$XB),
207 "xvsubdp $XT, $XA, $XB", IIC_VecFP,
208 [(set v2f64:$XT, (fsub v2f64:$XA, v2f64:$XB))]>;
209 def XVSUBSP : XX3Form<60, 72,
210 (outs vsrc:$XT), (ins vsrc:$XA, vsrc:$XB),
211 "xvsubsp $XT, $XA, $XB", IIC_VecFP,
212 [(set v4f32:$XT, (fsub v4f32:$XA, v4f32:$XB))]>;
213
214 // FMA Instructions
Hal Finkel25e04542014-03-25 18:55:11 +0000215 let BaseName = "XSMADDADP" in {
Hal Finkele01d3212014-03-24 15:07:28 +0000216 let isCommutable = 1 in
Hal Finkel27774d92014-03-13 07:58:58 +0000217 def XSMADDADP : XX3Form<60, 33,
Hal Finkel19be5062014-03-29 05:29:01 +0000218 (outs vsfrc:$XT), (ins vsfrc:$XTi, vsfrc:$XA, vsfrc:$XB),
Hal Finkel27774d92014-03-13 07:58:58 +0000219 "xsmaddadp $XT, $XA, $XB", IIC_VecFP,
220 [(set f64:$XT, (fma f64:$XA, f64:$XB, f64:$XTi))]>,
Hal Finkel25e04542014-03-25 18:55:11 +0000221 RegConstraint<"$XTi = $XT">, NoEncode<"$XTi">,
222 AltVSXFMARel;
223 let IsVSXFMAAlt = 1 in
Hal Finkel27774d92014-03-13 07:58:58 +0000224 def XSMADDMDP : XX3Form<60, 41,
Hal Finkel19be5062014-03-29 05:29:01 +0000225 (outs vsfrc:$XT), (ins vsfrc:$XTi, vsfrc:$XA, vsfrc:$XB),
Hal Finkel27774d92014-03-13 07:58:58 +0000226 "xsmaddmdp $XT, $XA, $XB", IIC_VecFP, []>,
Hal Finkel25e04542014-03-25 18:55:11 +0000227 RegConstraint<"$XTi = $XT">, NoEncode<"$XTi">,
228 AltVSXFMARel;
229 }
Hal Finkel27774d92014-03-13 07:58:58 +0000230
Hal Finkel25e04542014-03-25 18:55:11 +0000231 let BaseName = "XSMSUBADP" in {
Hal Finkele01d3212014-03-24 15:07:28 +0000232 let isCommutable = 1 in
Hal Finkel27774d92014-03-13 07:58:58 +0000233 def XSMSUBADP : XX3Form<60, 49,
Hal Finkel19be5062014-03-29 05:29:01 +0000234 (outs vsfrc:$XT), (ins vsfrc:$XTi, vsfrc:$XA, vsfrc:$XB),
Hal Finkel27774d92014-03-13 07:58:58 +0000235 "xsmsubadp $XT, $XA, $XB", IIC_VecFP,
236 [(set f64:$XT, (fma f64:$XA, f64:$XB, (fneg f64:$XTi)))]>,
Hal Finkel25e04542014-03-25 18:55:11 +0000237 RegConstraint<"$XTi = $XT">, NoEncode<"$XTi">,
238 AltVSXFMARel;
239 let IsVSXFMAAlt = 1 in
Hal Finkel27774d92014-03-13 07:58:58 +0000240 def XSMSUBMDP : XX3Form<60, 57,
Hal Finkel19be5062014-03-29 05:29:01 +0000241 (outs vsfrc:$XT), (ins vsfrc:$XTi, vsfrc:$XA, vsfrc:$XB),
Hal Finkel27774d92014-03-13 07:58:58 +0000242 "xsmsubmdp $XT, $XA, $XB", IIC_VecFP, []>,
Hal Finkel25e04542014-03-25 18:55:11 +0000243 RegConstraint<"$XTi = $XT">, NoEncode<"$XTi">,
244 AltVSXFMARel;
245 }
Hal Finkel27774d92014-03-13 07:58:58 +0000246
Hal Finkel25e04542014-03-25 18:55:11 +0000247 let BaseName = "XSNMADDADP" in {
Hal Finkele01d3212014-03-24 15:07:28 +0000248 let isCommutable = 1 in
Hal Finkel27774d92014-03-13 07:58:58 +0000249 def XSNMADDADP : XX3Form<60, 161,
Hal Finkel19be5062014-03-29 05:29:01 +0000250 (outs vsfrc:$XT), (ins vsfrc:$XTi, vsfrc:$XA, vsfrc:$XB),
Hal Finkel27774d92014-03-13 07:58:58 +0000251 "xsnmaddadp $XT, $XA, $XB", IIC_VecFP,
252 [(set f64:$XT, (fneg (fma f64:$XA, f64:$XB, f64:$XTi)))]>,
Hal Finkel25e04542014-03-25 18:55:11 +0000253 RegConstraint<"$XTi = $XT">, NoEncode<"$XTi">,
254 AltVSXFMARel;
255 let IsVSXFMAAlt = 1 in
Hal Finkel27774d92014-03-13 07:58:58 +0000256 def XSNMADDMDP : XX3Form<60, 169,
Hal Finkel19be5062014-03-29 05:29:01 +0000257 (outs vsfrc:$XT), (ins vsfrc:$XTi, vsfrc:$XA, vsfrc:$XB),
Hal Finkel27774d92014-03-13 07:58:58 +0000258 "xsnmaddmdp $XT, $XA, $XB", IIC_VecFP, []>,
Hal Finkel25e04542014-03-25 18:55:11 +0000259 RegConstraint<"$XTi = $XT">, NoEncode<"$XTi">,
260 AltVSXFMARel;
261 }
Hal Finkel27774d92014-03-13 07:58:58 +0000262
Hal Finkel25e04542014-03-25 18:55:11 +0000263 let BaseName = "XSNMSUBADP" in {
Hal Finkele01d3212014-03-24 15:07:28 +0000264 let isCommutable = 1 in
Hal Finkel27774d92014-03-13 07:58:58 +0000265 def XSNMSUBADP : XX3Form<60, 177,
Hal Finkel19be5062014-03-29 05:29:01 +0000266 (outs vsfrc:$XT), (ins vsfrc:$XTi, vsfrc:$XA, vsfrc:$XB),
Hal Finkel27774d92014-03-13 07:58:58 +0000267 "xsnmsubadp $XT, $XA, $XB", IIC_VecFP,
268 [(set f64:$XT, (fneg (fma f64:$XA, f64:$XB, (fneg f64:$XTi))))]>,
Hal Finkel25e04542014-03-25 18:55:11 +0000269 RegConstraint<"$XTi = $XT">, NoEncode<"$XTi">,
270 AltVSXFMARel;
271 let IsVSXFMAAlt = 1 in
Hal Finkel27774d92014-03-13 07:58:58 +0000272 def XSNMSUBMDP : XX3Form<60, 185,
Hal Finkel19be5062014-03-29 05:29:01 +0000273 (outs vsfrc:$XT), (ins vsfrc:$XTi, vsfrc:$XA, vsfrc:$XB),
Hal Finkel27774d92014-03-13 07:58:58 +0000274 "xsnmsubmdp $XT, $XA, $XB", IIC_VecFP, []>,
Hal Finkel25e04542014-03-25 18:55:11 +0000275 RegConstraint<"$XTi = $XT">, NoEncode<"$XTi">,
276 AltVSXFMARel;
277 }
Hal Finkel27774d92014-03-13 07:58:58 +0000278
Hal Finkel25e04542014-03-25 18:55:11 +0000279 let BaseName = "XVMADDADP" in {
Hal Finkele01d3212014-03-24 15:07:28 +0000280 let isCommutable = 1 in
Hal Finkel27774d92014-03-13 07:58:58 +0000281 def XVMADDADP : XX3Form<60, 97,
282 (outs vsrc:$XT), (ins vsrc:$XTi, vsrc:$XA, vsrc:$XB),
283 "xvmaddadp $XT, $XA, $XB", IIC_VecFP,
284 [(set v2f64:$XT, (fma v2f64:$XA, v2f64:$XB, v2f64:$XTi))]>,
Hal Finkel25e04542014-03-25 18:55:11 +0000285 RegConstraint<"$XTi = $XT">, NoEncode<"$XTi">,
286 AltVSXFMARel;
287 let IsVSXFMAAlt = 1 in
Hal Finkel27774d92014-03-13 07:58:58 +0000288 def XVMADDMDP : XX3Form<60, 105,
289 (outs vsrc:$XT), (ins vsrc:$XTi, vsrc:$XA, vsrc:$XB),
290 "xvmaddmdp $XT, $XA, $XB", IIC_VecFP, []>,
Hal Finkel25e04542014-03-25 18:55:11 +0000291 RegConstraint<"$XTi = $XT">, NoEncode<"$XTi">,
292 AltVSXFMARel;
293 }
Hal Finkel27774d92014-03-13 07:58:58 +0000294
Hal Finkel25e04542014-03-25 18:55:11 +0000295 let BaseName = "XVMADDASP" in {
Hal Finkele01d3212014-03-24 15:07:28 +0000296 let isCommutable = 1 in
Hal Finkel27774d92014-03-13 07:58:58 +0000297 def XVMADDASP : XX3Form<60, 65,
298 (outs vsrc:$XT), (ins vsrc:$XTi, vsrc:$XA, vsrc:$XB),
299 "xvmaddasp $XT, $XA, $XB", IIC_VecFP,
300 [(set v4f32:$XT, (fma v4f32:$XA, v4f32:$XB, v4f32:$XTi))]>,
Hal Finkel25e04542014-03-25 18:55:11 +0000301 RegConstraint<"$XTi = $XT">, NoEncode<"$XTi">,
302 AltVSXFMARel;
303 let IsVSXFMAAlt = 1 in
Hal Finkel27774d92014-03-13 07:58:58 +0000304 def XVMADDMSP : XX3Form<60, 73,
305 (outs vsrc:$XT), (ins vsrc:$XTi, vsrc:$XA, vsrc:$XB),
306 "xvmaddmsp $XT, $XA, $XB", IIC_VecFP, []>,
Hal Finkel25e04542014-03-25 18:55:11 +0000307 RegConstraint<"$XTi = $XT">, NoEncode<"$XTi">,
308 AltVSXFMARel;
309 }
Hal Finkel27774d92014-03-13 07:58:58 +0000310
Hal Finkel25e04542014-03-25 18:55:11 +0000311 let BaseName = "XVMSUBADP" in {
Hal Finkele01d3212014-03-24 15:07:28 +0000312 let isCommutable = 1 in
Hal Finkel27774d92014-03-13 07:58:58 +0000313 def XVMSUBADP : XX3Form<60, 113,
314 (outs vsrc:$XT), (ins vsrc:$XTi, vsrc:$XA, vsrc:$XB),
315 "xvmsubadp $XT, $XA, $XB", IIC_VecFP,
316 [(set v2f64:$XT, (fma v2f64:$XA, v2f64:$XB, (fneg v2f64:$XTi)))]>,
Hal Finkel25e04542014-03-25 18:55:11 +0000317 RegConstraint<"$XTi = $XT">, NoEncode<"$XTi">,
318 AltVSXFMARel;
319 let IsVSXFMAAlt = 1 in
Hal Finkel27774d92014-03-13 07:58:58 +0000320 def XVMSUBMDP : XX3Form<60, 121,
321 (outs vsrc:$XT), (ins vsrc:$XTi, vsrc:$XA, vsrc:$XB),
322 "xvmsubmdp $XT, $XA, $XB", IIC_VecFP, []>,
Hal Finkel25e04542014-03-25 18:55:11 +0000323 RegConstraint<"$XTi = $XT">, NoEncode<"$XTi">,
324 AltVSXFMARel;
325 }
Hal Finkel27774d92014-03-13 07:58:58 +0000326
Hal Finkel25e04542014-03-25 18:55:11 +0000327 let BaseName = "XVMSUBASP" in {
Hal Finkele01d3212014-03-24 15:07:28 +0000328 let isCommutable = 1 in
Hal Finkel27774d92014-03-13 07:58:58 +0000329 def XVMSUBASP : XX3Form<60, 81,
330 (outs vsrc:$XT), (ins vsrc:$XTi, vsrc:$XA, vsrc:$XB),
331 "xvmsubasp $XT, $XA, $XB", IIC_VecFP,
332 [(set v4f32:$XT, (fma v4f32:$XA, v4f32:$XB, (fneg v4f32:$XTi)))]>,
Hal Finkel25e04542014-03-25 18:55:11 +0000333 RegConstraint<"$XTi = $XT">, NoEncode<"$XTi">,
334 AltVSXFMARel;
335 let IsVSXFMAAlt = 1 in
Hal Finkel27774d92014-03-13 07:58:58 +0000336 def XVMSUBMSP : XX3Form<60, 89,
337 (outs vsrc:$XT), (ins vsrc:$XTi, vsrc:$XA, vsrc:$XB),
338 "xvmsubmsp $XT, $XA, $XB", IIC_VecFP, []>,
Hal Finkel25e04542014-03-25 18:55:11 +0000339 RegConstraint<"$XTi = $XT">, NoEncode<"$XTi">,
340 AltVSXFMARel;
341 }
Hal Finkel27774d92014-03-13 07:58:58 +0000342
Hal Finkel25e04542014-03-25 18:55:11 +0000343 let BaseName = "XVNMADDADP" in {
Hal Finkele01d3212014-03-24 15:07:28 +0000344 let isCommutable = 1 in
Hal Finkel27774d92014-03-13 07:58:58 +0000345 def XVNMADDADP : XX3Form<60, 225,
346 (outs vsrc:$XT), (ins vsrc:$XTi, vsrc:$XA, vsrc:$XB),
347 "xvnmaddadp $XT, $XA, $XB", IIC_VecFP,
348 [(set v2f64:$XT, (fneg (fma v2f64:$XA, v2f64:$XB, v2f64:$XTi)))]>,
Hal Finkel25e04542014-03-25 18:55:11 +0000349 RegConstraint<"$XTi = $XT">, NoEncode<"$XTi">,
350 AltVSXFMARel;
351 let IsVSXFMAAlt = 1 in
Hal Finkel27774d92014-03-13 07:58:58 +0000352 def XVNMADDMDP : XX3Form<60, 233,
353 (outs vsrc:$XT), (ins vsrc:$XTi, vsrc:$XA, vsrc:$XB),
354 "xvnmaddmdp $XT, $XA, $XB", IIC_VecFP, []>,
Hal Finkel25e04542014-03-25 18:55:11 +0000355 RegConstraint<"$XTi = $XT">, NoEncode<"$XTi">,
356 AltVSXFMARel;
357 }
Hal Finkel27774d92014-03-13 07:58:58 +0000358
Hal Finkel25e04542014-03-25 18:55:11 +0000359 let BaseName = "XVNMADDASP" in {
Hal Finkele01d3212014-03-24 15:07:28 +0000360 let isCommutable = 1 in
Hal Finkel27774d92014-03-13 07:58:58 +0000361 def XVNMADDASP : XX3Form<60, 193,
362 (outs vsrc:$XT), (ins vsrc:$XTi, vsrc:$XA, vsrc:$XB),
363 "xvnmaddasp $XT, $XA, $XB", IIC_VecFP,
364 [(set v4f32:$XT, (fneg (fma v4f32:$XA, v4f32:$XB, v4f32:$XTi)))]>,
Hal Finkel25e04542014-03-25 18:55:11 +0000365 RegConstraint<"$XTi = $XT">, NoEncode<"$XTi">,
366 AltVSXFMARel;
367 let IsVSXFMAAlt = 1 in
Hal Finkel27774d92014-03-13 07:58:58 +0000368 def XVNMADDMSP : XX3Form<60, 201,
369 (outs vsrc:$XT), (ins vsrc:$XTi, vsrc:$XA, vsrc:$XB),
370 "xvnmaddmsp $XT, $XA, $XB", IIC_VecFP, []>,
Hal Finkel25e04542014-03-25 18:55:11 +0000371 RegConstraint<"$XTi = $XT">, NoEncode<"$XTi">,
372 AltVSXFMARel;
373 }
Hal Finkel27774d92014-03-13 07:58:58 +0000374
Hal Finkel25e04542014-03-25 18:55:11 +0000375 let BaseName = "XVNMSUBADP" in {
Hal Finkele01d3212014-03-24 15:07:28 +0000376 let isCommutable = 1 in
Hal Finkel27774d92014-03-13 07:58:58 +0000377 def XVNMSUBADP : XX3Form<60, 241,
378 (outs vsrc:$XT), (ins vsrc:$XTi, vsrc:$XA, vsrc:$XB),
379 "xvnmsubadp $XT, $XA, $XB", IIC_VecFP,
380 [(set v2f64:$XT, (fneg (fma v2f64:$XA, v2f64:$XB, (fneg v2f64:$XTi))))]>,
Hal Finkel25e04542014-03-25 18:55:11 +0000381 RegConstraint<"$XTi = $XT">, NoEncode<"$XTi">,
382 AltVSXFMARel;
383 let IsVSXFMAAlt = 1 in
Hal Finkel27774d92014-03-13 07:58:58 +0000384 def XVNMSUBMDP : XX3Form<60, 249,
385 (outs vsrc:$XT), (ins vsrc:$XTi, vsrc:$XA, vsrc:$XB),
386 "xvnmsubmdp $XT, $XA, $XB", IIC_VecFP, []>,
Hal Finkel25e04542014-03-25 18:55:11 +0000387 RegConstraint<"$XTi = $XT">, NoEncode<"$XTi">,
388 AltVSXFMARel;
389 }
Hal Finkel27774d92014-03-13 07:58:58 +0000390
Hal Finkel25e04542014-03-25 18:55:11 +0000391 let BaseName = "XVNMSUBASP" in {
Hal Finkele01d3212014-03-24 15:07:28 +0000392 let isCommutable = 1 in
Hal Finkel27774d92014-03-13 07:58:58 +0000393 def XVNMSUBASP : XX3Form<60, 209,
394 (outs vsrc:$XT), (ins vsrc:$XTi, vsrc:$XA, vsrc:$XB),
395 "xvnmsubasp $XT, $XA, $XB", IIC_VecFP,
396 [(set v4f32:$XT, (fneg (fma v4f32:$XA, v4f32:$XB, (fneg v4f32:$XTi))))]>,
Hal Finkel25e04542014-03-25 18:55:11 +0000397 RegConstraint<"$XTi = $XT">, NoEncode<"$XTi">,
398 AltVSXFMARel;
399 let IsVSXFMAAlt = 1 in
Hal Finkel27774d92014-03-13 07:58:58 +0000400 def XVNMSUBMSP : XX3Form<60, 217,
401 (outs vsrc:$XT), (ins vsrc:$XTi, vsrc:$XA, vsrc:$XB),
402 "xvnmsubmsp $XT, $XA, $XB", IIC_VecFP, []>,
Hal Finkel25e04542014-03-25 18:55:11 +0000403 RegConstraint<"$XTi = $XT">, NoEncode<"$XTi">,
404 AltVSXFMARel;
405 }
Hal Finkel27774d92014-03-13 07:58:58 +0000406
407 // Division Instructions
408 def XSDIVDP : XX3Form<60, 56,
Hal Finkel19be5062014-03-29 05:29:01 +0000409 (outs vsfrc:$XT), (ins vsfrc:$XA, vsfrc:$XB),
Hal Finkele8fba982014-03-29 13:20:31 +0000410 "xsdivdp $XT, $XA, $XB", IIC_FPDivD,
Hal Finkel27774d92014-03-13 07:58:58 +0000411 [(set f64:$XT, (fdiv f64:$XA, f64:$XB))]>;
412 def XSSQRTDP : XX2Form<60, 75,
Hal Finkel19be5062014-03-29 05:29:01 +0000413 (outs vsfrc:$XT), (ins vsfrc:$XB),
Hal Finkele8fba982014-03-29 13:20:31 +0000414 "xssqrtdp $XT, $XB", IIC_FPSqrtD,
Hal Finkel27774d92014-03-13 07:58:58 +0000415 [(set f64:$XT, (fsqrt f64:$XB))]>;
416
417 def XSREDP : XX2Form<60, 90,
Hal Finkel19be5062014-03-29 05:29:01 +0000418 (outs vsfrc:$XT), (ins vsfrc:$XB),
Hal Finkel27774d92014-03-13 07:58:58 +0000419 "xsredp $XT, $XB", IIC_VecFP,
420 [(set f64:$XT, (PPCfre f64:$XB))]>;
421 def XSRSQRTEDP : XX2Form<60, 74,
Hal Finkel19be5062014-03-29 05:29:01 +0000422 (outs vsfrc:$XT), (ins vsfrc:$XB),
Hal Finkel27774d92014-03-13 07:58:58 +0000423 "xsrsqrtedp $XT, $XB", IIC_VecFP,
424 [(set f64:$XT, (PPCfrsqrte f64:$XB))]>;
425
426 def XSTDIVDP : XX3Form_1<60, 61,
Hal Finkel19be5062014-03-29 05:29:01 +0000427 (outs crrc:$crD), (ins vsfrc:$XA, vsfrc:$XB),
Hal Finkele8fba982014-03-29 13:20:31 +0000428 "xstdivdp $crD, $XA, $XB", IIC_FPCompare, []>;
Hal Finkel27774d92014-03-13 07:58:58 +0000429 def XSTSQRTDP : XX2Form_1<60, 106,
Hal Finkel19be5062014-03-29 05:29:01 +0000430 (outs crrc:$crD), (ins vsfrc:$XB),
Hal Finkele8fba982014-03-29 13:20:31 +0000431 "xstsqrtdp $crD, $XB", IIC_FPCompare, []>;
Hal Finkel27774d92014-03-13 07:58:58 +0000432
433 def XVDIVDP : XX3Form<60, 120,
434 (outs vsrc:$XT), (ins vsrc:$XA, vsrc:$XB),
Hal Finkele8fba982014-03-29 13:20:31 +0000435 "xvdivdp $XT, $XA, $XB", IIC_FPDivD,
Hal Finkel27774d92014-03-13 07:58:58 +0000436 [(set v2f64:$XT, (fdiv v2f64:$XA, v2f64:$XB))]>;
437 def XVDIVSP : XX3Form<60, 88,
438 (outs vsrc:$XT), (ins vsrc:$XA, vsrc:$XB),
Hal Finkele8fba982014-03-29 13:20:31 +0000439 "xvdivsp $XT, $XA, $XB", IIC_FPDivS,
Hal Finkel27774d92014-03-13 07:58:58 +0000440 [(set v4f32:$XT, (fdiv v4f32:$XA, v4f32:$XB))]>;
441
442 def XVSQRTDP : XX2Form<60, 203,
443 (outs vsrc:$XT), (ins vsrc:$XB),
Hal Finkele8fba982014-03-29 13:20:31 +0000444 "xvsqrtdp $XT, $XB", IIC_FPSqrtD,
Hal Finkel27774d92014-03-13 07:58:58 +0000445 [(set v2f64:$XT, (fsqrt v2f64:$XB))]>;
446 def XVSQRTSP : XX2Form<60, 139,
447 (outs vsrc:$XT), (ins vsrc:$XB),
Hal Finkele8fba982014-03-29 13:20:31 +0000448 "xvsqrtsp $XT, $XB", IIC_FPSqrtS,
Hal Finkel27774d92014-03-13 07:58:58 +0000449 [(set v4f32:$XT, (fsqrt v4f32:$XB))]>;
450
451 def XVTDIVDP : XX3Form_1<60, 125,
452 (outs crrc:$crD), (ins vsrc:$XA, vsrc:$XB),
Hal Finkele8fba982014-03-29 13:20:31 +0000453 "xvtdivdp $crD, $XA, $XB", IIC_FPCompare, []>;
Hal Finkel27774d92014-03-13 07:58:58 +0000454 def XVTDIVSP : XX3Form_1<60, 93,
455 (outs crrc:$crD), (ins vsrc:$XA, vsrc:$XB),
Hal Finkele8fba982014-03-29 13:20:31 +0000456 "xvtdivsp $crD, $XA, $XB", IIC_FPCompare, []>;
Hal Finkel27774d92014-03-13 07:58:58 +0000457
458 def XVTSQRTDP : XX2Form_1<60, 234,
459 (outs crrc:$crD), (ins vsrc:$XB),
Hal Finkele8fba982014-03-29 13:20:31 +0000460 "xvtsqrtdp $crD, $XB", IIC_FPCompare, []>;
Hal Finkel27774d92014-03-13 07:58:58 +0000461 def XVTSQRTSP : XX2Form_1<60, 170,
462 (outs crrc:$crD), (ins vsrc:$XB),
Hal Finkele8fba982014-03-29 13:20:31 +0000463 "xvtsqrtsp $crD, $XB", IIC_FPCompare, []>;
Hal Finkel27774d92014-03-13 07:58:58 +0000464
465 def XVREDP : XX2Form<60, 218,
466 (outs vsrc:$XT), (ins vsrc:$XB),
467 "xvredp $XT, $XB", IIC_VecFP,
468 [(set v2f64:$XT, (PPCfre v2f64:$XB))]>;
469 def XVRESP : XX2Form<60, 154,
470 (outs vsrc:$XT), (ins vsrc:$XB),
471 "xvresp $XT, $XB", IIC_VecFP,
472 [(set v4f32:$XT, (PPCfre v4f32:$XB))]>;
473
474 def XVRSQRTEDP : XX2Form<60, 202,
475 (outs vsrc:$XT), (ins vsrc:$XB),
476 "xvrsqrtedp $XT, $XB", IIC_VecFP,
477 [(set v2f64:$XT, (PPCfrsqrte v2f64:$XB))]>;
478 def XVRSQRTESP : XX2Form<60, 138,
479 (outs vsrc:$XT), (ins vsrc:$XB),
480 "xvrsqrtesp $XT, $XB", IIC_VecFP,
481 [(set v4f32:$XT, (PPCfrsqrte v4f32:$XB))]>;
482
483 // Compare Instructions
484 def XSCMPODP : XX3Form_1<60, 43,
Hal Finkel19be5062014-03-29 05:29:01 +0000485 (outs crrc:$crD), (ins vsfrc:$XA, vsfrc:$XB),
Hal Finkele8fba982014-03-29 13:20:31 +0000486 "xscmpodp $crD, $XA, $XB", IIC_FPCompare, []>;
Hal Finkel27774d92014-03-13 07:58:58 +0000487 def XSCMPUDP : XX3Form_1<60, 35,
Hal Finkel19be5062014-03-29 05:29:01 +0000488 (outs crrc:$crD), (ins vsfrc:$XA, vsfrc:$XB),
Hal Finkele8fba982014-03-29 13:20:31 +0000489 "xscmpudp $crD, $XA, $XB", IIC_FPCompare, []>;
Hal Finkel27774d92014-03-13 07:58:58 +0000490
491 defm XVCMPEQDP : XX3Form_Rcr<60, 99,
Nemanja Ivanovicf502a422015-06-26 19:26:53 +0000492 "xvcmpeqdp", "$XT, $XA, $XB", IIC_VecFPCompare,
Nemanja Ivanovic2c84b292015-09-29 17:41:53 +0000493 int_ppc_vsx_xvcmpeqdp, v2i64, v2f64>;
Hal Finkel27774d92014-03-13 07:58:58 +0000494 defm XVCMPEQSP : XX3Form_Rcr<60, 67,
Nemanja Ivanovicf502a422015-06-26 19:26:53 +0000495 "xvcmpeqsp", "$XT, $XA, $XB", IIC_VecFPCompare,
Nemanja Ivanovic2c84b292015-09-29 17:41:53 +0000496 int_ppc_vsx_xvcmpeqsp, v4i32, v4f32>;
Hal Finkel27774d92014-03-13 07:58:58 +0000497 defm XVCMPGEDP : XX3Form_Rcr<60, 115,
Nemanja Ivanovicf502a422015-06-26 19:26:53 +0000498 "xvcmpgedp", "$XT, $XA, $XB", IIC_VecFPCompare,
Nemanja Ivanovic2c84b292015-09-29 17:41:53 +0000499 int_ppc_vsx_xvcmpgedp, v2i64, v2f64>;
Hal Finkel27774d92014-03-13 07:58:58 +0000500 defm XVCMPGESP : XX3Form_Rcr<60, 83,
Nemanja Ivanovicf502a422015-06-26 19:26:53 +0000501 "xvcmpgesp", "$XT, $XA, $XB", IIC_VecFPCompare,
Nemanja Ivanovic2c84b292015-09-29 17:41:53 +0000502 int_ppc_vsx_xvcmpgesp, v4i32, v4f32>;
Hal Finkel27774d92014-03-13 07:58:58 +0000503 defm XVCMPGTDP : XX3Form_Rcr<60, 107,
Nemanja Ivanovicf502a422015-06-26 19:26:53 +0000504 "xvcmpgtdp", "$XT, $XA, $XB", IIC_VecFPCompare,
Nemanja Ivanovic2c84b292015-09-29 17:41:53 +0000505 int_ppc_vsx_xvcmpgtdp, v2i64, v2f64>;
Hal Finkel27774d92014-03-13 07:58:58 +0000506 defm XVCMPGTSP : XX3Form_Rcr<60, 75,
Nemanja Ivanovicf502a422015-06-26 19:26:53 +0000507 "xvcmpgtsp", "$XT, $XA, $XB", IIC_VecFPCompare,
Nemanja Ivanovic2c84b292015-09-29 17:41:53 +0000508 int_ppc_vsx_xvcmpgtsp, v4i32, v4f32>;
Hal Finkel27774d92014-03-13 07:58:58 +0000509
510 // Move Instructions
511 def XSABSDP : XX2Form<60, 345,
Hal Finkel19be5062014-03-29 05:29:01 +0000512 (outs vsfrc:$XT), (ins vsfrc:$XB),
Hal Finkel27774d92014-03-13 07:58:58 +0000513 "xsabsdp $XT, $XB", IIC_VecFP,
514 [(set f64:$XT, (fabs f64:$XB))]>;
515 def XSNABSDP : XX2Form<60, 361,
Hal Finkel19be5062014-03-29 05:29:01 +0000516 (outs vsfrc:$XT), (ins vsfrc:$XB),
Hal Finkel27774d92014-03-13 07:58:58 +0000517 "xsnabsdp $XT, $XB", IIC_VecFP,
518 [(set f64:$XT, (fneg (fabs f64:$XB)))]>;
519 def XSNEGDP : XX2Form<60, 377,
Hal Finkel19be5062014-03-29 05:29:01 +0000520 (outs vsfrc:$XT), (ins vsfrc:$XB),
Hal Finkel27774d92014-03-13 07:58:58 +0000521 "xsnegdp $XT, $XB", IIC_VecFP,
522 [(set f64:$XT, (fneg f64:$XB))]>;
523 def XSCPSGNDP : XX3Form<60, 176,
Hal Finkel19be5062014-03-29 05:29:01 +0000524 (outs vsfrc:$XT), (ins vsfrc:$XA, vsfrc:$XB),
Hal Finkel27774d92014-03-13 07:58:58 +0000525 "xscpsgndp $XT, $XA, $XB", IIC_VecFP,
526 [(set f64:$XT, (fcopysign f64:$XB, f64:$XA))]>;
527
528 def XVABSDP : XX2Form<60, 473,
529 (outs vsrc:$XT), (ins vsrc:$XB),
530 "xvabsdp $XT, $XB", IIC_VecFP,
531 [(set v2f64:$XT, (fabs v2f64:$XB))]>;
532
533 def XVABSSP : XX2Form<60, 409,
534 (outs vsrc:$XT), (ins vsrc:$XB),
535 "xvabssp $XT, $XB", IIC_VecFP,
536 [(set v4f32:$XT, (fabs v4f32:$XB))]>;
537
538 def XVCPSGNDP : XX3Form<60, 240,
539 (outs vsrc:$XT), (ins vsrc:$XA, vsrc:$XB),
540 "xvcpsgndp $XT, $XA, $XB", IIC_VecFP,
541 [(set v2f64:$XT, (fcopysign v2f64:$XB, v2f64:$XA))]>;
542 def XVCPSGNSP : XX3Form<60, 208,
543 (outs vsrc:$XT), (ins vsrc:$XA, vsrc:$XB),
544 "xvcpsgnsp $XT, $XA, $XB", IIC_VecFP,
545 [(set v4f32:$XT, (fcopysign v4f32:$XB, v4f32:$XA))]>;
546
547 def XVNABSDP : XX2Form<60, 489,
548 (outs vsrc:$XT), (ins vsrc:$XB),
549 "xvnabsdp $XT, $XB", IIC_VecFP,
550 [(set v2f64:$XT, (fneg (fabs v2f64:$XB)))]>;
551 def XVNABSSP : XX2Form<60, 425,
552 (outs vsrc:$XT), (ins vsrc:$XB),
553 "xvnabssp $XT, $XB", IIC_VecFP,
554 [(set v4f32:$XT, (fneg (fabs v4f32:$XB)))]>;
555
556 def XVNEGDP : XX2Form<60, 505,
557 (outs vsrc:$XT), (ins vsrc:$XB),
558 "xvnegdp $XT, $XB", IIC_VecFP,
559 [(set v2f64:$XT, (fneg v2f64:$XB))]>;
560 def XVNEGSP : XX2Form<60, 441,
561 (outs vsrc:$XT), (ins vsrc:$XB),
562 "xvnegsp $XT, $XB", IIC_VecFP,
563 [(set v4f32:$XT, (fneg v4f32:$XB))]>;
564
565 // Conversion Instructions
566 def XSCVDPSP : XX2Form<60, 265,
Hal Finkel19be5062014-03-29 05:29:01 +0000567 (outs vsfrc:$XT), (ins vsfrc:$XB),
Hal Finkel27774d92014-03-13 07:58:58 +0000568 "xscvdpsp $XT, $XB", IIC_VecFP, []>;
569 def XSCVDPSXDS : XX2Form<60, 344,
Hal Finkel19be5062014-03-29 05:29:01 +0000570 (outs vsfrc:$XT), (ins vsfrc:$XB),
Hal Finkel4a912252014-03-23 05:35:00 +0000571 "xscvdpsxds $XT, $XB", IIC_VecFP,
572 [(set f64:$XT, (PPCfctidz f64:$XB))]>;
Nemanja Ivanovicdf1cb522016-11-29 16:11:34 +0000573 let isCodeGenOnly = 1 in
574 def XSCVDPSXDSs : XX2Form<60, 344,
575 (outs vssrc:$XT), (ins vssrc:$XB),
576 "xscvdpsxds $XT, $XB", IIC_VecFP,
577 [(set f32:$XT, (PPCfctidz f32:$XB))]>;
Hal Finkel27774d92014-03-13 07:58:58 +0000578 def XSCVDPSXWS : XX2Form<60, 88,
Hal Finkel19be5062014-03-29 05:29:01 +0000579 (outs vsfrc:$XT), (ins vsfrc:$XB),
Hal Finkel4a912252014-03-23 05:35:00 +0000580 "xscvdpsxws $XT, $XB", IIC_VecFP,
581 [(set f64:$XT, (PPCfctiwz f64:$XB))]>;
Nemanja Ivanovicdf1cb522016-11-29 16:11:34 +0000582 let isCodeGenOnly = 1 in
583 def XSCVDPSXWSs : XX2Form<60, 88,
584 (outs vssrc:$XT), (ins vssrc:$XB),
585 "xscvdpsxws $XT, $XB", IIC_VecFP,
586 [(set f32:$XT, (PPCfctiwz f32:$XB))]>;
Hal Finkel27774d92014-03-13 07:58:58 +0000587 def XSCVDPUXDS : XX2Form<60, 328,
Hal Finkel19be5062014-03-29 05:29:01 +0000588 (outs vsfrc:$XT), (ins vsfrc:$XB),
Hal Finkel4a912252014-03-23 05:35:00 +0000589 "xscvdpuxds $XT, $XB", IIC_VecFP,
590 [(set f64:$XT, (PPCfctiduz f64:$XB))]>;
Nemanja Ivanovicdf1cb522016-11-29 16:11:34 +0000591 let isCodeGenOnly = 1 in
592 def XSCVDPUXDSs : XX2Form<60, 328,
593 (outs vssrc:$XT), (ins vssrc:$XB),
594 "xscvdpuxds $XT, $XB", IIC_VecFP,
595 [(set f32:$XT, (PPCfctiduz f32:$XB))]>;
Hal Finkel27774d92014-03-13 07:58:58 +0000596 def XSCVDPUXWS : XX2Form<60, 72,
Hal Finkel19be5062014-03-29 05:29:01 +0000597 (outs vsfrc:$XT), (ins vsfrc:$XB),
Hal Finkel4a912252014-03-23 05:35:00 +0000598 "xscvdpuxws $XT, $XB", IIC_VecFP,
599 [(set f64:$XT, (PPCfctiwuz f64:$XB))]>;
Nemanja Ivanovicdf1cb522016-11-29 16:11:34 +0000600 let isCodeGenOnly = 1 in
601 def XSCVDPUXWSs : XX2Form<60, 72,
602 (outs vssrc:$XT), (ins vssrc:$XB),
603 "xscvdpuxws $XT, $XB", IIC_VecFP,
604 [(set f32:$XT, (PPCfctiwuz f32:$XB))]>;
Hal Finkel27774d92014-03-13 07:58:58 +0000605 def XSCVSPDP : XX2Form<60, 329,
Hal Finkel19be5062014-03-29 05:29:01 +0000606 (outs vsfrc:$XT), (ins vsfrc:$XB),
Hal Finkel27774d92014-03-13 07:58:58 +0000607 "xscvspdp $XT, $XB", IIC_VecFP, []>;
608 def XSCVSXDDP : XX2Form<60, 376,
Hal Finkel19be5062014-03-29 05:29:01 +0000609 (outs vsfrc:$XT), (ins vsfrc:$XB),
Hal Finkel4a912252014-03-23 05:35:00 +0000610 "xscvsxddp $XT, $XB", IIC_VecFP,
611 [(set f64:$XT, (PPCfcfid f64:$XB))]>;
Hal Finkel27774d92014-03-13 07:58:58 +0000612 def XSCVUXDDP : XX2Form<60, 360,
Hal Finkel19be5062014-03-29 05:29:01 +0000613 (outs vsfrc:$XT), (ins vsfrc:$XB),
Hal Finkel4a912252014-03-23 05:35:00 +0000614 "xscvuxddp $XT, $XB", IIC_VecFP,
615 [(set f64:$XT, (PPCfcfidu f64:$XB))]>;
Hal Finkel27774d92014-03-13 07:58:58 +0000616
617 def XVCVDPSP : XX2Form<60, 393,
618 (outs vsrc:$XT), (ins vsrc:$XB),
Nemanja Ivanovic2efc3cb2016-11-11 14:41:19 +0000619 "xvcvdpsp $XT, $XB", IIC_VecFP,
620 [(set v4f32:$XT, (int_ppc_vsx_xvcvdpsp v2f64:$XB))]>;
Hal Finkel27774d92014-03-13 07:58:58 +0000621 def XVCVDPSXDS : XX2Form<60, 472,
622 (outs vsrc:$XT), (ins vsrc:$XB),
Hal Finkel7279f4b2014-03-26 19:13:54 +0000623 "xvcvdpsxds $XT, $XB", IIC_VecFP,
624 [(set v2i64:$XT, (fp_to_sint v2f64:$XB))]>;
Hal Finkel27774d92014-03-13 07:58:58 +0000625 def XVCVDPSXWS : XX2Form<60, 216,
626 (outs vsrc:$XT), (ins vsrc:$XB),
Nemanja Ivanovic2efc3cb2016-11-11 14:41:19 +0000627 "xvcvdpsxws $XT, $XB", IIC_VecFP,
628 [(set v4i32:$XT, (int_ppc_vsx_xvcvdpsxws v2f64:$XB))]>;
Hal Finkel27774d92014-03-13 07:58:58 +0000629 def XVCVDPUXDS : XX2Form<60, 456,
630 (outs vsrc:$XT), (ins vsrc:$XB),
Hal Finkel7279f4b2014-03-26 19:13:54 +0000631 "xvcvdpuxds $XT, $XB", IIC_VecFP,
632 [(set v2i64:$XT, (fp_to_uint v2f64:$XB))]>;
Hal Finkel27774d92014-03-13 07:58:58 +0000633 def XVCVDPUXWS : XX2Form<60, 200,
634 (outs vsrc:$XT), (ins vsrc:$XB),
Nemanja Ivanovic2efc3cb2016-11-11 14:41:19 +0000635 "xvcvdpuxws $XT, $XB", IIC_VecFP,
636 [(set v4i32:$XT, (int_ppc_vsx_xvcvdpuxws v2f64:$XB))]>;
Hal Finkel27774d92014-03-13 07:58:58 +0000637
638 def XVCVSPDP : XX2Form<60, 457,
639 (outs vsrc:$XT), (ins vsrc:$XB),
Nemanja Ivanovic2efc3cb2016-11-11 14:41:19 +0000640 "xvcvspdp $XT, $XB", IIC_VecFP,
641 [(set v2f64:$XT, (int_ppc_vsx_xvcvspdp v4f32:$XB))]>;
Hal Finkel27774d92014-03-13 07:58:58 +0000642 def XVCVSPSXDS : XX2Form<60, 408,
643 (outs vsrc:$XT), (ins vsrc:$XB),
644 "xvcvspsxds $XT, $XB", IIC_VecFP, []>;
645 def XVCVSPSXWS : XX2Form<60, 152,
646 (outs vsrc:$XT), (ins vsrc:$XB),
Nemanja Ivanovicdf1cb522016-11-29 16:11:34 +0000647 "xvcvspsxws $XT, $XB", IIC_VecFP,
648 [(set v4i32:$XT, (fp_to_sint v4f32:$XB))]>;
Hal Finkel27774d92014-03-13 07:58:58 +0000649 def XVCVSPUXDS : XX2Form<60, 392,
650 (outs vsrc:$XT), (ins vsrc:$XB),
651 "xvcvspuxds $XT, $XB", IIC_VecFP, []>;
652 def XVCVSPUXWS : XX2Form<60, 136,
653 (outs vsrc:$XT), (ins vsrc:$XB),
Nemanja Ivanovicdf1cb522016-11-29 16:11:34 +0000654 "xvcvspuxws $XT, $XB", IIC_VecFP,
655 [(set v4i32:$XT, (fp_to_uint v4f32:$XB))]>;
Hal Finkel27774d92014-03-13 07:58:58 +0000656 def XVCVSXDDP : XX2Form<60, 504,
657 (outs vsrc:$XT), (ins vsrc:$XB),
Hal Finkel7279f4b2014-03-26 19:13:54 +0000658 "xvcvsxddp $XT, $XB", IIC_VecFP,
659 [(set v2f64:$XT, (sint_to_fp v2i64:$XB))]>;
Hal Finkel27774d92014-03-13 07:58:58 +0000660 def XVCVSXDSP : XX2Form<60, 440,
661 (outs vsrc:$XT), (ins vsrc:$XB),
Nemanja Ivanovic2efc3cb2016-11-11 14:41:19 +0000662 "xvcvsxdsp $XT, $XB", IIC_VecFP,
663 [(set v4f32:$XT, (int_ppc_vsx_xvcvsxdsp v2i64:$XB))]>;
Hal Finkel27774d92014-03-13 07:58:58 +0000664 def XVCVSXWDP : XX2Form<60, 248,
665 (outs vsrc:$XT), (ins vsrc:$XB),
Nemanja Ivanovic2efc3cb2016-11-11 14:41:19 +0000666 "xvcvsxwdp $XT, $XB", IIC_VecFP,
667 [(set v2f64:$XT, (int_ppc_vsx_xvcvsxwdp v4i32:$XB))]>;
Hal Finkel27774d92014-03-13 07:58:58 +0000668 def XVCVSXWSP : XX2Form<60, 184,
669 (outs vsrc:$XT), (ins vsrc:$XB),
Nemanja Ivanovic44513e52016-07-05 09:22:29 +0000670 "xvcvsxwsp $XT, $XB", IIC_VecFP,
671 [(set v4f32:$XT, (sint_to_fp v4i32:$XB))]>;
Hal Finkel27774d92014-03-13 07:58:58 +0000672 def XVCVUXDDP : XX2Form<60, 488,
673 (outs vsrc:$XT), (ins vsrc:$XB),
Hal Finkel7279f4b2014-03-26 19:13:54 +0000674 "xvcvuxddp $XT, $XB", IIC_VecFP,
675 [(set v2f64:$XT, (uint_to_fp v2i64:$XB))]>;
Hal Finkel27774d92014-03-13 07:58:58 +0000676 def XVCVUXDSP : XX2Form<60, 424,
677 (outs vsrc:$XT), (ins vsrc:$XB),
Nemanja Ivanovic2efc3cb2016-11-11 14:41:19 +0000678 "xvcvuxdsp $XT, $XB", IIC_VecFP,
679 [(set v4f32:$XT, (int_ppc_vsx_xvcvuxdsp v2i64:$XB))]>;
Hal Finkel27774d92014-03-13 07:58:58 +0000680 def XVCVUXWDP : XX2Form<60, 232,
681 (outs vsrc:$XT), (ins vsrc:$XB),
Nemanja Ivanovic2efc3cb2016-11-11 14:41:19 +0000682 "xvcvuxwdp $XT, $XB", IIC_VecFP,
683 [(set v2f64:$XT, (int_ppc_vsx_xvcvuxwdp v4i32:$XB))]>;
Hal Finkel27774d92014-03-13 07:58:58 +0000684 def XVCVUXWSP : XX2Form<60, 168,
685 (outs vsrc:$XT), (ins vsrc:$XB),
Nemanja Ivanovicdf1cb522016-11-29 16:11:34 +0000686 "xvcvuxwsp $XT, $XB", IIC_VecFP,
687 [(set v4f32:$XT, (uint_to_fp v4i32:$XB))]>;
Hal Finkel27774d92014-03-13 07:58:58 +0000688
689 // Rounding Instructions
690 def XSRDPI : XX2Form<60, 73,
Hal Finkel19be5062014-03-29 05:29:01 +0000691 (outs vsfrc:$XT), (ins vsfrc:$XB),
Hal Finkel27774d92014-03-13 07:58:58 +0000692 "xsrdpi $XT, $XB", IIC_VecFP,
Michael Kuperstein2bc3d4d2016-08-18 20:08:15 +0000693 [(set f64:$XT, (fround f64:$XB))]>;
Hal Finkel27774d92014-03-13 07:58:58 +0000694 def XSRDPIC : XX2Form<60, 107,
Hal Finkel19be5062014-03-29 05:29:01 +0000695 (outs vsfrc:$XT), (ins vsfrc:$XB),
Hal Finkel27774d92014-03-13 07:58:58 +0000696 "xsrdpic $XT, $XB", IIC_VecFP,
697 [(set f64:$XT, (fnearbyint f64:$XB))]>;
698 def XSRDPIM : XX2Form<60, 121,
Hal Finkel19be5062014-03-29 05:29:01 +0000699 (outs vsfrc:$XT), (ins vsfrc:$XB),
Hal Finkel27774d92014-03-13 07:58:58 +0000700 "xsrdpim $XT, $XB", IIC_VecFP,
701 [(set f64:$XT, (ffloor f64:$XB))]>;
702 def XSRDPIP : XX2Form<60, 105,
Hal Finkel19be5062014-03-29 05:29:01 +0000703 (outs vsfrc:$XT), (ins vsfrc:$XB),
Hal Finkel27774d92014-03-13 07:58:58 +0000704 "xsrdpip $XT, $XB", IIC_VecFP,
705 [(set f64:$XT, (fceil f64:$XB))]>;
706 def XSRDPIZ : XX2Form<60, 89,
Hal Finkel19be5062014-03-29 05:29:01 +0000707 (outs vsfrc:$XT), (ins vsfrc:$XB),
Hal Finkel27774d92014-03-13 07:58:58 +0000708 "xsrdpiz $XT, $XB", IIC_VecFP,
709 [(set f64:$XT, (ftrunc f64:$XB))]>;
710
711 def XVRDPI : XX2Form<60, 201,
712 (outs vsrc:$XT), (ins vsrc:$XB),
713 "xvrdpi $XT, $XB", IIC_VecFP,
Michael Kuperstein2bc3d4d2016-08-18 20:08:15 +0000714 [(set v2f64:$XT, (fround v2f64:$XB))]>;
Hal Finkel27774d92014-03-13 07:58:58 +0000715 def XVRDPIC : XX2Form<60, 235,
716 (outs vsrc:$XT), (ins vsrc:$XB),
717 "xvrdpic $XT, $XB", IIC_VecFP,
718 [(set v2f64:$XT, (fnearbyint v2f64:$XB))]>;
719 def XVRDPIM : XX2Form<60, 249,
720 (outs vsrc:$XT), (ins vsrc:$XB),
721 "xvrdpim $XT, $XB", IIC_VecFP,
722 [(set v2f64:$XT, (ffloor v2f64:$XB))]>;
723 def XVRDPIP : XX2Form<60, 233,
724 (outs vsrc:$XT), (ins vsrc:$XB),
725 "xvrdpip $XT, $XB", IIC_VecFP,
726 [(set v2f64:$XT, (fceil v2f64:$XB))]>;
727 def XVRDPIZ : XX2Form<60, 217,
728 (outs vsrc:$XT), (ins vsrc:$XB),
729 "xvrdpiz $XT, $XB", IIC_VecFP,
730 [(set v2f64:$XT, (ftrunc v2f64:$XB))]>;
731
732 def XVRSPI : XX2Form<60, 137,
733 (outs vsrc:$XT), (ins vsrc:$XB),
734 "xvrspi $XT, $XB", IIC_VecFP,
Michael Kuperstein2bc3d4d2016-08-18 20:08:15 +0000735 [(set v4f32:$XT, (fround v4f32:$XB))]>;
Hal Finkel27774d92014-03-13 07:58:58 +0000736 def XVRSPIC : XX2Form<60, 171,
737 (outs vsrc:$XT), (ins vsrc:$XB),
738 "xvrspic $XT, $XB", IIC_VecFP,
739 [(set v4f32:$XT, (fnearbyint v4f32:$XB))]>;
740 def XVRSPIM : XX2Form<60, 185,
741 (outs vsrc:$XT), (ins vsrc:$XB),
742 "xvrspim $XT, $XB", IIC_VecFP,
743 [(set v4f32:$XT, (ffloor v4f32:$XB))]>;
744 def XVRSPIP : XX2Form<60, 169,
745 (outs vsrc:$XT), (ins vsrc:$XB),
746 "xvrspip $XT, $XB", IIC_VecFP,
747 [(set v4f32:$XT, (fceil v4f32:$XB))]>;
748 def XVRSPIZ : XX2Form<60, 153,
749 (outs vsrc:$XT), (ins vsrc:$XB),
750 "xvrspiz $XT, $XB", IIC_VecFP,
751 [(set v4f32:$XT, (ftrunc v4f32:$XB))]>;
752
753 // Max/Min Instructions
Hal Finkele01d3212014-03-24 15:07:28 +0000754 let isCommutable = 1 in {
Hal Finkel27774d92014-03-13 07:58:58 +0000755 def XSMAXDP : XX3Form<60, 160,
Hal Finkel19be5062014-03-29 05:29:01 +0000756 (outs vsfrc:$XT), (ins vsfrc:$XA, vsfrc:$XB),
Bill Schmidt1ca69fa2014-10-31 19:19:07 +0000757 "xsmaxdp $XT, $XA, $XB", IIC_VecFP,
758 [(set vsfrc:$XT,
759 (int_ppc_vsx_xsmaxdp vsfrc:$XA, vsfrc:$XB))]>;
Hal Finkel27774d92014-03-13 07:58:58 +0000760 def XSMINDP : XX3Form<60, 168,
Hal Finkel19be5062014-03-29 05:29:01 +0000761 (outs vsfrc:$XT), (ins vsfrc:$XA, vsfrc:$XB),
Bill Schmidt1ca69fa2014-10-31 19:19:07 +0000762 "xsmindp $XT, $XA, $XB", IIC_VecFP,
763 [(set vsfrc:$XT,
764 (int_ppc_vsx_xsmindp vsfrc:$XA, vsfrc:$XB))]>;
Hal Finkel27774d92014-03-13 07:58:58 +0000765
766 def XVMAXDP : XX3Form<60, 224,
767 (outs vsrc:$XT), (ins vsrc:$XA, vsrc:$XB),
Bill Schmidt1ca69fa2014-10-31 19:19:07 +0000768 "xvmaxdp $XT, $XA, $XB", IIC_VecFP,
769 [(set vsrc:$XT,
770 (int_ppc_vsx_xvmaxdp vsrc:$XA, vsrc:$XB))]>;
Hal Finkel27774d92014-03-13 07:58:58 +0000771 def XVMINDP : XX3Form<60, 232,
772 (outs vsrc:$XT), (ins vsrc:$XA, vsrc:$XB),
Bill Schmidt1ca69fa2014-10-31 19:19:07 +0000773 "xvmindp $XT, $XA, $XB", IIC_VecFP,
774 [(set vsrc:$XT,
775 (int_ppc_vsx_xvmindp vsrc:$XA, vsrc:$XB))]>;
Hal Finkel27774d92014-03-13 07:58:58 +0000776
777 def XVMAXSP : XX3Form<60, 192,
778 (outs vsrc:$XT), (ins vsrc:$XA, vsrc:$XB),
Bill Schmidt1ca69fa2014-10-31 19:19:07 +0000779 "xvmaxsp $XT, $XA, $XB", IIC_VecFP,
780 [(set vsrc:$XT,
781 (int_ppc_vsx_xvmaxsp vsrc:$XA, vsrc:$XB))]>;
Hal Finkel27774d92014-03-13 07:58:58 +0000782 def XVMINSP : XX3Form<60, 200,
783 (outs vsrc:$XT), (ins vsrc:$XA, vsrc:$XB),
Bill Schmidt1ca69fa2014-10-31 19:19:07 +0000784 "xvminsp $XT, $XA, $XB", IIC_VecFP,
785 [(set vsrc:$XT,
786 (int_ppc_vsx_xvminsp vsrc:$XA, vsrc:$XB))]>;
Hal Finkele01d3212014-03-24 15:07:28 +0000787 } // isCommutable
Hal Finkel27774d92014-03-13 07:58:58 +0000788} // Uses = [RM]
789
790 // Logical Instructions
Hal Finkele01d3212014-03-24 15:07:28 +0000791 let isCommutable = 1 in
Hal Finkel27774d92014-03-13 07:58:58 +0000792 def XXLAND : XX3Form<60, 130,
793 (outs vsrc:$XT), (ins vsrc:$XA, vsrc:$XB),
Hal Finkelbd4de9d2014-03-26 04:55:40 +0000794 "xxland $XT, $XA, $XB", IIC_VecGeneral,
795 [(set v4i32:$XT, (and v4i32:$XA, v4i32:$XB))]>;
Hal Finkel27774d92014-03-13 07:58:58 +0000796 def XXLANDC : XX3Form<60, 138,
797 (outs vsrc:$XT), (ins vsrc:$XA, vsrc:$XB),
Hal Finkelbd4de9d2014-03-26 04:55:40 +0000798 "xxlandc $XT, $XA, $XB", IIC_VecGeneral,
799 [(set v4i32:$XT, (and v4i32:$XA,
800 (vnot_ppc v4i32:$XB)))]>;
Hal Finkele01d3212014-03-24 15:07:28 +0000801 let isCommutable = 1 in {
Hal Finkel27774d92014-03-13 07:58:58 +0000802 def XXLNOR : XX3Form<60, 162,
803 (outs vsrc:$XT), (ins vsrc:$XA, vsrc:$XB),
Hal Finkelbd4de9d2014-03-26 04:55:40 +0000804 "xxlnor $XT, $XA, $XB", IIC_VecGeneral,
805 [(set v4i32:$XT, (vnot_ppc (or v4i32:$XA,
806 v4i32:$XB)))]>;
Hal Finkel27774d92014-03-13 07:58:58 +0000807 def XXLOR : XX3Form<60, 146,
808 (outs vsrc:$XT), (ins vsrc:$XA, vsrc:$XB),
Hal Finkelbd4de9d2014-03-26 04:55:40 +0000809 "xxlor $XT, $XA, $XB", IIC_VecGeneral,
810 [(set v4i32:$XT, (or v4i32:$XA, v4i32:$XB))]>;
Hal Finkel19be5062014-03-29 05:29:01 +0000811 let isCodeGenOnly = 1 in
812 def XXLORf: XX3Form<60, 146,
813 (outs vsfrc:$XT), (ins vsfrc:$XA, vsfrc:$XB),
814 "xxlor $XT, $XA, $XB", IIC_VecGeneral, []>;
Hal Finkel27774d92014-03-13 07:58:58 +0000815 def XXLXOR : XX3Form<60, 154,
816 (outs vsrc:$XT), (ins vsrc:$XA, vsrc:$XB),
Hal Finkelbd4de9d2014-03-26 04:55:40 +0000817 "xxlxor $XT, $XA, $XB", IIC_VecGeneral,
818 [(set v4i32:$XT, (xor v4i32:$XA, v4i32:$XB))]>;
Hal Finkele01d3212014-03-24 15:07:28 +0000819 } // isCommutable
Nemanja Ivanovicd2c3c512016-09-23 13:25:31 +0000820 let isCodeGenOnly = 1 in
821 def XXLXORz : XX3Form_Zero<60, 154, (outs vsrc:$XT), (ins),
822 "xxlxor $XT, $XT, $XT", IIC_VecGeneral,
823 [(set v4i32:$XT, (v4i32 immAllZerosV))]>;
Hal Finkel27774d92014-03-13 07:58:58 +0000824
Ehsan Amiric90b02c2016-10-24 17:31:09 +0000825 let isCodeGenOnly = 1 in {
826 def XXLXORdpz : XX3Form_SetZero<60, 154,
827 (outs vsfrc:$XT), (ins),
828 "xxlxor $XT, $XT, $XT", IIC_VecGeneral,
829 [(set f64:$XT, (fpimm0))]>;
830 def XXLXORspz : XX3Form_SetZero<60, 154,
831 (outs vssrc:$XT), (ins),
832 "xxlxor $XT, $XT, $XT", IIC_VecGeneral,
833 [(set f32:$XT, (fpimm0))]>;
834 }
835
Hal Finkel27774d92014-03-13 07:58:58 +0000836 // Permutation Instructions
837 def XXMRGHW : XX3Form<60, 18,
838 (outs vsrc:$XT), (ins vsrc:$XA, vsrc:$XB),
839 "xxmrghw $XT, $XA, $XB", IIC_VecPerm, []>;
840 def XXMRGLW : XX3Form<60, 50,
841 (outs vsrc:$XT), (ins vsrc:$XA, vsrc:$XB),
842 "xxmrglw $XT, $XA, $XB", IIC_VecPerm, []>;
843
844 def XXPERMDI : XX3Form_2<60, 10,
845 (outs vsrc:$XT), (ins vsrc:$XA, vsrc:$XB, u2imm:$DM),
846 "xxpermdi $XT, $XA, $XB, $DM", IIC_VecPerm, []>;
Nemanja Ivanovic10fc3cf2016-11-23 15:51:52 +0000847 let isCodeGenOnly = 1 in {
Nemanja Ivanovic11049f82016-10-04 06:59:23 +0000848 def XXPERMDIs : XX3Form_2s<60, 10, (outs vsrc:$XT), (ins vfrc:$XA, u2imm:$DM),
849 "xxpermdi $XT, $XA, $XA, $DM", IIC_VecPerm, []>;
Nemanja Ivanovic10fc3cf2016-11-23 15:51:52 +0000850 let D = 0 in
851 def XXSPLTD0s : XX3Form_2s<60, 10, (outs vsrc:$XT), (ins vfrc:$XA),
852 "xxspltd $XT, $XA, 0", IIC_VecPerm, []>;
853 let D = 1 in
854 def XXSPLTD1s : XX3Form_2s<60, 10, (outs vsrc:$XT), (ins vfrc:$XA),
855 "xxspltd $XT, $XA, 1", IIC_VecPerm, []>;
856 let D = 2 in
857 def XXSWAPDs : XX3Form_2s<60, 10, (outs vsrc:$XT), (ins vfrc:$XA),
858 "xxswapd $XT, $XA", IIC_VecPerm, []>;
859 }
Hal Finkel27774d92014-03-13 07:58:58 +0000860 def XXSEL : XX4Form<60, 3,
861 (outs vsrc:$XT), (ins vsrc:$XA, vsrc:$XB, vsrc:$XC),
862 "xxsel $XT, $XA, $XB, $XC", IIC_VecPerm, []>;
863
864 def XXSLDWI : XX3Form_2<60, 2,
865 (outs vsrc:$XT), (ins vsrc:$XA, vsrc:$XB, u2imm:$SHW),
Nemanja Ivanovicb43bb612016-07-12 21:00:10 +0000866 "xxsldwi $XT, $XA, $XB, $SHW", IIC_VecPerm,
867 [(set v4i32:$XT, (PPCvecshl v4i32:$XA, v4i32:$XB,
868 imm32SExt16:$SHW))]>;
Hal Finkel27774d92014-03-13 07:58:58 +0000869 def XXSPLTW : XX2Form_2<60, 164,
870 (outs vsrc:$XT), (ins vsrc:$XB, u2imm:$UIM),
Nemanja Ivanovic1a2b2f02016-05-04 16:04:02 +0000871 "xxspltw $XT, $XB, $UIM", IIC_VecPerm,
872 [(set v4i32:$XT,
873 (PPCxxsplt v4i32:$XB, imm32SExt16:$UIM))]>;
Nemanja Ivanovic11049f82016-10-04 06:59:23 +0000874 let isCodeGenOnly = 1 in
875 def XXSPLTWs : XX2Form_2<60, 164,
876 (outs vsrc:$XT), (ins vfrc:$XB, u2imm:$UIM),
877 "xxspltw $XT, $XB, $UIM", IIC_VecPerm, []>;
Craig Topperc50d64b2014-11-26 00:46:26 +0000878} // hasSideEffects
Nemanja Ivanovic11049f82016-10-04 06:59:23 +0000879} // UseVSXReg = 1
Hal Finkel27774d92014-03-13 07:58:58 +0000880
Bill Schmidt61e65232014-10-22 13:13:40 +0000881// SELECT_CC_* - Used to implement the SELECT_CC DAG operation. Expanded after
882// instruction selection into a branch sequence.
883let usesCustomInserter = 1, // Expanded after instruction selection.
884 PPC970_Single = 1 in {
885
886 def SELECT_CC_VSRC: Pseudo<(outs vsrc:$dst),
887 (ins crrc:$cond, vsrc:$T, vsrc:$F, i32imm:$BROPC),
888 "#SELECT_CC_VSRC",
889 []>;
Bill Schmidt9c54bbd2014-10-22 16:58:20 +0000890 def SELECT_VSRC: Pseudo<(outs vsrc:$dst),
891 (ins crbitrc:$cond, vsrc:$T, vsrc:$F),
892 "#SELECT_VSRC",
Bill Schmidt61e65232014-10-22 13:13:40 +0000893 [(set v2f64:$dst,
894 (select i1:$cond, v2f64:$T, v2f64:$F))]>;
Bill Schmidt9c54bbd2014-10-22 16:58:20 +0000895 def SELECT_CC_VSFRC: Pseudo<(outs f8rc:$dst),
896 (ins crrc:$cond, f8rc:$T, f8rc:$F,
897 i32imm:$BROPC), "#SELECT_CC_VSFRC",
898 []>;
899 def SELECT_VSFRC: Pseudo<(outs f8rc:$dst),
900 (ins crbitrc:$cond, f8rc:$T, f8rc:$F),
901 "#SELECT_VSFRC",
902 [(set f64:$dst,
903 (select i1:$cond, f64:$T, f64:$F))]>;
Nemanja Ivanovicf3c94b12015-05-07 18:24:05 +0000904 def SELECT_CC_VSSRC: Pseudo<(outs f4rc:$dst),
905 (ins crrc:$cond, f4rc:$T, f4rc:$F,
906 i32imm:$BROPC), "#SELECT_CC_VSSRC",
907 []>;
908 def SELECT_VSSRC: Pseudo<(outs f4rc:$dst),
909 (ins crbitrc:$cond, f4rc:$T, f4rc:$F),
910 "#SELECT_VSSRC",
911 [(set f32:$dst,
912 (select i1:$cond, f32:$T, f32:$F))]>;
Bill Schmidt9c54bbd2014-10-22 16:58:20 +0000913} // usesCustomInserter
914} // AddedComplexity
Bill Schmidt61e65232014-10-22 13:13:40 +0000915
Hal Finkel27774d92014-03-13 07:58:58 +0000916def : InstAlias<"xvmovdp $XT, $XB",
917 (XVCPSGNDP vsrc:$XT, vsrc:$XB, vsrc:$XB)>;
918def : InstAlias<"xvmovsp $XT, $XB",
919 (XVCPSGNSP vsrc:$XT, vsrc:$XB, vsrc:$XB)>;
920
921def : InstAlias<"xxspltd $XT, $XB, 0",
922 (XXPERMDI vsrc:$XT, vsrc:$XB, vsrc:$XB, 0)>;
923def : InstAlias<"xxspltd $XT, $XB, 1",
924 (XXPERMDI vsrc:$XT, vsrc:$XB, vsrc:$XB, 3)>;
925def : InstAlias<"xxmrghd $XT, $XA, $XB",
926 (XXPERMDI vsrc:$XT, vsrc:$XA, vsrc:$XB, 0)>;
927def : InstAlias<"xxmrgld $XT, $XA, $XB",
928 (XXPERMDI vsrc:$XT, vsrc:$XA, vsrc:$XB, 3)>;
929def : InstAlias<"xxswapd $XT, $XB",
930 (XXPERMDI vsrc:$XT, vsrc:$XB, vsrc:$XB, 2)>;
931
932let AddedComplexity = 400 in { // Prefer VSX patterns over non-VSX patterns.
Bill Schmidt10f6eb92014-12-09 16:43:32 +0000933
Nemanja Ivanovic6f22b412016-09-27 08:42:12 +0000934def : Pat<(v4i32 (vnot_ppc v4i32:$A)),
935 (v4i32 (XXLNOR $A, $A))>;
Bill Schmidt10f6eb92014-12-09 16:43:32 +0000936let Predicates = [IsBigEndian] in {
Hal Finkel27774d92014-03-13 07:58:58 +0000937def : Pat<(v2f64 (scalar_to_vector f64:$A)),
Hal Finkel19be5062014-03-29 05:29:01 +0000938 (v2f64 (SUBREG_TO_REG (i64 1), $A, sub_64))>;
Hal Finkel27774d92014-03-13 07:58:58 +0000939
Matt Arsenaultfbd9bbf2015-12-11 19:20:16 +0000940def : Pat<(f64 (extractelt v2f64:$S, 0)),
Hal Finkel19be5062014-03-29 05:29:01 +0000941 (f64 (EXTRACT_SUBREG $S, sub_64))>;
Matt Arsenaultfbd9bbf2015-12-11 19:20:16 +0000942def : Pat<(f64 (extractelt v2f64:$S, 1)),
Hal Finkel19be5062014-03-29 05:29:01 +0000943 (f64 (EXTRACT_SUBREG (XXPERMDI $S, $S, 2), sub_64))>;
Bill Schmidt10f6eb92014-12-09 16:43:32 +0000944}
945
946let Predicates = [IsLittleEndian] in {
947def : Pat<(v2f64 (scalar_to_vector f64:$A)),
948 (v2f64 (XXPERMDI (SUBREG_TO_REG (i64 1), $A, sub_64),
949 (SUBREG_TO_REG (i64 1), $A, sub_64), 0))>;
950
Matt Arsenaultfbd9bbf2015-12-11 19:20:16 +0000951def : Pat<(f64 (extractelt v2f64:$S, 0)),
Bill Schmidt10f6eb92014-12-09 16:43:32 +0000952 (f64 (EXTRACT_SUBREG (XXPERMDI $S, $S, 2), sub_64))>;
Matt Arsenaultfbd9bbf2015-12-11 19:20:16 +0000953def : Pat<(f64 (extractelt v2f64:$S, 1)),
Bill Schmidt10f6eb92014-12-09 16:43:32 +0000954 (f64 (EXTRACT_SUBREG $S, sub_64))>;
955}
Hal Finkel27774d92014-03-13 07:58:58 +0000956
957// Additional fnmsub patterns: -a*c + b == -(a*c - b)
958def : Pat<(fma (fneg f64:$A), f64:$C, f64:$B),
959 (XSNMSUBADP $B, $C, $A)>;
960def : Pat<(fma f64:$A, (fneg f64:$C), f64:$B),
961 (XSNMSUBADP $B, $C, $A)>;
962
963def : Pat<(fma (fneg v2f64:$A), v2f64:$C, v2f64:$B),
964 (XVNMSUBADP $B, $C, $A)>;
965def : Pat<(fma v2f64:$A, (fneg v2f64:$C), v2f64:$B),
966 (XVNMSUBADP $B, $C, $A)>;
967
968def : Pat<(fma (fneg v4f32:$A), v4f32:$C, v4f32:$B),
969 (XVNMSUBASP $B, $C, $A)>;
970def : Pat<(fma v4f32:$A, (fneg v4f32:$C), v4f32:$B),
971 (XVNMSUBASP $B, $C, $A)>;
972
Hal Finkel9e0baa62014-04-01 19:24:27 +0000973def : Pat<(v2f64 (bitconvert v4f32:$A)),
974 (COPY_TO_REGCLASS $A, VSRC)>;
Hal Finkel27774d92014-03-13 07:58:58 +0000975def : Pat<(v2f64 (bitconvert v4i32:$A)),
976 (COPY_TO_REGCLASS $A, VSRC)>;
977def : Pat<(v2f64 (bitconvert v8i16:$A)),
978 (COPY_TO_REGCLASS $A, VSRC)>;
979def : Pat<(v2f64 (bitconvert v16i8:$A)),
980 (COPY_TO_REGCLASS $A, VSRC)>;
981
Hal Finkel9e0baa62014-04-01 19:24:27 +0000982def : Pat<(v4f32 (bitconvert v2f64:$A)),
983 (COPY_TO_REGCLASS $A, VRRC)>;
Hal Finkel27774d92014-03-13 07:58:58 +0000984def : Pat<(v4i32 (bitconvert v2f64:$A)),
985 (COPY_TO_REGCLASS $A, VRRC)>;
986def : Pat<(v8i16 (bitconvert v2f64:$A)),
987 (COPY_TO_REGCLASS $A, VRRC)>;
988def : Pat<(v16i8 (bitconvert v2f64:$A)),
989 (COPY_TO_REGCLASS $A, VRRC)>;
990
Hal Finkel9e0baa62014-04-01 19:24:27 +0000991def : Pat<(v2i64 (bitconvert v4f32:$A)),
992 (COPY_TO_REGCLASS $A, VSRC)>;
Hal Finkela6c8b512014-03-26 16:12:58 +0000993def : Pat<(v2i64 (bitconvert v4i32:$A)),
994 (COPY_TO_REGCLASS $A, VSRC)>;
995def : Pat<(v2i64 (bitconvert v8i16:$A)),
996 (COPY_TO_REGCLASS $A, VSRC)>;
997def : Pat<(v2i64 (bitconvert v16i8:$A)),
998 (COPY_TO_REGCLASS $A, VSRC)>;
999
Hal Finkel9e0baa62014-04-01 19:24:27 +00001000def : Pat<(v4f32 (bitconvert v2i64:$A)),
1001 (COPY_TO_REGCLASS $A, VRRC)>;
Hal Finkela6c8b512014-03-26 16:12:58 +00001002def : Pat<(v4i32 (bitconvert v2i64:$A)),
1003 (COPY_TO_REGCLASS $A, VRRC)>;
1004def : Pat<(v8i16 (bitconvert v2i64:$A)),
1005 (COPY_TO_REGCLASS $A, VRRC)>;
1006def : Pat<(v16i8 (bitconvert v2i64:$A)),
1007 (COPY_TO_REGCLASS $A, VRRC)>;
1008
Hal Finkel9281c9a2014-03-26 18:26:30 +00001009def : Pat<(v2f64 (bitconvert v2i64:$A)),
1010 (COPY_TO_REGCLASS $A, VRRC)>;
1011def : Pat<(v2i64 (bitconvert v2f64:$A)),
1012 (COPY_TO_REGCLASS $A, VRRC)>;
1013
Kit Bartond4eb73c2015-05-05 16:10:44 +00001014def : Pat<(v2f64 (bitconvert v1i128:$A)),
1015 (COPY_TO_REGCLASS $A, VRRC)>;
1016def : Pat<(v1i128 (bitconvert v2f64:$A)),
1017 (COPY_TO_REGCLASS $A, VRRC)>;
1018
Hal Finkel5c0d1452014-03-30 13:22:59 +00001019// sign extension patterns
1020// To extend "in place" from v2i32 to v2i64, we have input data like:
1021// | undef | i32 | undef | i32 |
1022// but xvcvsxwdp expects the input in big-Endian format:
1023// | i32 | undef | i32 | undef |
1024// so we need to shift everything to the left by one i32 (word) before
1025// the conversion.
1026def : Pat<(sext_inreg v2i64:$C, v2i32),
1027 (XVCVDPSXDS (XVCVSXWDP (XXSLDWI $C, $C, 1)))>;
1028def : Pat<(v2f64 (sint_to_fp (sext_inreg v2i64:$C, v2i32))),
1029 (XVCVSXWDP (XXSLDWI $C, $C, 1))>;
1030
Nemanja Ivanovic44513e52016-07-05 09:22:29 +00001031def : Pat<(v2f64 (PPCsvec2fp v4i32:$C, 0)),
1032 (v2f64 (XVCVSXWDP (v2i64 (XXMRGHW $C, $C))))>;
1033def : Pat<(v2f64 (PPCsvec2fp v4i32:$C, 1)),
1034 (v2f64 (XVCVSXWDP (v2i64 (XXMRGLW $C, $C))))>;
1035
1036def : Pat<(v2f64 (PPCuvec2fp v4i32:$C, 0)),
1037 (v2f64 (XVCVUXWDP (v2i64 (XXMRGHW $C, $C))))>;
1038def : Pat<(v2f64 (PPCuvec2fp v4i32:$C, 1)),
1039 (v2f64 (XVCVUXWDP (v2i64 (XXMRGLW $C, $C))))>;
1040
Bill Schmidt2d1128a2014-10-17 15:13:38 +00001041// Loads.
Nemanja Ivanovic6e7879c2016-09-22 09:52:19 +00001042let Predicates = [HasVSX, HasOnlySwappingMemOps] in {
Nemanja Ivanovic6e7879c2016-09-22 09:52:19 +00001043 def : Pat<(v2f64 (PPClxvd2x xoaddr:$src)), (LXVD2X xoaddr:$src)>;
Bill Schmidt2d1128a2014-10-17 15:13:38 +00001044
Nemanja Ivanovic6e7879c2016-09-22 09:52:19 +00001045 // Stores.
1046 def : Pat<(int_ppc_vsx_stxvd2x v2f64:$rS, xoaddr:$dst),
1047 (STXVD2X $rS, xoaddr:$dst)>;
Tony Jiang5f850cd2016-11-15 14:25:56 +00001048 def : Pat<(int_ppc_vsx_stxvd2x_be v2f64:$rS, xoaddr:$dst),
1049 (STXVD2X $rS, xoaddr:$dst)>;
1050 def : Pat<(int_ppc_vsx_stxvw4x_be v4i32:$rS, xoaddr:$dst),
1051 (STXVW4X $rS, xoaddr:$dst)>;
Nemanja Ivanovic6e7879c2016-09-22 09:52:19 +00001052 def : Pat<(PPCstxvd2x v2f64:$rS, xoaddr:$dst), (STXVD2X $rS, xoaddr:$dst)>;
1053}
Nemanja Ivanovice78ffed2016-09-22 10:32:03 +00001054let Predicates = [IsBigEndian, HasVSX, HasOnlySwappingMemOps] in {
1055 def : Pat<(v2f64 (load xoaddr:$src)), (LXVD2X xoaddr:$src)>;
1056 def : Pat<(v2i64 (load xoaddr:$src)), (LXVD2X xoaddr:$src)>;
1057 def : Pat<(v4i32 (load xoaddr:$src)), (LXVW4X xoaddr:$src)>;
Nemanja Ivanovicb8e30d62016-11-22 19:02:07 +00001058 def : Pat<(v4i32 (int_ppc_vsx_lxvw4x xoaddr:$src)), (LXVW4X xoaddr:$src)>;
Nemanja Ivanovice78ffed2016-09-22 10:32:03 +00001059 def : Pat<(store v2f64:$rS, xoaddr:$dst), (STXVD2X $rS, xoaddr:$dst)>;
1060 def : Pat<(store v2i64:$rS, xoaddr:$dst), (STXVD2X $rS, xoaddr:$dst)>;
Nemanja Ivanovicb8e30d62016-11-22 19:02:07 +00001061 def : Pat<(store v4i32:$XT, xoaddr:$dst), (STXVW4X $XT, xoaddr:$dst)>;
1062 def : Pat<(int_ppc_vsx_stxvw4x v4i32:$rS, xoaddr:$dst),
1063 (STXVW4X $rS, xoaddr:$dst)>;
Nemanja Ivanovice78ffed2016-09-22 10:32:03 +00001064}
Bill Schmidtfae5d712014-12-09 16:35:51 +00001065
1066// Permutes.
1067def : Pat<(v2f64 (PPCxxswapd v2f64:$src)), (XXPERMDI $src, $src, 2)>;
1068def : Pat<(v2i64 (PPCxxswapd v2i64:$src)), (XXPERMDI $src, $src, 2)>;
1069def : Pat<(v4f32 (PPCxxswapd v4f32:$src)), (XXPERMDI $src, $src, 2)>;
1070def : Pat<(v4i32 (PPCxxswapd v4i32:$src)), (XXPERMDI $src, $src, 2)>;
Nemanja Ivanoviceebbcb62016-07-12 12:16:27 +00001071def : Pat<(v2f64 (PPCswapNoChain v2f64:$src)), (XXPERMDI $src, $src, 2)>;
Bill Schmidt2d1128a2014-10-17 15:13:38 +00001072
Bill Schmidt61e65232014-10-22 13:13:40 +00001073// Selects.
1074def : Pat<(v2f64 (selectcc i1:$lhs, i1:$rhs, v2f64:$tval, v2f64:$fval, SETLT)),
Hal Finkela2cdbce2015-08-30 22:12:50 +00001075 (SELECT_VSRC (CRANDC $lhs, $rhs), $tval, $fval)>;
1076def : Pat<(v2f64 (selectcc i1:$lhs, i1:$rhs, v2f64:$tval, v2f64:$fval, SETULT)),
Bill Schmidt61e65232014-10-22 13:13:40 +00001077 (SELECT_VSRC (CRANDC $rhs, $lhs), $tval, $fval)>;
1078def : Pat<(v2f64 (selectcc i1:$lhs, i1:$rhs, v2f64:$tval, v2f64:$fval, SETLE)),
Hal Finkela2cdbce2015-08-30 22:12:50 +00001079 (SELECT_VSRC (CRORC $lhs, $rhs), $tval, $fval)>;
1080def : Pat<(v2f64 (selectcc i1:$lhs, i1:$rhs, v2f64:$tval, v2f64:$fval, SETULE)),
Bill Schmidt61e65232014-10-22 13:13:40 +00001081 (SELECT_VSRC (CRORC $rhs, $lhs), $tval, $fval)>;
1082def : Pat<(v2f64 (selectcc i1:$lhs, i1:$rhs, v2f64:$tval, v2f64:$fval, SETEQ)),
1083 (SELECT_VSRC (CREQV $lhs, $rhs), $tval, $fval)>;
1084def : Pat<(v2f64 (selectcc i1:$lhs, i1:$rhs, v2f64:$tval, v2f64:$fval, SETGE)),
Hal Finkela2cdbce2015-08-30 22:12:50 +00001085 (SELECT_VSRC (CRORC $rhs, $lhs), $tval, $fval)>;
1086def : Pat<(v2f64 (selectcc i1:$lhs, i1:$rhs, v2f64:$tval, v2f64:$fval, SETUGE)),
Bill Schmidt61e65232014-10-22 13:13:40 +00001087 (SELECT_VSRC (CRORC $lhs, $rhs), $tval, $fval)>;
1088def : Pat<(v2f64 (selectcc i1:$lhs, i1:$rhs, v2f64:$tval, v2f64:$fval, SETGT)),
Hal Finkela2cdbce2015-08-30 22:12:50 +00001089 (SELECT_VSRC (CRANDC $rhs, $lhs), $tval, $fval)>;
1090def : Pat<(v2f64 (selectcc i1:$lhs, i1:$rhs, v2f64:$tval, v2f64:$fval, SETUGT)),
Bill Schmidt61e65232014-10-22 13:13:40 +00001091 (SELECT_VSRC (CRANDC $lhs, $rhs), $tval, $fval)>;
1092def : Pat<(v2f64 (selectcc i1:$lhs, i1:$rhs, v2f64:$tval, v2f64:$fval, SETNE)),
1093 (SELECT_VSRC (CRXOR $lhs, $rhs), $tval, $fval)>;
1094
Bill Schmidt9c54bbd2014-10-22 16:58:20 +00001095def : Pat<(f64 (selectcc i1:$lhs, i1:$rhs, f64:$tval, f64:$fval, SETLT)),
Hal Finkela2cdbce2015-08-30 22:12:50 +00001096 (SELECT_VSFRC (CRANDC $lhs, $rhs), $tval, $fval)>;
1097def : Pat<(f64 (selectcc i1:$lhs, i1:$rhs, f64:$tval, f64:$fval, SETULT)),
Bill Schmidt9c54bbd2014-10-22 16:58:20 +00001098 (SELECT_VSFRC (CRANDC $rhs, $lhs), $tval, $fval)>;
1099def : Pat<(f64 (selectcc i1:$lhs, i1:$rhs, f64:$tval, f64:$fval, SETLE)),
Hal Finkela2cdbce2015-08-30 22:12:50 +00001100 (SELECT_VSFRC (CRORC $lhs, $rhs), $tval, $fval)>;
1101def : Pat<(f64 (selectcc i1:$lhs, i1:$rhs, f64:$tval, f64:$fval, SETULE)),
Bill Schmidt9c54bbd2014-10-22 16:58:20 +00001102 (SELECT_VSFRC (CRORC $rhs, $lhs), $tval, $fval)>;
1103def : Pat<(f64 (selectcc i1:$lhs, i1:$rhs, f64:$tval, f64:$fval, SETEQ)),
1104 (SELECT_VSFRC (CREQV $lhs, $rhs), $tval, $fval)>;
1105def : Pat<(f64 (selectcc i1:$lhs, i1:$rhs, f64:$tval, f64:$fval, SETGE)),
Hal Finkela2cdbce2015-08-30 22:12:50 +00001106 (SELECT_VSFRC (CRORC $rhs, $lhs), $tval, $fval)>;
1107def : Pat<(f64 (selectcc i1:$lhs, i1:$rhs, f64:$tval, f64:$fval, SETUGE)),
Bill Schmidt9c54bbd2014-10-22 16:58:20 +00001108 (SELECT_VSFRC (CRORC $lhs, $rhs), $tval, $fval)>;
1109def : Pat<(f64 (selectcc i1:$lhs, i1:$rhs, f64:$tval, f64:$fval, SETGT)),
Hal Finkela2cdbce2015-08-30 22:12:50 +00001110 (SELECT_VSFRC (CRANDC $rhs, $lhs), $tval, $fval)>;
1111def : Pat<(f64 (selectcc i1:$lhs, i1:$rhs, f64:$tval, f64:$fval, SETUGT)),
Bill Schmidt9c54bbd2014-10-22 16:58:20 +00001112 (SELECT_VSFRC (CRANDC $lhs, $rhs), $tval, $fval)>;
1113def : Pat<(f64 (selectcc i1:$lhs, i1:$rhs, f64:$tval, f64:$fval, SETNE)),
1114 (SELECT_VSFRC (CRXOR $lhs, $rhs), $tval, $fval)>;
1115
Bill Schmidt76746922014-11-14 12:10:40 +00001116// Divides.
1117def : Pat<(int_ppc_vsx_xvdivsp v4f32:$A, v4f32:$B),
1118 (XVDIVSP $A, $B)>;
1119def : Pat<(int_ppc_vsx_xvdivdp v2f64:$A, v2f64:$B),
1120 (XVDIVDP $A, $B)>;
1121
Nemanja Ivanovic984a3612015-07-14 17:25:20 +00001122// Reciprocal estimate
1123def : Pat<(int_ppc_vsx_xvresp v4f32:$A),
1124 (XVRESP $A)>;
1125def : Pat<(int_ppc_vsx_xvredp v2f64:$A),
1126 (XVREDP $A)>;
1127
Nemanja Ivanovicd358b8f2015-07-05 06:03:51 +00001128// Recip. square root estimate
1129def : Pat<(int_ppc_vsx_xvrsqrtesp v4f32:$A),
1130 (XVRSQRTESP $A)>;
1131def : Pat<(int_ppc_vsx_xvrsqrtedp v2f64:$A),
1132 (XVRSQRTEDP $A)>;
1133
Nemanja Ivanovicd3c284f2016-07-18 15:30:00 +00001134let Predicates = [IsLittleEndian] in {
1135def : Pat<(f64 (PPCfcfid (PPCmtvsra (i64 (vector_extract v2i64:$S, 0))))),
1136 (f64 (XSCVSXDDP (COPY_TO_REGCLASS (XXPERMDI $S, $S, 2), VSFRC)))>;
1137def : Pat<(f64 (PPCfcfid (PPCmtvsra (i64 (vector_extract v2i64:$S, 1))))),
1138 (f64 (XSCVSXDDP (COPY_TO_REGCLASS (f64 (COPY_TO_REGCLASS $S, VSRC)), VSFRC)))>;
1139def : Pat<(f64 (PPCfcfidu (PPCmtvsra (i64 (vector_extract v2i64:$S, 0))))),
1140 (f64 (XSCVUXDDP (COPY_TO_REGCLASS (XXPERMDI $S, $S, 2), VSFRC)))>;
1141def : Pat<(f64 (PPCfcfidu (PPCmtvsra (i64 (vector_extract v2i64:$S, 1))))),
1142 (f64 (XSCVUXDDP (COPY_TO_REGCLASS (f64 (COPY_TO_REGCLASS $S, VSRC)), VSFRC)))>;
1143} // IsLittleEndian
1144
1145let Predicates = [IsBigEndian] in {
1146def : Pat<(f64 (PPCfcfid (PPCmtvsra (i64 (vector_extract v2i64:$S, 0))))),
1147 (f64 (XSCVSXDDP (COPY_TO_REGCLASS $S, VSFRC)))>;
1148def : Pat<(f64 (PPCfcfid (PPCmtvsra (i64 (vector_extract v2i64:$S, 1))))),
1149 (f64 (XSCVSXDDP (COPY_TO_REGCLASS (XXPERMDI $S, $S, 2), VSFRC)))>;
1150def : Pat<(f64 (PPCfcfidu (PPCmtvsra (i64 (vector_extract v2i64:$S, 0))))),
1151 (f64 (XSCVUXDDP (COPY_TO_REGCLASS $S, VSFRC)))>;
1152def : Pat<(f64 (PPCfcfidu (PPCmtvsra (i64 (vector_extract v2i64:$S, 1))))),
1153 (f64 (XSCVUXDDP (COPY_TO_REGCLASS (XXPERMDI $S, $S, 2), VSFRC)))>;
1154} // IsBigEndian
1155
Hal Finkel27774d92014-03-13 07:58:58 +00001156} // AddedComplexity
1157} // HasVSX
1158
Nemanja Ivanovic11049f82016-10-04 06:59:23 +00001159def ScalarLoads {
1160 dag Li8 = (i32 (extloadi8 xoaddr:$src));
1161 dag ZELi8 = (i32 (zextloadi8 xoaddr:$src));
1162 dag ZELi8i64 = (i64 (zextloadi8 xoaddr:$src));
1163 dag SELi8 = (i32 (sext_inreg (extloadi8 xoaddr:$src), i8));
1164 dag SELi8i64 = (i64 (sext_inreg (extloadi8 xoaddr:$src), i8));
1165
1166 dag Li16 = (i32 (extloadi16 xoaddr:$src));
1167 dag ZELi16 = (i32 (zextloadi16 xoaddr:$src));
1168 dag ZELi16i64 = (i64 (zextloadi16 xoaddr:$src));
1169 dag SELi16 = (i32 (sextloadi16 xoaddr:$src));
1170 dag SELi16i64 = (i64 (sextloadi16 xoaddr:$src));
1171
1172 dag Li32 = (i32 (load xoaddr:$src));
1173}
1174
Kit Barton298beb52015-02-18 16:21:46 +00001175// The following VSX instructions were introduced in Power ISA 2.07
1176/* FIXME: if the operands are v2i64, these patterns will not match.
1177 we should define new patterns or otherwise match the same patterns
1178 when the elements are larger than i32.
1179*/
1180def HasP8Vector : Predicate<"PPCSubTarget->hasP8Vector()">;
Nemanja Ivanovicc38b5312015-04-11 10:40:42 +00001181def HasDirectMove : Predicate<"PPCSubTarget->hasDirectMove()">;
Kit Barton298beb52015-02-18 16:21:46 +00001182let Predicates = [HasP8Vector] in {
1183let AddedComplexity = 400 in { // Prefer VSX patterns over non-VSX patterns.
Nemanja Ivanovic11049f82016-10-04 06:59:23 +00001184 let isCommutable = 1, UseVSXReg = 1 in {
Nemanja Ivanovicf02def62015-05-21 19:32:49 +00001185 def XXLEQV : XX3Form<60, 186,
1186 (outs vsrc:$XT), (ins vsrc:$XA, vsrc:$XB),
1187 "xxleqv $XT, $XA, $XB", IIC_VecGeneral,
1188 [(set v4i32:$XT, (vnot_ppc (xor v4i32:$XA, v4i32:$XB)))]>;
1189 def XXLNAND : XX3Form<60, 178,
1190 (outs vsrc:$XT), (ins vsrc:$XA, vsrc:$XB),
1191 "xxlnand $XT, $XA, $XB", IIC_VecGeneral,
1192 [(set v4i32:$XT, (vnot_ppc (and v4i32:$XA,
Kit Barton298beb52015-02-18 16:21:46 +00001193 v4i32:$XB)))]>;
Nemanja Ivanovic11049f82016-10-04 06:59:23 +00001194 } // isCommutable, UseVSXReg
Nemanja Ivanovicd9e4b4f2015-07-10 14:25:17 +00001195
Nemanja Ivanovic5655fb32015-07-10 12:38:08 +00001196 def : Pat<(int_ppc_vsx_xxleqv v4i32:$A, v4i32:$B),
1197 (XXLEQV $A, $B)>;
Nemanja Ivanovicf02def62015-05-21 19:32:49 +00001198
Nemanja Ivanovic11049f82016-10-04 06:59:23 +00001199 let UseVSXReg = 1 in {
Nemanja Ivanovicf02def62015-05-21 19:32:49 +00001200 def XXLORC : XX3Form<60, 170,
1201 (outs vsrc:$XT), (ins vsrc:$XA, vsrc:$XB),
1202 "xxlorc $XT, $XA, $XB", IIC_VecGeneral,
1203 [(set v4i32:$XT, (or v4i32:$XA, (vnot_ppc v4i32:$XB)))]>;
1204
Nemanja Ivanovicf3c94b12015-05-07 18:24:05 +00001205 // VSX scalar loads introduced in ISA 2.07
1206 let mayLoad = 1 in {
Nemanja Ivanovic6354d232016-10-04 11:25:52 +00001207 let CodeSize = 3 in
Nemanja Ivanovicf3c94b12015-05-07 18:24:05 +00001208 def LXSSPX : XX1Form<31, 524, (outs vssrc:$XT), (ins memrr:$src),
1209 "lxsspx $XT, $src", IIC_LdStLFD,
1210 [(set f32:$XT, (load xoaddr:$src))]>;
1211 def LXSIWAX : XX1Form<31, 76, (outs vsfrc:$XT), (ins memrr:$src),
1212 "lxsiwax $XT, $src", IIC_LdStLFD,
1213 [(set f64:$XT, (PPClfiwax xoaddr:$src))]>;
1214 def LXSIWZX : XX1Form<31, 12, (outs vsfrc:$XT), (ins memrr:$src),
1215 "lxsiwzx $XT, $src", IIC_LdStLFD,
1216 [(set f64:$XT, (PPClfiwzx xoaddr:$src))]>;
1217 } // mayLoad
1218
1219 // VSX scalar stores introduced in ISA 2.07
1220 let mayStore = 1 in {
Nemanja Ivanovic6354d232016-10-04 11:25:52 +00001221 let CodeSize = 3 in
Nemanja Ivanovicf3c94b12015-05-07 18:24:05 +00001222 def STXSSPX : XX1Form<31, 652, (outs), (ins vssrc:$XT, memrr:$dst),
1223 "stxsspx $XT, $dst", IIC_LdStSTFD,
1224 [(store f32:$XT, xoaddr:$dst)]>;
1225 def STXSIWX : XX1Form<31, 140, (outs), (ins vsfrc:$XT, memrr:$dst),
1226 "stxsiwx $XT, $dst", IIC_LdStSTFD,
1227 [(PPCstfiwx f64:$XT, xoaddr:$dst)]>;
1228 } // mayStore
Nemanja Ivanovic11049f82016-10-04 06:59:23 +00001229 } // UseVSXReg = 1
Nemanja Ivanovicf02def62015-05-21 19:32:49 +00001230
1231 def : Pat<(f64 (extloadf32 xoaddr:$src)),
1232 (COPY_TO_REGCLASS (LXSSPX xoaddr:$src), VSFRC)>;
Nemanja Ivanovicdf1cb522016-11-29 16:11:34 +00001233 def : Pat<(f32 (fpround (extloadf32 xoaddr:$src))),
1234 (f32 (LXSSPX xoaddr:$src))>;
Michael Kuperstein2bc3d4d2016-08-18 20:08:15 +00001235 def : Pat<(f64 (fpextend f32:$src)),
Nemanja Ivanovicf02def62015-05-21 19:32:49 +00001236 (COPY_TO_REGCLASS $src, VSFRC)>;
Hal Finkela2cdbce2015-08-30 22:12:50 +00001237
Nemanja Ivanovicf02def62015-05-21 19:32:49 +00001238 def : Pat<(f32 (selectcc i1:$lhs, i1:$rhs, f32:$tval, f32:$fval, SETLT)),
Hal Finkela2cdbce2015-08-30 22:12:50 +00001239 (SELECT_VSSRC (CRANDC $lhs, $rhs), $tval, $fval)>;
1240 def : Pat<(f32 (selectcc i1:$lhs, i1:$rhs, f32:$tval, f32:$fval, SETULT)),
Nemanja Ivanovicf02def62015-05-21 19:32:49 +00001241 (SELECT_VSSRC (CRANDC $rhs, $lhs), $tval, $fval)>;
1242 def : Pat<(f32 (selectcc i1:$lhs, i1:$rhs, f32:$tval, f32:$fval, SETLE)),
Hal Finkela2cdbce2015-08-30 22:12:50 +00001243 (SELECT_VSSRC (CRORC $lhs, $rhs), $tval, $fval)>;
1244 def : Pat<(f32 (selectcc i1:$lhs, i1:$rhs, f32:$tval, f32:$fval, SETULE)),
Nemanja Ivanovicf02def62015-05-21 19:32:49 +00001245 (SELECT_VSSRC (CRORC $rhs, $lhs), $tval, $fval)>;
1246 def : Pat<(f32 (selectcc i1:$lhs, i1:$rhs, f32:$tval, f32:$fval, SETEQ)),
1247 (SELECT_VSSRC (CREQV $lhs, $rhs), $tval, $fval)>;
1248 def : Pat<(f32 (selectcc i1:$lhs, i1:$rhs, f32:$tval, f32:$fval, SETGE)),
Hal Finkela2cdbce2015-08-30 22:12:50 +00001249 (SELECT_VSSRC (CRORC $rhs, $lhs), $tval, $fval)>;
1250 def : Pat<(f32 (selectcc i1:$lhs, i1:$rhs, f32:$tval, f32:$fval, SETUGE)),
Nemanja Ivanovicf02def62015-05-21 19:32:49 +00001251 (SELECT_VSSRC (CRORC $lhs, $rhs), $tval, $fval)>;
1252 def : Pat<(f32 (selectcc i1:$lhs, i1:$rhs, f32:$tval, f32:$fval, SETGT)),
Hal Finkela2cdbce2015-08-30 22:12:50 +00001253 (SELECT_VSSRC (CRANDC $rhs, $lhs), $tval, $fval)>;
1254 def : Pat<(f32 (selectcc i1:$lhs, i1:$rhs, f32:$tval, f32:$fval, SETUGT)),
Nemanja Ivanovicf02def62015-05-21 19:32:49 +00001255 (SELECT_VSSRC (CRANDC $lhs, $rhs), $tval, $fval)>;
1256 def : Pat<(f32 (selectcc i1:$lhs, i1:$rhs, f32:$tval, f32:$fval, SETNE)),
Hal Finkela2cdbce2015-08-30 22:12:50 +00001257 (SELECT_VSSRC (CRXOR $lhs, $rhs), $tval, $fval)>;
Nemanja Ivanovicf02def62015-05-21 19:32:49 +00001258
Nemanja Ivanovic11049f82016-10-04 06:59:23 +00001259 let UseVSXReg = 1 in {
Nemanja Ivanovicf02def62015-05-21 19:32:49 +00001260 // VSX Elementary Scalar FP arithmetic (SP)
1261 let isCommutable = 1 in {
1262 def XSADDSP : XX3Form<60, 0,
1263 (outs vssrc:$XT), (ins vssrc:$XA, vssrc:$XB),
1264 "xsaddsp $XT, $XA, $XB", IIC_VecFP,
1265 [(set f32:$XT, (fadd f32:$XA, f32:$XB))]>;
1266 def XSMULSP : XX3Form<60, 16,
1267 (outs vssrc:$XT), (ins vssrc:$XA, vssrc:$XB),
1268 "xsmulsp $XT, $XA, $XB", IIC_VecFP,
1269 [(set f32:$XT, (fmul f32:$XA, f32:$XB))]>;
1270 } // isCommutable
1271
1272 def XSDIVSP : XX3Form<60, 24,
1273 (outs vssrc:$XT), (ins vssrc:$XA, vssrc:$XB),
1274 "xsdivsp $XT, $XA, $XB", IIC_FPDivS,
1275 [(set f32:$XT, (fdiv f32:$XA, f32:$XB))]>;
1276 def XSRESP : XX2Form<60, 26,
1277 (outs vssrc:$XT), (ins vssrc:$XB),
1278 "xsresp $XT, $XB", IIC_VecFP,
1279 [(set f32:$XT, (PPCfre f32:$XB))]>;
1280 def XSSQRTSP : XX2Form<60, 11,
1281 (outs vssrc:$XT), (ins vssrc:$XB),
1282 "xssqrtsp $XT, $XB", IIC_FPSqrtS,
1283 [(set f32:$XT, (fsqrt f32:$XB))]>;
1284 def XSRSQRTESP : XX2Form<60, 10,
1285 (outs vssrc:$XT), (ins vssrc:$XB),
1286 "xsrsqrtesp $XT, $XB", IIC_VecFP,
1287 [(set f32:$XT, (PPCfrsqrte f32:$XB))]>;
1288 def XSSUBSP : XX3Form<60, 8,
1289 (outs vssrc:$XT), (ins vssrc:$XA, vssrc:$XB),
1290 "xssubsp $XT, $XA, $XB", IIC_VecFP,
1291 [(set f32:$XT, (fsub f32:$XA, f32:$XB))]>;
Nemanja Ivanovic376e1732015-05-29 17:13:25 +00001292
1293 // FMA Instructions
1294 let BaseName = "XSMADDASP" in {
1295 let isCommutable = 1 in
1296 def XSMADDASP : XX3Form<60, 1,
1297 (outs vssrc:$XT),
1298 (ins vssrc:$XTi, vssrc:$XA, vssrc:$XB),
1299 "xsmaddasp $XT, $XA, $XB", IIC_VecFP,
1300 [(set f32:$XT, (fma f32:$XA, f32:$XB, f32:$XTi))]>,
1301 RegConstraint<"$XTi = $XT">, NoEncode<"$XTi">,
1302 AltVSXFMARel;
1303 let IsVSXFMAAlt = 1 in
1304 def XSMADDMSP : XX3Form<60, 9,
1305 (outs vssrc:$XT),
1306 (ins vssrc:$XTi, vssrc:$XA, vssrc:$XB),
1307 "xsmaddmsp $XT, $XA, $XB", IIC_VecFP, []>,
1308 RegConstraint<"$XTi = $XT">, NoEncode<"$XTi">,
1309 AltVSXFMARel;
1310 }
1311
1312 let BaseName = "XSMSUBASP" in {
1313 let isCommutable = 1 in
1314 def XSMSUBASP : XX3Form<60, 17,
1315 (outs vssrc:$XT),
1316 (ins vssrc:$XTi, vssrc:$XA, vssrc:$XB),
1317 "xsmsubasp $XT, $XA, $XB", IIC_VecFP,
1318 [(set f32:$XT, (fma f32:$XA, f32:$XB,
1319 (fneg f32:$XTi)))]>,
1320 RegConstraint<"$XTi = $XT">, NoEncode<"$XTi">,
1321 AltVSXFMARel;
1322 let IsVSXFMAAlt = 1 in
1323 def XSMSUBMSP : XX3Form<60, 25,
1324 (outs vssrc:$XT),
1325 (ins vssrc:$XTi, vssrc:$XA, vssrc:$XB),
1326 "xsmsubmsp $XT, $XA, $XB", IIC_VecFP, []>,
1327 RegConstraint<"$XTi = $XT">, NoEncode<"$XTi">,
1328 AltVSXFMARel;
1329 }
1330
1331 let BaseName = "XSNMADDASP" in {
1332 let isCommutable = 1 in
1333 def XSNMADDASP : XX3Form<60, 129,
1334 (outs vssrc:$XT),
1335 (ins vssrc:$XTi, vssrc:$XA, vssrc:$XB),
1336 "xsnmaddasp $XT, $XA, $XB", IIC_VecFP,
1337 [(set f32:$XT, (fneg (fma f32:$XA, f32:$XB,
1338 f32:$XTi)))]>,
1339 RegConstraint<"$XTi = $XT">, NoEncode<"$XTi">,
1340 AltVSXFMARel;
1341 let IsVSXFMAAlt = 1 in
1342 def XSNMADDMSP : XX3Form<60, 137,
1343 (outs vssrc:$XT),
1344 (ins vssrc:$XTi, vssrc:$XA, vssrc:$XB),
1345 "xsnmaddmsp $XT, $XA, $XB", IIC_VecFP, []>,
1346 RegConstraint<"$XTi = $XT">, NoEncode<"$XTi">,
1347 AltVSXFMARel;
1348 }
1349
1350 let BaseName = "XSNMSUBASP" in {
1351 let isCommutable = 1 in
1352 def XSNMSUBASP : XX3Form<60, 145,
1353 (outs vssrc:$XT),
1354 (ins vssrc:$XTi, vssrc:$XA, vssrc:$XB),
1355 "xsnmsubasp $XT, $XA, $XB", IIC_VecFP,
1356 [(set f32:$XT, (fneg (fma f32:$XA, f32:$XB,
1357 (fneg f32:$XTi))))]>,
1358 RegConstraint<"$XTi = $XT">, NoEncode<"$XTi">,
1359 AltVSXFMARel;
1360 let IsVSXFMAAlt = 1 in
1361 def XSNMSUBMSP : XX3Form<60, 153,
1362 (outs vssrc:$XT),
1363 (ins vssrc:$XTi, vssrc:$XA, vssrc:$XB),
1364 "xsnmsubmsp $XT, $XA, $XB", IIC_VecFP, []>,
1365 RegConstraint<"$XTi = $XT">, NoEncode<"$XTi">,
1366 AltVSXFMARel;
1367 }
Nemanja Ivanovic1c39ca62015-08-13 17:40:44 +00001368
1369 // Single Precision Conversions (FP <-> INT)
1370 def XSCVSXDSP : XX2Form<60, 312,
1371 (outs vssrc:$XT), (ins vsfrc:$XB),
1372 "xscvsxdsp $XT, $XB", IIC_VecFP,
1373 [(set f32:$XT, (PPCfcfids f64:$XB))]>;
1374 def XSCVUXDSP : XX2Form<60, 296,
1375 (outs vssrc:$XT), (ins vsfrc:$XB),
1376 "xscvuxdsp $XT, $XB", IIC_VecFP,
1377 [(set f32:$XT, (PPCfcfidus f64:$XB))]>;
1378
1379 // Conversions between vector and scalar single precision
1380 def XSCVDPSPN : XX2Form<60, 267, (outs vsrc:$XT), (ins vssrc:$XB),
1381 "xscvdpspn $XT, $XB", IIC_VecFP, []>;
1382 def XSCVSPDPN : XX2Form<60, 331, (outs vssrc:$XT), (ins vsrc:$XB),
1383 "xscvspdpn $XT, $XB", IIC_VecFP, []>;
Nemanja Ivanovic11049f82016-10-04 06:59:23 +00001384 } // UseVSXReg = 1
Nemanja Ivanovic1c39ca62015-08-13 17:40:44 +00001385
Nemanja Ivanovicd3c284f2016-07-18 15:30:00 +00001386 let Predicates = [IsLittleEndian] in {
1387 def : Pat<(f32 (PPCfcfids (PPCmtvsra (i64 (vector_extract v2i64:$S, 0))))),
1388 (f32 (XSCVSXDSP (COPY_TO_REGCLASS (XXPERMDI $S, $S, 2), VSFRC)))>;
1389 def : Pat<(f32 (PPCfcfids (PPCmtvsra (i64 (vector_extract v2i64:$S, 1))))),
1390 (f32 (XSCVSXDSP (COPY_TO_REGCLASS (f64 (COPY_TO_REGCLASS $S, VSRC)), VSFRC)))>;
1391 def : Pat<(f32 (PPCfcfidus (PPCmtvsra (i64 (vector_extract v2i64:$S, 0))))),
1392 (f32 (XSCVUXDSP (COPY_TO_REGCLASS (XXPERMDI $S, $S, 2), VSFRC)))>;
1393 def : Pat<(f32 (PPCfcfidus (PPCmtvsra (i64 (vector_extract v2i64:$S, 1))))),
1394 (f32 (XSCVUXDSP (COPY_TO_REGCLASS (f64 (COPY_TO_REGCLASS $S, VSRC)), VSFRC)))>;
1395 }
1396
1397 let Predicates = [IsBigEndian] in {
1398 def : Pat<(f32 (PPCfcfids (PPCmtvsra (i64 (vector_extract v2i64:$S, 0))))),
1399 (f32 (XSCVSXDSP (COPY_TO_REGCLASS $S, VSFRC)))>;
1400 def : Pat<(f32 (PPCfcfids (PPCmtvsra (i64 (vector_extract v2i64:$S, 1))))),
1401 (f32 (XSCVSXDSP (COPY_TO_REGCLASS (XXPERMDI $S, $S, 2), VSFRC)))>;
1402 def : Pat<(f32 (PPCfcfidus (PPCmtvsra (i64 (vector_extract v2i64:$S, 0))))),
1403 (f32 (XSCVUXDSP (COPY_TO_REGCLASS $S, VSFRC)))>;
1404 def : Pat<(f32 (PPCfcfidus (PPCmtvsra (i64 (vector_extract v2i64:$S, 1))))),
1405 (f32 (XSCVUXDSP (COPY_TO_REGCLASS (XXPERMDI $S, $S, 2), VSFRC)))>;
1406 }
Nemanja Ivanovic11049f82016-10-04 06:59:23 +00001407 def : Pat<(v4i32 (scalar_to_vector ScalarLoads.Li32)),
1408 (v4i32 (XXSPLTWs (LXSIWAX xoaddr:$src), 1))>;
Nemanja Ivanovicf3c94b12015-05-07 18:24:05 +00001409} // AddedComplexity = 400
Kit Barton298beb52015-02-18 16:21:46 +00001410} // HasP8Vector
Nemanja Ivanovicc38b5312015-04-11 10:40:42 +00001411
Nemanja Ivanovicdf1cb522016-11-29 16:11:34 +00001412let UseVSXReg = 1, AddedComplexity = 400 in {
Ehsan Amiri99b017a2016-03-31 17:47:17 +00001413let Predicates = [HasDirectMove] in {
Nemanja Ivanovicf02def62015-05-21 19:32:49 +00001414 // VSX direct move instructions
1415 def MFVSRD : XX1_RS6_RD5_XO<31, 51, (outs g8rc:$rA), (ins vsfrc:$XT),
1416 "mfvsrd $rA, $XT", IIC_VecGeneral,
1417 [(set i64:$rA, (PPCmfvsr f64:$XT))]>,
1418 Requires<[In64BitMode]>;
1419 def MFVSRWZ : XX1_RS6_RD5_XO<31, 115, (outs gprc:$rA), (ins vsfrc:$XT),
1420 "mfvsrwz $rA, $XT", IIC_VecGeneral,
1421 [(set i32:$rA, (PPCmfvsr f64:$XT))]>;
1422 def MTVSRD : XX1_RS6_RD5_XO<31, 179, (outs vsfrc:$XT), (ins g8rc:$rA),
1423 "mtvsrd $XT, $rA", IIC_VecGeneral,
1424 [(set f64:$XT, (PPCmtvsra i64:$rA))]>,
1425 Requires<[In64BitMode]>;
1426 def MTVSRWA : XX1_RS6_RD5_XO<31, 211, (outs vsfrc:$XT), (ins gprc:$rA),
1427 "mtvsrwa $XT, $rA", IIC_VecGeneral,
1428 [(set f64:$XT, (PPCmtvsra i32:$rA))]>;
1429 def MTVSRWZ : XX1_RS6_RD5_XO<31, 243, (outs vsfrc:$XT), (ins gprc:$rA),
1430 "mtvsrwz $XT, $rA", IIC_VecGeneral,
1431 [(set f64:$XT, (PPCmtvsrz i32:$rA))]>;
Ehsan Amiri99b017a2016-03-31 17:47:17 +00001432} // HasDirectMove
1433
1434let Predicates = [IsISA3_0, HasDirectMove] in {
1435 def MTVSRWS: XX1_RS6_RD5_XO<31, 403, (outs vsrc:$XT), (ins gprc:$rA),
Nemanja Ivanovicd2c3c512016-09-23 13:25:31 +00001436 "mtvsrws $XT, $rA", IIC_VecGeneral, []>;
Ehsan Amiri99b017a2016-03-31 17:47:17 +00001437
1438 def MTVSRDD: XX1Form<31, 435, (outs vsrc:$XT), (ins g8rc:$rA, g8rc:$rB),
1439 "mtvsrdd $XT, $rA, $rB", IIC_VecGeneral,
1440 []>, Requires<[In64BitMode]>;
1441
1442 def MFVSRLD: XX1_RS6_RD5_XO<31, 307, (outs g8rc:$rA), (ins vsrc:$XT),
1443 "mfvsrld $rA, $XT", IIC_VecGeneral,
1444 []>, Requires<[In64BitMode]>;
1445
1446} // IsISA3_0, HasDirectMove
Nemanja Ivanovic11049f82016-10-04 06:59:23 +00001447} // UseVSXReg = 1
Nemanja Ivanovic1c39ca62015-08-13 17:40:44 +00001448
Nemanja Ivanovicd3896572015-10-09 11:12:18 +00001449/* Direct moves of various widths from GPR's into VSR's. Each move lines
Nemanja Ivanovic1c39ca62015-08-13 17:40:44 +00001450 the value up into element 0 (both BE and LE). Namely, entities smaller than
1451 a doubleword are shifted left and moved for BE. For LE, they're moved, then
1452 swapped to go into the least significant element of the VSR.
1453*/
Nemanja Ivanovicd3896572015-10-09 11:12:18 +00001454def MovesToVSR {
1455 dag BE_BYTE_0 =
1456 (MTVSRD
1457 (RLDICR
1458 (INSERT_SUBREG (i64 (IMPLICIT_DEF)), $A, sub_32), 56, 7));
1459 dag BE_HALF_0 =
1460 (MTVSRD
1461 (RLDICR
1462 (INSERT_SUBREG (i64 (IMPLICIT_DEF)), $A, sub_32), 48, 15));
1463 dag BE_WORD_0 =
1464 (MTVSRD
1465 (RLDICR
1466 (INSERT_SUBREG (i64 (IMPLICIT_DEF)), $A, sub_32), 32, 31));
Nemanja Ivanovic1c39ca62015-08-13 17:40:44 +00001467 dag BE_DWORD_0 = (MTVSRD $A);
1468
1469 dag LE_MTVSRW = (MTVSRD (INSERT_SUBREG (i64 (IMPLICIT_DEF)), $A, sub_32));
Nemanja Ivanovicd3896572015-10-09 11:12:18 +00001470 dag LE_WORD_1 = (v2i64 (INSERT_SUBREG (v2i64 (IMPLICIT_DEF)),
1471 LE_MTVSRW, sub_64));
Nemanja Ivanovic1c39ca62015-08-13 17:40:44 +00001472 dag LE_WORD_0 = (XXPERMDI LE_WORD_1, LE_WORD_1, 2);
Nemanja Ivanovicd3896572015-10-09 11:12:18 +00001473 dag LE_DWORD_1 = (v2i64 (INSERT_SUBREG (v2i64 (IMPLICIT_DEF)),
1474 BE_DWORD_0, sub_64));
Nemanja Ivanovic1c39ca62015-08-13 17:40:44 +00001475 dag LE_DWORD_0 = (XXPERMDI LE_DWORD_1, LE_DWORD_1, 2);
1476}
1477
Nemanja Ivanovicac8d01a2015-12-10 13:35:28 +00001478/* Patterns for extracting elements out of vectors. Integer elements are
1479 extracted using direct move operations. Patterns for extracting elements
1480 whose indices are not available at compile time are also provided with
1481 various _VARIABLE_ patterns.
Nemanja Ivanovicd3896572015-10-09 11:12:18 +00001482 The numbering for the DAG's is for LE, but when used on BE, the correct
1483 LE element can just be used (i.e. LE_BYTE_2 == BE_BYTE_13).
1484*/
Nemanja Ivanovicac8d01a2015-12-10 13:35:28 +00001485def VectorExtractions {
Nemanja Ivanovicd3896572015-10-09 11:12:18 +00001486 // Doubleword extraction
1487 dag LE_DWORD_0 =
1488 (MFVSRD
1489 (EXTRACT_SUBREG
1490 (XXPERMDI (COPY_TO_REGCLASS $S, VSRC),
1491 (COPY_TO_REGCLASS $S, VSRC), 2), sub_64));
1492 dag LE_DWORD_1 = (MFVSRD
1493 (EXTRACT_SUBREG
1494 (v2i64 (COPY_TO_REGCLASS $S, VSRC)), sub_64));
1495
1496 // Word extraction
Nemanja Ivanoviceebbcb62016-07-12 12:16:27 +00001497 dag LE_WORD_0 = (MFVSRWZ (EXTRACT_SUBREG (XXPERMDI $S, $S, 2), sub_64));
Nemanja Ivanovicd3896572015-10-09 11:12:18 +00001498 dag LE_WORD_1 = (MFVSRWZ (EXTRACT_SUBREG (XXSLDWI $S, $S, 1), sub_64));
1499 dag LE_WORD_2 = (MFVSRWZ (EXTRACT_SUBREG
1500 (v2i64 (COPY_TO_REGCLASS $S, VSRC)), sub_64));
1501 dag LE_WORD_3 = (MFVSRWZ (EXTRACT_SUBREG (XXSLDWI $S, $S, 3), sub_64));
1502
1503 // Halfword extraction
1504 dag LE_HALF_0 = (i32 (EXTRACT_SUBREG (RLDICL LE_DWORD_0, 0, 48), sub_32));
1505 dag LE_HALF_1 = (i32 (EXTRACT_SUBREG (RLDICL LE_DWORD_0, 48, 48), sub_32));
1506 dag LE_HALF_2 = (i32 (EXTRACT_SUBREG (RLDICL LE_DWORD_0, 32, 48), sub_32));
1507 dag LE_HALF_3 = (i32 (EXTRACT_SUBREG (RLDICL LE_DWORD_0, 16, 48), sub_32));
1508 dag LE_HALF_4 = (i32 (EXTRACT_SUBREG (RLDICL LE_DWORD_1, 0, 48), sub_32));
1509 dag LE_HALF_5 = (i32 (EXTRACT_SUBREG (RLDICL LE_DWORD_1, 48, 48), sub_32));
1510 dag LE_HALF_6 = (i32 (EXTRACT_SUBREG (RLDICL LE_DWORD_1, 32, 48), sub_32));
1511 dag LE_HALF_7 = (i32 (EXTRACT_SUBREG (RLDICL LE_DWORD_1, 16, 48), sub_32));
1512
1513 // Byte extraction
1514 dag LE_BYTE_0 = (i32 (EXTRACT_SUBREG (RLDICL LE_DWORD_0, 0, 56), sub_32));
1515 dag LE_BYTE_1 = (i32 (EXTRACT_SUBREG (RLDICL LE_DWORD_0, 56, 56), sub_32));
1516 dag LE_BYTE_2 = (i32 (EXTRACT_SUBREG (RLDICL LE_DWORD_0, 48, 56), sub_32));
1517 dag LE_BYTE_3 = (i32 (EXTRACT_SUBREG (RLDICL LE_DWORD_0, 40, 56), sub_32));
1518 dag LE_BYTE_4 = (i32 (EXTRACT_SUBREG (RLDICL LE_DWORD_0, 32, 56), sub_32));
1519 dag LE_BYTE_5 = (i32 (EXTRACT_SUBREG (RLDICL LE_DWORD_0, 24, 56), sub_32));
1520 dag LE_BYTE_6 = (i32 (EXTRACT_SUBREG (RLDICL LE_DWORD_0, 16, 56), sub_32));
1521 dag LE_BYTE_7 = (i32 (EXTRACT_SUBREG (RLDICL LE_DWORD_0, 8, 56), sub_32));
1522 dag LE_BYTE_8 = (i32 (EXTRACT_SUBREG (RLDICL LE_DWORD_1, 0, 56), sub_32));
1523 dag LE_BYTE_9 = (i32 (EXTRACT_SUBREG (RLDICL LE_DWORD_1, 56, 56), sub_32));
1524 dag LE_BYTE_10 = (i32 (EXTRACT_SUBREG (RLDICL LE_DWORD_1, 48, 56), sub_32));
1525 dag LE_BYTE_11 = (i32 (EXTRACT_SUBREG (RLDICL LE_DWORD_1, 40, 56), sub_32));
1526 dag LE_BYTE_12 = (i32 (EXTRACT_SUBREG (RLDICL LE_DWORD_1, 32, 56), sub_32));
1527 dag LE_BYTE_13 = (i32 (EXTRACT_SUBREG (RLDICL LE_DWORD_1, 24, 56), sub_32));
1528 dag LE_BYTE_14 = (i32 (EXTRACT_SUBREG (RLDICL LE_DWORD_1, 16, 56), sub_32));
1529 dag LE_BYTE_15 = (i32 (EXTRACT_SUBREG (RLDICL LE_DWORD_1, 8, 56), sub_32));
1530
1531 /* Variable element number (BE and LE patterns must be specified separately)
1532 This is a rather involved process.
1533
1534 Conceptually, this is how the move is accomplished:
1535 1. Identify which doubleword contains the element
1536 2. Shift in the VMX register so that the correct doubleword is correctly
1537 lined up for the MFVSRD
1538 3. Perform the move so that the element (along with some extra stuff)
1539 is in the GPR
1540 4. Right shift within the GPR so that the element is right-justified
1541
1542 Of course, the index is an element number which has a different meaning
1543 on LE/BE so the patterns have to be specified separately.
1544
1545 Note: The final result will be the element right-justified with high
1546 order bits being arbitrarily defined (namely, whatever was in the
1547 vector register to the left of the value originally).
1548 */
1549
1550 /* LE variable byte
1551 Number 1. above:
1552 - For elements 0-7, we shift left by 8 bytes since they're on the right
1553 - For elements 8-15, we need not shift (shift left by zero bytes)
1554 This is accomplished by inverting the bits of the index and AND-ing
1555 with 0x8 (i.e. clearing all bits of the index and inverting bit 60).
1556 */
1557 dag LE_VBYTE_PERM_VEC = (LVSL ZERO8, (ANDC8 (LI8 8), $Idx));
1558
1559 // Number 2. above:
1560 // - Now that we set up the shift amount, we shift in the VMX register
1561 dag LE_VBYTE_PERMUTE = (VPERM $S, $S, LE_VBYTE_PERM_VEC);
1562
1563 // Number 3. above:
1564 // - The doubleword containing our element is moved to a GPR
1565 dag LE_MV_VBYTE = (MFVSRD
1566 (EXTRACT_SUBREG
1567 (v2i64 (COPY_TO_REGCLASS LE_VBYTE_PERMUTE, VSRC)),
1568 sub_64));
1569
1570 /* Number 4. above:
1571 - Truncate the element number to the range 0-7 (8-15 are symmetrical
1572 and out of range values are truncated accordingly)
1573 - Multiply by 8 as we need to shift right by the number of bits, not bytes
1574 - Shift right in the GPR by the calculated value
1575 */
1576 dag LE_VBYTE_SHIFT = (EXTRACT_SUBREG (RLDICR (AND8 (LI8 7), $Idx), 3, 60),
1577 sub_32);
1578 dag LE_VARIABLE_BYTE = (EXTRACT_SUBREG (SRD LE_MV_VBYTE, LE_VBYTE_SHIFT),
1579 sub_32);
1580
Nemanja Ivanovicd3896572015-10-09 11:12:18 +00001581 /* LE variable halfword
1582 Number 1. above:
1583 - For elements 0-3, we shift left by 8 since they're on the right
1584 - For elements 4-7, we need not shift (shift left by zero bytes)
1585 Similarly to the byte pattern, we invert the bits of the index, but we
1586 AND with 0x4 (i.e. clear all bits of the index and invert bit 61).
1587 Of course, the shift is still by 8 bytes, so we must multiply by 2.
1588 */
1589 dag LE_VHALF_PERM_VEC = (LVSL ZERO8, (RLDICR (ANDC8 (LI8 4), $Idx), 1, 62));
1590
1591 // Number 2. above:
1592 // - Now that we set up the shift amount, we shift in the VMX register
1593 dag LE_VHALF_PERMUTE = (VPERM $S, $S, LE_VHALF_PERM_VEC);
1594
1595 // Number 3. above:
1596 // - The doubleword containing our element is moved to a GPR
1597 dag LE_MV_VHALF = (MFVSRD
1598 (EXTRACT_SUBREG
1599 (v2i64 (COPY_TO_REGCLASS LE_VHALF_PERMUTE, VSRC)),
1600 sub_64));
1601
1602 /* Number 4. above:
1603 - Truncate the element number to the range 0-3 (4-7 are symmetrical
1604 and out of range values are truncated accordingly)
1605 - Multiply by 16 as we need to shift right by the number of bits
1606 - Shift right in the GPR by the calculated value
1607 */
1608 dag LE_VHALF_SHIFT = (EXTRACT_SUBREG (RLDICR (AND8 (LI8 3), $Idx), 4, 59),
1609 sub_32);
1610 dag LE_VARIABLE_HALF = (EXTRACT_SUBREG (SRD LE_MV_VHALF, LE_VHALF_SHIFT),
1611 sub_32);
1612
Nemanja Ivanovicac8d01a2015-12-10 13:35:28 +00001613 /* LE variable word
1614 Number 1. above:
1615 - For elements 0-1, we shift left by 8 since they're on the right
1616 - For elements 2-3, we need not shift
1617 */
1618 dag LE_VWORD_PERM_VEC = (LVSL ZERO8, (RLDICR (ANDC8 (LI8 2), $Idx), 2, 61));
1619
1620 // Number 2. above:
1621 // - Now that we set up the shift amount, we shift in the VMX register
1622 dag LE_VWORD_PERMUTE = (VPERM $S, $S, LE_VWORD_PERM_VEC);
1623
1624 // Number 3. above:
1625 // - The doubleword containing our element is moved to a GPR
1626 dag LE_MV_VWORD = (MFVSRD
1627 (EXTRACT_SUBREG
1628 (v2i64 (COPY_TO_REGCLASS LE_VWORD_PERMUTE, VSRC)),
1629 sub_64));
1630
1631 /* Number 4. above:
1632 - Truncate the element number to the range 0-1 (2-3 are symmetrical
1633 and out of range values are truncated accordingly)
1634 - Multiply by 32 as we need to shift right by the number of bits
1635 - Shift right in the GPR by the calculated value
1636 */
1637 dag LE_VWORD_SHIFT = (EXTRACT_SUBREG (RLDICR (AND8 (LI8 1), $Idx), 5, 58),
1638 sub_32);
1639 dag LE_VARIABLE_WORD = (EXTRACT_SUBREG (SRD LE_MV_VWORD, LE_VWORD_SHIFT),
1640 sub_32);
1641
1642 /* LE variable doubleword
1643 Number 1. above:
1644 - For element 0, we shift left by 8 since it's on the right
1645 - For element 1, we need not shift
1646 */
1647 dag LE_VDWORD_PERM_VEC = (LVSL ZERO8, (RLDICR (ANDC8 (LI8 1), $Idx), 3, 60));
1648
1649 // Number 2. above:
1650 // - Now that we set up the shift amount, we shift in the VMX register
1651 dag LE_VDWORD_PERMUTE = (VPERM $S, $S, LE_VDWORD_PERM_VEC);
1652
1653 // Number 3. above:
1654 // - The doubleword containing our element is moved to a GPR
1655 // - Number 4. is not needed for the doubleword as the value is 64-bits
1656 dag LE_VARIABLE_DWORD =
1657 (MFVSRD (EXTRACT_SUBREG
1658 (v2i64 (COPY_TO_REGCLASS LE_VDWORD_PERMUTE, VSRC)),
1659 sub_64));
1660
1661 /* LE variable float
1662 - Shift the vector to line up the desired element to BE Word 0
1663 - Convert 32-bit float to a 64-bit single precision float
1664 */
1665 dag LE_VFLOAT_PERM_VEC = (LVSL ZERO8, (RLDICR (XOR8 (LI8 3), $Idx), 2, 61));
1666 dag LE_VFLOAT_PERMUTE = (VPERM $S, $S, LE_VFLOAT_PERM_VEC);
1667 dag LE_VARIABLE_FLOAT = (XSCVSPDPN LE_VFLOAT_PERMUTE);
1668
1669 /* LE variable double
1670 Same as the LE doubleword except there is no move.
1671 */
1672 dag LE_VDOUBLE_PERMUTE = (VPERM (COPY_TO_REGCLASS $S, VRRC),
1673 (COPY_TO_REGCLASS $S, VRRC),
1674 LE_VDWORD_PERM_VEC);
1675 dag LE_VARIABLE_DOUBLE = (COPY_TO_REGCLASS LE_VDOUBLE_PERMUTE, VSRC);
1676
1677 /* BE variable byte
1678 The algorithm here is the same as the LE variable byte except:
1679 - The shift in the VMX register is by 0/8 for opposite element numbers so
1680 we simply AND the element number with 0x8
1681 - The order of elements after the move to GPR is reversed, so we invert
1682 the bits of the index prior to truncating to the range 0-7
1683 */
1684 dag BE_VBYTE_PERM_VEC = (LVSL ZERO8, (ANDIo8 $Idx, 8));
1685 dag BE_VBYTE_PERMUTE = (VPERM $S, $S, BE_VBYTE_PERM_VEC);
1686 dag BE_MV_VBYTE = (MFVSRD
1687 (EXTRACT_SUBREG
1688 (v2i64 (COPY_TO_REGCLASS BE_VBYTE_PERMUTE, VSRC)),
1689 sub_64));
1690 dag BE_VBYTE_SHIFT = (EXTRACT_SUBREG (RLDICR (ANDC8 (LI8 7), $Idx), 3, 60),
1691 sub_32);
1692 dag BE_VARIABLE_BYTE = (EXTRACT_SUBREG (SRD BE_MV_VBYTE, BE_VBYTE_SHIFT),
1693 sub_32);
1694
Nemanja Ivanovicd3896572015-10-09 11:12:18 +00001695 /* BE variable halfword
1696 The algorithm here is the same as the LE variable halfword except:
1697 - The shift in the VMX register is by 0/8 for opposite element numbers so
1698 we simply AND the element number with 0x4 and multiply by 2
1699 - The order of elements after the move to GPR is reversed, so we invert
1700 the bits of the index prior to truncating to the range 0-3
1701 */
1702 dag BE_VHALF_PERM_VEC = (LVSL ZERO8, (RLDICR (ANDIo8 $Idx, 4), 1, 62));
1703 dag BE_VHALF_PERMUTE = (VPERM $S, $S, BE_VHALF_PERM_VEC);
1704 dag BE_MV_VHALF = (MFVSRD
1705 (EXTRACT_SUBREG
1706 (v2i64 (COPY_TO_REGCLASS BE_VHALF_PERMUTE, VSRC)),
1707 sub_64));
Nemanja Ivanovicac8d01a2015-12-10 13:35:28 +00001708 dag BE_VHALF_SHIFT = (EXTRACT_SUBREG (RLDICR (ANDC8 (LI8 3), $Idx), 4, 59),
Nemanja Ivanovicd3896572015-10-09 11:12:18 +00001709 sub_32);
1710 dag BE_VARIABLE_HALF = (EXTRACT_SUBREG (SRD BE_MV_VHALF, BE_VHALF_SHIFT),
1711 sub_32);
Nemanja Ivanovicac8d01a2015-12-10 13:35:28 +00001712
1713 /* BE variable word
1714 The algorithm is the same as the LE variable word except:
1715 - The shift in the VMX register happens for opposite element numbers
1716 - The order of elements after the move to GPR is reversed, so we invert
1717 the bits of the index prior to truncating to the range 0-1
1718 */
1719 dag BE_VWORD_PERM_VEC = (LVSL ZERO8, (RLDICR (ANDIo8 $Idx, 2), 2, 61));
1720 dag BE_VWORD_PERMUTE = (VPERM $S, $S, BE_VWORD_PERM_VEC);
1721 dag BE_MV_VWORD = (MFVSRD
1722 (EXTRACT_SUBREG
1723 (v2i64 (COPY_TO_REGCLASS BE_VWORD_PERMUTE, VSRC)),
1724 sub_64));
1725 dag BE_VWORD_SHIFT = (EXTRACT_SUBREG (RLDICR (ANDC8 (LI8 1), $Idx), 5, 58),
1726 sub_32);
1727 dag BE_VARIABLE_WORD = (EXTRACT_SUBREG (SRD BE_MV_VWORD, BE_VWORD_SHIFT),
1728 sub_32);
1729
1730 /* BE variable doubleword
1731 Same as the LE doubleword except we shift in the VMX register for opposite
1732 element indices.
1733 */
1734 dag BE_VDWORD_PERM_VEC = (LVSL ZERO8, (RLDICR (ANDIo8 $Idx, 1), 3, 60));
1735 dag BE_VDWORD_PERMUTE = (VPERM $S, $S, BE_VDWORD_PERM_VEC);
1736 dag BE_VARIABLE_DWORD =
1737 (MFVSRD (EXTRACT_SUBREG
1738 (v2i64 (COPY_TO_REGCLASS BE_VDWORD_PERMUTE, VSRC)),
1739 sub_64));
1740
1741 /* BE variable float
1742 - Shift the vector to line up the desired element to BE Word 0
1743 - Convert 32-bit float to a 64-bit single precision float
1744 */
1745 dag BE_VFLOAT_PERM_VEC = (LVSL ZERO8, (RLDICR $Idx, 2, 61));
1746 dag BE_VFLOAT_PERMUTE = (VPERM $S, $S, BE_VFLOAT_PERM_VEC);
1747 dag BE_VARIABLE_FLOAT = (XSCVSPDPN BE_VFLOAT_PERMUTE);
1748
1749 /* BE variable double
1750 Same as the BE doubleword except there is no move.
1751 */
1752 dag BE_VDOUBLE_PERMUTE = (VPERM (COPY_TO_REGCLASS $S, VRRC),
1753 (COPY_TO_REGCLASS $S, VRRC),
1754 BE_VDWORD_PERM_VEC);
1755 dag BE_VARIABLE_DOUBLE = (COPY_TO_REGCLASS BE_VDOUBLE_PERMUTE, VSRC);
Nemanja Ivanovicd3896572015-10-09 11:12:18 +00001756}
1757
Nemanja Ivanovicdf1cb522016-11-29 16:11:34 +00001758let AddedComplexity = 400 in {
Nemanja Ivanovicd3896572015-10-09 11:12:18 +00001759// v4f32 scalar <-> vector conversions (BE)
Nemanja Ivanovic1c39ca62015-08-13 17:40:44 +00001760let Predicates = [IsBigEndian, HasP8Vector] in {
1761 def : Pat<(v4f32 (scalar_to_vector f32:$A)),
1762 (v4f32 (XSCVDPSPN $A))>;
Nemanja Ivanovicd3896572015-10-09 11:12:18 +00001763 def : Pat<(f32 (vector_extract v4f32:$S, 0)),
1764 (f32 (XSCVSPDPN $S))>;
1765 def : Pat<(f32 (vector_extract v4f32:$S, 1)),
1766 (f32 (XSCVSPDPN (XXSLDWI $S, $S, 1)))>;
1767 def : Pat<(f32 (vector_extract v4f32:$S, 2)),
Nemanja Ivanoviceebbcb62016-07-12 12:16:27 +00001768 (f32 (XSCVSPDPN (XXPERMDI $S, $S, 2)))>;
Nemanja Ivanovicd3896572015-10-09 11:12:18 +00001769 def : Pat<(f32 (vector_extract v4f32:$S, 3)),
1770 (f32 (XSCVSPDPN (XXSLDWI $S, $S, 3)))>;
Nemanja Ivanovicac8d01a2015-12-10 13:35:28 +00001771 def : Pat<(f32 (vector_extract v4f32:$S, i64:$Idx)),
1772 (f32 VectorExtractions.BE_VARIABLE_FLOAT)>;
Nemanja Ivanovic1c39ca62015-08-13 17:40:44 +00001773} // IsBigEndian, HasP8Vector
1774
Nemanja Ivanovicac8d01a2015-12-10 13:35:28 +00001775// Variable index vector_extract for v2f64 does not require P8Vector
1776let Predicates = [IsBigEndian, HasVSX] in
1777 def : Pat<(f64 (vector_extract v2f64:$S, i64:$Idx)),
1778 (f64 VectorExtractions.BE_VARIABLE_DOUBLE)>;
1779
Nemanja Ivanovic1c39ca62015-08-13 17:40:44 +00001780let Predicates = [IsBigEndian, HasDirectMove] in {
Nemanja Ivanovicd3896572015-10-09 11:12:18 +00001781 // v16i8 scalar <-> vector conversions (BE)
Nemanja Ivanovic1c39ca62015-08-13 17:40:44 +00001782 def : Pat<(v16i8 (scalar_to_vector i32:$A)),
Nemanja Ivanovicd3896572015-10-09 11:12:18 +00001783 (v16i8 (SUBREG_TO_REG (i64 1), MovesToVSR.BE_BYTE_0, sub_64))>;
Nemanja Ivanovic1c39ca62015-08-13 17:40:44 +00001784 def : Pat<(v8i16 (scalar_to_vector i32:$A)),
Nemanja Ivanovicd3896572015-10-09 11:12:18 +00001785 (v8i16 (SUBREG_TO_REG (i64 1), MovesToVSR.BE_HALF_0, sub_64))>;
Nemanja Ivanovic1c39ca62015-08-13 17:40:44 +00001786 def : Pat<(v4i32 (scalar_to_vector i32:$A)),
Nemanja Ivanovicd3896572015-10-09 11:12:18 +00001787 (v4i32 (SUBREG_TO_REG (i64 1), MovesToVSR.BE_WORD_0, sub_64))>;
Nemanja Ivanovic1c39ca62015-08-13 17:40:44 +00001788 def : Pat<(v2i64 (scalar_to_vector i64:$A)),
Nemanja Ivanovicd3896572015-10-09 11:12:18 +00001789 (v2i64 (SUBREG_TO_REG (i64 1), MovesToVSR.BE_DWORD_0, sub_64))>;
1790 def : Pat<(i32 (vector_extract v16i8:$S, 0)),
Nemanja Ivanovicac8d01a2015-12-10 13:35:28 +00001791 (i32 VectorExtractions.LE_BYTE_15)>;
Nemanja Ivanovicd3896572015-10-09 11:12:18 +00001792 def : Pat<(i32 (vector_extract v16i8:$S, 1)),
Nemanja Ivanovicac8d01a2015-12-10 13:35:28 +00001793 (i32 VectorExtractions.LE_BYTE_14)>;
Nemanja Ivanovicd3896572015-10-09 11:12:18 +00001794 def : Pat<(i32 (vector_extract v16i8:$S, 2)),
Nemanja Ivanovicac8d01a2015-12-10 13:35:28 +00001795 (i32 VectorExtractions.LE_BYTE_13)>;
Nemanja Ivanovicd3896572015-10-09 11:12:18 +00001796 def : Pat<(i32 (vector_extract v16i8:$S, 3)),
Nemanja Ivanovicac8d01a2015-12-10 13:35:28 +00001797 (i32 VectorExtractions.LE_BYTE_12)>;
Nemanja Ivanovicd3896572015-10-09 11:12:18 +00001798 def : Pat<(i32 (vector_extract v16i8:$S, 4)),
Nemanja Ivanovicac8d01a2015-12-10 13:35:28 +00001799 (i32 VectorExtractions.LE_BYTE_11)>;
Nemanja Ivanovicd3896572015-10-09 11:12:18 +00001800 def : Pat<(i32 (vector_extract v16i8:$S, 5)),
Nemanja Ivanovicac8d01a2015-12-10 13:35:28 +00001801 (i32 VectorExtractions.LE_BYTE_10)>;
Nemanja Ivanovicd3896572015-10-09 11:12:18 +00001802 def : Pat<(i32 (vector_extract v16i8:$S, 6)),
Nemanja Ivanovicac8d01a2015-12-10 13:35:28 +00001803 (i32 VectorExtractions.LE_BYTE_9)>;
Nemanja Ivanovicd3896572015-10-09 11:12:18 +00001804 def : Pat<(i32 (vector_extract v16i8:$S, 7)),
Nemanja Ivanovicac8d01a2015-12-10 13:35:28 +00001805 (i32 VectorExtractions.LE_BYTE_8)>;
Nemanja Ivanovicd3896572015-10-09 11:12:18 +00001806 def : Pat<(i32 (vector_extract v16i8:$S, 8)),
Nemanja Ivanovicac8d01a2015-12-10 13:35:28 +00001807 (i32 VectorExtractions.LE_BYTE_7)>;
Nemanja Ivanovicd3896572015-10-09 11:12:18 +00001808 def : Pat<(i32 (vector_extract v16i8:$S, 9)),
Nemanja Ivanovicac8d01a2015-12-10 13:35:28 +00001809 (i32 VectorExtractions.LE_BYTE_6)>;
Nemanja Ivanovicd3896572015-10-09 11:12:18 +00001810 def : Pat<(i32 (vector_extract v16i8:$S, 10)),
Nemanja Ivanovicac8d01a2015-12-10 13:35:28 +00001811 (i32 VectorExtractions.LE_BYTE_5)>;
Nemanja Ivanovicd3896572015-10-09 11:12:18 +00001812 def : Pat<(i32 (vector_extract v16i8:$S, 11)),
Nemanja Ivanovicac8d01a2015-12-10 13:35:28 +00001813 (i32 VectorExtractions.LE_BYTE_4)>;
Nemanja Ivanovicd3896572015-10-09 11:12:18 +00001814 def : Pat<(i32 (vector_extract v16i8:$S, 12)),
Nemanja Ivanovicac8d01a2015-12-10 13:35:28 +00001815 (i32 VectorExtractions.LE_BYTE_3)>;
Nemanja Ivanovicd3896572015-10-09 11:12:18 +00001816 def : Pat<(i32 (vector_extract v16i8:$S, 13)),
Nemanja Ivanovicac8d01a2015-12-10 13:35:28 +00001817 (i32 VectorExtractions.LE_BYTE_2)>;
Nemanja Ivanovicd3896572015-10-09 11:12:18 +00001818 def : Pat<(i32 (vector_extract v16i8:$S, 14)),
Nemanja Ivanovicac8d01a2015-12-10 13:35:28 +00001819 (i32 VectorExtractions.LE_BYTE_1)>;
Nemanja Ivanovicd3896572015-10-09 11:12:18 +00001820 def : Pat<(i32 (vector_extract v16i8:$S, 15)),
Nemanja Ivanovicac8d01a2015-12-10 13:35:28 +00001821 (i32 VectorExtractions.LE_BYTE_0)>;
Nemanja Ivanovicd3896572015-10-09 11:12:18 +00001822 def : Pat<(i32 (vector_extract v16i8:$S, i64:$Idx)),
Nemanja Ivanovicac8d01a2015-12-10 13:35:28 +00001823 (i32 VectorExtractions.BE_VARIABLE_BYTE)>;
Nemanja Ivanovicd3896572015-10-09 11:12:18 +00001824
1825 // v8i16 scalar <-> vector conversions (BE)
1826 def : Pat<(i32 (vector_extract v8i16:$S, 0)),
Nemanja Ivanovicac8d01a2015-12-10 13:35:28 +00001827 (i32 VectorExtractions.LE_HALF_7)>;
Nemanja Ivanovicd3896572015-10-09 11:12:18 +00001828 def : Pat<(i32 (vector_extract v8i16:$S, 1)),
Nemanja Ivanovicac8d01a2015-12-10 13:35:28 +00001829 (i32 VectorExtractions.LE_HALF_6)>;
Nemanja Ivanovicd3896572015-10-09 11:12:18 +00001830 def : Pat<(i32 (vector_extract v8i16:$S, 2)),
Nemanja Ivanovicac8d01a2015-12-10 13:35:28 +00001831 (i32 VectorExtractions.LE_HALF_5)>;
Nemanja Ivanovicd3896572015-10-09 11:12:18 +00001832 def : Pat<(i32 (vector_extract v8i16:$S, 3)),
Nemanja Ivanovicac8d01a2015-12-10 13:35:28 +00001833 (i32 VectorExtractions.LE_HALF_4)>;
Nemanja Ivanovicd3896572015-10-09 11:12:18 +00001834 def : Pat<(i32 (vector_extract v8i16:$S, 4)),
Nemanja Ivanovicac8d01a2015-12-10 13:35:28 +00001835 (i32 VectorExtractions.LE_HALF_3)>;
Nemanja Ivanovicd3896572015-10-09 11:12:18 +00001836 def : Pat<(i32 (vector_extract v8i16:$S, 5)),
Nemanja Ivanovicac8d01a2015-12-10 13:35:28 +00001837 (i32 VectorExtractions.LE_HALF_2)>;
Nemanja Ivanovicd3896572015-10-09 11:12:18 +00001838 def : Pat<(i32 (vector_extract v8i16:$S, 6)),
Nemanja Ivanovicac8d01a2015-12-10 13:35:28 +00001839 (i32 VectorExtractions.LE_HALF_1)>;
Nemanja Ivanovicd3896572015-10-09 11:12:18 +00001840 def : Pat<(i32 (vector_extract v8i16:$S, 7)),
Nemanja Ivanovicac8d01a2015-12-10 13:35:28 +00001841 (i32 VectorExtractions.LE_HALF_0)>;
Nemanja Ivanovicd3896572015-10-09 11:12:18 +00001842 def : Pat<(i32 (vector_extract v8i16:$S, i64:$Idx)),
Nemanja Ivanovicac8d01a2015-12-10 13:35:28 +00001843 (i32 VectorExtractions.BE_VARIABLE_HALF)>;
Nemanja Ivanovicd3896572015-10-09 11:12:18 +00001844
1845 // v4i32 scalar <-> vector conversions (BE)
1846 def : Pat<(i32 (vector_extract v4i32:$S, 0)),
Nemanja Ivanovicac8d01a2015-12-10 13:35:28 +00001847 (i32 VectorExtractions.LE_WORD_3)>;
Nemanja Ivanovicd3896572015-10-09 11:12:18 +00001848 def : Pat<(i32 (vector_extract v4i32:$S, 1)),
Nemanja Ivanovicac8d01a2015-12-10 13:35:28 +00001849 (i32 VectorExtractions.LE_WORD_2)>;
Nemanja Ivanovicd3896572015-10-09 11:12:18 +00001850 def : Pat<(i32 (vector_extract v4i32:$S, 2)),
Nemanja Ivanovicac8d01a2015-12-10 13:35:28 +00001851 (i32 VectorExtractions.LE_WORD_1)>;
Nemanja Ivanovicd3896572015-10-09 11:12:18 +00001852 def : Pat<(i32 (vector_extract v4i32:$S, 3)),
Nemanja Ivanovicac8d01a2015-12-10 13:35:28 +00001853 (i32 VectorExtractions.LE_WORD_0)>;
1854 def : Pat<(i32 (vector_extract v4i32:$S, i64:$Idx)),
1855 (i32 VectorExtractions.BE_VARIABLE_WORD)>;
Nemanja Ivanovicd3896572015-10-09 11:12:18 +00001856
1857 // v2i64 scalar <-> vector conversions (BE)
1858 def : Pat<(i64 (vector_extract v2i64:$S, 0)),
Nemanja Ivanovicac8d01a2015-12-10 13:35:28 +00001859 (i64 VectorExtractions.LE_DWORD_1)>;
Nemanja Ivanovicd3896572015-10-09 11:12:18 +00001860 def : Pat<(i64 (vector_extract v2i64:$S, 1)),
Nemanja Ivanovicac8d01a2015-12-10 13:35:28 +00001861 (i64 VectorExtractions.LE_DWORD_0)>;
1862 def : Pat<(i64 (vector_extract v2i64:$S, i64:$Idx)),
1863 (i64 VectorExtractions.BE_VARIABLE_DWORD)>;
Nemanja Ivanovic1c39ca62015-08-13 17:40:44 +00001864} // IsBigEndian, HasDirectMove
1865
Nemanja Ivanovicd3896572015-10-09 11:12:18 +00001866// v4f32 scalar <-> vector conversions (LE)
Nemanja Ivanovic1c39ca62015-08-13 17:40:44 +00001867let Predicates = [IsLittleEndian, HasP8Vector] in {
1868 def : Pat<(v4f32 (scalar_to_vector f32:$A)),
1869 (v4f32 (XXSLDWI (XSCVDPSPN $A), (XSCVDPSPN $A), 1))>;
Nemanja Ivanovicd3896572015-10-09 11:12:18 +00001870 def : Pat<(f32 (vector_extract v4f32:$S, 0)),
1871 (f32 (XSCVSPDPN (XXSLDWI $S, $S, 3)))>;
1872 def : Pat<(f32 (vector_extract v4f32:$S, 1)),
Nemanja Ivanoviceebbcb62016-07-12 12:16:27 +00001873 (f32 (XSCVSPDPN (XXPERMDI $S, $S, 2)))>;
Nemanja Ivanovicd3896572015-10-09 11:12:18 +00001874 def : Pat<(f32 (vector_extract v4f32:$S, 2)),
1875 (f32 (XSCVSPDPN (XXSLDWI $S, $S, 1)))>;
1876 def : Pat<(f32 (vector_extract v4f32:$S, 3)),
1877 (f32 (XSCVSPDPN $S))>;
Nemanja Ivanovicac8d01a2015-12-10 13:35:28 +00001878 def : Pat<(f32 (vector_extract v4f32:$S, i64:$Idx)),
1879 (f32 VectorExtractions.LE_VARIABLE_FLOAT)>;
Nemanja Ivanovic1c39ca62015-08-13 17:40:44 +00001880} // IsLittleEndian, HasP8Vector
1881
Nemanja Ivanovicac8d01a2015-12-10 13:35:28 +00001882// Variable index vector_extract for v2f64 does not require P8Vector
1883let Predicates = [IsLittleEndian, HasVSX] in
1884 def : Pat<(f64 (vector_extract v2f64:$S, i64:$Idx)),
1885 (f64 VectorExtractions.LE_VARIABLE_DOUBLE)>;
1886
Nemanja Ivanovicb8e30d62016-11-22 19:02:07 +00001887def : Pat<(v4i32 (int_ppc_vsx_lxvw4x_be xoaddr:$src)), (LXVW4X xoaddr:$src)>;
1888def : Pat<(v2f64 (int_ppc_vsx_lxvd2x_be xoaddr:$src)), (LXVD2X xoaddr:$src)>;
Tony Jiang5f850cd2016-11-15 14:25:56 +00001889
Nemanja Ivanovic1c39ca62015-08-13 17:40:44 +00001890let Predicates = [IsLittleEndian, HasDirectMove] in {
Nemanja Ivanovicd3896572015-10-09 11:12:18 +00001891 // v16i8 scalar <-> vector conversions (LE)
Nemanja Ivanovic1c39ca62015-08-13 17:40:44 +00001892 def : Pat<(v16i8 (scalar_to_vector i32:$A)),
Nemanja Ivanovicd3896572015-10-09 11:12:18 +00001893 (v16i8 (COPY_TO_REGCLASS MovesToVSR.LE_WORD_0, VSRC))>;
Nemanja Ivanovic1c39ca62015-08-13 17:40:44 +00001894 def : Pat<(v8i16 (scalar_to_vector i32:$A)),
Nemanja Ivanovicd3896572015-10-09 11:12:18 +00001895 (v8i16 (COPY_TO_REGCLASS MovesToVSR.LE_WORD_0, VSRC))>;
Nemanja Ivanovic1c39ca62015-08-13 17:40:44 +00001896 def : Pat<(v4i32 (scalar_to_vector i32:$A)),
Nemanja Ivanovicd3896572015-10-09 11:12:18 +00001897 (v4i32 MovesToVSR.LE_WORD_0)>;
Nemanja Ivanovic1c39ca62015-08-13 17:40:44 +00001898 def : Pat<(v2i64 (scalar_to_vector i64:$A)),
Nemanja Ivanovicd3896572015-10-09 11:12:18 +00001899 (v2i64 MovesToVSR.LE_DWORD_0)>;
1900 def : Pat<(i32 (vector_extract v16i8:$S, 0)),
Nemanja Ivanovicac8d01a2015-12-10 13:35:28 +00001901 (i32 VectorExtractions.LE_BYTE_0)>;
Nemanja Ivanovicd3896572015-10-09 11:12:18 +00001902 def : Pat<(i32 (vector_extract v16i8:$S, 1)),
Nemanja Ivanovicac8d01a2015-12-10 13:35:28 +00001903 (i32 VectorExtractions.LE_BYTE_1)>;
Nemanja Ivanovicd3896572015-10-09 11:12:18 +00001904 def : Pat<(i32 (vector_extract v16i8:$S, 2)),
Nemanja Ivanovicac8d01a2015-12-10 13:35:28 +00001905 (i32 VectorExtractions.LE_BYTE_2)>;
Nemanja Ivanovicd3896572015-10-09 11:12:18 +00001906 def : Pat<(i32 (vector_extract v16i8:$S, 3)),
Nemanja Ivanovicac8d01a2015-12-10 13:35:28 +00001907 (i32 VectorExtractions.LE_BYTE_3)>;
Nemanja Ivanovicd3896572015-10-09 11:12:18 +00001908 def : Pat<(i32 (vector_extract v16i8:$S, 4)),
Nemanja Ivanovicac8d01a2015-12-10 13:35:28 +00001909 (i32 VectorExtractions.LE_BYTE_4)>;
Nemanja Ivanovicd3896572015-10-09 11:12:18 +00001910 def : Pat<(i32 (vector_extract v16i8:$S, 5)),
Nemanja Ivanovicac8d01a2015-12-10 13:35:28 +00001911 (i32 VectorExtractions.LE_BYTE_5)>;
Nemanja Ivanovicd3896572015-10-09 11:12:18 +00001912 def : Pat<(i32 (vector_extract v16i8:$S, 6)),
Nemanja Ivanovicac8d01a2015-12-10 13:35:28 +00001913 (i32 VectorExtractions.LE_BYTE_6)>;
Nemanja Ivanovicd3896572015-10-09 11:12:18 +00001914 def : Pat<(i32 (vector_extract v16i8:$S, 7)),
Nemanja Ivanovicac8d01a2015-12-10 13:35:28 +00001915 (i32 VectorExtractions.LE_BYTE_7)>;
Nemanja Ivanovicd3896572015-10-09 11:12:18 +00001916 def : Pat<(i32 (vector_extract v16i8:$S, 8)),
Nemanja Ivanovicac8d01a2015-12-10 13:35:28 +00001917 (i32 VectorExtractions.LE_BYTE_8)>;
Nemanja Ivanovicd3896572015-10-09 11:12:18 +00001918 def : Pat<(i32 (vector_extract v16i8:$S, 9)),
Nemanja Ivanovicac8d01a2015-12-10 13:35:28 +00001919 (i32 VectorExtractions.LE_BYTE_9)>;
Nemanja Ivanovicd3896572015-10-09 11:12:18 +00001920 def : Pat<(i32 (vector_extract v16i8:$S, 10)),
Nemanja Ivanovicac8d01a2015-12-10 13:35:28 +00001921 (i32 VectorExtractions.LE_BYTE_10)>;
Nemanja Ivanovicd3896572015-10-09 11:12:18 +00001922 def : Pat<(i32 (vector_extract v16i8:$S, 11)),
Nemanja Ivanovicac8d01a2015-12-10 13:35:28 +00001923 (i32 VectorExtractions.LE_BYTE_11)>;
Nemanja Ivanovicd3896572015-10-09 11:12:18 +00001924 def : Pat<(i32 (vector_extract v16i8:$S, 12)),
Nemanja Ivanovicac8d01a2015-12-10 13:35:28 +00001925 (i32 VectorExtractions.LE_BYTE_12)>;
Nemanja Ivanovicd3896572015-10-09 11:12:18 +00001926 def : Pat<(i32 (vector_extract v16i8:$S, 13)),
Nemanja Ivanovicac8d01a2015-12-10 13:35:28 +00001927 (i32 VectorExtractions.LE_BYTE_13)>;
Nemanja Ivanovicd3896572015-10-09 11:12:18 +00001928 def : Pat<(i32 (vector_extract v16i8:$S, 14)),
Nemanja Ivanovicac8d01a2015-12-10 13:35:28 +00001929 (i32 VectorExtractions.LE_BYTE_14)>;
Nemanja Ivanovicd3896572015-10-09 11:12:18 +00001930 def : Pat<(i32 (vector_extract v16i8:$S, 15)),
Nemanja Ivanovicac8d01a2015-12-10 13:35:28 +00001931 (i32 VectorExtractions.LE_BYTE_15)>;
Nemanja Ivanovicd3896572015-10-09 11:12:18 +00001932 def : Pat<(i32 (vector_extract v16i8:$S, i64:$Idx)),
Nemanja Ivanovicac8d01a2015-12-10 13:35:28 +00001933 (i32 VectorExtractions.LE_VARIABLE_BYTE)>;
Nemanja Ivanovic1c39ca62015-08-13 17:40:44 +00001934
Nemanja Ivanovicd3896572015-10-09 11:12:18 +00001935 // v8i16 scalar <-> vector conversions (LE)
1936 def : Pat<(i32 (vector_extract v8i16:$S, 0)),
Nemanja Ivanovicac8d01a2015-12-10 13:35:28 +00001937 (i32 VectorExtractions.LE_HALF_0)>;
Nemanja Ivanovicd3896572015-10-09 11:12:18 +00001938 def : Pat<(i32 (vector_extract v8i16:$S, 1)),
Nemanja Ivanovicac8d01a2015-12-10 13:35:28 +00001939 (i32 VectorExtractions.LE_HALF_1)>;
Nemanja Ivanovicd3896572015-10-09 11:12:18 +00001940 def : Pat<(i32 (vector_extract v8i16:$S, 2)),
Nemanja Ivanovicac8d01a2015-12-10 13:35:28 +00001941 (i32 VectorExtractions.LE_HALF_2)>;
Nemanja Ivanovicd3896572015-10-09 11:12:18 +00001942 def : Pat<(i32 (vector_extract v8i16:$S, 3)),
Nemanja Ivanovicac8d01a2015-12-10 13:35:28 +00001943 (i32 VectorExtractions.LE_HALF_3)>;
Nemanja Ivanovicd3896572015-10-09 11:12:18 +00001944 def : Pat<(i32 (vector_extract v8i16:$S, 4)),
Nemanja Ivanovicac8d01a2015-12-10 13:35:28 +00001945 (i32 VectorExtractions.LE_HALF_4)>;
Nemanja Ivanovicd3896572015-10-09 11:12:18 +00001946 def : Pat<(i32 (vector_extract v8i16:$S, 5)),
Nemanja Ivanovicac8d01a2015-12-10 13:35:28 +00001947 (i32 VectorExtractions.LE_HALF_5)>;
Nemanja Ivanovicd3896572015-10-09 11:12:18 +00001948 def : Pat<(i32 (vector_extract v8i16:$S, 6)),
Nemanja Ivanovicac8d01a2015-12-10 13:35:28 +00001949 (i32 VectorExtractions.LE_HALF_6)>;
Nemanja Ivanovicd3896572015-10-09 11:12:18 +00001950 def : Pat<(i32 (vector_extract v8i16:$S, 7)),
Nemanja Ivanovicac8d01a2015-12-10 13:35:28 +00001951 (i32 VectorExtractions.LE_HALF_7)>;
Nemanja Ivanovicd3896572015-10-09 11:12:18 +00001952 def : Pat<(i32 (vector_extract v8i16:$S, i64:$Idx)),
Nemanja Ivanovicac8d01a2015-12-10 13:35:28 +00001953 (i32 VectorExtractions.LE_VARIABLE_HALF)>;
Nemanja Ivanovicd3896572015-10-09 11:12:18 +00001954
1955 // v4i32 scalar <-> vector conversions (LE)
1956 def : Pat<(i32 (vector_extract v4i32:$S, 0)),
Nemanja Ivanovicac8d01a2015-12-10 13:35:28 +00001957 (i32 VectorExtractions.LE_WORD_0)>;
Nemanja Ivanovicd3896572015-10-09 11:12:18 +00001958 def : Pat<(i32 (vector_extract v4i32:$S, 1)),
Nemanja Ivanovicac8d01a2015-12-10 13:35:28 +00001959 (i32 VectorExtractions.LE_WORD_1)>;
Nemanja Ivanovicd3896572015-10-09 11:12:18 +00001960 def : Pat<(i32 (vector_extract v4i32:$S, 2)),
Nemanja Ivanovicac8d01a2015-12-10 13:35:28 +00001961 (i32 VectorExtractions.LE_WORD_2)>;
Nemanja Ivanovicd3896572015-10-09 11:12:18 +00001962 def : Pat<(i32 (vector_extract v4i32:$S, 3)),
Nemanja Ivanovicac8d01a2015-12-10 13:35:28 +00001963 (i32 VectorExtractions.LE_WORD_3)>;
1964 def : Pat<(i32 (vector_extract v4i32:$S, i64:$Idx)),
1965 (i32 VectorExtractions.LE_VARIABLE_WORD)>;
Nemanja Ivanovicd3896572015-10-09 11:12:18 +00001966
1967 // v2i64 scalar <-> vector conversions (LE)
1968 def : Pat<(i64 (vector_extract v2i64:$S, 0)),
Nemanja Ivanovicac8d01a2015-12-10 13:35:28 +00001969 (i64 VectorExtractions.LE_DWORD_0)>;
Nemanja Ivanovicd3896572015-10-09 11:12:18 +00001970 def : Pat<(i64 (vector_extract v2i64:$S, 1)),
Nemanja Ivanovicac8d01a2015-12-10 13:35:28 +00001971 (i64 VectorExtractions.LE_DWORD_1)>;
1972 def : Pat<(i64 (vector_extract v2i64:$S, i64:$Idx)),
1973 (i64 VectorExtractions.LE_VARIABLE_DWORD)>;
Nemanja Ivanovicd3896572015-10-09 11:12:18 +00001974} // IsLittleEndian, HasDirectMove
Nemanja Ivanovic89224762015-12-15 14:50:34 +00001975
1976let Predicates = [HasDirectMove, HasVSX] in {
1977// bitconvert f32 -> i32
1978// (convert to 32-bit fp single, shift right 1 word, move to GPR)
1979def : Pat<(i32 (bitconvert f32:$S)),
1980 (i32 (MFVSRWZ (EXTRACT_SUBREG
1981 (XXSLDWI (XSCVDPSPN $S),(XSCVDPSPN $S), 3),
1982 sub_64)))>;
1983// bitconvert i32 -> f32
1984// (move to FPR, shift left 1 word, convert to 64-bit fp single)
1985def : Pat<(f32 (bitconvert i32:$A)),
1986 (f32 (XSCVSPDPN
1987 (XXSLDWI MovesToVSR.LE_WORD_1, MovesToVSR.LE_WORD_1, 1)))>;
1988
1989// bitconvert f64 -> i64
1990// (move to GPR, nothing else needed)
1991def : Pat<(i64 (bitconvert f64:$S)),
1992 (i64 (MFVSRD $S))>;
1993
1994// bitconvert i64 -> f64
1995// (move to FPR, nothing else needed)
1996def : Pat<(f64 (bitconvert i64:$S)),
1997 (f64 (MTVSRD $S))>;
1998}
Kit Barton93612ec2016-02-26 21:11:55 +00001999
Nemanja Ivanovicdf1cb522016-11-29 16:11:34 +00002000// Materialize a zero-vector of long long
2001def : Pat<(v2i64 immAllZerosV),
2002 (v2i64 (XXLXORz))>;
2003}
2004
Nemanja Ivanovicb43bb612016-07-12 21:00:10 +00002005def AlignValues {
2006 dag F32_TO_BE_WORD1 = (v4f32 (XXSLDWI (XSCVDPSPN $B), (XSCVDPSPN $B), 3));
2007 dag I32_TO_BE_WORD1 = (COPY_TO_REGCLASS (MTVSRWZ $B), VSRC);
2008}
2009
Kit Barton93612ec2016-02-26 21:11:55 +00002010// The following VSX instructions were introduced in Power ISA 3.0
2011def HasP9Vector : Predicate<"PPCSubTarget->hasP9Vector()">;
Nemanja Ivanovicb43bb612016-07-12 21:00:10 +00002012let AddedComplexity = 400, Predicates = [HasP9Vector] in {
Kit Barton93612ec2016-02-26 21:11:55 +00002013
2014 // [PO VRT XO VRB XO /]
2015 class X_VT5_XO5_VB5<bits<6> opcode, bits<5> xo2, bits<10> xo, string opc,
2016 list<dag> pattern>
2017 : X_RD5_XO5_RS5<opcode, xo2, xo, (outs vrrc:$vT), (ins vrrc:$vB),
2018 !strconcat(opc, " $vT, $vB"), IIC_VecFP, pattern>;
2019
2020 // [PO VRT XO VRB XO RO], Round to Odd version of [PO VRT XO VRB XO /]
2021 class X_VT5_XO5_VB5_Ro<bits<6> opcode, bits<5> xo2, bits<10> xo, string opc,
2022 list<dag> pattern>
2023 : X_VT5_XO5_VB5<opcode, xo2, xo, opc, pattern>, isDOT;
2024
2025 // [PO VRT XO VRB XO /], but the VRB is only used the left 64 bits (or less),
2026 // So we use different operand class for VRB
2027 class X_VT5_XO5_VB5_TyVB<bits<6> opcode, bits<5> xo2, bits<10> xo, string opc,
2028 RegisterOperand vbtype, list<dag> pattern>
2029 : X_RD5_XO5_RS5<opcode, xo2, xo, (outs vrrc:$vT), (ins vbtype:$vB),
2030 !strconcat(opc, " $vT, $vB"), IIC_VecFP, pattern>;
2031
Nemanja Ivanovic11049f82016-10-04 06:59:23 +00002032 let UseVSXReg = 1 in {
Chuang-Yu Cheng80722712016-03-28 08:34:28 +00002033 // [PO T XO B XO BX /]
2034 class XX2_RT5_XO5_XB6<bits<6> opcode, bits<5> xo2, bits<9> xo, string opc,
2035 list<dag> pattern>
2036 : XX2_RD5_XO5_RS6<opcode, xo2, xo, (outs g8rc:$rT), (ins vsfrc:$XB),
2037 !strconcat(opc, " $rT, $XB"), IIC_VecFP, pattern>;
2038
Kit Barton93612ec2016-02-26 21:11:55 +00002039 // [PO T XO B XO BX TX]
2040 class XX2_XT6_XO5_XB6<bits<6> opcode, bits<5> xo2, bits<9> xo, string opc,
2041 RegisterOperand vtype, list<dag> pattern>
2042 : XX2_RD6_XO5_RS6<opcode, xo2, xo, (outs vtype:$XT), (ins vtype:$XB),
2043 !strconcat(opc, " $XT, $XB"), IIC_VecFP, pattern>;
2044
2045 // [PO T A B XO AX BX TX], src and dest register use different operand class
2046 class XX3_XT5_XA5_XB5<bits<6> opcode, bits<8> xo, string opc,
2047 RegisterOperand xty, RegisterOperand aty, RegisterOperand bty,
2048 InstrItinClass itin, list<dag> pattern>
2049 : XX3Form<opcode, xo, (outs xty:$XT), (ins aty:$XA, bty:$XB),
2050 !strconcat(opc, " $XT, $XA, $XB"), itin, pattern>;
Nemanja Ivanovic11049f82016-10-04 06:59:23 +00002051 } // UseVSXReg = 1
Kit Barton93612ec2016-02-26 21:11:55 +00002052
Chuang-Yu Cheng56638482016-03-28 07:38:01 +00002053 // [PO VRT VRA VRB XO /]
2054 class X_VT5_VA5_VB5<bits<6> opcode, bits<10> xo, string opc,
2055 list<dag> pattern>
2056 : XForm_1<opcode, xo, (outs vrrc:$vT), (ins vrrc:$vA, vrrc:$vB),
2057 !strconcat(opc, " $vT, $vA, $vB"), IIC_VecFP, pattern>;
2058
2059 // [PO VRT VRA VRB XO RO], Round to Odd version of [PO VRT VRA VRB XO /]
2060 class X_VT5_VA5_VB5_Ro<bits<6> opcode, bits<10> xo, string opc,
2061 list<dag> pattern>
2062 : X_VT5_VA5_VB5<opcode, xo, opc, pattern>, isDOT;
2063
2064 //===--------------------------------------------------------------------===//
2065 // Quad-Precision Scalar Move Instructions:
2066
2067 // Copy Sign
2068 def XSCPSGNQP : X_VT5_VA5_VB5<63, 100, "xscpsgnqp", []>;
2069
2070 // Absolute/Negative-Absolute/Negate
2071 def XSABSQP : X_VT5_XO5_VB5<63, 0, 804, "xsabsqp" , []>;
2072 def XSNABSQP : X_VT5_XO5_VB5<63, 8, 804, "xsnabsqp", []>;
2073 def XSNEGQP : X_VT5_XO5_VB5<63, 16, 804, "xsnegqp" , []>;
2074
2075 //===--------------------------------------------------------------------===//
2076 // Quad-Precision Scalar Floating-Point Arithmetic Instructions:
2077
2078 // Add/Divide/Multiply/Subtract
2079 def XSADDQP : X_VT5_VA5_VB5 <63, 4, "xsaddqp" , []>;
2080 def XSADDQPO : X_VT5_VA5_VB5_Ro<63, 4, "xsaddqpo", []>;
2081 def XSDIVQP : X_VT5_VA5_VB5 <63, 548, "xsdivqp" , []>;
2082 def XSDIVQPO : X_VT5_VA5_VB5_Ro<63, 548, "xsdivqpo", []>;
2083 def XSMULQP : X_VT5_VA5_VB5 <63, 36, "xsmulqp" , []>;
2084 def XSMULQPO : X_VT5_VA5_VB5_Ro<63, 36, "xsmulqpo", []>;
2085 def XSSUBQP : X_VT5_VA5_VB5 <63, 516, "xssubqp" , []>;
2086 def XSSUBQPO : X_VT5_VA5_VB5_Ro<63, 516, "xssubqpo", []>;
2087
2088 // Square-Root
2089 def XSSQRTQP : X_VT5_XO5_VB5 <63, 27, 804, "xssqrtqp" , []>;
2090 def XSSQRTQPO : X_VT5_XO5_VB5_Ro<63, 27, 804, "xssqrtqpo", []>;
2091
2092 // (Negative) Multiply-{Add/Subtract}
2093 def XSMADDQP : X_VT5_VA5_VB5 <63, 388, "xsmaddqp" , []>;
2094 def XSMADDQPO : X_VT5_VA5_VB5_Ro<63, 388, "xsmaddqpo" , []>;
2095 def XSMSUBQP : X_VT5_VA5_VB5 <63, 420, "xsmsubqp" , []>;
2096 def XSMSUBQPO : X_VT5_VA5_VB5_Ro<63, 420, "xsmsubqpo" , []>;
2097 def XSNMADDQP : X_VT5_VA5_VB5 <63, 452, "xsnmaddqp" , []>;
2098 def XSNMADDQPO: X_VT5_VA5_VB5_Ro<63, 452, "xsnmaddqpo", []>;
2099 def XSNMSUBQP : X_VT5_VA5_VB5 <63, 484, "xsnmsubqp" , []>;
2100 def XSNMSUBQPO: X_VT5_VA5_VB5_Ro<63, 484, "xsnmsubqpo", []>;
2101
Kit Barton93612ec2016-02-26 21:11:55 +00002102 //===--------------------------------------------------------------------===//
2103 // Quad/Double-Precision Compare Instructions:
2104
2105 // [PO BF // VRA VRB XO /]
2106 class X_BF3_VA5_VB5<bits<6> opcode, bits<10> xo, string opc,
2107 list<dag> pattern>
2108 : XForm_17<opcode, xo, (outs crrc:$crD), (ins vrrc:$VA, vrrc:$VB),
2109 !strconcat(opc, " $crD, $VA, $VB"), IIC_FPCompare> {
2110 let Pattern = pattern;
2111 }
2112
2113 // QP Compare Ordered/Unordered
2114 def XSCMPOQP : X_BF3_VA5_VB5<63, 132, "xscmpoqp", []>;
2115 def XSCMPUQP : X_BF3_VA5_VB5<63, 644, "xscmpuqp", []>;
2116
2117 // DP/QP Compare Exponents
2118 def XSCMPEXPDP : XX3Form_1<60, 59,
2119 (outs crrc:$crD), (ins vsfrc:$XA, vsfrc:$XB),
Nemanja Ivanovic11049f82016-10-04 06:59:23 +00002120 "xscmpexpdp $crD, $XA, $XB", IIC_FPCompare, []>,
2121 UseVSXReg;
Kit Barton93612ec2016-02-26 21:11:55 +00002122 def XSCMPEXPQP : X_BF3_VA5_VB5<63, 164, "xscmpexpqp", []>;
2123
2124 // DP Compare ==, >=, >, !=
2125 // Use vsrc for XT, because the entire register of XT is set.
2126 // XT.dword[1] = 0x0000_0000_0000_0000
2127 def XSCMPEQDP : XX3_XT5_XA5_XB5<60, 3, "xscmpeqdp", vsrc, vsfrc, vsfrc,
2128 IIC_FPCompare, []>;
2129 def XSCMPGEDP : XX3_XT5_XA5_XB5<60, 19, "xscmpgedp", vsrc, vsfrc, vsfrc,
2130 IIC_FPCompare, []>;
2131 def XSCMPGTDP : XX3_XT5_XA5_XB5<60, 11, "xscmpgtdp", vsrc, vsfrc, vsfrc,
2132 IIC_FPCompare, []>;
2133 def XSCMPNEDP : XX3_XT5_XA5_XB5<60, 27, "xscmpnedp", vsrc, vsfrc, vsfrc,
2134 IIC_FPCompare, []>;
Nemanja Ivanovic11049f82016-10-04 06:59:23 +00002135 let UseVSXReg = 1 in {
Kit Barton93612ec2016-02-26 21:11:55 +00002136 // Vector Compare Not Equal
2137 def XVCMPNEDP : XX3Form_Rc<60, 123,
2138 (outs vsrc:$XT), (ins vsrc:$XA, vsrc:$XB),
2139 "xvcmpnedp $XT, $XA, $XB", IIC_VecFPCompare, []>;
2140 let Defs = [CR6] in
2141 def XVCMPNEDPo : XX3Form_Rc<60, 123,
2142 (outs vsrc:$XT), (ins vsrc:$XA, vsrc:$XB),
2143 "xvcmpnedp. $XT, $XA, $XB", IIC_VecFPCompare, []>,
2144 isDOT;
2145 def XVCMPNESP : XX3Form_Rc<60, 91,
2146 (outs vsrc:$XT), (ins vsrc:$XA, vsrc:$XB),
2147 "xvcmpnesp $XT, $XA, $XB", IIC_VecFPCompare, []>;
2148 let Defs = [CR6] in
2149 def XVCMPNESPo : XX3Form_Rc<60, 91,
2150 (outs vsrc:$XT), (ins vsrc:$XA, vsrc:$XB),
2151 "xvcmpnesp. $XT, $XA, $XB", IIC_VecFPCompare, []>,
2152 isDOT;
Nemanja Ivanovic11049f82016-10-04 06:59:23 +00002153 } // UseVSXReg = 1
Kit Barton93612ec2016-02-26 21:11:55 +00002154
2155 //===--------------------------------------------------------------------===//
2156 // Quad-Precision Floating-Point Conversion Instructions:
2157
2158 // Convert DP -> QP
Nemanja Ivanovic11049f82016-10-04 06:59:23 +00002159 def XSCVDPQP : X_VT5_XO5_VB5_TyVB<63, 22, 836, "xscvdpqp", vfrc, []>;
Kit Barton93612ec2016-02-26 21:11:55 +00002160
2161 // Round & Convert QP -> DP (dword[1] is set to zero)
2162 def XSCVQPDP : X_VT5_XO5_VB5 <63, 20, 836, "xscvqpdp" , []>;
2163 def XSCVQPDPO : X_VT5_XO5_VB5_Ro<63, 20, 836, "xscvqpdpo", []>;
2164
2165 // Truncate & Convert QP -> (Un)Signed (D)Word (dword[1] is set to zero)
2166 def XSCVQPSDZ : X_VT5_XO5_VB5<63, 25, 836, "xscvqpsdz", []>;
2167 def XSCVQPSWZ : X_VT5_XO5_VB5<63, 9, 836, "xscvqpswz", []>;
2168 def XSCVQPUDZ : X_VT5_XO5_VB5<63, 17, 836, "xscvqpudz", []>;
2169 def XSCVQPUWZ : X_VT5_XO5_VB5<63, 1, 836, "xscvqpuwz", []>;
2170
2171 // Convert (Un)Signed DWord -> QP
Nemanja Ivanovic11049f82016-10-04 06:59:23 +00002172 def XSCVSDQP : X_VT5_XO5_VB5_TyVB<63, 10, 836, "xscvsdqp", vfrc, []>;
2173 def XSCVUDQP : X_VT5_XO5_VB5_TyVB<63, 2, 836, "xscvudqp", vfrc, []>;
Kit Barton93612ec2016-02-26 21:11:55 +00002174
Sean Fertilea435e072016-11-14 18:43:59 +00002175 let UseVSXReg = 1 in {
Kit Barton93612ec2016-02-26 21:11:55 +00002176 //===--------------------------------------------------------------------===//
2177 // Round to Floating-Point Integer Instructions
2178
2179 // (Round &) Convert DP <-> HP
2180 // Note! xscvdphp's src and dest register both use the left 64 bits, so we use
2181 // vsfrc for src and dest register. xscvhpdp's src only use the left 16 bits,
2182 // but we still use vsfrc for it.
2183 def XSCVDPHP : XX2_XT6_XO5_XB6<60, 17, 347, "xscvdphp", vsfrc, []>;
2184 def XSCVHPDP : XX2_XT6_XO5_XB6<60, 16, 347, "xscvhpdp", vsfrc, []>;
2185
2186 // Vector HP -> SP
2187 def XVCVHPSP : XX2_XT6_XO5_XB6<60, 24, 475, "xvcvhpsp", vsrc, []>;
Nemanja Ivanovicec4b0c32016-11-11 21:42:01 +00002188 def XVCVSPHP : XX2_XT6_XO5_XB6<60, 25, 475, "xvcvsphp", vsrc,
2189 [(set v4f32:$XT,
2190 (int_ppc_vsx_xvcvsphp v4f32:$XB))]>;
Kit Barton93612ec2016-02-26 21:11:55 +00002191
Sean Fertilea435e072016-11-14 18:43:59 +00002192 } // UseVSXReg = 1
2193
2194 // Pattern for matching Vector HP -> Vector SP intrinsic. Defined as a
2195 // seperate pattern so that it can convert the input register class from
2196 // VRRC(v8i16) to VSRC.
2197 def : Pat<(v4f32 (int_ppc_vsx_xvcvhpsp v8i16:$A)),
2198 (v4f32 (XVCVHPSP (COPY_TO_REGCLASS $A, VSRC)))>;
2199
Kit Barton93612ec2016-02-26 21:11:55 +00002200 class Z23_VT5_R1_VB5_RMC2_EX1<bits<6> opcode, bits<8> xo, bit ex, string opc,
2201 list<dag> pattern>
2202 : Z23Form_1<opcode, xo,
2203 (outs vrrc:$vT), (ins u1imm:$r, vrrc:$vB, u2imm:$rmc),
2204 !strconcat(opc, " $r, $vT, $vB, $rmc"), IIC_VecFP, pattern> {
2205 let RC = ex;
2206 }
2207
2208 // Round to Quad-Precision Integer [with Inexact]
2209 def XSRQPI : Z23_VT5_R1_VB5_RMC2_EX1<63, 5, 0, "xsrqpi" , []>;
2210 def XSRQPIX : Z23_VT5_R1_VB5_RMC2_EX1<63, 5, 1, "xsrqpix", []>;
2211
2212 // Round Quad-Precision to Double-Extended Precision (fp80)
2213 def XSRQPXP : Z23_VT5_R1_VB5_RMC2_EX1<63, 37, 0, "xsrqpxp", []>;
Kit Bartonba532dc2016-03-08 03:49:13 +00002214
2215 //===--------------------------------------------------------------------===//
Chuang-Yu Cheng80722712016-03-28 08:34:28 +00002216 // Insert/Extract Instructions
2217
2218 // Insert Exponent DP/QP
2219 // XT NOTE: XT.dword[1] = 0xUUUU_UUUU_UUUU_UUUU
2220 def XSIEXPDP : XX1Form <60, 918, (outs vsrc:$XT), (ins g8rc:$rA, g8rc:$rB),
Nemanja Ivanovic11049f82016-10-04 06:59:23 +00002221 "xsiexpdp $XT, $rA, $rB", IIC_VecFP, []>, UseVSXReg;
Chuang-Yu Cheng80722712016-03-28 08:34:28 +00002222 // vB NOTE: only vB.dword[0] is used, that's why we don't use
2223 // X_VT5_VA5_VB5 form
2224 def XSIEXPQP : XForm_18<63, 868, (outs vrrc:$vT), (ins vrrc:$vA, vsfrc:$vB),
2225 "xsiexpqp $vT, $vA, $vB", IIC_VecFP, []>;
2226
2227 // Extract Exponent/Significand DP/QP
2228 def XSXEXPDP : XX2_RT5_XO5_XB6<60, 0, 347, "xsxexpdp", []>;
2229 def XSXSIGDP : XX2_RT5_XO5_XB6<60, 1, 347, "xsxsigdp", []>;
Nemanja Ivanovic11049f82016-10-04 06:59:23 +00002230
Chuang-Yu Cheng80722712016-03-28 08:34:28 +00002231 def XSXEXPQP : X_VT5_XO5_VB5 <63, 2, 804, "xsxexpqp", []>;
2232 def XSXSIGQP : X_VT5_XO5_VB5 <63, 18, 804, "xsxsigqp", []>;
2233
2234 // Vector Insert Word
Nemanja Ivanovic11049f82016-10-04 06:59:23 +00002235 let UseVSXReg = 1 in {
Chuang-Yu Cheng80722712016-03-28 08:34:28 +00002236 // XB NOTE: Only XB.dword[1] is used, but we use vsrc on XB.
Nemanja Ivanovicb43bb612016-07-12 21:00:10 +00002237 def XXINSERTW :
2238 XX2_RD6_UIM5_RS6<60, 181, (outs vsrc:$XT),
2239 (ins vsrc:$XTi, vsrc:$XB, u4imm:$UIM),
2240 "xxinsertw $XT, $XB, $UIM", IIC_VecFP,
2241 [(set v4i32:$XT, (PPCxxinsert v4i32:$XTi, v4i32:$XB,
2242 imm32SExt16:$UIM))]>,
2243 RegConstraint<"$XTi = $XT">, NoEncode<"$XTi">;
Chuang-Yu Cheng80722712016-03-28 08:34:28 +00002244
2245 // Vector Extract Unsigned Word
2246 def XXEXTRACTUW : XX2_RD6_UIM5_RS6<60, 165,
Nemanja Ivanovicb43bb612016-07-12 21:00:10 +00002247 (outs vsfrc:$XT), (ins vsrc:$XB, u4imm:$UIMM),
Chuang-Yu Cheng80722712016-03-28 08:34:28 +00002248 "xxextractuw $XT, $XB, $UIMM", IIC_VecFP, []>;
Nemanja Ivanovic11049f82016-10-04 06:59:23 +00002249 } // UseVSXReg = 1
Chuang-Yu Cheng80722712016-03-28 08:34:28 +00002250
2251 // Vector Insert Exponent DP/SP
2252 def XVIEXPDP : XX3_XT5_XA5_XB5<60, 248, "xviexpdp", vsrc, vsrc, vsrc,
Nemanja Ivanovic0f459982016-10-26 19:03:40 +00002253 IIC_VecFP, [(set v2f64: $XT,(int_ppc_vsx_xviexpdp v2i64:$XA, v2i64:$XB))]>;
Chuang-Yu Cheng80722712016-03-28 08:34:28 +00002254 def XVIEXPSP : XX3_XT5_XA5_XB5<60, 216, "xviexpsp", vsrc, vsrc, vsrc,
Nemanja Ivanovic0f459982016-10-26 19:03:40 +00002255 IIC_VecFP, [(set v4f32: $XT,(int_ppc_vsx_xviexpsp v4i32:$XA, v4i32:$XB))]>;
Chuang-Yu Cheng80722712016-03-28 08:34:28 +00002256
2257 // Vector Extract Exponent/Significand DP/SP
Sean Fertileadda5b22016-11-14 14:42:37 +00002258 def XVXEXPDP : XX2_XT6_XO5_XB6<60, 0, 475, "xvxexpdp", vsrc,
2259 [(set v2i64: $XT,
2260 (int_ppc_vsx_xvxexpdp v2f64:$XB))]>;
2261 def XVXEXPSP : XX2_XT6_XO5_XB6<60, 8, 475, "xvxexpsp", vsrc,
2262 [(set v4i32: $XT,
2263 (int_ppc_vsx_xvxexpsp v4f32:$XB))]>;
2264 def XVXSIGDP : XX2_XT6_XO5_XB6<60, 1, 475, "xvxsigdp", vsrc,
2265 [(set v2i64: $XT,
2266 (int_ppc_vsx_xvxsigdp v2f64:$XB))]>;
2267 def XVXSIGSP : XX2_XT6_XO5_XB6<60, 9, 475, "xvxsigsp", vsrc,
2268 [(set v4i32: $XT,
2269 (int_ppc_vsx_xvxsigsp v4f32:$XB))]>;
Chuang-Yu Cheng80722712016-03-28 08:34:28 +00002270
2271 //===--------------------------------------------------------------------===//
2272
2273 // Test Data Class SP/DP/QP
Nemanja Ivanovic11049f82016-10-04 06:59:23 +00002274 let UseVSXReg = 1 in {
Chuang-Yu Cheng80722712016-03-28 08:34:28 +00002275 def XSTSTDCSP : XX2_BF3_DCMX7_RS6<60, 298,
2276 (outs crrc:$BF), (ins u7imm:$DCMX, vsfrc:$XB),
2277 "xststdcsp $BF, $XB, $DCMX", IIC_VecFP, []>;
2278 def XSTSTDCDP : XX2_BF3_DCMX7_RS6<60, 362,
2279 (outs crrc:$BF), (ins u7imm:$DCMX, vsfrc:$XB),
2280 "xststdcdp $BF, $XB, $DCMX", IIC_VecFP, []>;
Nemanja Ivanovic11049f82016-10-04 06:59:23 +00002281 } // UseVSXReg = 1
Chuang-Yu Cheng80722712016-03-28 08:34:28 +00002282 def XSTSTDCQP : X_BF3_DCMX7_RS5 <63, 708,
2283 (outs crrc:$BF), (ins u7imm:$DCMX, vrrc:$vB),
2284 "xststdcqp $BF, $vB, $DCMX", IIC_VecFP, []>;
2285
2286 // Vector Test Data Class SP/DP
Nemanja Ivanovic11049f82016-10-04 06:59:23 +00002287 let UseVSXReg = 1 in {
Chuang-Yu Cheng80722712016-03-28 08:34:28 +00002288 def XVTSTDCSP : XX2_RD6_DCMX7_RS6<60, 13, 5,
2289 (outs vsrc:$XT), (ins u7imm:$DCMX, vsrc:$XB),
Sean Fertileadda5b22016-11-14 14:42:37 +00002290 "xvtstdcsp $XT, $XB, $DCMX", IIC_VecFP,
2291 [(set v4i32: $XT,
2292 (int_ppc_vsx_xvtstdcsp v4f32:$XB, imm:$DCMX))]>;
Chuang-Yu Cheng80722712016-03-28 08:34:28 +00002293 def XVTSTDCDP : XX2_RD6_DCMX7_RS6<60, 15, 5,
2294 (outs vsrc:$XT), (ins u7imm:$DCMX, vsrc:$XB),
Sean Fertileadda5b22016-11-14 14:42:37 +00002295 "xvtstdcdp $XT, $XB, $DCMX", IIC_VecFP,
2296 [(set v2i64: $XT,
2297 (int_ppc_vsx_xvtstdcdp v2f64:$XB, imm:$DCMX))]>;
Nemanja Ivanovic11049f82016-10-04 06:59:23 +00002298 } // UseVSXReg = 1
Chuang-Yu Cheng80722712016-03-28 08:34:28 +00002299
2300 //===--------------------------------------------------------------------===//
2301
2302 // Maximum/Minimum Type-C/Type-J DP
2303 // XT.dword[1] = 0xUUUU_UUUU_UUUU_UUUU, so we use vsrc for XT
2304 def XSMAXCDP : XX3_XT5_XA5_XB5<60, 128, "xsmaxcdp", vsrc, vsfrc, vsfrc,
2305 IIC_VecFP, []>;
2306 def XSMAXJDP : XX3_XT5_XA5_XB5<60, 144, "xsmaxjdp", vsrc, vsfrc, vsfrc,
2307 IIC_VecFP, []>;
2308 def XSMINCDP : XX3_XT5_XA5_XB5<60, 136, "xsmincdp", vsrc, vsfrc, vsfrc,
2309 IIC_VecFP, []>;
2310 def XSMINJDP : XX3_XT5_XA5_XB5<60, 152, "xsminjdp", vsrc, vsfrc, vsfrc,
2311 IIC_VecFP, []>;
2312
2313 //===--------------------------------------------------------------------===//
2314
2315 // Vector Byte-Reverse H/W/D/Q Word
2316 def XXBRH : XX2_XT6_XO5_XB6<60, 7, 475, "xxbrh", vsrc, []>;
2317 def XXBRW : XX2_XT6_XO5_XB6<60, 15, 475, "xxbrw", vsrc, []>;
2318 def XXBRD : XX2_XT6_XO5_XB6<60, 23, 475, "xxbrd", vsrc, []>;
2319 def XXBRQ : XX2_XT6_XO5_XB6<60, 31, 475, "xxbrq", vsrc, []>;
2320
2321 // Vector Permute
2322 def XXPERM : XX3_XT5_XA5_XB5<60, 26, "xxperm" , vsrc, vsrc, vsrc,
2323 IIC_VecPerm, []>;
2324 def XXPERMR : XX3_XT5_XA5_XB5<60, 58, "xxpermr", vsrc, vsrc, vsrc,
2325 IIC_VecPerm, []>;
2326
2327 // Vector Splat Immediate Byte
2328 def XXSPLTIB : X_RD6_IMM8<60, 360, (outs vsrc:$XT), (ins u8imm:$IMM8),
Nemanja Ivanovic11049f82016-10-04 06:59:23 +00002329 "xxspltib $XT, $IMM8", IIC_VecPerm, []>, UseVSXReg;
Chuang-Yu Cheng80722712016-03-28 08:34:28 +00002330
2331 //===--------------------------------------------------------------------===//
Kit Bartonba532dc2016-03-08 03:49:13 +00002332 // Vector/Scalar Load/Store Instructions
2333
Nemanja Ivanovic6354d232016-10-04 11:25:52 +00002334 // When adding new D-Form loads/stores, be sure to update the ImmToIdxMap in
2335 // PPCRegisterInfo::PPCRegisterInfo and maybe save yourself some debugging.
Kit Bartonba532dc2016-03-08 03:49:13 +00002336 let mayLoad = 1 in {
2337 // Load Vector
2338 def LXV : DQ_RD6_RS5_DQ12<61, 1, (outs vsrc:$XT), (ins memrix16:$src),
Nemanja Ivanovic11049f82016-10-04 06:59:23 +00002339 "lxv $XT, $src", IIC_LdStLFD, []>, UseVSXReg;
Kit Bartonba532dc2016-03-08 03:49:13 +00002340 // Load DWord
Nemanja Ivanovic11049f82016-10-04 06:59:23 +00002341 def LXSD : DSForm_1<57, 2, (outs vfrc:$vD), (ins memrix:$src),
Kit Bartonba532dc2016-03-08 03:49:13 +00002342 "lxsd $vD, $src", IIC_LdStLFD, []>;
2343 // Load SP from src, convert it to DP, and place in dword[0]
Nemanja Ivanovic11049f82016-10-04 06:59:23 +00002344 def LXSSP : DSForm_1<57, 3, (outs vfrc:$vD), (ins memrix:$src),
Kit Bartonba532dc2016-03-08 03:49:13 +00002345 "lxssp $vD, $src", IIC_LdStLFD, []>;
2346
2347 // [PO T RA RB XO TX] almost equal to [PO S RA RB XO SX], but has different
2348 // "out" and "in" dag
2349 class X_XT6_RA5_RB5<bits<6> opcode, bits<10> xo, string opc,
2350 RegisterOperand vtype, list<dag> pattern>
2351 : XX1Form<opcode, xo, (outs vtype:$XT), (ins memrr:$src),
Nemanja Ivanovic11049f82016-10-04 06:59:23 +00002352 !strconcat(opc, " $XT, $src"), IIC_LdStLFD, pattern>, UseVSXReg;
Kit Bartonba532dc2016-03-08 03:49:13 +00002353
2354 // Load as Integer Byte/Halfword & Zero Indexed
Nemanja Ivanovic11049f82016-10-04 06:59:23 +00002355 def LXSIBZX : X_XT6_RA5_RB5<31, 781, "lxsibzx", vsfrc,
2356 [(set f64:$XT, (PPClxsizx xoaddr:$src, 1))]>;
2357 def LXSIHZX : X_XT6_RA5_RB5<31, 813, "lxsihzx", vsfrc,
2358 [(set f64:$XT, (PPClxsizx xoaddr:$src, 2))]>;
Kit Bartonba532dc2016-03-08 03:49:13 +00002359
2360 // Load Vector Halfword*8/Byte*16 Indexed
2361 def LXVH8X : X_XT6_RA5_RB5<31, 812, "lxvh8x" , vsrc, []>;
2362 def LXVB16X : X_XT6_RA5_RB5<31, 876, "lxvb16x", vsrc, []>;
2363
2364 // Load Vector Indexed
Nemanja Ivanovic6e7879c2016-09-22 09:52:19 +00002365 def LXVX : X_XT6_RA5_RB5<31, 268, "lxvx" , vsrc,
2366 [(set v2f64:$XT, (load xoaddr:$src))]>;
Kit Bartonba532dc2016-03-08 03:49:13 +00002367
2368 // Load Vector (Left-justified) with Length
Zaara Syedaa19c9e62016-11-15 17:54:19 +00002369 def LXVL : XX1Form<31, 269, (outs vsrc:$XT), (ins memr:$src, g8rc:$rB),
2370 "lxvl $XT, $src, $rB", IIC_LdStLoad,
2371 [(set v4i32:$XT, (int_ppc_vsx_lxvl addr:$src, i64:$rB))]>,
2372 UseVSXReg;
2373 def LXVLL : XX1Form<31,301, (outs vsrc:$XT), (ins memr:$src, g8rc:$rB),
2374 "lxvll $XT, $src, $rB", IIC_LdStLoad,
2375 [(set v4i32:$XT, (int_ppc_vsx_lxvll addr:$src, i64:$rB))]>,
2376 UseVSXReg;
Kit Bartonba532dc2016-03-08 03:49:13 +00002377
2378 // Load Vector Word & Splat Indexed
2379 def LXVWSX : X_XT6_RA5_RB5<31, 364, "lxvwsx" , vsrc, []>;
Nemanja Ivanovic11049f82016-10-04 06:59:23 +00002380 } // mayLoad
Kit Bartonba532dc2016-03-08 03:49:13 +00002381
Nemanja Ivanovic6354d232016-10-04 11:25:52 +00002382 // When adding new D-Form loads/stores, be sure to update the ImmToIdxMap in
2383 // PPCRegisterInfo::PPCRegisterInfo and maybe save yourself some debugging.
Kit Bartonba532dc2016-03-08 03:49:13 +00002384 let mayStore = 1 in {
2385 // Store Vector
2386 def STXV : DQ_RD6_RS5_DQ12<61, 5, (outs), (ins vsrc:$XT, memrix16:$dst),
Nemanja Ivanovic11049f82016-10-04 06:59:23 +00002387 "stxv $XT, $dst", IIC_LdStSTFD, []>, UseVSXReg;
Kit Bartonba532dc2016-03-08 03:49:13 +00002388 // Store DWord
Nemanja Ivanovic11049f82016-10-04 06:59:23 +00002389 def STXSD : DSForm_1<61, 2, (outs), (ins vfrc:$vS, memrix:$dst),
Kit Bartonba532dc2016-03-08 03:49:13 +00002390 "stxsd $vS, $dst", IIC_LdStSTFD, []>;
2391 // Convert DP of dword[0] to SP, and Store to dst
Nemanja Ivanovic11049f82016-10-04 06:59:23 +00002392 def STXSSP : DSForm_1<61, 3, (outs), (ins vfrc:$vS, memrix:$dst),
Kit Bartonba532dc2016-03-08 03:49:13 +00002393 "stxssp $vS, $dst", IIC_LdStSTFD, []>;
2394
2395 // [PO S RA RB XO SX]
2396 class X_XS6_RA5_RB5<bits<6> opcode, bits<10> xo, string opc,
2397 RegisterOperand vtype, list<dag> pattern>
2398 : XX1Form<opcode, xo, (outs), (ins vtype:$XT, memrr:$dst),
Nemanja Ivanovic11049f82016-10-04 06:59:23 +00002399 !strconcat(opc, " $XT, $dst"), IIC_LdStSTFD, pattern>, UseVSXReg;
Kit Bartonba532dc2016-03-08 03:49:13 +00002400
2401 // Store as Integer Byte/Halfword Indexed
Nemanja Ivanovic11049f82016-10-04 06:59:23 +00002402 def STXSIBX : X_XS6_RA5_RB5<31, 909, "stxsibx" , vsfrc,
2403 [(PPCstxsix f64:$XT, xoaddr:$dst, 1)]>;
2404 def STXSIHX : X_XS6_RA5_RB5<31, 941, "stxsihx" , vsfrc,
2405 [(PPCstxsix f64:$XT, xoaddr:$dst, 2)]>;
2406 let isCodeGenOnly = 1 in {
2407 def STXSIBXv : X_XS6_RA5_RB5<31, 909, "stxsibx" , vrrc, []>;
2408 def STXSIHXv : X_XS6_RA5_RB5<31, 941, "stxsihx" , vrrc, []>;
2409 }
Kit Bartonba532dc2016-03-08 03:49:13 +00002410
2411 // Store Vector Halfword*8/Byte*16 Indexed
2412 def STXVH8X : X_XS6_RA5_RB5<31, 940, "stxvh8x" , vsrc, []>;
2413 def STXVB16X : X_XS6_RA5_RB5<31, 1004, "stxvb16x", vsrc, []>;
2414
2415 // Store Vector Indexed
Nemanja Ivanovic6e7879c2016-09-22 09:52:19 +00002416 def STXVX : X_XS6_RA5_RB5<31, 396, "stxvx" , vsrc,
2417 [(store v2f64:$XT, xoaddr:$dst)]>;
Kit Bartonba532dc2016-03-08 03:49:13 +00002418
2419 // Store Vector (Left-justified) with Length
Zaara Syedaa19c9e62016-11-15 17:54:19 +00002420 def STXVL : XX1Form<31, 397, (outs), (ins vsrc:$XT, memr:$dst, g8rc:$rB),
2421 "stxvl $XT, $dst, $rB", IIC_LdStLoad,
2422 [(int_ppc_vsx_stxvl v4i32:$XT, addr:$dst, i64:$rB)]>,
2423 UseVSXReg;
2424 def STXVLL : XX1Form<31, 429, (outs), (ins vsrc:$XT, memr:$dst, g8rc:$rB),
2425 "stxvll $XT, $dst, $rB", IIC_LdStLoad,
2426 [(int_ppc_vsx_stxvll v4i32:$XT, addr:$dst, i64:$rB)]>,
2427 UseVSXReg;
Nemanja Ivanovic11049f82016-10-04 06:59:23 +00002428 } // mayStore
Nemanja Ivanovicb43bb612016-07-12 21:00:10 +00002429
2430 // Patterns for which instructions from ISA 3.0 are a better match
2431 let Predicates = [IsLittleEndian, HasP9Vector] in {
2432 def : Pat<(f32 (PPCfcfidus (PPCmtvsrz (i32 (extractelt v4i32:$A, 0))))),
2433 (f32 (XSCVUXDSP (XXEXTRACTUW $A, 12)))>;
2434 def : Pat<(f32 (PPCfcfidus (PPCmtvsrz (i32 (extractelt v4i32:$A, 1))))),
2435 (f32 (XSCVUXDSP (XXEXTRACTUW $A, 8)))>;
2436 def : Pat<(f32 (PPCfcfidus (PPCmtvsrz (i32 (extractelt v4i32:$A, 2))))),
2437 (f32 (XSCVUXDSP (XXEXTRACTUW $A, 4)))>;
2438 def : Pat<(f32 (PPCfcfidus (PPCmtvsrz (i32 (extractelt v4i32:$A, 3))))),
2439 (f32 (XSCVUXDSP (XXEXTRACTUW $A, 0)))>;
2440 def : Pat<(v4i32 (insertelt v4i32:$A, i32:$B, 0)),
2441 (v4i32 (XXINSERTW v4i32:$A, AlignValues.I32_TO_BE_WORD1, 12))>;
2442 def : Pat<(v4i32 (insertelt v4i32:$A, i32:$B, 1)),
2443 (v4i32 (XXINSERTW v4i32:$A, AlignValues.I32_TO_BE_WORD1, 8))>;
2444 def : Pat<(v4i32 (insertelt v4i32:$A, i32:$B, 2)),
2445 (v4i32 (XXINSERTW v4i32:$A, AlignValues.I32_TO_BE_WORD1, 4))>;
2446 def : Pat<(v4i32 (insertelt v4i32:$A, i32:$B, 3)),
2447 (v4i32 (XXINSERTW v4i32:$A, AlignValues.I32_TO_BE_WORD1, 0))>;
2448 def : Pat<(v4f32 (insertelt v4f32:$A, f32:$B, 0)),
2449 (v4f32 (XXINSERTW v4f32:$A, AlignValues.F32_TO_BE_WORD1, 12))>;
2450 def : Pat<(v4f32 (insertelt v4f32:$A, f32:$B, 1)),
2451 (v4f32 (XXINSERTW v4f32:$A, AlignValues.F32_TO_BE_WORD1, 8))>;
2452 def : Pat<(v4f32 (insertelt v4f32:$A, f32:$B, 2)),
2453 (v4f32 (XXINSERTW v4f32:$A, AlignValues.F32_TO_BE_WORD1, 4))>;
2454 def : Pat<(v4f32 (insertelt v4f32:$A, f32:$B, 3)),
2455 (v4f32 (XXINSERTW v4f32:$A, AlignValues.F32_TO_BE_WORD1, 0))>;
2456 } // IsLittleEndian, HasP9Vector
2457
2458 let Predicates = [IsBigEndian, HasP9Vector] in {
2459 def : Pat<(f32 (PPCfcfidus (PPCmtvsrz (i32 (extractelt v4i32:$A, 0))))),
2460 (f32 (XSCVUXDSP (XXEXTRACTUW $A, 0)))>;
2461 def : Pat<(f32 (PPCfcfidus (PPCmtvsrz (i32 (extractelt v4i32:$A, 1))))),
2462 (f32 (XSCVUXDSP (XXEXTRACTUW $A, 4)))>;
2463 def : Pat<(f32 (PPCfcfidus (PPCmtvsrz (i32 (extractelt v4i32:$A, 2))))),
2464 (f32 (XSCVUXDSP (XXEXTRACTUW $A, 8)))>;
2465 def : Pat<(f32 (PPCfcfidus (PPCmtvsrz (i32 (extractelt v4i32:$A, 3))))),
2466 (f32 (XSCVUXDSP (XXEXTRACTUW $A, 12)))>;
2467 def : Pat<(v4i32 (insertelt v4i32:$A, i32:$B, 0)),
2468 (v4i32 (XXINSERTW v4i32:$A, AlignValues.I32_TO_BE_WORD1, 0))>;
2469 def : Pat<(v4i32 (insertelt v4i32:$A, i32:$B, 1)),
2470 (v4i32 (XXINSERTW v4i32:$A, AlignValues.I32_TO_BE_WORD1, 4))>;
2471 def : Pat<(v4i32 (insertelt v4i32:$A, i32:$B, 2)),
2472 (v4i32 (XXINSERTW v4i32:$A, AlignValues.I32_TO_BE_WORD1, 8))>;
2473 def : Pat<(v4i32 (insertelt v4i32:$A, i32:$B, 3)),
2474 (v4i32 (XXINSERTW v4i32:$A, AlignValues.I32_TO_BE_WORD1, 12))>;
2475 def : Pat<(v4f32 (insertelt v4f32:$A, f32:$B, 0)),
2476 (v4f32 (XXINSERTW v4f32:$A, AlignValues.F32_TO_BE_WORD1, 0))>;
2477 def : Pat<(v4f32 (insertelt v4f32:$A, f32:$B, 1)),
2478 (v4f32 (XXINSERTW v4f32:$A, AlignValues.F32_TO_BE_WORD1, 4))>;
2479 def : Pat<(v4f32 (insertelt v4f32:$A, f32:$B, 2)),
2480 (v4f32 (XXINSERTW v4f32:$A, AlignValues.F32_TO_BE_WORD1, 8))>;
2481 def : Pat<(v4f32 (insertelt v4f32:$A, f32:$B, 3)),
2482 (v4f32 (XXINSERTW v4f32:$A, AlignValues.F32_TO_BE_WORD1, 12))>;
2483 } // IsLittleEndian, HasP9Vector
Nemanja Ivanovic6e7879c2016-09-22 09:52:19 +00002484
2485 def : Pat<(v2f64 (load xoaddr:$src)), (LXVX xoaddr:$src)>;
2486 def : Pat<(v2i64 (load xoaddr:$src)), (LXVX xoaddr:$src)>;
2487 def : Pat<(v4f32 (load xoaddr:$src)), (LXVX xoaddr:$src)>;
2488 def : Pat<(v4i32 (load xoaddr:$src)), (LXVX xoaddr:$src)>;
2489 def : Pat<(v4i32 (int_ppc_vsx_lxvw4x xoaddr:$src)), (LXVX xoaddr:$src)>;
2490 def : Pat<(v2f64 (int_ppc_vsx_lxvd2x xoaddr:$src)), (LXVX xoaddr:$src)>;
2491 def : Pat<(store v2f64:$rS, xoaddr:$dst), (STXVX $rS, xoaddr:$dst)>;
2492 def : Pat<(store v2i64:$rS, xoaddr:$dst), (STXVX $rS, xoaddr:$dst)>;
2493 def : Pat<(store v4f32:$rS, xoaddr:$dst), (STXVX $rS, xoaddr:$dst)>;
2494 def : Pat<(store v4i32:$rS, xoaddr:$dst), (STXVX $rS, xoaddr:$dst)>;
2495 def : Pat<(int_ppc_vsx_stxvw4x v4i32:$rS, xoaddr:$dst),
2496 (STXVX $rS, xoaddr:$dst)>;
2497 def : Pat<(int_ppc_vsx_stxvd2x v2f64:$rS, xoaddr:$dst),
2498 (STXVX $rS, xoaddr:$dst)>;
Nemanja Ivanovicd2c3c512016-09-23 13:25:31 +00002499
2500 def : Pat<(v4i32 (scalar_to_vector (i32 (load xoaddr:$src)))),
2501 (v4i32 (LXVWSX xoaddr:$src))>;
2502 def : Pat<(v4f32 (scalar_to_vector (f32 (load xoaddr:$src)))),
2503 (v4f32 (LXVWSX xoaddr:$src))>;
Nemanja Ivanovicdf1cb522016-11-29 16:11:34 +00002504 def : Pat<(v4f32 (scalar_to_vector (f32 (fpround (extloadf32 xoaddr:$src))))),
2505 (v4f32 (LXVWSX xoaddr:$src))>;
Nemanja Ivanovic11049f82016-10-04 06:59:23 +00002506
2507 // Build vectors from i8 loads
2508 def : Pat<(v16i8 (scalar_to_vector ScalarLoads.Li8)),
2509 (v16i8 (VSPLTBs 7, (LXSIBZX xoaddr:$src)))>;
2510 def : Pat<(v8i16 (scalar_to_vector ScalarLoads.ZELi8)),
2511 (v8i16 (VSPLTHs 3, (LXSIBZX xoaddr:$src)))>;
2512 def : Pat<(v4i32 (scalar_to_vector ScalarLoads.ZELi8)),
2513 (v4i32 (XXSPLTWs (LXSIBZX xoaddr:$src), 1))>;
2514 def : Pat<(v2i64 (scalar_to_vector ScalarLoads.ZELi8i64)),
Nemanja Ivanovic10fc3cf2016-11-23 15:51:52 +00002515 (v2i64 (XXSPLTD0s (LXSIBZX xoaddr:$src)))>;
Nemanja Ivanovic11049f82016-10-04 06:59:23 +00002516 def : Pat<(v4i32 (scalar_to_vector ScalarLoads.SELi8)),
2517 (v4i32 (XXSPLTWs (VEXTSB2Ws (LXSIBZX xoaddr:$src)), 1))>;
2518 def : Pat<(v2i64 (scalar_to_vector ScalarLoads.SELi8i64)),
Nemanja Ivanovic10fc3cf2016-11-23 15:51:52 +00002519 (v2i64 (XXSPLTD0s (VEXTSB2Ds (LXSIBZX xoaddr:$src))))>;
Nemanja Ivanovic11049f82016-10-04 06:59:23 +00002520
2521 // Build vectors from i16 loads
2522 def : Pat<(v8i16 (scalar_to_vector ScalarLoads.Li16)),
2523 (v8i16 (VSPLTHs 3, (LXSIHZX xoaddr:$src)))>;
2524 def : Pat<(v4i32 (scalar_to_vector ScalarLoads.ZELi16)),
2525 (v4i32 (XXSPLTWs (LXSIHZX xoaddr:$src), 1))>;
2526 def : Pat<(v2i64 (scalar_to_vector ScalarLoads.ZELi16i64)),
Nemanja Ivanovic10fc3cf2016-11-23 15:51:52 +00002527 (v2i64 (XXSPLTD0s (LXSIHZX xoaddr:$src)))>;
Nemanja Ivanovic11049f82016-10-04 06:59:23 +00002528 def : Pat<(v4i32 (scalar_to_vector ScalarLoads.SELi16)),
2529 (v4i32 (XXSPLTWs (VEXTSH2Ws (LXSIHZX xoaddr:$src)), 1))>;
2530 def : Pat<(v2i64 (scalar_to_vector ScalarLoads.SELi16i64)),
Nemanja Ivanovic10fc3cf2016-11-23 15:51:52 +00002531 (v2i64 (XXSPLTD0s (VEXTSH2Ds (LXSIHZX xoaddr:$src))))>;
Nemanja Ivanovic11049f82016-10-04 06:59:23 +00002532
2533 let Predicates = [IsBigEndian, HasP9Vector] in {
2534 // Scalar stores of i8
2535 def : Pat<(truncstorei8 (i32 (vector_extract v16i8:$S, 0)), xoaddr:$dst),
2536 (STXSIBXv (VSLDOI $S, $S, 9), xoaddr:$dst)>;
2537 def : Pat<(truncstorei8 (i32 (vector_extract v16i8:$S, 1)), xoaddr:$dst),
2538 (STXSIBXv (VSLDOI $S, $S, 10), xoaddr:$dst)>;
2539 def : Pat<(truncstorei8 (i32 (vector_extract v16i8:$S, 2)), xoaddr:$dst),
2540 (STXSIBXv (VSLDOI $S, $S, 11), xoaddr:$dst)>;
2541 def : Pat<(truncstorei8 (i32 (vector_extract v16i8:$S, 3)), xoaddr:$dst),
2542 (STXSIBXv (VSLDOI $S, $S, 12), xoaddr:$dst)>;
2543 def : Pat<(truncstorei8 (i32 (vector_extract v16i8:$S, 4)), xoaddr:$dst),
2544 (STXSIBXv (VSLDOI $S, $S, 13), xoaddr:$dst)>;
2545 def : Pat<(truncstorei8 (i32 (vector_extract v16i8:$S, 5)), xoaddr:$dst),
2546 (STXSIBXv (VSLDOI $S, $S, 14), xoaddr:$dst)>;
2547 def : Pat<(truncstorei8 (i32 (vector_extract v16i8:$S, 6)), xoaddr:$dst),
2548 (STXSIBXv (VSLDOI $S, $S, 15), xoaddr:$dst)>;
2549 def : Pat<(truncstorei8 (i32 (vector_extract v16i8:$S, 7)), xoaddr:$dst),
2550 (STXSIBXv $S, xoaddr:$dst)>;
2551 def : Pat<(truncstorei8 (i32 (vector_extract v16i8:$S, 8)), xoaddr:$dst),
2552 (STXSIBXv (VSLDOI $S, $S, 1), xoaddr:$dst)>;
2553 def : Pat<(truncstorei8 (i32 (vector_extract v16i8:$S, 9)), xoaddr:$dst),
2554 (STXSIBXv (VSLDOI $S, $S, 2), xoaddr:$dst)>;
2555 def : Pat<(truncstorei8 (i32 (vector_extract v16i8:$S, 10)), xoaddr:$dst),
2556 (STXSIBXv (VSLDOI $S, $S, 3), xoaddr:$dst)>;
2557 def : Pat<(truncstorei8 (i32 (vector_extract v16i8:$S, 11)), xoaddr:$dst),
2558 (STXSIBXv (VSLDOI $S, $S, 4), xoaddr:$dst)>;
2559 def : Pat<(truncstorei8 (i32 (vector_extract v16i8:$S, 12)), xoaddr:$dst),
2560 (STXSIBXv (VSLDOI $S, $S, 5), xoaddr:$dst)>;
2561 def : Pat<(truncstorei8 (i32 (vector_extract v16i8:$S, 13)), xoaddr:$dst),
2562 (STXSIBXv (VSLDOI $S, $S, 6), xoaddr:$dst)>;
2563 def : Pat<(truncstorei8 (i32 (vector_extract v16i8:$S, 14)), xoaddr:$dst),
2564 (STXSIBXv (VSLDOI $S, $S, 7), xoaddr:$dst)>;
2565 def : Pat<(truncstorei8 (i32 (vector_extract v16i8:$S, 15)), xoaddr:$dst),
2566 (STXSIBXv (VSLDOI $S, $S, 8), xoaddr:$dst)>;
2567
2568 // Scalar stores of i16
2569 def : Pat<(truncstorei16 (i32 (vector_extract v8i16:$S, 0)), xoaddr:$dst),
2570 (STXSIHXv (VSLDOI $S, $S, 10), xoaddr:$dst)>;
2571 def : Pat<(truncstorei16 (i32 (vector_extract v8i16:$S, 1)), xoaddr:$dst),
2572 (STXSIHXv (VSLDOI $S, $S, 12), xoaddr:$dst)>;
2573 def : Pat<(truncstorei16 (i32 (vector_extract v8i16:$S, 2)), xoaddr:$dst),
2574 (STXSIHXv (VSLDOI $S, $S, 14), xoaddr:$dst)>;
2575 def : Pat<(truncstorei16 (i32 (vector_extract v8i16:$S, 3)), xoaddr:$dst),
2576 (STXSIHXv $S, xoaddr:$dst)>;
2577 def : Pat<(truncstorei16 (i32 (vector_extract v8i16:$S, 4)), xoaddr:$dst),
2578 (STXSIHXv (VSLDOI $S, $S, 2), xoaddr:$dst)>;
2579 def : Pat<(truncstorei16 (i32 (vector_extract v8i16:$S, 5)), xoaddr:$dst),
2580 (STXSIHXv (VSLDOI $S, $S, 4), xoaddr:$dst)>;
2581 def : Pat<(truncstorei16 (i32 (vector_extract v8i16:$S, 6)), xoaddr:$dst),
2582 (STXSIHXv (VSLDOI $S, $S, 6), xoaddr:$dst)>;
2583 def : Pat<(truncstorei16 (i32 (vector_extract v8i16:$S, 7)), xoaddr:$dst),
2584 (STXSIHXv (VSLDOI $S, $S, 8), xoaddr:$dst)>;
2585 } // IsBigEndian, HasP9Vector
2586
2587 let Predicates = [IsLittleEndian, HasP9Vector] in {
2588 // Scalar stores of i8
2589 def : Pat<(truncstorei8 (i32 (vector_extract v16i8:$S, 0)), xoaddr:$dst),
2590 (STXSIBXv (VSLDOI $S, $S, 8), xoaddr:$dst)>;
2591 def : Pat<(truncstorei8 (i32 (vector_extract v16i8:$S, 1)), xoaddr:$dst),
2592 (STXSIBXv (VSLDOI $S, $S, 7), xoaddr:$dst)>;
2593 def : Pat<(truncstorei8 (i32 (vector_extract v16i8:$S, 2)), xoaddr:$dst),
2594 (STXSIBXv (VSLDOI $S, $S, 6), xoaddr:$dst)>;
2595 def : Pat<(truncstorei8 (i32 (vector_extract v16i8:$S, 3)), xoaddr:$dst),
2596 (STXSIBXv (VSLDOI $S, $S, 5), xoaddr:$dst)>;
2597 def : Pat<(truncstorei8 (i32 (vector_extract v16i8:$S, 4)), xoaddr:$dst),
2598 (STXSIBXv (VSLDOI $S, $S, 4), xoaddr:$dst)>;
2599 def : Pat<(truncstorei8 (i32 (vector_extract v16i8:$S, 5)), xoaddr:$dst),
2600 (STXSIBXv (VSLDOI $S, $S, 3), xoaddr:$dst)>;
2601 def : Pat<(truncstorei8 (i32 (vector_extract v16i8:$S, 6)), xoaddr:$dst),
2602 (STXSIBXv (VSLDOI $S, $S, 2), xoaddr:$dst)>;
2603 def : Pat<(truncstorei8 (i32 (vector_extract v16i8:$S, 7)), xoaddr:$dst),
2604 (STXSIBXv (VSLDOI $S, $S, 1), xoaddr:$dst)>;
2605 def : Pat<(truncstorei8 (i32 (vector_extract v16i8:$S, 8)), xoaddr:$dst),
2606 (STXSIBXv $S, xoaddr:$dst)>;
2607 def : Pat<(truncstorei8 (i32 (vector_extract v16i8:$S, 9)), xoaddr:$dst),
2608 (STXSIBXv (VSLDOI $S, $S, 15), xoaddr:$dst)>;
2609 def : Pat<(truncstorei8 (i32 (vector_extract v16i8:$S, 10)), xoaddr:$dst),
2610 (STXSIBXv (VSLDOI $S, $S, 14), xoaddr:$dst)>;
2611 def : Pat<(truncstorei8 (i32 (vector_extract v16i8:$S, 11)), xoaddr:$dst),
2612 (STXSIBXv (VSLDOI $S, $S, 13), xoaddr:$dst)>;
2613 def : Pat<(truncstorei8 (i32 (vector_extract v16i8:$S, 12)), xoaddr:$dst),
2614 (STXSIBXv (VSLDOI $S, $S, 12), xoaddr:$dst)>;
2615 def : Pat<(truncstorei8 (i32 (vector_extract v16i8:$S, 13)), xoaddr:$dst),
2616 (STXSIBXv (VSLDOI $S, $S, 11), xoaddr:$dst)>;
2617 def : Pat<(truncstorei8 (i32 (vector_extract v16i8:$S, 14)), xoaddr:$dst),
2618 (STXSIBXv (VSLDOI $S, $S, 10), xoaddr:$dst)>;
2619 def : Pat<(truncstorei8 (i32 (vector_extract v16i8:$S, 15)), xoaddr:$dst),
2620 (STXSIBXv (VSLDOI $S, $S, 9), xoaddr:$dst)>;
2621
2622 // Scalar stores of i16
2623 def : Pat<(truncstorei16 (i32 (vector_extract v8i16:$S, 0)), xoaddr:$dst),
2624 (STXSIHXv (VSLDOI $S, $S, 8), xoaddr:$dst)>;
2625 def : Pat<(truncstorei16 (i32 (vector_extract v8i16:$S, 1)), xoaddr:$dst),
2626 (STXSIHXv (VSLDOI $S, $S, 6), xoaddr:$dst)>;
2627 def : Pat<(truncstorei16 (i32 (vector_extract v8i16:$S, 2)), xoaddr:$dst),
2628 (STXSIHXv (VSLDOI $S, $S, 4), xoaddr:$dst)>;
2629 def : Pat<(truncstorei16 (i32 (vector_extract v8i16:$S, 3)), xoaddr:$dst),
2630 (STXSIHXv (VSLDOI $S, $S, 2), xoaddr:$dst)>;
2631 def : Pat<(truncstorei16 (i32 (vector_extract v8i16:$S, 4)), xoaddr:$dst),
2632 (STXSIHXv $S, xoaddr:$dst)>;
2633 def : Pat<(truncstorei16 (i32 (vector_extract v8i16:$S, 5)), xoaddr:$dst),
2634 (STXSIHXv (VSLDOI $S, $S, 14), xoaddr:$dst)>;
2635 def : Pat<(truncstorei16 (i32 (vector_extract v8i16:$S, 6)), xoaddr:$dst),
2636 (STXSIHXv (VSLDOI $S, $S, 12), xoaddr:$dst)>;
2637 def : Pat<(truncstorei16 (i32 (vector_extract v8i16:$S, 7)), xoaddr:$dst),
2638 (STXSIHXv (VSLDOI $S, $S, 10), xoaddr:$dst)>;
2639 } // IsLittleEndian, HasP9Vector
2640
2641 // Vector sign extensions
2642 def : Pat<(f64 (PPCVexts f64:$A, 1)),
2643 (f64 (COPY_TO_REGCLASS (VEXTSB2Ds $A), VSFRC))>;
2644 def : Pat<(f64 (PPCVexts f64:$A, 2)),
2645 (f64 (COPY_TO_REGCLASS (VEXTSH2Ds $A), VSFRC))>;
Nemanja Ivanovicdf1cb522016-11-29 16:11:34 +00002646
Nemanja Ivanovic6354d232016-10-04 11:25:52 +00002647 let isPseudo = 1 in {
2648 def DFLOADf32 : Pseudo<(outs vssrc:$XT), (ins memrix:$src),
2649 "#DFLOADf32",
2650 [(set f32:$XT, (load iaddr:$src))]>;
2651 def DFLOADf64 : Pseudo<(outs vsfrc:$XT), (ins memrix:$src),
2652 "#DFLOADf64",
2653 [(set f64:$XT, (load iaddr:$src))]>;
2654 def DFSTOREf32 : Pseudo<(outs), (ins vssrc:$XT, memrix:$dst),
2655 "#DFSTOREf32",
2656 [(store f32:$XT, iaddr:$dst)]>;
2657 def DFSTOREf64 : Pseudo<(outs), (ins vsfrc:$XT, memrix:$dst),
2658 "#DFSTOREf64",
2659 [(store f64:$XT, iaddr:$dst)]>;
2660 }
2661 def : Pat<(f64 (extloadf32 iaddr:$src)),
2662 (COPY_TO_REGCLASS (DFLOADf32 iaddr:$src), VSFRC)>;
Nemanja Ivanovicdf1cb522016-11-29 16:11:34 +00002663 def : Pat<(f32 (fpround (extloadf32 iaddr:$src))),
2664 (f32 (DFLOADf32 iaddr:$src))>;
Nemanja Ivanovicb43bb612016-07-12 21:00:10 +00002665} // end HasP9Vector, AddedComplexity
Nemanja Ivanovicd2c3c512016-09-23 13:25:31 +00002666
Nemanja Ivanovicdf1cb522016-11-29 16:11:34 +00002667// Integer extend helper dags 32 -> 64
2668def AnyExts {
2669 dag A = (INSERT_SUBREG (i64 (IMPLICIT_DEF)), $A, sub_32);
2670 dag B = (INSERT_SUBREG (i64 (IMPLICIT_DEF)), $B, sub_32);
2671 dag C = (INSERT_SUBREG (i64 (IMPLICIT_DEF)), $C, sub_32);
2672 dag D = (INSERT_SUBREG (i64 (IMPLICIT_DEF)), $D, sub_32);
Nemanja Ivanovicd2c3c512016-09-23 13:25:31 +00002673}
2674
Nemanja Ivanovicdf1cb522016-11-29 16:11:34 +00002675def DblToFlt {
2676 dag A0 = (f32 (fpround (f64 (extractelt v2f64:$A, 0))));
2677 dag A1 = (f32 (fpround (f64 (extractelt v2f64:$A, 1))));
2678 dag B0 = (f32 (fpround (f64 (extractelt v2f64:$B, 0))));
2679 dag B1 = (f32 (fpround (f64 (extractelt v2f64:$B, 1))));
2680}
2681def FltToIntLoad {
2682 dag A = (i32 (PPCmfvsr (PPCfctiwz (f64 (extloadf32 xoaddr:$A)))));
2683}
2684def FltToUIntLoad {
2685 dag A = (i32 (PPCmfvsr (PPCfctiwuz (f64 (extloadf32 xoaddr:$A)))));
2686}
2687def FltToLongLoad {
2688 dag A = (i64 (PPCmfvsr (PPCfctidz (f64 (extloadf32 xoaddr:$A)))));
2689}
2690def FltToULongLoad {
2691 dag A = (i64 (PPCmfvsr (PPCfctiduz (f64 (extloadf32 xoaddr:$A)))));
2692}
2693def FltToLong {
2694 dag A = (i64 (PPCmfvsr (PPCfctidz (fpextend f32:$A))));
2695}
2696def FltToULong {
2697 dag A = (i64 (PPCmfvsr (PPCfctiduz (fpextend f32:$A))));
2698}
2699def DblToInt {
2700 dag A = (i32 (PPCmfvsr (f64 (PPCfctiwz f64:$A))));
2701}
2702def DblToUInt {
2703 dag A = (i32 (PPCmfvsr (f64 (PPCfctiwuz f64:$A))));
2704}
2705def DblToLong {
2706 dag A = (i64 (PPCmfvsr (f64 (PPCfctidz f64:$A))));
2707}
2708def DblToULong {
2709 dag A = (i64 (PPCmfvsr (f64 (PPCfctiduz f64:$A))));
2710}
2711def DblToIntLoad {
2712 dag A = (i32 (PPCmfvsr (PPCfctiwz (f64 (load xoaddr:$A)))));
2713}
2714def DblToUIntLoad {
2715 dag A = (i32 (PPCmfvsr (PPCfctiwuz (f64 (load xoaddr:$A)))));
2716}
2717def DblToLongLoad {
2718 dag A = (i64 (PPCmfvsr (PPCfctidz (f64 (load xoaddr:$A)))));
2719}
2720def DblToULongLoad {
2721 dag A = (i64 (PPCmfvsr (PPCfctiduz (f64 (load xoaddr:$A)))));
2722}
2723
2724// FP merge dags (for f32 -> v4f32)
2725def MrgFP {
2726 dag AC = (XVCVDPSP (XXPERMDI (COPY_TO_REGCLASS $A, VSRC),
2727 (COPY_TO_REGCLASS $C, VSRC), 0));
2728 dag BD = (XVCVDPSP (XXPERMDI (COPY_TO_REGCLASS $B, VSRC),
2729 (COPY_TO_REGCLASS $D, VSRC), 0));
2730 dag ABhToFlt = (XVCVDPSP (XXPERMDI $A, $B, 0));
2731 dag ABlToFlt = (XVCVDPSP (XXPERMDI $A, $B, 3));
2732 dag BAhToFlt = (XVCVDPSP (XXPERMDI $B, $A, 0));
2733 dag BAlToFlt = (XVCVDPSP (XXPERMDI $B, $A, 3));
2734}
2735
2736// Patterns for BUILD_VECTOR nodes.
2737def NoP9Vector : Predicate<"!PPCSubTarget->hasP9Vector()">;
2738let AddedComplexity = 400 in {
2739
2740 let Predicates = [HasVSX] in {
2741 // Build vectors of floating point converted to i32.
2742 def : Pat<(v4i32 (build_vector DblToInt.A, DblToInt.A,
2743 DblToInt.A, DblToInt.A)),
2744 (v4i32 (XXSPLTW (COPY_TO_REGCLASS (XSCVDPSXWS $A), VSRC), 1))>;
2745 def : Pat<(v4i32 (build_vector DblToUInt.A, DblToUInt.A,
2746 DblToUInt.A, DblToUInt.A)),
2747 (v4i32 (XXSPLTW (COPY_TO_REGCLASS (XSCVDPUXWS $A), VSRC), 1))>;
2748 def : Pat<(v2i64 (build_vector DblToLong.A, DblToLong.A)),
2749 (v2i64 (XXPERMDI (COPY_TO_REGCLASS (XSCVDPSXDS $A), VSRC),
2750 (COPY_TO_REGCLASS (XSCVDPSXDS $A), VSRC), 0))>;
2751 def : Pat<(v2i64 (build_vector DblToULong.A, DblToULong.A)),
2752 (v2i64 (XXPERMDI (COPY_TO_REGCLASS (XSCVDPUXDS $A), VSRC),
2753 (COPY_TO_REGCLASS (XSCVDPUXDS $A), VSRC), 0))>;
2754 def : Pat<(v4i32 (scalar_to_vector FltToIntLoad.A)),
2755 (v4i32 (XXSPLTW (COPY_TO_REGCLASS
2756 (XSCVDPSXWSs (LXSSPX xoaddr:$A)), VSRC), 1))>;
2757 def : Pat<(v4i32 (scalar_to_vector FltToUIntLoad.A)),
2758 (v4i32 (XXSPLTW (COPY_TO_REGCLASS
2759 (XSCVDPUXWSs (LXSSPX xoaddr:$A)), VSRC), 1))>;
2760 def : Pat<(v4f32 (build_vector f32:$A, f32:$A, f32:$A, f32:$A)),
2761 (v4f32 (XXSPLTW (v4f32 (XSCVDPSPN $A)), 0))>;
2762
2763 // Build vectors of floating point converted to i64.
2764 def : Pat<(v2i64 (build_vector FltToLong.A, FltToLong.A)),
2765 (v2i64 (XXPERMDIs (COPY_TO_REGCLASS (XSCVDPSXDSs $A), VSFRC), 0))>;
2766 def : Pat<(v2i64 (build_vector FltToULong.A, FltToULong.A)),
2767 (v2i64 (XXPERMDIs (COPY_TO_REGCLASS (XSCVDPUXDSs $A), VSFRC), 0))>;
2768 def : Pat<(v2i64 (scalar_to_vector DblToLongLoad.A)),
2769 (v2i64 (XVCVDPSXDS (LXVDSX xoaddr:$A)))>;
2770 def : Pat<(v2i64 (scalar_to_vector DblToULongLoad.A)),
2771 (v2i64 (XVCVDPUXDS (LXVDSX xoaddr:$A)))>;
2772 }
2773
2774 let Predicates = [HasVSX, NoP9Vector] in {
2775 // Load-and-splat with fp-to-int conversion (using X-Form VSX loads).
2776 def : Pat<(v4i32 (scalar_to_vector DblToIntLoad.A)),
2777 (v4i32 (XXSPLTW (COPY_TO_REGCLASS
2778 (XSCVDPSXWS (LXSDX xoaddr:$A)), VSRC), 1))>;
2779 def : Pat<(v4i32 (scalar_to_vector DblToUIntLoad.A)),
2780 (v4i32 (XXSPLTW (COPY_TO_REGCLASS
2781 (XSCVDPUXWS (LXSDX xoaddr:$A)), VSRC), 1))>;
2782 def : Pat<(v2i64 (scalar_to_vector FltToLongLoad.A)),
2783 (v2i64 (XXPERMDIs (XSCVDPSXDS (COPY_TO_REGCLASS
2784 (LXSSPX xoaddr:$A), VSFRC)), 0))>;
2785 def : Pat<(v2i64 (scalar_to_vector FltToULongLoad.A)),
2786 (v2i64 (XXPERMDIs (XSCVDPUXDS (COPY_TO_REGCLASS
2787 (LXSSPX xoaddr:$A), VSFRC)), 0))>;
2788 }
2789
2790 // Big endian, available on all targets with VSX
2791 let Predicates = [IsBigEndian, HasVSX] in {
2792 def : Pat<(v2f64 (build_vector f64:$A, f64:$B)),
2793 (v2f64 (XXPERMDI
2794 (COPY_TO_REGCLASS $A, VSRC),
2795 (COPY_TO_REGCLASS $B, VSRC), 0))>;
2796
2797 def : Pat<(v4f32 (build_vector f32:$A, f32:$B, f32:$C, f32:$D)),
2798 (VMRGEW MrgFP.AC, MrgFP.BD)>;
2799 def : Pat<(v4f32 (build_vector DblToFlt.A0, DblToFlt.A1,
2800 DblToFlt.B0, DblToFlt.B1)),
2801 (v4f32 (VMRGEW MrgFP.ABhToFlt, MrgFP.ABlToFlt))>;
2802 }
2803
2804 let Predicates = [IsLittleEndian, HasVSX] in {
2805 // Little endian, available on all targets with VSX
2806 def : Pat<(v2f64 (build_vector f64:$A, f64:$B)),
2807 (v2f64 (XXPERMDI
2808 (COPY_TO_REGCLASS $B, VSRC),
2809 (COPY_TO_REGCLASS $A, VSRC), 0))>;
2810
2811 def : Pat<(v4f32 (build_vector f32:$D, f32:$C, f32:$B, f32:$A)),
2812 (VMRGEW MrgFP.AC, MrgFP.BD)>;
2813 def : Pat<(v4f32 (build_vector DblToFlt.A0, DblToFlt.A1,
2814 DblToFlt.B0, DblToFlt.B1)),
2815 (v4f32 (VMRGEW MrgFP.BAhToFlt, MrgFP.BAlToFlt))>;
2816 }
2817
2818 let Predicates = [HasDirectMove] in {
2819 // Endianness-neutral constant splat on P8 and newer targets. The reason
2820 // for this pattern is that on targets with direct moves, we don't expand
2821 // BUILD_VECTOR nodes for v4i32.
2822 def : Pat<(v4i32 (build_vector immSExt5NonZero:$A, immSExt5NonZero:$A,
2823 immSExt5NonZero:$A, immSExt5NonZero:$A)),
2824 (v4i32 (VSPLTISW imm:$A))>;
2825 }
2826
2827 let Predicates = [IsBigEndian, HasDirectMove, NoP9Vector] in {
2828 // Big endian integer vectors using direct moves.
2829 def : Pat<(v2i64 (build_vector i64:$A, i64:$B)),
2830 (v2i64 (XXPERMDI
2831 (COPY_TO_REGCLASS (MTVSRD $A), VSRC),
2832 (COPY_TO_REGCLASS (MTVSRD $B), VSRC), 0))>;
2833 def : Pat<(v4i32 (build_vector i32:$A, i32:$B, i32:$C, i32:$D)),
2834 (VMRGOW (XXPERMDI (COPY_TO_REGCLASS (MTVSRWZ $A), VSRC),
2835 (COPY_TO_REGCLASS (MTVSRWZ $C), VSRC), 0),
2836 (XXPERMDI (COPY_TO_REGCLASS (MTVSRWZ $B), VSRC),
2837 (COPY_TO_REGCLASS (MTVSRWZ $D), VSRC), 0))>;
2838 def : Pat<(v4i32 (build_vector i32:$A, i32:$A, i32:$A, i32:$A)),
2839 (XXSPLTW (COPY_TO_REGCLASS (MTVSRWZ $A), VSRC), 1)>;
2840 }
2841
2842 let Predicates = [IsLittleEndian, HasDirectMove, NoP9Vector] in {
2843 // Little endian integer vectors using direct moves.
2844 def : Pat<(v2i64 (build_vector i64:$A, i64:$B)),
2845 (v2i64 (XXPERMDI
2846 (COPY_TO_REGCLASS (MTVSRD $B), VSRC),
2847 (COPY_TO_REGCLASS (MTVSRD $A), VSRC), 0))>;
2848 def : Pat<(v4i32 (build_vector i32:$A, i32:$B, i32:$C, i32:$D)),
2849 (VMRGOW (XXPERMDI (COPY_TO_REGCLASS (MTVSRWZ $D), VSRC),
2850 (COPY_TO_REGCLASS (MTVSRWZ $B), VSRC), 0),
2851 (XXPERMDI (COPY_TO_REGCLASS (MTVSRWZ $C), VSRC),
2852 (COPY_TO_REGCLASS (MTVSRWZ $A), VSRC), 0))>;
2853 def : Pat<(v4i32 (build_vector i32:$A, i32:$A, i32:$A, i32:$A)),
2854 (XXSPLTW (COPY_TO_REGCLASS (MTVSRWZ $A), VSRC), 1)>;
2855 }
2856
2857 let Predicates = [HasP9Vector] in {
2858 // Endianness-neutral patterns for const splats with ISA 3.0 instructions.
2859 def : Pat<(v4i32 (scalar_to_vector i32:$A)),
2860 (v4i32 (MTVSRWS $A))>;
2861 def : Pat<(v4i32 (build_vector i32:$A, i32:$A, i32:$A, i32:$A)),
2862 (v4i32 (MTVSRWS $A))>;
2863 def : Pat<(v16i8 (build_vector immSExt8:$A, immSExt8:$A, immSExt8:$A,
2864 immSExt8:$A, immSExt8:$A, immSExt8:$A,
2865 immSExt8:$A, immSExt8:$A, immSExt8:$A,
2866 immSExt8:$A, immSExt8:$A, immSExt8:$A,
2867 immSExt8:$A, immSExt8:$A, immSExt8:$A,
2868 immSExt8:$A)),
2869 (v16i8 (COPY_TO_REGCLASS (XXSPLTIB imm:$A), VSRC))>;
2870 def : Pat<(v16i8 immAllOnesV),
2871 (v16i8 (COPY_TO_REGCLASS (XXSPLTIB 255), VSRC))>;
2872 def : Pat<(v8i16 immAllOnesV),
2873 (v8i16 (COPY_TO_REGCLASS (XXSPLTIB 255), VSRC))>;
2874 def : Pat<(v4i32 immAllOnesV),
2875 (v4i32 (XXSPLTIB 255))>;
2876 def : Pat<(v2i64 immAllOnesV),
2877 (v2i64 (XXSPLTIB 255))>;
2878 def : Pat<(v4i32 (scalar_to_vector FltToIntLoad.A)),
2879 (v4i32 (XVCVSPSXWS (LXVWSX xoaddr:$A)))>;
2880 def : Pat<(v4i32 (scalar_to_vector FltToUIntLoad.A)),
2881 (v4i32 (XVCVSPUXWS (LXVWSX xoaddr:$A)))>;
2882 def : Pat<(v4i32 (scalar_to_vector DblToIntLoad.A)),
2883 (v4i32 (XXSPLTW (COPY_TO_REGCLASS
2884 (XSCVDPSXWS (DFLOADf64 iaddr:$A)), VSRC), 1))>;
2885 def : Pat<(v4i32 (scalar_to_vector DblToUIntLoad.A)),
2886 (v4i32 (XXSPLTW (COPY_TO_REGCLASS
2887 (XSCVDPUXWS (DFLOADf64 iaddr:$A)), VSRC), 1))>;
2888 def : Pat<(v2i64 (scalar_to_vector FltToLongLoad.A)),
2889 (v2i64 (XXPERMDIs (XSCVDPSXDS (COPY_TO_REGCLASS
2890 (DFLOADf32 iaddr:$A),
2891 VSFRC)), 0))>;
2892 def : Pat<(v2i64 (scalar_to_vector FltToULongLoad.A)),
2893 (v2i64 (XXPERMDIs (XSCVDPUXDS (COPY_TO_REGCLASS
2894 (DFLOADf32 iaddr:$A),
2895 VSFRC)), 0))>;
2896 }
2897
2898 let Predicates = [IsISA3_0, HasDirectMove, IsBigEndian] in {
2899 def : Pat<(i64 (extractelt v2i64:$A, 1)),
2900 (i64 (MFVSRLD $A))>;
2901 // Better way to build integer vectors if we have MTVSRDD. Big endian.
2902 def : Pat<(v2i64 (build_vector i64:$rB, i64:$rA)),
2903 (v2i64 (MTVSRDD $rB, $rA))>;
2904 def : Pat<(v4i32 (build_vector i32:$A, i32:$B, i32:$C, i32:$D)),
2905 (VMRGOW (COPY_TO_REGCLASS (MTVSRDD AnyExts.A, AnyExts.C), VSRC),
2906 (COPY_TO_REGCLASS (MTVSRDD AnyExts.B, AnyExts.D), VSRC))>;
2907 }
2908
2909 let Predicates = [IsISA3_0, HasDirectMove, IsLittleEndian] in {
2910 def : Pat<(i64 (extractelt v2i64:$A, 0)),
2911 (i64 (MFVSRLD $A))>;
2912 // Better way to build integer vectors if we have MTVSRDD. Little endian.
2913 def : Pat<(v2i64 (build_vector i64:$rA, i64:$rB)),
2914 (v2i64 (MTVSRDD $rB, $rA))>;
2915 def : Pat<(v4i32 (build_vector i32:$A, i32:$B, i32:$C, i32:$D)),
2916 (VMRGOW (COPY_TO_REGCLASS (MTVSRDD AnyExts.D, AnyExts.B), VSRC),
2917 (COPY_TO_REGCLASS (MTVSRDD AnyExts.C, AnyExts.A), VSRC))>;
2918 }
Nemanja Ivanovicd2c3c512016-09-23 13:25:31 +00002919}