blob: e5d375a2450ccfa0e48db7e3d70d7c5325a96480 [file] [log] [blame]
Hal Finkel27774d92014-03-13 07:58:58 +00001//===- PPCInstrVSX.td - The PowerPC VSX Extension --*- tablegen -*-===//
2//
3// The LLVM Compiler Infrastructure
4//
5// This file is distributed under the University of Illinois Open Source
6// License. See LICENSE.TXT for details.
7//
8//===----------------------------------------------------------------------===//
9//
10// This file describes the VSX extension to the PowerPC instruction set.
11//
12//===----------------------------------------------------------------------===//
13
Bill Schmidtfe723b92015-04-27 19:57:34 +000014// *********************************** NOTE ***********************************
15// ** For POWER8 Little Endian, the VSX swap optimization relies on knowing **
16// ** which VMX and VSX instructions are lane-sensitive and which are not. **
17// ** A lane-sensitive instruction relies, implicitly or explicitly, on **
18// ** whether lanes are numbered from left to right. An instruction like **
19// ** VADDFP is not lane-sensitive, because each lane of the result vector **
20// ** relies only on the corresponding lane of the source vectors. However, **
21// ** an instruction like VMULESB is lane-sensitive, because "even" and **
22// ** "odd" lanes are different for big-endian and little-endian numbering. **
23// ** **
24// ** When adding new VMX and VSX instructions, please consider whether they **
25// ** are lane-sensitive. If so, they must be added to a switch statement **
26// ** in PPCVSXSwapRemoval::gatherVectorInstructions(). **
27// ****************************************************************************
28
Hal Finkel27774d92014-03-13 07:58:58 +000029def PPCRegVSRCAsmOperand : AsmOperandClass {
30 let Name = "RegVSRC"; let PredicateMethod = "isVSRegNumber";
31}
32def vsrc : RegisterOperand<VSRC> {
33 let ParserMatchClass = PPCRegVSRCAsmOperand;
34}
35
Hal Finkel19be5062014-03-29 05:29:01 +000036def PPCRegVSFRCAsmOperand : AsmOperandClass {
37 let Name = "RegVSFRC"; let PredicateMethod = "isVSRegNumber";
38}
39def vsfrc : RegisterOperand<VSFRC> {
40 let ParserMatchClass = PPCRegVSFRCAsmOperand;
41}
42
Nemanja Ivanovicf3c94b12015-05-07 18:24:05 +000043def PPCRegVSSRCAsmOperand : AsmOperandClass {
44 let Name = "RegVSSRC"; let PredicateMethod = "isVSRegNumber";
45}
46def vssrc : RegisterOperand<VSSRC> {
47 let ParserMatchClass = PPCRegVSSRCAsmOperand;
48}
49
Bill Schmidtfae5d712014-12-09 16:35:51 +000050// Little-endian-specific nodes.
51def SDT_PPClxvd2x : SDTypeProfile<1, 1, [
52 SDTCisVT<0, v2f64>, SDTCisPtrTy<1>
53]>;
54def SDT_PPCstxvd2x : SDTypeProfile<0, 2, [
55 SDTCisVT<0, v2f64>, SDTCisPtrTy<1>
56]>;
57def SDT_PPCxxswapd : SDTypeProfile<1, 1, [
58 SDTCisSameAs<0, 1>
59]>;
Nemanja Ivanovic44513e52016-07-05 09:22:29 +000060def SDTVecConv : SDTypeProfile<1, 2, [
61 SDTCisVec<0>, SDTCisVec<1>, SDTCisPtrTy<2>
62]>;
Bill Schmidtfae5d712014-12-09 16:35:51 +000063
64def PPClxvd2x : SDNode<"PPCISD::LXVD2X", SDT_PPClxvd2x,
65 [SDNPHasChain, SDNPMayLoad]>;
66def PPCstxvd2x : SDNode<"PPCISD::STXVD2X", SDT_PPCstxvd2x,
67 [SDNPHasChain, SDNPMayStore]>;
68def PPCxxswapd : SDNode<"PPCISD::XXSWAPD", SDT_PPCxxswapd, [SDNPHasChain]>;
Nemanja Ivanovicc38b5312015-04-11 10:40:42 +000069def PPCmfvsr : SDNode<"PPCISD::MFVSR", SDTUnaryOp, []>;
70def PPCmtvsra : SDNode<"PPCISD::MTVSRA", SDTUnaryOp, []>;
71def PPCmtvsrz : SDNode<"PPCISD::MTVSRZ", SDTUnaryOp, []>;
Nemanja Ivanovic44513e52016-07-05 09:22:29 +000072def PPCsvec2fp : SDNode<"PPCISD::SINT_VEC_TO_FP", SDTVecConv, []>;
73def PPCuvec2fp: SDNode<"PPCISD::UINT_VEC_TO_FP", SDTVecConv, []>;
Nemanja Ivanoviceebbcb62016-07-12 12:16:27 +000074def PPCswapNoChain : SDNode<"PPCISD::SWAP_NO_CHAIN", SDT_PPCxxswapd>;
Bill Schmidtfae5d712014-12-09 16:35:51 +000075
Nemanja Ivanovic2c84b292015-09-29 17:41:53 +000076multiclass XX3Form_Rcr<bits<6> opcode, bits<7> xo, string asmbase,
77 string asmstr, InstrItinClass itin, Intrinsic Int,
78 ValueType OutTy, ValueType InTy> {
Hal Finkel27774d92014-03-13 07:58:58 +000079 let BaseName = asmbase in {
Nemanja Ivanovic2c84b292015-09-29 17:41:53 +000080 def NAME : XX3Form_Rc<opcode, xo, (outs vsrc:$XT), (ins vsrc:$XA, vsrc:$XB),
Hal Finkel27774d92014-03-13 07:58:58 +000081 !strconcat(asmbase, !strconcat(" ", asmstr)), itin,
Nemanja Ivanovic2c84b292015-09-29 17:41:53 +000082 [(set OutTy:$XT, (Int InTy:$XA, InTy:$XB))]>;
Hal Finkel27774d92014-03-13 07:58:58 +000083 let Defs = [CR6] in
Nemanja Ivanovic2c84b292015-09-29 17:41:53 +000084 def o : XX3Form_Rc<opcode, xo, (outs vsrc:$XT), (ins vsrc:$XA, vsrc:$XB),
Hal Finkel27774d92014-03-13 07:58:58 +000085 !strconcat(asmbase, !strconcat(". ", asmstr)), itin,
Nemanja Ivanovic2c84b292015-09-29 17:41:53 +000086 [(set InTy:$XT,
87 (InTy (PPCvcmp_o InTy:$XA, InTy:$XB, xo)))]>,
88 isDOT;
Hal Finkel27774d92014-03-13 07:58:58 +000089 }
90}
91
Nemanja Ivanovic11049f82016-10-04 06:59:23 +000092// Instruction form with a single input register for instructions such as
93// XXPERMDI. The reason for defining this is that specifying multiple chained
94// operands (such as loads) to an instruction will perform both chained
95// operations rather than coalescing them into a single register - even though
96// the source memory location is the same. This simply forces the instruction
97// to use the same register for both inputs.
98// For example, an output DAG such as this:
99// (XXPERMDI (LXSIBZX xoaddr:$src), (LXSIBZX xoaddr:$src ), 0))
100// would result in two load instructions emitted and used as separate inputs
101// to the XXPERMDI instruction.
102class XX3Form_2s<bits<6> opcode, bits<5> xo, dag OOL, dag IOL, string asmstr,
103 InstrItinClass itin, list<dag> pattern>
104 : XX3Form_2<opcode, xo, OOL, IOL, asmstr, itin, pattern> {
105 let XB = XA;
106}
107
Eric Christopher1b8e7632014-05-22 01:07:24 +0000108def HasVSX : Predicate<"PPCSubTarget->hasVSX()">;
Bill Schmidtfae5d712014-12-09 16:35:51 +0000109def IsLittleEndian : Predicate<"PPCSubTarget->isLittleEndian()">;
110def IsBigEndian : Predicate<"!PPCSubTarget->isLittleEndian()">;
Nemanja Ivanovic6e7879c2016-09-22 09:52:19 +0000111def HasOnlySwappingMemOps : Predicate<"!PPCSubTarget->hasP9Vector()">;
Bill Schmidtfae5d712014-12-09 16:35:51 +0000112
Hal Finkel27774d92014-03-13 07:58:58 +0000113let Predicates = [HasVSX] in {
114let AddedComplexity = 400 in { // Prefer VSX patterns over non-VSX patterns.
Nemanja Ivanovic11049f82016-10-04 06:59:23 +0000115let UseVSXReg = 1 in {
Craig Topperc50d64b2014-11-26 00:46:26 +0000116let hasSideEffects = 0 in { // VSX instructions don't have side effects.
Hal Finkel27774d92014-03-13 07:58:58 +0000117let Uses = [RM] in {
118
119 // Load indexed instructions
Hal Finkel6a778fb2015-03-11 23:28:38 +0000120 let mayLoad = 1 in {
Nemanja Ivanovic6354d232016-10-04 11:25:52 +0000121 let CodeSize = 3 in
Bill Schmidtcb34fd02014-10-09 17:51:35 +0000122 def LXSDX : XX1Form<31, 588,
Hal Finkel19be5062014-03-29 05:29:01 +0000123 (outs vsfrc:$XT), (ins memrr:$src),
Hal Finkel27774d92014-03-13 07:58:58 +0000124 "lxsdx $XT, $src", IIC_LdStLFD,
125 [(set f64:$XT, (load xoaddr:$src))]>;
126
Nemanja Ivanovic6e7879c2016-09-22 09:52:19 +0000127 let Predicates = [HasVSX, HasOnlySwappingMemOps] in
Bill Schmidtcb34fd02014-10-09 17:51:35 +0000128 def LXVD2X : XX1Form<31, 844,
Hal Finkel27774d92014-03-13 07:58:58 +0000129 (outs vsrc:$XT), (ins memrr:$src),
130 "lxvd2x $XT, $src", IIC_LdStLFD,
Bill Schmidt72954782014-11-12 04:19:40 +0000131 [(set v2f64:$XT, (int_ppc_vsx_lxvd2x xoaddr:$src))]>;
Hal Finkel27774d92014-03-13 07:58:58 +0000132
Bill Schmidtcb34fd02014-10-09 17:51:35 +0000133 def LXVDSX : XX1Form<31, 332,
Hal Finkel27774d92014-03-13 07:58:58 +0000134 (outs vsrc:$XT), (ins memrr:$src),
135 "lxvdsx $XT, $src", IIC_LdStLFD, []>;
Hal Finkel27774d92014-03-13 07:58:58 +0000136
Nemanja Ivanovic6e7879c2016-09-22 09:52:19 +0000137 let Predicates = [HasVSX, HasOnlySwappingMemOps] in
Bill Schmidtcb34fd02014-10-09 17:51:35 +0000138 def LXVW4X : XX1Form<31, 780,
Hal Finkel27774d92014-03-13 07:58:58 +0000139 (outs vsrc:$XT), (ins memrr:$src),
Bill Schmidt2d1128a2014-10-17 15:13:38 +0000140 "lxvw4x $XT, $src", IIC_LdStLFD,
Nemanja Ivanovicf57f1502016-11-29 23:00:33 +0000141 [(set v4i32:$XT, (int_ppc_vsx_lxvw4x xoaddr:$src))]>;
Nemanja Ivanovicf3c94b12015-05-07 18:24:05 +0000142 } // mayLoad
Hal Finkel27774d92014-03-13 07:58:58 +0000143
144 // Store indexed instructions
145 let mayStore = 1 in {
Nemanja Ivanovic6354d232016-10-04 11:25:52 +0000146 let CodeSize = 3 in
Hal Finkel27774d92014-03-13 07:58:58 +0000147 def STXSDX : XX1Form<31, 716,
Hal Finkel19be5062014-03-29 05:29:01 +0000148 (outs), (ins vsfrc:$XT, memrr:$dst),
Hal Finkel27774d92014-03-13 07:58:58 +0000149 "stxsdx $XT, $dst", IIC_LdStSTFD,
150 [(store f64:$XT, xoaddr:$dst)]>;
151
Nemanja Ivanovic6e7879c2016-09-22 09:52:19 +0000152 let Predicates = [HasVSX, HasOnlySwappingMemOps] in {
Nemanja Ivanovice78ffed2016-09-22 10:32:03 +0000153 // The behaviour of this instruction is endianness-specific so we provide no
154 // pattern to match it without considering endianness.
Hal Finkel27774d92014-03-13 07:58:58 +0000155 def STXVD2X : XX1Form<31, 972,
156 (outs), (ins vsrc:$XT, memrr:$dst),
157 "stxvd2x $XT, $dst", IIC_LdStSTFD,
Nemanja Ivanovice78ffed2016-09-22 10:32:03 +0000158 []>;
Hal Finkel27774d92014-03-13 07:58:58 +0000159
160 def STXVW4X : XX1Form<31, 908,
161 (outs), (ins vsrc:$XT, memrr:$dst),
Bill Schmidt2d1128a2014-10-17 15:13:38 +0000162 "stxvw4x $XT, $dst", IIC_LdStSTFD,
Nemanja Ivanovicf57f1502016-11-29 23:00:33 +0000163 [(store v4i32:$XT, xoaddr:$dst)]>;
Nemanja Ivanovic6e7879c2016-09-22 09:52:19 +0000164 }
Nemanja Ivanovicf3c94b12015-05-07 18:24:05 +0000165 } // mayStore
Hal Finkel27774d92014-03-13 07:58:58 +0000166
167 // Add/Mul Instructions
168 let isCommutable = 1 in {
169 def XSADDDP : XX3Form<60, 32,
Hal Finkel19be5062014-03-29 05:29:01 +0000170 (outs vsfrc:$XT), (ins vsfrc:$XA, vsfrc:$XB),
Hal Finkel27774d92014-03-13 07:58:58 +0000171 "xsadddp $XT, $XA, $XB", IIC_VecFP,
172 [(set f64:$XT, (fadd f64:$XA, f64:$XB))]>;
173 def XSMULDP : XX3Form<60, 48,
Hal Finkel19be5062014-03-29 05:29:01 +0000174 (outs vsfrc:$XT), (ins vsfrc:$XA, vsfrc:$XB),
Hal Finkel27774d92014-03-13 07:58:58 +0000175 "xsmuldp $XT, $XA, $XB", IIC_VecFP,
176 [(set f64:$XT, (fmul f64:$XA, f64:$XB))]>;
177
178 def XVADDDP : XX3Form<60, 96,
179 (outs vsrc:$XT), (ins vsrc:$XA, vsrc:$XB),
180 "xvadddp $XT, $XA, $XB", IIC_VecFP,
181 [(set v2f64:$XT, (fadd v2f64:$XA, v2f64:$XB))]>;
182
183 def XVADDSP : XX3Form<60, 64,
184 (outs vsrc:$XT), (ins vsrc:$XA, vsrc:$XB),
185 "xvaddsp $XT, $XA, $XB", IIC_VecFP,
186 [(set v4f32:$XT, (fadd v4f32:$XA, v4f32:$XB))]>;
187
188 def XVMULDP : XX3Form<60, 112,
189 (outs vsrc:$XT), (ins vsrc:$XA, vsrc:$XB),
190 "xvmuldp $XT, $XA, $XB", IIC_VecFP,
191 [(set v2f64:$XT, (fmul v2f64:$XA, v2f64:$XB))]>;
192
193 def XVMULSP : XX3Form<60, 80,
194 (outs vsrc:$XT), (ins vsrc:$XA, vsrc:$XB),
195 "xvmulsp $XT, $XA, $XB", IIC_VecFP,
196 [(set v4f32:$XT, (fmul v4f32:$XA, v4f32:$XB))]>;
197 }
198
199 // Subtract Instructions
200 def XSSUBDP : XX3Form<60, 40,
Hal Finkel19be5062014-03-29 05:29:01 +0000201 (outs vsfrc:$XT), (ins vsfrc:$XA, vsfrc:$XB),
Hal Finkel27774d92014-03-13 07:58:58 +0000202 "xssubdp $XT, $XA, $XB", IIC_VecFP,
203 [(set f64:$XT, (fsub f64:$XA, f64:$XB))]>;
204
205 def XVSUBDP : XX3Form<60, 104,
206 (outs vsrc:$XT), (ins vsrc:$XA, vsrc:$XB),
207 "xvsubdp $XT, $XA, $XB", IIC_VecFP,
208 [(set v2f64:$XT, (fsub v2f64:$XA, v2f64:$XB))]>;
209 def XVSUBSP : XX3Form<60, 72,
210 (outs vsrc:$XT), (ins vsrc:$XA, vsrc:$XB),
211 "xvsubsp $XT, $XA, $XB", IIC_VecFP,
212 [(set v4f32:$XT, (fsub v4f32:$XA, v4f32:$XB))]>;
213
214 // FMA Instructions
Hal Finkel25e04542014-03-25 18:55:11 +0000215 let BaseName = "XSMADDADP" in {
Hal Finkele01d3212014-03-24 15:07:28 +0000216 let isCommutable = 1 in
Hal Finkel27774d92014-03-13 07:58:58 +0000217 def XSMADDADP : XX3Form<60, 33,
Hal Finkel19be5062014-03-29 05:29:01 +0000218 (outs vsfrc:$XT), (ins vsfrc:$XTi, vsfrc:$XA, vsfrc:$XB),
Hal Finkel27774d92014-03-13 07:58:58 +0000219 "xsmaddadp $XT, $XA, $XB", IIC_VecFP,
220 [(set f64:$XT, (fma f64:$XA, f64:$XB, f64:$XTi))]>,
Hal Finkel25e04542014-03-25 18:55:11 +0000221 RegConstraint<"$XTi = $XT">, NoEncode<"$XTi">,
222 AltVSXFMARel;
223 let IsVSXFMAAlt = 1 in
Hal Finkel27774d92014-03-13 07:58:58 +0000224 def XSMADDMDP : XX3Form<60, 41,
Hal Finkel19be5062014-03-29 05:29:01 +0000225 (outs vsfrc:$XT), (ins vsfrc:$XTi, vsfrc:$XA, vsfrc:$XB),
Hal Finkel27774d92014-03-13 07:58:58 +0000226 "xsmaddmdp $XT, $XA, $XB", IIC_VecFP, []>,
Hal Finkel25e04542014-03-25 18:55:11 +0000227 RegConstraint<"$XTi = $XT">, NoEncode<"$XTi">,
228 AltVSXFMARel;
229 }
Hal Finkel27774d92014-03-13 07:58:58 +0000230
Hal Finkel25e04542014-03-25 18:55:11 +0000231 let BaseName = "XSMSUBADP" in {
Hal Finkele01d3212014-03-24 15:07:28 +0000232 let isCommutable = 1 in
Hal Finkel27774d92014-03-13 07:58:58 +0000233 def XSMSUBADP : XX3Form<60, 49,
Hal Finkel19be5062014-03-29 05:29:01 +0000234 (outs vsfrc:$XT), (ins vsfrc:$XTi, vsfrc:$XA, vsfrc:$XB),
Hal Finkel27774d92014-03-13 07:58:58 +0000235 "xsmsubadp $XT, $XA, $XB", IIC_VecFP,
236 [(set f64:$XT, (fma f64:$XA, f64:$XB, (fneg f64:$XTi)))]>,
Hal Finkel25e04542014-03-25 18:55:11 +0000237 RegConstraint<"$XTi = $XT">, NoEncode<"$XTi">,
238 AltVSXFMARel;
239 let IsVSXFMAAlt = 1 in
Hal Finkel27774d92014-03-13 07:58:58 +0000240 def XSMSUBMDP : XX3Form<60, 57,
Hal Finkel19be5062014-03-29 05:29:01 +0000241 (outs vsfrc:$XT), (ins vsfrc:$XTi, vsfrc:$XA, vsfrc:$XB),
Hal Finkel27774d92014-03-13 07:58:58 +0000242 "xsmsubmdp $XT, $XA, $XB", IIC_VecFP, []>,
Hal Finkel25e04542014-03-25 18:55:11 +0000243 RegConstraint<"$XTi = $XT">, NoEncode<"$XTi">,
244 AltVSXFMARel;
245 }
Hal Finkel27774d92014-03-13 07:58:58 +0000246
Hal Finkel25e04542014-03-25 18:55:11 +0000247 let BaseName = "XSNMADDADP" in {
Hal Finkele01d3212014-03-24 15:07:28 +0000248 let isCommutable = 1 in
Hal Finkel27774d92014-03-13 07:58:58 +0000249 def XSNMADDADP : XX3Form<60, 161,
Hal Finkel19be5062014-03-29 05:29:01 +0000250 (outs vsfrc:$XT), (ins vsfrc:$XTi, vsfrc:$XA, vsfrc:$XB),
Hal Finkel27774d92014-03-13 07:58:58 +0000251 "xsnmaddadp $XT, $XA, $XB", IIC_VecFP,
252 [(set f64:$XT, (fneg (fma f64:$XA, f64:$XB, f64:$XTi)))]>,
Hal Finkel25e04542014-03-25 18:55:11 +0000253 RegConstraint<"$XTi = $XT">, NoEncode<"$XTi">,
254 AltVSXFMARel;
255 let IsVSXFMAAlt = 1 in
Hal Finkel27774d92014-03-13 07:58:58 +0000256 def XSNMADDMDP : XX3Form<60, 169,
Hal Finkel19be5062014-03-29 05:29:01 +0000257 (outs vsfrc:$XT), (ins vsfrc:$XTi, vsfrc:$XA, vsfrc:$XB),
Hal Finkel27774d92014-03-13 07:58:58 +0000258 "xsnmaddmdp $XT, $XA, $XB", IIC_VecFP, []>,
Hal Finkel25e04542014-03-25 18:55:11 +0000259 RegConstraint<"$XTi = $XT">, NoEncode<"$XTi">,
260 AltVSXFMARel;
261 }
Hal Finkel27774d92014-03-13 07:58:58 +0000262
Hal Finkel25e04542014-03-25 18:55:11 +0000263 let BaseName = "XSNMSUBADP" in {
Hal Finkele01d3212014-03-24 15:07:28 +0000264 let isCommutable = 1 in
Hal Finkel27774d92014-03-13 07:58:58 +0000265 def XSNMSUBADP : XX3Form<60, 177,
Hal Finkel19be5062014-03-29 05:29:01 +0000266 (outs vsfrc:$XT), (ins vsfrc:$XTi, vsfrc:$XA, vsfrc:$XB),
Hal Finkel27774d92014-03-13 07:58:58 +0000267 "xsnmsubadp $XT, $XA, $XB", IIC_VecFP,
268 [(set f64:$XT, (fneg (fma f64:$XA, f64:$XB, (fneg f64:$XTi))))]>,
Hal Finkel25e04542014-03-25 18:55:11 +0000269 RegConstraint<"$XTi = $XT">, NoEncode<"$XTi">,
270 AltVSXFMARel;
271 let IsVSXFMAAlt = 1 in
Hal Finkel27774d92014-03-13 07:58:58 +0000272 def XSNMSUBMDP : XX3Form<60, 185,
Hal Finkel19be5062014-03-29 05:29:01 +0000273 (outs vsfrc:$XT), (ins vsfrc:$XTi, vsfrc:$XA, vsfrc:$XB),
Hal Finkel27774d92014-03-13 07:58:58 +0000274 "xsnmsubmdp $XT, $XA, $XB", IIC_VecFP, []>,
Hal Finkel25e04542014-03-25 18:55:11 +0000275 RegConstraint<"$XTi = $XT">, NoEncode<"$XTi">,
276 AltVSXFMARel;
277 }
Hal Finkel27774d92014-03-13 07:58:58 +0000278
Hal Finkel25e04542014-03-25 18:55:11 +0000279 let BaseName = "XVMADDADP" in {
Hal Finkele01d3212014-03-24 15:07:28 +0000280 let isCommutable = 1 in
Hal Finkel27774d92014-03-13 07:58:58 +0000281 def XVMADDADP : XX3Form<60, 97,
282 (outs vsrc:$XT), (ins vsrc:$XTi, vsrc:$XA, vsrc:$XB),
283 "xvmaddadp $XT, $XA, $XB", IIC_VecFP,
284 [(set v2f64:$XT, (fma v2f64:$XA, v2f64:$XB, v2f64:$XTi))]>,
Hal Finkel25e04542014-03-25 18:55:11 +0000285 RegConstraint<"$XTi = $XT">, NoEncode<"$XTi">,
286 AltVSXFMARel;
287 let IsVSXFMAAlt = 1 in
Hal Finkel27774d92014-03-13 07:58:58 +0000288 def XVMADDMDP : XX3Form<60, 105,
289 (outs vsrc:$XT), (ins vsrc:$XTi, vsrc:$XA, vsrc:$XB),
290 "xvmaddmdp $XT, $XA, $XB", IIC_VecFP, []>,
Hal Finkel25e04542014-03-25 18:55:11 +0000291 RegConstraint<"$XTi = $XT">, NoEncode<"$XTi">,
292 AltVSXFMARel;
293 }
Hal Finkel27774d92014-03-13 07:58:58 +0000294
Hal Finkel25e04542014-03-25 18:55:11 +0000295 let BaseName = "XVMADDASP" in {
Hal Finkele01d3212014-03-24 15:07:28 +0000296 let isCommutable = 1 in
Hal Finkel27774d92014-03-13 07:58:58 +0000297 def XVMADDASP : XX3Form<60, 65,
298 (outs vsrc:$XT), (ins vsrc:$XTi, vsrc:$XA, vsrc:$XB),
299 "xvmaddasp $XT, $XA, $XB", IIC_VecFP,
300 [(set v4f32:$XT, (fma v4f32:$XA, v4f32:$XB, v4f32:$XTi))]>,
Hal Finkel25e04542014-03-25 18:55:11 +0000301 RegConstraint<"$XTi = $XT">, NoEncode<"$XTi">,
302 AltVSXFMARel;
303 let IsVSXFMAAlt = 1 in
Hal Finkel27774d92014-03-13 07:58:58 +0000304 def XVMADDMSP : XX3Form<60, 73,
305 (outs vsrc:$XT), (ins vsrc:$XTi, vsrc:$XA, vsrc:$XB),
306 "xvmaddmsp $XT, $XA, $XB", IIC_VecFP, []>,
Hal Finkel25e04542014-03-25 18:55:11 +0000307 RegConstraint<"$XTi = $XT">, NoEncode<"$XTi">,
308 AltVSXFMARel;
309 }
Hal Finkel27774d92014-03-13 07:58:58 +0000310
Hal Finkel25e04542014-03-25 18:55:11 +0000311 let BaseName = "XVMSUBADP" in {
Hal Finkele01d3212014-03-24 15:07:28 +0000312 let isCommutable = 1 in
Hal Finkel27774d92014-03-13 07:58:58 +0000313 def XVMSUBADP : XX3Form<60, 113,
314 (outs vsrc:$XT), (ins vsrc:$XTi, vsrc:$XA, vsrc:$XB),
315 "xvmsubadp $XT, $XA, $XB", IIC_VecFP,
316 [(set v2f64:$XT, (fma v2f64:$XA, v2f64:$XB, (fneg v2f64:$XTi)))]>,
Hal Finkel25e04542014-03-25 18:55:11 +0000317 RegConstraint<"$XTi = $XT">, NoEncode<"$XTi">,
318 AltVSXFMARel;
319 let IsVSXFMAAlt = 1 in
Hal Finkel27774d92014-03-13 07:58:58 +0000320 def XVMSUBMDP : XX3Form<60, 121,
321 (outs vsrc:$XT), (ins vsrc:$XTi, vsrc:$XA, vsrc:$XB),
322 "xvmsubmdp $XT, $XA, $XB", IIC_VecFP, []>,
Hal Finkel25e04542014-03-25 18:55:11 +0000323 RegConstraint<"$XTi = $XT">, NoEncode<"$XTi">,
324 AltVSXFMARel;
325 }
Hal Finkel27774d92014-03-13 07:58:58 +0000326
Hal Finkel25e04542014-03-25 18:55:11 +0000327 let BaseName = "XVMSUBASP" in {
Hal Finkele01d3212014-03-24 15:07:28 +0000328 let isCommutable = 1 in
Hal Finkel27774d92014-03-13 07:58:58 +0000329 def XVMSUBASP : XX3Form<60, 81,
330 (outs vsrc:$XT), (ins vsrc:$XTi, vsrc:$XA, vsrc:$XB),
331 "xvmsubasp $XT, $XA, $XB", IIC_VecFP,
332 [(set v4f32:$XT, (fma v4f32:$XA, v4f32:$XB, (fneg v4f32:$XTi)))]>,
Hal Finkel25e04542014-03-25 18:55:11 +0000333 RegConstraint<"$XTi = $XT">, NoEncode<"$XTi">,
334 AltVSXFMARel;
335 let IsVSXFMAAlt = 1 in
Hal Finkel27774d92014-03-13 07:58:58 +0000336 def XVMSUBMSP : XX3Form<60, 89,
337 (outs vsrc:$XT), (ins vsrc:$XTi, vsrc:$XA, vsrc:$XB),
338 "xvmsubmsp $XT, $XA, $XB", IIC_VecFP, []>,
Hal Finkel25e04542014-03-25 18:55:11 +0000339 RegConstraint<"$XTi = $XT">, NoEncode<"$XTi">,
340 AltVSXFMARel;
341 }
Hal Finkel27774d92014-03-13 07:58:58 +0000342
Hal Finkel25e04542014-03-25 18:55:11 +0000343 let BaseName = "XVNMADDADP" in {
Hal Finkele01d3212014-03-24 15:07:28 +0000344 let isCommutable = 1 in
Hal Finkel27774d92014-03-13 07:58:58 +0000345 def XVNMADDADP : XX3Form<60, 225,
346 (outs vsrc:$XT), (ins vsrc:$XTi, vsrc:$XA, vsrc:$XB),
347 "xvnmaddadp $XT, $XA, $XB", IIC_VecFP,
348 [(set v2f64:$XT, (fneg (fma v2f64:$XA, v2f64:$XB, v2f64:$XTi)))]>,
Hal Finkel25e04542014-03-25 18:55:11 +0000349 RegConstraint<"$XTi = $XT">, NoEncode<"$XTi">,
350 AltVSXFMARel;
351 let IsVSXFMAAlt = 1 in
Hal Finkel27774d92014-03-13 07:58:58 +0000352 def XVNMADDMDP : XX3Form<60, 233,
353 (outs vsrc:$XT), (ins vsrc:$XTi, vsrc:$XA, vsrc:$XB),
354 "xvnmaddmdp $XT, $XA, $XB", IIC_VecFP, []>,
Hal Finkel25e04542014-03-25 18:55:11 +0000355 RegConstraint<"$XTi = $XT">, NoEncode<"$XTi">,
356 AltVSXFMARel;
357 }
Hal Finkel27774d92014-03-13 07:58:58 +0000358
Hal Finkel25e04542014-03-25 18:55:11 +0000359 let BaseName = "XVNMADDASP" in {
Hal Finkele01d3212014-03-24 15:07:28 +0000360 let isCommutable = 1 in
Hal Finkel27774d92014-03-13 07:58:58 +0000361 def XVNMADDASP : XX3Form<60, 193,
362 (outs vsrc:$XT), (ins vsrc:$XTi, vsrc:$XA, vsrc:$XB),
363 "xvnmaddasp $XT, $XA, $XB", IIC_VecFP,
364 [(set v4f32:$XT, (fneg (fma v4f32:$XA, v4f32:$XB, v4f32:$XTi)))]>,
Hal Finkel25e04542014-03-25 18:55:11 +0000365 RegConstraint<"$XTi = $XT">, NoEncode<"$XTi">,
366 AltVSXFMARel;
367 let IsVSXFMAAlt = 1 in
Hal Finkel27774d92014-03-13 07:58:58 +0000368 def XVNMADDMSP : XX3Form<60, 201,
369 (outs vsrc:$XT), (ins vsrc:$XTi, vsrc:$XA, vsrc:$XB),
370 "xvnmaddmsp $XT, $XA, $XB", IIC_VecFP, []>,
Hal Finkel25e04542014-03-25 18:55:11 +0000371 RegConstraint<"$XTi = $XT">, NoEncode<"$XTi">,
372 AltVSXFMARel;
373 }
Hal Finkel27774d92014-03-13 07:58:58 +0000374
Hal Finkel25e04542014-03-25 18:55:11 +0000375 let BaseName = "XVNMSUBADP" in {
Hal Finkele01d3212014-03-24 15:07:28 +0000376 let isCommutable = 1 in
Hal Finkel27774d92014-03-13 07:58:58 +0000377 def XVNMSUBADP : XX3Form<60, 241,
378 (outs vsrc:$XT), (ins vsrc:$XTi, vsrc:$XA, vsrc:$XB),
379 "xvnmsubadp $XT, $XA, $XB", IIC_VecFP,
380 [(set v2f64:$XT, (fneg (fma v2f64:$XA, v2f64:$XB, (fneg v2f64:$XTi))))]>,
Hal Finkel25e04542014-03-25 18:55:11 +0000381 RegConstraint<"$XTi = $XT">, NoEncode<"$XTi">,
382 AltVSXFMARel;
383 let IsVSXFMAAlt = 1 in
Hal Finkel27774d92014-03-13 07:58:58 +0000384 def XVNMSUBMDP : XX3Form<60, 249,
385 (outs vsrc:$XT), (ins vsrc:$XTi, vsrc:$XA, vsrc:$XB),
386 "xvnmsubmdp $XT, $XA, $XB", IIC_VecFP, []>,
Hal Finkel25e04542014-03-25 18:55:11 +0000387 RegConstraint<"$XTi = $XT">, NoEncode<"$XTi">,
388 AltVSXFMARel;
389 }
Hal Finkel27774d92014-03-13 07:58:58 +0000390
Hal Finkel25e04542014-03-25 18:55:11 +0000391 let BaseName = "XVNMSUBASP" in {
Hal Finkele01d3212014-03-24 15:07:28 +0000392 let isCommutable = 1 in
Hal Finkel27774d92014-03-13 07:58:58 +0000393 def XVNMSUBASP : XX3Form<60, 209,
394 (outs vsrc:$XT), (ins vsrc:$XTi, vsrc:$XA, vsrc:$XB),
395 "xvnmsubasp $XT, $XA, $XB", IIC_VecFP,
396 [(set v4f32:$XT, (fneg (fma v4f32:$XA, v4f32:$XB, (fneg v4f32:$XTi))))]>,
Hal Finkel25e04542014-03-25 18:55:11 +0000397 RegConstraint<"$XTi = $XT">, NoEncode<"$XTi">,
398 AltVSXFMARel;
399 let IsVSXFMAAlt = 1 in
Hal Finkel27774d92014-03-13 07:58:58 +0000400 def XVNMSUBMSP : XX3Form<60, 217,
401 (outs vsrc:$XT), (ins vsrc:$XTi, vsrc:$XA, vsrc:$XB),
402 "xvnmsubmsp $XT, $XA, $XB", IIC_VecFP, []>,
Hal Finkel25e04542014-03-25 18:55:11 +0000403 RegConstraint<"$XTi = $XT">, NoEncode<"$XTi">,
404 AltVSXFMARel;
405 }
Hal Finkel27774d92014-03-13 07:58:58 +0000406
407 // Division Instructions
408 def XSDIVDP : XX3Form<60, 56,
Hal Finkel19be5062014-03-29 05:29:01 +0000409 (outs vsfrc:$XT), (ins vsfrc:$XA, vsfrc:$XB),
Hal Finkele8fba982014-03-29 13:20:31 +0000410 "xsdivdp $XT, $XA, $XB", IIC_FPDivD,
Hal Finkel27774d92014-03-13 07:58:58 +0000411 [(set f64:$XT, (fdiv f64:$XA, f64:$XB))]>;
412 def XSSQRTDP : XX2Form<60, 75,
Hal Finkel19be5062014-03-29 05:29:01 +0000413 (outs vsfrc:$XT), (ins vsfrc:$XB),
Hal Finkele8fba982014-03-29 13:20:31 +0000414 "xssqrtdp $XT, $XB", IIC_FPSqrtD,
Hal Finkel27774d92014-03-13 07:58:58 +0000415 [(set f64:$XT, (fsqrt f64:$XB))]>;
416
417 def XSREDP : XX2Form<60, 90,
Hal Finkel19be5062014-03-29 05:29:01 +0000418 (outs vsfrc:$XT), (ins vsfrc:$XB),
Hal Finkel27774d92014-03-13 07:58:58 +0000419 "xsredp $XT, $XB", IIC_VecFP,
420 [(set f64:$XT, (PPCfre f64:$XB))]>;
421 def XSRSQRTEDP : XX2Form<60, 74,
Hal Finkel19be5062014-03-29 05:29:01 +0000422 (outs vsfrc:$XT), (ins vsfrc:$XB),
Hal Finkel27774d92014-03-13 07:58:58 +0000423 "xsrsqrtedp $XT, $XB", IIC_VecFP,
424 [(set f64:$XT, (PPCfrsqrte f64:$XB))]>;
425
426 def XSTDIVDP : XX3Form_1<60, 61,
Hal Finkel19be5062014-03-29 05:29:01 +0000427 (outs crrc:$crD), (ins vsfrc:$XA, vsfrc:$XB),
Hal Finkele8fba982014-03-29 13:20:31 +0000428 "xstdivdp $crD, $XA, $XB", IIC_FPCompare, []>;
Hal Finkel27774d92014-03-13 07:58:58 +0000429 def XSTSQRTDP : XX2Form_1<60, 106,
Hal Finkel19be5062014-03-29 05:29:01 +0000430 (outs crrc:$crD), (ins vsfrc:$XB),
Hal Finkele8fba982014-03-29 13:20:31 +0000431 "xstsqrtdp $crD, $XB", IIC_FPCompare, []>;
Hal Finkel27774d92014-03-13 07:58:58 +0000432
433 def XVDIVDP : XX3Form<60, 120,
434 (outs vsrc:$XT), (ins vsrc:$XA, vsrc:$XB),
Hal Finkele8fba982014-03-29 13:20:31 +0000435 "xvdivdp $XT, $XA, $XB", IIC_FPDivD,
Hal Finkel27774d92014-03-13 07:58:58 +0000436 [(set v2f64:$XT, (fdiv v2f64:$XA, v2f64:$XB))]>;
437 def XVDIVSP : XX3Form<60, 88,
438 (outs vsrc:$XT), (ins vsrc:$XA, vsrc:$XB),
Hal Finkele8fba982014-03-29 13:20:31 +0000439 "xvdivsp $XT, $XA, $XB", IIC_FPDivS,
Hal Finkel27774d92014-03-13 07:58:58 +0000440 [(set v4f32:$XT, (fdiv v4f32:$XA, v4f32:$XB))]>;
441
442 def XVSQRTDP : XX2Form<60, 203,
443 (outs vsrc:$XT), (ins vsrc:$XB),
Hal Finkele8fba982014-03-29 13:20:31 +0000444 "xvsqrtdp $XT, $XB", IIC_FPSqrtD,
Hal Finkel27774d92014-03-13 07:58:58 +0000445 [(set v2f64:$XT, (fsqrt v2f64:$XB))]>;
446 def XVSQRTSP : XX2Form<60, 139,
447 (outs vsrc:$XT), (ins vsrc:$XB),
Hal Finkele8fba982014-03-29 13:20:31 +0000448 "xvsqrtsp $XT, $XB", IIC_FPSqrtS,
Hal Finkel27774d92014-03-13 07:58:58 +0000449 [(set v4f32:$XT, (fsqrt v4f32:$XB))]>;
450
451 def XVTDIVDP : XX3Form_1<60, 125,
452 (outs crrc:$crD), (ins vsrc:$XA, vsrc:$XB),
Hal Finkele8fba982014-03-29 13:20:31 +0000453 "xvtdivdp $crD, $XA, $XB", IIC_FPCompare, []>;
Hal Finkel27774d92014-03-13 07:58:58 +0000454 def XVTDIVSP : XX3Form_1<60, 93,
455 (outs crrc:$crD), (ins vsrc:$XA, vsrc:$XB),
Hal Finkele8fba982014-03-29 13:20:31 +0000456 "xvtdivsp $crD, $XA, $XB", IIC_FPCompare, []>;
Hal Finkel27774d92014-03-13 07:58:58 +0000457
458 def XVTSQRTDP : XX2Form_1<60, 234,
459 (outs crrc:$crD), (ins vsrc:$XB),
Hal Finkele8fba982014-03-29 13:20:31 +0000460 "xvtsqrtdp $crD, $XB", IIC_FPCompare, []>;
Hal Finkel27774d92014-03-13 07:58:58 +0000461 def XVTSQRTSP : XX2Form_1<60, 170,
462 (outs crrc:$crD), (ins vsrc:$XB),
Hal Finkele8fba982014-03-29 13:20:31 +0000463 "xvtsqrtsp $crD, $XB", IIC_FPCompare, []>;
Hal Finkel27774d92014-03-13 07:58:58 +0000464
465 def XVREDP : XX2Form<60, 218,
466 (outs vsrc:$XT), (ins vsrc:$XB),
467 "xvredp $XT, $XB", IIC_VecFP,
468 [(set v2f64:$XT, (PPCfre v2f64:$XB))]>;
469 def XVRESP : XX2Form<60, 154,
470 (outs vsrc:$XT), (ins vsrc:$XB),
471 "xvresp $XT, $XB", IIC_VecFP,
472 [(set v4f32:$XT, (PPCfre v4f32:$XB))]>;
473
474 def XVRSQRTEDP : XX2Form<60, 202,
475 (outs vsrc:$XT), (ins vsrc:$XB),
476 "xvrsqrtedp $XT, $XB", IIC_VecFP,
477 [(set v2f64:$XT, (PPCfrsqrte v2f64:$XB))]>;
478 def XVRSQRTESP : XX2Form<60, 138,
479 (outs vsrc:$XT), (ins vsrc:$XB),
480 "xvrsqrtesp $XT, $XB", IIC_VecFP,
481 [(set v4f32:$XT, (PPCfrsqrte v4f32:$XB))]>;
482
483 // Compare Instructions
484 def XSCMPODP : XX3Form_1<60, 43,
Hal Finkel19be5062014-03-29 05:29:01 +0000485 (outs crrc:$crD), (ins vsfrc:$XA, vsfrc:$XB),
Hal Finkele8fba982014-03-29 13:20:31 +0000486 "xscmpodp $crD, $XA, $XB", IIC_FPCompare, []>;
Hal Finkel27774d92014-03-13 07:58:58 +0000487 def XSCMPUDP : XX3Form_1<60, 35,
Hal Finkel19be5062014-03-29 05:29:01 +0000488 (outs crrc:$crD), (ins vsfrc:$XA, vsfrc:$XB),
Hal Finkele8fba982014-03-29 13:20:31 +0000489 "xscmpudp $crD, $XA, $XB", IIC_FPCompare, []>;
Hal Finkel27774d92014-03-13 07:58:58 +0000490
491 defm XVCMPEQDP : XX3Form_Rcr<60, 99,
Nemanja Ivanovicf502a422015-06-26 19:26:53 +0000492 "xvcmpeqdp", "$XT, $XA, $XB", IIC_VecFPCompare,
Nemanja Ivanovic2c84b292015-09-29 17:41:53 +0000493 int_ppc_vsx_xvcmpeqdp, v2i64, v2f64>;
Hal Finkel27774d92014-03-13 07:58:58 +0000494 defm XVCMPEQSP : XX3Form_Rcr<60, 67,
Nemanja Ivanovicf502a422015-06-26 19:26:53 +0000495 "xvcmpeqsp", "$XT, $XA, $XB", IIC_VecFPCompare,
Nemanja Ivanovic2c84b292015-09-29 17:41:53 +0000496 int_ppc_vsx_xvcmpeqsp, v4i32, v4f32>;
Hal Finkel27774d92014-03-13 07:58:58 +0000497 defm XVCMPGEDP : XX3Form_Rcr<60, 115,
Nemanja Ivanovicf502a422015-06-26 19:26:53 +0000498 "xvcmpgedp", "$XT, $XA, $XB", IIC_VecFPCompare,
Nemanja Ivanovic2c84b292015-09-29 17:41:53 +0000499 int_ppc_vsx_xvcmpgedp, v2i64, v2f64>;
Hal Finkel27774d92014-03-13 07:58:58 +0000500 defm XVCMPGESP : XX3Form_Rcr<60, 83,
Nemanja Ivanovicf502a422015-06-26 19:26:53 +0000501 "xvcmpgesp", "$XT, $XA, $XB", IIC_VecFPCompare,
Nemanja Ivanovic2c84b292015-09-29 17:41:53 +0000502 int_ppc_vsx_xvcmpgesp, v4i32, v4f32>;
Hal Finkel27774d92014-03-13 07:58:58 +0000503 defm XVCMPGTDP : XX3Form_Rcr<60, 107,
Nemanja Ivanovicf502a422015-06-26 19:26:53 +0000504 "xvcmpgtdp", "$XT, $XA, $XB", IIC_VecFPCompare,
Nemanja Ivanovic2c84b292015-09-29 17:41:53 +0000505 int_ppc_vsx_xvcmpgtdp, v2i64, v2f64>;
Hal Finkel27774d92014-03-13 07:58:58 +0000506 defm XVCMPGTSP : XX3Form_Rcr<60, 75,
Nemanja Ivanovicf502a422015-06-26 19:26:53 +0000507 "xvcmpgtsp", "$XT, $XA, $XB", IIC_VecFPCompare,
Nemanja Ivanovic2c84b292015-09-29 17:41:53 +0000508 int_ppc_vsx_xvcmpgtsp, v4i32, v4f32>;
Hal Finkel27774d92014-03-13 07:58:58 +0000509
510 // Move Instructions
511 def XSABSDP : XX2Form<60, 345,
Hal Finkel19be5062014-03-29 05:29:01 +0000512 (outs vsfrc:$XT), (ins vsfrc:$XB),
Hal Finkel27774d92014-03-13 07:58:58 +0000513 "xsabsdp $XT, $XB", IIC_VecFP,
514 [(set f64:$XT, (fabs f64:$XB))]>;
515 def XSNABSDP : XX2Form<60, 361,
Hal Finkel19be5062014-03-29 05:29:01 +0000516 (outs vsfrc:$XT), (ins vsfrc:$XB),
Hal Finkel27774d92014-03-13 07:58:58 +0000517 "xsnabsdp $XT, $XB", IIC_VecFP,
518 [(set f64:$XT, (fneg (fabs f64:$XB)))]>;
519 def XSNEGDP : XX2Form<60, 377,
Hal Finkel19be5062014-03-29 05:29:01 +0000520 (outs vsfrc:$XT), (ins vsfrc:$XB),
Hal Finkel27774d92014-03-13 07:58:58 +0000521 "xsnegdp $XT, $XB", IIC_VecFP,
522 [(set f64:$XT, (fneg f64:$XB))]>;
523 def XSCPSGNDP : XX3Form<60, 176,
Hal Finkel19be5062014-03-29 05:29:01 +0000524 (outs vsfrc:$XT), (ins vsfrc:$XA, vsfrc:$XB),
Hal Finkel27774d92014-03-13 07:58:58 +0000525 "xscpsgndp $XT, $XA, $XB", IIC_VecFP,
526 [(set f64:$XT, (fcopysign f64:$XB, f64:$XA))]>;
527
528 def XVABSDP : XX2Form<60, 473,
529 (outs vsrc:$XT), (ins vsrc:$XB),
530 "xvabsdp $XT, $XB", IIC_VecFP,
531 [(set v2f64:$XT, (fabs v2f64:$XB))]>;
532
533 def XVABSSP : XX2Form<60, 409,
534 (outs vsrc:$XT), (ins vsrc:$XB),
535 "xvabssp $XT, $XB", IIC_VecFP,
536 [(set v4f32:$XT, (fabs v4f32:$XB))]>;
537
538 def XVCPSGNDP : XX3Form<60, 240,
539 (outs vsrc:$XT), (ins vsrc:$XA, vsrc:$XB),
540 "xvcpsgndp $XT, $XA, $XB", IIC_VecFP,
541 [(set v2f64:$XT, (fcopysign v2f64:$XB, v2f64:$XA))]>;
542 def XVCPSGNSP : XX3Form<60, 208,
543 (outs vsrc:$XT), (ins vsrc:$XA, vsrc:$XB),
544 "xvcpsgnsp $XT, $XA, $XB", IIC_VecFP,
545 [(set v4f32:$XT, (fcopysign v4f32:$XB, v4f32:$XA))]>;
546
547 def XVNABSDP : XX2Form<60, 489,
548 (outs vsrc:$XT), (ins vsrc:$XB),
549 "xvnabsdp $XT, $XB", IIC_VecFP,
550 [(set v2f64:$XT, (fneg (fabs v2f64:$XB)))]>;
551 def XVNABSSP : XX2Form<60, 425,
552 (outs vsrc:$XT), (ins vsrc:$XB),
553 "xvnabssp $XT, $XB", IIC_VecFP,
554 [(set v4f32:$XT, (fneg (fabs v4f32:$XB)))]>;
555
556 def XVNEGDP : XX2Form<60, 505,
557 (outs vsrc:$XT), (ins vsrc:$XB),
558 "xvnegdp $XT, $XB", IIC_VecFP,
559 [(set v2f64:$XT, (fneg v2f64:$XB))]>;
560 def XVNEGSP : XX2Form<60, 441,
561 (outs vsrc:$XT), (ins vsrc:$XB),
562 "xvnegsp $XT, $XB", IIC_VecFP,
563 [(set v4f32:$XT, (fneg v4f32:$XB))]>;
564
565 // Conversion Instructions
566 def XSCVDPSP : XX2Form<60, 265,
Hal Finkel19be5062014-03-29 05:29:01 +0000567 (outs vsfrc:$XT), (ins vsfrc:$XB),
Hal Finkel27774d92014-03-13 07:58:58 +0000568 "xscvdpsp $XT, $XB", IIC_VecFP, []>;
569 def XSCVDPSXDS : XX2Form<60, 344,
Hal Finkel19be5062014-03-29 05:29:01 +0000570 (outs vsfrc:$XT), (ins vsfrc:$XB),
Hal Finkel4a912252014-03-23 05:35:00 +0000571 "xscvdpsxds $XT, $XB", IIC_VecFP,
572 [(set f64:$XT, (PPCfctidz f64:$XB))]>;
Nemanja Ivanovicdf1cb522016-11-29 16:11:34 +0000573 let isCodeGenOnly = 1 in
574 def XSCVDPSXDSs : XX2Form<60, 344,
575 (outs vssrc:$XT), (ins vssrc:$XB),
576 "xscvdpsxds $XT, $XB", IIC_VecFP,
577 [(set f32:$XT, (PPCfctidz f32:$XB))]>;
Hal Finkel27774d92014-03-13 07:58:58 +0000578 def XSCVDPSXWS : XX2Form<60, 88,
Hal Finkel19be5062014-03-29 05:29:01 +0000579 (outs vsfrc:$XT), (ins vsfrc:$XB),
Hal Finkel4a912252014-03-23 05:35:00 +0000580 "xscvdpsxws $XT, $XB", IIC_VecFP,
581 [(set f64:$XT, (PPCfctiwz f64:$XB))]>;
Nemanja Ivanovicdf1cb522016-11-29 16:11:34 +0000582 let isCodeGenOnly = 1 in
583 def XSCVDPSXWSs : XX2Form<60, 88,
584 (outs vssrc:$XT), (ins vssrc:$XB),
585 "xscvdpsxws $XT, $XB", IIC_VecFP,
586 [(set f32:$XT, (PPCfctiwz f32:$XB))]>;
Hal Finkel27774d92014-03-13 07:58:58 +0000587 def XSCVDPUXDS : XX2Form<60, 328,
Hal Finkel19be5062014-03-29 05:29:01 +0000588 (outs vsfrc:$XT), (ins vsfrc:$XB),
Hal Finkel4a912252014-03-23 05:35:00 +0000589 "xscvdpuxds $XT, $XB", IIC_VecFP,
590 [(set f64:$XT, (PPCfctiduz f64:$XB))]>;
Nemanja Ivanovicdf1cb522016-11-29 16:11:34 +0000591 let isCodeGenOnly = 1 in
592 def XSCVDPUXDSs : XX2Form<60, 328,
593 (outs vssrc:$XT), (ins vssrc:$XB),
594 "xscvdpuxds $XT, $XB", IIC_VecFP,
595 [(set f32:$XT, (PPCfctiduz f32:$XB))]>;
Hal Finkel27774d92014-03-13 07:58:58 +0000596 def XSCVDPUXWS : XX2Form<60, 72,
Hal Finkel19be5062014-03-29 05:29:01 +0000597 (outs vsfrc:$XT), (ins vsfrc:$XB),
Hal Finkel4a912252014-03-23 05:35:00 +0000598 "xscvdpuxws $XT, $XB", IIC_VecFP,
599 [(set f64:$XT, (PPCfctiwuz f64:$XB))]>;
Nemanja Ivanovicdf1cb522016-11-29 16:11:34 +0000600 let isCodeGenOnly = 1 in
601 def XSCVDPUXWSs : XX2Form<60, 72,
602 (outs vssrc:$XT), (ins vssrc:$XB),
603 "xscvdpuxws $XT, $XB", IIC_VecFP,
604 [(set f32:$XT, (PPCfctiwuz f32:$XB))]>;
Hal Finkel27774d92014-03-13 07:58:58 +0000605 def XSCVSPDP : XX2Form<60, 329,
Hal Finkel19be5062014-03-29 05:29:01 +0000606 (outs vsfrc:$XT), (ins vsfrc:$XB),
Hal Finkel27774d92014-03-13 07:58:58 +0000607 "xscvspdp $XT, $XB", IIC_VecFP, []>;
608 def XSCVSXDDP : XX2Form<60, 376,
Hal Finkel19be5062014-03-29 05:29:01 +0000609 (outs vsfrc:$XT), (ins vsfrc:$XB),
Hal Finkel4a912252014-03-23 05:35:00 +0000610 "xscvsxddp $XT, $XB", IIC_VecFP,
611 [(set f64:$XT, (PPCfcfid f64:$XB))]>;
Hal Finkel27774d92014-03-13 07:58:58 +0000612 def XSCVUXDDP : XX2Form<60, 360,
Hal Finkel19be5062014-03-29 05:29:01 +0000613 (outs vsfrc:$XT), (ins vsfrc:$XB),
Hal Finkel4a912252014-03-23 05:35:00 +0000614 "xscvuxddp $XT, $XB", IIC_VecFP,
615 [(set f64:$XT, (PPCfcfidu f64:$XB))]>;
Hal Finkel27774d92014-03-13 07:58:58 +0000616
617 def XVCVDPSP : XX2Form<60, 393,
618 (outs vsrc:$XT), (ins vsrc:$XB),
Nemanja Ivanovic2efc3cb2016-11-11 14:41:19 +0000619 "xvcvdpsp $XT, $XB", IIC_VecFP,
620 [(set v4f32:$XT, (int_ppc_vsx_xvcvdpsp v2f64:$XB))]>;
Hal Finkel27774d92014-03-13 07:58:58 +0000621 def XVCVDPSXDS : XX2Form<60, 472,
622 (outs vsrc:$XT), (ins vsrc:$XB),
Hal Finkel7279f4b2014-03-26 19:13:54 +0000623 "xvcvdpsxds $XT, $XB", IIC_VecFP,
624 [(set v2i64:$XT, (fp_to_sint v2f64:$XB))]>;
Hal Finkel27774d92014-03-13 07:58:58 +0000625 def XVCVDPSXWS : XX2Form<60, 216,
626 (outs vsrc:$XT), (ins vsrc:$XB),
Nemanja Ivanovic2efc3cb2016-11-11 14:41:19 +0000627 "xvcvdpsxws $XT, $XB", IIC_VecFP,
628 [(set v4i32:$XT, (int_ppc_vsx_xvcvdpsxws v2f64:$XB))]>;
Hal Finkel27774d92014-03-13 07:58:58 +0000629 def XVCVDPUXDS : XX2Form<60, 456,
630 (outs vsrc:$XT), (ins vsrc:$XB),
Hal Finkel7279f4b2014-03-26 19:13:54 +0000631 "xvcvdpuxds $XT, $XB", IIC_VecFP,
632 [(set v2i64:$XT, (fp_to_uint v2f64:$XB))]>;
Hal Finkel27774d92014-03-13 07:58:58 +0000633 def XVCVDPUXWS : XX2Form<60, 200,
634 (outs vsrc:$XT), (ins vsrc:$XB),
Nemanja Ivanovic2efc3cb2016-11-11 14:41:19 +0000635 "xvcvdpuxws $XT, $XB", IIC_VecFP,
636 [(set v4i32:$XT, (int_ppc_vsx_xvcvdpuxws v2f64:$XB))]>;
Hal Finkel27774d92014-03-13 07:58:58 +0000637
638 def XVCVSPDP : XX2Form<60, 457,
639 (outs vsrc:$XT), (ins vsrc:$XB),
Nemanja Ivanovic2efc3cb2016-11-11 14:41:19 +0000640 "xvcvspdp $XT, $XB", IIC_VecFP,
641 [(set v2f64:$XT, (int_ppc_vsx_xvcvspdp v4f32:$XB))]>;
Hal Finkel27774d92014-03-13 07:58:58 +0000642 def XVCVSPSXDS : XX2Form<60, 408,
643 (outs vsrc:$XT), (ins vsrc:$XB),
644 "xvcvspsxds $XT, $XB", IIC_VecFP, []>;
645 def XVCVSPSXWS : XX2Form<60, 152,
646 (outs vsrc:$XT), (ins vsrc:$XB),
Nemanja Ivanovicdf1cb522016-11-29 16:11:34 +0000647 "xvcvspsxws $XT, $XB", IIC_VecFP,
648 [(set v4i32:$XT, (fp_to_sint v4f32:$XB))]>;
Hal Finkel27774d92014-03-13 07:58:58 +0000649 def XVCVSPUXDS : XX2Form<60, 392,
650 (outs vsrc:$XT), (ins vsrc:$XB),
651 "xvcvspuxds $XT, $XB", IIC_VecFP, []>;
652 def XVCVSPUXWS : XX2Form<60, 136,
653 (outs vsrc:$XT), (ins vsrc:$XB),
Nemanja Ivanovicdf1cb522016-11-29 16:11:34 +0000654 "xvcvspuxws $XT, $XB", IIC_VecFP,
655 [(set v4i32:$XT, (fp_to_uint v4f32:$XB))]>;
Hal Finkel27774d92014-03-13 07:58:58 +0000656 def XVCVSXDDP : XX2Form<60, 504,
657 (outs vsrc:$XT), (ins vsrc:$XB),
Hal Finkel7279f4b2014-03-26 19:13:54 +0000658 "xvcvsxddp $XT, $XB", IIC_VecFP,
659 [(set v2f64:$XT, (sint_to_fp v2i64:$XB))]>;
Hal Finkel27774d92014-03-13 07:58:58 +0000660 def XVCVSXDSP : XX2Form<60, 440,
661 (outs vsrc:$XT), (ins vsrc:$XB),
Nemanja Ivanovic2efc3cb2016-11-11 14:41:19 +0000662 "xvcvsxdsp $XT, $XB", IIC_VecFP,
663 [(set v4f32:$XT, (int_ppc_vsx_xvcvsxdsp v2i64:$XB))]>;
Hal Finkel27774d92014-03-13 07:58:58 +0000664 def XVCVSXWDP : XX2Form<60, 248,
665 (outs vsrc:$XT), (ins vsrc:$XB),
Nemanja Ivanovic2efc3cb2016-11-11 14:41:19 +0000666 "xvcvsxwdp $XT, $XB", IIC_VecFP,
667 [(set v2f64:$XT, (int_ppc_vsx_xvcvsxwdp v4i32:$XB))]>;
Hal Finkel27774d92014-03-13 07:58:58 +0000668 def XVCVSXWSP : XX2Form<60, 184,
669 (outs vsrc:$XT), (ins vsrc:$XB),
Nemanja Ivanovic44513e52016-07-05 09:22:29 +0000670 "xvcvsxwsp $XT, $XB", IIC_VecFP,
671 [(set v4f32:$XT, (sint_to_fp v4i32:$XB))]>;
Hal Finkel27774d92014-03-13 07:58:58 +0000672 def XVCVUXDDP : XX2Form<60, 488,
673 (outs vsrc:$XT), (ins vsrc:$XB),
Hal Finkel7279f4b2014-03-26 19:13:54 +0000674 "xvcvuxddp $XT, $XB", IIC_VecFP,
675 [(set v2f64:$XT, (uint_to_fp v2i64:$XB))]>;
Hal Finkel27774d92014-03-13 07:58:58 +0000676 def XVCVUXDSP : XX2Form<60, 424,
677 (outs vsrc:$XT), (ins vsrc:$XB),
Nemanja Ivanovic2efc3cb2016-11-11 14:41:19 +0000678 "xvcvuxdsp $XT, $XB", IIC_VecFP,
679 [(set v4f32:$XT, (int_ppc_vsx_xvcvuxdsp v2i64:$XB))]>;
Hal Finkel27774d92014-03-13 07:58:58 +0000680 def XVCVUXWDP : XX2Form<60, 232,
681 (outs vsrc:$XT), (ins vsrc:$XB),
Nemanja Ivanovic2efc3cb2016-11-11 14:41:19 +0000682 "xvcvuxwdp $XT, $XB", IIC_VecFP,
683 [(set v2f64:$XT, (int_ppc_vsx_xvcvuxwdp v4i32:$XB))]>;
Hal Finkel27774d92014-03-13 07:58:58 +0000684 def XVCVUXWSP : XX2Form<60, 168,
685 (outs vsrc:$XT), (ins vsrc:$XB),
Nemanja Ivanovicdf1cb522016-11-29 16:11:34 +0000686 "xvcvuxwsp $XT, $XB", IIC_VecFP,
687 [(set v4f32:$XT, (uint_to_fp v4i32:$XB))]>;
Hal Finkel27774d92014-03-13 07:58:58 +0000688
689 // Rounding Instructions
690 def XSRDPI : XX2Form<60, 73,
Hal Finkel19be5062014-03-29 05:29:01 +0000691 (outs vsfrc:$XT), (ins vsfrc:$XB),
Hal Finkel27774d92014-03-13 07:58:58 +0000692 "xsrdpi $XT, $XB", IIC_VecFP,
Michael Kuperstein2bc3d4d2016-08-18 20:08:15 +0000693 [(set f64:$XT, (fround f64:$XB))]>;
Hal Finkel27774d92014-03-13 07:58:58 +0000694 def XSRDPIC : XX2Form<60, 107,
Hal Finkel19be5062014-03-29 05:29:01 +0000695 (outs vsfrc:$XT), (ins vsfrc:$XB),
Hal Finkel27774d92014-03-13 07:58:58 +0000696 "xsrdpic $XT, $XB", IIC_VecFP,
697 [(set f64:$XT, (fnearbyint f64:$XB))]>;
698 def XSRDPIM : XX2Form<60, 121,
Hal Finkel19be5062014-03-29 05:29:01 +0000699 (outs vsfrc:$XT), (ins vsfrc:$XB),
Hal Finkel27774d92014-03-13 07:58:58 +0000700 "xsrdpim $XT, $XB", IIC_VecFP,
701 [(set f64:$XT, (ffloor f64:$XB))]>;
702 def XSRDPIP : XX2Form<60, 105,
Hal Finkel19be5062014-03-29 05:29:01 +0000703 (outs vsfrc:$XT), (ins vsfrc:$XB),
Hal Finkel27774d92014-03-13 07:58:58 +0000704 "xsrdpip $XT, $XB", IIC_VecFP,
705 [(set f64:$XT, (fceil f64:$XB))]>;
706 def XSRDPIZ : XX2Form<60, 89,
Hal Finkel19be5062014-03-29 05:29:01 +0000707 (outs vsfrc:$XT), (ins vsfrc:$XB),
Hal Finkel27774d92014-03-13 07:58:58 +0000708 "xsrdpiz $XT, $XB", IIC_VecFP,
709 [(set f64:$XT, (ftrunc f64:$XB))]>;
710
711 def XVRDPI : XX2Form<60, 201,
712 (outs vsrc:$XT), (ins vsrc:$XB),
713 "xvrdpi $XT, $XB", IIC_VecFP,
Michael Kuperstein2bc3d4d2016-08-18 20:08:15 +0000714 [(set v2f64:$XT, (fround v2f64:$XB))]>;
Hal Finkel27774d92014-03-13 07:58:58 +0000715 def XVRDPIC : XX2Form<60, 235,
716 (outs vsrc:$XT), (ins vsrc:$XB),
717 "xvrdpic $XT, $XB", IIC_VecFP,
718 [(set v2f64:$XT, (fnearbyint v2f64:$XB))]>;
719 def XVRDPIM : XX2Form<60, 249,
720 (outs vsrc:$XT), (ins vsrc:$XB),
721 "xvrdpim $XT, $XB", IIC_VecFP,
722 [(set v2f64:$XT, (ffloor v2f64:$XB))]>;
723 def XVRDPIP : XX2Form<60, 233,
724 (outs vsrc:$XT), (ins vsrc:$XB),
725 "xvrdpip $XT, $XB", IIC_VecFP,
726 [(set v2f64:$XT, (fceil v2f64:$XB))]>;
727 def XVRDPIZ : XX2Form<60, 217,
728 (outs vsrc:$XT), (ins vsrc:$XB),
729 "xvrdpiz $XT, $XB", IIC_VecFP,
730 [(set v2f64:$XT, (ftrunc v2f64:$XB))]>;
731
732 def XVRSPI : XX2Form<60, 137,
733 (outs vsrc:$XT), (ins vsrc:$XB),
734 "xvrspi $XT, $XB", IIC_VecFP,
Michael Kuperstein2bc3d4d2016-08-18 20:08:15 +0000735 [(set v4f32:$XT, (fround v4f32:$XB))]>;
Hal Finkel27774d92014-03-13 07:58:58 +0000736 def XVRSPIC : XX2Form<60, 171,
737 (outs vsrc:$XT), (ins vsrc:$XB),
738 "xvrspic $XT, $XB", IIC_VecFP,
739 [(set v4f32:$XT, (fnearbyint v4f32:$XB))]>;
740 def XVRSPIM : XX2Form<60, 185,
741 (outs vsrc:$XT), (ins vsrc:$XB),
742 "xvrspim $XT, $XB", IIC_VecFP,
743 [(set v4f32:$XT, (ffloor v4f32:$XB))]>;
744 def XVRSPIP : XX2Form<60, 169,
745 (outs vsrc:$XT), (ins vsrc:$XB),
746 "xvrspip $XT, $XB", IIC_VecFP,
747 [(set v4f32:$XT, (fceil v4f32:$XB))]>;
748 def XVRSPIZ : XX2Form<60, 153,
749 (outs vsrc:$XT), (ins vsrc:$XB),
750 "xvrspiz $XT, $XB", IIC_VecFP,
751 [(set v4f32:$XT, (ftrunc v4f32:$XB))]>;
752
753 // Max/Min Instructions
Hal Finkele01d3212014-03-24 15:07:28 +0000754 let isCommutable = 1 in {
Hal Finkel27774d92014-03-13 07:58:58 +0000755 def XSMAXDP : XX3Form<60, 160,
Hal Finkel19be5062014-03-29 05:29:01 +0000756 (outs vsfrc:$XT), (ins vsfrc:$XA, vsfrc:$XB),
Bill Schmidt1ca69fa2014-10-31 19:19:07 +0000757 "xsmaxdp $XT, $XA, $XB", IIC_VecFP,
758 [(set vsfrc:$XT,
759 (int_ppc_vsx_xsmaxdp vsfrc:$XA, vsfrc:$XB))]>;
Hal Finkel27774d92014-03-13 07:58:58 +0000760 def XSMINDP : XX3Form<60, 168,
Hal Finkel19be5062014-03-29 05:29:01 +0000761 (outs vsfrc:$XT), (ins vsfrc:$XA, vsfrc:$XB),
Bill Schmidt1ca69fa2014-10-31 19:19:07 +0000762 "xsmindp $XT, $XA, $XB", IIC_VecFP,
763 [(set vsfrc:$XT,
764 (int_ppc_vsx_xsmindp vsfrc:$XA, vsfrc:$XB))]>;
Hal Finkel27774d92014-03-13 07:58:58 +0000765
766 def XVMAXDP : XX3Form<60, 224,
767 (outs vsrc:$XT), (ins vsrc:$XA, vsrc:$XB),
Bill Schmidt1ca69fa2014-10-31 19:19:07 +0000768 "xvmaxdp $XT, $XA, $XB", IIC_VecFP,
769 [(set vsrc:$XT,
770 (int_ppc_vsx_xvmaxdp vsrc:$XA, vsrc:$XB))]>;
Hal Finkel27774d92014-03-13 07:58:58 +0000771 def XVMINDP : XX3Form<60, 232,
772 (outs vsrc:$XT), (ins vsrc:$XA, vsrc:$XB),
Bill Schmidt1ca69fa2014-10-31 19:19:07 +0000773 "xvmindp $XT, $XA, $XB", IIC_VecFP,
774 [(set vsrc:$XT,
775 (int_ppc_vsx_xvmindp vsrc:$XA, vsrc:$XB))]>;
Hal Finkel27774d92014-03-13 07:58:58 +0000776
777 def XVMAXSP : XX3Form<60, 192,
778 (outs vsrc:$XT), (ins vsrc:$XA, vsrc:$XB),
Bill Schmidt1ca69fa2014-10-31 19:19:07 +0000779 "xvmaxsp $XT, $XA, $XB", IIC_VecFP,
780 [(set vsrc:$XT,
781 (int_ppc_vsx_xvmaxsp vsrc:$XA, vsrc:$XB))]>;
Hal Finkel27774d92014-03-13 07:58:58 +0000782 def XVMINSP : XX3Form<60, 200,
783 (outs vsrc:$XT), (ins vsrc:$XA, vsrc:$XB),
Bill Schmidt1ca69fa2014-10-31 19:19:07 +0000784 "xvminsp $XT, $XA, $XB", IIC_VecFP,
785 [(set vsrc:$XT,
786 (int_ppc_vsx_xvminsp vsrc:$XA, vsrc:$XB))]>;
Hal Finkele01d3212014-03-24 15:07:28 +0000787 } // isCommutable
Hal Finkel27774d92014-03-13 07:58:58 +0000788} // Uses = [RM]
789
790 // Logical Instructions
Hal Finkele01d3212014-03-24 15:07:28 +0000791 let isCommutable = 1 in
Hal Finkel27774d92014-03-13 07:58:58 +0000792 def XXLAND : XX3Form<60, 130,
793 (outs vsrc:$XT), (ins vsrc:$XA, vsrc:$XB),
Hal Finkelbd4de9d2014-03-26 04:55:40 +0000794 "xxland $XT, $XA, $XB", IIC_VecGeneral,
795 [(set v4i32:$XT, (and v4i32:$XA, v4i32:$XB))]>;
Hal Finkel27774d92014-03-13 07:58:58 +0000796 def XXLANDC : XX3Form<60, 138,
797 (outs vsrc:$XT), (ins vsrc:$XA, vsrc:$XB),
Hal Finkelbd4de9d2014-03-26 04:55:40 +0000798 "xxlandc $XT, $XA, $XB", IIC_VecGeneral,
799 [(set v4i32:$XT, (and v4i32:$XA,
800 (vnot_ppc v4i32:$XB)))]>;
Hal Finkele01d3212014-03-24 15:07:28 +0000801 let isCommutable = 1 in {
Hal Finkel27774d92014-03-13 07:58:58 +0000802 def XXLNOR : XX3Form<60, 162,
803 (outs vsrc:$XT), (ins vsrc:$XA, vsrc:$XB),
Hal Finkelbd4de9d2014-03-26 04:55:40 +0000804 "xxlnor $XT, $XA, $XB", IIC_VecGeneral,
805 [(set v4i32:$XT, (vnot_ppc (or v4i32:$XA,
806 v4i32:$XB)))]>;
Hal Finkel27774d92014-03-13 07:58:58 +0000807 def XXLOR : XX3Form<60, 146,
808 (outs vsrc:$XT), (ins vsrc:$XA, vsrc:$XB),
Hal Finkelbd4de9d2014-03-26 04:55:40 +0000809 "xxlor $XT, $XA, $XB", IIC_VecGeneral,
810 [(set v4i32:$XT, (or v4i32:$XA, v4i32:$XB))]>;
Hal Finkel19be5062014-03-29 05:29:01 +0000811 let isCodeGenOnly = 1 in
812 def XXLORf: XX3Form<60, 146,
813 (outs vsfrc:$XT), (ins vsfrc:$XA, vsfrc:$XB),
814 "xxlor $XT, $XA, $XB", IIC_VecGeneral, []>;
Hal Finkel27774d92014-03-13 07:58:58 +0000815 def XXLXOR : XX3Form<60, 154,
816 (outs vsrc:$XT), (ins vsrc:$XA, vsrc:$XB),
Hal Finkelbd4de9d2014-03-26 04:55:40 +0000817 "xxlxor $XT, $XA, $XB", IIC_VecGeneral,
818 [(set v4i32:$XT, (xor v4i32:$XA, v4i32:$XB))]>;
Hal Finkele01d3212014-03-24 15:07:28 +0000819 } // isCommutable
Nemanja Ivanovicd2c3c512016-09-23 13:25:31 +0000820 let isCodeGenOnly = 1 in
821 def XXLXORz : XX3Form_Zero<60, 154, (outs vsrc:$XT), (ins),
822 "xxlxor $XT, $XT, $XT", IIC_VecGeneral,
823 [(set v4i32:$XT, (v4i32 immAllZerosV))]>;
Hal Finkel27774d92014-03-13 07:58:58 +0000824
Ehsan Amiric90b02c2016-10-24 17:31:09 +0000825 let isCodeGenOnly = 1 in {
826 def XXLXORdpz : XX3Form_SetZero<60, 154,
827 (outs vsfrc:$XT), (ins),
828 "xxlxor $XT, $XT, $XT", IIC_VecGeneral,
829 [(set f64:$XT, (fpimm0))]>;
830 def XXLXORspz : XX3Form_SetZero<60, 154,
831 (outs vssrc:$XT), (ins),
832 "xxlxor $XT, $XT, $XT", IIC_VecGeneral,
833 [(set f32:$XT, (fpimm0))]>;
834 }
835
Hal Finkel27774d92014-03-13 07:58:58 +0000836 // Permutation Instructions
837 def XXMRGHW : XX3Form<60, 18,
838 (outs vsrc:$XT), (ins vsrc:$XA, vsrc:$XB),
839 "xxmrghw $XT, $XA, $XB", IIC_VecPerm, []>;
840 def XXMRGLW : XX3Form<60, 50,
841 (outs vsrc:$XT), (ins vsrc:$XA, vsrc:$XB),
842 "xxmrglw $XT, $XA, $XB", IIC_VecPerm, []>;
843
844 def XXPERMDI : XX3Form_2<60, 10,
845 (outs vsrc:$XT), (ins vsrc:$XA, vsrc:$XB, u2imm:$DM),
846 "xxpermdi $XT, $XA, $XB, $DM", IIC_VecPerm, []>;
Nemanja Ivanovic15748f42016-12-06 11:47:14 +0000847 let isCodeGenOnly = 1 in
848 def XXPERMDIs : XX3Form_2s<60, 10, (outs vsrc:$XT), (ins vsfrc:$XA, u2imm:$DM),
Nemanja Ivanovic11049f82016-10-04 06:59:23 +0000849 "xxpermdi $XT, $XA, $XA, $DM", IIC_VecPerm, []>;
Hal Finkel27774d92014-03-13 07:58:58 +0000850 def XXSEL : XX4Form<60, 3,
851 (outs vsrc:$XT), (ins vsrc:$XA, vsrc:$XB, vsrc:$XC),
852 "xxsel $XT, $XA, $XB, $XC", IIC_VecPerm, []>;
853
854 def XXSLDWI : XX3Form_2<60, 2,
855 (outs vsrc:$XT), (ins vsrc:$XA, vsrc:$XB, u2imm:$SHW),
Nemanja Ivanovicb43bb612016-07-12 21:00:10 +0000856 "xxsldwi $XT, $XA, $XB, $SHW", IIC_VecPerm,
857 [(set v4i32:$XT, (PPCvecshl v4i32:$XA, v4i32:$XB,
858 imm32SExt16:$SHW))]>;
Hal Finkel27774d92014-03-13 07:58:58 +0000859 def XXSPLTW : XX2Form_2<60, 164,
860 (outs vsrc:$XT), (ins vsrc:$XB, u2imm:$UIM),
Nemanja Ivanovic1a2b2f02016-05-04 16:04:02 +0000861 "xxspltw $XT, $XB, $UIM", IIC_VecPerm,
862 [(set v4i32:$XT,
863 (PPCxxsplt v4i32:$XB, imm32SExt16:$UIM))]>;
Nemanja Ivanovic11049f82016-10-04 06:59:23 +0000864 let isCodeGenOnly = 1 in
865 def XXSPLTWs : XX2Form_2<60, 164,
866 (outs vsrc:$XT), (ins vfrc:$XB, u2imm:$UIM),
867 "xxspltw $XT, $XB, $UIM", IIC_VecPerm, []>;
Craig Topperc50d64b2014-11-26 00:46:26 +0000868} // hasSideEffects
Nemanja Ivanovic11049f82016-10-04 06:59:23 +0000869} // UseVSXReg = 1
Hal Finkel27774d92014-03-13 07:58:58 +0000870
Bill Schmidt61e65232014-10-22 13:13:40 +0000871// SELECT_CC_* - Used to implement the SELECT_CC DAG operation. Expanded after
872// instruction selection into a branch sequence.
873let usesCustomInserter = 1, // Expanded after instruction selection.
874 PPC970_Single = 1 in {
875
876 def SELECT_CC_VSRC: Pseudo<(outs vsrc:$dst),
877 (ins crrc:$cond, vsrc:$T, vsrc:$F, i32imm:$BROPC),
878 "#SELECT_CC_VSRC",
879 []>;
Bill Schmidt9c54bbd2014-10-22 16:58:20 +0000880 def SELECT_VSRC: Pseudo<(outs vsrc:$dst),
881 (ins crbitrc:$cond, vsrc:$T, vsrc:$F),
882 "#SELECT_VSRC",
Bill Schmidt61e65232014-10-22 13:13:40 +0000883 [(set v2f64:$dst,
884 (select i1:$cond, v2f64:$T, v2f64:$F))]>;
Bill Schmidt9c54bbd2014-10-22 16:58:20 +0000885 def SELECT_CC_VSFRC: Pseudo<(outs f8rc:$dst),
886 (ins crrc:$cond, f8rc:$T, f8rc:$F,
887 i32imm:$BROPC), "#SELECT_CC_VSFRC",
888 []>;
889 def SELECT_VSFRC: Pseudo<(outs f8rc:$dst),
890 (ins crbitrc:$cond, f8rc:$T, f8rc:$F),
891 "#SELECT_VSFRC",
892 [(set f64:$dst,
893 (select i1:$cond, f64:$T, f64:$F))]>;
Nemanja Ivanovicf3c94b12015-05-07 18:24:05 +0000894 def SELECT_CC_VSSRC: Pseudo<(outs f4rc:$dst),
895 (ins crrc:$cond, f4rc:$T, f4rc:$F,
896 i32imm:$BROPC), "#SELECT_CC_VSSRC",
897 []>;
898 def SELECT_VSSRC: Pseudo<(outs f4rc:$dst),
899 (ins crbitrc:$cond, f4rc:$T, f4rc:$F),
900 "#SELECT_VSSRC",
901 [(set f32:$dst,
902 (select i1:$cond, f32:$T, f32:$F))]>;
Bill Schmidt9c54bbd2014-10-22 16:58:20 +0000903} // usesCustomInserter
904} // AddedComplexity
Bill Schmidt61e65232014-10-22 13:13:40 +0000905
Hal Finkel27774d92014-03-13 07:58:58 +0000906def : InstAlias<"xvmovdp $XT, $XB",
907 (XVCPSGNDP vsrc:$XT, vsrc:$XB, vsrc:$XB)>;
908def : InstAlias<"xvmovsp $XT, $XB",
909 (XVCPSGNSP vsrc:$XT, vsrc:$XB, vsrc:$XB)>;
910
911def : InstAlias<"xxspltd $XT, $XB, 0",
912 (XXPERMDI vsrc:$XT, vsrc:$XB, vsrc:$XB, 0)>;
913def : InstAlias<"xxspltd $XT, $XB, 1",
914 (XXPERMDI vsrc:$XT, vsrc:$XB, vsrc:$XB, 3)>;
915def : InstAlias<"xxmrghd $XT, $XA, $XB",
916 (XXPERMDI vsrc:$XT, vsrc:$XA, vsrc:$XB, 0)>;
917def : InstAlias<"xxmrgld $XT, $XA, $XB",
918 (XXPERMDI vsrc:$XT, vsrc:$XA, vsrc:$XB, 3)>;
919def : InstAlias<"xxswapd $XT, $XB",
920 (XXPERMDI vsrc:$XT, vsrc:$XB, vsrc:$XB, 2)>;
Nemanja Ivanovic15748f42016-12-06 11:47:14 +0000921def : InstAlias<"xxspltd $XT, $XB, 0",
922 (XXPERMDIs vsrc:$XT, vsfrc:$XB, 0)>;
923def : InstAlias<"xxspltd $XT, $XB, 1",
924 (XXPERMDIs vsrc:$XT, vsfrc:$XB, 3)>;
925def : InstAlias<"xxswapd $XT, $XB",
926 (XXPERMDIs vsrc:$XT, vsfrc:$XB, 2)>;
Hal Finkel27774d92014-03-13 07:58:58 +0000927
928let AddedComplexity = 400 in { // Prefer VSX patterns over non-VSX patterns.
Bill Schmidt10f6eb92014-12-09 16:43:32 +0000929
Nemanja Ivanovic6f22b412016-09-27 08:42:12 +0000930def : Pat<(v4i32 (vnot_ppc v4i32:$A)),
931 (v4i32 (XXLNOR $A, $A))>;
Bill Schmidt10f6eb92014-12-09 16:43:32 +0000932let Predicates = [IsBigEndian] in {
Hal Finkel27774d92014-03-13 07:58:58 +0000933def : Pat<(v2f64 (scalar_to_vector f64:$A)),
Hal Finkel19be5062014-03-29 05:29:01 +0000934 (v2f64 (SUBREG_TO_REG (i64 1), $A, sub_64))>;
Hal Finkel27774d92014-03-13 07:58:58 +0000935
Matt Arsenaultfbd9bbf2015-12-11 19:20:16 +0000936def : Pat<(f64 (extractelt v2f64:$S, 0)),
Hal Finkel19be5062014-03-29 05:29:01 +0000937 (f64 (EXTRACT_SUBREG $S, sub_64))>;
Matt Arsenaultfbd9bbf2015-12-11 19:20:16 +0000938def : Pat<(f64 (extractelt v2f64:$S, 1)),
Hal Finkel19be5062014-03-29 05:29:01 +0000939 (f64 (EXTRACT_SUBREG (XXPERMDI $S, $S, 2), sub_64))>;
Bill Schmidt10f6eb92014-12-09 16:43:32 +0000940}
941
942let Predicates = [IsLittleEndian] in {
943def : Pat<(v2f64 (scalar_to_vector f64:$A)),
944 (v2f64 (XXPERMDI (SUBREG_TO_REG (i64 1), $A, sub_64),
945 (SUBREG_TO_REG (i64 1), $A, sub_64), 0))>;
946
Matt Arsenaultfbd9bbf2015-12-11 19:20:16 +0000947def : Pat<(f64 (extractelt v2f64:$S, 0)),
Bill Schmidt10f6eb92014-12-09 16:43:32 +0000948 (f64 (EXTRACT_SUBREG (XXPERMDI $S, $S, 2), sub_64))>;
Matt Arsenaultfbd9bbf2015-12-11 19:20:16 +0000949def : Pat<(f64 (extractelt v2f64:$S, 1)),
Bill Schmidt10f6eb92014-12-09 16:43:32 +0000950 (f64 (EXTRACT_SUBREG $S, sub_64))>;
951}
Hal Finkel27774d92014-03-13 07:58:58 +0000952
953// Additional fnmsub patterns: -a*c + b == -(a*c - b)
954def : Pat<(fma (fneg f64:$A), f64:$C, f64:$B),
955 (XSNMSUBADP $B, $C, $A)>;
956def : Pat<(fma f64:$A, (fneg f64:$C), f64:$B),
957 (XSNMSUBADP $B, $C, $A)>;
958
959def : Pat<(fma (fneg v2f64:$A), v2f64:$C, v2f64:$B),
960 (XVNMSUBADP $B, $C, $A)>;
961def : Pat<(fma v2f64:$A, (fneg v2f64:$C), v2f64:$B),
962 (XVNMSUBADP $B, $C, $A)>;
963
964def : Pat<(fma (fneg v4f32:$A), v4f32:$C, v4f32:$B),
965 (XVNMSUBASP $B, $C, $A)>;
966def : Pat<(fma v4f32:$A, (fneg v4f32:$C), v4f32:$B),
967 (XVNMSUBASP $B, $C, $A)>;
968
Hal Finkel9e0baa62014-04-01 19:24:27 +0000969def : Pat<(v2f64 (bitconvert v4f32:$A)),
970 (COPY_TO_REGCLASS $A, VSRC)>;
Hal Finkel27774d92014-03-13 07:58:58 +0000971def : Pat<(v2f64 (bitconvert v4i32:$A)),
972 (COPY_TO_REGCLASS $A, VSRC)>;
973def : Pat<(v2f64 (bitconvert v8i16:$A)),
974 (COPY_TO_REGCLASS $A, VSRC)>;
975def : Pat<(v2f64 (bitconvert v16i8:$A)),
976 (COPY_TO_REGCLASS $A, VSRC)>;
977
Hal Finkel9e0baa62014-04-01 19:24:27 +0000978def : Pat<(v4f32 (bitconvert v2f64:$A)),
979 (COPY_TO_REGCLASS $A, VRRC)>;
Hal Finkel27774d92014-03-13 07:58:58 +0000980def : Pat<(v4i32 (bitconvert v2f64:$A)),
981 (COPY_TO_REGCLASS $A, VRRC)>;
982def : Pat<(v8i16 (bitconvert v2f64:$A)),
983 (COPY_TO_REGCLASS $A, VRRC)>;
984def : Pat<(v16i8 (bitconvert v2f64:$A)),
985 (COPY_TO_REGCLASS $A, VRRC)>;
986
Hal Finkel9e0baa62014-04-01 19:24:27 +0000987def : Pat<(v2i64 (bitconvert v4f32:$A)),
988 (COPY_TO_REGCLASS $A, VSRC)>;
Hal Finkela6c8b512014-03-26 16:12:58 +0000989def : Pat<(v2i64 (bitconvert v4i32:$A)),
990 (COPY_TO_REGCLASS $A, VSRC)>;
991def : Pat<(v2i64 (bitconvert v8i16:$A)),
992 (COPY_TO_REGCLASS $A, VSRC)>;
993def : Pat<(v2i64 (bitconvert v16i8:$A)),
994 (COPY_TO_REGCLASS $A, VSRC)>;
995
Hal Finkel9e0baa62014-04-01 19:24:27 +0000996def : Pat<(v4f32 (bitconvert v2i64:$A)),
997 (COPY_TO_REGCLASS $A, VRRC)>;
Hal Finkela6c8b512014-03-26 16:12:58 +0000998def : Pat<(v4i32 (bitconvert v2i64:$A)),
999 (COPY_TO_REGCLASS $A, VRRC)>;
1000def : Pat<(v8i16 (bitconvert v2i64:$A)),
1001 (COPY_TO_REGCLASS $A, VRRC)>;
1002def : Pat<(v16i8 (bitconvert v2i64:$A)),
1003 (COPY_TO_REGCLASS $A, VRRC)>;
1004
Hal Finkel9281c9a2014-03-26 18:26:30 +00001005def : Pat<(v2f64 (bitconvert v2i64:$A)),
1006 (COPY_TO_REGCLASS $A, VRRC)>;
1007def : Pat<(v2i64 (bitconvert v2f64:$A)),
1008 (COPY_TO_REGCLASS $A, VRRC)>;
1009
Kit Bartond4eb73c2015-05-05 16:10:44 +00001010def : Pat<(v2f64 (bitconvert v1i128:$A)),
1011 (COPY_TO_REGCLASS $A, VRRC)>;
1012def : Pat<(v1i128 (bitconvert v2f64:$A)),
1013 (COPY_TO_REGCLASS $A, VRRC)>;
1014
Hal Finkel5c0d1452014-03-30 13:22:59 +00001015// sign extension patterns
1016// To extend "in place" from v2i32 to v2i64, we have input data like:
1017// | undef | i32 | undef | i32 |
1018// but xvcvsxwdp expects the input in big-Endian format:
1019// | i32 | undef | i32 | undef |
1020// so we need to shift everything to the left by one i32 (word) before
1021// the conversion.
1022def : Pat<(sext_inreg v2i64:$C, v2i32),
1023 (XVCVDPSXDS (XVCVSXWDP (XXSLDWI $C, $C, 1)))>;
1024def : Pat<(v2f64 (sint_to_fp (sext_inreg v2i64:$C, v2i32))),
1025 (XVCVSXWDP (XXSLDWI $C, $C, 1))>;
1026
Nemanja Ivanovic44513e52016-07-05 09:22:29 +00001027def : Pat<(v2f64 (PPCsvec2fp v4i32:$C, 0)),
1028 (v2f64 (XVCVSXWDP (v2i64 (XXMRGHW $C, $C))))>;
1029def : Pat<(v2f64 (PPCsvec2fp v4i32:$C, 1)),
1030 (v2f64 (XVCVSXWDP (v2i64 (XXMRGLW $C, $C))))>;
1031
1032def : Pat<(v2f64 (PPCuvec2fp v4i32:$C, 0)),
1033 (v2f64 (XVCVUXWDP (v2i64 (XXMRGHW $C, $C))))>;
1034def : Pat<(v2f64 (PPCuvec2fp v4i32:$C, 1)),
1035 (v2f64 (XVCVUXWDP (v2i64 (XXMRGLW $C, $C))))>;
1036
Bill Schmidt2d1128a2014-10-17 15:13:38 +00001037// Loads.
Nemanja Ivanovic6e7879c2016-09-22 09:52:19 +00001038let Predicates = [HasVSX, HasOnlySwappingMemOps] in {
Nemanja Ivanovic6e7879c2016-09-22 09:52:19 +00001039 def : Pat<(v2f64 (PPClxvd2x xoaddr:$src)), (LXVD2X xoaddr:$src)>;
Bill Schmidt2d1128a2014-10-17 15:13:38 +00001040
Nemanja Ivanovic6e7879c2016-09-22 09:52:19 +00001041 // Stores.
1042 def : Pat<(int_ppc_vsx_stxvd2x v2f64:$rS, xoaddr:$dst),
1043 (STXVD2X $rS, xoaddr:$dst)>;
Nemanja Ivanovicf57f1502016-11-29 23:00:33 +00001044 def : Pat<(int_ppc_vsx_stxvw4x v4i32:$rS, xoaddr:$dst),
1045 (STXVW4X $rS, xoaddr:$dst)>;
Tony Jiang5f850cd2016-11-15 14:25:56 +00001046 def : Pat<(int_ppc_vsx_stxvd2x_be v2f64:$rS, xoaddr:$dst),
1047 (STXVD2X $rS, xoaddr:$dst)>;
1048 def : Pat<(int_ppc_vsx_stxvw4x_be v4i32:$rS, xoaddr:$dst),
1049 (STXVW4X $rS, xoaddr:$dst)>;
Nemanja Ivanovic6e7879c2016-09-22 09:52:19 +00001050 def : Pat<(PPCstxvd2x v2f64:$rS, xoaddr:$dst), (STXVD2X $rS, xoaddr:$dst)>;
1051}
Nemanja Ivanovice78ffed2016-09-22 10:32:03 +00001052let Predicates = [IsBigEndian, HasVSX, HasOnlySwappingMemOps] in {
1053 def : Pat<(v2f64 (load xoaddr:$src)), (LXVD2X xoaddr:$src)>;
1054 def : Pat<(v2i64 (load xoaddr:$src)), (LXVD2X xoaddr:$src)>;
1055 def : Pat<(v4i32 (load xoaddr:$src)), (LXVW4X xoaddr:$src)>;
1056 def : Pat<(store v2f64:$rS, xoaddr:$dst), (STXVD2X $rS, xoaddr:$dst)>;
1057 def : Pat<(store v2i64:$rS, xoaddr:$dst), (STXVD2X $rS, xoaddr:$dst)>;
1058}
Bill Schmidtfae5d712014-12-09 16:35:51 +00001059
1060// Permutes.
1061def : Pat<(v2f64 (PPCxxswapd v2f64:$src)), (XXPERMDI $src, $src, 2)>;
1062def : Pat<(v2i64 (PPCxxswapd v2i64:$src)), (XXPERMDI $src, $src, 2)>;
1063def : Pat<(v4f32 (PPCxxswapd v4f32:$src)), (XXPERMDI $src, $src, 2)>;
1064def : Pat<(v4i32 (PPCxxswapd v4i32:$src)), (XXPERMDI $src, $src, 2)>;
Nemanja Ivanoviceebbcb62016-07-12 12:16:27 +00001065def : Pat<(v2f64 (PPCswapNoChain v2f64:$src)), (XXPERMDI $src, $src, 2)>;
Bill Schmidt2d1128a2014-10-17 15:13:38 +00001066
Bill Schmidt61e65232014-10-22 13:13:40 +00001067// Selects.
1068def : Pat<(v2f64 (selectcc i1:$lhs, i1:$rhs, v2f64:$tval, v2f64:$fval, SETLT)),
Hal Finkela2cdbce2015-08-30 22:12:50 +00001069 (SELECT_VSRC (CRANDC $lhs, $rhs), $tval, $fval)>;
1070def : Pat<(v2f64 (selectcc i1:$lhs, i1:$rhs, v2f64:$tval, v2f64:$fval, SETULT)),
Bill Schmidt61e65232014-10-22 13:13:40 +00001071 (SELECT_VSRC (CRANDC $rhs, $lhs), $tval, $fval)>;
1072def : Pat<(v2f64 (selectcc i1:$lhs, i1:$rhs, v2f64:$tval, v2f64:$fval, SETLE)),
Hal Finkela2cdbce2015-08-30 22:12:50 +00001073 (SELECT_VSRC (CRORC $lhs, $rhs), $tval, $fval)>;
1074def : Pat<(v2f64 (selectcc i1:$lhs, i1:$rhs, v2f64:$tval, v2f64:$fval, SETULE)),
Bill Schmidt61e65232014-10-22 13:13:40 +00001075 (SELECT_VSRC (CRORC $rhs, $lhs), $tval, $fval)>;
1076def : Pat<(v2f64 (selectcc i1:$lhs, i1:$rhs, v2f64:$tval, v2f64:$fval, SETEQ)),
1077 (SELECT_VSRC (CREQV $lhs, $rhs), $tval, $fval)>;
1078def : Pat<(v2f64 (selectcc i1:$lhs, i1:$rhs, v2f64:$tval, v2f64:$fval, SETGE)),
Hal Finkela2cdbce2015-08-30 22:12:50 +00001079 (SELECT_VSRC (CRORC $rhs, $lhs), $tval, $fval)>;
1080def : Pat<(v2f64 (selectcc i1:$lhs, i1:$rhs, v2f64:$tval, v2f64:$fval, SETUGE)),
Bill Schmidt61e65232014-10-22 13:13:40 +00001081 (SELECT_VSRC (CRORC $lhs, $rhs), $tval, $fval)>;
1082def : Pat<(v2f64 (selectcc i1:$lhs, i1:$rhs, v2f64:$tval, v2f64:$fval, SETGT)),
Hal Finkela2cdbce2015-08-30 22:12:50 +00001083 (SELECT_VSRC (CRANDC $rhs, $lhs), $tval, $fval)>;
1084def : Pat<(v2f64 (selectcc i1:$lhs, i1:$rhs, v2f64:$tval, v2f64:$fval, SETUGT)),
Bill Schmidt61e65232014-10-22 13:13:40 +00001085 (SELECT_VSRC (CRANDC $lhs, $rhs), $tval, $fval)>;
1086def : Pat<(v2f64 (selectcc i1:$lhs, i1:$rhs, v2f64:$tval, v2f64:$fval, SETNE)),
1087 (SELECT_VSRC (CRXOR $lhs, $rhs), $tval, $fval)>;
1088
Bill Schmidt9c54bbd2014-10-22 16:58:20 +00001089def : Pat<(f64 (selectcc i1:$lhs, i1:$rhs, f64:$tval, f64:$fval, SETLT)),
Hal Finkela2cdbce2015-08-30 22:12:50 +00001090 (SELECT_VSFRC (CRANDC $lhs, $rhs), $tval, $fval)>;
1091def : Pat<(f64 (selectcc i1:$lhs, i1:$rhs, f64:$tval, f64:$fval, SETULT)),
Bill Schmidt9c54bbd2014-10-22 16:58:20 +00001092 (SELECT_VSFRC (CRANDC $rhs, $lhs), $tval, $fval)>;
1093def : Pat<(f64 (selectcc i1:$lhs, i1:$rhs, f64:$tval, f64:$fval, SETLE)),
Hal Finkela2cdbce2015-08-30 22:12:50 +00001094 (SELECT_VSFRC (CRORC $lhs, $rhs), $tval, $fval)>;
1095def : Pat<(f64 (selectcc i1:$lhs, i1:$rhs, f64:$tval, f64:$fval, SETULE)),
Bill Schmidt9c54bbd2014-10-22 16:58:20 +00001096 (SELECT_VSFRC (CRORC $rhs, $lhs), $tval, $fval)>;
1097def : Pat<(f64 (selectcc i1:$lhs, i1:$rhs, f64:$tval, f64:$fval, SETEQ)),
1098 (SELECT_VSFRC (CREQV $lhs, $rhs), $tval, $fval)>;
1099def : Pat<(f64 (selectcc i1:$lhs, i1:$rhs, f64:$tval, f64:$fval, SETGE)),
Hal Finkela2cdbce2015-08-30 22:12:50 +00001100 (SELECT_VSFRC (CRORC $rhs, $lhs), $tval, $fval)>;
1101def : Pat<(f64 (selectcc i1:$lhs, i1:$rhs, f64:$tval, f64:$fval, SETUGE)),
Bill Schmidt9c54bbd2014-10-22 16:58:20 +00001102 (SELECT_VSFRC (CRORC $lhs, $rhs), $tval, $fval)>;
1103def : Pat<(f64 (selectcc i1:$lhs, i1:$rhs, f64:$tval, f64:$fval, SETGT)),
Hal Finkela2cdbce2015-08-30 22:12:50 +00001104 (SELECT_VSFRC (CRANDC $rhs, $lhs), $tval, $fval)>;
1105def : Pat<(f64 (selectcc i1:$lhs, i1:$rhs, f64:$tval, f64:$fval, SETUGT)),
Bill Schmidt9c54bbd2014-10-22 16:58:20 +00001106 (SELECT_VSFRC (CRANDC $lhs, $rhs), $tval, $fval)>;
1107def : Pat<(f64 (selectcc i1:$lhs, i1:$rhs, f64:$tval, f64:$fval, SETNE)),
1108 (SELECT_VSFRC (CRXOR $lhs, $rhs), $tval, $fval)>;
1109
Bill Schmidt76746922014-11-14 12:10:40 +00001110// Divides.
1111def : Pat<(int_ppc_vsx_xvdivsp v4f32:$A, v4f32:$B),
1112 (XVDIVSP $A, $B)>;
1113def : Pat<(int_ppc_vsx_xvdivdp v2f64:$A, v2f64:$B),
1114 (XVDIVDP $A, $B)>;
1115
Nemanja Ivanovic984a3612015-07-14 17:25:20 +00001116// Reciprocal estimate
1117def : Pat<(int_ppc_vsx_xvresp v4f32:$A),
1118 (XVRESP $A)>;
1119def : Pat<(int_ppc_vsx_xvredp v2f64:$A),
1120 (XVREDP $A)>;
1121
Nemanja Ivanovicd358b8f2015-07-05 06:03:51 +00001122// Recip. square root estimate
1123def : Pat<(int_ppc_vsx_xvrsqrtesp v4f32:$A),
1124 (XVRSQRTESP $A)>;
1125def : Pat<(int_ppc_vsx_xvrsqrtedp v2f64:$A),
1126 (XVRSQRTEDP $A)>;
1127
Nemanja Ivanovicd3c284f2016-07-18 15:30:00 +00001128let Predicates = [IsLittleEndian] in {
1129def : Pat<(f64 (PPCfcfid (PPCmtvsra (i64 (vector_extract v2i64:$S, 0))))),
1130 (f64 (XSCVSXDDP (COPY_TO_REGCLASS (XXPERMDI $S, $S, 2), VSFRC)))>;
1131def : Pat<(f64 (PPCfcfid (PPCmtvsra (i64 (vector_extract v2i64:$S, 1))))),
1132 (f64 (XSCVSXDDP (COPY_TO_REGCLASS (f64 (COPY_TO_REGCLASS $S, VSRC)), VSFRC)))>;
1133def : Pat<(f64 (PPCfcfidu (PPCmtvsra (i64 (vector_extract v2i64:$S, 0))))),
1134 (f64 (XSCVUXDDP (COPY_TO_REGCLASS (XXPERMDI $S, $S, 2), VSFRC)))>;
1135def : Pat<(f64 (PPCfcfidu (PPCmtvsra (i64 (vector_extract v2i64:$S, 1))))),
1136 (f64 (XSCVUXDDP (COPY_TO_REGCLASS (f64 (COPY_TO_REGCLASS $S, VSRC)), VSFRC)))>;
1137} // IsLittleEndian
1138
1139let Predicates = [IsBigEndian] in {
1140def : Pat<(f64 (PPCfcfid (PPCmtvsra (i64 (vector_extract v2i64:$S, 0))))),
1141 (f64 (XSCVSXDDP (COPY_TO_REGCLASS $S, VSFRC)))>;
1142def : Pat<(f64 (PPCfcfid (PPCmtvsra (i64 (vector_extract v2i64:$S, 1))))),
1143 (f64 (XSCVSXDDP (COPY_TO_REGCLASS (XXPERMDI $S, $S, 2), VSFRC)))>;
1144def : Pat<(f64 (PPCfcfidu (PPCmtvsra (i64 (vector_extract v2i64:$S, 0))))),
1145 (f64 (XSCVUXDDP (COPY_TO_REGCLASS $S, VSFRC)))>;
1146def : Pat<(f64 (PPCfcfidu (PPCmtvsra (i64 (vector_extract v2i64:$S, 1))))),
1147 (f64 (XSCVUXDDP (COPY_TO_REGCLASS (XXPERMDI $S, $S, 2), VSFRC)))>;
1148} // IsBigEndian
1149
Hal Finkel27774d92014-03-13 07:58:58 +00001150} // AddedComplexity
1151} // HasVSX
1152
Nemanja Ivanovic11049f82016-10-04 06:59:23 +00001153def ScalarLoads {
1154 dag Li8 = (i32 (extloadi8 xoaddr:$src));
1155 dag ZELi8 = (i32 (zextloadi8 xoaddr:$src));
1156 dag ZELi8i64 = (i64 (zextloadi8 xoaddr:$src));
1157 dag SELi8 = (i32 (sext_inreg (extloadi8 xoaddr:$src), i8));
1158 dag SELi8i64 = (i64 (sext_inreg (extloadi8 xoaddr:$src), i8));
1159
1160 dag Li16 = (i32 (extloadi16 xoaddr:$src));
1161 dag ZELi16 = (i32 (zextloadi16 xoaddr:$src));
1162 dag ZELi16i64 = (i64 (zextloadi16 xoaddr:$src));
1163 dag SELi16 = (i32 (sextloadi16 xoaddr:$src));
1164 dag SELi16i64 = (i64 (sextloadi16 xoaddr:$src));
1165
1166 dag Li32 = (i32 (load xoaddr:$src));
1167}
1168
Kit Barton298beb52015-02-18 16:21:46 +00001169// The following VSX instructions were introduced in Power ISA 2.07
1170/* FIXME: if the operands are v2i64, these patterns will not match.
1171 we should define new patterns or otherwise match the same patterns
1172 when the elements are larger than i32.
1173*/
1174def HasP8Vector : Predicate<"PPCSubTarget->hasP8Vector()">;
Nemanja Ivanovicc38b5312015-04-11 10:40:42 +00001175def HasDirectMove : Predicate<"PPCSubTarget->hasDirectMove()">;
Kit Barton298beb52015-02-18 16:21:46 +00001176let Predicates = [HasP8Vector] in {
1177let AddedComplexity = 400 in { // Prefer VSX patterns over non-VSX patterns.
Nemanja Ivanovic11049f82016-10-04 06:59:23 +00001178 let isCommutable = 1, UseVSXReg = 1 in {
Nemanja Ivanovicf02def62015-05-21 19:32:49 +00001179 def XXLEQV : XX3Form<60, 186,
1180 (outs vsrc:$XT), (ins vsrc:$XA, vsrc:$XB),
1181 "xxleqv $XT, $XA, $XB", IIC_VecGeneral,
1182 [(set v4i32:$XT, (vnot_ppc (xor v4i32:$XA, v4i32:$XB)))]>;
1183 def XXLNAND : XX3Form<60, 178,
1184 (outs vsrc:$XT), (ins vsrc:$XA, vsrc:$XB),
1185 "xxlnand $XT, $XA, $XB", IIC_VecGeneral,
1186 [(set v4i32:$XT, (vnot_ppc (and v4i32:$XA,
Kit Barton298beb52015-02-18 16:21:46 +00001187 v4i32:$XB)))]>;
Nemanja Ivanovic11049f82016-10-04 06:59:23 +00001188 } // isCommutable, UseVSXReg
Nemanja Ivanovicd9e4b4f2015-07-10 14:25:17 +00001189
Nemanja Ivanovic5655fb32015-07-10 12:38:08 +00001190 def : Pat<(int_ppc_vsx_xxleqv v4i32:$A, v4i32:$B),
1191 (XXLEQV $A, $B)>;
Nemanja Ivanovicf02def62015-05-21 19:32:49 +00001192
Nemanja Ivanovic11049f82016-10-04 06:59:23 +00001193 let UseVSXReg = 1 in {
Nemanja Ivanovicf02def62015-05-21 19:32:49 +00001194 def XXLORC : XX3Form<60, 170,
1195 (outs vsrc:$XT), (ins vsrc:$XA, vsrc:$XB),
1196 "xxlorc $XT, $XA, $XB", IIC_VecGeneral,
1197 [(set v4i32:$XT, (or v4i32:$XA, (vnot_ppc v4i32:$XB)))]>;
1198
Nemanja Ivanovicf3c94b12015-05-07 18:24:05 +00001199 // VSX scalar loads introduced in ISA 2.07
1200 let mayLoad = 1 in {
Nemanja Ivanovic6354d232016-10-04 11:25:52 +00001201 let CodeSize = 3 in
Nemanja Ivanovicf3c94b12015-05-07 18:24:05 +00001202 def LXSSPX : XX1Form<31, 524, (outs vssrc:$XT), (ins memrr:$src),
1203 "lxsspx $XT, $src", IIC_LdStLFD,
1204 [(set f32:$XT, (load xoaddr:$src))]>;
1205 def LXSIWAX : XX1Form<31, 76, (outs vsfrc:$XT), (ins memrr:$src),
1206 "lxsiwax $XT, $src", IIC_LdStLFD,
1207 [(set f64:$XT, (PPClfiwax xoaddr:$src))]>;
1208 def LXSIWZX : XX1Form<31, 12, (outs vsfrc:$XT), (ins memrr:$src),
1209 "lxsiwzx $XT, $src", IIC_LdStLFD,
1210 [(set f64:$XT, (PPClfiwzx xoaddr:$src))]>;
1211 } // mayLoad
1212
1213 // VSX scalar stores introduced in ISA 2.07
1214 let mayStore = 1 in {
Nemanja Ivanovic6354d232016-10-04 11:25:52 +00001215 let CodeSize = 3 in
Nemanja Ivanovicf3c94b12015-05-07 18:24:05 +00001216 def STXSSPX : XX1Form<31, 652, (outs), (ins vssrc:$XT, memrr:$dst),
1217 "stxsspx $XT, $dst", IIC_LdStSTFD,
1218 [(store f32:$XT, xoaddr:$dst)]>;
1219 def STXSIWX : XX1Form<31, 140, (outs), (ins vsfrc:$XT, memrr:$dst),
1220 "stxsiwx $XT, $dst", IIC_LdStSTFD,
1221 [(PPCstfiwx f64:$XT, xoaddr:$dst)]>;
1222 } // mayStore
Nemanja Ivanovic11049f82016-10-04 06:59:23 +00001223 } // UseVSXReg = 1
Nemanja Ivanovicf02def62015-05-21 19:32:49 +00001224
1225 def : Pat<(f64 (extloadf32 xoaddr:$src)),
1226 (COPY_TO_REGCLASS (LXSSPX xoaddr:$src), VSFRC)>;
Nemanja Ivanovicdf1cb522016-11-29 16:11:34 +00001227 def : Pat<(f32 (fpround (extloadf32 xoaddr:$src))),
1228 (f32 (LXSSPX xoaddr:$src))>;
Michael Kuperstein2bc3d4d2016-08-18 20:08:15 +00001229 def : Pat<(f64 (fpextend f32:$src)),
Nemanja Ivanovicf02def62015-05-21 19:32:49 +00001230 (COPY_TO_REGCLASS $src, VSFRC)>;
Hal Finkela2cdbce2015-08-30 22:12:50 +00001231
Nemanja Ivanovicf02def62015-05-21 19:32:49 +00001232 def : Pat<(f32 (selectcc i1:$lhs, i1:$rhs, f32:$tval, f32:$fval, SETLT)),
Hal Finkela2cdbce2015-08-30 22:12:50 +00001233 (SELECT_VSSRC (CRANDC $lhs, $rhs), $tval, $fval)>;
1234 def : Pat<(f32 (selectcc i1:$lhs, i1:$rhs, f32:$tval, f32:$fval, SETULT)),
Nemanja Ivanovicf02def62015-05-21 19:32:49 +00001235 (SELECT_VSSRC (CRANDC $rhs, $lhs), $tval, $fval)>;
1236 def : Pat<(f32 (selectcc i1:$lhs, i1:$rhs, f32:$tval, f32:$fval, SETLE)),
Hal Finkela2cdbce2015-08-30 22:12:50 +00001237 (SELECT_VSSRC (CRORC $lhs, $rhs), $tval, $fval)>;
1238 def : Pat<(f32 (selectcc i1:$lhs, i1:$rhs, f32:$tval, f32:$fval, SETULE)),
Nemanja Ivanovicf02def62015-05-21 19:32:49 +00001239 (SELECT_VSSRC (CRORC $rhs, $lhs), $tval, $fval)>;
1240 def : Pat<(f32 (selectcc i1:$lhs, i1:$rhs, f32:$tval, f32:$fval, SETEQ)),
1241 (SELECT_VSSRC (CREQV $lhs, $rhs), $tval, $fval)>;
1242 def : Pat<(f32 (selectcc i1:$lhs, i1:$rhs, f32:$tval, f32:$fval, SETGE)),
Hal Finkela2cdbce2015-08-30 22:12:50 +00001243 (SELECT_VSSRC (CRORC $rhs, $lhs), $tval, $fval)>;
1244 def : Pat<(f32 (selectcc i1:$lhs, i1:$rhs, f32:$tval, f32:$fval, SETUGE)),
Nemanja Ivanovicf02def62015-05-21 19:32:49 +00001245 (SELECT_VSSRC (CRORC $lhs, $rhs), $tval, $fval)>;
1246 def : Pat<(f32 (selectcc i1:$lhs, i1:$rhs, f32:$tval, f32:$fval, SETGT)),
Hal Finkela2cdbce2015-08-30 22:12:50 +00001247 (SELECT_VSSRC (CRANDC $rhs, $lhs), $tval, $fval)>;
1248 def : Pat<(f32 (selectcc i1:$lhs, i1:$rhs, f32:$tval, f32:$fval, SETUGT)),
Nemanja Ivanovicf02def62015-05-21 19:32:49 +00001249 (SELECT_VSSRC (CRANDC $lhs, $rhs), $tval, $fval)>;
1250 def : Pat<(f32 (selectcc i1:$lhs, i1:$rhs, f32:$tval, f32:$fval, SETNE)),
Hal Finkela2cdbce2015-08-30 22:12:50 +00001251 (SELECT_VSSRC (CRXOR $lhs, $rhs), $tval, $fval)>;
Nemanja Ivanovicf02def62015-05-21 19:32:49 +00001252
Nemanja Ivanovic11049f82016-10-04 06:59:23 +00001253 let UseVSXReg = 1 in {
Nemanja Ivanovicf02def62015-05-21 19:32:49 +00001254 // VSX Elementary Scalar FP arithmetic (SP)
1255 let isCommutable = 1 in {
1256 def XSADDSP : XX3Form<60, 0,
1257 (outs vssrc:$XT), (ins vssrc:$XA, vssrc:$XB),
1258 "xsaddsp $XT, $XA, $XB", IIC_VecFP,
1259 [(set f32:$XT, (fadd f32:$XA, f32:$XB))]>;
1260 def XSMULSP : XX3Form<60, 16,
1261 (outs vssrc:$XT), (ins vssrc:$XA, vssrc:$XB),
1262 "xsmulsp $XT, $XA, $XB", IIC_VecFP,
1263 [(set f32:$XT, (fmul f32:$XA, f32:$XB))]>;
1264 } // isCommutable
1265
1266 def XSDIVSP : XX3Form<60, 24,
1267 (outs vssrc:$XT), (ins vssrc:$XA, vssrc:$XB),
1268 "xsdivsp $XT, $XA, $XB", IIC_FPDivS,
1269 [(set f32:$XT, (fdiv f32:$XA, f32:$XB))]>;
1270 def XSRESP : XX2Form<60, 26,
1271 (outs vssrc:$XT), (ins vssrc:$XB),
1272 "xsresp $XT, $XB", IIC_VecFP,
1273 [(set f32:$XT, (PPCfre f32:$XB))]>;
1274 def XSSQRTSP : XX2Form<60, 11,
1275 (outs vssrc:$XT), (ins vssrc:$XB),
1276 "xssqrtsp $XT, $XB", IIC_FPSqrtS,
1277 [(set f32:$XT, (fsqrt f32:$XB))]>;
1278 def XSRSQRTESP : XX2Form<60, 10,
1279 (outs vssrc:$XT), (ins vssrc:$XB),
1280 "xsrsqrtesp $XT, $XB", IIC_VecFP,
1281 [(set f32:$XT, (PPCfrsqrte f32:$XB))]>;
1282 def XSSUBSP : XX3Form<60, 8,
1283 (outs vssrc:$XT), (ins vssrc:$XA, vssrc:$XB),
1284 "xssubsp $XT, $XA, $XB", IIC_VecFP,
1285 [(set f32:$XT, (fsub f32:$XA, f32:$XB))]>;
Nemanja Ivanovic376e1732015-05-29 17:13:25 +00001286
1287 // FMA Instructions
1288 let BaseName = "XSMADDASP" in {
1289 let isCommutable = 1 in
1290 def XSMADDASP : XX3Form<60, 1,
1291 (outs vssrc:$XT),
1292 (ins vssrc:$XTi, vssrc:$XA, vssrc:$XB),
1293 "xsmaddasp $XT, $XA, $XB", IIC_VecFP,
1294 [(set f32:$XT, (fma f32:$XA, f32:$XB, f32:$XTi))]>,
1295 RegConstraint<"$XTi = $XT">, NoEncode<"$XTi">,
1296 AltVSXFMARel;
1297 let IsVSXFMAAlt = 1 in
1298 def XSMADDMSP : XX3Form<60, 9,
1299 (outs vssrc:$XT),
1300 (ins vssrc:$XTi, vssrc:$XA, vssrc:$XB),
1301 "xsmaddmsp $XT, $XA, $XB", IIC_VecFP, []>,
1302 RegConstraint<"$XTi = $XT">, NoEncode<"$XTi">,
1303 AltVSXFMARel;
1304 }
1305
1306 let BaseName = "XSMSUBASP" in {
1307 let isCommutable = 1 in
1308 def XSMSUBASP : XX3Form<60, 17,
1309 (outs vssrc:$XT),
1310 (ins vssrc:$XTi, vssrc:$XA, vssrc:$XB),
1311 "xsmsubasp $XT, $XA, $XB", IIC_VecFP,
1312 [(set f32:$XT, (fma f32:$XA, f32:$XB,
1313 (fneg f32:$XTi)))]>,
1314 RegConstraint<"$XTi = $XT">, NoEncode<"$XTi">,
1315 AltVSXFMARel;
1316 let IsVSXFMAAlt = 1 in
1317 def XSMSUBMSP : XX3Form<60, 25,
1318 (outs vssrc:$XT),
1319 (ins vssrc:$XTi, vssrc:$XA, vssrc:$XB),
1320 "xsmsubmsp $XT, $XA, $XB", IIC_VecFP, []>,
1321 RegConstraint<"$XTi = $XT">, NoEncode<"$XTi">,
1322 AltVSXFMARel;
1323 }
1324
1325 let BaseName = "XSNMADDASP" in {
1326 let isCommutable = 1 in
1327 def XSNMADDASP : XX3Form<60, 129,
1328 (outs vssrc:$XT),
1329 (ins vssrc:$XTi, vssrc:$XA, vssrc:$XB),
1330 "xsnmaddasp $XT, $XA, $XB", IIC_VecFP,
1331 [(set f32:$XT, (fneg (fma f32:$XA, f32:$XB,
1332 f32:$XTi)))]>,
1333 RegConstraint<"$XTi = $XT">, NoEncode<"$XTi">,
1334 AltVSXFMARel;
1335 let IsVSXFMAAlt = 1 in
1336 def XSNMADDMSP : XX3Form<60, 137,
1337 (outs vssrc:$XT),
1338 (ins vssrc:$XTi, vssrc:$XA, vssrc:$XB),
1339 "xsnmaddmsp $XT, $XA, $XB", IIC_VecFP, []>,
1340 RegConstraint<"$XTi = $XT">, NoEncode<"$XTi">,
1341 AltVSXFMARel;
1342 }
1343
1344 let BaseName = "XSNMSUBASP" in {
1345 let isCommutable = 1 in
1346 def XSNMSUBASP : XX3Form<60, 145,
1347 (outs vssrc:$XT),
1348 (ins vssrc:$XTi, vssrc:$XA, vssrc:$XB),
1349 "xsnmsubasp $XT, $XA, $XB", IIC_VecFP,
1350 [(set f32:$XT, (fneg (fma f32:$XA, f32:$XB,
1351 (fneg f32:$XTi))))]>,
1352 RegConstraint<"$XTi = $XT">, NoEncode<"$XTi">,
1353 AltVSXFMARel;
1354 let IsVSXFMAAlt = 1 in
1355 def XSNMSUBMSP : XX3Form<60, 153,
1356 (outs vssrc:$XT),
1357 (ins vssrc:$XTi, vssrc:$XA, vssrc:$XB),
1358 "xsnmsubmsp $XT, $XA, $XB", IIC_VecFP, []>,
1359 RegConstraint<"$XTi = $XT">, NoEncode<"$XTi">,
1360 AltVSXFMARel;
1361 }
Nemanja Ivanovic1c39ca62015-08-13 17:40:44 +00001362
1363 // Single Precision Conversions (FP <-> INT)
1364 def XSCVSXDSP : XX2Form<60, 312,
1365 (outs vssrc:$XT), (ins vsfrc:$XB),
1366 "xscvsxdsp $XT, $XB", IIC_VecFP,
1367 [(set f32:$XT, (PPCfcfids f64:$XB))]>;
1368 def XSCVUXDSP : XX2Form<60, 296,
1369 (outs vssrc:$XT), (ins vsfrc:$XB),
1370 "xscvuxdsp $XT, $XB", IIC_VecFP,
1371 [(set f32:$XT, (PPCfcfidus f64:$XB))]>;
1372
1373 // Conversions between vector and scalar single precision
1374 def XSCVDPSPN : XX2Form<60, 267, (outs vsrc:$XT), (ins vssrc:$XB),
1375 "xscvdpspn $XT, $XB", IIC_VecFP, []>;
1376 def XSCVSPDPN : XX2Form<60, 331, (outs vssrc:$XT), (ins vsrc:$XB),
1377 "xscvspdpn $XT, $XB", IIC_VecFP, []>;
Nemanja Ivanovic11049f82016-10-04 06:59:23 +00001378 } // UseVSXReg = 1
Nemanja Ivanovic1c39ca62015-08-13 17:40:44 +00001379
Nemanja Ivanovicd3c284f2016-07-18 15:30:00 +00001380 let Predicates = [IsLittleEndian] in {
1381 def : Pat<(f32 (PPCfcfids (PPCmtvsra (i64 (vector_extract v2i64:$S, 0))))),
1382 (f32 (XSCVSXDSP (COPY_TO_REGCLASS (XXPERMDI $S, $S, 2), VSFRC)))>;
1383 def : Pat<(f32 (PPCfcfids (PPCmtvsra (i64 (vector_extract v2i64:$S, 1))))),
1384 (f32 (XSCVSXDSP (COPY_TO_REGCLASS (f64 (COPY_TO_REGCLASS $S, VSRC)), VSFRC)))>;
1385 def : Pat<(f32 (PPCfcfidus (PPCmtvsra (i64 (vector_extract v2i64:$S, 0))))),
1386 (f32 (XSCVUXDSP (COPY_TO_REGCLASS (XXPERMDI $S, $S, 2), VSFRC)))>;
1387 def : Pat<(f32 (PPCfcfidus (PPCmtvsra (i64 (vector_extract v2i64:$S, 1))))),
1388 (f32 (XSCVUXDSP (COPY_TO_REGCLASS (f64 (COPY_TO_REGCLASS $S, VSRC)), VSFRC)))>;
1389 }
1390
1391 let Predicates = [IsBigEndian] in {
1392 def : Pat<(f32 (PPCfcfids (PPCmtvsra (i64 (vector_extract v2i64:$S, 0))))),
1393 (f32 (XSCVSXDSP (COPY_TO_REGCLASS $S, VSFRC)))>;
1394 def : Pat<(f32 (PPCfcfids (PPCmtvsra (i64 (vector_extract v2i64:$S, 1))))),
1395 (f32 (XSCVSXDSP (COPY_TO_REGCLASS (XXPERMDI $S, $S, 2), VSFRC)))>;
1396 def : Pat<(f32 (PPCfcfidus (PPCmtvsra (i64 (vector_extract v2i64:$S, 0))))),
1397 (f32 (XSCVUXDSP (COPY_TO_REGCLASS $S, VSFRC)))>;
1398 def : Pat<(f32 (PPCfcfidus (PPCmtvsra (i64 (vector_extract v2i64:$S, 1))))),
1399 (f32 (XSCVUXDSP (COPY_TO_REGCLASS (XXPERMDI $S, $S, 2), VSFRC)))>;
1400 }
Nemanja Ivanovic11049f82016-10-04 06:59:23 +00001401 def : Pat<(v4i32 (scalar_to_vector ScalarLoads.Li32)),
1402 (v4i32 (XXSPLTWs (LXSIWAX xoaddr:$src), 1))>;
Nemanja Ivanovicf3c94b12015-05-07 18:24:05 +00001403} // AddedComplexity = 400
Kit Barton298beb52015-02-18 16:21:46 +00001404} // HasP8Vector
Nemanja Ivanovicc38b5312015-04-11 10:40:42 +00001405
Nemanja Ivanovicdf1cb522016-11-29 16:11:34 +00001406let UseVSXReg = 1, AddedComplexity = 400 in {
Ehsan Amiri99b017a2016-03-31 17:47:17 +00001407let Predicates = [HasDirectMove] in {
Nemanja Ivanovicf02def62015-05-21 19:32:49 +00001408 // VSX direct move instructions
1409 def MFVSRD : XX1_RS6_RD5_XO<31, 51, (outs g8rc:$rA), (ins vsfrc:$XT),
1410 "mfvsrd $rA, $XT", IIC_VecGeneral,
1411 [(set i64:$rA, (PPCmfvsr f64:$XT))]>,
1412 Requires<[In64BitMode]>;
1413 def MFVSRWZ : XX1_RS6_RD5_XO<31, 115, (outs gprc:$rA), (ins vsfrc:$XT),
1414 "mfvsrwz $rA, $XT", IIC_VecGeneral,
1415 [(set i32:$rA, (PPCmfvsr f64:$XT))]>;
1416 def MTVSRD : XX1_RS6_RD5_XO<31, 179, (outs vsfrc:$XT), (ins g8rc:$rA),
1417 "mtvsrd $XT, $rA", IIC_VecGeneral,
1418 [(set f64:$XT, (PPCmtvsra i64:$rA))]>,
1419 Requires<[In64BitMode]>;
1420 def MTVSRWA : XX1_RS6_RD5_XO<31, 211, (outs vsfrc:$XT), (ins gprc:$rA),
1421 "mtvsrwa $XT, $rA", IIC_VecGeneral,
1422 [(set f64:$XT, (PPCmtvsra i32:$rA))]>;
1423 def MTVSRWZ : XX1_RS6_RD5_XO<31, 243, (outs vsfrc:$XT), (ins gprc:$rA),
1424 "mtvsrwz $XT, $rA", IIC_VecGeneral,
1425 [(set f64:$XT, (PPCmtvsrz i32:$rA))]>;
Ehsan Amiri99b017a2016-03-31 17:47:17 +00001426} // HasDirectMove
1427
1428let Predicates = [IsISA3_0, HasDirectMove] in {
1429 def MTVSRWS: XX1_RS6_RD5_XO<31, 403, (outs vsrc:$XT), (ins gprc:$rA),
Nemanja Ivanovicd2c3c512016-09-23 13:25:31 +00001430 "mtvsrws $XT, $rA", IIC_VecGeneral, []>;
Ehsan Amiri99b017a2016-03-31 17:47:17 +00001431
1432 def MTVSRDD: XX1Form<31, 435, (outs vsrc:$XT), (ins g8rc:$rA, g8rc:$rB),
1433 "mtvsrdd $XT, $rA, $rB", IIC_VecGeneral,
1434 []>, Requires<[In64BitMode]>;
1435
1436 def MFVSRLD: XX1_RS6_RD5_XO<31, 307, (outs g8rc:$rA), (ins vsrc:$XT),
1437 "mfvsrld $rA, $XT", IIC_VecGeneral,
1438 []>, Requires<[In64BitMode]>;
1439
1440} // IsISA3_0, HasDirectMove
Nemanja Ivanovic11049f82016-10-04 06:59:23 +00001441} // UseVSXReg = 1
Nemanja Ivanovic1c39ca62015-08-13 17:40:44 +00001442
Nemanja Ivanovicd3896572015-10-09 11:12:18 +00001443/* Direct moves of various widths from GPR's into VSR's. Each move lines
Nemanja Ivanovic1c39ca62015-08-13 17:40:44 +00001444 the value up into element 0 (both BE and LE). Namely, entities smaller than
1445 a doubleword are shifted left and moved for BE. For LE, they're moved, then
1446 swapped to go into the least significant element of the VSR.
1447*/
Nemanja Ivanovicd3896572015-10-09 11:12:18 +00001448def MovesToVSR {
1449 dag BE_BYTE_0 =
1450 (MTVSRD
1451 (RLDICR
1452 (INSERT_SUBREG (i64 (IMPLICIT_DEF)), $A, sub_32), 56, 7));
1453 dag BE_HALF_0 =
1454 (MTVSRD
1455 (RLDICR
1456 (INSERT_SUBREG (i64 (IMPLICIT_DEF)), $A, sub_32), 48, 15));
1457 dag BE_WORD_0 =
1458 (MTVSRD
1459 (RLDICR
1460 (INSERT_SUBREG (i64 (IMPLICIT_DEF)), $A, sub_32), 32, 31));
Nemanja Ivanovic1c39ca62015-08-13 17:40:44 +00001461 dag BE_DWORD_0 = (MTVSRD $A);
1462
1463 dag LE_MTVSRW = (MTVSRD (INSERT_SUBREG (i64 (IMPLICIT_DEF)), $A, sub_32));
Nemanja Ivanovicd3896572015-10-09 11:12:18 +00001464 dag LE_WORD_1 = (v2i64 (INSERT_SUBREG (v2i64 (IMPLICIT_DEF)),
1465 LE_MTVSRW, sub_64));
Nemanja Ivanovic1c39ca62015-08-13 17:40:44 +00001466 dag LE_WORD_0 = (XXPERMDI LE_WORD_1, LE_WORD_1, 2);
Nemanja Ivanovicd3896572015-10-09 11:12:18 +00001467 dag LE_DWORD_1 = (v2i64 (INSERT_SUBREG (v2i64 (IMPLICIT_DEF)),
1468 BE_DWORD_0, sub_64));
Nemanja Ivanovic1c39ca62015-08-13 17:40:44 +00001469 dag LE_DWORD_0 = (XXPERMDI LE_DWORD_1, LE_DWORD_1, 2);
1470}
1471
Nemanja Ivanovicac8d01a2015-12-10 13:35:28 +00001472/* Patterns for extracting elements out of vectors. Integer elements are
1473 extracted using direct move operations. Patterns for extracting elements
1474 whose indices are not available at compile time are also provided with
1475 various _VARIABLE_ patterns.
Nemanja Ivanovicd3896572015-10-09 11:12:18 +00001476 The numbering for the DAG's is for LE, but when used on BE, the correct
1477 LE element can just be used (i.e. LE_BYTE_2 == BE_BYTE_13).
1478*/
Nemanja Ivanovicac8d01a2015-12-10 13:35:28 +00001479def VectorExtractions {
Nemanja Ivanovicd3896572015-10-09 11:12:18 +00001480 // Doubleword extraction
1481 dag LE_DWORD_0 =
1482 (MFVSRD
1483 (EXTRACT_SUBREG
1484 (XXPERMDI (COPY_TO_REGCLASS $S, VSRC),
1485 (COPY_TO_REGCLASS $S, VSRC), 2), sub_64));
1486 dag LE_DWORD_1 = (MFVSRD
1487 (EXTRACT_SUBREG
1488 (v2i64 (COPY_TO_REGCLASS $S, VSRC)), sub_64));
1489
1490 // Word extraction
Nemanja Ivanoviceebbcb62016-07-12 12:16:27 +00001491 dag LE_WORD_0 = (MFVSRWZ (EXTRACT_SUBREG (XXPERMDI $S, $S, 2), sub_64));
Nemanja Ivanovicd3896572015-10-09 11:12:18 +00001492 dag LE_WORD_1 = (MFVSRWZ (EXTRACT_SUBREG (XXSLDWI $S, $S, 1), sub_64));
1493 dag LE_WORD_2 = (MFVSRWZ (EXTRACT_SUBREG
1494 (v2i64 (COPY_TO_REGCLASS $S, VSRC)), sub_64));
1495 dag LE_WORD_3 = (MFVSRWZ (EXTRACT_SUBREG (XXSLDWI $S, $S, 3), sub_64));
1496
1497 // Halfword extraction
1498 dag LE_HALF_0 = (i32 (EXTRACT_SUBREG (RLDICL LE_DWORD_0, 0, 48), sub_32));
1499 dag LE_HALF_1 = (i32 (EXTRACT_SUBREG (RLDICL LE_DWORD_0, 48, 48), sub_32));
1500 dag LE_HALF_2 = (i32 (EXTRACT_SUBREG (RLDICL LE_DWORD_0, 32, 48), sub_32));
1501 dag LE_HALF_3 = (i32 (EXTRACT_SUBREG (RLDICL LE_DWORD_0, 16, 48), sub_32));
1502 dag LE_HALF_4 = (i32 (EXTRACT_SUBREG (RLDICL LE_DWORD_1, 0, 48), sub_32));
1503 dag LE_HALF_5 = (i32 (EXTRACT_SUBREG (RLDICL LE_DWORD_1, 48, 48), sub_32));
1504 dag LE_HALF_6 = (i32 (EXTRACT_SUBREG (RLDICL LE_DWORD_1, 32, 48), sub_32));
1505 dag LE_HALF_7 = (i32 (EXTRACT_SUBREG (RLDICL LE_DWORD_1, 16, 48), sub_32));
1506
1507 // Byte extraction
1508 dag LE_BYTE_0 = (i32 (EXTRACT_SUBREG (RLDICL LE_DWORD_0, 0, 56), sub_32));
1509 dag LE_BYTE_1 = (i32 (EXTRACT_SUBREG (RLDICL LE_DWORD_0, 56, 56), sub_32));
1510 dag LE_BYTE_2 = (i32 (EXTRACT_SUBREG (RLDICL LE_DWORD_0, 48, 56), sub_32));
1511 dag LE_BYTE_3 = (i32 (EXTRACT_SUBREG (RLDICL LE_DWORD_0, 40, 56), sub_32));
1512 dag LE_BYTE_4 = (i32 (EXTRACT_SUBREG (RLDICL LE_DWORD_0, 32, 56), sub_32));
1513 dag LE_BYTE_5 = (i32 (EXTRACT_SUBREG (RLDICL LE_DWORD_0, 24, 56), sub_32));
1514 dag LE_BYTE_6 = (i32 (EXTRACT_SUBREG (RLDICL LE_DWORD_0, 16, 56), sub_32));
1515 dag LE_BYTE_7 = (i32 (EXTRACT_SUBREG (RLDICL LE_DWORD_0, 8, 56), sub_32));
1516 dag LE_BYTE_8 = (i32 (EXTRACT_SUBREG (RLDICL LE_DWORD_1, 0, 56), sub_32));
1517 dag LE_BYTE_9 = (i32 (EXTRACT_SUBREG (RLDICL LE_DWORD_1, 56, 56), sub_32));
1518 dag LE_BYTE_10 = (i32 (EXTRACT_SUBREG (RLDICL LE_DWORD_1, 48, 56), sub_32));
1519 dag LE_BYTE_11 = (i32 (EXTRACT_SUBREG (RLDICL LE_DWORD_1, 40, 56), sub_32));
1520 dag LE_BYTE_12 = (i32 (EXTRACT_SUBREG (RLDICL LE_DWORD_1, 32, 56), sub_32));
1521 dag LE_BYTE_13 = (i32 (EXTRACT_SUBREG (RLDICL LE_DWORD_1, 24, 56), sub_32));
1522 dag LE_BYTE_14 = (i32 (EXTRACT_SUBREG (RLDICL LE_DWORD_1, 16, 56), sub_32));
1523 dag LE_BYTE_15 = (i32 (EXTRACT_SUBREG (RLDICL LE_DWORD_1, 8, 56), sub_32));
1524
1525 /* Variable element number (BE and LE patterns must be specified separately)
1526 This is a rather involved process.
1527
1528 Conceptually, this is how the move is accomplished:
1529 1. Identify which doubleword contains the element
1530 2. Shift in the VMX register so that the correct doubleword is correctly
1531 lined up for the MFVSRD
1532 3. Perform the move so that the element (along with some extra stuff)
1533 is in the GPR
1534 4. Right shift within the GPR so that the element is right-justified
1535
1536 Of course, the index is an element number which has a different meaning
1537 on LE/BE so the patterns have to be specified separately.
1538
1539 Note: The final result will be the element right-justified with high
1540 order bits being arbitrarily defined (namely, whatever was in the
1541 vector register to the left of the value originally).
1542 */
1543
1544 /* LE variable byte
1545 Number 1. above:
1546 - For elements 0-7, we shift left by 8 bytes since they're on the right
1547 - For elements 8-15, we need not shift (shift left by zero bytes)
1548 This is accomplished by inverting the bits of the index and AND-ing
1549 with 0x8 (i.e. clearing all bits of the index and inverting bit 60).
1550 */
1551 dag LE_VBYTE_PERM_VEC = (LVSL ZERO8, (ANDC8 (LI8 8), $Idx));
1552
1553 // Number 2. above:
1554 // - Now that we set up the shift amount, we shift in the VMX register
1555 dag LE_VBYTE_PERMUTE = (VPERM $S, $S, LE_VBYTE_PERM_VEC);
1556
1557 // Number 3. above:
1558 // - The doubleword containing our element is moved to a GPR
1559 dag LE_MV_VBYTE = (MFVSRD
1560 (EXTRACT_SUBREG
1561 (v2i64 (COPY_TO_REGCLASS LE_VBYTE_PERMUTE, VSRC)),
1562 sub_64));
1563
1564 /* Number 4. above:
1565 - Truncate the element number to the range 0-7 (8-15 are symmetrical
1566 and out of range values are truncated accordingly)
1567 - Multiply by 8 as we need to shift right by the number of bits, not bytes
1568 - Shift right in the GPR by the calculated value
1569 */
1570 dag LE_VBYTE_SHIFT = (EXTRACT_SUBREG (RLDICR (AND8 (LI8 7), $Idx), 3, 60),
1571 sub_32);
1572 dag LE_VARIABLE_BYTE = (EXTRACT_SUBREG (SRD LE_MV_VBYTE, LE_VBYTE_SHIFT),
1573 sub_32);
1574
Nemanja Ivanovicd3896572015-10-09 11:12:18 +00001575 /* LE variable halfword
1576 Number 1. above:
1577 - For elements 0-3, we shift left by 8 since they're on the right
1578 - For elements 4-7, we need not shift (shift left by zero bytes)
1579 Similarly to the byte pattern, we invert the bits of the index, but we
1580 AND with 0x4 (i.e. clear all bits of the index and invert bit 61).
1581 Of course, the shift is still by 8 bytes, so we must multiply by 2.
1582 */
1583 dag LE_VHALF_PERM_VEC = (LVSL ZERO8, (RLDICR (ANDC8 (LI8 4), $Idx), 1, 62));
1584
1585 // Number 2. above:
1586 // - Now that we set up the shift amount, we shift in the VMX register
1587 dag LE_VHALF_PERMUTE = (VPERM $S, $S, LE_VHALF_PERM_VEC);
1588
1589 // Number 3. above:
1590 // - The doubleword containing our element is moved to a GPR
1591 dag LE_MV_VHALF = (MFVSRD
1592 (EXTRACT_SUBREG
1593 (v2i64 (COPY_TO_REGCLASS LE_VHALF_PERMUTE, VSRC)),
1594 sub_64));
1595
1596 /* Number 4. above:
1597 - Truncate the element number to the range 0-3 (4-7 are symmetrical
1598 and out of range values are truncated accordingly)
1599 - Multiply by 16 as we need to shift right by the number of bits
1600 - Shift right in the GPR by the calculated value
1601 */
1602 dag LE_VHALF_SHIFT = (EXTRACT_SUBREG (RLDICR (AND8 (LI8 3), $Idx), 4, 59),
1603 sub_32);
1604 dag LE_VARIABLE_HALF = (EXTRACT_SUBREG (SRD LE_MV_VHALF, LE_VHALF_SHIFT),
1605 sub_32);
1606
Nemanja Ivanovicac8d01a2015-12-10 13:35:28 +00001607 /* LE variable word
1608 Number 1. above:
1609 - For elements 0-1, we shift left by 8 since they're on the right
1610 - For elements 2-3, we need not shift
1611 */
1612 dag LE_VWORD_PERM_VEC = (LVSL ZERO8, (RLDICR (ANDC8 (LI8 2), $Idx), 2, 61));
1613
1614 // Number 2. above:
1615 // - Now that we set up the shift amount, we shift in the VMX register
1616 dag LE_VWORD_PERMUTE = (VPERM $S, $S, LE_VWORD_PERM_VEC);
1617
1618 // Number 3. above:
1619 // - The doubleword containing our element is moved to a GPR
1620 dag LE_MV_VWORD = (MFVSRD
1621 (EXTRACT_SUBREG
1622 (v2i64 (COPY_TO_REGCLASS LE_VWORD_PERMUTE, VSRC)),
1623 sub_64));
1624
1625 /* Number 4. above:
1626 - Truncate the element number to the range 0-1 (2-3 are symmetrical
1627 and out of range values are truncated accordingly)
1628 - Multiply by 32 as we need to shift right by the number of bits
1629 - Shift right in the GPR by the calculated value
1630 */
1631 dag LE_VWORD_SHIFT = (EXTRACT_SUBREG (RLDICR (AND8 (LI8 1), $Idx), 5, 58),
1632 sub_32);
1633 dag LE_VARIABLE_WORD = (EXTRACT_SUBREG (SRD LE_MV_VWORD, LE_VWORD_SHIFT),
1634 sub_32);
1635
1636 /* LE variable doubleword
1637 Number 1. above:
1638 - For element 0, we shift left by 8 since it's on the right
1639 - For element 1, we need not shift
1640 */
1641 dag LE_VDWORD_PERM_VEC = (LVSL ZERO8, (RLDICR (ANDC8 (LI8 1), $Idx), 3, 60));
1642
1643 // Number 2. above:
1644 // - Now that we set up the shift amount, we shift in the VMX register
1645 dag LE_VDWORD_PERMUTE = (VPERM $S, $S, LE_VDWORD_PERM_VEC);
1646
1647 // Number 3. above:
1648 // - The doubleword containing our element is moved to a GPR
1649 // - Number 4. is not needed for the doubleword as the value is 64-bits
1650 dag LE_VARIABLE_DWORD =
1651 (MFVSRD (EXTRACT_SUBREG
1652 (v2i64 (COPY_TO_REGCLASS LE_VDWORD_PERMUTE, VSRC)),
1653 sub_64));
1654
1655 /* LE variable float
1656 - Shift the vector to line up the desired element to BE Word 0
1657 - Convert 32-bit float to a 64-bit single precision float
1658 */
1659 dag LE_VFLOAT_PERM_VEC = (LVSL ZERO8, (RLDICR (XOR8 (LI8 3), $Idx), 2, 61));
1660 dag LE_VFLOAT_PERMUTE = (VPERM $S, $S, LE_VFLOAT_PERM_VEC);
1661 dag LE_VARIABLE_FLOAT = (XSCVSPDPN LE_VFLOAT_PERMUTE);
1662
1663 /* LE variable double
1664 Same as the LE doubleword except there is no move.
1665 */
1666 dag LE_VDOUBLE_PERMUTE = (VPERM (COPY_TO_REGCLASS $S, VRRC),
1667 (COPY_TO_REGCLASS $S, VRRC),
1668 LE_VDWORD_PERM_VEC);
1669 dag LE_VARIABLE_DOUBLE = (COPY_TO_REGCLASS LE_VDOUBLE_PERMUTE, VSRC);
1670
1671 /* BE variable byte
1672 The algorithm here is the same as the LE variable byte except:
1673 - The shift in the VMX register is by 0/8 for opposite element numbers so
1674 we simply AND the element number with 0x8
1675 - The order of elements after the move to GPR is reversed, so we invert
1676 the bits of the index prior to truncating to the range 0-7
1677 */
1678 dag BE_VBYTE_PERM_VEC = (LVSL ZERO8, (ANDIo8 $Idx, 8));
1679 dag BE_VBYTE_PERMUTE = (VPERM $S, $S, BE_VBYTE_PERM_VEC);
1680 dag BE_MV_VBYTE = (MFVSRD
1681 (EXTRACT_SUBREG
1682 (v2i64 (COPY_TO_REGCLASS BE_VBYTE_PERMUTE, VSRC)),
1683 sub_64));
1684 dag BE_VBYTE_SHIFT = (EXTRACT_SUBREG (RLDICR (ANDC8 (LI8 7), $Idx), 3, 60),
1685 sub_32);
1686 dag BE_VARIABLE_BYTE = (EXTRACT_SUBREG (SRD BE_MV_VBYTE, BE_VBYTE_SHIFT),
1687 sub_32);
1688
Nemanja Ivanovicd3896572015-10-09 11:12:18 +00001689 /* BE variable halfword
1690 The algorithm here is the same as the LE variable halfword except:
1691 - The shift in the VMX register is by 0/8 for opposite element numbers so
1692 we simply AND the element number with 0x4 and multiply by 2
1693 - The order of elements after the move to GPR is reversed, so we invert
1694 the bits of the index prior to truncating to the range 0-3
1695 */
1696 dag BE_VHALF_PERM_VEC = (LVSL ZERO8, (RLDICR (ANDIo8 $Idx, 4), 1, 62));
1697 dag BE_VHALF_PERMUTE = (VPERM $S, $S, BE_VHALF_PERM_VEC);
1698 dag BE_MV_VHALF = (MFVSRD
1699 (EXTRACT_SUBREG
1700 (v2i64 (COPY_TO_REGCLASS BE_VHALF_PERMUTE, VSRC)),
1701 sub_64));
Nemanja Ivanovicac8d01a2015-12-10 13:35:28 +00001702 dag BE_VHALF_SHIFT = (EXTRACT_SUBREG (RLDICR (ANDC8 (LI8 3), $Idx), 4, 59),
Nemanja Ivanovicd3896572015-10-09 11:12:18 +00001703 sub_32);
1704 dag BE_VARIABLE_HALF = (EXTRACT_SUBREG (SRD BE_MV_VHALF, BE_VHALF_SHIFT),
1705 sub_32);
Nemanja Ivanovicac8d01a2015-12-10 13:35:28 +00001706
1707 /* BE variable word
1708 The algorithm is the same as the LE variable word except:
1709 - The shift in the VMX register happens for opposite element numbers
1710 - The order of elements after the move to GPR is reversed, so we invert
1711 the bits of the index prior to truncating to the range 0-1
1712 */
1713 dag BE_VWORD_PERM_VEC = (LVSL ZERO8, (RLDICR (ANDIo8 $Idx, 2), 2, 61));
1714 dag BE_VWORD_PERMUTE = (VPERM $S, $S, BE_VWORD_PERM_VEC);
1715 dag BE_MV_VWORD = (MFVSRD
1716 (EXTRACT_SUBREG
1717 (v2i64 (COPY_TO_REGCLASS BE_VWORD_PERMUTE, VSRC)),
1718 sub_64));
1719 dag BE_VWORD_SHIFT = (EXTRACT_SUBREG (RLDICR (ANDC8 (LI8 1), $Idx), 5, 58),
1720 sub_32);
1721 dag BE_VARIABLE_WORD = (EXTRACT_SUBREG (SRD BE_MV_VWORD, BE_VWORD_SHIFT),
1722 sub_32);
1723
1724 /* BE variable doubleword
1725 Same as the LE doubleword except we shift in the VMX register for opposite
1726 element indices.
1727 */
1728 dag BE_VDWORD_PERM_VEC = (LVSL ZERO8, (RLDICR (ANDIo8 $Idx, 1), 3, 60));
1729 dag BE_VDWORD_PERMUTE = (VPERM $S, $S, BE_VDWORD_PERM_VEC);
1730 dag BE_VARIABLE_DWORD =
1731 (MFVSRD (EXTRACT_SUBREG
1732 (v2i64 (COPY_TO_REGCLASS BE_VDWORD_PERMUTE, VSRC)),
1733 sub_64));
1734
1735 /* BE variable float
1736 - Shift the vector to line up the desired element to BE Word 0
1737 - Convert 32-bit float to a 64-bit single precision float
1738 */
1739 dag BE_VFLOAT_PERM_VEC = (LVSL ZERO8, (RLDICR $Idx, 2, 61));
1740 dag BE_VFLOAT_PERMUTE = (VPERM $S, $S, BE_VFLOAT_PERM_VEC);
1741 dag BE_VARIABLE_FLOAT = (XSCVSPDPN BE_VFLOAT_PERMUTE);
1742
1743 /* BE variable double
1744 Same as the BE doubleword except there is no move.
1745 */
1746 dag BE_VDOUBLE_PERMUTE = (VPERM (COPY_TO_REGCLASS $S, VRRC),
1747 (COPY_TO_REGCLASS $S, VRRC),
1748 BE_VDWORD_PERM_VEC);
1749 dag BE_VARIABLE_DOUBLE = (COPY_TO_REGCLASS BE_VDOUBLE_PERMUTE, VSRC);
Nemanja Ivanovicd3896572015-10-09 11:12:18 +00001750}
1751
Nemanja Ivanovicdf1cb522016-11-29 16:11:34 +00001752let AddedComplexity = 400 in {
Nemanja Ivanovicd3896572015-10-09 11:12:18 +00001753// v4f32 scalar <-> vector conversions (BE)
Nemanja Ivanovic1c39ca62015-08-13 17:40:44 +00001754let Predicates = [IsBigEndian, HasP8Vector] in {
1755 def : Pat<(v4f32 (scalar_to_vector f32:$A)),
1756 (v4f32 (XSCVDPSPN $A))>;
Nemanja Ivanovicd3896572015-10-09 11:12:18 +00001757 def : Pat<(f32 (vector_extract v4f32:$S, 0)),
1758 (f32 (XSCVSPDPN $S))>;
1759 def : Pat<(f32 (vector_extract v4f32:$S, 1)),
1760 (f32 (XSCVSPDPN (XXSLDWI $S, $S, 1)))>;
1761 def : Pat<(f32 (vector_extract v4f32:$S, 2)),
Nemanja Ivanoviceebbcb62016-07-12 12:16:27 +00001762 (f32 (XSCVSPDPN (XXPERMDI $S, $S, 2)))>;
Nemanja Ivanovicd3896572015-10-09 11:12:18 +00001763 def : Pat<(f32 (vector_extract v4f32:$S, 3)),
1764 (f32 (XSCVSPDPN (XXSLDWI $S, $S, 3)))>;
Nemanja Ivanovicac8d01a2015-12-10 13:35:28 +00001765 def : Pat<(f32 (vector_extract v4f32:$S, i64:$Idx)),
1766 (f32 VectorExtractions.BE_VARIABLE_FLOAT)>;
Nemanja Ivanovic1c39ca62015-08-13 17:40:44 +00001767} // IsBigEndian, HasP8Vector
1768
Nemanja Ivanovicac8d01a2015-12-10 13:35:28 +00001769// Variable index vector_extract for v2f64 does not require P8Vector
1770let Predicates = [IsBigEndian, HasVSX] in
1771 def : Pat<(f64 (vector_extract v2f64:$S, i64:$Idx)),
1772 (f64 VectorExtractions.BE_VARIABLE_DOUBLE)>;
1773
Nemanja Ivanovic1c39ca62015-08-13 17:40:44 +00001774let Predicates = [IsBigEndian, HasDirectMove] in {
Nemanja Ivanovicd3896572015-10-09 11:12:18 +00001775 // v16i8 scalar <-> vector conversions (BE)
Nemanja Ivanovic1c39ca62015-08-13 17:40:44 +00001776 def : Pat<(v16i8 (scalar_to_vector i32:$A)),
Nemanja Ivanovicd3896572015-10-09 11:12:18 +00001777 (v16i8 (SUBREG_TO_REG (i64 1), MovesToVSR.BE_BYTE_0, sub_64))>;
Nemanja Ivanovic1c39ca62015-08-13 17:40:44 +00001778 def : Pat<(v8i16 (scalar_to_vector i32:$A)),
Nemanja Ivanovicd3896572015-10-09 11:12:18 +00001779 (v8i16 (SUBREG_TO_REG (i64 1), MovesToVSR.BE_HALF_0, sub_64))>;
Nemanja Ivanovic1c39ca62015-08-13 17:40:44 +00001780 def : Pat<(v4i32 (scalar_to_vector i32:$A)),
Nemanja Ivanovicd3896572015-10-09 11:12:18 +00001781 (v4i32 (SUBREG_TO_REG (i64 1), MovesToVSR.BE_WORD_0, sub_64))>;
Nemanja Ivanovic1c39ca62015-08-13 17:40:44 +00001782 def : Pat<(v2i64 (scalar_to_vector i64:$A)),
Nemanja Ivanovicd3896572015-10-09 11:12:18 +00001783 (v2i64 (SUBREG_TO_REG (i64 1), MovesToVSR.BE_DWORD_0, sub_64))>;
1784 def : Pat<(i32 (vector_extract v16i8:$S, 0)),
Nemanja Ivanovicac8d01a2015-12-10 13:35:28 +00001785 (i32 VectorExtractions.LE_BYTE_15)>;
Nemanja Ivanovicd3896572015-10-09 11:12:18 +00001786 def : Pat<(i32 (vector_extract v16i8:$S, 1)),
Nemanja Ivanovicac8d01a2015-12-10 13:35:28 +00001787 (i32 VectorExtractions.LE_BYTE_14)>;
Nemanja Ivanovicd3896572015-10-09 11:12:18 +00001788 def : Pat<(i32 (vector_extract v16i8:$S, 2)),
Nemanja Ivanovicac8d01a2015-12-10 13:35:28 +00001789 (i32 VectorExtractions.LE_BYTE_13)>;
Nemanja Ivanovicd3896572015-10-09 11:12:18 +00001790 def : Pat<(i32 (vector_extract v16i8:$S, 3)),
Nemanja Ivanovicac8d01a2015-12-10 13:35:28 +00001791 (i32 VectorExtractions.LE_BYTE_12)>;
Nemanja Ivanovicd3896572015-10-09 11:12:18 +00001792 def : Pat<(i32 (vector_extract v16i8:$S, 4)),
Nemanja Ivanovicac8d01a2015-12-10 13:35:28 +00001793 (i32 VectorExtractions.LE_BYTE_11)>;
Nemanja Ivanovicd3896572015-10-09 11:12:18 +00001794 def : Pat<(i32 (vector_extract v16i8:$S, 5)),
Nemanja Ivanovicac8d01a2015-12-10 13:35:28 +00001795 (i32 VectorExtractions.LE_BYTE_10)>;
Nemanja Ivanovicd3896572015-10-09 11:12:18 +00001796 def : Pat<(i32 (vector_extract v16i8:$S, 6)),
Nemanja Ivanovicac8d01a2015-12-10 13:35:28 +00001797 (i32 VectorExtractions.LE_BYTE_9)>;
Nemanja Ivanovicd3896572015-10-09 11:12:18 +00001798 def : Pat<(i32 (vector_extract v16i8:$S, 7)),
Nemanja Ivanovicac8d01a2015-12-10 13:35:28 +00001799 (i32 VectorExtractions.LE_BYTE_8)>;
Nemanja Ivanovicd3896572015-10-09 11:12:18 +00001800 def : Pat<(i32 (vector_extract v16i8:$S, 8)),
Nemanja Ivanovicac8d01a2015-12-10 13:35:28 +00001801 (i32 VectorExtractions.LE_BYTE_7)>;
Nemanja Ivanovicd3896572015-10-09 11:12:18 +00001802 def : Pat<(i32 (vector_extract v16i8:$S, 9)),
Nemanja Ivanovicac8d01a2015-12-10 13:35:28 +00001803 (i32 VectorExtractions.LE_BYTE_6)>;
Nemanja Ivanovicd3896572015-10-09 11:12:18 +00001804 def : Pat<(i32 (vector_extract v16i8:$S, 10)),
Nemanja Ivanovicac8d01a2015-12-10 13:35:28 +00001805 (i32 VectorExtractions.LE_BYTE_5)>;
Nemanja Ivanovicd3896572015-10-09 11:12:18 +00001806 def : Pat<(i32 (vector_extract v16i8:$S, 11)),
Nemanja Ivanovicac8d01a2015-12-10 13:35:28 +00001807 (i32 VectorExtractions.LE_BYTE_4)>;
Nemanja Ivanovicd3896572015-10-09 11:12:18 +00001808 def : Pat<(i32 (vector_extract v16i8:$S, 12)),
Nemanja Ivanovicac8d01a2015-12-10 13:35:28 +00001809 (i32 VectorExtractions.LE_BYTE_3)>;
Nemanja Ivanovicd3896572015-10-09 11:12:18 +00001810 def : Pat<(i32 (vector_extract v16i8:$S, 13)),
Nemanja Ivanovicac8d01a2015-12-10 13:35:28 +00001811 (i32 VectorExtractions.LE_BYTE_2)>;
Nemanja Ivanovicd3896572015-10-09 11:12:18 +00001812 def : Pat<(i32 (vector_extract v16i8:$S, 14)),
Nemanja Ivanovicac8d01a2015-12-10 13:35:28 +00001813 (i32 VectorExtractions.LE_BYTE_1)>;
Nemanja Ivanovicd3896572015-10-09 11:12:18 +00001814 def : Pat<(i32 (vector_extract v16i8:$S, 15)),
Nemanja Ivanovicac8d01a2015-12-10 13:35:28 +00001815 (i32 VectorExtractions.LE_BYTE_0)>;
Nemanja Ivanovicd3896572015-10-09 11:12:18 +00001816 def : Pat<(i32 (vector_extract v16i8:$S, i64:$Idx)),
Nemanja Ivanovicac8d01a2015-12-10 13:35:28 +00001817 (i32 VectorExtractions.BE_VARIABLE_BYTE)>;
Nemanja Ivanovicd3896572015-10-09 11:12:18 +00001818
1819 // v8i16 scalar <-> vector conversions (BE)
1820 def : Pat<(i32 (vector_extract v8i16:$S, 0)),
Nemanja Ivanovicac8d01a2015-12-10 13:35:28 +00001821 (i32 VectorExtractions.LE_HALF_7)>;
Nemanja Ivanovicd3896572015-10-09 11:12:18 +00001822 def : Pat<(i32 (vector_extract v8i16:$S, 1)),
Nemanja Ivanovicac8d01a2015-12-10 13:35:28 +00001823 (i32 VectorExtractions.LE_HALF_6)>;
Nemanja Ivanovicd3896572015-10-09 11:12:18 +00001824 def : Pat<(i32 (vector_extract v8i16:$S, 2)),
Nemanja Ivanovicac8d01a2015-12-10 13:35:28 +00001825 (i32 VectorExtractions.LE_HALF_5)>;
Nemanja Ivanovicd3896572015-10-09 11:12:18 +00001826 def : Pat<(i32 (vector_extract v8i16:$S, 3)),
Nemanja Ivanovicac8d01a2015-12-10 13:35:28 +00001827 (i32 VectorExtractions.LE_HALF_4)>;
Nemanja Ivanovicd3896572015-10-09 11:12:18 +00001828 def : Pat<(i32 (vector_extract v8i16:$S, 4)),
Nemanja Ivanovicac8d01a2015-12-10 13:35:28 +00001829 (i32 VectorExtractions.LE_HALF_3)>;
Nemanja Ivanovicd3896572015-10-09 11:12:18 +00001830 def : Pat<(i32 (vector_extract v8i16:$S, 5)),
Nemanja Ivanovicac8d01a2015-12-10 13:35:28 +00001831 (i32 VectorExtractions.LE_HALF_2)>;
Nemanja Ivanovicd3896572015-10-09 11:12:18 +00001832 def : Pat<(i32 (vector_extract v8i16:$S, 6)),
Nemanja Ivanovicac8d01a2015-12-10 13:35:28 +00001833 (i32 VectorExtractions.LE_HALF_1)>;
Nemanja Ivanovicd3896572015-10-09 11:12:18 +00001834 def : Pat<(i32 (vector_extract v8i16:$S, 7)),
Nemanja Ivanovicac8d01a2015-12-10 13:35:28 +00001835 (i32 VectorExtractions.LE_HALF_0)>;
Nemanja Ivanovicd3896572015-10-09 11:12:18 +00001836 def : Pat<(i32 (vector_extract v8i16:$S, i64:$Idx)),
Nemanja Ivanovicac8d01a2015-12-10 13:35:28 +00001837 (i32 VectorExtractions.BE_VARIABLE_HALF)>;
Nemanja Ivanovicd3896572015-10-09 11:12:18 +00001838
1839 // v4i32 scalar <-> vector conversions (BE)
1840 def : Pat<(i32 (vector_extract v4i32:$S, 0)),
Nemanja Ivanovicac8d01a2015-12-10 13:35:28 +00001841 (i32 VectorExtractions.LE_WORD_3)>;
Nemanja Ivanovicd3896572015-10-09 11:12:18 +00001842 def : Pat<(i32 (vector_extract v4i32:$S, 1)),
Nemanja Ivanovicac8d01a2015-12-10 13:35:28 +00001843 (i32 VectorExtractions.LE_WORD_2)>;
Nemanja Ivanovicd3896572015-10-09 11:12:18 +00001844 def : Pat<(i32 (vector_extract v4i32:$S, 2)),
Nemanja Ivanovicac8d01a2015-12-10 13:35:28 +00001845 (i32 VectorExtractions.LE_WORD_1)>;
Nemanja Ivanovicd3896572015-10-09 11:12:18 +00001846 def : Pat<(i32 (vector_extract v4i32:$S, 3)),
Nemanja Ivanovicac8d01a2015-12-10 13:35:28 +00001847 (i32 VectorExtractions.LE_WORD_0)>;
1848 def : Pat<(i32 (vector_extract v4i32:$S, i64:$Idx)),
1849 (i32 VectorExtractions.BE_VARIABLE_WORD)>;
Nemanja Ivanovicd3896572015-10-09 11:12:18 +00001850
1851 // v2i64 scalar <-> vector conversions (BE)
1852 def : Pat<(i64 (vector_extract v2i64:$S, 0)),
Nemanja Ivanovicac8d01a2015-12-10 13:35:28 +00001853 (i64 VectorExtractions.LE_DWORD_1)>;
Nemanja Ivanovicd3896572015-10-09 11:12:18 +00001854 def : Pat<(i64 (vector_extract v2i64:$S, 1)),
Nemanja Ivanovicac8d01a2015-12-10 13:35:28 +00001855 (i64 VectorExtractions.LE_DWORD_0)>;
1856 def : Pat<(i64 (vector_extract v2i64:$S, i64:$Idx)),
1857 (i64 VectorExtractions.BE_VARIABLE_DWORD)>;
Nemanja Ivanovic1c39ca62015-08-13 17:40:44 +00001858} // IsBigEndian, HasDirectMove
1859
Nemanja Ivanovicd3896572015-10-09 11:12:18 +00001860// v4f32 scalar <-> vector conversions (LE)
Nemanja Ivanovic1c39ca62015-08-13 17:40:44 +00001861let Predicates = [IsLittleEndian, HasP8Vector] in {
1862 def : Pat<(v4f32 (scalar_to_vector f32:$A)),
1863 (v4f32 (XXSLDWI (XSCVDPSPN $A), (XSCVDPSPN $A), 1))>;
Nemanja Ivanovicd3896572015-10-09 11:12:18 +00001864 def : Pat<(f32 (vector_extract v4f32:$S, 0)),
1865 (f32 (XSCVSPDPN (XXSLDWI $S, $S, 3)))>;
1866 def : Pat<(f32 (vector_extract v4f32:$S, 1)),
Nemanja Ivanoviceebbcb62016-07-12 12:16:27 +00001867 (f32 (XSCVSPDPN (XXPERMDI $S, $S, 2)))>;
Nemanja Ivanovicd3896572015-10-09 11:12:18 +00001868 def : Pat<(f32 (vector_extract v4f32:$S, 2)),
1869 (f32 (XSCVSPDPN (XXSLDWI $S, $S, 1)))>;
1870 def : Pat<(f32 (vector_extract v4f32:$S, 3)),
1871 (f32 (XSCVSPDPN $S))>;
Nemanja Ivanovicac8d01a2015-12-10 13:35:28 +00001872 def : Pat<(f32 (vector_extract v4f32:$S, i64:$Idx)),
1873 (f32 VectorExtractions.LE_VARIABLE_FLOAT)>;
Nemanja Ivanovic1c39ca62015-08-13 17:40:44 +00001874} // IsLittleEndian, HasP8Vector
1875
Nemanja Ivanovicac8d01a2015-12-10 13:35:28 +00001876// Variable index vector_extract for v2f64 does not require P8Vector
1877let Predicates = [IsLittleEndian, HasVSX] in
1878 def : Pat<(f64 (vector_extract v2f64:$S, i64:$Idx)),
1879 (f64 VectorExtractions.LE_VARIABLE_DOUBLE)>;
1880
Nemanja Ivanovicf57f1502016-11-29 23:00:33 +00001881 def : Pat<(v4i32 (int_ppc_vsx_lxvw4x_be xoaddr:$src)), (LXVW4X xoaddr:$src)>;
1882 def : Pat<(v2f64 (int_ppc_vsx_lxvd2x_be xoaddr:$src)), (LXVD2X xoaddr:$src)>;
Tony Jiang5f850cd2016-11-15 14:25:56 +00001883
Nemanja Ivanovic1c39ca62015-08-13 17:40:44 +00001884let Predicates = [IsLittleEndian, HasDirectMove] in {
Nemanja Ivanovicd3896572015-10-09 11:12:18 +00001885 // v16i8 scalar <-> vector conversions (LE)
Nemanja Ivanovic1c39ca62015-08-13 17:40:44 +00001886 def : Pat<(v16i8 (scalar_to_vector i32:$A)),
Nemanja Ivanovicd3896572015-10-09 11:12:18 +00001887 (v16i8 (COPY_TO_REGCLASS MovesToVSR.LE_WORD_0, VSRC))>;
Nemanja Ivanovic1c39ca62015-08-13 17:40:44 +00001888 def : Pat<(v8i16 (scalar_to_vector i32:$A)),
Nemanja Ivanovicd3896572015-10-09 11:12:18 +00001889 (v8i16 (COPY_TO_REGCLASS MovesToVSR.LE_WORD_0, VSRC))>;
Nemanja Ivanovic1c39ca62015-08-13 17:40:44 +00001890 def : Pat<(v4i32 (scalar_to_vector i32:$A)),
Nemanja Ivanovicd3896572015-10-09 11:12:18 +00001891 (v4i32 MovesToVSR.LE_WORD_0)>;
Nemanja Ivanovic1c39ca62015-08-13 17:40:44 +00001892 def : Pat<(v2i64 (scalar_to_vector i64:$A)),
Nemanja Ivanovicd3896572015-10-09 11:12:18 +00001893 (v2i64 MovesToVSR.LE_DWORD_0)>;
1894 def : Pat<(i32 (vector_extract v16i8:$S, 0)),
Nemanja Ivanovicac8d01a2015-12-10 13:35:28 +00001895 (i32 VectorExtractions.LE_BYTE_0)>;
Nemanja Ivanovicd3896572015-10-09 11:12:18 +00001896 def : Pat<(i32 (vector_extract v16i8:$S, 1)),
Nemanja Ivanovicac8d01a2015-12-10 13:35:28 +00001897 (i32 VectorExtractions.LE_BYTE_1)>;
Nemanja Ivanovicd3896572015-10-09 11:12:18 +00001898 def : Pat<(i32 (vector_extract v16i8:$S, 2)),
Nemanja Ivanovicac8d01a2015-12-10 13:35:28 +00001899 (i32 VectorExtractions.LE_BYTE_2)>;
Nemanja Ivanovicd3896572015-10-09 11:12:18 +00001900 def : Pat<(i32 (vector_extract v16i8:$S, 3)),
Nemanja Ivanovicac8d01a2015-12-10 13:35:28 +00001901 (i32 VectorExtractions.LE_BYTE_3)>;
Nemanja Ivanovicd3896572015-10-09 11:12:18 +00001902 def : Pat<(i32 (vector_extract v16i8:$S, 4)),
Nemanja Ivanovicac8d01a2015-12-10 13:35:28 +00001903 (i32 VectorExtractions.LE_BYTE_4)>;
Nemanja Ivanovicd3896572015-10-09 11:12:18 +00001904 def : Pat<(i32 (vector_extract v16i8:$S, 5)),
Nemanja Ivanovicac8d01a2015-12-10 13:35:28 +00001905 (i32 VectorExtractions.LE_BYTE_5)>;
Nemanja Ivanovicd3896572015-10-09 11:12:18 +00001906 def : Pat<(i32 (vector_extract v16i8:$S, 6)),
Nemanja Ivanovicac8d01a2015-12-10 13:35:28 +00001907 (i32 VectorExtractions.LE_BYTE_6)>;
Nemanja Ivanovicd3896572015-10-09 11:12:18 +00001908 def : Pat<(i32 (vector_extract v16i8:$S, 7)),
Nemanja Ivanovicac8d01a2015-12-10 13:35:28 +00001909 (i32 VectorExtractions.LE_BYTE_7)>;
Nemanja Ivanovicd3896572015-10-09 11:12:18 +00001910 def : Pat<(i32 (vector_extract v16i8:$S, 8)),
Nemanja Ivanovicac8d01a2015-12-10 13:35:28 +00001911 (i32 VectorExtractions.LE_BYTE_8)>;
Nemanja Ivanovicd3896572015-10-09 11:12:18 +00001912 def : Pat<(i32 (vector_extract v16i8:$S, 9)),
Nemanja Ivanovicac8d01a2015-12-10 13:35:28 +00001913 (i32 VectorExtractions.LE_BYTE_9)>;
Nemanja Ivanovicd3896572015-10-09 11:12:18 +00001914 def : Pat<(i32 (vector_extract v16i8:$S, 10)),
Nemanja Ivanovicac8d01a2015-12-10 13:35:28 +00001915 (i32 VectorExtractions.LE_BYTE_10)>;
Nemanja Ivanovicd3896572015-10-09 11:12:18 +00001916 def : Pat<(i32 (vector_extract v16i8:$S, 11)),
Nemanja Ivanovicac8d01a2015-12-10 13:35:28 +00001917 (i32 VectorExtractions.LE_BYTE_11)>;
Nemanja Ivanovicd3896572015-10-09 11:12:18 +00001918 def : Pat<(i32 (vector_extract v16i8:$S, 12)),
Nemanja Ivanovicac8d01a2015-12-10 13:35:28 +00001919 (i32 VectorExtractions.LE_BYTE_12)>;
Nemanja Ivanovicd3896572015-10-09 11:12:18 +00001920 def : Pat<(i32 (vector_extract v16i8:$S, 13)),
Nemanja Ivanovicac8d01a2015-12-10 13:35:28 +00001921 (i32 VectorExtractions.LE_BYTE_13)>;
Nemanja Ivanovicd3896572015-10-09 11:12:18 +00001922 def : Pat<(i32 (vector_extract v16i8:$S, 14)),
Nemanja Ivanovicac8d01a2015-12-10 13:35:28 +00001923 (i32 VectorExtractions.LE_BYTE_14)>;
Nemanja Ivanovicd3896572015-10-09 11:12:18 +00001924 def : Pat<(i32 (vector_extract v16i8:$S, 15)),
Nemanja Ivanovicac8d01a2015-12-10 13:35:28 +00001925 (i32 VectorExtractions.LE_BYTE_15)>;
Nemanja Ivanovicd3896572015-10-09 11:12:18 +00001926 def : Pat<(i32 (vector_extract v16i8:$S, i64:$Idx)),
Nemanja Ivanovicac8d01a2015-12-10 13:35:28 +00001927 (i32 VectorExtractions.LE_VARIABLE_BYTE)>;
Nemanja Ivanovic1c39ca62015-08-13 17:40:44 +00001928
Nemanja Ivanovicd3896572015-10-09 11:12:18 +00001929 // v8i16 scalar <-> vector conversions (LE)
1930 def : Pat<(i32 (vector_extract v8i16:$S, 0)),
Nemanja Ivanovicac8d01a2015-12-10 13:35:28 +00001931 (i32 VectorExtractions.LE_HALF_0)>;
Nemanja Ivanovicd3896572015-10-09 11:12:18 +00001932 def : Pat<(i32 (vector_extract v8i16:$S, 1)),
Nemanja Ivanovicac8d01a2015-12-10 13:35:28 +00001933 (i32 VectorExtractions.LE_HALF_1)>;
Nemanja Ivanovicd3896572015-10-09 11:12:18 +00001934 def : Pat<(i32 (vector_extract v8i16:$S, 2)),
Nemanja Ivanovicac8d01a2015-12-10 13:35:28 +00001935 (i32 VectorExtractions.LE_HALF_2)>;
Nemanja Ivanovicd3896572015-10-09 11:12:18 +00001936 def : Pat<(i32 (vector_extract v8i16:$S, 3)),
Nemanja Ivanovicac8d01a2015-12-10 13:35:28 +00001937 (i32 VectorExtractions.LE_HALF_3)>;
Nemanja Ivanovicd3896572015-10-09 11:12:18 +00001938 def : Pat<(i32 (vector_extract v8i16:$S, 4)),
Nemanja Ivanovicac8d01a2015-12-10 13:35:28 +00001939 (i32 VectorExtractions.LE_HALF_4)>;
Nemanja Ivanovicd3896572015-10-09 11:12:18 +00001940 def : Pat<(i32 (vector_extract v8i16:$S, 5)),
Nemanja Ivanovicac8d01a2015-12-10 13:35:28 +00001941 (i32 VectorExtractions.LE_HALF_5)>;
Nemanja Ivanovicd3896572015-10-09 11:12:18 +00001942 def : Pat<(i32 (vector_extract v8i16:$S, 6)),
Nemanja Ivanovicac8d01a2015-12-10 13:35:28 +00001943 (i32 VectorExtractions.LE_HALF_6)>;
Nemanja Ivanovicd3896572015-10-09 11:12:18 +00001944 def : Pat<(i32 (vector_extract v8i16:$S, 7)),
Nemanja Ivanovicac8d01a2015-12-10 13:35:28 +00001945 (i32 VectorExtractions.LE_HALF_7)>;
Nemanja Ivanovicd3896572015-10-09 11:12:18 +00001946 def : Pat<(i32 (vector_extract v8i16:$S, i64:$Idx)),
Nemanja Ivanovicac8d01a2015-12-10 13:35:28 +00001947 (i32 VectorExtractions.LE_VARIABLE_HALF)>;
Nemanja Ivanovicd3896572015-10-09 11:12:18 +00001948
1949 // v4i32 scalar <-> vector conversions (LE)
1950 def : Pat<(i32 (vector_extract v4i32:$S, 0)),
Nemanja Ivanovicac8d01a2015-12-10 13:35:28 +00001951 (i32 VectorExtractions.LE_WORD_0)>;
Nemanja Ivanovicd3896572015-10-09 11:12:18 +00001952 def : Pat<(i32 (vector_extract v4i32:$S, 1)),
Nemanja Ivanovicac8d01a2015-12-10 13:35:28 +00001953 (i32 VectorExtractions.LE_WORD_1)>;
Nemanja Ivanovicd3896572015-10-09 11:12:18 +00001954 def : Pat<(i32 (vector_extract v4i32:$S, 2)),
Nemanja Ivanovicac8d01a2015-12-10 13:35:28 +00001955 (i32 VectorExtractions.LE_WORD_2)>;
Nemanja Ivanovicd3896572015-10-09 11:12:18 +00001956 def : Pat<(i32 (vector_extract v4i32:$S, 3)),
Nemanja Ivanovicac8d01a2015-12-10 13:35:28 +00001957 (i32 VectorExtractions.LE_WORD_3)>;
1958 def : Pat<(i32 (vector_extract v4i32:$S, i64:$Idx)),
1959 (i32 VectorExtractions.LE_VARIABLE_WORD)>;
Nemanja Ivanovicd3896572015-10-09 11:12:18 +00001960
1961 // v2i64 scalar <-> vector conversions (LE)
1962 def : Pat<(i64 (vector_extract v2i64:$S, 0)),
Nemanja Ivanovicac8d01a2015-12-10 13:35:28 +00001963 (i64 VectorExtractions.LE_DWORD_0)>;
Nemanja Ivanovicd3896572015-10-09 11:12:18 +00001964 def : Pat<(i64 (vector_extract v2i64:$S, 1)),
Nemanja Ivanovicac8d01a2015-12-10 13:35:28 +00001965 (i64 VectorExtractions.LE_DWORD_1)>;
1966 def : Pat<(i64 (vector_extract v2i64:$S, i64:$Idx)),
1967 (i64 VectorExtractions.LE_VARIABLE_DWORD)>;
Nemanja Ivanovicd3896572015-10-09 11:12:18 +00001968} // IsLittleEndian, HasDirectMove
Nemanja Ivanovic89224762015-12-15 14:50:34 +00001969
1970let Predicates = [HasDirectMove, HasVSX] in {
1971// bitconvert f32 -> i32
1972// (convert to 32-bit fp single, shift right 1 word, move to GPR)
1973def : Pat<(i32 (bitconvert f32:$S)),
1974 (i32 (MFVSRWZ (EXTRACT_SUBREG
1975 (XXSLDWI (XSCVDPSPN $S),(XSCVDPSPN $S), 3),
1976 sub_64)))>;
1977// bitconvert i32 -> f32
1978// (move to FPR, shift left 1 word, convert to 64-bit fp single)
1979def : Pat<(f32 (bitconvert i32:$A)),
1980 (f32 (XSCVSPDPN
1981 (XXSLDWI MovesToVSR.LE_WORD_1, MovesToVSR.LE_WORD_1, 1)))>;
1982
1983// bitconvert f64 -> i64
1984// (move to GPR, nothing else needed)
1985def : Pat<(i64 (bitconvert f64:$S)),
1986 (i64 (MFVSRD $S))>;
1987
1988// bitconvert i64 -> f64
1989// (move to FPR, nothing else needed)
1990def : Pat<(f64 (bitconvert i64:$S)),
1991 (f64 (MTVSRD $S))>;
1992}
Kit Barton93612ec2016-02-26 21:11:55 +00001993
Nemanja Ivanovicdf1cb522016-11-29 16:11:34 +00001994// Materialize a zero-vector of long long
1995def : Pat<(v2i64 immAllZerosV),
1996 (v2i64 (XXLXORz))>;
1997}
1998
Nemanja Ivanovicb43bb612016-07-12 21:00:10 +00001999def AlignValues {
2000 dag F32_TO_BE_WORD1 = (v4f32 (XXSLDWI (XSCVDPSPN $B), (XSCVDPSPN $B), 3));
2001 dag I32_TO_BE_WORD1 = (COPY_TO_REGCLASS (MTVSRWZ $B), VSRC);
2002}
2003
Kit Barton93612ec2016-02-26 21:11:55 +00002004// The following VSX instructions were introduced in Power ISA 3.0
2005def HasP9Vector : Predicate<"PPCSubTarget->hasP9Vector()">;
Nemanja Ivanovicb43bb612016-07-12 21:00:10 +00002006let AddedComplexity = 400, Predicates = [HasP9Vector] in {
Kit Barton93612ec2016-02-26 21:11:55 +00002007
2008 // [PO VRT XO VRB XO /]
2009 class X_VT5_XO5_VB5<bits<6> opcode, bits<5> xo2, bits<10> xo, string opc,
2010 list<dag> pattern>
2011 : X_RD5_XO5_RS5<opcode, xo2, xo, (outs vrrc:$vT), (ins vrrc:$vB),
2012 !strconcat(opc, " $vT, $vB"), IIC_VecFP, pattern>;
2013
2014 // [PO VRT XO VRB XO RO], Round to Odd version of [PO VRT XO VRB XO /]
2015 class X_VT5_XO5_VB5_Ro<bits<6> opcode, bits<5> xo2, bits<10> xo, string opc,
2016 list<dag> pattern>
2017 : X_VT5_XO5_VB5<opcode, xo2, xo, opc, pattern>, isDOT;
2018
2019 // [PO VRT XO VRB XO /], but the VRB is only used the left 64 bits (or less),
2020 // So we use different operand class for VRB
2021 class X_VT5_XO5_VB5_TyVB<bits<6> opcode, bits<5> xo2, bits<10> xo, string opc,
2022 RegisterOperand vbtype, list<dag> pattern>
2023 : X_RD5_XO5_RS5<opcode, xo2, xo, (outs vrrc:$vT), (ins vbtype:$vB),
2024 !strconcat(opc, " $vT, $vB"), IIC_VecFP, pattern>;
2025
Nemanja Ivanovic11049f82016-10-04 06:59:23 +00002026 let UseVSXReg = 1 in {
Chuang-Yu Cheng80722712016-03-28 08:34:28 +00002027 // [PO T XO B XO BX /]
2028 class XX2_RT5_XO5_XB6<bits<6> opcode, bits<5> xo2, bits<9> xo, string opc,
2029 list<dag> pattern>
2030 : XX2_RD5_XO5_RS6<opcode, xo2, xo, (outs g8rc:$rT), (ins vsfrc:$XB),
2031 !strconcat(opc, " $rT, $XB"), IIC_VecFP, pattern>;
2032
Kit Barton93612ec2016-02-26 21:11:55 +00002033 // [PO T XO B XO BX TX]
2034 class XX2_XT6_XO5_XB6<bits<6> opcode, bits<5> xo2, bits<9> xo, string opc,
2035 RegisterOperand vtype, list<dag> pattern>
2036 : XX2_RD6_XO5_RS6<opcode, xo2, xo, (outs vtype:$XT), (ins vtype:$XB),
2037 !strconcat(opc, " $XT, $XB"), IIC_VecFP, pattern>;
2038
2039 // [PO T A B XO AX BX TX], src and dest register use different operand class
2040 class XX3_XT5_XA5_XB5<bits<6> opcode, bits<8> xo, string opc,
2041 RegisterOperand xty, RegisterOperand aty, RegisterOperand bty,
2042 InstrItinClass itin, list<dag> pattern>
2043 : XX3Form<opcode, xo, (outs xty:$XT), (ins aty:$XA, bty:$XB),
2044 !strconcat(opc, " $XT, $XA, $XB"), itin, pattern>;
Nemanja Ivanovic11049f82016-10-04 06:59:23 +00002045 } // UseVSXReg = 1
Kit Barton93612ec2016-02-26 21:11:55 +00002046
Chuang-Yu Cheng56638482016-03-28 07:38:01 +00002047 // [PO VRT VRA VRB XO /]
2048 class X_VT5_VA5_VB5<bits<6> opcode, bits<10> xo, string opc,
2049 list<dag> pattern>
2050 : XForm_1<opcode, xo, (outs vrrc:$vT), (ins vrrc:$vA, vrrc:$vB),
2051 !strconcat(opc, " $vT, $vA, $vB"), IIC_VecFP, pattern>;
2052
2053 // [PO VRT VRA VRB XO RO], Round to Odd version of [PO VRT VRA VRB XO /]
2054 class X_VT5_VA5_VB5_Ro<bits<6> opcode, bits<10> xo, string opc,
2055 list<dag> pattern>
2056 : X_VT5_VA5_VB5<opcode, xo, opc, pattern>, isDOT;
2057
2058 //===--------------------------------------------------------------------===//
2059 // Quad-Precision Scalar Move Instructions:
2060
2061 // Copy Sign
2062 def XSCPSGNQP : X_VT5_VA5_VB5<63, 100, "xscpsgnqp", []>;
2063
2064 // Absolute/Negative-Absolute/Negate
2065 def XSABSQP : X_VT5_XO5_VB5<63, 0, 804, "xsabsqp" , []>;
2066 def XSNABSQP : X_VT5_XO5_VB5<63, 8, 804, "xsnabsqp", []>;
2067 def XSNEGQP : X_VT5_XO5_VB5<63, 16, 804, "xsnegqp" , []>;
2068
2069 //===--------------------------------------------------------------------===//
2070 // Quad-Precision Scalar Floating-Point Arithmetic Instructions:
2071
2072 // Add/Divide/Multiply/Subtract
2073 def XSADDQP : X_VT5_VA5_VB5 <63, 4, "xsaddqp" , []>;
2074 def XSADDQPO : X_VT5_VA5_VB5_Ro<63, 4, "xsaddqpo", []>;
2075 def XSDIVQP : X_VT5_VA5_VB5 <63, 548, "xsdivqp" , []>;
2076 def XSDIVQPO : X_VT5_VA5_VB5_Ro<63, 548, "xsdivqpo", []>;
2077 def XSMULQP : X_VT5_VA5_VB5 <63, 36, "xsmulqp" , []>;
2078 def XSMULQPO : X_VT5_VA5_VB5_Ro<63, 36, "xsmulqpo", []>;
2079 def XSSUBQP : X_VT5_VA5_VB5 <63, 516, "xssubqp" , []>;
2080 def XSSUBQPO : X_VT5_VA5_VB5_Ro<63, 516, "xssubqpo", []>;
2081
2082 // Square-Root
2083 def XSSQRTQP : X_VT5_XO5_VB5 <63, 27, 804, "xssqrtqp" , []>;
2084 def XSSQRTQPO : X_VT5_XO5_VB5_Ro<63, 27, 804, "xssqrtqpo", []>;
2085
2086 // (Negative) Multiply-{Add/Subtract}
2087 def XSMADDQP : X_VT5_VA5_VB5 <63, 388, "xsmaddqp" , []>;
2088 def XSMADDQPO : X_VT5_VA5_VB5_Ro<63, 388, "xsmaddqpo" , []>;
2089 def XSMSUBQP : X_VT5_VA5_VB5 <63, 420, "xsmsubqp" , []>;
2090 def XSMSUBQPO : X_VT5_VA5_VB5_Ro<63, 420, "xsmsubqpo" , []>;
2091 def XSNMADDQP : X_VT5_VA5_VB5 <63, 452, "xsnmaddqp" , []>;
2092 def XSNMADDQPO: X_VT5_VA5_VB5_Ro<63, 452, "xsnmaddqpo", []>;
2093 def XSNMSUBQP : X_VT5_VA5_VB5 <63, 484, "xsnmsubqp" , []>;
2094 def XSNMSUBQPO: X_VT5_VA5_VB5_Ro<63, 484, "xsnmsubqpo", []>;
2095
Kit Barton93612ec2016-02-26 21:11:55 +00002096 //===--------------------------------------------------------------------===//
2097 // Quad/Double-Precision Compare Instructions:
2098
2099 // [PO BF // VRA VRB XO /]
2100 class X_BF3_VA5_VB5<bits<6> opcode, bits<10> xo, string opc,
2101 list<dag> pattern>
2102 : XForm_17<opcode, xo, (outs crrc:$crD), (ins vrrc:$VA, vrrc:$VB),
2103 !strconcat(opc, " $crD, $VA, $VB"), IIC_FPCompare> {
2104 let Pattern = pattern;
2105 }
2106
2107 // QP Compare Ordered/Unordered
2108 def XSCMPOQP : X_BF3_VA5_VB5<63, 132, "xscmpoqp", []>;
2109 def XSCMPUQP : X_BF3_VA5_VB5<63, 644, "xscmpuqp", []>;
2110
2111 // DP/QP Compare Exponents
2112 def XSCMPEXPDP : XX3Form_1<60, 59,
2113 (outs crrc:$crD), (ins vsfrc:$XA, vsfrc:$XB),
Nemanja Ivanovic11049f82016-10-04 06:59:23 +00002114 "xscmpexpdp $crD, $XA, $XB", IIC_FPCompare, []>,
2115 UseVSXReg;
Kit Barton93612ec2016-02-26 21:11:55 +00002116 def XSCMPEXPQP : X_BF3_VA5_VB5<63, 164, "xscmpexpqp", []>;
2117
2118 // DP Compare ==, >=, >, !=
2119 // Use vsrc for XT, because the entire register of XT is set.
2120 // XT.dword[1] = 0x0000_0000_0000_0000
2121 def XSCMPEQDP : XX3_XT5_XA5_XB5<60, 3, "xscmpeqdp", vsrc, vsfrc, vsfrc,
2122 IIC_FPCompare, []>;
2123 def XSCMPGEDP : XX3_XT5_XA5_XB5<60, 19, "xscmpgedp", vsrc, vsfrc, vsfrc,
2124 IIC_FPCompare, []>;
2125 def XSCMPGTDP : XX3_XT5_XA5_XB5<60, 11, "xscmpgtdp", vsrc, vsfrc, vsfrc,
2126 IIC_FPCompare, []>;
2127 def XSCMPNEDP : XX3_XT5_XA5_XB5<60, 27, "xscmpnedp", vsrc, vsfrc, vsfrc,
2128 IIC_FPCompare, []>;
Nemanja Ivanovic11049f82016-10-04 06:59:23 +00002129 let UseVSXReg = 1 in {
Kit Barton93612ec2016-02-26 21:11:55 +00002130 // Vector Compare Not Equal
2131 def XVCMPNEDP : XX3Form_Rc<60, 123,
2132 (outs vsrc:$XT), (ins vsrc:$XA, vsrc:$XB),
2133 "xvcmpnedp $XT, $XA, $XB", IIC_VecFPCompare, []>;
2134 let Defs = [CR6] in
2135 def XVCMPNEDPo : XX3Form_Rc<60, 123,
2136 (outs vsrc:$XT), (ins vsrc:$XA, vsrc:$XB),
2137 "xvcmpnedp. $XT, $XA, $XB", IIC_VecFPCompare, []>,
2138 isDOT;
2139 def XVCMPNESP : XX3Form_Rc<60, 91,
2140 (outs vsrc:$XT), (ins vsrc:$XA, vsrc:$XB),
2141 "xvcmpnesp $XT, $XA, $XB", IIC_VecFPCompare, []>;
2142 let Defs = [CR6] in
2143 def XVCMPNESPo : XX3Form_Rc<60, 91,
2144 (outs vsrc:$XT), (ins vsrc:$XA, vsrc:$XB),
2145 "xvcmpnesp. $XT, $XA, $XB", IIC_VecFPCompare, []>,
2146 isDOT;
Nemanja Ivanovic11049f82016-10-04 06:59:23 +00002147 } // UseVSXReg = 1
Kit Barton93612ec2016-02-26 21:11:55 +00002148
2149 //===--------------------------------------------------------------------===//
2150 // Quad-Precision Floating-Point Conversion Instructions:
2151
2152 // Convert DP -> QP
Nemanja Ivanovic11049f82016-10-04 06:59:23 +00002153 def XSCVDPQP : X_VT5_XO5_VB5_TyVB<63, 22, 836, "xscvdpqp", vfrc, []>;
Kit Barton93612ec2016-02-26 21:11:55 +00002154
2155 // Round & Convert QP -> DP (dword[1] is set to zero)
2156 def XSCVQPDP : X_VT5_XO5_VB5 <63, 20, 836, "xscvqpdp" , []>;
2157 def XSCVQPDPO : X_VT5_XO5_VB5_Ro<63, 20, 836, "xscvqpdpo", []>;
2158
2159 // Truncate & Convert QP -> (Un)Signed (D)Word (dword[1] is set to zero)
2160 def XSCVQPSDZ : X_VT5_XO5_VB5<63, 25, 836, "xscvqpsdz", []>;
2161 def XSCVQPSWZ : X_VT5_XO5_VB5<63, 9, 836, "xscvqpswz", []>;
2162 def XSCVQPUDZ : X_VT5_XO5_VB5<63, 17, 836, "xscvqpudz", []>;
2163 def XSCVQPUWZ : X_VT5_XO5_VB5<63, 1, 836, "xscvqpuwz", []>;
2164
2165 // Convert (Un)Signed DWord -> QP
Nemanja Ivanovic11049f82016-10-04 06:59:23 +00002166 def XSCVSDQP : X_VT5_XO5_VB5_TyVB<63, 10, 836, "xscvsdqp", vfrc, []>;
2167 def XSCVUDQP : X_VT5_XO5_VB5_TyVB<63, 2, 836, "xscvudqp", vfrc, []>;
Kit Barton93612ec2016-02-26 21:11:55 +00002168
Sean Fertilea435e072016-11-14 18:43:59 +00002169 let UseVSXReg = 1 in {
Kit Barton93612ec2016-02-26 21:11:55 +00002170 //===--------------------------------------------------------------------===//
2171 // Round to Floating-Point Integer Instructions
2172
2173 // (Round &) Convert DP <-> HP
2174 // Note! xscvdphp's src and dest register both use the left 64 bits, so we use
2175 // vsfrc for src and dest register. xscvhpdp's src only use the left 16 bits,
2176 // but we still use vsfrc for it.
2177 def XSCVDPHP : XX2_XT6_XO5_XB6<60, 17, 347, "xscvdphp", vsfrc, []>;
2178 def XSCVHPDP : XX2_XT6_XO5_XB6<60, 16, 347, "xscvhpdp", vsfrc, []>;
2179
2180 // Vector HP -> SP
2181 def XVCVHPSP : XX2_XT6_XO5_XB6<60, 24, 475, "xvcvhpsp", vsrc, []>;
Nemanja Ivanovicec4b0c32016-11-11 21:42:01 +00002182 def XVCVSPHP : XX2_XT6_XO5_XB6<60, 25, 475, "xvcvsphp", vsrc,
2183 [(set v4f32:$XT,
2184 (int_ppc_vsx_xvcvsphp v4f32:$XB))]>;
Kit Barton93612ec2016-02-26 21:11:55 +00002185
Sean Fertilea435e072016-11-14 18:43:59 +00002186 } // UseVSXReg = 1
2187
2188 // Pattern for matching Vector HP -> Vector SP intrinsic. Defined as a
2189 // seperate pattern so that it can convert the input register class from
2190 // VRRC(v8i16) to VSRC.
2191 def : Pat<(v4f32 (int_ppc_vsx_xvcvhpsp v8i16:$A)),
2192 (v4f32 (XVCVHPSP (COPY_TO_REGCLASS $A, VSRC)))>;
2193
Kit Barton93612ec2016-02-26 21:11:55 +00002194 class Z23_VT5_R1_VB5_RMC2_EX1<bits<6> opcode, bits<8> xo, bit ex, string opc,
2195 list<dag> pattern>
2196 : Z23Form_1<opcode, xo,
2197 (outs vrrc:$vT), (ins u1imm:$r, vrrc:$vB, u2imm:$rmc),
2198 !strconcat(opc, " $r, $vT, $vB, $rmc"), IIC_VecFP, pattern> {
2199 let RC = ex;
2200 }
2201
2202 // Round to Quad-Precision Integer [with Inexact]
2203 def XSRQPI : Z23_VT5_R1_VB5_RMC2_EX1<63, 5, 0, "xsrqpi" , []>;
2204 def XSRQPIX : Z23_VT5_R1_VB5_RMC2_EX1<63, 5, 1, "xsrqpix", []>;
2205
2206 // Round Quad-Precision to Double-Extended Precision (fp80)
2207 def XSRQPXP : Z23_VT5_R1_VB5_RMC2_EX1<63, 37, 0, "xsrqpxp", []>;
Kit Bartonba532dc2016-03-08 03:49:13 +00002208
2209 //===--------------------------------------------------------------------===//
Chuang-Yu Cheng80722712016-03-28 08:34:28 +00002210 // Insert/Extract Instructions
2211
2212 // Insert Exponent DP/QP
2213 // XT NOTE: XT.dword[1] = 0xUUUU_UUUU_UUUU_UUUU
2214 def XSIEXPDP : XX1Form <60, 918, (outs vsrc:$XT), (ins g8rc:$rA, g8rc:$rB),
Nemanja Ivanovic11049f82016-10-04 06:59:23 +00002215 "xsiexpdp $XT, $rA, $rB", IIC_VecFP, []>, UseVSXReg;
Chuang-Yu Cheng80722712016-03-28 08:34:28 +00002216 // vB NOTE: only vB.dword[0] is used, that's why we don't use
2217 // X_VT5_VA5_VB5 form
2218 def XSIEXPQP : XForm_18<63, 868, (outs vrrc:$vT), (ins vrrc:$vA, vsfrc:$vB),
2219 "xsiexpqp $vT, $vA, $vB", IIC_VecFP, []>;
2220
2221 // Extract Exponent/Significand DP/QP
2222 def XSXEXPDP : XX2_RT5_XO5_XB6<60, 0, 347, "xsxexpdp", []>;
2223 def XSXSIGDP : XX2_RT5_XO5_XB6<60, 1, 347, "xsxsigdp", []>;
Nemanja Ivanovic11049f82016-10-04 06:59:23 +00002224
Chuang-Yu Cheng80722712016-03-28 08:34:28 +00002225 def XSXEXPQP : X_VT5_XO5_VB5 <63, 2, 804, "xsxexpqp", []>;
2226 def XSXSIGQP : X_VT5_XO5_VB5 <63, 18, 804, "xsxsigqp", []>;
2227
2228 // Vector Insert Word
Nemanja Ivanovic11049f82016-10-04 06:59:23 +00002229 let UseVSXReg = 1 in {
Chuang-Yu Cheng80722712016-03-28 08:34:28 +00002230 // XB NOTE: Only XB.dword[1] is used, but we use vsrc on XB.
Nemanja Ivanovicb43bb612016-07-12 21:00:10 +00002231 def XXINSERTW :
2232 XX2_RD6_UIM5_RS6<60, 181, (outs vsrc:$XT),
2233 (ins vsrc:$XTi, vsrc:$XB, u4imm:$UIM),
2234 "xxinsertw $XT, $XB, $UIM", IIC_VecFP,
2235 [(set v4i32:$XT, (PPCxxinsert v4i32:$XTi, v4i32:$XB,
2236 imm32SExt16:$UIM))]>,
2237 RegConstraint<"$XTi = $XT">, NoEncode<"$XTi">;
Chuang-Yu Cheng80722712016-03-28 08:34:28 +00002238
2239 // Vector Extract Unsigned Word
2240 def XXEXTRACTUW : XX2_RD6_UIM5_RS6<60, 165,
Nemanja Ivanovicb43bb612016-07-12 21:00:10 +00002241 (outs vsfrc:$XT), (ins vsrc:$XB, u4imm:$UIMM),
Chuang-Yu Cheng80722712016-03-28 08:34:28 +00002242 "xxextractuw $XT, $XB, $UIMM", IIC_VecFP, []>;
Nemanja Ivanovic11049f82016-10-04 06:59:23 +00002243 } // UseVSXReg = 1
Chuang-Yu Cheng80722712016-03-28 08:34:28 +00002244
2245 // Vector Insert Exponent DP/SP
2246 def XVIEXPDP : XX3_XT5_XA5_XB5<60, 248, "xviexpdp", vsrc, vsrc, vsrc,
Nemanja Ivanovic0f459982016-10-26 19:03:40 +00002247 IIC_VecFP, [(set v2f64: $XT,(int_ppc_vsx_xviexpdp v2i64:$XA, v2i64:$XB))]>;
Chuang-Yu Cheng80722712016-03-28 08:34:28 +00002248 def XVIEXPSP : XX3_XT5_XA5_XB5<60, 216, "xviexpsp", vsrc, vsrc, vsrc,
Nemanja Ivanovic0f459982016-10-26 19:03:40 +00002249 IIC_VecFP, [(set v4f32: $XT,(int_ppc_vsx_xviexpsp v4i32:$XA, v4i32:$XB))]>;
Chuang-Yu Cheng80722712016-03-28 08:34:28 +00002250
2251 // Vector Extract Exponent/Significand DP/SP
Sean Fertileadda5b22016-11-14 14:42:37 +00002252 def XVXEXPDP : XX2_XT6_XO5_XB6<60, 0, 475, "xvxexpdp", vsrc,
2253 [(set v2i64: $XT,
2254 (int_ppc_vsx_xvxexpdp v2f64:$XB))]>;
2255 def XVXEXPSP : XX2_XT6_XO5_XB6<60, 8, 475, "xvxexpsp", vsrc,
2256 [(set v4i32: $XT,
2257 (int_ppc_vsx_xvxexpsp v4f32:$XB))]>;
2258 def XVXSIGDP : XX2_XT6_XO5_XB6<60, 1, 475, "xvxsigdp", vsrc,
2259 [(set v2i64: $XT,
2260 (int_ppc_vsx_xvxsigdp v2f64:$XB))]>;
2261 def XVXSIGSP : XX2_XT6_XO5_XB6<60, 9, 475, "xvxsigsp", vsrc,
2262 [(set v4i32: $XT,
2263 (int_ppc_vsx_xvxsigsp v4f32:$XB))]>;
Chuang-Yu Cheng80722712016-03-28 08:34:28 +00002264
2265 //===--------------------------------------------------------------------===//
2266
2267 // Test Data Class SP/DP/QP
Nemanja Ivanovic11049f82016-10-04 06:59:23 +00002268 let UseVSXReg = 1 in {
Chuang-Yu Cheng80722712016-03-28 08:34:28 +00002269 def XSTSTDCSP : XX2_BF3_DCMX7_RS6<60, 298,
2270 (outs crrc:$BF), (ins u7imm:$DCMX, vsfrc:$XB),
2271 "xststdcsp $BF, $XB, $DCMX", IIC_VecFP, []>;
2272 def XSTSTDCDP : XX2_BF3_DCMX7_RS6<60, 362,
2273 (outs crrc:$BF), (ins u7imm:$DCMX, vsfrc:$XB),
2274 "xststdcdp $BF, $XB, $DCMX", IIC_VecFP, []>;
Nemanja Ivanovic11049f82016-10-04 06:59:23 +00002275 } // UseVSXReg = 1
Chuang-Yu Cheng80722712016-03-28 08:34:28 +00002276 def XSTSTDCQP : X_BF3_DCMX7_RS5 <63, 708,
2277 (outs crrc:$BF), (ins u7imm:$DCMX, vrrc:$vB),
2278 "xststdcqp $BF, $vB, $DCMX", IIC_VecFP, []>;
2279
2280 // Vector Test Data Class SP/DP
Nemanja Ivanovic11049f82016-10-04 06:59:23 +00002281 let UseVSXReg = 1 in {
Chuang-Yu Cheng80722712016-03-28 08:34:28 +00002282 def XVTSTDCSP : XX2_RD6_DCMX7_RS6<60, 13, 5,
2283 (outs vsrc:$XT), (ins u7imm:$DCMX, vsrc:$XB),
Sean Fertileadda5b22016-11-14 14:42:37 +00002284 "xvtstdcsp $XT, $XB, $DCMX", IIC_VecFP,
2285 [(set v4i32: $XT,
2286 (int_ppc_vsx_xvtstdcsp v4f32:$XB, imm:$DCMX))]>;
Chuang-Yu Cheng80722712016-03-28 08:34:28 +00002287 def XVTSTDCDP : XX2_RD6_DCMX7_RS6<60, 15, 5,
2288 (outs vsrc:$XT), (ins u7imm:$DCMX, vsrc:$XB),
Sean Fertileadda5b22016-11-14 14:42:37 +00002289 "xvtstdcdp $XT, $XB, $DCMX", IIC_VecFP,
2290 [(set v2i64: $XT,
2291 (int_ppc_vsx_xvtstdcdp v2f64:$XB, imm:$DCMX))]>;
Nemanja Ivanovic11049f82016-10-04 06:59:23 +00002292 } // UseVSXReg = 1
Chuang-Yu Cheng80722712016-03-28 08:34:28 +00002293
2294 //===--------------------------------------------------------------------===//
2295
2296 // Maximum/Minimum Type-C/Type-J DP
2297 // XT.dword[1] = 0xUUUU_UUUU_UUUU_UUUU, so we use vsrc for XT
2298 def XSMAXCDP : XX3_XT5_XA5_XB5<60, 128, "xsmaxcdp", vsrc, vsfrc, vsfrc,
2299 IIC_VecFP, []>;
2300 def XSMAXJDP : XX3_XT5_XA5_XB5<60, 144, "xsmaxjdp", vsrc, vsfrc, vsfrc,
2301 IIC_VecFP, []>;
2302 def XSMINCDP : XX3_XT5_XA5_XB5<60, 136, "xsmincdp", vsrc, vsfrc, vsfrc,
2303 IIC_VecFP, []>;
2304 def XSMINJDP : XX3_XT5_XA5_XB5<60, 152, "xsminjdp", vsrc, vsfrc, vsfrc,
2305 IIC_VecFP, []>;
2306
2307 //===--------------------------------------------------------------------===//
2308
2309 // Vector Byte-Reverse H/W/D/Q Word
2310 def XXBRH : XX2_XT6_XO5_XB6<60, 7, 475, "xxbrh", vsrc, []>;
2311 def XXBRW : XX2_XT6_XO5_XB6<60, 15, 475, "xxbrw", vsrc, []>;
2312 def XXBRD : XX2_XT6_XO5_XB6<60, 23, 475, "xxbrd", vsrc, []>;
2313 def XXBRQ : XX2_XT6_XO5_XB6<60, 31, 475, "xxbrq", vsrc, []>;
2314
2315 // Vector Permute
2316 def XXPERM : XX3_XT5_XA5_XB5<60, 26, "xxperm" , vsrc, vsrc, vsrc,
2317 IIC_VecPerm, []>;
2318 def XXPERMR : XX3_XT5_XA5_XB5<60, 58, "xxpermr", vsrc, vsrc, vsrc,
2319 IIC_VecPerm, []>;
2320
2321 // Vector Splat Immediate Byte
2322 def XXSPLTIB : X_RD6_IMM8<60, 360, (outs vsrc:$XT), (ins u8imm:$IMM8),
Nemanja Ivanovic11049f82016-10-04 06:59:23 +00002323 "xxspltib $XT, $IMM8", IIC_VecPerm, []>, UseVSXReg;
Chuang-Yu Cheng80722712016-03-28 08:34:28 +00002324
2325 //===--------------------------------------------------------------------===//
Kit Bartonba532dc2016-03-08 03:49:13 +00002326 // Vector/Scalar Load/Store Instructions
2327
Nemanja Ivanovic6354d232016-10-04 11:25:52 +00002328 // When adding new D-Form loads/stores, be sure to update the ImmToIdxMap in
2329 // PPCRegisterInfo::PPCRegisterInfo and maybe save yourself some debugging.
Kit Bartonba532dc2016-03-08 03:49:13 +00002330 let mayLoad = 1 in {
2331 // Load Vector
2332 def LXV : DQ_RD6_RS5_DQ12<61, 1, (outs vsrc:$XT), (ins memrix16:$src),
Nemanja Ivanovic11049f82016-10-04 06:59:23 +00002333 "lxv $XT, $src", IIC_LdStLFD, []>, UseVSXReg;
Kit Bartonba532dc2016-03-08 03:49:13 +00002334 // Load DWord
Nemanja Ivanovic11049f82016-10-04 06:59:23 +00002335 def LXSD : DSForm_1<57, 2, (outs vfrc:$vD), (ins memrix:$src),
Kit Bartonba532dc2016-03-08 03:49:13 +00002336 "lxsd $vD, $src", IIC_LdStLFD, []>;
2337 // Load SP from src, convert it to DP, and place in dword[0]
Nemanja Ivanovic11049f82016-10-04 06:59:23 +00002338 def LXSSP : DSForm_1<57, 3, (outs vfrc:$vD), (ins memrix:$src),
Kit Bartonba532dc2016-03-08 03:49:13 +00002339 "lxssp $vD, $src", IIC_LdStLFD, []>;
2340
2341 // [PO T RA RB XO TX] almost equal to [PO S RA RB XO SX], but has different
2342 // "out" and "in" dag
2343 class X_XT6_RA5_RB5<bits<6> opcode, bits<10> xo, string opc,
2344 RegisterOperand vtype, list<dag> pattern>
2345 : XX1Form<opcode, xo, (outs vtype:$XT), (ins memrr:$src),
Nemanja Ivanovic11049f82016-10-04 06:59:23 +00002346 !strconcat(opc, " $XT, $src"), IIC_LdStLFD, pattern>, UseVSXReg;
Kit Bartonba532dc2016-03-08 03:49:13 +00002347
2348 // Load as Integer Byte/Halfword & Zero Indexed
Nemanja Ivanovic11049f82016-10-04 06:59:23 +00002349 def LXSIBZX : X_XT6_RA5_RB5<31, 781, "lxsibzx", vsfrc,
2350 [(set f64:$XT, (PPClxsizx xoaddr:$src, 1))]>;
2351 def LXSIHZX : X_XT6_RA5_RB5<31, 813, "lxsihzx", vsfrc,
2352 [(set f64:$XT, (PPClxsizx xoaddr:$src, 2))]>;
Kit Bartonba532dc2016-03-08 03:49:13 +00002353
2354 // Load Vector Halfword*8/Byte*16 Indexed
2355 def LXVH8X : X_XT6_RA5_RB5<31, 812, "lxvh8x" , vsrc, []>;
2356 def LXVB16X : X_XT6_RA5_RB5<31, 876, "lxvb16x", vsrc, []>;
2357
2358 // Load Vector Indexed
Nemanja Ivanovic6e7879c2016-09-22 09:52:19 +00002359 def LXVX : X_XT6_RA5_RB5<31, 268, "lxvx" , vsrc,
2360 [(set v2f64:$XT, (load xoaddr:$src))]>;
Kit Bartonba532dc2016-03-08 03:49:13 +00002361
2362 // Load Vector (Left-justified) with Length
Zaara Syedaa19c9e62016-11-15 17:54:19 +00002363 def LXVL : XX1Form<31, 269, (outs vsrc:$XT), (ins memr:$src, g8rc:$rB),
2364 "lxvl $XT, $src, $rB", IIC_LdStLoad,
2365 [(set v4i32:$XT, (int_ppc_vsx_lxvl addr:$src, i64:$rB))]>,
2366 UseVSXReg;
2367 def LXVLL : XX1Form<31,301, (outs vsrc:$XT), (ins memr:$src, g8rc:$rB),
2368 "lxvll $XT, $src, $rB", IIC_LdStLoad,
2369 [(set v4i32:$XT, (int_ppc_vsx_lxvll addr:$src, i64:$rB))]>,
2370 UseVSXReg;
Kit Bartonba532dc2016-03-08 03:49:13 +00002371
2372 // Load Vector Word & Splat Indexed
2373 def LXVWSX : X_XT6_RA5_RB5<31, 364, "lxvwsx" , vsrc, []>;
Nemanja Ivanovic11049f82016-10-04 06:59:23 +00002374 } // mayLoad
Kit Bartonba532dc2016-03-08 03:49:13 +00002375
Nemanja Ivanovic6354d232016-10-04 11:25:52 +00002376 // When adding new D-Form loads/stores, be sure to update the ImmToIdxMap in
2377 // PPCRegisterInfo::PPCRegisterInfo and maybe save yourself some debugging.
Kit Bartonba532dc2016-03-08 03:49:13 +00002378 let mayStore = 1 in {
2379 // Store Vector
2380 def STXV : DQ_RD6_RS5_DQ12<61, 5, (outs), (ins vsrc:$XT, memrix16:$dst),
Nemanja Ivanovic11049f82016-10-04 06:59:23 +00002381 "stxv $XT, $dst", IIC_LdStSTFD, []>, UseVSXReg;
Kit Bartonba532dc2016-03-08 03:49:13 +00002382 // Store DWord
Nemanja Ivanovic11049f82016-10-04 06:59:23 +00002383 def STXSD : DSForm_1<61, 2, (outs), (ins vfrc:$vS, memrix:$dst),
Kit Bartonba532dc2016-03-08 03:49:13 +00002384 "stxsd $vS, $dst", IIC_LdStSTFD, []>;
2385 // Convert DP of dword[0] to SP, and Store to dst
Nemanja Ivanovic11049f82016-10-04 06:59:23 +00002386 def STXSSP : DSForm_1<61, 3, (outs), (ins vfrc:$vS, memrix:$dst),
Kit Bartonba532dc2016-03-08 03:49:13 +00002387 "stxssp $vS, $dst", IIC_LdStSTFD, []>;
2388
2389 // [PO S RA RB XO SX]
2390 class X_XS6_RA5_RB5<bits<6> opcode, bits<10> xo, string opc,
2391 RegisterOperand vtype, list<dag> pattern>
2392 : XX1Form<opcode, xo, (outs), (ins vtype:$XT, memrr:$dst),
Nemanja Ivanovic11049f82016-10-04 06:59:23 +00002393 !strconcat(opc, " $XT, $dst"), IIC_LdStSTFD, pattern>, UseVSXReg;
Kit Bartonba532dc2016-03-08 03:49:13 +00002394
2395 // Store as Integer Byte/Halfword Indexed
Nemanja Ivanovic11049f82016-10-04 06:59:23 +00002396 def STXSIBX : X_XS6_RA5_RB5<31, 909, "stxsibx" , vsfrc,
2397 [(PPCstxsix f64:$XT, xoaddr:$dst, 1)]>;
2398 def STXSIHX : X_XS6_RA5_RB5<31, 941, "stxsihx" , vsfrc,
2399 [(PPCstxsix f64:$XT, xoaddr:$dst, 2)]>;
2400 let isCodeGenOnly = 1 in {
2401 def STXSIBXv : X_XS6_RA5_RB5<31, 909, "stxsibx" , vrrc, []>;
2402 def STXSIHXv : X_XS6_RA5_RB5<31, 941, "stxsihx" , vrrc, []>;
2403 }
Kit Bartonba532dc2016-03-08 03:49:13 +00002404
2405 // Store Vector Halfword*8/Byte*16 Indexed
2406 def STXVH8X : X_XS6_RA5_RB5<31, 940, "stxvh8x" , vsrc, []>;
2407 def STXVB16X : X_XS6_RA5_RB5<31, 1004, "stxvb16x", vsrc, []>;
2408
2409 // Store Vector Indexed
Nemanja Ivanovic6e7879c2016-09-22 09:52:19 +00002410 def STXVX : X_XS6_RA5_RB5<31, 396, "stxvx" , vsrc,
2411 [(store v2f64:$XT, xoaddr:$dst)]>;
Kit Bartonba532dc2016-03-08 03:49:13 +00002412
2413 // Store Vector (Left-justified) with Length
Zaara Syedaa19c9e62016-11-15 17:54:19 +00002414 def STXVL : XX1Form<31, 397, (outs), (ins vsrc:$XT, memr:$dst, g8rc:$rB),
2415 "stxvl $XT, $dst, $rB", IIC_LdStLoad,
2416 [(int_ppc_vsx_stxvl v4i32:$XT, addr:$dst, i64:$rB)]>,
2417 UseVSXReg;
2418 def STXVLL : XX1Form<31, 429, (outs), (ins vsrc:$XT, memr:$dst, g8rc:$rB),
2419 "stxvll $XT, $dst, $rB", IIC_LdStLoad,
2420 [(int_ppc_vsx_stxvll v4i32:$XT, addr:$dst, i64:$rB)]>,
2421 UseVSXReg;
Nemanja Ivanovic11049f82016-10-04 06:59:23 +00002422 } // mayStore
Nemanja Ivanovicb43bb612016-07-12 21:00:10 +00002423
2424 // Patterns for which instructions from ISA 3.0 are a better match
2425 let Predicates = [IsLittleEndian, HasP9Vector] in {
2426 def : Pat<(f32 (PPCfcfidus (PPCmtvsrz (i32 (extractelt v4i32:$A, 0))))),
2427 (f32 (XSCVUXDSP (XXEXTRACTUW $A, 12)))>;
2428 def : Pat<(f32 (PPCfcfidus (PPCmtvsrz (i32 (extractelt v4i32:$A, 1))))),
2429 (f32 (XSCVUXDSP (XXEXTRACTUW $A, 8)))>;
2430 def : Pat<(f32 (PPCfcfidus (PPCmtvsrz (i32 (extractelt v4i32:$A, 2))))),
2431 (f32 (XSCVUXDSP (XXEXTRACTUW $A, 4)))>;
2432 def : Pat<(f32 (PPCfcfidus (PPCmtvsrz (i32 (extractelt v4i32:$A, 3))))),
2433 (f32 (XSCVUXDSP (XXEXTRACTUW $A, 0)))>;
2434 def : Pat<(v4i32 (insertelt v4i32:$A, i32:$B, 0)),
2435 (v4i32 (XXINSERTW v4i32:$A, AlignValues.I32_TO_BE_WORD1, 12))>;
2436 def : Pat<(v4i32 (insertelt v4i32:$A, i32:$B, 1)),
2437 (v4i32 (XXINSERTW v4i32:$A, AlignValues.I32_TO_BE_WORD1, 8))>;
2438 def : Pat<(v4i32 (insertelt v4i32:$A, i32:$B, 2)),
2439 (v4i32 (XXINSERTW v4i32:$A, AlignValues.I32_TO_BE_WORD1, 4))>;
2440 def : Pat<(v4i32 (insertelt v4i32:$A, i32:$B, 3)),
2441 (v4i32 (XXINSERTW v4i32:$A, AlignValues.I32_TO_BE_WORD1, 0))>;
2442 def : Pat<(v4f32 (insertelt v4f32:$A, f32:$B, 0)),
2443 (v4f32 (XXINSERTW v4f32:$A, AlignValues.F32_TO_BE_WORD1, 12))>;
2444 def : Pat<(v4f32 (insertelt v4f32:$A, f32:$B, 1)),
2445 (v4f32 (XXINSERTW v4f32:$A, AlignValues.F32_TO_BE_WORD1, 8))>;
2446 def : Pat<(v4f32 (insertelt v4f32:$A, f32:$B, 2)),
2447 (v4f32 (XXINSERTW v4f32:$A, AlignValues.F32_TO_BE_WORD1, 4))>;
2448 def : Pat<(v4f32 (insertelt v4f32:$A, f32:$B, 3)),
2449 (v4f32 (XXINSERTW v4f32:$A, AlignValues.F32_TO_BE_WORD1, 0))>;
2450 } // IsLittleEndian, HasP9Vector
2451
2452 let Predicates = [IsBigEndian, HasP9Vector] in {
2453 def : Pat<(f32 (PPCfcfidus (PPCmtvsrz (i32 (extractelt v4i32:$A, 0))))),
2454 (f32 (XSCVUXDSP (XXEXTRACTUW $A, 0)))>;
2455 def : Pat<(f32 (PPCfcfidus (PPCmtvsrz (i32 (extractelt v4i32:$A, 1))))),
2456 (f32 (XSCVUXDSP (XXEXTRACTUW $A, 4)))>;
2457 def : Pat<(f32 (PPCfcfidus (PPCmtvsrz (i32 (extractelt v4i32:$A, 2))))),
2458 (f32 (XSCVUXDSP (XXEXTRACTUW $A, 8)))>;
2459 def : Pat<(f32 (PPCfcfidus (PPCmtvsrz (i32 (extractelt v4i32:$A, 3))))),
2460 (f32 (XSCVUXDSP (XXEXTRACTUW $A, 12)))>;
2461 def : Pat<(v4i32 (insertelt v4i32:$A, i32:$B, 0)),
2462 (v4i32 (XXINSERTW v4i32:$A, AlignValues.I32_TO_BE_WORD1, 0))>;
2463 def : Pat<(v4i32 (insertelt v4i32:$A, i32:$B, 1)),
2464 (v4i32 (XXINSERTW v4i32:$A, AlignValues.I32_TO_BE_WORD1, 4))>;
2465 def : Pat<(v4i32 (insertelt v4i32:$A, i32:$B, 2)),
2466 (v4i32 (XXINSERTW v4i32:$A, AlignValues.I32_TO_BE_WORD1, 8))>;
2467 def : Pat<(v4i32 (insertelt v4i32:$A, i32:$B, 3)),
2468 (v4i32 (XXINSERTW v4i32:$A, AlignValues.I32_TO_BE_WORD1, 12))>;
2469 def : Pat<(v4f32 (insertelt v4f32:$A, f32:$B, 0)),
2470 (v4f32 (XXINSERTW v4f32:$A, AlignValues.F32_TO_BE_WORD1, 0))>;
2471 def : Pat<(v4f32 (insertelt v4f32:$A, f32:$B, 1)),
2472 (v4f32 (XXINSERTW v4f32:$A, AlignValues.F32_TO_BE_WORD1, 4))>;
2473 def : Pat<(v4f32 (insertelt v4f32:$A, f32:$B, 2)),
2474 (v4f32 (XXINSERTW v4f32:$A, AlignValues.F32_TO_BE_WORD1, 8))>;
2475 def : Pat<(v4f32 (insertelt v4f32:$A, f32:$B, 3)),
2476 (v4f32 (XXINSERTW v4f32:$A, AlignValues.F32_TO_BE_WORD1, 12))>;
2477 } // IsLittleEndian, HasP9Vector
Nemanja Ivanovic6e7879c2016-09-22 09:52:19 +00002478
2479 def : Pat<(v2f64 (load xoaddr:$src)), (LXVX xoaddr:$src)>;
2480 def : Pat<(v2i64 (load xoaddr:$src)), (LXVX xoaddr:$src)>;
2481 def : Pat<(v4f32 (load xoaddr:$src)), (LXVX xoaddr:$src)>;
2482 def : Pat<(v4i32 (load xoaddr:$src)), (LXVX xoaddr:$src)>;
2483 def : Pat<(v4i32 (int_ppc_vsx_lxvw4x xoaddr:$src)), (LXVX xoaddr:$src)>;
2484 def : Pat<(v2f64 (int_ppc_vsx_lxvd2x xoaddr:$src)), (LXVX xoaddr:$src)>;
2485 def : Pat<(store v2f64:$rS, xoaddr:$dst), (STXVX $rS, xoaddr:$dst)>;
2486 def : Pat<(store v2i64:$rS, xoaddr:$dst), (STXVX $rS, xoaddr:$dst)>;
2487 def : Pat<(store v4f32:$rS, xoaddr:$dst), (STXVX $rS, xoaddr:$dst)>;
2488 def : Pat<(store v4i32:$rS, xoaddr:$dst), (STXVX $rS, xoaddr:$dst)>;
2489 def : Pat<(int_ppc_vsx_stxvw4x v4i32:$rS, xoaddr:$dst),
2490 (STXVX $rS, xoaddr:$dst)>;
2491 def : Pat<(int_ppc_vsx_stxvd2x v2f64:$rS, xoaddr:$dst),
2492 (STXVX $rS, xoaddr:$dst)>;
Nemanja Ivanovicd2c3c512016-09-23 13:25:31 +00002493
2494 def : Pat<(v4i32 (scalar_to_vector (i32 (load xoaddr:$src)))),
2495 (v4i32 (LXVWSX xoaddr:$src))>;
2496 def : Pat<(v4f32 (scalar_to_vector (f32 (load xoaddr:$src)))),
2497 (v4f32 (LXVWSX xoaddr:$src))>;
Nemanja Ivanovicdf1cb522016-11-29 16:11:34 +00002498 def : Pat<(v4f32 (scalar_to_vector (f32 (fpround (extloadf32 xoaddr:$src))))),
2499 (v4f32 (LXVWSX xoaddr:$src))>;
Nemanja Ivanovic11049f82016-10-04 06:59:23 +00002500
2501 // Build vectors from i8 loads
2502 def : Pat<(v16i8 (scalar_to_vector ScalarLoads.Li8)),
2503 (v16i8 (VSPLTBs 7, (LXSIBZX xoaddr:$src)))>;
2504 def : Pat<(v8i16 (scalar_to_vector ScalarLoads.ZELi8)),
2505 (v8i16 (VSPLTHs 3, (LXSIBZX xoaddr:$src)))>;
2506 def : Pat<(v4i32 (scalar_to_vector ScalarLoads.ZELi8)),
2507 (v4i32 (XXSPLTWs (LXSIBZX xoaddr:$src), 1))>;
2508 def : Pat<(v2i64 (scalar_to_vector ScalarLoads.ZELi8i64)),
Nemanja Ivanovic15748f42016-12-06 11:47:14 +00002509 (v2i64 (XXPERMDIs (LXSIBZX xoaddr:$src), 0))>;
Nemanja Ivanovic11049f82016-10-04 06:59:23 +00002510 def : Pat<(v4i32 (scalar_to_vector ScalarLoads.SELi8)),
2511 (v4i32 (XXSPLTWs (VEXTSB2Ws (LXSIBZX xoaddr:$src)), 1))>;
2512 def : Pat<(v2i64 (scalar_to_vector ScalarLoads.SELi8i64)),
Nemanja Ivanovic15748f42016-12-06 11:47:14 +00002513 (v2i64 (XXPERMDIs (VEXTSB2Ds (LXSIBZX xoaddr:$src)), 0))>;
Nemanja Ivanovic11049f82016-10-04 06:59:23 +00002514
2515 // Build vectors from i16 loads
2516 def : Pat<(v8i16 (scalar_to_vector ScalarLoads.Li16)),
2517 (v8i16 (VSPLTHs 3, (LXSIHZX xoaddr:$src)))>;
2518 def : Pat<(v4i32 (scalar_to_vector ScalarLoads.ZELi16)),
2519 (v4i32 (XXSPLTWs (LXSIHZX xoaddr:$src), 1))>;
2520 def : Pat<(v2i64 (scalar_to_vector ScalarLoads.ZELi16i64)),
Nemanja Ivanovic15748f42016-12-06 11:47:14 +00002521 (v2i64 (XXPERMDIs (LXSIHZX xoaddr:$src), 0))>;
Nemanja Ivanovic11049f82016-10-04 06:59:23 +00002522 def : Pat<(v4i32 (scalar_to_vector ScalarLoads.SELi16)),
2523 (v4i32 (XXSPLTWs (VEXTSH2Ws (LXSIHZX xoaddr:$src)), 1))>;
2524 def : Pat<(v2i64 (scalar_to_vector ScalarLoads.SELi16i64)),
Nemanja Ivanovic15748f42016-12-06 11:47:14 +00002525 (v2i64 (XXPERMDIs (VEXTSH2Ds (LXSIHZX xoaddr:$src)), 0))>;
Nemanja Ivanovic11049f82016-10-04 06:59:23 +00002526
2527 let Predicates = [IsBigEndian, HasP9Vector] in {
2528 // Scalar stores of i8
2529 def : Pat<(truncstorei8 (i32 (vector_extract v16i8:$S, 0)), xoaddr:$dst),
2530 (STXSIBXv (VSLDOI $S, $S, 9), xoaddr:$dst)>;
2531 def : Pat<(truncstorei8 (i32 (vector_extract v16i8:$S, 1)), xoaddr:$dst),
2532 (STXSIBXv (VSLDOI $S, $S, 10), xoaddr:$dst)>;
2533 def : Pat<(truncstorei8 (i32 (vector_extract v16i8:$S, 2)), xoaddr:$dst),
2534 (STXSIBXv (VSLDOI $S, $S, 11), xoaddr:$dst)>;
2535 def : Pat<(truncstorei8 (i32 (vector_extract v16i8:$S, 3)), xoaddr:$dst),
2536 (STXSIBXv (VSLDOI $S, $S, 12), xoaddr:$dst)>;
2537 def : Pat<(truncstorei8 (i32 (vector_extract v16i8:$S, 4)), xoaddr:$dst),
2538 (STXSIBXv (VSLDOI $S, $S, 13), xoaddr:$dst)>;
2539 def : Pat<(truncstorei8 (i32 (vector_extract v16i8:$S, 5)), xoaddr:$dst),
2540 (STXSIBXv (VSLDOI $S, $S, 14), xoaddr:$dst)>;
2541 def : Pat<(truncstorei8 (i32 (vector_extract v16i8:$S, 6)), xoaddr:$dst),
2542 (STXSIBXv (VSLDOI $S, $S, 15), xoaddr:$dst)>;
2543 def : Pat<(truncstorei8 (i32 (vector_extract v16i8:$S, 7)), xoaddr:$dst),
2544 (STXSIBXv $S, xoaddr:$dst)>;
2545 def : Pat<(truncstorei8 (i32 (vector_extract v16i8:$S, 8)), xoaddr:$dst),
2546 (STXSIBXv (VSLDOI $S, $S, 1), xoaddr:$dst)>;
2547 def : Pat<(truncstorei8 (i32 (vector_extract v16i8:$S, 9)), xoaddr:$dst),
2548 (STXSIBXv (VSLDOI $S, $S, 2), xoaddr:$dst)>;
2549 def : Pat<(truncstorei8 (i32 (vector_extract v16i8:$S, 10)), xoaddr:$dst),
2550 (STXSIBXv (VSLDOI $S, $S, 3), xoaddr:$dst)>;
2551 def : Pat<(truncstorei8 (i32 (vector_extract v16i8:$S, 11)), xoaddr:$dst),
2552 (STXSIBXv (VSLDOI $S, $S, 4), xoaddr:$dst)>;
2553 def : Pat<(truncstorei8 (i32 (vector_extract v16i8:$S, 12)), xoaddr:$dst),
2554 (STXSIBXv (VSLDOI $S, $S, 5), xoaddr:$dst)>;
2555 def : Pat<(truncstorei8 (i32 (vector_extract v16i8:$S, 13)), xoaddr:$dst),
2556 (STXSIBXv (VSLDOI $S, $S, 6), xoaddr:$dst)>;
2557 def : Pat<(truncstorei8 (i32 (vector_extract v16i8:$S, 14)), xoaddr:$dst),
2558 (STXSIBXv (VSLDOI $S, $S, 7), xoaddr:$dst)>;
2559 def : Pat<(truncstorei8 (i32 (vector_extract v16i8:$S, 15)), xoaddr:$dst),
2560 (STXSIBXv (VSLDOI $S, $S, 8), xoaddr:$dst)>;
2561
2562 // Scalar stores of i16
2563 def : Pat<(truncstorei16 (i32 (vector_extract v8i16:$S, 0)), xoaddr:$dst),
2564 (STXSIHXv (VSLDOI $S, $S, 10), xoaddr:$dst)>;
2565 def : Pat<(truncstorei16 (i32 (vector_extract v8i16:$S, 1)), xoaddr:$dst),
2566 (STXSIHXv (VSLDOI $S, $S, 12), xoaddr:$dst)>;
2567 def : Pat<(truncstorei16 (i32 (vector_extract v8i16:$S, 2)), xoaddr:$dst),
2568 (STXSIHXv (VSLDOI $S, $S, 14), xoaddr:$dst)>;
2569 def : Pat<(truncstorei16 (i32 (vector_extract v8i16:$S, 3)), xoaddr:$dst),
2570 (STXSIHXv $S, xoaddr:$dst)>;
2571 def : Pat<(truncstorei16 (i32 (vector_extract v8i16:$S, 4)), xoaddr:$dst),
2572 (STXSIHXv (VSLDOI $S, $S, 2), xoaddr:$dst)>;
2573 def : Pat<(truncstorei16 (i32 (vector_extract v8i16:$S, 5)), xoaddr:$dst),
2574 (STXSIHXv (VSLDOI $S, $S, 4), xoaddr:$dst)>;
2575 def : Pat<(truncstorei16 (i32 (vector_extract v8i16:$S, 6)), xoaddr:$dst),
2576 (STXSIHXv (VSLDOI $S, $S, 6), xoaddr:$dst)>;
2577 def : Pat<(truncstorei16 (i32 (vector_extract v8i16:$S, 7)), xoaddr:$dst),
2578 (STXSIHXv (VSLDOI $S, $S, 8), xoaddr:$dst)>;
2579 } // IsBigEndian, HasP9Vector
2580
2581 let Predicates = [IsLittleEndian, HasP9Vector] in {
2582 // Scalar stores of i8
2583 def : Pat<(truncstorei8 (i32 (vector_extract v16i8:$S, 0)), xoaddr:$dst),
2584 (STXSIBXv (VSLDOI $S, $S, 8), xoaddr:$dst)>;
2585 def : Pat<(truncstorei8 (i32 (vector_extract v16i8:$S, 1)), xoaddr:$dst),
2586 (STXSIBXv (VSLDOI $S, $S, 7), xoaddr:$dst)>;
2587 def : Pat<(truncstorei8 (i32 (vector_extract v16i8:$S, 2)), xoaddr:$dst),
2588 (STXSIBXv (VSLDOI $S, $S, 6), xoaddr:$dst)>;
2589 def : Pat<(truncstorei8 (i32 (vector_extract v16i8:$S, 3)), xoaddr:$dst),
2590 (STXSIBXv (VSLDOI $S, $S, 5), xoaddr:$dst)>;
2591 def : Pat<(truncstorei8 (i32 (vector_extract v16i8:$S, 4)), xoaddr:$dst),
2592 (STXSIBXv (VSLDOI $S, $S, 4), xoaddr:$dst)>;
2593 def : Pat<(truncstorei8 (i32 (vector_extract v16i8:$S, 5)), xoaddr:$dst),
2594 (STXSIBXv (VSLDOI $S, $S, 3), xoaddr:$dst)>;
2595 def : Pat<(truncstorei8 (i32 (vector_extract v16i8:$S, 6)), xoaddr:$dst),
2596 (STXSIBXv (VSLDOI $S, $S, 2), xoaddr:$dst)>;
2597 def : Pat<(truncstorei8 (i32 (vector_extract v16i8:$S, 7)), xoaddr:$dst),
2598 (STXSIBXv (VSLDOI $S, $S, 1), xoaddr:$dst)>;
2599 def : Pat<(truncstorei8 (i32 (vector_extract v16i8:$S, 8)), xoaddr:$dst),
2600 (STXSIBXv $S, xoaddr:$dst)>;
2601 def : Pat<(truncstorei8 (i32 (vector_extract v16i8:$S, 9)), xoaddr:$dst),
2602 (STXSIBXv (VSLDOI $S, $S, 15), xoaddr:$dst)>;
2603 def : Pat<(truncstorei8 (i32 (vector_extract v16i8:$S, 10)), xoaddr:$dst),
2604 (STXSIBXv (VSLDOI $S, $S, 14), xoaddr:$dst)>;
2605 def : Pat<(truncstorei8 (i32 (vector_extract v16i8:$S, 11)), xoaddr:$dst),
2606 (STXSIBXv (VSLDOI $S, $S, 13), xoaddr:$dst)>;
2607 def : Pat<(truncstorei8 (i32 (vector_extract v16i8:$S, 12)), xoaddr:$dst),
2608 (STXSIBXv (VSLDOI $S, $S, 12), xoaddr:$dst)>;
2609 def : Pat<(truncstorei8 (i32 (vector_extract v16i8:$S, 13)), xoaddr:$dst),
2610 (STXSIBXv (VSLDOI $S, $S, 11), xoaddr:$dst)>;
2611 def : Pat<(truncstorei8 (i32 (vector_extract v16i8:$S, 14)), xoaddr:$dst),
2612 (STXSIBXv (VSLDOI $S, $S, 10), xoaddr:$dst)>;
2613 def : Pat<(truncstorei8 (i32 (vector_extract v16i8:$S, 15)), xoaddr:$dst),
2614 (STXSIBXv (VSLDOI $S, $S, 9), xoaddr:$dst)>;
2615
2616 // Scalar stores of i16
2617 def : Pat<(truncstorei16 (i32 (vector_extract v8i16:$S, 0)), xoaddr:$dst),
2618 (STXSIHXv (VSLDOI $S, $S, 8), xoaddr:$dst)>;
2619 def : Pat<(truncstorei16 (i32 (vector_extract v8i16:$S, 1)), xoaddr:$dst),
2620 (STXSIHXv (VSLDOI $S, $S, 6), xoaddr:$dst)>;
2621 def : Pat<(truncstorei16 (i32 (vector_extract v8i16:$S, 2)), xoaddr:$dst),
2622 (STXSIHXv (VSLDOI $S, $S, 4), xoaddr:$dst)>;
2623 def : Pat<(truncstorei16 (i32 (vector_extract v8i16:$S, 3)), xoaddr:$dst),
2624 (STXSIHXv (VSLDOI $S, $S, 2), xoaddr:$dst)>;
2625 def : Pat<(truncstorei16 (i32 (vector_extract v8i16:$S, 4)), xoaddr:$dst),
2626 (STXSIHXv $S, xoaddr:$dst)>;
2627 def : Pat<(truncstorei16 (i32 (vector_extract v8i16:$S, 5)), xoaddr:$dst),
2628 (STXSIHXv (VSLDOI $S, $S, 14), xoaddr:$dst)>;
2629 def : Pat<(truncstorei16 (i32 (vector_extract v8i16:$S, 6)), xoaddr:$dst),
2630 (STXSIHXv (VSLDOI $S, $S, 12), xoaddr:$dst)>;
2631 def : Pat<(truncstorei16 (i32 (vector_extract v8i16:$S, 7)), xoaddr:$dst),
2632 (STXSIHXv (VSLDOI $S, $S, 10), xoaddr:$dst)>;
2633 } // IsLittleEndian, HasP9Vector
2634
2635 // Vector sign extensions
2636 def : Pat<(f64 (PPCVexts f64:$A, 1)),
2637 (f64 (COPY_TO_REGCLASS (VEXTSB2Ds $A), VSFRC))>;
2638 def : Pat<(f64 (PPCVexts f64:$A, 2)),
2639 (f64 (COPY_TO_REGCLASS (VEXTSH2Ds $A), VSFRC))>;
Nemanja Ivanovicdf1cb522016-11-29 16:11:34 +00002640
Nemanja Ivanovic6354d232016-10-04 11:25:52 +00002641 let isPseudo = 1 in {
2642 def DFLOADf32 : Pseudo<(outs vssrc:$XT), (ins memrix:$src),
2643 "#DFLOADf32",
2644 [(set f32:$XT, (load iaddr:$src))]>;
2645 def DFLOADf64 : Pseudo<(outs vsfrc:$XT), (ins memrix:$src),
2646 "#DFLOADf64",
2647 [(set f64:$XT, (load iaddr:$src))]>;
2648 def DFSTOREf32 : Pseudo<(outs), (ins vssrc:$XT, memrix:$dst),
2649 "#DFSTOREf32",
2650 [(store f32:$XT, iaddr:$dst)]>;
2651 def DFSTOREf64 : Pseudo<(outs), (ins vsfrc:$XT, memrix:$dst),
2652 "#DFSTOREf64",
2653 [(store f64:$XT, iaddr:$dst)]>;
2654 }
2655 def : Pat<(f64 (extloadf32 iaddr:$src)),
2656 (COPY_TO_REGCLASS (DFLOADf32 iaddr:$src), VSFRC)>;
Nemanja Ivanovicdf1cb522016-11-29 16:11:34 +00002657 def : Pat<(f32 (fpround (extloadf32 iaddr:$src))),
2658 (f32 (DFLOADf32 iaddr:$src))>;
Nemanja Ivanovicb43bb612016-07-12 21:00:10 +00002659} // end HasP9Vector, AddedComplexity
Nemanja Ivanovicd2c3c512016-09-23 13:25:31 +00002660
Nemanja Ivanovicdf1cb522016-11-29 16:11:34 +00002661// Integer extend helper dags 32 -> 64
2662def AnyExts {
2663 dag A = (INSERT_SUBREG (i64 (IMPLICIT_DEF)), $A, sub_32);
2664 dag B = (INSERT_SUBREG (i64 (IMPLICIT_DEF)), $B, sub_32);
2665 dag C = (INSERT_SUBREG (i64 (IMPLICIT_DEF)), $C, sub_32);
2666 dag D = (INSERT_SUBREG (i64 (IMPLICIT_DEF)), $D, sub_32);
Nemanja Ivanovicd2c3c512016-09-23 13:25:31 +00002667}
2668
Nemanja Ivanovicdf1cb522016-11-29 16:11:34 +00002669def DblToFlt {
2670 dag A0 = (f32 (fpround (f64 (extractelt v2f64:$A, 0))));
2671 dag A1 = (f32 (fpround (f64 (extractelt v2f64:$A, 1))));
2672 dag B0 = (f32 (fpround (f64 (extractelt v2f64:$B, 0))));
2673 dag B1 = (f32 (fpround (f64 (extractelt v2f64:$B, 1))));
2674}
2675def FltToIntLoad {
2676 dag A = (i32 (PPCmfvsr (PPCfctiwz (f64 (extloadf32 xoaddr:$A)))));
2677}
2678def FltToUIntLoad {
2679 dag A = (i32 (PPCmfvsr (PPCfctiwuz (f64 (extloadf32 xoaddr:$A)))));
2680}
2681def FltToLongLoad {
2682 dag A = (i64 (PPCmfvsr (PPCfctidz (f64 (extloadf32 xoaddr:$A)))));
2683}
2684def FltToULongLoad {
2685 dag A = (i64 (PPCmfvsr (PPCfctiduz (f64 (extloadf32 xoaddr:$A)))));
2686}
2687def FltToLong {
2688 dag A = (i64 (PPCmfvsr (PPCfctidz (fpextend f32:$A))));
2689}
2690def FltToULong {
2691 dag A = (i64 (PPCmfvsr (PPCfctiduz (fpextend f32:$A))));
2692}
2693def DblToInt {
2694 dag A = (i32 (PPCmfvsr (f64 (PPCfctiwz f64:$A))));
2695}
2696def DblToUInt {
2697 dag A = (i32 (PPCmfvsr (f64 (PPCfctiwuz f64:$A))));
2698}
2699def DblToLong {
2700 dag A = (i64 (PPCmfvsr (f64 (PPCfctidz f64:$A))));
2701}
2702def DblToULong {
2703 dag A = (i64 (PPCmfvsr (f64 (PPCfctiduz f64:$A))));
2704}
2705def DblToIntLoad {
2706 dag A = (i32 (PPCmfvsr (PPCfctiwz (f64 (load xoaddr:$A)))));
2707}
2708def DblToUIntLoad {
2709 dag A = (i32 (PPCmfvsr (PPCfctiwuz (f64 (load xoaddr:$A)))));
2710}
2711def DblToLongLoad {
2712 dag A = (i64 (PPCmfvsr (PPCfctidz (f64 (load xoaddr:$A)))));
2713}
2714def DblToULongLoad {
2715 dag A = (i64 (PPCmfvsr (PPCfctiduz (f64 (load xoaddr:$A)))));
2716}
2717
2718// FP merge dags (for f32 -> v4f32)
2719def MrgFP {
2720 dag AC = (XVCVDPSP (XXPERMDI (COPY_TO_REGCLASS $A, VSRC),
2721 (COPY_TO_REGCLASS $C, VSRC), 0));
2722 dag BD = (XVCVDPSP (XXPERMDI (COPY_TO_REGCLASS $B, VSRC),
2723 (COPY_TO_REGCLASS $D, VSRC), 0));
2724 dag ABhToFlt = (XVCVDPSP (XXPERMDI $A, $B, 0));
2725 dag ABlToFlt = (XVCVDPSP (XXPERMDI $A, $B, 3));
2726 dag BAhToFlt = (XVCVDPSP (XXPERMDI $B, $A, 0));
2727 dag BAlToFlt = (XVCVDPSP (XXPERMDI $B, $A, 3));
2728}
2729
2730// Patterns for BUILD_VECTOR nodes.
2731def NoP9Vector : Predicate<"!PPCSubTarget->hasP9Vector()">;
2732let AddedComplexity = 400 in {
2733
2734 let Predicates = [HasVSX] in {
2735 // Build vectors of floating point converted to i32.
2736 def : Pat<(v4i32 (build_vector DblToInt.A, DblToInt.A,
2737 DblToInt.A, DblToInt.A)),
2738 (v4i32 (XXSPLTW (COPY_TO_REGCLASS (XSCVDPSXWS $A), VSRC), 1))>;
2739 def : Pat<(v4i32 (build_vector DblToUInt.A, DblToUInt.A,
2740 DblToUInt.A, DblToUInt.A)),
2741 (v4i32 (XXSPLTW (COPY_TO_REGCLASS (XSCVDPUXWS $A), VSRC), 1))>;
2742 def : Pat<(v2i64 (build_vector DblToLong.A, DblToLong.A)),
2743 (v2i64 (XXPERMDI (COPY_TO_REGCLASS (XSCVDPSXDS $A), VSRC),
2744 (COPY_TO_REGCLASS (XSCVDPSXDS $A), VSRC), 0))>;
2745 def : Pat<(v2i64 (build_vector DblToULong.A, DblToULong.A)),
2746 (v2i64 (XXPERMDI (COPY_TO_REGCLASS (XSCVDPUXDS $A), VSRC),
2747 (COPY_TO_REGCLASS (XSCVDPUXDS $A), VSRC), 0))>;
2748 def : Pat<(v4i32 (scalar_to_vector FltToIntLoad.A)),
2749 (v4i32 (XXSPLTW (COPY_TO_REGCLASS
2750 (XSCVDPSXWSs (LXSSPX xoaddr:$A)), VSRC), 1))>;
2751 def : Pat<(v4i32 (scalar_to_vector FltToUIntLoad.A)),
2752 (v4i32 (XXSPLTW (COPY_TO_REGCLASS
2753 (XSCVDPUXWSs (LXSSPX xoaddr:$A)), VSRC), 1))>;
2754 def : Pat<(v4f32 (build_vector f32:$A, f32:$A, f32:$A, f32:$A)),
2755 (v4f32 (XXSPLTW (v4f32 (XSCVDPSPN $A)), 0))>;
2756
2757 // Build vectors of floating point converted to i64.
2758 def : Pat<(v2i64 (build_vector FltToLong.A, FltToLong.A)),
Nemanja Ivanovic15748f42016-12-06 11:47:14 +00002759 (v2i64 (XXPERMDIs
2760 (COPY_TO_REGCLASS (XSCVDPSXDSs $A), VSFRC), 0))>;
Nemanja Ivanovicdf1cb522016-11-29 16:11:34 +00002761 def : Pat<(v2i64 (build_vector FltToULong.A, FltToULong.A)),
Nemanja Ivanovic15748f42016-12-06 11:47:14 +00002762 (v2i64 (XXPERMDIs
2763 (COPY_TO_REGCLASS (XSCVDPUXDSs $A), VSFRC), 0))>;
Nemanja Ivanovicdf1cb522016-11-29 16:11:34 +00002764 def : Pat<(v2i64 (scalar_to_vector DblToLongLoad.A)),
2765 (v2i64 (XVCVDPSXDS (LXVDSX xoaddr:$A)))>;
2766 def : Pat<(v2i64 (scalar_to_vector DblToULongLoad.A)),
2767 (v2i64 (XVCVDPUXDS (LXVDSX xoaddr:$A)))>;
2768 }
2769
2770 let Predicates = [HasVSX, NoP9Vector] in {
2771 // Load-and-splat with fp-to-int conversion (using X-Form VSX loads).
2772 def : Pat<(v4i32 (scalar_to_vector DblToIntLoad.A)),
2773 (v4i32 (XXSPLTW (COPY_TO_REGCLASS
2774 (XSCVDPSXWS (LXSDX xoaddr:$A)), VSRC), 1))>;
2775 def : Pat<(v4i32 (scalar_to_vector DblToUIntLoad.A)),
2776 (v4i32 (XXSPLTW (COPY_TO_REGCLASS
2777 (XSCVDPUXWS (LXSDX xoaddr:$A)), VSRC), 1))>;
2778 def : Pat<(v2i64 (scalar_to_vector FltToLongLoad.A)),
2779 (v2i64 (XXPERMDIs (XSCVDPSXDS (COPY_TO_REGCLASS
2780 (LXSSPX xoaddr:$A), VSFRC)), 0))>;
2781 def : Pat<(v2i64 (scalar_to_vector FltToULongLoad.A)),
2782 (v2i64 (XXPERMDIs (XSCVDPUXDS (COPY_TO_REGCLASS
2783 (LXSSPX xoaddr:$A), VSFRC)), 0))>;
2784 }
2785
2786 // Big endian, available on all targets with VSX
2787 let Predicates = [IsBigEndian, HasVSX] in {
2788 def : Pat<(v2f64 (build_vector f64:$A, f64:$B)),
2789 (v2f64 (XXPERMDI
2790 (COPY_TO_REGCLASS $A, VSRC),
2791 (COPY_TO_REGCLASS $B, VSRC), 0))>;
2792
2793 def : Pat<(v4f32 (build_vector f32:$A, f32:$B, f32:$C, f32:$D)),
2794 (VMRGEW MrgFP.AC, MrgFP.BD)>;
2795 def : Pat<(v4f32 (build_vector DblToFlt.A0, DblToFlt.A1,
2796 DblToFlt.B0, DblToFlt.B1)),
2797 (v4f32 (VMRGEW MrgFP.ABhToFlt, MrgFP.ABlToFlt))>;
2798 }
2799
2800 let Predicates = [IsLittleEndian, HasVSX] in {
2801 // Little endian, available on all targets with VSX
2802 def : Pat<(v2f64 (build_vector f64:$A, f64:$B)),
2803 (v2f64 (XXPERMDI
2804 (COPY_TO_REGCLASS $B, VSRC),
2805 (COPY_TO_REGCLASS $A, VSRC), 0))>;
2806
2807 def : Pat<(v4f32 (build_vector f32:$D, f32:$C, f32:$B, f32:$A)),
2808 (VMRGEW MrgFP.AC, MrgFP.BD)>;
2809 def : Pat<(v4f32 (build_vector DblToFlt.A0, DblToFlt.A1,
2810 DblToFlt.B0, DblToFlt.B1)),
2811 (v4f32 (VMRGEW MrgFP.BAhToFlt, MrgFP.BAlToFlt))>;
2812 }
2813
2814 let Predicates = [HasDirectMove] in {
2815 // Endianness-neutral constant splat on P8 and newer targets. The reason
2816 // for this pattern is that on targets with direct moves, we don't expand
2817 // BUILD_VECTOR nodes for v4i32.
2818 def : Pat<(v4i32 (build_vector immSExt5NonZero:$A, immSExt5NonZero:$A,
2819 immSExt5NonZero:$A, immSExt5NonZero:$A)),
2820 (v4i32 (VSPLTISW imm:$A))>;
2821 }
2822
2823 let Predicates = [IsBigEndian, HasDirectMove, NoP9Vector] in {
2824 // Big endian integer vectors using direct moves.
2825 def : Pat<(v2i64 (build_vector i64:$A, i64:$B)),
2826 (v2i64 (XXPERMDI
2827 (COPY_TO_REGCLASS (MTVSRD $A), VSRC),
2828 (COPY_TO_REGCLASS (MTVSRD $B), VSRC), 0))>;
2829 def : Pat<(v4i32 (build_vector i32:$A, i32:$B, i32:$C, i32:$D)),
2830 (VMRGOW (XXPERMDI (COPY_TO_REGCLASS (MTVSRWZ $A), VSRC),
2831 (COPY_TO_REGCLASS (MTVSRWZ $C), VSRC), 0),
2832 (XXPERMDI (COPY_TO_REGCLASS (MTVSRWZ $B), VSRC),
2833 (COPY_TO_REGCLASS (MTVSRWZ $D), VSRC), 0))>;
2834 def : Pat<(v4i32 (build_vector i32:$A, i32:$A, i32:$A, i32:$A)),
2835 (XXSPLTW (COPY_TO_REGCLASS (MTVSRWZ $A), VSRC), 1)>;
2836 }
2837
2838 let Predicates = [IsLittleEndian, HasDirectMove, NoP9Vector] in {
2839 // Little endian integer vectors using direct moves.
2840 def : Pat<(v2i64 (build_vector i64:$A, i64:$B)),
2841 (v2i64 (XXPERMDI
2842 (COPY_TO_REGCLASS (MTVSRD $B), VSRC),
2843 (COPY_TO_REGCLASS (MTVSRD $A), VSRC), 0))>;
2844 def : Pat<(v4i32 (build_vector i32:$A, i32:$B, i32:$C, i32:$D)),
2845 (VMRGOW (XXPERMDI (COPY_TO_REGCLASS (MTVSRWZ $D), VSRC),
2846 (COPY_TO_REGCLASS (MTVSRWZ $B), VSRC), 0),
2847 (XXPERMDI (COPY_TO_REGCLASS (MTVSRWZ $C), VSRC),
2848 (COPY_TO_REGCLASS (MTVSRWZ $A), VSRC), 0))>;
2849 def : Pat<(v4i32 (build_vector i32:$A, i32:$A, i32:$A, i32:$A)),
2850 (XXSPLTW (COPY_TO_REGCLASS (MTVSRWZ $A), VSRC), 1)>;
2851 }
2852
2853 let Predicates = [HasP9Vector] in {
2854 // Endianness-neutral patterns for const splats with ISA 3.0 instructions.
2855 def : Pat<(v4i32 (scalar_to_vector i32:$A)),
2856 (v4i32 (MTVSRWS $A))>;
2857 def : Pat<(v4i32 (build_vector i32:$A, i32:$A, i32:$A, i32:$A)),
2858 (v4i32 (MTVSRWS $A))>;
2859 def : Pat<(v16i8 (build_vector immSExt8:$A, immSExt8:$A, immSExt8:$A,
2860 immSExt8:$A, immSExt8:$A, immSExt8:$A,
2861 immSExt8:$A, immSExt8:$A, immSExt8:$A,
2862 immSExt8:$A, immSExt8:$A, immSExt8:$A,
2863 immSExt8:$A, immSExt8:$A, immSExt8:$A,
2864 immSExt8:$A)),
2865 (v16i8 (COPY_TO_REGCLASS (XXSPLTIB imm:$A), VSRC))>;
2866 def : Pat<(v16i8 immAllOnesV),
2867 (v16i8 (COPY_TO_REGCLASS (XXSPLTIB 255), VSRC))>;
2868 def : Pat<(v8i16 immAllOnesV),
2869 (v8i16 (COPY_TO_REGCLASS (XXSPLTIB 255), VSRC))>;
2870 def : Pat<(v4i32 immAllOnesV),
2871 (v4i32 (XXSPLTIB 255))>;
2872 def : Pat<(v2i64 immAllOnesV),
2873 (v2i64 (XXSPLTIB 255))>;
2874 def : Pat<(v4i32 (scalar_to_vector FltToIntLoad.A)),
2875 (v4i32 (XVCVSPSXWS (LXVWSX xoaddr:$A)))>;
2876 def : Pat<(v4i32 (scalar_to_vector FltToUIntLoad.A)),
2877 (v4i32 (XVCVSPUXWS (LXVWSX xoaddr:$A)))>;
2878 def : Pat<(v4i32 (scalar_to_vector DblToIntLoad.A)),
2879 (v4i32 (XXSPLTW (COPY_TO_REGCLASS
2880 (XSCVDPSXWS (DFLOADf64 iaddr:$A)), VSRC), 1))>;
2881 def : Pat<(v4i32 (scalar_to_vector DblToUIntLoad.A)),
2882 (v4i32 (XXSPLTW (COPY_TO_REGCLASS
2883 (XSCVDPUXWS (DFLOADf64 iaddr:$A)), VSRC), 1))>;
2884 def : Pat<(v2i64 (scalar_to_vector FltToLongLoad.A)),
2885 (v2i64 (XXPERMDIs (XSCVDPSXDS (COPY_TO_REGCLASS
2886 (DFLOADf32 iaddr:$A),
2887 VSFRC)), 0))>;
2888 def : Pat<(v2i64 (scalar_to_vector FltToULongLoad.A)),
2889 (v2i64 (XXPERMDIs (XSCVDPUXDS (COPY_TO_REGCLASS
2890 (DFLOADf32 iaddr:$A),
2891 VSFRC)), 0))>;
2892 }
2893
2894 let Predicates = [IsISA3_0, HasDirectMove, IsBigEndian] in {
2895 def : Pat<(i64 (extractelt v2i64:$A, 1)),
2896 (i64 (MFVSRLD $A))>;
2897 // Better way to build integer vectors if we have MTVSRDD. Big endian.
2898 def : Pat<(v2i64 (build_vector i64:$rB, i64:$rA)),
2899 (v2i64 (MTVSRDD $rB, $rA))>;
2900 def : Pat<(v4i32 (build_vector i32:$A, i32:$B, i32:$C, i32:$D)),
2901 (VMRGOW (COPY_TO_REGCLASS (MTVSRDD AnyExts.A, AnyExts.C), VSRC),
2902 (COPY_TO_REGCLASS (MTVSRDD AnyExts.B, AnyExts.D), VSRC))>;
2903 }
2904
2905 let Predicates = [IsISA3_0, HasDirectMove, IsLittleEndian] in {
2906 def : Pat<(i64 (extractelt v2i64:$A, 0)),
2907 (i64 (MFVSRLD $A))>;
2908 // Better way to build integer vectors if we have MTVSRDD. Little endian.
2909 def : Pat<(v2i64 (build_vector i64:$rA, i64:$rB)),
2910 (v2i64 (MTVSRDD $rB, $rA))>;
2911 def : Pat<(v4i32 (build_vector i32:$A, i32:$B, i32:$C, i32:$D)),
2912 (VMRGOW (COPY_TO_REGCLASS (MTVSRDD AnyExts.D, AnyExts.B), VSRC),
2913 (COPY_TO_REGCLASS (MTVSRDD AnyExts.C, AnyExts.A), VSRC))>;
2914 }
Nemanja Ivanovicd2c3c512016-09-23 13:25:31 +00002915}