blob: b0c1bcc40ca89f2360a0b6d30c5947d40a896209 [file] [log] [blame]
Hal Finkel27774d92014-03-13 07:58:58 +00001//===- PPCInstrVSX.td - The PowerPC VSX Extension --*- tablegen -*-===//
2//
3// The LLVM Compiler Infrastructure
4//
5// This file is distributed under the University of Illinois Open Source
6// License. See LICENSE.TXT for details.
7//
8//===----------------------------------------------------------------------===//
9//
10// This file describes the VSX extension to the PowerPC instruction set.
11//
12//===----------------------------------------------------------------------===//
13
Bill Schmidtfe723b92015-04-27 19:57:34 +000014// *********************************** NOTE ***********************************
15// ** For POWER8 Little Endian, the VSX swap optimization relies on knowing **
16// ** which VMX and VSX instructions are lane-sensitive and which are not. **
17// ** A lane-sensitive instruction relies, implicitly or explicitly, on **
18// ** whether lanes are numbered from left to right. An instruction like **
19// ** VADDFP is not lane-sensitive, because each lane of the result vector **
20// ** relies only on the corresponding lane of the source vectors. However, **
21// ** an instruction like VMULESB is lane-sensitive, because "even" and **
22// ** "odd" lanes are different for big-endian and little-endian numbering. **
23// ** **
24// ** When adding new VMX and VSX instructions, please consider whether they **
25// ** are lane-sensitive. If so, they must be added to a switch statement **
26// ** in PPCVSXSwapRemoval::gatherVectorInstructions(). **
27// ****************************************************************************
28
Hal Finkel27774d92014-03-13 07:58:58 +000029def PPCRegVSRCAsmOperand : AsmOperandClass {
30 let Name = "RegVSRC"; let PredicateMethod = "isVSRegNumber";
31}
32def vsrc : RegisterOperand<VSRC> {
33 let ParserMatchClass = PPCRegVSRCAsmOperand;
34}
35
Hal Finkel19be5062014-03-29 05:29:01 +000036def PPCRegVSFRCAsmOperand : AsmOperandClass {
37 let Name = "RegVSFRC"; let PredicateMethod = "isVSRegNumber";
38}
39def vsfrc : RegisterOperand<VSFRC> {
40 let ParserMatchClass = PPCRegVSFRCAsmOperand;
41}
42
Nemanja Ivanovicf3c94b12015-05-07 18:24:05 +000043def PPCRegVSSRCAsmOperand : AsmOperandClass {
44 let Name = "RegVSSRC"; let PredicateMethod = "isVSRegNumber";
45}
46def vssrc : RegisterOperand<VSSRC> {
47 let ParserMatchClass = PPCRegVSSRCAsmOperand;
48}
49
Bill Schmidtfae5d712014-12-09 16:35:51 +000050// Little-endian-specific nodes.
51def SDT_PPClxvd2x : SDTypeProfile<1, 1, [
52 SDTCisVT<0, v2f64>, SDTCisPtrTy<1>
53]>;
54def SDT_PPCstxvd2x : SDTypeProfile<0, 2, [
55 SDTCisVT<0, v2f64>, SDTCisPtrTy<1>
56]>;
57def SDT_PPCxxswapd : SDTypeProfile<1, 1, [
58 SDTCisSameAs<0, 1>
59]>;
Nemanja Ivanovic44513e52016-07-05 09:22:29 +000060def SDTVecConv : SDTypeProfile<1, 2, [
61 SDTCisVec<0>, SDTCisVec<1>, SDTCisPtrTy<2>
62]>;
Bill Schmidtfae5d712014-12-09 16:35:51 +000063
64def PPClxvd2x : SDNode<"PPCISD::LXVD2X", SDT_PPClxvd2x,
65 [SDNPHasChain, SDNPMayLoad]>;
66def PPCstxvd2x : SDNode<"PPCISD::STXVD2X", SDT_PPCstxvd2x,
67 [SDNPHasChain, SDNPMayStore]>;
68def PPCxxswapd : SDNode<"PPCISD::XXSWAPD", SDT_PPCxxswapd, [SDNPHasChain]>;
Nemanja Ivanovicc38b5312015-04-11 10:40:42 +000069def PPCmfvsr : SDNode<"PPCISD::MFVSR", SDTUnaryOp, []>;
70def PPCmtvsra : SDNode<"PPCISD::MTVSRA", SDTUnaryOp, []>;
71def PPCmtvsrz : SDNode<"PPCISD::MTVSRZ", SDTUnaryOp, []>;
Nemanja Ivanovic44513e52016-07-05 09:22:29 +000072def PPCsvec2fp : SDNode<"PPCISD::SINT_VEC_TO_FP", SDTVecConv, []>;
73def PPCuvec2fp: SDNode<"PPCISD::UINT_VEC_TO_FP", SDTVecConv, []>;
Nemanja Ivanoviceebbcb62016-07-12 12:16:27 +000074def PPCswapNoChain : SDNode<"PPCISD::SWAP_NO_CHAIN", SDT_PPCxxswapd>;
Bill Schmidtfae5d712014-12-09 16:35:51 +000075
Nemanja Ivanovic2c84b292015-09-29 17:41:53 +000076multiclass XX3Form_Rcr<bits<6> opcode, bits<7> xo, string asmbase,
77 string asmstr, InstrItinClass itin, Intrinsic Int,
78 ValueType OutTy, ValueType InTy> {
Hal Finkel27774d92014-03-13 07:58:58 +000079 let BaseName = asmbase in {
Nemanja Ivanovic2c84b292015-09-29 17:41:53 +000080 def NAME : XX3Form_Rc<opcode, xo, (outs vsrc:$XT), (ins vsrc:$XA, vsrc:$XB),
Hal Finkel27774d92014-03-13 07:58:58 +000081 !strconcat(asmbase, !strconcat(" ", asmstr)), itin,
Nemanja Ivanovic2c84b292015-09-29 17:41:53 +000082 [(set OutTy:$XT, (Int InTy:$XA, InTy:$XB))]>;
Hal Finkel27774d92014-03-13 07:58:58 +000083 let Defs = [CR6] in
Nemanja Ivanovic2c84b292015-09-29 17:41:53 +000084 def o : XX3Form_Rc<opcode, xo, (outs vsrc:$XT), (ins vsrc:$XA, vsrc:$XB),
Hal Finkel27774d92014-03-13 07:58:58 +000085 !strconcat(asmbase, !strconcat(". ", asmstr)), itin,
Nemanja Ivanovic2c84b292015-09-29 17:41:53 +000086 [(set InTy:$XT,
87 (InTy (PPCvcmp_o InTy:$XA, InTy:$XB, xo)))]>,
88 isDOT;
Hal Finkel27774d92014-03-13 07:58:58 +000089 }
90}
91
Nemanja Ivanovic11049f82016-10-04 06:59:23 +000092// Instruction form with a single input register for instructions such as
93// XXPERMDI. The reason for defining this is that specifying multiple chained
94// operands (such as loads) to an instruction will perform both chained
95// operations rather than coalescing them into a single register - even though
96// the source memory location is the same. This simply forces the instruction
97// to use the same register for both inputs.
98// For example, an output DAG such as this:
99// (XXPERMDI (LXSIBZX xoaddr:$src), (LXSIBZX xoaddr:$src ), 0))
100// would result in two load instructions emitted and used as separate inputs
101// to the XXPERMDI instruction.
102class XX3Form_2s<bits<6> opcode, bits<5> xo, dag OOL, dag IOL, string asmstr,
103 InstrItinClass itin, list<dag> pattern>
104 : XX3Form_2<opcode, xo, OOL, IOL, asmstr, itin, pattern> {
105 let XB = XA;
106}
107
Eric Christopher1b8e7632014-05-22 01:07:24 +0000108def HasVSX : Predicate<"PPCSubTarget->hasVSX()">;
Bill Schmidtfae5d712014-12-09 16:35:51 +0000109def IsLittleEndian : Predicate<"PPCSubTarget->isLittleEndian()">;
110def IsBigEndian : Predicate<"!PPCSubTarget->isLittleEndian()">;
Nemanja Ivanovic6e7879c2016-09-22 09:52:19 +0000111def HasOnlySwappingMemOps : Predicate<"!PPCSubTarget->hasP9Vector()">;
Bill Schmidtfae5d712014-12-09 16:35:51 +0000112
Hal Finkel27774d92014-03-13 07:58:58 +0000113let Predicates = [HasVSX] in {
114let AddedComplexity = 400 in { // Prefer VSX patterns over non-VSX patterns.
Nemanja Ivanovic11049f82016-10-04 06:59:23 +0000115let UseVSXReg = 1 in {
Craig Topperc50d64b2014-11-26 00:46:26 +0000116let hasSideEffects = 0 in { // VSX instructions don't have side effects.
Hal Finkel27774d92014-03-13 07:58:58 +0000117let Uses = [RM] in {
118
119 // Load indexed instructions
Hal Finkel6a778fb2015-03-11 23:28:38 +0000120 let mayLoad = 1 in {
Nemanja Ivanovic6354d232016-10-04 11:25:52 +0000121 let CodeSize = 3 in
Bill Schmidtcb34fd02014-10-09 17:51:35 +0000122 def LXSDX : XX1Form<31, 588,
Hal Finkel19be5062014-03-29 05:29:01 +0000123 (outs vsfrc:$XT), (ins memrr:$src),
Hal Finkel27774d92014-03-13 07:58:58 +0000124 "lxsdx $XT, $src", IIC_LdStLFD,
125 [(set f64:$XT, (load xoaddr:$src))]>;
126
Nemanja Ivanovic6e7879c2016-09-22 09:52:19 +0000127 let Predicates = [HasVSX, HasOnlySwappingMemOps] in
Bill Schmidtcb34fd02014-10-09 17:51:35 +0000128 def LXVD2X : XX1Form<31, 844,
Hal Finkel27774d92014-03-13 07:58:58 +0000129 (outs vsrc:$XT), (ins memrr:$src),
130 "lxvd2x $XT, $src", IIC_LdStLFD,
Bill Schmidt72954782014-11-12 04:19:40 +0000131 [(set v2f64:$XT, (int_ppc_vsx_lxvd2x xoaddr:$src))]>;
Hal Finkel27774d92014-03-13 07:58:58 +0000132
Bill Schmidtcb34fd02014-10-09 17:51:35 +0000133 def LXVDSX : XX1Form<31, 332,
Hal Finkel27774d92014-03-13 07:58:58 +0000134 (outs vsrc:$XT), (ins memrr:$src),
135 "lxvdsx $XT, $src", IIC_LdStLFD, []>;
Hal Finkel27774d92014-03-13 07:58:58 +0000136
Nemanja Ivanovic6e7879c2016-09-22 09:52:19 +0000137 let Predicates = [HasVSX, HasOnlySwappingMemOps] in
Bill Schmidtcb34fd02014-10-09 17:51:35 +0000138 def LXVW4X : XX1Form<31, 780,
Hal Finkel27774d92014-03-13 07:58:58 +0000139 (outs vsrc:$XT), (ins memrr:$src),
Bill Schmidt2d1128a2014-10-17 15:13:38 +0000140 "lxvw4x $XT, $src", IIC_LdStLFD,
Nemanja Ivanovicf57f1502016-11-29 23:00:33 +0000141 [(set v4i32:$XT, (int_ppc_vsx_lxvw4x xoaddr:$src))]>;
Nemanja Ivanovicf3c94b12015-05-07 18:24:05 +0000142 } // mayLoad
Hal Finkel27774d92014-03-13 07:58:58 +0000143
144 // Store indexed instructions
145 let mayStore = 1 in {
Nemanja Ivanovic6354d232016-10-04 11:25:52 +0000146 let CodeSize = 3 in
Hal Finkel27774d92014-03-13 07:58:58 +0000147 def STXSDX : XX1Form<31, 716,
Hal Finkel19be5062014-03-29 05:29:01 +0000148 (outs), (ins vsfrc:$XT, memrr:$dst),
Hal Finkel27774d92014-03-13 07:58:58 +0000149 "stxsdx $XT, $dst", IIC_LdStSTFD,
150 [(store f64:$XT, xoaddr:$dst)]>;
151
Nemanja Ivanovic6e7879c2016-09-22 09:52:19 +0000152 let Predicates = [HasVSX, HasOnlySwappingMemOps] in {
Nemanja Ivanovice78ffed2016-09-22 10:32:03 +0000153 // The behaviour of this instruction is endianness-specific so we provide no
154 // pattern to match it without considering endianness.
Hal Finkel27774d92014-03-13 07:58:58 +0000155 def STXVD2X : XX1Form<31, 972,
156 (outs), (ins vsrc:$XT, memrr:$dst),
157 "stxvd2x $XT, $dst", IIC_LdStSTFD,
Nemanja Ivanovice78ffed2016-09-22 10:32:03 +0000158 []>;
Hal Finkel27774d92014-03-13 07:58:58 +0000159
160 def STXVW4X : XX1Form<31, 908,
161 (outs), (ins vsrc:$XT, memrr:$dst),
Bill Schmidt2d1128a2014-10-17 15:13:38 +0000162 "stxvw4x $XT, $dst", IIC_LdStSTFD,
Nemanja Ivanovicf57f1502016-11-29 23:00:33 +0000163 [(store v4i32:$XT, xoaddr:$dst)]>;
Nemanja Ivanovic6e7879c2016-09-22 09:52:19 +0000164 }
Nemanja Ivanovicf3c94b12015-05-07 18:24:05 +0000165 } // mayStore
Hal Finkel27774d92014-03-13 07:58:58 +0000166
167 // Add/Mul Instructions
168 let isCommutable = 1 in {
169 def XSADDDP : XX3Form<60, 32,
Hal Finkel19be5062014-03-29 05:29:01 +0000170 (outs vsfrc:$XT), (ins vsfrc:$XA, vsfrc:$XB),
Hal Finkel27774d92014-03-13 07:58:58 +0000171 "xsadddp $XT, $XA, $XB", IIC_VecFP,
172 [(set f64:$XT, (fadd f64:$XA, f64:$XB))]>;
173 def XSMULDP : XX3Form<60, 48,
Hal Finkel19be5062014-03-29 05:29:01 +0000174 (outs vsfrc:$XT), (ins vsfrc:$XA, vsfrc:$XB),
Hal Finkel27774d92014-03-13 07:58:58 +0000175 "xsmuldp $XT, $XA, $XB", IIC_VecFP,
176 [(set f64:$XT, (fmul f64:$XA, f64:$XB))]>;
177
178 def XVADDDP : XX3Form<60, 96,
179 (outs vsrc:$XT), (ins vsrc:$XA, vsrc:$XB),
180 "xvadddp $XT, $XA, $XB", IIC_VecFP,
181 [(set v2f64:$XT, (fadd v2f64:$XA, v2f64:$XB))]>;
182
183 def XVADDSP : XX3Form<60, 64,
184 (outs vsrc:$XT), (ins vsrc:$XA, vsrc:$XB),
185 "xvaddsp $XT, $XA, $XB", IIC_VecFP,
186 [(set v4f32:$XT, (fadd v4f32:$XA, v4f32:$XB))]>;
187
188 def XVMULDP : XX3Form<60, 112,
189 (outs vsrc:$XT), (ins vsrc:$XA, vsrc:$XB),
190 "xvmuldp $XT, $XA, $XB", IIC_VecFP,
191 [(set v2f64:$XT, (fmul v2f64:$XA, v2f64:$XB))]>;
192
193 def XVMULSP : XX3Form<60, 80,
194 (outs vsrc:$XT), (ins vsrc:$XA, vsrc:$XB),
195 "xvmulsp $XT, $XA, $XB", IIC_VecFP,
196 [(set v4f32:$XT, (fmul v4f32:$XA, v4f32:$XB))]>;
197 }
198
199 // Subtract Instructions
200 def XSSUBDP : XX3Form<60, 40,
Hal Finkel19be5062014-03-29 05:29:01 +0000201 (outs vsfrc:$XT), (ins vsfrc:$XA, vsfrc:$XB),
Hal Finkel27774d92014-03-13 07:58:58 +0000202 "xssubdp $XT, $XA, $XB", IIC_VecFP,
203 [(set f64:$XT, (fsub f64:$XA, f64:$XB))]>;
204
205 def XVSUBDP : XX3Form<60, 104,
206 (outs vsrc:$XT), (ins vsrc:$XA, vsrc:$XB),
207 "xvsubdp $XT, $XA, $XB", IIC_VecFP,
208 [(set v2f64:$XT, (fsub v2f64:$XA, v2f64:$XB))]>;
209 def XVSUBSP : XX3Form<60, 72,
210 (outs vsrc:$XT), (ins vsrc:$XA, vsrc:$XB),
211 "xvsubsp $XT, $XA, $XB", IIC_VecFP,
212 [(set v4f32:$XT, (fsub v4f32:$XA, v4f32:$XB))]>;
213
214 // FMA Instructions
Hal Finkel25e04542014-03-25 18:55:11 +0000215 let BaseName = "XSMADDADP" in {
Hal Finkele01d3212014-03-24 15:07:28 +0000216 let isCommutable = 1 in
Hal Finkel27774d92014-03-13 07:58:58 +0000217 def XSMADDADP : XX3Form<60, 33,
Hal Finkel19be5062014-03-29 05:29:01 +0000218 (outs vsfrc:$XT), (ins vsfrc:$XTi, vsfrc:$XA, vsfrc:$XB),
Hal Finkel27774d92014-03-13 07:58:58 +0000219 "xsmaddadp $XT, $XA, $XB", IIC_VecFP,
220 [(set f64:$XT, (fma f64:$XA, f64:$XB, f64:$XTi))]>,
Hal Finkel25e04542014-03-25 18:55:11 +0000221 RegConstraint<"$XTi = $XT">, NoEncode<"$XTi">,
222 AltVSXFMARel;
223 let IsVSXFMAAlt = 1 in
Hal Finkel27774d92014-03-13 07:58:58 +0000224 def XSMADDMDP : XX3Form<60, 41,
Hal Finkel19be5062014-03-29 05:29:01 +0000225 (outs vsfrc:$XT), (ins vsfrc:$XTi, vsfrc:$XA, vsfrc:$XB),
Hal Finkel27774d92014-03-13 07:58:58 +0000226 "xsmaddmdp $XT, $XA, $XB", IIC_VecFP, []>,
Hal Finkel25e04542014-03-25 18:55:11 +0000227 RegConstraint<"$XTi = $XT">, NoEncode<"$XTi">,
228 AltVSXFMARel;
229 }
Hal Finkel27774d92014-03-13 07:58:58 +0000230
Hal Finkel25e04542014-03-25 18:55:11 +0000231 let BaseName = "XSMSUBADP" in {
Hal Finkele01d3212014-03-24 15:07:28 +0000232 let isCommutable = 1 in
Hal Finkel27774d92014-03-13 07:58:58 +0000233 def XSMSUBADP : XX3Form<60, 49,
Hal Finkel19be5062014-03-29 05:29:01 +0000234 (outs vsfrc:$XT), (ins vsfrc:$XTi, vsfrc:$XA, vsfrc:$XB),
Hal Finkel27774d92014-03-13 07:58:58 +0000235 "xsmsubadp $XT, $XA, $XB", IIC_VecFP,
236 [(set f64:$XT, (fma f64:$XA, f64:$XB, (fneg f64:$XTi)))]>,
Hal Finkel25e04542014-03-25 18:55:11 +0000237 RegConstraint<"$XTi = $XT">, NoEncode<"$XTi">,
238 AltVSXFMARel;
239 let IsVSXFMAAlt = 1 in
Hal Finkel27774d92014-03-13 07:58:58 +0000240 def XSMSUBMDP : XX3Form<60, 57,
Hal Finkel19be5062014-03-29 05:29:01 +0000241 (outs vsfrc:$XT), (ins vsfrc:$XTi, vsfrc:$XA, vsfrc:$XB),
Hal Finkel27774d92014-03-13 07:58:58 +0000242 "xsmsubmdp $XT, $XA, $XB", IIC_VecFP, []>,
Hal Finkel25e04542014-03-25 18:55:11 +0000243 RegConstraint<"$XTi = $XT">, NoEncode<"$XTi">,
244 AltVSXFMARel;
245 }
Hal Finkel27774d92014-03-13 07:58:58 +0000246
Hal Finkel25e04542014-03-25 18:55:11 +0000247 let BaseName = "XSNMADDADP" in {
Hal Finkele01d3212014-03-24 15:07:28 +0000248 let isCommutable = 1 in
Hal Finkel27774d92014-03-13 07:58:58 +0000249 def XSNMADDADP : XX3Form<60, 161,
Hal Finkel19be5062014-03-29 05:29:01 +0000250 (outs vsfrc:$XT), (ins vsfrc:$XTi, vsfrc:$XA, vsfrc:$XB),
Hal Finkel27774d92014-03-13 07:58:58 +0000251 "xsnmaddadp $XT, $XA, $XB", IIC_VecFP,
252 [(set f64:$XT, (fneg (fma f64:$XA, f64:$XB, f64:$XTi)))]>,
Hal Finkel25e04542014-03-25 18:55:11 +0000253 RegConstraint<"$XTi = $XT">, NoEncode<"$XTi">,
254 AltVSXFMARel;
255 let IsVSXFMAAlt = 1 in
Hal Finkel27774d92014-03-13 07:58:58 +0000256 def XSNMADDMDP : XX3Form<60, 169,
Hal Finkel19be5062014-03-29 05:29:01 +0000257 (outs vsfrc:$XT), (ins vsfrc:$XTi, vsfrc:$XA, vsfrc:$XB),
Hal Finkel27774d92014-03-13 07:58:58 +0000258 "xsnmaddmdp $XT, $XA, $XB", IIC_VecFP, []>,
Hal Finkel25e04542014-03-25 18:55:11 +0000259 RegConstraint<"$XTi = $XT">, NoEncode<"$XTi">,
260 AltVSXFMARel;
261 }
Hal Finkel27774d92014-03-13 07:58:58 +0000262
Hal Finkel25e04542014-03-25 18:55:11 +0000263 let BaseName = "XSNMSUBADP" in {
Hal Finkele01d3212014-03-24 15:07:28 +0000264 let isCommutable = 1 in
Hal Finkel27774d92014-03-13 07:58:58 +0000265 def XSNMSUBADP : XX3Form<60, 177,
Hal Finkel19be5062014-03-29 05:29:01 +0000266 (outs vsfrc:$XT), (ins vsfrc:$XTi, vsfrc:$XA, vsfrc:$XB),
Hal Finkel27774d92014-03-13 07:58:58 +0000267 "xsnmsubadp $XT, $XA, $XB", IIC_VecFP,
268 [(set f64:$XT, (fneg (fma f64:$XA, f64:$XB, (fneg f64:$XTi))))]>,
Hal Finkel25e04542014-03-25 18:55:11 +0000269 RegConstraint<"$XTi = $XT">, NoEncode<"$XTi">,
270 AltVSXFMARel;
271 let IsVSXFMAAlt = 1 in
Hal Finkel27774d92014-03-13 07:58:58 +0000272 def XSNMSUBMDP : XX3Form<60, 185,
Hal Finkel19be5062014-03-29 05:29:01 +0000273 (outs vsfrc:$XT), (ins vsfrc:$XTi, vsfrc:$XA, vsfrc:$XB),
Hal Finkel27774d92014-03-13 07:58:58 +0000274 "xsnmsubmdp $XT, $XA, $XB", IIC_VecFP, []>,
Hal Finkel25e04542014-03-25 18:55:11 +0000275 RegConstraint<"$XTi = $XT">, NoEncode<"$XTi">,
276 AltVSXFMARel;
277 }
Hal Finkel27774d92014-03-13 07:58:58 +0000278
Hal Finkel25e04542014-03-25 18:55:11 +0000279 let BaseName = "XVMADDADP" in {
Hal Finkele01d3212014-03-24 15:07:28 +0000280 let isCommutable = 1 in
Hal Finkel27774d92014-03-13 07:58:58 +0000281 def XVMADDADP : XX3Form<60, 97,
282 (outs vsrc:$XT), (ins vsrc:$XTi, vsrc:$XA, vsrc:$XB),
283 "xvmaddadp $XT, $XA, $XB", IIC_VecFP,
284 [(set v2f64:$XT, (fma v2f64:$XA, v2f64:$XB, v2f64:$XTi))]>,
Hal Finkel25e04542014-03-25 18:55:11 +0000285 RegConstraint<"$XTi = $XT">, NoEncode<"$XTi">,
286 AltVSXFMARel;
287 let IsVSXFMAAlt = 1 in
Hal Finkel27774d92014-03-13 07:58:58 +0000288 def XVMADDMDP : XX3Form<60, 105,
289 (outs vsrc:$XT), (ins vsrc:$XTi, vsrc:$XA, vsrc:$XB),
290 "xvmaddmdp $XT, $XA, $XB", IIC_VecFP, []>,
Hal Finkel25e04542014-03-25 18:55:11 +0000291 RegConstraint<"$XTi = $XT">, NoEncode<"$XTi">,
292 AltVSXFMARel;
293 }
Hal Finkel27774d92014-03-13 07:58:58 +0000294
Hal Finkel25e04542014-03-25 18:55:11 +0000295 let BaseName = "XVMADDASP" in {
Hal Finkele01d3212014-03-24 15:07:28 +0000296 let isCommutable = 1 in
Hal Finkel27774d92014-03-13 07:58:58 +0000297 def XVMADDASP : XX3Form<60, 65,
298 (outs vsrc:$XT), (ins vsrc:$XTi, vsrc:$XA, vsrc:$XB),
299 "xvmaddasp $XT, $XA, $XB", IIC_VecFP,
300 [(set v4f32:$XT, (fma v4f32:$XA, v4f32:$XB, v4f32:$XTi))]>,
Hal Finkel25e04542014-03-25 18:55:11 +0000301 RegConstraint<"$XTi = $XT">, NoEncode<"$XTi">,
302 AltVSXFMARel;
303 let IsVSXFMAAlt = 1 in
Hal Finkel27774d92014-03-13 07:58:58 +0000304 def XVMADDMSP : XX3Form<60, 73,
305 (outs vsrc:$XT), (ins vsrc:$XTi, vsrc:$XA, vsrc:$XB),
306 "xvmaddmsp $XT, $XA, $XB", IIC_VecFP, []>,
Hal Finkel25e04542014-03-25 18:55:11 +0000307 RegConstraint<"$XTi = $XT">, NoEncode<"$XTi">,
308 AltVSXFMARel;
309 }
Hal Finkel27774d92014-03-13 07:58:58 +0000310
Hal Finkel25e04542014-03-25 18:55:11 +0000311 let BaseName = "XVMSUBADP" in {
Hal Finkele01d3212014-03-24 15:07:28 +0000312 let isCommutable = 1 in
Hal Finkel27774d92014-03-13 07:58:58 +0000313 def XVMSUBADP : XX3Form<60, 113,
314 (outs vsrc:$XT), (ins vsrc:$XTi, vsrc:$XA, vsrc:$XB),
315 "xvmsubadp $XT, $XA, $XB", IIC_VecFP,
316 [(set v2f64:$XT, (fma v2f64:$XA, v2f64:$XB, (fneg v2f64:$XTi)))]>,
Hal Finkel25e04542014-03-25 18:55:11 +0000317 RegConstraint<"$XTi = $XT">, NoEncode<"$XTi">,
318 AltVSXFMARel;
319 let IsVSXFMAAlt = 1 in
Hal Finkel27774d92014-03-13 07:58:58 +0000320 def XVMSUBMDP : XX3Form<60, 121,
321 (outs vsrc:$XT), (ins vsrc:$XTi, vsrc:$XA, vsrc:$XB),
322 "xvmsubmdp $XT, $XA, $XB", IIC_VecFP, []>,
Hal Finkel25e04542014-03-25 18:55:11 +0000323 RegConstraint<"$XTi = $XT">, NoEncode<"$XTi">,
324 AltVSXFMARel;
325 }
Hal Finkel27774d92014-03-13 07:58:58 +0000326
Hal Finkel25e04542014-03-25 18:55:11 +0000327 let BaseName = "XVMSUBASP" in {
Hal Finkele01d3212014-03-24 15:07:28 +0000328 let isCommutable = 1 in
Hal Finkel27774d92014-03-13 07:58:58 +0000329 def XVMSUBASP : XX3Form<60, 81,
330 (outs vsrc:$XT), (ins vsrc:$XTi, vsrc:$XA, vsrc:$XB),
331 "xvmsubasp $XT, $XA, $XB", IIC_VecFP,
332 [(set v4f32:$XT, (fma v4f32:$XA, v4f32:$XB, (fneg v4f32:$XTi)))]>,
Hal Finkel25e04542014-03-25 18:55:11 +0000333 RegConstraint<"$XTi = $XT">, NoEncode<"$XTi">,
334 AltVSXFMARel;
335 let IsVSXFMAAlt = 1 in
Hal Finkel27774d92014-03-13 07:58:58 +0000336 def XVMSUBMSP : XX3Form<60, 89,
337 (outs vsrc:$XT), (ins vsrc:$XTi, vsrc:$XA, vsrc:$XB),
338 "xvmsubmsp $XT, $XA, $XB", IIC_VecFP, []>,
Hal Finkel25e04542014-03-25 18:55:11 +0000339 RegConstraint<"$XTi = $XT">, NoEncode<"$XTi">,
340 AltVSXFMARel;
341 }
Hal Finkel27774d92014-03-13 07:58:58 +0000342
Hal Finkel25e04542014-03-25 18:55:11 +0000343 let BaseName = "XVNMADDADP" in {
Hal Finkele01d3212014-03-24 15:07:28 +0000344 let isCommutable = 1 in
Hal Finkel27774d92014-03-13 07:58:58 +0000345 def XVNMADDADP : XX3Form<60, 225,
346 (outs vsrc:$XT), (ins vsrc:$XTi, vsrc:$XA, vsrc:$XB),
347 "xvnmaddadp $XT, $XA, $XB", IIC_VecFP,
348 [(set v2f64:$XT, (fneg (fma v2f64:$XA, v2f64:$XB, v2f64:$XTi)))]>,
Hal Finkel25e04542014-03-25 18:55:11 +0000349 RegConstraint<"$XTi = $XT">, NoEncode<"$XTi">,
350 AltVSXFMARel;
351 let IsVSXFMAAlt = 1 in
Hal Finkel27774d92014-03-13 07:58:58 +0000352 def XVNMADDMDP : XX3Form<60, 233,
353 (outs vsrc:$XT), (ins vsrc:$XTi, vsrc:$XA, vsrc:$XB),
354 "xvnmaddmdp $XT, $XA, $XB", IIC_VecFP, []>,
Hal Finkel25e04542014-03-25 18:55:11 +0000355 RegConstraint<"$XTi = $XT">, NoEncode<"$XTi">,
356 AltVSXFMARel;
357 }
Hal Finkel27774d92014-03-13 07:58:58 +0000358
Hal Finkel25e04542014-03-25 18:55:11 +0000359 let BaseName = "XVNMADDASP" in {
Hal Finkele01d3212014-03-24 15:07:28 +0000360 let isCommutable = 1 in
Hal Finkel27774d92014-03-13 07:58:58 +0000361 def XVNMADDASP : XX3Form<60, 193,
362 (outs vsrc:$XT), (ins vsrc:$XTi, vsrc:$XA, vsrc:$XB),
363 "xvnmaddasp $XT, $XA, $XB", IIC_VecFP,
364 [(set v4f32:$XT, (fneg (fma v4f32:$XA, v4f32:$XB, v4f32:$XTi)))]>,
Hal Finkel25e04542014-03-25 18:55:11 +0000365 RegConstraint<"$XTi = $XT">, NoEncode<"$XTi">,
366 AltVSXFMARel;
367 let IsVSXFMAAlt = 1 in
Hal Finkel27774d92014-03-13 07:58:58 +0000368 def XVNMADDMSP : XX3Form<60, 201,
369 (outs vsrc:$XT), (ins vsrc:$XTi, vsrc:$XA, vsrc:$XB),
370 "xvnmaddmsp $XT, $XA, $XB", IIC_VecFP, []>,
Hal Finkel25e04542014-03-25 18:55:11 +0000371 RegConstraint<"$XTi = $XT">, NoEncode<"$XTi">,
372 AltVSXFMARel;
373 }
Hal Finkel27774d92014-03-13 07:58:58 +0000374
Hal Finkel25e04542014-03-25 18:55:11 +0000375 let BaseName = "XVNMSUBADP" in {
Hal Finkele01d3212014-03-24 15:07:28 +0000376 let isCommutable = 1 in
Hal Finkel27774d92014-03-13 07:58:58 +0000377 def XVNMSUBADP : XX3Form<60, 241,
378 (outs vsrc:$XT), (ins vsrc:$XTi, vsrc:$XA, vsrc:$XB),
379 "xvnmsubadp $XT, $XA, $XB", IIC_VecFP,
380 [(set v2f64:$XT, (fneg (fma v2f64:$XA, v2f64:$XB, (fneg v2f64:$XTi))))]>,
Hal Finkel25e04542014-03-25 18:55:11 +0000381 RegConstraint<"$XTi = $XT">, NoEncode<"$XTi">,
382 AltVSXFMARel;
383 let IsVSXFMAAlt = 1 in
Hal Finkel27774d92014-03-13 07:58:58 +0000384 def XVNMSUBMDP : XX3Form<60, 249,
385 (outs vsrc:$XT), (ins vsrc:$XTi, vsrc:$XA, vsrc:$XB),
386 "xvnmsubmdp $XT, $XA, $XB", IIC_VecFP, []>,
Hal Finkel25e04542014-03-25 18:55:11 +0000387 RegConstraint<"$XTi = $XT">, NoEncode<"$XTi">,
388 AltVSXFMARel;
389 }
Hal Finkel27774d92014-03-13 07:58:58 +0000390
Hal Finkel25e04542014-03-25 18:55:11 +0000391 let BaseName = "XVNMSUBASP" in {
Hal Finkele01d3212014-03-24 15:07:28 +0000392 let isCommutable = 1 in
Hal Finkel27774d92014-03-13 07:58:58 +0000393 def XVNMSUBASP : XX3Form<60, 209,
394 (outs vsrc:$XT), (ins vsrc:$XTi, vsrc:$XA, vsrc:$XB),
395 "xvnmsubasp $XT, $XA, $XB", IIC_VecFP,
396 [(set v4f32:$XT, (fneg (fma v4f32:$XA, v4f32:$XB, (fneg v4f32:$XTi))))]>,
Hal Finkel25e04542014-03-25 18:55:11 +0000397 RegConstraint<"$XTi = $XT">, NoEncode<"$XTi">,
398 AltVSXFMARel;
399 let IsVSXFMAAlt = 1 in
Hal Finkel27774d92014-03-13 07:58:58 +0000400 def XVNMSUBMSP : XX3Form<60, 217,
401 (outs vsrc:$XT), (ins vsrc:$XTi, vsrc:$XA, vsrc:$XB),
402 "xvnmsubmsp $XT, $XA, $XB", IIC_VecFP, []>,
Hal Finkel25e04542014-03-25 18:55:11 +0000403 RegConstraint<"$XTi = $XT">, NoEncode<"$XTi">,
404 AltVSXFMARel;
405 }
Hal Finkel27774d92014-03-13 07:58:58 +0000406
407 // Division Instructions
408 def XSDIVDP : XX3Form<60, 56,
Hal Finkel19be5062014-03-29 05:29:01 +0000409 (outs vsfrc:$XT), (ins vsfrc:$XA, vsfrc:$XB),
Hal Finkele8fba982014-03-29 13:20:31 +0000410 "xsdivdp $XT, $XA, $XB", IIC_FPDivD,
Hal Finkel27774d92014-03-13 07:58:58 +0000411 [(set f64:$XT, (fdiv f64:$XA, f64:$XB))]>;
412 def XSSQRTDP : XX2Form<60, 75,
Hal Finkel19be5062014-03-29 05:29:01 +0000413 (outs vsfrc:$XT), (ins vsfrc:$XB),
Hal Finkele8fba982014-03-29 13:20:31 +0000414 "xssqrtdp $XT, $XB", IIC_FPSqrtD,
Hal Finkel27774d92014-03-13 07:58:58 +0000415 [(set f64:$XT, (fsqrt f64:$XB))]>;
416
417 def XSREDP : XX2Form<60, 90,
Hal Finkel19be5062014-03-29 05:29:01 +0000418 (outs vsfrc:$XT), (ins vsfrc:$XB),
Hal Finkel27774d92014-03-13 07:58:58 +0000419 "xsredp $XT, $XB", IIC_VecFP,
420 [(set f64:$XT, (PPCfre f64:$XB))]>;
421 def XSRSQRTEDP : XX2Form<60, 74,
Hal Finkel19be5062014-03-29 05:29:01 +0000422 (outs vsfrc:$XT), (ins vsfrc:$XB),
Hal Finkel27774d92014-03-13 07:58:58 +0000423 "xsrsqrtedp $XT, $XB", IIC_VecFP,
424 [(set f64:$XT, (PPCfrsqrte f64:$XB))]>;
425
426 def XSTDIVDP : XX3Form_1<60, 61,
Hal Finkel19be5062014-03-29 05:29:01 +0000427 (outs crrc:$crD), (ins vsfrc:$XA, vsfrc:$XB),
Hal Finkele8fba982014-03-29 13:20:31 +0000428 "xstdivdp $crD, $XA, $XB", IIC_FPCompare, []>;
Hal Finkel27774d92014-03-13 07:58:58 +0000429 def XSTSQRTDP : XX2Form_1<60, 106,
Hal Finkel19be5062014-03-29 05:29:01 +0000430 (outs crrc:$crD), (ins vsfrc:$XB),
Hal Finkele8fba982014-03-29 13:20:31 +0000431 "xstsqrtdp $crD, $XB", IIC_FPCompare, []>;
Hal Finkel27774d92014-03-13 07:58:58 +0000432
433 def XVDIVDP : XX3Form<60, 120,
434 (outs vsrc:$XT), (ins vsrc:$XA, vsrc:$XB),
Hal Finkele8fba982014-03-29 13:20:31 +0000435 "xvdivdp $XT, $XA, $XB", IIC_FPDivD,
Hal Finkel27774d92014-03-13 07:58:58 +0000436 [(set v2f64:$XT, (fdiv v2f64:$XA, v2f64:$XB))]>;
437 def XVDIVSP : XX3Form<60, 88,
438 (outs vsrc:$XT), (ins vsrc:$XA, vsrc:$XB),
Hal Finkele8fba982014-03-29 13:20:31 +0000439 "xvdivsp $XT, $XA, $XB", IIC_FPDivS,
Hal Finkel27774d92014-03-13 07:58:58 +0000440 [(set v4f32:$XT, (fdiv v4f32:$XA, v4f32:$XB))]>;
441
442 def XVSQRTDP : XX2Form<60, 203,
443 (outs vsrc:$XT), (ins vsrc:$XB),
Hal Finkele8fba982014-03-29 13:20:31 +0000444 "xvsqrtdp $XT, $XB", IIC_FPSqrtD,
Hal Finkel27774d92014-03-13 07:58:58 +0000445 [(set v2f64:$XT, (fsqrt v2f64:$XB))]>;
446 def XVSQRTSP : XX2Form<60, 139,
447 (outs vsrc:$XT), (ins vsrc:$XB),
Hal Finkele8fba982014-03-29 13:20:31 +0000448 "xvsqrtsp $XT, $XB", IIC_FPSqrtS,
Hal Finkel27774d92014-03-13 07:58:58 +0000449 [(set v4f32:$XT, (fsqrt v4f32:$XB))]>;
450
451 def XVTDIVDP : XX3Form_1<60, 125,
452 (outs crrc:$crD), (ins vsrc:$XA, vsrc:$XB),
Hal Finkele8fba982014-03-29 13:20:31 +0000453 "xvtdivdp $crD, $XA, $XB", IIC_FPCompare, []>;
Hal Finkel27774d92014-03-13 07:58:58 +0000454 def XVTDIVSP : XX3Form_1<60, 93,
455 (outs crrc:$crD), (ins vsrc:$XA, vsrc:$XB),
Hal Finkele8fba982014-03-29 13:20:31 +0000456 "xvtdivsp $crD, $XA, $XB", IIC_FPCompare, []>;
Hal Finkel27774d92014-03-13 07:58:58 +0000457
458 def XVTSQRTDP : XX2Form_1<60, 234,
459 (outs crrc:$crD), (ins vsrc:$XB),
Hal Finkele8fba982014-03-29 13:20:31 +0000460 "xvtsqrtdp $crD, $XB", IIC_FPCompare, []>;
Hal Finkel27774d92014-03-13 07:58:58 +0000461 def XVTSQRTSP : XX2Form_1<60, 170,
462 (outs crrc:$crD), (ins vsrc:$XB),
Hal Finkele8fba982014-03-29 13:20:31 +0000463 "xvtsqrtsp $crD, $XB", IIC_FPCompare, []>;
Hal Finkel27774d92014-03-13 07:58:58 +0000464
465 def XVREDP : XX2Form<60, 218,
466 (outs vsrc:$XT), (ins vsrc:$XB),
467 "xvredp $XT, $XB", IIC_VecFP,
468 [(set v2f64:$XT, (PPCfre v2f64:$XB))]>;
469 def XVRESP : XX2Form<60, 154,
470 (outs vsrc:$XT), (ins vsrc:$XB),
471 "xvresp $XT, $XB", IIC_VecFP,
472 [(set v4f32:$XT, (PPCfre v4f32:$XB))]>;
473
474 def XVRSQRTEDP : XX2Form<60, 202,
475 (outs vsrc:$XT), (ins vsrc:$XB),
476 "xvrsqrtedp $XT, $XB", IIC_VecFP,
477 [(set v2f64:$XT, (PPCfrsqrte v2f64:$XB))]>;
478 def XVRSQRTESP : XX2Form<60, 138,
479 (outs vsrc:$XT), (ins vsrc:$XB),
480 "xvrsqrtesp $XT, $XB", IIC_VecFP,
481 [(set v4f32:$XT, (PPCfrsqrte v4f32:$XB))]>;
482
483 // Compare Instructions
484 def XSCMPODP : XX3Form_1<60, 43,
Hal Finkel19be5062014-03-29 05:29:01 +0000485 (outs crrc:$crD), (ins vsfrc:$XA, vsfrc:$XB),
Hal Finkele8fba982014-03-29 13:20:31 +0000486 "xscmpodp $crD, $XA, $XB", IIC_FPCompare, []>;
Hal Finkel27774d92014-03-13 07:58:58 +0000487 def XSCMPUDP : XX3Form_1<60, 35,
Hal Finkel19be5062014-03-29 05:29:01 +0000488 (outs crrc:$crD), (ins vsfrc:$XA, vsfrc:$XB),
Hal Finkele8fba982014-03-29 13:20:31 +0000489 "xscmpudp $crD, $XA, $XB", IIC_FPCompare, []>;
Hal Finkel27774d92014-03-13 07:58:58 +0000490
491 defm XVCMPEQDP : XX3Form_Rcr<60, 99,
Nemanja Ivanovicf502a422015-06-26 19:26:53 +0000492 "xvcmpeqdp", "$XT, $XA, $XB", IIC_VecFPCompare,
Nemanja Ivanovic2c84b292015-09-29 17:41:53 +0000493 int_ppc_vsx_xvcmpeqdp, v2i64, v2f64>;
Hal Finkel27774d92014-03-13 07:58:58 +0000494 defm XVCMPEQSP : XX3Form_Rcr<60, 67,
Nemanja Ivanovicf502a422015-06-26 19:26:53 +0000495 "xvcmpeqsp", "$XT, $XA, $XB", IIC_VecFPCompare,
Nemanja Ivanovic2c84b292015-09-29 17:41:53 +0000496 int_ppc_vsx_xvcmpeqsp, v4i32, v4f32>;
Hal Finkel27774d92014-03-13 07:58:58 +0000497 defm XVCMPGEDP : XX3Form_Rcr<60, 115,
Nemanja Ivanovicf502a422015-06-26 19:26:53 +0000498 "xvcmpgedp", "$XT, $XA, $XB", IIC_VecFPCompare,
Nemanja Ivanovic2c84b292015-09-29 17:41:53 +0000499 int_ppc_vsx_xvcmpgedp, v2i64, v2f64>;
Hal Finkel27774d92014-03-13 07:58:58 +0000500 defm XVCMPGESP : XX3Form_Rcr<60, 83,
Nemanja Ivanovicf502a422015-06-26 19:26:53 +0000501 "xvcmpgesp", "$XT, $XA, $XB", IIC_VecFPCompare,
Nemanja Ivanovic2c84b292015-09-29 17:41:53 +0000502 int_ppc_vsx_xvcmpgesp, v4i32, v4f32>;
Hal Finkel27774d92014-03-13 07:58:58 +0000503 defm XVCMPGTDP : XX3Form_Rcr<60, 107,
Nemanja Ivanovicf502a422015-06-26 19:26:53 +0000504 "xvcmpgtdp", "$XT, $XA, $XB", IIC_VecFPCompare,
Nemanja Ivanovic2c84b292015-09-29 17:41:53 +0000505 int_ppc_vsx_xvcmpgtdp, v2i64, v2f64>;
Hal Finkel27774d92014-03-13 07:58:58 +0000506 defm XVCMPGTSP : XX3Form_Rcr<60, 75,
Nemanja Ivanovicf502a422015-06-26 19:26:53 +0000507 "xvcmpgtsp", "$XT, $XA, $XB", IIC_VecFPCompare,
Nemanja Ivanovic2c84b292015-09-29 17:41:53 +0000508 int_ppc_vsx_xvcmpgtsp, v4i32, v4f32>;
Hal Finkel27774d92014-03-13 07:58:58 +0000509
510 // Move Instructions
511 def XSABSDP : XX2Form<60, 345,
Hal Finkel19be5062014-03-29 05:29:01 +0000512 (outs vsfrc:$XT), (ins vsfrc:$XB),
Hal Finkel27774d92014-03-13 07:58:58 +0000513 "xsabsdp $XT, $XB", IIC_VecFP,
514 [(set f64:$XT, (fabs f64:$XB))]>;
515 def XSNABSDP : XX2Form<60, 361,
Hal Finkel19be5062014-03-29 05:29:01 +0000516 (outs vsfrc:$XT), (ins vsfrc:$XB),
Hal Finkel27774d92014-03-13 07:58:58 +0000517 "xsnabsdp $XT, $XB", IIC_VecFP,
518 [(set f64:$XT, (fneg (fabs f64:$XB)))]>;
519 def XSNEGDP : XX2Form<60, 377,
Hal Finkel19be5062014-03-29 05:29:01 +0000520 (outs vsfrc:$XT), (ins vsfrc:$XB),
Hal Finkel27774d92014-03-13 07:58:58 +0000521 "xsnegdp $XT, $XB", IIC_VecFP,
522 [(set f64:$XT, (fneg f64:$XB))]>;
523 def XSCPSGNDP : XX3Form<60, 176,
Hal Finkel19be5062014-03-29 05:29:01 +0000524 (outs vsfrc:$XT), (ins vsfrc:$XA, vsfrc:$XB),
Hal Finkel27774d92014-03-13 07:58:58 +0000525 "xscpsgndp $XT, $XA, $XB", IIC_VecFP,
526 [(set f64:$XT, (fcopysign f64:$XB, f64:$XA))]>;
527
528 def XVABSDP : XX2Form<60, 473,
529 (outs vsrc:$XT), (ins vsrc:$XB),
530 "xvabsdp $XT, $XB", IIC_VecFP,
531 [(set v2f64:$XT, (fabs v2f64:$XB))]>;
532
533 def XVABSSP : XX2Form<60, 409,
534 (outs vsrc:$XT), (ins vsrc:$XB),
535 "xvabssp $XT, $XB", IIC_VecFP,
536 [(set v4f32:$XT, (fabs v4f32:$XB))]>;
537
538 def XVCPSGNDP : XX3Form<60, 240,
539 (outs vsrc:$XT), (ins vsrc:$XA, vsrc:$XB),
540 "xvcpsgndp $XT, $XA, $XB", IIC_VecFP,
541 [(set v2f64:$XT, (fcopysign v2f64:$XB, v2f64:$XA))]>;
542 def XVCPSGNSP : XX3Form<60, 208,
543 (outs vsrc:$XT), (ins vsrc:$XA, vsrc:$XB),
544 "xvcpsgnsp $XT, $XA, $XB", IIC_VecFP,
545 [(set v4f32:$XT, (fcopysign v4f32:$XB, v4f32:$XA))]>;
546
547 def XVNABSDP : XX2Form<60, 489,
548 (outs vsrc:$XT), (ins vsrc:$XB),
549 "xvnabsdp $XT, $XB", IIC_VecFP,
550 [(set v2f64:$XT, (fneg (fabs v2f64:$XB)))]>;
551 def XVNABSSP : XX2Form<60, 425,
552 (outs vsrc:$XT), (ins vsrc:$XB),
553 "xvnabssp $XT, $XB", IIC_VecFP,
554 [(set v4f32:$XT, (fneg (fabs v4f32:$XB)))]>;
555
556 def XVNEGDP : XX2Form<60, 505,
557 (outs vsrc:$XT), (ins vsrc:$XB),
558 "xvnegdp $XT, $XB", IIC_VecFP,
559 [(set v2f64:$XT, (fneg v2f64:$XB))]>;
560 def XVNEGSP : XX2Form<60, 441,
561 (outs vsrc:$XT), (ins vsrc:$XB),
562 "xvnegsp $XT, $XB", IIC_VecFP,
563 [(set v4f32:$XT, (fneg v4f32:$XB))]>;
564
565 // Conversion Instructions
566 def XSCVDPSP : XX2Form<60, 265,
Hal Finkel19be5062014-03-29 05:29:01 +0000567 (outs vsfrc:$XT), (ins vsfrc:$XB),
Hal Finkel27774d92014-03-13 07:58:58 +0000568 "xscvdpsp $XT, $XB", IIC_VecFP, []>;
569 def XSCVDPSXDS : XX2Form<60, 344,
Hal Finkel19be5062014-03-29 05:29:01 +0000570 (outs vsfrc:$XT), (ins vsfrc:$XB),
Hal Finkel4a912252014-03-23 05:35:00 +0000571 "xscvdpsxds $XT, $XB", IIC_VecFP,
572 [(set f64:$XT, (PPCfctidz f64:$XB))]>;
Nemanja Ivanovicdf1cb522016-11-29 16:11:34 +0000573 let isCodeGenOnly = 1 in
574 def XSCVDPSXDSs : XX2Form<60, 344,
575 (outs vssrc:$XT), (ins vssrc:$XB),
576 "xscvdpsxds $XT, $XB", IIC_VecFP,
577 [(set f32:$XT, (PPCfctidz f32:$XB))]>;
Hal Finkel27774d92014-03-13 07:58:58 +0000578 def XSCVDPSXWS : XX2Form<60, 88,
Hal Finkel19be5062014-03-29 05:29:01 +0000579 (outs vsfrc:$XT), (ins vsfrc:$XB),
Hal Finkel4a912252014-03-23 05:35:00 +0000580 "xscvdpsxws $XT, $XB", IIC_VecFP,
581 [(set f64:$XT, (PPCfctiwz f64:$XB))]>;
Nemanja Ivanovicdf1cb522016-11-29 16:11:34 +0000582 let isCodeGenOnly = 1 in
583 def XSCVDPSXWSs : XX2Form<60, 88,
584 (outs vssrc:$XT), (ins vssrc:$XB),
585 "xscvdpsxws $XT, $XB", IIC_VecFP,
586 [(set f32:$XT, (PPCfctiwz f32:$XB))]>;
Hal Finkel27774d92014-03-13 07:58:58 +0000587 def XSCVDPUXDS : XX2Form<60, 328,
Hal Finkel19be5062014-03-29 05:29:01 +0000588 (outs vsfrc:$XT), (ins vsfrc:$XB),
Hal Finkel4a912252014-03-23 05:35:00 +0000589 "xscvdpuxds $XT, $XB", IIC_VecFP,
590 [(set f64:$XT, (PPCfctiduz f64:$XB))]>;
Nemanja Ivanovicdf1cb522016-11-29 16:11:34 +0000591 let isCodeGenOnly = 1 in
592 def XSCVDPUXDSs : XX2Form<60, 328,
593 (outs vssrc:$XT), (ins vssrc:$XB),
594 "xscvdpuxds $XT, $XB", IIC_VecFP,
595 [(set f32:$XT, (PPCfctiduz f32:$XB))]>;
Hal Finkel27774d92014-03-13 07:58:58 +0000596 def XSCVDPUXWS : XX2Form<60, 72,
Hal Finkel19be5062014-03-29 05:29:01 +0000597 (outs vsfrc:$XT), (ins vsfrc:$XB),
Hal Finkel4a912252014-03-23 05:35:00 +0000598 "xscvdpuxws $XT, $XB", IIC_VecFP,
599 [(set f64:$XT, (PPCfctiwuz f64:$XB))]>;
Nemanja Ivanovicdf1cb522016-11-29 16:11:34 +0000600 let isCodeGenOnly = 1 in
601 def XSCVDPUXWSs : XX2Form<60, 72,
602 (outs vssrc:$XT), (ins vssrc:$XB),
603 "xscvdpuxws $XT, $XB", IIC_VecFP,
604 [(set f32:$XT, (PPCfctiwuz f32:$XB))]>;
Hal Finkel27774d92014-03-13 07:58:58 +0000605 def XSCVSPDP : XX2Form<60, 329,
Hal Finkel19be5062014-03-29 05:29:01 +0000606 (outs vsfrc:$XT), (ins vsfrc:$XB),
Hal Finkel27774d92014-03-13 07:58:58 +0000607 "xscvspdp $XT, $XB", IIC_VecFP, []>;
608 def XSCVSXDDP : XX2Form<60, 376,
Hal Finkel19be5062014-03-29 05:29:01 +0000609 (outs vsfrc:$XT), (ins vsfrc:$XB),
Hal Finkel4a912252014-03-23 05:35:00 +0000610 "xscvsxddp $XT, $XB", IIC_VecFP,
611 [(set f64:$XT, (PPCfcfid f64:$XB))]>;
Hal Finkel27774d92014-03-13 07:58:58 +0000612 def XSCVUXDDP : XX2Form<60, 360,
Hal Finkel19be5062014-03-29 05:29:01 +0000613 (outs vsfrc:$XT), (ins vsfrc:$XB),
Hal Finkel4a912252014-03-23 05:35:00 +0000614 "xscvuxddp $XT, $XB", IIC_VecFP,
615 [(set f64:$XT, (PPCfcfidu f64:$XB))]>;
Hal Finkel27774d92014-03-13 07:58:58 +0000616
617 def XVCVDPSP : XX2Form<60, 393,
618 (outs vsrc:$XT), (ins vsrc:$XB),
Nemanja Ivanovic2efc3cb2016-11-11 14:41:19 +0000619 "xvcvdpsp $XT, $XB", IIC_VecFP,
620 [(set v4f32:$XT, (int_ppc_vsx_xvcvdpsp v2f64:$XB))]>;
Hal Finkel27774d92014-03-13 07:58:58 +0000621 def XVCVDPSXDS : XX2Form<60, 472,
622 (outs vsrc:$XT), (ins vsrc:$XB),
Hal Finkel7279f4b2014-03-26 19:13:54 +0000623 "xvcvdpsxds $XT, $XB", IIC_VecFP,
624 [(set v2i64:$XT, (fp_to_sint v2f64:$XB))]>;
Hal Finkel27774d92014-03-13 07:58:58 +0000625 def XVCVDPSXWS : XX2Form<60, 216,
626 (outs vsrc:$XT), (ins vsrc:$XB),
Nemanja Ivanovic2efc3cb2016-11-11 14:41:19 +0000627 "xvcvdpsxws $XT, $XB", IIC_VecFP,
628 [(set v4i32:$XT, (int_ppc_vsx_xvcvdpsxws v2f64:$XB))]>;
Hal Finkel27774d92014-03-13 07:58:58 +0000629 def XVCVDPUXDS : XX2Form<60, 456,
630 (outs vsrc:$XT), (ins vsrc:$XB),
Hal Finkel7279f4b2014-03-26 19:13:54 +0000631 "xvcvdpuxds $XT, $XB", IIC_VecFP,
632 [(set v2i64:$XT, (fp_to_uint v2f64:$XB))]>;
Hal Finkel27774d92014-03-13 07:58:58 +0000633 def XVCVDPUXWS : XX2Form<60, 200,
634 (outs vsrc:$XT), (ins vsrc:$XB),
Nemanja Ivanovic2efc3cb2016-11-11 14:41:19 +0000635 "xvcvdpuxws $XT, $XB", IIC_VecFP,
636 [(set v4i32:$XT, (int_ppc_vsx_xvcvdpuxws v2f64:$XB))]>;
Hal Finkel27774d92014-03-13 07:58:58 +0000637
638 def XVCVSPDP : XX2Form<60, 457,
639 (outs vsrc:$XT), (ins vsrc:$XB),
Nemanja Ivanovic2efc3cb2016-11-11 14:41:19 +0000640 "xvcvspdp $XT, $XB", IIC_VecFP,
641 [(set v2f64:$XT, (int_ppc_vsx_xvcvspdp v4f32:$XB))]>;
Hal Finkel27774d92014-03-13 07:58:58 +0000642 def XVCVSPSXDS : XX2Form<60, 408,
643 (outs vsrc:$XT), (ins vsrc:$XB),
644 "xvcvspsxds $XT, $XB", IIC_VecFP, []>;
645 def XVCVSPSXWS : XX2Form<60, 152,
646 (outs vsrc:$XT), (ins vsrc:$XB),
Nemanja Ivanovicdf1cb522016-11-29 16:11:34 +0000647 "xvcvspsxws $XT, $XB", IIC_VecFP,
648 [(set v4i32:$XT, (fp_to_sint v4f32:$XB))]>;
Hal Finkel27774d92014-03-13 07:58:58 +0000649 def XVCVSPUXDS : XX2Form<60, 392,
650 (outs vsrc:$XT), (ins vsrc:$XB),
651 "xvcvspuxds $XT, $XB", IIC_VecFP, []>;
652 def XVCVSPUXWS : XX2Form<60, 136,
653 (outs vsrc:$XT), (ins vsrc:$XB),
Nemanja Ivanovicdf1cb522016-11-29 16:11:34 +0000654 "xvcvspuxws $XT, $XB", IIC_VecFP,
655 [(set v4i32:$XT, (fp_to_uint v4f32:$XB))]>;
Hal Finkel27774d92014-03-13 07:58:58 +0000656 def XVCVSXDDP : XX2Form<60, 504,
657 (outs vsrc:$XT), (ins vsrc:$XB),
Hal Finkel7279f4b2014-03-26 19:13:54 +0000658 "xvcvsxddp $XT, $XB", IIC_VecFP,
659 [(set v2f64:$XT, (sint_to_fp v2i64:$XB))]>;
Hal Finkel27774d92014-03-13 07:58:58 +0000660 def XVCVSXDSP : XX2Form<60, 440,
661 (outs vsrc:$XT), (ins vsrc:$XB),
Nemanja Ivanovic2efc3cb2016-11-11 14:41:19 +0000662 "xvcvsxdsp $XT, $XB", IIC_VecFP,
663 [(set v4f32:$XT, (int_ppc_vsx_xvcvsxdsp v2i64:$XB))]>;
Hal Finkel27774d92014-03-13 07:58:58 +0000664 def XVCVSXWDP : XX2Form<60, 248,
665 (outs vsrc:$XT), (ins vsrc:$XB),
Nemanja Ivanovic2efc3cb2016-11-11 14:41:19 +0000666 "xvcvsxwdp $XT, $XB", IIC_VecFP,
667 [(set v2f64:$XT, (int_ppc_vsx_xvcvsxwdp v4i32:$XB))]>;
Hal Finkel27774d92014-03-13 07:58:58 +0000668 def XVCVSXWSP : XX2Form<60, 184,
669 (outs vsrc:$XT), (ins vsrc:$XB),
Nemanja Ivanovic44513e52016-07-05 09:22:29 +0000670 "xvcvsxwsp $XT, $XB", IIC_VecFP,
671 [(set v4f32:$XT, (sint_to_fp v4i32:$XB))]>;
Hal Finkel27774d92014-03-13 07:58:58 +0000672 def XVCVUXDDP : XX2Form<60, 488,
673 (outs vsrc:$XT), (ins vsrc:$XB),
Hal Finkel7279f4b2014-03-26 19:13:54 +0000674 "xvcvuxddp $XT, $XB", IIC_VecFP,
675 [(set v2f64:$XT, (uint_to_fp v2i64:$XB))]>;
Hal Finkel27774d92014-03-13 07:58:58 +0000676 def XVCVUXDSP : XX2Form<60, 424,
677 (outs vsrc:$XT), (ins vsrc:$XB),
Nemanja Ivanovic2efc3cb2016-11-11 14:41:19 +0000678 "xvcvuxdsp $XT, $XB", IIC_VecFP,
679 [(set v4f32:$XT, (int_ppc_vsx_xvcvuxdsp v2i64:$XB))]>;
Hal Finkel27774d92014-03-13 07:58:58 +0000680 def XVCVUXWDP : XX2Form<60, 232,
681 (outs vsrc:$XT), (ins vsrc:$XB),
Nemanja Ivanovic2efc3cb2016-11-11 14:41:19 +0000682 "xvcvuxwdp $XT, $XB", IIC_VecFP,
683 [(set v2f64:$XT, (int_ppc_vsx_xvcvuxwdp v4i32:$XB))]>;
Hal Finkel27774d92014-03-13 07:58:58 +0000684 def XVCVUXWSP : XX2Form<60, 168,
685 (outs vsrc:$XT), (ins vsrc:$XB),
Nemanja Ivanovicdf1cb522016-11-29 16:11:34 +0000686 "xvcvuxwsp $XT, $XB", IIC_VecFP,
687 [(set v4f32:$XT, (uint_to_fp v4i32:$XB))]>;
Hal Finkel27774d92014-03-13 07:58:58 +0000688
689 // Rounding Instructions
690 def XSRDPI : XX2Form<60, 73,
Hal Finkel19be5062014-03-29 05:29:01 +0000691 (outs vsfrc:$XT), (ins vsfrc:$XB),
Hal Finkel27774d92014-03-13 07:58:58 +0000692 "xsrdpi $XT, $XB", IIC_VecFP,
Michael Kuperstein2bc3d4d2016-08-18 20:08:15 +0000693 [(set f64:$XT, (fround f64:$XB))]>;
Hal Finkel27774d92014-03-13 07:58:58 +0000694 def XSRDPIC : XX2Form<60, 107,
Hal Finkel19be5062014-03-29 05:29:01 +0000695 (outs vsfrc:$XT), (ins vsfrc:$XB),
Hal Finkel27774d92014-03-13 07:58:58 +0000696 "xsrdpic $XT, $XB", IIC_VecFP,
697 [(set f64:$XT, (fnearbyint f64:$XB))]>;
698 def XSRDPIM : XX2Form<60, 121,
Hal Finkel19be5062014-03-29 05:29:01 +0000699 (outs vsfrc:$XT), (ins vsfrc:$XB),
Hal Finkel27774d92014-03-13 07:58:58 +0000700 "xsrdpim $XT, $XB", IIC_VecFP,
701 [(set f64:$XT, (ffloor f64:$XB))]>;
702 def XSRDPIP : XX2Form<60, 105,
Hal Finkel19be5062014-03-29 05:29:01 +0000703 (outs vsfrc:$XT), (ins vsfrc:$XB),
Hal Finkel27774d92014-03-13 07:58:58 +0000704 "xsrdpip $XT, $XB", IIC_VecFP,
705 [(set f64:$XT, (fceil f64:$XB))]>;
706 def XSRDPIZ : XX2Form<60, 89,
Hal Finkel19be5062014-03-29 05:29:01 +0000707 (outs vsfrc:$XT), (ins vsfrc:$XB),
Hal Finkel27774d92014-03-13 07:58:58 +0000708 "xsrdpiz $XT, $XB", IIC_VecFP,
709 [(set f64:$XT, (ftrunc f64:$XB))]>;
710
711 def XVRDPI : XX2Form<60, 201,
712 (outs vsrc:$XT), (ins vsrc:$XB),
713 "xvrdpi $XT, $XB", IIC_VecFP,
Michael Kuperstein2bc3d4d2016-08-18 20:08:15 +0000714 [(set v2f64:$XT, (fround v2f64:$XB))]>;
Hal Finkel27774d92014-03-13 07:58:58 +0000715 def XVRDPIC : XX2Form<60, 235,
716 (outs vsrc:$XT), (ins vsrc:$XB),
717 "xvrdpic $XT, $XB", IIC_VecFP,
718 [(set v2f64:$XT, (fnearbyint v2f64:$XB))]>;
719 def XVRDPIM : XX2Form<60, 249,
720 (outs vsrc:$XT), (ins vsrc:$XB),
721 "xvrdpim $XT, $XB", IIC_VecFP,
722 [(set v2f64:$XT, (ffloor v2f64:$XB))]>;
723 def XVRDPIP : XX2Form<60, 233,
724 (outs vsrc:$XT), (ins vsrc:$XB),
725 "xvrdpip $XT, $XB", IIC_VecFP,
726 [(set v2f64:$XT, (fceil v2f64:$XB))]>;
727 def XVRDPIZ : XX2Form<60, 217,
728 (outs vsrc:$XT), (ins vsrc:$XB),
729 "xvrdpiz $XT, $XB", IIC_VecFP,
730 [(set v2f64:$XT, (ftrunc v2f64:$XB))]>;
731
732 def XVRSPI : XX2Form<60, 137,
733 (outs vsrc:$XT), (ins vsrc:$XB),
734 "xvrspi $XT, $XB", IIC_VecFP,
Michael Kuperstein2bc3d4d2016-08-18 20:08:15 +0000735 [(set v4f32:$XT, (fround v4f32:$XB))]>;
Hal Finkel27774d92014-03-13 07:58:58 +0000736 def XVRSPIC : XX2Form<60, 171,
737 (outs vsrc:$XT), (ins vsrc:$XB),
738 "xvrspic $XT, $XB", IIC_VecFP,
739 [(set v4f32:$XT, (fnearbyint v4f32:$XB))]>;
740 def XVRSPIM : XX2Form<60, 185,
741 (outs vsrc:$XT), (ins vsrc:$XB),
742 "xvrspim $XT, $XB", IIC_VecFP,
743 [(set v4f32:$XT, (ffloor v4f32:$XB))]>;
744 def XVRSPIP : XX2Form<60, 169,
745 (outs vsrc:$XT), (ins vsrc:$XB),
746 "xvrspip $XT, $XB", IIC_VecFP,
747 [(set v4f32:$XT, (fceil v4f32:$XB))]>;
748 def XVRSPIZ : XX2Form<60, 153,
749 (outs vsrc:$XT), (ins vsrc:$XB),
750 "xvrspiz $XT, $XB", IIC_VecFP,
751 [(set v4f32:$XT, (ftrunc v4f32:$XB))]>;
752
753 // Max/Min Instructions
Hal Finkele01d3212014-03-24 15:07:28 +0000754 let isCommutable = 1 in {
Hal Finkel27774d92014-03-13 07:58:58 +0000755 def XSMAXDP : XX3Form<60, 160,
Hal Finkel19be5062014-03-29 05:29:01 +0000756 (outs vsfrc:$XT), (ins vsfrc:$XA, vsfrc:$XB),
Bill Schmidt1ca69fa2014-10-31 19:19:07 +0000757 "xsmaxdp $XT, $XA, $XB", IIC_VecFP,
758 [(set vsfrc:$XT,
759 (int_ppc_vsx_xsmaxdp vsfrc:$XA, vsfrc:$XB))]>;
Hal Finkel27774d92014-03-13 07:58:58 +0000760 def XSMINDP : XX3Form<60, 168,
Hal Finkel19be5062014-03-29 05:29:01 +0000761 (outs vsfrc:$XT), (ins vsfrc:$XA, vsfrc:$XB),
Bill Schmidt1ca69fa2014-10-31 19:19:07 +0000762 "xsmindp $XT, $XA, $XB", IIC_VecFP,
763 [(set vsfrc:$XT,
764 (int_ppc_vsx_xsmindp vsfrc:$XA, vsfrc:$XB))]>;
Hal Finkel27774d92014-03-13 07:58:58 +0000765
766 def XVMAXDP : XX3Form<60, 224,
767 (outs vsrc:$XT), (ins vsrc:$XA, vsrc:$XB),
Bill Schmidt1ca69fa2014-10-31 19:19:07 +0000768 "xvmaxdp $XT, $XA, $XB", IIC_VecFP,
769 [(set vsrc:$XT,
770 (int_ppc_vsx_xvmaxdp vsrc:$XA, vsrc:$XB))]>;
Hal Finkel27774d92014-03-13 07:58:58 +0000771 def XVMINDP : XX3Form<60, 232,
772 (outs vsrc:$XT), (ins vsrc:$XA, vsrc:$XB),
Bill Schmidt1ca69fa2014-10-31 19:19:07 +0000773 "xvmindp $XT, $XA, $XB", IIC_VecFP,
774 [(set vsrc:$XT,
775 (int_ppc_vsx_xvmindp vsrc:$XA, vsrc:$XB))]>;
Hal Finkel27774d92014-03-13 07:58:58 +0000776
777 def XVMAXSP : XX3Form<60, 192,
778 (outs vsrc:$XT), (ins vsrc:$XA, vsrc:$XB),
Bill Schmidt1ca69fa2014-10-31 19:19:07 +0000779 "xvmaxsp $XT, $XA, $XB", IIC_VecFP,
780 [(set vsrc:$XT,
781 (int_ppc_vsx_xvmaxsp vsrc:$XA, vsrc:$XB))]>;
Hal Finkel27774d92014-03-13 07:58:58 +0000782 def XVMINSP : XX3Form<60, 200,
783 (outs vsrc:$XT), (ins vsrc:$XA, vsrc:$XB),
Bill Schmidt1ca69fa2014-10-31 19:19:07 +0000784 "xvminsp $XT, $XA, $XB", IIC_VecFP,
785 [(set vsrc:$XT,
786 (int_ppc_vsx_xvminsp vsrc:$XA, vsrc:$XB))]>;
Hal Finkele01d3212014-03-24 15:07:28 +0000787 } // isCommutable
Hal Finkel27774d92014-03-13 07:58:58 +0000788} // Uses = [RM]
789
790 // Logical Instructions
Hal Finkele01d3212014-03-24 15:07:28 +0000791 let isCommutable = 1 in
Hal Finkel27774d92014-03-13 07:58:58 +0000792 def XXLAND : XX3Form<60, 130,
793 (outs vsrc:$XT), (ins vsrc:$XA, vsrc:$XB),
Hal Finkelbd4de9d2014-03-26 04:55:40 +0000794 "xxland $XT, $XA, $XB", IIC_VecGeneral,
795 [(set v4i32:$XT, (and v4i32:$XA, v4i32:$XB))]>;
Hal Finkel27774d92014-03-13 07:58:58 +0000796 def XXLANDC : XX3Form<60, 138,
797 (outs vsrc:$XT), (ins vsrc:$XA, vsrc:$XB),
Hal Finkelbd4de9d2014-03-26 04:55:40 +0000798 "xxlandc $XT, $XA, $XB", IIC_VecGeneral,
799 [(set v4i32:$XT, (and v4i32:$XA,
800 (vnot_ppc v4i32:$XB)))]>;
Hal Finkele01d3212014-03-24 15:07:28 +0000801 let isCommutable = 1 in {
Hal Finkel27774d92014-03-13 07:58:58 +0000802 def XXLNOR : XX3Form<60, 162,
803 (outs vsrc:$XT), (ins vsrc:$XA, vsrc:$XB),
Hal Finkelbd4de9d2014-03-26 04:55:40 +0000804 "xxlnor $XT, $XA, $XB", IIC_VecGeneral,
805 [(set v4i32:$XT, (vnot_ppc (or v4i32:$XA,
806 v4i32:$XB)))]>;
Hal Finkel27774d92014-03-13 07:58:58 +0000807 def XXLOR : XX3Form<60, 146,
808 (outs vsrc:$XT), (ins vsrc:$XA, vsrc:$XB),
Hal Finkelbd4de9d2014-03-26 04:55:40 +0000809 "xxlor $XT, $XA, $XB", IIC_VecGeneral,
810 [(set v4i32:$XT, (or v4i32:$XA, v4i32:$XB))]>;
Hal Finkel19be5062014-03-29 05:29:01 +0000811 let isCodeGenOnly = 1 in
812 def XXLORf: XX3Form<60, 146,
813 (outs vsfrc:$XT), (ins vsfrc:$XA, vsfrc:$XB),
814 "xxlor $XT, $XA, $XB", IIC_VecGeneral, []>;
Hal Finkel27774d92014-03-13 07:58:58 +0000815 def XXLXOR : XX3Form<60, 154,
816 (outs vsrc:$XT), (ins vsrc:$XA, vsrc:$XB),
Hal Finkelbd4de9d2014-03-26 04:55:40 +0000817 "xxlxor $XT, $XA, $XB", IIC_VecGeneral,
818 [(set v4i32:$XT, (xor v4i32:$XA, v4i32:$XB))]>;
Hal Finkele01d3212014-03-24 15:07:28 +0000819 } // isCommutable
Nemanja Ivanovicd2c3c512016-09-23 13:25:31 +0000820 let isCodeGenOnly = 1 in
821 def XXLXORz : XX3Form_Zero<60, 154, (outs vsrc:$XT), (ins),
822 "xxlxor $XT, $XT, $XT", IIC_VecGeneral,
823 [(set v4i32:$XT, (v4i32 immAllZerosV))]>;
Hal Finkel27774d92014-03-13 07:58:58 +0000824
Ehsan Amiric90b02c2016-10-24 17:31:09 +0000825 let isCodeGenOnly = 1 in {
826 def XXLXORdpz : XX3Form_SetZero<60, 154,
827 (outs vsfrc:$XT), (ins),
828 "xxlxor $XT, $XT, $XT", IIC_VecGeneral,
829 [(set f64:$XT, (fpimm0))]>;
830 def XXLXORspz : XX3Form_SetZero<60, 154,
831 (outs vssrc:$XT), (ins),
832 "xxlxor $XT, $XT, $XT", IIC_VecGeneral,
833 [(set f32:$XT, (fpimm0))]>;
834 }
835
Hal Finkel27774d92014-03-13 07:58:58 +0000836 // Permutation Instructions
837 def XXMRGHW : XX3Form<60, 18,
838 (outs vsrc:$XT), (ins vsrc:$XA, vsrc:$XB),
839 "xxmrghw $XT, $XA, $XB", IIC_VecPerm, []>;
840 def XXMRGLW : XX3Form<60, 50,
841 (outs vsrc:$XT), (ins vsrc:$XA, vsrc:$XB),
842 "xxmrglw $XT, $XA, $XB", IIC_VecPerm, []>;
843
844 def XXPERMDI : XX3Form_2<60, 10,
845 (outs vsrc:$XT), (ins vsrc:$XA, vsrc:$XB, u2imm:$DM),
846 "xxpermdi $XT, $XA, $XB, $DM", IIC_VecPerm, []>;
Nemanja Ivanovic10fc3cf2016-11-23 15:51:52 +0000847 let isCodeGenOnly = 1 in {
Nemanja Ivanovic11049f82016-10-04 06:59:23 +0000848 def XXPERMDIs : XX3Form_2s<60, 10, (outs vsrc:$XT), (ins vfrc:$XA, u2imm:$DM),
849 "xxpermdi $XT, $XA, $XA, $DM", IIC_VecPerm, []>;
Nemanja Ivanovic10fc3cf2016-11-23 15:51:52 +0000850 let D = 0 in
851 def XXSPLTD0s : XX3Form_2s<60, 10, (outs vsrc:$XT), (ins vfrc:$XA),
852 "xxspltd $XT, $XA, 0", IIC_VecPerm, []>;
853 let D = 1 in
854 def XXSPLTD1s : XX3Form_2s<60, 10, (outs vsrc:$XT), (ins vfrc:$XA),
855 "xxspltd $XT, $XA, 1", IIC_VecPerm, []>;
856 let D = 2 in
857 def XXSWAPDs : XX3Form_2s<60, 10, (outs vsrc:$XT), (ins vfrc:$XA),
858 "xxswapd $XT, $XA", IIC_VecPerm, []>;
859 }
Hal Finkel27774d92014-03-13 07:58:58 +0000860 def XXSEL : XX4Form<60, 3,
861 (outs vsrc:$XT), (ins vsrc:$XA, vsrc:$XB, vsrc:$XC),
862 "xxsel $XT, $XA, $XB, $XC", IIC_VecPerm, []>;
863
864 def XXSLDWI : XX3Form_2<60, 2,
865 (outs vsrc:$XT), (ins vsrc:$XA, vsrc:$XB, u2imm:$SHW),
Nemanja Ivanovicb43bb612016-07-12 21:00:10 +0000866 "xxsldwi $XT, $XA, $XB, $SHW", IIC_VecPerm,
867 [(set v4i32:$XT, (PPCvecshl v4i32:$XA, v4i32:$XB,
868 imm32SExt16:$SHW))]>;
Hal Finkel27774d92014-03-13 07:58:58 +0000869 def XXSPLTW : XX2Form_2<60, 164,
870 (outs vsrc:$XT), (ins vsrc:$XB, u2imm:$UIM),
Nemanja Ivanovic1a2b2f02016-05-04 16:04:02 +0000871 "xxspltw $XT, $XB, $UIM", IIC_VecPerm,
872 [(set v4i32:$XT,
873 (PPCxxsplt v4i32:$XB, imm32SExt16:$UIM))]>;
Nemanja Ivanovic11049f82016-10-04 06:59:23 +0000874 let isCodeGenOnly = 1 in
875 def XXSPLTWs : XX2Form_2<60, 164,
876 (outs vsrc:$XT), (ins vfrc:$XB, u2imm:$UIM),
877 "xxspltw $XT, $XB, $UIM", IIC_VecPerm, []>;
Craig Topperc50d64b2014-11-26 00:46:26 +0000878} // hasSideEffects
Nemanja Ivanovic11049f82016-10-04 06:59:23 +0000879} // UseVSXReg = 1
Hal Finkel27774d92014-03-13 07:58:58 +0000880
Bill Schmidt61e65232014-10-22 13:13:40 +0000881// SELECT_CC_* - Used to implement the SELECT_CC DAG operation. Expanded after
882// instruction selection into a branch sequence.
883let usesCustomInserter = 1, // Expanded after instruction selection.
884 PPC970_Single = 1 in {
885
886 def SELECT_CC_VSRC: Pseudo<(outs vsrc:$dst),
887 (ins crrc:$cond, vsrc:$T, vsrc:$F, i32imm:$BROPC),
888 "#SELECT_CC_VSRC",
889 []>;
Bill Schmidt9c54bbd2014-10-22 16:58:20 +0000890 def SELECT_VSRC: Pseudo<(outs vsrc:$dst),
891 (ins crbitrc:$cond, vsrc:$T, vsrc:$F),
892 "#SELECT_VSRC",
Bill Schmidt61e65232014-10-22 13:13:40 +0000893 [(set v2f64:$dst,
894 (select i1:$cond, v2f64:$T, v2f64:$F))]>;
Bill Schmidt9c54bbd2014-10-22 16:58:20 +0000895 def SELECT_CC_VSFRC: Pseudo<(outs f8rc:$dst),
896 (ins crrc:$cond, f8rc:$T, f8rc:$F,
897 i32imm:$BROPC), "#SELECT_CC_VSFRC",
898 []>;
899 def SELECT_VSFRC: Pseudo<(outs f8rc:$dst),
900 (ins crbitrc:$cond, f8rc:$T, f8rc:$F),
901 "#SELECT_VSFRC",
902 [(set f64:$dst,
903 (select i1:$cond, f64:$T, f64:$F))]>;
Nemanja Ivanovicf3c94b12015-05-07 18:24:05 +0000904 def SELECT_CC_VSSRC: Pseudo<(outs f4rc:$dst),
905 (ins crrc:$cond, f4rc:$T, f4rc:$F,
906 i32imm:$BROPC), "#SELECT_CC_VSSRC",
907 []>;
908 def SELECT_VSSRC: Pseudo<(outs f4rc:$dst),
909 (ins crbitrc:$cond, f4rc:$T, f4rc:$F),
910 "#SELECT_VSSRC",
911 [(set f32:$dst,
912 (select i1:$cond, f32:$T, f32:$F))]>;
Bill Schmidt9c54bbd2014-10-22 16:58:20 +0000913} // usesCustomInserter
914} // AddedComplexity
Bill Schmidt61e65232014-10-22 13:13:40 +0000915
Hal Finkel27774d92014-03-13 07:58:58 +0000916def : InstAlias<"xvmovdp $XT, $XB",
917 (XVCPSGNDP vsrc:$XT, vsrc:$XB, vsrc:$XB)>;
918def : InstAlias<"xvmovsp $XT, $XB",
919 (XVCPSGNSP vsrc:$XT, vsrc:$XB, vsrc:$XB)>;
920
921def : InstAlias<"xxspltd $XT, $XB, 0",
922 (XXPERMDI vsrc:$XT, vsrc:$XB, vsrc:$XB, 0)>;
923def : InstAlias<"xxspltd $XT, $XB, 1",
924 (XXPERMDI vsrc:$XT, vsrc:$XB, vsrc:$XB, 3)>;
925def : InstAlias<"xxmrghd $XT, $XA, $XB",
926 (XXPERMDI vsrc:$XT, vsrc:$XA, vsrc:$XB, 0)>;
927def : InstAlias<"xxmrgld $XT, $XA, $XB",
928 (XXPERMDI vsrc:$XT, vsrc:$XA, vsrc:$XB, 3)>;
929def : InstAlias<"xxswapd $XT, $XB",
930 (XXPERMDI vsrc:$XT, vsrc:$XB, vsrc:$XB, 2)>;
931
932let AddedComplexity = 400 in { // Prefer VSX patterns over non-VSX patterns.
Bill Schmidt10f6eb92014-12-09 16:43:32 +0000933
Nemanja Ivanovic6f22b412016-09-27 08:42:12 +0000934def : Pat<(v4i32 (vnot_ppc v4i32:$A)),
935 (v4i32 (XXLNOR $A, $A))>;
Bill Schmidt10f6eb92014-12-09 16:43:32 +0000936let Predicates = [IsBigEndian] in {
Hal Finkel27774d92014-03-13 07:58:58 +0000937def : Pat<(v2f64 (scalar_to_vector f64:$A)),
Hal Finkel19be5062014-03-29 05:29:01 +0000938 (v2f64 (SUBREG_TO_REG (i64 1), $A, sub_64))>;
Hal Finkel27774d92014-03-13 07:58:58 +0000939
Matt Arsenaultfbd9bbf2015-12-11 19:20:16 +0000940def : Pat<(f64 (extractelt v2f64:$S, 0)),
Hal Finkel19be5062014-03-29 05:29:01 +0000941 (f64 (EXTRACT_SUBREG $S, sub_64))>;
Matt Arsenaultfbd9bbf2015-12-11 19:20:16 +0000942def : Pat<(f64 (extractelt v2f64:$S, 1)),
Hal Finkel19be5062014-03-29 05:29:01 +0000943 (f64 (EXTRACT_SUBREG (XXPERMDI $S, $S, 2), sub_64))>;
Bill Schmidt10f6eb92014-12-09 16:43:32 +0000944}
945
946let Predicates = [IsLittleEndian] in {
947def : Pat<(v2f64 (scalar_to_vector f64:$A)),
948 (v2f64 (XXPERMDI (SUBREG_TO_REG (i64 1), $A, sub_64),
949 (SUBREG_TO_REG (i64 1), $A, sub_64), 0))>;
950
Matt Arsenaultfbd9bbf2015-12-11 19:20:16 +0000951def : Pat<(f64 (extractelt v2f64:$S, 0)),
Bill Schmidt10f6eb92014-12-09 16:43:32 +0000952 (f64 (EXTRACT_SUBREG (XXPERMDI $S, $S, 2), sub_64))>;
Matt Arsenaultfbd9bbf2015-12-11 19:20:16 +0000953def : Pat<(f64 (extractelt v2f64:$S, 1)),
Bill Schmidt10f6eb92014-12-09 16:43:32 +0000954 (f64 (EXTRACT_SUBREG $S, sub_64))>;
955}
Hal Finkel27774d92014-03-13 07:58:58 +0000956
957// Additional fnmsub patterns: -a*c + b == -(a*c - b)
958def : Pat<(fma (fneg f64:$A), f64:$C, f64:$B),
959 (XSNMSUBADP $B, $C, $A)>;
960def : Pat<(fma f64:$A, (fneg f64:$C), f64:$B),
961 (XSNMSUBADP $B, $C, $A)>;
962
963def : Pat<(fma (fneg v2f64:$A), v2f64:$C, v2f64:$B),
964 (XVNMSUBADP $B, $C, $A)>;
965def : Pat<(fma v2f64:$A, (fneg v2f64:$C), v2f64:$B),
966 (XVNMSUBADP $B, $C, $A)>;
967
968def : Pat<(fma (fneg v4f32:$A), v4f32:$C, v4f32:$B),
969 (XVNMSUBASP $B, $C, $A)>;
970def : Pat<(fma v4f32:$A, (fneg v4f32:$C), v4f32:$B),
971 (XVNMSUBASP $B, $C, $A)>;
972
Hal Finkel9e0baa62014-04-01 19:24:27 +0000973def : Pat<(v2f64 (bitconvert v4f32:$A)),
974 (COPY_TO_REGCLASS $A, VSRC)>;
Hal Finkel27774d92014-03-13 07:58:58 +0000975def : Pat<(v2f64 (bitconvert v4i32:$A)),
976 (COPY_TO_REGCLASS $A, VSRC)>;
977def : Pat<(v2f64 (bitconvert v8i16:$A)),
978 (COPY_TO_REGCLASS $A, VSRC)>;
979def : Pat<(v2f64 (bitconvert v16i8:$A)),
980 (COPY_TO_REGCLASS $A, VSRC)>;
981
Hal Finkel9e0baa62014-04-01 19:24:27 +0000982def : Pat<(v4f32 (bitconvert v2f64:$A)),
983 (COPY_TO_REGCLASS $A, VRRC)>;
Hal Finkel27774d92014-03-13 07:58:58 +0000984def : Pat<(v4i32 (bitconvert v2f64:$A)),
985 (COPY_TO_REGCLASS $A, VRRC)>;
986def : Pat<(v8i16 (bitconvert v2f64:$A)),
987 (COPY_TO_REGCLASS $A, VRRC)>;
988def : Pat<(v16i8 (bitconvert v2f64:$A)),
989 (COPY_TO_REGCLASS $A, VRRC)>;
990
Hal Finkel9e0baa62014-04-01 19:24:27 +0000991def : Pat<(v2i64 (bitconvert v4f32:$A)),
992 (COPY_TO_REGCLASS $A, VSRC)>;
Hal Finkela6c8b512014-03-26 16:12:58 +0000993def : Pat<(v2i64 (bitconvert v4i32:$A)),
994 (COPY_TO_REGCLASS $A, VSRC)>;
995def : Pat<(v2i64 (bitconvert v8i16:$A)),
996 (COPY_TO_REGCLASS $A, VSRC)>;
997def : Pat<(v2i64 (bitconvert v16i8:$A)),
998 (COPY_TO_REGCLASS $A, VSRC)>;
999
Hal Finkel9e0baa62014-04-01 19:24:27 +00001000def : Pat<(v4f32 (bitconvert v2i64:$A)),
1001 (COPY_TO_REGCLASS $A, VRRC)>;
Hal Finkela6c8b512014-03-26 16:12:58 +00001002def : Pat<(v4i32 (bitconvert v2i64:$A)),
1003 (COPY_TO_REGCLASS $A, VRRC)>;
1004def : Pat<(v8i16 (bitconvert v2i64:$A)),
1005 (COPY_TO_REGCLASS $A, VRRC)>;
1006def : Pat<(v16i8 (bitconvert v2i64:$A)),
1007 (COPY_TO_REGCLASS $A, VRRC)>;
1008
Hal Finkel9281c9a2014-03-26 18:26:30 +00001009def : Pat<(v2f64 (bitconvert v2i64:$A)),
1010 (COPY_TO_REGCLASS $A, VRRC)>;
1011def : Pat<(v2i64 (bitconvert v2f64:$A)),
1012 (COPY_TO_REGCLASS $A, VRRC)>;
1013
Kit Bartond4eb73c2015-05-05 16:10:44 +00001014def : Pat<(v2f64 (bitconvert v1i128:$A)),
1015 (COPY_TO_REGCLASS $A, VRRC)>;
1016def : Pat<(v1i128 (bitconvert v2f64:$A)),
1017 (COPY_TO_REGCLASS $A, VRRC)>;
1018
Hal Finkel5c0d1452014-03-30 13:22:59 +00001019// sign extension patterns
1020// To extend "in place" from v2i32 to v2i64, we have input data like:
1021// | undef | i32 | undef | i32 |
1022// but xvcvsxwdp expects the input in big-Endian format:
1023// | i32 | undef | i32 | undef |
1024// so we need to shift everything to the left by one i32 (word) before
1025// the conversion.
1026def : Pat<(sext_inreg v2i64:$C, v2i32),
1027 (XVCVDPSXDS (XVCVSXWDP (XXSLDWI $C, $C, 1)))>;
1028def : Pat<(v2f64 (sint_to_fp (sext_inreg v2i64:$C, v2i32))),
1029 (XVCVSXWDP (XXSLDWI $C, $C, 1))>;
1030
Nemanja Ivanovic44513e52016-07-05 09:22:29 +00001031def : Pat<(v2f64 (PPCsvec2fp v4i32:$C, 0)),
1032 (v2f64 (XVCVSXWDP (v2i64 (XXMRGHW $C, $C))))>;
1033def : Pat<(v2f64 (PPCsvec2fp v4i32:$C, 1)),
1034 (v2f64 (XVCVSXWDP (v2i64 (XXMRGLW $C, $C))))>;
1035
1036def : Pat<(v2f64 (PPCuvec2fp v4i32:$C, 0)),
1037 (v2f64 (XVCVUXWDP (v2i64 (XXMRGHW $C, $C))))>;
1038def : Pat<(v2f64 (PPCuvec2fp v4i32:$C, 1)),
1039 (v2f64 (XVCVUXWDP (v2i64 (XXMRGLW $C, $C))))>;
1040
Bill Schmidt2d1128a2014-10-17 15:13:38 +00001041// Loads.
Nemanja Ivanovic6e7879c2016-09-22 09:52:19 +00001042let Predicates = [HasVSX, HasOnlySwappingMemOps] in {
Nemanja Ivanovic6e7879c2016-09-22 09:52:19 +00001043 def : Pat<(v2f64 (PPClxvd2x xoaddr:$src)), (LXVD2X xoaddr:$src)>;
Bill Schmidt2d1128a2014-10-17 15:13:38 +00001044
Nemanja Ivanovic6e7879c2016-09-22 09:52:19 +00001045 // Stores.
1046 def : Pat<(int_ppc_vsx_stxvd2x v2f64:$rS, xoaddr:$dst),
1047 (STXVD2X $rS, xoaddr:$dst)>;
Nemanja Ivanovicf57f1502016-11-29 23:00:33 +00001048 def : Pat<(int_ppc_vsx_stxvw4x v4i32:$rS, xoaddr:$dst),
1049 (STXVW4X $rS, xoaddr:$dst)>;
Tony Jiang5f850cd2016-11-15 14:25:56 +00001050 def : Pat<(int_ppc_vsx_stxvd2x_be v2f64:$rS, xoaddr:$dst),
1051 (STXVD2X $rS, xoaddr:$dst)>;
1052 def : Pat<(int_ppc_vsx_stxvw4x_be v4i32:$rS, xoaddr:$dst),
1053 (STXVW4X $rS, xoaddr:$dst)>;
Nemanja Ivanovic6e7879c2016-09-22 09:52:19 +00001054 def : Pat<(PPCstxvd2x v2f64:$rS, xoaddr:$dst), (STXVD2X $rS, xoaddr:$dst)>;
1055}
Nemanja Ivanovice78ffed2016-09-22 10:32:03 +00001056let Predicates = [IsBigEndian, HasVSX, HasOnlySwappingMemOps] in {
1057 def : Pat<(v2f64 (load xoaddr:$src)), (LXVD2X xoaddr:$src)>;
1058 def : Pat<(v2i64 (load xoaddr:$src)), (LXVD2X xoaddr:$src)>;
1059 def : Pat<(v4i32 (load xoaddr:$src)), (LXVW4X xoaddr:$src)>;
1060 def : Pat<(store v2f64:$rS, xoaddr:$dst), (STXVD2X $rS, xoaddr:$dst)>;
1061 def : Pat<(store v2i64:$rS, xoaddr:$dst), (STXVD2X $rS, xoaddr:$dst)>;
1062}
Bill Schmidtfae5d712014-12-09 16:35:51 +00001063
1064// Permutes.
1065def : Pat<(v2f64 (PPCxxswapd v2f64:$src)), (XXPERMDI $src, $src, 2)>;
1066def : Pat<(v2i64 (PPCxxswapd v2i64:$src)), (XXPERMDI $src, $src, 2)>;
1067def : Pat<(v4f32 (PPCxxswapd v4f32:$src)), (XXPERMDI $src, $src, 2)>;
1068def : Pat<(v4i32 (PPCxxswapd v4i32:$src)), (XXPERMDI $src, $src, 2)>;
Nemanja Ivanoviceebbcb62016-07-12 12:16:27 +00001069def : Pat<(v2f64 (PPCswapNoChain v2f64:$src)), (XXPERMDI $src, $src, 2)>;
Bill Schmidt2d1128a2014-10-17 15:13:38 +00001070
Bill Schmidt61e65232014-10-22 13:13:40 +00001071// Selects.
1072def : Pat<(v2f64 (selectcc i1:$lhs, i1:$rhs, v2f64:$tval, v2f64:$fval, SETLT)),
Hal Finkela2cdbce2015-08-30 22:12:50 +00001073 (SELECT_VSRC (CRANDC $lhs, $rhs), $tval, $fval)>;
1074def : Pat<(v2f64 (selectcc i1:$lhs, i1:$rhs, v2f64:$tval, v2f64:$fval, SETULT)),
Bill Schmidt61e65232014-10-22 13:13:40 +00001075 (SELECT_VSRC (CRANDC $rhs, $lhs), $tval, $fval)>;
1076def : Pat<(v2f64 (selectcc i1:$lhs, i1:$rhs, v2f64:$tval, v2f64:$fval, SETLE)),
Hal Finkela2cdbce2015-08-30 22:12:50 +00001077 (SELECT_VSRC (CRORC $lhs, $rhs), $tval, $fval)>;
1078def : Pat<(v2f64 (selectcc i1:$lhs, i1:$rhs, v2f64:$tval, v2f64:$fval, SETULE)),
Bill Schmidt61e65232014-10-22 13:13:40 +00001079 (SELECT_VSRC (CRORC $rhs, $lhs), $tval, $fval)>;
1080def : Pat<(v2f64 (selectcc i1:$lhs, i1:$rhs, v2f64:$tval, v2f64:$fval, SETEQ)),
1081 (SELECT_VSRC (CREQV $lhs, $rhs), $tval, $fval)>;
1082def : Pat<(v2f64 (selectcc i1:$lhs, i1:$rhs, v2f64:$tval, v2f64:$fval, SETGE)),
Hal Finkela2cdbce2015-08-30 22:12:50 +00001083 (SELECT_VSRC (CRORC $rhs, $lhs), $tval, $fval)>;
1084def : Pat<(v2f64 (selectcc i1:$lhs, i1:$rhs, v2f64:$tval, v2f64:$fval, SETUGE)),
Bill Schmidt61e65232014-10-22 13:13:40 +00001085 (SELECT_VSRC (CRORC $lhs, $rhs), $tval, $fval)>;
1086def : Pat<(v2f64 (selectcc i1:$lhs, i1:$rhs, v2f64:$tval, v2f64:$fval, SETGT)),
Hal Finkela2cdbce2015-08-30 22:12:50 +00001087 (SELECT_VSRC (CRANDC $rhs, $lhs), $tval, $fval)>;
1088def : Pat<(v2f64 (selectcc i1:$lhs, i1:$rhs, v2f64:$tval, v2f64:$fval, SETUGT)),
Bill Schmidt61e65232014-10-22 13:13:40 +00001089 (SELECT_VSRC (CRANDC $lhs, $rhs), $tval, $fval)>;
1090def : Pat<(v2f64 (selectcc i1:$lhs, i1:$rhs, v2f64:$tval, v2f64:$fval, SETNE)),
1091 (SELECT_VSRC (CRXOR $lhs, $rhs), $tval, $fval)>;
1092
Bill Schmidt9c54bbd2014-10-22 16:58:20 +00001093def : Pat<(f64 (selectcc i1:$lhs, i1:$rhs, f64:$tval, f64:$fval, SETLT)),
Hal Finkela2cdbce2015-08-30 22:12:50 +00001094 (SELECT_VSFRC (CRANDC $lhs, $rhs), $tval, $fval)>;
1095def : Pat<(f64 (selectcc i1:$lhs, i1:$rhs, f64:$tval, f64:$fval, SETULT)),
Bill Schmidt9c54bbd2014-10-22 16:58:20 +00001096 (SELECT_VSFRC (CRANDC $rhs, $lhs), $tval, $fval)>;
1097def : Pat<(f64 (selectcc i1:$lhs, i1:$rhs, f64:$tval, f64:$fval, SETLE)),
Hal Finkela2cdbce2015-08-30 22:12:50 +00001098 (SELECT_VSFRC (CRORC $lhs, $rhs), $tval, $fval)>;
1099def : Pat<(f64 (selectcc i1:$lhs, i1:$rhs, f64:$tval, f64:$fval, SETULE)),
Bill Schmidt9c54bbd2014-10-22 16:58:20 +00001100 (SELECT_VSFRC (CRORC $rhs, $lhs), $tval, $fval)>;
1101def : Pat<(f64 (selectcc i1:$lhs, i1:$rhs, f64:$tval, f64:$fval, SETEQ)),
1102 (SELECT_VSFRC (CREQV $lhs, $rhs), $tval, $fval)>;
1103def : Pat<(f64 (selectcc i1:$lhs, i1:$rhs, f64:$tval, f64:$fval, SETGE)),
Hal Finkela2cdbce2015-08-30 22:12:50 +00001104 (SELECT_VSFRC (CRORC $rhs, $lhs), $tval, $fval)>;
1105def : Pat<(f64 (selectcc i1:$lhs, i1:$rhs, f64:$tval, f64:$fval, SETUGE)),
Bill Schmidt9c54bbd2014-10-22 16:58:20 +00001106 (SELECT_VSFRC (CRORC $lhs, $rhs), $tval, $fval)>;
1107def : Pat<(f64 (selectcc i1:$lhs, i1:$rhs, f64:$tval, f64:$fval, SETGT)),
Hal Finkela2cdbce2015-08-30 22:12:50 +00001108 (SELECT_VSFRC (CRANDC $rhs, $lhs), $tval, $fval)>;
1109def : Pat<(f64 (selectcc i1:$lhs, i1:$rhs, f64:$tval, f64:$fval, SETUGT)),
Bill Schmidt9c54bbd2014-10-22 16:58:20 +00001110 (SELECT_VSFRC (CRANDC $lhs, $rhs), $tval, $fval)>;
1111def : Pat<(f64 (selectcc i1:$lhs, i1:$rhs, f64:$tval, f64:$fval, SETNE)),
1112 (SELECT_VSFRC (CRXOR $lhs, $rhs), $tval, $fval)>;
1113
Bill Schmidt76746922014-11-14 12:10:40 +00001114// Divides.
1115def : Pat<(int_ppc_vsx_xvdivsp v4f32:$A, v4f32:$B),
1116 (XVDIVSP $A, $B)>;
1117def : Pat<(int_ppc_vsx_xvdivdp v2f64:$A, v2f64:$B),
1118 (XVDIVDP $A, $B)>;
1119
Nemanja Ivanovic984a3612015-07-14 17:25:20 +00001120// Reciprocal estimate
1121def : Pat<(int_ppc_vsx_xvresp v4f32:$A),
1122 (XVRESP $A)>;
1123def : Pat<(int_ppc_vsx_xvredp v2f64:$A),
1124 (XVREDP $A)>;
1125
Nemanja Ivanovicd358b8f2015-07-05 06:03:51 +00001126// Recip. square root estimate
1127def : Pat<(int_ppc_vsx_xvrsqrtesp v4f32:$A),
1128 (XVRSQRTESP $A)>;
1129def : Pat<(int_ppc_vsx_xvrsqrtedp v2f64:$A),
1130 (XVRSQRTEDP $A)>;
1131
Nemanja Ivanovicd3c284f2016-07-18 15:30:00 +00001132let Predicates = [IsLittleEndian] in {
1133def : Pat<(f64 (PPCfcfid (PPCmtvsra (i64 (vector_extract v2i64:$S, 0))))),
1134 (f64 (XSCVSXDDP (COPY_TO_REGCLASS (XXPERMDI $S, $S, 2), VSFRC)))>;
1135def : Pat<(f64 (PPCfcfid (PPCmtvsra (i64 (vector_extract v2i64:$S, 1))))),
1136 (f64 (XSCVSXDDP (COPY_TO_REGCLASS (f64 (COPY_TO_REGCLASS $S, VSRC)), VSFRC)))>;
1137def : Pat<(f64 (PPCfcfidu (PPCmtvsra (i64 (vector_extract v2i64:$S, 0))))),
1138 (f64 (XSCVUXDDP (COPY_TO_REGCLASS (XXPERMDI $S, $S, 2), VSFRC)))>;
1139def : Pat<(f64 (PPCfcfidu (PPCmtvsra (i64 (vector_extract v2i64:$S, 1))))),
1140 (f64 (XSCVUXDDP (COPY_TO_REGCLASS (f64 (COPY_TO_REGCLASS $S, VSRC)), VSFRC)))>;
1141} // IsLittleEndian
1142
1143let Predicates = [IsBigEndian] in {
1144def : Pat<(f64 (PPCfcfid (PPCmtvsra (i64 (vector_extract v2i64:$S, 0))))),
1145 (f64 (XSCVSXDDP (COPY_TO_REGCLASS $S, VSFRC)))>;
1146def : Pat<(f64 (PPCfcfid (PPCmtvsra (i64 (vector_extract v2i64:$S, 1))))),
1147 (f64 (XSCVSXDDP (COPY_TO_REGCLASS (XXPERMDI $S, $S, 2), VSFRC)))>;
1148def : Pat<(f64 (PPCfcfidu (PPCmtvsra (i64 (vector_extract v2i64:$S, 0))))),
1149 (f64 (XSCVUXDDP (COPY_TO_REGCLASS $S, VSFRC)))>;
1150def : Pat<(f64 (PPCfcfidu (PPCmtvsra (i64 (vector_extract v2i64:$S, 1))))),
1151 (f64 (XSCVUXDDP (COPY_TO_REGCLASS (XXPERMDI $S, $S, 2), VSFRC)))>;
1152} // IsBigEndian
1153
Hal Finkel27774d92014-03-13 07:58:58 +00001154} // AddedComplexity
1155} // HasVSX
1156
Nemanja Ivanovic11049f82016-10-04 06:59:23 +00001157def ScalarLoads {
1158 dag Li8 = (i32 (extloadi8 xoaddr:$src));
1159 dag ZELi8 = (i32 (zextloadi8 xoaddr:$src));
1160 dag ZELi8i64 = (i64 (zextloadi8 xoaddr:$src));
1161 dag SELi8 = (i32 (sext_inreg (extloadi8 xoaddr:$src), i8));
1162 dag SELi8i64 = (i64 (sext_inreg (extloadi8 xoaddr:$src), i8));
1163
1164 dag Li16 = (i32 (extloadi16 xoaddr:$src));
1165 dag ZELi16 = (i32 (zextloadi16 xoaddr:$src));
1166 dag ZELi16i64 = (i64 (zextloadi16 xoaddr:$src));
1167 dag SELi16 = (i32 (sextloadi16 xoaddr:$src));
1168 dag SELi16i64 = (i64 (sextloadi16 xoaddr:$src));
1169
1170 dag Li32 = (i32 (load xoaddr:$src));
1171}
1172
Kit Barton298beb52015-02-18 16:21:46 +00001173// The following VSX instructions were introduced in Power ISA 2.07
1174/* FIXME: if the operands are v2i64, these patterns will not match.
1175 we should define new patterns or otherwise match the same patterns
1176 when the elements are larger than i32.
1177*/
1178def HasP8Vector : Predicate<"PPCSubTarget->hasP8Vector()">;
Nemanja Ivanovicc38b5312015-04-11 10:40:42 +00001179def HasDirectMove : Predicate<"PPCSubTarget->hasDirectMove()">;
Kit Barton298beb52015-02-18 16:21:46 +00001180let Predicates = [HasP8Vector] in {
1181let AddedComplexity = 400 in { // Prefer VSX patterns over non-VSX patterns.
Nemanja Ivanovic11049f82016-10-04 06:59:23 +00001182 let isCommutable = 1, UseVSXReg = 1 in {
Nemanja Ivanovicf02def62015-05-21 19:32:49 +00001183 def XXLEQV : XX3Form<60, 186,
1184 (outs vsrc:$XT), (ins vsrc:$XA, vsrc:$XB),
1185 "xxleqv $XT, $XA, $XB", IIC_VecGeneral,
1186 [(set v4i32:$XT, (vnot_ppc (xor v4i32:$XA, v4i32:$XB)))]>;
1187 def XXLNAND : XX3Form<60, 178,
1188 (outs vsrc:$XT), (ins vsrc:$XA, vsrc:$XB),
1189 "xxlnand $XT, $XA, $XB", IIC_VecGeneral,
1190 [(set v4i32:$XT, (vnot_ppc (and v4i32:$XA,
Kit Barton298beb52015-02-18 16:21:46 +00001191 v4i32:$XB)))]>;
Nemanja Ivanovic11049f82016-10-04 06:59:23 +00001192 } // isCommutable, UseVSXReg
Nemanja Ivanovicd9e4b4f2015-07-10 14:25:17 +00001193
Nemanja Ivanovic5655fb32015-07-10 12:38:08 +00001194 def : Pat<(int_ppc_vsx_xxleqv v4i32:$A, v4i32:$B),
1195 (XXLEQV $A, $B)>;
Nemanja Ivanovicf02def62015-05-21 19:32:49 +00001196
Nemanja Ivanovic11049f82016-10-04 06:59:23 +00001197 let UseVSXReg = 1 in {
Nemanja Ivanovicf02def62015-05-21 19:32:49 +00001198 def XXLORC : XX3Form<60, 170,
1199 (outs vsrc:$XT), (ins vsrc:$XA, vsrc:$XB),
1200 "xxlorc $XT, $XA, $XB", IIC_VecGeneral,
1201 [(set v4i32:$XT, (or v4i32:$XA, (vnot_ppc v4i32:$XB)))]>;
1202
Nemanja Ivanovicf3c94b12015-05-07 18:24:05 +00001203 // VSX scalar loads introduced in ISA 2.07
1204 let mayLoad = 1 in {
Nemanja Ivanovic6354d232016-10-04 11:25:52 +00001205 let CodeSize = 3 in
Nemanja Ivanovicf3c94b12015-05-07 18:24:05 +00001206 def LXSSPX : XX1Form<31, 524, (outs vssrc:$XT), (ins memrr:$src),
1207 "lxsspx $XT, $src", IIC_LdStLFD,
1208 [(set f32:$XT, (load xoaddr:$src))]>;
1209 def LXSIWAX : XX1Form<31, 76, (outs vsfrc:$XT), (ins memrr:$src),
1210 "lxsiwax $XT, $src", IIC_LdStLFD,
1211 [(set f64:$XT, (PPClfiwax xoaddr:$src))]>;
1212 def LXSIWZX : XX1Form<31, 12, (outs vsfrc:$XT), (ins memrr:$src),
1213 "lxsiwzx $XT, $src", IIC_LdStLFD,
1214 [(set f64:$XT, (PPClfiwzx xoaddr:$src))]>;
1215 } // mayLoad
1216
1217 // VSX scalar stores introduced in ISA 2.07
1218 let mayStore = 1 in {
Nemanja Ivanovic6354d232016-10-04 11:25:52 +00001219 let CodeSize = 3 in
Nemanja Ivanovicf3c94b12015-05-07 18:24:05 +00001220 def STXSSPX : XX1Form<31, 652, (outs), (ins vssrc:$XT, memrr:$dst),
1221 "stxsspx $XT, $dst", IIC_LdStSTFD,
1222 [(store f32:$XT, xoaddr:$dst)]>;
1223 def STXSIWX : XX1Form<31, 140, (outs), (ins vsfrc:$XT, memrr:$dst),
1224 "stxsiwx $XT, $dst", IIC_LdStSTFD,
1225 [(PPCstfiwx f64:$XT, xoaddr:$dst)]>;
1226 } // mayStore
Nemanja Ivanovic11049f82016-10-04 06:59:23 +00001227 } // UseVSXReg = 1
Nemanja Ivanovicf02def62015-05-21 19:32:49 +00001228
1229 def : Pat<(f64 (extloadf32 xoaddr:$src)),
1230 (COPY_TO_REGCLASS (LXSSPX xoaddr:$src), VSFRC)>;
Nemanja Ivanovicdf1cb522016-11-29 16:11:34 +00001231 def : Pat<(f32 (fpround (extloadf32 xoaddr:$src))),
1232 (f32 (LXSSPX xoaddr:$src))>;
Michael Kuperstein2bc3d4d2016-08-18 20:08:15 +00001233 def : Pat<(f64 (fpextend f32:$src)),
Nemanja Ivanovicf02def62015-05-21 19:32:49 +00001234 (COPY_TO_REGCLASS $src, VSFRC)>;
Hal Finkela2cdbce2015-08-30 22:12:50 +00001235
Nemanja Ivanovicf02def62015-05-21 19:32:49 +00001236 def : Pat<(f32 (selectcc i1:$lhs, i1:$rhs, f32:$tval, f32:$fval, SETLT)),
Hal Finkela2cdbce2015-08-30 22:12:50 +00001237 (SELECT_VSSRC (CRANDC $lhs, $rhs), $tval, $fval)>;
1238 def : Pat<(f32 (selectcc i1:$lhs, i1:$rhs, f32:$tval, f32:$fval, SETULT)),
Nemanja Ivanovicf02def62015-05-21 19:32:49 +00001239 (SELECT_VSSRC (CRANDC $rhs, $lhs), $tval, $fval)>;
1240 def : Pat<(f32 (selectcc i1:$lhs, i1:$rhs, f32:$tval, f32:$fval, SETLE)),
Hal Finkela2cdbce2015-08-30 22:12:50 +00001241 (SELECT_VSSRC (CRORC $lhs, $rhs), $tval, $fval)>;
1242 def : Pat<(f32 (selectcc i1:$lhs, i1:$rhs, f32:$tval, f32:$fval, SETULE)),
Nemanja Ivanovicf02def62015-05-21 19:32:49 +00001243 (SELECT_VSSRC (CRORC $rhs, $lhs), $tval, $fval)>;
1244 def : Pat<(f32 (selectcc i1:$lhs, i1:$rhs, f32:$tval, f32:$fval, SETEQ)),
1245 (SELECT_VSSRC (CREQV $lhs, $rhs), $tval, $fval)>;
1246 def : Pat<(f32 (selectcc i1:$lhs, i1:$rhs, f32:$tval, f32:$fval, SETGE)),
Hal Finkela2cdbce2015-08-30 22:12:50 +00001247 (SELECT_VSSRC (CRORC $rhs, $lhs), $tval, $fval)>;
1248 def : Pat<(f32 (selectcc i1:$lhs, i1:$rhs, f32:$tval, f32:$fval, SETUGE)),
Nemanja Ivanovicf02def62015-05-21 19:32:49 +00001249 (SELECT_VSSRC (CRORC $lhs, $rhs), $tval, $fval)>;
1250 def : Pat<(f32 (selectcc i1:$lhs, i1:$rhs, f32:$tval, f32:$fval, SETGT)),
Hal Finkela2cdbce2015-08-30 22:12:50 +00001251 (SELECT_VSSRC (CRANDC $rhs, $lhs), $tval, $fval)>;
1252 def : Pat<(f32 (selectcc i1:$lhs, i1:$rhs, f32:$tval, f32:$fval, SETUGT)),
Nemanja Ivanovicf02def62015-05-21 19:32:49 +00001253 (SELECT_VSSRC (CRANDC $lhs, $rhs), $tval, $fval)>;
1254 def : Pat<(f32 (selectcc i1:$lhs, i1:$rhs, f32:$tval, f32:$fval, SETNE)),
Hal Finkela2cdbce2015-08-30 22:12:50 +00001255 (SELECT_VSSRC (CRXOR $lhs, $rhs), $tval, $fval)>;
Nemanja Ivanovicf02def62015-05-21 19:32:49 +00001256
Nemanja Ivanovic11049f82016-10-04 06:59:23 +00001257 let UseVSXReg = 1 in {
Nemanja Ivanovicf02def62015-05-21 19:32:49 +00001258 // VSX Elementary Scalar FP arithmetic (SP)
1259 let isCommutable = 1 in {
1260 def XSADDSP : XX3Form<60, 0,
1261 (outs vssrc:$XT), (ins vssrc:$XA, vssrc:$XB),
1262 "xsaddsp $XT, $XA, $XB", IIC_VecFP,
1263 [(set f32:$XT, (fadd f32:$XA, f32:$XB))]>;
1264 def XSMULSP : XX3Form<60, 16,
1265 (outs vssrc:$XT), (ins vssrc:$XA, vssrc:$XB),
1266 "xsmulsp $XT, $XA, $XB", IIC_VecFP,
1267 [(set f32:$XT, (fmul f32:$XA, f32:$XB))]>;
1268 } // isCommutable
1269
1270 def XSDIVSP : XX3Form<60, 24,
1271 (outs vssrc:$XT), (ins vssrc:$XA, vssrc:$XB),
1272 "xsdivsp $XT, $XA, $XB", IIC_FPDivS,
1273 [(set f32:$XT, (fdiv f32:$XA, f32:$XB))]>;
1274 def XSRESP : XX2Form<60, 26,
1275 (outs vssrc:$XT), (ins vssrc:$XB),
1276 "xsresp $XT, $XB", IIC_VecFP,
1277 [(set f32:$XT, (PPCfre f32:$XB))]>;
1278 def XSSQRTSP : XX2Form<60, 11,
1279 (outs vssrc:$XT), (ins vssrc:$XB),
1280 "xssqrtsp $XT, $XB", IIC_FPSqrtS,
1281 [(set f32:$XT, (fsqrt f32:$XB))]>;
1282 def XSRSQRTESP : XX2Form<60, 10,
1283 (outs vssrc:$XT), (ins vssrc:$XB),
1284 "xsrsqrtesp $XT, $XB", IIC_VecFP,
1285 [(set f32:$XT, (PPCfrsqrte f32:$XB))]>;
1286 def XSSUBSP : XX3Form<60, 8,
1287 (outs vssrc:$XT), (ins vssrc:$XA, vssrc:$XB),
1288 "xssubsp $XT, $XA, $XB", IIC_VecFP,
1289 [(set f32:$XT, (fsub f32:$XA, f32:$XB))]>;
Nemanja Ivanovic376e1732015-05-29 17:13:25 +00001290
1291 // FMA Instructions
1292 let BaseName = "XSMADDASP" in {
1293 let isCommutable = 1 in
1294 def XSMADDASP : XX3Form<60, 1,
1295 (outs vssrc:$XT),
1296 (ins vssrc:$XTi, vssrc:$XA, vssrc:$XB),
1297 "xsmaddasp $XT, $XA, $XB", IIC_VecFP,
1298 [(set f32:$XT, (fma f32:$XA, f32:$XB, f32:$XTi))]>,
1299 RegConstraint<"$XTi = $XT">, NoEncode<"$XTi">,
1300 AltVSXFMARel;
1301 let IsVSXFMAAlt = 1 in
1302 def XSMADDMSP : XX3Form<60, 9,
1303 (outs vssrc:$XT),
1304 (ins vssrc:$XTi, vssrc:$XA, vssrc:$XB),
1305 "xsmaddmsp $XT, $XA, $XB", IIC_VecFP, []>,
1306 RegConstraint<"$XTi = $XT">, NoEncode<"$XTi">,
1307 AltVSXFMARel;
1308 }
1309
1310 let BaseName = "XSMSUBASP" in {
1311 let isCommutable = 1 in
1312 def XSMSUBASP : XX3Form<60, 17,
1313 (outs vssrc:$XT),
1314 (ins vssrc:$XTi, vssrc:$XA, vssrc:$XB),
1315 "xsmsubasp $XT, $XA, $XB", IIC_VecFP,
1316 [(set f32:$XT, (fma f32:$XA, f32:$XB,
1317 (fneg f32:$XTi)))]>,
1318 RegConstraint<"$XTi = $XT">, NoEncode<"$XTi">,
1319 AltVSXFMARel;
1320 let IsVSXFMAAlt = 1 in
1321 def XSMSUBMSP : XX3Form<60, 25,
1322 (outs vssrc:$XT),
1323 (ins vssrc:$XTi, vssrc:$XA, vssrc:$XB),
1324 "xsmsubmsp $XT, $XA, $XB", IIC_VecFP, []>,
1325 RegConstraint<"$XTi = $XT">, NoEncode<"$XTi">,
1326 AltVSXFMARel;
1327 }
1328
1329 let BaseName = "XSNMADDASP" in {
1330 let isCommutable = 1 in
1331 def XSNMADDASP : XX3Form<60, 129,
1332 (outs vssrc:$XT),
1333 (ins vssrc:$XTi, vssrc:$XA, vssrc:$XB),
1334 "xsnmaddasp $XT, $XA, $XB", IIC_VecFP,
1335 [(set f32:$XT, (fneg (fma f32:$XA, f32:$XB,
1336 f32:$XTi)))]>,
1337 RegConstraint<"$XTi = $XT">, NoEncode<"$XTi">,
1338 AltVSXFMARel;
1339 let IsVSXFMAAlt = 1 in
1340 def XSNMADDMSP : XX3Form<60, 137,
1341 (outs vssrc:$XT),
1342 (ins vssrc:$XTi, vssrc:$XA, vssrc:$XB),
1343 "xsnmaddmsp $XT, $XA, $XB", IIC_VecFP, []>,
1344 RegConstraint<"$XTi = $XT">, NoEncode<"$XTi">,
1345 AltVSXFMARel;
1346 }
1347
1348 let BaseName = "XSNMSUBASP" in {
1349 let isCommutable = 1 in
1350 def XSNMSUBASP : XX3Form<60, 145,
1351 (outs vssrc:$XT),
1352 (ins vssrc:$XTi, vssrc:$XA, vssrc:$XB),
1353 "xsnmsubasp $XT, $XA, $XB", IIC_VecFP,
1354 [(set f32:$XT, (fneg (fma f32:$XA, f32:$XB,
1355 (fneg f32:$XTi))))]>,
1356 RegConstraint<"$XTi = $XT">, NoEncode<"$XTi">,
1357 AltVSXFMARel;
1358 let IsVSXFMAAlt = 1 in
1359 def XSNMSUBMSP : XX3Form<60, 153,
1360 (outs vssrc:$XT),
1361 (ins vssrc:$XTi, vssrc:$XA, vssrc:$XB),
1362 "xsnmsubmsp $XT, $XA, $XB", IIC_VecFP, []>,
1363 RegConstraint<"$XTi = $XT">, NoEncode<"$XTi">,
1364 AltVSXFMARel;
1365 }
Nemanja Ivanovic1c39ca62015-08-13 17:40:44 +00001366
1367 // Single Precision Conversions (FP <-> INT)
1368 def XSCVSXDSP : XX2Form<60, 312,
1369 (outs vssrc:$XT), (ins vsfrc:$XB),
1370 "xscvsxdsp $XT, $XB", IIC_VecFP,
1371 [(set f32:$XT, (PPCfcfids f64:$XB))]>;
1372 def XSCVUXDSP : XX2Form<60, 296,
1373 (outs vssrc:$XT), (ins vsfrc:$XB),
1374 "xscvuxdsp $XT, $XB", IIC_VecFP,
1375 [(set f32:$XT, (PPCfcfidus f64:$XB))]>;
1376
1377 // Conversions between vector and scalar single precision
1378 def XSCVDPSPN : XX2Form<60, 267, (outs vsrc:$XT), (ins vssrc:$XB),
1379 "xscvdpspn $XT, $XB", IIC_VecFP, []>;
1380 def XSCVSPDPN : XX2Form<60, 331, (outs vssrc:$XT), (ins vsrc:$XB),
1381 "xscvspdpn $XT, $XB", IIC_VecFP, []>;
Nemanja Ivanovic11049f82016-10-04 06:59:23 +00001382 } // UseVSXReg = 1
Nemanja Ivanovic1c39ca62015-08-13 17:40:44 +00001383
Nemanja Ivanovicd3c284f2016-07-18 15:30:00 +00001384 let Predicates = [IsLittleEndian] in {
1385 def : Pat<(f32 (PPCfcfids (PPCmtvsra (i64 (vector_extract v2i64:$S, 0))))),
1386 (f32 (XSCVSXDSP (COPY_TO_REGCLASS (XXPERMDI $S, $S, 2), VSFRC)))>;
1387 def : Pat<(f32 (PPCfcfids (PPCmtvsra (i64 (vector_extract v2i64:$S, 1))))),
1388 (f32 (XSCVSXDSP (COPY_TO_REGCLASS (f64 (COPY_TO_REGCLASS $S, VSRC)), VSFRC)))>;
1389 def : Pat<(f32 (PPCfcfidus (PPCmtvsra (i64 (vector_extract v2i64:$S, 0))))),
1390 (f32 (XSCVUXDSP (COPY_TO_REGCLASS (XXPERMDI $S, $S, 2), VSFRC)))>;
1391 def : Pat<(f32 (PPCfcfidus (PPCmtvsra (i64 (vector_extract v2i64:$S, 1))))),
1392 (f32 (XSCVUXDSP (COPY_TO_REGCLASS (f64 (COPY_TO_REGCLASS $S, VSRC)), VSFRC)))>;
1393 }
1394
1395 let Predicates = [IsBigEndian] in {
1396 def : Pat<(f32 (PPCfcfids (PPCmtvsra (i64 (vector_extract v2i64:$S, 0))))),
1397 (f32 (XSCVSXDSP (COPY_TO_REGCLASS $S, VSFRC)))>;
1398 def : Pat<(f32 (PPCfcfids (PPCmtvsra (i64 (vector_extract v2i64:$S, 1))))),
1399 (f32 (XSCVSXDSP (COPY_TO_REGCLASS (XXPERMDI $S, $S, 2), VSFRC)))>;
1400 def : Pat<(f32 (PPCfcfidus (PPCmtvsra (i64 (vector_extract v2i64:$S, 0))))),
1401 (f32 (XSCVUXDSP (COPY_TO_REGCLASS $S, VSFRC)))>;
1402 def : Pat<(f32 (PPCfcfidus (PPCmtvsra (i64 (vector_extract v2i64:$S, 1))))),
1403 (f32 (XSCVUXDSP (COPY_TO_REGCLASS (XXPERMDI $S, $S, 2), VSFRC)))>;
1404 }
Nemanja Ivanovic11049f82016-10-04 06:59:23 +00001405 def : Pat<(v4i32 (scalar_to_vector ScalarLoads.Li32)),
1406 (v4i32 (XXSPLTWs (LXSIWAX xoaddr:$src), 1))>;
Nemanja Ivanovicf3c94b12015-05-07 18:24:05 +00001407} // AddedComplexity = 400
Kit Barton298beb52015-02-18 16:21:46 +00001408} // HasP8Vector
Nemanja Ivanovicc38b5312015-04-11 10:40:42 +00001409
Nemanja Ivanovicdf1cb522016-11-29 16:11:34 +00001410let UseVSXReg = 1, AddedComplexity = 400 in {
Ehsan Amiri99b017a2016-03-31 17:47:17 +00001411let Predicates = [HasDirectMove] in {
Nemanja Ivanovicf02def62015-05-21 19:32:49 +00001412 // VSX direct move instructions
1413 def MFVSRD : XX1_RS6_RD5_XO<31, 51, (outs g8rc:$rA), (ins vsfrc:$XT),
1414 "mfvsrd $rA, $XT", IIC_VecGeneral,
1415 [(set i64:$rA, (PPCmfvsr f64:$XT))]>,
1416 Requires<[In64BitMode]>;
1417 def MFVSRWZ : XX1_RS6_RD5_XO<31, 115, (outs gprc:$rA), (ins vsfrc:$XT),
1418 "mfvsrwz $rA, $XT", IIC_VecGeneral,
1419 [(set i32:$rA, (PPCmfvsr f64:$XT))]>;
1420 def MTVSRD : XX1_RS6_RD5_XO<31, 179, (outs vsfrc:$XT), (ins g8rc:$rA),
1421 "mtvsrd $XT, $rA", IIC_VecGeneral,
1422 [(set f64:$XT, (PPCmtvsra i64:$rA))]>,
1423 Requires<[In64BitMode]>;
1424 def MTVSRWA : XX1_RS6_RD5_XO<31, 211, (outs vsfrc:$XT), (ins gprc:$rA),
1425 "mtvsrwa $XT, $rA", IIC_VecGeneral,
1426 [(set f64:$XT, (PPCmtvsra i32:$rA))]>;
1427 def MTVSRWZ : XX1_RS6_RD5_XO<31, 243, (outs vsfrc:$XT), (ins gprc:$rA),
1428 "mtvsrwz $XT, $rA", IIC_VecGeneral,
1429 [(set f64:$XT, (PPCmtvsrz i32:$rA))]>;
Ehsan Amiri99b017a2016-03-31 17:47:17 +00001430} // HasDirectMove
1431
1432let Predicates = [IsISA3_0, HasDirectMove] in {
1433 def MTVSRWS: XX1_RS6_RD5_XO<31, 403, (outs vsrc:$XT), (ins gprc:$rA),
Nemanja Ivanovicd2c3c512016-09-23 13:25:31 +00001434 "mtvsrws $XT, $rA", IIC_VecGeneral, []>;
Ehsan Amiri99b017a2016-03-31 17:47:17 +00001435
1436 def MTVSRDD: XX1Form<31, 435, (outs vsrc:$XT), (ins g8rc:$rA, g8rc:$rB),
1437 "mtvsrdd $XT, $rA, $rB", IIC_VecGeneral,
1438 []>, Requires<[In64BitMode]>;
1439
1440 def MFVSRLD: XX1_RS6_RD5_XO<31, 307, (outs g8rc:$rA), (ins vsrc:$XT),
1441 "mfvsrld $rA, $XT", IIC_VecGeneral,
1442 []>, Requires<[In64BitMode]>;
1443
1444} // IsISA3_0, HasDirectMove
Nemanja Ivanovic11049f82016-10-04 06:59:23 +00001445} // UseVSXReg = 1
Nemanja Ivanovic1c39ca62015-08-13 17:40:44 +00001446
Nemanja Ivanovicd3896572015-10-09 11:12:18 +00001447/* Direct moves of various widths from GPR's into VSR's. Each move lines
Nemanja Ivanovic1c39ca62015-08-13 17:40:44 +00001448 the value up into element 0 (both BE and LE). Namely, entities smaller than
1449 a doubleword are shifted left and moved for BE. For LE, they're moved, then
1450 swapped to go into the least significant element of the VSR.
1451*/
Nemanja Ivanovicd3896572015-10-09 11:12:18 +00001452def MovesToVSR {
1453 dag BE_BYTE_0 =
1454 (MTVSRD
1455 (RLDICR
1456 (INSERT_SUBREG (i64 (IMPLICIT_DEF)), $A, sub_32), 56, 7));
1457 dag BE_HALF_0 =
1458 (MTVSRD
1459 (RLDICR
1460 (INSERT_SUBREG (i64 (IMPLICIT_DEF)), $A, sub_32), 48, 15));
1461 dag BE_WORD_0 =
1462 (MTVSRD
1463 (RLDICR
1464 (INSERT_SUBREG (i64 (IMPLICIT_DEF)), $A, sub_32), 32, 31));
Nemanja Ivanovic1c39ca62015-08-13 17:40:44 +00001465 dag BE_DWORD_0 = (MTVSRD $A);
1466
1467 dag LE_MTVSRW = (MTVSRD (INSERT_SUBREG (i64 (IMPLICIT_DEF)), $A, sub_32));
Nemanja Ivanovicd3896572015-10-09 11:12:18 +00001468 dag LE_WORD_1 = (v2i64 (INSERT_SUBREG (v2i64 (IMPLICIT_DEF)),
1469 LE_MTVSRW, sub_64));
Nemanja Ivanovic1c39ca62015-08-13 17:40:44 +00001470 dag LE_WORD_0 = (XXPERMDI LE_WORD_1, LE_WORD_1, 2);
Nemanja Ivanovicd3896572015-10-09 11:12:18 +00001471 dag LE_DWORD_1 = (v2i64 (INSERT_SUBREG (v2i64 (IMPLICIT_DEF)),
1472 BE_DWORD_0, sub_64));
Nemanja Ivanovic1c39ca62015-08-13 17:40:44 +00001473 dag LE_DWORD_0 = (XXPERMDI LE_DWORD_1, LE_DWORD_1, 2);
1474}
1475
Nemanja Ivanovicac8d01a2015-12-10 13:35:28 +00001476/* Patterns for extracting elements out of vectors. Integer elements are
1477 extracted using direct move operations. Patterns for extracting elements
1478 whose indices are not available at compile time are also provided with
1479 various _VARIABLE_ patterns.
Nemanja Ivanovicd3896572015-10-09 11:12:18 +00001480 The numbering for the DAG's is for LE, but when used on BE, the correct
1481 LE element can just be used (i.e. LE_BYTE_2 == BE_BYTE_13).
1482*/
Nemanja Ivanovicac8d01a2015-12-10 13:35:28 +00001483def VectorExtractions {
Nemanja Ivanovicd3896572015-10-09 11:12:18 +00001484 // Doubleword extraction
1485 dag LE_DWORD_0 =
1486 (MFVSRD
1487 (EXTRACT_SUBREG
1488 (XXPERMDI (COPY_TO_REGCLASS $S, VSRC),
1489 (COPY_TO_REGCLASS $S, VSRC), 2), sub_64));
1490 dag LE_DWORD_1 = (MFVSRD
1491 (EXTRACT_SUBREG
1492 (v2i64 (COPY_TO_REGCLASS $S, VSRC)), sub_64));
1493
1494 // Word extraction
Nemanja Ivanoviceebbcb62016-07-12 12:16:27 +00001495 dag LE_WORD_0 = (MFVSRWZ (EXTRACT_SUBREG (XXPERMDI $S, $S, 2), sub_64));
Nemanja Ivanovicd3896572015-10-09 11:12:18 +00001496 dag LE_WORD_1 = (MFVSRWZ (EXTRACT_SUBREG (XXSLDWI $S, $S, 1), sub_64));
1497 dag LE_WORD_2 = (MFVSRWZ (EXTRACT_SUBREG
1498 (v2i64 (COPY_TO_REGCLASS $S, VSRC)), sub_64));
1499 dag LE_WORD_3 = (MFVSRWZ (EXTRACT_SUBREG (XXSLDWI $S, $S, 3), sub_64));
1500
1501 // Halfword extraction
1502 dag LE_HALF_0 = (i32 (EXTRACT_SUBREG (RLDICL LE_DWORD_0, 0, 48), sub_32));
1503 dag LE_HALF_1 = (i32 (EXTRACT_SUBREG (RLDICL LE_DWORD_0, 48, 48), sub_32));
1504 dag LE_HALF_2 = (i32 (EXTRACT_SUBREG (RLDICL LE_DWORD_0, 32, 48), sub_32));
1505 dag LE_HALF_3 = (i32 (EXTRACT_SUBREG (RLDICL LE_DWORD_0, 16, 48), sub_32));
1506 dag LE_HALF_4 = (i32 (EXTRACT_SUBREG (RLDICL LE_DWORD_1, 0, 48), sub_32));
1507 dag LE_HALF_5 = (i32 (EXTRACT_SUBREG (RLDICL LE_DWORD_1, 48, 48), sub_32));
1508 dag LE_HALF_6 = (i32 (EXTRACT_SUBREG (RLDICL LE_DWORD_1, 32, 48), sub_32));
1509 dag LE_HALF_7 = (i32 (EXTRACT_SUBREG (RLDICL LE_DWORD_1, 16, 48), sub_32));
1510
1511 // Byte extraction
1512 dag LE_BYTE_0 = (i32 (EXTRACT_SUBREG (RLDICL LE_DWORD_0, 0, 56), sub_32));
1513 dag LE_BYTE_1 = (i32 (EXTRACT_SUBREG (RLDICL LE_DWORD_0, 56, 56), sub_32));
1514 dag LE_BYTE_2 = (i32 (EXTRACT_SUBREG (RLDICL LE_DWORD_0, 48, 56), sub_32));
1515 dag LE_BYTE_3 = (i32 (EXTRACT_SUBREG (RLDICL LE_DWORD_0, 40, 56), sub_32));
1516 dag LE_BYTE_4 = (i32 (EXTRACT_SUBREG (RLDICL LE_DWORD_0, 32, 56), sub_32));
1517 dag LE_BYTE_5 = (i32 (EXTRACT_SUBREG (RLDICL LE_DWORD_0, 24, 56), sub_32));
1518 dag LE_BYTE_6 = (i32 (EXTRACT_SUBREG (RLDICL LE_DWORD_0, 16, 56), sub_32));
1519 dag LE_BYTE_7 = (i32 (EXTRACT_SUBREG (RLDICL LE_DWORD_0, 8, 56), sub_32));
1520 dag LE_BYTE_8 = (i32 (EXTRACT_SUBREG (RLDICL LE_DWORD_1, 0, 56), sub_32));
1521 dag LE_BYTE_9 = (i32 (EXTRACT_SUBREG (RLDICL LE_DWORD_1, 56, 56), sub_32));
1522 dag LE_BYTE_10 = (i32 (EXTRACT_SUBREG (RLDICL LE_DWORD_1, 48, 56), sub_32));
1523 dag LE_BYTE_11 = (i32 (EXTRACT_SUBREG (RLDICL LE_DWORD_1, 40, 56), sub_32));
1524 dag LE_BYTE_12 = (i32 (EXTRACT_SUBREG (RLDICL LE_DWORD_1, 32, 56), sub_32));
1525 dag LE_BYTE_13 = (i32 (EXTRACT_SUBREG (RLDICL LE_DWORD_1, 24, 56), sub_32));
1526 dag LE_BYTE_14 = (i32 (EXTRACT_SUBREG (RLDICL LE_DWORD_1, 16, 56), sub_32));
1527 dag LE_BYTE_15 = (i32 (EXTRACT_SUBREG (RLDICL LE_DWORD_1, 8, 56), sub_32));
1528
1529 /* Variable element number (BE and LE patterns must be specified separately)
1530 This is a rather involved process.
1531
1532 Conceptually, this is how the move is accomplished:
1533 1. Identify which doubleword contains the element
1534 2. Shift in the VMX register so that the correct doubleword is correctly
1535 lined up for the MFVSRD
1536 3. Perform the move so that the element (along with some extra stuff)
1537 is in the GPR
1538 4. Right shift within the GPR so that the element is right-justified
1539
1540 Of course, the index is an element number which has a different meaning
1541 on LE/BE so the patterns have to be specified separately.
1542
1543 Note: The final result will be the element right-justified with high
1544 order bits being arbitrarily defined (namely, whatever was in the
1545 vector register to the left of the value originally).
1546 */
1547
1548 /* LE variable byte
1549 Number 1. above:
1550 - For elements 0-7, we shift left by 8 bytes since they're on the right
1551 - For elements 8-15, we need not shift (shift left by zero bytes)
1552 This is accomplished by inverting the bits of the index and AND-ing
1553 with 0x8 (i.e. clearing all bits of the index and inverting bit 60).
1554 */
1555 dag LE_VBYTE_PERM_VEC = (LVSL ZERO8, (ANDC8 (LI8 8), $Idx));
1556
1557 // Number 2. above:
1558 // - Now that we set up the shift amount, we shift in the VMX register
1559 dag LE_VBYTE_PERMUTE = (VPERM $S, $S, LE_VBYTE_PERM_VEC);
1560
1561 // Number 3. above:
1562 // - The doubleword containing our element is moved to a GPR
1563 dag LE_MV_VBYTE = (MFVSRD
1564 (EXTRACT_SUBREG
1565 (v2i64 (COPY_TO_REGCLASS LE_VBYTE_PERMUTE, VSRC)),
1566 sub_64));
1567
1568 /* Number 4. above:
1569 - Truncate the element number to the range 0-7 (8-15 are symmetrical
1570 and out of range values are truncated accordingly)
1571 - Multiply by 8 as we need to shift right by the number of bits, not bytes
1572 - Shift right in the GPR by the calculated value
1573 */
1574 dag LE_VBYTE_SHIFT = (EXTRACT_SUBREG (RLDICR (AND8 (LI8 7), $Idx), 3, 60),
1575 sub_32);
1576 dag LE_VARIABLE_BYTE = (EXTRACT_SUBREG (SRD LE_MV_VBYTE, LE_VBYTE_SHIFT),
1577 sub_32);
1578
Nemanja Ivanovicd3896572015-10-09 11:12:18 +00001579 /* LE variable halfword
1580 Number 1. above:
1581 - For elements 0-3, we shift left by 8 since they're on the right
1582 - For elements 4-7, we need not shift (shift left by zero bytes)
1583 Similarly to the byte pattern, we invert the bits of the index, but we
1584 AND with 0x4 (i.e. clear all bits of the index and invert bit 61).
1585 Of course, the shift is still by 8 bytes, so we must multiply by 2.
1586 */
1587 dag LE_VHALF_PERM_VEC = (LVSL ZERO8, (RLDICR (ANDC8 (LI8 4), $Idx), 1, 62));
1588
1589 // Number 2. above:
1590 // - Now that we set up the shift amount, we shift in the VMX register
1591 dag LE_VHALF_PERMUTE = (VPERM $S, $S, LE_VHALF_PERM_VEC);
1592
1593 // Number 3. above:
1594 // - The doubleword containing our element is moved to a GPR
1595 dag LE_MV_VHALF = (MFVSRD
1596 (EXTRACT_SUBREG
1597 (v2i64 (COPY_TO_REGCLASS LE_VHALF_PERMUTE, VSRC)),
1598 sub_64));
1599
1600 /* Number 4. above:
1601 - Truncate the element number to the range 0-3 (4-7 are symmetrical
1602 and out of range values are truncated accordingly)
1603 - Multiply by 16 as we need to shift right by the number of bits
1604 - Shift right in the GPR by the calculated value
1605 */
1606 dag LE_VHALF_SHIFT = (EXTRACT_SUBREG (RLDICR (AND8 (LI8 3), $Idx), 4, 59),
1607 sub_32);
1608 dag LE_VARIABLE_HALF = (EXTRACT_SUBREG (SRD LE_MV_VHALF, LE_VHALF_SHIFT),
1609 sub_32);
1610
Nemanja Ivanovicac8d01a2015-12-10 13:35:28 +00001611 /* LE variable word
1612 Number 1. above:
1613 - For elements 0-1, we shift left by 8 since they're on the right
1614 - For elements 2-3, we need not shift
1615 */
1616 dag LE_VWORD_PERM_VEC = (LVSL ZERO8, (RLDICR (ANDC8 (LI8 2), $Idx), 2, 61));
1617
1618 // Number 2. above:
1619 // - Now that we set up the shift amount, we shift in the VMX register
1620 dag LE_VWORD_PERMUTE = (VPERM $S, $S, LE_VWORD_PERM_VEC);
1621
1622 // Number 3. above:
1623 // - The doubleword containing our element is moved to a GPR
1624 dag LE_MV_VWORD = (MFVSRD
1625 (EXTRACT_SUBREG
1626 (v2i64 (COPY_TO_REGCLASS LE_VWORD_PERMUTE, VSRC)),
1627 sub_64));
1628
1629 /* Number 4. above:
1630 - Truncate the element number to the range 0-1 (2-3 are symmetrical
1631 and out of range values are truncated accordingly)
1632 - Multiply by 32 as we need to shift right by the number of bits
1633 - Shift right in the GPR by the calculated value
1634 */
1635 dag LE_VWORD_SHIFT = (EXTRACT_SUBREG (RLDICR (AND8 (LI8 1), $Idx), 5, 58),
1636 sub_32);
1637 dag LE_VARIABLE_WORD = (EXTRACT_SUBREG (SRD LE_MV_VWORD, LE_VWORD_SHIFT),
1638 sub_32);
1639
1640 /* LE variable doubleword
1641 Number 1. above:
1642 - For element 0, we shift left by 8 since it's on the right
1643 - For element 1, we need not shift
1644 */
1645 dag LE_VDWORD_PERM_VEC = (LVSL ZERO8, (RLDICR (ANDC8 (LI8 1), $Idx), 3, 60));
1646
1647 // Number 2. above:
1648 // - Now that we set up the shift amount, we shift in the VMX register
1649 dag LE_VDWORD_PERMUTE = (VPERM $S, $S, LE_VDWORD_PERM_VEC);
1650
1651 // Number 3. above:
1652 // - The doubleword containing our element is moved to a GPR
1653 // - Number 4. is not needed for the doubleword as the value is 64-bits
1654 dag LE_VARIABLE_DWORD =
1655 (MFVSRD (EXTRACT_SUBREG
1656 (v2i64 (COPY_TO_REGCLASS LE_VDWORD_PERMUTE, VSRC)),
1657 sub_64));
1658
1659 /* LE variable float
1660 - Shift the vector to line up the desired element to BE Word 0
1661 - Convert 32-bit float to a 64-bit single precision float
1662 */
1663 dag LE_VFLOAT_PERM_VEC = (LVSL ZERO8, (RLDICR (XOR8 (LI8 3), $Idx), 2, 61));
1664 dag LE_VFLOAT_PERMUTE = (VPERM $S, $S, LE_VFLOAT_PERM_VEC);
1665 dag LE_VARIABLE_FLOAT = (XSCVSPDPN LE_VFLOAT_PERMUTE);
1666
1667 /* LE variable double
1668 Same as the LE doubleword except there is no move.
1669 */
1670 dag LE_VDOUBLE_PERMUTE = (VPERM (COPY_TO_REGCLASS $S, VRRC),
1671 (COPY_TO_REGCLASS $S, VRRC),
1672 LE_VDWORD_PERM_VEC);
1673 dag LE_VARIABLE_DOUBLE = (COPY_TO_REGCLASS LE_VDOUBLE_PERMUTE, VSRC);
1674
1675 /* BE variable byte
1676 The algorithm here is the same as the LE variable byte except:
1677 - The shift in the VMX register is by 0/8 for opposite element numbers so
1678 we simply AND the element number with 0x8
1679 - The order of elements after the move to GPR is reversed, so we invert
1680 the bits of the index prior to truncating to the range 0-7
1681 */
1682 dag BE_VBYTE_PERM_VEC = (LVSL ZERO8, (ANDIo8 $Idx, 8));
1683 dag BE_VBYTE_PERMUTE = (VPERM $S, $S, BE_VBYTE_PERM_VEC);
1684 dag BE_MV_VBYTE = (MFVSRD
1685 (EXTRACT_SUBREG
1686 (v2i64 (COPY_TO_REGCLASS BE_VBYTE_PERMUTE, VSRC)),
1687 sub_64));
1688 dag BE_VBYTE_SHIFT = (EXTRACT_SUBREG (RLDICR (ANDC8 (LI8 7), $Idx), 3, 60),
1689 sub_32);
1690 dag BE_VARIABLE_BYTE = (EXTRACT_SUBREG (SRD BE_MV_VBYTE, BE_VBYTE_SHIFT),
1691 sub_32);
1692
Nemanja Ivanovicd3896572015-10-09 11:12:18 +00001693 /* BE variable halfword
1694 The algorithm here is the same as the LE variable halfword except:
1695 - The shift in the VMX register is by 0/8 for opposite element numbers so
1696 we simply AND the element number with 0x4 and multiply by 2
1697 - The order of elements after the move to GPR is reversed, so we invert
1698 the bits of the index prior to truncating to the range 0-3
1699 */
1700 dag BE_VHALF_PERM_VEC = (LVSL ZERO8, (RLDICR (ANDIo8 $Idx, 4), 1, 62));
1701 dag BE_VHALF_PERMUTE = (VPERM $S, $S, BE_VHALF_PERM_VEC);
1702 dag BE_MV_VHALF = (MFVSRD
1703 (EXTRACT_SUBREG
1704 (v2i64 (COPY_TO_REGCLASS BE_VHALF_PERMUTE, VSRC)),
1705 sub_64));
Nemanja Ivanovicac8d01a2015-12-10 13:35:28 +00001706 dag BE_VHALF_SHIFT = (EXTRACT_SUBREG (RLDICR (ANDC8 (LI8 3), $Idx), 4, 59),
Nemanja Ivanovicd3896572015-10-09 11:12:18 +00001707 sub_32);
1708 dag BE_VARIABLE_HALF = (EXTRACT_SUBREG (SRD BE_MV_VHALF, BE_VHALF_SHIFT),
1709 sub_32);
Nemanja Ivanovicac8d01a2015-12-10 13:35:28 +00001710
1711 /* BE variable word
1712 The algorithm is the same as the LE variable word except:
1713 - The shift in the VMX register happens for opposite element numbers
1714 - The order of elements after the move to GPR is reversed, so we invert
1715 the bits of the index prior to truncating to the range 0-1
1716 */
1717 dag BE_VWORD_PERM_VEC = (LVSL ZERO8, (RLDICR (ANDIo8 $Idx, 2), 2, 61));
1718 dag BE_VWORD_PERMUTE = (VPERM $S, $S, BE_VWORD_PERM_VEC);
1719 dag BE_MV_VWORD = (MFVSRD
1720 (EXTRACT_SUBREG
1721 (v2i64 (COPY_TO_REGCLASS BE_VWORD_PERMUTE, VSRC)),
1722 sub_64));
1723 dag BE_VWORD_SHIFT = (EXTRACT_SUBREG (RLDICR (ANDC8 (LI8 1), $Idx), 5, 58),
1724 sub_32);
1725 dag BE_VARIABLE_WORD = (EXTRACT_SUBREG (SRD BE_MV_VWORD, BE_VWORD_SHIFT),
1726 sub_32);
1727
1728 /* BE variable doubleword
1729 Same as the LE doubleword except we shift in the VMX register for opposite
1730 element indices.
1731 */
1732 dag BE_VDWORD_PERM_VEC = (LVSL ZERO8, (RLDICR (ANDIo8 $Idx, 1), 3, 60));
1733 dag BE_VDWORD_PERMUTE = (VPERM $S, $S, BE_VDWORD_PERM_VEC);
1734 dag BE_VARIABLE_DWORD =
1735 (MFVSRD (EXTRACT_SUBREG
1736 (v2i64 (COPY_TO_REGCLASS BE_VDWORD_PERMUTE, VSRC)),
1737 sub_64));
1738
1739 /* BE variable float
1740 - Shift the vector to line up the desired element to BE Word 0
1741 - Convert 32-bit float to a 64-bit single precision float
1742 */
1743 dag BE_VFLOAT_PERM_VEC = (LVSL ZERO8, (RLDICR $Idx, 2, 61));
1744 dag BE_VFLOAT_PERMUTE = (VPERM $S, $S, BE_VFLOAT_PERM_VEC);
1745 dag BE_VARIABLE_FLOAT = (XSCVSPDPN BE_VFLOAT_PERMUTE);
1746
1747 /* BE variable double
1748 Same as the BE doubleword except there is no move.
1749 */
1750 dag BE_VDOUBLE_PERMUTE = (VPERM (COPY_TO_REGCLASS $S, VRRC),
1751 (COPY_TO_REGCLASS $S, VRRC),
1752 BE_VDWORD_PERM_VEC);
1753 dag BE_VARIABLE_DOUBLE = (COPY_TO_REGCLASS BE_VDOUBLE_PERMUTE, VSRC);
Nemanja Ivanovicd3896572015-10-09 11:12:18 +00001754}
1755
Nemanja Ivanovicdf1cb522016-11-29 16:11:34 +00001756let AddedComplexity = 400 in {
Nemanja Ivanovicd3896572015-10-09 11:12:18 +00001757// v4f32 scalar <-> vector conversions (BE)
Nemanja Ivanovic1c39ca62015-08-13 17:40:44 +00001758let Predicates = [IsBigEndian, HasP8Vector] in {
1759 def : Pat<(v4f32 (scalar_to_vector f32:$A)),
1760 (v4f32 (XSCVDPSPN $A))>;
Nemanja Ivanovicd3896572015-10-09 11:12:18 +00001761 def : Pat<(f32 (vector_extract v4f32:$S, 0)),
1762 (f32 (XSCVSPDPN $S))>;
1763 def : Pat<(f32 (vector_extract v4f32:$S, 1)),
1764 (f32 (XSCVSPDPN (XXSLDWI $S, $S, 1)))>;
1765 def : Pat<(f32 (vector_extract v4f32:$S, 2)),
Nemanja Ivanoviceebbcb62016-07-12 12:16:27 +00001766 (f32 (XSCVSPDPN (XXPERMDI $S, $S, 2)))>;
Nemanja Ivanovicd3896572015-10-09 11:12:18 +00001767 def : Pat<(f32 (vector_extract v4f32:$S, 3)),
1768 (f32 (XSCVSPDPN (XXSLDWI $S, $S, 3)))>;
Nemanja Ivanovicac8d01a2015-12-10 13:35:28 +00001769 def : Pat<(f32 (vector_extract v4f32:$S, i64:$Idx)),
1770 (f32 VectorExtractions.BE_VARIABLE_FLOAT)>;
Nemanja Ivanovic1c39ca62015-08-13 17:40:44 +00001771} // IsBigEndian, HasP8Vector
1772
Nemanja Ivanovicac8d01a2015-12-10 13:35:28 +00001773// Variable index vector_extract for v2f64 does not require P8Vector
1774let Predicates = [IsBigEndian, HasVSX] in
1775 def : Pat<(f64 (vector_extract v2f64:$S, i64:$Idx)),
1776 (f64 VectorExtractions.BE_VARIABLE_DOUBLE)>;
1777
Nemanja Ivanovic1c39ca62015-08-13 17:40:44 +00001778let Predicates = [IsBigEndian, HasDirectMove] in {
Nemanja Ivanovicd3896572015-10-09 11:12:18 +00001779 // v16i8 scalar <-> vector conversions (BE)
Nemanja Ivanovic1c39ca62015-08-13 17:40:44 +00001780 def : Pat<(v16i8 (scalar_to_vector i32:$A)),
Nemanja Ivanovicd3896572015-10-09 11:12:18 +00001781 (v16i8 (SUBREG_TO_REG (i64 1), MovesToVSR.BE_BYTE_0, sub_64))>;
Nemanja Ivanovic1c39ca62015-08-13 17:40:44 +00001782 def : Pat<(v8i16 (scalar_to_vector i32:$A)),
Nemanja Ivanovicd3896572015-10-09 11:12:18 +00001783 (v8i16 (SUBREG_TO_REG (i64 1), MovesToVSR.BE_HALF_0, sub_64))>;
Nemanja Ivanovic1c39ca62015-08-13 17:40:44 +00001784 def : Pat<(v4i32 (scalar_to_vector i32:$A)),
Nemanja Ivanovicd3896572015-10-09 11:12:18 +00001785 (v4i32 (SUBREG_TO_REG (i64 1), MovesToVSR.BE_WORD_0, sub_64))>;
Nemanja Ivanovic1c39ca62015-08-13 17:40:44 +00001786 def : Pat<(v2i64 (scalar_to_vector i64:$A)),
Nemanja Ivanovicd3896572015-10-09 11:12:18 +00001787 (v2i64 (SUBREG_TO_REG (i64 1), MovesToVSR.BE_DWORD_0, sub_64))>;
1788 def : Pat<(i32 (vector_extract v16i8:$S, 0)),
Nemanja Ivanovicac8d01a2015-12-10 13:35:28 +00001789 (i32 VectorExtractions.LE_BYTE_15)>;
Nemanja Ivanovicd3896572015-10-09 11:12:18 +00001790 def : Pat<(i32 (vector_extract v16i8:$S, 1)),
Nemanja Ivanovicac8d01a2015-12-10 13:35:28 +00001791 (i32 VectorExtractions.LE_BYTE_14)>;
Nemanja Ivanovicd3896572015-10-09 11:12:18 +00001792 def : Pat<(i32 (vector_extract v16i8:$S, 2)),
Nemanja Ivanovicac8d01a2015-12-10 13:35:28 +00001793 (i32 VectorExtractions.LE_BYTE_13)>;
Nemanja Ivanovicd3896572015-10-09 11:12:18 +00001794 def : Pat<(i32 (vector_extract v16i8:$S, 3)),
Nemanja Ivanovicac8d01a2015-12-10 13:35:28 +00001795 (i32 VectorExtractions.LE_BYTE_12)>;
Nemanja Ivanovicd3896572015-10-09 11:12:18 +00001796 def : Pat<(i32 (vector_extract v16i8:$S, 4)),
Nemanja Ivanovicac8d01a2015-12-10 13:35:28 +00001797 (i32 VectorExtractions.LE_BYTE_11)>;
Nemanja Ivanovicd3896572015-10-09 11:12:18 +00001798 def : Pat<(i32 (vector_extract v16i8:$S, 5)),
Nemanja Ivanovicac8d01a2015-12-10 13:35:28 +00001799 (i32 VectorExtractions.LE_BYTE_10)>;
Nemanja Ivanovicd3896572015-10-09 11:12:18 +00001800 def : Pat<(i32 (vector_extract v16i8:$S, 6)),
Nemanja Ivanovicac8d01a2015-12-10 13:35:28 +00001801 (i32 VectorExtractions.LE_BYTE_9)>;
Nemanja Ivanovicd3896572015-10-09 11:12:18 +00001802 def : Pat<(i32 (vector_extract v16i8:$S, 7)),
Nemanja Ivanovicac8d01a2015-12-10 13:35:28 +00001803 (i32 VectorExtractions.LE_BYTE_8)>;
Nemanja Ivanovicd3896572015-10-09 11:12:18 +00001804 def : Pat<(i32 (vector_extract v16i8:$S, 8)),
Nemanja Ivanovicac8d01a2015-12-10 13:35:28 +00001805 (i32 VectorExtractions.LE_BYTE_7)>;
Nemanja Ivanovicd3896572015-10-09 11:12:18 +00001806 def : Pat<(i32 (vector_extract v16i8:$S, 9)),
Nemanja Ivanovicac8d01a2015-12-10 13:35:28 +00001807 (i32 VectorExtractions.LE_BYTE_6)>;
Nemanja Ivanovicd3896572015-10-09 11:12:18 +00001808 def : Pat<(i32 (vector_extract v16i8:$S, 10)),
Nemanja Ivanovicac8d01a2015-12-10 13:35:28 +00001809 (i32 VectorExtractions.LE_BYTE_5)>;
Nemanja Ivanovicd3896572015-10-09 11:12:18 +00001810 def : Pat<(i32 (vector_extract v16i8:$S, 11)),
Nemanja Ivanovicac8d01a2015-12-10 13:35:28 +00001811 (i32 VectorExtractions.LE_BYTE_4)>;
Nemanja Ivanovicd3896572015-10-09 11:12:18 +00001812 def : Pat<(i32 (vector_extract v16i8:$S, 12)),
Nemanja Ivanovicac8d01a2015-12-10 13:35:28 +00001813 (i32 VectorExtractions.LE_BYTE_3)>;
Nemanja Ivanovicd3896572015-10-09 11:12:18 +00001814 def : Pat<(i32 (vector_extract v16i8:$S, 13)),
Nemanja Ivanovicac8d01a2015-12-10 13:35:28 +00001815 (i32 VectorExtractions.LE_BYTE_2)>;
Nemanja Ivanovicd3896572015-10-09 11:12:18 +00001816 def : Pat<(i32 (vector_extract v16i8:$S, 14)),
Nemanja Ivanovicac8d01a2015-12-10 13:35:28 +00001817 (i32 VectorExtractions.LE_BYTE_1)>;
Nemanja Ivanovicd3896572015-10-09 11:12:18 +00001818 def : Pat<(i32 (vector_extract v16i8:$S, 15)),
Nemanja Ivanovicac8d01a2015-12-10 13:35:28 +00001819 (i32 VectorExtractions.LE_BYTE_0)>;
Nemanja Ivanovicd3896572015-10-09 11:12:18 +00001820 def : Pat<(i32 (vector_extract v16i8:$S, i64:$Idx)),
Nemanja Ivanovicac8d01a2015-12-10 13:35:28 +00001821 (i32 VectorExtractions.BE_VARIABLE_BYTE)>;
Nemanja Ivanovicd3896572015-10-09 11:12:18 +00001822
1823 // v8i16 scalar <-> vector conversions (BE)
1824 def : Pat<(i32 (vector_extract v8i16:$S, 0)),
Nemanja Ivanovicac8d01a2015-12-10 13:35:28 +00001825 (i32 VectorExtractions.LE_HALF_7)>;
Nemanja Ivanovicd3896572015-10-09 11:12:18 +00001826 def : Pat<(i32 (vector_extract v8i16:$S, 1)),
Nemanja Ivanovicac8d01a2015-12-10 13:35:28 +00001827 (i32 VectorExtractions.LE_HALF_6)>;
Nemanja Ivanovicd3896572015-10-09 11:12:18 +00001828 def : Pat<(i32 (vector_extract v8i16:$S, 2)),
Nemanja Ivanovicac8d01a2015-12-10 13:35:28 +00001829 (i32 VectorExtractions.LE_HALF_5)>;
Nemanja Ivanovicd3896572015-10-09 11:12:18 +00001830 def : Pat<(i32 (vector_extract v8i16:$S, 3)),
Nemanja Ivanovicac8d01a2015-12-10 13:35:28 +00001831 (i32 VectorExtractions.LE_HALF_4)>;
Nemanja Ivanovicd3896572015-10-09 11:12:18 +00001832 def : Pat<(i32 (vector_extract v8i16:$S, 4)),
Nemanja Ivanovicac8d01a2015-12-10 13:35:28 +00001833 (i32 VectorExtractions.LE_HALF_3)>;
Nemanja Ivanovicd3896572015-10-09 11:12:18 +00001834 def : Pat<(i32 (vector_extract v8i16:$S, 5)),
Nemanja Ivanovicac8d01a2015-12-10 13:35:28 +00001835 (i32 VectorExtractions.LE_HALF_2)>;
Nemanja Ivanovicd3896572015-10-09 11:12:18 +00001836 def : Pat<(i32 (vector_extract v8i16:$S, 6)),
Nemanja Ivanovicac8d01a2015-12-10 13:35:28 +00001837 (i32 VectorExtractions.LE_HALF_1)>;
Nemanja Ivanovicd3896572015-10-09 11:12:18 +00001838 def : Pat<(i32 (vector_extract v8i16:$S, 7)),
Nemanja Ivanovicac8d01a2015-12-10 13:35:28 +00001839 (i32 VectorExtractions.LE_HALF_0)>;
Nemanja Ivanovicd3896572015-10-09 11:12:18 +00001840 def : Pat<(i32 (vector_extract v8i16:$S, i64:$Idx)),
Nemanja Ivanovicac8d01a2015-12-10 13:35:28 +00001841 (i32 VectorExtractions.BE_VARIABLE_HALF)>;
Nemanja Ivanovicd3896572015-10-09 11:12:18 +00001842
1843 // v4i32 scalar <-> vector conversions (BE)
1844 def : Pat<(i32 (vector_extract v4i32:$S, 0)),
Nemanja Ivanovicac8d01a2015-12-10 13:35:28 +00001845 (i32 VectorExtractions.LE_WORD_3)>;
Nemanja Ivanovicd3896572015-10-09 11:12:18 +00001846 def : Pat<(i32 (vector_extract v4i32:$S, 1)),
Nemanja Ivanovicac8d01a2015-12-10 13:35:28 +00001847 (i32 VectorExtractions.LE_WORD_2)>;
Nemanja Ivanovicd3896572015-10-09 11:12:18 +00001848 def : Pat<(i32 (vector_extract v4i32:$S, 2)),
Nemanja Ivanovicac8d01a2015-12-10 13:35:28 +00001849 (i32 VectorExtractions.LE_WORD_1)>;
Nemanja Ivanovicd3896572015-10-09 11:12:18 +00001850 def : Pat<(i32 (vector_extract v4i32:$S, 3)),
Nemanja Ivanovicac8d01a2015-12-10 13:35:28 +00001851 (i32 VectorExtractions.LE_WORD_0)>;
1852 def : Pat<(i32 (vector_extract v4i32:$S, i64:$Idx)),
1853 (i32 VectorExtractions.BE_VARIABLE_WORD)>;
Nemanja Ivanovicd3896572015-10-09 11:12:18 +00001854
1855 // v2i64 scalar <-> vector conversions (BE)
1856 def : Pat<(i64 (vector_extract v2i64:$S, 0)),
Nemanja Ivanovicac8d01a2015-12-10 13:35:28 +00001857 (i64 VectorExtractions.LE_DWORD_1)>;
Nemanja Ivanovicd3896572015-10-09 11:12:18 +00001858 def : Pat<(i64 (vector_extract v2i64:$S, 1)),
Nemanja Ivanovicac8d01a2015-12-10 13:35:28 +00001859 (i64 VectorExtractions.LE_DWORD_0)>;
1860 def : Pat<(i64 (vector_extract v2i64:$S, i64:$Idx)),
1861 (i64 VectorExtractions.BE_VARIABLE_DWORD)>;
Nemanja Ivanovic1c39ca62015-08-13 17:40:44 +00001862} // IsBigEndian, HasDirectMove
1863
Nemanja Ivanovicd3896572015-10-09 11:12:18 +00001864// v4f32 scalar <-> vector conversions (LE)
Nemanja Ivanovic1c39ca62015-08-13 17:40:44 +00001865let Predicates = [IsLittleEndian, HasP8Vector] in {
1866 def : Pat<(v4f32 (scalar_to_vector f32:$A)),
1867 (v4f32 (XXSLDWI (XSCVDPSPN $A), (XSCVDPSPN $A), 1))>;
Nemanja Ivanovicd3896572015-10-09 11:12:18 +00001868 def : Pat<(f32 (vector_extract v4f32:$S, 0)),
1869 (f32 (XSCVSPDPN (XXSLDWI $S, $S, 3)))>;
1870 def : Pat<(f32 (vector_extract v4f32:$S, 1)),
Nemanja Ivanoviceebbcb62016-07-12 12:16:27 +00001871 (f32 (XSCVSPDPN (XXPERMDI $S, $S, 2)))>;
Nemanja Ivanovicd3896572015-10-09 11:12:18 +00001872 def : Pat<(f32 (vector_extract v4f32:$S, 2)),
1873 (f32 (XSCVSPDPN (XXSLDWI $S, $S, 1)))>;
1874 def : Pat<(f32 (vector_extract v4f32:$S, 3)),
1875 (f32 (XSCVSPDPN $S))>;
Nemanja Ivanovicac8d01a2015-12-10 13:35:28 +00001876 def : Pat<(f32 (vector_extract v4f32:$S, i64:$Idx)),
1877 (f32 VectorExtractions.LE_VARIABLE_FLOAT)>;
Nemanja Ivanovic1c39ca62015-08-13 17:40:44 +00001878} // IsLittleEndian, HasP8Vector
1879
Nemanja Ivanovicac8d01a2015-12-10 13:35:28 +00001880// Variable index vector_extract for v2f64 does not require P8Vector
1881let Predicates = [IsLittleEndian, HasVSX] in
1882 def : Pat<(f64 (vector_extract v2f64:$S, i64:$Idx)),
1883 (f64 VectorExtractions.LE_VARIABLE_DOUBLE)>;
1884
Nemanja Ivanovicf57f1502016-11-29 23:00:33 +00001885 def : Pat<(v4i32 (int_ppc_vsx_lxvw4x_be xoaddr:$src)), (LXVW4X xoaddr:$src)>;
1886 def : Pat<(v2f64 (int_ppc_vsx_lxvd2x_be xoaddr:$src)), (LXVD2X xoaddr:$src)>;
Tony Jiang5f850cd2016-11-15 14:25:56 +00001887
Nemanja Ivanovic1c39ca62015-08-13 17:40:44 +00001888let Predicates = [IsLittleEndian, HasDirectMove] in {
Nemanja Ivanovicd3896572015-10-09 11:12:18 +00001889 // v16i8 scalar <-> vector conversions (LE)
Nemanja Ivanovic1c39ca62015-08-13 17:40:44 +00001890 def : Pat<(v16i8 (scalar_to_vector i32:$A)),
Nemanja Ivanovicd3896572015-10-09 11:12:18 +00001891 (v16i8 (COPY_TO_REGCLASS MovesToVSR.LE_WORD_0, VSRC))>;
Nemanja Ivanovic1c39ca62015-08-13 17:40:44 +00001892 def : Pat<(v8i16 (scalar_to_vector i32:$A)),
Nemanja Ivanovicd3896572015-10-09 11:12:18 +00001893 (v8i16 (COPY_TO_REGCLASS MovesToVSR.LE_WORD_0, VSRC))>;
Nemanja Ivanovic1c39ca62015-08-13 17:40:44 +00001894 def : Pat<(v4i32 (scalar_to_vector i32:$A)),
Nemanja Ivanovicd3896572015-10-09 11:12:18 +00001895 (v4i32 MovesToVSR.LE_WORD_0)>;
Nemanja Ivanovic1c39ca62015-08-13 17:40:44 +00001896 def : Pat<(v2i64 (scalar_to_vector i64:$A)),
Nemanja Ivanovicd3896572015-10-09 11:12:18 +00001897 (v2i64 MovesToVSR.LE_DWORD_0)>;
1898 def : Pat<(i32 (vector_extract v16i8:$S, 0)),
Nemanja Ivanovicac8d01a2015-12-10 13:35:28 +00001899 (i32 VectorExtractions.LE_BYTE_0)>;
Nemanja Ivanovicd3896572015-10-09 11:12:18 +00001900 def : Pat<(i32 (vector_extract v16i8:$S, 1)),
Nemanja Ivanovicac8d01a2015-12-10 13:35:28 +00001901 (i32 VectorExtractions.LE_BYTE_1)>;
Nemanja Ivanovicd3896572015-10-09 11:12:18 +00001902 def : Pat<(i32 (vector_extract v16i8:$S, 2)),
Nemanja Ivanovicac8d01a2015-12-10 13:35:28 +00001903 (i32 VectorExtractions.LE_BYTE_2)>;
Nemanja Ivanovicd3896572015-10-09 11:12:18 +00001904 def : Pat<(i32 (vector_extract v16i8:$S, 3)),
Nemanja Ivanovicac8d01a2015-12-10 13:35:28 +00001905 (i32 VectorExtractions.LE_BYTE_3)>;
Nemanja Ivanovicd3896572015-10-09 11:12:18 +00001906 def : Pat<(i32 (vector_extract v16i8:$S, 4)),
Nemanja Ivanovicac8d01a2015-12-10 13:35:28 +00001907 (i32 VectorExtractions.LE_BYTE_4)>;
Nemanja Ivanovicd3896572015-10-09 11:12:18 +00001908 def : Pat<(i32 (vector_extract v16i8:$S, 5)),
Nemanja Ivanovicac8d01a2015-12-10 13:35:28 +00001909 (i32 VectorExtractions.LE_BYTE_5)>;
Nemanja Ivanovicd3896572015-10-09 11:12:18 +00001910 def : Pat<(i32 (vector_extract v16i8:$S, 6)),
Nemanja Ivanovicac8d01a2015-12-10 13:35:28 +00001911 (i32 VectorExtractions.LE_BYTE_6)>;
Nemanja Ivanovicd3896572015-10-09 11:12:18 +00001912 def : Pat<(i32 (vector_extract v16i8:$S, 7)),
Nemanja Ivanovicac8d01a2015-12-10 13:35:28 +00001913 (i32 VectorExtractions.LE_BYTE_7)>;
Nemanja Ivanovicd3896572015-10-09 11:12:18 +00001914 def : Pat<(i32 (vector_extract v16i8:$S, 8)),
Nemanja Ivanovicac8d01a2015-12-10 13:35:28 +00001915 (i32 VectorExtractions.LE_BYTE_8)>;
Nemanja Ivanovicd3896572015-10-09 11:12:18 +00001916 def : Pat<(i32 (vector_extract v16i8:$S, 9)),
Nemanja Ivanovicac8d01a2015-12-10 13:35:28 +00001917 (i32 VectorExtractions.LE_BYTE_9)>;
Nemanja Ivanovicd3896572015-10-09 11:12:18 +00001918 def : Pat<(i32 (vector_extract v16i8:$S, 10)),
Nemanja Ivanovicac8d01a2015-12-10 13:35:28 +00001919 (i32 VectorExtractions.LE_BYTE_10)>;
Nemanja Ivanovicd3896572015-10-09 11:12:18 +00001920 def : Pat<(i32 (vector_extract v16i8:$S, 11)),
Nemanja Ivanovicac8d01a2015-12-10 13:35:28 +00001921 (i32 VectorExtractions.LE_BYTE_11)>;
Nemanja Ivanovicd3896572015-10-09 11:12:18 +00001922 def : Pat<(i32 (vector_extract v16i8:$S, 12)),
Nemanja Ivanovicac8d01a2015-12-10 13:35:28 +00001923 (i32 VectorExtractions.LE_BYTE_12)>;
Nemanja Ivanovicd3896572015-10-09 11:12:18 +00001924 def : Pat<(i32 (vector_extract v16i8:$S, 13)),
Nemanja Ivanovicac8d01a2015-12-10 13:35:28 +00001925 (i32 VectorExtractions.LE_BYTE_13)>;
Nemanja Ivanovicd3896572015-10-09 11:12:18 +00001926 def : Pat<(i32 (vector_extract v16i8:$S, 14)),
Nemanja Ivanovicac8d01a2015-12-10 13:35:28 +00001927 (i32 VectorExtractions.LE_BYTE_14)>;
Nemanja Ivanovicd3896572015-10-09 11:12:18 +00001928 def : Pat<(i32 (vector_extract v16i8:$S, 15)),
Nemanja Ivanovicac8d01a2015-12-10 13:35:28 +00001929 (i32 VectorExtractions.LE_BYTE_15)>;
Nemanja Ivanovicd3896572015-10-09 11:12:18 +00001930 def : Pat<(i32 (vector_extract v16i8:$S, i64:$Idx)),
Nemanja Ivanovicac8d01a2015-12-10 13:35:28 +00001931 (i32 VectorExtractions.LE_VARIABLE_BYTE)>;
Nemanja Ivanovic1c39ca62015-08-13 17:40:44 +00001932
Nemanja Ivanovicd3896572015-10-09 11:12:18 +00001933 // v8i16 scalar <-> vector conversions (LE)
1934 def : Pat<(i32 (vector_extract v8i16:$S, 0)),
Nemanja Ivanovicac8d01a2015-12-10 13:35:28 +00001935 (i32 VectorExtractions.LE_HALF_0)>;
Nemanja Ivanovicd3896572015-10-09 11:12:18 +00001936 def : Pat<(i32 (vector_extract v8i16:$S, 1)),
Nemanja Ivanovicac8d01a2015-12-10 13:35:28 +00001937 (i32 VectorExtractions.LE_HALF_1)>;
Nemanja Ivanovicd3896572015-10-09 11:12:18 +00001938 def : Pat<(i32 (vector_extract v8i16:$S, 2)),
Nemanja Ivanovicac8d01a2015-12-10 13:35:28 +00001939 (i32 VectorExtractions.LE_HALF_2)>;
Nemanja Ivanovicd3896572015-10-09 11:12:18 +00001940 def : Pat<(i32 (vector_extract v8i16:$S, 3)),
Nemanja Ivanovicac8d01a2015-12-10 13:35:28 +00001941 (i32 VectorExtractions.LE_HALF_3)>;
Nemanja Ivanovicd3896572015-10-09 11:12:18 +00001942 def : Pat<(i32 (vector_extract v8i16:$S, 4)),
Nemanja Ivanovicac8d01a2015-12-10 13:35:28 +00001943 (i32 VectorExtractions.LE_HALF_4)>;
Nemanja Ivanovicd3896572015-10-09 11:12:18 +00001944 def : Pat<(i32 (vector_extract v8i16:$S, 5)),
Nemanja Ivanovicac8d01a2015-12-10 13:35:28 +00001945 (i32 VectorExtractions.LE_HALF_5)>;
Nemanja Ivanovicd3896572015-10-09 11:12:18 +00001946 def : Pat<(i32 (vector_extract v8i16:$S, 6)),
Nemanja Ivanovicac8d01a2015-12-10 13:35:28 +00001947 (i32 VectorExtractions.LE_HALF_6)>;
Nemanja Ivanovicd3896572015-10-09 11:12:18 +00001948 def : Pat<(i32 (vector_extract v8i16:$S, 7)),
Nemanja Ivanovicac8d01a2015-12-10 13:35:28 +00001949 (i32 VectorExtractions.LE_HALF_7)>;
Nemanja Ivanovicd3896572015-10-09 11:12:18 +00001950 def : Pat<(i32 (vector_extract v8i16:$S, i64:$Idx)),
Nemanja Ivanovicac8d01a2015-12-10 13:35:28 +00001951 (i32 VectorExtractions.LE_VARIABLE_HALF)>;
Nemanja Ivanovicd3896572015-10-09 11:12:18 +00001952
1953 // v4i32 scalar <-> vector conversions (LE)
1954 def : Pat<(i32 (vector_extract v4i32:$S, 0)),
Nemanja Ivanovicac8d01a2015-12-10 13:35:28 +00001955 (i32 VectorExtractions.LE_WORD_0)>;
Nemanja Ivanovicd3896572015-10-09 11:12:18 +00001956 def : Pat<(i32 (vector_extract v4i32:$S, 1)),
Nemanja Ivanovicac8d01a2015-12-10 13:35:28 +00001957 (i32 VectorExtractions.LE_WORD_1)>;
Nemanja Ivanovicd3896572015-10-09 11:12:18 +00001958 def : Pat<(i32 (vector_extract v4i32:$S, 2)),
Nemanja Ivanovicac8d01a2015-12-10 13:35:28 +00001959 (i32 VectorExtractions.LE_WORD_2)>;
Nemanja Ivanovicd3896572015-10-09 11:12:18 +00001960 def : Pat<(i32 (vector_extract v4i32:$S, 3)),
Nemanja Ivanovicac8d01a2015-12-10 13:35:28 +00001961 (i32 VectorExtractions.LE_WORD_3)>;
1962 def : Pat<(i32 (vector_extract v4i32:$S, i64:$Idx)),
1963 (i32 VectorExtractions.LE_VARIABLE_WORD)>;
Nemanja Ivanovicd3896572015-10-09 11:12:18 +00001964
1965 // v2i64 scalar <-> vector conversions (LE)
1966 def : Pat<(i64 (vector_extract v2i64:$S, 0)),
Nemanja Ivanovicac8d01a2015-12-10 13:35:28 +00001967 (i64 VectorExtractions.LE_DWORD_0)>;
Nemanja Ivanovicd3896572015-10-09 11:12:18 +00001968 def : Pat<(i64 (vector_extract v2i64:$S, 1)),
Nemanja Ivanovicac8d01a2015-12-10 13:35:28 +00001969 (i64 VectorExtractions.LE_DWORD_1)>;
1970 def : Pat<(i64 (vector_extract v2i64:$S, i64:$Idx)),
1971 (i64 VectorExtractions.LE_VARIABLE_DWORD)>;
Nemanja Ivanovicd3896572015-10-09 11:12:18 +00001972} // IsLittleEndian, HasDirectMove
Nemanja Ivanovic89224762015-12-15 14:50:34 +00001973
1974let Predicates = [HasDirectMove, HasVSX] in {
1975// bitconvert f32 -> i32
1976// (convert to 32-bit fp single, shift right 1 word, move to GPR)
1977def : Pat<(i32 (bitconvert f32:$S)),
1978 (i32 (MFVSRWZ (EXTRACT_SUBREG
1979 (XXSLDWI (XSCVDPSPN $S),(XSCVDPSPN $S), 3),
1980 sub_64)))>;
1981// bitconvert i32 -> f32
1982// (move to FPR, shift left 1 word, convert to 64-bit fp single)
1983def : Pat<(f32 (bitconvert i32:$A)),
1984 (f32 (XSCVSPDPN
1985 (XXSLDWI MovesToVSR.LE_WORD_1, MovesToVSR.LE_WORD_1, 1)))>;
1986
1987// bitconvert f64 -> i64
1988// (move to GPR, nothing else needed)
1989def : Pat<(i64 (bitconvert f64:$S)),
1990 (i64 (MFVSRD $S))>;
1991
1992// bitconvert i64 -> f64
1993// (move to FPR, nothing else needed)
1994def : Pat<(f64 (bitconvert i64:$S)),
1995 (f64 (MTVSRD $S))>;
1996}
Kit Barton93612ec2016-02-26 21:11:55 +00001997
Nemanja Ivanovicdf1cb522016-11-29 16:11:34 +00001998// Materialize a zero-vector of long long
1999def : Pat<(v2i64 immAllZerosV),
2000 (v2i64 (XXLXORz))>;
2001}
2002
Nemanja Ivanovicb43bb612016-07-12 21:00:10 +00002003def AlignValues {
2004 dag F32_TO_BE_WORD1 = (v4f32 (XXSLDWI (XSCVDPSPN $B), (XSCVDPSPN $B), 3));
2005 dag I32_TO_BE_WORD1 = (COPY_TO_REGCLASS (MTVSRWZ $B), VSRC);
2006}
2007
Kit Barton93612ec2016-02-26 21:11:55 +00002008// The following VSX instructions were introduced in Power ISA 3.0
2009def HasP9Vector : Predicate<"PPCSubTarget->hasP9Vector()">;
Nemanja Ivanovicb43bb612016-07-12 21:00:10 +00002010let AddedComplexity = 400, Predicates = [HasP9Vector] in {
Kit Barton93612ec2016-02-26 21:11:55 +00002011
2012 // [PO VRT XO VRB XO /]
2013 class X_VT5_XO5_VB5<bits<6> opcode, bits<5> xo2, bits<10> xo, string opc,
2014 list<dag> pattern>
2015 : X_RD5_XO5_RS5<opcode, xo2, xo, (outs vrrc:$vT), (ins vrrc:$vB),
2016 !strconcat(opc, " $vT, $vB"), IIC_VecFP, pattern>;
2017
2018 // [PO VRT XO VRB XO RO], Round to Odd version of [PO VRT XO VRB XO /]
2019 class X_VT5_XO5_VB5_Ro<bits<6> opcode, bits<5> xo2, bits<10> xo, string opc,
2020 list<dag> pattern>
2021 : X_VT5_XO5_VB5<opcode, xo2, xo, opc, pattern>, isDOT;
2022
2023 // [PO VRT XO VRB XO /], but the VRB is only used the left 64 bits (or less),
2024 // So we use different operand class for VRB
2025 class X_VT5_XO5_VB5_TyVB<bits<6> opcode, bits<5> xo2, bits<10> xo, string opc,
2026 RegisterOperand vbtype, list<dag> pattern>
2027 : X_RD5_XO5_RS5<opcode, xo2, xo, (outs vrrc:$vT), (ins vbtype:$vB),
2028 !strconcat(opc, " $vT, $vB"), IIC_VecFP, pattern>;
2029
Nemanja Ivanovic11049f82016-10-04 06:59:23 +00002030 let UseVSXReg = 1 in {
Chuang-Yu Cheng80722712016-03-28 08:34:28 +00002031 // [PO T XO B XO BX /]
2032 class XX2_RT5_XO5_XB6<bits<6> opcode, bits<5> xo2, bits<9> xo, string opc,
2033 list<dag> pattern>
2034 : XX2_RD5_XO5_RS6<opcode, xo2, xo, (outs g8rc:$rT), (ins vsfrc:$XB),
2035 !strconcat(opc, " $rT, $XB"), IIC_VecFP, pattern>;
2036
Kit Barton93612ec2016-02-26 21:11:55 +00002037 // [PO T XO B XO BX TX]
2038 class XX2_XT6_XO5_XB6<bits<6> opcode, bits<5> xo2, bits<9> xo, string opc,
2039 RegisterOperand vtype, list<dag> pattern>
2040 : XX2_RD6_XO5_RS6<opcode, xo2, xo, (outs vtype:$XT), (ins vtype:$XB),
2041 !strconcat(opc, " $XT, $XB"), IIC_VecFP, pattern>;
2042
2043 // [PO T A B XO AX BX TX], src and dest register use different operand class
2044 class XX3_XT5_XA5_XB5<bits<6> opcode, bits<8> xo, string opc,
2045 RegisterOperand xty, RegisterOperand aty, RegisterOperand bty,
2046 InstrItinClass itin, list<dag> pattern>
2047 : XX3Form<opcode, xo, (outs xty:$XT), (ins aty:$XA, bty:$XB),
2048 !strconcat(opc, " $XT, $XA, $XB"), itin, pattern>;
Nemanja Ivanovic11049f82016-10-04 06:59:23 +00002049 } // UseVSXReg = 1
Kit Barton93612ec2016-02-26 21:11:55 +00002050
Chuang-Yu Cheng56638482016-03-28 07:38:01 +00002051 // [PO VRT VRA VRB XO /]
2052 class X_VT5_VA5_VB5<bits<6> opcode, bits<10> xo, string opc,
2053 list<dag> pattern>
2054 : XForm_1<opcode, xo, (outs vrrc:$vT), (ins vrrc:$vA, vrrc:$vB),
2055 !strconcat(opc, " $vT, $vA, $vB"), IIC_VecFP, pattern>;
2056
2057 // [PO VRT VRA VRB XO RO], Round to Odd version of [PO VRT VRA VRB XO /]
2058 class X_VT5_VA5_VB5_Ro<bits<6> opcode, bits<10> xo, string opc,
2059 list<dag> pattern>
2060 : X_VT5_VA5_VB5<opcode, xo, opc, pattern>, isDOT;
2061
2062 //===--------------------------------------------------------------------===//
2063 // Quad-Precision Scalar Move Instructions:
2064
2065 // Copy Sign
2066 def XSCPSGNQP : X_VT5_VA5_VB5<63, 100, "xscpsgnqp", []>;
2067
2068 // Absolute/Negative-Absolute/Negate
2069 def XSABSQP : X_VT5_XO5_VB5<63, 0, 804, "xsabsqp" , []>;
2070 def XSNABSQP : X_VT5_XO5_VB5<63, 8, 804, "xsnabsqp", []>;
2071 def XSNEGQP : X_VT5_XO5_VB5<63, 16, 804, "xsnegqp" , []>;
2072
2073 //===--------------------------------------------------------------------===//
2074 // Quad-Precision Scalar Floating-Point Arithmetic Instructions:
2075
2076 // Add/Divide/Multiply/Subtract
2077 def XSADDQP : X_VT5_VA5_VB5 <63, 4, "xsaddqp" , []>;
2078 def XSADDQPO : X_VT5_VA5_VB5_Ro<63, 4, "xsaddqpo", []>;
2079 def XSDIVQP : X_VT5_VA5_VB5 <63, 548, "xsdivqp" , []>;
2080 def XSDIVQPO : X_VT5_VA5_VB5_Ro<63, 548, "xsdivqpo", []>;
2081 def XSMULQP : X_VT5_VA5_VB5 <63, 36, "xsmulqp" , []>;
2082 def XSMULQPO : X_VT5_VA5_VB5_Ro<63, 36, "xsmulqpo", []>;
2083 def XSSUBQP : X_VT5_VA5_VB5 <63, 516, "xssubqp" , []>;
2084 def XSSUBQPO : X_VT5_VA5_VB5_Ro<63, 516, "xssubqpo", []>;
2085
2086 // Square-Root
2087 def XSSQRTQP : X_VT5_XO5_VB5 <63, 27, 804, "xssqrtqp" , []>;
2088 def XSSQRTQPO : X_VT5_XO5_VB5_Ro<63, 27, 804, "xssqrtqpo", []>;
2089
2090 // (Negative) Multiply-{Add/Subtract}
2091 def XSMADDQP : X_VT5_VA5_VB5 <63, 388, "xsmaddqp" , []>;
2092 def XSMADDQPO : X_VT5_VA5_VB5_Ro<63, 388, "xsmaddqpo" , []>;
2093 def XSMSUBQP : X_VT5_VA5_VB5 <63, 420, "xsmsubqp" , []>;
2094 def XSMSUBQPO : X_VT5_VA5_VB5_Ro<63, 420, "xsmsubqpo" , []>;
2095 def XSNMADDQP : X_VT5_VA5_VB5 <63, 452, "xsnmaddqp" , []>;
2096 def XSNMADDQPO: X_VT5_VA5_VB5_Ro<63, 452, "xsnmaddqpo", []>;
2097 def XSNMSUBQP : X_VT5_VA5_VB5 <63, 484, "xsnmsubqp" , []>;
2098 def XSNMSUBQPO: X_VT5_VA5_VB5_Ro<63, 484, "xsnmsubqpo", []>;
2099
Kit Barton93612ec2016-02-26 21:11:55 +00002100 //===--------------------------------------------------------------------===//
2101 // Quad/Double-Precision Compare Instructions:
2102
2103 // [PO BF // VRA VRB XO /]
2104 class X_BF3_VA5_VB5<bits<6> opcode, bits<10> xo, string opc,
2105 list<dag> pattern>
2106 : XForm_17<opcode, xo, (outs crrc:$crD), (ins vrrc:$VA, vrrc:$VB),
2107 !strconcat(opc, " $crD, $VA, $VB"), IIC_FPCompare> {
2108 let Pattern = pattern;
2109 }
2110
2111 // QP Compare Ordered/Unordered
2112 def XSCMPOQP : X_BF3_VA5_VB5<63, 132, "xscmpoqp", []>;
2113 def XSCMPUQP : X_BF3_VA5_VB5<63, 644, "xscmpuqp", []>;
2114
2115 // DP/QP Compare Exponents
2116 def XSCMPEXPDP : XX3Form_1<60, 59,
2117 (outs crrc:$crD), (ins vsfrc:$XA, vsfrc:$XB),
Nemanja Ivanovic11049f82016-10-04 06:59:23 +00002118 "xscmpexpdp $crD, $XA, $XB", IIC_FPCompare, []>,
2119 UseVSXReg;
Kit Barton93612ec2016-02-26 21:11:55 +00002120 def XSCMPEXPQP : X_BF3_VA5_VB5<63, 164, "xscmpexpqp", []>;
2121
2122 // DP Compare ==, >=, >, !=
2123 // Use vsrc for XT, because the entire register of XT is set.
2124 // XT.dword[1] = 0x0000_0000_0000_0000
2125 def XSCMPEQDP : XX3_XT5_XA5_XB5<60, 3, "xscmpeqdp", vsrc, vsfrc, vsfrc,
2126 IIC_FPCompare, []>;
2127 def XSCMPGEDP : XX3_XT5_XA5_XB5<60, 19, "xscmpgedp", vsrc, vsfrc, vsfrc,
2128 IIC_FPCompare, []>;
2129 def XSCMPGTDP : XX3_XT5_XA5_XB5<60, 11, "xscmpgtdp", vsrc, vsfrc, vsfrc,
2130 IIC_FPCompare, []>;
2131 def XSCMPNEDP : XX3_XT5_XA5_XB5<60, 27, "xscmpnedp", vsrc, vsfrc, vsfrc,
2132 IIC_FPCompare, []>;
Nemanja Ivanovic11049f82016-10-04 06:59:23 +00002133 let UseVSXReg = 1 in {
Kit Barton93612ec2016-02-26 21:11:55 +00002134 // Vector Compare Not Equal
2135 def XVCMPNEDP : XX3Form_Rc<60, 123,
2136 (outs vsrc:$XT), (ins vsrc:$XA, vsrc:$XB),
2137 "xvcmpnedp $XT, $XA, $XB", IIC_VecFPCompare, []>;
2138 let Defs = [CR6] in
2139 def XVCMPNEDPo : XX3Form_Rc<60, 123,
2140 (outs vsrc:$XT), (ins vsrc:$XA, vsrc:$XB),
2141 "xvcmpnedp. $XT, $XA, $XB", IIC_VecFPCompare, []>,
2142 isDOT;
2143 def XVCMPNESP : XX3Form_Rc<60, 91,
2144 (outs vsrc:$XT), (ins vsrc:$XA, vsrc:$XB),
2145 "xvcmpnesp $XT, $XA, $XB", IIC_VecFPCompare, []>;
2146 let Defs = [CR6] in
2147 def XVCMPNESPo : XX3Form_Rc<60, 91,
2148 (outs vsrc:$XT), (ins vsrc:$XA, vsrc:$XB),
2149 "xvcmpnesp. $XT, $XA, $XB", IIC_VecFPCompare, []>,
2150 isDOT;
Nemanja Ivanovic11049f82016-10-04 06:59:23 +00002151 } // UseVSXReg = 1
Kit Barton93612ec2016-02-26 21:11:55 +00002152
2153 //===--------------------------------------------------------------------===//
2154 // Quad-Precision Floating-Point Conversion Instructions:
2155
2156 // Convert DP -> QP
Nemanja Ivanovic11049f82016-10-04 06:59:23 +00002157 def XSCVDPQP : X_VT5_XO5_VB5_TyVB<63, 22, 836, "xscvdpqp", vfrc, []>;
Kit Barton93612ec2016-02-26 21:11:55 +00002158
2159 // Round & Convert QP -> DP (dword[1] is set to zero)
2160 def XSCVQPDP : X_VT5_XO5_VB5 <63, 20, 836, "xscvqpdp" , []>;
2161 def XSCVQPDPO : X_VT5_XO5_VB5_Ro<63, 20, 836, "xscvqpdpo", []>;
2162
2163 // Truncate & Convert QP -> (Un)Signed (D)Word (dword[1] is set to zero)
2164 def XSCVQPSDZ : X_VT5_XO5_VB5<63, 25, 836, "xscvqpsdz", []>;
2165 def XSCVQPSWZ : X_VT5_XO5_VB5<63, 9, 836, "xscvqpswz", []>;
2166 def XSCVQPUDZ : X_VT5_XO5_VB5<63, 17, 836, "xscvqpudz", []>;
2167 def XSCVQPUWZ : X_VT5_XO5_VB5<63, 1, 836, "xscvqpuwz", []>;
2168
2169 // Convert (Un)Signed DWord -> QP
Nemanja Ivanovic11049f82016-10-04 06:59:23 +00002170 def XSCVSDQP : X_VT5_XO5_VB5_TyVB<63, 10, 836, "xscvsdqp", vfrc, []>;
2171 def XSCVUDQP : X_VT5_XO5_VB5_TyVB<63, 2, 836, "xscvudqp", vfrc, []>;
Kit Barton93612ec2016-02-26 21:11:55 +00002172
Sean Fertilea435e072016-11-14 18:43:59 +00002173 let UseVSXReg = 1 in {
Kit Barton93612ec2016-02-26 21:11:55 +00002174 //===--------------------------------------------------------------------===//
2175 // Round to Floating-Point Integer Instructions
2176
2177 // (Round &) Convert DP <-> HP
2178 // Note! xscvdphp's src and dest register both use the left 64 bits, so we use
2179 // vsfrc for src and dest register. xscvhpdp's src only use the left 16 bits,
2180 // but we still use vsfrc for it.
2181 def XSCVDPHP : XX2_XT6_XO5_XB6<60, 17, 347, "xscvdphp", vsfrc, []>;
2182 def XSCVHPDP : XX2_XT6_XO5_XB6<60, 16, 347, "xscvhpdp", vsfrc, []>;
2183
2184 // Vector HP -> SP
2185 def XVCVHPSP : XX2_XT6_XO5_XB6<60, 24, 475, "xvcvhpsp", vsrc, []>;
Nemanja Ivanovicec4b0c32016-11-11 21:42:01 +00002186 def XVCVSPHP : XX2_XT6_XO5_XB6<60, 25, 475, "xvcvsphp", vsrc,
2187 [(set v4f32:$XT,
2188 (int_ppc_vsx_xvcvsphp v4f32:$XB))]>;
Kit Barton93612ec2016-02-26 21:11:55 +00002189
Sean Fertilea435e072016-11-14 18:43:59 +00002190 } // UseVSXReg = 1
2191
2192 // Pattern for matching Vector HP -> Vector SP intrinsic. Defined as a
2193 // seperate pattern so that it can convert the input register class from
2194 // VRRC(v8i16) to VSRC.
2195 def : Pat<(v4f32 (int_ppc_vsx_xvcvhpsp v8i16:$A)),
2196 (v4f32 (XVCVHPSP (COPY_TO_REGCLASS $A, VSRC)))>;
2197
Kit Barton93612ec2016-02-26 21:11:55 +00002198 class Z23_VT5_R1_VB5_RMC2_EX1<bits<6> opcode, bits<8> xo, bit ex, string opc,
2199 list<dag> pattern>
2200 : Z23Form_1<opcode, xo,
2201 (outs vrrc:$vT), (ins u1imm:$r, vrrc:$vB, u2imm:$rmc),
2202 !strconcat(opc, " $r, $vT, $vB, $rmc"), IIC_VecFP, pattern> {
2203 let RC = ex;
2204 }
2205
2206 // Round to Quad-Precision Integer [with Inexact]
2207 def XSRQPI : Z23_VT5_R1_VB5_RMC2_EX1<63, 5, 0, "xsrqpi" , []>;
2208 def XSRQPIX : Z23_VT5_R1_VB5_RMC2_EX1<63, 5, 1, "xsrqpix", []>;
2209
2210 // Round Quad-Precision to Double-Extended Precision (fp80)
2211 def XSRQPXP : Z23_VT5_R1_VB5_RMC2_EX1<63, 37, 0, "xsrqpxp", []>;
Kit Bartonba532dc2016-03-08 03:49:13 +00002212
2213 //===--------------------------------------------------------------------===//
Chuang-Yu Cheng80722712016-03-28 08:34:28 +00002214 // Insert/Extract Instructions
2215
2216 // Insert Exponent DP/QP
2217 // XT NOTE: XT.dword[1] = 0xUUUU_UUUU_UUUU_UUUU
2218 def XSIEXPDP : XX1Form <60, 918, (outs vsrc:$XT), (ins g8rc:$rA, g8rc:$rB),
Nemanja Ivanovic11049f82016-10-04 06:59:23 +00002219 "xsiexpdp $XT, $rA, $rB", IIC_VecFP, []>, UseVSXReg;
Chuang-Yu Cheng80722712016-03-28 08:34:28 +00002220 // vB NOTE: only vB.dword[0] is used, that's why we don't use
2221 // X_VT5_VA5_VB5 form
2222 def XSIEXPQP : XForm_18<63, 868, (outs vrrc:$vT), (ins vrrc:$vA, vsfrc:$vB),
2223 "xsiexpqp $vT, $vA, $vB", IIC_VecFP, []>;
2224
2225 // Extract Exponent/Significand DP/QP
2226 def XSXEXPDP : XX2_RT5_XO5_XB6<60, 0, 347, "xsxexpdp", []>;
2227 def XSXSIGDP : XX2_RT5_XO5_XB6<60, 1, 347, "xsxsigdp", []>;
Nemanja Ivanovic11049f82016-10-04 06:59:23 +00002228
Chuang-Yu Cheng80722712016-03-28 08:34:28 +00002229 def XSXEXPQP : X_VT5_XO5_VB5 <63, 2, 804, "xsxexpqp", []>;
2230 def XSXSIGQP : X_VT5_XO5_VB5 <63, 18, 804, "xsxsigqp", []>;
2231
2232 // Vector Insert Word
Nemanja Ivanovic11049f82016-10-04 06:59:23 +00002233 let UseVSXReg = 1 in {
Chuang-Yu Cheng80722712016-03-28 08:34:28 +00002234 // XB NOTE: Only XB.dword[1] is used, but we use vsrc on XB.
Nemanja Ivanovicb43bb612016-07-12 21:00:10 +00002235 def XXINSERTW :
2236 XX2_RD6_UIM5_RS6<60, 181, (outs vsrc:$XT),
2237 (ins vsrc:$XTi, vsrc:$XB, u4imm:$UIM),
2238 "xxinsertw $XT, $XB, $UIM", IIC_VecFP,
2239 [(set v4i32:$XT, (PPCxxinsert v4i32:$XTi, v4i32:$XB,
2240 imm32SExt16:$UIM))]>,
2241 RegConstraint<"$XTi = $XT">, NoEncode<"$XTi">;
Chuang-Yu Cheng80722712016-03-28 08:34:28 +00002242
2243 // Vector Extract Unsigned Word
2244 def XXEXTRACTUW : XX2_RD6_UIM5_RS6<60, 165,
Nemanja Ivanovicb43bb612016-07-12 21:00:10 +00002245 (outs vsfrc:$XT), (ins vsrc:$XB, u4imm:$UIMM),
Chuang-Yu Cheng80722712016-03-28 08:34:28 +00002246 "xxextractuw $XT, $XB, $UIMM", IIC_VecFP, []>;
Nemanja Ivanovic11049f82016-10-04 06:59:23 +00002247 } // UseVSXReg = 1
Chuang-Yu Cheng80722712016-03-28 08:34:28 +00002248
2249 // Vector Insert Exponent DP/SP
2250 def XVIEXPDP : XX3_XT5_XA5_XB5<60, 248, "xviexpdp", vsrc, vsrc, vsrc,
Nemanja Ivanovic0f459982016-10-26 19:03:40 +00002251 IIC_VecFP, [(set v2f64: $XT,(int_ppc_vsx_xviexpdp v2i64:$XA, v2i64:$XB))]>;
Chuang-Yu Cheng80722712016-03-28 08:34:28 +00002252 def XVIEXPSP : XX3_XT5_XA5_XB5<60, 216, "xviexpsp", vsrc, vsrc, vsrc,
Nemanja Ivanovic0f459982016-10-26 19:03:40 +00002253 IIC_VecFP, [(set v4f32: $XT,(int_ppc_vsx_xviexpsp v4i32:$XA, v4i32:$XB))]>;
Chuang-Yu Cheng80722712016-03-28 08:34:28 +00002254
2255 // Vector Extract Exponent/Significand DP/SP
Sean Fertileadda5b22016-11-14 14:42:37 +00002256 def XVXEXPDP : XX2_XT6_XO5_XB6<60, 0, 475, "xvxexpdp", vsrc,
2257 [(set v2i64: $XT,
2258 (int_ppc_vsx_xvxexpdp v2f64:$XB))]>;
2259 def XVXEXPSP : XX2_XT6_XO5_XB6<60, 8, 475, "xvxexpsp", vsrc,
2260 [(set v4i32: $XT,
2261 (int_ppc_vsx_xvxexpsp v4f32:$XB))]>;
2262 def XVXSIGDP : XX2_XT6_XO5_XB6<60, 1, 475, "xvxsigdp", vsrc,
2263 [(set v2i64: $XT,
2264 (int_ppc_vsx_xvxsigdp v2f64:$XB))]>;
2265 def XVXSIGSP : XX2_XT6_XO5_XB6<60, 9, 475, "xvxsigsp", vsrc,
2266 [(set v4i32: $XT,
2267 (int_ppc_vsx_xvxsigsp v4f32:$XB))]>;
Chuang-Yu Cheng80722712016-03-28 08:34:28 +00002268
2269 //===--------------------------------------------------------------------===//
2270
2271 // Test Data Class SP/DP/QP
Nemanja Ivanovic11049f82016-10-04 06:59:23 +00002272 let UseVSXReg = 1 in {
Chuang-Yu Cheng80722712016-03-28 08:34:28 +00002273 def XSTSTDCSP : XX2_BF3_DCMX7_RS6<60, 298,
2274 (outs crrc:$BF), (ins u7imm:$DCMX, vsfrc:$XB),
2275 "xststdcsp $BF, $XB, $DCMX", IIC_VecFP, []>;
2276 def XSTSTDCDP : XX2_BF3_DCMX7_RS6<60, 362,
2277 (outs crrc:$BF), (ins u7imm:$DCMX, vsfrc:$XB),
2278 "xststdcdp $BF, $XB, $DCMX", IIC_VecFP, []>;
Nemanja Ivanovic11049f82016-10-04 06:59:23 +00002279 } // UseVSXReg = 1
Chuang-Yu Cheng80722712016-03-28 08:34:28 +00002280 def XSTSTDCQP : X_BF3_DCMX7_RS5 <63, 708,
2281 (outs crrc:$BF), (ins u7imm:$DCMX, vrrc:$vB),
2282 "xststdcqp $BF, $vB, $DCMX", IIC_VecFP, []>;
2283
2284 // Vector Test Data Class SP/DP
Nemanja Ivanovic11049f82016-10-04 06:59:23 +00002285 let UseVSXReg = 1 in {
Chuang-Yu Cheng80722712016-03-28 08:34:28 +00002286 def XVTSTDCSP : XX2_RD6_DCMX7_RS6<60, 13, 5,
2287 (outs vsrc:$XT), (ins u7imm:$DCMX, vsrc:$XB),
Sean Fertileadda5b22016-11-14 14:42:37 +00002288 "xvtstdcsp $XT, $XB, $DCMX", IIC_VecFP,
2289 [(set v4i32: $XT,
2290 (int_ppc_vsx_xvtstdcsp v4f32:$XB, imm:$DCMX))]>;
Chuang-Yu Cheng80722712016-03-28 08:34:28 +00002291 def XVTSTDCDP : XX2_RD6_DCMX7_RS6<60, 15, 5,
2292 (outs vsrc:$XT), (ins u7imm:$DCMX, vsrc:$XB),
Sean Fertileadda5b22016-11-14 14:42:37 +00002293 "xvtstdcdp $XT, $XB, $DCMX", IIC_VecFP,
2294 [(set v2i64: $XT,
2295 (int_ppc_vsx_xvtstdcdp v2f64:$XB, imm:$DCMX))]>;
Nemanja Ivanovic11049f82016-10-04 06:59:23 +00002296 } // UseVSXReg = 1
Chuang-Yu Cheng80722712016-03-28 08:34:28 +00002297
2298 //===--------------------------------------------------------------------===//
2299
2300 // Maximum/Minimum Type-C/Type-J DP
2301 // XT.dword[1] = 0xUUUU_UUUU_UUUU_UUUU, so we use vsrc for XT
2302 def XSMAXCDP : XX3_XT5_XA5_XB5<60, 128, "xsmaxcdp", vsrc, vsfrc, vsfrc,
2303 IIC_VecFP, []>;
2304 def XSMAXJDP : XX3_XT5_XA5_XB5<60, 144, "xsmaxjdp", vsrc, vsfrc, vsfrc,
2305 IIC_VecFP, []>;
2306 def XSMINCDP : XX3_XT5_XA5_XB5<60, 136, "xsmincdp", vsrc, vsfrc, vsfrc,
2307 IIC_VecFP, []>;
2308 def XSMINJDP : XX3_XT5_XA5_XB5<60, 152, "xsminjdp", vsrc, vsfrc, vsfrc,
2309 IIC_VecFP, []>;
2310
2311 //===--------------------------------------------------------------------===//
2312
2313 // Vector Byte-Reverse H/W/D/Q Word
2314 def XXBRH : XX2_XT6_XO5_XB6<60, 7, 475, "xxbrh", vsrc, []>;
2315 def XXBRW : XX2_XT6_XO5_XB6<60, 15, 475, "xxbrw", vsrc, []>;
2316 def XXBRD : XX2_XT6_XO5_XB6<60, 23, 475, "xxbrd", vsrc, []>;
2317 def XXBRQ : XX2_XT6_XO5_XB6<60, 31, 475, "xxbrq", vsrc, []>;
2318
2319 // Vector Permute
2320 def XXPERM : XX3_XT5_XA5_XB5<60, 26, "xxperm" , vsrc, vsrc, vsrc,
2321 IIC_VecPerm, []>;
2322 def XXPERMR : XX3_XT5_XA5_XB5<60, 58, "xxpermr", vsrc, vsrc, vsrc,
2323 IIC_VecPerm, []>;
2324
2325 // Vector Splat Immediate Byte
2326 def XXSPLTIB : X_RD6_IMM8<60, 360, (outs vsrc:$XT), (ins u8imm:$IMM8),
Nemanja Ivanovic11049f82016-10-04 06:59:23 +00002327 "xxspltib $XT, $IMM8", IIC_VecPerm, []>, UseVSXReg;
Chuang-Yu Cheng80722712016-03-28 08:34:28 +00002328
2329 //===--------------------------------------------------------------------===//
Kit Bartonba532dc2016-03-08 03:49:13 +00002330 // Vector/Scalar Load/Store Instructions
2331
Nemanja Ivanovic6354d232016-10-04 11:25:52 +00002332 // When adding new D-Form loads/stores, be sure to update the ImmToIdxMap in
2333 // PPCRegisterInfo::PPCRegisterInfo and maybe save yourself some debugging.
Kit Bartonba532dc2016-03-08 03:49:13 +00002334 let mayLoad = 1 in {
2335 // Load Vector
2336 def LXV : DQ_RD6_RS5_DQ12<61, 1, (outs vsrc:$XT), (ins memrix16:$src),
Nemanja Ivanovic11049f82016-10-04 06:59:23 +00002337 "lxv $XT, $src", IIC_LdStLFD, []>, UseVSXReg;
Kit Bartonba532dc2016-03-08 03:49:13 +00002338 // Load DWord
Nemanja Ivanovic11049f82016-10-04 06:59:23 +00002339 def LXSD : DSForm_1<57, 2, (outs vfrc:$vD), (ins memrix:$src),
Kit Bartonba532dc2016-03-08 03:49:13 +00002340 "lxsd $vD, $src", IIC_LdStLFD, []>;
2341 // Load SP from src, convert it to DP, and place in dword[0]
Nemanja Ivanovic11049f82016-10-04 06:59:23 +00002342 def LXSSP : DSForm_1<57, 3, (outs vfrc:$vD), (ins memrix:$src),
Kit Bartonba532dc2016-03-08 03:49:13 +00002343 "lxssp $vD, $src", IIC_LdStLFD, []>;
2344
2345 // [PO T RA RB XO TX] almost equal to [PO S RA RB XO SX], but has different
2346 // "out" and "in" dag
2347 class X_XT6_RA5_RB5<bits<6> opcode, bits<10> xo, string opc,
2348 RegisterOperand vtype, list<dag> pattern>
2349 : XX1Form<opcode, xo, (outs vtype:$XT), (ins memrr:$src),
Nemanja Ivanovic11049f82016-10-04 06:59:23 +00002350 !strconcat(opc, " $XT, $src"), IIC_LdStLFD, pattern>, UseVSXReg;
Kit Bartonba532dc2016-03-08 03:49:13 +00002351
2352 // Load as Integer Byte/Halfword & Zero Indexed
Nemanja Ivanovic11049f82016-10-04 06:59:23 +00002353 def LXSIBZX : X_XT6_RA5_RB5<31, 781, "lxsibzx", vsfrc,
2354 [(set f64:$XT, (PPClxsizx xoaddr:$src, 1))]>;
2355 def LXSIHZX : X_XT6_RA5_RB5<31, 813, "lxsihzx", vsfrc,
2356 [(set f64:$XT, (PPClxsizx xoaddr:$src, 2))]>;
Kit Bartonba532dc2016-03-08 03:49:13 +00002357
2358 // Load Vector Halfword*8/Byte*16 Indexed
2359 def LXVH8X : X_XT6_RA5_RB5<31, 812, "lxvh8x" , vsrc, []>;
2360 def LXVB16X : X_XT6_RA5_RB5<31, 876, "lxvb16x", vsrc, []>;
2361
2362 // Load Vector Indexed
Nemanja Ivanovic6e7879c2016-09-22 09:52:19 +00002363 def LXVX : X_XT6_RA5_RB5<31, 268, "lxvx" , vsrc,
2364 [(set v2f64:$XT, (load xoaddr:$src))]>;
Kit Bartonba532dc2016-03-08 03:49:13 +00002365
2366 // Load Vector (Left-justified) with Length
Zaara Syedaa19c9e62016-11-15 17:54:19 +00002367 def LXVL : XX1Form<31, 269, (outs vsrc:$XT), (ins memr:$src, g8rc:$rB),
2368 "lxvl $XT, $src, $rB", IIC_LdStLoad,
2369 [(set v4i32:$XT, (int_ppc_vsx_lxvl addr:$src, i64:$rB))]>,
2370 UseVSXReg;
2371 def LXVLL : XX1Form<31,301, (outs vsrc:$XT), (ins memr:$src, g8rc:$rB),
2372 "lxvll $XT, $src, $rB", IIC_LdStLoad,
2373 [(set v4i32:$XT, (int_ppc_vsx_lxvll addr:$src, i64:$rB))]>,
2374 UseVSXReg;
Kit Bartonba532dc2016-03-08 03:49:13 +00002375
2376 // Load Vector Word & Splat Indexed
2377 def LXVWSX : X_XT6_RA5_RB5<31, 364, "lxvwsx" , vsrc, []>;
Nemanja Ivanovic11049f82016-10-04 06:59:23 +00002378 } // mayLoad
Kit Bartonba532dc2016-03-08 03:49:13 +00002379
Nemanja Ivanovic6354d232016-10-04 11:25:52 +00002380 // When adding new D-Form loads/stores, be sure to update the ImmToIdxMap in
2381 // PPCRegisterInfo::PPCRegisterInfo and maybe save yourself some debugging.
Kit Bartonba532dc2016-03-08 03:49:13 +00002382 let mayStore = 1 in {
2383 // Store Vector
2384 def STXV : DQ_RD6_RS5_DQ12<61, 5, (outs), (ins vsrc:$XT, memrix16:$dst),
Nemanja Ivanovic11049f82016-10-04 06:59:23 +00002385 "stxv $XT, $dst", IIC_LdStSTFD, []>, UseVSXReg;
Kit Bartonba532dc2016-03-08 03:49:13 +00002386 // Store DWord
Nemanja Ivanovic11049f82016-10-04 06:59:23 +00002387 def STXSD : DSForm_1<61, 2, (outs), (ins vfrc:$vS, memrix:$dst),
Kit Bartonba532dc2016-03-08 03:49:13 +00002388 "stxsd $vS, $dst", IIC_LdStSTFD, []>;
2389 // Convert DP of dword[0] to SP, and Store to dst
Nemanja Ivanovic11049f82016-10-04 06:59:23 +00002390 def STXSSP : DSForm_1<61, 3, (outs), (ins vfrc:$vS, memrix:$dst),
Kit Bartonba532dc2016-03-08 03:49:13 +00002391 "stxssp $vS, $dst", IIC_LdStSTFD, []>;
2392
2393 // [PO S RA RB XO SX]
2394 class X_XS6_RA5_RB5<bits<6> opcode, bits<10> xo, string opc,
2395 RegisterOperand vtype, list<dag> pattern>
2396 : XX1Form<opcode, xo, (outs), (ins vtype:$XT, memrr:$dst),
Nemanja Ivanovic11049f82016-10-04 06:59:23 +00002397 !strconcat(opc, " $XT, $dst"), IIC_LdStSTFD, pattern>, UseVSXReg;
Kit Bartonba532dc2016-03-08 03:49:13 +00002398
2399 // Store as Integer Byte/Halfword Indexed
Nemanja Ivanovic11049f82016-10-04 06:59:23 +00002400 def STXSIBX : X_XS6_RA5_RB5<31, 909, "stxsibx" , vsfrc,
2401 [(PPCstxsix f64:$XT, xoaddr:$dst, 1)]>;
2402 def STXSIHX : X_XS6_RA5_RB5<31, 941, "stxsihx" , vsfrc,
2403 [(PPCstxsix f64:$XT, xoaddr:$dst, 2)]>;
2404 let isCodeGenOnly = 1 in {
2405 def STXSIBXv : X_XS6_RA5_RB5<31, 909, "stxsibx" , vrrc, []>;
2406 def STXSIHXv : X_XS6_RA5_RB5<31, 941, "stxsihx" , vrrc, []>;
2407 }
Kit Bartonba532dc2016-03-08 03:49:13 +00002408
2409 // Store Vector Halfword*8/Byte*16 Indexed
2410 def STXVH8X : X_XS6_RA5_RB5<31, 940, "stxvh8x" , vsrc, []>;
2411 def STXVB16X : X_XS6_RA5_RB5<31, 1004, "stxvb16x", vsrc, []>;
2412
2413 // Store Vector Indexed
Nemanja Ivanovic6e7879c2016-09-22 09:52:19 +00002414 def STXVX : X_XS6_RA5_RB5<31, 396, "stxvx" , vsrc,
2415 [(store v2f64:$XT, xoaddr:$dst)]>;
Kit Bartonba532dc2016-03-08 03:49:13 +00002416
2417 // Store Vector (Left-justified) with Length
Zaara Syedaa19c9e62016-11-15 17:54:19 +00002418 def STXVL : XX1Form<31, 397, (outs), (ins vsrc:$XT, memr:$dst, g8rc:$rB),
2419 "stxvl $XT, $dst, $rB", IIC_LdStLoad,
2420 [(int_ppc_vsx_stxvl v4i32:$XT, addr:$dst, i64:$rB)]>,
2421 UseVSXReg;
2422 def STXVLL : XX1Form<31, 429, (outs), (ins vsrc:$XT, memr:$dst, g8rc:$rB),
2423 "stxvll $XT, $dst, $rB", IIC_LdStLoad,
2424 [(int_ppc_vsx_stxvll v4i32:$XT, addr:$dst, i64:$rB)]>,
2425 UseVSXReg;
Nemanja Ivanovic11049f82016-10-04 06:59:23 +00002426 } // mayStore
Nemanja Ivanovicb43bb612016-07-12 21:00:10 +00002427
2428 // Patterns for which instructions from ISA 3.0 are a better match
2429 let Predicates = [IsLittleEndian, HasP9Vector] in {
2430 def : Pat<(f32 (PPCfcfidus (PPCmtvsrz (i32 (extractelt v4i32:$A, 0))))),
2431 (f32 (XSCVUXDSP (XXEXTRACTUW $A, 12)))>;
2432 def : Pat<(f32 (PPCfcfidus (PPCmtvsrz (i32 (extractelt v4i32:$A, 1))))),
2433 (f32 (XSCVUXDSP (XXEXTRACTUW $A, 8)))>;
2434 def : Pat<(f32 (PPCfcfidus (PPCmtvsrz (i32 (extractelt v4i32:$A, 2))))),
2435 (f32 (XSCVUXDSP (XXEXTRACTUW $A, 4)))>;
2436 def : Pat<(f32 (PPCfcfidus (PPCmtvsrz (i32 (extractelt v4i32:$A, 3))))),
2437 (f32 (XSCVUXDSP (XXEXTRACTUW $A, 0)))>;
2438 def : Pat<(v4i32 (insertelt v4i32:$A, i32:$B, 0)),
2439 (v4i32 (XXINSERTW v4i32:$A, AlignValues.I32_TO_BE_WORD1, 12))>;
2440 def : Pat<(v4i32 (insertelt v4i32:$A, i32:$B, 1)),
2441 (v4i32 (XXINSERTW v4i32:$A, AlignValues.I32_TO_BE_WORD1, 8))>;
2442 def : Pat<(v4i32 (insertelt v4i32:$A, i32:$B, 2)),
2443 (v4i32 (XXINSERTW v4i32:$A, AlignValues.I32_TO_BE_WORD1, 4))>;
2444 def : Pat<(v4i32 (insertelt v4i32:$A, i32:$B, 3)),
2445 (v4i32 (XXINSERTW v4i32:$A, AlignValues.I32_TO_BE_WORD1, 0))>;
2446 def : Pat<(v4f32 (insertelt v4f32:$A, f32:$B, 0)),
2447 (v4f32 (XXINSERTW v4f32:$A, AlignValues.F32_TO_BE_WORD1, 12))>;
2448 def : Pat<(v4f32 (insertelt v4f32:$A, f32:$B, 1)),
2449 (v4f32 (XXINSERTW v4f32:$A, AlignValues.F32_TO_BE_WORD1, 8))>;
2450 def : Pat<(v4f32 (insertelt v4f32:$A, f32:$B, 2)),
2451 (v4f32 (XXINSERTW v4f32:$A, AlignValues.F32_TO_BE_WORD1, 4))>;
2452 def : Pat<(v4f32 (insertelt v4f32:$A, f32:$B, 3)),
2453 (v4f32 (XXINSERTW v4f32:$A, AlignValues.F32_TO_BE_WORD1, 0))>;
2454 } // IsLittleEndian, HasP9Vector
2455
2456 let Predicates = [IsBigEndian, HasP9Vector] in {
2457 def : Pat<(f32 (PPCfcfidus (PPCmtvsrz (i32 (extractelt v4i32:$A, 0))))),
2458 (f32 (XSCVUXDSP (XXEXTRACTUW $A, 0)))>;
2459 def : Pat<(f32 (PPCfcfidus (PPCmtvsrz (i32 (extractelt v4i32:$A, 1))))),
2460 (f32 (XSCVUXDSP (XXEXTRACTUW $A, 4)))>;
2461 def : Pat<(f32 (PPCfcfidus (PPCmtvsrz (i32 (extractelt v4i32:$A, 2))))),
2462 (f32 (XSCVUXDSP (XXEXTRACTUW $A, 8)))>;
2463 def : Pat<(f32 (PPCfcfidus (PPCmtvsrz (i32 (extractelt v4i32:$A, 3))))),
2464 (f32 (XSCVUXDSP (XXEXTRACTUW $A, 12)))>;
2465 def : Pat<(v4i32 (insertelt v4i32:$A, i32:$B, 0)),
2466 (v4i32 (XXINSERTW v4i32:$A, AlignValues.I32_TO_BE_WORD1, 0))>;
2467 def : Pat<(v4i32 (insertelt v4i32:$A, i32:$B, 1)),
2468 (v4i32 (XXINSERTW v4i32:$A, AlignValues.I32_TO_BE_WORD1, 4))>;
2469 def : Pat<(v4i32 (insertelt v4i32:$A, i32:$B, 2)),
2470 (v4i32 (XXINSERTW v4i32:$A, AlignValues.I32_TO_BE_WORD1, 8))>;
2471 def : Pat<(v4i32 (insertelt v4i32:$A, i32:$B, 3)),
2472 (v4i32 (XXINSERTW v4i32:$A, AlignValues.I32_TO_BE_WORD1, 12))>;
2473 def : Pat<(v4f32 (insertelt v4f32:$A, f32:$B, 0)),
2474 (v4f32 (XXINSERTW v4f32:$A, AlignValues.F32_TO_BE_WORD1, 0))>;
2475 def : Pat<(v4f32 (insertelt v4f32:$A, f32:$B, 1)),
2476 (v4f32 (XXINSERTW v4f32:$A, AlignValues.F32_TO_BE_WORD1, 4))>;
2477 def : Pat<(v4f32 (insertelt v4f32:$A, f32:$B, 2)),
2478 (v4f32 (XXINSERTW v4f32:$A, AlignValues.F32_TO_BE_WORD1, 8))>;
2479 def : Pat<(v4f32 (insertelt v4f32:$A, f32:$B, 3)),
2480 (v4f32 (XXINSERTW v4f32:$A, AlignValues.F32_TO_BE_WORD1, 12))>;
2481 } // IsLittleEndian, HasP9Vector
Nemanja Ivanovic6e7879c2016-09-22 09:52:19 +00002482
2483 def : Pat<(v2f64 (load xoaddr:$src)), (LXVX xoaddr:$src)>;
2484 def : Pat<(v2i64 (load xoaddr:$src)), (LXVX xoaddr:$src)>;
2485 def : Pat<(v4f32 (load xoaddr:$src)), (LXVX xoaddr:$src)>;
2486 def : Pat<(v4i32 (load xoaddr:$src)), (LXVX xoaddr:$src)>;
2487 def : Pat<(v4i32 (int_ppc_vsx_lxvw4x xoaddr:$src)), (LXVX xoaddr:$src)>;
2488 def : Pat<(v2f64 (int_ppc_vsx_lxvd2x xoaddr:$src)), (LXVX xoaddr:$src)>;
2489 def : Pat<(store v2f64:$rS, xoaddr:$dst), (STXVX $rS, xoaddr:$dst)>;
2490 def : Pat<(store v2i64:$rS, xoaddr:$dst), (STXVX $rS, xoaddr:$dst)>;
2491 def : Pat<(store v4f32:$rS, xoaddr:$dst), (STXVX $rS, xoaddr:$dst)>;
2492 def : Pat<(store v4i32:$rS, xoaddr:$dst), (STXVX $rS, xoaddr:$dst)>;
2493 def : Pat<(int_ppc_vsx_stxvw4x v4i32:$rS, xoaddr:$dst),
2494 (STXVX $rS, xoaddr:$dst)>;
2495 def : Pat<(int_ppc_vsx_stxvd2x v2f64:$rS, xoaddr:$dst),
2496 (STXVX $rS, xoaddr:$dst)>;
Nemanja Ivanovicd2c3c512016-09-23 13:25:31 +00002497
2498 def : Pat<(v4i32 (scalar_to_vector (i32 (load xoaddr:$src)))),
2499 (v4i32 (LXVWSX xoaddr:$src))>;
2500 def : Pat<(v4f32 (scalar_to_vector (f32 (load xoaddr:$src)))),
2501 (v4f32 (LXVWSX xoaddr:$src))>;
Nemanja Ivanovicdf1cb522016-11-29 16:11:34 +00002502 def : Pat<(v4f32 (scalar_to_vector (f32 (fpround (extloadf32 xoaddr:$src))))),
2503 (v4f32 (LXVWSX xoaddr:$src))>;
Nemanja Ivanovic11049f82016-10-04 06:59:23 +00002504
2505 // Build vectors from i8 loads
2506 def : Pat<(v16i8 (scalar_to_vector ScalarLoads.Li8)),
2507 (v16i8 (VSPLTBs 7, (LXSIBZX xoaddr:$src)))>;
2508 def : Pat<(v8i16 (scalar_to_vector ScalarLoads.ZELi8)),
2509 (v8i16 (VSPLTHs 3, (LXSIBZX xoaddr:$src)))>;
2510 def : Pat<(v4i32 (scalar_to_vector ScalarLoads.ZELi8)),
2511 (v4i32 (XXSPLTWs (LXSIBZX xoaddr:$src), 1))>;
2512 def : Pat<(v2i64 (scalar_to_vector ScalarLoads.ZELi8i64)),
Nemanja Ivanovic10fc3cf2016-11-23 15:51:52 +00002513 (v2i64 (XXSPLTD0s (LXSIBZX xoaddr:$src)))>;
Nemanja Ivanovic11049f82016-10-04 06:59:23 +00002514 def : Pat<(v4i32 (scalar_to_vector ScalarLoads.SELi8)),
2515 (v4i32 (XXSPLTWs (VEXTSB2Ws (LXSIBZX xoaddr:$src)), 1))>;
2516 def : Pat<(v2i64 (scalar_to_vector ScalarLoads.SELi8i64)),
Nemanja Ivanovic10fc3cf2016-11-23 15:51:52 +00002517 (v2i64 (XXSPLTD0s (VEXTSB2Ds (LXSIBZX xoaddr:$src))))>;
Nemanja Ivanovic11049f82016-10-04 06:59:23 +00002518
2519 // Build vectors from i16 loads
2520 def : Pat<(v8i16 (scalar_to_vector ScalarLoads.Li16)),
2521 (v8i16 (VSPLTHs 3, (LXSIHZX xoaddr:$src)))>;
2522 def : Pat<(v4i32 (scalar_to_vector ScalarLoads.ZELi16)),
2523 (v4i32 (XXSPLTWs (LXSIHZX xoaddr:$src), 1))>;
2524 def : Pat<(v2i64 (scalar_to_vector ScalarLoads.ZELi16i64)),
Nemanja Ivanovic10fc3cf2016-11-23 15:51:52 +00002525 (v2i64 (XXSPLTD0s (LXSIHZX xoaddr:$src)))>;
Nemanja Ivanovic11049f82016-10-04 06:59:23 +00002526 def : Pat<(v4i32 (scalar_to_vector ScalarLoads.SELi16)),
2527 (v4i32 (XXSPLTWs (VEXTSH2Ws (LXSIHZX xoaddr:$src)), 1))>;
2528 def : Pat<(v2i64 (scalar_to_vector ScalarLoads.SELi16i64)),
Nemanja Ivanovic10fc3cf2016-11-23 15:51:52 +00002529 (v2i64 (XXSPLTD0s (VEXTSH2Ds (LXSIHZX xoaddr:$src))))>;
Nemanja Ivanovic11049f82016-10-04 06:59:23 +00002530
2531 let Predicates = [IsBigEndian, HasP9Vector] in {
2532 // Scalar stores of i8
2533 def : Pat<(truncstorei8 (i32 (vector_extract v16i8:$S, 0)), xoaddr:$dst),
2534 (STXSIBXv (VSLDOI $S, $S, 9), xoaddr:$dst)>;
2535 def : Pat<(truncstorei8 (i32 (vector_extract v16i8:$S, 1)), xoaddr:$dst),
2536 (STXSIBXv (VSLDOI $S, $S, 10), xoaddr:$dst)>;
2537 def : Pat<(truncstorei8 (i32 (vector_extract v16i8:$S, 2)), xoaddr:$dst),
2538 (STXSIBXv (VSLDOI $S, $S, 11), xoaddr:$dst)>;
2539 def : Pat<(truncstorei8 (i32 (vector_extract v16i8:$S, 3)), xoaddr:$dst),
2540 (STXSIBXv (VSLDOI $S, $S, 12), xoaddr:$dst)>;
2541 def : Pat<(truncstorei8 (i32 (vector_extract v16i8:$S, 4)), xoaddr:$dst),
2542 (STXSIBXv (VSLDOI $S, $S, 13), xoaddr:$dst)>;
2543 def : Pat<(truncstorei8 (i32 (vector_extract v16i8:$S, 5)), xoaddr:$dst),
2544 (STXSIBXv (VSLDOI $S, $S, 14), xoaddr:$dst)>;
2545 def : Pat<(truncstorei8 (i32 (vector_extract v16i8:$S, 6)), xoaddr:$dst),
2546 (STXSIBXv (VSLDOI $S, $S, 15), xoaddr:$dst)>;
2547 def : Pat<(truncstorei8 (i32 (vector_extract v16i8:$S, 7)), xoaddr:$dst),
2548 (STXSIBXv $S, xoaddr:$dst)>;
2549 def : Pat<(truncstorei8 (i32 (vector_extract v16i8:$S, 8)), xoaddr:$dst),
2550 (STXSIBXv (VSLDOI $S, $S, 1), xoaddr:$dst)>;
2551 def : Pat<(truncstorei8 (i32 (vector_extract v16i8:$S, 9)), xoaddr:$dst),
2552 (STXSIBXv (VSLDOI $S, $S, 2), xoaddr:$dst)>;
2553 def : Pat<(truncstorei8 (i32 (vector_extract v16i8:$S, 10)), xoaddr:$dst),
2554 (STXSIBXv (VSLDOI $S, $S, 3), xoaddr:$dst)>;
2555 def : Pat<(truncstorei8 (i32 (vector_extract v16i8:$S, 11)), xoaddr:$dst),
2556 (STXSIBXv (VSLDOI $S, $S, 4), xoaddr:$dst)>;
2557 def : Pat<(truncstorei8 (i32 (vector_extract v16i8:$S, 12)), xoaddr:$dst),
2558 (STXSIBXv (VSLDOI $S, $S, 5), xoaddr:$dst)>;
2559 def : Pat<(truncstorei8 (i32 (vector_extract v16i8:$S, 13)), xoaddr:$dst),
2560 (STXSIBXv (VSLDOI $S, $S, 6), xoaddr:$dst)>;
2561 def : Pat<(truncstorei8 (i32 (vector_extract v16i8:$S, 14)), xoaddr:$dst),
2562 (STXSIBXv (VSLDOI $S, $S, 7), xoaddr:$dst)>;
2563 def : Pat<(truncstorei8 (i32 (vector_extract v16i8:$S, 15)), xoaddr:$dst),
2564 (STXSIBXv (VSLDOI $S, $S, 8), xoaddr:$dst)>;
2565
2566 // Scalar stores of i16
2567 def : Pat<(truncstorei16 (i32 (vector_extract v8i16:$S, 0)), xoaddr:$dst),
2568 (STXSIHXv (VSLDOI $S, $S, 10), xoaddr:$dst)>;
2569 def : Pat<(truncstorei16 (i32 (vector_extract v8i16:$S, 1)), xoaddr:$dst),
2570 (STXSIHXv (VSLDOI $S, $S, 12), xoaddr:$dst)>;
2571 def : Pat<(truncstorei16 (i32 (vector_extract v8i16:$S, 2)), xoaddr:$dst),
2572 (STXSIHXv (VSLDOI $S, $S, 14), xoaddr:$dst)>;
2573 def : Pat<(truncstorei16 (i32 (vector_extract v8i16:$S, 3)), xoaddr:$dst),
2574 (STXSIHXv $S, xoaddr:$dst)>;
2575 def : Pat<(truncstorei16 (i32 (vector_extract v8i16:$S, 4)), xoaddr:$dst),
2576 (STXSIHXv (VSLDOI $S, $S, 2), xoaddr:$dst)>;
2577 def : Pat<(truncstorei16 (i32 (vector_extract v8i16:$S, 5)), xoaddr:$dst),
2578 (STXSIHXv (VSLDOI $S, $S, 4), xoaddr:$dst)>;
2579 def : Pat<(truncstorei16 (i32 (vector_extract v8i16:$S, 6)), xoaddr:$dst),
2580 (STXSIHXv (VSLDOI $S, $S, 6), xoaddr:$dst)>;
2581 def : Pat<(truncstorei16 (i32 (vector_extract v8i16:$S, 7)), xoaddr:$dst),
2582 (STXSIHXv (VSLDOI $S, $S, 8), xoaddr:$dst)>;
2583 } // IsBigEndian, HasP9Vector
2584
2585 let Predicates = [IsLittleEndian, HasP9Vector] in {
2586 // Scalar stores of i8
2587 def : Pat<(truncstorei8 (i32 (vector_extract v16i8:$S, 0)), xoaddr:$dst),
2588 (STXSIBXv (VSLDOI $S, $S, 8), xoaddr:$dst)>;
2589 def : Pat<(truncstorei8 (i32 (vector_extract v16i8:$S, 1)), xoaddr:$dst),
2590 (STXSIBXv (VSLDOI $S, $S, 7), xoaddr:$dst)>;
2591 def : Pat<(truncstorei8 (i32 (vector_extract v16i8:$S, 2)), xoaddr:$dst),
2592 (STXSIBXv (VSLDOI $S, $S, 6), xoaddr:$dst)>;
2593 def : Pat<(truncstorei8 (i32 (vector_extract v16i8:$S, 3)), xoaddr:$dst),
2594 (STXSIBXv (VSLDOI $S, $S, 5), xoaddr:$dst)>;
2595 def : Pat<(truncstorei8 (i32 (vector_extract v16i8:$S, 4)), xoaddr:$dst),
2596 (STXSIBXv (VSLDOI $S, $S, 4), xoaddr:$dst)>;
2597 def : Pat<(truncstorei8 (i32 (vector_extract v16i8:$S, 5)), xoaddr:$dst),
2598 (STXSIBXv (VSLDOI $S, $S, 3), xoaddr:$dst)>;
2599 def : Pat<(truncstorei8 (i32 (vector_extract v16i8:$S, 6)), xoaddr:$dst),
2600 (STXSIBXv (VSLDOI $S, $S, 2), xoaddr:$dst)>;
2601 def : Pat<(truncstorei8 (i32 (vector_extract v16i8:$S, 7)), xoaddr:$dst),
2602 (STXSIBXv (VSLDOI $S, $S, 1), xoaddr:$dst)>;
2603 def : Pat<(truncstorei8 (i32 (vector_extract v16i8:$S, 8)), xoaddr:$dst),
2604 (STXSIBXv $S, xoaddr:$dst)>;
2605 def : Pat<(truncstorei8 (i32 (vector_extract v16i8:$S, 9)), xoaddr:$dst),
2606 (STXSIBXv (VSLDOI $S, $S, 15), xoaddr:$dst)>;
2607 def : Pat<(truncstorei8 (i32 (vector_extract v16i8:$S, 10)), xoaddr:$dst),
2608 (STXSIBXv (VSLDOI $S, $S, 14), xoaddr:$dst)>;
2609 def : Pat<(truncstorei8 (i32 (vector_extract v16i8:$S, 11)), xoaddr:$dst),
2610 (STXSIBXv (VSLDOI $S, $S, 13), xoaddr:$dst)>;
2611 def : Pat<(truncstorei8 (i32 (vector_extract v16i8:$S, 12)), xoaddr:$dst),
2612 (STXSIBXv (VSLDOI $S, $S, 12), xoaddr:$dst)>;
2613 def : Pat<(truncstorei8 (i32 (vector_extract v16i8:$S, 13)), xoaddr:$dst),
2614 (STXSIBXv (VSLDOI $S, $S, 11), xoaddr:$dst)>;
2615 def : Pat<(truncstorei8 (i32 (vector_extract v16i8:$S, 14)), xoaddr:$dst),
2616 (STXSIBXv (VSLDOI $S, $S, 10), xoaddr:$dst)>;
2617 def : Pat<(truncstorei8 (i32 (vector_extract v16i8:$S, 15)), xoaddr:$dst),
2618 (STXSIBXv (VSLDOI $S, $S, 9), xoaddr:$dst)>;
2619
2620 // Scalar stores of i16
2621 def : Pat<(truncstorei16 (i32 (vector_extract v8i16:$S, 0)), xoaddr:$dst),
2622 (STXSIHXv (VSLDOI $S, $S, 8), xoaddr:$dst)>;
2623 def : Pat<(truncstorei16 (i32 (vector_extract v8i16:$S, 1)), xoaddr:$dst),
2624 (STXSIHXv (VSLDOI $S, $S, 6), xoaddr:$dst)>;
2625 def : Pat<(truncstorei16 (i32 (vector_extract v8i16:$S, 2)), xoaddr:$dst),
2626 (STXSIHXv (VSLDOI $S, $S, 4), xoaddr:$dst)>;
2627 def : Pat<(truncstorei16 (i32 (vector_extract v8i16:$S, 3)), xoaddr:$dst),
2628 (STXSIHXv (VSLDOI $S, $S, 2), xoaddr:$dst)>;
2629 def : Pat<(truncstorei16 (i32 (vector_extract v8i16:$S, 4)), xoaddr:$dst),
2630 (STXSIHXv $S, xoaddr:$dst)>;
2631 def : Pat<(truncstorei16 (i32 (vector_extract v8i16:$S, 5)), xoaddr:$dst),
2632 (STXSIHXv (VSLDOI $S, $S, 14), xoaddr:$dst)>;
2633 def : Pat<(truncstorei16 (i32 (vector_extract v8i16:$S, 6)), xoaddr:$dst),
2634 (STXSIHXv (VSLDOI $S, $S, 12), xoaddr:$dst)>;
2635 def : Pat<(truncstorei16 (i32 (vector_extract v8i16:$S, 7)), xoaddr:$dst),
2636 (STXSIHXv (VSLDOI $S, $S, 10), xoaddr:$dst)>;
2637 } // IsLittleEndian, HasP9Vector
2638
2639 // Vector sign extensions
2640 def : Pat<(f64 (PPCVexts f64:$A, 1)),
2641 (f64 (COPY_TO_REGCLASS (VEXTSB2Ds $A), VSFRC))>;
2642 def : Pat<(f64 (PPCVexts f64:$A, 2)),
2643 (f64 (COPY_TO_REGCLASS (VEXTSH2Ds $A), VSFRC))>;
Nemanja Ivanovicdf1cb522016-11-29 16:11:34 +00002644
Nemanja Ivanovic6354d232016-10-04 11:25:52 +00002645 let isPseudo = 1 in {
2646 def DFLOADf32 : Pseudo<(outs vssrc:$XT), (ins memrix:$src),
2647 "#DFLOADf32",
2648 [(set f32:$XT, (load iaddr:$src))]>;
2649 def DFLOADf64 : Pseudo<(outs vsfrc:$XT), (ins memrix:$src),
2650 "#DFLOADf64",
2651 [(set f64:$XT, (load iaddr:$src))]>;
2652 def DFSTOREf32 : Pseudo<(outs), (ins vssrc:$XT, memrix:$dst),
2653 "#DFSTOREf32",
2654 [(store f32:$XT, iaddr:$dst)]>;
2655 def DFSTOREf64 : Pseudo<(outs), (ins vsfrc:$XT, memrix:$dst),
2656 "#DFSTOREf64",
2657 [(store f64:$XT, iaddr:$dst)]>;
2658 }
2659 def : Pat<(f64 (extloadf32 iaddr:$src)),
2660 (COPY_TO_REGCLASS (DFLOADf32 iaddr:$src), VSFRC)>;
Nemanja Ivanovicdf1cb522016-11-29 16:11:34 +00002661 def : Pat<(f32 (fpround (extloadf32 iaddr:$src))),
2662 (f32 (DFLOADf32 iaddr:$src))>;
Nemanja Ivanovicb43bb612016-07-12 21:00:10 +00002663} // end HasP9Vector, AddedComplexity
Nemanja Ivanovicd2c3c512016-09-23 13:25:31 +00002664
Nemanja Ivanovicdf1cb522016-11-29 16:11:34 +00002665// Integer extend helper dags 32 -> 64
2666def AnyExts {
2667 dag A = (INSERT_SUBREG (i64 (IMPLICIT_DEF)), $A, sub_32);
2668 dag B = (INSERT_SUBREG (i64 (IMPLICIT_DEF)), $B, sub_32);
2669 dag C = (INSERT_SUBREG (i64 (IMPLICIT_DEF)), $C, sub_32);
2670 dag D = (INSERT_SUBREG (i64 (IMPLICIT_DEF)), $D, sub_32);
Nemanja Ivanovicd2c3c512016-09-23 13:25:31 +00002671}
2672
Nemanja Ivanovicdf1cb522016-11-29 16:11:34 +00002673def DblToFlt {
2674 dag A0 = (f32 (fpround (f64 (extractelt v2f64:$A, 0))));
2675 dag A1 = (f32 (fpround (f64 (extractelt v2f64:$A, 1))));
2676 dag B0 = (f32 (fpround (f64 (extractelt v2f64:$B, 0))));
2677 dag B1 = (f32 (fpround (f64 (extractelt v2f64:$B, 1))));
2678}
2679def FltToIntLoad {
2680 dag A = (i32 (PPCmfvsr (PPCfctiwz (f64 (extloadf32 xoaddr:$A)))));
2681}
2682def FltToUIntLoad {
2683 dag A = (i32 (PPCmfvsr (PPCfctiwuz (f64 (extloadf32 xoaddr:$A)))));
2684}
2685def FltToLongLoad {
2686 dag A = (i64 (PPCmfvsr (PPCfctidz (f64 (extloadf32 xoaddr:$A)))));
2687}
2688def FltToULongLoad {
2689 dag A = (i64 (PPCmfvsr (PPCfctiduz (f64 (extloadf32 xoaddr:$A)))));
2690}
2691def FltToLong {
2692 dag A = (i64 (PPCmfvsr (PPCfctidz (fpextend f32:$A))));
2693}
2694def FltToULong {
2695 dag A = (i64 (PPCmfvsr (PPCfctiduz (fpextend f32:$A))));
2696}
2697def DblToInt {
2698 dag A = (i32 (PPCmfvsr (f64 (PPCfctiwz f64:$A))));
2699}
2700def DblToUInt {
2701 dag A = (i32 (PPCmfvsr (f64 (PPCfctiwuz f64:$A))));
2702}
2703def DblToLong {
2704 dag A = (i64 (PPCmfvsr (f64 (PPCfctidz f64:$A))));
2705}
2706def DblToULong {
2707 dag A = (i64 (PPCmfvsr (f64 (PPCfctiduz f64:$A))));
2708}
2709def DblToIntLoad {
2710 dag A = (i32 (PPCmfvsr (PPCfctiwz (f64 (load xoaddr:$A)))));
2711}
2712def DblToUIntLoad {
2713 dag A = (i32 (PPCmfvsr (PPCfctiwuz (f64 (load xoaddr:$A)))));
2714}
2715def DblToLongLoad {
2716 dag A = (i64 (PPCmfvsr (PPCfctidz (f64 (load xoaddr:$A)))));
2717}
2718def DblToULongLoad {
2719 dag A = (i64 (PPCmfvsr (PPCfctiduz (f64 (load xoaddr:$A)))));
2720}
2721
2722// FP merge dags (for f32 -> v4f32)
2723def MrgFP {
2724 dag AC = (XVCVDPSP (XXPERMDI (COPY_TO_REGCLASS $A, VSRC),
2725 (COPY_TO_REGCLASS $C, VSRC), 0));
2726 dag BD = (XVCVDPSP (XXPERMDI (COPY_TO_REGCLASS $B, VSRC),
2727 (COPY_TO_REGCLASS $D, VSRC), 0));
2728 dag ABhToFlt = (XVCVDPSP (XXPERMDI $A, $B, 0));
2729 dag ABlToFlt = (XVCVDPSP (XXPERMDI $A, $B, 3));
2730 dag BAhToFlt = (XVCVDPSP (XXPERMDI $B, $A, 0));
2731 dag BAlToFlt = (XVCVDPSP (XXPERMDI $B, $A, 3));
2732}
2733
2734// Patterns for BUILD_VECTOR nodes.
2735def NoP9Vector : Predicate<"!PPCSubTarget->hasP9Vector()">;
2736let AddedComplexity = 400 in {
2737
2738 let Predicates = [HasVSX] in {
2739 // Build vectors of floating point converted to i32.
2740 def : Pat<(v4i32 (build_vector DblToInt.A, DblToInt.A,
2741 DblToInt.A, DblToInt.A)),
2742 (v4i32 (XXSPLTW (COPY_TO_REGCLASS (XSCVDPSXWS $A), VSRC), 1))>;
2743 def : Pat<(v4i32 (build_vector DblToUInt.A, DblToUInt.A,
2744 DblToUInt.A, DblToUInt.A)),
2745 (v4i32 (XXSPLTW (COPY_TO_REGCLASS (XSCVDPUXWS $A), VSRC), 1))>;
2746 def : Pat<(v2i64 (build_vector DblToLong.A, DblToLong.A)),
2747 (v2i64 (XXPERMDI (COPY_TO_REGCLASS (XSCVDPSXDS $A), VSRC),
2748 (COPY_TO_REGCLASS (XSCVDPSXDS $A), VSRC), 0))>;
2749 def : Pat<(v2i64 (build_vector DblToULong.A, DblToULong.A)),
2750 (v2i64 (XXPERMDI (COPY_TO_REGCLASS (XSCVDPUXDS $A), VSRC),
2751 (COPY_TO_REGCLASS (XSCVDPUXDS $A), VSRC), 0))>;
2752 def : Pat<(v4i32 (scalar_to_vector FltToIntLoad.A)),
2753 (v4i32 (XXSPLTW (COPY_TO_REGCLASS
2754 (XSCVDPSXWSs (LXSSPX xoaddr:$A)), VSRC), 1))>;
2755 def : Pat<(v4i32 (scalar_to_vector FltToUIntLoad.A)),
2756 (v4i32 (XXSPLTW (COPY_TO_REGCLASS
2757 (XSCVDPUXWSs (LXSSPX xoaddr:$A)), VSRC), 1))>;
2758 def : Pat<(v4f32 (build_vector f32:$A, f32:$A, f32:$A, f32:$A)),
2759 (v4f32 (XXSPLTW (v4f32 (XSCVDPSPN $A)), 0))>;
2760
2761 // Build vectors of floating point converted to i64.
2762 def : Pat<(v2i64 (build_vector FltToLong.A, FltToLong.A)),
2763 (v2i64 (XXPERMDIs (COPY_TO_REGCLASS (XSCVDPSXDSs $A), VSFRC), 0))>;
2764 def : Pat<(v2i64 (build_vector FltToULong.A, FltToULong.A)),
2765 (v2i64 (XXPERMDIs (COPY_TO_REGCLASS (XSCVDPUXDSs $A), VSFRC), 0))>;
2766 def : Pat<(v2i64 (scalar_to_vector DblToLongLoad.A)),
2767 (v2i64 (XVCVDPSXDS (LXVDSX xoaddr:$A)))>;
2768 def : Pat<(v2i64 (scalar_to_vector DblToULongLoad.A)),
2769 (v2i64 (XVCVDPUXDS (LXVDSX xoaddr:$A)))>;
2770 }
2771
2772 let Predicates = [HasVSX, NoP9Vector] in {
2773 // Load-and-splat with fp-to-int conversion (using X-Form VSX loads).
2774 def : Pat<(v4i32 (scalar_to_vector DblToIntLoad.A)),
2775 (v4i32 (XXSPLTW (COPY_TO_REGCLASS
2776 (XSCVDPSXWS (LXSDX xoaddr:$A)), VSRC), 1))>;
2777 def : Pat<(v4i32 (scalar_to_vector DblToUIntLoad.A)),
2778 (v4i32 (XXSPLTW (COPY_TO_REGCLASS
2779 (XSCVDPUXWS (LXSDX xoaddr:$A)), VSRC), 1))>;
2780 def : Pat<(v2i64 (scalar_to_vector FltToLongLoad.A)),
2781 (v2i64 (XXPERMDIs (XSCVDPSXDS (COPY_TO_REGCLASS
2782 (LXSSPX xoaddr:$A), VSFRC)), 0))>;
2783 def : Pat<(v2i64 (scalar_to_vector FltToULongLoad.A)),
2784 (v2i64 (XXPERMDIs (XSCVDPUXDS (COPY_TO_REGCLASS
2785 (LXSSPX xoaddr:$A), VSFRC)), 0))>;
2786 }
2787
2788 // Big endian, available on all targets with VSX
2789 let Predicates = [IsBigEndian, HasVSX] in {
2790 def : Pat<(v2f64 (build_vector f64:$A, f64:$B)),
2791 (v2f64 (XXPERMDI
2792 (COPY_TO_REGCLASS $A, VSRC),
2793 (COPY_TO_REGCLASS $B, VSRC), 0))>;
2794
2795 def : Pat<(v4f32 (build_vector f32:$A, f32:$B, f32:$C, f32:$D)),
2796 (VMRGEW MrgFP.AC, MrgFP.BD)>;
2797 def : Pat<(v4f32 (build_vector DblToFlt.A0, DblToFlt.A1,
2798 DblToFlt.B0, DblToFlt.B1)),
2799 (v4f32 (VMRGEW MrgFP.ABhToFlt, MrgFP.ABlToFlt))>;
2800 }
2801
2802 let Predicates = [IsLittleEndian, HasVSX] in {
2803 // Little endian, available on all targets with VSX
2804 def : Pat<(v2f64 (build_vector f64:$A, f64:$B)),
2805 (v2f64 (XXPERMDI
2806 (COPY_TO_REGCLASS $B, VSRC),
2807 (COPY_TO_REGCLASS $A, VSRC), 0))>;
2808
2809 def : Pat<(v4f32 (build_vector f32:$D, f32:$C, f32:$B, f32:$A)),
2810 (VMRGEW MrgFP.AC, MrgFP.BD)>;
2811 def : Pat<(v4f32 (build_vector DblToFlt.A0, DblToFlt.A1,
2812 DblToFlt.B0, DblToFlt.B1)),
2813 (v4f32 (VMRGEW MrgFP.BAhToFlt, MrgFP.BAlToFlt))>;
2814 }
2815
2816 let Predicates = [HasDirectMove] in {
2817 // Endianness-neutral constant splat on P8 and newer targets. The reason
2818 // for this pattern is that on targets with direct moves, we don't expand
2819 // BUILD_VECTOR nodes for v4i32.
2820 def : Pat<(v4i32 (build_vector immSExt5NonZero:$A, immSExt5NonZero:$A,
2821 immSExt5NonZero:$A, immSExt5NonZero:$A)),
2822 (v4i32 (VSPLTISW imm:$A))>;
2823 }
2824
2825 let Predicates = [IsBigEndian, HasDirectMove, NoP9Vector] in {
2826 // Big endian integer vectors using direct moves.
2827 def : Pat<(v2i64 (build_vector i64:$A, i64:$B)),
2828 (v2i64 (XXPERMDI
2829 (COPY_TO_REGCLASS (MTVSRD $A), VSRC),
2830 (COPY_TO_REGCLASS (MTVSRD $B), VSRC), 0))>;
2831 def : Pat<(v4i32 (build_vector i32:$A, i32:$B, i32:$C, i32:$D)),
2832 (VMRGOW (XXPERMDI (COPY_TO_REGCLASS (MTVSRWZ $A), VSRC),
2833 (COPY_TO_REGCLASS (MTVSRWZ $C), VSRC), 0),
2834 (XXPERMDI (COPY_TO_REGCLASS (MTVSRWZ $B), VSRC),
2835 (COPY_TO_REGCLASS (MTVSRWZ $D), VSRC), 0))>;
2836 def : Pat<(v4i32 (build_vector i32:$A, i32:$A, i32:$A, i32:$A)),
2837 (XXSPLTW (COPY_TO_REGCLASS (MTVSRWZ $A), VSRC), 1)>;
2838 }
2839
2840 let Predicates = [IsLittleEndian, HasDirectMove, NoP9Vector] in {
2841 // Little endian integer vectors using direct moves.
2842 def : Pat<(v2i64 (build_vector i64:$A, i64:$B)),
2843 (v2i64 (XXPERMDI
2844 (COPY_TO_REGCLASS (MTVSRD $B), VSRC),
2845 (COPY_TO_REGCLASS (MTVSRD $A), VSRC), 0))>;
2846 def : Pat<(v4i32 (build_vector i32:$A, i32:$B, i32:$C, i32:$D)),
2847 (VMRGOW (XXPERMDI (COPY_TO_REGCLASS (MTVSRWZ $D), VSRC),
2848 (COPY_TO_REGCLASS (MTVSRWZ $B), VSRC), 0),
2849 (XXPERMDI (COPY_TO_REGCLASS (MTVSRWZ $C), VSRC),
2850 (COPY_TO_REGCLASS (MTVSRWZ $A), VSRC), 0))>;
2851 def : Pat<(v4i32 (build_vector i32:$A, i32:$A, i32:$A, i32:$A)),
2852 (XXSPLTW (COPY_TO_REGCLASS (MTVSRWZ $A), VSRC), 1)>;
2853 }
2854
2855 let Predicates = [HasP9Vector] in {
2856 // Endianness-neutral patterns for const splats with ISA 3.0 instructions.
2857 def : Pat<(v4i32 (scalar_to_vector i32:$A)),
2858 (v4i32 (MTVSRWS $A))>;
2859 def : Pat<(v4i32 (build_vector i32:$A, i32:$A, i32:$A, i32:$A)),
2860 (v4i32 (MTVSRWS $A))>;
2861 def : Pat<(v16i8 (build_vector immSExt8:$A, immSExt8:$A, immSExt8:$A,
2862 immSExt8:$A, immSExt8:$A, immSExt8:$A,
2863 immSExt8:$A, immSExt8:$A, immSExt8:$A,
2864 immSExt8:$A, immSExt8:$A, immSExt8:$A,
2865 immSExt8:$A, immSExt8:$A, immSExt8:$A,
2866 immSExt8:$A)),
2867 (v16i8 (COPY_TO_REGCLASS (XXSPLTIB imm:$A), VSRC))>;
2868 def : Pat<(v16i8 immAllOnesV),
2869 (v16i8 (COPY_TO_REGCLASS (XXSPLTIB 255), VSRC))>;
2870 def : Pat<(v8i16 immAllOnesV),
2871 (v8i16 (COPY_TO_REGCLASS (XXSPLTIB 255), VSRC))>;
2872 def : Pat<(v4i32 immAllOnesV),
2873 (v4i32 (XXSPLTIB 255))>;
2874 def : Pat<(v2i64 immAllOnesV),
2875 (v2i64 (XXSPLTIB 255))>;
2876 def : Pat<(v4i32 (scalar_to_vector FltToIntLoad.A)),
2877 (v4i32 (XVCVSPSXWS (LXVWSX xoaddr:$A)))>;
2878 def : Pat<(v4i32 (scalar_to_vector FltToUIntLoad.A)),
2879 (v4i32 (XVCVSPUXWS (LXVWSX xoaddr:$A)))>;
2880 def : Pat<(v4i32 (scalar_to_vector DblToIntLoad.A)),
2881 (v4i32 (XXSPLTW (COPY_TO_REGCLASS
2882 (XSCVDPSXWS (DFLOADf64 iaddr:$A)), VSRC), 1))>;
2883 def : Pat<(v4i32 (scalar_to_vector DblToUIntLoad.A)),
2884 (v4i32 (XXSPLTW (COPY_TO_REGCLASS
2885 (XSCVDPUXWS (DFLOADf64 iaddr:$A)), VSRC), 1))>;
2886 def : Pat<(v2i64 (scalar_to_vector FltToLongLoad.A)),
2887 (v2i64 (XXPERMDIs (XSCVDPSXDS (COPY_TO_REGCLASS
2888 (DFLOADf32 iaddr:$A),
2889 VSFRC)), 0))>;
2890 def : Pat<(v2i64 (scalar_to_vector FltToULongLoad.A)),
2891 (v2i64 (XXPERMDIs (XSCVDPUXDS (COPY_TO_REGCLASS
2892 (DFLOADf32 iaddr:$A),
2893 VSFRC)), 0))>;
2894 }
2895
2896 let Predicates = [IsISA3_0, HasDirectMove, IsBigEndian] in {
2897 def : Pat<(i64 (extractelt v2i64:$A, 1)),
2898 (i64 (MFVSRLD $A))>;
2899 // Better way to build integer vectors if we have MTVSRDD. Big endian.
2900 def : Pat<(v2i64 (build_vector i64:$rB, i64:$rA)),
2901 (v2i64 (MTVSRDD $rB, $rA))>;
2902 def : Pat<(v4i32 (build_vector i32:$A, i32:$B, i32:$C, i32:$D)),
2903 (VMRGOW (COPY_TO_REGCLASS (MTVSRDD AnyExts.A, AnyExts.C), VSRC),
2904 (COPY_TO_REGCLASS (MTVSRDD AnyExts.B, AnyExts.D), VSRC))>;
2905 }
2906
2907 let Predicates = [IsISA3_0, HasDirectMove, IsLittleEndian] in {
2908 def : Pat<(i64 (extractelt v2i64:$A, 0)),
2909 (i64 (MFVSRLD $A))>;
2910 // Better way to build integer vectors if we have MTVSRDD. Little endian.
2911 def : Pat<(v2i64 (build_vector i64:$rA, i64:$rB)),
2912 (v2i64 (MTVSRDD $rB, $rA))>;
2913 def : Pat<(v4i32 (build_vector i32:$A, i32:$B, i32:$C, i32:$D)),
2914 (VMRGOW (COPY_TO_REGCLASS (MTVSRDD AnyExts.D, AnyExts.B), VSRC),
2915 (COPY_TO_REGCLASS (MTVSRDD AnyExts.C, AnyExts.A), VSRC))>;
2916 }
Nemanja Ivanovicd2c3c512016-09-23 13:25:31 +00002917}