blob: d874f30c7e8a2d3b4106efd8bb131f30c72cc3a1 [file] [log] [blame]
Hal Finkel27774d92014-03-13 07:58:58 +00001//===- PPCInstrVSX.td - The PowerPC VSX Extension --*- tablegen -*-===//
2//
Chandler Carruth2946cd72019-01-19 08:50:56 +00003// Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions.
4// See https://llvm.org/LICENSE.txt for license information.
5// SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception
Hal Finkel27774d92014-03-13 07:58:58 +00006//
7//===----------------------------------------------------------------------===//
8//
9// This file describes the VSX extension to the PowerPC instruction set.
10//
11//===----------------------------------------------------------------------===//
12
Bill Schmidtfe723b92015-04-27 19:57:34 +000013// *********************************** NOTE ***********************************
14// ** For POWER8 Little Endian, the VSX swap optimization relies on knowing **
15// ** which VMX and VSX instructions are lane-sensitive and which are not. **
16// ** A lane-sensitive instruction relies, implicitly or explicitly, on **
17// ** whether lanes are numbered from left to right. An instruction like **
18// ** VADDFP is not lane-sensitive, because each lane of the result vector **
19// ** relies only on the corresponding lane of the source vectors. However, **
20// ** an instruction like VMULESB is lane-sensitive, because "even" and **
21// ** "odd" lanes are different for big-endian and little-endian numbering. **
22// ** **
23// ** When adding new VMX and VSX instructions, please consider whether they **
24// ** are lane-sensitive. If so, they must be added to a switch statement **
25// ** in PPCVSXSwapRemoval::gatherVectorInstructions(). **
26// ****************************************************************************
27
Hal Finkel27774d92014-03-13 07:58:58 +000028def PPCRegVSRCAsmOperand : AsmOperandClass {
29 let Name = "RegVSRC"; let PredicateMethod = "isVSRegNumber";
30}
31def vsrc : RegisterOperand<VSRC> {
32 let ParserMatchClass = PPCRegVSRCAsmOperand;
33}
34
Hal Finkel19be5062014-03-29 05:29:01 +000035def PPCRegVSFRCAsmOperand : AsmOperandClass {
36 let Name = "RegVSFRC"; let PredicateMethod = "isVSRegNumber";
37}
38def vsfrc : RegisterOperand<VSFRC> {
39 let ParserMatchClass = PPCRegVSFRCAsmOperand;
40}
41
Nemanja Ivanovicf3c94b12015-05-07 18:24:05 +000042def PPCRegVSSRCAsmOperand : AsmOperandClass {
43 let Name = "RegVSSRC"; let PredicateMethod = "isVSRegNumber";
44}
45def vssrc : RegisterOperand<VSSRC> {
46 let ParserMatchClass = PPCRegVSSRCAsmOperand;
47}
48
Zaara Syedafcd96972017-09-21 16:12:33 +000049def PPCRegSPILLTOVSRRCAsmOperand : AsmOperandClass {
50 let Name = "RegSPILLTOVSRRC"; let PredicateMethod = "isVSRegNumber";
51}
52
53def spilltovsrrc : RegisterOperand<SPILLTOVSRRC> {
54 let ParserMatchClass = PPCRegSPILLTOVSRRCAsmOperand;
55}
Bill Schmidtfae5d712014-12-09 16:35:51 +000056// Little-endian-specific nodes.
57def SDT_PPClxvd2x : SDTypeProfile<1, 1, [
58 SDTCisVT<0, v2f64>, SDTCisPtrTy<1>
59]>;
60def SDT_PPCstxvd2x : SDTypeProfile<0, 2, [
61 SDTCisVT<0, v2f64>, SDTCisPtrTy<1>
62]>;
63def SDT_PPCxxswapd : SDTypeProfile<1, 1, [
64 SDTCisSameAs<0, 1>
65]>;
Nemanja Ivanovic44513e52016-07-05 09:22:29 +000066def SDTVecConv : SDTypeProfile<1, 2, [
67 SDTCisVec<0>, SDTCisVec<1>, SDTCisPtrTy<2>
68]>;
Kewen Lin3dac12522018-12-18 03:16:43 +000069def SDTVabsd : SDTypeProfile<1, 3, [
70 SDTCisVec<0>, SDTCisSameAs<0, 1>, SDTCisSameAs<0, 2>, SDTCisVT<3, i32>
71]>;
72
Bill Schmidtfae5d712014-12-09 16:35:51 +000073
74def PPClxvd2x : SDNode<"PPCISD::LXVD2X", SDT_PPClxvd2x,
Sean Fertile3c8c3852017-01-26 18:59:15 +000075 [SDNPHasChain, SDNPMayLoad, SDNPMemOperand]>;
Bill Schmidtfae5d712014-12-09 16:35:51 +000076def PPCstxvd2x : SDNode<"PPCISD::STXVD2X", SDT_PPCstxvd2x,
77 [SDNPHasChain, SDNPMayStore]>;
78def PPCxxswapd : SDNode<"PPCISD::XXSWAPD", SDT_PPCxxswapd, [SDNPHasChain]>;
Nemanja Ivanovicc38b5312015-04-11 10:40:42 +000079def PPCmfvsr : SDNode<"PPCISD::MFVSR", SDTUnaryOp, []>;
80def PPCmtvsra : SDNode<"PPCISD::MTVSRA", SDTUnaryOp, []>;
81def PPCmtvsrz : SDNode<"PPCISD::MTVSRZ", SDTUnaryOp, []>;
Nemanja Ivanovic44513e52016-07-05 09:22:29 +000082def PPCsvec2fp : SDNode<"PPCISD::SINT_VEC_TO_FP", SDTVecConv, []>;
83def PPCuvec2fp: SDNode<"PPCISD::UINT_VEC_TO_FP", SDTVecConv, []>;
Nemanja Ivanoviceebbcb62016-07-12 12:16:27 +000084def PPCswapNoChain : SDNode<"PPCISD::SWAP_NO_CHAIN", SDT_PPCxxswapd>;
Kewen Lin3dac12522018-12-18 03:16:43 +000085def PPCvabsd : SDNode<"PPCISD::VABSD", SDTVabsd, []>;
Bill Schmidtfae5d712014-12-09 16:35:51 +000086
Nemanja Ivanovic2c84b292015-09-29 17:41:53 +000087multiclass XX3Form_Rcr<bits<6> opcode, bits<7> xo, string asmbase,
88 string asmstr, InstrItinClass itin, Intrinsic Int,
89 ValueType OutTy, ValueType InTy> {
Hal Finkel27774d92014-03-13 07:58:58 +000090 let BaseName = asmbase in {
Nemanja Ivanovic2c84b292015-09-29 17:41:53 +000091 def NAME : XX3Form_Rc<opcode, xo, (outs vsrc:$XT), (ins vsrc:$XA, vsrc:$XB),
Hal Finkel27774d92014-03-13 07:58:58 +000092 !strconcat(asmbase, !strconcat(" ", asmstr)), itin,
Nemanja Ivanovic2c84b292015-09-29 17:41:53 +000093 [(set OutTy:$XT, (Int InTy:$XA, InTy:$XB))]>;
Hal Finkel27774d92014-03-13 07:58:58 +000094 let Defs = [CR6] in
Nemanja Ivanovic2c84b292015-09-29 17:41:53 +000095 def o : XX3Form_Rc<opcode, xo, (outs vsrc:$XT), (ins vsrc:$XA, vsrc:$XB),
Hal Finkel27774d92014-03-13 07:58:58 +000096 !strconcat(asmbase, !strconcat(". ", asmstr)), itin,
Nemanja Ivanovic2c84b292015-09-29 17:41:53 +000097 [(set InTy:$XT,
98 (InTy (PPCvcmp_o InTy:$XA, InTy:$XB, xo)))]>,
99 isDOT;
Hal Finkel27774d92014-03-13 07:58:58 +0000100 }
101}
102
Nemanja Ivanovic11049f82016-10-04 06:59:23 +0000103// Instruction form with a single input register for instructions such as
104// XXPERMDI. The reason for defining this is that specifying multiple chained
105// operands (such as loads) to an instruction will perform both chained
106// operations rather than coalescing them into a single register - even though
107// the source memory location is the same. This simply forces the instruction
108// to use the same register for both inputs.
109// For example, an output DAG such as this:
110// (XXPERMDI (LXSIBZX xoaddr:$src), (LXSIBZX xoaddr:$src ), 0))
111// would result in two load instructions emitted and used as separate inputs
112// to the XXPERMDI instruction.
113class XX3Form_2s<bits<6> opcode, bits<5> xo, dag OOL, dag IOL, string asmstr,
114 InstrItinClass itin, list<dag> pattern>
115 : XX3Form_2<opcode, xo, OOL, IOL, asmstr, itin, pattern> {
116 let XB = XA;
117}
118
Eric Christopher1b8e7632014-05-22 01:07:24 +0000119def HasVSX : Predicate<"PPCSubTarget->hasVSX()">;
Bill Schmidtfae5d712014-12-09 16:35:51 +0000120def IsLittleEndian : Predicate<"PPCSubTarget->isLittleEndian()">;
121def IsBigEndian : Predicate<"!PPCSubTarget->isLittleEndian()">;
Nemanja Ivanovic6e7879c2016-09-22 09:52:19 +0000122def HasOnlySwappingMemOps : Predicate<"!PPCSubTarget->hasP9Vector()">;
Bill Schmidtfae5d712014-12-09 16:35:51 +0000123
Hal Finkel27774d92014-03-13 07:58:58 +0000124let Predicates = [HasVSX] in {
125let AddedComplexity = 400 in { // Prefer VSX patterns over non-VSX patterns.
Craig Topperc50d64b2014-11-26 00:46:26 +0000126let hasSideEffects = 0 in { // VSX instructions don't have side effects.
Hal Finkel27774d92014-03-13 07:58:58 +0000127let Uses = [RM] in {
128
129 // Load indexed instructions
Sean Fertile3c8c3852017-01-26 18:59:15 +0000130 let mayLoad = 1, mayStore = 0 in {
Nemanja Ivanovic6354d232016-10-04 11:25:52 +0000131 let CodeSize = 3 in
Stefan Pintilie26d4f922018-03-26 17:39:18 +0000132 def LXSDX : XX1Form_memOp<31, 588,
Hal Finkel19be5062014-03-29 05:29:01 +0000133 (outs vsfrc:$XT), (ins memrr:$src),
Hal Finkel27774d92014-03-13 07:58:58 +0000134 "lxsdx $XT, $src", IIC_LdStLFD,
Lei Huangf4ec6782018-05-24 03:20:28 +0000135 []>;
Hal Finkel27774d92014-03-13 07:58:58 +0000136
Tony Jiang438bf4a2017-11-20 14:38:30 +0000137 // Pseudo instruction XFLOADf64 will be expanded to LXSDX or LFDX later
Jinsong Jic7b43b92018-12-13 15:12:57 +0000138 let CodeSize = 3 in
Stefan Pintilie26d4f922018-03-26 17:39:18 +0000139 def XFLOADf64 : PseudoXFormMemOp<(outs vsfrc:$XT), (ins memrr:$src),
Tony Jiang438bf4a2017-11-20 14:38:30 +0000140 "#XFLOADf64",
141 [(set f64:$XT, (load xoaddr:$src))]>;
142
Nemanja Ivanovic6e7879c2016-09-22 09:52:19 +0000143 let Predicates = [HasVSX, HasOnlySwappingMemOps] in
Stefan Pintilie26d4f922018-03-26 17:39:18 +0000144 def LXVD2X : XX1Form_memOp<31, 844,
Hal Finkel27774d92014-03-13 07:58:58 +0000145 (outs vsrc:$XT), (ins memrr:$src),
146 "lxvd2x $XT, $src", IIC_LdStLFD,
Bill Schmidt72954782014-11-12 04:19:40 +0000147 [(set v2f64:$XT, (int_ppc_vsx_lxvd2x xoaddr:$src))]>;
Hal Finkel27774d92014-03-13 07:58:58 +0000148
Stefan Pintilie26d4f922018-03-26 17:39:18 +0000149 def LXVDSX : XX1Form_memOp<31, 332,
Hal Finkel27774d92014-03-13 07:58:58 +0000150 (outs vsrc:$XT), (ins memrr:$src),
151 "lxvdsx $XT, $src", IIC_LdStLFD, []>;
Hal Finkel27774d92014-03-13 07:58:58 +0000152
Nemanja Ivanovic6e7879c2016-09-22 09:52:19 +0000153 let Predicates = [HasVSX, HasOnlySwappingMemOps] in
Stefan Pintilie26d4f922018-03-26 17:39:18 +0000154 def LXVW4X : XX1Form_memOp<31, 780,
Hal Finkel27774d92014-03-13 07:58:58 +0000155 (outs vsrc:$XT), (ins memrr:$src),
Bill Schmidt2d1128a2014-10-17 15:13:38 +0000156 "lxvw4x $XT, $src", IIC_LdStLFD,
Nemanja Ivanovicb89c27f2017-05-02 01:47:34 +0000157 []>;
Nemanja Ivanovicf3c94b12015-05-07 18:24:05 +0000158 } // mayLoad
Hal Finkel27774d92014-03-13 07:58:58 +0000159
160 // Store indexed instructions
Sean Fertile3c8c3852017-01-26 18:59:15 +0000161 let mayStore = 1, mayLoad = 0 in {
Nemanja Ivanovic6354d232016-10-04 11:25:52 +0000162 let CodeSize = 3 in
Stefan Pintilie26d4f922018-03-26 17:39:18 +0000163 def STXSDX : XX1Form_memOp<31, 716,
Hal Finkel19be5062014-03-29 05:29:01 +0000164 (outs), (ins vsfrc:$XT, memrr:$dst),
Hal Finkel27774d92014-03-13 07:58:58 +0000165 "stxsdx $XT, $dst", IIC_LdStSTFD,
Lei Huangf4ec6782018-05-24 03:20:28 +0000166 []>;
Hal Finkel27774d92014-03-13 07:58:58 +0000167
Tony Jiang438bf4a2017-11-20 14:38:30 +0000168 // Pseudo instruction XFSTOREf64 will be expanded to STXSDX or STFDX later
Jinsong Jic7b43b92018-12-13 15:12:57 +0000169 let CodeSize = 3 in
Stefan Pintilie26d4f922018-03-26 17:39:18 +0000170 def XFSTOREf64 : PseudoXFormMemOp<(outs), (ins vsfrc:$XT, memrr:$dst),
Tony Jiang438bf4a2017-11-20 14:38:30 +0000171 "#XFSTOREf64",
172 [(store f64:$XT, xoaddr:$dst)]>;
173
Nemanja Ivanovic6e7879c2016-09-22 09:52:19 +0000174 let Predicates = [HasVSX, HasOnlySwappingMemOps] in {
Nemanja Ivanovice78ffed2016-09-22 10:32:03 +0000175 // The behaviour of this instruction is endianness-specific so we provide no
176 // pattern to match it without considering endianness.
Stefan Pintilie26d4f922018-03-26 17:39:18 +0000177 def STXVD2X : XX1Form_memOp<31, 972,
Hal Finkel27774d92014-03-13 07:58:58 +0000178 (outs), (ins vsrc:$XT, memrr:$dst),
179 "stxvd2x $XT, $dst", IIC_LdStSTFD,
Nemanja Ivanovice78ffed2016-09-22 10:32:03 +0000180 []>;
Hal Finkel27774d92014-03-13 07:58:58 +0000181
Stefan Pintilie26d4f922018-03-26 17:39:18 +0000182 def STXVW4X : XX1Form_memOp<31, 908,
Hal Finkel27774d92014-03-13 07:58:58 +0000183 (outs), (ins vsrc:$XT, memrr:$dst),
Bill Schmidt2d1128a2014-10-17 15:13:38 +0000184 "stxvw4x $XT, $dst", IIC_LdStSTFD,
Nemanja Ivanovicb89c27f2017-05-02 01:47:34 +0000185 []>;
Nemanja Ivanovic6e7879c2016-09-22 09:52:19 +0000186 }
Nemanja Ivanovicf3c94b12015-05-07 18:24:05 +0000187 } // mayStore
Hal Finkel27774d92014-03-13 07:58:58 +0000188
189 // Add/Mul Instructions
190 let isCommutable = 1 in {
191 def XSADDDP : XX3Form<60, 32,
Hal Finkel19be5062014-03-29 05:29:01 +0000192 (outs vsfrc:$XT), (ins vsfrc:$XA, vsfrc:$XB),
Hal Finkel27774d92014-03-13 07:58:58 +0000193 "xsadddp $XT, $XA, $XB", IIC_VecFP,
194 [(set f64:$XT, (fadd f64:$XA, f64:$XB))]>;
195 def XSMULDP : XX3Form<60, 48,
Hal Finkel19be5062014-03-29 05:29:01 +0000196 (outs vsfrc:$XT), (ins vsfrc:$XA, vsfrc:$XB),
Hal Finkel27774d92014-03-13 07:58:58 +0000197 "xsmuldp $XT, $XA, $XB", IIC_VecFP,
198 [(set f64:$XT, (fmul f64:$XA, f64:$XB))]>;
199
200 def XVADDDP : XX3Form<60, 96,
201 (outs vsrc:$XT), (ins vsrc:$XA, vsrc:$XB),
202 "xvadddp $XT, $XA, $XB", IIC_VecFP,
203 [(set v2f64:$XT, (fadd v2f64:$XA, v2f64:$XB))]>;
204
205 def XVADDSP : XX3Form<60, 64,
206 (outs vsrc:$XT), (ins vsrc:$XA, vsrc:$XB),
207 "xvaddsp $XT, $XA, $XB", IIC_VecFP,
208 [(set v4f32:$XT, (fadd v4f32:$XA, v4f32:$XB))]>;
209
210 def XVMULDP : XX3Form<60, 112,
211 (outs vsrc:$XT), (ins vsrc:$XA, vsrc:$XB),
212 "xvmuldp $XT, $XA, $XB", IIC_VecFP,
213 [(set v2f64:$XT, (fmul v2f64:$XA, v2f64:$XB))]>;
214
215 def XVMULSP : XX3Form<60, 80,
216 (outs vsrc:$XT), (ins vsrc:$XA, vsrc:$XB),
217 "xvmulsp $XT, $XA, $XB", IIC_VecFP,
218 [(set v4f32:$XT, (fmul v4f32:$XA, v4f32:$XB))]>;
219 }
220
221 // Subtract Instructions
222 def XSSUBDP : XX3Form<60, 40,
Hal Finkel19be5062014-03-29 05:29:01 +0000223 (outs vsfrc:$XT), (ins vsfrc:$XA, vsfrc:$XB),
Hal Finkel27774d92014-03-13 07:58:58 +0000224 "xssubdp $XT, $XA, $XB", IIC_VecFP,
225 [(set f64:$XT, (fsub f64:$XA, f64:$XB))]>;
226
227 def XVSUBDP : XX3Form<60, 104,
228 (outs vsrc:$XT), (ins vsrc:$XA, vsrc:$XB),
229 "xvsubdp $XT, $XA, $XB", IIC_VecFP,
230 [(set v2f64:$XT, (fsub v2f64:$XA, v2f64:$XB))]>;
231 def XVSUBSP : XX3Form<60, 72,
232 (outs vsrc:$XT), (ins vsrc:$XA, vsrc:$XB),
233 "xvsubsp $XT, $XA, $XB", IIC_VecFP,
234 [(set v4f32:$XT, (fsub v4f32:$XA, v4f32:$XB))]>;
235
236 // FMA Instructions
Hal Finkel25e04542014-03-25 18:55:11 +0000237 let BaseName = "XSMADDADP" in {
Hal Finkele01d3212014-03-24 15:07:28 +0000238 let isCommutable = 1 in
Hal Finkel27774d92014-03-13 07:58:58 +0000239 def XSMADDADP : XX3Form<60, 33,
Hal Finkel19be5062014-03-29 05:29:01 +0000240 (outs vsfrc:$XT), (ins vsfrc:$XTi, vsfrc:$XA, vsfrc:$XB),
Hal Finkel27774d92014-03-13 07:58:58 +0000241 "xsmaddadp $XT, $XA, $XB", IIC_VecFP,
242 [(set f64:$XT, (fma f64:$XA, f64:$XB, f64:$XTi))]>,
Hal Finkel25e04542014-03-25 18:55:11 +0000243 RegConstraint<"$XTi = $XT">, NoEncode<"$XTi">,
244 AltVSXFMARel;
245 let IsVSXFMAAlt = 1 in
Hal Finkel27774d92014-03-13 07:58:58 +0000246 def XSMADDMDP : XX3Form<60, 41,
Hal Finkel19be5062014-03-29 05:29:01 +0000247 (outs vsfrc:$XT), (ins vsfrc:$XTi, vsfrc:$XA, vsfrc:$XB),
Hal Finkel27774d92014-03-13 07:58:58 +0000248 "xsmaddmdp $XT, $XA, $XB", IIC_VecFP, []>,
Hal Finkel25e04542014-03-25 18:55:11 +0000249 RegConstraint<"$XTi = $XT">, NoEncode<"$XTi">,
250 AltVSXFMARel;
251 }
Hal Finkel27774d92014-03-13 07:58:58 +0000252
Hal Finkel25e04542014-03-25 18:55:11 +0000253 let BaseName = "XSMSUBADP" in {
Hal Finkele01d3212014-03-24 15:07:28 +0000254 let isCommutable = 1 in
Hal Finkel27774d92014-03-13 07:58:58 +0000255 def XSMSUBADP : XX3Form<60, 49,
Hal Finkel19be5062014-03-29 05:29:01 +0000256 (outs vsfrc:$XT), (ins vsfrc:$XTi, vsfrc:$XA, vsfrc:$XB),
Hal Finkel27774d92014-03-13 07:58:58 +0000257 "xsmsubadp $XT, $XA, $XB", IIC_VecFP,
258 [(set f64:$XT, (fma f64:$XA, f64:$XB, (fneg f64:$XTi)))]>,
Hal Finkel25e04542014-03-25 18:55:11 +0000259 RegConstraint<"$XTi = $XT">, NoEncode<"$XTi">,
260 AltVSXFMARel;
261 let IsVSXFMAAlt = 1 in
Hal Finkel27774d92014-03-13 07:58:58 +0000262 def XSMSUBMDP : XX3Form<60, 57,
Hal Finkel19be5062014-03-29 05:29:01 +0000263 (outs vsfrc:$XT), (ins vsfrc:$XTi, vsfrc:$XA, vsfrc:$XB),
Hal Finkel27774d92014-03-13 07:58:58 +0000264 "xsmsubmdp $XT, $XA, $XB", IIC_VecFP, []>,
Hal Finkel25e04542014-03-25 18:55:11 +0000265 RegConstraint<"$XTi = $XT">, NoEncode<"$XTi">,
266 AltVSXFMARel;
267 }
Hal Finkel27774d92014-03-13 07:58:58 +0000268
Hal Finkel25e04542014-03-25 18:55:11 +0000269 let BaseName = "XSNMADDADP" in {
Hal Finkele01d3212014-03-24 15:07:28 +0000270 let isCommutable = 1 in
Hal Finkel27774d92014-03-13 07:58:58 +0000271 def XSNMADDADP : XX3Form<60, 161,
Hal Finkel19be5062014-03-29 05:29:01 +0000272 (outs vsfrc:$XT), (ins vsfrc:$XTi, vsfrc:$XA, vsfrc:$XB),
Hal Finkel27774d92014-03-13 07:58:58 +0000273 "xsnmaddadp $XT, $XA, $XB", IIC_VecFP,
274 [(set f64:$XT, (fneg (fma f64:$XA, f64:$XB, f64:$XTi)))]>,
Hal Finkel25e04542014-03-25 18:55:11 +0000275 RegConstraint<"$XTi = $XT">, NoEncode<"$XTi">,
276 AltVSXFMARel;
277 let IsVSXFMAAlt = 1 in
Hal Finkel27774d92014-03-13 07:58:58 +0000278 def XSNMADDMDP : XX3Form<60, 169,
Hal Finkel19be5062014-03-29 05:29:01 +0000279 (outs vsfrc:$XT), (ins vsfrc:$XTi, vsfrc:$XA, vsfrc:$XB),
Hal Finkel27774d92014-03-13 07:58:58 +0000280 "xsnmaddmdp $XT, $XA, $XB", IIC_VecFP, []>,
Hal Finkel25e04542014-03-25 18:55:11 +0000281 RegConstraint<"$XTi = $XT">, NoEncode<"$XTi">,
282 AltVSXFMARel;
283 }
Hal Finkel27774d92014-03-13 07:58:58 +0000284
Hal Finkel25e04542014-03-25 18:55:11 +0000285 let BaseName = "XSNMSUBADP" in {
Hal Finkele01d3212014-03-24 15:07:28 +0000286 let isCommutable = 1 in
Hal Finkel27774d92014-03-13 07:58:58 +0000287 def XSNMSUBADP : XX3Form<60, 177,
Hal Finkel19be5062014-03-29 05:29:01 +0000288 (outs vsfrc:$XT), (ins vsfrc:$XTi, vsfrc:$XA, vsfrc:$XB),
Hal Finkel27774d92014-03-13 07:58:58 +0000289 "xsnmsubadp $XT, $XA, $XB", IIC_VecFP,
290 [(set f64:$XT, (fneg (fma f64:$XA, f64:$XB, (fneg f64:$XTi))))]>,
Hal Finkel25e04542014-03-25 18:55:11 +0000291 RegConstraint<"$XTi = $XT">, NoEncode<"$XTi">,
292 AltVSXFMARel;
293 let IsVSXFMAAlt = 1 in
Hal Finkel27774d92014-03-13 07:58:58 +0000294 def XSNMSUBMDP : XX3Form<60, 185,
Hal Finkel19be5062014-03-29 05:29:01 +0000295 (outs vsfrc:$XT), (ins vsfrc:$XTi, vsfrc:$XA, vsfrc:$XB),
Hal Finkel27774d92014-03-13 07:58:58 +0000296 "xsnmsubmdp $XT, $XA, $XB", IIC_VecFP, []>,
Hal Finkel25e04542014-03-25 18:55:11 +0000297 RegConstraint<"$XTi = $XT">, NoEncode<"$XTi">,
298 AltVSXFMARel;
299 }
Hal Finkel27774d92014-03-13 07:58:58 +0000300
Hal Finkel25e04542014-03-25 18:55:11 +0000301 let BaseName = "XVMADDADP" in {
Hal Finkele01d3212014-03-24 15:07:28 +0000302 let isCommutable = 1 in
Hal Finkel27774d92014-03-13 07:58:58 +0000303 def XVMADDADP : XX3Form<60, 97,
304 (outs vsrc:$XT), (ins vsrc:$XTi, vsrc:$XA, vsrc:$XB),
305 "xvmaddadp $XT, $XA, $XB", IIC_VecFP,
306 [(set v2f64:$XT, (fma v2f64:$XA, v2f64:$XB, v2f64:$XTi))]>,
Hal Finkel25e04542014-03-25 18:55:11 +0000307 RegConstraint<"$XTi = $XT">, NoEncode<"$XTi">,
308 AltVSXFMARel;
309 let IsVSXFMAAlt = 1 in
Hal Finkel27774d92014-03-13 07:58:58 +0000310 def XVMADDMDP : XX3Form<60, 105,
311 (outs vsrc:$XT), (ins vsrc:$XTi, vsrc:$XA, vsrc:$XB),
312 "xvmaddmdp $XT, $XA, $XB", IIC_VecFP, []>,
Hal Finkel25e04542014-03-25 18:55:11 +0000313 RegConstraint<"$XTi = $XT">, NoEncode<"$XTi">,
314 AltVSXFMARel;
315 }
Hal Finkel27774d92014-03-13 07:58:58 +0000316
Hal Finkel25e04542014-03-25 18:55:11 +0000317 let BaseName = "XVMADDASP" in {
Hal Finkele01d3212014-03-24 15:07:28 +0000318 let isCommutable = 1 in
Hal Finkel27774d92014-03-13 07:58:58 +0000319 def XVMADDASP : XX3Form<60, 65,
320 (outs vsrc:$XT), (ins vsrc:$XTi, vsrc:$XA, vsrc:$XB),
321 "xvmaddasp $XT, $XA, $XB", IIC_VecFP,
322 [(set v4f32:$XT, (fma v4f32:$XA, v4f32:$XB, v4f32:$XTi))]>,
Hal Finkel25e04542014-03-25 18:55:11 +0000323 RegConstraint<"$XTi = $XT">, NoEncode<"$XTi">,
324 AltVSXFMARel;
325 let IsVSXFMAAlt = 1 in
Hal Finkel27774d92014-03-13 07:58:58 +0000326 def XVMADDMSP : XX3Form<60, 73,
327 (outs vsrc:$XT), (ins vsrc:$XTi, vsrc:$XA, vsrc:$XB),
328 "xvmaddmsp $XT, $XA, $XB", IIC_VecFP, []>,
Hal Finkel25e04542014-03-25 18:55:11 +0000329 RegConstraint<"$XTi = $XT">, NoEncode<"$XTi">,
330 AltVSXFMARel;
331 }
Hal Finkel27774d92014-03-13 07:58:58 +0000332
Hal Finkel25e04542014-03-25 18:55:11 +0000333 let BaseName = "XVMSUBADP" in {
Hal Finkele01d3212014-03-24 15:07:28 +0000334 let isCommutable = 1 in
Hal Finkel27774d92014-03-13 07:58:58 +0000335 def XVMSUBADP : XX3Form<60, 113,
336 (outs vsrc:$XT), (ins vsrc:$XTi, vsrc:$XA, vsrc:$XB),
337 "xvmsubadp $XT, $XA, $XB", IIC_VecFP,
338 [(set v2f64:$XT, (fma v2f64:$XA, v2f64:$XB, (fneg v2f64:$XTi)))]>,
Hal Finkel25e04542014-03-25 18:55:11 +0000339 RegConstraint<"$XTi = $XT">, NoEncode<"$XTi">,
340 AltVSXFMARel;
341 let IsVSXFMAAlt = 1 in
Hal Finkel27774d92014-03-13 07:58:58 +0000342 def XVMSUBMDP : XX3Form<60, 121,
343 (outs vsrc:$XT), (ins vsrc:$XTi, vsrc:$XA, vsrc:$XB),
344 "xvmsubmdp $XT, $XA, $XB", IIC_VecFP, []>,
Hal Finkel25e04542014-03-25 18:55:11 +0000345 RegConstraint<"$XTi = $XT">, NoEncode<"$XTi">,
346 AltVSXFMARel;
347 }
Hal Finkel27774d92014-03-13 07:58:58 +0000348
Hal Finkel25e04542014-03-25 18:55:11 +0000349 let BaseName = "XVMSUBASP" in {
Hal Finkele01d3212014-03-24 15:07:28 +0000350 let isCommutable = 1 in
Hal Finkel27774d92014-03-13 07:58:58 +0000351 def XVMSUBASP : XX3Form<60, 81,
352 (outs vsrc:$XT), (ins vsrc:$XTi, vsrc:$XA, vsrc:$XB),
353 "xvmsubasp $XT, $XA, $XB", IIC_VecFP,
354 [(set v4f32:$XT, (fma v4f32:$XA, v4f32:$XB, (fneg v4f32:$XTi)))]>,
Hal Finkel25e04542014-03-25 18:55:11 +0000355 RegConstraint<"$XTi = $XT">, NoEncode<"$XTi">,
356 AltVSXFMARel;
357 let IsVSXFMAAlt = 1 in
Hal Finkel27774d92014-03-13 07:58:58 +0000358 def XVMSUBMSP : XX3Form<60, 89,
359 (outs vsrc:$XT), (ins vsrc:$XTi, vsrc:$XA, vsrc:$XB),
360 "xvmsubmsp $XT, $XA, $XB", IIC_VecFP, []>,
Hal Finkel25e04542014-03-25 18:55:11 +0000361 RegConstraint<"$XTi = $XT">, NoEncode<"$XTi">,
362 AltVSXFMARel;
363 }
Hal Finkel27774d92014-03-13 07:58:58 +0000364
Hal Finkel25e04542014-03-25 18:55:11 +0000365 let BaseName = "XVNMADDADP" in {
Hal Finkele01d3212014-03-24 15:07:28 +0000366 let isCommutable = 1 in
Hal Finkel27774d92014-03-13 07:58:58 +0000367 def XVNMADDADP : XX3Form<60, 225,
368 (outs vsrc:$XT), (ins vsrc:$XTi, vsrc:$XA, vsrc:$XB),
369 "xvnmaddadp $XT, $XA, $XB", IIC_VecFP,
370 [(set v2f64:$XT, (fneg (fma v2f64:$XA, v2f64:$XB, v2f64:$XTi)))]>,
Hal Finkel25e04542014-03-25 18:55:11 +0000371 RegConstraint<"$XTi = $XT">, NoEncode<"$XTi">,
372 AltVSXFMARel;
373 let IsVSXFMAAlt = 1 in
Hal Finkel27774d92014-03-13 07:58:58 +0000374 def XVNMADDMDP : XX3Form<60, 233,
375 (outs vsrc:$XT), (ins vsrc:$XTi, vsrc:$XA, vsrc:$XB),
376 "xvnmaddmdp $XT, $XA, $XB", IIC_VecFP, []>,
Hal Finkel25e04542014-03-25 18:55:11 +0000377 RegConstraint<"$XTi = $XT">, NoEncode<"$XTi">,
378 AltVSXFMARel;
379 }
Hal Finkel27774d92014-03-13 07:58:58 +0000380
Hal Finkel25e04542014-03-25 18:55:11 +0000381 let BaseName = "XVNMADDASP" in {
Hal Finkele01d3212014-03-24 15:07:28 +0000382 let isCommutable = 1 in
Hal Finkel27774d92014-03-13 07:58:58 +0000383 def XVNMADDASP : XX3Form<60, 193,
384 (outs vsrc:$XT), (ins vsrc:$XTi, vsrc:$XA, vsrc:$XB),
385 "xvnmaddasp $XT, $XA, $XB", IIC_VecFP,
386 [(set v4f32:$XT, (fneg (fma v4f32:$XA, v4f32:$XB, v4f32:$XTi)))]>,
Hal Finkel25e04542014-03-25 18:55:11 +0000387 RegConstraint<"$XTi = $XT">, NoEncode<"$XTi">,
388 AltVSXFMARel;
389 let IsVSXFMAAlt = 1 in
Hal Finkel27774d92014-03-13 07:58:58 +0000390 def XVNMADDMSP : XX3Form<60, 201,
391 (outs vsrc:$XT), (ins vsrc:$XTi, vsrc:$XA, vsrc:$XB),
392 "xvnmaddmsp $XT, $XA, $XB", IIC_VecFP, []>,
Hal Finkel25e04542014-03-25 18:55:11 +0000393 RegConstraint<"$XTi = $XT">, NoEncode<"$XTi">,
394 AltVSXFMARel;
395 }
Hal Finkel27774d92014-03-13 07:58:58 +0000396
Hal Finkel25e04542014-03-25 18:55:11 +0000397 let BaseName = "XVNMSUBADP" in {
Hal Finkele01d3212014-03-24 15:07:28 +0000398 let isCommutable = 1 in
Hal Finkel27774d92014-03-13 07:58:58 +0000399 def XVNMSUBADP : XX3Form<60, 241,
400 (outs vsrc:$XT), (ins vsrc:$XTi, vsrc:$XA, vsrc:$XB),
401 "xvnmsubadp $XT, $XA, $XB", IIC_VecFP,
402 [(set v2f64:$XT, (fneg (fma v2f64:$XA, v2f64:$XB, (fneg v2f64:$XTi))))]>,
Hal Finkel25e04542014-03-25 18:55:11 +0000403 RegConstraint<"$XTi = $XT">, NoEncode<"$XTi">,
404 AltVSXFMARel;
405 let IsVSXFMAAlt = 1 in
Hal Finkel27774d92014-03-13 07:58:58 +0000406 def XVNMSUBMDP : XX3Form<60, 249,
407 (outs vsrc:$XT), (ins vsrc:$XTi, vsrc:$XA, vsrc:$XB),
408 "xvnmsubmdp $XT, $XA, $XB", IIC_VecFP, []>,
Hal Finkel25e04542014-03-25 18:55:11 +0000409 RegConstraint<"$XTi = $XT">, NoEncode<"$XTi">,
410 AltVSXFMARel;
411 }
Hal Finkel27774d92014-03-13 07:58:58 +0000412
Hal Finkel25e04542014-03-25 18:55:11 +0000413 let BaseName = "XVNMSUBASP" in {
Hal Finkele01d3212014-03-24 15:07:28 +0000414 let isCommutable = 1 in
Hal Finkel27774d92014-03-13 07:58:58 +0000415 def XVNMSUBASP : XX3Form<60, 209,
416 (outs vsrc:$XT), (ins vsrc:$XTi, vsrc:$XA, vsrc:$XB),
417 "xvnmsubasp $XT, $XA, $XB", IIC_VecFP,
418 [(set v4f32:$XT, (fneg (fma v4f32:$XA, v4f32:$XB, (fneg v4f32:$XTi))))]>,
Hal Finkel25e04542014-03-25 18:55:11 +0000419 RegConstraint<"$XTi = $XT">, NoEncode<"$XTi">,
420 AltVSXFMARel;
421 let IsVSXFMAAlt = 1 in
Hal Finkel27774d92014-03-13 07:58:58 +0000422 def XVNMSUBMSP : XX3Form<60, 217,
423 (outs vsrc:$XT), (ins vsrc:$XTi, vsrc:$XA, vsrc:$XB),
424 "xvnmsubmsp $XT, $XA, $XB", IIC_VecFP, []>,
Hal Finkel25e04542014-03-25 18:55:11 +0000425 RegConstraint<"$XTi = $XT">, NoEncode<"$XTi">,
426 AltVSXFMARel;
427 }
Hal Finkel27774d92014-03-13 07:58:58 +0000428
429 // Division Instructions
430 def XSDIVDP : XX3Form<60, 56,
Hal Finkel19be5062014-03-29 05:29:01 +0000431 (outs vsfrc:$XT), (ins vsfrc:$XA, vsfrc:$XB),
Hal Finkele8fba982014-03-29 13:20:31 +0000432 "xsdivdp $XT, $XA, $XB", IIC_FPDivD,
Hal Finkel27774d92014-03-13 07:58:58 +0000433 [(set f64:$XT, (fdiv f64:$XA, f64:$XB))]>;
434 def XSSQRTDP : XX2Form<60, 75,
Hal Finkel19be5062014-03-29 05:29:01 +0000435 (outs vsfrc:$XT), (ins vsfrc:$XB),
Hal Finkele8fba982014-03-29 13:20:31 +0000436 "xssqrtdp $XT, $XB", IIC_FPSqrtD,
Hal Finkel27774d92014-03-13 07:58:58 +0000437 [(set f64:$XT, (fsqrt f64:$XB))]>;
438
439 def XSREDP : XX2Form<60, 90,
Hal Finkel19be5062014-03-29 05:29:01 +0000440 (outs vsfrc:$XT), (ins vsfrc:$XB),
Hal Finkel27774d92014-03-13 07:58:58 +0000441 "xsredp $XT, $XB", IIC_VecFP,
442 [(set f64:$XT, (PPCfre f64:$XB))]>;
443 def XSRSQRTEDP : XX2Form<60, 74,
Hal Finkel19be5062014-03-29 05:29:01 +0000444 (outs vsfrc:$XT), (ins vsfrc:$XB),
Hal Finkel27774d92014-03-13 07:58:58 +0000445 "xsrsqrtedp $XT, $XB", IIC_VecFP,
446 [(set f64:$XT, (PPCfrsqrte f64:$XB))]>;
447
448 def XSTDIVDP : XX3Form_1<60, 61,
Hal Finkel19be5062014-03-29 05:29:01 +0000449 (outs crrc:$crD), (ins vsfrc:$XA, vsfrc:$XB),
Hal Finkele8fba982014-03-29 13:20:31 +0000450 "xstdivdp $crD, $XA, $XB", IIC_FPCompare, []>;
Hal Finkel27774d92014-03-13 07:58:58 +0000451 def XSTSQRTDP : XX2Form_1<60, 106,
Hal Finkel19be5062014-03-29 05:29:01 +0000452 (outs crrc:$crD), (ins vsfrc:$XB),
Hal Finkele8fba982014-03-29 13:20:31 +0000453 "xstsqrtdp $crD, $XB", IIC_FPCompare, []>;
Hal Finkel27774d92014-03-13 07:58:58 +0000454
455 def XVDIVDP : XX3Form<60, 120,
456 (outs vsrc:$XT), (ins vsrc:$XA, vsrc:$XB),
Hal Finkele8fba982014-03-29 13:20:31 +0000457 "xvdivdp $XT, $XA, $XB", IIC_FPDivD,
Hal Finkel27774d92014-03-13 07:58:58 +0000458 [(set v2f64:$XT, (fdiv v2f64:$XA, v2f64:$XB))]>;
459 def XVDIVSP : XX3Form<60, 88,
460 (outs vsrc:$XT), (ins vsrc:$XA, vsrc:$XB),
Hal Finkele8fba982014-03-29 13:20:31 +0000461 "xvdivsp $XT, $XA, $XB", IIC_FPDivS,
Hal Finkel27774d92014-03-13 07:58:58 +0000462 [(set v4f32:$XT, (fdiv v4f32:$XA, v4f32:$XB))]>;
463
464 def XVSQRTDP : XX2Form<60, 203,
465 (outs vsrc:$XT), (ins vsrc:$XB),
Hal Finkele8fba982014-03-29 13:20:31 +0000466 "xvsqrtdp $XT, $XB", IIC_FPSqrtD,
Hal Finkel27774d92014-03-13 07:58:58 +0000467 [(set v2f64:$XT, (fsqrt v2f64:$XB))]>;
468 def XVSQRTSP : XX2Form<60, 139,
469 (outs vsrc:$XT), (ins vsrc:$XB),
Hal Finkele8fba982014-03-29 13:20:31 +0000470 "xvsqrtsp $XT, $XB", IIC_FPSqrtS,
Hal Finkel27774d92014-03-13 07:58:58 +0000471 [(set v4f32:$XT, (fsqrt v4f32:$XB))]>;
472
473 def XVTDIVDP : XX3Form_1<60, 125,
474 (outs crrc:$crD), (ins vsrc:$XA, vsrc:$XB),
Hal Finkele8fba982014-03-29 13:20:31 +0000475 "xvtdivdp $crD, $XA, $XB", IIC_FPCompare, []>;
Hal Finkel27774d92014-03-13 07:58:58 +0000476 def XVTDIVSP : XX3Form_1<60, 93,
477 (outs crrc:$crD), (ins vsrc:$XA, vsrc:$XB),
Hal Finkele8fba982014-03-29 13:20:31 +0000478 "xvtdivsp $crD, $XA, $XB", IIC_FPCompare, []>;
Hal Finkel27774d92014-03-13 07:58:58 +0000479
480 def XVTSQRTDP : XX2Form_1<60, 234,
481 (outs crrc:$crD), (ins vsrc:$XB),
Hal Finkele8fba982014-03-29 13:20:31 +0000482 "xvtsqrtdp $crD, $XB", IIC_FPCompare, []>;
Hal Finkel27774d92014-03-13 07:58:58 +0000483 def XVTSQRTSP : XX2Form_1<60, 170,
484 (outs crrc:$crD), (ins vsrc:$XB),
Hal Finkele8fba982014-03-29 13:20:31 +0000485 "xvtsqrtsp $crD, $XB", IIC_FPCompare, []>;
Hal Finkel27774d92014-03-13 07:58:58 +0000486
487 def XVREDP : XX2Form<60, 218,
488 (outs vsrc:$XT), (ins vsrc:$XB),
489 "xvredp $XT, $XB", IIC_VecFP,
490 [(set v2f64:$XT, (PPCfre v2f64:$XB))]>;
491 def XVRESP : XX2Form<60, 154,
492 (outs vsrc:$XT), (ins vsrc:$XB),
493 "xvresp $XT, $XB", IIC_VecFP,
494 [(set v4f32:$XT, (PPCfre v4f32:$XB))]>;
495
496 def XVRSQRTEDP : XX2Form<60, 202,
497 (outs vsrc:$XT), (ins vsrc:$XB),
498 "xvrsqrtedp $XT, $XB", IIC_VecFP,
499 [(set v2f64:$XT, (PPCfrsqrte v2f64:$XB))]>;
500 def XVRSQRTESP : XX2Form<60, 138,
501 (outs vsrc:$XT), (ins vsrc:$XB),
502 "xvrsqrtesp $XT, $XB", IIC_VecFP,
503 [(set v4f32:$XT, (PPCfrsqrte v4f32:$XB))]>;
504
505 // Compare Instructions
506 def XSCMPODP : XX3Form_1<60, 43,
Hal Finkel19be5062014-03-29 05:29:01 +0000507 (outs crrc:$crD), (ins vsfrc:$XA, vsfrc:$XB),
Hal Finkele8fba982014-03-29 13:20:31 +0000508 "xscmpodp $crD, $XA, $XB", IIC_FPCompare, []>;
Hal Finkel27774d92014-03-13 07:58:58 +0000509 def XSCMPUDP : XX3Form_1<60, 35,
Hal Finkel19be5062014-03-29 05:29:01 +0000510 (outs crrc:$crD), (ins vsfrc:$XA, vsfrc:$XB),
Hal Finkele8fba982014-03-29 13:20:31 +0000511 "xscmpudp $crD, $XA, $XB", IIC_FPCompare, []>;
Hal Finkel27774d92014-03-13 07:58:58 +0000512
513 defm XVCMPEQDP : XX3Form_Rcr<60, 99,
Nemanja Ivanovicf502a422015-06-26 19:26:53 +0000514 "xvcmpeqdp", "$XT, $XA, $XB", IIC_VecFPCompare,
Nemanja Ivanovic2c84b292015-09-29 17:41:53 +0000515 int_ppc_vsx_xvcmpeqdp, v2i64, v2f64>;
Hal Finkel27774d92014-03-13 07:58:58 +0000516 defm XVCMPEQSP : XX3Form_Rcr<60, 67,
Nemanja Ivanovicf502a422015-06-26 19:26:53 +0000517 "xvcmpeqsp", "$XT, $XA, $XB", IIC_VecFPCompare,
Nemanja Ivanovic2c84b292015-09-29 17:41:53 +0000518 int_ppc_vsx_xvcmpeqsp, v4i32, v4f32>;
Hal Finkel27774d92014-03-13 07:58:58 +0000519 defm XVCMPGEDP : XX3Form_Rcr<60, 115,
Nemanja Ivanovicf502a422015-06-26 19:26:53 +0000520 "xvcmpgedp", "$XT, $XA, $XB", IIC_VecFPCompare,
Nemanja Ivanovic2c84b292015-09-29 17:41:53 +0000521 int_ppc_vsx_xvcmpgedp, v2i64, v2f64>;
Hal Finkel27774d92014-03-13 07:58:58 +0000522 defm XVCMPGESP : XX3Form_Rcr<60, 83,
Nemanja Ivanovicf502a422015-06-26 19:26:53 +0000523 "xvcmpgesp", "$XT, $XA, $XB", IIC_VecFPCompare,
Nemanja Ivanovic2c84b292015-09-29 17:41:53 +0000524 int_ppc_vsx_xvcmpgesp, v4i32, v4f32>;
Hal Finkel27774d92014-03-13 07:58:58 +0000525 defm XVCMPGTDP : XX3Form_Rcr<60, 107,
Nemanja Ivanovicf502a422015-06-26 19:26:53 +0000526 "xvcmpgtdp", "$XT, $XA, $XB", IIC_VecFPCompare,
Nemanja Ivanovic2c84b292015-09-29 17:41:53 +0000527 int_ppc_vsx_xvcmpgtdp, v2i64, v2f64>;
Hal Finkel27774d92014-03-13 07:58:58 +0000528 defm XVCMPGTSP : XX3Form_Rcr<60, 75,
Nemanja Ivanovicf502a422015-06-26 19:26:53 +0000529 "xvcmpgtsp", "$XT, $XA, $XB", IIC_VecFPCompare,
Nemanja Ivanovic2c84b292015-09-29 17:41:53 +0000530 int_ppc_vsx_xvcmpgtsp, v4i32, v4f32>;
Hal Finkel27774d92014-03-13 07:58:58 +0000531
532 // Move Instructions
533 def XSABSDP : XX2Form<60, 345,
Hal Finkel19be5062014-03-29 05:29:01 +0000534 (outs vsfrc:$XT), (ins vsfrc:$XB),
Hal Finkel27774d92014-03-13 07:58:58 +0000535 "xsabsdp $XT, $XB", IIC_VecFP,
536 [(set f64:$XT, (fabs f64:$XB))]>;
537 def XSNABSDP : XX2Form<60, 361,
Hal Finkel19be5062014-03-29 05:29:01 +0000538 (outs vsfrc:$XT), (ins vsfrc:$XB),
Hal Finkel27774d92014-03-13 07:58:58 +0000539 "xsnabsdp $XT, $XB", IIC_VecFP,
540 [(set f64:$XT, (fneg (fabs f64:$XB)))]>;
541 def XSNEGDP : XX2Form<60, 377,
Hal Finkel19be5062014-03-29 05:29:01 +0000542 (outs vsfrc:$XT), (ins vsfrc:$XB),
Hal Finkel27774d92014-03-13 07:58:58 +0000543 "xsnegdp $XT, $XB", IIC_VecFP,
544 [(set f64:$XT, (fneg f64:$XB))]>;
545 def XSCPSGNDP : XX3Form<60, 176,
Hal Finkel19be5062014-03-29 05:29:01 +0000546 (outs vsfrc:$XT), (ins vsfrc:$XA, vsfrc:$XB),
Hal Finkel27774d92014-03-13 07:58:58 +0000547 "xscpsgndp $XT, $XA, $XB", IIC_VecFP,
548 [(set f64:$XT, (fcopysign f64:$XB, f64:$XA))]>;
549
550 def XVABSDP : XX2Form<60, 473,
551 (outs vsrc:$XT), (ins vsrc:$XB),
552 "xvabsdp $XT, $XB", IIC_VecFP,
553 [(set v2f64:$XT, (fabs v2f64:$XB))]>;
554
555 def XVABSSP : XX2Form<60, 409,
556 (outs vsrc:$XT), (ins vsrc:$XB),
557 "xvabssp $XT, $XB", IIC_VecFP,
558 [(set v4f32:$XT, (fabs v4f32:$XB))]>;
559
560 def XVCPSGNDP : XX3Form<60, 240,
561 (outs vsrc:$XT), (ins vsrc:$XA, vsrc:$XB),
562 "xvcpsgndp $XT, $XA, $XB", IIC_VecFP,
563 [(set v2f64:$XT, (fcopysign v2f64:$XB, v2f64:$XA))]>;
564 def XVCPSGNSP : XX3Form<60, 208,
565 (outs vsrc:$XT), (ins vsrc:$XA, vsrc:$XB),
566 "xvcpsgnsp $XT, $XA, $XB", IIC_VecFP,
567 [(set v4f32:$XT, (fcopysign v4f32:$XB, v4f32:$XA))]>;
568
569 def XVNABSDP : XX2Form<60, 489,
570 (outs vsrc:$XT), (ins vsrc:$XB),
571 "xvnabsdp $XT, $XB", IIC_VecFP,
572 [(set v2f64:$XT, (fneg (fabs v2f64:$XB)))]>;
573 def XVNABSSP : XX2Form<60, 425,
574 (outs vsrc:$XT), (ins vsrc:$XB),
575 "xvnabssp $XT, $XB", IIC_VecFP,
576 [(set v4f32:$XT, (fneg (fabs v4f32:$XB)))]>;
577
578 def XVNEGDP : XX2Form<60, 505,
579 (outs vsrc:$XT), (ins vsrc:$XB),
580 "xvnegdp $XT, $XB", IIC_VecFP,
581 [(set v2f64:$XT, (fneg v2f64:$XB))]>;
582 def XVNEGSP : XX2Form<60, 441,
583 (outs vsrc:$XT), (ins vsrc:$XB),
584 "xvnegsp $XT, $XB", IIC_VecFP,
585 [(set v4f32:$XT, (fneg v4f32:$XB))]>;
586
587 // Conversion Instructions
588 def XSCVDPSP : XX2Form<60, 265,
Hal Finkel19be5062014-03-29 05:29:01 +0000589 (outs vsfrc:$XT), (ins vsfrc:$XB),
Hal Finkel27774d92014-03-13 07:58:58 +0000590 "xscvdpsp $XT, $XB", IIC_VecFP, []>;
591 def XSCVDPSXDS : XX2Form<60, 344,
Hal Finkel19be5062014-03-29 05:29:01 +0000592 (outs vsfrc:$XT), (ins vsfrc:$XB),
Hal Finkel4a912252014-03-23 05:35:00 +0000593 "xscvdpsxds $XT, $XB", IIC_VecFP,
594 [(set f64:$XT, (PPCfctidz f64:$XB))]>;
Nemanja Ivanovicdf1cb522016-11-29 16:11:34 +0000595 let isCodeGenOnly = 1 in
596 def XSCVDPSXDSs : XX2Form<60, 344,
597 (outs vssrc:$XT), (ins vssrc:$XB),
598 "xscvdpsxds $XT, $XB", IIC_VecFP,
599 [(set f32:$XT, (PPCfctidz f32:$XB))]>;
Hal Finkel27774d92014-03-13 07:58:58 +0000600 def XSCVDPSXWS : XX2Form<60, 88,
Hal Finkel19be5062014-03-29 05:29:01 +0000601 (outs vsfrc:$XT), (ins vsfrc:$XB),
Hal Finkel4a912252014-03-23 05:35:00 +0000602 "xscvdpsxws $XT, $XB", IIC_VecFP,
603 [(set f64:$XT, (PPCfctiwz f64:$XB))]>;
Nemanja Ivanovicdf1cb522016-11-29 16:11:34 +0000604 let isCodeGenOnly = 1 in
605 def XSCVDPSXWSs : XX2Form<60, 88,
606 (outs vssrc:$XT), (ins vssrc:$XB),
607 "xscvdpsxws $XT, $XB", IIC_VecFP,
608 [(set f32:$XT, (PPCfctiwz f32:$XB))]>;
Hal Finkel27774d92014-03-13 07:58:58 +0000609 def XSCVDPUXDS : XX2Form<60, 328,
Hal Finkel19be5062014-03-29 05:29:01 +0000610 (outs vsfrc:$XT), (ins vsfrc:$XB),
Hal Finkel4a912252014-03-23 05:35:00 +0000611 "xscvdpuxds $XT, $XB", IIC_VecFP,
612 [(set f64:$XT, (PPCfctiduz f64:$XB))]>;
Nemanja Ivanovicdf1cb522016-11-29 16:11:34 +0000613 let isCodeGenOnly = 1 in
614 def XSCVDPUXDSs : XX2Form<60, 328,
615 (outs vssrc:$XT), (ins vssrc:$XB),
616 "xscvdpuxds $XT, $XB", IIC_VecFP,
617 [(set f32:$XT, (PPCfctiduz f32:$XB))]>;
Hal Finkel27774d92014-03-13 07:58:58 +0000618 def XSCVDPUXWS : XX2Form<60, 72,
Hal Finkel19be5062014-03-29 05:29:01 +0000619 (outs vsfrc:$XT), (ins vsfrc:$XB),
Hal Finkel4a912252014-03-23 05:35:00 +0000620 "xscvdpuxws $XT, $XB", IIC_VecFP,
621 [(set f64:$XT, (PPCfctiwuz f64:$XB))]>;
Nemanja Ivanovicdf1cb522016-11-29 16:11:34 +0000622 let isCodeGenOnly = 1 in
623 def XSCVDPUXWSs : XX2Form<60, 72,
624 (outs vssrc:$XT), (ins vssrc:$XB),
625 "xscvdpuxws $XT, $XB", IIC_VecFP,
626 [(set f32:$XT, (PPCfctiwuz f32:$XB))]>;
Hal Finkel27774d92014-03-13 07:58:58 +0000627 def XSCVSPDP : XX2Form<60, 329,
Hal Finkel19be5062014-03-29 05:29:01 +0000628 (outs vsfrc:$XT), (ins vsfrc:$XB),
Hal Finkel27774d92014-03-13 07:58:58 +0000629 "xscvspdp $XT, $XB", IIC_VecFP, []>;
630 def XSCVSXDDP : XX2Form<60, 376,
Hal Finkel19be5062014-03-29 05:29:01 +0000631 (outs vsfrc:$XT), (ins vsfrc:$XB),
Hal Finkel4a912252014-03-23 05:35:00 +0000632 "xscvsxddp $XT, $XB", IIC_VecFP,
633 [(set f64:$XT, (PPCfcfid f64:$XB))]>;
Hal Finkel27774d92014-03-13 07:58:58 +0000634 def XSCVUXDDP : XX2Form<60, 360,
Hal Finkel19be5062014-03-29 05:29:01 +0000635 (outs vsfrc:$XT), (ins vsfrc:$XB),
Hal Finkel4a912252014-03-23 05:35:00 +0000636 "xscvuxddp $XT, $XB", IIC_VecFP,
637 [(set f64:$XT, (PPCfcfidu f64:$XB))]>;
Hal Finkel27774d92014-03-13 07:58:58 +0000638
639 def XVCVDPSP : XX2Form<60, 393,
640 (outs vsrc:$XT), (ins vsrc:$XB),
Nemanja Ivanovic2efc3cb2016-11-11 14:41:19 +0000641 "xvcvdpsp $XT, $XB", IIC_VecFP,
642 [(set v4f32:$XT, (int_ppc_vsx_xvcvdpsp v2f64:$XB))]>;
Hal Finkel27774d92014-03-13 07:58:58 +0000643 def XVCVDPSXDS : XX2Form<60, 472,
644 (outs vsrc:$XT), (ins vsrc:$XB),
Hal Finkel7279f4b2014-03-26 19:13:54 +0000645 "xvcvdpsxds $XT, $XB", IIC_VecFP,
646 [(set v2i64:$XT, (fp_to_sint v2f64:$XB))]>;
Hal Finkel27774d92014-03-13 07:58:58 +0000647 def XVCVDPSXWS : XX2Form<60, 216,
648 (outs vsrc:$XT), (ins vsrc:$XB),
Nemanja Ivanovic2efc3cb2016-11-11 14:41:19 +0000649 "xvcvdpsxws $XT, $XB", IIC_VecFP,
650 [(set v4i32:$XT, (int_ppc_vsx_xvcvdpsxws v2f64:$XB))]>;
Hal Finkel27774d92014-03-13 07:58:58 +0000651 def XVCVDPUXDS : XX2Form<60, 456,
652 (outs vsrc:$XT), (ins vsrc:$XB),
Hal Finkel7279f4b2014-03-26 19:13:54 +0000653 "xvcvdpuxds $XT, $XB", IIC_VecFP,
654 [(set v2i64:$XT, (fp_to_uint v2f64:$XB))]>;
Hal Finkel27774d92014-03-13 07:58:58 +0000655 def XVCVDPUXWS : XX2Form<60, 200,
656 (outs vsrc:$XT), (ins vsrc:$XB),
Nemanja Ivanovic2efc3cb2016-11-11 14:41:19 +0000657 "xvcvdpuxws $XT, $XB", IIC_VecFP,
658 [(set v4i32:$XT, (int_ppc_vsx_xvcvdpuxws v2f64:$XB))]>;
Hal Finkel27774d92014-03-13 07:58:58 +0000659
660 def XVCVSPDP : XX2Form<60, 457,
661 (outs vsrc:$XT), (ins vsrc:$XB),
Nemanja Ivanovic2efc3cb2016-11-11 14:41:19 +0000662 "xvcvspdp $XT, $XB", IIC_VecFP,
663 [(set v2f64:$XT, (int_ppc_vsx_xvcvspdp v4f32:$XB))]>;
Hal Finkel27774d92014-03-13 07:58:58 +0000664 def XVCVSPSXDS : XX2Form<60, 408,
665 (outs vsrc:$XT), (ins vsrc:$XB),
666 "xvcvspsxds $XT, $XB", IIC_VecFP, []>;
667 def XVCVSPSXWS : XX2Form<60, 152,
668 (outs vsrc:$XT), (ins vsrc:$XB),
Nemanja Ivanovicdf1cb522016-11-29 16:11:34 +0000669 "xvcvspsxws $XT, $XB", IIC_VecFP,
670 [(set v4i32:$XT, (fp_to_sint v4f32:$XB))]>;
Hal Finkel27774d92014-03-13 07:58:58 +0000671 def XVCVSPUXDS : XX2Form<60, 392,
672 (outs vsrc:$XT), (ins vsrc:$XB),
673 "xvcvspuxds $XT, $XB", IIC_VecFP, []>;
674 def XVCVSPUXWS : XX2Form<60, 136,
675 (outs vsrc:$XT), (ins vsrc:$XB),
Nemanja Ivanovicdf1cb522016-11-29 16:11:34 +0000676 "xvcvspuxws $XT, $XB", IIC_VecFP,
677 [(set v4i32:$XT, (fp_to_uint v4f32:$XB))]>;
Hal Finkel27774d92014-03-13 07:58:58 +0000678 def XVCVSXDDP : XX2Form<60, 504,
679 (outs vsrc:$XT), (ins vsrc:$XB),
Hal Finkel7279f4b2014-03-26 19:13:54 +0000680 "xvcvsxddp $XT, $XB", IIC_VecFP,
681 [(set v2f64:$XT, (sint_to_fp v2i64:$XB))]>;
Hal Finkel27774d92014-03-13 07:58:58 +0000682 def XVCVSXDSP : XX2Form<60, 440,
683 (outs vsrc:$XT), (ins vsrc:$XB),
Nemanja Ivanovic2efc3cb2016-11-11 14:41:19 +0000684 "xvcvsxdsp $XT, $XB", IIC_VecFP,
685 [(set v4f32:$XT, (int_ppc_vsx_xvcvsxdsp v2i64:$XB))]>;
Hal Finkel27774d92014-03-13 07:58:58 +0000686 def XVCVSXWDP : XX2Form<60, 248,
687 (outs vsrc:$XT), (ins vsrc:$XB),
Nemanja Ivanovic2efc3cb2016-11-11 14:41:19 +0000688 "xvcvsxwdp $XT, $XB", IIC_VecFP,
689 [(set v2f64:$XT, (int_ppc_vsx_xvcvsxwdp v4i32:$XB))]>;
Hal Finkel27774d92014-03-13 07:58:58 +0000690 def XVCVSXWSP : XX2Form<60, 184,
691 (outs vsrc:$XT), (ins vsrc:$XB),
Nemanja Ivanovic44513e52016-07-05 09:22:29 +0000692 "xvcvsxwsp $XT, $XB", IIC_VecFP,
693 [(set v4f32:$XT, (sint_to_fp v4i32:$XB))]>;
Hal Finkel27774d92014-03-13 07:58:58 +0000694 def XVCVUXDDP : XX2Form<60, 488,
695 (outs vsrc:$XT), (ins vsrc:$XB),
Hal Finkel7279f4b2014-03-26 19:13:54 +0000696 "xvcvuxddp $XT, $XB", IIC_VecFP,
697 [(set v2f64:$XT, (uint_to_fp v2i64:$XB))]>;
Hal Finkel27774d92014-03-13 07:58:58 +0000698 def XVCVUXDSP : XX2Form<60, 424,
699 (outs vsrc:$XT), (ins vsrc:$XB),
Nemanja Ivanovic2efc3cb2016-11-11 14:41:19 +0000700 "xvcvuxdsp $XT, $XB", IIC_VecFP,
701 [(set v4f32:$XT, (int_ppc_vsx_xvcvuxdsp v2i64:$XB))]>;
Hal Finkel27774d92014-03-13 07:58:58 +0000702 def XVCVUXWDP : XX2Form<60, 232,
703 (outs vsrc:$XT), (ins vsrc:$XB),
Nemanja Ivanovic2efc3cb2016-11-11 14:41:19 +0000704 "xvcvuxwdp $XT, $XB", IIC_VecFP,
705 [(set v2f64:$XT, (int_ppc_vsx_xvcvuxwdp v4i32:$XB))]>;
Hal Finkel27774d92014-03-13 07:58:58 +0000706 def XVCVUXWSP : XX2Form<60, 168,
707 (outs vsrc:$XT), (ins vsrc:$XB),
Nemanja Ivanovicdf1cb522016-11-29 16:11:34 +0000708 "xvcvuxwsp $XT, $XB", IIC_VecFP,
709 [(set v4f32:$XT, (uint_to_fp v4i32:$XB))]>;
Hal Finkel27774d92014-03-13 07:58:58 +0000710
711 // Rounding Instructions
712 def XSRDPI : XX2Form<60, 73,
Hal Finkel19be5062014-03-29 05:29:01 +0000713 (outs vsfrc:$XT), (ins vsfrc:$XB),
Hal Finkel27774d92014-03-13 07:58:58 +0000714 "xsrdpi $XT, $XB", IIC_VecFP,
Michael Kuperstein2bc3d4d2016-08-18 20:08:15 +0000715 [(set f64:$XT, (fround f64:$XB))]>;
Hal Finkel27774d92014-03-13 07:58:58 +0000716 def XSRDPIC : XX2Form<60, 107,
Hal Finkel19be5062014-03-29 05:29:01 +0000717 (outs vsfrc:$XT), (ins vsfrc:$XB),
Hal Finkel27774d92014-03-13 07:58:58 +0000718 "xsrdpic $XT, $XB", IIC_VecFP,
719 [(set f64:$XT, (fnearbyint f64:$XB))]>;
720 def XSRDPIM : XX2Form<60, 121,
Hal Finkel19be5062014-03-29 05:29:01 +0000721 (outs vsfrc:$XT), (ins vsfrc:$XB),
Hal Finkel27774d92014-03-13 07:58:58 +0000722 "xsrdpim $XT, $XB", IIC_VecFP,
723 [(set f64:$XT, (ffloor f64:$XB))]>;
724 def XSRDPIP : XX2Form<60, 105,
Hal Finkel19be5062014-03-29 05:29:01 +0000725 (outs vsfrc:$XT), (ins vsfrc:$XB),
Hal Finkel27774d92014-03-13 07:58:58 +0000726 "xsrdpip $XT, $XB", IIC_VecFP,
727 [(set f64:$XT, (fceil f64:$XB))]>;
728 def XSRDPIZ : XX2Form<60, 89,
Hal Finkel19be5062014-03-29 05:29:01 +0000729 (outs vsfrc:$XT), (ins vsfrc:$XB),
Hal Finkel27774d92014-03-13 07:58:58 +0000730 "xsrdpiz $XT, $XB", IIC_VecFP,
731 [(set f64:$XT, (ftrunc f64:$XB))]>;
732
733 def XVRDPI : XX2Form<60, 201,
734 (outs vsrc:$XT), (ins vsrc:$XB),
735 "xvrdpi $XT, $XB", IIC_VecFP,
Michael Kuperstein2bc3d4d2016-08-18 20:08:15 +0000736 [(set v2f64:$XT, (fround v2f64:$XB))]>;
Hal Finkel27774d92014-03-13 07:58:58 +0000737 def XVRDPIC : XX2Form<60, 235,
738 (outs vsrc:$XT), (ins vsrc:$XB),
739 "xvrdpic $XT, $XB", IIC_VecFP,
740 [(set v2f64:$XT, (fnearbyint v2f64:$XB))]>;
741 def XVRDPIM : XX2Form<60, 249,
742 (outs vsrc:$XT), (ins vsrc:$XB),
743 "xvrdpim $XT, $XB", IIC_VecFP,
744 [(set v2f64:$XT, (ffloor v2f64:$XB))]>;
745 def XVRDPIP : XX2Form<60, 233,
746 (outs vsrc:$XT), (ins vsrc:$XB),
747 "xvrdpip $XT, $XB", IIC_VecFP,
748 [(set v2f64:$XT, (fceil v2f64:$XB))]>;
749 def XVRDPIZ : XX2Form<60, 217,
750 (outs vsrc:$XT), (ins vsrc:$XB),
751 "xvrdpiz $XT, $XB", IIC_VecFP,
752 [(set v2f64:$XT, (ftrunc v2f64:$XB))]>;
753
754 def XVRSPI : XX2Form<60, 137,
755 (outs vsrc:$XT), (ins vsrc:$XB),
756 "xvrspi $XT, $XB", IIC_VecFP,
Michael Kuperstein2bc3d4d2016-08-18 20:08:15 +0000757 [(set v4f32:$XT, (fround v4f32:$XB))]>;
Hal Finkel27774d92014-03-13 07:58:58 +0000758 def XVRSPIC : XX2Form<60, 171,
759 (outs vsrc:$XT), (ins vsrc:$XB),
760 "xvrspic $XT, $XB", IIC_VecFP,
761 [(set v4f32:$XT, (fnearbyint v4f32:$XB))]>;
762 def XVRSPIM : XX2Form<60, 185,
763 (outs vsrc:$XT), (ins vsrc:$XB),
764 "xvrspim $XT, $XB", IIC_VecFP,
765 [(set v4f32:$XT, (ffloor v4f32:$XB))]>;
766 def XVRSPIP : XX2Form<60, 169,
767 (outs vsrc:$XT), (ins vsrc:$XB),
768 "xvrspip $XT, $XB", IIC_VecFP,
769 [(set v4f32:$XT, (fceil v4f32:$XB))]>;
770 def XVRSPIZ : XX2Form<60, 153,
771 (outs vsrc:$XT), (ins vsrc:$XB),
772 "xvrspiz $XT, $XB", IIC_VecFP,
773 [(set v4f32:$XT, (ftrunc v4f32:$XB))]>;
774
775 // Max/Min Instructions
Hal Finkele01d3212014-03-24 15:07:28 +0000776 let isCommutable = 1 in {
Hal Finkel27774d92014-03-13 07:58:58 +0000777 def XSMAXDP : XX3Form<60, 160,
Hal Finkel19be5062014-03-29 05:29:01 +0000778 (outs vsfrc:$XT), (ins vsfrc:$XA, vsfrc:$XB),
Bill Schmidt1ca69fa2014-10-31 19:19:07 +0000779 "xsmaxdp $XT, $XA, $XB", IIC_VecFP,
780 [(set vsfrc:$XT,
781 (int_ppc_vsx_xsmaxdp vsfrc:$XA, vsfrc:$XB))]>;
Hal Finkel27774d92014-03-13 07:58:58 +0000782 def XSMINDP : XX3Form<60, 168,
Hal Finkel19be5062014-03-29 05:29:01 +0000783 (outs vsfrc:$XT), (ins vsfrc:$XA, vsfrc:$XB),
Bill Schmidt1ca69fa2014-10-31 19:19:07 +0000784 "xsmindp $XT, $XA, $XB", IIC_VecFP,
785 [(set vsfrc:$XT,
786 (int_ppc_vsx_xsmindp vsfrc:$XA, vsfrc:$XB))]>;
Hal Finkel27774d92014-03-13 07:58:58 +0000787
788 def XVMAXDP : XX3Form<60, 224,
789 (outs vsrc:$XT), (ins vsrc:$XA, vsrc:$XB),
Bill Schmidt1ca69fa2014-10-31 19:19:07 +0000790 "xvmaxdp $XT, $XA, $XB", IIC_VecFP,
791 [(set vsrc:$XT,
792 (int_ppc_vsx_xvmaxdp vsrc:$XA, vsrc:$XB))]>;
Hal Finkel27774d92014-03-13 07:58:58 +0000793 def XVMINDP : XX3Form<60, 232,
794 (outs vsrc:$XT), (ins vsrc:$XA, vsrc:$XB),
Bill Schmidt1ca69fa2014-10-31 19:19:07 +0000795 "xvmindp $XT, $XA, $XB", IIC_VecFP,
796 [(set vsrc:$XT,
797 (int_ppc_vsx_xvmindp vsrc:$XA, vsrc:$XB))]>;
Hal Finkel27774d92014-03-13 07:58:58 +0000798
799 def XVMAXSP : XX3Form<60, 192,
800 (outs vsrc:$XT), (ins vsrc:$XA, vsrc:$XB),
Bill Schmidt1ca69fa2014-10-31 19:19:07 +0000801 "xvmaxsp $XT, $XA, $XB", IIC_VecFP,
802 [(set vsrc:$XT,
803 (int_ppc_vsx_xvmaxsp vsrc:$XA, vsrc:$XB))]>;
Hal Finkel27774d92014-03-13 07:58:58 +0000804 def XVMINSP : XX3Form<60, 200,
805 (outs vsrc:$XT), (ins vsrc:$XA, vsrc:$XB),
Bill Schmidt1ca69fa2014-10-31 19:19:07 +0000806 "xvminsp $XT, $XA, $XB", IIC_VecFP,
807 [(set vsrc:$XT,
808 (int_ppc_vsx_xvminsp vsrc:$XA, vsrc:$XB))]>;
Hal Finkele01d3212014-03-24 15:07:28 +0000809 } // isCommutable
Hal Finkel27774d92014-03-13 07:58:58 +0000810} // Uses = [RM]
811
812 // Logical Instructions
Hal Finkele01d3212014-03-24 15:07:28 +0000813 let isCommutable = 1 in
Hal Finkel27774d92014-03-13 07:58:58 +0000814 def XXLAND : XX3Form<60, 130,
815 (outs vsrc:$XT), (ins vsrc:$XA, vsrc:$XB),
Hal Finkelbd4de9d2014-03-26 04:55:40 +0000816 "xxland $XT, $XA, $XB", IIC_VecGeneral,
817 [(set v4i32:$XT, (and v4i32:$XA, v4i32:$XB))]>;
Hal Finkel27774d92014-03-13 07:58:58 +0000818 def XXLANDC : XX3Form<60, 138,
819 (outs vsrc:$XT), (ins vsrc:$XA, vsrc:$XB),
Hal Finkelbd4de9d2014-03-26 04:55:40 +0000820 "xxlandc $XT, $XA, $XB", IIC_VecGeneral,
821 [(set v4i32:$XT, (and v4i32:$XA,
822 (vnot_ppc v4i32:$XB)))]>;
Hal Finkele01d3212014-03-24 15:07:28 +0000823 let isCommutable = 1 in {
Hal Finkel27774d92014-03-13 07:58:58 +0000824 def XXLNOR : XX3Form<60, 162,
825 (outs vsrc:$XT), (ins vsrc:$XA, vsrc:$XB),
Hal Finkelbd4de9d2014-03-26 04:55:40 +0000826 "xxlnor $XT, $XA, $XB", IIC_VecGeneral,
827 [(set v4i32:$XT, (vnot_ppc (or v4i32:$XA,
828 v4i32:$XB)))]>;
Hal Finkel27774d92014-03-13 07:58:58 +0000829 def XXLOR : XX3Form<60, 146,
830 (outs vsrc:$XT), (ins vsrc:$XA, vsrc:$XB),
Hal Finkelbd4de9d2014-03-26 04:55:40 +0000831 "xxlor $XT, $XA, $XB", IIC_VecGeneral,
832 [(set v4i32:$XT, (or v4i32:$XA, v4i32:$XB))]>;
Hal Finkel19be5062014-03-29 05:29:01 +0000833 let isCodeGenOnly = 1 in
834 def XXLORf: XX3Form<60, 146,
835 (outs vsfrc:$XT), (ins vsfrc:$XA, vsfrc:$XB),
836 "xxlor $XT, $XA, $XB", IIC_VecGeneral, []>;
Hal Finkel27774d92014-03-13 07:58:58 +0000837 def XXLXOR : XX3Form<60, 154,
838 (outs vsrc:$XT), (ins vsrc:$XA, vsrc:$XB),
Hal Finkelbd4de9d2014-03-26 04:55:40 +0000839 "xxlxor $XT, $XA, $XB", IIC_VecGeneral,
840 [(set v4i32:$XT, (xor v4i32:$XA, v4i32:$XB))]>;
Hal Finkele01d3212014-03-24 15:07:28 +0000841 } // isCommutable
Jinsong Ji9dc2c1d2019-03-12 18:27:09 +0000842
843 let isCodeGenOnly = 1, isMoveImm = 1, isAsCheapAsAMove = 1,
844 isReMaterializable = 1 in {
845 def XXLXORz : XX3Form_Zero<60, 154, (outs vsrc:$XT), (ins),
Nemanja Ivanovicd2c3c512016-09-23 13:25:31 +0000846 "xxlxor $XT, $XT, $XT", IIC_VecGeneral,
847 [(set v4i32:$XT, (v4i32 immAllZerosV))]>;
Ehsan Amiric90b02c2016-10-24 17:31:09 +0000848 def XXLXORdpz : XX3Form_SetZero<60, 154,
849 (outs vsfrc:$XT), (ins),
850 "xxlxor $XT, $XT, $XT", IIC_VecGeneral,
851 [(set f64:$XT, (fpimm0))]>;
852 def XXLXORspz : XX3Form_SetZero<60, 154,
853 (outs vssrc:$XT), (ins),
854 "xxlxor $XT, $XT, $XT", IIC_VecGeneral,
855 [(set f32:$XT, (fpimm0))]>;
856 }
857
Hal Finkel27774d92014-03-13 07:58:58 +0000858 // Permutation Instructions
859 def XXMRGHW : XX3Form<60, 18,
860 (outs vsrc:$XT), (ins vsrc:$XA, vsrc:$XB),
861 "xxmrghw $XT, $XA, $XB", IIC_VecPerm, []>;
862 def XXMRGLW : XX3Form<60, 50,
863 (outs vsrc:$XT), (ins vsrc:$XA, vsrc:$XB),
864 "xxmrglw $XT, $XA, $XB", IIC_VecPerm, []>;
865
866 def XXPERMDI : XX3Form_2<60, 10,
867 (outs vsrc:$XT), (ins vsrc:$XA, vsrc:$XB, u2imm:$DM),
Tony Jiang60c247d2017-05-31 13:09:57 +0000868 "xxpermdi $XT, $XA, $XB, $DM", IIC_VecPerm,
869 [(set v2i64:$XT, (PPCxxpermdi v2i64:$XA, v2i64:$XB,
870 imm32SExt16:$DM))]>;
Nemanja Ivanovic15748f42016-12-06 11:47:14 +0000871 let isCodeGenOnly = 1 in
872 def XXPERMDIs : XX3Form_2s<60, 10, (outs vsrc:$XT), (ins vsfrc:$XA, u2imm:$DM),
Nemanja Ivanovic11049f82016-10-04 06:59:23 +0000873 "xxpermdi $XT, $XA, $XA, $DM", IIC_VecPerm, []>;
Hal Finkel27774d92014-03-13 07:58:58 +0000874 def XXSEL : XX4Form<60, 3,
875 (outs vsrc:$XT), (ins vsrc:$XA, vsrc:$XB, vsrc:$XC),
Nemanja Ivanovic5d06f172018-08-27 13:20:42 +0000876 "xxsel $XT, $XA, $XB, $XC", IIC_VecPerm, []>;
Hal Finkel27774d92014-03-13 07:58:58 +0000877
878 def XXSLDWI : XX3Form_2<60, 2,
879 (outs vsrc:$XT), (ins vsrc:$XA, vsrc:$XB, u2imm:$SHW),
Nemanja Ivanovicb43bb612016-07-12 21:00:10 +0000880 "xxsldwi $XT, $XA, $XB, $SHW", IIC_VecPerm,
881 [(set v4i32:$XT, (PPCvecshl v4i32:$XA, v4i32:$XB,
882 imm32SExt16:$SHW))]>;
Zaara Syedab2595b92018-08-08 15:20:43 +0000883
884 let isCodeGenOnly = 1 in
885 def XXSLDWIs : XX3Form_2s<60, 2,
886 (outs vsrc:$XT), (ins vsfrc:$XA, u2imm:$SHW),
887 "xxsldwi $XT, $XA, $XA, $SHW", IIC_VecPerm, []>;
888
Hal Finkel27774d92014-03-13 07:58:58 +0000889 def XXSPLTW : XX2Form_2<60, 164,
890 (outs vsrc:$XT), (ins vsrc:$XB, u2imm:$UIM),
Nemanja Ivanovic1a2b2f02016-05-04 16:04:02 +0000891 "xxspltw $XT, $XB, $UIM", IIC_VecPerm,
892 [(set v4i32:$XT,
893 (PPCxxsplt v4i32:$XB, imm32SExt16:$UIM))]>;
Nemanja Ivanovic11049f82016-10-04 06:59:23 +0000894 let isCodeGenOnly = 1 in
895 def XXSPLTWs : XX2Form_2<60, 164,
Stefan Pintiliee1d79a82019-03-26 20:28:21 +0000896 (outs vsrc:$XT), (ins vsfrc:$XB, u2imm:$UIM),
Nemanja Ivanovic11049f82016-10-04 06:59:23 +0000897 "xxspltw $XT, $XB, $UIM", IIC_VecPerm, []>;
Zaara Syedab2595b92018-08-08 15:20:43 +0000898
Craig Topperc50d64b2014-11-26 00:46:26 +0000899} // hasSideEffects
Hal Finkel27774d92014-03-13 07:58:58 +0000900
Bill Schmidt61e65232014-10-22 13:13:40 +0000901// SELECT_CC_* - Used to implement the SELECT_CC DAG operation. Expanded after
902// instruction selection into a branch sequence.
Jinsong Jic7b43b92018-12-13 15:12:57 +0000903let PPC970_Single = 1 in {
Bill Schmidt61e65232014-10-22 13:13:40 +0000904
Jinsong Jic7b43b92018-12-13 15:12:57 +0000905 def SELECT_CC_VSRC: PPCCustomInserterPseudo<(outs vsrc:$dst),
Bill Schmidt61e65232014-10-22 13:13:40 +0000906 (ins crrc:$cond, vsrc:$T, vsrc:$F, i32imm:$BROPC),
907 "#SELECT_CC_VSRC",
908 []>;
Jinsong Jic7b43b92018-12-13 15:12:57 +0000909 def SELECT_VSRC: PPCCustomInserterPseudo<(outs vsrc:$dst),
Bill Schmidt9c54bbd2014-10-22 16:58:20 +0000910 (ins crbitrc:$cond, vsrc:$T, vsrc:$F),
911 "#SELECT_VSRC",
Bill Schmidt61e65232014-10-22 13:13:40 +0000912 [(set v2f64:$dst,
913 (select i1:$cond, v2f64:$T, v2f64:$F))]>;
Jinsong Jic7b43b92018-12-13 15:12:57 +0000914 def SELECT_CC_VSFRC: PPCCustomInserterPseudo<(outs f8rc:$dst),
Bill Schmidt9c54bbd2014-10-22 16:58:20 +0000915 (ins crrc:$cond, f8rc:$T, f8rc:$F,
916 i32imm:$BROPC), "#SELECT_CC_VSFRC",
917 []>;
Jinsong Jic7b43b92018-12-13 15:12:57 +0000918 def SELECT_VSFRC: PPCCustomInserterPseudo<(outs f8rc:$dst),
Bill Schmidt9c54bbd2014-10-22 16:58:20 +0000919 (ins crbitrc:$cond, f8rc:$T, f8rc:$F),
920 "#SELECT_VSFRC",
921 [(set f64:$dst,
922 (select i1:$cond, f64:$T, f64:$F))]>;
Jinsong Jic7b43b92018-12-13 15:12:57 +0000923 def SELECT_CC_VSSRC: PPCCustomInserterPseudo<(outs f4rc:$dst),
Nemanja Ivanovicf3c94b12015-05-07 18:24:05 +0000924 (ins crrc:$cond, f4rc:$T, f4rc:$F,
925 i32imm:$BROPC), "#SELECT_CC_VSSRC",
926 []>;
Jinsong Jic7b43b92018-12-13 15:12:57 +0000927 def SELECT_VSSRC: PPCCustomInserterPseudo<(outs f4rc:$dst),
Nemanja Ivanovicf3c94b12015-05-07 18:24:05 +0000928 (ins crbitrc:$cond, f4rc:$T, f4rc:$F),
929 "#SELECT_VSSRC",
930 [(set f32:$dst,
931 (select i1:$cond, f32:$T, f32:$F))]>;
Jinsong Jic7b43b92018-12-13 15:12:57 +0000932}
Bill Schmidt9c54bbd2014-10-22 16:58:20 +0000933} // AddedComplexity
Bill Schmidt61e65232014-10-22 13:13:40 +0000934
Hal Finkel27774d92014-03-13 07:58:58 +0000935def : InstAlias<"xvmovdp $XT, $XB",
936 (XVCPSGNDP vsrc:$XT, vsrc:$XB, vsrc:$XB)>;
937def : InstAlias<"xvmovsp $XT, $XB",
938 (XVCPSGNSP vsrc:$XT, vsrc:$XB, vsrc:$XB)>;
939
940def : InstAlias<"xxspltd $XT, $XB, 0",
941 (XXPERMDI vsrc:$XT, vsrc:$XB, vsrc:$XB, 0)>;
942def : InstAlias<"xxspltd $XT, $XB, 1",
943 (XXPERMDI vsrc:$XT, vsrc:$XB, vsrc:$XB, 3)>;
944def : InstAlias<"xxmrghd $XT, $XA, $XB",
945 (XXPERMDI vsrc:$XT, vsrc:$XA, vsrc:$XB, 0)>;
946def : InstAlias<"xxmrgld $XT, $XA, $XB",
947 (XXPERMDI vsrc:$XT, vsrc:$XA, vsrc:$XB, 3)>;
948def : InstAlias<"xxswapd $XT, $XB",
949 (XXPERMDI vsrc:$XT, vsrc:$XB, vsrc:$XB, 2)>;
Nemanja Ivanovic15748f42016-12-06 11:47:14 +0000950def : InstAlias<"xxspltd $XT, $XB, 0",
951 (XXPERMDIs vsrc:$XT, vsfrc:$XB, 0)>;
952def : InstAlias<"xxspltd $XT, $XB, 1",
953 (XXPERMDIs vsrc:$XT, vsfrc:$XB, 3)>;
954def : InstAlias<"xxswapd $XT, $XB",
955 (XXPERMDIs vsrc:$XT, vsfrc:$XB, 2)>;
Hal Finkel27774d92014-03-13 07:58:58 +0000956
957let AddedComplexity = 400 in { // Prefer VSX patterns over non-VSX patterns.
Bill Schmidt10f6eb92014-12-09 16:43:32 +0000958
Nemanja Ivanovic6f22b412016-09-27 08:42:12 +0000959def : Pat<(v4i32 (vnot_ppc v4i32:$A)),
960 (v4i32 (XXLNOR $A, $A))>;
Bill Schmidt10f6eb92014-12-09 16:43:32 +0000961let Predicates = [IsBigEndian] in {
Hal Finkel27774d92014-03-13 07:58:58 +0000962def : Pat<(v2f64 (scalar_to_vector f64:$A)),
Hal Finkel19be5062014-03-29 05:29:01 +0000963 (v2f64 (SUBREG_TO_REG (i64 1), $A, sub_64))>;
Hal Finkel27774d92014-03-13 07:58:58 +0000964
Matt Arsenaultfbd9bbf2015-12-11 19:20:16 +0000965def : Pat<(f64 (extractelt v2f64:$S, 0)),
Hal Finkel19be5062014-03-29 05:29:01 +0000966 (f64 (EXTRACT_SUBREG $S, sub_64))>;
Matt Arsenaultfbd9bbf2015-12-11 19:20:16 +0000967def : Pat<(f64 (extractelt v2f64:$S, 1)),
Hal Finkel19be5062014-03-29 05:29:01 +0000968 (f64 (EXTRACT_SUBREG (XXPERMDI $S, $S, 2), sub_64))>;
Bill Schmidt10f6eb92014-12-09 16:43:32 +0000969}
970
971let Predicates = [IsLittleEndian] in {
972def : Pat<(v2f64 (scalar_to_vector f64:$A)),
973 (v2f64 (XXPERMDI (SUBREG_TO_REG (i64 1), $A, sub_64),
974 (SUBREG_TO_REG (i64 1), $A, sub_64), 0))>;
975
Matt Arsenaultfbd9bbf2015-12-11 19:20:16 +0000976def : Pat<(f64 (extractelt v2f64:$S, 0)),
Bill Schmidt10f6eb92014-12-09 16:43:32 +0000977 (f64 (EXTRACT_SUBREG (XXPERMDI $S, $S, 2), sub_64))>;
Matt Arsenaultfbd9bbf2015-12-11 19:20:16 +0000978def : Pat<(f64 (extractelt v2f64:$S, 1)),
Bill Schmidt10f6eb92014-12-09 16:43:32 +0000979 (f64 (EXTRACT_SUBREG $S, sub_64))>;
980}
Hal Finkel27774d92014-03-13 07:58:58 +0000981
982// Additional fnmsub patterns: -a*c + b == -(a*c - b)
983def : Pat<(fma (fneg f64:$A), f64:$C, f64:$B),
984 (XSNMSUBADP $B, $C, $A)>;
985def : Pat<(fma f64:$A, (fneg f64:$C), f64:$B),
986 (XSNMSUBADP $B, $C, $A)>;
987
988def : Pat<(fma (fneg v2f64:$A), v2f64:$C, v2f64:$B),
989 (XVNMSUBADP $B, $C, $A)>;
990def : Pat<(fma v2f64:$A, (fneg v2f64:$C), v2f64:$B),
991 (XVNMSUBADP $B, $C, $A)>;
992
993def : Pat<(fma (fneg v4f32:$A), v4f32:$C, v4f32:$B),
994 (XVNMSUBASP $B, $C, $A)>;
995def : Pat<(fma v4f32:$A, (fneg v4f32:$C), v4f32:$B),
996 (XVNMSUBASP $B, $C, $A)>;
997
Hal Finkel9e0baa62014-04-01 19:24:27 +0000998def : Pat<(v2f64 (bitconvert v4f32:$A)),
999 (COPY_TO_REGCLASS $A, VSRC)>;
Hal Finkel27774d92014-03-13 07:58:58 +00001000def : Pat<(v2f64 (bitconvert v4i32:$A)),
1001 (COPY_TO_REGCLASS $A, VSRC)>;
1002def : Pat<(v2f64 (bitconvert v8i16:$A)),
1003 (COPY_TO_REGCLASS $A, VSRC)>;
1004def : Pat<(v2f64 (bitconvert v16i8:$A)),
1005 (COPY_TO_REGCLASS $A, VSRC)>;
1006
Hal Finkel9e0baa62014-04-01 19:24:27 +00001007def : Pat<(v4f32 (bitconvert v2f64:$A)),
1008 (COPY_TO_REGCLASS $A, VRRC)>;
Hal Finkel27774d92014-03-13 07:58:58 +00001009def : Pat<(v4i32 (bitconvert v2f64:$A)),
1010 (COPY_TO_REGCLASS $A, VRRC)>;
1011def : Pat<(v8i16 (bitconvert v2f64:$A)),
1012 (COPY_TO_REGCLASS $A, VRRC)>;
1013def : Pat<(v16i8 (bitconvert v2f64:$A)),
1014 (COPY_TO_REGCLASS $A, VRRC)>;
1015
Hal Finkel9e0baa62014-04-01 19:24:27 +00001016def : Pat<(v2i64 (bitconvert v4f32:$A)),
1017 (COPY_TO_REGCLASS $A, VSRC)>;
Hal Finkela6c8b512014-03-26 16:12:58 +00001018def : Pat<(v2i64 (bitconvert v4i32:$A)),
1019 (COPY_TO_REGCLASS $A, VSRC)>;
1020def : Pat<(v2i64 (bitconvert v8i16:$A)),
1021 (COPY_TO_REGCLASS $A, VSRC)>;
1022def : Pat<(v2i64 (bitconvert v16i8:$A)),
1023 (COPY_TO_REGCLASS $A, VSRC)>;
1024
Hal Finkel9e0baa62014-04-01 19:24:27 +00001025def : Pat<(v4f32 (bitconvert v2i64:$A)),
1026 (COPY_TO_REGCLASS $A, VRRC)>;
Hal Finkela6c8b512014-03-26 16:12:58 +00001027def : Pat<(v4i32 (bitconvert v2i64:$A)),
1028 (COPY_TO_REGCLASS $A, VRRC)>;
1029def : Pat<(v8i16 (bitconvert v2i64:$A)),
1030 (COPY_TO_REGCLASS $A, VRRC)>;
1031def : Pat<(v16i8 (bitconvert v2i64:$A)),
1032 (COPY_TO_REGCLASS $A, VRRC)>;
1033
Hal Finkel9281c9a2014-03-26 18:26:30 +00001034def : Pat<(v2f64 (bitconvert v2i64:$A)),
1035 (COPY_TO_REGCLASS $A, VRRC)>;
1036def : Pat<(v2i64 (bitconvert v2f64:$A)),
1037 (COPY_TO_REGCLASS $A, VRRC)>;
1038
Kit Bartond4eb73c2015-05-05 16:10:44 +00001039def : Pat<(v2f64 (bitconvert v1i128:$A)),
1040 (COPY_TO_REGCLASS $A, VRRC)>;
1041def : Pat<(v1i128 (bitconvert v2f64:$A)),
1042 (COPY_TO_REGCLASS $A, VRRC)>;
1043
Stefan Pintilie927e8bf2018-10-23 17:11:36 +00001044def : Pat<(v2i64 (bitconvert f128:$A)),
1045 (COPY_TO_REGCLASS $A, VRRC)>;
1046def : Pat<(v4i32 (bitconvert f128:$A)),
1047 (COPY_TO_REGCLASS $A, VRRC)>;
1048def : Pat<(v8i16 (bitconvert f128:$A)),
1049 (COPY_TO_REGCLASS $A, VRRC)>;
1050def : Pat<(v16i8 (bitconvert f128:$A)),
1051 (COPY_TO_REGCLASS $A, VRRC)>;
1052
Nemanja Ivanovic44513e52016-07-05 09:22:29 +00001053def : Pat<(v2f64 (PPCsvec2fp v4i32:$C, 0)),
1054 (v2f64 (XVCVSXWDP (v2i64 (XXMRGHW $C, $C))))>;
1055def : Pat<(v2f64 (PPCsvec2fp v4i32:$C, 1)),
1056 (v2f64 (XVCVSXWDP (v2i64 (XXMRGLW $C, $C))))>;
1057
1058def : Pat<(v2f64 (PPCuvec2fp v4i32:$C, 0)),
1059 (v2f64 (XVCVUXWDP (v2i64 (XXMRGHW $C, $C))))>;
1060def : Pat<(v2f64 (PPCuvec2fp v4i32:$C, 1)),
1061 (v2f64 (XVCVUXWDP (v2i64 (XXMRGLW $C, $C))))>;
1062
Bill Schmidt2d1128a2014-10-17 15:13:38 +00001063// Loads.
Nemanja Ivanovic6e7879c2016-09-22 09:52:19 +00001064let Predicates = [HasVSX, HasOnlySwappingMemOps] in {
Nemanja Ivanovic6e7879c2016-09-22 09:52:19 +00001065 def : Pat<(v2f64 (PPClxvd2x xoaddr:$src)), (LXVD2X xoaddr:$src)>;
Bill Schmidt2d1128a2014-10-17 15:13:38 +00001066
Nemanja Ivanovic6e7879c2016-09-22 09:52:19 +00001067 // Stores.
1068 def : Pat<(int_ppc_vsx_stxvd2x v2f64:$rS, xoaddr:$dst),
1069 (STXVD2X $rS, xoaddr:$dst)>;
Nemanja Ivanovic6e7879c2016-09-22 09:52:19 +00001070 def : Pat<(PPCstxvd2x v2f64:$rS, xoaddr:$dst), (STXVD2X $rS, xoaddr:$dst)>;
1071}
Nemanja Ivanovice78ffed2016-09-22 10:32:03 +00001072let Predicates = [IsBigEndian, HasVSX, HasOnlySwappingMemOps] in {
1073 def : Pat<(v2f64 (load xoaddr:$src)), (LXVD2X xoaddr:$src)>;
1074 def : Pat<(v2i64 (load xoaddr:$src)), (LXVD2X xoaddr:$src)>;
1075 def : Pat<(v4i32 (load xoaddr:$src)), (LXVW4X xoaddr:$src)>;
Nemanja Ivanovicb89c27f2017-05-02 01:47:34 +00001076 def : Pat<(v4i32 (int_ppc_vsx_lxvw4x xoaddr:$src)), (LXVW4X xoaddr:$src)>;
Nemanja Ivanovice78ffed2016-09-22 10:32:03 +00001077 def : Pat<(store v2f64:$rS, xoaddr:$dst), (STXVD2X $rS, xoaddr:$dst)>;
1078 def : Pat<(store v2i64:$rS, xoaddr:$dst), (STXVD2X $rS, xoaddr:$dst)>;
Nemanja Ivanovicb89c27f2017-05-02 01:47:34 +00001079 def : Pat<(store v4i32:$XT, xoaddr:$dst), (STXVW4X $XT, xoaddr:$dst)>;
1080 def : Pat<(int_ppc_vsx_stxvw4x v4i32:$rS, xoaddr:$dst),
1081 (STXVW4X $rS, xoaddr:$dst)>;
Nemanja Ivanovice78ffed2016-09-22 10:32:03 +00001082}
Bill Schmidtfae5d712014-12-09 16:35:51 +00001083
1084// Permutes.
1085def : Pat<(v2f64 (PPCxxswapd v2f64:$src)), (XXPERMDI $src, $src, 2)>;
1086def : Pat<(v2i64 (PPCxxswapd v2i64:$src)), (XXPERMDI $src, $src, 2)>;
1087def : Pat<(v4f32 (PPCxxswapd v4f32:$src)), (XXPERMDI $src, $src, 2)>;
1088def : Pat<(v4i32 (PPCxxswapd v4i32:$src)), (XXPERMDI $src, $src, 2)>;
Nemanja Ivanoviceebbcb62016-07-12 12:16:27 +00001089def : Pat<(v2f64 (PPCswapNoChain v2f64:$src)), (XXPERMDI $src, $src, 2)>;
Bill Schmidt2d1128a2014-10-17 15:13:38 +00001090
Tony Jiang0a429f02017-05-24 23:48:29 +00001091// PPCvecshl XT, XA, XA, 2 can be selected to both XXSLDWI XT,XA,XA,2 and
1092// XXSWAPD XT,XA (i.e. XXPERMDI XT,XA,XA,2), the later one is more profitable.
1093def : Pat<(v4i32 (PPCvecshl v4i32:$src, v4i32:$src, 2)), (XXPERMDI $src, $src, 2)>;
1094
Bill Schmidt61e65232014-10-22 13:13:40 +00001095// Selects.
1096def : Pat<(v2f64 (selectcc i1:$lhs, i1:$rhs, v2f64:$tval, v2f64:$fval, SETLT)),
Hal Finkela2cdbce2015-08-30 22:12:50 +00001097 (SELECT_VSRC (CRANDC $lhs, $rhs), $tval, $fval)>;
1098def : Pat<(v2f64 (selectcc i1:$lhs, i1:$rhs, v2f64:$tval, v2f64:$fval, SETULT)),
Bill Schmidt61e65232014-10-22 13:13:40 +00001099 (SELECT_VSRC (CRANDC $rhs, $lhs), $tval, $fval)>;
1100def : Pat<(v2f64 (selectcc i1:$lhs, i1:$rhs, v2f64:$tval, v2f64:$fval, SETLE)),
Hal Finkela2cdbce2015-08-30 22:12:50 +00001101 (SELECT_VSRC (CRORC $lhs, $rhs), $tval, $fval)>;
1102def : Pat<(v2f64 (selectcc i1:$lhs, i1:$rhs, v2f64:$tval, v2f64:$fval, SETULE)),
Bill Schmidt61e65232014-10-22 13:13:40 +00001103 (SELECT_VSRC (CRORC $rhs, $lhs), $tval, $fval)>;
1104def : Pat<(v2f64 (selectcc i1:$lhs, i1:$rhs, v2f64:$tval, v2f64:$fval, SETEQ)),
1105 (SELECT_VSRC (CREQV $lhs, $rhs), $tval, $fval)>;
1106def : Pat<(v2f64 (selectcc i1:$lhs, i1:$rhs, v2f64:$tval, v2f64:$fval, SETGE)),
Hal Finkela2cdbce2015-08-30 22:12:50 +00001107 (SELECT_VSRC (CRORC $rhs, $lhs), $tval, $fval)>;
1108def : Pat<(v2f64 (selectcc i1:$lhs, i1:$rhs, v2f64:$tval, v2f64:$fval, SETUGE)),
Bill Schmidt61e65232014-10-22 13:13:40 +00001109 (SELECT_VSRC (CRORC $lhs, $rhs), $tval, $fval)>;
1110def : Pat<(v2f64 (selectcc i1:$lhs, i1:$rhs, v2f64:$tval, v2f64:$fval, SETGT)),
Hal Finkela2cdbce2015-08-30 22:12:50 +00001111 (SELECT_VSRC (CRANDC $rhs, $lhs), $tval, $fval)>;
1112def : Pat<(v2f64 (selectcc i1:$lhs, i1:$rhs, v2f64:$tval, v2f64:$fval, SETUGT)),
Bill Schmidt61e65232014-10-22 13:13:40 +00001113 (SELECT_VSRC (CRANDC $lhs, $rhs), $tval, $fval)>;
1114def : Pat<(v2f64 (selectcc i1:$lhs, i1:$rhs, v2f64:$tval, v2f64:$fval, SETNE)),
1115 (SELECT_VSRC (CRXOR $lhs, $rhs), $tval, $fval)>;
1116
Bill Schmidt9c54bbd2014-10-22 16:58:20 +00001117def : Pat<(f64 (selectcc i1:$lhs, i1:$rhs, f64:$tval, f64:$fval, SETLT)),
Hal Finkela2cdbce2015-08-30 22:12:50 +00001118 (SELECT_VSFRC (CRANDC $lhs, $rhs), $tval, $fval)>;
1119def : Pat<(f64 (selectcc i1:$lhs, i1:$rhs, f64:$tval, f64:$fval, SETULT)),
Bill Schmidt9c54bbd2014-10-22 16:58:20 +00001120 (SELECT_VSFRC (CRANDC $rhs, $lhs), $tval, $fval)>;
1121def : Pat<(f64 (selectcc i1:$lhs, i1:$rhs, f64:$tval, f64:$fval, SETLE)),
Hal Finkela2cdbce2015-08-30 22:12:50 +00001122 (SELECT_VSFRC (CRORC $lhs, $rhs), $tval, $fval)>;
1123def : Pat<(f64 (selectcc i1:$lhs, i1:$rhs, f64:$tval, f64:$fval, SETULE)),
Bill Schmidt9c54bbd2014-10-22 16:58:20 +00001124 (SELECT_VSFRC (CRORC $rhs, $lhs), $tval, $fval)>;
1125def : Pat<(f64 (selectcc i1:$lhs, i1:$rhs, f64:$tval, f64:$fval, SETEQ)),
1126 (SELECT_VSFRC (CREQV $lhs, $rhs), $tval, $fval)>;
1127def : Pat<(f64 (selectcc i1:$lhs, i1:$rhs, f64:$tval, f64:$fval, SETGE)),
Hal Finkela2cdbce2015-08-30 22:12:50 +00001128 (SELECT_VSFRC (CRORC $rhs, $lhs), $tval, $fval)>;
1129def : Pat<(f64 (selectcc i1:$lhs, i1:$rhs, f64:$tval, f64:$fval, SETUGE)),
Bill Schmidt9c54bbd2014-10-22 16:58:20 +00001130 (SELECT_VSFRC (CRORC $lhs, $rhs), $tval, $fval)>;
1131def : Pat<(f64 (selectcc i1:$lhs, i1:$rhs, f64:$tval, f64:$fval, SETGT)),
Hal Finkela2cdbce2015-08-30 22:12:50 +00001132 (SELECT_VSFRC (CRANDC $rhs, $lhs), $tval, $fval)>;
1133def : Pat<(f64 (selectcc i1:$lhs, i1:$rhs, f64:$tval, f64:$fval, SETUGT)),
Bill Schmidt9c54bbd2014-10-22 16:58:20 +00001134 (SELECT_VSFRC (CRANDC $lhs, $rhs), $tval, $fval)>;
1135def : Pat<(f64 (selectcc i1:$lhs, i1:$rhs, f64:$tval, f64:$fval, SETNE)),
1136 (SELECT_VSFRC (CRXOR $lhs, $rhs), $tval, $fval)>;
1137
Bill Schmidt76746922014-11-14 12:10:40 +00001138// Divides.
1139def : Pat<(int_ppc_vsx_xvdivsp v4f32:$A, v4f32:$B),
1140 (XVDIVSP $A, $B)>;
1141def : Pat<(int_ppc_vsx_xvdivdp v2f64:$A, v2f64:$B),
1142 (XVDIVDP $A, $B)>;
1143
Nemanja Ivanovic984a3612015-07-14 17:25:20 +00001144// Reciprocal estimate
1145def : Pat<(int_ppc_vsx_xvresp v4f32:$A),
1146 (XVRESP $A)>;
1147def : Pat<(int_ppc_vsx_xvredp v2f64:$A),
1148 (XVREDP $A)>;
1149
Nemanja Ivanovicd358b8f2015-07-05 06:03:51 +00001150// Recip. square root estimate
1151def : Pat<(int_ppc_vsx_xvrsqrtesp v4f32:$A),
1152 (XVRSQRTESP $A)>;
1153def : Pat<(int_ppc_vsx_xvrsqrtedp v2f64:$A),
1154 (XVRSQRTEDP $A)>;
1155
Zi Xuan Wu6a3c2792018-11-14 02:34:45 +00001156// Vector selection
1157def : Pat<(v16i8 (vselect v16i8:$vA, v16i8:$vB, v16i8:$vC)),
1158 (COPY_TO_REGCLASS
1159 (XXSEL (COPY_TO_REGCLASS $vC, VSRC),
1160 (COPY_TO_REGCLASS $vB, VSRC),
1161 (COPY_TO_REGCLASS $vA, VSRC)), VRRC)>;
1162def : Pat<(v8i16 (vselect v8i16:$vA, v8i16:$vB, v8i16:$vC)),
1163 (COPY_TO_REGCLASS
1164 (XXSEL (COPY_TO_REGCLASS $vC, VSRC),
1165 (COPY_TO_REGCLASS $vB, VSRC),
1166 (COPY_TO_REGCLASS $vA, VSRC)), VRRC)>;
1167def : Pat<(vselect v4i32:$vA, v4i32:$vB, v4i32:$vC),
1168 (XXSEL $vC, $vB, $vA)>;
1169def : Pat<(vselect v2i64:$vA, v2i64:$vB, v2i64:$vC),
1170 (XXSEL $vC, $vB, $vA)>;
1171def : Pat<(vselect v4i32:$vA, v4f32:$vB, v4f32:$vC),
1172 (XXSEL $vC, $vB, $vA)>;
1173def : Pat<(vselect v2i64:$vA, v2f64:$vB, v2f64:$vC),
1174 (XXSEL $vC, $vB, $vA)>;
1175
Nemanja Ivanovicd3c284f2016-07-18 15:30:00 +00001176let Predicates = [IsLittleEndian] in {
1177def : Pat<(f64 (PPCfcfid (PPCmtvsra (i64 (vector_extract v2i64:$S, 0))))),
1178 (f64 (XSCVSXDDP (COPY_TO_REGCLASS (XXPERMDI $S, $S, 2), VSFRC)))>;
1179def : Pat<(f64 (PPCfcfid (PPCmtvsra (i64 (vector_extract v2i64:$S, 1))))),
1180 (f64 (XSCVSXDDP (COPY_TO_REGCLASS (f64 (COPY_TO_REGCLASS $S, VSRC)), VSFRC)))>;
1181def : Pat<(f64 (PPCfcfidu (PPCmtvsra (i64 (vector_extract v2i64:$S, 0))))),
1182 (f64 (XSCVUXDDP (COPY_TO_REGCLASS (XXPERMDI $S, $S, 2), VSFRC)))>;
1183def : Pat<(f64 (PPCfcfidu (PPCmtvsra (i64 (vector_extract v2i64:$S, 1))))),
1184 (f64 (XSCVUXDDP (COPY_TO_REGCLASS (f64 (COPY_TO_REGCLASS $S, VSRC)), VSFRC)))>;
1185} // IsLittleEndian
1186
1187let Predicates = [IsBigEndian] in {
1188def : Pat<(f64 (PPCfcfid (PPCmtvsra (i64 (vector_extract v2i64:$S, 0))))),
1189 (f64 (XSCVSXDDP (COPY_TO_REGCLASS $S, VSFRC)))>;
1190def : Pat<(f64 (PPCfcfid (PPCmtvsra (i64 (vector_extract v2i64:$S, 1))))),
1191 (f64 (XSCVSXDDP (COPY_TO_REGCLASS (XXPERMDI $S, $S, 2), VSFRC)))>;
1192def : Pat<(f64 (PPCfcfidu (PPCmtvsra (i64 (vector_extract v2i64:$S, 0))))),
1193 (f64 (XSCVUXDDP (COPY_TO_REGCLASS $S, VSFRC)))>;
1194def : Pat<(f64 (PPCfcfidu (PPCmtvsra (i64 (vector_extract v2i64:$S, 1))))),
1195 (f64 (XSCVUXDDP (COPY_TO_REGCLASS (XXPERMDI $S, $S, 2), VSFRC)))>;
1196} // IsBigEndian
1197
Hal Finkel27774d92014-03-13 07:58:58 +00001198} // AddedComplexity
1199} // HasVSX
1200
Nemanja Ivanovic11049f82016-10-04 06:59:23 +00001201def ScalarLoads {
1202 dag Li8 = (i32 (extloadi8 xoaddr:$src));
1203 dag ZELi8 = (i32 (zextloadi8 xoaddr:$src));
1204 dag ZELi8i64 = (i64 (zextloadi8 xoaddr:$src));
1205 dag SELi8 = (i32 (sext_inreg (extloadi8 xoaddr:$src), i8));
1206 dag SELi8i64 = (i64 (sext_inreg (extloadi8 xoaddr:$src), i8));
1207
1208 dag Li16 = (i32 (extloadi16 xoaddr:$src));
1209 dag ZELi16 = (i32 (zextloadi16 xoaddr:$src));
1210 dag ZELi16i64 = (i64 (zextloadi16 xoaddr:$src));
1211 dag SELi16 = (i32 (sextloadi16 xoaddr:$src));
1212 dag SELi16i64 = (i64 (sextloadi16 xoaddr:$src));
1213
1214 dag Li32 = (i32 (load xoaddr:$src));
1215}
1216
Nemanja Ivanovic0f7715a2018-12-29 13:40:48 +00001217def DWToSPExtractConv {
1218 dag El0US1 = (f32 (PPCfcfidus
1219 (f64 (PPCmtvsra (i64 (vector_extract v2i64:$S1, 0))))));
1220 dag El1US1 = (f32 (PPCfcfidus
1221 (f64 (PPCmtvsra (i64 (vector_extract v2i64:$S1, 1))))));
1222 dag El0US2 = (f32 (PPCfcfidus
1223 (f64 (PPCmtvsra (i64 (vector_extract v2i64:$S2, 0))))));
1224 dag El1US2 = (f32 (PPCfcfidus
1225 (f64 (PPCmtvsra (i64 (vector_extract v2i64:$S2, 1))))));
1226 dag El0SS1 = (f32 (PPCfcfids
1227 (f64 (PPCmtvsra (i64 (vector_extract v2i64:$S1, 0))))));
1228 dag El1SS1 = (f32 (PPCfcfids
1229 (f64 (PPCmtvsra (i64 (vector_extract v2i64:$S1, 1))))));
1230 dag El0SS2 = (f32 (PPCfcfids
1231 (f64 (PPCmtvsra (i64 (vector_extract v2i64:$S2, 0))))));
1232 dag El1SS2 = (f32 (PPCfcfids
1233 (f64 (PPCmtvsra (i64 (vector_extract v2i64:$S2, 1))))));
1234 dag BVU = (v4f32 (build_vector El0US1, El1US1, El0US2, El1US2));
1235 dag BVS = (v4f32 (build_vector El0SS1, El1SS1, El0SS2, El1SS2));
1236}
1237
Kit Barton298beb52015-02-18 16:21:46 +00001238// The following VSX instructions were introduced in Power ISA 2.07
1239/* FIXME: if the operands are v2i64, these patterns will not match.
1240 we should define new patterns or otherwise match the same patterns
1241 when the elements are larger than i32.
1242*/
1243def HasP8Vector : Predicate<"PPCSubTarget->hasP8Vector()">;
Nemanja Ivanovicc38b5312015-04-11 10:40:42 +00001244def HasDirectMove : Predicate<"PPCSubTarget->hasDirectMove()">;
Lei Huangc29229a2018-05-08 17:36:40 +00001245def NoP9Vector : Predicate<"!PPCSubTarget->hasP9Vector()">;
Kit Barton298beb52015-02-18 16:21:46 +00001246let Predicates = [HasP8Vector] in {
1247let AddedComplexity = 400 in { // Prefer VSX patterns over non-VSX patterns.
Stefan Pintiliee1d79a82019-03-26 20:28:21 +00001248 let isCommutable = 1 in {
Nemanja Ivanovicf02def62015-05-21 19:32:49 +00001249 def XXLEQV : XX3Form<60, 186,
1250 (outs vsrc:$XT), (ins vsrc:$XA, vsrc:$XB),
1251 "xxleqv $XT, $XA, $XB", IIC_VecGeneral,
1252 [(set v4i32:$XT, (vnot_ppc (xor v4i32:$XA, v4i32:$XB)))]>;
1253 def XXLNAND : XX3Form<60, 178,
1254 (outs vsrc:$XT), (ins vsrc:$XA, vsrc:$XB),
1255 "xxlnand $XT, $XA, $XB", IIC_VecGeneral,
1256 [(set v4i32:$XT, (vnot_ppc (and v4i32:$XA,
Kit Barton298beb52015-02-18 16:21:46 +00001257 v4i32:$XB)))]>;
Stefan Pintiliee1d79a82019-03-26 20:28:21 +00001258 } // isCommutable
Nemanja Ivanovicd9e4b4f2015-07-10 14:25:17 +00001259
Nemanja Ivanovic5655fb32015-07-10 12:38:08 +00001260 def : Pat<(int_ppc_vsx_xxleqv v4i32:$A, v4i32:$B),
1261 (XXLEQV $A, $B)>;
Nemanja Ivanovicf02def62015-05-21 19:32:49 +00001262
1263 def XXLORC : XX3Form<60, 170,
1264 (outs vsrc:$XT), (ins vsrc:$XA, vsrc:$XB),
1265 "xxlorc $XT, $XA, $XB", IIC_VecGeneral,
1266 [(set v4i32:$XT, (or v4i32:$XA, (vnot_ppc v4i32:$XB)))]>;
1267
Nemanja Ivanovicf3c94b12015-05-07 18:24:05 +00001268 // VSX scalar loads introduced in ISA 2.07
Sean Fertile3c8c3852017-01-26 18:59:15 +00001269 let mayLoad = 1, mayStore = 0 in {
Nemanja Ivanovic6354d232016-10-04 11:25:52 +00001270 let CodeSize = 3 in
Stefan Pintilie26d4f922018-03-26 17:39:18 +00001271 def LXSSPX : XX1Form_memOp<31, 524, (outs vssrc:$XT), (ins memrr:$src),
Tony Jiang438bf4a2017-11-20 14:38:30 +00001272 "lxsspx $XT, $src", IIC_LdStLFD, []>;
Stefan Pintilie26d4f922018-03-26 17:39:18 +00001273 def LXSIWAX : XX1Form_memOp<31, 76, (outs vsfrc:$XT), (ins memrr:$src),
Tony Jiang438bf4a2017-11-20 14:38:30 +00001274 "lxsiwax $XT, $src", IIC_LdStLFD, []>;
Stefan Pintilie26d4f922018-03-26 17:39:18 +00001275 def LXSIWZX : XX1Form_memOp<31, 12, (outs vsfrc:$XT), (ins memrr:$src),
Tony Jiang438bf4a2017-11-20 14:38:30 +00001276 "lxsiwzx $XT, $src", IIC_LdStLFD, []>;
1277
Jinsong Jic7b43b92018-12-13 15:12:57 +00001278 // Pseudo instruction XFLOADf32 will be expanded to LXSSPX or LFSX later
1279 let CodeSize = 3 in
1280 def XFLOADf32 : PseudoXFormMemOp<(outs vssrc:$XT), (ins memrr:$src),
1281 "#XFLOADf32",
1282 [(set f32:$XT, (load xoaddr:$src))]>;
1283 // Pseudo instruction LIWAX will be expanded to LXSIWAX or LFIWAX later
1284 def LIWAX : PseudoXFormMemOp<(outs vsfrc:$XT), (ins memrr:$src),
1285 "#LIWAX",
1286 [(set f64:$XT, (PPClfiwax xoaddr:$src))]>;
1287 // Pseudo instruction LIWZX will be expanded to LXSIWZX or LFIWZX later
1288 def LIWZX : PseudoXFormMemOp<(outs vsfrc:$XT), (ins memrr:$src),
1289 "#LIWZX",
1290 [(set f64:$XT, (PPClfiwzx xoaddr:$src))]>;
Nemanja Ivanovicf3c94b12015-05-07 18:24:05 +00001291 } // mayLoad
1292
1293 // VSX scalar stores introduced in ISA 2.07
Sean Fertile3c8c3852017-01-26 18:59:15 +00001294 let mayStore = 1, mayLoad = 0 in {
Nemanja Ivanovic6354d232016-10-04 11:25:52 +00001295 let CodeSize = 3 in
Stefan Pintilie26d4f922018-03-26 17:39:18 +00001296 def STXSSPX : XX1Form_memOp<31, 652, (outs), (ins vssrc:$XT, memrr:$dst),
Tony Jiang438bf4a2017-11-20 14:38:30 +00001297 "stxsspx $XT, $dst", IIC_LdStSTFD, []>;
Stefan Pintilie26d4f922018-03-26 17:39:18 +00001298 def STXSIWX : XX1Form_memOp<31, 140, (outs), (ins vsfrc:$XT, memrr:$dst),
Tony Jiang438bf4a2017-11-20 14:38:30 +00001299 "stxsiwx $XT, $dst", IIC_LdStSTFD, []>;
1300
Jinsong Jic7b43b92018-12-13 15:12:57 +00001301 // Pseudo instruction XFSTOREf32 will be expanded to STXSSPX or STFSX later
1302 let CodeSize = 3 in
1303 def XFSTOREf32 : PseudoXFormMemOp<(outs), (ins vssrc:$XT, memrr:$dst),
1304 "#XFSTOREf32",
1305 [(store f32:$XT, xoaddr:$dst)]>;
1306 // Pseudo instruction STIWX will be expanded to STXSIWX or STFIWX later
1307 def STIWX : PseudoXFormMemOp<(outs), (ins vsfrc:$XT, memrr:$dst),
1308 "#STIWX",
1309 [(PPCstfiwx f64:$XT, xoaddr:$dst)]>;
Nemanja Ivanovicf3c94b12015-05-07 18:24:05 +00001310 } // mayStore
Nemanja Ivanovicf02def62015-05-21 19:32:49 +00001311
1312 def : Pat<(f64 (extloadf32 xoaddr:$src)),
Tony Jiang438bf4a2017-11-20 14:38:30 +00001313 (COPY_TO_REGCLASS (XFLOADf32 xoaddr:$src), VSFRC)>;
Lei Huangcd4f3852018-03-12 19:26:18 +00001314 def : Pat<(f32 (fpround (f64 (extloadf32 xoaddr:$src)))),
Tony Jiang438bf4a2017-11-20 14:38:30 +00001315 (f32 (XFLOADf32 xoaddr:$src))>;
Michael Kuperstein2bc3d4d2016-08-18 20:08:15 +00001316 def : Pat<(f64 (fpextend f32:$src)),
Nemanja Ivanovicf02def62015-05-21 19:32:49 +00001317 (COPY_TO_REGCLASS $src, VSFRC)>;
Hal Finkela2cdbce2015-08-30 22:12:50 +00001318
Nemanja Ivanovicf02def62015-05-21 19:32:49 +00001319 def : Pat<(f32 (selectcc i1:$lhs, i1:$rhs, f32:$tval, f32:$fval, SETLT)),
Hal Finkela2cdbce2015-08-30 22:12:50 +00001320 (SELECT_VSSRC (CRANDC $lhs, $rhs), $tval, $fval)>;
1321 def : Pat<(f32 (selectcc i1:$lhs, i1:$rhs, f32:$tval, f32:$fval, SETULT)),
Nemanja Ivanovicf02def62015-05-21 19:32:49 +00001322 (SELECT_VSSRC (CRANDC $rhs, $lhs), $tval, $fval)>;
1323 def : Pat<(f32 (selectcc i1:$lhs, i1:$rhs, f32:$tval, f32:$fval, SETLE)),
Hal Finkela2cdbce2015-08-30 22:12:50 +00001324 (SELECT_VSSRC (CRORC $lhs, $rhs), $tval, $fval)>;
1325 def : Pat<(f32 (selectcc i1:$lhs, i1:$rhs, f32:$tval, f32:$fval, SETULE)),
Nemanja Ivanovicf02def62015-05-21 19:32:49 +00001326 (SELECT_VSSRC (CRORC $rhs, $lhs), $tval, $fval)>;
1327 def : Pat<(f32 (selectcc i1:$lhs, i1:$rhs, f32:$tval, f32:$fval, SETEQ)),
1328 (SELECT_VSSRC (CREQV $lhs, $rhs), $tval, $fval)>;
1329 def : Pat<(f32 (selectcc i1:$lhs, i1:$rhs, f32:$tval, f32:$fval, SETGE)),
Hal Finkela2cdbce2015-08-30 22:12:50 +00001330 (SELECT_VSSRC (CRORC $rhs, $lhs), $tval, $fval)>;
1331 def : Pat<(f32 (selectcc i1:$lhs, i1:$rhs, f32:$tval, f32:$fval, SETUGE)),
Nemanja Ivanovicf02def62015-05-21 19:32:49 +00001332 (SELECT_VSSRC (CRORC $lhs, $rhs), $tval, $fval)>;
1333 def : Pat<(f32 (selectcc i1:$lhs, i1:$rhs, f32:$tval, f32:$fval, SETGT)),
Hal Finkela2cdbce2015-08-30 22:12:50 +00001334 (SELECT_VSSRC (CRANDC $rhs, $lhs), $tval, $fval)>;
1335 def : Pat<(f32 (selectcc i1:$lhs, i1:$rhs, f32:$tval, f32:$fval, SETUGT)),
Nemanja Ivanovicf02def62015-05-21 19:32:49 +00001336 (SELECT_VSSRC (CRANDC $lhs, $rhs), $tval, $fval)>;
1337 def : Pat<(f32 (selectcc i1:$lhs, i1:$rhs, f32:$tval, f32:$fval, SETNE)),
Hal Finkela2cdbce2015-08-30 22:12:50 +00001338 (SELECT_VSSRC (CRXOR $lhs, $rhs), $tval, $fval)>;
Nemanja Ivanovicf02def62015-05-21 19:32:49 +00001339
1340 // VSX Elementary Scalar FP arithmetic (SP)
1341 let isCommutable = 1 in {
1342 def XSADDSP : XX3Form<60, 0,
1343 (outs vssrc:$XT), (ins vssrc:$XA, vssrc:$XB),
1344 "xsaddsp $XT, $XA, $XB", IIC_VecFP,
1345 [(set f32:$XT, (fadd f32:$XA, f32:$XB))]>;
1346 def XSMULSP : XX3Form<60, 16,
1347 (outs vssrc:$XT), (ins vssrc:$XA, vssrc:$XB),
1348 "xsmulsp $XT, $XA, $XB", IIC_VecFP,
1349 [(set f32:$XT, (fmul f32:$XA, f32:$XB))]>;
1350 } // isCommutable
1351
1352 def XSDIVSP : XX3Form<60, 24,
1353 (outs vssrc:$XT), (ins vssrc:$XA, vssrc:$XB),
1354 "xsdivsp $XT, $XA, $XB", IIC_FPDivS,
1355 [(set f32:$XT, (fdiv f32:$XA, f32:$XB))]>;
1356 def XSRESP : XX2Form<60, 26,
1357 (outs vssrc:$XT), (ins vssrc:$XB),
1358 "xsresp $XT, $XB", IIC_VecFP,
1359 [(set f32:$XT, (PPCfre f32:$XB))]>;
Lei Huang6270ab62018-07-04 21:59:16 +00001360 def XSRSP : XX2Form<60, 281,
1361 (outs vssrc:$XT), (ins vsfrc:$XB),
1362 "xsrsp $XT, $XB", IIC_VecFP, []>;
Nemanja Ivanovicf02def62015-05-21 19:32:49 +00001363 def XSSQRTSP : XX2Form<60, 11,
1364 (outs vssrc:$XT), (ins vssrc:$XB),
1365 "xssqrtsp $XT, $XB", IIC_FPSqrtS,
1366 [(set f32:$XT, (fsqrt f32:$XB))]>;
1367 def XSRSQRTESP : XX2Form<60, 10,
1368 (outs vssrc:$XT), (ins vssrc:$XB),
1369 "xsrsqrtesp $XT, $XB", IIC_VecFP,
1370 [(set f32:$XT, (PPCfrsqrte f32:$XB))]>;
1371 def XSSUBSP : XX3Form<60, 8,
1372 (outs vssrc:$XT), (ins vssrc:$XA, vssrc:$XB),
1373 "xssubsp $XT, $XA, $XB", IIC_VecFP,
1374 [(set f32:$XT, (fsub f32:$XA, f32:$XB))]>;
Nemanja Ivanovic376e1732015-05-29 17:13:25 +00001375
1376 // FMA Instructions
1377 let BaseName = "XSMADDASP" in {
1378 let isCommutable = 1 in
1379 def XSMADDASP : XX3Form<60, 1,
1380 (outs vssrc:$XT),
1381 (ins vssrc:$XTi, vssrc:$XA, vssrc:$XB),
1382 "xsmaddasp $XT, $XA, $XB", IIC_VecFP,
1383 [(set f32:$XT, (fma f32:$XA, f32:$XB, f32:$XTi))]>,
1384 RegConstraint<"$XTi = $XT">, NoEncode<"$XTi">,
1385 AltVSXFMARel;
1386 let IsVSXFMAAlt = 1 in
1387 def XSMADDMSP : XX3Form<60, 9,
1388 (outs vssrc:$XT),
1389 (ins vssrc:$XTi, vssrc:$XA, vssrc:$XB),
1390 "xsmaddmsp $XT, $XA, $XB", IIC_VecFP, []>,
1391 RegConstraint<"$XTi = $XT">, NoEncode<"$XTi">,
1392 AltVSXFMARel;
1393 }
1394
1395 let BaseName = "XSMSUBASP" in {
1396 let isCommutable = 1 in
1397 def XSMSUBASP : XX3Form<60, 17,
1398 (outs vssrc:$XT),
1399 (ins vssrc:$XTi, vssrc:$XA, vssrc:$XB),
1400 "xsmsubasp $XT, $XA, $XB", IIC_VecFP,
1401 [(set f32:$XT, (fma f32:$XA, f32:$XB,
1402 (fneg f32:$XTi)))]>,
1403 RegConstraint<"$XTi = $XT">, NoEncode<"$XTi">,
1404 AltVSXFMARel;
1405 let IsVSXFMAAlt = 1 in
1406 def XSMSUBMSP : XX3Form<60, 25,
1407 (outs vssrc:$XT),
1408 (ins vssrc:$XTi, vssrc:$XA, vssrc:$XB),
1409 "xsmsubmsp $XT, $XA, $XB", IIC_VecFP, []>,
1410 RegConstraint<"$XTi = $XT">, NoEncode<"$XTi">,
1411 AltVSXFMARel;
1412 }
1413
1414 let BaseName = "XSNMADDASP" in {
1415 let isCommutable = 1 in
1416 def XSNMADDASP : XX3Form<60, 129,
1417 (outs vssrc:$XT),
1418 (ins vssrc:$XTi, vssrc:$XA, vssrc:$XB),
1419 "xsnmaddasp $XT, $XA, $XB", IIC_VecFP,
1420 [(set f32:$XT, (fneg (fma f32:$XA, f32:$XB,
1421 f32:$XTi)))]>,
1422 RegConstraint<"$XTi = $XT">, NoEncode<"$XTi">,
1423 AltVSXFMARel;
1424 let IsVSXFMAAlt = 1 in
1425 def XSNMADDMSP : XX3Form<60, 137,
1426 (outs vssrc:$XT),
1427 (ins vssrc:$XTi, vssrc:$XA, vssrc:$XB),
1428 "xsnmaddmsp $XT, $XA, $XB", IIC_VecFP, []>,
1429 RegConstraint<"$XTi = $XT">, NoEncode<"$XTi">,
1430 AltVSXFMARel;
1431 }
1432
1433 let BaseName = "XSNMSUBASP" in {
1434 let isCommutable = 1 in
1435 def XSNMSUBASP : XX3Form<60, 145,
1436 (outs vssrc:$XT),
1437 (ins vssrc:$XTi, vssrc:$XA, vssrc:$XB),
1438 "xsnmsubasp $XT, $XA, $XB", IIC_VecFP,
1439 [(set f32:$XT, (fneg (fma f32:$XA, f32:$XB,
1440 (fneg f32:$XTi))))]>,
1441 RegConstraint<"$XTi = $XT">, NoEncode<"$XTi">,
1442 AltVSXFMARel;
1443 let IsVSXFMAAlt = 1 in
1444 def XSNMSUBMSP : XX3Form<60, 153,
1445 (outs vssrc:$XT),
1446 (ins vssrc:$XTi, vssrc:$XA, vssrc:$XB),
1447 "xsnmsubmsp $XT, $XA, $XB", IIC_VecFP, []>,
1448 RegConstraint<"$XTi = $XT">, NoEncode<"$XTi">,
1449 AltVSXFMARel;
1450 }
Nemanja Ivanovic1c39ca62015-08-13 17:40:44 +00001451
1452 // Single Precision Conversions (FP <-> INT)
1453 def XSCVSXDSP : XX2Form<60, 312,
1454 (outs vssrc:$XT), (ins vsfrc:$XB),
1455 "xscvsxdsp $XT, $XB", IIC_VecFP,
1456 [(set f32:$XT, (PPCfcfids f64:$XB))]>;
1457 def XSCVUXDSP : XX2Form<60, 296,
1458 (outs vssrc:$XT), (ins vsfrc:$XB),
1459 "xscvuxdsp $XT, $XB", IIC_VecFP,
1460 [(set f32:$XT, (PPCfcfidus f64:$XB))]>;
1461
1462 // Conversions between vector and scalar single precision
1463 def XSCVDPSPN : XX2Form<60, 267, (outs vsrc:$XT), (ins vssrc:$XB),
1464 "xscvdpspn $XT, $XB", IIC_VecFP, []>;
1465 def XSCVSPDPN : XX2Form<60, 331, (outs vssrc:$XT), (ins vsrc:$XB),
1466 "xscvspdpn $XT, $XB", IIC_VecFP, []>;
1467
Nemanja Ivanovicd3c284f2016-07-18 15:30:00 +00001468 let Predicates = [IsLittleEndian] in {
Nemanja Ivanovic0f7715a2018-12-29 13:40:48 +00001469 def : Pat<DWToSPExtractConv.El0SS1,
1470 (f32 (XSCVSXDSP (COPY_TO_REGCLASS (XXPERMDI $S1, $S1, 2), VSFRC)))>;
1471 def : Pat<DWToSPExtractConv.El1SS1,
Lei Huangcd4f3852018-03-12 19:26:18 +00001472 (f32 (XSCVSXDSP (COPY_TO_REGCLASS
Nemanja Ivanovic0f7715a2018-12-29 13:40:48 +00001473 (f64 (COPY_TO_REGCLASS $S1, VSRC)), VSFRC)))>;
1474 def : Pat<DWToSPExtractConv.El0US1,
1475 (f32 (XSCVUXDSP (COPY_TO_REGCLASS (XXPERMDI $S1, $S1, 2), VSFRC)))>;
1476 def : Pat<DWToSPExtractConv.El1US1,
Lei Huangcd4f3852018-03-12 19:26:18 +00001477 (f32 (XSCVUXDSP (COPY_TO_REGCLASS
Nemanja Ivanovic0f7715a2018-12-29 13:40:48 +00001478 (f64 (COPY_TO_REGCLASS $S1, VSRC)), VSFRC)))>;
Nemanja Ivanovicd3c284f2016-07-18 15:30:00 +00001479 }
1480
1481 let Predicates = [IsBigEndian] in {
Nemanja Ivanovic0f7715a2018-12-29 13:40:48 +00001482 def : Pat<DWToSPExtractConv.El0SS1,
1483 (f32 (XSCVSXDSP (COPY_TO_REGCLASS $S1, VSFRC)))>;
1484 def : Pat<DWToSPExtractConv.El1SS1,
1485 (f32 (XSCVSXDSP (COPY_TO_REGCLASS (XXPERMDI $S1, $S1, 2), VSFRC)))>;
1486 def : Pat<DWToSPExtractConv.El0US1,
1487 (f32 (XSCVUXDSP (COPY_TO_REGCLASS $S1, VSFRC)))>;
1488 def : Pat<DWToSPExtractConv.El1US1,
1489 (f32 (XSCVUXDSP (COPY_TO_REGCLASS (XXPERMDI $S1, $S1, 2), VSFRC)))>;
Nemanja Ivanovicd3c284f2016-07-18 15:30:00 +00001490 }
Lei Huangc29229a2018-05-08 17:36:40 +00001491
1492 // Instructions for converting float to i64 feeding a store.
1493 let Predicates = [NoP9Vector] in {
1494 def : Pat<(PPCstore_scal_int_from_vsr
1495 (f64 (PPCcv_fp_to_sint_in_vsr f64:$src)), xoaddr:$dst, 8),
1496 (STXSDX (XSCVDPSXDS f64:$src), xoaddr:$dst)>;
1497 def : Pat<(PPCstore_scal_int_from_vsr
1498 (f64 (PPCcv_fp_to_uint_in_vsr f64:$src)), xoaddr:$dst, 8),
1499 (STXSDX (XSCVDPUXDS f64:$src), xoaddr:$dst)>;
1500 }
1501
1502 // Instructions for converting float to i32 feeding a store.
1503 def : Pat<(PPCstore_scal_int_from_vsr
1504 (f64 (PPCcv_fp_to_sint_in_vsr f64:$src)), xoaddr:$dst, 4),
1505 (STIWX (XSCVDPSXWS f64:$src), xoaddr:$dst)>;
1506 def : Pat<(PPCstore_scal_int_from_vsr
1507 (f64 (PPCcv_fp_to_uint_in_vsr f64:$src)), xoaddr:$dst, 4),
1508 (STIWX (XSCVDPUXWS f64:$src), xoaddr:$dst)>;
1509
Nemanja Ivanovicf3c94b12015-05-07 18:24:05 +00001510} // AddedComplexity = 400
Kit Barton298beb52015-02-18 16:21:46 +00001511} // HasP8Vector
Nemanja Ivanovicc38b5312015-04-11 10:40:42 +00001512
Stefan Pintiliee1d79a82019-03-26 20:28:21 +00001513let AddedComplexity = 400 in {
Ehsan Amiri99b017a2016-03-31 17:47:17 +00001514let Predicates = [HasDirectMove] in {
Nemanja Ivanovicf02def62015-05-21 19:32:49 +00001515 // VSX direct move instructions
1516 def MFVSRD : XX1_RS6_RD5_XO<31, 51, (outs g8rc:$rA), (ins vsfrc:$XT),
1517 "mfvsrd $rA, $XT", IIC_VecGeneral,
1518 [(set i64:$rA, (PPCmfvsr f64:$XT))]>,
1519 Requires<[In64BitMode]>;
Nemanja Ivanovicffcf0fb2017-03-15 16:04:53 +00001520 let isCodeGenOnly = 1 in
Stefan Pintiliee1d79a82019-03-26 20:28:21 +00001521 def MFVRD : XX1_RS6_RD5_XO<31, 51, (outs g8rc:$rA), (ins vsrc:$XT),
Nemanja Ivanovicffcf0fb2017-03-15 16:04:53 +00001522 "mfvsrd $rA, $XT", IIC_VecGeneral,
1523 []>,
1524 Requires<[In64BitMode]>;
Nemanja Ivanovicf02def62015-05-21 19:32:49 +00001525 def MFVSRWZ : XX1_RS6_RD5_XO<31, 115, (outs gprc:$rA), (ins vsfrc:$XT),
1526 "mfvsrwz $rA, $XT", IIC_VecGeneral,
1527 [(set i32:$rA, (PPCmfvsr f64:$XT))]>;
1528 def MTVSRD : XX1_RS6_RD5_XO<31, 179, (outs vsfrc:$XT), (ins g8rc:$rA),
1529 "mtvsrd $XT, $rA", IIC_VecGeneral,
1530 [(set f64:$XT, (PPCmtvsra i64:$rA))]>,
1531 Requires<[In64BitMode]>;
1532 def MTVSRWA : XX1_RS6_RD5_XO<31, 211, (outs vsfrc:$XT), (ins gprc:$rA),
1533 "mtvsrwa $XT, $rA", IIC_VecGeneral,
1534 [(set f64:$XT, (PPCmtvsra i32:$rA))]>;
1535 def MTVSRWZ : XX1_RS6_RD5_XO<31, 243, (outs vsfrc:$XT), (ins gprc:$rA),
1536 "mtvsrwz $XT, $rA", IIC_VecGeneral,
1537 [(set f64:$XT, (PPCmtvsrz i32:$rA))]>;
Ehsan Amiri99b017a2016-03-31 17:47:17 +00001538} // HasDirectMove
1539
1540let Predicates = [IsISA3_0, HasDirectMove] in {
1541 def MTVSRWS: XX1_RS6_RD5_XO<31, 403, (outs vsrc:$XT), (ins gprc:$rA),
Nemanja Ivanovicd2c3c512016-09-23 13:25:31 +00001542 "mtvsrws $XT, $rA", IIC_VecGeneral, []>;
Ehsan Amiri99b017a2016-03-31 17:47:17 +00001543
Guozhi Wei22e7da92017-05-11 22:17:35 +00001544 def MTVSRDD: XX1Form<31, 435, (outs vsrc:$XT), (ins g8rc_nox0:$rA, g8rc:$rB),
Ehsan Amiri99b017a2016-03-31 17:47:17 +00001545 "mtvsrdd $XT, $rA, $rB", IIC_VecGeneral,
1546 []>, Requires<[In64BitMode]>;
1547
1548 def MFVSRLD: XX1_RS6_RD5_XO<31, 307, (outs g8rc:$rA), (ins vsrc:$XT),
1549 "mfvsrld $rA, $XT", IIC_VecGeneral,
1550 []>, Requires<[In64BitMode]>;
1551
1552} // IsISA3_0, HasDirectMove
Stefan Pintiliee1d79a82019-03-26 20:28:21 +00001553} // AddedComplexity = 400
Nemanja Ivanovic1c39ca62015-08-13 17:40:44 +00001554
Nemanja Ivanovicffcf0fb2017-03-15 16:04:53 +00001555// We want to parse this from asm, but we don't want to emit this as it would
1556// be emitted with a VSX reg. So leave Emit = 0 here.
1557def : InstAlias<"mfvrd $rA, $XT",
1558 (MFVRD g8rc:$rA, vrrc:$XT), 0>;
1559def : InstAlias<"mffprd $rA, $src",
1560 (MFVSRD g8rc:$rA, f8rc:$src)>;
1561
Nemanja Ivanovicd3896572015-10-09 11:12:18 +00001562/* Direct moves of various widths from GPR's into VSR's. Each move lines
Nemanja Ivanovic1c39ca62015-08-13 17:40:44 +00001563 the value up into element 0 (both BE and LE). Namely, entities smaller than
1564 a doubleword are shifted left and moved for BE. For LE, they're moved, then
1565 swapped to go into the least significant element of the VSR.
1566*/
Nemanja Ivanovicd3896572015-10-09 11:12:18 +00001567def MovesToVSR {
1568 dag BE_BYTE_0 =
1569 (MTVSRD
1570 (RLDICR
1571 (INSERT_SUBREG (i64 (IMPLICIT_DEF)), $A, sub_32), 56, 7));
1572 dag BE_HALF_0 =
1573 (MTVSRD
1574 (RLDICR
1575 (INSERT_SUBREG (i64 (IMPLICIT_DEF)), $A, sub_32), 48, 15));
1576 dag BE_WORD_0 =
1577 (MTVSRD
1578 (RLDICR
1579 (INSERT_SUBREG (i64 (IMPLICIT_DEF)), $A, sub_32), 32, 31));
Nemanja Ivanovic1c39ca62015-08-13 17:40:44 +00001580 dag BE_DWORD_0 = (MTVSRD $A);
1581
1582 dag LE_MTVSRW = (MTVSRD (INSERT_SUBREG (i64 (IMPLICIT_DEF)), $A, sub_32));
Nemanja Ivanovicd3896572015-10-09 11:12:18 +00001583 dag LE_WORD_1 = (v2i64 (INSERT_SUBREG (v2i64 (IMPLICIT_DEF)),
1584 LE_MTVSRW, sub_64));
Nemanja Ivanovic1c39ca62015-08-13 17:40:44 +00001585 dag LE_WORD_0 = (XXPERMDI LE_WORD_1, LE_WORD_1, 2);
Nemanja Ivanovicd3896572015-10-09 11:12:18 +00001586 dag LE_DWORD_1 = (v2i64 (INSERT_SUBREG (v2i64 (IMPLICIT_DEF)),
1587 BE_DWORD_0, sub_64));
Nemanja Ivanovic1c39ca62015-08-13 17:40:44 +00001588 dag LE_DWORD_0 = (XXPERMDI LE_DWORD_1, LE_DWORD_1, 2);
1589}
1590
Nemanja Ivanovicac8d01a2015-12-10 13:35:28 +00001591/* Patterns for extracting elements out of vectors. Integer elements are
1592 extracted using direct move operations. Patterns for extracting elements
1593 whose indices are not available at compile time are also provided with
1594 various _VARIABLE_ patterns.
Nemanja Ivanovicd3896572015-10-09 11:12:18 +00001595 The numbering for the DAG's is for LE, but when used on BE, the correct
1596 LE element can just be used (i.e. LE_BYTE_2 == BE_BYTE_13).
1597*/
Nemanja Ivanovicac8d01a2015-12-10 13:35:28 +00001598def VectorExtractions {
Nemanja Ivanovicd3896572015-10-09 11:12:18 +00001599 // Doubleword extraction
1600 dag LE_DWORD_0 =
1601 (MFVSRD
1602 (EXTRACT_SUBREG
1603 (XXPERMDI (COPY_TO_REGCLASS $S, VSRC),
1604 (COPY_TO_REGCLASS $S, VSRC), 2), sub_64));
1605 dag LE_DWORD_1 = (MFVSRD
1606 (EXTRACT_SUBREG
1607 (v2i64 (COPY_TO_REGCLASS $S, VSRC)), sub_64));
1608
1609 // Word extraction
Nemanja Ivanoviceebbcb62016-07-12 12:16:27 +00001610 dag LE_WORD_0 = (MFVSRWZ (EXTRACT_SUBREG (XXPERMDI $S, $S, 2), sub_64));
Nemanja Ivanovicd3896572015-10-09 11:12:18 +00001611 dag LE_WORD_1 = (MFVSRWZ (EXTRACT_SUBREG (XXSLDWI $S, $S, 1), sub_64));
1612 dag LE_WORD_2 = (MFVSRWZ (EXTRACT_SUBREG
1613 (v2i64 (COPY_TO_REGCLASS $S, VSRC)), sub_64));
1614 dag LE_WORD_3 = (MFVSRWZ (EXTRACT_SUBREG (XXSLDWI $S, $S, 3), sub_64));
1615
1616 // Halfword extraction
1617 dag LE_HALF_0 = (i32 (EXTRACT_SUBREG (RLDICL LE_DWORD_0, 0, 48), sub_32));
1618 dag LE_HALF_1 = (i32 (EXTRACT_SUBREG (RLDICL LE_DWORD_0, 48, 48), sub_32));
1619 dag LE_HALF_2 = (i32 (EXTRACT_SUBREG (RLDICL LE_DWORD_0, 32, 48), sub_32));
1620 dag LE_HALF_3 = (i32 (EXTRACT_SUBREG (RLDICL LE_DWORD_0, 16, 48), sub_32));
1621 dag LE_HALF_4 = (i32 (EXTRACT_SUBREG (RLDICL LE_DWORD_1, 0, 48), sub_32));
1622 dag LE_HALF_5 = (i32 (EXTRACT_SUBREG (RLDICL LE_DWORD_1, 48, 48), sub_32));
1623 dag LE_HALF_6 = (i32 (EXTRACT_SUBREG (RLDICL LE_DWORD_1, 32, 48), sub_32));
1624 dag LE_HALF_7 = (i32 (EXTRACT_SUBREG (RLDICL LE_DWORD_1, 16, 48), sub_32));
1625
1626 // Byte extraction
1627 dag LE_BYTE_0 = (i32 (EXTRACT_SUBREG (RLDICL LE_DWORD_0, 0, 56), sub_32));
1628 dag LE_BYTE_1 = (i32 (EXTRACT_SUBREG (RLDICL LE_DWORD_0, 56, 56), sub_32));
1629 dag LE_BYTE_2 = (i32 (EXTRACT_SUBREG (RLDICL LE_DWORD_0, 48, 56), sub_32));
1630 dag LE_BYTE_3 = (i32 (EXTRACT_SUBREG (RLDICL LE_DWORD_0, 40, 56), sub_32));
1631 dag LE_BYTE_4 = (i32 (EXTRACT_SUBREG (RLDICL LE_DWORD_0, 32, 56), sub_32));
1632 dag LE_BYTE_5 = (i32 (EXTRACT_SUBREG (RLDICL LE_DWORD_0, 24, 56), sub_32));
1633 dag LE_BYTE_6 = (i32 (EXTRACT_SUBREG (RLDICL LE_DWORD_0, 16, 56), sub_32));
1634 dag LE_BYTE_7 = (i32 (EXTRACT_SUBREG (RLDICL LE_DWORD_0, 8, 56), sub_32));
1635 dag LE_BYTE_8 = (i32 (EXTRACT_SUBREG (RLDICL LE_DWORD_1, 0, 56), sub_32));
1636 dag LE_BYTE_9 = (i32 (EXTRACT_SUBREG (RLDICL LE_DWORD_1, 56, 56), sub_32));
1637 dag LE_BYTE_10 = (i32 (EXTRACT_SUBREG (RLDICL LE_DWORD_1, 48, 56), sub_32));
1638 dag LE_BYTE_11 = (i32 (EXTRACT_SUBREG (RLDICL LE_DWORD_1, 40, 56), sub_32));
1639 dag LE_BYTE_12 = (i32 (EXTRACT_SUBREG (RLDICL LE_DWORD_1, 32, 56), sub_32));
1640 dag LE_BYTE_13 = (i32 (EXTRACT_SUBREG (RLDICL LE_DWORD_1, 24, 56), sub_32));
1641 dag LE_BYTE_14 = (i32 (EXTRACT_SUBREG (RLDICL LE_DWORD_1, 16, 56), sub_32));
1642 dag LE_BYTE_15 = (i32 (EXTRACT_SUBREG (RLDICL LE_DWORD_1, 8, 56), sub_32));
1643
1644 /* Variable element number (BE and LE patterns must be specified separately)
1645 This is a rather involved process.
1646
1647 Conceptually, this is how the move is accomplished:
1648 1. Identify which doubleword contains the element
1649 2. Shift in the VMX register so that the correct doubleword is correctly
1650 lined up for the MFVSRD
1651 3. Perform the move so that the element (along with some extra stuff)
1652 is in the GPR
1653 4. Right shift within the GPR so that the element is right-justified
1654
1655 Of course, the index is an element number which has a different meaning
1656 on LE/BE so the patterns have to be specified separately.
1657
1658 Note: The final result will be the element right-justified with high
1659 order bits being arbitrarily defined (namely, whatever was in the
1660 vector register to the left of the value originally).
1661 */
1662
1663 /* LE variable byte
1664 Number 1. above:
1665 - For elements 0-7, we shift left by 8 bytes since they're on the right
1666 - For elements 8-15, we need not shift (shift left by zero bytes)
1667 This is accomplished by inverting the bits of the index and AND-ing
1668 with 0x8 (i.e. clearing all bits of the index and inverting bit 60).
1669 */
Lei Huangcd4f3852018-03-12 19:26:18 +00001670 dag LE_VBYTE_PERM_VEC = (v16i8 (LVSL ZERO8, (ANDC8 (LI8 8), $Idx)));
Nemanja Ivanovicd3896572015-10-09 11:12:18 +00001671
1672 // Number 2. above:
1673 // - Now that we set up the shift amount, we shift in the VMX register
Lei Huangcd4f3852018-03-12 19:26:18 +00001674 dag LE_VBYTE_PERMUTE = (v16i8 (VPERM $S, $S, LE_VBYTE_PERM_VEC));
Nemanja Ivanovicd3896572015-10-09 11:12:18 +00001675
1676 // Number 3. above:
1677 // - The doubleword containing our element is moved to a GPR
1678 dag LE_MV_VBYTE = (MFVSRD
1679 (EXTRACT_SUBREG
1680 (v2i64 (COPY_TO_REGCLASS LE_VBYTE_PERMUTE, VSRC)),
1681 sub_64));
1682
1683 /* Number 4. above:
1684 - Truncate the element number to the range 0-7 (8-15 are symmetrical
1685 and out of range values are truncated accordingly)
1686 - Multiply by 8 as we need to shift right by the number of bits, not bytes
1687 - Shift right in the GPR by the calculated value
1688 */
1689 dag LE_VBYTE_SHIFT = (EXTRACT_SUBREG (RLDICR (AND8 (LI8 7), $Idx), 3, 60),
1690 sub_32);
1691 dag LE_VARIABLE_BYTE = (EXTRACT_SUBREG (SRD LE_MV_VBYTE, LE_VBYTE_SHIFT),
1692 sub_32);
1693
Nemanja Ivanovicd3896572015-10-09 11:12:18 +00001694 /* LE variable halfword
1695 Number 1. above:
1696 - For elements 0-3, we shift left by 8 since they're on the right
1697 - For elements 4-7, we need not shift (shift left by zero bytes)
1698 Similarly to the byte pattern, we invert the bits of the index, but we
1699 AND with 0x4 (i.e. clear all bits of the index and invert bit 61).
1700 Of course, the shift is still by 8 bytes, so we must multiply by 2.
1701 */
Lei Huangcd4f3852018-03-12 19:26:18 +00001702 dag LE_VHALF_PERM_VEC =
1703 (v16i8 (LVSL ZERO8, (RLDICR (ANDC8 (LI8 4), $Idx), 1, 62)));
Nemanja Ivanovicd3896572015-10-09 11:12:18 +00001704
1705 // Number 2. above:
1706 // - Now that we set up the shift amount, we shift in the VMX register
Lei Huangcd4f3852018-03-12 19:26:18 +00001707 dag LE_VHALF_PERMUTE = (v16i8 (VPERM $S, $S, LE_VHALF_PERM_VEC));
Nemanja Ivanovicd3896572015-10-09 11:12:18 +00001708
1709 // Number 3. above:
1710 // - The doubleword containing our element is moved to a GPR
1711 dag LE_MV_VHALF = (MFVSRD
1712 (EXTRACT_SUBREG
1713 (v2i64 (COPY_TO_REGCLASS LE_VHALF_PERMUTE, VSRC)),
1714 sub_64));
1715
1716 /* Number 4. above:
1717 - Truncate the element number to the range 0-3 (4-7 are symmetrical
1718 and out of range values are truncated accordingly)
1719 - Multiply by 16 as we need to shift right by the number of bits
1720 - Shift right in the GPR by the calculated value
1721 */
1722 dag LE_VHALF_SHIFT = (EXTRACT_SUBREG (RLDICR (AND8 (LI8 3), $Idx), 4, 59),
1723 sub_32);
1724 dag LE_VARIABLE_HALF = (EXTRACT_SUBREG (SRD LE_MV_VHALF, LE_VHALF_SHIFT),
1725 sub_32);
1726
Nemanja Ivanovicac8d01a2015-12-10 13:35:28 +00001727 /* LE variable word
1728 Number 1. above:
1729 - For elements 0-1, we shift left by 8 since they're on the right
1730 - For elements 2-3, we need not shift
1731 */
Lei Huangcd4f3852018-03-12 19:26:18 +00001732 dag LE_VWORD_PERM_VEC = (v16i8 (LVSL ZERO8,
1733 (RLDICR (ANDC8 (LI8 2), $Idx), 2, 61)));
Nemanja Ivanovicac8d01a2015-12-10 13:35:28 +00001734
1735 // Number 2. above:
1736 // - Now that we set up the shift amount, we shift in the VMX register
Lei Huangcd4f3852018-03-12 19:26:18 +00001737 dag LE_VWORD_PERMUTE = (v16i8 (VPERM $S, $S, LE_VWORD_PERM_VEC));
Nemanja Ivanovicac8d01a2015-12-10 13:35:28 +00001738
1739 // Number 3. above:
1740 // - The doubleword containing our element is moved to a GPR
1741 dag LE_MV_VWORD = (MFVSRD
1742 (EXTRACT_SUBREG
1743 (v2i64 (COPY_TO_REGCLASS LE_VWORD_PERMUTE, VSRC)),
1744 sub_64));
1745
1746 /* Number 4. above:
1747 - Truncate the element number to the range 0-1 (2-3 are symmetrical
1748 and out of range values are truncated accordingly)
1749 - Multiply by 32 as we need to shift right by the number of bits
1750 - Shift right in the GPR by the calculated value
1751 */
1752 dag LE_VWORD_SHIFT = (EXTRACT_SUBREG (RLDICR (AND8 (LI8 1), $Idx), 5, 58),
1753 sub_32);
1754 dag LE_VARIABLE_WORD = (EXTRACT_SUBREG (SRD LE_MV_VWORD, LE_VWORD_SHIFT),
1755 sub_32);
1756
1757 /* LE variable doubleword
1758 Number 1. above:
1759 - For element 0, we shift left by 8 since it's on the right
1760 - For element 1, we need not shift
1761 */
Lei Huangcd4f3852018-03-12 19:26:18 +00001762 dag LE_VDWORD_PERM_VEC = (v16i8 (LVSL ZERO8,
1763 (RLDICR (ANDC8 (LI8 1), $Idx), 3, 60)));
Nemanja Ivanovicac8d01a2015-12-10 13:35:28 +00001764
1765 // Number 2. above:
1766 // - Now that we set up the shift amount, we shift in the VMX register
Lei Huangcd4f3852018-03-12 19:26:18 +00001767 dag LE_VDWORD_PERMUTE = (v16i8 (VPERM $S, $S, LE_VDWORD_PERM_VEC));
Nemanja Ivanovicac8d01a2015-12-10 13:35:28 +00001768
1769 // Number 3. above:
1770 // - The doubleword containing our element is moved to a GPR
1771 // - Number 4. is not needed for the doubleword as the value is 64-bits
1772 dag LE_VARIABLE_DWORD =
1773 (MFVSRD (EXTRACT_SUBREG
1774 (v2i64 (COPY_TO_REGCLASS LE_VDWORD_PERMUTE, VSRC)),
1775 sub_64));
1776
1777 /* LE variable float
1778 - Shift the vector to line up the desired element to BE Word 0
1779 - Convert 32-bit float to a 64-bit single precision float
1780 */
Lei Huangcd4f3852018-03-12 19:26:18 +00001781 dag LE_VFLOAT_PERM_VEC = (v16i8 (LVSL ZERO8,
1782 (RLDICR (XOR8 (LI8 3), $Idx), 2, 61)));
Nemanja Ivanovicac8d01a2015-12-10 13:35:28 +00001783 dag LE_VFLOAT_PERMUTE = (VPERM $S, $S, LE_VFLOAT_PERM_VEC);
1784 dag LE_VARIABLE_FLOAT = (XSCVSPDPN LE_VFLOAT_PERMUTE);
1785
1786 /* LE variable double
1787 Same as the LE doubleword except there is no move.
1788 */
Lei Huangcd4f3852018-03-12 19:26:18 +00001789 dag LE_VDOUBLE_PERMUTE = (v16i8 (VPERM (v16i8 (COPY_TO_REGCLASS $S, VRRC)),
1790 (v16i8 (COPY_TO_REGCLASS $S, VRRC)),
1791 LE_VDWORD_PERM_VEC));
Nemanja Ivanovicac8d01a2015-12-10 13:35:28 +00001792 dag LE_VARIABLE_DOUBLE = (COPY_TO_REGCLASS LE_VDOUBLE_PERMUTE, VSRC);
1793
1794 /* BE variable byte
1795 The algorithm here is the same as the LE variable byte except:
1796 - The shift in the VMX register is by 0/8 for opposite element numbers so
1797 we simply AND the element number with 0x8
1798 - The order of elements after the move to GPR is reversed, so we invert
1799 the bits of the index prior to truncating to the range 0-7
1800 */
Lei Huangcd4f3852018-03-12 19:26:18 +00001801 dag BE_VBYTE_PERM_VEC = (v16i8 (LVSL ZERO8, (ANDIo8 $Idx, 8)));
1802 dag BE_VBYTE_PERMUTE = (v16i8 (VPERM $S, $S, BE_VBYTE_PERM_VEC));
Nemanja Ivanovicac8d01a2015-12-10 13:35:28 +00001803 dag BE_MV_VBYTE = (MFVSRD
1804 (EXTRACT_SUBREG
1805 (v2i64 (COPY_TO_REGCLASS BE_VBYTE_PERMUTE, VSRC)),
1806 sub_64));
1807 dag BE_VBYTE_SHIFT = (EXTRACT_SUBREG (RLDICR (ANDC8 (LI8 7), $Idx), 3, 60),
1808 sub_32);
1809 dag BE_VARIABLE_BYTE = (EXTRACT_SUBREG (SRD BE_MV_VBYTE, BE_VBYTE_SHIFT),
1810 sub_32);
1811
Nemanja Ivanovicd3896572015-10-09 11:12:18 +00001812 /* BE variable halfword
1813 The algorithm here is the same as the LE variable halfword except:
1814 - The shift in the VMX register is by 0/8 for opposite element numbers so
1815 we simply AND the element number with 0x4 and multiply by 2
1816 - The order of elements after the move to GPR is reversed, so we invert
1817 the bits of the index prior to truncating to the range 0-3
1818 */
Lei Huangcd4f3852018-03-12 19:26:18 +00001819 dag BE_VHALF_PERM_VEC = (v16i8 (LVSL ZERO8,
1820 (RLDICR (ANDIo8 $Idx, 4), 1, 62)));
1821 dag BE_VHALF_PERMUTE = (v16i8 (VPERM $S, $S, BE_VHALF_PERM_VEC));
Nemanja Ivanovicd3896572015-10-09 11:12:18 +00001822 dag BE_MV_VHALF = (MFVSRD
1823 (EXTRACT_SUBREG
1824 (v2i64 (COPY_TO_REGCLASS BE_VHALF_PERMUTE, VSRC)),
1825 sub_64));
Nemanja Ivanovicac8d01a2015-12-10 13:35:28 +00001826 dag BE_VHALF_SHIFT = (EXTRACT_SUBREG (RLDICR (ANDC8 (LI8 3), $Idx), 4, 59),
Nemanja Ivanovicd3896572015-10-09 11:12:18 +00001827 sub_32);
1828 dag BE_VARIABLE_HALF = (EXTRACT_SUBREG (SRD BE_MV_VHALF, BE_VHALF_SHIFT),
1829 sub_32);
Nemanja Ivanovicac8d01a2015-12-10 13:35:28 +00001830
1831 /* BE variable word
1832 The algorithm is the same as the LE variable word except:
1833 - The shift in the VMX register happens for opposite element numbers
1834 - The order of elements after the move to GPR is reversed, so we invert
1835 the bits of the index prior to truncating to the range 0-1
1836 */
Lei Huangcd4f3852018-03-12 19:26:18 +00001837 dag BE_VWORD_PERM_VEC = (v16i8 (LVSL ZERO8,
1838 (RLDICR (ANDIo8 $Idx, 2), 2, 61)));
1839 dag BE_VWORD_PERMUTE = (v16i8 (VPERM $S, $S, BE_VWORD_PERM_VEC));
Nemanja Ivanovicac8d01a2015-12-10 13:35:28 +00001840 dag BE_MV_VWORD = (MFVSRD
1841 (EXTRACT_SUBREG
1842 (v2i64 (COPY_TO_REGCLASS BE_VWORD_PERMUTE, VSRC)),
1843 sub_64));
1844 dag BE_VWORD_SHIFT = (EXTRACT_SUBREG (RLDICR (ANDC8 (LI8 1), $Idx), 5, 58),
1845 sub_32);
1846 dag BE_VARIABLE_WORD = (EXTRACT_SUBREG (SRD BE_MV_VWORD, BE_VWORD_SHIFT),
1847 sub_32);
1848
1849 /* BE variable doubleword
1850 Same as the LE doubleword except we shift in the VMX register for opposite
1851 element indices.
1852 */
Lei Huangcd4f3852018-03-12 19:26:18 +00001853 dag BE_VDWORD_PERM_VEC = (v16i8 (LVSL ZERO8,
1854 (RLDICR (ANDIo8 $Idx, 1), 3, 60)));
1855 dag BE_VDWORD_PERMUTE = (v16i8 (VPERM $S, $S, BE_VDWORD_PERM_VEC));
Nemanja Ivanovicac8d01a2015-12-10 13:35:28 +00001856 dag BE_VARIABLE_DWORD =
1857 (MFVSRD (EXTRACT_SUBREG
1858 (v2i64 (COPY_TO_REGCLASS BE_VDWORD_PERMUTE, VSRC)),
1859 sub_64));
1860
1861 /* BE variable float
1862 - Shift the vector to line up the desired element to BE Word 0
1863 - Convert 32-bit float to a 64-bit single precision float
1864 */
Lei Huangcd4f3852018-03-12 19:26:18 +00001865 dag BE_VFLOAT_PERM_VEC = (v16i8 (LVSL ZERO8, (RLDICR $Idx, 2, 61)));
Nemanja Ivanovicac8d01a2015-12-10 13:35:28 +00001866 dag BE_VFLOAT_PERMUTE = (VPERM $S, $S, BE_VFLOAT_PERM_VEC);
1867 dag BE_VARIABLE_FLOAT = (XSCVSPDPN BE_VFLOAT_PERMUTE);
1868
1869 /* BE variable double
1870 Same as the BE doubleword except there is no move.
1871 */
Lei Huangcd4f3852018-03-12 19:26:18 +00001872 dag BE_VDOUBLE_PERMUTE = (v16i8 (VPERM (v16i8 (COPY_TO_REGCLASS $S, VRRC)),
1873 (v16i8 (COPY_TO_REGCLASS $S, VRRC)),
1874 BE_VDWORD_PERM_VEC));
Nemanja Ivanovicac8d01a2015-12-10 13:35:28 +00001875 dag BE_VARIABLE_DOUBLE = (COPY_TO_REGCLASS BE_VDOUBLE_PERMUTE, VSRC);
Nemanja Ivanovicd3896572015-10-09 11:12:18 +00001876}
1877
Zaara Syeda48cb3c12017-11-27 17:11:03 +00001878def NoP9Altivec : Predicate<"!PPCSubTarget->hasP9Altivec()">;
Nemanja Ivanovicdf1cb522016-11-29 16:11:34 +00001879let AddedComplexity = 400 in {
Nemanja Ivanovicd3896572015-10-09 11:12:18 +00001880// v4f32 scalar <-> vector conversions (BE)
Nemanja Ivanovic1c39ca62015-08-13 17:40:44 +00001881let Predicates = [IsBigEndian, HasP8Vector] in {
1882 def : Pat<(v4f32 (scalar_to_vector f32:$A)),
1883 (v4f32 (XSCVDPSPN $A))>;
Nemanja Ivanovicd3896572015-10-09 11:12:18 +00001884 def : Pat<(f32 (vector_extract v4f32:$S, 0)),
1885 (f32 (XSCVSPDPN $S))>;
1886 def : Pat<(f32 (vector_extract v4f32:$S, 1)),
1887 (f32 (XSCVSPDPN (XXSLDWI $S, $S, 1)))>;
1888 def : Pat<(f32 (vector_extract v4f32:$S, 2)),
Nemanja Ivanoviceebbcb62016-07-12 12:16:27 +00001889 (f32 (XSCVSPDPN (XXPERMDI $S, $S, 2)))>;
Nemanja Ivanovicd3896572015-10-09 11:12:18 +00001890 def : Pat<(f32 (vector_extract v4f32:$S, 3)),
1891 (f32 (XSCVSPDPN (XXSLDWI $S, $S, 3)))>;
Nemanja Ivanovicac8d01a2015-12-10 13:35:28 +00001892 def : Pat<(f32 (vector_extract v4f32:$S, i64:$Idx)),
1893 (f32 VectorExtractions.BE_VARIABLE_FLOAT)>;
Nemanja Ivanovic1c39ca62015-08-13 17:40:44 +00001894} // IsBigEndian, HasP8Vector
1895
Nemanja Ivanovicac8d01a2015-12-10 13:35:28 +00001896// Variable index vector_extract for v2f64 does not require P8Vector
1897let Predicates = [IsBigEndian, HasVSX] in
1898 def : Pat<(f64 (vector_extract v2f64:$S, i64:$Idx)),
1899 (f64 VectorExtractions.BE_VARIABLE_DOUBLE)>;
1900
Nemanja Ivanovic1c39ca62015-08-13 17:40:44 +00001901let Predicates = [IsBigEndian, HasDirectMove] in {
Nemanja Ivanovicd3896572015-10-09 11:12:18 +00001902 // v16i8 scalar <-> vector conversions (BE)
Nemanja Ivanovic1c39ca62015-08-13 17:40:44 +00001903 def : Pat<(v16i8 (scalar_to_vector i32:$A)),
Nemanja Ivanovicd3896572015-10-09 11:12:18 +00001904 (v16i8 (SUBREG_TO_REG (i64 1), MovesToVSR.BE_BYTE_0, sub_64))>;
Nemanja Ivanovic1c39ca62015-08-13 17:40:44 +00001905 def : Pat<(v8i16 (scalar_to_vector i32:$A)),
Nemanja Ivanovicd3896572015-10-09 11:12:18 +00001906 (v8i16 (SUBREG_TO_REG (i64 1), MovesToVSR.BE_HALF_0, sub_64))>;
Nemanja Ivanovic1c39ca62015-08-13 17:40:44 +00001907 def : Pat<(v4i32 (scalar_to_vector i32:$A)),
Nemanja Ivanovicd3896572015-10-09 11:12:18 +00001908 (v4i32 (SUBREG_TO_REG (i64 1), MovesToVSR.BE_WORD_0, sub_64))>;
Nemanja Ivanovic1c39ca62015-08-13 17:40:44 +00001909 def : Pat<(v2i64 (scalar_to_vector i64:$A)),
Nemanja Ivanovicd3896572015-10-09 11:12:18 +00001910 (v2i64 (SUBREG_TO_REG (i64 1), MovesToVSR.BE_DWORD_0, sub_64))>;
Zaara Syeda48cb3c12017-11-27 17:11:03 +00001911
1912 // v2i64 scalar <-> vector conversions (BE)
1913 def : Pat<(i64 (vector_extract v2i64:$S, 0)),
1914 (i64 VectorExtractions.LE_DWORD_1)>;
1915 def : Pat<(i64 (vector_extract v2i64:$S, 1)),
1916 (i64 VectorExtractions.LE_DWORD_0)>;
1917 def : Pat<(i64 (vector_extract v2i64:$S, i64:$Idx)),
1918 (i64 VectorExtractions.BE_VARIABLE_DWORD)>;
1919} // IsBigEndian, HasDirectMove
1920
1921let Predicates = [IsBigEndian, HasDirectMove, NoP9Altivec] in {
Nemanja Ivanovicd3896572015-10-09 11:12:18 +00001922 def : Pat<(i32 (vector_extract v16i8:$S, 0)),
Nemanja Ivanovicac8d01a2015-12-10 13:35:28 +00001923 (i32 VectorExtractions.LE_BYTE_15)>;
Nemanja Ivanovicd3896572015-10-09 11:12:18 +00001924 def : Pat<(i32 (vector_extract v16i8:$S, 1)),
Nemanja Ivanovicac8d01a2015-12-10 13:35:28 +00001925 (i32 VectorExtractions.LE_BYTE_14)>;
Nemanja Ivanovicd3896572015-10-09 11:12:18 +00001926 def : Pat<(i32 (vector_extract v16i8:$S, 2)),
Nemanja Ivanovicac8d01a2015-12-10 13:35:28 +00001927 (i32 VectorExtractions.LE_BYTE_13)>;
Nemanja Ivanovicd3896572015-10-09 11:12:18 +00001928 def : Pat<(i32 (vector_extract v16i8:$S, 3)),
Nemanja Ivanovicac8d01a2015-12-10 13:35:28 +00001929 (i32 VectorExtractions.LE_BYTE_12)>;
Nemanja Ivanovicd3896572015-10-09 11:12:18 +00001930 def : Pat<(i32 (vector_extract v16i8:$S, 4)),
Nemanja Ivanovicac8d01a2015-12-10 13:35:28 +00001931 (i32 VectorExtractions.LE_BYTE_11)>;
Nemanja Ivanovicd3896572015-10-09 11:12:18 +00001932 def : Pat<(i32 (vector_extract v16i8:$S, 5)),
Nemanja Ivanovicac8d01a2015-12-10 13:35:28 +00001933 (i32 VectorExtractions.LE_BYTE_10)>;
Nemanja Ivanovicd3896572015-10-09 11:12:18 +00001934 def : Pat<(i32 (vector_extract v16i8:$S, 6)),
Nemanja Ivanovicac8d01a2015-12-10 13:35:28 +00001935 (i32 VectorExtractions.LE_BYTE_9)>;
Nemanja Ivanovicd3896572015-10-09 11:12:18 +00001936 def : Pat<(i32 (vector_extract v16i8:$S, 7)),
Nemanja Ivanovicac8d01a2015-12-10 13:35:28 +00001937 (i32 VectorExtractions.LE_BYTE_8)>;
Nemanja Ivanovicd3896572015-10-09 11:12:18 +00001938 def : Pat<(i32 (vector_extract v16i8:$S, 8)),
Nemanja Ivanovicac8d01a2015-12-10 13:35:28 +00001939 (i32 VectorExtractions.LE_BYTE_7)>;
Nemanja Ivanovicd3896572015-10-09 11:12:18 +00001940 def : Pat<(i32 (vector_extract v16i8:$S, 9)),
Nemanja Ivanovicac8d01a2015-12-10 13:35:28 +00001941 (i32 VectorExtractions.LE_BYTE_6)>;
Nemanja Ivanovicd3896572015-10-09 11:12:18 +00001942 def : Pat<(i32 (vector_extract v16i8:$S, 10)),
Nemanja Ivanovicac8d01a2015-12-10 13:35:28 +00001943 (i32 VectorExtractions.LE_BYTE_5)>;
Nemanja Ivanovicd3896572015-10-09 11:12:18 +00001944 def : Pat<(i32 (vector_extract v16i8:$S, 11)),
Nemanja Ivanovicac8d01a2015-12-10 13:35:28 +00001945 (i32 VectorExtractions.LE_BYTE_4)>;
Nemanja Ivanovicd3896572015-10-09 11:12:18 +00001946 def : Pat<(i32 (vector_extract v16i8:$S, 12)),
Nemanja Ivanovicac8d01a2015-12-10 13:35:28 +00001947 (i32 VectorExtractions.LE_BYTE_3)>;
Nemanja Ivanovicd3896572015-10-09 11:12:18 +00001948 def : Pat<(i32 (vector_extract v16i8:$S, 13)),
Nemanja Ivanovicac8d01a2015-12-10 13:35:28 +00001949 (i32 VectorExtractions.LE_BYTE_2)>;
Nemanja Ivanovicd3896572015-10-09 11:12:18 +00001950 def : Pat<(i32 (vector_extract v16i8:$S, 14)),
Nemanja Ivanovicac8d01a2015-12-10 13:35:28 +00001951 (i32 VectorExtractions.LE_BYTE_1)>;
Nemanja Ivanovicd3896572015-10-09 11:12:18 +00001952 def : Pat<(i32 (vector_extract v16i8:$S, 15)),
Nemanja Ivanovicac8d01a2015-12-10 13:35:28 +00001953 (i32 VectorExtractions.LE_BYTE_0)>;
Nemanja Ivanovicd3896572015-10-09 11:12:18 +00001954 def : Pat<(i32 (vector_extract v16i8:$S, i64:$Idx)),
Nemanja Ivanovicac8d01a2015-12-10 13:35:28 +00001955 (i32 VectorExtractions.BE_VARIABLE_BYTE)>;
Nemanja Ivanovicd3896572015-10-09 11:12:18 +00001956
1957 // v8i16 scalar <-> vector conversions (BE)
1958 def : Pat<(i32 (vector_extract v8i16:$S, 0)),
Nemanja Ivanovicac8d01a2015-12-10 13:35:28 +00001959 (i32 VectorExtractions.LE_HALF_7)>;
Nemanja Ivanovicd3896572015-10-09 11:12:18 +00001960 def : Pat<(i32 (vector_extract v8i16:$S, 1)),
Nemanja Ivanovicac8d01a2015-12-10 13:35:28 +00001961 (i32 VectorExtractions.LE_HALF_6)>;
Nemanja Ivanovicd3896572015-10-09 11:12:18 +00001962 def : Pat<(i32 (vector_extract v8i16:$S, 2)),
Nemanja Ivanovicac8d01a2015-12-10 13:35:28 +00001963 (i32 VectorExtractions.LE_HALF_5)>;
Nemanja Ivanovicd3896572015-10-09 11:12:18 +00001964 def : Pat<(i32 (vector_extract v8i16:$S, 3)),
Nemanja Ivanovicac8d01a2015-12-10 13:35:28 +00001965 (i32 VectorExtractions.LE_HALF_4)>;
Nemanja Ivanovicd3896572015-10-09 11:12:18 +00001966 def : Pat<(i32 (vector_extract v8i16:$S, 4)),
Nemanja Ivanovicac8d01a2015-12-10 13:35:28 +00001967 (i32 VectorExtractions.LE_HALF_3)>;
Nemanja Ivanovicd3896572015-10-09 11:12:18 +00001968 def : Pat<(i32 (vector_extract v8i16:$S, 5)),
Nemanja Ivanovicac8d01a2015-12-10 13:35:28 +00001969 (i32 VectorExtractions.LE_HALF_2)>;
Nemanja Ivanovicd3896572015-10-09 11:12:18 +00001970 def : Pat<(i32 (vector_extract v8i16:$S, 6)),
Nemanja Ivanovicac8d01a2015-12-10 13:35:28 +00001971 (i32 VectorExtractions.LE_HALF_1)>;
Nemanja Ivanovicd3896572015-10-09 11:12:18 +00001972 def : Pat<(i32 (vector_extract v8i16:$S, 7)),
Nemanja Ivanovicac8d01a2015-12-10 13:35:28 +00001973 (i32 VectorExtractions.LE_HALF_0)>;
Nemanja Ivanovicd3896572015-10-09 11:12:18 +00001974 def : Pat<(i32 (vector_extract v8i16:$S, i64:$Idx)),
Nemanja Ivanovicac8d01a2015-12-10 13:35:28 +00001975 (i32 VectorExtractions.BE_VARIABLE_HALF)>;
Nemanja Ivanovicd3896572015-10-09 11:12:18 +00001976
1977 // v4i32 scalar <-> vector conversions (BE)
1978 def : Pat<(i32 (vector_extract v4i32:$S, 0)),
Nemanja Ivanovicac8d01a2015-12-10 13:35:28 +00001979 (i32 VectorExtractions.LE_WORD_3)>;
Nemanja Ivanovicd3896572015-10-09 11:12:18 +00001980 def : Pat<(i32 (vector_extract v4i32:$S, 1)),
Nemanja Ivanovicac8d01a2015-12-10 13:35:28 +00001981 (i32 VectorExtractions.LE_WORD_2)>;
Nemanja Ivanovicd3896572015-10-09 11:12:18 +00001982 def : Pat<(i32 (vector_extract v4i32:$S, 2)),
Nemanja Ivanovicac8d01a2015-12-10 13:35:28 +00001983 (i32 VectorExtractions.LE_WORD_1)>;
Nemanja Ivanovicd3896572015-10-09 11:12:18 +00001984 def : Pat<(i32 (vector_extract v4i32:$S, 3)),
Nemanja Ivanovicac8d01a2015-12-10 13:35:28 +00001985 (i32 VectorExtractions.LE_WORD_0)>;
1986 def : Pat<(i32 (vector_extract v4i32:$S, i64:$Idx)),
1987 (i32 VectorExtractions.BE_VARIABLE_WORD)>;
Zaara Syeda48cb3c12017-11-27 17:11:03 +00001988} // IsBigEndian, HasDirectMove, NoP9Altivec
Nemanja Ivanovic1c39ca62015-08-13 17:40:44 +00001989
Nemanja Ivanovicd3896572015-10-09 11:12:18 +00001990// v4f32 scalar <-> vector conversions (LE)
Nemanja Ivanovic1c39ca62015-08-13 17:40:44 +00001991let Predicates = [IsLittleEndian, HasP8Vector] in {
1992 def : Pat<(v4f32 (scalar_to_vector f32:$A)),
1993 (v4f32 (XXSLDWI (XSCVDPSPN $A), (XSCVDPSPN $A), 1))>;
Nemanja Ivanovicd3896572015-10-09 11:12:18 +00001994 def : Pat<(f32 (vector_extract v4f32:$S, 0)),
1995 (f32 (XSCVSPDPN (XXSLDWI $S, $S, 3)))>;
1996 def : Pat<(f32 (vector_extract v4f32:$S, 1)),
Nemanja Ivanoviceebbcb62016-07-12 12:16:27 +00001997 (f32 (XSCVSPDPN (XXPERMDI $S, $S, 2)))>;
Nemanja Ivanovicd3896572015-10-09 11:12:18 +00001998 def : Pat<(f32 (vector_extract v4f32:$S, 2)),
1999 (f32 (XSCVSPDPN (XXSLDWI $S, $S, 1)))>;
2000 def : Pat<(f32 (vector_extract v4f32:$S, 3)),
2001 (f32 (XSCVSPDPN $S))>;
Nemanja Ivanovicac8d01a2015-12-10 13:35:28 +00002002 def : Pat<(f32 (vector_extract v4f32:$S, i64:$Idx)),
2003 (f32 VectorExtractions.LE_VARIABLE_FLOAT)>;
Nemanja Ivanovic1c39ca62015-08-13 17:40:44 +00002004} // IsLittleEndian, HasP8Vector
2005
Nemanja Ivanovicac8d01a2015-12-10 13:35:28 +00002006// Variable index vector_extract for v2f64 does not require P8Vector
2007let Predicates = [IsLittleEndian, HasVSX] in
2008 def : Pat<(f64 (vector_extract v2f64:$S, i64:$Idx)),
2009 (f64 VectorExtractions.LE_VARIABLE_DOUBLE)>;
2010
Zaara Syeda75098802018-11-05 17:31:26 +00002011def : Pat<(int_ppc_vsx_stxvd2x_be v2f64:$rS, xoaddr:$dst),
2012 (STXVD2X $rS, xoaddr:$dst)>;
2013def : Pat<(int_ppc_vsx_stxvw4x_be v4i32:$rS, xoaddr:$dst),
2014 (STXVW4X $rS, xoaddr:$dst)>;
Nemanja Ivanovicb89c27f2017-05-02 01:47:34 +00002015def : Pat<(v4i32 (int_ppc_vsx_lxvw4x_be xoaddr:$src)), (LXVW4X xoaddr:$src)>;
2016def : Pat<(v2f64 (int_ppc_vsx_lxvd2x_be xoaddr:$src)), (LXVD2X xoaddr:$src)>;
Tony Jiang5f850cd2016-11-15 14:25:56 +00002017
Tony Jiangaa5a6a12017-07-05 16:55:00 +00002018// Variable index unsigned vector_extract on Power9
2019let Predicates = [HasP9Altivec, IsLittleEndian] in {
2020 def : Pat<(i64 (anyext (i32 (vector_extract v16i8:$S, i64:$Idx)))),
2021 (VEXTUBRX $Idx, $S)>;
2022
2023 def : Pat<(i64 (anyext (i32 (vector_extract v8i16:$S, i64:$Idx)))),
2024 (VEXTUHRX (RLWINM8 $Idx, 1, 28, 30), $S)>;
2025 def : Pat<(i64 (anyext (i32 (vector_extract v8i16:$S, 0)))),
2026 (VEXTUHRX (LI8 0), $S)>;
2027 def : Pat<(i64 (anyext (i32 (vector_extract v8i16:$S, 1)))),
2028 (VEXTUHRX (LI8 2), $S)>;
2029 def : Pat<(i64 (anyext (i32 (vector_extract v8i16:$S, 2)))),
2030 (VEXTUHRX (LI8 4), $S)>;
2031 def : Pat<(i64 (anyext (i32 (vector_extract v8i16:$S, 3)))),
2032 (VEXTUHRX (LI8 6), $S)>;
2033 def : Pat<(i64 (anyext (i32 (vector_extract v8i16:$S, 4)))),
2034 (VEXTUHRX (LI8 8), $S)>;
2035 def : Pat<(i64 (anyext (i32 (vector_extract v8i16:$S, 5)))),
2036 (VEXTUHRX (LI8 10), $S)>;
2037 def : Pat<(i64 (anyext (i32 (vector_extract v8i16:$S, 6)))),
2038 (VEXTUHRX (LI8 12), $S)>;
2039 def : Pat<(i64 (anyext (i32 (vector_extract v8i16:$S, 7)))),
2040 (VEXTUHRX (LI8 14), $S)>;
2041
2042 def : Pat<(i64 (zext (i32 (vector_extract v4i32:$S, i64:$Idx)))),
2043 (VEXTUWRX (RLWINM8 $Idx, 2, 28, 29), $S)>;
2044 def : Pat<(i64 (zext (i32 (vector_extract v4i32:$S, 0)))),
2045 (VEXTUWRX (LI8 0), $S)>;
2046 def : Pat<(i64 (zext (i32 (vector_extract v4i32:$S, 1)))),
2047 (VEXTUWRX (LI8 4), $S)>;
Zaara Syeda48cb3c12017-11-27 17:11:03 +00002048 // For extracting LE word 2, MFVSRWZ is better than VEXTUWRX
Tony Jiangaa5a6a12017-07-05 16:55:00 +00002049 def : Pat<(i64 (zext (i32 (vector_extract v4i32:$S, 2)))),
Zaara Syeda48cb3c12017-11-27 17:11:03 +00002050 (INSERT_SUBREG (i64 (IMPLICIT_DEF)),
2051 (i32 VectorExtractions.LE_WORD_2), sub_32)>;
Tony Jiangaa5a6a12017-07-05 16:55:00 +00002052 def : Pat<(i64 (zext (i32 (vector_extract v4i32:$S, 3)))),
2053 (VEXTUWRX (LI8 12), $S)>;
2054
2055 def : Pat<(i64 (sext (i32 (vector_extract v4i32:$S, i64:$Idx)))),
2056 (EXTSW (VEXTUWRX (RLWINM8 $Idx, 2, 28, 29), $S))>;
2057 def : Pat<(i64 (sext (i32 (vector_extract v4i32:$S, 0)))),
2058 (EXTSW (VEXTUWRX (LI8 0), $S))>;
2059 def : Pat<(i64 (sext (i32 (vector_extract v4i32:$S, 1)))),
2060 (EXTSW (VEXTUWRX (LI8 4), $S))>;
Zaara Syeda48cb3c12017-11-27 17:11:03 +00002061 // For extracting LE word 2, MFVSRWZ is better than VEXTUWRX
Tony Jiangaa5a6a12017-07-05 16:55:00 +00002062 def : Pat<(i64 (sext (i32 (vector_extract v4i32:$S, 2)))),
Zaara Syeda48cb3c12017-11-27 17:11:03 +00002063 (EXTSW (INSERT_SUBREG (i64 (IMPLICIT_DEF)),
2064 (i32 VectorExtractions.LE_WORD_2), sub_32))>;
Tony Jiangaa5a6a12017-07-05 16:55:00 +00002065 def : Pat<(i64 (sext (i32 (vector_extract v4i32:$S, 3)))),
2066 (EXTSW (VEXTUWRX (LI8 12), $S))>;
Zaara Syeda48cb3c12017-11-27 17:11:03 +00002067
2068 def : Pat<(i32 (vector_extract v16i8:$S, i64:$Idx)),
2069 (i32 (EXTRACT_SUBREG (VEXTUBRX $Idx, $S), sub_32))>;
2070 def : Pat<(i32 (vector_extract v16i8:$S, 0)),
2071 (i32 (EXTRACT_SUBREG (VEXTUBRX (LI8 0), $S), sub_32))>;
2072 def : Pat<(i32 (vector_extract v16i8:$S, 1)),
2073 (i32 (EXTRACT_SUBREG (VEXTUBRX (LI8 1), $S), sub_32))>;
2074 def : Pat<(i32 (vector_extract v16i8:$S, 2)),
2075 (i32 (EXTRACT_SUBREG (VEXTUBRX (LI8 2), $S), sub_32))>;
2076 def : Pat<(i32 (vector_extract v16i8:$S, 3)),
2077 (i32 (EXTRACT_SUBREG (VEXTUBRX (LI8 3), $S), sub_32))>;
2078 def : Pat<(i32 (vector_extract v16i8:$S, 4)),
2079 (i32 (EXTRACT_SUBREG (VEXTUBRX (LI8 4), $S), sub_32))>;
2080 def : Pat<(i32 (vector_extract v16i8:$S, 5)),
2081 (i32 (EXTRACT_SUBREG (VEXTUBRX (LI8 5), $S), sub_32))>;
2082 def : Pat<(i32 (vector_extract v16i8:$S, 6)),
2083 (i32 (EXTRACT_SUBREG (VEXTUBRX (LI8 6), $S), sub_32))>;
2084 def : Pat<(i32 (vector_extract v16i8:$S, 7)),
2085 (i32 (EXTRACT_SUBREG (VEXTUBRX (LI8 7), $S), sub_32))>;
2086 def : Pat<(i32 (vector_extract v16i8:$S, 8)),
2087 (i32 (EXTRACT_SUBREG (VEXTUBRX (LI8 8), $S), sub_32))>;
2088 def : Pat<(i32 (vector_extract v16i8:$S, 9)),
2089 (i32 (EXTRACT_SUBREG (VEXTUBRX (LI8 9), $S), sub_32))>;
2090 def : Pat<(i32 (vector_extract v16i8:$S, 10)),
2091 (i32 (EXTRACT_SUBREG (VEXTUBRX (LI8 10), $S), sub_32))>;
2092 def : Pat<(i32 (vector_extract v16i8:$S, 11)),
2093 (i32 (EXTRACT_SUBREG (VEXTUBRX (LI8 11), $S), sub_32))>;
2094 def : Pat<(i32 (vector_extract v16i8:$S, 12)),
2095 (i32 (EXTRACT_SUBREG (VEXTUBRX (LI8 12), $S), sub_32))>;
2096 def : Pat<(i32 (vector_extract v16i8:$S, 13)),
2097 (i32 (EXTRACT_SUBREG (VEXTUBRX (LI8 13), $S), sub_32))>;
2098 def : Pat<(i32 (vector_extract v16i8:$S, 14)),
2099 (i32 (EXTRACT_SUBREG (VEXTUBRX (LI8 14), $S), sub_32))>;
2100 def : Pat<(i32 (vector_extract v16i8:$S, 15)),
2101 (i32 (EXTRACT_SUBREG (VEXTUBRX (LI8 15), $S), sub_32))>;
2102
2103 def : Pat<(i32 (vector_extract v8i16:$S, i64:$Idx)),
2104 (i32 (EXTRACT_SUBREG (VEXTUHRX
2105 (RLWINM8 $Idx, 1, 28, 30), $S), sub_32))>;
2106 def : Pat<(i32 (vector_extract v8i16:$S, 0)),
2107 (i32 (EXTRACT_SUBREG (VEXTUHRX (LI8 0), $S), sub_32))>;
2108 def : Pat<(i32 (vector_extract v8i16:$S, 1)),
2109 (i32 (EXTRACT_SUBREG (VEXTUHRX (LI8 2), $S), sub_32))>;
2110 def : Pat<(i32 (vector_extract v8i16:$S, 2)),
2111 (i32 (EXTRACT_SUBREG (VEXTUHRX (LI8 4), $S), sub_32))>;
2112 def : Pat<(i32 (vector_extract v8i16:$S, 3)),
2113 (i32 (EXTRACT_SUBREG (VEXTUHRX (LI8 6), $S), sub_32))>;
2114 def : Pat<(i32 (vector_extract v8i16:$S, 4)),
2115 (i32 (EXTRACT_SUBREG (VEXTUHRX (LI8 8), $S), sub_32))>;
2116 def : Pat<(i32 (vector_extract v8i16:$S, 5)),
2117 (i32 (EXTRACT_SUBREG (VEXTUHRX (LI8 10), $S), sub_32))>;
2118 def : Pat<(i32 (vector_extract v8i16:$S, 6)),
2119 (i32 (EXTRACT_SUBREG (VEXTUHRX (LI8 12), $S), sub_32))>;
2120 def : Pat<(i32 (vector_extract v8i16:$S, 6)),
2121 (i32 (EXTRACT_SUBREG (VEXTUHRX (LI8 14), $S), sub_32))>;
2122
2123 def : Pat<(i32 (vector_extract v4i32:$S, i64:$Idx)),
2124 (i32 (EXTRACT_SUBREG (VEXTUWRX
2125 (RLWINM8 $Idx, 2, 28, 29), $S), sub_32))>;
2126 def : Pat<(i32 (vector_extract v4i32:$S, 0)),
2127 (i32 (EXTRACT_SUBREG (VEXTUWRX (LI8 0), $S), sub_32))>;
2128 def : Pat<(i32 (vector_extract v4i32:$S, 1)),
2129 (i32 (EXTRACT_SUBREG (VEXTUWRX (LI8 4), $S), sub_32))>;
2130 // For extracting LE word 2, MFVSRWZ is better than VEXTUWRX
2131 def : Pat<(i32 (vector_extract v4i32:$S, 2)),
2132 (i32 VectorExtractions.LE_WORD_2)>;
2133 def : Pat<(i32 (vector_extract v4i32:$S, 3)),
2134 (i32 (EXTRACT_SUBREG (VEXTUWRX (LI8 12), $S), sub_32))>;
Tony Jiangaa5a6a12017-07-05 16:55:00 +00002135}
Zaara Syeda48cb3c12017-11-27 17:11:03 +00002136
Tony Jiangaa5a6a12017-07-05 16:55:00 +00002137let Predicates = [HasP9Altivec, IsBigEndian] in {
2138 def : Pat<(i64 (anyext (i32 (vector_extract v16i8:$S, i64:$Idx)))),
2139 (VEXTUBLX $Idx, $S)>;
2140
2141 def : Pat<(i64 (anyext (i32 (vector_extract v8i16:$S, i64:$Idx)))),
2142 (VEXTUHLX (RLWINM8 $Idx, 1, 28, 30), $S)>;
2143 def : Pat<(i64 (anyext (i32 (vector_extract v8i16:$S, 0)))),
2144 (VEXTUHLX (LI8 0), $S)>;
2145 def : Pat<(i64 (anyext (i32 (vector_extract v8i16:$S, 1)))),
2146 (VEXTUHLX (LI8 2), $S)>;
2147 def : Pat<(i64 (anyext (i32 (vector_extract v8i16:$S, 2)))),
2148 (VEXTUHLX (LI8 4), $S)>;
2149 def : Pat<(i64 (anyext (i32 (vector_extract v8i16:$S, 3)))),
2150 (VEXTUHLX (LI8 6), $S)>;
2151 def : Pat<(i64 (anyext (i32 (vector_extract v8i16:$S, 4)))),
2152 (VEXTUHLX (LI8 8), $S)>;
2153 def : Pat<(i64 (anyext (i32 (vector_extract v8i16:$S, 5)))),
2154 (VEXTUHLX (LI8 10), $S)>;
2155 def : Pat<(i64 (anyext (i32 (vector_extract v8i16:$S, 6)))),
2156 (VEXTUHLX (LI8 12), $S)>;
2157 def : Pat<(i64 (anyext (i32 (vector_extract v8i16:$S, 7)))),
2158 (VEXTUHLX (LI8 14), $S)>;
2159
2160 def : Pat<(i64 (zext (i32 (vector_extract v4i32:$S, i64:$Idx)))),
2161 (VEXTUWLX (RLWINM8 $Idx, 2, 28, 29), $S)>;
2162 def : Pat<(i64 (zext (i32 (vector_extract v4i32:$S, 0)))),
2163 (VEXTUWLX (LI8 0), $S)>;
Zaara Syeda48cb3c12017-11-27 17:11:03 +00002164
2165 // For extracting BE word 1, MFVSRWZ is better than VEXTUWLX
Tony Jiangaa5a6a12017-07-05 16:55:00 +00002166 def : Pat<(i64 (zext (i32 (vector_extract v4i32:$S, 1)))),
Zaara Syeda48cb3c12017-11-27 17:11:03 +00002167 (INSERT_SUBREG (i64 (IMPLICIT_DEF)),
2168 (i32 VectorExtractions.LE_WORD_2), sub_32)>;
Tony Jiangaa5a6a12017-07-05 16:55:00 +00002169 def : Pat<(i64 (zext (i32 (vector_extract v4i32:$S, 2)))),
2170 (VEXTUWLX (LI8 8), $S)>;
2171 def : Pat<(i64 (zext (i32 (vector_extract v4i32:$S, 3)))),
2172 (VEXTUWLX (LI8 12), $S)>;
2173
2174 def : Pat<(i64 (sext (i32 (vector_extract v4i32:$S, i64:$Idx)))),
2175 (EXTSW (VEXTUWLX (RLWINM8 $Idx, 2, 28, 29), $S))>;
2176 def : Pat<(i64 (sext (i32 (vector_extract v4i32:$S, 0)))),
2177 (EXTSW (VEXTUWLX (LI8 0), $S))>;
Zaara Syeda48cb3c12017-11-27 17:11:03 +00002178 // For extracting BE word 1, MFVSRWZ is better than VEXTUWLX
Tony Jiangaa5a6a12017-07-05 16:55:00 +00002179 def : Pat<(i64 (sext (i32 (vector_extract v4i32:$S, 1)))),
Zaara Syeda48cb3c12017-11-27 17:11:03 +00002180 (EXTSW (INSERT_SUBREG (i64 (IMPLICIT_DEF)),
2181 (i32 VectorExtractions.LE_WORD_2), sub_32))>;
Tony Jiangaa5a6a12017-07-05 16:55:00 +00002182 def : Pat<(i64 (sext (i32 (vector_extract v4i32:$S, 2)))),
2183 (EXTSW (VEXTUWLX (LI8 8), $S))>;
2184 def : Pat<(i64 (sext (i32 (vector_extract v4i32:$S, 3)))),
2185 (EXTSW (VEXTUWLX (LI8 12), $S))>;
Zaara Syeda48cb3c12017-11-27 17:11:03 +00002186
2187 def : Pat<(i32 (vector_extract v16i8:$S, i64:$Idx)),
2188 (i32 (EXTRACT_SUBREG (VEXTUBLX $Idx, $S), sub_32))>;
2189 def : Pat<(i32 (vector_extract v16i8:$S, 0)),
2190 (i32 (EXTRACT_SUBREG (VEXTUBLX (LI8 0), $S), sub_32))>;
2191 def : Pat<(i32 (vector_extract v16i8:$S, 1)),
2192 (i32 (EXTRACT_SUBREG (VEXTUBLX (LI8 1), $S), sub_32))>;
2193 def : Pat<(i32 (vector_extract v16i8:$S, 2)),
2194 (i32 (EXTRACT_SUBREG (VEXTUBLX (LI8 2), $S), sub_32))>;
2195 def : Pat<(i32 (vector_extract v16i8:$S, 3)),
2196 (i32 (EXTRACT_SUBREG (VEXTUBLX (LI8 3), $S), sub_32))>;
2197 def : Pat<(i32 (vector_extract v16i8:$S, 4)),
2198 (i32 (EXTRACT_SUBREG (VEXTUBLX (LI8 4), $S), sub_32))>;
2199 def : Pat<(i32 (vector_extract v16i8:$S, 5)),
2200 (i32 (EXTRACT_SUBREG (VEXTUBLX (LI8 5), $S), sub_32))>;
2201 def : Pat<(i32 (vector_extract v16i8:$S, 6)),
2202 (i32 (EXTRACT_SUBREG (VEXTUBLX (LI8 6), $S), sub_32))>;
2203 def : Pat<(i32 (vector_extract v16i8:$S, 7)),
2204 (i32 (EXTRACT_SUBREG (VEXTUBLX (LI8 7), $S), sub_32))>;
2205 def : Pat<(i32 (vector_extract v16i8:$S, 8)),
2206 (i32 (EXTRACT_SUBREG (VEXTUBLX (LI8 8), $S), sub_32))>;
2207 def : Pat<(i32 (vector_extract v16i8:$S, 9)),
2208 (i32 (EXTRACT_SUBREG (VEXTUBLX (LI8 9), $S), sub_32))>;
2209 def : Pat<(i32 (vector_extract v16i8:$S, 10)),
2210 (i32 (EXTRACT_SUBREG (VEXTUBLX (LI8 10), $S), sub_32))>;
2211 def : Pat<(i32 (vector_extract v16i8:$S, 11)),
2212 (i32 (EXTRACT_SUBREG (VEXTUBLX (LI8 11), $S), sub_32))>;
2213 def : Pat<(i32 (vector_extract v16i8:$S, 12)),
2214 (i32 (EXTRACT_SUBREG (VEXTUBLX (LI8 12), $S), sub_32))>;
2215 def : Pat<(i32 (vector_extract v16i8:$S, 13)),
2216 (i32 (EXTRACT_SUBREG (VEXTUBLX (LI8 13), $S), sub_32))>;
2217 def : Pat<(i32 (vector_extract v16i8:$S, 14)),
2218 (i32 (EXTRACT_SUBREG (VEXTUBLX (LI8 14), $S), sub_32))>;
2219 def : Pat<(i32 (vector_extract v16i8:$S, 15)),
2220 (i32 (EXTRACT_SUBREG (VEXTUBLX (LI8 15), $S), sub_32))>;
2221
2222 def : Pat<(i32 (vector_extract v8i16:$S, i64:$Idx)),
2223 (i32 (EXTRACT_SUBREG (VEXTUHLX
2224 (RLWINM8 $Idx, 1, 28, 30), $S), sub_32))>;
2225 def : Pat<(i32 (vector_extract v8i16:$S, 0)),
2226 (i32 (EXTRACT_SUBREG (VEXTUHLX (LI8 0), $S), sub_32))>;
2227 def : Pat<(i32 (vector_extract v8i16:$S, 1)),
2228 (i32 (EXTRACT_SUBREG (VEXTUHLX (LI8 2), $S), sub_32))>;
2229 def : Pat<(i32 (vector_extract v8i16:$S, 2)),
2230 (i32 (EXTRACT_SUBREG (VEXTUHLX (LI8 4), $S), sub_32))>;
2231 def : Pat<(i32 (vector_extract v8i16:$S, 3)),
2232 (i32 (EXTRACT_SUBREG (VEXTUHLX (LI8 6), $S), sub_32))>;
2233 def : Pat<(i32 (vector_extract v8i16:$S, 4)),
2234 (i32 (EXTRACT_SUBREG (VEXTUHLX (LI8 8), $S), sub_32))>;
2235 def : Pat<(i32 (vector_extract v8i16:$S, 5)),
2236 (i32 (EXTRACT_SUBREG (VEXTUHLX (LI8 10), $S), sub_32))>;
2237 def : Pat<(i32 (vector_extract v8i16:$S, 6)),
2238 (i32 (EXTRACT_SUBREG (VEXTUHLX (LI8 12), $S), sub_32))>;
2239 def : Pat<(i32 (vector_extract v8i16:$S, 6)),
2240 (i32 (EXTRACT_SUBREG (VEXTUHLX (LI8 14), $S), sub_32))>;
2241
2242 def : Pat<(i32 (vector_extract v4i32:$S, i64:$Idx)),
2243 (i32 (EXTRACT_SUBREG (VEXTUWLX
2244 (RLWINM8 $Idx, 2, 28, 29), $S), sub_32))>;
2245 def : Pat<(i32 (vector_extract v4i32:$S, 0)),
2246 (i32 (EXTRACT_SUBREG (VEXTUWLX (LI8 0), $S), sub_32))>;
2247 // For extracting BE word 1, MFVSRWZ is better than VEXTUWLX
2248 def : Pat<(i32 (vector_extract v4i32:$S, 1)),
2249 (i32 VectorExtractions.LE_WORD_2)>;
2250 def : Pat<(i32 (vector_extract v4i32:$S, 2)),
2251 (i32 (EXTRACT_SUBREG (VEXTUWLX (LI8 8), $S), sub_32))>;
2252 def : Pat<(i32 (vector_extract v4i32:$S, 3)),
2253 (i32 (EXTRACT_SUBREG (VEXTUWLX (LI8 12), $S), sub_32))>;
Tony Jiangaa5a6a12017-07-05 16:55:00 +00002254}
2255
Nemanja Ivanovic1c39ca62015-08-13 17:40:44 +00002256let Predicates = [IsLittleEndian, HasDirectMove] in {
Nemanja Ivanovicd3896572015-10-09 11:12:18 +00002257 // v16i8 scalar <-> vector conversions (LE)
Nemanja Ivanovic1c39ca62015-08-13 17:40:44 +00002258 def : Pat<(v16i8 (scalar_to_vector i32:$A)),
Nemanja Ivanovicd3896572015-10-09 11:12:18 +00002259 (v16i8 (COPY_TO_REGCLASS MovesToVSR.LE_WORD_0, VSRC))>;
Nemanja Ivanovic1c39ca62015-08-13 17:40:44 +00002260 def : Pat<(v8i16 (scalar_to_vector i32:$A)),
Nemanja Ivanovicd3896572015-10-09 11:12:18 +00002261 (v8i16 (COPY_TO_REGCLASS MovesToVSR.LE_WORD_0, VSRC))>;
Nemanja Ivanovic1c39ca62015-08-13 17:40:44 +00002262 def : Pat<(v4i32 (scalar_to_vector i32:$A)),
Nemanja Ivanovicd3896572015-10-09 11:12:18 +00002263 (v4i32 MovesToVSR.LE_WORD_0)>;
Nemanja Ivanovic1c39ca62015-08-13 17:40:44 +00002264 def : Pat<(v2i64 (scalar_to_vector i64:$A)),
Nemanja Ivanovicd3896572015-10-09 11:12:18 +00002265 (v2i64 MovesToVSR.LE_DWORD_0)>;
Zaara Syeda48cb3c12017-11-27 17:11:03 +00002266 // v2i64 scalar <-> vector conversions (LE)
2267 def : Pat<(i64 (vector_extract v2i64:$S, 0)),
2268 (i64 VectorExtractions.LE_DWORD_0)>;
2269 def : Pat<(i64 (vector_extract v2i64:$S, 1)),
2270 (i64 VectorExtractions.LE_DWORD_1)>;
2271 def : Pat<(i64 (vector_extract v2i64:$S, i64:$Idx)),
2272 (i64 VectorExtractions.LE_VARIABLE_DWORD)>;
2273} // IsLittleEndian, HasDirectMove
2274
2275let Predicates = [IsLittleEndian, HasDirectMove, NoP9Altivec] in {
Nemanja Ivanovicd3896572015-10-09 11:12:18 +00002276 def : Pat<(i32 (vector_extract v16i8:$S, 0)),
Nemanja Ivanovicac8d01a2015-12-10 13:35:28 +00002277 (i32 VectorExtractions.LE_BYTE_0)>;
Nemanja Ivanovicd3896572015-10-09 11:12:18 +00002278 def : Pat<(i32 (vector_extract v16i8:$S, 1)),
Nemanja Ivanovicac8d01a2015-12-10 13:35:28 +00002279 (i32 VectorExtractions.LE_BYTE_1)>;
Nemanja Ivanovicd3896572015-10-09 11:12:18 +00002280 def : Pat<(i32 (vector_extract v16i8:$S, 2)),
Nemanja Ivanovicac8d01a2015-12-10 13:35:28 +00002281 (i32 VectorExtractions.LE_BYTE_2)>;
Nemanja Ivanovicd3896572015-10-09 11:12:18 +00002282 def : Pat<(i32 (vector_extract v16i8:$S, 3)),
Nemanja Ivanovicac8d01a2015-12-10 13:35:28 +00002283 (i32 VectorExtractions.LE_BYTE_3)>;
Nemanja Ivanovicd3896572015-10-09 11:12:18 +00002284 def : Pat<(i32 (vector_extract v16i8:$S, 4)),
Nemanja Ivanovicac8d01a2015-12-10 13:35:28 +00002285 (i32 VectorExtractions.LE_BYTE_4)>;
Nemanja Ivanovicd3896572015-10-09 11:12:18 +00002286 def : Pat<(i32 (vector_extract v16i8:$S, 5)),
Nemanja Ivanovicac8d01a2015-12-10 13:35:28 +00002287 (i32 VectorExtractions.LE_BYTE_5)>;
Nemanja Ivanovicd3896572015-10-09 11:12:18 +00002288 def : Pat<(i32 (vector_extract v16i8:$S, 6)),
Nemanja Ivanovicac8d01a2015-12-10 13:35:28 +00002289 (i32 VectorExtractions.LE_BYTE_6)>;
Nemanja Ivanovicd3896572015-10-09 11:12:18 +00002290 def : Pat<(i32 (vector_extract v16i8:$S, 7)),
Nemanja Ivanovicac8d01a2015-12-10 13:35:28 +00002291 (i32 VectorExtractions.LE_BYTE_7)>;
Nemanja Ivanovicd3896572015-10-09 11:12:18 +00002292 def : Pat<(i32 (vector_extract v16i8:$S, 8)),
Nemanja Ivanovicac8d01a2015-12-10 13:35:28 +00002293 (i32 VectorExtractions.LE_BYTE_8)>;
Nemanja Ivanovicd3896572015-10-09 11:12:18 +00002294 def : Pat<(i32 (vector_extract v16i8:$S, 9)),
Nemanja Ivanovicac8d01a2015-12-10 13:35:28 +00002295 (i32 VectorExtractions.LE_BYTE_9)>;
Nemanja Ivanovicd3896572015-10-09 11:12:18 +00002296 def : Pat<(i32 (vector_extract v16i8:$S, 10)),
Nemanja Ivanovicac8d01a2015-12-10 13:35:28 +00002297 (i32 VectorExtractions.LE_BYTE_10)>;
Nemanja Ivanovicd3896572015-10-09 11:12:18 +00002298 def : Pat<(i32 (vector_extract v16i8:$S, 11)),
Nemanja Ivanovicac8d01a2015-12-10 13:35:28 +00002299 (i32 VectorExtractions.LE_BYTE_11)>;
Nemanja Ivanovicd3896572015-10-09 11:12:18 +00002300 def : Pat<(i32 (vector_extract v16i8:$S, 12)),
Nemanja Ivanovicac8d01a2015-12-10 13:35:28 +00002301 (i32 VectorExtractions.LE_BYTE_12)>;
Nemanja Ivanovicd3896572015-10-09 11:12:18 +00002302 def : Pat<(i32 (vector_extract v16i8:$S, 13)),
Nemanja Ivanovicac8d01a2015-12-10 13:35:28 +00002303 (i32 VectorExtractions.LE_BYTE_13)>;
Nemanja Ivanovicd3896572015-10-09 11:12:18 +00002304 def : Pat<(i32 (vector_extract v16i8:$S, 14)),
Nemanja Ivanovicac8d01a2015-12-10 13:35:28 +00002305 (i32 VectorExtractions.LE_BYTE_14)>;
Nemanja Ivanovicd3896572015-10-09 11:12:18 +00002306 def : Pat<(i32 (vector_extract v16i8:$S, 15)),
Nemanja Ivanovicac8d01a2015-12-10 13:35:28 +00002307 (i32 VectorExtractions.LE_BYTE_15)>;
Nemanja Ivanovicd3896572015-10-09 11:12:18 +00002308 def : Pat<(i32 (vector_extract v16i8:$S, i64:$Idx)),
Nemanja Ivanovicac8d01a2015-12-10 13:35:28 +00002309 (i32 VectorExtractions.LE_VARIABLE_BYTE)>;
Nemanja Ivanovic1c39ca62015-08-13 17:40:44 +00002310
Nemanja Ivanovicd3896572015-10-09 11:12:18 +00002311 // v8i16 scalar <-> vector conversions (LE)
2312 def : Pat<(i32 (vector_extract v8i16:$S, 0)),
Nemanja Ivanovicac8d01a2015-12-10 13:35:28 +00002313 (i32 VectorExtractions.LE_HALF_0)>;
Nemanja Ivanovicd3896572015-10-09 11:12:18 +00002314 def : Pat<(i32 (vector_extract v8i16:$S, 1)),
Nemanja Ivanovicac8d01a2015-12-10 13:35:28 +00002315 (i32 VectorExtractions.LE_HALF_1)>;
Nemanja Ivanovicd3896572015-10-09 11:12:18 +00002316 def : Pat<(i32 (vector_extract v8i16:$S, 2)),
Nemanja Ivanovicac8d01a2015-12-10 13:35:28 +00002317 (i32 VectorExtractions.LE_HALF_2)>;
Nemanja Ivanovicd3896572015-10-09 11:12:18 +00002318 def : Pat<(i32 (vector_extract v8i16:$S, 3)),
Nemanja Ivanovicac8d01a2015-12-10 13:35:28 +00002319 (i32 VectorExtractions.LE_HALF_3)>;
Nemanja Ivanovicd3896572015-10-09 11:12:18 +00002320 def : Pat<(i32 (vector_extract v8i16:$S, 4)),
Nemanja Ivanovicac8d01a2015-12-10 13:35:28 +00002321 (i32 VectorExtractions.LE_HALF_4)>;
Nemanja Ivanovicd3896572015-10-09 11:12:18 +00002322 def : Pat<(i32 (vector_extract v8i16:$S, 5)),
Nemanja Ivanovicac8d01a2015-12-10 13:35:28 +00002323 (i32 VectorExtractions.LE_HALF_5)>;
Nemanja Ivanovicd3896572015-10-09 11:12:18 +00002324 def : Pat<(i32 (vector_extract v8i16:$S, 6)),
Nemanja Ivanovicac8d01a2015-12-10 13:35:28 +00002325 (i32 VectorExtractions.LE_HALF_6)>;
Nemanja Ivanovicd3896572015-10-09 11:12:18 +00002326 def : Pat<(i32 (vector_extract v8i16:$S, 7)),
Nemanja Ivanovicac8d01a2015-12-10 13:35:28 +00002327 (i32 VectorExtractions.LE_HALF_7)>;
Nemanja Ivanovicd3896572015-10-09 11:12:18 +00002328 def : Pat<(i32 (vector_extract v8i16:$S, i64:$Idx)),
Nemanja Ivanovicac8d01a2015-12-10 13:35:28 +00002329 (i32 VectorExtractions.LE_VARIABLE_HALF)>;
Nemanja Ivanovicd3896572015-10-09 11:12:18 +00002330
2331 // v4i32 scalar <-> vector conversions (LE)
2332 def : Pat<(i32 (vector_extract v4i32:$S, 0)),
Nemanja Ivanovicac8d01a2015-12-10 13:35:28 +00002333 (i32 VectorExtractions.LE_WORD_0)>;
Nemanja Ivanovicd3896572015-10-09 11:12:18 +00002334 def : Pat<(i32 (vector_extract v4i32:$S, 1)),
Nemanja Ivanovicac8d01a2015-12-10 13:35:28 +00002335 (i32 VectorExtractions.LE_WORD_1)>;
Nemanja Ivanovicd3896572015-10-09 11:12:18 +00002336 def : Pat<(i32 (vector_extract v4i32:$S, 2)),
Nemanja Ivanovicac8d01a2015-12-10 13:35:28 +00002337 (i32 VectorExtractions.LE_WORD_2)>;
Nemanja Ivanovicd3896572015-10-09 11:12:18 +00002338 def : Pat<(i32 (vector_extract v4i32:$S, 3)),
Nemanja Ivanovicac8d01a2015-12-10 13:35:28 +00002339 (i32 VectorExtractions.LE_WORD_3)>;
2340 def : Pat<(i32 (vector_extract v4i32:$S, i64:$Idx)),
2341 (i32 VectorExtractions.LE_VARIABLE_WORD)>;
Zaara Syeda48cb3c12017-11-27 17:11:03 +00002342} // IsLittleEndian, HasDirectMove, NoP9Altivec
Nemanja Ivanovic89224762015-12-15 14:50:34 +00002343
2344let Predicates = [HasDirectMove, HasVSX] in {
2345// bitconvert f32 -> i32
2346// (convert to 32-bit fp single, shift right 1 word, move to GPR)
2347def : Pat<(i32 (bitconvert f32:$S)),
2348 (i32 (MFVSRWZ (EXTRACT_SUBREG
Lei Huangcd4f3852018-03-12 19:26:18 +00002349 (XXSLDWI (XSCVDPSPN $S), (XSCVDPSPN $S), 3),
Nemanja Ivanovic89224762015-12-15 14:50:34 +00002350 sub_64)))>;
2351// bitconvert i32 -> f32
2352// (move to FPR, shift left 1 word, convert to 64-bit fp single)
2353def : Pat<(f32 (bitconvert i32:$A)),
2354 (f32 (XSCVSPDPN
2355 (XXSLDWI MovesToVSR.LE_WORD_1, MovesToVSR.LE_WORD_1, 1)))>;
2356
2357// bitconvert f64 -> i64
2358// (move to GPR, nothing else needed)
2359def : Pat<(i64 (bitconvert f64:$S)),
2360 (i64 (MFVSRD $S))>;
2361
2362// bitconvert i64 -> f64
2363// (move to FPR, nothing else needed)
2364def : Pat<(f64 (bitconvert i64:$S)),
2365 (f64 (MTVSRD $S))>;
2366}
Kit Barton93612ec2016-02-26 21:11:55 +00002367
Nemanja Ivanovicdf1cb522016-11-29 16:11:34 +00002368// Materialize a zero-vector of long long
2369def : Pat<(v2i64 immAllZerosV),
2370 (v2i64 (XXLXORz))>;
2371}
2372
Nemanja Ivanovicb43bb612016-07-12 21:00:10 +00002373def AlignValues {
2374 dag F32_TO_BE_WORD1 = (v4f32 (XXSLDWI (XSCVDPSPN $B), (XSCVDPSPN $B), 3));
2375 dag I32_TO_BE_WORD1 = (COPY_TO_REGCLASS (MTVSRWZ $B), VSRC);
2376}
2377
Kit Barton93612ec2016-02-26 21:11:55 +00002378// The following VSX instructions were introduced in Power ISA 3.0
2379def HasP9Vector : Predicate<"PPCSubTarget->hasP9Vector()">;
Nemanja Ivanovicb43bb612016-07-12 21:00:10 +00002380let AddedComplexity = 400, Predicates = [HasP9Vector] in {
Kit Barton93612ec2016-02-26 21:11:55 +00002381
2382 // [PO VRT XO VRB XO /]
2383 class X_VT5_XO5_VB5<bits<6> opcode, bits<5> xo2, bits<10> xo, string opc,
2384 list<dag> pattern>
2385 : X_RD5_XO5_RS5<opcode, xo2, xo, (outs vrrc:$vT), (ins vrrc:$vB),
2386 !strconcat(opc, " $vT, $vB"), IIC_VecFP, pattern>;
2387
2388 // [PO VRT XO VRB XO RO], Round to Odd version of [PO VRT XO VRB XO /]
2389 class X_VT5_XO5_VB5_Ro<bits<6> opcode, bits<5> xo2, bits<10> xo, string opc,
2390 list<dag> pattern>
2391 : X_VT5_XO5_VB5<opcode, xo2, xo, opc, pattern>, isDOT;
2392
2393 // [PO VRT XO VRB XO /], but the VRB is only used the left 64 bits (or less),
2394 // So we use different operand class for VRB
2395 class X_VT5_XO5_VB5_TyVB<bits<6> opcode, bits<5> xo2, bits<10> xo, string opc,
2396 RegisterOperand vbtype, list<dag> pattern>
2397 : X_RD5_XO5_RS5<opcode, xo2, xo, (outs vrrc:$vT), (ins vbtype:$vB),
2398 !strconcat(opc, " $vT, $vB"), IIC_VecFP, pattern>;
2399
Lei Huang6270ab62018-07-04 21:59:16 +00002400 // [PO VRT XO VRB XO /]
2401 class X_VT5_XO5_VB5_VSFR<bits<6> opcode, bits<5> xo2, bits<10> xo, string opc,
2402 list<dag> pattern>
2403 : X_RD5_XO5_RS5<opcode, xo2, xo, (outs vfrc:$vT), (ins vrrc:$vB),
2404 !strconcat(opc, " $vT, $vB"), IIC_VecFP, pattern>;
2405
2406 // [PO VRT XO VRB XO RO], Round to Odd version of [PO VRT XO VRB XO /]
2407 class X_VT5_XO5_VB5_VSFR_Ro<bits<6> opcode, bits<5> xo2, bits<10> xo, string opc,
2408 list<dag> pattern>
2409 : X_VT5_XO5_VB5_VSFR<opcode, xo2, xo, opc, pattern>, isDOT;
2410
Chuang-Yu Cheng80722712016-03-28 08:34:28 +00002411 // [PO T XO B XO BX /]
2412 class XX2_RT5_XO5_XB6<bits<6> opcode, bits<5> xo2, bits<9> xo, string opc,
2413 list<dag> pattern>
2414 : XX2_RD5_XO5_RS6<opcode, xo2, xo, (outs g8rc:$rT), (ins vsfrc:$XB),
2415 !strconcat(opc, " $rT, $XB"), IIC_VecFP, pattern>;
2416
Kit Barton93612ec2016-02-26 21:11:55 +00002417 // [PO T XO B XO BX TX]
2418 class XX2_XT6_XO5_XB6<bits<6> opcode, bits<5> xo2, bits<9> xo, string opc,
2419 RegisterOperand vtype, list<dag> pattern>
2420 : XX2_RD6_XO5_RS6<opcode, xo2, xo, (outs vtype:$XT), (ins vtype:$XB),
2421 !strconcat(opc, " $XT, $XB"), IIC_VecFP, pattern>;
2422
2423 // [PO T A B XO AX BX TX], src and dest register use different operand class
2424 class XX3_XT5_XA5_XB5<bits<6> opcode, bits<8> xo, string opc,
2425 RegisterOperand xty, RegisterOperand aty, RegisterOperand bty,
2426 InstrItinClass itin, list<dag> pattern>
2427 : XX3Form<opcode, xo, (outs xty:$XT), (ins aty:$XA, bty:$XB),
2428 !strconcat(opc, " $XT, $XA, $XB"), itin, pattern>;
2429
Chuang-Yu Cheng56638482016-03-28 07:38:01 +00002430 // [PO VRT VRA VRB XO /]
2431 class X_VT5_VA5_VB5<bits<6> opcode, bits<10> xo, string opc,
2432 list<dag> pattern>
2433 : XForm_1<opcode, xo, (outs vrrc:$vT), (ins vrrc:$vA, vrrc:$vB),
2434 !strconcat(opc, " $vT, $vA, $vB"), IIC_VecFP, pattern>;
2435
2436 // [PO VRT VRA VRB XO RO], Round to Odd version of [PO VRT VRA VRB XO /]
2437 class X_VT5_VA5_VB5_Ro<bits<6> opcode, bits<10> xo, string opc,
2438 list<dag> pattern>
2439 : X_VT5_VA5_VB5<opcode, xo, opc, pattern>, isDOT;
2440
Lei Huang09fda632018-04-04 16:43:50 +00002441 // [PO VRT VRA VRB XO /]
2442 class X_VT5_VA5_VB5_FMA<bits<6> opcode, bits<10> xo, string opc,
2443 list<dag> pattern>
2444 : XForm_1<opcode, xo, (outs vrrc:$vT), (ins vrrc:$vTi, vrrc:$vA, vrrc:$vB),
2445 !strconcat(opc, " $vT, $vA, $vB"), IIC_VecFP, pattern>,
2446 RegConstraint<"$vTi = $vT">, NoEncode<"$vTi">;
2447
2448 // [PO VRT VRA VRB XO RO], Round to Odd version of [PO VRT VRA VRB XO /]
2449 class X_VT5_VA5_VB5_FMA_Ro<bits<6> opcode, bits<10> xo, string opc,
2450 list<dag> pattern>
2451 : X_VT5_VA5_VB5_FMA<opcode, xo, opc, pattern>, isDOT;
2452
Chuang-Yu Cheng56638482016-03-28 07:38:01 +00002453 //===--------------------------------------------------------------------===//
2454 // Quad-Precision Scalar Move Instructions:
2455
2456 // Copy Sign
Lei Huangecfede92018-03-19 19:22:52 +00002457 def XSCPSGNQP : X_VT5_VA5_VB5<63, 100, "xscpsgnqp",
2458 [(set f128:$vT,
2459 (fcopysign f128:$vB, f128:$vA))]>;
Chuang-Yu Cheng56638482016-03-28 07:38:01 +00002460
2461 // Absolute/Negative-Absolute/Negate
Lei Huangecfede92018-03-19 19:22:52 +00002462 def XSABSQP : X_VT5_XO5_VB5<63, 0, 804, "xsabsqp",
2463 [(set f128:$vT, (fabs f128:$vB))]>;
2464 def XSNABSQP : X_VT5_XO5_VB5<63, 8, 804, "xsnabsqp",
2465 [(set f128:$vT, (fneg (fabs f128:$vB)))]>;
2466 def XSNEGQP : X_VT5_XO5_VB5<63, 16, 804, "xsnegqp",
2467 [(set f128:$vT, (fneg f128:$vB))]>;
Chuang-Yu Cheng56638482016-03-28 07:38:01 +00002468
2469 //===--------------------------------------------------------------------===//
2470 // Quad-Precision Scalar Floating-Point Arithmetic Instructions:
2471
2472 // Add/Divide/Multiply/Subtract
Lei Huang6d1596a2018-03-19 18:52:20 +00002473 let isCommutable = 1 in {
2474 def XSADDQP : X_VT5_VA5_VB5 <63, 4, "xsaddqp",
2475 [(set f128:$vT, (fadd f128:$vA, f128:$vB))]>;
Stefan Pintilie83a5fe12018-07-09 18:50:06 +00002476 def XSADDQPO : X_VT5_VA5_VB5_Ro<63, 4, "xsaddqpo",
2477 [(set f128:$vT,
2478 (int_ppc_addf128_round_to_odd
2479 f128:$vA, f128:$vB))]>;
Lei Huang6d1596a2018-03-19 18:52:20 +00002480 def XSMULQP : X_VT5_VA5_VB5 <63, 36, "xsmulqp",
2481 [(set f128:$vT, (fmul f128:$vA, f128:$vB))]>;
Stefan Pintilie83a5fe12018-07-09 18:50:06 +00002482 def XSMULQPO : X_VT5_VA5_VB5_Ro<63, 36, "xsmulqpo",
2483 [(set f128:$vT,
2484 (int_ppc_mulf128_round_to_odd
2485 f128:$vA, f128:$vB))]>;
Lei Huang6d1596a2018-03-19 18:52:20 +00002486 }
2487
2488 def XSSUBQP : X_VT5_VA5_VB5 <63, 516, "xssubqp" ,
2489 [(set f128:$vT, (fsub f128:$vA, f128:$vB))]>;
Stefan Pintilie83a5fe12018-07-09 18:50:06 +00002490 def XSSUBQPO : X_VT5_VA5_VB5_Ro<63, 516, "xssubqpo",
2491 [(set f128:$vT,
2492 (int_ppc_subf128_round_to_odd
2493 f128:$vA, f128:$vB))]>;
Lei Huang6d1596a2018-03-19 18:52:20 +00002494 def XSDIVQP : X_VT5_VA5_VB5 <63, 548, "xsdivqp",
2495 [(set f128:$vT, (fdiv f128:$vA, f128:$vB))]>;
Stefan Pintilie83a5fe12018-07-09 18:50:06 +00002496 def XSDIVQPO : X_VT5_VA5_VB5_Ro<63, 548, "xsdivqpo",
2497 [(set f128:$vT,
2498 (int_ppc_divf128_round_to_odd
2499 f128:$vA, f128:$vB))]>;
Chuang-Yu Cheng56638482016-03-28 07:38:01 +00002500
2501 // Square-Root
Lei Huangecfede92018-03-19 19:22:52 +00002502 def XSSQRTQP : X_VT5_XO5_VB5 <63, 27, 804, "xssqrtqp",
2503 [(set f128:$vT, (fsqrt f128:$vB))]>;
Stefan Pintilie83a5fe12018-07-09 18:50:06 +00002504 def XSSQRTQPO : X_VT5_XO5_VB5_Ro<63, 27, 804, "xssqrtqpo",
2505 [(set f128:$vT,
2506 (int_ppc_sqrtf128_round_to_odd f128:$vB))]>;
Chuang-Yu Cheng56638482016-03-28 07:38:01 +00002507
2508 // (Negative) Multiply-{Add/Subtract}
Lei Huang09fda632018-04-04 16:43:50 +00002509 def XSMADDQP : X_VT5_VA5_VB5_FMA <63, 388, "xsmaddqp",
2510 [(set f128:$vT,
2511 (fma f128:$vA, f128:$vB,
2512 f128:$vTi))]>;
Stefan Pintilie83a5fe12018-07-09 18:50:06 +00002513
2514 def XSMADDQPO : X_VT5_VA5_VB5_FMA_Ro<63, 388, "xsmaddqpo",
2515 [(set f128:$vT,
2516 (int_ppc_fmaf128_round_to_odd
2517 f128:$vA,f128:$vB,f128:$vTi))]>;
2518
Lei Huang09fda632018-04-04 16:43:50 +00002519 def XSMSUBQP : X_VT5_VA5_VB5_FMA <63, 420, "xsmsubqp" ,
2520 [(set f128:$vT,
2521 (fma f128:$vA, f128:$vB,
2522 (fneg f128:$vTi)))]>;
Stefan Pintilieb9d01aa2018-07-11 01:42:22 +00002523 def XSMSUBQPO : X_VT5_VA5_VB5_FMA_Ro<63, 420, "xsmsubqpo" ,
2524 [(set f128:$vT,
2525 (int_ppc_fmaf128_round_to_odd
2526 f128:$vA, f128:$vB, (fneg f128:$vTi)))]>;
Lei Huang09fda632018-04-04 16:43:50 +00002527 def XSNMADDQP : X_VT5_VA5_VB5_FMA <63, 452, "xsnmaddqp",
2528 [(set f128:$vT,
2529 (fneg (fma f128:$vA, f128:$vB,
2530 f128:$vTi)))]>;
Stefan Pintilieb9d01aa2018-07-11 01:42:22 +00002531 def XSNMADDQPO: X_VT5_VA5_VB5_FMA_Ro<63, 452, "xsnmaddqpo",
2532 [(set f128:$vT,
2533 (fneg (int_ppc_fmaf128_round_to_odd
2534 f128:$vA, f128:$vB, f128:$vTi)))]>;
Lei Huang09fda632018-04-04 16:43:50 +00002535 def XSNMSUBQP : X_VT5_VA5_VB5_FMA <63, 484, "xsnmsubqp",
2536 [(set f128:$vT,
2537 (fneg (fma f128:$vA, f128:$vB,
2538 (fneg f128:$vTi))))]>;
Stefan Pintilieb9d01aa2018-07-11 01:42:22 +00002539 def XSNMSUBQPO: X_VT5_VA5_VB5_FMA_Ro<63, 484, "xsnmsubqpo",
2540 [(set f128:$vT,
2541 (fneg (int_ppc_fmaf128_round_to_odd
2542 f128:$vA, f128:$vB, (fneg f128:$vTi))))]>;
Lei Huang09fda632018-04-04 16:43:50 +00002543
2544 // Additional fnmsub patterns: -a*c + b == -(a*c - b)
2545 def : Pat<(fma (fneg f128:$A), f128:$C, f128:$B), (XSNMSUBQP $B, $C, $A)>;
2546 def : Pat<(fma f128:$A, (fneg f128:$C), f128:$B), (XSNMSUBQP $B, $C, $A)>;
Chuang-Yu Cheng56638482016-03-28 07:38:01 +00002547
Kit Barton93612ec2016-02-26 21:11:55 +00002548 //===--------------------------------------------------------------------===//
2549 // Quad/Double-Precision Compare Instructions:
2550
2551 // [PO BF // VRA VRB XO /]
2552 class X_BF3_VA5_VB5<bits<6> opcode, bits<10> xo, string opc,
2553 list<dag> pattern>
2554 : XForm_17<opcode, xo, (outs crrc:$crD), (ins vrrc:$VA, vrrc:$VB),
2555 !strconcat(opc, " $crD, $VA, $VB"), IIC_FPCompare> {
2556 let Pattern = pattern;
2557 }
2558
2559 // QP Compare Ordered/Unordered
2560 def XSCMPOQP : X_BF3_VA5_VB5<63, 132, "xscmpoqp", []>;
2561 def XSCMPUQP : X_BF3_VA5_VB5<63, 644, "xscmpuqp", []>;
2562
2563 // DP/QP Compare Exponents
2564 def XSCMPEXPDP : XX3Form_1<60, 59,
2565 (outs crrc:$crD), (ins vsfrc:$XA, vsfrc:$XB),
Stefan Pintiliee1d79a82019-03-26 20:28:21 +00002566 "xscmpexpdp $crD, $XA, $XB", IIC_FPCompare, []>;
Kit Barton93612ec2016-02-26 21:11:55 +00002567 def XSCMPEXPQP : X_BF3_VA5_VB5<63, 164, "xscmpexpqp", []>;
2568
2569 // DP Compare ==, >=, >, !=
2570 // Use vsrc for XT, because the entire register of XT is set.
2571 // XT.dword[1] = 0x0000_0000_0000_0000
2572 def XSCMPEQDP : XX3_XT5_XA5_XB5<60, 3, "xscmpeqdp", vsrc, vsfrc, vsfrc,
2573 IIC_FPCompare, []>;
2574 def XSCMPGEDP : XX3_XT5_XA5_XB5<60, 19, "xscmpgedp", vsrc, vsfrc, vsfrc,
2575 IIC_FPCompare, []>;
2576 def XSCMPGTDP : XX3_XT5_XA5_XB5<60, 11, "xscmpgtdp", vsrc, vsfrc, vsfrc,
2577 IIC_FPCompare, []>;
Kit Barton93612ec2016-02-26 21:11:55 +00002578
2579 //===--------------------------------------------------------------------===//
2580 // Quad-Precision Floating-Point Conversion Instructions:
2581
2582 // Convert DP -> QP
Lei Huangd17c39c2018-07-05 04:18:37 +00002583 def XSCVDPQP : X_VT5_XO5_VB5_TyVB<63, 22, 836, "xscvdpqp", vfrc,
2584 [(set f128:$vT, (fpextend f64:$vB))]>;
Kit Barton93612ec2016-02-26 21:11:55 +00002585
2586 // Round & Convert QP -> DP (dword[1] is set to zero)
Lei Huang6270ab62018-07-04 21:59:16 +00002587 def XSCVQPDP : X_VT5_XO5_VB5_VSFR<63, 20, 836, "xscvqpdp" , []>;
Stefan Pintilie58e3e0a2018-07-09 20:09:22 +00002588 def XSCVQPDPO : X_VT5_XO5_VB5_VSFR_Ro<63, 20, 836, "xscvqpdpo",
2589 [(set f64:$vT,
2590 (int_ppc_truncf128_round_to_odd
2591 f128:$vB))]>;
Kit Barton93612ec2016-02-26 21:11:55 +00002592
2593 // Truncate & Convert QP -> (Un)Signed (D)Word (dword[1] is set to zero)
2594 def XSCVQPSDZ : X_VT5_XO5_VB5<63, 25, 836, "xscvqpsdz", []>;
2595 def XSCVQPSWZ : X_VT5_XO5_VB5<63, 9, 836, "xscvqpswz", []>;
2596 def XSCVQPUDZ : X_VT5_XO5_VB5<63, 17, 836, "xscvqpudz", []>;
2597 def XSCVQPUWZ : X_VT5_XO5_VB5<63, 1, 836, "xscvqpuwz", []>;
2598
Lei Huangc517e952018-05-08 18:23:31 +00002599 // Convert (Un)Signed DWord -> QP.
Nemanja Ivanovic11049f82016-10-04 06:59:23 +00002600 def XSCVSDQP : X_VT5_XO5_VB5_TyVB<63, 10, 836, "xscvsdqp", vfrc, []>;
Lei Huang10367eb2018-04-12 18:00:14 +00002601 def : Pat<(f128 (sint_to_fp i64:$src)),
2602 (f128 (XSCVSDQP (COPY_TO_REGCLASS $src, VFRC)))>;
Lei Huang66e22c22018-07-05 07:46:01 +00002603 def : Pat<(f128 (sint_to_fp (i64 (PPCmfvsr f64:$src)))),
2604 (f128 (XSCVSDQP $src))>;
2605 def : Pat<(f128 (sint_to_fp (i32 (PPCmfvsr f64:$src)))),
2606 (f128 (XSCVSDQP (VEXTSW2Ds $src)))>;
2607
Nemanja Ivanovic11049f82016-10-04 06:59:23 +00002608 def XSCVUDQP : X_VT5_XO5_VB5_TyVB<63, 2, 836, "xscvudqp", vfrc, []>;
Lei Huang10367eb2018-04-12 18:00:14 +00002609 def : Pat<(f128 (uint_to_fp i64:$src)),
2610 (f128 (XSCVUDQP (COPY_TO_REGCLASS $src, VFRC)))>;
Lei Huang66e22c22018-07-05 07:46:01 +00002611 def : Pat<(f128 (uint_to_fp (i64 (PPCmfvsr f64:$src)))),
2612 (f128 (XSCVUDQP $src))>;
Kit Barton93612ec2016-02-26 21:11:55 +00002613
Lei Huangc517e952018-05-08 18:23:31 +00002614 // Convert (Un)Signed Word -> QP.
Lei Huang198e6782018-04-18 16:34:22 +00002615 def : Pat<(f128 (sint_to_fp i32:$src)),
2616 (f128 (XSCVSDQP (MTVSRWA $src)))>;
2617 def : Pat<(f128 (sint_to_fp (i32 (load xoaddr:$src)))),
2618 (f128 (XSCVSDQP (LIWAX xoaddr:$src)))>;
2619 def : Pat<(f128 (uint_to_fp i32:$src)),
2620 (f128 (XSCVUDQP (MTVSRWZ $src)))>;
2621 def : Pat<(f128 (uint_to_fp (i32 (load xoaddr:$src)))),
2622 (f128 (XSCVUDQP (LIWZX xoaddr:$src)))>;
2623
Kit Barton93612ec2016-02-26 21:11:55 +00002624 //===--------------------------------------------------------------------===//
2625 // Round to Floating-Point Integer Instructions
2626
2627 // (Round &) Convert DP <-> HP
2628 // Note! xscvdphp's src and dest register both use the left 64 bits, so we use
2629 // vsfrc for src and dest register. xscvhpdp's src only use the left 16 bits,
2630 // but we still use vsfrc for it.
2631 def XSCVDPHP : XX2_XT6_XO5_XB6<60, 17, 347, "xscvdphp", vsfrc, []>;
2632 def XSCVHPDP : XX2_XT6_XO5_XB6<60, 16, 347, "xscvhpdp", vsfrc, []>;
2633
2634 // Vector HP -> SP
2635 def XVCVHPSP : XX2_XT6_XO5_XB6<60, 24, 475, "xvcvhpsp", vsrc, []>;
Nemanja Ivanovicec4b0c32016-11-11 21:42:01 +00002636 def XVCVSPHP : XX2_XT6_XO5_XB6<60, 25, 475, "xvcvsphp", vsrc,
2637 [(set v4f32:$XT,
2638 (int_ppc_vsx_xvcvsphp v4f32:$XB))]>;
Kit Barton93612ec2016-02-26 21:11:55 +00002639
Sean Fertilea435e072016-11-14 18:43:59 +00002640 // Pattern for matching Vector HP -> Vector SP intrinsic. Defined as a
Simon Pilgrim68168d12017-03-30 12:59:53 +00002641 // separate pattern so that it can convert the input register class from
Sean Fertilea435e072016-11-14 18:43:59 +00002642 // VRRC(v8i16) to VSRC.
2643 def : Pat<(v4f32 (int_ppc_vsx_xvcvhpsp v8i16:$A)),
2644 (v4f32 (XVCVHPSP (COPY_TO_REGCLASS $A, VSRC)))>;
2645
Kit Barton93612ec2016-02-26 21:11:55 +00002646 class Z23_VT5_R1_VB5_RMC2_EX1<bits<6> opcode, bits<8> xo, bit ex, string opc,
2647 list<dag> pattern>
Zaara Syeda421a5962018-05-14 15:45:15 +00002648 : Z23Form_8<opcode, xo,
Kit Barton93612ec2016-02-26 21:11:55 +00002649 (outs vrrc:$vT), (ins u1imm:$r, vrrc:$vB, u2imm:$rmc),
2650 !strconcat(opc, " $r, $vT, $vB, $rmc"), IIC_VecFP, pattern> {
2651 let RC = ex;
2652 }
2653
2654 // Round to Quad-Precision Integer [with Inexact]
2655 def XSRQPI : Z23_VT5_R1_VB5_RMC2_EX1<63, 5, 0, "xsrqpi" , []>;
2656 def XSRQPIX : Z23_VT5_R1_VB5_RMC2_EX1<63, 5, 1, "xsrqpix", []>;
2657
Stefan Pintilie133acb22018-07-09 20:38:40 +00002658 // Use current rounding mode
2659 def : Pat<(f128 (fnearbyint f128:$vB)), (f128 (XSRQPI 0, $vB, 3))>;
2660 // Round to nearest, ties away from zero
2661 def : Pat<(f128 (fround f128:$vB)), (f128 (XSRQPI 0, $vB, 0))>;
2662 // Round towards Zero
2663 def : Pat<(f128 (ftrunc f128:$vB)), (f128 (XSRQPI 1, $vB, 1))>;
2664 // Round towards +Inf
2665 def : Pat<(f128 (fceil f128:$vB)), (f128 (XSRQPI 1, $vB, 2))>;
2666 // Round towards -Inf
2667 def : Pat<(f128 (ffloor f128:$vB)), (f128 (XSRQPI 1, $vB, 3))>;
2668
2669 // Use current rounding mode, [with Inexact]
2670 def : Pat<(f128 (frint f128:$vB)), (f128 (XSRQPIX 0, $vB, 3))>;
2671
Kit Barton93612ec2016-02-26 21:11:55 +00002672 // Round Quad-Precision to Double-Extended Precision (fp80)
2673 def XSRQPXP : Z23_VT5_R1_VB5_RMC2_EX1<63, 37, 0, "xsrqpxp", []>;
Kit Bartonba532dc2016-03-08 03:49:13 +00002674
2675 //===--------------------------------------------------------------------===//
Chuang-Yu Cheng80722712016-03-28 08:34:28 +00002676 // Insert/Extract Instructions
2677
2678 // Insert Exponent DP/QP
2679 // XT NOTE: XT.dword[1] = 0xUUUU_UUUU_UUUU_UUUU
2680 def XSIEXPDP : XX1Form <60, 918, (outs vsrc:$XT), (ins g8rc:$rA, g8rc:$rB),
Stefan Pintiliee1d79a82019-03-26 20:28:21 +00002681 "xsiexpdp $XT, $rA, $rB", IIC_VecFP, []>;
Chuang-Yu Cheng80722712016-03-28 08:34:28 +00002682 // vB NOTE: only vB.dword[0] is used, that's why we don't use
2683 // X_VT5_VA5_VB5 form
2684 def XSIEXPQP : XForm_18<63, 868, (outs vrrc:$vT), (ins vrrc:$vA, vsfrc:$vB),
2685 "xsiexpqp $vT, $vA, $vB", IIC_VecFP, []>;
2686
Stefan Pintilieb5305772018-09-24 18:14:13 +00002687 def : Pat<(f128 (int_ppc_scalar_insert_exp_qp f128:$vA, i64:$vB)),
2688 (f128 (XSIEXPQP $vA, (MTVSRD $vB)))>;
2689
Chuang-Yu Cheng80722712016-03-28 08:34:28 +00002690 // Extract Exponent/Significand DP/QP
2691 def XSXEXPDP : XX2_RT5_XO5_XB6<60, 0, 347, "xsxexpdp", []>;
2692 def XSXSIGDP : XX2_RT5_XO5_XB6<60, 1, 347, "xsxsigdp", []>;
Nemanja Ivanovic11049f82016-10-04 06:59:23 +00002693
Chuang-Yu Cheng80722712016-03-28 08:34:28 +00002694 def XSXEXPQP : X_VT5_XO5_VB5 <63, 2, 804, "xsxexpqp", []>;
2695 def XSXSIGQP : X_VT5_XO5_VB5 <63, 18, 804, "xsxsigqp", []>;
2696
Stefan Pintilieb5305772018-09-24 18:14:13 +00002697 def : Pat<(i64 (int_ppc_scalar_extract_expq f128:$vA)),
2698 (i64 (MFVSRD (EXTRACT_SUBREG
2699 (v2i64 (XSXEXPQP $vA)), sub_64)))>;
2700
Chuang-Yu Cheng80722712016-03-28 08:34:28 +00002701 // Vector Insert Word
2702 // XB NOTE: Only XB.dword[1] is used, but we use vsrc on XB.
Nemanja Ivanovicb43bb612016-07-12 21:00:10 +00002703 def XXINSERTW :
2704 XX2_RD6_UIM5_RS6<60, 181, (outs vsrc:$XT),
2705 (ins vsrc:$XTi, vsrc:$XB, u4imm:$UIM),
2706 "xxinsertw $XT, $XB, $UIM", IIC_VecFP,
Tony Jiang61ef1c52017-09-05 18:08:02 +00002707 [(set v4i32:$XT, (PPCvecinsert v4i32:$XTi, v4i32:$XB,
Nemanja Ivanovicb43bb612016-07-12 21:00:10 +00002708 imm32SExt16:$UIM))]>,
2709 RegConstraint<"$XTi = $XT">, NoEncode<"$XTi">;
Chuang-Yu Cheng80722712016-03-28 08:34:28 +00002710
2711 // Vector Extract Unsigned Word
2712 def XXEXTRACTUW : XX2_RD6_UIM5_RS6<60, 165,
Nemanja Ivanovicb43bb612016-07-12 21:00:10 +00002713 (outs vsfrc:$XT), (ins vsrc:$XB, u4imm:$UIMM),
Chuang-Yu Cheng80722712016-03-28 08:34:28 +00002714 "xxextractuw $XT, $XB, $UIMM", IIC_VecFP, []>;
2715
2716 // Vector Insert Exponent DP/SP
2717 def XVIEXPDP : XX3_XT5_XA5_XB5<60, 248, "xviexpdp", vsrc, vsrc, vsrc,
Nemanja Ivanovic0f459982016-10-26 19:03:40 +00002718 IIC_VecFP, [(set v2f64: $XT,(int_ppc_vsx_xviexpdp v2i64:$XA, v2i64:$XB))]>;
Chuang-Yu Cheng80722712016-03-28 08:34:28 +00002719 def XVIEXPSP : XX3_XT5_XA5_XB5<60, 216, "xviexpsp", vsrc, vsrc, vsrc,
Nemanja Ivanovic0f459982016-10-26 19:03:40 +00002720 IIC_VecFP, [(set v4f32: $XT,(int_ppc_vsx_xviexpsp v4i32:$XA, v4i32:$XB))]>;
Chuang-Yu Cheng80722712016-03-28 08:34:28 +00002721
2722 // Vector Extract Exponent/Significand DP/SP
Sean Fertileadda5b22016-11-14 14:42:37 +00002723 def XVXEXPDP : XX2_XT6_XO5_XB6<60, 0, 475, "xvxexpdp", vsrc,
2724 [(set v2i64: $XT,
2725 (int_ppc_vsx_xvxexpdp v2f64:$XB))]>;
2726 def XVXEXPSP : XX2_XT6_XO5_XB6<60, 8, 475, "xvxexpsp", vsrc,
2727 [(set v4i32: $XT,
2728 (int_ppc_vsx_xvxexpsp v4f32:$XB))]>;
2729 def XVXSIGDP : XX2_XT6_XO5_XB6<60, 1, 475, "xvxsigdp", vsrc,
2730 [(set v2i64: $XT,
2731 (int_ppc_vsx_xvxsigdp v2f64:$XB))]>;
2732 def XVXSIGSP : XX2_XT6_XO5_XB6<60, 9, 475, "xvxsigsp", vsrc,
2733 [(set v4i32: $XT,
2734 (int_ppc_vsx_xvxsigsp v4f32:$XB))]>;
Chuang-Yu Cheng80722712016-03-28 08:34:28 +00002735
Sean Fertile1c4109b2016-12-09 17:21:42 +00002736 let AddedComplexity = 400, Predicates = [HasP9Vector] in {
2737 // Extra patterns expanding to vector Extract Word/Insert Word
2738 def : Pat<(v4i32 (int_ppc_vsx_xxinsertw v4i32:$A, v2i64:$B, imm:$IMM)),
2739 (v4i32 (XXINSERTW $A, $B, imm:$IMM))>;
2740 def : Pat<(v2i64 (int_ppc_vsx_xxextractuw v2i64:$A, imm:$IMM)),
2741 (v2i64 (COPY_TO_REGCLASS (XXEXTRACTUW $A, imm:$IMM), VSRC))>;
2742 } // AddedComplexity = 400, HasP9Vector
2743
Chuang-Yu Cheng80722712016-03-28 08:34:28 +00002744 //===--------------------------------------------------------------------===//
2745
2746 // Test Data Class SP/DP/QP
2747 def XSTSTDCSP : XX2_BF3_DCMX7_RS6<60, 298,
2748 (outs crrc:$BF), (ins u7imm:$DCMX, vsfrc:$XB),
2749 "xststdcsp $BF, $XB, $DCMX", IIC_VecFP, []>;
2750 def XSTSTDCDP : XX2_BF3_DCMX7_RS6<60, 362,
2751 (outs crrc:$BF), (ins u7imm:$DCMX, vsfrc:$XB),
2752 "xststdcdp $BF, $XB, $DCMX", IIC_VecFP, []>;
2753 def XSTSTDCQP : X_BF3_DCMX7_RS5 <63, 708,
2754 (outs crrc:$BF), (ins u7imm:$DCMX, vrrc:$vB),
2755 "xststdcqp $BF, $vB, $DCMX", IIC_VecFP, []>;
2756
2757 // Vector Test Data Class SP/DP
2758 def XVTSTDCSP : XX2_RD6_DCMX7_RS6<60, 13, 5,
2759 (outs vsrc:$XT), (ins u7imm:$DCMX, vsrc:$XB),
Sean Fertileadda5b22016-11-14 14:42:37 +00002760 "xvtstdcsp $XT, $XB, $DCMX", IIC_VecFP,
2761 [(set v4i32: $XT,
2762 (int_ppc_vsx_xvtstdcsp v4f32:$XB, imm:$DCMX))]>;
Chuang-Yu Cheng80722712016-03-28 08:34:28 +00002763 def XVTSTDCDP : XX2_RD6_DCMX7_RS6<60, 15, 5,
2764 (outs vsrc:$XT), (ins u7imm:$DCMX, vsrc:$XB),
Sean Fertileadda5b22016-11-14 14:42:37 +00002765 "xvtstdcdp $XT, $XB, $DCMX", IIC_VecFP,
2766 [(set v2i64: $XT,
2767 (int_ppc_vsx_xvtstdcdp v2f64:$XB, imm:$DCMX))]>;
Chuang-Yu Cheng80722712016-03-28 08:34:28 +00002768
2769 //===--------------------------------------------------------------------===//
2770
2771 // Maximum/Minimum Type-C/Type-J DP
2772 // XT.dword[1] = 0xUUUU_UUUU_UUUU_UUUU, so we use vsrc for XT
2773 def XSMAXCDP : XX3_XT5_XA5_XB5<60, 128, "xsmaxcdp", vsrc, vsfrc, vsfrc,
2774 IIC_VecFP, []>;
2775 def XSMAXJDP : XX3_XT5_XA5_XB5<60, 144, "xsmaxjdp", vsrc, vsfrc, vsfrc,
2776 IIC_VecFP, []>;
2777 def XSMINCDP : XX3_XT5_XA5_XB5<60, 136, "xsmincdp", vsrc, vsfrc, vsfrc,
2778 IIC_VecFP, []>;
2779 def XSMINJDP : XX3_XT5_XA5_XB5<60, 152, "xsminjdp", vsrc, vsfrc, vsfrc,
2780 IIC_VecFP, []>;
2781
2782 //===--------------------------------------------------------------------===//
2783
2784 // Vector Byte-Reverse H/W/D/Q Word
2785 def XXBRH : XX2_XT6_XO5_XB6<60, 7, 475, "xxbrh", vsrc, []>;
2786 def XXBRW : XX2_XT6_XO5_XB6<60, 15, 475, "xxbrw", vsrc, []>;
2787 def XXBRD : XX2_XT6_XO5_XB6<60, 23, 475, "xxbrd", vsrc, []>;
2788 def XXBRQ : XX2_XT6_XO5_XB6<60, 31, 475, "xxbrq", vsrc, []>;
2789
Tony Jiang1a8eec12017-06-12 18:24:36 +00002790 // Vector Reverse
2791 def : Pat<(v8i16 (PPCxxreverse v8i16 :$A)),
2792 (v8i16 (COPY_TO_REGCLASS (XXBRH (COPY_TO_REGCLASS $A, VSRC)), VRRC))>;
2793 def : Pat<(v4i32 (PPCxxreverse v4i32 :$A)),
2794 (v4i32 (XXBRW $A))>;
2795 def : Pat<(v2i64 (PPCxxreverse v2i64 :$A)),
2796 (v2i64 (XXBRD $A))>;
2797 def : Pat<(v1i128 (PPCxxreverse v1i128 :$A)),
2798 (v1i128 (COPY_TO_REGCLASS (XXBRQ (COPY_TO_REGCLASS $A, VSRC)), VRRC))>;
2799
Chuang-Yu Cheng80722712016-03-28 08:34:28 +00002800 // Vector Permute
2801 def XXPERM : XX3_XT5_XA5_XB5<60, 26, "xxperm" , vsrc, vsrc, vsrc,
2802 IIC_VecPerm, []>;
2803 def XXPERMR : XX3_XT5_XA5_XB5<60, 58, "xxpermr", vsrc, vsrc, vsrc,
2804 IIC_VecPerm, []>;
2805
2806 // Vector Splat Immediate Byte
2807 def XXSPLTIB : X_RD6_IMM8<60, 360, (outs vsrc:$XT), (ins u8imm:$IMM8),
Stefan Pintiliee1d79a82019-03-26 20:28:21 +00002808 "xxspltib $XT, $IMM8", IIC_VecPerm, []>;
Chuang-Yu Cheng80722712016-03-28 08:34:28 +00002809
2810 //===--------------------------------------------------------------------===//
Kit Bartonba532dc2016-03-08 03:49:13 +00002811 // Vector/Scalar Load/Store Instructions
2812
Nemanja Ivanovic6354d232016-10-04 11:25:52 +00002813 // When adding new D-Form loads/stores, be sure to update the ImmToIdxMap in
2814 // PPCRegisterInfo::PPCRegisterInfo and maybe save yourself some debugging.
Sean Fertile3c8c3852017-01-26 18:59:15 +00002815 let mayLoad = 1, mayStore = 0 in {
Kit Bartonba532dc2016-03-08 03:49:13 +00002816 // Load Vector
2817 def LXV : DQ_RD6_RS5_DQ12<61, 1, (outs vsrc:$XT), (ins memrix16:$src),
Stefan Pintiliee1d79a82019-03-26 20:28:21 +00002818 "lxv $XT, $src", IIC_LdStLFD, []>;
Kit Bartonba532dc2016-03-08 03:49:13 +00002819 // Load DWord
Nemanja Ivanovic11049f82016-10-04 06:59:23 +00002820 def LXSD : DSForm_1<57, 2, (outs vfrc:$vD), (ins memrix:$src),
Kit Bartonba532dc2016-03-08 03:49:13 +00002821 "lxsd $vD, $src", IIC_LdStLFD, []>;
2822 // Load SP from src, convert it to DP, and place in dword[0]
Nemanja Ivanovic11049f82016-10-04 06:59:23 +00002823 def LXSSP : DSForm_1<57, 3, (outs vfrc:$vD), (ins memrix:$src),
Kit Bartonba532dc2016-03-08 03:49:13 +00002824 "lxssp $vD, $src", IIC_LdStLFD, []>;
2825
2826 // [PO T RA RB XO TX] almost equal to [PO S RA RB XO SX], but has different
2827 // "out" and "in" dag
2828 class X_XT6_RA5_RB5<bits<6> opcode, bits<10> xo, string opc,
2829 RegisterOperand vtype, list<dag> pattern>
Stefan Pintilie26d4f922018-03-26 17:39:18 +00002830 : XX1Form_memOp<opcode, xo, (outs vtype:$XT), (ins memrr:$src),
Stefan Pintiliee1d79a82019-03-26 20:28:21 +00002831 !strconcat(opc, " $XT, $src"), IIC_LdStLFD, pattern>;
Kit Bartonba532dc2016-03-08 03:49:13 +00002832
2833 // Load as Integer Byte/Halfword & Zero Indexed
Nemanja Ivanovic11049f82016-10-04 06:59:23 +00002834 def LXSIBZX : X_XT6_RA5_RB5<31, 781, "lxsibzx", vsfrc,
2835 [(set f64:$XT, (PPClxsizx xoaddr:$src, 1))]>;
2836 def LXSIHZX : X_XT6_RA5_RB5<31, 813, "lxsihzx", vsfrc,
2837 [(set f64:$XT, (PPClxsizx xoaddr:$src, 2))]>;
Kit Bartonba532dc2016-03-08 03:49:13 +00002838
2839 // Load Vector Halfword*8/Byte*16 Indexed
2840 def LXVH8X : X_XT6_RA5_RB5<31, 812, "lxvh8x" , vsrc, []>;
2841 def LXVB16X : X_XT6_RA5_RB5<31, 876, "lxvb16x", vsrc, []>;
2842
2843 // Load Vector Indexed
Nemanja Ivanovic6e7879c2016-09-22 09:52:19 +00002844 def LXVX : X_XT6_RA5_RB5<31, 268, "lxvx" , vsrc,
Zaara Syeda93297832017-05-24 17:50:37 +00002845 [(set v2f64:$XT, (load xaddr:$src))]>;
Kit Bartonba532dc2016-03-08 03:49:13 +00002846 // Load Vector (Left-justified) with Length
Stefan Pintilie26d4f922018-03-26 17:39:18 +00002847 def LXVL : XX1Form_memOp<31, 269, (outs vsrc:$XT), (ins memr:$src, g8rc:$rB),
Zaara Syedaa19c9e62016-11-15 17:54:19 +00002848 "lxvl $XT, $src, $rB", IIC_LdStLoad,
Stefan Pintiliee1d79a82019-03-26 20:28:21 +00002849 [(set v4i32:$XT, (int_ppc_vsx_lxvl addr:$src, i64:$rB))]>;
Stefan Pintilie26d4f922018-03-26 17:39:18 +00002850 def LXVLL : XX1Form_memOp<31,301, (outs vsrc:$XT), (ins memr:$src, g8rc:$rB),
Zaara Syedaa19c9e62016-11-15 17:54:19 +00002851 "lxvll $XT, $src, $rB", IIC_LdStLoad,
Stefan Pintiliee1d79a82019-03-26 20:28:21 +00002852 [(set v4i32:$XT, (int_ppc_vsx_lxvll addr:$src, i64:$rB))]>;
Kit Bartonba532dc2016-03-08 03:49:13 +00002853
2854 // Load Vector Word & Splat Indexed
2855 def LXVWSX : X_XT6_RA5_RB5<31, 364, "lxvwsx" , vsrc, []>;
Nemanja Ivanovic11049f82016-10-04 06:59:23 +00002856 } // mayLoad
Kit Bartonba532dc2016-03-08 03:49:13 +00002857
Nemanja Ivanovic6354d232016-10-04 11:25:52 +00002858 // When adding new D-Form loads/stores, be sure to update the ImmToIdxMap in
2859 // PPCRegisterInfo::PPCRegisterInfo and maybe save yourself some debugging.
Sean Fertile3c8c3852017-01-26 18:59:15 +00002860 let mayStore = 1, mayLoad = 0 in {
Kit Bartonba532dc2016-03-08 03:49:13 +00002861 // Store Vector
2862 def STXV : DQ_RD6_RS5_DQ12<61, 5, (outs), (ins vsrc:$XT, memrix16:$dst),
Stefan Pintiliee1d79a82019-03-26 20:28:21 +00002863 "stxv $XT, $dst", IIC_LdStSTFD, []>;
Kit Bartonba532dc2016-03-08 03:49:13 +00002864 // Store DWord
Nemanja Ivanovic11049f82016-10-04 06:59:23 +00002865 def STXSD : DSForm_1<61, 2, (outs), (ins vfrc:$vS, memrix:$dst),
Kit Bartonba532dc2016-03-08 03:49:13 +00002866 "stxsd $vS, $dst", IIC_LdStSTFD, []>;
2867 // Convert DP of dword[0] to SP, and Store to dst
Nemanja Ivanovic11049f82016-10-04 06:59:23 +00002868 def STXSSP : DSForm_1<61, 3, (outs), (ins vfrc:$vS, memrix:$dst),
Kit Bartonba532dc2016-03-08 03:49:13 +00002869 "stxssp $vS, $dst", IIC_LdStSTFD, []>;
2870
2871 // [PO S RA RB XO SX]
2872 class X_XS6_RA5_RB5<bits<6> opcode, bits<10> xo, string opc,
2873 RegisterOperand vtype, list<dag> pattern>
Stefan Pintilie26d4f922018-03-26 17:39:18 +00002874 : XX1Form_memOp<opcode, xo, (outs), (ins vtype:$XT, memrr:$dst),
Stefan Pintiliee1d79a82019-03-26 20:28:21 +00002875 !strconcat(opc, " $XT, $dst"), IIC_LdStSTFD, pattern>;
Kit Bartonba532dc2016-03-08 03:49:13 +00002876
2877 // Store as Integer Byte/Halfword Indexed
Nemanja Ivanovic11049f82016-10-04 06:59:23 +00002878 def STXSIBX : X_XS6_RA5_RB5<31, 909, "stxsibx" , vsfrc,
2879 [(PPCstxsix f64:$XT, xoaddr:$dst, 1)]>;
2880 def STXSIHX : X_XS6_RA5_RB5<31, 941, "stxsihx" , vsfrc,
2881 [(PPCstxsix f64:$XT, xoaddr:$dst, 2)]>;
2882 let isCodeGenOnly = 1 in {
Stefan Pintiliee1d79a82019-03-26 20:28:21 +00002883 def STXSIBXv : X_XS6_RA5_RB5<31, 909, "stxsibx" , vsrc, []>;
2884 def STXSIHXv : X_XS6_RA5_RB5<31, 941, "stxsihx" , vsrc, []>;
Nemanja Ivanovic11049f82016-10-04 06:59:23 +00002885 }
Kit Bartonba532dc2016-03-08 03:49:13 +00002886
2887 // Store Vector Halfword*8/Byte*16 Indexed
2888 def STXVH8X : X_XS6_RA5_RB5<31, 940, "stxvh8x" , vsrc, []>;
2889 def STXVB16X : X_XS6_RA5_RB5<31, 1004, "stxvb16x", vsrc, []>;
2890
2891 // Store Vector Indexed
Nemanja Ivanovic6e7879c2016-09-22 09:52:19 +00002892 def STXVX : X_XS6_RA5_RB5<31, 396, "stxvx" , vsrc,
Zaara Syeda93297832017-05-24 17:50:37 +00002893 [(store v2f64:$XT, xaddr:$dst)]>;
Kit Bartonba532dc2016-03-08 03:49:13 +00002894
2895 // Store Vector (Left-justified) with Length
Stefan Pintilie26d4f922018-03-26 17:39:18 +00002896 def STXVL : XX1Form_memOp<31, 397, (outs),
2897 (ins vsrc:$XT, memr:$dst, g8rc:$rB),
2898 "stxvl $XT, $dst, $rB", IIC_LdStLoad,
2899 [(int_ppc_vsx_stxvl v4i32:$XT, addr:$dst,
Stefan Pintiliee1d79a82019-03-26 20:28:21 +00002900 i64:$rB)]>;
Stefan Pintilie26d4f922018-03-26 17:39:18 +00002901 def STXVLL : XX1Form_memOp<31, 429, (outs),
2902 (ins vsrc:$XT, memr:$dst, g8rc:$rB),
2903 "stxvll $XT, $dst, $rB", IIC_LdStLoad,
2904 [(int_ppc_vsx_stxvll v4i32:$XT, addr:$dst,
Stefan Pintiliee1d79a82019-03-26 20:28:21 +00002905 i64:$rB)]>;
Nemanja Ivanovic11049f82016-10-04 06:59:23 +00002906 } // mayStore
Nemanja Ivanovicb43bb612016-07-12 21:00:10 +00002907
Lei Huang451ef4a2017-08-14 18:09:29 +00002908 let Predicates = [IsLittleEndian] in {
Lei Huangcd4f3852018-03-12 19:26:18 +00002909 def: Pat<(f32 (PPCfcfids (f64 (PPCmtvsra (i32 (extractelt v4i32:$A, 0)))))),
Lei Huang451ef4a2017-08-14 18:09:29 +00002910 (f32 (XSCVSPDPN (XVCVSXWSP (XXSPLTW $A, 3))))>;
Lei Huangcd4f3852018-03-12 19:26:18 +00002911 def: Pat<(f32 (PPCfcfids (f64 (PPCmtvsra (i32 (extractelt v4i32:$A, 1)))))),
Lei Huang451ef4a2017-08-14 18:09:29 +00002912 (f32 (XSCVSPDPN (XVCVSXWSP (XXSPLTW $A, 2))))>;
Lei Huangcd4f3852018-03-12 19:26:18 +00002913 def: Pat<(f32 (PPCfcfids (f64 (PPCmtvsra (i32 (extractelt v4i32:$A, 2)))))),
Lei Huang451ef4a2017-08-14 18:09:29 +00002914 (f32 (XSCVSPDPN (XVCVSXWSP (XXSPLTW $A, 1))))>;
Lei Huangcd4f3852018-03-12 19:26:18 +00002915 def: Pat<(f32 (PPCfcfids (f64 (PPCmtvsra (i32 (extractelt v4i32:$A, 3)))))),
Lei Huang451ef4a2017-08-14 18:09:29 +00002916 (f32 (XSCVSPDPN (XVCVSXWSP (XXSPLTW $A, 0))))>;
Lei Huangcd4f3852018-03-12 19:26:18 +00002917 def: Pat<(f64 (PPCfcfid (f64 (PPCmtvsra (i32 (extractelt v4i32:$A, 0)))))),
Lei Huang451ef4a2017-08-14 18:09:29 +00002918 (f64 (COPY_TO_REGCLASS (XVCVSXWDP (XXSPLTW $A, 3)), VSFRC))>;
Lei Huangcd4f3852018-03-12 19:26:18 +00002919 def: Pat<(f64 (PPCfcfid (f64 (PPCmtvsra (i32 (extractelt v4i32:$A, 1)))))),
Lei Huang451ef4a2017-08-14 18:09:29 +00002920 (f64 (COPY_TO_REGCLASS (XVCVSXWDP (XXSPLTW $A, 2)), VSFRC))>;
Lei Huangcd4f3852018-03-12 19:26:18 +00002921 def: Pat<(f64 (PPCfcfid (f64 (PPCmtvsra (i32 (extractelt v4i32:$A, 2)))))),
Lei Huang451ef4a2017-08-14 18:09:29 +00002922 (f64 (COPY_TO_REGCLASS (XVCVSXWDP (XXSPLTW $A, 1)), VSFRC))>;
Lei Huangcd4f3852018-03-12 19:26:18 +00002923 def: Pat<(f64 (PPCfcfid (f64 (PPCmtvsra (i32 (extractelt v4i32:$A, 3)))))),
Lei Huang451ef4a2017-08-14 18:09:29 +00002924 (f64 (COPY_TO_REGCLASS (XVCVSXWDP (XXSPLTW $A, 0)), VSFRC))>;
2925 }
2926
2927 let Predicates = [IsBigEndian] in {
Lei Huangcd4f3852018-03-12 19:26:18 +00002928 def: Pat<(f32 (PPCfcfids (f64 (PPCmtvsra (i32 (extractelt v4i32:$A, 0)))))),
Lei Huang451ef4a2017-08-14 18:09:29 +00002929 (f32 (XSCVSPDPN (XVCVSXWSP (XXSPLTW $A, 0))))>;
Lei Huangcd4f3852018-03-12 19:26:18 +00002930 def: Pat<(f32 (PPCfcfids (f64 (PPCmtvsra (i32 (extractelt v4i32:$A, 1)))))),
Lei Huang451ef4a2017-08-14 18:09:29 +00002931 (f32 (XSCVSPDPN (XVCVSXWSP (XXSPLTW $A, 1))))>;
Lei Huangcd4f3852018-03-12 19:26:18 +00002932 def: Pat<(f32 (PPCfcfids (f64 (PPCmtvsra (i32 (extractelt v4i32:$A, 2)))))),
Lei Huang451ef4a2017-08-14 18:09:29 +00002933 (f32 (XSCVSPDPN (XVCVSXWSP (XXSPLTW $A, 2))))>;
Lei Huangcd4f3852018-03-12 19:26:18 +00002934 def: Pat<(f32 (PPCfcfids (f64 (PPCmtvsra (i32 (extractelt v4i32:$A, 3)))))),
Lei Huang451ef4a2017-08-14 18:09:29 +00002935 (f32 (XSCVSPDPN (XVCVSXWSP (XXSPLTW $A, 3))))>;
Lei Huangcd4f3852018-03-12 19:26:18 +00002936 def: Pat<(f64 (PPCfcfid (f64 (PPCmtvsra (i32 (extractelt v4i32:$A, 0)))))),
Lei Huang451ef4a2017-08-14 18:09:29 +00002937 (f64 (COPY_TO_REGCLASS (XVCVSXWDP (XXSPLTW $A, 0)), VSFRC))>;
Lei Huangcd4f3852018-03-12 19:26:18 +00002938 def: Pat<(f64 (PPCfcfid (f64 (PPCmtvsra (i32 (extractelt v4i32:$A, 1)))))),
Lei Huang451ef4a2017-08-14 18:09:29 +00002939 (f64 (COPY_TO_REGCLASS (XVCVSXWDP (XXSPLTW $A, 1)), VSFRC))>;
Lei Huangcd4f3852018-03-12 19:26:18 +00002940 def: Pat<(f64 (PPCfcfid (f64 (PPCmtvsra (i32 (extractelt v4i32:$A, 2)))))),
Lei Huang451ef4a2017-08-14 18:09:29 +00002941 (f64 (COPY_TO_REGCLASS (XVCVSXWDP (XXSPLTW $A, 2)), VSFRC))>;
Lei Huangcd4f3852018-03-12 19:26:18 +00002942 def: Pat<(f64 (PPCfcfid (f64 (PPCmtvsra (i32 (extractelt v4i32:$A, 3)))))),
Lei Huang451ef4a2017-08-14 18:09:29 +00002943 (f64 (COPY_TO_REGCLASS (XVCVSXWDP (XXSPLTW $A, 3)), VSFRC))>;
2944 }
2945
Graham Yiu5cd044e2017-11-07 20:55:43 +00002946 // Alternate patterns for PPCmtvsrz where the output is v8i16 or v16i8 instead
2947 // of f64
2948 def : Pat<(v8i16 (PPCmtvsrz i32:$A)),
2949 (v8i16 (SUBREG_TO_REG (i64 1), (MTVSRWZ $A), sub_64))>;
2950 def : Pat<(v16i8 (PPCmtvsrz i32:$A)),
2951 (v16i8 (SUBREG_TO_REG (i64 1), (MTVSRWZ $A), sub_64))>;
2952
Nemanja Ivanovicb43bb612016-07-12 21:00:10 +00002953 // Patterns for which instructions from ISA 3.0 are a better match
2954 let Predicates = [IsLittleEndian, HasP9Vector] in {
Lei Huangcd4f3852018-03-12 19:26:18 +00002955 def : Pat<(f32 (PPCfcfidus (f64 (PPCmtvsrz (i32 (extractelt v4i32:$A, 0)))))),
Nemanja Ivanovicb43bb612016-07-12 21:00:10 +00002956 (f32 (XSCVUXDSP (XXEXTRACTUW $A, 12)))>;
Lei Huangcd4f3852018-03-12 19:26:18 +00002957 def : Pat<(f32 (PPCfcfidus (f64 (PPCmtvsrz (i32 (extractelt v4i32:$A, 1)))))),
Nemanja Ivanovicb43bb612016-07-12 21:00:10 +00002958 (f32 (XSCVUXDSP (XXEXTRACTUW $A, 8)))>;
Lei Huangcd4f3852018-03-12 19:26:18 +00002959 def : Pat<(f32 (PPCfcfidus (f64 (PPCmtvsrz (i32 (extractelt v4i32:$A, 2)))))),
Nemanja Ivanovicb43bb612016-07-12 21:00:10 +00002960 (f32 (XSCVUXDSP (XXEXTRACTUW $A, 4)))>;
Lei Huangcd4f3852018-03-12 19:26:18 +00002961 def : Pat<(f32 (PPCfcfidus (f64 (PPCmtvsrz (i32 (extractelt v4i32:$A, 3)))))),
Nemanja Ivanovicb43bb612016-07-12 21:00:10 +00002962 (f32 (XSCVUXDSP (XXEXTRACTUW $A, 0)))>;
Lei Huangcd4f3852018-03-12 19:26:18 +00002963 def : Pat<(f64 (PPCfcfidu (f64 (PPCmtvsrz (i32 (extractelt v4i32:$A, 0)))))),
Lei Huang451ef4a2017-08-14 18:09:29 +00002964 (f64 (XSCVUXDDP (XXEXTRACTUW $A, 12)))>;
Lei Huangcd4f3852018-03-12 19:26:18 +00002965 def : Pat<(f64 (PPCfcfidu (f64 (PPCmtvsrz (i32 (extractelt v4i32:$A, 1)))))),
Lei Huang451ef4a2017-08-14 18:09:29 +00002966 (f64 (XSCVUXDDP (XXEXTRACTUW $A, 8)))>;
Lei Huangcd4f3852018-03-12 19:26:18 +00002967 def : Pat<(f64 (PPCfcfidu (f64 (PPCmtvsrz (i32 (extractelt v4i32:$A, 2)))))),
Lei Huang451ef4a2017-08-14 18:09:29 +00002968 (f64 (XSCVUXDDP (XXEXTRACTUW $A, 4)))>;
Lei Huangcd4f3852018-03-12 19:26:18 +00002969 def : Pat<(f64 (PPCfcfidu (f64 (PPCmtvsrz (i32 (extractelt v4i32:$A, 3)))))),
Lei Huang451ef4a2017-08-14 18:09:29 +00002970 (f64 (XSCVUXDDP (XXEXTRACTUW $A, 0)))>;
Nemanja Ivanovicb43bb612016-07-12 21:00:10 +00002971 def : Pat<(v4i32 (insertelt v4i32:$A, i32:$B, 0)),
2972 (v4i32 (XXINSERTW v4i32:$A, AlignValues.I32_TO_BE_WORD1, 12))>;
2973 def : Pat<(v4i32 (insertelt v4i32:$A, i32:$B, 1)),
2974 (v4i32 (XXINSERTW v4i32:$A, AlignValues.I32_TO_BE_WORD1, 8))>;
2975 def : Pat<(v4i32 (insertelt v4i32:$A, i32:$B, 2)),
2976 (v4i32 (XXINSERTW v4i32:$A, AlignValues.I32_TO_BE_WORD1, 4))>;
2977 def : Pat<(v4i32 (insertelt v4i32:$A, i32:$B, 3)),
2978 (v4i32 (XXINSERTW v4i32:$A, AlignValues.I32_TO_BE_WORD1, 0))>;
2979 def : Pat<(v4f32 (insertelt v4f32:$A, f32:$B, 0)),
2980 (v4f32 (XXINSERTW v4f32:$A, AlignValues.F32_TO_BE_WORD1, 12))>;
2981 def : Pat<(v4f32 (insertelt v4f32:$A, f32:$B, 1)),
2982 (v4f32 (XXINSERTW v4f32:$A, AlignValues.F32_TO_BE_WORD1, 8))>;
2983 def : Pat<(v4f32 (insertelt v4f32:$A, f32:$B, 2)),
2984 (v4f32 (XXINSERTW v4f32:$A, AlignValues.F32_TO_BE_WORD1, 4))>;
2985 def : Pat<(v4f32 (insertelt v4f32:$A, f32:$B, 3)),
2986 (v4f32 (XXINSERTW v4f32:$A, AlignValues.F32_TO_BE_WORD1, 0))>;
2987 } // IsLittleEndian, HasP9Vector
2988
2989 let Predicates = [IsBigEndian, HasP9Vector] in {
Lei Huangcd4f3852018-03-12 19:26:18 +00002990 def : Pat<(f32 (PPCfcfidus (f64 (PPCmtvsrz (i32 (extractelt v4i32:$A, 0)))))),
Nemanja Ivanovicb43bb612016-07-12 21:00:10 +00002991 (f32 (XSCVUXDSP (XXEXTRACTUW $A, 0)))>;
Lei Huangcd4f3852018-03-12 19:26:18 +00002992 def : Pat<(f32 (PPCfcfidus (f64 (PPCmtvsrz (i32 (extractelt v4i32:$A, 1)))))),
Nemanja Ivanovicb43bb612016-07-12 21:00:10 +00002993 (f32 (XSCVUXDSP (XXEXTRACTUW $A, 4)))>;
Lei Huangcd4f3852018-03-12 19:26:18 +00002994 def : Pat<(f32 (PPCfcfidus (f64 (PPCmtvsrz (i32 (extractelt v4i32:$A, 2)))))),
Nemanja Ivanovicb43bb612016-07-12 21:00:10 +00002995 (f32 (XSCVUXDSP (XXEXTRACTUW $A, 8)))>;
Lei Huangcd4f3852018-03-12 19:26:18 +00002996 def : Pat<(f32 (PPCfcfidus (f64 (PPCmtvsrz (i32 (extractelt v4i32:$A, 3)))))),
Nemanja Ivanovicb43bb612016-07-12 21:00:10 +00002997 (f32 (XSCVUXDSP (XXEXTRACTUW $A, 12)))>;
Lei Huangcd4f3852018-03-12 19:26:18 +00002998 def : Pat<(f64 (PPCfcfidu (f64 (PPCmtvsrz (i32 (extractelt v4i32:$A, 0)))))),
Lei Huang451ef4a2017-08-14 18:09:29 +00002999 (f64 (XSCVUXDDP (XXEXTRACTUW $A, 0)))>;
Lei Huangcd4f3852018-03-12 19:26:18 +00003000 def : Pat<(f64 (PPCfcfidu (f64 (PPCmtvsrz (i32 (extractelt v4i32:$A, 1)))))),
Lei Huang451ef4a2017-08-14 18:09:29 +00003001 (f64 (XSCVUXDDP (XXEXTRACTUW $A, 4)))>;
Lei Huangcd4f3852018-03-12 19:26:18 +00003002 def : Pat<(f64 (PPCfcfidu (f64 (PPCmtvsrz (i32 (extractelt v4i32:$A, 2)))))),
Lei Huang451ef4a2017-08-14 18:09:29 +00003003 (f64 (XSCVUXDDP (XXEXTRACTUW $A, 8)))>;
Lei Huangcd4f3852018-03-12 19:26:18 +00003004 def : Pat<(f64 (PPCfcfidu (f64 (PPCmtvsrz (i32 (extractelt v4i32:$A, 3)))))),
Lei Huang451ef4a2017-08-14 18:09:29 +00003005 (f64 (XSCVUXDDP (XXEXTRACTUW $A, 12)))>;
Nemanja Ivanovicb43bb612016-07-12 21:00:10 +00003006 def : Pat<(v4i32 (insertelt v4i32:$A, i32:$B, 0)),
3007 (v4i32 (XXINSERTW v4i32:$A, AlignValues.I32_TO_BE_WORD1, 0))>;
3008 def : Pat<(v4i32 (insertelt v4i32:$A, i32:$B, 1)),
3009 (v4i32 (XXINSERTW v4i32:$A, AlignValues.I32_TO_BE_WORD1, 4))>;
3010 def : Pat<(v4i32 (insertelt v4i32:$A, i32:$B, 2)),
3011 (v4i32 (XXINSERTW v4i32:$A, AlignValues.I32_TO_BE_WORD1, 8))>;
3012 def : Pat<(v4i32 (insertelt v4i32:$A, i32:$B, 3)),
3013 (v4i32 (XXINSERTW v4i32:$A, AlignValues.I32_TO_BE_WORD1, 12))>;
3014 def : Pat<(v4f32 (insertelt v4f32:$A, f32:$B, 0)),
3015 (v4f32 (XXINSERTW v4f32:$A, AlignValues.F32_TO_BE_WORD1, 0))>;
3016 def : Pat<(v4f32 (insertelt v4f32:$A, f32:$B, 1)),
3017 (v4f32 (XXINSERTW v4f32:$A, AlignValues.F32_TO_BE_WORD1, 4))>;
3018 def : Pat<(v4f32 (insertelt v4f32:$A, f32:$B, 2)),
3019 (v4f32 (XXINSERTW v4f32:$A, AlignValues.F32_TO_BE_WORD1, 8))>;
3020 def : Pat<(v4f32 (insertelt v4f32:$A, f32:$B, 3)),
3021 (v4f32 (XXINSERTW v4f32:$A, AlignValues.F32_TO_BE_WORD1, 12))>;
3022 } // IsLittleEndian, HasP9Vector
Nemanja Ivanovic6e7879c2016-09-22 09:52:19 +00003023
Zaara Syeda93297832017-05-24 17:50:37 +00003024 // D-Form Load/Store
Nemanja Ivanovic3c7e276d2017-07-13 18:17:10 +00003025 def : Pat<(v4i32 (quadwOffsetLoad iqaddr:$src)), (LXV memrix16:$src)>;
3026 def : Pat<(v4f32 (quadwOffsetLoad iqaddr:$src)), (LXV memrix16:$src)>;
3027 def : Pat<(v2i64 (quadwOffsetLoad iqaddr:$src)), (LXV memrix16:$src)>;
3028 def : Pat<(v2f64 (quadwOffsetLoad iqaddr:$src)), (LXV memrix16:$src)>;
Lei Huang6d1596a2018-03-19 18:52:20 +00003029 def : Pat<(f128 (quadwOffsetLoad iqaddr:$src)),
3030 (COPY_TO_REGCLASS (LXV memrix16:$src), VRRC)>;
Nemanja Ivanovic3c7e276d2017-07-13 18:17:10 +00003031 def : Pat<(v4i32 (int_ppc_vsx_lxvw4x iqaddr:$src)), (LXV memrix16:$src)>;
3032 def : Pat<(v2f64 (int_ppc_vsx_lxvd2x iqaddr:$src)), (LXV memrix16:$src)>;
Nemanja Ivanovicd2c3c512016-09-23 13:25:31 +00003033
Nemanja Ivanovic3c7e276d2017-07-13 18:17:10 +00003034 def : Pat<(quadwOffsetStore v4f32:$rS, iqaddr:$dst), (STXV $rS, memrix16:$dst)>;
3035 def : Pat<(quadwOffsetStore v4i32:$rS, iqaddr:$dst), (STXV $rS, memrix16:$dst)>;
3036 def : Pat<(quadwOffsetStore v2f64:$rS, iqaddr:$dst), (STXV $rS, memrix16:$dst)>;
Lei Huang6d1596a2018-03-19 18:52:20 +00003037 def : Pat<(quadwOffsetStore f128:$rS, iqaddr:$dst),
3038 (STXV (COPY_TO_REGCLASS $rS, VSRC), memrix16:$dst)>;
Nemanja Ivanovic3c7e276d2017-07-13 18:17:10 +00003039 def : Pat<(quadwOffsetStore v2i64:$rS, iqaddr:$dst), (STXV $rS, memrix16:$dst)>;
3040 def : Pat<(int_ppc_vsx_stxvw4x v4i32:$rS, iqaddr:$dst),
Zaara Syeda93297832017-05-24 17:50:37 +00003041 (STXV $rS, memrix16:$dst)>;
Nemanja Ivanovic3c7e276d2017-07-13 18:17:10 +00003042 def : Pat<(int_ppc_vsx_stxvd2x v2f64:$rS, iqaddr:$dst),
Zaara Syeda93297832017-05-24 17:50:37 +00003043 (STXV $rS, memrix16:$dst)>;
3044
3045
Nemanja Ivanovic3c7e276d2017-07-13 18:17:10 +00003046 def : Pat<(v2f64 (nonQuadwOffsetLoad xoaddr:$src)), (LXVX xoaddr:$src)>;
3047 def : Pat<(v2i64 (nonQuadwOffsetLoad xoaddr:$src)), (LXVX xoaddr:$src)>;
3048 def : Pat<(v4f32 (nonQuadwOffsetLoad xoaddr:$src)), (LXVX xoaddr:$src)>;
3049 def : Pat<(v4i32 (nonQuadwOffsetLoad xoaddr:$src)), (LXVX xoaddr:$src)>;
3050 def : Pat<(v4i32 (int_ppc_vsx_lxvw4x xoaddr:$src)), (LXVX xoaddr:$src)>;
3051 def : Pat<(v2f64 (int_ppc_vsx_lxvd2x xoaddr:$src)), (LXVX xoaddr:$src)>;
Lei Huang6d1596a2018-03-19 18:52:20 +00003052 def : Pat<(f128 (nonQuadwOffsetLoad xoaddr:$src)),
3053 (COPY_TO_REGCLASS (LXVX xoaddr:$src), VRRC)>;
3054 def : Pat<(nonQuadwOffsetStore f128:$rS, xoaddr:$dst),
3055 (STXVX (COPY_TO_REGCLASS $rS, VSRC), xoaddr:$dst)>;
Nemanja Ivanovic3c7e276d2017-07-13 18:17:10 +00003056 def : Pat<(nonQuadwOffsetStore v2f64:$rS, xoaddr:$dst),
3057 (STXVX $rS, xoaddr:$dst)>;
3058 def : Pat<(nonQuadwOffsetStore v2i64:$rS, xoaddr:$dst),
3059 (STXVX $rS, xoaddr:$dst)>;
3060 def : Pat<(nonQuadwOffsetStore v4f32:$rS, xoaddr:$dst),
3061 (STXVX $rS, xoaddr:$dst)>;
3062 def : Pat<(nonQuadwOffsetStore v4i32:$rS, xoaddr:$dst),
3063 (STXVX $rS, xoaddr:$dst)>;
3064 def : Pat<(int_ppc_vsx_stxvw4x v4i32:$rS, xoaddr:$dst),
3065 (STXVX $rS, xoaddr:$dst)>;
3066 def : Pat<(int_ppc_vsx_stxvd2x v2f64:$rS, xoaddr:$dst),
3067 (STXVX $rS, xoaddr:$dst)>;
Zaara Syedab2595b92018-08-08 15:20:43 +00003068
3069 let AddedComplexity = 400 in {
3070 // LIWAX - This instruction is used for sign extending i32 -> i64.
3071 // LIWZX - This instruction will be emitted for i32, f32, and when
3072 // zero-extending i32 to i64 (zext i32 -> i64).
3073 let Predicates = [IsLittleEndian] in {
3074
3075 def : Pat<(v2i64 (scalar_to_vector (i64 (sextloadi32 xoaddr:$src)))),
3076 (v2i64 (XXPERMDIs
3077 (COPY_TO_REGCLASS (LIWAX xoaddr:$src), VSRC), 2))>;
3078
3079 def : Pat<(v2i64 (scalar_to_vector (i64 (zextloadi32 xoaddr:$src)))),
3080 (v2i64 (XXPERMDIs
3081 (COPY_TO_REGCLASS (LIWZX xoaddr:$src), VSRC), 2))>;
3082
3083 def : Pat<(v4i32 (scalar_to_vector (i32 (load xoaddr:$src)))),
3084 (v4i32 (XXPERMDIs
3085 (COPY_TO_REGCLASS (LIWZX xoaddr:$src), VSRC), 2))>;
3086
3087 def : Pat<(v4f32 (scalar_to_vector (f32 (load xoaddr:$src)))),
3088 (v4f32 (XXPERMDIs
3089 (COPY_TO_REGCLASS (LIWZX xoaddr:$src), VSRC), 2))>;
3090 }
3091
3092 let Predicates = [IsBigEndian] in {
3093 def : Pat<(v2i64 (scalar_to_vector (i64 (sextloadi32 xoaddr:$src)))),
3094 (v2i64 (COPY_TO_REGCLASS (LIWAX xoaddr:$src), VSRC))>;
3095
3096 def : Pat<(v2i64 (scalar_to_vector (i64 (zextloadi32 xoaddr:$src)))),
3097 (v2i64 (COPY_TO_REGCLASS (LIWZX xoaddr:$src), VSRC))>;
3098
3099 def : Pat<(v4i32 (scalar_to_vector (i32 (load xoaddr:$src)))),
3100 (v4i32 (XXSLDWIs
3101 (COPY_TO_REGCLASS (LIWZX xoaddr:$src), VSRC), 1))>;
3102
3103 def : Pat<(v4f32 (scalar_to_vector (f32 (load xoaddr:$src)))),
3104 (v4f32 (XXSLDWIs
3105 (COPY_TO_REGCLASS (LIWZX xoaddr:$src), VSRC), 1))>;
3106 }
3107
3108 }
Nemanja Ivanovic11049f82016-10-04 06:59:23 +00003109
3110 // Build vectors from i8 loads
3111 def : Pat<(v16i8 (scalar_to_vector ScalarLoads.Li8)),
3112 (v16i8 (VSPLTBs 7, (LXSIBZX xoaddr:$src)))>;
3113 def : Pat<(v8i16 (scalar_to_vector ScalarLoads.ZELi8)),
3114 (v8i16 (VSPLTHs 3, (LXSIBZX xoaddr:$src)))>;
3115 def : Pat<(v4i32 (scalar_to_vector ScalarLoads.ZELi8)),
3116 (v4i32 (XXSPLTWs (LXSIBZX xoaddr:$src), 1))>;
3117 def : Pat<(v2i64 (scalar_to_vector ScalarLoads.ZELi8i64)),
Nemanja Ivanovic15748f42016-12-06 11:47:14 +00003118 (v2i64 (XXPERMDIs (LXSIBZX xoaddr:$src), 0))>;
Nemanja Ivanovic11049f82016-10-04 06:59:23 +00003119 def : Pat<(v4i32 (scalar_to_vector ScalarLoads.SELi8)),
3120 (v4i32 (XXSPLTWs (VEXTSB2Ws (LXSIBZX xoaddr:$src)), 1))>;
3121 def : Pat<(v2i64 (scalar_to_vector ScalarLoads.SELi8i64)),
Nemanja Ivanovic15748f42016-12-06 11:47:14 +00003122 (v2i64 (XXPERMDIs (VEXTSB2Ds (LXSIBZX xoaddr:$src)), 0))>;
Nemanja Ivanovic11049f82016-10-04 06:59:23 +00003123
3124 // Build vectors from i16 loads
3125 def : Pat<(v8i16 (scalar_to_vector ScalarLoads.Li16)),
3126 (v8i16 (VSPLTHs 3, (LXSIHZX xoaddr:$src)))>;
3127 def : Pat<(v4i32 (scalar_to_vector ScalarLoads.ZELi16)),
3128 (v4i32 (XXSPLTWs (LXSIHZX xoaddr:$src), 1))>;
3129 def : Pat<(v2i64 (scalar_to_vector ScalarLoads.ZELi16i64)),
Nemanja Ivanovic15748f42016-12-06 11:47:14 +00003130 (v2i64 (XXPERMDIs (LXSIHZX xoaddr:$src), 0))>;
Nemanja Ivanovic11049f82016-10-04 06:59:23 +00003131 def : Pat<(v4i32 (scalar_to_vector ScalarLoads.SELi16)),
3132 (v4i32 (XXSPLTWs (VEXTSH2Ws (LXSIHZX xoaddr:$src)), 1))>;
3133 def : Pat<(v2i64 (scalar_to_vector ScalarLoads.SELi16i64)),
Nemanja Ivanovic15748f42016-12-06 11:47:14 +00003134 (v2i64 (XXPERMDIs (VEXTSH2Ds (LXSIHZX xoaddr:$src)), 0))>;
Nemanja Ivanovic11049f82016-10-04 06:59:23 +00003135
3136 let Predicates = [IsBigEndian, HasP9Vector] in {
3137 // Scalar stores of i8
3138 def : Pat<(truncstorei8 (i32 (vector_extract v16i8:$S, 0)), xoaddr:$dst),
Stefan Pintiliee1d79a82019-03-26 20:28:21 +00003139 (STXSIBXv (COPY_TO_REGCLASS (v16i8 (VSLDOI $S, $S, 9)), VSRC), xoaddr:$dst)>;
Nemanja Ivanovic11049f82016-10-04 06:59:23 +00003140 def : Pat<(truncstorei8 (i32 (vector_extract v16i8:$S, 1)), xoaddr:$dst),
Stefan Pintiliee1d79a82019-03-26 20:28:21 +00003141 (STXSIBXv (COPY_TO_REGCLASS (v16i8 (VSLDOI $S, $S, 10)), VSRC), xoaddr:$dst)>;
Nemanja Ivanovic11049f82016-10-04 06:59:23 +00003142 def : Pat<(truncstorei8 (i32 (vector_extract v16i8:$S, 2)), xoaddr:$dst),
Stefan Pintiliee1d79a82019-03-26 20:28:21 +00003143 (STXSIBXv (COPY_TO_REGCLASS (v16i8 (VSLDOI $S, $S, 11)), VSRC), xoaddr:$dst)>;
Nemanja Ivanovic11049f82016-10-04 06:59:23 +00003144 def : Pat<(truncstorei8 (i32 (vector_extract v16i8:$S, 3)), xoaddr:$dst),
Stefan Pintiliee1d79a82019-03-26 20:28:21 +00003145 (STXSIBXv (COPY_TO_REGCLASS (v16i8 (VSLDOI $S, $S, 12)), VSRC), xoaddr:$dst)>;
Nemanja Ivanovic11049f82016-10-04 06:59:23 +00003146 def : Pat<(truncstorei8 (i32 (vector_extract v16i8:$S, 4)), xoaddr:$dst),
Stefan Pintiliee1d79a82019-03-26 20:28:21 +00003147 (STXSIBXv (COPY_TO_REGCLASS (v16i8 (VSLDOI $S, $S, 13)), VSRC), xoaddr:$dst)>;
Nemanja Ivanovic11049f82016-10-04 06:59:23 +00003148 def : Pat<(truncstorei8 (i32 (vector_extract v16i8:$S, 5)), xoaddr:$dst),
Stefan Pintiliee1d79a82019-03-26 20:28:21 +00003149 (STXSIBXv (COPY_TO_REGCLASS (v16i8 (VSLDOI $S, $S, 14)), VSRC), xoaddr:$dst)>;
Nemanja Ivanovic11049f82016-10-04 06:59:23 +00003150 def : Pat<(truncstorei8 (i32 (vector_extract v16i8:$S, 6)), xoaddr:$dst),
Stefan Pintiliee1d79a82019-03-26 20:28:21 +00003151 (STXSIBXv (COPY_TO_REGCLASS (v16i8 (VSLDOI $S, $S, 15)), VSRC), xoaddr:$dst)>;
Nemanja Ivanovic11049f82016-10-04 06:59:23 +00003152 def : Pat<(truncstorei8 (i32 (vector_extract v16i8:$S, 7)), xoaddr:$dst),
Stefan Pintiliee1d79a82019-03-26 20:28:21 +00003153 (STXSIBXv (COPY_TO_REGCLASS $S, VSRC), xoaddr:$dst)>;
Nemanja Ivanovic11049f82016-10-04 06:59:23 +00003154 def : Pat<(truncstorei8 (i32 (vector_extract v16i8:$S, 8)), xoaddr:$dst),
Stefan Pintiliee1d79a82019-03-26 20:28:21 +00003155 (STXSIBXv (COPY_TO_REGCLASS (v16i8 (VSLDOI $S, $S, 1)), VSRC), xoaddr:$dst)>;
Nemanja Ivanovic11049f82016-10-04 06:59:23 +00003156 def : Pat<(truncstorei8 (i32 (vector_extract v16i8:$S, 9)), xoaddr:$dst),
Stefan Pintiliee1d79a82019-03-26 20:28:21 +00003157 (STXSIBXv (COPY_TO_REGCLASS (v16i8 (VSLDOI $S, $S, 2)), VSRC), xoaddr:$dst)>;
Nemanja Ivanovic11049f82016-10-04 06:59:23 +00003158 def : Pat<(truncstorei8 (i32 (vector_extract v16i8:$S, 10)), xoaddr:$dst),
Stefan Pintiliee1d79a82019-03-26 20:28:21 +00003159 (STXSIBXv (COPY_TO_REGCLASS (v16i8 (VSLDOI $S, $S, 3)), VSRC), xoaddr:$dst)>;
Nemanja Ivanovic11049f82016-10-04 06:59:23 +00003160 def : Pat<(truncstorei8 (i32 (vector_extract v16i8:$S, 11)), xoaddr:$dst),
Stefan Pintiliee1d79a82019-03-26 20:28:21 +00003161 (STXSIBXv (COPY_TO_REGCLASS (v16i8 (VSLDOI $S, $S, 4)), VSRC), xoaddr:$dst)>;
Nemanja Ivanovic11049f82016-10-04 06:59:23 +00003162 def : Pat<(truncstorei8 (i32 (vector_extract v16i8:$S, 12)), xoaddr:$dst),
Stefan Pintiliee1d79a82019-03-26 20:28:21 +00003163 (STXSIBXv (COPY_TO_REGCLASS (v16i8 (VSLDOI $S, $S, 5)), VSRC), xoaddr:$dst)>;
Nemanja Ivanovic11049f82016-10-04 06:59:23 +00003164 def : Pat<(truncstorei8 (i32 (vector_extract v16i8:$S, 13)), xoaddr:$dst),
Stefan Pintiliee1d79a82019-03-26 20:28:21 +00003165 (STXSIBXv (COPY_TO_REGCLASS (v16i8 (VSLDOI $S, $S, 6)), VSRC), xoaddr:$dst)>;
Nemanja Ivanovic11049f82016-10-04 06:59:23 +00003166 def : Pat<(truncstorei8 (i32 (vector_extract v16i8:$S, 14)), xoaddr:$dst),
Stefan Pintiliee1d79a82019-03-26 20:28:21 +00003167 (STXSIBXv (COPY_TO_REGCLASS (v16i8 (VSLDOI $S, $S, 7)), VSRC), xoaddr:$dst)>;
Nemanja Ivanovic11049f82016-10-04 06:59:23 +00003168 def : Pat<(truncstorei8 (i32 (vector_extract v16i8:$S, 15)), xoaddr:$dst),
Stefan Pintiliee1d79a82019-03-26 20:28:21 +00003169 (STXSIBXv (COPY_TO_REGCLASS (v16i8 (VSLDOI $S, $S, 8)), VSRC), xoaddr:$dst)>;
Nemanja Ivanovic11049f82016-10-04 06:59:23 +00003170
3171 // Scalar stores of i16
3172 def : Pat<(truncstorei16 (i32 (vector_extract v8i16:$S, 0)), xoaddr:$dst),
Stefan Pintiliee1d79a82019-03-26 20:28:21 +00003173 (STXSIHXv (COPY_TO_REGCLASS (v16i8 (VSLDOI $S, $S, 10)), VSRC), xoaddr:$dst)>;
Nemanja Ivanovic11049f82016-10-04 06:59:23 +00003174 def : Pat<(truncstorei16 (i32 (vector_extract v8i16:$S, 1)), xoaddr:$dst),
Stefan Pintiliee1d79a82019-03-26 20:28:21 +00003175 (STXSIHXv (COPY_TO_REGCLASS (v16i8 (VSLDOI $S, $S, 12)), VSRC), xoaddr:$dst)>;
Nemanja Ivanovic11049f82016-10-04 06:59:23 +00003176 def : Pat<(truncstorei16 (i32 (vector_extract v8i16:$S, 2)), xoaddr:$dst),
Stefan Pintiliee1d79a82019-03-26 20:28:21 +00003177 (STXSIHXv (COPY_TO_REGCLASS (v16i8 (VSLDOI $S, $S, 14)), VSRC), xoaddr:$dst)>;
Nemanja Ivanovic11049f82016-10-04 06:59:23 +00003178 def : Pat<(truncstorei16 (i32 (vector_extract v8i16:$S, 3)), xoaddr:$dst),
Stefan Pintiliee1d79a82019-03-26 20:28:21 +00003179 (STXSIHXv (COPY_TO_REGCLASS $S, VSRC), xoaddr:$dst)>;
Nemanja Ivanovic11049f82016-10-04 06:59:23 +00003180 def : Pat<(truncstorei16 (i32 (vector_extract v8i16:$S, 4)), xoaddr:$dst),
Stefan Pintiliee1d79a82019-03-26 20:28:21 +00003181 (STXSIHXv (COPY_TO_REGCLASS (v16i8 (VSLDOI $S, $S, 2)), VSRC), xoaddr:$dst)>;
Nemanja Ivanovic11049f82016-10-04 06:59:23 +00003182 def : Pat<(truncstorei16 (i32 (vector_extract v8i16:$S, 5)), xoaddr:$dst),
Stefan Pintiliee1d79a82019-03-26 20:28:21 +00003183 (STXSIHXv (COPY_TO_REGCLASS (v16i8 (VSLDOI $S, $S, 4)), VSRC), xoaddr:$dst)>;
Nemanja Ivanovic11049f82016-10-04 06:59:23 +00003184 def : Pat<(truncstorei16 (i32 (vector_extract v8i16:$S, 6)), xoaddr:$dst),
Stefan Pintiliee1d79a82019-03-26 20:28:21 +00003185 (STXSIHXv (COPY_TO_REGCLASS (v16i8 (VSLDOI $S, $S, 6)), VSRC), xoaddr:$dst)>;
Nemanja Ivanovic11049f82016-10-04 06:59:23 +00003186 def : Pat<(truncstorei16 (i32 (vector_extract v8i16:$S, 7)), xoaddr:$dst),
Stefan Pintiliee1d79a82019-03-26 20:28:21 +00003187 (STXSIHXv (COPY_TO_REGCLASS (v16i8 (VSLDOI $S, $S, 8)), VSRC), xoaddr:$dst)>;
Nemanja Ivanovic11049f82016-10-04 06:59:23 +00003188 } // IsBigEndian, HasP9Vector
3189
3190 let Predicates = [IsLittleEndian, HasP9Vector] in {
3191 // Scalar stores of i8
3192 def : Pat<(truncstorei8 (i32 (vector_extract v16i8:$S, 0)), xoaddr:$dst),
Stefan Pintiliee1d79a82019-03-26 20:28:21 +00003193 (STXSIBXv (COPY_TO_REGCLASS (v16i8 (VSLDOI $S, $S, 8)), VSRC), xoaddr:$dst)>;
Nemanja Ivanovic11049f82016-10-04 06:59:23 +00003194 def : Pat<(truncstorei8 (i32 (vector_extract v16i8:$S, 1)), xoaddr:$dst),
Stefan Pintiliee1d79a82019-03-26 20:28:21 +00003195 (STXSIBXv (COPY_TO_REGCLASS (v16i8 (VSLDOI $S, $S, 7)), VSRC), xoaddr:$dst)>;
Nemanja Ivanovic11049f82016-10-04 06:59:23 +00003196 def : Pat<(truncstorei8 (i32 (vector_extract v16i8:$S, 2)), xoaddr:$dst),
Stefan Pintiliee1d79a82019-03-26 20:28:21 +00003197 (STXSIBXv (COPY_TO_REGCLASS (v16i8 (VSLDOI $S, $S, 6)), VSRC), xoaddr:$dst)>;
Nemanja Ivanovic11049f82016-10-04 06:59:23 +00003198 def : Pat<(truncstorei8 (i32 (vector_extract v16i8:$S, 3)), xoaddr:$dst),
Stefan Pintiliee1d79a82019-03-26 20:28:21 +00003199 (STXSIBXv (COPY_TO_REGCLASS (v16i8 (VSLDOI $S, $S, 5)), VSRC), xoaddr:$dst)>;
Nemanja Ivanovic11049f82016-10-04 06:59:23 +00003200 def : Pat<(truncstorei8 (i32 (vector_extract v16i8:$S, 4)), xoaddr:$dst),
Stefan Pintiliee1d79a82019-03-26 20:28:21 +00003201 (STXSIBXv (COPY_TO_REGCLASS (v16i8 (VSLDOI $S, $S, 4)), VSRC), xoaddr:$dst)>;
Nemanja Ivanovic11049f82016-10-04 06:59:23 +00003202 def : Pat<(truncstorei8 (i32 (vector_extract v16i8:$S, 5)), xoaddr:$dst),
Stefan Pintiliee1d79a82019-03-26 20:28:21 +00003203 (STXSIBXv (COPY_TO_REGCLASS (v16i8 (VSLDOI $S, $S, 3)), VSRC), xoaddr:$dst)>;
Nemanja Ivanovic11049f82016-10-04 06:59:23 +00003204 def : Pat<(truncstorei8 (i32 (vector_extract v16i8:$S, 6)), xoaddr:$dst),
Stefan Pintiliee1d79a82019-03-26 20:28:21 +00003205 (STXSIBXv (COPY_TO_REGCLASS (v16i8 (VSLDOI $S, $S, 2)), VSRC), xoaddr:$dst)>;
Nemanja Ivanovic11049f82016-10-04 06:59:23 +00003206 def : Pat<(truncstorei8 (i32 (vector_extract v16i8:$S, 7)), xoaddr:$dst),
Stefan Pintiliee1d79a82019-03-26 20:28:21 +00003207 (STXSIBXv (COPY_TO_REGCLASS (v16i8 (VSLDOI $S, $S, 1)), VSRC), xoaddr:$dst)>;
Nemanja Ivanovic11049f82016-10-04 06:59:23 +00003208 def : Pat<(truncstorei8 (i32 (vector_extract v16i8:$S, 8)), xoaddr:$dst),
Stefan Pintiliee1d79a82019-03-26 20:28:21 +00003209 (STXSIBXv (COPY_TO_REGCLASS $S, VSRC), xoaddr:$dst)>;
Nemanja Ivanovic11049f82016-10-04 06:59:23 +00003210 def : Pat<(truncstorei8 (i32 (vector_extract v16i8:$S, 9)), xoaddr:$dst),
Stefan Pintiliee1d79a82019-03-26 20:28:21 +00003211 (STXSIBXv (COPY_TO_REGCLASS (v16i8 (VSLDOI $S, $S, 15)), VSRC), xoaddr:$dst)>;
Nemanja Ivanovic11049f82016-10-04 06:59:23 +00003212 def : Pat<(truncstorei8 (i32 (vector_extract v16i8:$S, 10)), xoaddr:$dst),
Stefan Pintiliee1d79a82019-03-26 20:28:21 +00003213 (STXSIBXv (COPY_TO_REGCLASS (v16i8 (VSLDOI $S, $S, 14)), VSRC), xoaddr:$dst)>;
Nemanja Ivanovic11049f82016-10-04 06:59:23 +00003214 def : Pat<(truncstorei8 (i32 (vector_extract v16i8:$S, 11)), xoaddr:$dst),
Stefan Pintiliee1d79a82019-03-26 20:28:21 +00003215 (STXSIBXv (COPY_TO_REGCLASS (v16i8 (VSLDOI $S, $S, 13)), VSRC), xoaddr:$dst)>;
Nemanja Ivanovic11049f82016-10-04 06:59:23 +00003216 def : Pat<(truncstorei8 (i32 (vector_extract v16i8:$S, 12)), xoaddr:$dst),
Stefan Pintiliee1d79a82019-03-26 20:28:21 +00003217 (STXSIBXv (COPY_TO_REGCLASS (v16i8 (VSLDOI $S, $S, 12)), VSRC), xoaddr:$dst)>;
Nemanja Ivanovic11049f82016-10-04 06:59:23 +00003218 def : Pat<(truncstorei8 (i32 (vector_extract v16i8:$S, 13)), xoaddr:$dst),
Stefan Pintiliee1d79a82019-03-26 20:28:21 +00003219 (STXSIBXv (COPY_TO_REGCLASS (v16i8 (VSLDOI $S, $S, 11)), VSRC), xoaddr:$dst)>;
Nemanja Ivanovic11049f82016-10-04 06:59:23 +00003220 def : Pat<(truncstorei8 (i32 (vector_extract v16i8:$S, 14)), xoaddr:$dst),
Stefan Pintiliee1d79a82019-03-26 20:28:21 +00003221 (STXSIBXv (COPY_TO_REGCLASS (v16i8 (VSLDOI $S, $S, 10)), VSRC), xoaddr:$dst)>;
Nemanja Ivanovic11049f82016-10-04 06:59:23 +00003222 def : Pat<(truncstorei8 (i32 (vector_extract v16i8:$S, 15)), xoaddr:$dst),
Stefan Pintiliee1d79a82019-03-26 20:28:21 +00003223 (STXSIBXv (COPY_TO_REGCLASS (v16i8 (VSLDOI $S, $S, 9)), VSRC), xoaddr:$dst)>;
Nemanja Ivanovic11049f82016-10-04 06:59:23 +00003224
3225 // Scalar stores of i16
3226 def : Pat<(truncstorei16 (i32 (vector_extract v8i16:$S, 0)), xoaddr:$dst),
Stefan Pintiliee1d79a82019-03-26 20:28:21 +00003227 (STXSIHXv (COPY_TO_REGCLASS (v16i8 (VSLDOI $S, $S, 8)), VSRC), xoaddr:$dst)>;
Nemanja Ivanovic11049f82016-10-04 06:59:23 +00003228 def : Pat<(truncstorei16 (i32 (vector_extract v8i16:$S, 1)), xoaddr:$dst),
Stefan Pintiliee1d79a82019-03-26 20:28:21 +00003229 (STXSIHXv (COPY_TO_REGCLASS (v16i8 (VSLDOI $S, $S, 6)), VSRC), xoaddr:$dst)>;
Nemanja Ivanovic11049f82016-10-04 06:59:23 +00003230 def : Pat<(truncstorei16 (i32 (vector_extract v8i16:$S, 2)), xoaddr:$dst),
Stefan Pintiliee1d79a82019-03-26 20:28:21 +00003231 (STXSIHXv (COPY_TO_REGCLASS (v16i8 (VSLDOI $S, $S, 4)), VSRC), xoaddr:$dst)>;
Nemanja Ivanovic11049f82016-10-04 06:59:23 +00003232 def : Pat<(truncstorei16 (i32 (vector_extract v8i16:$S, 3)), xoaddr:$dst),
Stefan Pintiliee1d79a82019-03-26 20:28:21 +00003233 (STXSIHXv (COPY_TO_REGCLASS (v16i8 (VSLDOI $S, $S, 2)), VSRC), xoaddr:$dst)>;
Nemanja Ivanovic11049f82016-10-04 06:59:23 +00003234 def : Pat<(truncstorei16 (i32 (vector_extract v8i16:$S, 4)), xoaddr:$dst),
Stefan Pintiliee1d79a82019-03-26 20:28:21 +00003235 (STXSIHXv (COPY_TO_REGCLASS $S, VSRC), xoaddr:$dst)>;
Nemanja Ivanovic11049f82016-10-04 06:59:23 +00003236 def : Pat<(truncstorei16 (i32 (vector_extract v8i16:$S, 5)), xoaddr:$dst),
Stefan Pintiliee1d79a82019-03-26 20:28:21 +00003237 (STXSIHXv (COPY_TO_REGCLASS (v16i8 (VSLDOI $S, $S, 14)), VSRC), xoaddr:$dst)>;
Nemanja Ivanovic11049f82016-10-04 06:59:23 +00003238 def : Pat<(truncstorei16 (i32 (vector_extract v8i16:$S, 6)), xoaddr:$dst),
Stefan Pintiliee1d79a82019-03-26 20:28:21 +00003239 (STXSIHXv (COPY_TO_REGCLASS (v16i8 (VSLDOI $S, $S, 12)), VSRC), xoaddr:$dst)>;
Nemanja Ivanovic11049f82016-10-04 06:59:23 +00003240 def : Pat<(truncstorei16 (i32 (vector_extract v8i16:$S, 7)), xoaddr:$dst),
Stefan Pintiliee1d79a82019-03-26 20:28:21 +00003241 (STXSIHXv (COPY_TO_REGCLASS (v16i8 (VSLDOI $S, $S, 10)), VSRC), xoaddr:$dst)>;
Nemanja Ivanovic11049f82016-10-04 06:59:23 +00003242 } // IsLittleEndian, HasP9Vector
3243
Sean Fertile1c4109b2016-12-09 17:21:42 +00003244
Nemanja Ivanovic11049f82016-10-04 06:59:23 +00003245 // Vector sign extensions
3246 def : Pat<(f64 (PPCVexts f64:$A, 1)),
3247 (f64 (COPY_TO_REGCLASS (VEXTSB2Ds $A), VSFRC))>;
3248 def : Pat<(f64 (PPCVexts f64:$A, 2)),
3249 (f64 (COPY_TO_REGCLASS (VEXTSH2Ds $A), VSFRC))>;
Nemanja Ivanovicdf1cb522016-11-29 16:11:34 +00003250
Jinsong Jic7b43b92018-12-13 15:12:57 +00003251 def DFLOADf32 : PPCPostRAExpPseudo<(outs vssrc:$XT), (ins memrix:$src),
3252 "#DFLOADf32",
3253 [(set f32:$XT, (load ixaddr:$src))]>;
3254 def DFLOADf64 : PPCPostRAExpPseudo<(outs vsfrc:$XT), (ins memrix:$src),
3255 "#DFLOADf64",
3256 [(set f64:$XT, (load ixaddr:$src))]>;
3257 def DFSTOREf32 : PPCPostRAExpPseudo<(outs), (ins vssrc:$XT, memrix:$dst),
3258 "#DFSTOREf32",
3259 [(store f32:$XT, ixaddr:$dst)]>;
3260 def DFSTOREf64 : PPCPostRAExpPseudo<(outs), (ins vsfrc:$XT, memrix:$dst),
3261 "#DFSTOREf64",
3262 [(store f64:$XT, ixaddr:$dst)]>;
3263
Nemanja Ivanovic3c7e276d2017-07-13 18:17:10 +00003264 def : Pat<(f64 (extloadf32 ixaddr:$src)),
3265 (COPY_TO_REGCLASS (DFLOADf32 ixaddr:$src), VSFRC)>;
Lei Huangcd4f3852018-03-12 19:26:18 +00003266 def : Pat<(f32 (fpround (f64 (extloadf32 ixaddr:$src)))),
Nemanja Ivanovic3c7e276d2017-07-13 18:17:10 +00003267 (f32 (DFLOADf32 ixaddr:$src))>;
Lei Huang10367eb2018-04-12 18:00:14 +00003268
Zaara Syedab2595b92018-08-08 15:20:43 +00003269
3270 let AddedComplexity = 400 in {
3271 // The following pseudoinstructions are used to ensure the utilization
3272 // of all 64 VSX registers.
3273 let Predicates = [IsLittleEndian, HasP9Vector] in {
3274 def : Pat<(v2i64 (scalar_to_vector (i64 (load ixaddr:$src)))),
3275 (v2i64 (XXPERMDIs
3276 (COPY_TO_REGCLASS (DFLOADf64 ixaddr:$src), VSRC), 2))>;
3277 def : Pat<(v2i64 (scalar_to_vector (i64 (load xaddr:$src)))),
3278 (v2i64 (XXPERMDIs
3279 (COPY_TO_REGCLASS (XFLOADf64 xaddr:$src), VSRC), 2))>;
3280
3281 def : Pat<(v2f64 (scalar_to_vector (f64 (load ixaddr:$src)))),
3282 (v2f64 (XXPERMDIs
3283 (COPY_TO_REGCLASS (DFLOADf64 ixaddr:$src), VSRC), 2))>;
3284 def : Pat<(v2f64 (scalar_to_vector (f64 (load xaddr:$src)))),
3285 (v2f64 (XXPERMDIs
3286 (COPY_TO_REGCLASS (XFLOADf64 xaddr:$src), VSRC), 2))>;
Nemanja Ivanovicb9b75de2019-01-24 23:44:28 +00003287 def : Pat<(store (i64 (extractelt v2i64:$A, 0)), xaddr:$src),
3288 (XFSTOREf64 (EXTRACT_SUBREG (XXPERMDI $A, $A, 2),
3289 sub_64), xaddr:$src)>;
3290 def : Pat<(store (f64 (extractelt v2f64:$A, 0)), xaddr:$src),
3291 (XFSTOREf64 (EXTRACT_SUBREG (XXPERMDI $A, $A, 2),
3292 sub_64), xaddr:$src)>;
3293 def : Pat<(store (i64 (extractelt v2i64:$A, 1)), xaddr:$src),
3294 (XFSTOREf64 (EXTRACT_SUBREG $A, sub_64), xaddr:$src)>;
3295 def : Pat<(store (f64 (extractelt v2f64:$A, 1)), xaddr:$src),
3296 (XFSTOREf64 (EXTRACT_SUBREG $A, sub_64), xaddr:$src)>;
3297 def : Pat<(store (i64 (extractelt v2i64:$A, 0)), ixaddr:$src),
3298 (DFSTOREf64 (EXTRACT_SUBREG (XXPERMDI $A, $A, 2),
3299 sub_64), ixaddr:$src)>;
3300 def : Pat<(store (f64 (extractelt v2f64:$A, 0)), ixaddr:$src),
3301 (DFSTOREf64 (EXTRACT_SUBREG (XXPERMDI $A, $A, 2), sub_64),
3302 ixaddr:$src)>;
3303 def : Pat<(store (i64 (extractelt v2i64:$A, 1)), ixaddr:$src),
3304 (DFSTOREf64 (EXTRACT_SUBREG $A, sub_64), ixaddr:$src)>;
3305 def : Pat<(store (f64 (extractelt v2f64:$A, 1)), ixaddr:$src),
3306 (DFSTOREf64 (EXTRACT_SUBREG $A, sub_64), ixaddr:$src)>;
3307 } // IsLittleEndian, HasP9Vector
Zaara Syedab2595b92018-08-08 15:20:43 +00003308
3309 let Predicates = [IsBigEndian, HasP9Vector] in {
3310 def : Pat<(v2i64 (scalar_to_vector (i64 (load ixaddr:$src)))),
3311 (v2i64 (COPY_TO_REGCLASS (DFLOADf64 ixaddr:$src), VSRC))>;
3312 def : Pat<(v2i64 (scalar_to_vector (i64 (load xaddr:$src)))),
3313 (v2i64 (COPY_TO_REGCLASS (XFLOADf64 xaddr:$src), VSRC))>;
3314
3315 def : Pat<(v2f64 (scalar_to_vector (f64 (load ixaddr:$src)))),
3316 (v2f64 (COPY_TO_REGCLASS (DFLOADf64 ixaddr:$src), VSRC))>;
3317 def : Pat<(v2f64 (scalar_to_vector (f64 (load xaddr:$src)))),
3318 (v2f64 (COPY_TO_REGCLASS (XFLOADf64 xaddr:$src), VSRC))>;
Nemanja Ivanovicb9b75de2019-01-24 23:44:28 +00003319 def : Pat<(store (i64 (extractelt v2i64:$A, 1)), xaddr:$src),
3320 (XFSTOREf64 (EXTRACT_SUBREG (XXPERMDI $A, $A, 2),
3321 sub_64), xaddr:$src)>;
3322 def : Pat<(store (f64 (extractelt v2f64:$A, 1)), xaddr:$src),
3323 (XFSTOREf64 (EXTRACT_SUBREG (XXPERMDI $A, $A, 2),
3324 sub_64), xaddr:$src)>;
3325 def : Pat<(store (i64 (extractelt v2i64:$A, 0)), xaddr:$src),
3326 (XFSTOREf64 (EXTRACT_SUBREG $A, sub_64), xaddr:$src)>;
3327 def : Pat<(store (f64 (extractelt v2f64:$A, 0)), xaddr:$src),
3328 (XFSTOREf64 (EXTRACT_SUBREG $A, sub_64), xaddr:$src)>;
3329 def : Pat<(store (i64 (extractelt v2i64:$A, 1)), ixaddr:$src),
3330 (DFSTOREf64 (EXTRACT_SUBREG (XXPERMDI $A, $A, 2),
3331 sub_64), ixaddr:$src)>;
3332 def : Pat<(store (f64 (extractelt v2f64:$A, 1)), ixaddr:$src),
3333 (DFSTOREf64 (EXTRACT_SUBREG (XXPERMDI $A, $A, 2),
3334 sub_64), ixaddr:$src)>;
3335 def : Pat<(store (i64 (extractelt v2i64:$A, 0)), ixaddr:$src),
3336 (DFSTOREf64 (EXTRACT_SUBREG $A, sub_64), ixaddr:$src)>;
3337 def : Pat<(store (f64 (extractelt v2f64:$A, 0)), ixaddr:$src),
3338 (DFSTOREf64 (EXTRACT_SUBREG $A, sub_64), ixaddr:$src)>;
3339 } // IsBigEndian, HasP9Vector
Zaara Syedab2595b92018-08-08 15:20:43 +00003340 }
3341
Lei Huang8b0da652018-05-23 19:31:54 +00003342 let Predicates = [IsBigEndian, HasP9Vector] in {
Lei Huang89901682018-05-23 18:36:51 +00003343
Lei Huang8b0da652018-05-23 19:31:54 +00003344 // (Un)Signed DWord vector extract -> QP
3345 def : Pat<(f128 (sint_to_fp (i64 (extractelt v2i64:$src, 0)))),
3346 (f128 (XSCVSDQP (COPY_TO_REGCLASS $src, VFRC)))>;
3347 def : Pat<(f128 (sint_to_fp (i64 (extractelt v2i64:$src, 1)))),
3348 (f128 (XSCVSDQP
3349 (EXTRACT_SUBREG (XXPERMDI $src, $src, 3), sub_64)))>;
3350 def : Pat<(f128 (uint_to_fp (i64 (extractelt v2i64:$src, 0)))),
3351 (f128 (XSCVUDQP (COPY_TO_REGCLASS $src, VFRC)))>;
3352 def : Pat<(f128 (uint_to_fp (i64 (extractelt v2i64:$src, 1)))),
3353 (f128 (XSCVUDQP
3354 (EXTRACT_SUBREG (XXPERMDI $src, $src, 3), sub_64)))>;
3355
3356 // (Un)Signed Word vector extract -> QP
3357 def : Pat<(f128 (sint_to_fp (i32 (extractelt v4i32:$src, 1)))),
3358 (f128 (XSCVSDQP (EXTRACT_SUBREG (VEXTSW2D $src), sub_64)))>;
3359 foreach Idx = [0,2,3] in {
3360 def : Pat<(f128 (sint_to_fp (i32 (extractelt v4i32:$src, Idx)))),
3361 (f128 (XSCVSDQP (EXTRACT_SUBREG
3362 (VEXTSW2D (VSPLTW Idx, $src)), sub_64)))>;
3363 }
3364 foreach Idx = 0-3 in {
3365 def : Pat<(f128 (uint_to_fp (i32 (extractelt v4i32:$src, Idx)))),
3366 (f128 (XSCVUDQP (XXEXTRACTUW $src, !shl(Idx, 2))))>;
3367 }
3368
Lei Huang651be442018-05-28 16:43:29 +00003369 // (Un)Signed HWord vector extract -> QP
3370 foreach Idx = 0-7 in {
3371 def : Pat<(f128 (sint_to_fp
3372 (i32 (sext_inreg
3373 (vector_extract v8i16:$src, Idx), i16)))),
3374 (f128 (XSCVSDQP (EXTRACT_SUBREG
3375 (VEXTSH2D (VEXTRACTUH !add(Idx, Idx), $src)),
3376 sub_64)))>;
3377 // The SDAG adds the `and` since an `i16` is being extracted as an `i32`.
3378 def : Pat<(f128 (uint_to_fp
3379 (and (i32 (vector_extract v8i16:$src, Idx)), 65535))),
3380 (f128 (XSCVUDQP (EXTRACT_SUBREG
3381 (VEXTRACTUH !add(Idx, Idx), $src), sub_64)))>;
3382 }
3383
3384 // (Un)Signed Byte vector extract -> QP
3385 foreach Idx = 0-15 in {
3386 def : Pat<(f128 (sint_to_fp
3387 (i32 (sext_inreg (vector_extract v16i8:$src, Idx),
3388 i8)))),
3389 (f128 (XSCVSDQP (EXTRACT_SUBREG
3390 (VEXTSB2D (VEXTRACTUB Idx, $src)), sub_64)))>;
3391 def : Pat<(f128 (uint_to_fp
3392 (and (i32 (vector_extract v16i8:$src, Idx)), 255))),
3393 (f128 (XSCVUDQP
3394 (EXTRACT_SUBREG (VEXTRACTUB Idx, $src), sub_64)))>;
3395 }
Lei Huang66e22c22018-07-05 07:46:01 +00003396
3397 // Unsiged int in vsx register -> QP
3398 def : Pat<(f128 (uint_to_fp (i32 (PPCmfvsr f64:$src)))),
3399 (f128 (XSCVUDQP
3400 (XXEXTRACTUW (SUBREG_TO_REG (i64 1), $src, sub_64), 4)))>;
Lei Huang8b0da652018-05-23 19:31:54 +00003401 } // IsBigEndian, HasP9Vector
3402
3403 let Predicates = [IsLittleEndian, HasP9Vector] in {
3404
3405 // (Un)Signed DWord vector extract -> QP
Lei Huang89901682018-05-23 18:36:51 +00003406 def : Pat<(f128 (sint_to_fp (i64 (extractelt v2i64:$src, 0)))),
3407 (f128 (XSCVSDQP
3408 (EXTRACT_SUBREG (XXPERMDI $src, $src, 3), sub_64)))>;
3409 def : Pat<(f128 (sint_to_fp (i64 (extractelt v2i64:$src, 1)))),
3410 (f128 (XSCVSDQP (COPY_TO_REGCLASS $src, VFRC)))>;
3411 def : Pat<(f128 (uint_to_fp (i64 (extractelt v2i64:$src, 0)))),
3412 (f128 (XSCVUDQP
3413 (EXTRACT_SUBREG (XXPERMDI $src, $src, 3), sub_64)))>;
3414 def : Pat<(f128 (uint_to_fp (i64 (extractelt v2i64:$src, 1)))),
3415 (f128 (XSCVUDQP (COPY_TO_REGCLASS $src, VFRC)))>;
Lei Huang8b0da652018-05-23 19:31:54 +00003416
3417 // (Un)Signed Word vector extract -> QP
3418 foreach Idx = [[0,3],[1,2],[3,0]] in {
3419 def : Pat<(f128 (sint_to_fp (i32 (extractelt v4i32:$src, !head(Idx))))),
3420 (f128 (XSCVSDQP (EXTRACT_SUBREG
3421 (VEXTSW2D (VSPLTW !head(!tail(Idx)), $src)),
3422 sub_64)))>;
3423 }
3424 def : Pat<(f128 (sint_to_fp (i32 (extractelt v4i32:$src, 2)))),
3425 (f128 (XSCVSDQP (EXTRACT_SUBREG (VEXTSW2D $src), sub_64)))>;
3426
3427 foreach Idx = [[0,12],[1,8],[2,4],[3,0]] in {
3428 def : Pat<(f128 (uint_to_fp (i32 (extractelt v4i32:$src, !head(Idx))))),
3429 (f128 (XSCVUDQP (XXEXTRACTUW $src, !head(!tail(Idx)))))>;
3430 }
Lei Huang651be442018-05-28 16:43:29 +00003431
3432 // (Un)Signed HWord vector extract -> QP
3433 // The Nested foreach lists identifies the vector element and corresponding
3434 // register byte location.
3435 foreach Idx = [[0,14],[1,12],[2,10],[3,8],[4,6],[5,4],[6,2],[7,0]] in {
3436 def : Pat<(f128 (sint_to_fp
3437 (i32 (sext_inreg
3438 (vector_extract v8i16:$src, !head(Idx)), i16)))),
3439 (f128 (XSCVSDQP
3440 (EXTRACT_SUBREG (VEXTSH2D
3441 (VEXTRACTUH !head(!tail(Idx)), $src)),
3442 sub_64)))>;
3443 def : Pat<(f128 (uint_to_fp
3444 (and (i32 (vector_extract v8i16:$src, !head(Idx))),
3445 65535))),
3446 (f128 (XSCVUDQP (EXTRACT_SUBREG
3447 (VEXTRACTUH !head(!tail(Idx)), $src), sub_64)))>;
3448 }
3449
3450 // (Un)Signed Byte vector extract -> QP
3451 foreach Idx = [[0,15],[1,14],[2,13],[3,12],[4,11],[5,10],[6,9],[7,8],[8,7],
3452 [9,6],[10,5],[11,4],[12,3],[13,2],[14,1],[15,0]] in {
3453 def : Pat<(f128 (sint_to_fp
3454 (i32 (sext_inreg
3455 (vector_extract v16i8:$src, !head(Idx)), i8)))),
3456 (f128 (XSCVSDQP
3457 (EXTRACT_SUBREG
3458 (VEXTSB2D (VEXTRACTUB !head(!tail(Idx)), $src)),
3459 sub_64)))>;
3460 def : Pat<(f128 (uint_to_fp
3461 (and (i32 (vector_extract v16i8:$src, !head(Idx))),
3462 255))),
3463 (f128 (XSCVUDQP
3464 (EXTRACT_SUBREG
3465 (VEXTRACTUB !head(!tail(Idx)), $src), sub_64)))>;
3466 }
Lei Huang66e22c22018-07-05 07:46:01 +00003467
3468 // Unsiged int in vsx register -> QP
3469 def : Pat<(f128 (uint_to_fp (i32 (PPCmfvsr f64:$src)))),
3470 (f128 (XSCVUDQP
3471 (XXEXTRACTUW (SUBREG_TO_REG (i64 1), $src, sub_64), 8)))>;
Lei Huang8b0da652018-05-23 19:31:54 +00003472 } // IsLittleEndian, HasP9Vector
Lei Huang89901682018-05-23 18:36:51 +00003473
Lei Huang10367eb2018-04-12 18:00:14 +00003474 // Convert (Un)Signed DWord in memory -> QP
3475 def : Pat<(f128 (sint_to_fp (i64 (load xaddr:$src)))),
3476 (f128 (XSCVSDQP (LXSDX xaddr:$src)))>;
3477 def : Pat<(f128 (sint_to_fp (i64 (load ixaddr:$src)))),
3478 (f128 (XSCVSDQP (LXSD ixaddr:$src)))>;
3479 def : Pat<(f128 (uint_to_fp (i64 (load xaddr:$src)))),
3480 (f128 (XSCVUDQP (LXSDX xaddr:$src)))>;
3481 def : Pat<(f128 (uint_to_fp (i64 (load ixaddr:$src)))),
3482 (f128 (XSCVUDQP (LXSD ixaddr:$src)))>;
3483
Lei Huang192c6cc2018-04-18 17:41:46 +00003484 // Convert Unsigned HWord in memory -> QP
3485 def : Pat<(f128 (uint_to_fp ScalarLoads.ZELi16)),
3486 (f128 (XSCVUDQP (LXSIHZX xaddr:$src)))>;
3487
3488 // Convert Unsigned Byte in memory -> QP
3489 def : Pat<(f128 (uint_to_fp ScalarLoads.ZELi8)),
3490 (f128 (XSCVUDQP (LXSIBZX xoaddr:$src)))>;
3491
Lei Huangc517e952018-05-08 18:23:31 +00003492 // Truncate & Convert QP -> (Un)Signed (D)Word.
3493 def : Pat<(i64 (fp_to_sint f128:$src)), (i64 (MFVRD (XSCVQPSDZ $src)))>;
3494 def : Pat<(i64 (fp_to_uint f128:$src)), (i64 (MFVRD (XSCVQPUDZ $src)))>;
Lei Huang63642882018-05-08 18:34:00 +00003495 def : Pat<(i32 (fp_to_sint f128:$src)),
3496 (i32 (MFVSRWZ (COPY_TO_REGCLASS (XSCVQPSWZ $src), VFRC)))>;
3497 def : Pat<(i32 (fp_to_uint f128:$src)),
3498 (i32 (MFVSRWZ (COPY_TO_REGCLASS (XSCVQPUWZ $src), VFRC)))>;
Lei Huangc517e952018-05-08 18:23:31 +00003499
Lei Huange41e3d32018-05-08 18:52:06 +00003500 // Instructions for store(fptosi).
Lei Huangc29229a2018-05-08 17:36:40 +00003501 // The 8-byte version is repeated here due to availability of D-Form STXSD.
3502 def : Pat<(PPCstore_scal_int_from_vsr
Lei Huangc517e952018-05-08 18:23:31 +00003503 (f64 (PPCcv_fp_to_sint_in_vsr f128:$src)), xaddr:$dst, 8),
3504 (STXSDX (COPY_TO_REGCLASS (XSCVQPSDZ f128:$src), VFRC),
3505 xaddr:$dst)>;
3506 def : Pat<(PPCstore_scal_int_from_vsr
3507 (f64 (PPCcv_fp_to_sint_in_vsr f128:$src)), ixaddr:$dst, 8),
3508 (STXSD (COPY_TO_REGCLASS (XSCVQPSDZ f128:$src), VFRC),
3509 ixaddr:$dst)>;
3510 def : Pat<(PPCstore_scal_int_from_vsr
Lei Huang63642882018-05-08 18:34:00 +00003511 (f64 (PPCcv_fp_to_sint_in_vsr f128:$src)), xoaddr:$dst, 4),
3512 (STXSIWX (COPY_TO_REGCLASS (XSCVQPSWZ $src), VFRC), xoaddr:$dst)>;
3513 def : Pat<(PPCstore_scal_int_from_vsr
Lei Huange41e3d32018-05-08 18:52:06 +00003514 (f64 (PPCcv_fp_to_sint_in_vsr f128:$src)), xoaddr:$dst, 2),
3515 (STXSIHX (COPY_TO_REGCLASS (XSCVQPSWZ $src), VFRC), xoaddr:$dst)>;
3516 def : Pat<(PPCstore_scal_int_from_vsr
3517 (f64 (PPCcv_fp_to_sint_in_vsr f128:$src)), xoaddr:$dst, 1),
3518 (STXSIBX (COPY_TO_REGCLASS (XSCVQPSWZ $src), VFRC), xoaddr:$dst)>;
3519 def : Pat<(PPCstore_scal_int_from_vsr
Lei Huangc29229a2018-05-08 17:36:40 +00003520 (f64 (PPCcv_fp_to_sint_in_vsr f64:$src)), xaddr:$dst, 8),
3521 (STXSDX (XSCVDPSXDS f64:$src), xaddr:$dst)>;
3522 def : Pat<(PPCstore_scal_int_from_vsr
3523 (f64 (PPCcv_fp_to_sint_in_vsr f64:$src)), ixaddr:$dst, 8),
3524 (STXSD (XSCVDPSXDS f64:$src), ixaddr:$dst)>;
3525 def : Pat<(PPCstore_scal_int_from_vsr
3526 (f64 (PPCcv_fp_to_sint_in_vsr f64:$src)), xoaddr:$dst, 2),
3527 (STXSIHX (XSCVDPSXWS f64:$src), xoaddr:$dst)>;
3528 def : Pat<(PPCstore_scal_int_from_vsr
3529 (f64 (PPCcv_fp_to_sint_in_vsr f64:$src)), xoaddr:$dst, 1),
3530 (STXSIBX (XSCVDPSXWS f64:$src), xoaddr:$dst)>;
Nemanja Ivanovicd2c3c512016-09-23 13:25:31 +00003531
Lei Huange41e3d32018-05-08 18:52:06 +00003532 // Instructions for store(fptoui).
Lei Huangc29229a2018-05-08 17:36:40 +00003533 def : Pat<(PPCstore_scal_int_from_vsr
Lei Huangc517e952018-05-08 18:23:31 +00003534 (f64 (PPCcv_fp_to_uint_in_vsr f128:$src)), xaddr:$dst, 8),
3535 (STXSDX (COPY_TO_REGCLASS (XSCVQPUDZ f128:$src), VFRC),
3536 xaddr:$dst)>;
3537 def : Pat<(PPCstore_scal_int_from_vsr
3538 (f64 (PPCcv_fp_to_uint_in_vsr f128:$src)), ixaddr:$dst, 8),
3539 (STXSD (COPY_TO_REGCLASS (XSCVQPUDZ f128:$src), VFRC),
3540 ixaddr:$dst)>;
3541 def : Pat<(PPCstore_scal_int_from_vsr
Lei Huang63642882018-05-08 18:34:00 +00003542 (f64 (PPCcv_fp_to_uint_in_vsr f128:$src)), xoaddr:$dst, 4),
3543 (STXSIWX (COPY_TO_REGCLASS (XSCVQPUWZ $src), VFRC), xoaddr:$dst)>;
3544 def : Pat<(PPCstore_scal_int_from_vsr
Lei Huange41e3d32018-05-08 18:52:06 +00003545 (f64 (PPCcv_fp_to_uint_in_vsr f128:$src)), xoaddr:$dst, 2),
3546 (STXSIHX (COPY_TO_REGCLASS (XSCVQPUWZ $src), VFRC), xoaddr:$dst)>;
3547 def : Pat<(PPCstore_scal_int_from_vsr
3548 (f64 (PPCcv_fp_to_uint_in_vsr f128:$src)), xoaddr:$dst, 1),
3549 (STXSIBX (COPY_TO_REGCLASS (XSCVQPUWZ $src), VFRC), xoaddr:$dst)>;
3550 def : Pat<(PPCstore_scal_int_from_vsr
Lei Huangc29229a2018-05-08 17:36:40 +00003551 (f64 (PPCcv_fp_to_uint_in_vsr f64:$src)), xaddr:$dst, 8),
3552 (STXSDX (XSCVDPUXDS f64:$src), xaddr:$dst)>;
3553 def : Pat<(PPCstore_scal_int_from_vsr
3554 (f64 (PPCcv_fp_to_uint_in_vsr f64:$src)), ixaddr:$dst, 8),
3555 (STXSD (XSCVDPUXDS f64:$src), ixaddr:$dst)>;
3556 def : Pat<(PPCstore_scal_int_from_vsr
3557 (f64 (PPCcv_fp_to_uint_in_vsr f64:$src)), xoaddr:$dst, 2),
3558 (STXSIHX (XSCVDPUXWS f64:$src), xoaddr:$dst)>;
3559 def : Pat<(PPCstore_scal_int_from_vsr
3560 (f64 (PPCcv_fp_to_uint_in_vsr f64:$src)), xoaddr:$dst, 1),
3561 (STXSIBX (XSCVDPUXWS f64:$src), xoaddr:$dst)>;
3562
Lei Huang6270ab62018-07-04 21:59:16 +00003563 // Round & Convert QP -> DP/SP
3564 def : Pat<(f64 (fpround f128:$src)), (f64 (XSCVQPDP $src))>;
3565 def : Pat<(f32 (fpround f128:$src)), (f32 (XSRSP (XSCVQPDPO $src)))>;
Lei Huangd17c39c2018-07-05 04:18:37 +00003566
3567 // Convert SP -> QP
3568 def : Pat<(f128 (fpextend f32:$src)),
3569 (f128 (XSCVDPQP (COPY_TO_REGCLASS $src, VFRC)))>;
3570
Lei Huangc29229a2018-05-08 17:36:40 +00003571} // end HasP9Vector, AddedComplexity
Lei Huang6270ab62018-07-04 21:59:16 +00003572
Lei Huanga855e172018-07-05 06:21:37 +00003573let AddedComplexity = 400 in {
3574 let Predicates = [IsISA3_0, HasP9Vector, HasDirectMove, IsBigEndian] in {
3575 def : Pat<(f128 (PPCbuild_fp128 i64:$rB, i64:$rA)),
3576 (f128 (COPY_TO_REGCLASS (MTVSRDD $rB, $rA), VRRC))>;
3577 }
3578 let Predicates = [IsISA3_0, HasP9Vector, HasDirectMove, IsLittleEndian] in {
3579 def : Pat<(f128 (PPCbuild_fp128 i64:$rA, i64:$rB)),
3580 (f128 (COPY_TO_REGCLASS (MTVSRDD $rB, $rA), VRRC))>;
3581 }
3582}
3583
Zaara Syedafcd96972017-09-21 16:12:33 +00003584let Predicates = [HasP9Vector] in {
Jinsong Jic7b43b92018-12-13 15:12:57 +00003585 let mayStore = 1 in {
3586 def SPILLTOVSR_STX : PseudoXFormMemOp<(outs),
3587 (ins spilltovsrrc:$XT, memrr:$dst),
3588 "#SPILLTOVSR_STX", []>;
3589 def SPILLTOVSR_ST : PPCPostRAExpPseudo<(outs), (ins spilltovsrrc:$XT, memrix:$dst),
3590 "#SPILLTOVSR_ST", []>;
3591 }
3592 let mayLoad = 1 in {
3593 def SPILLTOVSR_LDX : PseudoXFormMemOp<(outs spilltovsrrc:$XT),
3594 (ins memrr:$src),
3595 "#SPILLTOVSR_LDX", []>;
3596 def SPILLTOVSR_LD : PPCPostRAExpPseudo<(outs spilltovsrrc:$XT), (ins memrix:$src),
3597 "#SPILLTOVSR_LD", []>;
Zaara Syedafcd96972017-09-21 16:12:33 +00003598
Zaara Syedafcd96972017-09-21 16:12:33 +00003599 }
3600}
Nemanja Ivanovicdf1cb522016-11-29 16:11:34 +00003601// Integer extend helper dags 32 -> 64
3602def AnyExts {
3603 dag A = (INSERT_SUBREG (i64 (IMPLICIT_DEF)), $A, sub_32);
3604 dag B = (INSERT_SUBREG (i64 (IMPLICIT_DEF)), $B, sub_32);
3605 dag C = (INSERT_SUBREG (i64 (IMPLICIT_DEF)), $C, sub_32);
3606 dag D = (INSERT_SUBREG (i64 (IMPLICIT_DEF)), $D, sub_32);
Nemanja Ivanovicd2c3c512016-09-23 13:25:31 +00003607}
3608
Nemanja Ivanovicdf1cb522016-11-29 16:11:34 +00003609def DblToFlt {
3610 dag A0 = (f32 (fpround (f64 (extractelt v2f64:$A, 0))));
3611 dag A1 = (f32 (fpround (f64 (extractelt v2f64:$A, 1))));
3612 dag B0 = (f32 (fpround (f64 (extractelt v2f64:$B, 0))));
3613 dag B1 = (f32 (fpround (f64 (extractelt v2f64:$B, 1))));
3614}
Zaara Syeda79acbbe2017-06-08 17:14:36 +00003615
Nemanja Ivanovice1a525e2018-08-02 00:03:22 +00003616def ExtDbl {
3617 dag A0S = (i32 (PPCmfvsr (f64 (PPCfctiwz (f64 (extractelt v2f64:$A, 0))))));
3618 dag A1S = (i32 (PPCmfvsr (f64 (PPCfctiwz (f64 (extractelt v2f64:$A, 1))))));
3619 dag B0S = (i32 (PPCmfvsr (f64 (PPCfctiwz (f64 (extractelt v2f64:$B, 0))))));
3620 dag B1S = (i32 (PPCmfvsr (f64 (PPCfctiwz (f64 (extractelt v2f64:$B, 1))))));
3621 dag A0U = (i32 (PPCmfvsr (f64 (PPCfctiwuz (f64 (extractelt v2f64:$A, 0))))));
3622 dag A1U = (i32 (PPCmfvsr (f64 (PPCfctiwuz (f64 (extractelt v2f64:$A, 1))))));
3623 dag B0U = (i32 (PPCmfvsr (f64 (PPCfctiwuz (f64 (extractelt v2f64:$B, 0))))));
3624 dag B1U = (i32 (PPCmfvsr (f64 (PPCfctiwuz (f64 (extractelt v2f64:$B, 1))))));
3625}
3626
Zaara Syeda79acbbe2017-06-08 17:14:36 +00003627def ByteToWord {
Tony Jiang9a91a182017-07-05 16:00:38 +00003628 dag LE_A0 = (i32 (sext_inreg (i32 (vector_extract v16i8:$A, 0)), i8));
3629 dag LE_A1 = (i32 (sext_inreg (i32 (vector_extract v16i8:$A, 4)), i8));
3630 dag LE_A2 = (i32 (sext_inreg (i32 (vector_extract v16i8:$A, 8)), i8));
3631 dag LE_A3 = (i32 (sext_inreg (i32 (vector_extract v16i8:$A, 12)), i8));
3632 dag BE_A0 = (i32 (sext_inreg (i32 (vector_extract v16i8:$A, 3)), i8));
3633 dag BE_A1 = (i32 (sext_inreg (i32 (vector_extract v16i8:$A, 7)), i8));
3634 dag BE_A2 = (i32 (sext_inreg (i32 (vector_extract v16i8:$A, 11)), i8));
3635 dag BE_A3 = (i32 (sext_inreg (i32 (vector_extract v16i8:$A, 15)), i8));
Zaara Syeda79acbbe2017-06-08 17:14:36 +00003636}
3637
3638def ByteToDWord {
Tony Jiang9a91a182017-07-05 16:00:38 +00003639 dag LE_A0 = (i64 (sext_inreg
3640 (i64 (anyext (i32 (vector_extract v16i8:$A, 0)))), i8));
3641 dag LE_A1 = (i64 (sext_inreg
3642 (i64 (anyext (i32 (vector_extract v16i8:$A, 8)))), i8));
3643 dag BE_A0 = (i64 (sext_inreg
3644 (i64 (anyext (i32 (vector_extract v16i8:$A, 7)))), i8));
3645 dag BE_A1 = (i64 (sext_inreg
3646 (i64 (anyext (i32 (vector_extract v16i8:$A, 15)))), i8));
Zaara Syeda79acbbe2017-06-08 17:14:36 +00003647}
3648
3649def HWordToWord {
Tony Jiang9a91a182017-07-05 16:00:38 +00003650 dag LE_A0 = (i32 (sext_inreg (i32 (vector_extract v8i16:$A, 0)), i16));
3651 dag LE_A1 = (i32 (sext_inreg (i32 (vector_extract v8i16:$A, 2)), i16));
3652 dag LE_A2 = (i32 (sext_inreg (i32 (vector_extract v8i16:$A, 4)), i16));
3653 dag LE_A3 = (i32 (sext_inreg (i32 (vector_extract v8i16:$A, 6)), i16));
3654 dag BE_A0 = (i32 (sext_inreg (i32 (vector_extract v8i16:$A, 1)), i16));
3655 dag BE_A1 = (i32 (sext_inreg (i32 (vector_extract v8i16:$A, 3)), i16));
3656 dag BE_A2 = (i32 (sext_inreg (i32 (vector_extract v8i16:$A, 5)), i16));
3657 dag BE_A3 = (i32 (sext_inreg (i32 (vector_extract v8i16:$A, 7)), i16));
Zaara Syeda79acbbe2017-06-08 17:14:36 +00003658}
3659
3660def HWordToDWord {
Tony Jiang9a91a182017-07-05 16:00:38 +00003661 dag LE_A0 = (i64 (sext_inreg
3662 (i64 (anyext (i32 (vector_extract v8i16:$A, 0)))), i16));
3663 dag LE_A1 = (i64 (sext_inreg
3664 (i64 (anyext (i32 (vector_extract v8i16:$A, 4)))), i16));
3665 dag BE_A0 = (i64 (sext_inreg
3666 (i64 (anyext (i32 (vector_extract v8i16:$A, 3)))), i16));
3667 dag BE_A1 = (i64 (sext_inreg
3668 (i64 (anyext (i32 (vector_extract v8i16:$A, 7)))), i16));
Zaara Syeda79acbbe2017-06-08 17:14:36 +00003669}
3670
3671def WordToDWord {
Tony Jiang9a91a182017-07-05 16:00:38 +00003672 dag LE_A0 = (i64 (sext (i32 (vector_extract v4i32:$A, 0))));
3673 dag LE_A1 = (i64 (sext (i32 (vector_extract v4i32:$A, 2))));
3674 dag BE_A0 = (i64 (sext (i32 (vector_extract v4i32:$A, 1))));
3675 dag BE_A1 = (i64 (sext (i32 (vector_extract v4i32:$A, 3))));
Zaara Syeda79acbbe2017-06-08 17:14:36 +00003676}
3677
Nemanja Ivanovicdf1cb522016-11-29 16:11:34 +00003678def FltToIntLoad {
3679 dag A = (i32 (PPCmfvsr (PPCfctiwz (f64 (extloadf32 xoaddr:$A)))));
3680}
3681def FltToUIntLoad {
3682 dag A = (i32 (PPCmfvsr (PPCfctiwuz (f64 (extloadf32 xoaddr:$A)))));
3683}
3684def FltToLongLoad {
3685 dag A = (i64 (PPCmfvsr (PPCfctidz (f64 (extloadf32 xoaddr:$A)))));
3686}
Hiroshi Inouee3c14eb2017-05-29 07:12:39 +00003687def FltToLongLoadP9 {
Nemanja Ivanovic3c7e276d2017-07-13 18:17:10 +00003688 dag A = (i64 (PPCmfvsr (PPCfctidz (f64 (extloadf32 ixaddr:$A)))));
Hiroshi Inouee3c14eb2017-05-29 07:12:39 +00003689}
Nemanja Ivanovicdf1cb522016-11-29 16:11:34 +00003690def FltToULongLoad {
3691 dag A = (i64 (PPCmfvsr (PPCfctiduz (f64 (extloadf32 xoaddr:$A)))));
3692}
Hiroshi Inouee3c14eb2017-05-29 07:12:39 +00003693def FltToULongLoadP9 {
Nemanja Ivanovic3c7e276d2017-07-13 18:17:10 +00003694 dag A = (i64 (PPCmfvsr (PPCfctiduz (f64 (extloadf32 ixaddr:$A)))));
Hiroshi Inouee3c14eb2017-05-29 07:12:39 +00003695}
Nemanja Ivanovicdf1cb522016-11-29 16:11:34 +00003696def FltToLong {
Lei Huangcd4f3852018-03-12 19:26:18 +00003697 dag A = (i64 (PPCmfvsr (f64 (PPCfctidz (fpextend f32:$A)))));
Nemanja Ivanovicdf1cb522016-11-29 16:11:34 +00003698}
3699def FltToULong {
Lei Huangcd4f3852018-03-12 19:26:18 +00003700 dag A = (i64 (PPCmfvsr (f64 (PPCfctiduz (fpextend f32:$A)))));
Nemanja Ivanovicdf1cb522016-11-29 16:11:34 +00003701}
3702def DblToInt {
3703 dag A = (i32 (PPCmfvsr (f64 (PPCfctiwz f64:$A))));
Nemanja Ivanovice1a525e2018-08-02 00:03:22 +00003704 dag B = (i32 (PPCmfvsr (f64 (PPCfctiwz f64:$B))));
3705 dag C = (i32 (PPCmfvsr (f64 (PPCfctiwz f64:$C))));
3706 dag D = (i32 (PPCmfvsr (f64 (PPCfctiwz f64:$D))));
Nemanja Ivanovicdf1cb522016-11-29 16:11:34 +00003707}
3708def DblToUInt {
3709 dag A = (i32 (PPCmfvsr (f64 (PPCfctiwuz f64:$A))));
Nemanja Ivanovice1a525e2018-08-02 00:03:22 +00003710 dag B = (i32 (PPCmfvsr (f64 (PPCfctiwuz f64:$B))));
3711 dag C = (i32 (PPCmfvsr (f64 (PPCfctiwuz f64:$C))));
3712 dag D = (i32 (PPCmfvsr (f64 (PPCfctiwuz f64:$D))));
Nemanja Ivanovicdf1cb522016-11-29 16:11:34 +00003713}
3714def DblToLong {
3715 dag A = (i64 (PPCmfvsr (f64 (PPCfctidz f64:$A))));
3716}
3717def DblToULong {
3718 dag A = (i64 (PPCmfvsr (f64 (PPCfctiduz f64:$A))));
3719}
3720def DblToIntLoad {
3721 dag A = (i32 (PPCmfvsr (PPCfctiwz (f64 (load xoaddr:$A)))));
3722}
Hiroshi Inouee3c14eb2017-05-29 07:12:39 +00003723def DblToIntLoadP9 {
Nemanja Ivanovic3c7e276d2017-07-13 18:17:10 +00003724 dag A = (i32 (PPCmfvsr (PPCfctiwz (f64 (load ixaddr:$A)))));
Hiroshi Inouee3c14eb2017-05-29 07:12:39 +00003725}
Nemanja Ivanovicdf1cb522016-11-29 16:11:34 +00003726def DblToUIntLoad {
3727 dag A = (i32 (PPCmfvsr (PPCfctiwuz (f64 (load xoaddr:$A)))));
3728}
Hiroshi Inouee3c14eb2017-05-29 07:12:39 +00003729def DblToUIntLoadP9 {
Nemanja Ivanovic3c7e276d2017-07-13 18:17:10 +00003730 dag A = (i32 (PPCmfvsr (PPCfctiwuz (f64 (load ixaddr:$A)))));
Hiroshi Inouee3c14eb2017-05-29 07:12:39 +00003731}
Nemanja Ivanovicdf1cb522016-11-29 16:11:34 +00003732def DblToLongLoad {
3733 dag A = (i64 (PPCmfvsr (PPCfctidz (f64 (load xoaddr:$A)))));
3734}
3735def DblToULongLoad {
3736 dag A = (i64 (PPCmfvsr (PPCfctiduz (f64 (load xoaddr:$A)))));
3737}
3738
3739// FP merge dags (for f32 -> v4f32)
3740def MrgFP {
3741 dag AC = (XVCVDPSP (XXPERMDI (COPY_TO_REGCLASS $A, VSRC),
3742 (COPY_TO_REGCLASS $C, VSRC), 0));
3743 dag BD = (XVCVDPSP (XXPERMDI (COPY_TO_REGCLASS $B, VSRC),
3744 (COPY_TO_REGCLASS $D, VSRC), 0));
3745 dag ABhToFlt = (XVCVDPSP (XXPERMDI $A, $B, 0));
3746 dag ABlToFlt = (XVCVDPSP (XXPERMDI $A, $B, 3));
3747 dag BAhToFlt = (XVCVDPSP (XXPERMDI $B, $A, 0));
3748 dag BAlToFlt = (XVCVDPSP (XXPERMDI $B, $A, 3));
3749}
3750
Nemanja Ivanovice1a525e2018-08-02 00:03:22 +00003751// Word-element merge dags - conversions from f64 to i32 merged into vectors.
3752def MrgWords {
3753 // For big endian, we merge low and hi doublewords (A, B).
3754 dag A0B0 = (v2f64 (XXPERMDI v2f64:$A, v2f64:$B, 0));
3755 dag A1B1 = (v2f64 (XXPERMDI v2f64:$A, v2f64:$B, 3));
3756 dag CVA1B1S = (v4i32 (XVCVDPSXWS A1B1));
3757 dag CVA0B0S = (v4i32 (XVCVDPSXWS A0B0));
3758 dag CVA1B1U = (v4i32 (XVCVDPUXWS A1B1));
3759 dag CVA0B0U = (v4i32 (XVCVDPUXWS A0B0));
3760
3761 // For little endian, we merge low and hi doublewords (B, A).
3762 dag B1A1 = (v2f64 (XXPERMDI v2f64:$B, v2f64:$A, 0));
3763 dag B0A0 = (v2f64 (XXPERMDI v2f64:$B, v2f64:$A, 3));
3764 dag CVB1A1S = (v4i32 (XVCVDPSXWS B1A1));
3765 dag CVB0A0S = (v4i32 (XVCVDPSXWS B0A0));
3766 dag CVB1A1U = (v4i32 (XVCVDPUXWS B1A1));
3767 dag CVB0A0U = (v4i32 (XVCVDPUXWS B0A0));
3768
3769 // For big endian, we merge hi doublewords of (A, C) and (B, D), convert
3770 // then merge.
3771 dag AC = (v2f64 (XXPERMDI (COPY_TO_REGCLASS f64:$A, VSRC),
3772 (COPY_TO_REGCLASS f64:$C, VSRC), 0));
3773 dag BD = (v2f64 (XXPERMDI (COPY_TO_REGCLASS f64:$B, VSRC),
3774 (COPY_TO_REGCLASS f64:$D, VSRC), 0));
3775 dag CVACS = (v4i32 (XVCVDPSXWS AC));
3776 dag CVBDS = (v4i32 (XVCVDPSXWS BD));
3777 dag CVACU = (v4i32 (XVCVDPUXWS AC));
3778 dag CVBDU = (v4i32 (XVCVDPUXWS BD));
3779
3780 // For little endian, we merge hi doublewords of (D, B) and (C, A), convert
3781 // then merge.
3782 dag DB = (v2f64 (XXPERMDI (COPY_TO_REGCLASS f64:$D, VSRC),
3783 (COPY_TO_REGCLASS f64:$B, VSRC), 0));
3784 dag CA = (v2f64 (XXPERMDI (COPY_TO_REGCLASS f64:$C, VSRC),
3785 (COPY_TO_REGCLASS f64:$A, VSRC), 0));
3786 dag CVDBS = (v4i32 (XVCVDPSXWS DB));
3787 dag CVCAS = (v4i32 (XVCVDPSXWS CA));
3788 dag CVDBU = (v4i32 (XVCVDPUXWS DB));
3789 dag CVCAU = (v4i32 (XVCVDPUXWS CA));
3790}
3791
Nemanja Ivanovicdf1cb522016-11-29 16:11:34 +00003792// Patterns for BUILD_VECTOR nodes.
Nemanja Ivanovicdf1cb522016-11-29 16:11:34 +00003793let AddedComplexity = 400 in {
3794
3795 let Predicates = [HasVSX] in {
3796 // Build vectors of floating point converted to i32.
3797 def : Pat<(v4i32 (build_vector DblToInt.A, DblToInt.A,
3798 DblToInt.A, DblToInt.A)),
3799 (v4i32 (XXSPLTW (COPY_TO_REGCLASS (XSCVDPSXWS $A), VSRC), 1))>;
3800 def : Pat<(v4i32 (build_vector DblToUInt.A, DblToUInt.A,
3801 DblToUInt.A, DblToUInt.A)),
3802 (v4i32 (XXSPLTW (COPY_TO_REGCLASS (XSCVDPUXWS $A), VSRC), 1))>;
3803 def : Pat<(v2i64 (build_vector DblToLong.A, DblToLong.A)),
3804 (v2i64 (XXPERMDI (COPY_TO_REGCLASS (XSCVDPSXDS $A), VSRC),
3805 (COPY_TO_REGCLASS (XSCVDPSXDS $A), VSRC), 0))>;
3806 def : Pat<(v2i64 (build_vector DblToULong.A, DblToULong.A)),
3807 (v2i64 (XXPERMDI (COPY_TO_REGCLASS (XSCVDPUXDS $A), VSRC),
3808 (COPY_TO_REGCLASS (XSCVDPUXDS $A), VSRC), 0))>;
3809 def : Pat<(v4i32 (scalar_to_vector FltToIntLoad.A)),
3810 (v4i32 (XXSPLTW (COPY_TO_REGCLASS
Tony Jiang438bf4a2017-11-20 14:38:30 +00003811 (XSCVDPSXWSs (XFLOADf32 xoaddr:$A)), VSRC), 1))>;
Nemanja Ivanovicdf1cb522016-11-29 16:11:34 +00003812 def : Pat<(v4i32 (scalar_to_vector FltToUIntLoad.A)),
3813 (v4i32 (XXSPLTW (COPY_TO_REGCLASS
Tony Jiang438bf4a2017-11-20 14:38:30 +00003814 (XSCVDPUXWSs (XFLOADf32 xoaddr:$A)), VSRC), 1))>;
Nemanja Ivanovicdf1cb522016-11-29 16:11:34 +00003815 def : Pat<(v4f32 (build_vector f32:$A, f32:$A, f32:$A, f32:$A)),
3816 (v4f32 (XXSPLTW (v4f32 (XSCVDPSPN $A)), 0))>;
3817
3818 // Build vectors of floating point converted to i64.
3819 def : Pat<(v2i64 (build_vector FltToLong.A, FltToLong.A)),
Nemanja Ivanovic15748f42016-12-06 11:47:14 +00003820 (v2i64 (XXPERMDIs
3821 (COPY_TO_REGCLASS (XSCVDPSXDSs $A), VSFRC), 0))>;
Nemanja Ivanovicdf1cb522016-11-29 16:11:34 +00003822 def : Pat<(v2i64 (build_vector FltToULong.A, FltToULong.A)),
Nemanja Ivanovic15748f42016-12-06 11:47:14 +00003823 (v2i64 (XXPERMDIs
3824 (COPY_TO_REGCLASS (XSCVDPUXDSs $A), VSFRC), 0))>;
Nemanja Ivanovicdf1cb522016-11-29 16:11:34 +00003825 def : Pat<(v2i64 (scalar_to_vector DblToLongLoad.A)),
3826 (v2i64 (XVCVDPSXDS (LXVDSX xoaddr:$A)))>;
3827 def : Pat<(v2i64 (scalar_to_vector DblToULongLoad.A)),
3828 (v2i64 (XVCVDPUXDS (LXVDSX xoaddr:$A)))>;
3829 }
3830
3831 let Predicates = [HasVSX, NoP9Vector] in {
Tony Jiang438bf4a2017-11-20 14:38:30 +00003832 // Load-and-splat with fp-to-int conversion (using X-Form VSX/FP loads).
Nemanja Ivanovicdf1cb522016-11-29 16:11:34 +00003833 def : Pat<(v4i32 (scalar_to_vector DblToIntLoad.A)),
3834 (v4i32 (XXSPLTW (COPY_TO_REGCLASS
Tony Jiang438bf4a2017-11-20 14:38:30 +00003835 (XSCVDPSXWS (XFLOADf64 xoaddr:$A)), VSRC), 1))>;
Nemanja Ivanovicdf1cb522016-11-29 16:11:34 +00003836 def : Pat<(v4i32 (scalar_to_vector DblToUIntLoad.A)),
3837 (v4i32 (XXSPLTW (COPY_TO_REGCLASS
Tony Jiang438bf4a2017-11-20 14:38:30 +00003838 (XSCVDPUXWS (XFLOADf64 xoaddr:$A)), VSRC), 1))>;
Nemanja Ivanovicdf1cb522016-11-29 16:11:34 +00003839 def : Pat<(v2i64 (scalar_to_vector FltToLongLoad.A)),
3840 (v2i64 (XXPERMDIs (XSCVDPSXDS (COPY_TO_REGCLASS
Tony Jiang438bf4a2017-11-20 14:38:30 +00003841 (XFLOADf32 xoaddr:$A), VSFRC)), 0))>;
Nemanja Ivanovicdf1cb522016-11-29 16:11:34 +00003842 def : Pat<(v2i64 (scalar_to_vector FltToULongLoad.A)),
3843 (v2i64 (XXPERMDIs (XSCVDPUXDS (COPY_TO_REGCLASS
Tony Jiang438bf4a2017-11-20 14:38:30 +00003844 (XFLOADf32 xoaddr:$A), VSFRC)), 0))>;
Nemanja Ivanovicdf1cb522016-11-29 16:11:34 +00003845 }
3846
Nemanja Ivanovic0f7715a2018-12-29 13:40:48 +00003847 let Predicates = [IsBigEndian, HasP8Vector] in {
3848 def : Pat<DWToSPExtractConv.BVU,
3849 (v4f32 (VPKUDUM (XXSLDWI (XVCVUXDSP $S1), (XVCVUXDSP $S1), 3),
3850 (XXSLDWI (XVCVUXDSP $S2), (XVCVUXDSP $S2), 3)))>;
3851 def : Pat<DWToSPExtractConv.BVS,
3852 (v4f32 (VPKUDUM (XXSLDWI (XVCVSXDSP $S1), (XVCVSXDSP $S1), 3),
3853 (XXSLDWI (XVCVSXDSP $S2), (XVCVSXDSP $S2), 3)))>;
Nemanja Ivanovicb9b75de2019-01-24 23:44:28 +00003854 def : Pat<(store (i32 (extractelt v4i32:$A, 1)), xoaddr:$src),
3855 (STIWX (EXTRACT_SUBREG $A, sub_64), xoaddr:$src)>;
3856 def : Pat<(store (f32 (extractelt v4f32:$A, 1)), xoaddr:$src),
3857 (STIWX (EXTRACT_SUBREG $A, sub_64), xoaddr:$src)>;
3858
3859 // Elements in a register on a BE system are in order <0, 1, 2, 3>.
3860 // The store instructions store the second word from the left.
3861 // So to align element zero, we need to modulo-left-shift by 3 words.
3862 // Similar logic applies for elements 2 and 3.
3863 foreach Idx = [ [0,3], [2,1], [3,2] ] in {
3864 def : Pat<(store (i32 (extractelt v4i32:$A, !head(Idx))), xoaddr:$src),
3865 (STIWX (EXTRACT_SUBREG (XXSLDWI $A, $A, !head(!tail(Idx))),
3866 sub_64), xoaddr:$src)>;
3867 def : Pat<(store (f32 (extractelt v4f32:$A, !head(Idx))), xoaddr:$src),
3868 (STIWX (EXTRACT_SUBREG (XXSLDWI $A, $A, !head(!tail(Idx))),
3869 sub_64), xoaddr:$src)>;
3870 }
Nemanja Ivanovic0f7715a2018-12-29 13:40:48 +00003871 }
3872
Nemanja Ivanovicb9b75de2019-01-24 23:44:28 +00003873 let Predicates = [HasP8Vector, IsBigEndian, NoP9Vector] in {
3874 def : Pat<(store (i64 (extractelt v2i64:$A, 0)), xoaddr:$src),
3875 (XFSTOREf64 (EXTRACT_SUBREG $A, sub_64), xoaddr:$src)>;
3876 def : Pat<(store (f64 (extractelt v2f64:$A, 0)), xoaddr:$src),
3877 (XFSTOREf64 (EXTRACT_SUBREG $A, sub_64), xoaddr:$src)>;
3878 def : Pat<(store (i64 (extractelt v2i64:$A, 1)), xoaddr:$src),
3879 (XFSTOREf64 (EXTRACT_SUBREG (XXPERMDI $A, $A, 2), sub_64),
3880 xoaddr:$src)>;
3881 def : Pat<(store (f64 (extractelt v2f64:$A, 1)), xoaddr:$src),
3882 (XFSTOREf64 (EXTRACT_SUBREG (XXPERMDI $A, $A, 2), sub_64),
3883 xoaddr:$src)>;
3884 }
3885
Nemanja Ivanovicdf1cb522016-11-29 16:11:34 +00003886 // Big endian, available on all targets with VSX
3887 let Predicates = [IsBigEndian, HasVSX] in {
3888 def : Pat<(v2f64 (build_vector f64:$A, f64:$B)),
3889 (v2f64 (XXPERMDI
3890 (COPY_TO_REGCLASS $A, VSRC),
3891 (COPY_TO_REGCLASS $B, VSRC), 0))>;
3892
3893 def : Pat<(v4f32 (build_vector f32:$A, f32:$B, f32:$C, f32:$D)),
3894 (VMRGEW MrgFP.AC, MrgFP.BD)>;
3895 def : Pat<(v4f32 (build_vector DblToFlt.A0, DblToFlt.A1,
3896 DblToFlt.B0, DblToFlt.B1)),
3897 (v4f32 (VMRGEW MrgFP.ABhToFlt, MrgFP.ABlToFlt))>;
Nemanja Ivanovice1a525e2018-08-02 00:03:22 +00003898
3899 // Convert 4 doubles to a vector of ints.
3900 def : Pat<(v4i32 (build_vector DblToInt.A, DblToInt.B,
3901 DblToInt.C, DblToInt.D)),
3902 (v4i32 (VMRGEW MrgWords.CVACS, MrgWords.CVBDS))>;
3903 def : Pat<(v4i32 (build_vector DblToUInt.A, DblToUInt.B,
3904 DblToUInt.C, DblToUInt.D)),
3905 (v4i32 (VMRGEW MrgWords.CVACU, MrgWords.CVBDU))>;
3906 def : Pat<(v4i32 (build_vector ExtDbl.A0S, ExtDbl.A1S,
3907 ExtDbl.B0S, ExtDbl.B1S)),
3908 (v4i32 (VMRGEW MrgWords.CVA0B0S, MrgWords.CVA1B1S))>;
3909 def : Pat<(v4i32 (build_vector ExtDbl.A0U, ExtDbl.A1U,
3910 ExtDbl.B0U, ExtDbl.B1U)),
3911 (v4i32 (VMRGEW MrgWords.CVA0B0U, MrgWords.CVA1B1U))>;
Nemanja Ivanovicdf1cb522016-11-29 16:11:34 +00003912 }
3913
Nemanja Ivanovic0f7715a2018-12-29 13:40:48 +00003914 let Predicates = [IsLittleEndian, HasP8Vector] in {
3915 def : Pat<DWToSPExtractConv.BVU,
3916 (v4f32 (VPKUDUM (XXSLDWI (XVCVUXDSP $S2), (XVCVUXDSP $S2), 3),
3917 (XXSLDWI (XVCVUXDSP $S1), (XVCVUXDSP $S1), 3)))>;
3918 def : Pat<DWToSPExtractConv.BVS,
3919 (v4f32 (VPKUDUM (XXSLDWI (XVCVSXDSP $S2), (XVCVSXDSP $S2), 3),
3920 (XXSLDWI (XVCVSXDSP $S1), (XVCVSXDSP $S1), 3)))>;
Nemanja Ivanovicb9b75de2019-01-24 23:44:28 +00003921 def : Pat<(store (i32 (extractelt v4i32:$A, 2)), xoaddr:$src),
3922 (STIWX (EXTRACT_SUBREG $A, sub_64), xoaddr:$src)>;
3923 def : Pat<(store (f32 (extractelt v4f32:$A, 2)), xoaddr:$src),
3924 (STIWX (EXTRACT_SUBREG $A, sub_64), xoaddr:$src)>;
3925
3926 // Elements in a register on a LE system are in order <3, 2, 1, 0>.
3927 // The store instructions store the second word from the left.
3928 // So to align element 3, we need to modulo-left-shift by 3 words.
3929 // Similar logic applies for elements 0 and 1.
3930 foreach Idx = [ [0,2], [1,1], [3,3] ] in {
3931 def : Pat<(store (i32 (extractelt v4i32:$A, !head(Idx))), xoaddr:$src),
3932 (STIWX (EXTRACT_SUBREG (XXSLDWI $A, $A, !head(!tail(Idx))),
3933 sub_64), xoaddr:$src)>;
3934 def : Pat<(store (f32 (extractelt v4f32:$A, !head(Idx))), xoaddr:$src),
3935 (STIWX (EXTRACT_SUBREG (XXSLDWI $A, $A, !head(!tail(Idx))),
3936 sub_64), xoaddr:$src)>;
3937 }
Nemanja Ivanovic0f7715a2018-12-29 13:40:48 +00003938 }
3939
Nemanja Ivanovicb9b75de2019-01-24 23:44:28 +00003940 let Predicates = [HasP8Vector, IsLittleEndian, NoP9Vector] in {
3941 def : Pat<(store (i64 (extractelt v2i64:$A, 0)), xoaddr:$src),
3942 (XFSTOREf64 (EXTRACT_SUBREG (XXPERMDI $A, $A, 2), sub_64),
3943 xoaddr:$src)>;
3944 def : Pat<(store (f64 (extractelt v2f64:$A, 0)), xoaddr:$src),
3945 (XFSTOREf64 (EXTRACT_SUBREG (XXPERMDI $A, $A, 2), sub_64),
3946 xoaddr:$src)>;
3947 def : Pat<(store (i64 (extractelt v2i64:$A, 1)), xoaddr:$src),
3948 (XFSTOREf64 (EXTRACT_SUBREG $A, sub_64), xoaddr:$src)>;
3949 def : Pat<(store (f64 (extractelt v2f64:$A, 1)), xoaddr:$src),
3950 (XFSTOREf64 (EXTRACT_SUBREG $A, sub_64), xoaddr:$src)>;
3951 }
3952
Nemanja Ivanovicdf1cb522016-11-29 16:11:34 +00003953 let Predicates = [IsLittleEndian, HasVSX] in {
3954 // Little endian, available on all targets with VSX
3955 def : Pat<(v2f64 (build_vector f64:$A, f64:$B)),
3956 (v2f64 (XXPERMDI
3957 (COPY_TO_REGCLASS $B, VSRC),
3958 (COPY_TO_REGCLASS $A, VSRC), 0))>;
3959
3960 def : Pat<(v4f32 (build_vector f32:$D, f32:$C, f32:$B, f32:$A)),
3961 (VMRGEW MrgFP.AC, MrgFP.BD)>;
3962 def : Pat<(v4f32 (build_vector DblToFlt.A0, DblToFlt.A1,
3963 DblToFlt.B0, DblToFlt.B1)),
3964 (v4f32 (VMRGEW MrgFP.BAhToFlt, MrgFP.BAlToFlt))>;
Nemanja Ivanovice1a525e2018-08-02 00:03:22 +00003965
3966 // Convert 4 doubles to a vector of ints.
3967 def : Pat<(v4i32 (build_vector DblToInt.A, DblToInt.B,
3968 DblToInt.C, DblToInt.D)),
3969 (v4i32 (VMRGEW MrgWords.CVDBS, MrgWords.CVCAS))>;
3970 def : Pat<(v4i32 (build_vector DblToUInt.A, DblToUInt.B,
3971 DblToUInt.C, DblToUInt.D)),
3972 (v4i32 (VMRGEW MrgWords.CVDBU, MrgWords.CVCAU))>;
3973 def : Pat<(v4i32 (build_vector ExtDbl.A0S, ExtDbl.A1S,
3974 ExtDbl.B0S, ExtDbl.B1S)),
3975 (v4i32 (VMRGEW MrgWords.CVB1A1S, MrgWords.CVB0A0S))>;
3976 def : Pat<(v4i32 (build_vector ExtDbl.A0U, ExtDbl.A1U,
3977 ExtDbl.B0U, ExtDbl.B1U)),
3978 (v4i32 (VMRGEW MrgWords.CVB1A1U, MrgWords.CVB0A0U))>;
Nemanja Ivanovicdf1cb522016-11-29 16:11:34 +00003979 }
3980
3981 let Predicates = [HasDirectMove] in {
3982 // Endianness-neutral constant splat on P8 and newer targets. The reason
3983 // for this pattern is that on targets with direct moves, we don't expand
3984 // BUILD_VECTOR nodes for v4i32.
3985 def : Pat<(v4i32 (build_vector immSExt5NonZero:$A, immSExt5NonZero:$A,
3986 immSExt5NonZero:$A, immSExt5NonZero:$A)),
3987 (v4i32 (VSPLTISW imm:$A))>;
3988 }
3989
3990 let Predicates = [IsBigEndian, HasDirectMove, NoP9Vector] in {
3991 // Big endian integer vectors using direct moves.
3992 def : Pat<(v2i64 (build_vector i64:$A, i64:$B)),
3993 (v2i64 (XXPERMDI
3994 (COPY_TO_REGCLASS (MTVSRD $A), VSRC),
3995 (COPY_TO_REGCLASS (MTVSRD $B), VSRC), 0))>;
3996 def : Pat<(v4i32 (build_vector i32:$A, i32:$B, i32:$C, i32:$D)),
Lei Huangde208432018-10-26 18:09:36 +00003997 (XXPERMDI
3998 (COPY_TO_REGCLASS
3999 (MTVSRD (RLDIMI AnyExts.B, AnyExts.A, 32, 0)), VSRC),
4000 (COPY_TO_REGCLASS
4001 (MTVSRD (RLDIMI AnyExts.D, AnyExts.C, 32, 0)), VSRC), 0)>;
Nemanja Ivanovicdf1cb522016-11-29 16:11:34 +00004002 def : Pat<(v4i32 (build_vector i32:$A, i32:$A, i32:$A, i32:$A)),
4003 (XXSPLTW (COPY_TO_REGCLASS (MTVSRWZ $A), VSRC), 1)>;
4004 }
4005
4006 let Predicates = [IsLittleEndian, HasDirectMove, NoP9Vector] in {
4007 // Little endian integer vectors using direct moves.
4008 def : Pat<(v2i64 (build_vector i64:$A, i64:$B)),
4009 (v2i64 (XXPERMDI
4010 (COPY_TO_REGCLASS (MTVSRD $B), VSRC),
4011 (COPY_TO_REGCLASS (MTVSRD $A), VSRC), 0))>;
4012 def : Pat<(v4i32 (build_vector i32:$A, i32:$B, i32:$C, i32:$D)),
Lei Huangde208432018-10-26 18:09:36 +00004013 (XXPERMDI
4014 (COPY_TO_REGCLASS
4015 (MTVSRD (RLDIMI AnyExts.C, AnyExts.D, 32, 0)), VSRC),
4016 (COPY_TO_REGCLASS
4017 (MTVSRD (RLDIMI AnyExts.A, AnyExts.B, 32, 0)), VSRC), 0)>;
Nemanja Ivanovicdf1cb522016-11-29 16:11:34 +00004018 def : Pat<(v4i32 (build_vector i32:$A, i32:$A, i32:$A, i32:$A)),
4019 (XXSPLTW (COPY_TO_REGCLASS (MTVSRWZ $A), VSRC), 1)>;
4020 }
4021
4022 let Predicates = [HasP9Vector] in {
4023 // Endianness-neutral patterns for const splats with ISA 3.0 instructions.
4024 def : Pat<(v4i32 (scalar_to_vector i32:$A)),
4025 (v4i32 (MTVSRWS $A))>;
4026 def : Pat<(v4i32 (build_vector i32:$A, i32:$A, i32:$A, i32:$A)),
4027 (v4i32 (MTVSRWS $A))>;
Nemanja Ivanovic552c8e92016-12-15 11:16:20 +00004028 def : Pat<(v16i8 (build_vector immAnyExt8:$A, immAnyExt8:$A, immAnyExt8:$A,
4029 immAnyExt8:$A, immAnyExt8:$A, immAnyExt8:$A,
4030 immAnyExt8:$A, immAnyExt8:$A, immAnyExt8:$A,
4031 immAnyExt8:$A, immAnyExt8:$A, immAnyExt8:$A,
4032 immAnyExt8:$A, immAnyExt8:$A, immAnyExt8:$A,
4033 immAnyExt8:$A)),
Nemanja Ivanovicdf1cb522016-11-29 16:11:34 +00004034 (v16i8 (COPY_TO_REGCLASS (XXSPLTIB imm:$A), VSRC))>;
4035 def : Pat<(v16i8 immAllOnesV),
4036 (v16i8 (COPY_TO_REGCLASS (XXSPLTIB 255), VSRC))>;
4037 def : Pat<(v8i16 immAllOnesV),
4038 (v8i16 (COPY_TO_REGCLASS (XXSPLTIB 255), VSRC))>;
4039 def : Pat<(v4i32 immAllOnesV),
4040 (v4i32 (XXSPLTIB 255))>;
4041 def : Pat<(v2i64 immAllOnesV),
4042 (v2i64 (XXSPLTIB 255))>;
4043 def : Pat<(v4i32 (scalar_to_vector FltToIntLoad.A)),
4044 (v4i32 (XVCVSPSXWS (LXVWSX xoaddr:$A)))>;
4045 def : Pat<(v4i32 (scalar_to_vector FltToUIntLoad.A)),
4046 (v4i32 (XVCVSPUXWS (LXVWSX xoaddr:$A)))>;
Hiroshi Inouee3c14eb2017-05-29 07:12:39 +00004047 def : Pat<(v4i32 (scalar_to_vector DblToIntLoadP9.A)),
Nemanja Ivanovicdf1cb522016-11-29 16:11:34 +00004048 (v4i32 (XXSPLTW (COPY_TO_REGCLASS
Nemanja Ivanovic3c7e276d2017-07-13 18:17:10 +00004049 (XSCVDPSXWS (DFLOADf64 ixaddr:$A)), VSRC), 1))>;
Hiroshi Inouee3c14eb2017-05-29 07:12:39 +00004050 def : Pat<(v4i32 (scalar_to_vector DblToUIntLoadP9.A)),
Nemanja Ivanovicdf1cb522016-11-29 16:11:34 +00004051 (v4i32 (XXSPLTW (COPY_TO_REGCLASS
Nemanja Ivanovic3c7e276d2017-07-13 18:17:10 +00004052 (XSCVDPUXWS (DFLOADf64 ixaddr:$A)), VSRC), 1))>;
Hiroshi Inouee3c14eb2017-05-29 07:12:39 +00004053 def : Pat<(v2i64 (scalar_to_vector FltToLongLoadP9.A)),
Nemanja Ivanovicdf1cb522016-11-29 16:11:34 +00004054 (v2i64 (XXPERMDIs (XSCVDPSXDS (COPY_TO_REGCLASS
Nemanja Ivanovic3c7e276d2017-07-13 18:17:10 +00004055 (DFLOADf32 ixaddr:$A),
Nemanja Ivanovicdf1cb522016-11-29 16:11:34 +00004056 VSFRC)), 0))>;
Hiroshi Inouee3c14eb2017-05-29 07:12:39 +00004057 def : Pat<(v2i64 (scalar_to_vector FltToULongLoadP9.A)),
Nemanja Ivanovicdf1cb522016-11-29 16:11:34 +00004058 (v2i64 (XXPERMDIs (XSCVDPUXDS (COPY_TO_REGCLASS
Nemanja Ivanovic3c7e276d2017-07-13 18:17:10 +00004059 (DFLOADf32 ixaddr:$A),
Nemanja Ivanovicdf1cb522016-11-29 16:11:34 +00004060 VSFRC)), 0))>;
4061 }
4062
4063 let Predicates = [IsISA3_0, HasDirectMove, IsBigEndian] in {
4064 def : Pat<(i64 (extractelt v2i64:$A, 1)),
4065 (i64 (MFVSRLD $A))>;
4066 // Better way to build integer vectors if we have MTVSRDD. Big endian.
4067 def : Pat<(v2i64 (build_vector i64:$rB, i64:$rA)),
4068 (v2i64 (MTVSRDD $rB, $rA))>;
4069 def : Pat<(v4i32 (build_vector i32:$A, i32:$B, i32:$C, i32:$D)),
Lei Huangde208432018-10-26 18:09:36 +00004070 (MTVSRDD
4071 (RLDIMI AnyExts.B, AnyExts.A, 32, 0),
4072 (RLDIMI AnyExts.D, AnyExts.C, 32, 0))>;
Nemanja Ivanovicdf1cb522016-11-29 16:11:34 +00004073 }
4074
4075 let Predicates = [IsISA3_0, HasDirectMove, IsLittleEndian] in {
4076 def : Pat<(i64 (extractelt v2i64:$A, 0)),
4077 (i64 (MFVSRLD $A))>;
4078 // Better way to build integer vectors if we have MTVSRDD. Little endian.
4079 def : Pat<(v2i64 (build_vector i64:$rA, i64:$rB)),
4080 (v2i64 (MTVSRDD $rB, $rA))>;
4081 def : Pat<(v4i32 (build_vector i32:$A, i32:$B, i32:$C, i32:$D)),
Lei Huangde208432018-10-26 18:09:36 +00004082 (MTVSRDD
4083 (RLDIMI AnyExts.C, AnyExts.D, 32, 0),
4084 (RLDIMI AnyExts.A, AnyExts.B, 32, 0))>;
Nemanja Ivanovicdf1cb522016-11-29 16:11:34 +00004085 }
Zaara Syeda79acbbe2017-06-08 17:14:36 +00004086 // P9 Altivec instructions that can be used to build vectors.
4087 // Adding them to PPCInstrVSX.td rather than PPCAltivecVSX.td to compete
4088 // with complexities of existing build vector patterns in this file.
Tony Jiang9a91a182017-07-05 16:00:38 +00004089 let Predicates = [HasP9Altivec, IsLittleEndian] in {
4090 def : Pat<(v2i64 (build_vector WordToDWord.LE_A0, WordToDWord.LE_A1)),
Zaara Syeda79acbbe2017-06-08 17:14:36 +00004091 (v2i64 (VEXTSW2D $A))>;
Tony Jiang9a91a182017-07-05 16:00:38 +00004092 def : Pat<(v2i64 (build_vector HWordToDWord.LE_A0, HWordToDWord.LE_A1)),
Zaara Syeda79acbbe2017-06-08 17:14:36 +00004093 (v2i64 (VEXTSH2D $A))>;
Tony Jiang9a91a182017-07-05 16:00:38 +00004094 def : Pat<(v4i32 (build_vector HWordToWord.LE_A0, HWordToWord.LE_A1,
4095 HWordToWord.LE_A2, HWordToWord.LE_A3)),
Zaara Syeda79acbbe2017-06-08 17:14:36 +00004096 (v4i32 (VEXTSH2W $A))>;
Tony Jiang9a91a182017-07-05 16:00:38 +00004097 def : Pat<(v4i32 (build_vector ByteToWord.LE_A0, ByteToWord.LE_A1,
4098 ByteToWord.LE_A2, ByteToWord.LE_A3)),
Zaara Syeda79acbbe2017-06-08 17:14:36 +00004099 (v4i32 (VEXTSB2W $A))>;
Tony Jiang9a91a182017-07-05 16:00:38 +00004100 def : Pat<(v2i64 (build_vector ByteToDWord.LE_A0, ByteToDWord.LE_A1)),
Zaara Syeda79acbbe2017-06-08 17:14:36 +00004101 (v2i64 (VEXTSB2D $A))>;
4102 }
Tony Jiang9a91a182017-07-05 16:00:38 +00004103
4104 let Predicates = [HasP9Altivec, IsBigEndian] in {
4105 def : Pat<(v2i64 (build_vector WordToDWord.BE_A0, WordToDWord.BE_A1)),
4106 (v2i64 (VEXTSW2D $A))>;
4107 def : Pat<(v2i64 (build_vector HWordToDWord.BE_A0, HWordToDWord.BE_A1)),
4108 (v2i64 (VEXTSH2D $A))>;
4109 def : Pat<(v4i32 (build_vector HWordToWord.BE_A0, HWordToWord.BE_A1,
4110 HWordToWord.BE_A2, HWordToWord.BE_A3)),
4111 (v4i32 (VEXTSH2W $A))>;
4112 def : Pat<(v4i32 (build_vector ByteToWord.BE_A0, ByteToWord.BE_A1,
4113 ByteToWord.BE_A2, ByteToWord.BE_A3)),
4114 (v4i32 (VEXTSB2W $A))>;
4115 def : Pat<(v2i64 (build_vector ByteToDWord.BE_A0, ByteToDWord.BE_A1)),
4116 (v2i64 (VEXTSB2D $A))>;
4117 }
4118
4119 let Predicates = [HasP9Altivec] in {
4120 def: Pat<(v2i64 (PPCSExtVElems v16i8:$A)),
4121 (v2i64 (VEXTSB2D $A))>;
4122 def: Pat<(v2i64 (PPCSExtVElems v8i16:$A)),
4123 (v2i64 (VEXTSH2D $A))>;
4124 def: Pat<(v2i64 (PPCSExtVElems v4i32:$A)),
4125 (v2i64 (VEXTSW2D $A))>;
4126 def: Pat<(v4i32 (PPCSExtVElems v16i8:$A)),
4127 (v4i32 (VEXTSB2W $A))>;
4128 def: Pat<(v4i32 (PPCSExtVElems v8i16:$A)),
4129 (v4i32 (VEXTSH2W $A))>;
4130 }
Nemanja Ivanovicd2c3c512016-09-23 13:25:31 +00004131}
Zaara Syedab2595b92018-08-08 15:20:43 +00004132
Kewen Lin3dac12522018-12-18 03:16:43 +00004133// Put this P9Altivec related definition here since it's possible to be
4134// selected to VSX instruction xvnegsp, avoid possible undef.
4135let Predicates = [HasP9Altivec] in {
4136
4137 def : Pat<(v4i32 (PPCvabsd v4i32:$A, v4i32:$B, (i32 0))),
4138 (v4i32 (VABSDUW $A, $B))>;
4139
4140 def : Pat<(v8i16 (PPCvabsd v8i16:$A, v8i16:$B, (i32 0))),
4141 (v8i16 (VABSDUH $A, $B))>;
4142
4143 def : Pat<(v16i8 (PPCvabsd v16i8:$A, v16i8:$B, (i32 0))),
4144 (v16i8 (VABSDUB $A, $B))>;
4145
4146 // As PPCVABSD description, the last operand indicates whether do the
4147 // sign bit flip.
4148 def : Pat<(v4i32 (PPCvabsd v4i32:$A, v4i32:$B, (i32 1))),
4149 (v4i32 (VABSDUW (XVNEGSP $A), (XVNEGSP $B)))>;
4150}