blob: 85a9fdfa7b9da6b62506275332ae25148a759c3b [file] [log] [blame]
Chris Lattnerb22a04d2006-03-25 07:51:43 +00001//===- PPCInstrAltivec.td - The PowerPC Altivec Extension --*- tablegen -*-===//
2//
3// The LLVM Compiler Infrastructure
4//
5// This file was developed by Chris Lattner and is distributed under
6// the University of Illinois Open Source License. See LICENSE.TXT for details.
7//
8//===----------------------------------------------------------------------===//
9//
10// This file describes the Altivec extension to the PowerPC instruction set.
11//
12//===----------------------------------------------------------------------===//
13
14//===----------------------------------------------------------------------===//
15// Altivec transformation functions and pattern fragments.
16//
17
Chris Lattner7ff7e672006-04-04 17:25:31 +000018// VSPLT*_get_imm xform function: convert vector_shuffle mask to VSPLT* imm.
19def VSPLTB_get_imm : SDNodeXForm<build_vector, [{
20 return getI32Imm(PPC::getVSPLTImmediate(N, 1));
Chris Lattnerb22a04d2006-03-25 07:51:43 +000021}]>;
Chris Lattner7ff7e672006-04-04 17:25:31 +000022def VSPLTB_shuffle_mask : PatLeaf<(build_vector), [{
23 return PPC::isSplatShuffleMask(N, 1);
24}], VSPLTB_get_imm>;
25def VSPLTH_get_imm : SDNodeXForm<build_vector, [{
26 return getI32Imm(PPC::getVSPLTImmediate(N, 2));
27}]>;
28def VSPLTH_shuffle_mask : PatLeaf<(build_vector), [{
29 return PPC::isSplatShuffleMask(N, 2);
30}], VSPLTH_get_imm>;
31def VSPLTW_get_imm : SDNodeXForm<build_vector, [{
32 return getI32Imm(PPC::getVSPLTImmediate(N, 4));
33}]>;
34def VSPLTW_shuffle_mask : PatLeaf<(build_vector), [{
35 return PPC::isSplatShuffleMask(N, 4);
36}], VSPLTW_get_imm>;
Chris Lattnerb22a04d2006-03-25 07:51:43 +000037
Chris Lattnerb22a04d2006-03-25 07:51:43 +000038
39// VSPLTISB_get_imm xform function: convert build_vector to VSPLTISB imm.
40def VSPLTISB_get_imm : SDNodeXForm<build_vector, [{
41 char Val;
42 PPC::isVecSplatImm(N, 1, &Val);
43 return getI32Imm(Val);
44}]>;
45def vecspltisb : PatLeaf<(build_vector), [{
46 return PPC::isVecSplatImm(N, 1);
47}], VSPLTISB_get_imm>;
48
49// VSPLTISH_get_imm xform function: convert build_vector to VSPLTISH imm.
50def VSPLTISH_get_imm : SDNodeXForm<build_vector, [{
51 char Val;
52 PPC::isVecSplatImm(N, 2, &Val);
53 return getI32Imm(Val);
54}]>;
55def vecspltish : PatLeaf<(build_vector), [{
56 return PPC::isVecSplatImm(N, 2);
57}], VSPLTISH_get_imm>;
58
59// VSPLTISW_get_imm xform function: convert build_vector to VSPLTISW imm.
60def VSPLTISW_get_imm : SDNodeXForm<build_vector, [{
61 char Val;
62 PPC::isVecSplatImm(N, 4, &Val);
63 return getI32Imm(Val);
64}]>;
65def vecspltisw : PatLeaf<(build_vector), [{
66 return PPC::isVecSplatImm(N, 4);
67}], VSPLTISW_get_imm>;
68
Chris Lattnerb22a04d2006-03-25 07:51:43 +000069//===----------------------------------------------------------------------===//
Chris Lattner3c4f4e9f2006-03-30 23:21:27 +000070// Helpers for defining instructions that directly correspond to intrinsics.
71
Chris Lattner8768bf62006-03-30 23:39:06 +000072// VA1a_Int - A VAForm_1a intrinsic definition.
Chris Lattnerb5c4d172006-03-31 21:57:36 +000073class VA1a_Int<bits<6> xo, string opc, Intrinsic IntID>
74 : VAForm_1a<xo, (ops VRRC:$vD, VRRC:$vA, VRRC:$vB, VRRC:$vC),
75 !strconcat(opc, " $vD, $vA, $vB, $vC"), VecFP,
Chris Lattner8768bf62006-03-30 23:39:06 +000076 [(set VRRC:$vD, (IntID VRRC:$vA, VRRC:$vB, VRRC:$vC))]>;
77
Chris Lattner3c4f4e9f2006-03-30 23:21:27 +000078// VX1_Int - A VXForm_1 intrinsic definition.
Chris Lattner6cea8142006-03-31 22:34:05 +000079class VX1_Int<bits<11> xo, string opc, Intrinsic IntID>
80 : VXForm_1<xo, (ops VRRC:$vD, VRRC:$vA, VRRC:$vB),
81 !strconcat(opc, " $vD, $vA, $vB"), VecFP,
Chris Lattner3c4f4e9f2006-03-30 23:21:27 +000082 [(set VRRC:$vD, (IntID VRRC:$vA, VRRC:$vB))]>;
83
84// VX2_Int - A VXForm_2 intrinsic definition.
Chris Lattner6cea8142006-03-31 22:34:05 +000085class VX2_Int<bits<11> xo, string opc, Intrinsic IntID>
86 : VXForm_2<xo, (ops VRRC:$vD, VRRC:$vB),
87 !strconcat(opc, " $vD, $vB"), VecFP,
Chris Lattner3c4f4e9f2006-03-30 23:21:27 +000088 [(set VRRC:$vD, (IntID VRRC:$vB))]>;
89
90//===----------------------------------------------------------------------===//
Chris Lattnerb22a04d2006-03-25 07:51:43 +000091// Instruction Definitions.
92
93def IMPLICIT_DEF_VRRC : Pseudo<(ops VRRC:$rD), "; $rD = IMPLICIT_DEF_VRRC",
94 [(set VRRC:$rD, (v4f32 (undef)))]>;
95
96let isLoad = 1, PPC970_Unit = 2 in { // Loads.
97def LVEBX: XForm_1<31, 7, (ops VRRC:$vD, memrr:$src),
98 "lvebx $vD, $src", LdStGeneral,
Chris Lattnerecc219b2006-03-28 02:29:37 +000099 [(set VRRC:$vD, (int_ppc_altivec_lvebx xoaddr:$src))]>;
Chris Lattnere7d959c2006-03-26 00:41:48 +0000100def LVEHX: XForm_1<31, 39, (ops VRRC:$vD, memrr:$src),
Chris Lattnerb22a04d2006-03-25 07:51:43 +0000101 "lvehx $vD, $src", LdStGeneral,
Chris Lattnerecc219b2006-03-28 02:29:37 +0000102 [(set VRRC:$vD, (int_ppc_altivec_lvehx xoaddr:$src))]>;
Chris Lattnere7d959c2006-03-26 00:41:48 +0000103def LVEWX: XForm_1<31, 71, (ops VRRC:$vD, memrr:$src),
Chris Lattnerb22a04d2006-03-25 07:51:43 +0000104 "lvewx $vD, $src", LdStGeneral,
Chris Lattnerecc219b2006-03-28 02:29:37 +0000105 [(set VRRC:$vD, (int_ppc_altivec_lvewx xoaddr:$src))]>;
Chris Lattnere7d959c2006-03-26 00:41:48 +0000106def LVX : XForm_1<31, 103, (ops VRRC:$vD, memrr:$src),
Chris Lattnerb22a04d2006-03-25 07:51:43 +0000107 "lvx $vD, $src", LdStGeneral,
Chris Lattnerecc219b2006-03-28 02:29:37 +0000108 [(set VRRC:$vD, (int_ppc_altivec_lvx xoaddr:$src))]>;
109def LVXL : XForm_1<31, 359, (ops VRRC:$vD, memrr:$src),
110 "lvxl $vD, $src", LdStGeneral,
111 [(set VRRC:$vD, (int_ppc_altivec_lvxl xoaddr:$src))]>;
Chris Lattnerb22a04d2006-03-25 07:51:43 +0000112}
113
Chris Lattner30a6aba2006-03-30 23:07:36 +0000114def LVSL : XForm_1<31, 6, (ops VRRC:$vD, memrr:$src),
115 "lvsl $vD, $src", LdStGeneral,
116 [(set VRRC:$vD, (int_ppc_altivec_lvsl xoaddr:$src))]>,
117 PPC970_Unit_LSU;
118def LVSR : XForm_1<31, 38, (ops VRRC:$vD, memrr:$src),
119 "lvsl $vD, $src", LdStGeneral,
120 [(set VRRC:$vD, (int_ppc_altivec_lvsr xoaddr:$src))]>,
121 PPC970_Unit_LSU;
Chris Lattnerb22a04d2006-03-25 07:51:43 +0000122
123let isStore = 1, noResults = 1, PPC970_Unit = 2 in { // Stores.
Chris Lattner48b61a72006-03-28 00:40:33 +0000124def STVEBX: XForm_8<31, 135, (ops VRRC:$rS, memrr:$dst),
125 "stvebx $rS, $dst", LdStGeneral,
126 [(int_ppc_altivec_stvebx VRRC:$rS, xoaddr:$dst)]>;
127def STVEHX: XForm_8<31, 167, (ops VRRC:$rS, memrr:$dst),
128 "stvehx $rS, $dst", LdStGeneral,
129 [(int_ppc_altivec_stvehx VRRC:$rS, xoaddr:$dst)]>;
130def STVEWX: XForm_8<31, 199, (ops VRRC:$rS, memrr:$dst),
131 "stvewx $rS, $dst", LdStGeneral,
132 [(int_ppc_altivec_stvewx VRRC:$rS, xoaddr:$dst)]>;
Chris Lattnerb22a04d2006-03-25 07:51:43 +0000133def STVX : XForm_8<31, 231, (ops VRRC:$rS, memrr:$dst),
134 "stvx $rS, $dst", LdStGeneral,
Chris Lattnerecc219b2006-03-28 02:29:37 +0000135 [(int_ppc_altivec_stvx VRRC:$rS, xoaddr:$dst)]>;
136def STVXL : XForm_8<31, 487, (ops VRRC:$rS, memrr:$dst),
137 "stvxl $rS, $dst", LdStGeneral,
138 [(int_ppc_altivec_stvxl VRRC:$rS, xoaddr:$dst)]>;
Chris Lattnerb22a04d2006-03-25 07:51:43 +0000139}
140
141let PPC970_Unit = 5 in { // VALU Operations.
142// VA-Form instructions. 3-input AltiVec ops.
143def VMADDFP : VAForm_1<46, (ops VRRC:$vD, VRRC:$vA, VRRC:$vC, VRRC:$vB),
144 "vmaddfp $vD, $vA, $vC, $vB", VecFP,
145 [(set VRRC:$vD, (fadd (fmul VRRC:$vA, VRRC:$vC),
146 VRRC:$vB))]>,
147 Requires<[FPContractions]>;
148def VNMSUBFP: VAForm_1<47, (ops VRRC:$vD, VRRC:$vA, VRRC:$vC, VRRC:$vB),
149 "vnmsubfp $vD, $vA, $vC, $vB", VecFP,
150 [(set VRRC:$vD, (fneg (fsub (fmul VRRC:$vA, VRRC:$vC),
151 VRRC:$vB)))]>,
152 Requires<[FPContractions]>;
Chris Lattnerb5c4d172006-03-31 21:57:36 +0000153def VMHADDSHS : VA1a_Int<32, "vmhaddshs", int_ppc_altivec_vmhaddshs>;
154def VMHRADDSHS : VA1a_Int<33, "vmhraddshs", int_ppc_altivec_vmhraddshs>;
155def VPERM : VA1a_Int<43, "vperm", int_ppc_altivec_vperm>;
156def VSEL : VA1a_Int<42, "vsel", int_ppc_altivec_vsel>;
Chris Lattnera9cb4412006-03-31 20:00:35 +0000157
Chris Lattnere7d959c2006-03-26 00:41:48 +0000158def VSLDOI : VAForm_2<44, (ops VRRC:$vD, VRRC:$vA, VRRC:$vB, u5imm:$SH),
159 "vsldoi $vD, $vA, $vB, $SH", VecFP,
160 [(set VRRC:$vD,
161 (int_ppc_altivec_vsldoi VRRC:$vA, VRRC:$vB,
162 imm:$SH))]>;
Chris Lattnerb22a04d2006-03-25 07:51:43 +0000163
164// VX-Form instructions. AltiVec arithmetic ops.
165def VADDFP : VXForm_1<10, (ops VRRC:$vD, VRRC:$vA, VRRC:$vB),
166 "vaddfp $vD, $vA, $vB", VecFP,
167 [(set VRRC:$vD, (fadd VRRC:$vA, VRRC:$vB))]>;
Chris Lattner5d729072006-03-26 02:39:02 +0000168
169def VADDUBM : VXForm_1<0, (ops VRRC:$vD, VRRC:$vA, VRRC:$vB),
170 "vaddubm $vD, $vA, $vB", VecGeneral,
171 [(set VRRC:$vD, (add (v16i8 VRRC:$vA), VRRC:$vB))]>;
172def VADDUHM : VXForm_1<64, (ops VRRC:$vD, VRRC:$vA, VRRC:$vB),
173 "vadduhm $vD, $vA, $vB", VecGeneral,
174 [(set VRRC:$vD, (add (v8i16 VRRC:$vA), VRRC:$vB))]>;
175def VADDUWM : VXForm_1<128, (ops VRRC:$vD, VRRC:$vA, VRRC:$vB),
176 "vadduwm $vD, $vA, $vB", VecGeneral,
177 [(set VRRC:$vD, (add (v4i32 VRRC:$vA), VRRC:$vB))]>;
178
Chris Lattner348ba3f2006-03-31 22:41:56 +0000179def VADDCUW : VX1_Int<384, "vaddcuw", int_ppc_altivec_vaddcuw>;
180def VADDSBS : VX1_Int<768, "vaddsbs", int_ppc_altivec_vaddsbs>;
181def VADDSHS : VX1_Int<832, "vaddshs", int_ppc_altivec_vaddshs>;
182def VADDSWS : VX1_Int<896, "vaddsws", int_ppc_altivec_vaddsws>;
183def VADDUBS : VX1_Int<512, "vaddubs", int_ppc_altivec_vaddubs>;
184def VADDUHS : VX1_Int<576, "vadduhs", int_ppc_altivec_vadduhs>;
185def VADDUWS : VX1_Int<640, "vadduws", int_ppc_altivec_vadduws>;
Chris Lattner5d729072006-03-26 02:39:02 +0000186
Chris Lattner348ba3f2006-03-31 22:41:56 +0000187
Chris Lattner2430a5f2006-03-25 22:16:05 +0000188def VAND : VXForm_1<1028, (ops VRRC:$vD, VRRC:$vA, VRRC:$vB),
189 "vand $vD, $vA, $vB", VecFP,
190 [(set VRRC:$vD, (and (v4i32 VRRC:$vA), VRRC:$vB))]>;
191def VANDC : VXForm_1<1092, (ops VRRC:$vD, VRRC:$vA, VRRC:$vB),
192 "vandc $vD, $vA, $vB", VecFP,
Chris Lattneraf9136b2006-03-25 23:10:40 +0000193 [(set VRRC:$vD, (and (v4i32 VRRC:$vA), (vnot VRRC:$vB)))]>;
Chris Lattner2430a5f2006-03-25 22:16:05 +0000194
Chris Lattnerb22a04d2006-03-25 07:51:43 +0000195def VCFSX : VXForm_1<842, (ops VRRC:$vD, u5imm:$UIMM, VRRC:$vB),
196 "vcfsx $vD, $vB, $UIMM", VecFP,
Chris Lattner984f38b2006-03-25 08:01:02 +0000197 [(set VRRC:$vD,
198 (int_ppc_altivec_vcfsx VRRC:$vB, imm:$UIMM))]>;
Chris Lattnerb22a04d2006-03-25 07:51:43 +0000199def VCFUX : VXForm_1<778, (ops VRRC:$vD, u5imm:$UIMM, VRRC:$vB),
200 "vcfux $vD, $vB, $UIMM", VecFP,
Chris Lattner984f38b2006-03-25 08:01:02 +0000201 [(set VRRC:$vD,
202 (int_ppc_altivec_vcfux VRRC:$vB, imm:$UIMM))]>;
Chris Lattnerb22a04d2006-03-25 07:51:43 +0000203def VCTSXS : VXForm_1<970, (ops VRRC:$vD, u5imm:$UIMM, VRRC:$vB),
204 "vctsxs $vD, $vB, $UIMM", VecFP,
205 []>;
206def VCTUXS : VXForm_1<906, (ops VRRC:$vD, u5imm:$UIMM, VRRC:$vB),
207 "vctuxs $vD, $vB, $UIMM", VecFP,
208 []>;
Chris Lattner348ba3f2006-03-31 22:41:56 +0000209def VEXPTEFP : VX2_Int<394, "vexptefp", int_ppc_altivec_vexptefp>;
210def VLOGEFP : VX2_Int<458, "vlogefp", int_ppc_altivec_vlogefp>;
211
Chris Lattnerc461a512006-04-03 15:58:28 +0000212def VMAXFP : VX1_Int<1034, "vmaxfp", int_ppc_altivec_vmaxfp>;
213def VMAXSB : VX1_Int< 258, "vmaxsb", int_ppc_altivec_vmaxsb>;
214def VMAXSH : VX1_Int< 322, "vmaxsh", int_ppc_altivec_vmaxsh>;
215def VMAXSW : VX1_Int< 386, "vmaxsw", int_ppc_altivec_vmaxsw>;
216def VMAXUB : VX1_Int< 2, "vmaxub", int_ppc_altivec_vmaxub>;
217def VMAXUH : VX1_Int< 66, "vmaxuh", int_ppc_altivec_vmaxuh>;
218def VMAXUW : VX1_Int< 130, "vmaxuw", int_ppc_altivec_vmaxuw>;
219def VMINFP : VX1_Int<1098, "vminfp", int_ppc_altivec_vminfp>;
220def VMINSB : VX1_Int< 770, "vminsb", int_ppc_altivec_vminsb>;
221def VMINSH : VX1_Int< 834, "vminsh", int_ppc_altivec_vminsh>;
222def VMINSW : VX1_Int< 896, "vminsw", int_ppc_altivec_vminsw>;
223def VMINUB : VX1_Int< 514, "vminub", int_ppc_altivec_vminub>;
224def VMINUH : VX1_Int< 578, "vminuh", int_ppc_altivec_vminuh>;
225def VMINUW : VX1_Int< 642, "vminuw", int_ppc_altivec_vminuw>;
Chris Lattner30a6aba2006-03-30 23:07:36 +0000226
Chris Lattner6cea8142006-03-31 22:34:05 +0000227def VMRGHH : VX1_Int<76 , "vmrghh", int_ppc_altivec_vmrghh>;
228def VMRGHW : VX1_Int<140, "vmrghw", int_ppc_altivec_vmrghw>;
229def VMRGLH : VX1_Int<332, "vmrglh", int_ppc_altivec_vmrglh>;
230def VMRGLW : VX1_Int<396, "vmrglw", int_ppc_altivec_vmrglw>;
Chris Lattner3c4f4e9f2006-03-30 23:21:27 +0000231
Chris Lattnerb5c4d172006-03-31 21:57:36 +0000232def VMSUMMBM : VA1a_Int<37, "vmsummbm", int_ppc_altivec_vmsummbm>;
233def VMSUMSHM : VA1a_Int<40, "vmsumshm", int_ppc_altivec_vmsumshm>;
234def VMSUMSHS : VA1a_Int<41, "vmsumshs", int_ppc_altivec_vmsumshs>;
235def VMSUMUBM : VA1a_Int<36, "vmsumubm", int_ppc_altivec_vmsumubm>;
236def VMSUMUHM : VA1a_Int<38, "vmsumuhm", int_ppc_altivec_vmsumuhm>;
237def VMSUMUHS : VA1a_Int<39, "vmsumuhs", int_ppc_altivec_vmsumuhs>;
Chris Lattner8768bf62006-03-30 23:39:06 +0000238
Chris Lattner6cea8142006-03-31 22:34:05 +0000239def VMULESB : VX1_Int<776, "vmulesb", int_ppc_altivec_vmulesb>;
240def VMULESH : VX1_Int<840, "vmulesh", int_ppc_altivec_vmulesh>;
241def VMULEUB : VX1_Int<520, "vmuleub", int_ppc_altivec_vmuleub>;
242def VMULEUH : VX1_Int<584, "vmuleuh", int_ppc_altivec_vmuleuh>;
243def VMULOSB : VX1_Int<264, "vmulosb", int_ppc_altivec_vmulosb>;
244def VMULOSH : VX1_Int<328, "vmulosh", int_ppc_altivec_vmulosh>;
245def VMULOUB : VX1_Int< 8, "vmuloub", int_ppc_altivec_vmuloub>;
246def VMULOUH : VX1_Int< 72, "vmulouh", int_ppc_altivec_vmulouh>;
Chris Lattner30a6aba2006-03-30 23:07:36 +0000247
Chris Lattner6cea8142006-03-31 22:34:05 +0000248def VREFP : VX2_Int<266, "vrefp", int_ppc_altivec_vrefp>;
249def VRFIM : VX2_Int<714, "vrfim", int_ppc_altivec_vrfim>;
250def VRFIN : VX2_Int<522, "vrfin", int_ppc_altivec_vrfin>;
251def VRFIP : VX2_Int<650, "vrfip", int_ppc_altivec_vrfip>;
252def VRFIZ : VX2_Int<586, "vrfiz", int_ppc_altivec_vrfiz>;
253def VRSQRTEFP : VX2_Int<330, "vrsqrtefp", int_ppc_altivec_vrsqrtefp>;
Chris Lattner3c4f4e9f2006-03-30 23:21:27 +0000254
Chris Lattner6cea8142006-03-31 22:34:05 +0000255def VSUBCUW : VX1_Int<74, "vsubcuw", int_ppc_altivec_vsubcuw>;
Chris Lattner3c4f4e9f2006-03-30 23:21:27 +0000256
257def VSUBFP : VXForm_1<74, (ops VRRC:$vD, VRRC:$vA, VRRC:$vB),
258 "vsubfp $vD, $vA, $vB", VecGeneral,
Chris Lattnerb22a04d2006-03-25 07:51:43 +0000259 [(set VRRC:$vD, (fsub VRRC:$vA, VRRC:$vB))]>;
Chris Lattner5d729072006-03-26 02:39:02 +0000260def VSUBUBM : VXForm_1<1024, (ops VRRC:$vD, VRRC:$vA, VRRC:$vB),
261 "vsububm $vD, $vA, $vB", VecGeneral,
262 [(set VRRC:$vD, (sub (v16i8 VRRC:$vA), VRRC:$vB))]>;
263def VSUBUHM : VXForm_1<1088, (ops VRRC:$vD, VRRC:$vA, VRRC:$vB),
264 "vsubuhm $vD, $vA, $vB", VecGeneral,
265 [(set VRRC:$vD, (sub (v8i16 VRRC:$vA), VRRC:$vB))]>;
266def VSUBUWM : VXForm_1<1152, (ops VRRC:$vD, VRRC:$vA, VRRC:$vB),
267 "vsubuwm $vD, $vA, $vB", VecGeneral,
268 [(set VRRC:$vD, (sub (v4i32 VRRC:$vA), VRRC:$vB))]>;
269
Chris Lattner6cea8142006-03-31 22:34:05 +0000270def VSUBSBS : VX1_Int<1792, "vsubsbs" , int_ppc_altivec_vsubsbs>;
271def VSUBSHS : VX1_Int<1856, "vsubshs" , int_ppc_altivec_vsubshs>;
272def VSUBSWS : VX1_Int<1920, "vsubsws" , int_ppc_altivec_vsubsws>;
273def VSUBUBS : VX1_Int<1536, "vsububs" , int_ppc_altivec_vsububs>;
274def VSUBUHS : VX1_Int<1600, "vsubuhs" , int_ppc_altivec_vsubuhs>;
275def VSUBUWS : VX1_Int<1664, "vsubuws" , int_ppc_altivec_vsubuws>;
276def VSUMSWS : VX1_Int<1928, "vsumsws" , int_ppc_altivec_vsumsws>;
277def VSUM2SWS: VX1_Int<1672, "vsum2sws", int_ppc_altivec_vsum2sws>;
278def VSUM4SBS: VX1_Int<1672, "vsum4sbs", int_ppc_altivec_vsum4sbs>;
279def VSUM4SHS: VX1_Int<1608, "vsum4shs", int_ppc_altivec_vsum4shs>;
280def VSUM4UBS: VX1_Int<1544, "vsum4ubs", int_ppc_altivec_vsum4ubs>;
Chris Lattnerecc219b2006-03-28 02:29:37 +0000281
Chris Lattner2430a5f2006-03-25 22:16:05 +0000282def VNOR : VXForm_1<1284, (ops VRRC:$vD, VRRC:$vA, VRRC:$vB),
283 "vnor $vD, $vA, $vB", VecFP,
Chris Lattner6509ae82006-03-25 23:05:29 +0000284 [(set VRRC:$vD, (vnot (or (v4i32 VRRC:$vA), VRRC:$vB)))]>;
Chris Lattnerb22a04d2006-03-25 07:51:43 +0000285def VOR : VXForm_1<1156, (ops VRRC:$vD, VRRC:$vA, VRRC:$vB),
286 "vor $vD, $vA, $vB", VecFP,
Chris Lattner2430a5f2006-03-25 22:16:05 +0000287 [(set VRRC:$vD, (or (v4i32 VRRC:$vA), VRRC:$vB))]>;
Chris Lattnerb22a04d2006-03-25 07:51:43 +0000288def VXOR : VXForm_1<1220, (ops VRRC:$vD, VRRC:$vA, VRRC:$vB),
289 "vxor $vD, $vA, $vB", VecFP,
Chris Lattner2430a5f2006-03-25 22:16:05 +0000290 [(set VRRC:$vD, (xor (v4i32 VRRC:$vA), VRRC:$vB))]>;
Chris Lattnerb22a04d2006-03-25 07:51:43 +0000291
Chris Lattner6cea8142006-03-31 22:34:05 +0000292def VRLB : VX1_Int< 4, "vrlb", int_ppc_altivec_vrlb>;
293def VRLH : VX1_Int< 68, "vrlh", int_ppc_altivec_vrlh>;
294def VRLW : VX1_Int< 132, "vrlw", int_ppc_altivec_vrlw>;
295def VSLO : VX1_Int<1036, "vslo", int_ppc_altivec_vslo>;
296def VSLB : VX1_Int< 260, "vslb", int_ppc_altivec_vslb>;
297def VSLH : VX1_Int< 324, "vslh", int_ppc_altivec_vslh>;
298def VSLW : VX1_Int< 388, "vslw", int_ppc_altivec_vslw>;
Chris Lattnerecc219b2006-03-28 02:29:37 +0000299
Chris Lattnerb22a04d2006-03-25 07:51:43 +0000300def VSPLTB : VXForm_1<524, (ops VRRC:$vD, u5imm:$UIMM, VRRC:$vB),
301 "vspltb $vD, $vB, $UIMM", VecPerm,
Chris Lattner684ad772006-04-04 00:05:13 +0000302 [(set VRRC:$vD, (vector_shuffle (v16i8 VRRC:$vB), (undef),
Chris Lattner7ff7e672006-04-04 17:25:31 +0000303 VSPLTB_shuffle_mask:$UIMM))]>;
Chris Lattnerb22a04d2006-03-25 07:51:43 +0000304def VSPLTH : VXForm_1<588, (ops VRRC:$vD, u5imm:$UIMM, VRRC:$vB),
305 "vsplth $vD, $vB, $UIMM", VecPerm,
Chris Lattner7ff7e672006-04-04 17:25:31 +0000306 [(set VRRC:$vD, (vector_shuffle (v16i8 VRRC:$vB), (undef),
307 VSPLTH_shuffle_mask:$UIMM))]>;
Chris Lattnerb22a04d2006-03-25 07:51:43 +0000308def VSPLTW : VXForm_1<652, (ops VRRC:$vD, u5imm:$UIMM, VRRC:$vB),
309 "vspltw $vD, $vB, $UIMM", VecPerm,
Chris Lattner7ff7e672006-04-04 17:25:31 +0000310 [(set VRRC:$vD, (vector_shuffle (v16i8 VRRC:$vB), (undef),
311 VSPLTW_shuffle_mask:$UIMM))]>;
Chris Lattnerb22a04d2006-03-25 07:51:43 +0000312
Chris Lattner6cea8142006-03-31 22:34:05 +0000313def VSR : VX1_Int< 708, "vsr" , int_ppc_altivec_vsr>;
314def VSRO : VX1_Int<1100, "vsro" , int_ppc_altivec_vsro>;
315def VSRAB : VX1_Int< 772, "vsrab", int_ppc_altivec_vsrab>;
316def VSRAH : VX1_Int< 836, "vsrah", int_ppc_altivec_vsrah>;
317def VSRAW : VX1_Int< 900, "vsraw", int_ppc_altivec_vsraw>;
318def VSRB : VX1_Int< 516, "vsrb" , int_ppc_altivec_vsrb>;
319def VSRH : VX1_Int< 580, "vsrh" , int_ppc_altivec_vsrh>;
320def VSRW : VX1_Int< 644, "vsrw" , int_ppc_altivec_vsrw>;
Chris Lattnerecc219b2006-03-28 02:29:37 +0000321
322
Chris Lattnereeaf72a2006-03-27 03:28:57 +0000323def VSPLTISB : VXForm_3<780, (ops VRRC:$vD, s5imm:$SIMM),
324 "vspltisb $vD, $SIMM", VecPerm,
325 [(set VRRC:$vD, (v4f32 vecspltisb:$SIMM))]>;
326def VSPLTISH : VXForm_3<844, (ops VRRC:$vD, s5imm:$SIMM),
327 "vspltish $vD, $SIMM", VecPerm,
328 [(set VRRC:$vD, (v4f32 vecspltish:$SIMM))]>;
329def VSPLTISW : VXForm_3<908, (ops VRRC:$vD, s5imm:$SIMM),
330 "vspltisw $vD, $SIMM", VecPerm,
331 [(set VRRC:$vD, (v4f32 vecspltisw:$SIMM))]>;
Chris Lattnerb22a04d2006-03-25 07:51:43 +0000332
Chris Lattner30a6aba2006-03-30 23:07:36 +0000333// Vector Pack.
Chris Lattner6cea8142006-03-31 22:34:05 +0000334def VPKPX : VX1_Int<782, "vpkpx", int_ppc_altivec_vpkpx>;
335def VPKSHSS : VX1_Int<398, "vpkshss", int_ppc_altivec_vpkshss>;
336def VPKSHUS : VX1_Int<270, "vpkshus", int_ppc_altivec_vpkshus>;
337def VPKSWSS : VX1_Int<462, "vpkswss", int_ppc_altivec_vpkswss>;
338def VPKSWUS : VX1_Int<334, "vpkswus", int_ppc_altivec_vpkswus>;
Chris Lattner30a6aba2006-03-30 23:07:36 +0000339def VPKUHUM : VXForm_1<14, (ops VRRC:$vD, VRRC:$vA, VRRC:$vB),
340 "vpkuhum $vD, $vA, $vB", VecFP,
341 [/*TODO*/]>;
Chris Lattner6cea8142006-03-31 22:34:05 +0000342def VPKUHUS : VX1_Int<142, "vpkuhus", int_ppc_altivec_vpkuhus>;
Chris Lattner30a6aba2006-03-30 23:07:36 +0000343def VPKUWUM : VXForm_1<78, (ops VRRC:$vD, VRRC:$vA, VRRC:$vB),
344 "vpkuwum $vD, $vA, $vB", VecFP,
345 [/*TODO*/]>;
Chris Lattner6cea8142006-03-31 22:34:05 +0000346def VPKUWUS : VX1_Int<206, "vpkuwus", int_ppc_altivec_vpkuwus>;
Chris Lattner30a6aba2006-03-30 23:07:36 +0000347
348// Vector Unpack.
Chris Lattner348ba3f2006-03-31 22:41:56 +0000349def VUPKHPX : VX2_Int<846, "vupkhpx", int_ppc_altivec_vupkhpx>;
350def VUPKHSB : VX2_Int<526, "vupkhsb", int_ppc_altivec_vupkhsb>;
351def VUPKHSH : VX2_Int<590, "vupkhsh", int_ppc_altivec_vupkhsh>;
352def VUPKLPX : VX2_Int<974, "vupklpx", int_ppc_altivec_vupklpx>;
353def VUPKLSB : VX2_Int<654, "vupklsb", int_ppc_altivec_vupklsb>;
354def VUPKLSH : VX2_Int<718, "vupklsh", int_ppc_altivec_vupklsh>;
Chris Lattner30a6aba2006-03-30 23:07:36 +0000355
Chris Lattnerb22a04d2006-03-25 07:51:43 +0000356
Chris Lattnerb8a45c22006-03-26 04:57:17 +0000357// Altivec Comparisons.
358
Chris Lattner5f7b0192006-03-31 05:32:57 +0000359class VCMP<bits<10> xo, string asmstr, ValueType Ty>
360 : VXRForm_1<xo, (ops VRRC:$vD, VRRC:$vA, VRRC:$vB), asmstr, VecFPCompare,
361 [(set VRRC:$vD, (Ty (PPCvcmp VRRC:$vA, VRRC:$vB, xo)))]>;
362class VCMPo<bits<10> xo, string asmstr, ValueType Ty>
363 : VXRForm_1<xo, (ops VRRC:$vD, VRRC:$vA, VRRC:$vB), asmstr, VecFPCompare,
Chris Lattner7ff7e672006-04-04 17:25:31 +0000364 [(set VRRC:$vD, (Ty (PPCvcmp_o VRRC:$vA, VRRC:$vB, xo)))]> {
365 let Defs = [CR6];
366 let RC = 1;
367}
Chris Lattner5f7b0192006-03-31 05:32:57 +0000368
369// f32 element comparisons.0
370def VCMPBFP : VCMP <966, "vcmpbfp $vD, $vA, $vB" , v4f32>;
371def VCMPBFPo : VCMPo<966, "vcmpbfp. $vD, $vA, $vB" , v4f32>;
372def VCMPEQFP : VCMP <198, "vcmpeqfp $vD, $vA, $vB" , v4f32>;
373def VCMPEQFPo : VCMPo<198, "vcmpeqfp. $vD, $vA, $vB", v4f32>;
374def VCMPGEFP : VCMP <454, "vcmpgefp $vD, $vA, $vB" , v4f32>;
375def VCMPGEFPo : VCMPo<454, "vcmpgefp. $vD, $vA, $vB", v4f32>;
376def VCMPGTFP : VCMP <710, "vcmpgtfp $vD, $vA, $vB" , v4f32>;
377def VCMPGTFPo : VCMPo<710, "vcmpgtfp. $vD, $vA, $vB", v4f32>;
Chris Lattnerb8a45c22006-03-26 04:57:17 +0000378
379// i8 element comparisons.
Chris Lattner5f7b0192006-03-31 05:32:57 +0000380def VCMPEQUB : VCMP < 6, "vcmpequb $vD, $vA, $vB" , v16i8>;
381def VCMPEQUBo : VCMPo< 6, "vcmpequb. $vD, $vA, $vB", v16i8>;
382def VCMPGTSB : VCMP <774, "vcmpgtsb $vD, $vA, $vB" , v16i8>;
383def VCMPGTSBo : VCMPo<774, "vcmpgtsb. $vD, $vA, $vB", v16i8>;
384def VCMPGTUB : VCMP <518, "vcmpgtub $vD, $vA, $vB" , v16i8>;
385def VCMPGTUBo : VCMPo<518, "vcmpgtub. $vD, $vA, $vB", v16i8>;
Chris Lattnerb8a45c22006-03-26 04:57:17 +0000386
387// i16 element comparisons.
Chris Lattner5f7b0192006-03-31 05:32:57 +0000388def VCMPEQUH : VCMP < 70, "vcmpequh $vD, $vA, $vB" , v8i16>;
389def VCMPEQUHo : VCMPo< 70, "vcmpequh. $vD, $vA, $vB", v8i16>;
390def VCMPGTSH : VCMP <838, "vcmpgtsh $vD, $vA, $vB" , v8i16>;
391def VCMPGTSHo : VCMPo<838, "vcmpgtsh. $vD, $vA, $vB", v8i16>;
392def VCMPGTUH : VCMP <582, "vcmpgtuh $vD, $vA, $vB" , v8i16>;
393def VCMPGTUHo : VCMPo<582, "vcmpgtuh. $vD, $vA, $vB", v8i16>;
Chris Lattnerb8a45c22006-03-26 04:57:17 +0000394
395// i32 element comparisons.
Chris Lattner5f7b0192006-03-31 05:32:57 +0000396def VCMPEQUW : VCMP <134, "vcmpequw $vD, $vA, $vB" , v4i32>;
397def VCMPEQUWo : VCMPo<134, "vcmpequw. $vD, $vA, $vB", v4i32>;
398def VCMPGTSW : VCMP <902, "vcmpgtsw $vD, $vA, $vB" , v4i32>;
399def VCMPGTSWo : VCMPo<902, "vcmpgtsw. $vD, $vA, $vB", v4i32>;
400def VCMPGTUW : VCMP <646, "vcmpgtuw $vD, $vA, $vB" , v4i32>;
401def VCMPGTUWo : VCMPo<646, "vcmpgtuw. $vD, $vA, $vB", v4i32>;
Chris Lattnerb8a45c22006-03-26 04:57:17 +0000402
Chris Lattnerb22a04d2006-03-25 07:51:43 +0000403def V_SET0 : VXForm_setzero<1220, (ops VRRC:$vD),
404 "vxor $vD, $vD, $vD", VecFP,
Evan Cheng5b6a01b2006-03-26 09:52:32 +0000405 [(set VRRC:$vD, (v4f32 immAllZerosV))]>;
Chris Lattnerb22a04d2006-03-25 07:51:43 +0000406}
407
408//===----------------------------------------------------------------------===//
409// Additional Altivec Patterns
410//
411
412// Undef/Zero.
413def : Pat<(v16i8 (undef)), (v16i8 (IMPLICIT_DEF_VRRC))>;
414def : Pat<(v8i16 (undef)), (v8i16 (IMPLICIT_DEF_VRRC))>;
415def : Pat<(v4i32 (undef)), (v4i32 (IMPLICIT_DEF_VRRC))>;
Evan Cheng5b6a01b2006-03-26 09:52:32 +0000416def : Pat<(v16i8 immAllZerosV), (v16i8 (V_SET0))>;
417def : Pat<(v8i16 immAllZerosV), (v8i16 (V_SET0))>;
418def : Pat<(v4i32 immAllZerosV), (v4i32 (V_SET0))>;
Chris Lattnerb22a04d2006-03-25 07:51:43 +0000419
420// Loads.
421def : Pat<(v16i8 (load xoaddr:$src)), (v16i8 (LVX xoaddr:$src))>;
422def : Pat<(v8i16 (load xoaddr:$src)), (v8i16 (LVX xoaddr:$src))>;
423def : Pat<(v4i32 (load xoaddr:$src)), (v4i32 (LVX xoaddr:$src))>;
Chris Lattnerecc219b2006-03-28 02:29:37 +0000424def : Pat<(v4f32 (load xoaddr:$src)), (v4f32 (LVX xoaddr:$src))>;
Chris Lattnerb22a04d2006-03-25 07:51:43 +0000425
426// Stores.
427def : Pat<(store (v16i8 VRRC:$rS), xoaddr:$dst),
428 (STVX (v16i8 VRRC:$rS), xoaddr:$dst)>;
429def : Pat<(store (v8i16 VRRC:$rS), xoaddr:$dst),
430 (STVX (v8i16 VRRC:$rS), xoaddr:$dst)>;
431def : Pat<(store (v4i32 VRRC:$rS), xoaddr:$dst),
432 (STVX (v4i32 VRRC:$rS), xoaddr:$dst)>;
Chris Lattnerecc219b2006-03-28 02:29:37 +0000433def : Pat<(store (v4f32 VRRC:$rS), xoaddr:$dst),
434 (STVX (v4f32 VRRC:$rS), xoaddr:$dst)>;
Chris Lattnerb22a04d2006-03-25 07:51:43 +0000435
436// Bit conversions.
437def : Pat<(v16i8 (bitconvert (v8i16 VRRC:$src))), (v16i8 VRRC:$src)>;
438def : Pat<(v16i8 (bitconvert (v4i32 VRRC:$src))), (v16i8 VRRC:$src)>;
439def : Pat<(v16i8 (bitconvert (v4f32 VRRC:$src))), (v16i8 VRRC:$src)>;
440
441def : Pat<(v8i16 (bitconvert (v16i8 VRRC:$src))), (v8i16 VRRC:$src)>;
442def : Pat<(v8i16 (bitconvert (v4i32 VRRC:$src))), (v8i16 VRRC:$src)>;
443def : Pat<(v8i16 (bitconvert (v4f32 VRRC:$src))), (v8i16 VRRC:$src)>;
444
445def : Pat<(v4i32 (bitconvert (v16i8 VRRC:$src))), (v4i32 VRRC:$src)>;
446def : Pat<(v4i32 (bitconvert (v8i16 VRRC:$src))), (v4i32 VRRC:$src)>;
447def : Pat<(v4i32 (bitconvert (v4f32 VRRC:$src))), (v4i32 VRRC:$src)>;
448
449def : Pat<(v4f32 (bitconvert (v16i8 VRRC:$src))), (v4f32 VRRC:$src)>;
450def : Pat<(v4f32 (bitconvert (v8i16 VRRC:$src))), (v4f32 VRRC:$src)>;
451def : Pat<(v4f32 (bitconvert (v4i32 VRRC:$src))), (v4f32 VRRC:$src)>;
452
453// Immediate vector formation with vsplti*.
454def : Pat<(v16i8 vecspltisb:$invec), (v16i8 (VSPLTISB vecspltisb:$invec))>;
455def : Pat<(v16i8 vecspltish:$invec), (v16i8 (VSPLTISH vecspltish:$invec))>;
456def : Pat<(v16i8 vecspltisw:$invec), (v16i8 (VSPLTISW vecspltisw:$invec))>;
457
458def : Pat<(v8i16 vecspltisb:$invec), (v8i16 (VSPLTISB vecspltisb:$invec))>;
459def : Pat<(v8i16 vecspltish:$invec), (v8i16 (VSPLTISH vecspltish:$invec))>;
460def : Pat<(v8i16 vecspltisw:$invec), (v8i16 (VSPLTISW vecspltisw:$invec))>;
461
462def : Pat<(v4i32 vecspltisb:$invec), (v4i32 (VSPLTISB vecspltisb:$invec))>;
463def : Pat<(v4i32 vecspltish:$invec), (v4i32 (VSPLTISH vecspltish:$invec))>;
464def : Pat<(v4i32 vecspltisw:$invec), (v4i32 (VSPLTISW vecspltisw:$invec))>;
465
Chris Lattner2430a5f2006-03-25 22:16:05 +0000466// Logical Operations
Chris Lattnerc3837d42006-04-01 22:41:47 +0000467def : Pat<(v16i8 (vnot VRRC:$vA)), (v16i8 (VNOR VRRC:$vA, VRRC:$vA))>;
468def : Pat<(v8i16 (vnot VRRC:$vA)), (v8i16 (VNOR VRRC:$vA, VRRC:$vA))>;
469def : Pat<(v4i32 (vnot VRRC:$vA)), (v4i32 (VNOR VRRC:$vA, VRRC:$vA))>;
470
Chris Lattner2430a5f2006-03-25 22:16:05 +0000471def : Pat<(v16i8 (and VRRC:$A, VRRC:$B)), (v16i8 (VAND VRRC:$A, VRRC:$B))>;
472def : Pat<(v8i16 (and VRRC:$A, VRRC:$B)), (v8i16 (VAND VRRC:$A, VRRC:$B))>;
473def : Pat<(v16i8 (or VRRC:$A, VRRC:$B)), (v16i8 (VOR VRRC:$A, VRRC:$B))>;
474def : Pat<(v8i16 (or VRRC:$A, VRRC:$B)), (v8i16 (VOR VRRC:$A, VRRC:$B))>;
475def : Pat<(v16i8 (xor VRRC:$A, VRRC:$B)), (v16i8 (VXOR VRRC:$A, VRRC:$B))>;
476def : Pat<(v8i16 (xor VRRC:$A, VRRC:$B)), (v8i16 (VXOR VRRC:$A, VRRC:$B))>;
Chris Lattner6509ae82006-03-25 23:05:29 +0000477def : Pat<(v16i8 (vnot (or VRRC:$A, VRRC:$B))),(v16i8 (VNOR VRRC:$A, VRRC:$B))>;
478def : Pat<(v8i16 (vnot (or VRRC:$A, VRRC:$B))),(v8i16 (VNOR VRRC:$A, VRRC:$B))>;
Chris Lattneraf9136b2006-03-25 23:10:40 +0000479def : Pat<(v16i8 (and VRRC:$A, (vnot VRRC:$B))),
Chris Lattner6509ae82006-03-25 23:05:29 +0000480 (v16i8 (VANDC VRRC:$A, VRRC:$B))>;
Chris Lattneraf9136b2006-03-25 23:10:40 +0000481def : Pat<(v8i16 (and VRRC:$A, (vnot VRRC:$B))),
Chris Lattner6509ae82006-03-25 23:05:29 +0000482 (v8i16 (VANDC VRRC:$A, VRRC:$B))>;
Chris Lattnerb22a04d2006-03-25 07:51:43 +0000483
484def : Pat<(fmul VRRC:$vA, VRRC:$vB),
485 (VMADDFP VRRC:$vA, VRRC:$vB, (V_SET0))>;
486
487// Fused multiply add and multiply sub for packed float. These are represented
488// separately from the real instructions above, for operations that must have
489// the additional precision, such as Newton-Rhapson (used by divide, sqrt)
490def : Pat<(PPCvmaddfp VRRC:$A, VRRC:$B, VRRC:$C),
491 (VMADDFP VRRC:$A, VRRC:$B, VRRC:$C)>;
492def : Pat<(PPCvnmsubfp VRRC:$A, VRRC:$B, VRRC:$C),
493 (VNMSUBFP VRRC:$A, VRRC:$B, VRRC:$C)>;
494
495def : Pat<(int_ppc_altivec_vmaddfp VRRC:$A, VRRC:$B, VRRC:$C),
496 (VMADDFP VRRC:$A, VRRC:$B, VRRC:$C)>;
497def : Pat<(int_ppc_altivec_vnmsubfp VRRC:$A, VRRC:$B, VRRC:$C),
498 (VNMSUBFP VRRC:$A, VRRC:$B, VRRC:$C)>;
Chris Lattnerb22a04d2006-03-25 07:51:43 +0000499
Chris Lattnera9cb4412006-03-31 20:00:35 +0000500def : Pat<(PPCvperm (v16i8 VRRC:$vA), VRRC:$vB, VRRC:$vC),
501 (v16i8 (VPERM VRRC:$vA, VRRC:$vB, VRRC:$vC))>;