Chris Lattner | b22a04d | 2006-03-25 07:51:43 +0000 | [diff] [blame] | 1 | //===- PPCInstrAltivec.td - The PowerPC Altivec Extension --*- tablegen -*-===// |
| 2 | // |
| 3 | // The LLVM Compiler Infrastructure |
| 4 | // |
| 5 | // This file was developed by Chris Lattner and is distributed under |
| 6 | // the University of Illinois Open Source License. See LICENSE.TXT for details. |
| 7 | // |
| 8 | //===----------------------------------------------------------------------===// |
| 9 | // |
| 10 | // This file describes the Altivec extension to the PowerPC instruction set. |
| 11 | // |
| 12 | //===----------------------------------------------------------------------===// |
| 13 | |
| 14 | //===----------------------------------------------------------------------===// |
| 15 | // Altivec transformation functions and pattern fragments. |
| 16 | // |
| 17 | |
| 18 | // VSPLT_get_imm xform function: convert vector_shuffle mask to VSPLT* imm. |
| 19 | def VSPLT_get_imm : SDNodeXForm<build_vector, [{ |
| 20 | return getI32Imm(PPC::getVSPLTImmediate(N)); |
| 21 | }]>; |
| 22 | |
| 23 | def VSPLT_shuffle_mask : PatLeaf<(build_vector), [{ |
| 24 | return PPC::isSplatShuffleMask(N); |
| 25 | }], VSPLT_get_imm>; |
| 26 | |
Chris Lattner | b22a04d | 2006-03-25 07:51:43 +0000 | [diff] [blame] | 27 | |
| 28 | // VSPLTISB_get_imm xform function: convert build_vector to VSPLTISB imm. |
| 29 | def VSPLTISB_get_imm : SDNodeXForm<build_vector, [{ |
| 30 | char Val; |
| 31 | PPC::isVecSplatImm(N, 1, &Val); |
| 32 | return getI32Imm(Val); |
| 33 | }]>; |
| 34 | def vecspltisb : PatLeaf<(build_vector), [{ |
| 35 | return PPC::isVecSplatImm(N, 1); |
| 36 | }], VSPLTISB_get_imm>; |
| 37 | |
| 38 | // VSPLTISH_get_imm xform function: convert build_vector to VSPLTISH imm. |
| 39 | def VSPLTISH_get_imm : SDNodeXForm<build_vector, [{ |
| 40 | char Val; |
| 41 | PPC::isVecSplatImm(N, 2, &Val); |
| 42 | return getI32Imm(Val); |
| 43 | }]>; |
| 44 | def vecspltish : PatLeaf<(build_vector), [{ |
| 45 | return PPC::isVecSplatImm(N, 2); |
| 46 | }], VSPLTISH_get_imm>; |
| 47 | |
| 48 | // VSPLTISW_get_imm xform function: convert build_vector to VSPLTISW imm. |
| 49 | def VSPLTISW_get_imm : SDNodeXForm<build_vector, [{ |
| 50 | char Val; |
| 51 | PPC::isVecSplatImm(N, 4, &Val); |
| 52 | return getI32Imm(Val); |
| 53 | }]>; |
| 54 | def vecspltisw : PatLeaf<(build_vector), [{ |
| 55 | return PPC::isVecSplatImm(N, 4); |
| 56 | }], VSPLTISW_get_imm>; |
| 57 | |
Chris Lattner | b8a45c2 | 2006-03-26 04:57:17 +0000 | [diff] [blame] | 58 | class isVDOT { // vector dot instruction. |
| 59 | list<Register> Defs = [CR6]; |
| 60 | bit RC = 1; |
| 61 | } |
Chris Lattner | b22a04d | 2006-03-25 07:51:43 +0000 | [diff] [blame] | 62 | |
| 63 | //===----------------------------------------------------------------------===// |
Chris Lattner | 3c4f4e9f | 2006-03-30 23:21:27 +0000 | [diff] [blame] | 64 | // Helpers for defining instructions that directly correspond to intrinsics. |
| 65 | |
Chris Lattner | 8768bf6 | 2006-03-30 23:39:06 +0000 | [diff] [blame] | 66 | // VA1a_Int - A VAForm_1a intrinsic definition. |
| 67 | class VA1a_Int<bits<6> xo, string asmstr, Intrinsic IntID> |
| 68 | : VAForm_1a<xo, (ops VRRC:$vD, VRRC:$vA, VRRC:$vB, VRRC:$vC), asmstr, VecFP, |
| 69 | [(set VRRC:$vD, (IntID VRRC:$vA, VRRC:$vB, VRRC:$vC))]>; |
| 70 | |
Chris Lattner | 3c4f4e9f | 2006-03-30 23:21:27 +0000 | [diff] [blame] | 71 | // VX1_Int - A VXForm_1 intrinsic definition. |
| 72 | class VX1_Int<bits<11> xo, string asmstr, Intrinsic IntID> |
| 73 | : VXForm_1<xo, (ops VRRC:$vD, VRRC:$vA, VRRC:$vB), asmstr, VecFP, |
| 74 | [(set VRRC:$vD, (IntID VRRC:$vA, VRRC:$vB))]>; |
| 75 | |
| 76 | // VX2_Int - A VXForm_2 intrinsic definition. |
| 77 | class VX2_Int<bits<11> xo, string asmstr, Intrinsic IntID> |
| 78 | : VXForm_2<xo, (ops VRRC:$vD, VRRC:$vB), asmstr, VecFP, |
| 79 | [(set VRRC:$vD, (IntID VRRC:$vB))]>; |
| 80 | |
| 81 | //===----------------------------------------------------------------------===// |
Chris Lattner | b22a04d | 2006-03-25 07:51:43 +0000 | [diff] [blame] | 82 | // Instruction Definitions. |
| 83 | |
| 84 | def IMPLICIT_DEF_VRRC : Pseudo<(ops VRRC:$rD), "; $rD = IMPLICIT_DEF_VRRC", |
| 85 | [(set VRRC:$rD, (v4f32 (undef)))]>; |
| 86 | |
| 87 | let isLoad = 1, PPC970_Unit = 2 in { // Loads. |
| 88 | def LVEBX: XForm_1<31, 7, (ops VRRC:$vD, memrr:$src), |
| 89 | "lvebx $vD, $src", LdStGeneral, |
Chris Lattner | ecc219b | 2006-03-28 02:29:37 +0000 | [diff] [blame] | 90 | [(set VRRC:$vD, (int_ppc_altivec_lvebx xoaddr:$src))]>; |
Chris Lattner | e7d959c | 2006-03-26 00:41:48 +0000 | [diff] [blame] | 91 | def LVEHX: XForm_1<31, 39, (ops VRRC:$vD, memrr:$src), |
Chris Lattner | b22a04d | 2006-03-25 07:51:43 +0000 | [diff] [blame] | 92 | "lvehx $vD, $src", LdStGeneral, |
Chris Lattner | ecc219b | 2006-03-28 02:29:37 +0000 | [diff] [blame] | 93 | [(set VRRC:$vD, (int_ppc_altivec_lvehx xoaddr:$src))]>; |
Chris Lattner | e7d959c | 2006-03-26 00:41:48 +0000 | [diff] [blame] | 94 | def LVEWX: XForm_1<31, 71, (ops VRRC:$vD, memrr:$src), |
Chris Lattner | b22a04d | 2006-03-25 07:51:43 +0000 | [diff] [blame] | 95 | "lvewx $vD, $src", LdStGeneral, |
Chris Lattner | ecc219b | 2006-03-28 02:29:37 +0000 | [diff] [blame] | 96 | [(set VRRC:$vD, (int_ppc_altivec_lvewx xoaddr:$src))]>; |
Chris Lattner | e7d959c | 2006-03-26 00:41:48 +0000 | [diff] [blame] | 97 | def LVX : XForm_1<31, 103, (ops VRRC:$vD, memrr:$src), |
Chris Lattner | b22a04d | 2006-03-25 07:51:43 +0000 | [diff] [blame] | 98 | "lvx $vD, $src", LdStGeneral, |
Chris Lattner | ecc219b | 2006-03-28 02:29:37 +0000 | [diff] [blame] | 99 | [(set VRRC:$vD, (int_ppc_altivec_lvx xoaddr:$src))]>; |
| 100 | def LVXL : XForm_1<31, 359, (ops VRRC:$vD, memrr:$src), |
| 101 | "lvxl $vD, $src", LdStGeneral, |
| 102 | [(set VRRC:$vD, (int_ppc_altivec_lvxl xoaddr:$src))]>; |
Chris Lattner | b22a04d | 2006-03-25 07:51:43 +0000 | [diff] [blame] | 103 | } |
| 104 | |
Chris Lattner | 30a6aba | 2006-03-30 23:07:36 +0000 | [diff] [blame] | 105 | def LVSL : XForm_1<31, 6, (ops VRRC:$vD, memrr:$src), |
| 106 | "lvsl $vD, $src", LdStGeneral, |
| 107 | [(set VRRC:$vD, (int_ppc_altivec_lvsl xoaddr:$src))]>, |
| 108 | PPC970_Unit_LSU; |
| 109 | def LVSR : XForm_1<31, 38, (ops VRRC:$vD, memrr:$src), |
| 110 | "lvsl $vD, $src", LdStGeneral, |
| 111 | [(set VRRC:$vD, (int_ppc_altivec_lvsr xoaddr:$src))]>, |
| 112 | PPC970_Unit_LSU; |
Chris Lattner | b22a04d | 2006-03-25 07:51:43 +0000 | [diff] [blame] | 113 | |
| 114 | let isStore = 1, noResults = 1, PPC970_Unit = 2 in { // Stores. |
Chris Lattner | 48b61a7 | 2006-03-28 00:40:33 +0000 | [diff] [blame] | 115 | def STVEBX: XForm_8<31, 135, (ops VRRC:$rS, memrr:$dst), |
| 116 | "stvebx $rS, $dst", LdStGeneral, |
| 117 | [(int_ppc_altivec_stvebx VRRC:$rS, xoaddr:$dst)]>; |
| 118 | def STVEHX: XForm_8<31, 167, (ops VRRC:$rS, memrr:$dst), |
| 119 | "stvehx $rS, $dst", LdStGeneral, |
| 120 | [(int_ppc_altivec_stvehx VRRC:$rS, xoaddr:$dst)]>; |
| 121 | def STVEWX: XForm_8<31, 199, (ops VRRC:$rS, memrr:$dst), |
| 122 | "stvewx $rS, $dst", LdStGeneral, |
| 123 | [(int_ppc_altivec_stvewx VRRC:$rS, xoaddr:$dst)]>; |
Chris Lattner | b22a04d | 2006-03-25 07:51:43 +0000 | [diff] [blame] | 124 | def STVX : XForm_8<31, 231, (ops VRRC:$rS, memrr:$dst), |
| 125 | "stvx $rS, $dst", LdStGeneral, |
Chris Lattner | ecc219b | 2006-03-28 02:29:37 +0000 | [diff] [blame] | 126 | [(int_ppc_altivec_stvx VRRC:$rS, xoaddr:$dst)]>; |
| 127 | def STVXL : XForm_8<31, 487, (ops VRRC:$rS, memrr:$dst), |
| 128 | "stvxl $rS, $dst", LdStGeneral, |
| 129 | [(int_ppc_altivec_stvxl VRRC:$rS, xoaddr:$dst)]>; |
Chris Lattner | b22a04d | 2006-03-25 07:51:43 +0000 | [diff] [blame] | 130 | } |
| 131 | |
| 132 | let PPC970_Unit = 5 in { // VALU Operations. |
| 133 | // VA-Form instructions. 3-input AltiVec ops. |
| 134 | def VMADDFP : VAForm_1<46, (ops VRRC:$vD, VRRC:$vA, VRRC:$vC, VRRC:$vB), |
| 135 | "vmaddfp $vD, $vA, $vC, $vB", VecFP, |
| 136 | [(set VRRC:$vD, (fadd (fmul VRRC:$vA, VRRC:$vC), |
| 137 | VRRC:$vB))]>, |
| 138 | Requires<[FPContractions]>; |
| 139 | def VNMSUBFP: VAForm_1<47, (ops VRRC:$vD, VRRC:$vA, VRRC:$vC, VRRC:$vB), |
| 140 | "vnmsubfp $vD, $vA, $vC, $vB", VecFP, |
| 141 | [(set VRRC:$vD, (fneg (fsub (fmul VRRC:$vA, VRRC:$vC), |
| 142 | VRRC:$vB)))]>, |
| 143 | Requires<[FPContractions]>; |
Nate Begeman | 98e70cc | 2006-03-28 04:15:58 +0000 | [diff] [blame] | 144 | def VMHADDSHS : VAForm_1a<32, (ops VRRC:$vD, VRRC:$vA, VRRC:$vB, VRRC:$vC), |
| 145 | "vmhaddshs $vD, $vA, $vB, $vC", VecFP, |
| 146 | [(set VRRC:$vD, |
| 147 | (int_ppc_altivec_vmhaddshs VRRC:$vA, VRRC:$vB, VRRC:$vC))]>; |
| 148 | def VMHRADDSHS : VAForm_1a<33, (ops VRRC:$vD, VRRC:$vA, VRRC:$vB, VRRC:$vC), |
| 149 | "vmhraddshs $vD, $vA, $vB, $vC", VecFP, |
| 150 | [(set VRRC:$vD, |
| 151 | (int_ppc_altivec_vmhraddshs VRRC:$vA, VRRC:$vB, VRRC:$vC))]>; |
Chris Lattner | fb143ce | 2006-03-27 03:34:17 +0000 | [diff] [blame] | 152 | def VPERM : VAForm_1a<43, (ops VRRC:$vD, VRRC:$vA, VRRC:$vB, VRRC:$vC), |
| 153 | "vperm $vD, $vA, $vB, $vC", VecPerm, |
| 154 | [(set VRRC:$vD, |
Chris Lattner | b22a04d | 2006-03-25 07:51:43 +0000 | [diff] [blame] | 155 | (PPCvperm (v4f32 VRRC:$vA), VRRC:$vB, VRRC:$vC))]>; |
Chris Lattner | e7d959c | 2006-03-26 00:41:48 +0000 | [diff] [blame] | 156 | def VSLDOI : VAForm_2<44, (ops VRRC:$vD, VRRC:$vA, VRRC:$vB, u5imm:$SH), |
| 157 | "vsldoi $vD, $vA, $vB, $SH", VecFP, |
| 158 | [(set VRRC:$vD, |
| 159 | (int_ppc_altivec_vsldoi VRRC:$vA, VRRC:$vB, |
| 160 | imm:$SH))]>; |
Chris Lattner | fb143ce | 2006-03-27 03:34:17 +0000 | [diff] [blame] | 161 | def VSEL : VAForm_1a<42, (ops VRRC:$vD, VRRC:$vA, VRRC:$vB, VRRC:$vC), |
Chris Lattner | bd6be6f | 2006-03-26 22:38:43 +0000 | [diff] [blame] | 162 | "vsel $vD, $vA, $vB, $vC", VecFP, |
| 163 | [(set VRRC:$vD, |
| 164 | (int_ppc_altivec_vsel VRRC:$vA, VRRC:$vB, VRRC:$vC))]>; |
Chris Lattner | b22a04d | 2006-03-25 07:51:43 +0000 | [diff] [blame] | 165 | |
| 166 | // VX-Form instructions. AltiVec arithmetic ops. |
Chris Lattner | 984f38b | 2006-03-25 08:01:02 +0000 | [diff] [blame] | 167 | def VADDCUW : VXForm_1<384, (ops VRRC:$vD, VRRC:$vA, VRRC:$vB), |
| 168 | "vaddcuw $vD, $vA, $vB", VecFP, |
| 169 | [(set VRRC:$vD, |
| 170 | (int_ppc_altivec_vaddcuw VRRC:$vA, VRRC:$vB))]>; |
Chris Lattner | b22a04d | 2006-03-25 07:51:43 +0000 | [diff] [blame] | 171 | def VADDFP : VXForm_1<10, (ops VRRC:$vD, VRRC:$vA, VRRC:$vB), |
| 172 | "vaddfp $vD, $vA, $vB", VecFP, |
| 173 | [(set VRRC:$vD, (fadd VRRC:$vA, VRRC:$vB))]>; |
Chris Lattner | 5d72907 | 2006-03-26 02:39:02 +0000 | [diff] [blame] | 174 | |
| 175 | def VADDUBM : VXForm_1<0, (ops VRRC:$vD, VRRC:$vA, VRRC:$vB), |
| 176 | "vaddubm $vD, $vA, $vB", VecGeneral, |
| 177 | [(set VRRC:$vD, (add (v16i8 VRRC:$vA), VRRC:$vB))]>; |
| 178 | def VADDUHM : VXForm_1<64, (ops VRRC:$vD, VRRC:$vA, VRRC:$vB), |
| 179 | "vadduhm $vD, $vA, $vB", VecGeneral, |
| 180 | [(set VRRC:$vD, (add (v8i16 VRRC:$vA), VRRC:$vB))]>; |
| 181 | def VADDUWM : VXForm_1<128, (ops VRRC:$vD, VRRC:$vA, VRRC:$vB), |
| 182 | "vadduwm $vD, $vA, $vB", VecGeneral, |
| 183 | [(set VRRC:$vD, (add (v4i32 VRRC:$vA), VRRC:$vB))]>; |
| 184 | |
Chris Lattner | 984f38b | 2006-03-25 08:01:02 +0000 | [diff] [blame] | 185 | def VADDSBS : VXForm_1<768, (ops VRRC:$vD, VRRC:$vA, VRRC:$vB), |
| 186 | "vaddsbs $vD, $vA, $vB", VecFP, |
| 187 | [(set VRRC:$vD, |
| 188 | (int_ppc_altivec_vaddsbs VRRC:$vA, VRRC:$vB))]>; |
| 189 | def VADDSHS : VXForm_1<832, (ops VRRC:$vD, VRRC:$vA, VRRC:$vB), |
| 190 | "vaddshs $vD, $vA, $vB", VecFP, |
| 191 | [(set VRRC:$vD, |
| 192 | (int_ppc_altivec_vaddshs VRRC:$vA, VRRC:$vB))]>; |
| 193 | def VADDSWS : VXForm_1<896, (ops VRRC:$vD, VRRC:$vA, VRRC:$vB), |
| 194 | "vaddsws $vD, $vA, $vB", VecFP, |
| 195 | [(set VRRC:$vD, |
| 196 | (int_ppc_altivec_vaddsws VRRC:$vA, VRRC:$vB))]>; |
Chris Lattner | 5d72907 | 2006-03-26 02:39:02 +0000 | [diff] [blame] | 197 | |
Chris Lattner | 984f38b | 2006-03-25 08:01:02 +0000 | [diff] [blame] | 198 | def VADDUBS : VXForm_1<512, (ops VRRC:$vD, VRRC:$vA, VRRC:$vB), |
| 199 | "vaddubs $vD, $vA, $vB", VecFP, |
| 200 | [(set VRRC:$vD, |
| 201 | (int_ppc_altivec_vaddubs VRRC:$vA, VRRC:$vB))]>; |
| 202 | def VADDUHS : VXForm_1<576, (ops VRRC:$vD, VRRC:$vA, VRRC:$vB), |
| 203 | "vadduhs $vD, $vA, $vB", VecFP, |
| 204 | [(set VRRC:$vD, |
| 205 | (int_ppc_altivec_vadduhs VRRC:$vA, VRRC:$vB))]>; |
Chris Lattner | 984f38b | 2006-03-25 08:01:02 +0000 | [diff] [blame] | 206 | def VADDUWS : VXForm_1<640, (ops VRRC:$vD, VRRC:$vA, VRRC:$vB), |
| 207 | "vadduws $vD, $vA, $vB", VecFP, |
| 208 | [(set VRRC:$vD, |
| 209 | (int_ppc_altivec_vadduws VRRC:$vA, VRRC:$vB))]>; |
Chris Lattner | 2430a5f | 2006-03-25 22:16:05 +0000 | [diff] [blame] | 210 | def VAND : VXForm_1<1028, (ops VRRC:$vD, VRRC:$vA, VRRC:$vB), |
| 211 | "vand $vD, $vA, $vB", VecFP, |
| 212 | [(set VRRC:$vD, (and (v4i32 VRRC:$vA), VRRC:$vB))]>; |
| 213 | def VANDC : VXForm_1<1092, (ops VRRC:$vD, VRRC:$vA, VRRC:$vB), |
| 214 | "vandc $vD, $vA, $vB", VecFP, |
Chris Lattner | af9136b | 2006-03-25 23:10:40 +0000 | [diff] [blame] | 215 | [(set VRRC:$vD, (and (v4i32 VRRC:$vA), (vnot VRRC:$vB)))]>; |
Chris Lattner | 2430a5f | 2006-03-25 22:16:05 +0000 | [diff] [blame] | 216 | |
Chris Lattner | b22a04d | 2006-03-25 07:51:43 +0000 | [diff] [blame] | 217 | def VCFSX : VXForm_1<842, (ops VRRC:$vD, u5imm:$UIMM, VRRC:$vB), |
| 218 | "vcfsx $vD, $vB, $UIMM", VecFP, |
Chris Lattner | 984f38b | 2006-03-25 08:01:02 +0000 | [diff] [blame] | 219 | [(set VRRC:$vD, |
| 220 | (int_ppc_altivec_vcfsx VRRC:$vB, imm:$UIMM))]>; |
Chris Lattner | b22a04d | 2006-03-25 07:51:43 +0000 | [diff] [blame] | 221 | def VCFUX : VXForm_1<778, (ops VRRC:$vD, u5imm:$UIMM, VRRC:$vB), |
| 222 | "vcfux $vD, $vB, $UIMM", VecFP, |
Chris Lattner | 984f38b | 2006-03-25 08:01:02 +0000 | [diff] [blame] | 223 | [(set VRRC:$vD, |
| 224 | (int_ppc_altivec_vcfux VRRC:$vB, imm:$UIMM))]>; |
Chris Lattner | b22a04d | 2006-03-25 07:51:43 +0000 | [diff] [blame] | 225 | def VCTSXS : VXForm_1<970, (ops VRRC:$vD, u5imm:$UIMM, VRRC:$vB), |
| 226 | "vctsxs $vD, $vB, $UIMM", VecFP, |
| 227 | []>; |
| 228 | def VCTUXS : VXForm_1<906, (ops VRRC:$vD, u5imm:$UIMM, VRRC:$vB), |
| 229 | "vctuxs $vD, $vB, $UIMM", VecFP, |
| 230 | []>; |
| 231 | def VEXPTEFP : VXForm_2<394, (ops VRRC:$vD, VRRC:$vB), |
| 232 | "vexptefp $vD, $vB", VecFP, |
Chris Lattner | ecc219b | 2006-03-28 02:29:37 +0000 | [diff] [blame] | 233 | [(set VRRC:$vD, (int_ppc_altivec_vexptefp VRRC:$vB))]>; |
Chris Lattner | b22a04d | 2006-03-25 07:51:43 +0000 | [diff] [blame] | 234 | def VLOGEFP : VXForm_2<458, (ops VRRC:$vD, VRRC:$vB), |
| 235 | "vlogefp $vD, $vB", VecFP, |
Chris Lattner | ecc219b | 2006-03-28 02:29:37 +0000 | [diff] [blame] | 236 | [(set VRRC:$vD, (int_ppc_altivec_vlogefp VRRC:$vB))]>; |
Chris Lattner | b22a04d | 2006-03-25 07:51:43 +0000 | [diff] [blame] | 237 | def VMAXFP : VXForm_1<1034, (ops VRRC:$vD, VRRC:$vA, VRRC:$vB), |
| 238 | "vmaxfp $vD, $vA, $vB", VecFP, |
| 239 | []>; |
| 240 | def VMINFP : VXForm_1<1098, (ops VRRC:$vD, VRRC:$vA, VRRC:$vB), |
| 241 | "vminfp $vD, $vA, $vB", VecFP, |
| 242 | []>; |
Chris Lattner | 30a6aba | 2006-03-30 23:07:36 +0000 | [diff] [blame] | 243 | |
Chris Lattner | 3c4f4e9f | 2006-03-30 23:21:27 +0000 | [diff] [blame] | 244 | def VMRGHH : VX1_Int<76 , "vmrghh $vD, $vA, $vB", int_ppc_altivec_vmrghh>; |
| 245 | def VMRGHW : VX1_Int<140, "vmrghw $vD, $vA, $vB", int_ppc_altivec_vmrghw>; |
| 246 | def VMRGLH : VX1_Int<332, "vmrglh $vD, $vA, $vB", int_ppc_altivec_vmrglh>; |
| 247 | def VMRGLW : VX1_Int<396, "vmrglw $vD, $vA, $vB", int_ppc_altivec_vmrglw>; |
| 248 | |
Chris Lattner | 8768bf6 | 2006-03-30 23:39:06 +0000 | [diff] [blame] | 249 | def VMSUMMBM : VA1a_Int<37, "vmsummbm $vD, $vA, $vB, $vC", int_ppc_altivec_vmsummbm>; |
| 250 | def VMSUMSHM : VA1a_Int<40, "vmsumshm $vD, $vA, $vB, $vC", int_ppc_altivec_vmsumshm>; |
| 251 | def VMSUMSHS : VA1a_Int<41, "vmsumshs $vD, $vA, $vB, $vC", int_ppc_altivec_vmsumshs>; |
| 252 | def VMSUMUBM : VA1a_Int<36, "vmsumubm $vD, $vA, $vB, $vC", int_ppc_altivec_vmsumubm>; |
| 253 | def VMSUMUHM : VA1a_Int<38, "vmsumuhm $vD, $vA, $vB, $vC", int_ppc_altivec_vmsumuhm>; |
| 254 | def VMSUMUHS : VA1a_Int<39, "vmsumuhs $vD, $vA, $vB, $vC", int_ppc_altivec_vmsumuhs>; |
| 255 | |
Chris Lattner | 3c4f4e9f | 2006-03-30 23:21:27 +0000 | [diff] [blame] | 256 | def VMULESB : VX1_Int<776, "vmulesb $vD, $vA, $vB", int_ppc_altivec_vmulesb>; |
| 257 | def VMULESH : VX1_Int<840, "vmulesh $vD, $vA, $vB", int_ppc_altivec_vmulesh>; |
| 258 | def VMULEUB : VX1_Int<520, "vmuleub $vD, $vA, $vB", int_ppc_altivec_vmuleub>; |
| 259 | def VMULEUH : VX1_Int<584, "vmuleuh $vD, $vA, $vB", int_ppc_altivec_vmuleuh>; |
| 260 | def VMULOSB : VX1_Int<264, "vmulosb $vD, $vA, $vB", int_ppc_altivec_vmulosb>; |
Chris Lattner | 8768bf6 | 2006-03-30 23:39:06 +0000 | [diff] [blame] | 261 | def VMULOSH : VX1_Int<328, "vmulosh $vD, $vA, $vB", int_ppc_altivec_vmulosh>; |
| 262 | def VMULOUB : VX1_Int< 8, "vmuloub $vD, $vA, $vB", int_ppc_altivec_vmuloub>; |
| 263 | def VMULOUH : VX1_Int< 72, "vmulouh $vD, $vA, $vB", int_ppc_altivec_vmulouh>; |
Chris Lattner | 30a6aba | 2006-03-30 23:07:36 +0000 | [diff] [blame] | 264 | |
Chris Lattner | 3c4f4e9f | 2006-03-30 23:21:27 +0000 | [diff] [blame] | 265 | def VREFP : VX2_Int<266, "vrefp $vD, $vB", int_ppc_altivec_vrefp>; |
| 266 | def VRFIM : VX2_Int<714, "vrfim $vD, $vB", int_ppc_altivec_vrfim>; |
| 267 | def VRFIN : VX2_Int<522, "vrfin $vD, $vB", int_ppc_altivec_vrfin>; |
| 268 | def VRFIP : VX2_Int<650, "vrfip $vD, $vB", int_ppc_altivec_vrfip>; |
| 269 | def VRFIZ : VX2_Int<586, "vrfiz $vD, $vB", int_ppc_altivec_vrfiz>; |
| 270 | def VRSQRTEFP : VX2_Int<330, "vrsqrtefp $vD, $vB", int_ppc_altivec_vrsqrtefp>; |
| 271 | |
| 272 | def VSUBCUW : VX1_Int<74, "vsubcuw $vD, $vA, $vB", int_ppc_altivec_vsubcuw>; |
| 273 | |
| 274 | def VSUBFP : VXForm_1<74, (ops VRRC:$vD, VRRC:$vA, VRRC:$vB), |
| 275 | "vsubfp $vD, $vA, $vB", VecGeneral, |
Chris Lattner | b22a04d | 2006-03-25 07:51:43 +0000 | [diff] [blame] | 276 | [(set VRRC:$vD, (fsub VRRC:$vA, VRRC:$vB))]>; |
Chris Lattner | 5d72907 | 2006-03-26 02:39:02 +0000 | [diff] [blame] | 277 | def VSUBUBM : VXForm_1<1024, (ops VRRC:$vD, VRRC:$vA, VRRC:$vB), |
| 278 | "vsububm $vD, $vA, $vB", VecGeneral, |
| 279 | [(set VRRC:$vD, (sub (v16i8 VRRC:$vA), VRRC:$vB))]>; |
| 280 | def VSUBUHM : VXForm_1<1088, (ops VRRC:$vD, VRRC:$vA, VRRC:$vB), |
| 281 | "vsubuhm $vD, $vA, $vB", VecGeneral, |
| 282 | [(set VRRC:$vD, (sub (v8i16 VRRC:$vA), VRRC:$vB))]>; |
| 283 | def VSUBUWM : VXForm_1<1152, (ops VRRC:$vD, VRRC:$vA, VRRC:$vB), |
| 284 | "vsubuwm $vD, $vA, $vB", VecGeneral, |
| 285 | [(set VRRC:$vD, (sub (v4i32 VRRC:$vA), VRRC:$vB))]>; |
| 286 | |
Chris Lattner | 3c4f4e9f | 2006-03-30 23:21:27 +0000 | [diff] [blame] | 287 | def VSUBSBS : VX1_Int<1792, "vsubsbs $vD, $vA, $vB", int_ppc_altivec_vsubsbs>; |
| 288 | def VSUBSHS : VX1_Int<1856, "vsubshs $vD, $vA, $vB", int_ppc_altivec_vsubshs>; |
| 289 | def VSUBSWS : VX1_Int<1920, "vsubsws $vD, $vA, $vB", int_ppc_altivec_vsubsws>; |
| 290 | def VSUBUBS : VX1_Int<1536, "vsububs $vD, $vA, $vB", int_ppc_altivec_vsububs>; |
| 291 | def VSUBUHS : VX1_Int<1600, "vsubuhs $vD, $vA, $vB", int_ppc_altivec_vsubuhs>; |
| 292 | def VSUBUWS : VX1_Int<1664, "vsubuws $vD, $vA, $vB", int_ppc_altivec_vsubuws>; |
| 293 | def VSUMSWS : VX1_Int<1928, "vsumsws $vD, $vA, $vB", int_ppc_altivec_vsumsws>; |
| 294 | def VSUM2SWS: VX1_Int<1672, "vsum2sws $vD, $vA, $vB", int_ppc_altivec_vsum2sws>; |
| 295 | def VSUM4SBS: VX1_Int<1672, "vsum4sbs $vD, $vA, $vB", int_ppc_altivec_vsum4sbs>; |
| 296 | def VSUM4SHS: VX1_Int<1608, "vsum4shs $vD, $vA, $vB", int_ppc_altivec_vsum4shs>; |
| 297 | def VSUM4UBS: VX1_Int<1544, "vsum4ubs $vD, $vA, $vB", int_ppc_altivec_vsum4ubs>; |
Chris Lattner | ecc219b | 2006-03-28 02:29:37 +0000 | [diff] [blame] | 298 | |
Chris Lattner | 2430a5f | 2006-03-25 22:16:05 +0000 | [diff] [blame] | 299 | def VNOR : VXForm_1<1284, (ops VRRC:$vD, VRRC:$vA, VRRC:$vB), |
| 300 | "vnor $vD, $vA, $vB", VecFP, |
Chris Lattner | 6509ae8 | 2006-03-25 23:05:29 +0000 | [diff] [blame] | 301 | [(set VRRC:$vD, (vnot (or (v4i32 VRRC:$vA), VRRC:$vB)))]>; |
Chris Lattner | b22a04d | 2006-03-25 07:51:43 +0000 | [diff] [blame] | 302 | def VOR : VXForm_1<1156, (ops VRRC:$vD, VRRC:$vA, VRRC:$vB), |
| 303 | "vor $vD, $vA, $vB", VecFP, |
Chris Lattner | 2430a5f | 2006-03-25 22:16:05 +0000 | [diff] [blame] | 304 | [(set VRRC:$vD, (or (v4i32 VRRC:$vA), VRRC:$vB))]>; |
Chris Lattner | b22a04d | 2006-03-25 07:51:43 +0000 | [diff] [blame] | 305 | def VXOR : VXForm_1<1220, (ops VRRC:$vD, VRRC:$vA, VRRC:$vB), |
| 306 | "vxor $vD, $vA, $vB", VecFP, |
Chris Lattner | 2430a5f | 2006-03-25 22:16:05 +0000 | [diff] [blame] | 307 | [(set VRRC:$vD, (xor (v4i32 VRRC:$vA), VRRC:$vB))]>; |
Chris Lattner | b22a04d | 2006-03-25 07:51:43 +0000 | [diff] [blame] | 308 | |
Chris Lattner | ecc219b | 2006-03-28 02:29:37 +0000 | [diff] [blame] | 309 | def VRLB : VXForm_1<4, (ops VRRC:$vD, VRRC:$vA, VRRC:$vB), |
| 310 | "vrlb $vD, $vA, $vB", VecFP, |
| 311 | [(set VRRC:$vD, |
| 312 | (int_ppc_altivec_vrlb VRRC:$vA, VRRC:$vB))]>; |
| 313 | def VRLH : VXForm_1<68, (ops VRRC:$vD, VRRC:$vA, VRRC:$vB), |
| 314 | "vrlh $vD, $vA, $vB", VecFP, |
| 315 | [(set VRRC:$vD, |
| 316 | (int_ppc_altivec_vrlh VRRC:$vA, VRRC:$vB))]>; |
| 317 | def VRLW : VXForm_1<132, (ops VRRC:$vD, VRRC:$vA, VRRC:$vB), |
| 318 | "vrlw $vD, $vA, $vB", VecFP, |
| 319 | [(set VRRC:$vD, |
| 320 | (int_ppc_altivec_vrlw VRRC:$vA, VRRC:$vB))]>; |
| 321 | |
| 322 | def VSLO : VXForm_1<1036, (ops VRRC:$vD, VRRC:$vA, VRRC:$vB), |
| 323 | "vslo $vD, $vA, $vB", VecFP, |
| 324 | [(set VRRC:$vD, |
| 325 | (int_ppc_altivec_vslo VRRC:$vA, VRRC:$vB))]>; |
| 326 | def VSLB : VXForm_1<260, (ops VRRC:$vD, VRRC:$vA, VRRC:$vB), |
| 327 | "vslb $vD, $vA, $vB", VecFP, |
| 328 | [(set VRRC:$vD, |
| 329 | (int_ppc_altivec_vslb VRRC:$vA, VRRC:$vB))]>; |
| 330 | def VSLH : VXForm_1<324, (ops VRRC:$vD, VRRC:$vA, VRRC:$vB), |
| 331 | "vslh $vD, $vA, $vB", VecFP, |
| 332 | [(set VRRC:$vD, |
| 333 | (int_ppc_altivec_vslh VRRC:$vA, VRRC:$vB))]>; |
| 334 | def VSLW : VXForm_1<388, (ops VRRC:$vD, VRRC:$vA, VRRC:$vB), |
| 335 | "vslw $vD, $vA, $vB", VecFP, |
| 336 | [(set VRRC:$vD, |
| 337 | (int_ppc_altivec_vslw VRRC:$vA, VRRC:$vB))]>; |
| 338 | |
Chris Lattner | b22a04d | 2006-03-25 07:51:43 +0000 | [diff] [blame] | 339 | def VSPLTB : VXForm_1<524, (ops VRRC:$vD, u5imm:$UIMM, VRRC:$vB), |
| 340 | "vspltb $vD, $vB, $UIMM", VecPerm, |
| 341 | []>; |
| 342 | def VSPLTH : VXForm_1<588, (ops VRRC:$vD, u5imm:$UIMM, VRRC:$vB), |
| 343 | "vsplth $vD, $vB, $UIMM", VecPerm, |
| 344 | []>; |
| 345 | def VSPLTW : VXForm_1<652, (ops VRRC:$vD, u5imm:$UIMM, VRRC:$vB), |
| 346 | "vspltw $vD, $vB, $UIMM", VecPerm, |
| 347 | [(set VRRC:$vD, (vector_shuffle (v4f32 VRRC:$vB), (undef), |
| 348 | VSPLT_shuffle_mask:$UIMM))]>; |
| 349 | |
Chris Lattner | ecc219b | 2006-03-28 02:29:37 +0000 | [diff] [blame] | 350 | def VSR : VXForm_1<708, (ops VRRC:$vD, VRRC:$vA, VRRC:$vB), |
| 351 | "vsr $vD, $vA, $vB", VecFP, |
| 352 | [(set VRRC:$vD, |
| 353 | (int_ppc_altivec_vsr VRRC:$vA, VRRC:$vB))]>; |
| 354 | def VSRO : VXForm_1<1100, (ops VRRC:$vD, VRRC:$vA, VRRC:$vB), |
| 355 | "vsro $vD, $vA, $vB", VecFP, |
| 356 | [(set VRRC:$vD, |
| 357 | (int_ppc_altivec_vsro VRRC:$vA, VRRC:$vB))]>; |
| 358 | def VSRAB : VXForm_1<772, (ops VRRC:$vD, VRRC:$vA, VRRC:$vB), |
| 359 | "vsrab $vD, $vA, $vB", VecFP, |
| 360 | [(set VRRC:$vD, |
| 361 | (int_ppc_altivec_vsrab VRRC:$vA, VRRC:$vB))]>; |
| 362 | def VSRAH : VXForm_1<836, (ops VRRC:$vD, VRRC:$vA, VRRC:$vB), |
| 363 | "vsrah $vD, $vA, $vB", VecFP, |
| 364 | [(set VRRC:$vD, |
| 365 | (int_ppc_altivec_vsrah VRRC:$vA, VRRC:$vB))]>; |
| 366 | def VSRAW : VXForm_1<900, (ops VRRC:$vD, VRRC:$vA, VRRC:$vB), |
| 367 | "vsraw $vD, $vA, $vB", VecFP, |
| 368 | [(set VRRC:$vD, |
| 369 | (int_ppc_altivec_vsraw VRRC:$vA, VRRC:$vB))]>; |
| 370 | def VSRB : VXForm_1<516, (ops VRRC:$vD, VRRC:$vA, VRRC:$vB), |
| 371 | "vsrb $vD, $vA, $vB", VecFP, |
| 372 | [(set VRRC:$vD, |
| 373 | (int_ppc_altivec_vsrb VRRC:$vA, VRRC:$vB))]>; |
| 374 | def VSRH : VXForm_1<580, (ops VRRC:$vD, VRRC:$vA, VRRC:$vB), |
| 375 | "vsrh $vD, $vA, $vB", VecFP, |
| 376 | [(set VRRC:$vD, |
| 377 | (int_ppc_altivec_vsrh VRRC:$vA, VRRC:$vB))]>; |
| 378 | def VSRW : VXForm_1<644, (ops VRRC:$vD, VRRC:$vA, VRRC:$vB), |
| 379 | "vsrw $vD, $vA, $vB", VecFP, |
| 380 | [(set VRRC:$vD, |
| 381 | (int_ppc_altivec_vsrw VRRC:$vA, VRRC:$vB))]>; |
| 382 | |
| 383 | |
Chris Lattner | eeaf72a | 2006-03-27 03:28:57 +0000 | [diff] [blame] | 384 | def VSPLTISB : VXForm_3<780, (ops VRRC:$vD, s5imm:$SIMM), |
| 385 | "vspltisb $vD, $SIMM", VecPerm, |
| 386 | [(set VRRC:$vD, (v4f32 vecspltisb:$SIMM))]>; |
| 387 | def VSPLTISH : VXForm_3<844, (ops VRRC:$vD, s5imm:$SIMM), |
| 388 | "vspltish $vD, $SIMM", VecPerm, |
| 389 | [(set VRRC:$vD, (v4f32 vecspltish:$SIMM))]>; |
| 390 | def VSPLTISW : VXForm_3<908, (ops VRRC:$vD, s5imm:$SIMM), |
| 391 | "vspltisw $vD, $SIMM", VecPerm, |
| 392 | [(set VRRC:$vD, (v4f32 vecspltisw:$SIMM))]>; |
Chris Lattner | b22a04d | 2006-03-25 07:51:43 +0000 | [diff] [blame] | 393 | |
Chris Lattner | 30a6aba | 2006-03-30 23:07:36 +0000 | [diff] [blame] | 394 | // Vector Pack. |
| 395 | def VPKPX : VXForm_1<782, (ops VRRC:$vD, VRRC:$vA, VRRC:$vB), |
| 396 | "vpkpx $vD, $vA, $vB", VecFP, |
| 397 | [(set VRRC:$vD, |
| 398 | (int_ppc_altivec_vpkpx VRRC:$vA, VRRC:$vB))]>; |
| 399 | def VPKSHSS : VXForm_1<398, (ops VRRC:$vD, VRRC:$vA, VRRC:$vB), |
| 400 | "vpkshss $vD, $vA, $vB", VecFP, |
| 401 | [(set VRRC:$vD, |
| 402 | (int_ppc_altivec_vpkshss VRRC:$vA, VRRC:$vB))]>; |
| 403 | def VPKSHUS : VXForm_1<270, (ops VRRC:$vD, VRRC:$vA, VRRC:$vB), |
| 404 | "vpkshus $vD, $vA, $vB", VecFP, |
| 405 | [(set VRRC:$vD, |
| 406 | (int_ppc_altivec_vpkshus VRRC:$vA, VRRC:$vB))]>; |
| 407 | def VPKSWSS : VXForm_1<462, (ops VRRC:$vD, VRRC:$vA, VRRC:$vB), |
| 408 | "vpkswss $vD, $vA, $vB", VecFP, |
| 409 | [(set VRRC:$vD, |
| 410 | (int_ppc_altivec_vpkswss VRRC:$vA, VRRC:$vB))]>; |
| 411 | def VPKSWUS : VXForm_1<334, (ops VRRC:$vD, VRRC:$vA, VRRC:$vB), |
| 412 | "vpkswus $vD, $vA, $vB", VecFP, |
| 413 | [(set VRRC:$vD, |
| 414 | (int_ppc_altivec_vpkswus VRRC:$vA, VRRC:$vB))]>; |
| 415 | def VPKUHUM : VXForm_1<14, (ops VRRC:$vD, VRRC:$vA, VRRC:$vB), |
| 416 | "vpkuhum $vD, $vA, $vB", VecFP, |
| 417 | [/*TODO*/]>; |
| 418 | def VPKUHUS : VXForm_1<142, (ops VRRC:$vD, VRRC:$vA, VRRC:$vB), |
| 419 | "vpkuhus $vD, $vA, $vB", VecFP, |
| 420 | [(set VRRC:$vD, |
| 421 | (int_ppc_altivec_vpkuhus VRRC:$vA, VRRC:$vB))]>; |
| 422 | def VPKUWUM : VXForm_1<78, (ops VRRC:$vD, VRRC:$vA, VRRC:$vB), |
| 423 | "vpkuwum $vD, $vA, $vB", VecFP, |
| 424 | [/*TODO*/]>; |
| 425 | def VPKUWUS : VXForm_1<206, (ops VRRC:$vD, VRRC:$vA, VRRC:$vB), |
| 426 | "vpkuwus $vD, $vA, $vB", VecFP, |
| 427 | [(set VRRC:$vD, |
| 428 | (int_ppc_altivec_vpkuwus VRRC:$vA, VRRC:$vB))]>; |
| 429 | |
| 430 | // Vector Unpack. |
| 431 | def VUPKHPX : VXForm_2<846, (ops VRRC:$vD, VRRC:$vB), |
| 432 | "vupkhpx $vD, $vB", VecFP, |
| 433 | [(set VRRC:$vD, (int_ppc_altivec_vupkhpx VRRC:$vB))]>; |
| 434 | def VUPKHSB : VXForm_2<526, (ops VRRC:$vD, VRRC:$vB), |
| 435 | "vupkhsb $vD, $vB", VecFP, |
| 436 | [(set VRRC:$vD, (int_ppc_altivec_vupkhsb VRRC:$vB))]>; |
| 437 | def VUPKHSH : VXForm_2<590, (ops VRRC:$vD, VRRC:$vB), |
| 438 | "vupkhsh $vD, $vB", VecFP, |
| 439 | [(set VRRC:$vD, (int_ppc_altivec_vupkhsh VRRC:$vB))]>; |
| 440 | def VUPKLPX : VXForm_2<974, (ops VRRC:$vD, VRRC:$vB), |
| 441 | "vupklpx $vD, $vB", VecFP, |
| 442 | [(set VRRC:$vD, (int_ppc_altivec_vupklpx VRRC:$vB))]>; |
| 443 | def VUPKLSB : VXForm_2<654, (ops VRRC:$vD, VRRC:$vB), |
| 444 | "vupklsb $vD, $vB", VecFP, |
| 445 | [(set VRRC:$vD, (int_ppc_altivec_vupklsb VRRC:$vB))]>; |
| 446 | def VUPKLSH : VXForm_2<718, (ops VRRC:$vD, VRRC:$vB), |
| 447 | "vupklsh $vD, $vB", VecFP, |
| 448 | [(set VRRC:$vD, (int_ppc_altivec_vupklsh VRRC:$vB))]>; |
| 449 | |
Chris Lattner | b22a04d | 2006-03-25 07:51:43 +0000 | [diff] [blame] | 450 | |
Chris Lattner | b8a45c2 | 2006-03-26 04:57:17 +0000 | [diff] [blame] | 451 | // Altivec Comparisons. |
| 452 | |
Chris Lattner | 5f7b019 | 2006-03-31 05:32:57 +0000 | [diff] [blame^] | 453 | class VCMP<bits<10> xo, string asmstr, ValueType Ty> |
| 454 | : VXRForm_1<xo, (ops VRRC:$vD, VRRC:$vA, VRRC:$vB), asmstr, VecFPCompare, |
| 455 | [(set VRRC:$vD, (Ty (PPCvcmp VRRC:$vA, VRRC:$vB, xo)))]>; |
| 456 | class VCMPo<bits<10> xo, string asmstr, ValueType Ty> |
| 457 | : VXRForm_1<xo, (ops VRRC:$vD, VRRC:$vA, VRRC:$vB), asmstr, VecFPCompare, |
| 458 | [(set VRRC:$vD, (Ty (PPCvcmp_o VRRC:$vA, VRRC:$vB, xo)))]>,isVDOT; |
| 459 | |
| 460 | // f32 element comparisons.0 |
| 461 | def VCMPBFP : VCMP <966, "vcmpbfp $vD, $vA, $vB" , v4f32>; |
| 462 | def VCMPBFPo : VCMPo<966, "vcmpbfp. $vD, $vA, $vB" , v4f32>; |
| 463 | def VCMPEQFP : VCMP <198, "vcmpeqfp $vD, $vA, $vB" , v4f32>; |
| 464 | def VCMPEQFPo : VCMPo<198, "vcmpeqfp. $vD, $vA, $vB", v4f32>; |
| 465 | def VCMPGEFP : VCMP <454, "vcmpgefp $vD, $vA, $vB" , v4f32>; |
| 466 | def VCMPGEFPo : VCMPo<454, "vcmpgefp. $vD, $vA, $vB", v4f32>; |
| 467 | def VCMPGTFP : VCMP <710, "vcmpgtfp $vD, $vA, $vB" , v4f32>; |
| 468 | def VCMPGTFPo : VCMPo<710, "vcmpgtfp. $vD, $vA, $vB", v4f32>; |
Chris Lattner | b8a45c2 | 2006-03-26 04:57:17 +0000 | [diff] [blame] | 469 | |
| 470 | // i8 element comparisons. |
Chris Lattner | 5f7b019 | 2006-03-31 05:32:57 +0000 | [diff] [blame^] | 471 | def VCMPEQUB : VCMP < 6, "vcmpequb $vD, $vA, $vB" , v16i8>; |
| 472 | def VCMPEQUBo : VCMPo< 6, "vcmpequb. $vD, $vA, $vB", v16i8>; |
| 473 | def VCMPGTSB : VCMP <774, "vcmpgtsb $vD, $vA, $vB" , v16i8>; |
| 474 | def VCMPGTSBo : VCMPo<774, "vcmpgtsb. $vD, $vA, $vB", v16i8>; |
| 475 | def VCMPGTUB : VCMP <518, "vcmpgtub $vD, $vA, $vB" , v16i8>; |
| 476 | def VCMPGTUBo : VCMPo<518, "vcmpgtub. $vD, $vA, $vB", v16i8>; |
Chris Lattner | b8a45c2 | 2006-03-26 04:57:17 +0000 | [diff] [blame] | 477 | |
| 478 | // i16 element comparisons. |
Chris Lattner | 5f7b019 | 2006-03-31 05:32:57 +0000 | [diff] [blame^] | 479 | def VCMPEQUH : VCMP < 70, "vcmpequh $vD, $vA, $vB" , v8i16>; |
| 480 | def VCMPEQUHo : VCMPo< 70, "vcmpequh. $vD, $vA, $vB", v8i16>; |
| 481 | def VCMPGTSH : VCMP <838, "vcmpgtsh $vD, $vA, $vB" , v8i16>; |
| 482 | def VCMPGTSHo : VCMPo<838, "vcmpgtsh. $vD, $vA, $vB", v8i16>; |
| 483 | def VCMPGTUH : VCMP <582, "vcmpgtuh $vD, $vA, $vB" , v8i16>; |
| 484 | def VCMPGTUHo : VCMPo<582, "vcmpgtuh. $vD, $vA, $vB", v8i16>; |
Chris Lattner | b8a45c2 | 2006-03-26 04:57:17 +0000 | [diff] [blame] | 485 | |
| 486 | // i32 element comparisons. |
Chris Lattner | 5f7b019 | 2006-03-31 05:32:57 +0000 | [diff] [blame^] | 487 | def VCMPEQUW : VCMP <134, "vcmpequw $vD, $vA, $vB" , v4i32>; |
| 488 | def VCMPEQUWo : VCMPo<134, "vcmpequw. $vD, $vA, $vB", v4i32>; |
| 489 | def VCMPGTSW : VCMP <902, "vcmpgtsw $vD, $vA, $vB" , v4i32>; |
| 490 | def VCMPGTSWo : VCMPo<902, "vcmpgtsw. $vD, $vA, $vB", v4i32>; |
| 491 | def VCMPGTUW : VCMP <646, "vcmpgtuw $vD, $vA, $vB" , v4i32>; |
| 492 | def VCMPGTUWo : VCMPo<646, "vcmpgtuw. $vD, $vA, $vB", v4i32>; |
Chris Lattner | b8a45c2 | 2006-03-26 04:57:17 +0000 | [diff] [blame] | 493 | |
Chris Lattner | b22a04d | 2006-03-25 07:51:43 +0000 | [diff] [blame] | 494 | def V_SET0 : VXForm_setzero<1220, (ops VRRC:$vD), |
| 495 | "vxor $vD, $vD, $vD", VecFP, |
Evan Cheng | 5b6a01b | 2006-03-26 09:52:32 +0000 | [diff] [blame] | 496 | [(set VRRC:$vD, (v4f32 immAllZerosV))]>; |
Chris Lattner | b22a04d | 2006-03-25 07:51:43 +0000 | [diff] [blame] | 497 | } |
| 498 | |
| 499 | //===----------------------------------------------------------------------===// |
| 500 | // Additional Altivec Patterns |
| 501 | // |
| 502 | |
| 503 | // Undef/Zero. |
| 504 | def : Pat<(v16i8 (undef)), (v16i8 (IMPLICIT_DEF_VRRC))>; |
| 505 | def : Pat<(v8i16 (undef)), (v8i16 (IMPLICIT_DEF_VRRC))>; |
| 506 | def : Pat<(v4i32 (undef)), (v4i32 (IMPLICIT_DEF_VRRC))>; |
Evan Cheng | 5b6a01b | 2006-03-26 09:52:32 +0000 | [diff] [blame] | 507 | def : Pat<(v16i8 immAllZerosV), (v16i8 (V_SET0))>; |
| 508 | def : Pat<(v8i16 immAllZerosV), (v8i16 (V_SET0))>; |
| 509 | def : Pat<(v4i32 immAllZerosV), (v4i32 (V_SET0))>; |
Chris Lattner | b22a04d | 2006-03-25 07:51:43 +0000 | [diff] [blame] | 510 | |
| 511 | // Loads. |
| 512 | def : Pat<(v16i8 (load xoaddr:$src)), (v16i8 (LVX xoaddr:$src))>; |
| 513 | def : Pat<(v8i16 (load xoaddr:$src)), (v8i16 (LVX xoaddr:$src))>; |
| 514 | def : Pat<(v4i32 (load xoaddr:$src)), (v4i32 (LVX xoaddr:$src))>; |
Chris Lattner | ecc219b | 2006-03-28 02:29:37 +0000 | [diff] [blame] | 515 | def : Pat<(v4f32 (load xoaddr:$src)), (v4f32 (LVX xoaddr:$src))>; |
Chris Lattner | b22a04d | 2006-03-25 07:51:43 +0000 | [diff] [blame] | 516 | |
| 517 | // Stores. |
| 518 | def : Pat<(store (v16i8 VRRC:$rS), xoaddr:$dst), |
| 519 | (STVX (v16i8 VRRC:$rS), xoaddr:$dst)>; |
| 520 | def : Pat<(store (v8i16 VRRC:$rS), xoaddr:$dst), |
| 521 | (STVX (v8i16 VRRC:$rS), xoaddr:$dst)>; |
| 522 | def : Pat<(store (v4i32 VRRC:$rS), xoaddr:$dst), |
| 523 | (STVX (v4i32 VRRC:$rS), xoaddr:$dst)>; |
Chris Lattner | ecc219b | 2006-03-28 02:29:37 +0000 | [diff] [blame] | 524 | def : Pat<(store (v4f32 VRRC:$rS), xoaddr:$dst), |
| 525 | (STVX (v4f32 VRRC:$rS), xoaddr:$dst)>; |
Chris Lattner | b22a04d | 2006-03-25 07:51:43 +0000 | [diff] [blame] | 526 | |
| 527 | // Bit conversions. |
| 528 | def : Pat<(v16i8 (bitconvert (v8i16 VRRC:$src))), (v16i8 VRRC:$src)>; |
| 529 | def : Pat<(v16i8 (bitconvert (v4i32 VRRC:$src))), (v16i8 VRRC:$src)>; |
| 530 | def : Pat<(v16i8 (bitconvert (v4f32 VRRC:$src))), (v16i8 VRRC:$src)>; |
| 531 | |
| 532 | def : Pat<(v8i16 (bitconvert (v16i8 VRRC:$src))), (v8i16 VRRC:$src)>; |
| 533 | def : Pat<(v8i16 (bitconvert (v4i32 VRRC:$src))), (v8i16 VRRC:$src)>; |
| 534 | def : Pat<(v8i16 (bitconvert (v4f32 VRRC:$src))), (v8i16 VRRC:$src)>; |
| 535 | |
| 536 | def : Pat<(v4i32 (bitconvert (v16i8 VRRC:$src))), (v4i32 VRRC:$src)>; |
| 537 | def : Pat<(v4i32 (bitconvert (v8i16 VRRC:$src))), (v4i32 VRRC:$src)>; |
| 538 | def : Pat<(v4i32 (bitconvert (v4f32 VRRC:$src))), (v4i32 VRRC:$src)>; |
| 539 | |
| 540 | def : Pat<(v4f32 (bitconvert (v16i8 VRRC:$src))), (v4f32 VRRC:$src)>; |
| 541 | def : Pat<(v4f32 (bitconvert (v8i16 VRRC:$src))), (v4f32 VRRC:$src)>; |
| 542 | def : Pat<(v4f32 (bitconvert (v4i32 VRRC:$src))), (v4f32 VRRC:$src)>; |
| 543 | |
| 544 | // Immediate vector formation with vsplti*. |
| 545 | def : Pat<(v16i8 vecspltisb:$invec), (v16i8 (VSPLTISB vecspltisb:$invec))>; |
| 546 | def : Pat<(v16i8 vecspltish:$invec), (v16i8 (VSPLTISH vecspltish:$invec))>; |
| 547 | def : Pat<(v16i8 vecspltisw:$invec), (v16i8 (VSPLTISW vecspltisw:$invec))>; |
| 548 | |
| 549 | def : Pat<(v8i16 vecspltisb:$invec), (v8i16 (VSPLTISB vecspltisb:$invec))>; |
| 550 | def : Pat<(v8i16 vecspltish:$invec), (v8i16 (VSPLTISH vecspltish:$invec))>; |
| 551 | def : Pat<(v8i16 vecspltisw:$invec), (v8i16 (VSPLTISW vecspltisw:$invec))>; |
| 552 | |
| 553 | def : Pat<(v4i32 vecspltisb:$invec), (v4i32 (VSPLTISB vecspltisb:$invec))>; |
| 554 | def : Pat<(v4i32 vecspltish:$invec), (v4i32 (VSPLTISH vecspltish:$invec))>; |
| 555 | def : Pat<(v4i32 vecspltisw:$invec), (v4i32 (VSPLTISW vecspltisw:$invec))>; |
| 556 | |
Chris Lattner | 2430a5f | 2006-03-25 22:16:05 +0000 | [diff] [blame] | 557 | // Logical Operations |
| 558 | def : Pat<(v16i8 (and VRRC:$A, VRRC:$B)), (v16i8 (VAND VRRC:$A, VRRC:$B))>; |
| 559 | def : Pat<(v8i16 (and VRRC:$A, VRRC:$B)), (v8i16 (VAND VRRC:$A, VRRC:$B))>; |
| 560 | def : Pat<(v16i8 (or VRRC:$A, VRRC:$B)), (v16i8 (VOR VRRC:$A, VRRC:$B))>; |
| 561 | def : Pat<(v8i16 (or VRRC:$A, VRRC:$B)), (v8i16 (VOR VRRC:$A, VRRC:$B))>; |
| 562 | def : Pat<(v16i8 (xor VRRC:$A, VRRC:$B)), (v16i8 (VXOR VRRC:$A, VRRC:$B))>; |
| 563 | def : Pat<(v8i16 (xor VRRC:$A, VRRC:$B)), (v8i16 (VXOR VRRC:$A, VRRC:$B))>; |
Chris Lattner | 6509ae8 | 2006-03-25 23:05:29 +0000 | [diff] [blame] | 564 | def : Pat<(v16i8 (vnot (or VRRC:$A, VRRC:$B))),(v16i8 (VNOR VRRC:$A, VRRC:$B))>; |
| 565 | def : Pat<(v8i16 (vnot (or VRRC:$A, VRRC:$B))),(v8i16 (VNOR VRRC:$A, VRRC:$B))>; |
Chris Lattner | af9136b | 2006-03-25 23:10:40 +0000 | [diff] [blame] | 566 | def : Pat<(v16i8 (and VRRC:$A, (vnot VRRC:$B))), |
Chris Lattner | 6509ae8 | 2006-03-25 23:05:29 +0000 | [diff] [blame] | 567 | (v16i8 (VANDC VRRC:$A, VRRC:$B))>; |
Chris Lattner | af9136b | 2006-03-25 23:10:40 +0000 | [diff] [blame] | 568 | def : Pat<(v8i16 (and VRRC:$A, (vnot VRRC:$B))), |
Chris Lattner | 6509ae8 | 2006-03-25 23:05:29 +0000 | [diff] [blame] | 569 | (v8i16 (VANDC VRRC:$A, VRRC:$B))>; |
Chris Lattner | b22a04d | 2006-03-25 07:51:43 +0000 | [diff] [blame] | 570 | |
| 571 | def : Pat<(fmul VRRC:$vA, VRRC:$vB), |
| 572 | (VMADDFP VRRC:$vA, VRRC:$vB, (V_SET0))>; |
| 573 | |
| 574 | // Fused multiply add and multiply sub for packed float. These are represented |
| 575 | // separately from the real instructions above, for operations that must have |
| 576 | // the additional precision, such as Newton-Rhapson (used by divide, sqrt) |
| 577 | def : Pat<(PPCvmaddfp VRRC:$A, VRRC:$B, VRRC:$C), |
| 578 | (VMADDFP VRRC:$A, VRRC:$B, VRRC:$C)>; |
| 579 | def : Pat<(PPCvnmsubfp VRRC:$A, VRRC:$B, VRRC:$C), |
| 580 | (VNMSUBFP VRRC:$A, VRRC:$B, VRRC:$C)>; |
| 581 | |
| 582 | def : Pat<(int_ppc_altivec_vmaddfp VRRC:$A, VRRC:$B, VRRC:$C), |
| 583 | (VMADDFP VRRC:$A, VRRC:$B, VRRC:$C)>; |
| 584 | def : Pat<(int_ppc_altivec_vnmsubfp VRRC:$A, VRRC:$B, VRRC:$C), |
| 585 | (VNMSUBFP VRRC:$A, VRRC:$B, VRRC:$C)>; |
Nate Begeman | 98e70cc | 2006-03-28 04:15:58 +0000 | [diff] [blame] | 586 | def : Pat<(int_ppc_altivec_vperm VRRC:$A, VRRC:$B, VRRC:$C), |
| 587 | (VPERM VRRC:$A, VRRC:$B, VRRC:$C)>; |
Chris Lattner | b22a04d | 2006-03-25 07:51:43 +0000 | [diff] [blame] | 588 | def : Pat<(vector_shuffle (v4i32 VRRC:$vB), (undef), VSPLT_shuffle_mask:$UIMM), |
| 589 | (v4i32 (VSPLTW VSPLT_shuffle_mask:$UIMM, VRRC:$vB))>; |
| 590 | |
| 591 | def : Pat<(PPCvperm (v4i32 VRRC:$vA), VRRC:$vB, VRRC:$vC), |
| 592 | (v4i32 (VPERM VRRC:$vA, VRRC:$vB, VRRC:$vC))>; |
| 593 | |