Scott Michel | 7ea02ff | 2009-03-17 01:15:45 +0000 | [diff] [blame] | 1 | //===-- SPUISelLowering.cpp - Cell SPU DAG Lowering Implementation --------===// |
Scott Michel | 266bc8f | 2007-12-04 22:23:35 +0000 | [diff] [blame] | 2 | // The LLVM Compiler Infrastructure |
| 3 | // |
Chris Lattner | 4ee451d | 2007-12-29 20:36:04 +0000 | [diff] [blame] | 4 | // This file is distributed under the University of Illinois Open Source |
| 5 | // License. See LICENSE.TXT for details. |
Scott Michel | 266bc8f | 2007-12-04 22:23:35 +0000 | [diff] [blame] | 6 | // |
| 7 | //===----------------------------------------------------------------------===// |
| 8 | // |
| 9 | // This file implements the SPUTargetLowering class. |
| 10 | // |
| 11 | //===----------------------------------------------------------------------===// |
| 12 | |
Scott Michel | 266bc8f | 2007-12-04 22:23:35 +0000 | [diff] [blame] | 13 | #include "SPUISelLowering.h" |
| 14 | #include "SPUTargetMachine.h" |
Anton Korobeynikov | 16c29b5 | 2011-01-10 12:39:04 +0000 | [diff] [blame] | 15 | #include "SPUFrameLowering.h" |
Dan Gohman | 1e93df6 | 2010-04-17 14:41:14 +0000 | [diff] [blame] | 16 | #include "SPUMachineFunction.h" |
Chris Lattner | f014412 | 2009-07-28 03:13:23 +0000 | [diff] [blame] | 17 | #include "llvm/Constants.h" |
| 18 | #include "llvm/Function.h" |
| 19 | #include "llvm/Intrinsics.h" |
Scott Michel | c9c8b2a | 2009-01-26 03:31:40 +0000 | [diff] [blame] | 20 | #include "llvm/CallingConv.h" |
John Thompson | 44ab89e | 2010-10-29 17:29:13 +0000 | [diff] [blame] | 21 | #include "llvm/Type.h" |
Scott Michel | 266bc8f | 2007-12-04 22:23:35 +0000 | [diff] [blame] | 22 | #include "llvm/CodeGen/CallingConvLower.h" |
| 23 | #include "llvm/CodeGen/MachineFrameInfo.h" |
| 24 | #include "llvm/CodeGen/MachineFunction.h" |
| 25 | #include "llvm/CodeGen/MachineInstrBuilder.h" |
Chris Lattner | 84bc542 | 2007-12-31 04:13:23 +0000 | [diff] [blame] | 26 | #include "llvm/CodeGen/MachineRegisterInfo.h" |
Scott Michel | 266bc8f | 2007-12-04 22:23:35 +0000 | [diff] [blame] | 27 | #include "llvm/CodeGen/SelectionDAG.h" |
Anton Korobeynikov | 362dd0b | 2010-02-15 22:37:53 +0000 | [diff] [blame] | 28 | #include "llvm/CodeGen/TargetLoweringObjectFileImpl.h" |
Chris Lattner | f014412 | 2009-07-28 03:13:23 +0000 | [diff] [blame] | 29 | #include "llvm/Target/TargetOptions.h" |
| 30 | #include "llvm/ADT/VectorExtras.h" |
Scott Michel | 266bc8f | 2007-12-04 22:23:35 +0000 | [diff] [blame] | 31 | #include "llvm/Support/Debug.h" |
Torok Edwin | dac237e | 2009-07-08 20:53:28 +0000 | [diff] [blame] | 32 | #include "llvm/Support/ErrorHandling.h" |
Scott Michel | 266bc8f | 2007-12-04 22:23:35 +0000 | [diff] [blame] | 33 | #include "llvm/Support/MathExtras.h" |
Torok Edwin | dac237e | 2009-07-08 20:53:28 +0000 | [diff] [blame] | 34 | #include "llvm/Support/raw_ostream.h" |
Scott Michel | 266bc8f | 2007-12-04 22:23:35 +0000 | [diff] [blame] | 35 | #include <map> |
| 36 | |
| 37 | using namespace llvm; |
| 38 | |
| 39 | // Used in getTargetNodeName() below |
| 40 | namespace { |
| 41 | std::map<unsigned, const char *> node_names; |
| 42 | |
Kalle Raiskila | 7ea1ab5 | 2010-11-12 10:14:03 +0000 | [diff] [blame] | 43 | // Byte offset of the preferred slot (counted from the MSB) |
| 44 | int prefslotOffset(EVT VT) { |
| 45 | int retval=0; |
Wesley Peck | bf17cfa | 2010-11-23 03:31:01 +0000 | [diff] [blame] | 46 | if (VT==MVT::i1) retval=3; |
| 47 | if (VT==MVT::i8) retval=3; |
| 48 | if (VT==MVT::i16) retval=2; |
Scott Michel | 266bc8f | 2007-12-04 22:23:35 +0000 | [diff] [blame] | 49 | |
| 50 | return retval; |
| 51 | } |
Scott Michel | 94bd57e | 2009-01-15 04:41:47 +0000 | [diff] [blame] | 52 | |
Scott Michel | c9c8b2a | 2009-01-26 03:31:40 +0000 | [diff] [blame] | 53 | //! Expand a library call into an actual call DAG node |
| 54 | /*! |
| 55 | \note |
| 56 | This code is taken from SelectionDAGLegalize, since it is not exposed as |
| 57 | part of the LLVM SelectionDAG API. |
| 58 | */ |
| 59 | |
| 60 | SDValue |
| 61 | ExpandLibCall(RTLIB::Libcall LC, SDValue Op, SelectionDAG &DAG, |
Dan Gohman | d858e90 | 2010-04-17 15:26:15 +0000 | [diff] [blame] | 62 | bool isSigned, SDValue &Hi, const SPUTargetLowering &TLI) { |
Scott Michel | c9c8b2a | 2009-01-26 03:31:40 +0000 | [diff] [blame] | 63 | // The input chain to this libcall is the entry node of the function. |
| 64 | // Legalizing the call will automatically add the previous call to the |
| 65 | // dependence. |
| 66 | SDValue InChain = DAG.getEntryNode(); |
| 67 | |
| 68 | TargetLowering::ArgListTy Args; |
| 69 | TargetLowering::ArgListEntry Entry; |
| 70 | for (unsigned i = 0, e = Op.getNumOperands(); i != e; ++i) { |
Owen Anderson | e50ed30 | 2009-08-10 22:56:29 +0000 | [diff] [blame] | 71 | EVT ArgVT = Op.getOperand(i).getValueType(); |
Chris Lattner | db125cf | 2011-07-18 04:54:35 +0000 | [diff] [blame] | 72 | Type *ArgTy = ArgVT.getTypeForEVT(*DAG.getContext()); |
Scott Michel | c9c8b2a | 2009-01-26 03:31:40 +0000 | [diff] [blame] | 73 | Entry.Node = Op.getOperand(i); |
| 74 | Entry.Ty = ArgTy; |
| 75 | Entry.isSExt = isSigned; |
| 76 | Entry.isZExt = !isSigned; |
| 77 | Args.push_back(Entry); |
| 78 | } |
| 79 | SDValue Callee = DAG.getExternalSymbol(TLI.getLibcallName(LC), |
| 80 | TLI.getPointerTy()); |
| 81 | |
| 82 | // Splice the libcall in wherever FindInputOutputChains tells us to. |
Chris Lattner | db125cf | 2011-07-18 04:54:35 +0000 | [diff] [blame] | 83 | Type *RetTy = |
Owen Anderson | 23b9b19 | 2009-08-12 00:36:31 +0000 | [diff] [blame] | 84 | Op.getNode()->getValueType(0).getTypeForEVT(*DAG.getContext()); |
Scott Michel | c9c8b2a | 2009-01-26 03:31:40 +0000 | [diff] [blame] | 85 | std::pair<SDValue, SDValue> CallInfo = |
| 86 | TLI.LowerCallTo(InChain, RetTy, isSigned, !isSigned, false, false, |
Anton Korobeynikov | 72977a4 | 2009-08-14 20:10:52 +0000 | [diff] [blame] | 87 | 0, TLI.getLibcallCallingConv(LC), false, |
Dan Gohman | 98ca4f2 | 2009-08-05 01:29:28 +0000 | [diff] [blame] | 88 | /*isReturnValueUsed=*/true, |
Bill Wendling | 46ada19 | 2010-03-02 01:55:18 +0000 | [diff] [blame] | 89 | Callee, Args, DAG, Op.getDebugLoc()); |
Scott Michel | c9c8b2a | 2009-01-26 03:31:40 +0000 | [diff] [blame] | 90 | |
| 91 | return CallInfo.first; |
| 92 | } |
Scott Michel | 266bc8f | 2007-12-04 22:23:35 +0000 | [diff] [blame] | 93 | } |
| 94 | |
| 95 | SPUTargetLowering::SPUTargetLowering(SPUTargetMachine &TM) |
Chris Lattner | f014412 | 2009-07-28 03:13:23 +0000 | [diff] [blame] | 96 | : TargetLowering(TM, new TargetLoweringObjectFileELF()), |
| 97 | SPUTM(TM) { |
Scott Michel | 266bc8f | 2007-12-04 22:23:35 +0000 | [diff] [blame] | 98 | |
| 99 | // Use _setjmp/_longjmp instead of setjmp/longjmp. |
| 100 | setUseUnderscoreSetJmp(true); |
| 101 | setUseUnderscoreLongJmp(true); |
Scott Michel | 5af8f0e | 2008-07-16 17:17:29 +0000 | [diff] [blame] | 102 | |
Scott Michel | d1e8d9c | 2009-01-21 04:58:48 +0000 | [diff] [blame] | 103 | // Set RTLIB libcall names as used by SPU: |
| 104 | setLibcallName(RTLIB::DIV_F64, "__fast_divdf3"); |
| 105 | |
Scott Michel | 266bc8f | 2007-12-04 22:23:35 +0000 | [diff] [blame] | 106 | // Set up the SPU's register classes: |
Owen Anderson | 825b72b | 2009-08-11 20:47:22 +0000 | [diff] [blame] | 107 | addRegisterClass(MVT::i8, SPU::R8CRegisterClass); |
| 108 | addRegisterClass(MVT::i16, SPU::R16CRegisterClass); |
| 109 | addRegisterClass(MVT::i32, SPU::R32CRegisterClass); |
| 110 | addRegisterClass(MVT::i64, SPU::R64CRegisterClass); |
| 111 | addRegisterClass(MVT::f32, SPU::R32FPRegisterClass); |
| 112 | addRegisterClass(MVT::f64, SPU::R64FPRegisterClass); |
| 113 | addRegisterClass(MVT::i128, SPU::GPRCRegisterClass); |
Scott Michel | 5af8f0e | 2008-07-16 17:17:29 +0000 | [diff] [blame] | 114 | |
Scott Michel | 266bc8f | 2007-12-04 22:23:35 +0000 | [diff] [blame] | 115 | // SPU has no sign or zero extended loads for i1, i8, i16: |
Owen Anderson | 825b72b | 2009-08-11 20:47:22 +0000 | [diff] [blame] | 116 | setLoadExtAction(ISD::EXTLOAD, MVT::i1, Promote); |
| 117 | setLoadExtAction(ISD::SEXTLOAD, MVT::i1, Promote); |
| 118 | setLoadExtAction(ISD::ZEXTLOAD, MVT::i1, Promote); |
Scott Michel | 266bc8f | 2007-12-04 22:23:35 +0000 | [diff] [blame] | 119 | |
Owen Anderson | 825b72b | 2009-08-11 20:47:22 +0000 | [diff] [blame] | 120 | setLoadExtAction(ISD::EXTLOAD, MVT::f32, Expand); |
| 121 | setLoadExtAction(ISD::EXTLOAD, MVT::f64, Expand); |
Scott Michel | b30e8f6 | 2008-12-02 19:53:53 +0000 | [diff] [blame] | 122 | |
Owen Anderson | 825b72b | 2009-08-11 20:47:22 +0000 | [diff] [blame] | 123 | setTruncStoreAction(MVT::i128, MVT::i64, Expand); |
| 124 | setTruncStoreAction(MVT::i128, MVT::i32, Expand); |
| 125 | setTruncStoreAction(MVT::i128, MVT::i16, Expand); |
| 126 | setTruncStoreAction(MVT::i128, MVT::i8, Expand); |
Eli Friedman | 5427d71 | 2009-07-17 06:36:24 +0000 | [diff] [blame] | 127 | |
Owen Anderson | 825b72b | 2009-08-11 20:47:22 +0000 | [diff] [blame] | 128 | setTruncStoreAction(MVT::f64, MVT::f32, Expand); |
Eli Friedman | 5427d71 | 2009-07-17 06:36:24 +0000 | [diff] [blame] | 129 | |
Scott Michel | 266bc8f | 2007-12-04 22:23:35 +0000 | [diff] [blame] | 130 | // SPU constant load actions are custom lowered: |
Owen Anderson | 825b72b | 2009-08-11 20:47:22 +0000 | [diff] [blame] | 131 | setOperationAction(ISD::ConstantFP, MVT::f32, Legal); |
| 132 | setOperationAction(ISD::ConstantFP, MVT::f64, Custom); |
Scott Michel | 266bc8f | 2007-12-04 22:23:35 +0000 | [diff] [blame] | 133 | |
| 134 | // SPU's loads and stores have to be custom lowered: |
Owen Anderson | 825b72b | 2009-08-11 20:47:22 +0000 | [diff] [blame] | 135 | for (unsigned sctype = (unsigned) MVT::i8; sctype < (unsigned) MVT::i128; |
Scott Michel | 266bc8f | 2007-12-04 22:23:35 +0000 | [diff] [blame] | 136 | ++sctype) { |
Owen Anderson | 825b72b | 2009-08-11 20:47:22 +0000 | [diff] [blame] | 137 | MVT::SimpleValueType VT = (MVT::SimpleValueType)sctype; |
Duncan Sands | 83ec4b6 | 2008-06-06 12:08:01 +0000 | [diff] [blame] | 138 | |
Scott Michel | f0569be | 2008-12-27 04:51:36 +0000 | [diff] [blame] | 139 | setOperationAction(ISD::LOAD, VT, Custom); |
| 140 | setOperationAction(ISD::STORE, VT, Custom); |
| 141 | setLoadExtAction(ISD::EXTLOAD, VT, Custom); |
| 142 | setLoadExtAction(ISD::ZEXTLOAD, VT, Custom); |
| 143 | setLoadExtAction(ISD::SEXTLOAD, VT, Custom); |
| 144 | |
Owen Anderson | 825b72b | 2009-08-11 20:47:22 +0000 | [diff] [blame] | 145 | for (unsigned stype = sctype - 1; stype >= (unsigned) MVT::i8; --stype) { |
| 146 | MVT::SimpleValueType StoreVT = (MVT::SimpleValueType) stype; |
Scott Michel | f0569be | 2008-12-27 04:51:36 +0000 | [diff] [blame] | 147 | setTruncStoreAction(VT, StoreVT, Expand); |
| 148 | } |
Scott Michel | 266bc8f | 2007-12-04 22:23:35 +0000 | [diff] [blame] | 149 | } |
| 150 | |
Owen Anderson | 825b72b | 2009-08-11 20:47:22 +0000 | [diff] [blame] | 151 | for (unsigned sctype = (unsigned) MVT::f32; sctype < (unsigned) MVT::f64; |
Scott Michel | f0569be | 2008-12-27 04:51:36 +0000 | [diff] [blame] | 152 | ++sctype) { |
Owen Anderson | 825b72b | 2009-08-11 20:47:22 +0000 | [diff] [blame] | 153 | MVT::SimpleValueType VT = (MVT::SimpleValueType) sctype; |
Scott Michel | f0569be | 2008-12-27 04:51:36 +0000 | [diff] [blame] | 154 | |
| 155 | setOperationAction(ISD::LOAD, VT, Custom); |
| 156 | setOperationAction(ISD::STORE, VT, Custom); |
| 157 | |
Owen Anderson | 825b72b | 2009-08-11 20:47:22 +0000 | [diff] [blame] | 158 | for (unsigned stype = sctype - 1; stype >= (unsigned) MVT::f32; --stype) { |
| 159 | MVT::SimpleValueType StoreVT = (MVT::SimpleValueType) stype; |
Scott Michel | f0569be | 2008-12-27 04:51:36 +0000 | [diff] [blame] | 160 | setTruncStoreAction(VT, StoreVT, Expand); |
| 161 | } |
| 162 | } |
| 163 | |
Scott Michel | 266bc8f | 2007-12-04 22:23:35 +0000 | [diff] [blame] | 164 | // Expand the jumptable branches |
Owen Anderson | 825b72b | 2009-08-11 20:47:22 +0000 | [diff] [blame] | 165 | setOperationAction(ISD::BR_JT, MVT::Other, Expand); |
| 166 | setOperationAction(ISD::BR_CC, MVT::Other, Expand); |
Scott Michel | 7a1c9e9 | 2008-11-22 23:50:42 +0000 | [diff] [blame] | 167 | |
| 168 | // Custom lower SELECT_CC for most cases, but expand by default |
Owen Anderson | 825b72b | 2009-08-11 20:47:22 +0000 | [diff] [blame] | 169 | setOperationAction(ISD::SELECT_CC, MVT::Other, Expand); |
| 170 | setOperationAction(ISD::SELECT_CC, MVT::i8, Custom); |
| 171 | setOperationAction(ISD::SELECT_CC, MVT::i16, Custom); |
| 172 | setOperationAction(ISD::SELECT_CC, MVT::i32, Custom); |
| 173 | setOperationAction(ISD::SELECT_CC, MVT::i64, Custom); |
Scott Michel | 266bc8f | 2007-12-04 22:23:35 +0000 | [diff] [blame] | 174 | |
| 175 | // SPU has no intrinsics for these particular operations: |
Owen Anderson | 825b72b | 2009-08-11 20:47:22 +0000 | [diff] [blame] | 176 | setOperationAction(ISD::MEMBARRIER, MVT::Other, Expand); |
Eli Friedman | 1464846 | 2011-07-27 22:21:52 +0000 | [diff] [blame] | 177 | setOperationAction(ISD::ATOMIC_FENCE, MVT::Other, Expand); |
Andrew Lenharth | d497d9f | 2008-02-16 14:46:26 +0000 | [diff] [blame] | 178 | |
Eli Friedman | 5427d71 | 2009-07-17 06:36:24 +0000 | [diff] [blame] | 179 | // SPU has no division/remainder instructions |
Owen Anderson | 825b72b | 2009-08-11 20:47:22 +0000 | [diff] [blame] | 180 | setOperationAction(ISD::SREM, MVT::i8, Expand); |
| 181 | setOperationAction(ISD::UREM, MVT::i8, Expand); |
| 182 | setOperationAction(ISD::SDIV, MVT::i8, Expand); |
| 183 | setOperationAction(ISD::UDIV, MVT::i8, Expand); |
| 184 | setOperationAction(ISD::SDIVREM, MVT::i8, Expand); |
| 185 | setOperationAction(ISD::UDIVREM, MVT::i8, Expand); |
| 186 | setOperationAction(ISD::SREM, MVT::i16, Expand); |
| 187 | setOperationAction(ISD::UREM, MVT::i16, Expand); |
| 188 | setOperationAction(ISD::SDIV, MVT::i16, Expand); |
| 189 | setOperationAction(ISD::UDIV, MVT::i16, Expand); |
| 190 | setOperationAction(ISD::SDIVREM, MVT::i16, Expand); |
| 191 | setOperationAction(ISD::UDIVREM, MVT::i16, Expand); |
| 192 | setOperationAction(ISD::SREM, MVT::i32, Expand); |
| 193 | setOperationAction(ISD::UREM, MVT::i32, Expand); |
| 194 | setOperationAction(ISD::SDIV, MVT::i32, Expand); |
| 195 | setOperationAction(ISD::UDIV, MVT::i32, Expand); |
| 196 | setOperationAction(ISD::SDIVREM, MVT::i32, Expand); |
| 197 | setOperationAction(ISD::UDIVREM, MVT::i32, Expand); |
| 198 | setOperationAction(ISD::SREM, MVT::i64, Expand); |
| 199 | setOperationAction(ISD::UREM, MVT::i64, Expand); |
| 200 | setOperationAction(ISD::SDIV, MVT::i64, Expand); |
| 201 | setOperationAction(ISD::UDIV, MVT::i64, Expand); |
| 202 | setOperationAction(ISD::SDIVREM, MVT::i64, Expand); |
| 203 | setOperationAction(ISD::UDIVREM, MVT::i64, Expand); |
| 204 | setOperationAction(ISD::SREM, MVT::i128, Expand); |
| 205 | setOperationAction(ISD::UREM, MVT::i128, Expand); |
| 206 | setOperationAction(ISD::SDIV, MVT::i128, Expand); |
| 207 | setOperationAction(ISD::UDIV, MVT::i128, Expand); |
| 208 | setOperationAction(ISD::SDIVREM, MVT::i128, Expand); |
| 209 | setOperationAction(ISD::UDIVREM, MVT::i128, Expand); |
Scott Michel | 5af8f0e | 2008-07-16 17:17:29 +0000 | [diff] [blame] | 210 | |
Scott Michel | 266bc8f | 2007-12-04 22:23:35 +0000 | [diff] [blame] | 211 | // We don't support sin/cos/sqrt/fmod |
Owen Anderson | 825b72b | 2009-08-11 20:47:22 +0000 | [diff] [blame] | 212 | setOperationAction(ISD::FSIN , MVT::f64, Expand); |
| 213 | setOperationAction(ISD::FCOS , MVT::f64, Expand); |
| 214 | setOperationAction(ISD::FREM , MVT::f64, Expand); |
| 215 | setOperationAction(ISD::FSIN , MVT::f32, Expand); |
| 216 | setOperationAction(ISD::FCOS , MVT::f32, Expand); |
| 217 | setOperationAction(ISD::FREM , MVT::f32, Expand); |
Scott Michel | 5af8f0e | 2008-07-16 17:17:29 +0000 | [diff] [blame] | 218 | |
Scott Michel | c9c8b2a | 2009-01-26 03:31:40 +0000 | [diff] [blame] | 219 | // Expand fsqrt to the appropriate libcall (NOTE: should use h/w fsqrt |
| 220 | // for f32!) |
Owen Anderson | 825b72b | 2009-08-11 20:47:22 +0000 | [diff] [blame] | 221 | setOperationAction(ISD::FSQRT, MVT::f64, Expand); |
| 222 | setOperationAction(ISD::FSQRT, MVT::f32, Expand); |
Scott Michel | 5af8f0e | 2008-07-16 17:17:29 +0000 | [diff] [blame] | 223 | |
Cameron Zwarich | 3339084 | 2011-07-08 21:39:21 +0000 | [diff] [blame] | 224 | setOperationAction(ISD::FMA, MVT::f64, Expand); |
| 225 | setOperationAction(ISD::FMA, MVT::f32, Expand); |
| 226 | |
Owen Anderson | 825b72b | 2009-08-11 20:47:22 +0000 | [diff] [blame] | 227 | setOperationAction(ISD::FCOPYSIGN, MVT::f64, Expand); |
| 228 | setOperationAction(ISD::FCOPYSIGN, MVT::f32, Expand); |
Scott Michel | 266bc8f | 2007-12-04 22:23:35 +0000 | [diff] [blame] | 229 | |
| 230 | // SPU can do rotate right and left, so legalize it... but customize for i8 |
| 231 | // because instructions don't exist. |
Bill Wendling | 9440e35 | 2008-08-31 02:59:23 +0000 | [diff] [blame] | 232 | |
| 233 | // FIXME: Change from "expand" to appropriate type once ROTR is supported in |
| 234 | // .td files. |
Owen Anderson | 825b72b | 2009-08-11 20:47:22 +0000 | [diff] [blame] | 235 | setOperationAction(ISD::ROTR, MVT::i32, Expand /*Legal*/); |
| 236 | setOperationAction(ISD::ROTR, MVT::i16, Expand /*Legal*/); |
| 237 | setOperationAction(ISD::ROTR, MVT::i8, Expand /*Custom*/); |
Bill Wendling | 9440e35 | 2008-08-31 02:59:23 +0000 | [diff] [blame] | 238 | |
Owen Anderson | 825b72b | 2009-08-11 20:47:22 +0000 | [diff] [blame] | 239 | setOperationAction(ISD::ROTL, MVT::i32, Legal); |
| 240 | setOperationAction(ISD::ROTL, MVT::i16, Legal); |
| 241 | setOperationAction(ISD::ROTL, MVT::i8, Custom); |
Scott Michel | dc91bea | 2008-11-20 16:36:33 +0000 | [diff] [blame] | 242 | |
Scott Michel | 266bc8f | 2007-12-04 22:23:35 +0000 | [diff] [blame] | 243 | // SPU has no native version of shift left/right for i8 |
Owen Anderson | 825b72b | 2009-08-11 20:47:22 +0000 | [diff] [blame] | 244 | setOperationAction(ISD::SHL, MVT::i8, Custom); |
| 245 | setOperationAction(ISD::SRL, MVT::i8, Custom); |
| 246 | setOperationAction(ISD::SRA, MVT::i8, Custom); |
Scott Michel | 9c0c6b2 | 2008-11-21 02:56:16 +0000 | [diff] [blame] | 247 | |
Scott Michel | 02d711b | 2008-12-30 23:28:25 +0000 | [diff] [blame] | 248 | // Make these operations legal and handle them during instruction selection: |
Owen Anderson | 825b72b | 2009-08-11 20:47:22 +0000 | [diff] [blame] | 249 | setOperationAction(ISD::SHL, MVT::i64, Legal); |
| 250 | setOperationAction(ISD::SRL, MVT::i64, Legal); |
| 251 | setOperationAction(ISD::SRA, MVT::i64, Legal); |
Scott Michel | 266bc8f | 2007-12-04 22:23:35 +0000 | [diff] [blame] | 252 | |
Scott Michel | 5af8f0e | 2008-07-16 17:17:29 +0000 | [diff] [blame] | 253 | // Custom lower i8, i32 and i64 multiplications |
Owen Anderson | 825b72b | 2009-08-11 20:47:22 +0000 | [diff] [blame] | 254 | setOperationAction(ISD::MUL, MVT::i8, Custom); |
| 255 | setOperationAction(ISD::MUL, MVT::i32, Legal); |
| 256 | setOperationAction(ISD::MUL, MVT::i64, Legal); |
Scott Michel | 9c0c6b2 | 2008-11-21 02:56:16 +0000 | [diff] [blame] | 257 | |
Eli Friedman | 6314ac2 | 2009-06-16 06:40:59 +0000 | [diff] [blame] | 258 | // Expand double-width multiplication |
| 259 | // FIXME: It would probably be reasonable to support some of these operations |
Owen Anderson | 825b72b | 2009-08-11 20:47:22 +0000 | [diff] [blame] | 260 | setOperationAction(ISD::UMUL_LOHI, MVT::i8, Expand); |
| 261 | setOperationAction(ISD::SMUL_LOHI, MVT::i8, Expand); |
| 262 | setOperationAction(ISD::MULHU, MVT::i8, Expand); |
| 263 | setOperationAction(ISD::MULHS, MVT::i8, Expand); |
| 264 | setOperationAction(ISD::UMUL_LOHI, MVT::i16, Expand); |
| 265 | setOperationAction(ISD::SMUL_LOHI, MVT::i16, Expand); |
| 266 | setOperationAction(ISD::MULHU, MVT::i16, Expand); |
| 267 | setOperationAction(ISD::MULHS, MVT::i16, Expand); |
| 268 | setOperationAction(ISD::UMUL_LOHI, MVT::i32, Expand); |
| 269 | setOperationAction(ISD::SMUL_LOHI, MVT::i32, Expand); |
| 270 | setOperationAction(ISD::MULHU, MVT::i32, Expand); |
| 271 | setOperationAction(ISD::MULHS, MVT::i32, Expand); |
| 272 | setOperationAction(ISD::UMUL_LOHI, MVT::i64, Expand); |
| 273 | setOperationAction(ISD::SMUL_LOHI, MVT::i64, Expand); |
| 274 | setOperationAction(ISD::MULHU, MVT::i64, Expand); |
| 275 | setOperationAction(ISD::MULHS, MVT::i64, Expand); |
Eli Friedman | 6314ac2 | 2009-06-16 06:40:59 +0000 | [diff] [blame] | 276 | |
Scott Michel | 8bf61e8 | 2008-06-02 22:18:03 +0000 | [diff] [blame] | 277 | // Need to custom handle (some) common i8, i64 math ops |
Owen Anderson | 825b72b | 2009-08-11 20:47:22 +0000 | [diff] [blame] | 278 | setOperationAction(ISD::ADD, MVT::i8, Custom); |
| 279 | setOperationAction(ISD::ADD, MVT::i64, Legal); |
| 280 | setOperationAction(ISD::SUB, MVT::i8, Custom); |
| 281 | setOperationAction(ISD::SUB, MVT::i64, Legal); |
Scott Michel | 5af8f0e | 2008-07-16 17:17:29 +0000 | [diff] [blame] | 282 | |
Scott Michel | 266bc8f | 2007-12-04 22:23:35 +0000 | [diff] [blame] | 283 | // SPU does not have BSWAP. It does have i32 support CTLZ. |
| 284 | // CTPOP has to be custom lowered. |
Owen Anderson | 825b72b | 2009-08-11 20:47:22 +0000 | [diff] [blame] | 285 | setOperationAction(ISD::BSWAP, MVT::i32, Expand); |
| 286 | setOperationAction(ISD::BSWAP, MVT::i64, Expand); |
Scott Michel | 266bc8f | 2007-12-04 22:23:35 +0000 | [diff] [blame] | 287 | |
Owen Anderson | 825b72b | 2009-08-11 20:47:22 +0000 | [diff] [blame] | 288 | setOperationAction(ISD::CTPOP, MVT::i8, Custom); |
| 289 | setOperationAction(ISD::CTPOP, MVT::i16, Custom); |
| 290 | setOperationAction(ISD::CTPOP, MVT::i32, Custom); |
| 291 | setOperationAction(ISD::CTPOP, MVT::i64, Custom); |
| 292 | setOperationAction(ISD::CTPOP, MVT::i128, Expand); |
Scott Michel | 266bc8f | 2007-12-04 22:23:35 +0000 | [diff] [blame] | 293 | |
Owen Anderson | 825b72b | 2009-08-11 20:47:22 +0000 | [diff] [blame] | 294 | setOperationAction(ISD::CTTZ , MVT::i8, Expand); |
| 295 | setOperationAction(ISD::CTTZ , MVT::i16, Expand); |
| 296 | setOperationAction(ISD::CTTZ , MVT::i32, Expand); |
| 297 | setOperationAction(ISD::CTTZ , MVT::i64, Expand); |
| 298 | setOperationAction(ISD::CTTZ , MVT::i128, Expand); |
Chandler Carruth | 63974b2 | 2011-12-13 01:56:10 +0000 | [diff] [blame^] | 299 | setOperationAction(ISD::CTTZ_ZERO_UNDEF, MVT::i8, Expand); |
| 300 | setOperationAction(ISD::CTTZ_ZERO_UNDEF, MVT::i16, Expand); |
| 301 | setOperationAction(ISD::CTTZ_ZERO_UNDEF, MVT::i32, Expand); |
| 302 | setOperationAction(ISD::CTTZ_ZERO_UNDEF, MVT::i64, Expand); |
| 303 | setOperationAction(ISD::CTTZ_ZERO_UNDEF, MVT::i128, Expand); |
Scott Michel | 266bc8f | 2007-12-04 22:23:35 +0000 | [diff] [blame] | 304 | |
Owen Anderson | 825b72b | 2009-08-11 20:47:22 +0000 | [diff] [blame] | 305 | setOperationAction(ISD::CTLZ , MVT::i8, Promote); |
| 306 | setOperationAction(ISD::CTLZ , MVT::i16, Promote); |
| 307 | setOperationAction(ISD::CTLZ , MVT::i32, Legal); |
| 308 | setOperationAction(ISD::CTLZ , MVT::i64, Expand); |
| 309 | setOperationAction(ISD::CTLZ , MVT::i128, Expand); |
Chandler Carruth | 63974b2 | 2011-12-13 01:56:10 +0000 | [diff] [blame^] | 310 | setOperationAction(ISD::CTLZ_ZERO_UNDEF, MVT::i8, Expand); |
| 311 | setOperationAction(ISD::CTLZ_ZERO_UNDEF, MVT::i16, Expand); |
| 312 | setOperationAction(ISD::CTLZ_ZERO_UNDEF, MVT::i32, Expand); |
| 313 | setOperationAction(ISD::CTLZ_ZERO_UNDEF, MVT::i64, Expand); |
| 314 | setOperationAction(ISD::CTLZ_ZERO_UNDEF, MVT::i128, Expand); |
Scott Michel | 5af8f0e | 2008-07-16 17:17:29 +0000 | [diff] [blame] | 315 | |
Scott Michel | 8bf61e8 | 2008-06-02 22:18:03 +0000 | [diff] [blame] | 316 | // SPU has a version of select that implements (a&~c)|(b&c), just like |
Scott Michel | 405fba1 | 2008-03-10 23:49:09 +0000 | [diff] [blame] | 317 | // select ought to work: |
Owen Anderson | 825b72b | 2009-08-11 20:47:22 +0000 | [diff] [blame] | 318 | setOperationAction(ISD::SELECT, MVT::i8, Legal); |
| 319 | setOperationAction(ISD::SELECT, MVT::i16, Legal); |
| 320 | setOperationAction(ISD::SELECT, MVT::i32, Legal); |
| 321 | setOperationAction(ISD::SELECT, MVT::i64, Legal); |
Scott Michel | 266bc8f | 2007-12-04 22:23:35 +0000 | [diff] [blame] | 322 | |
Owen Anderson | 825b72b | 2009-08-11 20:47:22 +0000 | [diff] [blame] | 323 | setOperationAction(ISD::SETCC, MVT::i8, Legal); |
| 324 | setOperationAction(ISD::SETCC, MVT::i16, Legal); |
| 325 | setOperationAction(ISD::SETCC, MVT::i32, Legal); |
| 326 | setOperationAction(ISD::SETCC, MVT::i64, Legal); |
| 327 | setOperationAction(ISD::SETCC, MVT::f64, Custom); |
Scott Michel | ad2715e | 2008-03-05 23:02:02 +0000 | [diff] [blame] | 328 | |
Scott Michel | f0569be | 2008-12-27 04:51:36 +0000 | [diff] [blame] | 329 | // Custom lower i128 -> i64 truncates |
Owen Anderson | 825b72b | 2009-08-11 20:47:22 +0000 | [diff] [blame] | 330 | setOperationAction(ISD::TRUNCATE, MVT::i64, Custom); |
Scott Michel | b30e8f6 | 2008-12-02 19:53:53 +0000 | [diff] [blame] | 331 | |
Scott Michel | 77f452d | 2009-08-25 22:37:34 +0000 | [diff] [blame] | 332 | // Custom lower i32/i64 -> i128 sign extend |
Scott Michel | f1fa4fd | 2009-08-24 22:28:53 +0000 | [diff] [blame] | 333 | setOperationAction(ISD::SIGN_EXTEND, MVT::i128, Custom); |
| 334 | |
Owen Anderson | 825b72b | 2009-08-11 20:47:22 +0000 | [diff] [blame] | 335 | setOperationAction(ISD::FP_TO_SINT, MVT::i8, Promote); |
| 336 | setOperationAction(ISD::FP_TO_UINT, MVT::i8, Promote); |
| 337 | setOperationAction(ISD::FP_TO_SINT, MVT::i16, Promote); |
| 338 | setOperationAction(ISD::FP_TO_UINT, MVT::i16, Promote); |
Scott Michel | c9c8b2a | 2009-01-26 03:31:40 +0000 | [diff] [blame] | 339 | // SPU has a legal FP -> signed INT instruction for f32, but for f64, need |
| 340 | // to expand to a libcall, hence the custom lowering: |
Owen Anderson | 825b72b | 2009-08-11 20:47:22 +0000 | [diff] [blame] | 341 | setOperationAction(ISD::FP_TO_SINT, MVT::i32, Custom); |
| 342 | setOperationAction(ISD::FP_TO_UINT, MVT::i32, Custom); |
| 343 | setOperationAction(ISD::FP_TO_SINT, MVT::i64, Expand); |
| 344 | setOperationAction(ISD::FP_TO_UINT, MVT::i64, Expand); |
| 345 | setOperationAction(ISD::FP_TO_SINT, MVT::i128, Expand); |
| 346 | setOperationAction(ISD::FP_TO_UINT, MVT::i128, Expand); |
Scott Michel | 266bc8f | 2007-12-04 22:23:35 +0000 | [diff] [blame] | 347 | |
| 348 | // FDIV on SPU requires custom lowering |
Owen Anderson | 825b72b | 2009-08-11 20:47:22 +0000 | [diff] [blame] | 349 | setOperationAction(ISD::FDIV, MVT::f64, Expand); // to libcall |
Scott Michel | 266bc8f | 2007-12-04 22:23:35 +0000 | [diff] [blame] | 350 | |
Scott Michel | 9de57a9 | 2009-01-26 22:33:37 +0000 | [diff] [blame] | 351 | // SPU has [U|S]INT_TO_FP for f32->i32, but not for f64->i32, f64->i64: |
Owen Anderson | 825b72b | 2009-08-11 20:47:22 +0000 | [diff] [blame] | 352 | setOperationAction(ISD::SINT_TO_FP, MVT::i32, Custom); |
| 353 | setOperationAction(ISD::SINT_TO_FP, MVT::i16, Promote); |
| 354 | setOperationAction(ISD::SINT_TO_FP, MVT::i8, Promote); |
| 355 | setOperationAction(ISD::UINT_TO_FP, MVT::i32, Custom); |
| 356 | setOperationAction(ISD::UINT_TO_FP, MVT::i16, Promote); |
| 357 | setOperationAction(ISD::UINT_TO_FP, MVT::i8, Promote); |
| 358 | setOperationAction(ISD::SINT_TO_FP, MVT::i64, Custom); |
| 359 | setOperationAction(ISD::UINT_TO_FP, MVT::i64, Custom); |
Scott Michel | 266bc8f | 2007-12-04 22:23:35 +0000 | [diff] [blame] | 360 | |
Wesley Peck | bf17cfa | 2010-11-23 03:31:01 +0000 | [diff] [blame] | 361 | setOperationAction(ISD::BITCAST, MVT::i32, Legal); |
| 362 | setOperationAction(ISD::BITCAST, MVT::f32, Legal); |
| 363 | setOperationAction(ISD::BITCAST, MVT::i64, Legal); |
| 364 | setOperationAction(ISD::BITCAST, MVT::f64, Legal); |
Scott Michel | 266bc8f | 2007-12-04 22:23:35 +0000 | [diff] [blame] | 365 | |
| 366 | // We cannot sextinreg(i1). Expand to shifts. |
Owen Anderson | 825b72b | 2009-08-11 20:47:22 +0000 | [diff] [blame] | 367 | setOperationAction(ISD::SIGN_EXTEND_INREG, MVT::i1, Expand); |
Scott Michel | 5af8f0e | 2008-07-16 17:17:29 +0000 | [diff] [blame] | 368 | |
Scott Michel | 5af8f0e | 2008-07-16 17:17:29 +0000 | [diff] [blame] | 369 | // We want to legalize GlobalAddress and ConstantPool nodes into the |
Scott Michel | 266bc8f | 2007-12-04 22:23:35 +0000 | [diff] [blame] | 370 | // appropriate instructions to materialize the address. |
Owen Anderson | 825b72b | 2009-08-11 20:47:22 +0000 | [diff] [blame] | 371 | for (unsigned sctype = (unsigned) MVT::i8; sctype < (unsigned) MVT::f128; |
Scott Michel | 053c1da | 2008-01-29 02:16:57 +0000 | [diff] [blame] | 372 | ++sctype) { |
Owen Anderson | 825b72b | 2009-08-11 20:47:22 +0000 | [diff] [blame] | 373 | MVT::SimpleValueType VT = (MVT::SimpleValueType)sctype; |
Duncan Sands | 83ec4b6 | 2008-06-06 12:08:01 +0000 | [diff] [blame] | 374 | |
Scott Michel | 1df30c4 | 2008-12-29 03:23:36 +0000 | [diff] [blame] | 375 | setOperationAction(ISD::GlobalAddress, VT, Custom); |
| 376 | setOperationAction(ISD::ConstantPool, VT, Custom); |
| 377 | setOperationAction(ISD::JumpTable, VT, Custom); |
Scott Michel | 053c1da | 2008-01-29 02:16:57 +0000 | [diff] [blame] | 378 | } |
Scott Michel | 266bc8f | 2007-12-04 22:23:35 +0000 | [diff] [blame] | 379 | |
Scott Michel | 266bc8f | 2007-12-04 22:23:35 +0000 | [diff] [blame] | 380 | // VASTART needs to be custom lowered to use the VarArgsFrameIndex |
Owen Anderson | 825b72b | 2009-08-11 20:47:22 +0000 | [diff] [blame] | 381 | setOperationAction(ISD::VASTART , MVT::Other, Custom); |
Scott Michel | 5af8f0e | 2008-07-16 17:17:29 +0000 | [diff] [blame] | 382 | |
Scott Michel | 266bc8f | 2007-12-04 22:23:35 +0000 | [diff] [blame] | 383 | // Use the default implementation. |
Owen Anderson | 825b72b | 2009-08-11 20:47:22 +0000 | [diff] [blame] | 384 | setOperationAction(ISD::VAARG , MVT::Other, Expand); |
| 385 | setOperationAction(ISD::VACOPY , MVT::Other, Expand); |
| 386 | setOperationAction(ISD::VAEND , MVT::Other, Expand); |
| 387 | setOperationAction(ISD::STACKSAVE , MVT::Other, Expand); |
| 388 | setOperationAction(ISD::STACKRESTORE , MVT::Other, Expand); |
| 389 | setOperationAction(ISD::DYNAMIC_STACKALLOC, MVT::i32 , Expand); |
| 390 | setOperationAction(ISD::DYNAMIC_STACKALLOC, MVT::i64 , Expand); |
Scott Michel | 266bc8f | 2007-12-04 22:23:35 +0000 | [diff] [blame] | 391 | |
| 392 | // Cell SPU has instructions for converting between i64 and fp. |
Owen Anderson | 825b72b | 2009-08-11 20:47:22 +0000 | [diff] [blame] | 393 | setOperationAction(ISD::FP_TO_SINT, MVT::i64, Custom); |
| 394 | setOperationAction(ISD::SINT_TO_FP, MVT::i64, Custom); |
Scott Michel | 5af8f0e | 2008-07-16 17:17:29 +0000 | [diff] [blame] | 395 | |
Scott Michel | 266bc8f | 2007-12-04 22:23:35 +0000 | [diff] [blame] | 396 | // To take advantage of the above i64 FP_TO_SINT, promote i32 FP_TO_UINT |
Owen Anderson | 825b72b | 2009-08-11 20:47:22 +0000 | [diff] [blame] | 397 | setOperationAction(ISD::FP_TO_UINT, MVT::i32, Promote); |
Scott Michel | 266bc8f | 2007-12-04 22:23:35 +0000 | [diff] [blame] | 398 | |
| 399 | // BUILD_PAIR can't be handled natively, and should be expanded to shl/or |
Owen Anderson | 825b72b | 2009-08-11 20:47:22 +0000 | [diff] [blame] | 400 | setOperationAction(ISD::BUILD_PAIR, MVT::i64, Expand); |
Scott Michel | 266bc8f | 2007-12-04 22:23:35 +0000 | [diff] [blame] | 401 | |
| 402 | // First set operation action for all vector types to expand. Then we |
| 403 | // will selectively turn on ones that can be effectively codegen'd. |
Owen Anderson | 825b72b | 2009-08-11 20:47:22 +0000 | [diff] [blame] | 404 | addRegisterClass(MVT::v16i8, SPU::VECREGRegisterClass); |
| 405 | addRegisterClass(MVT::v8i16, SPU::VECREGRegisterClass); |
| 406 | addRegisterClass(MVT::v4i32, SPU::VECREGRegisterClass); |
| 407 | addRegisterClass(MVT::v2i64, SPU::VECREGRegisterClass); |
| 408 | addRegisterClass(MVT::v4f32, SPU::VECREGRegisterClass); |
| 409 | addRegisterClass(MVT::v2f64, SPU::VECREGRegisterClass); |
Scott Michel | 266bc8f | 2007-12-04 22:23:35 +0000 | [diff] [blame] | 410 | |
Owen Anderson | 825b72b | 2009-08-11 20:47:22 +0000 | [diff] [blame] | 411 | for (unsigned i = (unsigned)MVT::FIRST_VECTOR_VALUETYPE; |
| 412 | i <= (unsigned)MVT::LAST_VECTOR_VALUETYPE; ++i) { |
| 413 | MVT::SimpleValueType VT = (MVT::SimpleValueType)i; |
Scott Michel | 266bc8f | 2007-12-04 22:23:35 +0000 | [diff] [blame] | 414 | |
Nadav Rotem | 34804c4 | 2011-10-04 12:05:35 +0000 | [diff] [blame] | 415 | // Set operation actions to legal types only. |
| 416 | if (!isTypeLegal(VT)) continue; |
| 417 | |
Duncan Sands | 83ec4b6 | 2008-06-06 12:08:01 +0000 | [diff] [blame] | 418 | // add/sub are legal for all supported vector VT's. |
Scott Michel | c9c8b2a | 2009-01-26 03:31:40 +0000 | [diff] [blame] | 419 | setOperationAction(ISD::ADD, VT, Legal); |
| 420 | setOperationAction(ISD::SUB, VT, Legal); |
Duncan Sands | 83ec4b6 | 2008-06-06 12:08:01 +0000 | [diff] [blame] | 421 | // mul has to be custom lowered. |
Scott Michel | c9c8b2a | 2009-01-26 03:31:40 +0000 | [diff] [blame] | 422 | setOperationAction(ISD::MUL, VT, Legal); |
Duncan Sands | 83ec4b6 | 2008-06-06 12:08:01 +0000 | [diff] [blame] | 423 | |
Scott Michel | c9c8b2a | 2009-01-26 03:31:40 +0000 | [diff] [blame] | 424 | setOperationAction(ISD::AND, VT, Legal); |
| 425 | setOperationAction(ISD::OR, VT, Legal); |
| 426 | setOperationAction(ISD::XOR, VT, Legal); |
Kalle Raiskila | 7ea1ab5 | 2010-11-12 10:14:03 +0000 | [diff] [blame] | 427 | setOperationAction(ISD::LOAD, VT, Custom); |
Scott Michel | c9c8b2a | 2009-01-26 03:31:40 +0000 | [diff] [blame] | 428 | setOperationAction(ISD::SELECT, VT, Legal); |
Kalle Raiskila | 7ea1ab5 | 2010-11-12 10:14:03 +0000 | [diff] [blame] | 429 | setOperationAction(ISD::STORE, VT, Custom); |
Scott Michel | 5af8f0e | 2008-07-16 17:17:29 +0000 | [diff] [blame] | 430 | |
Scott Michel | 266bc8f | 2007-12-04 22:23:35 +0000 | [diff] [blame] | 431 | // These operations need to be expanded: |
Scott Michel | c9c8b2a | 2009-01-26 03:31:40 +0000 | [diff] [blame] | 432 | setOperationAction(ISD::SDIV, VT, Expand); |
| 433 | setOperationAction(ISD::SREM, VT, Expand); |
| 434 | setOperationAction(ISD::UDIV, VT, Expand); |
| 435 | setOperationAction(ISD::UREM, VT, Expand); |
Scott Michel | 266bc8f | 2007-12-04 22:23:35 +0000 | [diff] [blame] | 436 | |
Nadav Rotem | 4d83b79 | 2011-10-15 20:05:17 +0000 | [diff] [blame] | 437 | // Expand all trunc stores |
| 438 | for (unsigned j = (unsigned)MVT::FIRST_VECTOR_VALUETYPE; |
| 439 | j <= (unsigned)MVT::LAST_VECTOR_VALUETYPE; ++j) { |
| 440 | MVT::SimpleValueType TargetVT = (MVT::SimpleValueType)j; |
| 441 | setTruncStoreAction(VT, TargetVT, Expand); |
| 442 | } |
| 443 | |
Scott Michel | 266bc8f | 2007-12-04 22:23:35 +0000 | [diff] [blame] | 444 | // Custom lower build_vector, constant pool spills, insert and |
| 445 | // extract vector elements: |
Nadav Rotem | 34804c4 | 2011-10-04 12:05:35 +0000 | [diff] [blame] | 446 | setOperationAction(ISD::BUILD_VECTOR, VT, Custom); |
| 447 | setOperationAction(ISD::ConstantPool, VT, Custom); |
| 448 | setOperationAction(ISD::SCALAR_TO_VECTOR, VT, Custom); |
| 449 | setOperationAction(ISD::EXTRACT_VECTOR_ELT, VT, Custom); |
| 450 | setOperationAction(ISD::INSERT_VECTOR_ELT, VT, Custom); |
| 451 | setOperationAction(ISD::VECTOR_SHUFFLE, VT, Custom); |
Scott Michel | 266bc8f | 2007-12-04 22:23:35 +0000 | [diff] [blame] | 452 | } |
| 453 | |
Nadav Rotem | 4d83b79 | 2011-10-15 20:05:17 +0000 | [diff] [blame] | 454 | setOperationAction(ISD::SHL, MVT::v2i64, Expand); |
| 455 | |
Owen Anderson | 825b72b | 2009-08-11 20:47:22 +0000 | [diff] [blame] | 456 | setOperationAction(ISD::AND, MVT::v16i8, Custom); |
| 457 | setOperationAction(ISD::OR, MVT::v16i8, Custom); |
| 458 | setOperationAction(ISD::XOR, MVT::v16i8, Custom); |
| 459 | setOperationAction(ISD::SCALAR_TO_VECTOR, MVT::v4f32, Custom); |
Scott Michel | 9de5d0d | 2008-01-11 02:53:15 +0000 | [diff] [blame] | 460 | |
Owen Anderson | 825b72b | 2009-08-11 20:47:22 +0000 | [diff] [blame] | 461 | setOperationAction(ISD::FDIV, MVT::v4f32, Legal); |
Scott Michel | 1df30c4 | 2008-12-29 03:23:36 +0000 | [diff] [blame] | 462 | |
Scott Michel | f0569be | 2008-12-27 04:51:36 +0000 | [diff] [blame] | 463 | setBooleanContents(ZeroOrNegativeOneBooleanContent); |
Duncan Sands | 28b77e9 | 2011-09-06 19:07:46 +0000 | [diff] [blame] | 464 | setBooleanVectorContents(ZeroOrNegativeOneBooleanContent); // FIXME: Is this correct? |
Scott Michel | 5af8f0e | 2008-07-16 17:17:29 +0000 | [diff] [blame] | 465 | |
Scott Michel | 266bc8f | 2007-12-04 22:23:35 +0000 | [diff] [blame] | 466 | setStackPointerRegisterToSaveRestore(SPU::R1); |
Scott Michel | 5af8f0e | 2008-07-16 17:17:29 +0000 | [diff] [blame] | 467 | |
Scott Michel | 266bc8f | 2007-12-04 22:23:35 +0000 | [diff] [blame] | 468 | // We have target-specific dag combine patterns for the following nodes: |
Scott Michel | 053c1da | 2008-01-29 02:16:57 +0000 | [diff] [blame] | 469 | setTargetDAGCombine(ISD::ADD); |
Scott Michel | a59d469 | 2008-02-23 18:41:37 +0000 | [diff] [blame] | 470 | setTargetDAGCombine(ISD::ZERO_EXTEND); |
| 471 | setTargetDAGCombine(ISD::SIGN_EXTEND); |
| 472 | setTargetDAGCombine(ISD::ANY_EXTEND); |
Scott Michel | 5af8f0e | 2008-07-16 17:17:29 +0000 | [diff] [blame] | 473 | |
Eli Friedman | fc5d305 | 2011-05-06 20:34:06 +0000 | [diff] [blame] | 474 | setMinFunctionAlignment(3); |
| 475 | |
Scott Michel | 266bc8f | 2007-12-04 22:23:35 +0000 | [diff] [blame] | 476 | computeRegisterProperties(); |
Scott Michel | 7a1c9e9 | 2008-11-22 23:50:42 +0000 | [diff] [blame] | 477 | |
Scott Michel | e07d3de | 2008-12-09 03:37:19 +0000 | [diff] [blame] | 478 | // Set pre-RA register scheduler default to BURR, which produces slightly |
| 479 | // better code than the default (could also be TDRR, but TargetLowering.h |
| 480 | // needs a mod to support that model): |
Evan Cheng | 211ffa1 | 2010-05-19 20:19:50 +0000 | [diff] [blame] | 481 | setSchedulingPreference(Sched::RegPressure); |
Scott Michel | 266bc8f | 2007-12-04 22:23:35 +0000 | [diff] [blame] | 482 | } |
| 483 | |
| 484 | const char * |
| 485 | SPUTargetLowering::getTargetNodeName(unsigned Opcode) const |
| 486 | { |
| 487 | if (node_names.empty()) { |
| 488 | node_names[(unsigned) SPUISD::RET_FLAG] = "SPUISD::RET_FLAG"; |
| 489 | node_names[(unsigned) SPUISD::Hi] = "SPUISD::Hi"; |
| 490 | node_names[(unsigned) SPUISD::Lo] = "SPUISD::Lo"; |
| 491 | node_names[(unsigned) SPUISD::PCRelAddr] = "SPUISD::PCRelAddr"; |
Scott Michel | 9de5d0d | 2008-01-11 02:53:15 +0000 | [diff] [blame] | 492 | node_names[(unsigned) SPUISD::AFormAddr] = "SPUISD::AFormAddr"; |
Scott Michel | 053c1da | 2008-01-29 02:16:57 +0000 | [diff] [blame] | 493 | node_names[(unsigned) SPUISD::IndirectAddr] = "SPUISD::IndirectAddr"; |
Scott Michel | 266bc8f | 2007-12-04 22:23:35 +0000 | [diff] [blame] | 494 | node_names[(unsigned) SPUISD::LDRESULT] = "SPUISD::LDRESULT"; |
| 495 | node_names[(unsigned) SPUISD::CALL] = "SPUISD::CALL"; |
| 496 | node_names[(unsigned) SPUISD::SHUFB] = "SPUISD::SHUFB"; |
Scott Michel | 7a1c9e9 | 2008-11-22 23:50:42 +0000 | [diff] [blame] | 497 | node_names[(unsigned) SPUISD::SHUFFLE_MASK] = "SPUISD::SHUFFLE_MASK"; |
Scott Michel | 266bc8f | 2007-12-04 22:23:35 +0000 | [diff] [blame] | 498 | node_names[(unsigned) SPUISD::CNTB] = "SPUISD::CNTB"; |
Scott Michel | 1df30c4 | 2008-12-29 03:23:36 +0000 | [diff] [blame] | 499 | node_names[(unsigned) SPUISD::PREFSLOT2VEC] = "SPUISD::PREFSLOT2VEC"; |
Scott Michel | 104de43 | 2008-11-24 17:11:17 +0000 | [diff] [blame] | 500 | node_names[(unsigned) SPUISD::VEC2PREFSLOT] = "SPUISD::VEC2PREFSLOT"; |
Kalle Raiskila | 7ea1ab5 | 2010-11-12 10:14:03 +0000 | [diff] [blame] | 501 | node_names[(unsigned) SPUISD::SHL_BITS] = "SPUISD::SHL_BITS"; |
| 502 | node_names[(unsigned) SPUISD::SHL_BYTES] = "SPUISD::SHL_BYTES"; |
Scott Michel | 266bc8f | 2007-12-04 22:23:35 +0000 | [diff] [blame] | 503 | node_names[(unsigned) SPUISD::VEC_ROTL] = "SPUISD::VEC_ROTL"; |
| 504 | node_names[(unsigned) SPUISD::VEC_ROTR] = "SPUISD::VEC_ROTR"; |
Scott Michel | d1e8d9c | 2009-01-21 04:58:48 +0000 | [diff] [blame] | 505 | node_names[(unsigned) SPUISD::ROTBYTES_LEFT] = "SPUISD::ROTBYTES_LEFT"; |
| 506 | node_names[(unsigned) SPUISD::ROTBYTES_LEFT_BITS] = |
| 507 | "SPUISD::ROTBYTES_LEFT_BITS"; |
Scott Michel | 8bf61e8 | 2008-06-02 22:18:03 +0000 | [diff] [blame] | 508 | node_names[(unsigned) SPUISD::SELECT_MASK] = "SPUISD::SELECT_MASK"; |
Scott Michel | 266bc8f | 2007-12-04 22:23:35 +0000 | [diff] [blame] | 509 | node_names[(unsigned) SPUISD::SELB] = "SPUISD::SELB"; |
Scott Michel | 94bd57e | 2009-01-15 04:41:47 +0000 | [diff] [blame] | 510 | node_names[(unsigned) SPUISD::ADD64_MARKER] = "SPUISD::ADD64_MARKER"; |
| 511 | node_names[(unsigned) SPUISD::SUB64_MARKER] = "SPUISD::SUB64_MARKER"; |
| 512 | node_names[(unsigned) SPUISD::MUL64_MARKER] = "SPUISD::MUL64_MARKER"; |
Scott Michel | 266bc8f | 2007-12-04 22:23:35 +0000 | [diff] [blame] | 513 | } |
| 514 | |
| 515 | std::map<unsigned, const char *>::iterator i = node_names.find(Opcode); |
| 516 | |
| 517 | return ((i != node_names.end()) ? i->second : 0); |
| 518 | } |
| 519 | |
Scott Michel | f0569be | 2008-12-27 04:51:36 +0000 | [diff] [blame] | 520 | //===----------------------------------------------------------------------===// |
| 521 | // Return the Cell SPU's SETCC result type |
| 522 | //===----------------------------------------------------------------------===// |
| 523 | |
Duncan Sands | 28b77e9 | 2011-09-06 19:07:46 +0000 | [diff] [blame] | 524 | EVT SPUTargetLowering::getSetCCResultType(EVT VT) const { |
Kalle Raiskila | 7de8101 | 2010-11-24 12:59:16 +0000 | [diff] [blame] | 525 | // i8, i16 and i32 are valid SETCC result types |
| 526 | MVT::SimpleValueType retval; |
| 527 | |
| 528 | switch(VT.getSimpleVT().SimpleTy){ |
| 529 | case MVT::i1: |
| 530 | case MVT::i8: |
| 531 | retval = MVT::i8; break; |
| 532 | case MVT::i16: |
| 533 | retval = MVT::i16; break; |
| 534 | case MVT::i32: |
| 535 | default: |
| 536 | retval = MVT::i32; |
| 537 | } |
| 538 | return retval; |
Scott Michel | 78c47fa | 2008-03-10 16:58:52 +0000 | [diff] [blame] | 539 | } |
| 540 | |
Scott Michel | 266bc8f | 2007-12-04 22:23:35 +0000 | [diff] [blame] | 541 | //===----------------------------------------------------------------------===// |
| 542 | // Calling convention code: |
| 543 | //===----------------------------------------------------------------------===// |
| 544 | |
| 545 | #include "SPUGenCallingConv.inc" |
| 546 | |
| 547 | //===----------------------------------------------------------------------===// |
| 548 | // LowerOperation implementation |
| 549 | //===----------------------------------------------------------------------===// |
| 550 | |
| 551 | /// Custom lower loads for CellSPU |
| 552 | /*! |
| 553 | All CellSPU loads and stores are aligned to 16-byte boundaries, so for elements |
| 554 | within a 16-byte block, we have to rotate to extract the requested element. |
Scott Michel | 30ee7df | 2008-12-04 03:02:42 +0000 | [diff] [blame] | 555 | |
| 556 | For extending loads, we also want to ensure that the following sequence is |
Owen Anderson | 825b72b | 2009-08-11 20:47:22 +0000 | [diff] [blame] | 557 | emitted, e.g. for MVT::f32 extending load to MVT::f64: |
Scott Michel | 30ee7df | 2008-12-04 03:02:42 +0000 | [diff] [blame] | 558 | |
| 559 | \verbatim |
Scott Michel | 1df30c4 | 2008-12-29 03:23:36 +0000 | [diff] [blame] | 560 | %1 v16i8,ch = load |
Scott Michel | 30ee7df | 2008-12-04 03:02:42 +0000 | [diff] [blame] | 561 | %2 v16i8,ch = rotate %1 |
Scott Michel | 1df30c4 | 2008-12-29 03:23:36 +0000 | [diff] [blame] | 562 | %3 v4f8, ch = bitconvert %2 |
Scott Michel | 30ee7df | 2008-12-04 03:02:42 +0000 | [diff] [blame] | 563 | %4 f32 = vec2perfslot %3 |
| 564 | %5 f64 = fp_extend %4 |
| 565 | \endverbatim |
| 566 | */ |
Dan Gohman | 475871a | 2008-07-27 21:46:04 +0000 | [diff] [blame] | 567 | static SDValue |
| 568 | LowerLOAD(SDValue Op, SelectionDAG &DAG, const SPUSubtarget *ST) { |
Scott Michel | 266bc8f | 2007-12-04 22:23:35 +0000 | [diff] [blame] | 569 | LoadSDNode *LN = cast<LoadSDNode>(Op); |
Dan Gohman | 475871a | 2008-07-27 21:46:04 +0000 | [diff] [blame] | 570 | SDValue the_chain = LN->getChain(); |
Owen Anderson | e50ed30 | 2009-08-10 22:56:29 +0000 | [diff] [blame] | 571 | EVT PtrVT = DAG.getTargetLoweringInfo().getPointerTy(); |
| 572 | EVT InVT = LN->getMemoryVT(); |
| 573 | EVT OutVT = Op.getValueType(); |
Scott Michel | 266bc8f | 2007-12-04 22:23:35 +0000 | [diff] [blame] | 574 | ISD::LoadExtType ExtType = LN->getExtensionType(); |
| 575 | unsigned alignment = LN->getAlignment(); |
Kalle Raiskila | 7ea1ab5 | 2010-11-12 10:14:03 +0000 | [diff] [blame] | 576 | int pso = prefslotOffset(InVT); |
Dale Johannesen | 33c960f | 2009-02-04 20:06:27 +0000 | [diff] [blame] | 577 | DebugLoc dl = Op.getDebugLoc(); |
Kalle Raiskila | 7ea1ab5 | 2010-11-12 10:14:03 +0000 | [diff] [blame] | 578 | EVT vecVT = InVT.isVector()? InVT: EVT::getVectorVT(*DAG.getContext(), InVT, |
| 579 | (128 / InVT.getSizeInBits())); |
Scott Michel | 266bc8f | 2007-12-04 22:23:35 +0000 | [diff] [blame] | 580 | |
Kalle Raiskila | 7ea1ab5 | 2010-11-12 10:14:03 +0000 | [diff] [blame] | 581 | // two sanity checks |
Wesley Peck | bf17cfa | 2010-11-23 03:31:01 +0000 | [diff] [blame] | 582 | assert( LN->getAddressingMode() == ISD::UNINDEXED |
Kalle Raiskila | 7ea1ab5 | 2010-11-12 10:14:03 +0000 | [diff] [blame] | 583 | && "we should get only UNINDEXED adresses"); |
| 584 | // clean aligned loads can be selected as-is |
Kalle Raiskila | 8702e8b | 2011-01-17 11:59:20 +0000 | [diff] [blame] | 585 | if (InVT.getSizeInBits() == 128 && (alignment%16) == 0) |
Kalle Raiskila | 7ea1ab5 | 2010-11-12 10:14:03 +0000 | [diff] [blame] | 586 | return SDValue(); |
| 587 | |
Wesley Peck | bf17cfa | 2010-11-23 03:31:01 +0000 | [diff] [blame] | 588 | // Get pointerinfos to the memory chunk(s) that contain the data to load |
Kalle Raiskila | 7ea1ab5 | 2010-11-12 10:14:03 +0000 | [diff] [blame] | 589 | uint64_t mpi_offset = LN->getPointerInfo().Offset; |
| 590 | mpi_offset -= mpi_offset%16; |
Kalle Raiskila | 38e0c9b | 2010-11-15 10:12:32 +0000 | [diff] [blame] | 591 | MachinePointerInfo lowMemPtr(LN->getPointerInfo().V, mpi_offset); |
| 592 | MachinePointerInfo highMemPtr(LN->getPointerInfo().V, mpi_offset+16); |
Kalle Raiskila | 7ea1ab5 | 2010-11-12 10:14:03 +0000 | [diff] [blame] | 593 | |
Kalle Raiskila | 38e0c9b | 2010-11-15 10:12:32 +0000 | [diff] [blame] | 594 | SDValue result; |
| 595 | SDValue basePtr = LN->getBasePtr(); |
| 596 | SDValue rotate; |
Kalle Raiskila | 7ea1ab5 | 2010-11-12 10:14:03 +0000 | [diff] [blame] | 597 | |
Kalle Raiskila | 8702e8b | 2011-01-17 11:59:20 +0000 | [diff] [blame] | 598 | if ((alignment%16) == 0) { |
Kalle Raiskila | 38e0c9b | 2010-11-15 10:12:32 +0000 | [diff] [blame] | 599 | ConstantSDNode *CN; |
Kalle Raiskila | 7ea1ab5 | 2010-11-12 10:14:03 +0000 | [diff] [blame] | 600 | |
Kalle Raiskila | 38e0c9b | 2010-11-15 10:12:32 +0000 | [diff] [blame] | 601 | // Special cases for a known aligned load to simplify the base pointer |
| 602 | // and the rotation amount: |
| 603 | if (basePtr.getOpcode() == ISD::ADD |
| 604 | && (CN = dyn_cast<ConstantSDNode > (basePtr.getOperand(1))) != 0) { |
| 605 | // Known offset into basePtr |
| 606 | int64_t offset = CN->getSExtValue(); |
| 607 | int64_t rotamt = int64_t((offset & 0xf) - pso); |
Scott Michel | 266bc8f | 2007-12-04 22:23:35 +0000 | [diff] [blame] | 608 | |
Kalle Raiskila | 38e0c9b | 2010-11-15 10:12:32 +0000 | [diff] [blame] | 609 | if (rotamt < 0) |
| 610 | rotamt += 16; |
Scott Michel | 9de5d0d | 2008-01-11 02:53:15 +0000 | [diff] [blame] | 611 | |
Kalle Raiskila | 38e0c9b | 2010-11-15 10:12:32 +0000 | [diff] [blame] | 612 | rotate = DAG.getConstant(rotamt, MVT::i16); |
Scott Michel | 9de5d0d | 2008-01-11 02:53:15 +0000 | [diff] [blame] | 613 | |
Kalle Raiskila | 38e0c9b | 2010-11-15 10:12:32 +0000 | [diff] [blame] | 614 | // Simplify the base pointer for this case: |
| 615 | basePtr = basePtr.getOperand(0); |
| 616 | if ((offset & ~0xf) > 0) { |
Dale Johannesen | de06470 | 2009-02-06 21:50:26 +0000 | [diff] [blame] | 617 | basePtr = DAG.getNode(SPUISD::IndirectAddr, dl, PtrVT, |
Scott Michel | f0569be | 2008-12-27 04:51:36 +0000 | [diff] [blame] | 618 | basePtr, |
Kalle Raiskila | 38e0c9b | 2010-11-15 10:12:32 +0000 | [diff] [blame] | 619 | DAG.getConstant((offset & ~0xf), PtrVT)); |
Scott Michel | f0569be | 2008-12-27 04:51:36 +0000 | [diff] [blame] | 620 | } |
Kalle Raiskila | 38e0c9b | 2010-11-15 10:12:32 +0000 | [diff] [blame] | 621 | } else if ((basePtr.getOpcode() == SPUISD::AFormAddr) |
| 622 | || (basePtr.getOpcode() == SPUISD::IndirectAddr |
| 623 | && basePtr.getOperand(0).getOpcode() == SPUISD::Hi |
| 624 | && basePtr.getOperand(1).getOpcode() == SPUISD::Lo)) { |
| 625 | // Plain aligned a-form address: rotate into preferred slot |
| 626 | // Same for (SPUindirect (SPUhi ...), (SPUlo ...)) |
| 627 | int64_t rotamt = -pso; |
| 628 | if (rotamt < 0) |
| 629 | rotamt += 16; |
| 630 | rotate = DAG.getConstant(rotamt, MVT::i16); |
| 631 | } else { |
Scott Michel | f0569be | 2008-12-27 04:51:36 +0000 | [diff] [blame] | 632 | // Offset the rotate amount by the basePtr and the preferred slot |
| 633 | // byte offset |
Kalle Raiskila | 38e0c9b | 2010-11-15 10:12:32 +0000 | [diff] [blame] | 634 | int64_t rotamt = -pso; |
| 635 | if (rotamt < 0) |
| 636 | rotamt += 16; |
Dale Johannesen | 33c960f | 2009-02-04 20:06:27 +0000 | [diff] [blame] | 637 | rotate = DAG.getNode(ISD::ADD, dl, PtrVT, |
Scott Michel | f0569be | 2008-12-27 04:51:36 +0000 | [diff] [blame] | 638 | basePtr, |
Kalle Raiskila | 38e0c9b | 2010-11-15 10:12:32 +0000 | [diff] [blame] | 639 | DAG.getConstant(rotamt, PtrVT)); |
Scott Michel | 266bc8f | 2007-12-04 22:23:35 +0000 | [diff] [blame] | 640 | } |
Kalle Raiskila | 38e0c9b | 2010-11-15 10:12:32 +0000 | [diff] [blame] | 641 | } else { |
| 642 | // Unaligned load: must be more pessimistic about addressing modes: |
| 643 | if (basePtr.getOpcode() == ISD::ADD) { |
| 644 | MachineFunction &MF = DAG.getMachineFunction(); |
| 645 | MachineRegisterInfo &RegInfo = MF.getRegInfo(); |
| 646 | unsigned VReg = RegInfo.createVirtualRegister(&SPU::R32CRegClass); |
| 647 | SDValue Flag; |
Scott Michel | 9de5d0d | 2008-01-11 02:53:15 +0000 | [diff] [blame] | 648 | |
Kalle Raiskila | 38e0c9b | 2010-11-15 10:12:32 +0000 | [diff] [blame] | 649 | SDValue Op0 = basePtr.getOperand(0); |
| 650 | SDValue Op1 = basePtr.getOperand(1); |
| 651 | |
| 652 | if (isa<ConstantSDNode>(Op1)) { |
| 653 | // Convert the (add <ptr>, <const>) to an indirect address contained |
| 654 | // in a register. Note that this is done because we need to avoid |
| 655 | // creating a 0(reg) d-form address due to the SPU's block loads. |
| 656 | basePtr = DAG.getNode(SPUISD::IndirectAddr, dl, PtrVT, Op0, Op1); |
| 657 | the_chain = DAG.getCopyToReg(the_chain, dl, VReg, basePtr, Flag); |
| 658 | basePtr = DAG.getCopyFromReg(the_chain, dl, VReg, PtrVT); |
| 659 | } else { |
| 660 | // Convert the (add <arg1>, <arg2>) to an indirect address, which |
| 661 | // will likely be lowered as a reg(reg) x-form address. |
| 662 | basePtr = DAG.getNode(SPUISD::IndirectAddr, dl, PtrVT, Op0, Op1); |
| 663 | } |
| 664 | } else { |
| 665 | basePtr = DAG.getNode(SPUISD::IndirectAddr, dl, PtrVT, |
| 666 | basePtr, |
| 667 | DAG.getConstant(0, PtrVT)); |
| 668 | } |
| 669 | |
| 670 | // Offset the rotate amount by the basePtr and the preferred slot |
| 671 | // byte offset |
| 672 | rotate = DAG.getNode(ISD::ADD, dl, PtrVT, |
| 673 | basePtr, |
| 674 | DAG.getConstant(-pso, PtrVT)); |
| 675 | } |
| 676 | |
| 677 | // Do the load as a i128 to allow possible shifting |
| 678 | SDValue low = DAG.getLoad(MVT::i128, dl, the_chain, basePtr, |
| 679 | lowMemPtr, |
Pete Cooper | d752e0f | 2011-11-08 18:42:53 +0000 | [diff] [blame] | 680 | LN->isVolatile(), LN->isNonTemporal(), false, 16); |
Wesley Peck | bf17cfa | 2010-11-23 03:31:01 +0000 | [diff] [blame] | 681 | |
Kalle Raiskila | 7ea1ab5 | 2010-11-12 10:14:03 +0000 | [diff] [blame] | 682 | // When the size is not greater than alignment we get all data with just |
| 683 | // one load |
| 684 | if (alignment >= InVT.getSizeInBits()/8) { |
Scott Michel | f0569be | 2008-12-27 04:51:36 +0000 | [diff] [blame] | 685 | // Update the chain |
Kalle Raiskila | 7ea1ab5 | 2010-11-12 10:14:03 +0000 | [diff] [blame] | 686 | the_chain = low.getValue(1); |
Scott Michel | f0569be | 2008-12-27 04:51:36 +0000 | [diff] [blame] | 687 | |
| 688 | // Rotate into the preferred slot: |
Kalle Raiskila | 7ea1ab5 | 2010-11-12 10:14:03 +0000 | [diff] [blame] | 689 | result = DAG.getNode(SPUISD::ROTBYTES_LEFT, dl, MVT::i128, |
| 690 | low.getValue(0), rotate); |
Scott Michel | f0569be | 2008-12-27 04:51:36 +0000 | [diff] [blame] | 691 | |
Scott Michel | 30ee7df | 2008-12-04 03:02:42 +0000 | [diff] [blame] | 692 | // Convert the loaded v16i8 vector to the appropriate vector type |
| 693 | // specified by the operand: |
Wesley Peck | bf17cfa | 2010-11-23 03:31:01 +0000 | [diff] [blame] | 694 | EVT vecVT = EVT::getVectorVT(*DAG.getContext(), |
Owen Anderson | 23b9b19 | 2009-08-12 00:36:31 +0000 | [diff] [blame] | 695 | InVT, (128 / InVT.getSizeInBits())); |
Dale Johannesen | 33c960f | 2009-02-04 20:06:27 +0000 | [diff] [blame] | 696 | result = DAG.getNode(SPUISD::VEC2PREFSLOT, dl, InVT, |
Wesley Peck | bf17cfa | 2010-11-23 03:31:01 +0000 | [diff] [blame] | 697 | DAG.getNode(ISD::BITCAST, dl, vecVT, result)); |
Kalle Raiskila | 7ea1ab5 | 2010-11-12 10:14:03 +0000 | [diff] [blame] | 698 | } |
| 699 | // When alignment is less than the size, we might need (known only at |
| 700 | // run-time) two loads |
Wesley Peck | bf17cfa | 2010-11-23 03:31:01 +0000 | [diff] [blame] | 701 | // TODO: if the memory address is composed only from constants, we have |
Kalle Raiskila | 7ea1ab5 | 2010-11-12 10:14:03 +0000 | [diff] [blame] | 702 | // extra kowledge, and might avoid the second load |
| 703 | else { |
| 704 | // storage position offset from lower 16 byte aligned memory chunk |
Wesley Peck | bf17cfa | 2010-11-23 03:31:01 +0000 | [diff] [blame] | 705 | SDValue offset = DAG.getNode(ISD::AND, dl, MVT::i32, |
Kalle Raiskila | 7ea1ab5 | 2010-11-12 10:14:03 +0000 | [diff] [blame] | 706 | basePtr, DAG.getConstant( 0xf, MVT::i32 ) ); |
Wesley Peck | bf17cfa | 2010-11-23 03:31:01 +0000 | [diff] [blame] | 707 | // get a registerfull of ones. (this implementation is a workaround: LLVM |
Kalle Raiskila | 7ea1ab5 | 2010-11-12 10:14:03 +0000 | [diff] [blame] | 708 | // cannot handle 128 bit signed int constants) |
Kalle Raiskila | 38e0c9b | 2010-11-15 10:12:32 +0000 | [diff] [blame] | 709 | SDValue ones = DAG.getConstant(-1, MVT::v4i32 ); |
Wesley Peck | bf17cfa | 2010-11-23 03:31:01 +0000 | [diff] [blame] | 710 | ones = DAG.getNode(ISD::BITCAST, dl, MVT::i128, ones); |
Scott Michel | 5af8f0e | 2008-07-16 17:17:29 +0000 | [diff] [blame] | 711 | |
Kalle Raiskila | 7ea1ab5 | 2010-11-12 10:14:03 +0000 | [diff] [blame] | 712 | SDValue high = DAG.getLoad(MVT::i128, dl, the_chain, |
Wesley Peck | bf17cfa | 2010-11-23 03:31:01 +0000 | [diff] [blame] | 713 | DAG.getNode(ISD::ADD, dl, PtrVT, |
Kalle Raiskila | 7ea1ab5 | 2010-11-12 10:14:03 +0000 | [diff] [blame] | 714 | basePtr, |
| 715 | DAG.getConstant(16, PtrVT)), |
| 716 | highMemPtr, |
Pete Cooper | d752e0f | 2011-11-08 18:42:53 +0000 | [diff] [blame] | 717 | LN->isVolatile(), LN->isNonTemporal(), false, |
| 718 | 16); |
Kalle Raiskila | 7ea1ab5 | 2010-11-12 10:14:03 +0000 | [diff] [blame] | 719 | |
| 720 | the_chain = DAG.getNode(ISD::TokenFactor, dl, MVT::Other, low.getValue(1), |
| 721 | high.getValue(1)); |
| 722 | |
| 723 | // Shift the (possible) high part right to compensate the misalignemnt. |
Wesley Peck | bf17cfa | 2010-11-23 03:31:01 +0000 | [diff] [blame] | 724 | // if there is no highpart (i.e. value is i64 and offset is 4), this |
Kalle Raiskila | 7ea1ab5 | 2010-11-12 10:14:03 +0000 | [diff] [blame] | 725 | // will zero out the high value. |
Wesley Peck | bf17cfa | 2010-11-23 03:31:01 +0000 | [diff] [blame] | 726 | high = DAG.getNode(SPUISD::SRL_BYTES, dl, MVT::i128, high, |
Kalle Raiskila | 38e0c9b | 2010-11-15 10:12:32 +0000 | [diff] [blame] | 727 | DAG.getNode(ISD::SUB, dl, MVT::i32, |
Kalle Raiskila | 7ea1ab5 | 2010-11-12 10:14:03 +0000 | [diff] [blame] | 728 | DAG.getConstant( 16, MVT::i32), |
| 729 | offset |
| 730 | )); |
Wesley Peck | bf17cfa | 2010-11-23 03:31:01 +0000 | [diff] [blame] | 731 | |
Chris Lattner | 7a2bdde | 2011-04-15 05:18:47 +0000 | [diff] [blame] | 732 | // Shift the low similarly |
Kalle Raiskila | 7ea1ab5 | 2010-11-12 10:14:03 +0000 | [diff] [blame] | 733 | // TODO: add SPUISD::SHL_BYTES |
Kalle Raiskila | 38e0c9b | 2010-11-15 10:12:32 +0000 | [diff] [blame] | 734 | low = DAG.getNode(SPUISD::SHL_BYTES, dl, MVT::i128, low, offset ); |
Kalle Raiskila | 7ea1ab5 | 2010-11-12 10:14:03 +0000 | [diff] [blame] | 735 | |
| 736 | // Merge the two parts |
Wesley Peck | bf17cfa | 2010-11-23 03:31:01 +0000 | [diff] [blame] | 737 | result = DAG.getNode(ISD::BITCAST, dl, vecVT, |
Kalle Raiskila | 7ea1ab5 | 2010-11-12 10:14:03 +0000 | [diff] [blame] | 738 | DAG.getNode(ISD::OR, dl, MVT::i128, low, high)); |
| 739 | |
| 740 | if (!InVT.isVector()) { |
Kalle Raiskila | 38e0c9b | 2010-11-15 10:12:32 +0000 | [diff] [blame] | 741 | result = DAG.getNode(SPUISD::VEC2PREFSLOT, dl, InVT, result ); |
Kalle Raiskila | 7ea1ab5 | 2010-11-12 10:14:03 +0000 | [diff] [blame] | 742 | } |
| 743 | |
| 744 | } |
Scott Michel | 30ee7df | 2008-12-04 03:02:42 +0000 | [diff] [blame] | 745 | // Handle extending loads by extending the scalar result: |
| 746 | if (ExtType == ISD::SEXTLOAD) { |
Dale Johannesen | 33c960f | 2009-02-04 20:06:27 +0000 | [diff] [blame] | 747 | result = DAG.getNode(ISD::SIGN_EXTEND, dl, OutVT, result); |
Scott Michel | 30ee7df | 2008-12-04 03:02:42 +0000 | [diff] [blame] | 748 | } else if (ExtType == ISD::ZEXTLOAD) { |
Dale Johannesen | 33c960f | 2009-02-04 20:06:27 +0000 | [diff] [blame] | 749 | result = DAG.getNode(ISD::ZERO_EXTEND, dl, OutVT, result); |
Scott Michel | 30ee7df | 2008-12-04 03:02:42 +0000 | [diff] [blame] | 750 | } else if (ExtType == ISD::EXTLOAD) { |
| 751 | unsigned NewOpc = ISD::ANY_EXTEND; |
Scott Michel | 9de5d0d | 2008-01-11 02:53:15 +0000 | [diff] [blame] | 752 | |
Scott Michel | 30ee7df | 2008-12-04 03:02:42 +0000 | [diff] [blame] | 753 | if (OutVT.isFloatingPoint()) |
Scott Michel | 19c10e6 | 2009-01-26 03:37:41 +0000 | [diff] [blame] | 754 | NewOpc = ISD::FP_EXTEND; |
Scott Michel | 9de5d0d | 2008-01-11 02:53:15 +0000 | [diff] [blame] | 755 | |
Dale Johannesen | 33c960f | 2009-02-04 20:06:27 +0000 | [diff] [blame] | 756 | result = DAG.getNode(NewOpc, dl, OutVT, result); |
Scott Michel | 9de5d0d | 2008-01-11 02:53:15 +0000 | [diff] [blame] | 757 | } |
| 758 | |
Owen Anderson | 825b72b | 2009-08-11 20:47:22 +0000 | [diff] [blame] | 759 | SDVTList retvts = DAG.getVTList(OutVT, MVT::Other); |
Dan Gohman | 475871a | 2008-07-27 21:46:04 +0000 | [diff] [blame] | 760 | SDValue retops[2] = { |
Scott Michel | 58c5818 | 2008-01-17 20:38:41 +0000 | [diff] [blame] | 761 | result, |
Scott Michel | 7f9ba9b | 2008-01-30 02:55:46 +0000 | [diff] [blame] | 762 | the_chain |
Scott Michel | 58c5818 | 2008-01-17 20:38:41 +0000 | [diff] [blame] | 763 | }; |
Scott Michel | 9de5d0d | 2008-01-11 02:53:15 +0000 | [diff] [blame] | 764 | |
Dale Johannesen | 33c960f | 2009-02-04 20:06:27 +0000 | [diff] [blame] | 765 | result = DAG.getNode(SPUISD::LDRESULT, dl, retvts, |
Scott Michel | 58c5818 | 2008-01-17 20:38:41 +0000 | [diff] [blame] | 766 | retops, sizeof(retops) / sizeof(retops[0])); |
Scott Michel | 9de5d0d | 2008-01-11 02:53:15 +0000 | [diff] [blame] | 767 | return result; |
Scott Michel | 266bc8f | 2007-12-04 22:23:35 +0000 | [diff] [blame] | 768 | } |
| 769 | |
| 770 | /// Custom lower stores for CellSPU |
| 771 | /*! |
| 772 | All CellSPU stores are aligned to 16-byte boundaries, so for elements |
| 773 | within a 16-byte block, we have to generate a shuffle to insert the |
| 774 | requested element into its place, then store the resulting block. |
| 775 | */ |
Dan Gohman | 475871a | 2008-07-27 21:46:04 +0000 | [diff] [blame] | 776 | static SDValue |
| 777 | LowerSTORE(SDValue Op, SelectionDAG &DAG, const SPUSubtarget *ST) { |
Scott Michel | 266bc8f | 2007-12-04 22:23:35 +0000 | [diff] [blame] | 778 | StoreSDNode *SN = cast<StoreSDNode>(Op); |
Dan Gohman | 475871a | 2008-07-27 21:46:04 +0000 | [diff] [blame] | 779 | SDValue Value = SN->getValue(); |
Owen Anderson | e50ed30 | 2009-08-10 22:56:29 +0000 | [diff] [blame] | 780 | EVT VT = Value.getValueType(); |
| 781 | EVT StVT = (!SN->isTruncatingStore() ? VT : SN->getMemoryVT()); |
| 782 | EVT PtrVT = DAG.getTargetLoweringInfo().getPointerTy(); |
Dale Johannesen | 33c960f | 2009-02-04 20:06:27 +0000 | [diff] [blame] | 783 | DebugLoc dl = Op.getDebugLoc(); |
Scott Michel | 9de5d0d | 2008-01-11 02:53:15 +0000 | [diff] [blame] | 784 | unsigned alignment = SN->getAlignment(); |
Kalle Raiskila | 7ea1ab5 | 2010-11-12 10:14:03 +0000 | [diff] [blame] | 785 | SDValue result; |
| 786 | EVT vecVT = StVT.isVector()? StVT: EVT::getVectorVT(*DAG.getContext(), StVT, |
| 787 | (128 / StVT.getSizeInBits())); |
Wesley Peck | bf17cfa | 2010-11-23 03:31:01 +0000 | [diff] [blame] | 788 | // Get pointerinfos to the memory chunk(s) that contain the data to load |
Kalle Raiskila | 7ea1ab5 | 2010-11-12 10:14:03 +0000 | [diff] [blame] | 789 | uint64_t mpi_offset = SN->getPointerInfo().Offset; |
| 790 | mpi_offset -= mpi_offset%16; |
Kalle Raiskila | 38e0c9b | 2010-11-15 10:12:32 +0000 | [diff] [blame] | 791 | MachinePointerInfo lowMemPtr(SN->getPointerInfo().V, mpi_offset); |
| 792 | MachinePointerInfo highMemPtr(SN->getPointerInfo().V, mpi_offset+16); |
Scott Michel | 266bc8f | 2007-12-04 22:23:35 +0000 | [diff] [blame] | 793 | |
Kalle Raiskila | 7ea1ab5 | 2010-11-12 10:14:03 +0000 | [diff] [blame] | 794 | |
| 795 | // two sanity checks |
Wesley Peck | bf17cfa | 2010-11-23 03:31:01 +0000 | [diff] [blame] | 796 | assert( SN->getAddressingMode() == ISD::UNINDEXED |
Kalle Raiskila | 7ea1ab5 | 2010-11-12 10:14:03 +0000 | [diff] [blame] | 797 | && "we should get only UNINDEXED adresses"); |
| 798 | // clean aligned loads can be selected as-is |
Kalle Raiskila | 8702e8b | 2011-01-17 11:59:20 +0000 | [diff] [blame] | 799 | if (StVT.getSizeInBits() == 128 && (alignment%16) == 0) |
Kalle Raiskila | 7ea1ab5 | 2010-11-12 10:14:03 +0000 | [diff] [blame] | 800 | return SDValue(); |
| 801 | |
Kalle Raiskila | 38e0c9b | 2010-11-15 10:12:32 +0000 | [diff] [blame] | 802 | SDValue alignLoadVec; |
| 803 | SDValue basePtr = SN->getBasePtr(); |
| 804 | SDValue the_chain = SN->getChain(); |
| 805 | SDValue insertEltOffs; |
Kalle Raiskila | 7ea1ab5 | 2010-11-12 10:14:03 +0000 | [diff] [blame] | 806 | |
Kalle Raiskila | 8702e8b | 2011-01-17 11:59:20 +0000 | [diff] [blame] | 807 | if ((alignment%16) == 0) { |
Kalle Raiskila | 38e0c9b | 2010-11-15 10:12:32 +0000 | [diff] [blame] | 808 | ConstantSDNode *CN; |
| 809 | // Special cases for a known aligned load to simplify the base pointer |
| 810 | // and insertion byte: |
| 811 | if (basePtr.getOpcode() == ISD::ADD |
| 812 | && (CN = dyn_cast<ConstantSDNode>(basePtr.getOperand(1))) != 0) { |
| 813 | // Known offset into basePtr |
| 814 | int64_t offset = CN->getSExtValue(); |
Scott Michel | 266bc8f | 2007-12-04 22:23:35 +0000 | [diff] [blame] | 815 | |
Kalle Raiskila | 38e0c9b | 2010-11-15 10:12:32 +0000 | [diff] [blame] | 816 | // Simplify the base pointer for this case: |
| 817 | basePtr = basePtr.getOperand(0); |
| 818 | insertEltOffs = DAG.getNode(SPUISD::IndirectAddr, dl, PtrVT, |
| 819 | basePtr, |
| 820 | DAG.getConstant((offset & 0xf), PtrVT)); |
Scott Michel | 266bc8f | 2007-12-04 22:23:35 +0000 | [diff] [blame] | 821 | |
Kalle Raiskila | 38e0c9b | 2010-11-15 10:12:32 +0000 | [diff] [blame] | 822 | if ((offset & ~0xf) > 0) { |
Dale Johannesen | de06470 | 2009-02-06 21:50:26 +0000 | [diff] [blame] | 823 | basePtr = DAG.getNode(SPUISD::IndirectAddr, dl, PtrVT, |
Scott Michel | f0569be | 2008-12-27 04:51:36 +0000 | [diff] [blame] | 824 | basePtr, |
Kalle Raiskila | 38e0c9b | 2010-11-15 10:12:32 +0000 | [diff] [blame] | 825 | DAG.getConstant((offset & ~0xf), PtrVT)); |
Scott Michel | f0569be | 2008-12-27 04:51:36 +0000 | [diff] [blame] | 826 | } |
Kalle Raiskila | 38e0c9b | 2010-11-15 10:12:32 +0000 | [diff] [blame] | 827 | } else { |
| 828 | // Otherwise, assume it's at byte 0 of basePtr |
| 829 | insertEltOffs = DAG.getNode(SPUISD::IndirectAddr, dl, PtrVT, |
| 830 | basePtr, |
| 831 | DAG.getConstant(0, PtrVT)); |
| 832 | basePtr = DAG.getNode(SPUISD::IndirectAddr, dl, PtrVT, |
Scott Michel | f0569be | 2008-12-27 04:51:36 +0000 | [diff] [blame] | 833 | basePtr, |
| 834 | DAG.getConstant(0, PtrVT)); |
| 835 | } |
Kalle Raiskila | 38e0c9b | 2010-11-15 10:12:32 +0000 | [diff] [blame] | 836 | } else { |
| 837 | // Unaligned load: must be more pessimistic about addressing modes: |
| 838 | if (basePtr.getOpcode() == ISD::ADD) { |
| 839 | MachineFunction &MF = DAG.getMachineFunction(); |
| 840 | MachineRegisterInfo &RegInfo = MF.getRegInfo(); |
| 841 | unsigned VReg = RegInfo.createVirtualRegister(&SPU::R32CRegClass); |
| 842 | SDValue Flag; |
Scott Michel | f0569be | 2008-12-27 04:51:36 +0000 | [diff] [blame] | 843 | |
Kalle Raiskila | 38e0c9b | 2010-11-15 10:12:32 +0000 | [diff] [blame] | 844 | SDValue Op0 = basePtr.getOperand(0); |
| 845 | SDValue Op1 = basePtr.getOperand(1); |
| 846 | |
| 847 | if (isa<ConstantSDNode>(Op1)) { |
| 848 | // Convert the (add <ptr>, <const>) to an indirect address contained |
| 849 | // in a register. Note that this is done because we need to avoid |
| 850 | // creating a 0(reg) d-form address due to the SPU's block loads. |
| 851 | basePtr = DAG.getNode(SPUISD::IndirectAddr, dl, PtrVT, Op0, Op1); |
| 852 | the_chain = DAG.getCopyToReg(the_chain, dl, VReg, basePtr, Flag); |
| 853 | basePtr = DAG.getCopyFromReg(the_chain, dl, VReg, PtrVT); |
| 854 | } else { |
| 855 | // Convert the (add <arg1>, <arg2>) to an indirect address, which |
| 856 | // will likely be lowered as a reg(reg) x-form address. |
| 857 | basePtr = DAG.getNode(SPUISD::IndirectAddr, dl, PtrVT, Op0, Op1); |
| 858 | } |
| 859 | } else { |
| 860 | basePtr = DAG.getNode(SPUISD::IndirectAddr, dl, PtrVT, |
| 861 | basePtr, |
| 862 | DAG.getConstant(0, PtrVT)); |
| 863 | } |
| 864 | |
| 865 | // Insertion point is solely determined by basePtr's contents |
| 866 | insertEltOffs = DAG.getNode(ISD::ADD, dl, PtrVT, |
| 867 | basePtr, |
| 868 | DAG.getConstant(0, PtrVT)); |
| 869 | } |
| 870 | |
| 871 | // Load the lower part of the memory to which to store. |
| 872 | SDValue low = DAG.getLoad(vecVT, dl, the_chain, basePtr, |
Pete Cooper | d752e0f | 2011-11-08 18:42:53 +0000 | [diff] [blame] | 873 | lowMemPtr, SN->isVolatile(), SN->isNonTemporal(), |
| 874 | false, 16); |
Scott Michel | f0569be | 2008-12-27 04:51:36 +0000 | [diff] [blame] | 875 | |
Kalle Raiskila | 7ea1ab5 | 2010-11-12 10:14:03 +0000 | [diff] [blame] | 876 | // if we don't need to store over the 16 byte boundary, one store suffices |
| 877 | if (alignment >= StVT.getSizeInBits()/8) { |
Scott Michel | f0569be | 2008-12-27 04:51:36 +0000 | [diff] [blame] | 878 | // Update the chain |
Kalle Raiskila | 7ea1ab5 | 2010-11-12 10:14:03 +0000 | [diff] [blame] | 879 | the_chain = low.getValue(1); |
Scott Michel | 266bc8f | 2007-12-04 22:23:35 +0000 | [diff] [blame] | 880 | |
Kalle Raiskila | 7ea1ab5 | 2010-11-12 10:14:03 +0000 | [diff] [blame] | 881 | LoadSDNode *LN = cast<LoadSDNode>(low); |
Dan Gohman | 475871a | 2008-07-27 21:46:04 +0000 | [diff] [blame] | 882 | SDValue theValue = SN->getValue(); |
Scott Michel | 266bc8f | 2007-12-04 22:23:35 +0000 | [diff] [blame] | 883 | |
| 884 | if (StVT != VT |
Scott Michel | 7f9ba9b | 2008-01-30 02:55:46 +0000 | [diff] [blame] | 885 | && (theValue.getOpcode() == ISD::AssertZext |
| 886 | || theValue.getOpcode() == ISD::AssertSext)) { |
Scott Michel | 266bc8f | 2007-12-04 22:23:35 +0000 | [diff] [blame] | 887 | // Drill down and get the value for zero- and sign-extended |
| 888 | // quantities |
Scott Michel | 5af8f0e | 2008-07-16 17:17:29 +0000 | [diff] [blame] | 889 | theValue = theValue.getOperand(0); |
Scott Michel | 266bc8f | 2007-12-04 22:23:35 +0000 | [diff] [blame] | 890 | } |
| 891 | |
Scott Michel | 9de5d0d | 2008-01-11 02:53:15 +0000 | [diff] [blame] | 892 | // If the base pointer is already a D-form address, then just create |
| 893 | // a new D-form address with a slot offset and the orignal base pointer. |
| 894 | // Otherwise generate a D-form address with the slot offset relative |
| 895 | // to the stack pointer, which is always aligned. |
Scott Michel | f0569be | 2008-12-27 04:51:36 +0000 | [diff] [blame] | 896 | #if !defined(NDEBUG) |
| 897 | if (DebugFlag && isCurrentDebugType(DEBUG_TYPE)) { |
Chris Lattner | 4437ae2 | 2009-08-23 07:05:07 +0000 | [diff] [blame] | 898 | errs() << "CellSPU LowerSTORE: basePtr = "; |
Scott Michel | f0569be | 2008-12-27 04:51:36 +0000 | [diff] [blame] | 899 | basePtr.getNode()->dump(&DAG); |
Chris Lattner | 4437ae2 | 2009-08-23 07:05:07 +0000 | [diff] [blame] | 900 | errs() << "\n"; |
Scott Michel | f0569be | 2008-12-27 04:51:36 +0000 | [diff] [blame] | 901 | } |
| 902 | #endif |
Scott Michel | 9de5d0d | 2008-01-11 02:53:15 +0000 | [diff] [blame] | 903 | |
Kalle Raiskila | f53fdc2 | 2010-08-24 11:05:51 +0000 | [diff] [blame] | 904 | SDValue insertEltOp = DAG.getNode(SPUISD::SHUFFLE_MASK, dl, vecVT, |
| 905 | insertEltOffs); |
Wesley Peck | bf17cfa | 2010-11-23 03:31:01 +0000 | [diff] [blame] | 906 | SDValue vectorizeOp = DAG.getNode(ISD::SCALAR_TO_VECTOR, dl, vecVT, |
Kalle Raiskila | f53fdc2 | 2010-08-24 11:05:51 +0000 | [diff] [blame] | 907 | theValue); |
| 908 | |
Dale Johannesen | 33c960f | 2009-02-04 20:06:27 +0000 | [diff] [blame] | 909 | result = DAG.getNode(SPUISD::SHUFB, dl, vecVT, |
Kalle Raiskila | 7ea1ab5 | 2010-11-12 10:14:03 +0000 | [diff] [blame] | 910 | vectorizeOp, low, |
Wesley Peck | bf17cfa | 2010-11-23 03:31:01 +0000 | [diff] [blame] | 911 | DAG.getNode(ISD::BITCAST, dl, |
Owen Anderson | 825b72b | 2009-08-11 20:47:22 +0000 | [diff] [blame] | 912 | MVT::v4i32, insertEltOp)); |
Scott Michel | 266bc8f | 2007-12-04 22:23:35 +0000 | [diff] [blame] | 913 | |
Dale Johannesen | 33c960f | 2009-02-04 20:06:27 +0000 | [diff] [blame] | 914 | result = DAG.getStore(the_chain, dl, result, basePtr, |
Kalle Raiskila | 7ea1ab5 | 2010-11-12 10:14:03 +0000 | [diff] [blame] | 915 | lowMemPtr, |
David Greene | 73657df | 2010-02-15 16:55:58 +0000 | [diff] [blame] | 916 | LN->isVolatile(), LN->isNonTemporal(), |
Kalle Raiskila | 7ea1ab5 | 2010-11-12 10:14:03 +0000 | [diff] [blame] | 917 | 16); |
Scott Michel | 266bc8f | 2007-12-04 22:23:35 +0000 | [diff] [blame] | 918 | |
Scott Michel | 266bc8f | 2007-12-04 22:23:35 +0000 | [diff] [blame] | 919 | } |
Kalle Raiskila | 7ea1ab5 | 2010-11-12 10:14:03 +0000 | [diff] [blame] | 920 | // do the store when it might cross the 16 byte memory access boundary. |
| 921 | else { |
Wesley Peck | bf17cfa | 2010-11-23 03:31:01 +0000 | [diff] [blame] | 922 | // TODO issue a warning if SN->isVolatile()== true? This is likely not |
Kalle Raiskila | 7ea1ab5 | 2010-11-12 10:14:03 +0000 | [diff] [blame] | 923 | // what the user wanted. |
Wesley Peck | bf17cfa | 2010-11-23 03:31:01 +0000 | [diff] [blame] | 924 | |
Kalle Raiskila | 7ea1ab5 | 2010-11-12 10:14:03 +0000 | [diff] [blame] | 925 | // address offset from nearest lower 16byte alinged address |
Wesley Peck | bf17cfa | 2010-11-23 03:31:01 +0000 | [diff] [blame] | 926 | SDValue offset = DAG.getNode(ISD::AND, dl, MVT::i32, |
| 927 | SN->getBasePtr(), |
Kalle Raiskila | 7ea1ab5 | 2010-11-12 10:14:03 +0000 | [diff] [blame] | 928 | DAG.getConstant(0xf, MVT::i32)); |
| 929 | // 16 - offset |
Wesley Peck | bf17cfa | 2010-11-23 03:31:01 +0000 | [diff] [blame] | 930 | SDValue offset_compl = DAG.getNode(ISD::SUB, dl, MVT::i32, |
Kalle Raiskila | 7ea1ab5 | 2010-11-12 10:14:03 +0000 | [diff] [blame] | 931 | DAG.getConstant( 16, MVT::i32), |
| 932 | offset); |
Kalle Raiskila | 7ea1ab5 | 2010-11-12 10:14:03 +0000 | [diff] [blame] | 933 | // 16 - sizeof(Value) |
Wesley Peck | bf17cfa | 2010-11-23 03:31:01 +0000 | [diff] [blame] | 934 | SDValue surplus = DAG.getNode(ISD::SUB, dl, MVT::i32, |
Kalle Raiskila | 7ea1ab5 | 2010-11-12 10:14:03 +0000 | [diff] [blame] | 935 | DAG.getConstant( 16, MVT::i32), |
| 936 | DAG.getConstant( VT.getSizeInBits()/8, |
| 937 | MVT::i32)); |
Wesley Peck | bf17cfa | 2010-11-23 03:31:01 +0000 | [diff] [blame] | 938 | // get a registerfull of ones |
Kalle Raiskila | 7ea1ab5 | 2010-11-12 10:14:03 +0000 | [diff] [blame] | 939 | SDValue ones = DAG.getConstant(-1, MVT::v4i32); |
Wesley Peck | bf17cfa | 2010-11-23 03:31:01 +0000 | [diff] [blame] | 940 | ones = DAG.getNode(ISD::BITCAST, dl, MVT::i128, ones); |
Kalle Raiskila | 7ea1ab5 | 2010-11-12 10:14:03 +0000 | [diff] [blame] | 941 | |
| 942 | // Create the 128 bit masks that have ones where the data to store is |
| 943 | // located. |
Wesley Peck | bf17cfa | 2010-11-23 03:31:01 +0000 | [diff] [blame] | 944 | SDValue lowmask, himask; |
| 945 | // if the value to store don't fill up the an entire 128 bits, zero |
Kalle Raiskila | 7ea1ab5 | 2010-11-12 10:14:03 +0000 | [diff] [blame] | 946 | // out the last bits of the mask so that only the value we want to store |
Wesley Peck | bf17cfa | 2010-11-23 03:31:01 +0000 | [diff] [blame] | 947 | // is masked. |
Kalle Raiskila | 7ea1ab5 | 2010-11-12 10:14:03 +0000 | [diff] [blame] | 948 | // this is e.g. in the case of store i32, align 2 |
| 949 | if (!VT.isVector()){ |
| 950 | Value = DAG.getNode(SPUISD::PREFSLOT2VEC, dl, vecVT, Value); |
| 951 | lowmask = DAG.getNode(SPUISD::SRL_BYTES, dl, MVT::i128, ones, surplus); |
Wesley Peck | bf17cfa | 2010-11-23 03:31:01 +0000 | [diff] [blame] | 952 | lowmask = DAG.getNode(SPUISD::SHL_BYTES, dl, MVT::i128, lowmask, |
Kalle Raiskila | 7ea1ab5 | 2010-11-12 10:14:03 +0000 | [diff] [blame] | 953 | surplus); |
Wesley Peck | bf17cfa | 2010-11-23 03:31:01 +0000 | [diff] [blame] | 954 | Value = DAG.getNode(ISD::BITCAST, dl, MVT::i128, Value); |
Kalle Raiskila | 7ea1ab5 | 2010-11-12 10:14:03 +0000 | [diff] [blame] | 955 | Value = DAG.getNode(ISD::AND, dl, MVT::i128, Value, lowmask); |
Wesley Peck | bf17cfa | 2010-11-23 03:31:01 +0000 | [diff] [blame] | 956 | |
Torok Edwin | dac237e | 2009-07-08 20:53:28 +0000 | [diff] [blame] | 957 | } |
Kalle Raiskila | 7ea1ab5 | 2010-11-12 10:14:03 +0000 | [diff] [blame] | 958 | else { |
| 959 | lowmask = ones; |
Wesley Peck | bf17cfa | 2010-11-23 03:31:01 +0000 | [diff] [blame] | 960 | Value = DAG.getNode(ISD::BITCAST, dl, MVT::i128, Value); |
Kalle Raiskila | 7ea1ab5 | 2010-11-12 10:14:03 +0000 | [diff] [blame] | 961 | } |
Wesley Peck | bf17cfa | 2010-11-23 03:31:01 +0000 | [diff] [blame] | 962 | // this will zero, if there are no data that goes to the high quad |
| 963 | himask = DAG.getNode(SPUISD::SHL_BYTES, dl, MVT::i128, lowmask, |
Kalle Raiskila | 7ea1ab5 | 2010-11-12 10:14:03 +0000 | [diff] [blame] | 964 | offset_compl); |
Wesley Peck | bf17cfa | 2010-11-23 03:31:01 +0000 | [diff] [blame] | 965 | lowmask = DAG.getNode(SPUISD::SRL_BYTES, dl, MVT::i128, lowmask, |
Kalle Raiskila | 7ea1ab5 | 2010-11-12 10:14:03 +0000 | [diff] [blame] | 966 | offset); |
Wesley Peck | bf17cfa | 2010-11-23 03:31:01 +0000 | [diff] [blame] | 967 | |
Kalle Raiskila | 7ea1ab5 | 2010-11-12 10:14:03 +0000 | [diff] [blame] | 968 | // Load in the old data and zero out the parts that will be overwritten with |
| 969 | // the new data to store. |
Wesley Peck | bf17cfa | 2010-11-23 03:31:01 +0000 | [diff] [blame] | 970 | SDValue hi = DAG.getLoad(MVT::i128, dl, the_chain, |
Kalle Raiskila | 7ea1ab5 | 2010-11-12 10:14:03 +0000 | [diff] [blame] | 971 | DAG.getNode(ISD::ADD, dl, PtrVT, basePtr, |
| 972 | DAG.getConstant( 16, PtrVT)), |
| 973 | highMemPtr, |
Pete Cooper | d752e0f | 2011-11-08 18:42:53 +0000 | [diff] [blame] | 974 | SN->isVolatile(), SN->isNonTemporal(), |
| 975 | false, 16); |
Kalle Raiskila | 7ea1ab5 | 2010-11-12 10:14:03 +0000 | [diff] [blame] | 976 | the_chain = DAG.getNode(ISD::TokenFactor, dl, MVT::Other, low.getValue(1), |
| 977 | hi.getValue(1)); |
Scott Michel | 266bc8f | 2007-12-04 22:23:35 +0000 | [diff] [blame] | 978 | |
Wesley Peck | bf17cfa | 2010-11-23 03:31:01 +0000 | [diff] [blame] | 979 | low = DAG.getNode(ISD::AND, dl, MVT::i128, |
| 980 | DAG.getNode( ISD::BITCAST, dl, MVT::i128, low), |
Kalle Raiskila | 7ea1ab5 | 2010-11-12 10:14:03 +0000 | [diff] [blame] | 981 | DAG.getNode( ISD::XOR, dl, MVT::i128, lowmask, ones)); |
Wesley Peck | bf17cfa | 2010-11-23 03:31:01 +0000 | [diff] [blame] | 982 | hi = DAG.getNode(ISD::AND, dl, MVT::i128, |
| 983 | DAG.getNode( ISD::BITCAST, dl, MVT::i128, hi), |
Kalle Raiskila | 7ea1ab5 | 2010-11-12 10:14:03 +0000 | [diff] [blame] | 984 | DAG.getNode( ISD::XOR, dl, MVT::i128, himask, ones)); |
| 985 | |
| 986 | // Shift the Value to store into place. rlow contains the parts that go to |
Wesley Peck | bf17cfa | 2010-11-23 03:31:01 +0000 | [diff] [blame] | 987 | // the lower memory chunk, rhi has the parts that go to the upper one. |
Kalle Raiskila | 7ea1ab5 | 2010-11-12 10:14:03 +0000 | [diff] [blame] | 988 | SDValue rlow = DAG.getNode(SPUISD::SRL_BYTES, dl, MVT::i128, Value, offset); |
| 989 | rlow = DAG.getNode(ISD::AND, dl, MVT::i128, rlow, lowmask); |
Wesley Peck | bf17cfa | 2010-11-23 03:31:01 +0000 | [diff] [blame] | 990 | SDValue rhi = DAG.getNode(SPUISD::SHL_BYTES, dl, MVT::i128, Value, |
Kalle Raiskila | 7ea1ab5 | 2010-11-12 10:14:03 +0000 | [diff] [blame] | 991 | offset_compl); |
| 992 | |
| 993 | // Merge the old data and the new data and store the results |
Wesley Peck | bf17cfa | 2010-11-23 03:31:01 +0000 | [diff] [blame] | 994 | // Need to convert vectors here to integer as 'OR'ing floats assert |
| 995 | rlow = DAG.getNode(ISD::OR, dl, MVT::i128, |
| 996 | DAG.getNode(ISD::BITCAST, dl, MVT::i128, low), |
| 997 | DAG.getNode(ISD::BITCAST, dl, MVT::i128, rlow)); |
| 998 | rhi = DAG.getNode(ISD::OR, dl, MVT::i128, |
| 999 | DAG.getNode(ISD::BITCAST, dl, MVT::i128, hi), |
| 1000 | DAG.getNode(ISD::BITCAST, dl, MVT::i128, rhi)); |
Kalle Raiskila | 7ea1ab5 | 2010-11-12 10:14:03 +0000 | [diff] [blame] | 1001 | |
| 1002 | low = DAG.getStore(the_chain, dl, rlow, basePtr, |
| 1003 | lowMemPtr, |
| 1004 | SN->isVolatile(), SN->isNonTemporal(), 16); |
Wesley Peck | bf17cfa | 2010-11-23 03:31:01 +0000 | [diff] [blame] | 1005 | hi = DAG.getStore(the_chain, dl, rhi, |
Kalle Raiskila | 7ea1ab5 | 2010-11-12 10:14:03 +0000 | [diff] [blame] | 1006 | DAG.getNode(ISD::ADD, dl, PtrVT, basePtr, |
| 1007 | DAG.getConstant( 16, PtrVT)), |
| 1008 | highMemPtr, |
| 1009 | SN->isVolatile(), SN->isNonTemporal(), 16); |
| 1010 | result = DAG.getNode(ISD::TokenFactor, dl, MVT::Other, low.getValue(0), |
| 1011 | hi.getValue(0)); |
Wesley Peck | bf17cfa | 2010-11-23 03:31:01 +0000 | [diff] [blame] | 1012 | } |
Kalle Raiskila | 7ea1ab5 | 2010-11-12 10:14:03 +0000 | [diff] [blame] | 1013 | |
| 1014 | return result; |
Scott Michel | 266bc8f | 2007-12-04 22:23:35 +0000 | [diff] [blame] | 1015 | } |
| 1016 | |
Scott Michel | 94bd57e | 2009-01-15 04:41:47 +0000 | [diff] [blame] | 1017 | //! Generate the address of a constant pool entry. |
Dan Gohman | 7db949d | 2009-08-07 01:32:21 +0000 | [diff] [blame] | 1018 | static SDValue |
Dan Gohman | 475871a | 2008-07-27 21:46:04 +0000 | [diff] [blame] | 1019 | LowerConstantPool(SDValue Op, SelectionDAG &DAG, const SPUSubtarget *ST) { |
Owen Anderson | e50ed30 | 2009-08-10 22:56:29 +0000 | [diff] [blame] | 1020 | EVT PtrVT = Op.getValueType(); |
Scott Michel | 266bc8f | 2007-12-04 22:23:35 +0000 | [diff] [blame] | 1021 | ConstantPoolSDNode *CP = cast<ConstantPoolSDNode>(Op); |
Dan Gohman | 46510a7 | 2010-04-15 01:51:59 +0000 | [diff] [blame] | 1022 | const Constant *C = CP->getConstVal(); |
Dan Gohman | 475871a | 2008-07-27 21:46:04 +0000 | [diff] [blame] | 1023 | SDValue CPI = DAG.getTargetConstantPool(C, PtrVT, CP->getAlignment()); |
| 1024 | SDValue Zero = DAG.getConstant(0, PtrVT); |
Scott Michel | 9de5d0d | 2008-01-11 02:53:15 +0000 | [diff] [blame] | 1025 | const TargetMachine &TM = DAG.getTarget(); |
Dale Johannesen | de06470 | 2009-02-06 21:50:26 +0000 | [diff] [blame] | 1026 | // FIXME there is no actual debug info here |
| 1027 | DebugLoc dl = Op.getDebugLoc(); |
Scott Michel | 266bc8f | 2007-12-04 22:23:35 +0000 | [diff] [blame] | 1028 | |
| 1029 | if (TM.getRelocationModel() == Reloc::Static) { |
| 1030 | if (!ST->usingLargeMem()) { |
Dan Gohman | 475871a | 2008-07-27 21:46:04 +0000 | [diff] [blame] | 1031 | // Just return the SDValue with the constant pool address in it. |
Dale Johannesen | de06470 | 2009-02-06 21:50:26 +0000 | [diff] [blame] | 1032 | return DAG.getNode(SPUISD::AFormAddr, dl, PtrVT, CPI, Zero); |
Scott Michel | 266bc8f | 2007-12-04 22:23:35 +0000 | [diff] [blame] | 1033 | } else { |
Dale Johannesen | de06470 | 2009-02-06 21:50:26 +0000 | [diff] [blame] | 1034 | SDValue Hi = DAG.getNode(SPUISD::Hi, dl, PtrVT, CPI, Zero); |
| 1035 | SDValue Lo = DAG.getNode(SPUISD::Lo, dl, PtrVT, CPI, Zero); |
| 1036 | return DAG.getNode(SPUISD::IndirectAddr, dl, PtrVT, Hi, Lo); |
Scott Michel | 266bc8f | 2007-12-04 22:23:35 +0000 | [diff] [blame] | 1037 | } |
| 1038 | } |
| 1039 | |
Torok Edwin | c23197a | 2009-07-14 16:55:14 +0000 | [diff] [blame] | 1040 | llvm_unreachable("LowerConstantPool: Relocation model other than static" |
Torok Edwin | 481d15a | 2009-07-14 12:22:58 +0000 | [diff] [blame] | 1041 | " not supported."); |
Dan Gohman | 475871a | 2008-07-27 21:46:04 +0000 | [diff] [blame] | 1042 | return SDValue(); |
Scott Michel | 266bc8f | 2007-12-04 22:23:35 +0000 | [diff] [blame] | 1043 | } |
| 1044 | |
Scott Michel | 94bd57e | 2009-01-15 04:41:47 +0000 | [diff] [blame] | 1045 | //! Alternate entry point for generating the address of a constant pool entry |
| 1046 | SDValue |
| 1047 | SPU::LowerConstantPool(SDValue Op, SelectionDAG &DAG, const SPUTargetMachine &TM) { |
| 1048 | return ::LowerConstantPool(Op, DAG, TM.getSubtargetImpl()); |
| 1049 | } |
| 1050 | |
Dan Gohman | 475871a | 2008-07-27 21:46:04 +0000 | [diff] [blame] | 1051 | static SDValue |
| 1052 | LowerJumpTable(SDValue Op, SelectionDAG &DAG, const SPUSubtarget *ST) { |
Owen Anderson | e50ed30 | 2009-08-10 22:56:29 +0000 | [diff] [blame] | 1053 | EVT PtrVT = Op.getValueType(); |
Scott Michel | 266bc8f | 2007-12-04 22:23:35 +0000 | [diff] [blame] | 1054 | JumpTableSDNode *JT = cast<JumpTableSDNode>(Op); |
Dan Gohman | 475871a | 2008-07-27 21:46:04 +0000 | [diff] [blame] | 1055 | SDValue JTI = DAG.getTargetJumpTable(JT->getIndex(), PtrVT); |
| 1056 | SDValue Zero = DAG.getConstant(0, PtrVT); |
Scott Michel | 266bc8f | 2007-12-04 22:23:35 +0000 | [diff] [blame] | 1057 | const TargetMachine &TM = DAG.getTarget(); |
Dale Johannesen | de06470 | 2009-02-06 21:50:26 +0000 | [diff] [blame] | 1058 | // FIXME there is no actual debug info here |
| 1059 | DebugLoc dl = Op.getDebugLoc(); |
Scott Michel | 266bc8f | 2007-12-04 22:23:35 +0000 | [diff] [blame] | 1060 | |
| 1061 | if (TM.getRelocationModel() == Reloc::Static) { |
Scott Michel | a59d469 | 2008-02-23 18:41:37 +0000 | [diff] [blame] | 1062 | if (!ST->usingLargeMem()) { |
Dale Johannesen | de06470 | 2009-02-06 21:50:26 +0000 | [diff] [blame] | 1063 | return DAG.getNode(SPUISD::AFormAddr, dl, PtrVT, JTI, Zero); |
Scott Michel | a59d469 | 2008-02-23 18:41:37 +0000 | [diff] [blame] | 1064 | } else { |
Dale Johannesen | de06470 | 2009-02-06 21:50:26 +0000 | [diff] [blame] | 1065 | SDValue Hi = DAG.getNode(SPUISD::Hi, dl, PtrVT, JTI, Zero); |
| 1066 | SDValue Lo = DAG.getNode(SPUISD::Lo, dl, PtrVT, JTI, Zero); |
| 1067 | return DAG.getNode(SPUISD::IndirectAddr, dl, PtrVT, Hi, Lo); |
Scott Michel | a59d469 | 2008-02-23 18:41:37 +0000 | [diff] [blame] | 1068 | } |
Scott Michel | 266bc8f | 2007-12-04 22:23:35 +0000 | [diff] [blame] | 1069 | } |
| 1070 | |
Torok Edwin | c23197a | 2009-07-14 16:55:14 +0000 | [diff] [blame] | 1071 | llvm_unreachable("LowerJumpTable: Relocation model other than static" |
Torok Edwin | 481d15a | 2009-07-14 12:22:58 +0000 | [diff] [blame] | 1072 | " not supported."); |
Dan Gohman | 475871a | 2008-07-27 21:46:04 +0000 | [diff] [blame] | 1073 | return SDValue(); |
Scott Michel | 266bc8f | 2007-12-04 22:23:35 +0000 | [diff] [blame] | 1074 | } |
| 1075 | |
Dan Gohman | 475871a | 2008-07-27 21:46:04 +0000 | [diff] [blame] | 1076 | static SDValue |
| 1077 | LowerGlobalAddress(SDValue Op, SelectionDAG &DAG, const SPUSubtarget *ST) { |
Owen Anderson | e50ed30 | 2009-08-10 22:56:29 +0000 | [diff] [blame] | 1078 | EVT PtrVT = Op.getValueType(); |
Scott Michel | 266bc8f | 2007-12-04 22:23:35 +0000 | [diff] [blame] | 1079 | GlobalAddressSDNode *GSDN = cast<GlobalAddressSDNode>(Op); |
Dan Gohman | 46510a7 | 2010-04-15 01:51:59 +0000 | [diff] [blame] | 1080 | const GlobalValue *GV = GSDN->getGlobal(); |
Devang Patel | 0d881da | 2010-07-06 22:08:15 +0000 | [diff] [blame] | 1081 | SDValue GA = DAG.getTargetGlobalAddress(GV, Op.getDebugLoc(), |
| 1082 | PtrVT, GSDN->getOffset()); |
Scott Michel | 266bc8f | 2007-12-04 22:23:35 +0000 | [diff] [blame] | 1083 | const TargetMachine &TM = DAG.getTarget(); |
Dan Gohman | 475871a | 2008-07-27 21:46:04 +0000 | [diff] [blame] | 1084 | SDValue Zero = DAG.getConstant(0, PtrVT); |
Dale Johannesen | de06470 | 2009-02-06 21:50:26 +0000 | [diff] [blame] | 1085 | // FIXME there is no actual debug info here |
| 1086 | DebugLoc dl = Op.getDebugLoc(); |
Scott Michel | 5af8f0e | 2008-07-16 17:17:29 +0000 | [diff] [blame] | 1087 | |
Scott Michel | 266bc8f | 2007-12-04 22:23:35 +0000 | [diff] [blame] | 1088 | if (TM.getRelocationModel() == Reloc::Static) { |
Scott Michel | 053c1da | 2008-01-29 02:16:57 +0000 | [diff] [blame] | 1089 | if (!ST->usingLargeMem()) { |
Dale Johannesen | de06470 | 2009-02-06 21:50:26 +0000 | [diff] [blame] | 1090 | return DAG.getNode(SPUISD::AFormAddr, dl, PtrVT, GA, Zero); |
Scott Michel | 053c1da | 2008-01-29 02:16:57 +0000 | [diff] [blame] | 1091 | } else { |
Dale Johannesen | de06470 | 2009-02-06 21:50:26 +0000 | [diff] [blame] | 1092 | SDValue Hi = DAG.getNode(SPUISD::Hi, dl, PtrVT, GA, Zero); |
| 1093 | SDValue Lo = DAG.getNode(SPUISD::Lo, dl, PtrVT, GA, Zero); |
| 1094 | return DAG.getNode(SPUISD::IndirectAddr, dl, PtrVT, Hi, Lo); |
Scott Michel | 053c1da | 2008-01-29 02:16:57 +0000 | [diff] [blame] | 1095 | } |
Scott Michel | 266bc8f | 2007-12-04 22:23:35 +0000 | [diff] [blame] | 1096 | } else { |
Chris Lattner | 75361b6 | 2010-04-07 22:58:41 +0000 | [diff] [blame] | 1097 | report_fatal_error("LowerGlobalAddress: Relocation model other than static" |
Torok Edwin | dac237e | 2009-07-08 20:53:28 +0000 | [diff] [blame] | 1098 | "not supported."); |
Scott Michel | 266bc8f | 2007-12-04 22:23:35 +0000 | [diff] [blame] | 1099 | /*NOTREACHED*/ |
| 1100 | } |
| 1101 | |
Dan Gohman | 475871a | 2008-07-27 21:46:04 +0000 | [diff] [blame] | 1102 | return SDValue(); |
Scott Michel | 266bc8f | 2007-12-04 22:23:35 +0000 | [diff] [blame] | 1103 | } |
| 1104 | |
Nate Begeman | ccef580 | 2008-02-14 18:43:04 +0000 | [diff] [blame] | 1105 | //! Custom lower double precision floating point constants |
Dan Gohman | 475871a | 2008-07-27 21:46:04 +0000 | [diff] [blame] | 1106 | static SDValue |
| 1107 | LowerConstantFP(SDValue Op, SelectionDAG &DAG) { |
Owen Anderson | e50ed30 | 2009-08-10 22:56:29 +0000 | [diff] [blame] | 1108 | EVT VT = Op.getValueType(); |
Dale Johannesen | de06470 | 2009-02-06 21:50:26 +0000 | [diff] [blame] | 1109 | // FIXME there is no actual debug info here |
| 1110 | DebugLoc dl = Op.getDebugLoc(); |
Scott Michel | 266bc8f | 2007-12-04 22:23:35 +0000 | [diff] [blame] | 1111 | |
Owen Anderson | 825b72b | 2009-08-11 20:47:22 +0000 | [diff] [blame] | 1112 | if (VT == MVT::f64) { |
Scott Michel | 1a6cdb6 | 2008-12-01 17:56:02 +0000 | [diff] [blame] | 1113 | ConstantFPSDNode *FP = cast<ConstantFPSDNode>(Op.getNode()); |
| 1114 | |
| 1115 | assert((FP != 0) && |
| 1116 | "LowerConstantFP: Node is not ConstantFPSDNode"); |
Scott Michel | 1df30c4 | 2008-12-29 03:23:36 +0000 | [diff] [blame] | 1117 | |
Scott Michel | 170783a | 2007-12-19 20:15:47 +0000 | [diff] [blame] | 1118 | uint64_t dbits = DoubleToBits(FP->getValueAPF().convertToDouble()); |
Owen Anderson | 825b72b | 2009-08-11 20:47:22 +0000 | [diff] [blame] | 1119 | SDValue T = DAG.getConstant(dbits, MVT::i64); |
| 1120 | SDValue Tvec = DAG.getNode(ISD::BUILD_VECTOR, dl, MVT::v2i64, T, T); |
Dale Johannesen | de06470 | 2009-02-06 21:50:26 +0000 | [diff] [blame] | 1121 | return DAG.getNode(SPUISD::VEC2PREFSLOT, dl, VT, |
Wesley Peck | bf17cfa | 2010-11-23 03:31:01 +0000 | [diff] [blame] | 1122 | DAG.getNode(ISD::BITCAST, dl, MVT::v2f64, Tvec)); |
Scott Michel | 266bc8f | 2007-12-04 22:23:35 +0000 | [diff] [blame] | 1123 | } |
| 1124 | |
Dan Gohman | 475871a | 2008-07-27 21:46:04 +0000 | [diff] [blame] | 1125 | return SDValue(); |
Scott Michel | 266bc8f | 2007-12-04 22:23:35 +0000 | [diff] [blame] | 1126 | } |
| 1127 | |
Dan Gohman | 98ca4f2 | 2009-08-05 01:29:28 +0000 | [diff] [blame] | 1128 | SDValue |
| 1129 | SPUTargetLowering::LowerFormalArguments(SDValue Chain, |
Sandeep Patel | 65c3c8f | 2009-09-02 08:44:58 +0000 | [diff] [blame] | 1130 | CallingConv::ID CallConv, bool isVarArg, |
Dan Gohman | 98ca4f2 | 2009-08-05 01:29:28 +0000 | [diff] [blame] | 1131 | const SmallVectorImpl<ISD::InputArg> |
| 1132 | &Ins, |
| 1133 | DebugLoc dl, SelectionDAG &DAG, |
Dan Gohman | d858e90 | 2010-04-17 15:26:15 +0000 | [diff] [blame] | 1134 | SmallVectorImpl<SDValue> &InVals) |
| 1135 | const { |
Dan Gohman | 98ca4f2 | 2009-08-05 01:29:28 +0000 | [diff] [blame] | 1136 | |
Scott Michel | 266bc8f | 2007-12-04 22:23:35 +0000 | [diff] [blame] | 1137 | MachineFunction &MF = DAG.getMachineFunction(); |
| 1138 | MachineFrameInfo *MFI = MF.getFrameInfo(); |
Chris Lattner | 84bc542 | 2007-12-31 04:13:23 +0000 | [diff] [blame] | 1139 | MachineRegisterInfo &RegInfo = MF.getRegInfo(); |
Dan Gohman | 1e93df6 | 2010-04-17 14:41:14 +0000 | [diff] [blame] | 1140 | SPUFunctionInfo *FuncInfo = MF.getInfo<SPUFunctionInfo>(); |
Scott Michel | 266bc8f | 2007-12-04 22:23:35 +0000 | [diff] [blame] | 1141 | |
Anton Korobeynikov | 16c29b5 | 2011-01-10 12:39:04 +0000 | [diff] [blame] | 1142 | unsigned ArgOffset = SPUFrameLowering::minStackSize(); |
Scott Michel | 266bc8f | 2007-12-04 22:23:35 +0000 | [diff] [blame] | 1143 | unsigned ArgRegIdx = 0; |
Anton Korobeynikov | 16c29b5 | 2011-01-10 12:39:04 +0000 | [diff] [blame] | 1144 | unsigned StackSlotSize = SPUFrameLowering::stackSlotSize(); |
Scott Michel | 5af8f0e | 2008-07-16 17:17:29 +0000 | [diff] [blame] | 1145 | |
Owen Anderson | e50ed30 | 2009-08-10 22:56:29 +0000 | [diff] [blame] | 1146 | EVT PtrVT = DAG.getTargetLoweringInfo().getPointerTy(); |
Scott Michel | 5af8f0e | 2008-07-16 17:17:29 +0000 | [diff] [blame] | 1147 | |
Kalle Raiskila | d258c49 | 2010-07-08 21:15:22 +0000 | [diff] [blame] | 1148 | SmallVector<CCValAssign, 16> ArgLocs; |
Eric Christopher | 471e422 | 2011-06-08 23:55:35 +0000 | [diff] [blame] | 1149 | CCState CCInfo(CallConv, isVarArg, DAG.getMachineFunction(), |
| 1150 | getTargetMachine(), ArgLocs, *DAG.getContext()); |
Kalle Raiskila | d258c49 | 2010-07-08 21:15:22 +0000 | [diff] [blame] | 1151 | // FIXME: allow for other calling conventions |
| 1152 | CCInfo.AnalyzeFormalArguments(Ins, CCC_SPU); |
| 1153 | |
Scott Michel | 266bc8f | 2007-12-04 22:23:35 +0000 | [diff] [blame] | 1154 | // Add DAG nodes to load the arguments or copy them out of registers. |
Dan Gohman | 98ca4f2 | 2009-08-05 01:29:28 +0000 | [diff] [blame] | 1155 | for (unsigned ArgNo = 0, e = Ins.size(); ArgNo != e; ++ArgNo) { |
Owen Anderson | e50ed30 | 2009-08-10 22:56:29 +0000 | [diff] [blame] | 1156 | EVT ObjectVT = Ins[ArgNo].VT; |
Duncan Sands | 83ec4b6 | 2008-06-06 12:08:01 +0000 | [diff] [blame] | 1157 | unsigned ObjSize = ObjectVT.getSizeInBits()/8; |
Scott Michel | d976c21 | 2008-10-30 01:51:48 +0000 | [diff] [blame] | 1158 | SDValue ArgVal; |
Kalle Raiskila | d258c49 | 2010-07-08 21:15:22 +0000 | [diff] [blame] | 1159 | CCValAssign &VA = ArgLocs[ArgNo]; |
Scott Michel | 266bc8f | 2007-12-04 22:23:35 +0000 | [diff] [blame] | 1160 | |
Kalle Raiskila | d258c49 | 2010-07-08 21:15:22 +0000 | [diff] [blame] | 1161 | if (VA.isRegLoc()) { |
Scott Michel | d976c21 | 2008-10-30 01:51:48 +0000 | [diff] [blame] | 1162 | const TargetRegisterClass *ArgRegClass; |
Scott Michel | 5af8f0e | 2008-07-16 17:17:29 +0000 | [diff] [blame] | 1163 | |
Owen Anderson | 825b72b | 2009-08-11 20:47:22 +0000 | [diff] [blame] | 1164 | switch (ObjectVT.getSimpleVT().SimpleTy) { |
Benjamin Kramer | 1bd7335 | 2010-04-08 10:44:28 +0000 | [diff] [blame] | 1165 | default: |
| 1166 | report_fatal_error("LowerFormalArguments Unhandled argument type: " + |
| 1167 | Twine(ObjectVT.getEVTString())); |
Owen Anderson | 825b72b | 2009-08-11 20:47:22 +0000 | [diff] [blame] | 1168 | case MVT::i8: |
Scott Michel | 9c0c6b2 | 2008-11-21 02:56:16 +0000 | [diff] [blame] | 1169 | ArgRegClass = &SPU::R8CRegClass; |
| 1170 | break; |
Owen Anderson | 825b72b | 2009-08-11 20:47:22 +0000 | [diff] [blame] | 1171 | case MVT::i16: |
Scott Michel | 9c0c6b2 | 2008-11-21 02:56:16 +0000 | [diff] [blame] | 1172 | ArgRegClass = &SPU::R16CRegClass; |
| 1173 | break; |
Owen Anderson | 825b72b | 2009-08-11 20:47:22 +0000 | [diff] [blame] | 1174 | case MVT::i32: |
Scott Michel | 9c0c6b2 | 2008-11-21 02:56:16 +0000 | [diff] [blame] | 1175 | ArgRegClass = &SPU::R32CRegClass; |
| 1176 | break; |
Owen Anderson | 825b72b | 2009-08-11 20:47:22 +0000 | [diff] [blame] | 1177 | case MVT::i64: |
Scott Michel | 9c0c6b2 | 2008-11-21 02:56:16 +0000 | [diff] [blame] | 1178 | ArgRegClass = &SPU::R64CRegClass; |
| 1179 | break; |
Owen Anderson | 825b72b | 2009-08-11 20:47:22 +0000 | [diff] [blame] | 1180 | case MVT::i128: |
Scott Michel | dd95009 | 2009-01-06 03:36:14 +0000 | [diff] [blame] | 1181 | ArgRegClass = &SPU::GPRCRegClass; |
| 1182 | break; |
Owen Anderson | 825b72b | 2009-08-11 20:47:22 +0000 | [diff] [blame] | 1183 | case MVT::f32: |
Scott Michel | 9c0c6b2 | 2008-11-21 02:56:16 +0000 | [diff] [blame] | 1184 | ArgRegClass = &SPU::R32FPRegClass; |
| 1185 | break; |
Owen Anderson | 825b72b | 2009-08-11 20:47:22 +0000 | [diff] [blame] | 1186 | case MVT::f64: |
Scott Michel | 9c0c6b2 | 2008-11-21 02:56:16 +0000 | [diff] [blame] | 1187 | ArgRegClass = &SPU::R64FPRegClass; |
| 1188 | break; |
Owen Anderson | 825b72b | 2009-08-11 20:47:22 +0000 | [diff] [blame] | 1189 | case MVT::v2f64: |
| 1190 | case MVT::v4f32: |
| 1191 | case MVT::v2i64: |
| 1192 | case MVT::v4i32: |
| 1193 | case MVT::v8i16: |
| 1194 | case MVT::v16i8: |
Scott Michel | 9c0c6b2 | 2008-11-21 02:56:16 +0000 | [diff] [blame] | 1195 | ArgRegClass = &SPU::VECREGRegClass; |
| 1196 | break; |
Scott Michel | d976c21 | 2008-10-30 01:51:48 +0000 | [diff] [blame] | 1197 | } |
| 1198 | |
| 1199 | unsigned VReg = RegInfo.createVirtualRegister(ArgRegClass); |
Kalle Raiskila | d258c49 | 2010-07-08 21:15:22 +0000 | [diff] [blame] | 1200 | RegInfo.addLiveIn(VA.getLocReg(), VReg); |
Dan Gohman | 98ca4f2 | 2009-08-05 01:29:28 +0000 | [diff] [blame] | 1201 | ArgVal = DAG.getCopyFromReg(Chain, dl, VReg, ObjectVT); |
Scott Michel | d976c21 | 2008-10-30 01:51:48 +0000 | [diff] [blame] | 1202 | ++ArgRegIdx; |
| 1203 | } else { |
| 1204 | // We need to load the argument to a virtual register if we determined |
| 1205 | // above that we ran out of physical registers of the appropriate type |
| 1206 | // or we're forced to do vararg |
Evan Cheng | ed2ae13 | 2010-07-03 00:40:23 +0000 | [diff] [blame] | 1207 | int FI = MFI->CreateFixedObject(ObjSize, ArgOffset, true); |
Dan Gohman | 475871a | 2008-07-27 21:46:04 +0000 | [diff] [blame] | 1208 | SDValue FIN = DAG.getFrameIndex(FI, PtrVT); |
Chris Lattner | e863903 | 2010-09-21 06:22:23 +0000 | [diff] [blame] | 1209 | ArgVal = DAG.getLoad(ObjectVT, dl, Chain, FIN, MachinePointerInfo(), |
Pete Cooper | d752e0f | 2011-11-08 18:42:53 +0000 | [diff] [blame] | 1210 | false, false, false, 0); |
Scott Michel | 266bc8f | 2007-12-04 22:23:35 +0000 | [diff] [blame] | 1211 | ArgOffset += StackSlotSize; |
| 1212 | } |
Scott Michel | 5af8f0e | 2008-07-16 17:17:29 +0000 | [diff] [blame] | 1213 | |
Dan Gohman | 98ca4f2 | 2009-08-05 01:29:28 +0000 | [diff] [blame] | 1214 | InVals.push_back(ArgVal); |
Scott Michel | d976c21 | 2008-10-30 01:51:48 +0000 | [diff] [blame] | 1215 | // Update the chain |
Dan Gohman | 98ca4f2 | 2009-08-05 01:29:28 +0000 | [diff] [blame] | 1216 | Chain = ArgVal.getOperand(0); |
Scott Michel | 266bc8f | 2007-12-04 22:23:35 +0000 | [diff] [blame] | 1217 | } |
Scott Michel | 5af8f0e | 2008-07-16 17:17:29 +0000 | [diff] [blame] | 1218 | |
Scott Michel | d976c21 | 2008-10-30 01:51:48 +0000 | [diff] [blame] | 1219 | // vararg handling: |
Scott Michel | 266bc8f | 2007-12-04 22:23:35 +0000 | [diff] [blame] | 1220 | if (isVarArg) { |
Wesley Peck | bf17cfa | 2010-11-23 03:31:01 +0000 | [diff] [blame] | 1221 | // FIXME: we should be able to query the argument registers from |
| 1222 | // tablegen generated code. |
Kalle Raiskila | d258c49 | 2010-07-08 21:15:22 +0000 | [diff] [blame] | 1223 | static const unsigned ArgRegs[] = { |
| 1224 | SPU::R3, SPU::R4, SPU::R5, SPU::R6, SPU::R7, SPU::R8, SPU::R9, |
| 1225 | SPU::R10, SPU::R11, SPU::R12, SPU::R13, SPU::R14, SPU::R15, SPU::R16, |
| 1226 | SPU::R17, SPU::R18, SPU::R19, SPU::R20, SPU::R21, SPU::R22, SPU::R23, |
| 1227 | SPU::R24, SPU::R25, SPU::R26, SPU::R27, SPU::R28, SPU::R29, SPU::R30, |
| 1228 | SPU::R31, SPU::R32, SPU::R33, SPU::R34, SPU::R35, SPU::R36, SPU::R37, |
| 1229 | SPU::R38, SPU::R39, SPU::R40, SPU::R41, SPU::R42, SPU::R43, SPU::R44, |
| 1230 | SPU::R45, SPU::R46, SPU::R47, SPU::R48, SPU::R49, SPU::R50, SPU::R51, |
| 1231 | SPU::R52, SPU::R53, SPU::R54, SPU::R55, SPU::R56, SPU::R57, SPU::R58, |
| 1232 | SPU::R59, SPU::R60, SPU::R61, SPU::R62, SPU::R63, SPU::R64, SPU::R65, |
| 1233 | SPU::R66, SPU::R67, SPU::R68, SPU::R69, SPU::R70, SPU::R71, SPU::R72, |
| 1234 | SPU::R73, SPU::R74, SPU::R75, SPU::R76, SPU::R77, SPU::R78, SPU::R79 |
| 1235 | }; |
| 1236 | // size of ArgRegs array |
| 1237 | unsigned NumArgRegs = 77; |
| 1238 | |
Scott Michel | d976c21 | 2008-10-30 01:51:48 +0000 | [diff] [blame] | 1239 | // We will spill (79-3)+1 registers to the stack |
| 1240 | SmallVector<SDValue, 79-3+1> MemOps; |
| 1241 | |
| 1242 | // Create the frame slot |
Scott Michel | 266bc8f | 2007-12-04 22:23:35 +0000 | [diff] [blame] | 1243 | for (; ArgRegIdx != NumArgRegs; ++ArgRegIdx) { |
Dan Gohman | 1e93df6 | 2010-04-17 14:41:14 +0000 | [diff] [blame] | 1244 | FuncInfo->setVarArgsFrameIndex( |
Evan Cheng | ed2ae13 | 2010-07-03 00:40:23 +0000 | [diff] [blame] | 1245 | MFI->CreateFixedObject(StackSlotSize, ArgOffset, true)); |
Dan Gohman | 1e93df6 | 2010-04-17 14:41:14 +0000 | [diff] [blame] | 1246 | SDValue FIN = DAG.getFrameIndex(FuncInfo->getVarArgsFrameIndex(), PtrVT); |
Cameron Zwarich | 055cdfc | 2011-05-19 04:44:19 +0000 | [diff] [blame] | 1247 | unsigned VReg = MF.addLiveIn(ArgRegs[ArgRegIdx], &SPU::VECREGRegClass); |
Chris Lattner | e27e02b | 2010-03-29 17:38:47 +0000 | [diff] [blame] | 1248 | SDValue ArgVal = DAG.getRegister(VReg, MVT::v16i8); |
Chris Lattner | 6229d0a | 2010-09-21 18:41:36 +0000 | [diff] [blame] | 1249 | SDValue Store = DAG.getStore(Chain, dl, ArgVal, FIN, MachinePointerInfo(), |
David Greene | 73657df | 2010-02-15 16:55:58 +0000 | [diff] [blame] | 1250 | false, false, 0); |
Dan Gohman | 98ca4f2 | 2009-08-05 01:29:28 +0000 | [diff] [blame] | 1251 | Chain = Store.getOperand(0); |
Scott Michel | 266bc8f | 2007-12-04 22:23:35 +0000 | [diff] [blame] | 1252 | MemOps.push_back(Store); |
Scott Michel | d976c21 | 2008-10-30 01:51:48 +0000 | [diff] [blame] | 1253 | |
| 1254 | // Increment address by stack slot size for the next stored argument |
| 1255 | ArgOffset += StackSlotSize; |
Scott Michel | 266bc8f | 2007-12-04 22:23:35 +0000 | [diff] [blame] | 1256 | } |
| 1257 | if (!MemOps.empty()) |
Owen Anderson | 825b72b | 2009-08-11 20:47:22 +0000 | [diff] [blame] | 1258 | Chain = DAG.getNode(ISD::TokenFactor, dl, MVT::Other, |
Dan Gohman | 98ca4f2 | 2009-08-05 01:29:28 +0000 | [diff] [blame] | 1259 | &MemOps[0], MemOps.size()); |
Scott Michel | 266bc8f | 2007-12-04 22:23:35 +0000 | [diff] [blame] | 1260 | } |
Scott Michel | 5af8f0e | 2008-07-16 17:17:29 +0000 | [diff] [blame] | 1261 | |
Dan Gohman | 98ca4f2 | 2009-08-05 01:29:28 +0000 | [diff] [blame] | 1262 | return Chain; |
Scott Michel | 266bc8f | 2007-12-04 22:23:35 +0000 | [diff] [blame] | 1263 | } |
| 1264 | |
| 1265 | /// isLSAAddress - Return the immediate to use if the specified |
| 1266 | /// value is representable as a LSA address. |
Dan Gohman | 475871a | 2008-07-27 21:46:04 +0000 | [diff] [blame] | 1267 | static SDNode *isLSAAddress(SDValue Op, SelectionDAG &DAG) { |
Scott Michel | 19fd42a | 2008-11-11 03:06:06 +0000 | [diff] [blame] | 1268 | ConstantSDNode *C = dyn_cast<ConstantSDNode>(Op); |
Scott Michel | 266bc8f | 2007-12-04 22:23:35 +0000 | [diff] [blame] | 1269 | if (!C) return 0; |
Scott Michel | 5af8f0e | 2008-07-16 17:17:29 +0000 | [diff] [blame] | 1270 | |
Dan Gohman | f5aeb1a | 2008-09-12 16:56:44 +0000 | [diff] [blame] | 1271 | int Addr = C->getZExtValue(); |
Scott Michel | 266bc8f | 2007-12-04 22:23:35 +0000 | [diff] [blame] | 1272 | if ((Addr & 3) != 0 || // Low 2 bits are implicitly zero. |
| 1273 | (Addr << 14 >> 14) != Addr) |
| 1274 | return 0; // Top 14 bits have to be sext of immediate. |
Scott Michel | 5af8f0e | 2008-07-16 17:17:29 +0000 | [diff] [blame] | 1275 | |
Owen Anderson | 825b72b | 2009-08-11 20:47:22 +0000 | [diff] [blame] | 1276 | return DAG.getConstant((int)C->getZExtValue() >> 2, MVT::i32).getNode(); |
Scott Michel | 266bc8f | 2007-12-04 22:23:35 +0000 | [diff] [blame] | 1277 | } |
| 1278 | |
Dan Gohman | 98ca4f2 | 2009-08-05 01:29:28 +0000 | [diff] [blame] | 1279 | SDValue |
Evan Cheng | 022d9e1 | 2010-02-02 23:55:14 +0000 | [diff] [blame] | 1280 | SPUTargetLowering::LowerCall(SDValue Chain, SDValue Callee, |
Sandeep Patel | 65c3c8f | 2009-09-02 08:44:58 +0000 | [diff] [blame] | 1281 | CallingConv::ID CallConv, bool isVarArg, |
Evan Cheng | 0c439eb | 2010-01-27 00:07:07 +0000 | [diff] [blame] | 1282 | bool &isTailCall, |
Dan Gohman | 98ca4f2 | 2009-08-05 01:29:28 +0000 | [diff] [blame] | 1283 | const SmallVectorImpl<ISD::OutputArg> &Outs, |
Dan Gohman | c940365 | 2010-07-07 15:54:55 +0000 | [diff] [blame] | 1284 | const SmallVectorImpl<SDValue> &OutVals, |
Dan Gohman | 98ca4f2 | 2009-08-05 01:29:28 +0000 | [diff] [blame] | 1285 | const SmallVectorImpl<ISD::InputArg> &Ins, |
| 1286 | DebugLoc dl, SelectionDAG &DAG, |
Dan Gohman | d858e90 | 2010-04-17 15:26:15 +0000 | [diff] [blame] | 1287 | SmallVectorImpl<SDValue> &InVals) const { |
Evan Cheng | 0c439eb | 2010-01-27 00:07:07 +0000 | [diff] [blame] | 1288 | // CellSPU target does not yet support tail call optimization. |
| 1289 | isTailCall = false; |
Dan Gohman | 98ca4f2 | 2009-08-05 01:29:28 +0000 | [diff] [blame] | 1290 | |
| 1291 | const SPUSubtarget *ST = SPUTM.getSubtargetImpl(); |
| 1292 | unsigned NumOps = Outs.size(); |
Anton Korobeynikov | 16c29b5 | 2011-01-10 12:39:04 +0000 | [diff] [blame] | 1293 | unsigned StackSlotSize = SPUFrameLowering::stackSlotSize(); |
Kalle Raiskila | d258c49 | 2010-07-08 21:15:22 +0000 | [diff] [blame] | 1294 | |
| 1295 | SmallVector<CCValAssign, 16> ArgLocs; |
Eric Christopher | 471e422 | 2011-06-08 23:55:35 +0000 | [diff] [blame] | 1296 | CCState CCInfo(CallConv, isVarArg, DAG.getMachineFunction(), |
| 1297 | getTargetMachine(), ArgLocs, *DAG.getContext()); |
Kalle Raiskila | d258c49 | 2010-07-08 21:15:22 +0000 | [diff] [blame] | 1298 | // FIXME: allow for other calling conventions |
| 1299 | CCInfo.AnalyzeCallOperands(Outs, CCC_SPU); |
Wesley Peck | bf17cfa | 2010-11-23 03:31:01 +0000 | [diff] [blame] | 1300 | |
Kalle Raiskila | d258c49 | 2010-07-08 21:15:22 +0000 | [diff] [blame] | 1301 | const unsigned NumArgRegs = ArgLocs.size(); |
| 1302 | |
Scott Michel | 266bc8f | 2007-12-04 22:23:35 +0000 | [diff] [blame] | 1303 | |
| 1304 | // Handy pointer type |
Owen Anderson | e50ed30 | 2009-08-10 22:56:29 +0000 | [diff] [blame] | 1305 | EVT PtrVT = DAG.getTargetLoweringInfo().getPointerTy(); |
Scott Michel | 5af8f0e | 2008-07-16 17:17:29 +0000 | [diff] [blame] | 1306 | |
Scott Michel | 266bc8f | 2007-12-04 22:23:35 +0000 | [diff] [blame] | 1307 | // Set up a copy of the stack pointer for use loading and storing any |
| 1308 | // arguments that may not fit in the registers available for argument |
| 1309 | // passing. |
Owen Anderson | 825b72b | 2009-08-11 20:47:22 +0000 | [diff] [blame] | 1310 | SDValue StackPtr = DAG.getRegister(SPU::R1, MVT::i32); |
Scott Michel | 5af8f0e | 2008-07-16 17:17:29 +0000 | [diff] [blame] | 1311 | |
Scott Michel | 266bc8f | 2007-12-04 22:23:35 +0000 | [diff] [blame] | 1312 | // Figure out which arguments are going to go in registers, and which in |
| 1313 | // memory. |
Anton Korobeynikov | 16c29b5 | 2011-01-10 12:39:04 +0000 | [diff] [blame] | 1314 | unsigned ArgOffset = SPUFrameLowering::minStackSize(); // Just below [LR] |
Scott Michel | 266bc8f | 2007-12-04 22:23:35 +0000 | [diff] [blame] | 1315 | unsigned ArgRegIdx = 0; |
| 1316 | |
| 1317 | // Keep track of registers passing arguments |
Dan Gohman | 475871a | 2008-07-27 21:46:04 +0000 | [diff] [blame] | 1318 | std::vector<std::pair<unsigned, SDValue> > RegsToPass; |
Scott Michel | 266bc8f | 2007-12-04 22:23:35 +0000 | [diff] [blame] | 1319 | // And the arguments passed on the stack |
Dan Gohman | 475871a | 2008-07-27 21:46:04 +0000 | [diff] [blame] | 1320 | SmallVector<SDValue, 8> MemOpChains; |
Scott Michel | 266bc8f | 2007-12-04 22:23:35 +0000 | [diff] [blame] | 1321 | |
Kalle Raiskila | d258c49 | 2010-07-08 21:15:22 +0000 | [diff] [blame] | 1322 | for (; ArgRegIdx != NumOps; ++ArgRegIdx) { |
| 1323 | SDValue Arg = OutVals[ArgRegIdx]; |
| 1324 | CCValAssign &VA = ArgLocs[ArgRegIdx]; |
Scott Michel | 5af8f0e | 2008-07-16 17:17:29 +0000 | [diff] [blame] | 1325 | |
Scott Michel | 266bc8f | 2007-12-04 22:23:35 +0000 | [diff] [blame] | 1326 | // PtrOff will be used to store the current argument to the stack if a |
| 1327 | // register cannot be found for it. |
Dan Gohman | 475871a | 2008-07-27 21:46:04 +0000 | [diff] [blame] | 1328 | SDValue PtrOff = DAG.getConstant(ArgOffset, StackPtr.getValueType()); |
Dale Johannesen | 33c960f | 2009-02-04 20:06:27 +0000 | [diff] [blame] | 1329 | PtrOff = DAG.getNode(ISD::ADD, dl, PtrVT, StackPtr, PtrOff); |
Scott Michel | 266bc8f | 2007-12-04 22:23:35 +0000 | [diff] [blame] | 1330 | |
Owen Anderson | 825b72b | 2009-08-11 20:47:22 +0000 | [diff] [blame] | 1331 | switch (Arg.getValueType().getSimpleVT().SimpleTy) { |
Torok Edwin | c23197a | 2009-07-14 16:55:14 +0000 | [diff] [blame] | 1332 | default: llvm_unreachable("Unexpected ValueType for argument!"); |
Owen Anderson | 825b72b | 2009-08-11 20:47:22 +0000 | [diff] [blame] | 1333 | case MVT::i8: |
| 1334 | case MVT::i16: |
| 1335 | case MVT::i32: |
| 1336 | case MVT::i64: |
| 1337 | case MVT::i128: |
Owen Anderson | 825b72b | 2009-08-11 20:47:22 +0000 | [diff] [blame] | 1338 | case MVT::f32: |
| 1339 | case MVT::f64: |
Owen Anderson | 825b72b | 2009-08-11 20:47:22 +0000 | [diff] [blame] | 1340 | case MVT::v2i64: |
| 1341 | case MVT::v2f64: |
| 1342 | case MVT::v4f32: |
| 1343 | case MVT::v4i32: |
| 1344 | case MVT::v8i16: |
| 1345 | case MVT::v16i8: |
Scott Michel | 266bc8f | 2007-12-04 22:23:35 +0000 | [diff] [blame] | 1346 | if (ArgRegIdx != NumArgRegs) { |
Kalle Raiskila | d258c49 | 2010-07-08 21:15:22 +0000 | [diff] [blame] | 1347 | RegsToPass.push_back(std::make_pair(VA.getLocReg(), Arg)); |
Scott Michel | 266bc8f | 2007-12-04 22:23:35 +0000 | [diff] [blame] | 1348 | } else { |
Chris Lattner | 6229d0a | 2010-09-21 18:41:36 +0000 | [diff] [blame] | 1349 | MemOpChains.push_back(DAG.getStore(Chain, dl, Arg, PtrOff, |
| 1350 | MachinePointerInfo(), |
David Greene | 73657df | 2010-02-15 16:55:58 +0000 | [diff] [blame] | 1351 | false, false, 0)); |
Scott Michel | 7f9ba9b | 2008-01-30 02:55:46 +0000 | [diff] [blame] | 1352 | ArgOffset += StackSlotSize; |
Scott Michel | 266bc8f | 2007-12-04 22:23:35 +0000 | [diff] [blame] | 1353 | } |
| 1354 | break; |
| 1355 | } |
| 1356 | } |
| 1357 | |
Bill Wendling | ce90c24 | 2009-12-28 01:31:11 +0000 | [diff] [blame] | 1358 | // Accumulate how many bytes are to be pushed on the stack, including the |
| 1359 | // linkage area, and parameter passing area. According to the SPU ABI, |
| 1360 | // we minimally need space for [LR] and [SP]. |
Anton Korobeynikov | 16c29b5 | 2011-01-10 12:39:04 +0000 | [diff] [blame] | 1361 | unsigned NumStackBytes = ArgOffset - SPUFrameLowering::minStackSize(); |
Bill Wendling | ce90c24 | 2009-12-28 01:31:11 +0000 | [diff] [blame] | 1362 | |
| 1363 | // Insert a call sequence start |
Chris Lattner | e563bbc | 2008-10-11 22:08:30 +0000 | [diff] [blame] | 1364 | Chain = DAG.getCALLSEQ_START(Chain, DAG.getIntPtrConstant(NumStackBytes, |
| 1365 | true)); |
Scott Michel | 266bc8f | 2007-12-04 22:23:35 +0000 | [diff] [blame] | 1366 | |
| 1367 | if (!MemOpChains.empty()) { |
| 1368 | // Adjust the stack pointer for the stack arguments. |
Owen Anderson | 825b72b | 2009-08-11 20:47:22 +0000 | [diff] [blame] | 1369 | Chain = DAG.getNode(ISD::TokenFactor, dl, MVT::Other, |
Scott Michel | 266bc8f | 2007-12-04 22:23:35 +0000 | [diff] [blame] | 1370 | &MemOpChains[0], MemOpChains.size()); |
| 1371 | } |
Scott Michel | 5af8f0e | 2008-07-16 17:17:29 +0000 | [diff] [blame] | 1372 | |
Scott Michel | 266bc8f | 2007-12-04 22:23:35 +0000 | [diff] [blame] | 1373 | // Build a sequence of copy-to-reg nodes chained together with token chain |
| 1374 | // and flag operands which copy the outgoing args into the appropriate regs. |
Dan Gohman | 475871a | 2008-07-27 21:46:04 +0000 | [diff] [blame] | 1375 | SDValue InFlag; |
Scott Michel | 266bc8f | 2007-12-04 22:23:35 +0000 | [diff] [blame] | 1376 | for (unsigned i = 0, e = RegsToPass.size(); i != e; ++i) { |
Scott Michel | 6e1d147 | 2009-03-16 18:47:25 +0000 | [diff] [blame] | 1377 | Chain = DAG.getCopyToReg(Chain, dl, RegsToPass[i].first, |
Dale Johannesen | 33c960f | 2009-02-04 20:06:27 +0000 | [diff] [blame] | 1378 | RegsToPass[i].second, InFlag); |
Scott Michel | 266bc8f | 2007-12-04 22:23:35 +0000 | [diff] [blame] | 1379 | InFlag = Chain.getValue(1); |
| 1380 | } |
Scott Michel | 5af8f0e | 2008-07-16 17:17:29 +0000 | [diff] [blame] | 1381 | |
Dan Gohman | 475871a | 2008-07-27 21:46:04 +0000 | [diff] [blame] | 1382 | SmallVector<SDValue, 8> Ops; |
Scott Michel | 266bc8f | 2007-12-04 22:23:35 +0000 | [diff] [blame] | 1383 | unsigned CallOpc = SPUISD::CALL; |
Scott Michel | 5af8f0e | 2008-07-16 17:17:29 +0000 | [diff] [blame] | 1384 | |
Bill Wendling | 056292f | 2008-09-16 21:48:12 +0000 | [diff] [blame] | 1385 | // If the callee is a GlobalAddress/ExternalSymbol node (quite common, every |
| 1386 | // direct call is) turn it into a TargetGlobalAddress/TargetExternalSymbol |
| 1387 | // node so that legalize doesn't hack it. |
Scott Michel | 19fd42a | 2008-11-11 03:06:06 +0000 | [diff] [blame] | 1388 | if (GlobalAddressSDNode *G = dyn_cast<GlobalAddressSDNode>(Callee)) { |
Dan Gohman | 46510a7 | 2010-04-15 01:51:59 +0000 | [diff] [blame] | 1389 | const GlobalValue *GV = G->getGlobal(); |
Owen Anderson | e50ed30 | 2009-08-10 22:56:29 +0000 | [diff] [blame] | 1390 | EVT CalleeVT = Callee.getValueType(); |
Dan Gohman | 475871a | 2008-07-27 21:46:04 +0000 | [diff] [blame] | 1391 | SDValue Zero = DAG.getConstant(0, PtrVT); |
Devang Patel | 0d881da | 2010-07-06 22:08:15 +0000 | [diff] [blame] | 1392 | SDValue GA = DAG.getTargetGlobalAddress(GV, dl, CalleeVT); |
Scott Michel | 266bc8f | 2007-12-04 22:23:35 +0000 | [diff] [blame] | 1393 | |
Scott Michel | 9de5d0d | 2008-01-11 02:53:15 +0000 | [diff] [blame] | 1394 | if (!ST->usingLargeMem()) { |
| 1395 | // Turn calls to targets that are defined (i.e., have bodies) into BRSL |
| 1396 | // style calls, otherwise, external symbols are BRASL calls. This assumes |
| 1397 | // that declared/defined symbols are in the same compilation unit and can |
| 1398 | // be reached through PC-relative jumps. |
| 1399 | // |
| 1400 | // NOTE: |
| 1401 | // This may be an unsafe assumption for JIT and really large compilation |
| 1402 | // units. |
| 1403 | if (GV->isDeclaration()) { |
Dale Johannesen | de06470 | 2009-02-06 21:50:26 +0000 | [diff] [blame] | 1404 | Callee = DAG.getNode(SPUISD::AFormAddr, dl, CalleeVT, GA, Zero); |
Scott Michel | 9de5d0d | 2008-01-11 02:53:15 +0000 | [diff] [blame] | 1405 | } else { |
Dale Johannesen | de06470 | 2009-02-06 21:50:26 +0000 | [diff] [blame] | 1406 | Callee = DAG.getNode(SPUISD::PCRelAddr, dl, CalleeVT, GA, Zero); |
Scott Michel | 9de5d0d | 2008-01-11 02:53:15 +0000 | [diff] [blame] | 1407 | } |
Scott Michel | 266bc8f | 2007-12-04 22:23:35 +0000 | [diff] [blame] | 1408 | } else { |
Scott Michel | 9de5d0d | 2008-01-11 02:53:15 +0000 | [diff] [blame] | 1409 | // "Large memory" mode: Turn all calls into indirect calls with a X-form |
| 1410 | // address pairs: |
Dale Johannesen | de06470 | 2009-02-06 21:50:26 +0000 | [diff] [blame] | 1411 | Callee = DAG.getNode(SPUISD::IndirectAddr, dl, PtrVT, GA, Zero); |
Scott Michel | 266bc8f | 2007-12-04 22:23:35 +0000 | [diff] [blame] | 1412 | } |
Scott Michel | 1df30c4 | 2008-12-29 03:23:36 +0000 | [diff] [blame] | 1413 | } else if (ExternalSymbolSDNode *S = dyn_cast<ExternalSymbolSDNode>(Callee)) { |
Owen Anderson | e50ed30 | 2009-08-10 22:56:29 +0000 | [diff] [blame] | 1414 | EVT CalleeVT = Callee.getValueType(); |
Scott Michel | 1df30c4 | 2008-12-29 03:23:36 +0000 | [diff] [blame] | 1415 | SDValue Zero = DAG.getConstant(0, PtrVT); |
| 1416 | SDValue ExtSym = DAG.getTargetExternalSymbol(S->getSymbol(), |
| 1417 | Callee.getValueType()); |
| 1418 | |
| 1419 | if (!ST->usingLargeMem()) { |
Dale Johannesen | de06470 | 2009-02-06 21:50:26 +0000 | [diff] [blame] | 1420 | Callee = DAG.getNode(SPUISD::AFormAddr, dl, CalleeVT, ExtSym, Zero); |
Scott Michel | 1df30c4 | 2008-12-29 03:23:36 +0000 | [diff] [blame] | 1421 | } else { |
Dale Johannesen | de06470 | 2009-02-06 21:50:26 +0000 | [diff] [blame] | 1422 | Callee = DAG.getNode(SPUISD::IndirectAddr, dl, PtrVT, ExtSym, Zero); |
Scott Michel | 1df30c4 | 2008-12-29 03:23:36 +0000 | [diff] [blame] | 1423 | } |
| 1424 | } else if (SDNode *Dest = isLSAAddress(Callee, DAG)) { |
Scott Michel | 266bc8f | 2007-12-04 22:23:35 +0000 | [diff] [blame] | 1425 | // If this is an absolute destination address that appears to be a legal |
| 1426 | // local store address, use the munged value. |
Dan Gohman | 475871a | 2008-07-27 21:46:04 +0000 | [diff] [blame] | 1427 | Callee = SDValue(Dest, 0); |
Scott Michel | 9de5d0d | 2008-01-11 02:53:15 +0000 | [diff] [blame] | 1428 | } |
Scott Michel | 266bc8f | 2007-12-04 22:23:35 +0000 | [diff] [blame] | 1429 | |
| 1430 | Ops.push_back(Chain); |
| 1431 | Ops.push_back(Callee); |
Scott Michel | 5af8f0e | 2008-07-16 17:17:29 +0000 | [diff] [blame] | 1432 | |
Scott Michel | 266bc8f | 2007-12-04 22:23:35 +0000 | [diff] [blame] | 1433 | // Add argument registers to the end of the list so that they are known live |
| 1434 | // into the call. |
| 1435 | for (unsigned i = 0, e = RegsToPass.size(); i != e; ++i) |
Scott Michel | 5af8f0e | 2008-07-16 17:17:29 +0000 | [diff] [blame] | 1436 | Ops.push_back(DAG.getRegister(RegsToPass[i].first, |
Scott Michel | 266bc8f | 2007-12-04 22:23:35 +0000 | [diff] [blame] | 1437 | RegsToPass[i].second.getValueType())); |
Scott Michel | 5af8f0e | 2008-07-16 17:17:29 +0000 | [diff] [blame] | 1438 | |
Gabor Greif | ba36cb5 | 2008-08-28 21:40:38 +0000 | [diff] [blame] | 1439 | if (InFlag.getNode()) |
Scott Michel | 266bc8f | 2007-12-04 22:23:35 +0000 | [diff] [blame] | 1440 | Ops.push_back(InFlag); |
Duncan Sands | 4bdcb61 | 2008-07-02 17:40:58 +0000 | [diff] [blame] | 1441 | // Returns a chain and a flag for retval copy to use. |
Chris Lattner | f1b4eaf | 2010-12-21 02:38:05 +0000 | [diff] [blame] | 1442 | Chain = DAG.getNode(CallOpc, dl, DAG.getVTList(MVT::Other, MVT::Glue), |
Duncan Sands | 4bdcb61 | 2008-07-02 17:40:58 +0000 | [diff] [blame] | 1443 | &Ops[0], Ops.size()); |
Scott Michel | 266bc8f | 2007-12-04 22:23:35 +0000 | [diff] [blame] | 1444 | InFlag = Chain.getValue(1); |
| 1445 | |
Chris Lattner | e563bbc | 2008-10-11 22:08:30 +0000 | [diff] [blame] | 1446 | Chain = DAG.getCALLSEQ_END(Chain, DAG.getIntPtrConstant(NumStackBytes, true), |
| 1447 | DAG.getIntPtrConstant(0, true), InFlag); |
Dan Gohman | 98ca4f2 | 2009-08-05 01:29:28 +0000 | [diff] [blame] | 1448 | if (!Ins.empty()) |
Evan Cheng | ebaaa91 | 2008-02-05 22:44:06 +0000 | [diff] [blame] | 1449 | InFlag = Chain.getValue(1); |
| 1450 | |
Dan Gohman | 98ca4f2 | 2009-08-05 01:29:28 +0000 | [diff] [blame] | 1451 | // If the function returns void, just return the chain. |
| 1452 | if (Ins.empty()) |
| 1453 | return Chain; |
Scott Michel | 5af8f0e | 2008-07-16 17:17:29 +0000 | [diff] [blame] | 1454 | |
Kalle Raiskila | 55aebef | 2010-08-24 11:50:48 +0000 | [diff] [blame] | 1455 | // Now handle the return value(s) |
| 1456 | SmallVector<CCValAssign, 16> RVLocs; |
Eric Christopher | 471e422 | 2011-06-08 23:55:35 +0000 | [diff] [blame] | 1457 | CCState CCRetInfo(CallConv, isVarArg, DAG.getMachineFunction(), |
| 1458 | getTargetMachine(), RVLocs, *DAG.getContext()); |
Kalle Raiskila | 55aebef | 2010-08-24 11:50:48 +0000 | [diff] [blame] | 1459 | CCRetInfo.AnalyzeCallResult(Ins, CCC_SPU); |
| 1460 | |
| 1461 | |
Scott Michel | 266bc8f | 2007-12-04 22:23:35 +0000 | [diff] [blame] | 1462 | // If the call has results, copy the values out of the ret val registers. |
Kalle Raiskila | 55aebef | 2010-08-24 11:50:48 +0000 | [diff] [blame] | 1463 | for (unsigned i = 0; i != RVLocs.size(); ++i) { |
| 1464 | CCValAssign VA = RVLocs[i]; |
Wesley Peck | bf17cfa | 2010-11-23 03:31:01 +0000 | [diff] [blame] | 1465 | |
Kalle Raiskila | 55aebef | 2010-08-24 11:50:48 +0000 | [diff] [blame] | 1466 | SDValue Val = DAG.getCopyFromReg(Chain, dl, VA.getLocReg(), VA.getLocVT(), |
| 1467 | InFlag); |
| 1468 | Chain = Val.getValue(1); |
| 1469 | InFlag = Val.getValue(2); |
| 1470 | InVals.push_back(Val); |
| 1471 | } |
Duncan Sands | 4bdcb61 | 2008-07-02 17:40:58 +0000 | [diff] [blame] | 1472 | |
Dan Gohman | 98ca4f2 | 2009-08-05 01:29:28 +0000 | [diff] [blame] | 1473 | return Chain; |
Scott Michel | 266bc8f | 2007-12-04 22:23:35 +0000 | [diff] [blame] | 1474 | } |
| 1475 | |
Dan Gohman | 98ca4f2 | 2009-08-05 01:29:28 +0000 | [diff] [blame] | 1476 | SDValue |
| 1477 | SPUTargetLowering::LowerReturn(SDValue Chain, |
Sandeep Patel | 65c3c8f | 2009-09-02 08:44:58 +0000 | [diff] [blame] | 1478 | CallingConv::ID CallConv, bool isVarArg, |
Dan Gohman | 98ca4f2 | 2009-08-05 01:29:28 +0000 | [diff] [blame] | 1479 | const SmallVectorImpl<ISD::OutputArg> &Outs, |
Dan Gohman | c940365 | 2010-07-07 15:54:55 +0000 | [diff] [blame] | 1480 | const SmallVectorImpl<SDValue> &OutVals, |
Dan Gohman | d858e90 | 2010-04-17 15:26:15 +0000 | [diff] [blame] | 1481 | DebugLoc dl, SelectionDAG &DAG) const { |
Dan Gohman | 98ca4f2 | 2009-08-05 01:29:28 +0000 | [diff] [blame] | 1482 | |
Scott Michel | 266bc8f | 2007-12-04 22:23:35 +0000 | [diff] [blame] | 1483 | SmallVector<CCValAssign, 16> RVLocs; |
Eric Christopher | 471e422 | 2011-06-08 23:55:35 +0000 | [diff] [blame] | 1484 | CCState CCInfo(CallConv, isVarArg, DAG.getMachineFunction(), |
| 1485 | getTargetMachine(), RVLocs, *DAG.getContext()); |
Dan Gohman | 98ca4f2 | 2009-08-05 01:29:28 +0000 | [diff] [blame] | 1486 | CCInfo.AnalyzeReturn(Outs, RetCC_SPU); |
Scott Michel | 5af8f0e | 2008-07-16 17:17:29 +0000 | [diff] [blame] | 1487 | |
Scott Michel | 266bc8f | 2007-12-04 22:23:35 +0000 | [diff] [blame] | 1488 | // If this is the first return lowered for this function, add the regs to the |
| 1489 | // liveout set for the function. |
Chris Lattner | 84bc542 | 2007-12-31 04:13:23 +0000 | [diff] [blame] | 1490 | if (DAG.getMachineFunction().getRegInfo().liveout_empty()) { |
Scott Michel | 266bc8f | 2007-12-04 22:23:35 +0000 | [diff] [blame] | 1491 | for (unsigned i = 0; i != RVLocs.size(); ++i) |
Chris Lattner | 84bc542 | 2007-12-31 04:13:23 +0000 | [diff] [blame] | 1492 | DAG.getMachineFunction().getRegInfo().addLiveOut(RVLocs[i].getLocReg()); |
Scott Michel | 266bc8f | 2007-12-04 22:23:35 +0000 | [diff] [blame] | 1493 | } |
| 1494 | |
Dan Gohman | 475871a | 2008-07-27 21:46:04 +0000 | [diff] [blame] | 1495 | SDValue Flag; |
Scott Michel | 5af8f0e | 2008-07-16 17:17:29 +0000 | [diff] [blame] | 1496 | |
Scott Michel | 266bc8f | 2007-12-04 22:23:35 +0000 | [diff] [blame] | 1497 | // Copy the result values into the output registers. |
| 1498 | for (unsigned i = 0; i != RVLocs.size(); ++i) { |
| 1499 | CCValAssign &VA = RVLocs[i]; |
| 1500 | assert(VA.isRegLoc() && "Can only return in registers!"); |
Dale Johannesen | a05dca4 | 2009-02-04 23:02:30 +0000 | [diff] [blame] | 1501 | Chain = DAG.getCopyToReg(Chain, dl, VA.getLocReg(), |
Dan Gohman | c940365 | 2010-07-07 15:54:55 +0000 | [diff] [blame] | 1502 | OutVals[i], Flag); |
Scott Michel | 266bc8f | 2007-12-04 22:23:35 +0000 | [diff] [blame] | 1503 | Flag = Chain.getValue(1); |
| 1504 | } |
| 1505 | |
Gabor Greif | ba36cb5 | 2008-08-28 21:40:38 +0000 | [diff] [blame] | 1506 | if (Flag.getNode()) |
Owen Anderson | 825b72b | 2009-08-11 20:47:22 +0000 | [diff] [blame] | 1507 | return DAG.getNode(SPUISD::RET_FLAG, dl, MVT::Other, Chain, Flag); |
Scott Michel | 266bc8f | 2007-12-04 22:23:35 +0000 | [diff] [blame] | 1508 | else |
Owen Anderson | 825b72b | 2009-08-11 20:47:22 +0000 | [diff] [blame] | 1509 | return DAG.getNode(SPUISD::RET_FLAG, dl, MVT::Other, Chain); |
Scott Michel | 266bc8f | 2007-12-04 22:23:35 +0000 | [diff] [blame] | 1510 | } |
| 1511 | |
| 1512 | |
| 1513 | //===----------------------------------------------------------------------===// |
| 1514 | // Vector related lowering: |
| 1515 | //===----------------------------------------------------------------------===// |
| 1516 | |
| 1517 | static ConstantSDNode * |
| 1518 | getVecImm(SDNode *N) { |
Dan Gohman | 475871a | 2008-07-27 21:46:04 +0000 | [diff] [blame] | 1519 | SDValue OpVal(0, 0); |
Scott Michel | 5af8f0e | 2008-07-16 17:17:29 +0000 | [diff] [blame] | 1520 | |
Scott Michel | 266bc8f | 2007-12-04 22:23:35 +0000 | [diff] [blame] | 1521 | // Check to see if this buildvec has a single non-undef value in its elements. |
| 1522 | for (unsigned i = 0, e = N->getNumOperands(); i != e; ++i) { |
| 1523 | if (N->getOperand(i).getOpcode() == ISD::UNDEF) continue; |
Gabor Greif | ba36cb5 | 2008-08-28 21:40:38 +0000 | [diff] [blame] | 1524 | if (OpVal.getNode() == 0) |
Scott Michel | 266bc8f | 2007-12-04 22:23:35 +0000 | [diff] [blame] | 1525 | OpVal = N->getOperand(i); |
| 1526 | else if (OpVal != N->getOperand(i)) |
| 1527 | return 0; |
| 1528 | } |
Scott Michel | 5af8f0e | 2008-07-16 17:17:29 +0000 | [diff] [blame] | 1529 | |
Gabor Greif | ba36cb5 | 2008-08-28 21:40:38 +0000 | [diff] [blame] | 1530 | if (OpVal.getNode() != 0) { |
Scott Michel | 19fd42a | 2008-11-11 03:06:06 +0000 | [diff] [blame] | 1531 | if (ConstantSDNode *CN = dyn_cast<ConstantSDNode>(OpVal)) { |
Scott Michel | 266bc8f | 2007-12-04 22:23:35 +0000 | [diff] [blame] | 1532 | return CN; |
| 1533 | } |
| 1534 | } |
| 1535 | |
Scott Michel | 7ea02ff | 2009-03-17 01:15:45 +0000 | [diff] [blame] | 1536 | return 0; |
Scott Michel | 266bc8f | 2007-12-04 22:23:35 +0000 | [diff] [blame] | 1537 | } |
| 1538 | |
| 1539 | /// get_vec_i18imm - Test if this vector is a vector filled with the same value |
| 1540 | /// and the value fits into an unsigned 18-bit constant, and if so, return the |
| 1541 | /// constant |
Dan Gohman | 475871a | 2008-07-27 21:46:04 +0000 | [diff] [blame] | 1542 | SDValue SPU::get_vec_u18imm(SDNode *N, SelectionDAG &DAG, |
Owen Anderson | e50ed30 | 2009-08-10 22:56:29 +0000 | [diff] [blame] | 1543 | EVT ValueType) { |
Scott Michel | 266bc8f | 2007-12-04 22:23:35 +0000 | [diff] [blame] | 1544 | if (ConstantSDNode *CN = getVecImm(N)) { |
Dan Gohman | f5aeb1a | 2008-09-12 16:56:44 +0000 | [diff] [blame] | 1545 | uint64_t Value = CN->getZExtValue(); |
Owen Anderson | 825b72b | 2009-08-11 20:47:22 +0000 | [diff] [blame] | 1546 | if (ValueType == MVT::i64) { |
Dan Gohman | f5aeb1a | 2008-09-12 16:56:44 +0000 | [diff] [blame] | 1547 | uint64_t UValue = CN->getZExtValue(); |
Scott Michel | 4cb8bd8 | 2008-03-06 04:02:54 +0000 | [diff] [blame] | 1548 | uint32_t upper = uint32_t(UValue >> 32); |
| 1549 | uint32_t lower = uint32_t(UValue); |
| 1550 | if (upper != lower) |
Dan Gohman | 475871a | 2008-07-27 21:46:04 +0000 | [diff] [blame] | 1551 | return SDValue(); |
Scott Michel | 4cb8bd8 | 2008-03-06 04:02:54 +0000 | [diff] [blame] | 1552 | Value = Value >> 32; |
| 1553 | } |
Scott Michel | 266bc8f | 2007-12-04 22:23:35 +0000 | [diff] [blame] | 1554 | if (Value <= 0x3ffff) |
Dan Gohman | fa210d8 | 2008-11-05 02:06:09 +0000 | [diff] [blame] | 1555 | return DAG.getTargetConstant(Value, ValueType); |
Scott Michel | 266bc8f | 2007-12-04 22:23:35 +0000 | [diff] [blame] | 1556 | } |
| 1557 | |
Dan Gohman | 475871a | 2008-07-27 21:46:04 +0000 | [diff] [blame] | 1558 | return SDValue(); |
Scott Michel | 266bc8f | 2007-12-04 22:23:35 +0000 | [diff] [blame] | 1559 | } |
| 1560 | |
| 1561 | /// get_vec_i16imm - Test if this vector is a vector filled with the same value |
| 1562 | /// and the value fits into a signed 16-bit constant, and if so, return the |
| 1563 | /// constant |
Dan Gohman | 475871a | 2008-07-27 21:46:04 +0000 | [diff] [blame] | 1564 | SDValue SPU::get_vec_i16imm(SDNode *N, SelectionDAG &DAG, |
Owen Anderson | e50ed30 | 2009-08-10 22:56:29 +0000 | [diff] [blame] | 1565 | EVT ValueType) { |
Scott Michel | 266bc8f | 2007-12-04 22:23:35 +0000 | [diff] [blame] | 1566 | if (ConstantSDNode *CN = getVecImm(N)) { |
Dan Gohman | 7810bfe | 2008-09-26 21:54:37 +0000 | [diff] [blame] | 1567 | int64_t Value = CN->getSExtValue(); |
Owen Anderson | 825b72b | 2009-08-11 20:47:22 +0000 | [diff] [blame] | 1568 | if (ValueType == MVT::i64) { |
Dan Gohman | f5aeb1a | 2008-09-12 16:56:44 +0000 | [diff] [blame] | 1569 | uint64_t UValue = CN->getZExtValue(); |
Scott Michel | 4cb8bd8 | 2008-03-06 04:02:54 +0000 | [diff] [blame] | 1570 | uint32_t upper = uint32_t(UValue >> 32); |
| 1571 | uint32_t lower = uint32_t(UValue); |
| 1572 | if (upper != lower) |
Dan Gohman | 475871a | 2008-07-27 21:46:04 +0000 | [diff] [blame] | 1573 | return SDValue(); |
Scott Michel | 4cb8bd8 | 2008-03-06 04:02:54 +0000 | [diff] [blame] | 1574 | Value = Value >> 32; |
| 1575 | } |
Scott Michel | ad2715e | 2008-03-05 23:02:02 +0000 | [diff] [blame] | 1576 | if (Value >= -(1 << 15) && Value <= ((1 << 15) - 1)) { |
Dan Gohman | fa210d8 | 2008-11-05 02:06:09 +0000 | [diff] [blame] | 1577 | return DAG.getTargetConstant(Value, ValueType); |
Scott Michel | 266bc8f | 2007-12-04 22:23:35 +0000 | [diff] [blame] | 1578 | } |
| 1579 | } |
| 1580 | |
Dan Gohman | 475871a | 2008-07-27 21:46:04 +0000 | [diff] [blame] | 1581 | return SDValue(); |
Scott Michel | 266bc8f | 2007-12-04 22:23:35 +0000 | [diff] [blame] | 1582 | } |
| 1583 | |
| 1584 | /// get_vec_i10imm - Test if this vector is a vector filled with the same value |
| 1585 | /// and the value fits into a signed 10-bit constant, and if so, return the |
| 1586 | /// constant |
Dan Gohman | 475871a | 2008-07-27 21:46:04 +0000 | [diff] [blame] | 1587 | SDValue SPU::get_vec_i10imm(SDNode *N, SelectionDAG &DAG, |
Owen Anderson | e50ed30 | 2009-08-10 22:56:29 +0000 | [diff] [blame] | 1588 | EVT ValueType) { |
Scott Michel | 266bc8f | 2007-12-04 22:23:35 +0000 | [diff] [blame] | 1589 | if (ConstantSDNode *CN = getVecImm(N)) { |
Dan Gohman | 7810bfe | 2008-09-26 21:54:37 +0000 | [diff] [blame] | 1590 | int64_t Value = CN->getSExtValue(); |
Owen Anderson | 825b72b | 2009-08-11 20:47:22 +0000 | [diff] [blame] | 1591 | if (ValueType == MVT::i64) { |
Dan Gohman | f5aeb1a | 2008-09-12 16:56:44 +0000 | [diff] [blame] | 1592 | uint64_t UValue = CN->getZExtValue(); |
Scott Michel | 4cb8bd8 | 2008-03-06 04:02:54 +0000 | [diff] [blame] | 1593 | uint32_t upper = uint32_t(UValue >> 32); |
| 1594 | uint32_t lower = uint32_t(UValue); |
| 1595 | if (upper != lower) |
Dan Gohman | 475871a | 2008-07-27 21:46:04 +0000 | [diff] [blame] | 1596 | return SDValue(); |
Scott Michel | 4cb8bd8 | 2008-03-06 04:02:54 +0000 | [diff] [blame] | 1597 | Value = Value >> 32; |
| 1598 | } |
Benjamin Kramer | 7e09deb | 2010-03-29 19:07:58 +0000 | [diff] [blame] | 1599 | if (isInt<10>(Value)) |
Dan Gohman | fa210d8 | 2008-11-05 02:06:09 +0000 | [diff] [blame] | 1600 | return DAG.getTargetConstant(Value, ValueType); |
Scott Michel | 266bc8f | 2007-12-04 22:23:35 +0000 | [diff] [blame] | 1601 | } |
| 1602 | |
Dan Gohman | 475871a | 2008-07-27 21:46:04 +0000 | [diff] [blame] | 1603 | return SDValue(); |
Scott Michel | 266bc8f | 2007-12-04 22:23:35 +0000 | [diff] [blame] | 1604 | } |
| 1605 | |
| 1606 | /// get_vec_i8imm - Test if this vector is a vector filled with the same value |
| 1607 | /// and the value fits into a signed 8-bit constant, and if so, return the |
| 1608 | /// constant. |
| 1609 | /// |
| 1610 | /// @note: The incoming vector is v16i8 because that's the only way we can load |
| 1611 | /// constant vectors. Thus, we test to see if the upper and lower bytes are the |
| 1612 | /// same value. |
Dan Gohman | 475871a | 2008-07-27 21:46:04 +0000 | [diff] [blame] | 1613 | SDValue SPU::get_vec_i8imm(SDNode *N, SelectionDAG &DAG, |
Owen Anderson | e50ed30 | 2009-08-10 22:56:29 +0000 | [diff] [blame] | 1614 | EVT ValueType) { |
Scott Michel | 266bc8f | 2007-12-04 22:23:35 +0000 | [diff] [blame] | 1615 | if (ConstantSDNode *CN = getVecImm(N)) { |
Dan Gohman | f5aeb1a | 2008-09-12 16:56:44 +0000 | [diff] [blame] | 1616 | int Value = (int) CN->getZExtValue(); |
Owen Anderson | 825b72b | 2009-08-11 20:47:22 +0000 | [diff] [blame] | 1617 | if (ValueType == MVT::i16 |
Scott Michel | 7f9ba9b | 2008-01-30 02:55:46 +0000 | [diff] [blame] | 1618 | && Value <= 0xffff /* truncated from uint64_t */ |
| 1619 | && ((short) Value >> 8) == ((short) Value & 0xff)) |
Dan Gohman | fa210d8 | 2008-11-05 02:06:09 +0000 | [diff] [blame] | 1620 | return DAG.getTargetConstant(Value & 0xff, ValueType); |
Owen Anderson | 825b72b | 2009-08-11 20:47:22 +0000 | [diff] [blame] | 1621 | else if (ValueType == MVT::i8 |
Scott Michel | 7f9ba9b | 2008-01-30 02:55:46 +0000 | [diff] [blame] | 1622 | && (Value & 0xff) == Value) |
Dan Gohman | fa210d8 | 2008-11-05 02:06:09 +0000 | [diff] [blame] | 1623 | return DAG.getTargetConstant(Value, ValueType); |
Scott Michel | 266bc8f | 2007-12-04 22:23:35 +0000 | [diff] [blame] | 1624 | } |
| 1625 | |
Dan Gohman | 475871a | 2008-07-27 21:46:04 +0000 | [diff] [blame] | 1626 | return SDValue(); |
Scott Michel | 266bc8f | 2007-12-04 22:23:35 +0000 | [diff] [blame] | 1627 | } |
| 1628 | |
| 1629 | /// get_ILHUvec_imm - Test if this vector is a vector filled with the same value |
| 1630 | /// and the value fits into a signed 16-bit constant, and if so, return the |
| 1631 | /// constant |
Dan Gohman | 475871a | 2008-07-27 21:46:04 +0000 | [diff] [blame] | 1632 | SDValue SPU::get_ILHUvec_imm(SDNode *N, SelectionDAG &DAG, |
Owen Anderson | e50ed30 | 2009-08-10 22:56:29 +0000 | [diff] [blame] | 1633 | EVT ValueType) { |
Scott Michel | 266bc8f | 2007-12-04 22:23:35 +0000 | [diff] [blame] | 1634 | if (ConstantSDNode *CN = getVecImm(N)) { |
Dan Gohman | f5aeb1a | 2008-09-12 16:56:44 +0000 | [diff] [blame] | 1635 | uint64_t Value = CN->getZExtValue(); |
Owen Anderson | 825b72b | 2009-08-11 20:47:22 +0000 | [diff] [blame] | 1636 | if ((ValueType == MVT::i32 |
Scott Michel | 7f9ba9b | 2008-01-30 02:55:46 +0000 | [diff] [blame] | 1637 | && ((unsigned) Value & 0xffff0000) == (unsigned) Value) |
Owen Anderson | 825b72b | 2009-08-11 20:47:22 +0000 | [diff] [blame] | 1638 | || (ValueType == MVT::i64 && (Value & 0xffff0000) == Value)) |
Dan Gohman | fa210d8 | 2008-11-05 02:06:09 +0000 | [diff] [blame] | 1639 | return DAG.getTargetConstant(Value >> 16, ValueType); |
Scott Michel | 266bc8f | 2007-12-04 22:23:35 +0000 | [diff] [blame] | 1640 | } |
| 1641 | |
Dan Gohman | 475871a | 2008-07-27 21:46:04 +0000 | [diff] [blame] | 1642 | return SDValue(); |
Scott Michel | 266bc8f | 2007-12-04 22:23:35 +0000 | [diff] [blame] | 1643 | } |
| 1644 | |
| 1645 | /// get_v4i32_imm - Catch-all for general 32-bit constant vectors |
Dan Gohman | 475871a | 2008-07-27 21:46:04 +0000 | [diff] [blame] | 1646 | SDValue SPU::get_v4i32_imm(SDNode *N, SelectionDAG &DAG) { |
Scott Michel | 266bc8f | 2007-12-04 22:23:35 +0000 | [diff] [blame] | 1647 | if (ConstantSDNode *CN = getVecImm(N)) { |
Owen Anderson | 825b72b | 2009-08-11 20:47:22 +0000 | [diff] [blame] | 1648 | return DAG.getTargetConstant((unsigned) CN->getZExtValue(), MVT::i32); |
Scott Michel | 266bc8f | 2007-12-04 22:23:35 +0000 | [diff] [blame] | 1649 | } |
| 1650 | |
Dan Gohman | 475871a | 2008-07-27 21:46:04 +0000 | [diff] [blame] | 1651 | return SDValue(); |
Scott Michel | 266bc8f | 2007-12-04 22:23:35 +0000 | [diff] [blame] | 1652 | } |
| 1653 | |
| 1654 | /// get_v4i32_imm - Catch-all for general 64-bit constant vectors |
Dan Gohman | 475871a | 2008-07-27 21:46:04 +0000 | [diff] [blame] | 1655 | SDValue SPU::get_v2i64_imm(SDNode *N, SelectionDAG &DAG) { |
Scott Michel | 266bc8f | 2007-12-04 22:23:35 +0000 | [diff] [blame] | 1656 | if (ConstantSDNode *CN = getVecImm(N)) { |
Owen Anderson | 825b72b | 2009-08-11 20:47:22 +0000 | [diff] [blame] | 1657 | return DAG.getTargetConstant((unsigned) CN->getZExtValue(), MVT::i64); |
Scott Michel | 266bc8f | 2007-12-04 22:23:35 +0000 | [diff] [blame] | 1658 | } |
| 1659 | |
Dan Gohman | 475871a | 2008-07-27 21:46:04 +0000 | [diff] [blame] | 1660 | return SDValue(); |
Scott Michel | 266bc8f | 2007-12-04 22:23:35 +0000 | [diff] [blame] | 1661 | } |
| 1662 | |
Scott Michel | d1e8d9c | 2009-01-21 04:58:48 +0000 | [diff] [blame] | 1663 | //! Lower a BUILD_VECTOR instruction creatively: |
Dan Gohman | 7db949d | 2009-08-07 01:32:21 +0000 | [diff] [blame] | 1664 | static SDValue |
Scott Michel | c9c8b2a | 2009-01-26 03:31:40 +0000 | [diff] [blame] | 1665 | LowerBUILD_VECTOR(SDValue Op, SelectionDAG &DAG) { |
Owen Anderson | e50ed30 | 2009-08-10 22:56:29 +0000 | [diff] [blame] | 1666 | EVT VT = Op.getValueType(); |
| 1667 | EVT EltVT = VT.getVectorElementType(); |
Dale Johannesen | ed2eee6 | 2009-02-06 01:31:28 +0000 | [diff] [blame] | 1668 | DebugLoc dl = Op.getDebugLoc(); |
Scott Michel | 7ea02ff | 2009-03-17 01:15:45 +0000 | [diff] [blame] | 1669 | BuildVectorSDNode *BCN = dyn_cast<BuildVectorSDNode>(Op.getNode()); |
| 1670 | assert(BCN != 0 && "Expected BuildVectorSDNode in SPU LowerBUILD_VECTOR"); |
| 1671 | unsigned minSplatBits = EltVT.getSizeInBits(); |
| 1672 | |
| 1673 | if (minSplatBits < 16) |
| 1674 | minSplatBits = 16; |
| 1675 | |
| 1676 | APInt APSplatBits, APSplatUndef; |
| 1677 | unsigned SplatBitSize; |
| 1678 | bool HasAnyUndefs; |
| 1679 | |
| 1680 | if (!BCN->isConstantSplat(APSplatBits, APSplatUndef, SplatBitSize, |
| 1681 | HasAnyUndefs, minSplatBits) |
| 1682 | || minSplatBits < SplatBitSize) |
| 1683 | return SDValue(); // Wasn't a constant vector or splat exceeded min |
| 1684 | |
| 1685 | uint64_t SplatBits = APSplatBits.getZExtValue(); |
Scott Michel | 5af8f0e | 2008-07-16 17:17:29 +0000 | [diff] [blame] | 1686 | |
Owen Anderson | 825b72b | 2009-08-11 20:47:22 +0000 | [diff] [blame] | 1687 | switch (VT.getSimpleVT().SimpleTy) { |
Benjamin Kramer | 1bd7335 | 2010-04-08 10:44:28 +0000 | [diff] [blame] | 1688 | default: |
| 1689 | report_fatal_error("CellSPU: Unhandled VT in LowerBUILD_VECTOR, VT = " + |
| 1690 | Twine(VT.getEVTString())); |
Scott Michel | d1e8d9c | 2009-01-21 04:58:48 +0000 | [diff] [blame] | 1691 | /*NOTREACHED*/ |
Owen Anderson | 825b72b | 2009-08-11 20:47:22 +0000 | [diff] [blame] | 1692 | case MVT::v4f32: { |
Scott Michel | c9c8b2a | 2009-01-26 03:31:40 +0000 | [diff] [blame] | 1693 | uint32_t Value32 = uint32_t(SplatBits); |
Chris Lattner | e7fa1f2 | 2009-03-26 05:29:34 +0000 | [diff] [blame] | 1694 | assert(SplatBitSize == 32 |
Scott Michel | 7f9ba9b | 2008-01-30 02:55:46 +0000 | [diff] [blame] | 1695 | && "LowerBUILD_VECTOR: Unexpected floating point vector element."); |
Scott Michel | 266bc8f | 2007-12-04 22:23:35 +0000 | [diff] [blame] | 1696 | // NOTE: pretend the constant is an integer. LLVM won't load FP constants |
Owen Anderson | 825b72b | 2009-08-11 20:47:22 +0000 | [diff] [blame] | 1697 | SDValue T = DAG.getConstant(Value32, MVT::i32); |
Wesley Peck | bf17cfa | 2010-11-23 03:31:01 +0000 | [diff] [blame] | 1698 | return DAG.getNode(ISD::BITCAST, dl, MVT::v4f32, |
Owen Anderson | 825b72b | 2009-08-11 20:47:22 +0000 | [diff] [blame] | 1699 | DAG.getNode(ISD::BUILD_VECTOR, dl, MVT::v4i32, T,T,T,T)); |
Scott Michel | 266bc8f | 2007-12-04 22:23:35 +0000 | [diff] [blame] | 1700 | break; |
| 1701 | } |
Owen Anderson | 825b72b | 2009-08-11 20:47:22 +0000 | [diff] [blame] | 1702 | case MVT::v2f64: { |
Scott Michel | c9c8b2a | 2009-01-26 03:31:40 +0000 | [diff] [blame] | 1703 | uint64_t f64val = uint64_t(SplatBits); |
Chris Lattner | e7fa1f2 | 2009-03-26 05:29:34 +0000 | [diff] [blame] | 1704 | assert(SplatBitSize == 64 |
Scott Michel | 104de43 | 2008-11-24 17:11:17 +0000 | [diff] [blame] | 1705 | && "LowerBUILD_VECTOR: 64-bit float vector size > 8 bytes."); |
Scott Michel | 266bc8f | 2007-12-04 22:23:35 +0000 | [diff] [blame] | 1706 | // NOTE: pretend the constant is an integer. LLVM won't load FP constants |
Owen Anderson | 825b72b | 2009-08-11 20:47:22 +0000 | [diff] [blame] | 1707 | SDValue T = DAG.getConstant(f64val, MVT::i64); |
Wesley Peck | bf17cfa | 2010-11-23 03:31:01 +0000 | [diff] [blame] | 1708 | return DAG.getNode(ISD::BITCAST, dl, MVT::v2f64, |
Owen Anderson | 825b72b | 2009-08-11 20:47:22 +0000 | [diff] [blame] | 1709 | DAG.getNode(ISD::BUILD_VECTOR, dl, MVT::v2i64, T, T)); |
Scott Michel | 266bc8f | 2007-12-04 22:23:35 +0000 | [diff] [blame] | 1710 | break; |
| 1711 | } |
Owen Anderson | 825b72b | 2009-08-11 20:47:22 +0000 | [diff] [blame] | 1712 | case MVT::v16i8: { |
Scott Michel | 266bc8f | 2007-12-04 22:23:35 +0000 | [diff] [blame] | 1713 | // 8-bit constants have to be expanded to 16-bits |
Scott Michel | 7ea02ff | 2009-03-17 01:15:45 +0000 | [diff] [blame] | 1714 | unsigned short Value16 = SplatBits /* | (SplatBits << 8) */; |
| 1715 | SmallVector<SDValue, 8> Ops; |
| 1716 | |
Owen Anderson | 825b72b | 2009-08-11 20:47:22 +0000 | [diff] [blame] | 1717 | Ops.assign(8, DAG.getConstant(Value16, MVT::i16)); |
Wesley Peck | bf17cfa | 2010-11-23 03:31:01 +0000 | [diff] [blame] | 1718 | return DAG.getNode(ISD::BITCAST, dl, VT, |
Owen Anderson | 825b72b | 2009-08-11 20:47:22 +0000 | [diff] [blame] | 1719 | DAG.getNode(ISD::BUILD_VECTOR, dl, MVT::v8i16, &Ops[0], Ops.size())); |
Scott Michel | 266bc8f | 2007-12-04 22:23:35 +0000 | [diff] [blame] | 1720 | } |
Owen Anderson | 825b72b | 2009-08-11 20:47:22 +0000 | [diff] [blame] | 1721 | case MVT::v8i16: { |
Scott Michel | 7ea02ff | 2009-03-17 01:15:45 +0000 | [diff] [blame] | 1722 | unsigned short Value16 = SplatBits; |
| 1723 | SDValue T = DAG.getConstant(Value16, EltVT); |
| 1724 | SmallVector<SDValue, 8> Ops; |
| 1725 | |
| 1726 | Ops.assign(8, T); |
| 1727 | return DAG.getNode(ISD::BUILD_VECTOR, dl, VT, &Ops[0], Ops.size()); |
Scott Michel | 266bc8f | 2007-12-04 22:23:35 +0000 | [diff] [blame] | 1728 | } |
Owen Anderson | 825b72b | 2009-08-11 20:47:22 +0000 | [diff] [blame] | 1729 | case MVT::v4i32: { |
Scott Michel | 7ea02ff | 2009-03-17 01:15:45 +0000 | [diff] [blame] | 1730 | SDValue T = DAG.getConstant(unsigned(SplatBits), VT.getVectorElementType()); |
Evan Cheng | a87008d | 2009-02-25 22:49:59 +0000 | [diff] [blame] | 1731 | return DAG.getNode(ISD::BUILD_VECTOR, dl, VT, T, T, T, T); |
Scott Michel | 266bc8f | 2007-12-04 22:23:35 +0000 | [diff] [blame] | 1732 | } |
Owen Anderson | 825b72b | 2009-08-11 20:47:22 +0000 | [diff] [blame] | 1733 | case MVT::v2i64: { |
Scott Michel | 7ea02ff | 2009-03-17 01:15:45 +0000 | [diff] [blame] | 1734 | return SPU::LowerV2I64Splat(VT, DAG, SplatBits, dl); |
Scott Michel | 266bc8f | 2007-12-04 22:23:35 +0000 | [diff] [blame] | 1735 | } |
| 1736 | } |
Scott Michel | 5af8f0e | 2008-07-16 17:17:29 +0000 | [diff] [blame] | 1737 | |
Dan Gohman | 475871a | 2008-07-27 21:46:04 +0000 | [diff] [blame] | 1738 | return SDValue(); |
Scott Michel | 266bc8f | 2007-12-04 22:23:35 +0000 | [diff] [blame] | 1739 | } |
| 1740 | |
Scott Michel | 7ea02ff | 2009-03-17 01:15:45 +0000 | [diff] [blame] | 1741 | /*! |
| 1742 | */ |
Scott Michel | c9c8b2a | 2009-01-26 03:31:40 +0000 | [diff] [blame] | 1743 | SDValue |
Owen Anderson | e50ed30 | 2009-08-10 22:56:29 +0000 | [diff] [blame] | 1744 | SPU::LowerV2I64Splat(EVT OpVT, SelectionDAG& DAG, uint64_t SplatVal, |
Scott Michel | 7ea02ff | 2009-03-17 01:15:45 +0000 | [diff] [blame] | 1745 | DebugLoc dl) { |
Scott Michel | c9c8b2a | 2009-01-26 03:31:40 +0000 | [diff] [blame] | 1746 | uint32_t upper = uint32_t(SplatVal >> 32); |
| 1747 | uint32_t lower = uint32_t(SplatVal); |
| 1748 | |
| 1749 | if (upper == lower) { |
| 1750 | // Magic constant that can be matched by IL, ILA, et. al. |
Owen Anderson | 825b72b | 2009-08-11 20:47:22 +0000 | [diff] [blame] | 1751 | SDValue Val = DAG.getTargetConstant(upper, MVT::i32); |
Wesley Peck | bf17cfa | 2010-11-23 03:31:01 +0000 | [diff] [blame] | 1752 | return DAG.getNode(ISD::BITCAST, dl, OpVT, |
Owen Anderson | 825b72b | 2009-08-11 20:47:22 +0000 | [diff] [blame] | 1753 | DAG.getNode(ISD::BUILD_VECTOR, dl, MVT::v4i32, |
Evan Cheng | a87008d | 2009-02-25 22:49:59 +0000 | [diff] [blame] | 1754 | Val, Val, Val, Val)); |
Scott Michel | c9c8b2a | 2009-01-26 03:31:40 +0000 | [diff] [blame] | 1755 | } else { |
Scott Michel | c9c8b2a | 2009-01-26 03:31:40 +0000 | [diff] [blame] | 1756 | bool upper_special, lower_special; |
| 1757 | |
| 1758 | // NOTE: This code creates common-case shuffle masks that can be easily |
| 1759 | // detected as common expressions. It is not attempting to create highly |
| 1760 | // specialized masks to replace any and all 0's, 0xff's and 0x80's. |
| 1761 | |
| 1762 | // Detect if the upper or lower half is a special shuffle mask pattern: |
| 1763 | upper_special = (upper == 0 || upper == 0xffffffff || upper == 0x80000000); |
| 1764 | lower_special = (lower == 0 || lower == 0xffffffff || lower == 0x80000000); |
| 1765 | |
Scott Michel | 7ea02ff | 2009-03-17 01:15:45 +0000 | [diff] [blame] | 1766 | // Both upper and lower are special, lower to a constant pool load: |
| 1767 | if (lower_special && upper_special) { |
Nadav Rotem | c32a8c9 | 2011-10-16 10:02:06 +0000 | [diff] [blame] | 1768 | SDValue UpperVal = DAG.getConstant(upper, MVT::i32); |
| 1769 | SDValue LowerVal = DAG.getConstant(lower, MVT::i32); |
| 1770 | SDValue BV = DAG.getNode(ISD::BUILD_VECTOR, dl, MVT::v4i32, |
| 1771 | UpperVal, LowerVal, UpperVal, LowerVal); |
| 1772 | return DAG.getNode(ISD::BITCAST, dl, OpVT, BV); |
Scott Michel | 7ea02ff | 2009-03-17 01:15:45 +0000 | [diff] [blame] | 1773 | } |
| 1774 | |
| 1775 | SDValue LO32; |
| 1776 | SDValue HI32; |
| 1777 | SmallVector<SDValue, 16> ShufBytes; |
| 1778 | SDValue Result; |
| 1779 | |
Scott Michel | c9c8b2a | 2009-01-26 03:31:40 +0000 | [diff] [blame] | 1780 | // Create lower vector if not a special pattern |
| 1781 | if (!lower_special) { |
Owen Anderson | 825b72b | 2009-08-11 20:47:22 +0000 | [diff] [blame] | 1782 | SDValue LO32C = DAG.getConstant(lower, MVT::i32); |
Wesley Peck | bf17cfa | 2010-11-23 03:31:01 +0000 | [diff] [blame] | 1783 | LO32 = DAG.getNode(ISD::BITCAST, dl, OpVT, |
Owen Anderson | 825b72b | 2009-08-11 20:47:22 +0000 | [diff] [blame] | 1784 | DAG.getNode(ISD::BUILD_VECTOR, dl, MVT::v4i32, |
Evan Cheng | a87008d | 2009-02-25 22:49:59 +0000 | [diff] [blame] | 1785 | LO32C, LO32C, LO32C, LO32C)); |
Scott Michel | c9c8b2a | 2009-01-26 03:31:40 +0000 | [diff] [blame] | 1786 | } |
| 1787 | |
| 1788 | // Create upper vector if not a special pattern |
| 1789 | if (!upper_special) { |
Owen Anderson | 825b72b | 2009-08-11 20:47:22 +0000 | [diff] [blame] | 1790 | SDValue HI32C = DAG.getConstant(upper, MVT::i32); |
Wesley Peck | bf17cfa | 2010-11-23 03:31:01 +0000 | [diff] [blame] | 1791 | HI32 = DAG.getNode(ISD::BITCAST, dl, OpVT, |
Owen Anderson | 825b72b | 2009-08-11 20:47:22 +0000 | [diff] [blame] | 1792 | DAG.getNode(ISD::BUILD_VECTOR, dl, MVT::v4i32, |
Evan Cheng | a87008d | 2009-02-25 22:49:59 +0000 | [diff] [blame] | 1793 | HI32C, HI32C, HI32C, HI32C)); |
Scott Michel | c9c8b2a | 2009-01-26 03:31:40 +0000 | [diff] [blame] | 1794 | } |
| 1795 | |
| 1796 | // If either upper or lower are special, then the two input operands are |
| 1797 | // the same (basically, one of them is a "don't care") |
| 1798 | if (lower_special) |
| 1799 | LO32 = HI32; |
| 1800 | if (upper_special) |
| 1801 | HI32 = LO32; |
Scott Michel | c9c8b2a | 2009-01-26 03:31:40 +0000 | [diff] [blame] | 1802 | |
| 1803 | for (int i = 0; i < 4; ++i) { |
| 1804 | uint64_t val = 0; |
| 1805 | for (int j = 0; j < 4; ++j) { |
| 1806 | SDValue V; |
| 1807 | bool process_upper, process_lower; |
| 1808 | val <<= 8; |
| 1809 | process_upper = (upper_special && (i & 1) == 0); |
| 1810 | process_lower = (lower_special && (i & 1) == 1); |
| 1811 | |
| 1812 | if (process_upper || process_lower) { |
| 1813 | if ((process_upper && upper == 0) |
| 1814 | || (process_lower && lower == 0)) |
| 1815 | val |= 0x80; |
| 1816 | else if ((process_upper && upper == 0xffffffff) |
| 1817 | || (process_lower && lower == 0xffffffff)) |
| 1818 | val |= 0xc0; |
| 1819 | else if ((process_upper && upper == 0x80000000) |
| 1820 | || (process_lower && lower == 0x80000000)) |
| 1821 | val |= (j == 0 ? 0xe0 : 0x80); |
| 1822 | } else |
| 1823 | val |= i * 4 + j + ((i & 1) * 16); |
| 1824 | } |
| 1825 | |
Owen Anderson | 825b72b | 2009-08-11 20:47:22 +0000 | [diff] [blame] | 1826 | ShufBytes.push_back(DAG.getConstant(val, MVT::i32)); |
Scott Michel | c9c8b2a | 2009-01-26 03:31:40 +0000 | [diff] [blame] | 1827 | } |
| 1828 | |
Dale Johannesen | ed2eee6 | 2009-02-06 01:31:28 +0000 | [diff] [blame] | 1829 | return DAG.getNode(SPUISD::SHUFB, dl, OpVT, HI32, LO32, |
Owen Anderson | 825b72b | 2009-08-11 20:47:22 +0000 | [diff] [blame] | 1830 | DAG.getNode(ISD::BUILD_VECTOR, dl, MVT::v4i32, |
Evan Cheng | a87008d | 2009-02-25 22:49:59 +0000 | [diff] [blame] | 1831 | &ShufBytes[0], ShufBytes.size())); |
Scott Michel | c9c8b2a | 2009-01-26 03:31:40 +0000 | [diff] [blame] | 1832 | } |
| 1833 | } |
| 1834 | |
Scott Michel | 266bc8f | 2007-12-04 22:23:35 +0000 | [diff] [blame] | 1835 | /// LowerVECTOR_SHUFFLE - Lower a vector shuffle (V1, V2, V3) to something on |
| 1836 | /// which the Cell can operate. The code inspects V3 to ascertain whether the |
| 1837 | /// permutation vector, V3, is monotonically increasing with one "exception" |
| 1838 | /// element, e.g., (0, 1, _, 3). If this is the case, then generate a |
Scott Michel | 7a1c9e9 | 2008-11-22 23:50:42 +0000 | [diff] [blame] | 1839 | /// SHUFFLE_MASK synthetic instruction. Otherwise, spill V3 to the constant pool. |
Scott Michel | 266bc8f | 2007-12-04 22:23:35 +0000 | [diff] [blame] | 1840 | /// In either case, the net result is going to eventually invoke SHUFB to |
| 1841 | /// permute/shuffle the bytes from V1 and V2. |
| 1842 | /// \note |
Scott Michel | 7a1c9e9 | 2008-11-22 23:50:42 +0000 | [diff] [blame] | 1843 | /// SHUFFLE_MASK is eventually selected as one of the C*D instructions, generate |
Scott Michel | 266bc8f | 2007-12-04 22:23:35 +0000 | [diff] [blame] | 1844 | /// control word for byte/halfword/word insertion. This takes care of a single |
| 1845 | /// element move from V2 into V1. |
| 1846 | /// \note |
| 1847 | /// SPUISD::SHUFB is eventually selected as Cell's <i>shufb</i> instructions. |
Dan Gohman | 475871a | 2008-07-27 21:46:04 +0000 | [diff] [blame] | 1848 | static SDValue LowerVECTOR_SHUFFLE(SDValue Op, SelectionDAG &DAG) { |
Nate Begeman | 9008ca6 | 2009-04-27 18:41:29 +0000 | [diff] [blame] | 1849 | const ShuffleVectorSDNode *SVN = cast<ShuffleVectorSDNode>(Op); |
Dan Gohman | 475871a | 2008-07-27 21:46:04 +0000 | [diff] [blame] | 1850 | SDValue V1 = Op.getOperand(0); |
| 1851 | SDValue V2 = Op.getOperand(1); |
Dale Johannesen | a05dca4 | 2009-02-04 23:02:30 +0000 | [diff] [blame] | 1852 | DebugLoc dl = Op.getDebugLoc(); |
Scott Michel | 5af8f0e | 2008-07-16 17:17:29 +0000 | [diff] [blame] | 1853 | |
Scott Michel | 266bc8f | 2007-12-04 22:23:35 +0000 | [diff] [blame] | 1854 | if (V2.getOpcode() == ISD::UNDEF) V2 = V1; |
Scott Michel | 5af8f0e | 2008-07-16 17:17:29 +0000 | [diff] [blame] | 1855 | |
Scott Michel | 266bc8f | 2007-12-04 22:23:35 +0000 | [diff] [blame] | 1856 | // If we have a single element being moved from V1 to V2, this can be handled |
| 1857 | // using the C*[DX] compute mask instructions, but the vector elements have |
Kalle Raiskila | ca9460f | 2010-08-18 10:20:29 +0000 | [diff] [blame] | 1858 | // to be monotonically increasing with one exception element, and the source |
| 1859 | // slot of the element to move must be the same as the destination. |
Owen Anderson | e50ed30 | 2009-08-10 22:56:29 +0000 | [diff] [blame] | 1860 | EVT VecVT = V1.getValueType(); |
| 1861 | EVT EltVT = VecVT.getVectorElementType(); |
Scott Michel | 266bc8f | 2007-12-04 22:23:35 +0000 | [diff] [blame] | 1862 | unsigned EltsFromV2 = 0; |
Kalle Raiskila | ca9460f | 2010-08-18 10:20:29 +0000 | [diff] [blame] | 1863 | unsigned V2EltOffset = 0; |
Scott Michel | 266bc8f | 2007-12-04 22:23:35 +0000 | [diff] [blame] | 1864 | unsigned V2EltIdx0 = 0; |
| 1865 | unsigned CurrElt = 0; |
Scott Michel | cc18827 | 2008-12-04 21:01:44 +0000 | [diff] [blame] | 1866 | unsigned MaxElts = VecVT.getVectorNumElements(); |
| 1867 | unsigned PrevElt = 0; |
Scott Michel | 266bc8f | 2007-12-04 22:23:35 +0000 | [diff] [blame] | 1868 | bool monotonic = true; |
Scott Michel | cc18827 | 2008-12-04 21:01:44 +0000 | [diff] [blame] | 1869 | bool rotate = true; |
Kalle Raiskila | bb7d33a | 2010-09-09 07:30:15 +0000 | [diff] [blame] | 1870 | int rotamt=0; |
Kalle Raiskila | 4794807 | 2010-06-21 10:17:36 +0000 | [diff] [blame] | 1871 | EVT maskVT; // which of the c?d instructions to use |
Scott Michel | cc18827 | 2008-12-04 21:01:44 +0000 | [diff] [blame] | 1872 | |
Owen Anderson | 825b72b | 2009-08-11 20:47:22 +0000 | [diff] [blame] | 1873 | if (EltVT == MVT::i8) { |
Scott Michel | 266bc8f | 2007-12-04 22:23:35 +0000 | [diff] [blame] | 1874 | V2EltIdx0 = 16; |
Wesley Peck | bf17cfa | 2010-11-23 03:31:01 +0000 | [diff] [blame] | 1875 | maskVT = MVT::v16i8; |
Owen Anderson | 825b72b | 2009-08-11 20:47:22 +0000 | [diff] [blame] | 1876 | } else if (EltVT == MVT::i16) { |
Scott Michel | 266bc8f | 2007-12-04 22:23:35 +0000 | [diff] [blame] | 1877 | V2EltIdx0 = 8; |
Kalle Raiskila | 4794807 | 2010-06-21 10:17:36 +0000 | [diff] [blame] | 1878 | maskVT = MVT::v8i16; |
Owen Anderson | 825b72b | 2009-08-11 20:47:22 +0000 | [diff] [blame] | 1879 | } else if (EltVT == MVT::i32 || EltVT == MVT::f32) { |
Scott Michel | 266bc8f | 2007-12-04 22:23:35 +0000 | [diff] [blame] | 1880 | V2EltIdx0 = 4; |
Kalle Raiskila | 4794807 | 2010-06-21 10:17:36 +0000 | [diff] [blame] | 1881 | maskVT = MVT::v4i32; |
Owen Anderson | 825b72b | 2009-08-11 20:47:22 +0000 | [diff] [blame] | 1882 | } else if (EltVT == MVT::i64 || EltVT == MVT::f64) { |
Scott Michel | cc18827 | 2008-12-04 21:01:44 +0000 | [diff] [blame] | 1883 | V2EltIdx0 = 2; |
Kalle Raiskila | 4794807 | 2010-06-21 10:17:36 +0000 | [diff] [blame] | 1884 | maskVT = MVT::v2i64; |
Scott Michel | cc18827 | 2008-12-04 21:01:44 +0000 | [diff] [blame] | 1885 | } else |
Torok Edwin | c23197a | 2009-07-14 16:55:14 +0000 | [diff] [blame] | 1886 | llvm_unreachable("Unhandled vector type in LowerVECTOR_SHUFFLE"); |
Scott Michel | 266bc8f | 2007-12-04 22:23:35 +0000 | [diff] [blame] | 1887 | |
Nate Begeman | 9008ca6 | 2009-04-27 18:41:29 +0000 | [diff] [blame] | 1888 | for (unsigned i = 0; i != MaxElts; ++i) { |
| 1889 | if (SVN->getMaskElt(i) < 0) |
| 1890 | continue; |
Wesley Peck | bf17cfa | 2010-11-23 03:31:01 +0000 | [diff] [blame] | 1891 | |
Nate Begeman | 9008ca6 | 2009-04-27 18:41:29 +0000 | [diff] [blame] | 1892 | unsigned SrcElt = SVN->getMaskElt(i); |
Scott Michel | 266bc8f | 2007-12-04 22:23:35 +0000 | [diff] [blame] | 1893 | |
Nate Begeman | 9008ca6 | 2009-04-27 18:41:29 +0000 | [diff] [blame] | 1894 | if (monotonic) { |
| 1895 | if (SrcElt >= V2EltIdx0) { |
Kalle Raiskila | ca9460f | 2010-08-18 10:20:29 +0000 | [diff] [blame] | 1896 | // TODO: optimize for the monotonic case when several consecutive |
| 1897 | // elements are taken form V2. Do we ever get such a case? |
| 1898 | if (EltsFromV2 == 0 && CurrElt == (SrcElt - V2EltIdx0)) |
| 1899 | V2EltOffset = (SrcElt - V2EltIdx0) * (EltVT.getSizeInBits()/8); |
| 1900 | else |
| 1901 | monotonic = false; |
| 1902 | ++EltsFromV2; |
Nate Begeman | 9008ca6 | 2009-04-27 18:41:29 +0000 | [diff] [blame] | 1903 | } else if (CurrElt != SrcElt) { |
| 1904 | monotonic = false; |
Scott Michel | cc18827 | 2008-12-04 21:01:44 +0000 | [diff] [blame] | 1905 | } |
| 1906 | |
Nate Begeman | 9008ca6 | 2009-04-27 18:41:29 +0000 | [diff] [blame] | 1907 | ++CurrElt; |
| 1908 | } |
| 1909 | |
| 1910 | if (rotate) { |
| 1911 | if (PrevElt > 0 && SrcElt < MaxElts) { |
| 1912 | if ((PrevElt == SrcElt - 1) |
| 1913 | || (PrevElt == MaxElts - 1 && SrcElt == 0)) { |
Scott Michel | cc18827 | 2008-12-04 21:01:44 +0000 | [diff] [blame] | 1914 | PrevElt = SrcElt; |
| 1915 | } else { |
Scott Michel | cc18827 | 2008-12-04 21:01:44 +0000 | [diff] [blame] | 1916 | rotate = false; |
| 1917 | } |
Kalle Raiskila | 0b4ab0c | 2010-09-08 11:53:38 +0000 | [diff] [blame] | 1918 | } else if (i == 0 || (PrevElt==0 && SrcElt==1)) { |
| 1919 | // First time or after a "wrap around" |
Kalle Raiskila | d87e571 | 2010-11-22 16:28:26 +0000 | [diff] [blame] | 1920 | rotamt = SrcElt-i; |
Nate Begeman | 9008ca6 | 2009-04-27 18:41:29 +0000 | [diff] [blame] | 1921 | PrevElt = SrcElt; |
| 1922 | } else { |
| 1923 | // This isn't a rotation, takes elements from vector 2 |
| 1924 | rotate = false; |
Scott Michel | cc18827 | 2008-12-04 21:01:44 +0000 | [diff] [blame] | 1925 | } |
Scott Michel | 266bc8f | 2007-12-04 22:23:35 +0000 | [diff] [blame] | 1926 | } |
Scott Michel | 266bc8f | 2007-12-04 22:23:35 +0000 | [diff] [blame] | 1927 | } |
| 1928 | |
| 1929 | if (EltsFromV2 == 1 && monotonic) { |
| 1930 | // Compute mask and shuffle |
Owen Anderson | e50ed30 | 2009-08-10 22:56:29 +0000 | [diff] [blame] | 1931 | EVT PtrVT = DAG.getTargetLoweringInfo().getPointerTy(); |
Kalle Raiskila | 4794807 | 2010-06-21 10:17:36 +0000 | [diff] [blame] | 1932 | |
| 1933 | // As SHUFFLE_MASK becomes a c?d instruction, feed it an address |
| 1934 | // R1 ($sp) is used here only as it is guaranteed to have last bits zero |
| 1935 | SDValue Pointer = DAG.getNode(SPUISD::IndirectAddr, dl, PtrVT, |
| 1936 | DAG.getRegister(SPU::R1, PtrVT), |
Kalle Raiskila | ca9460f | 2010-08-18 10:20:29 +0000 | [diff] [blame] | 1937 | DAG.getConstant(V2EltOffset, MVT::i32)); |
Wesley Peck | bf17cfa | 2010-11-23 03:31:01 +0000 | [diff] [blame] | 1938 | SDValue ShufMaskOp = DAG.getNode(SPUISD::SHUFFLE_MASK, dl, |
Kalle Raiskila | 4794807 | 2010-06-21 10:17:36 +0000 | [diff] [blame] | 1939 | maskVT, Pointer); |
| 1940 | |
Scott Michel | 266bc8f | 2007-12-04 22:23:35 +0000 | [diff] [blame] | 1941 | // Use shuffle mask in SHUFB synthetic instruction: |
Scott Michel | 6e1d147 | 2009-03-16 18:47:25 +0000 | [diff] [blame] | 1942 | return DAG.getNode(SPUISD::SHUFB, dl, V1.getValueType(), V2, V1, |
Dale Johannesen | a05dca4 | 2009-02-04 23:02:30 +0000 | [diff] [blame] | 1943 | ShufMaskOp); |
Scott Michel | cc18827 | 2008-12-04 21:01:44 +0000 | [diff] [blame] | 1944 | } else if (rotate) { |
Kalle Raiskila | 0b4ab0c | 2010-09-08 11:53:38 +0000 | [diff] [blame] | 1945 | if (rotamt < 0) |
| 1946 | rotamt +=MaxElts; |
| 1947 | rotamt *= EltVT.getSizeInBits()/8; |
Dale Johannesen | a05dca4 | 2009-02-04 23:02:30 +0000 | [diff] [blame] | 1948 | return DAG.getNode(SPUISD::ROTBYTES_LEFT, dl, V1.getValueType(), |
Owen Anderson | 825b72b | 2009-08-11 20:47:22 +0000 | [diff] [blame] | 1949 | V1, DAG.getConstant(rotamt, MVT::i16)); |
Scott Michel | 266bc8f | 2007-12-04 22:23:35 +0000 | [diff] [blame] | 1950 | } else { |
Gabor Greif | 93c53e5 | 2008-08-31 15:37:04 +0000 | [diff] [blame] | 1951 | // Convert the SHUFFLE_VECTOR mask's input element units to the |
| 1952 | // actual bytes. |
Duncan Sands | 83ec4b6 | 2008-06-06 12:08:01 +0000 | [diff] [blame] | 1953 | unsigned BytesPerElement = EltVT.getSizeInBits()/8; |
Scott Michel | 5af8f0e | 2008-07-16 17:17:29 +0000 | [diff] [blame] | 1954 | |
Dan Gohman | 475871a | 2008-07-27 21:46:04 +0000 | [diff] [blame] | 1955 | SmallVector<SDValue, 16> ResultMask; |
Nate Begeman | 9008ca6 | 2009-04-27 18:41:29 +0000 | [diff] [blame] | 1956 | for (unsigned i = 0, e = MaxElts; i != e; ++i) { |
| 1957 | unsigned SrcElt = SVN->getMaskElt(i) < 0 ? 0 : SVN->getMaskElt(i); |
Scott Michel | 5af8f0e | 2008-07-16 17:17:29 +0000 | [diff] [blame] | 1958 | |
Nate Begeman | 9008ca6 | 2009-04-27 18:41:29 +0000 | [diff] [blame] | 1959 | for (unsigned j = 0; j < BytesPerElement; ++j) |
Owen Anderson | 825b72b | 2009-08-11 20:47:22 +0000 | [diff] [blame] | 1960 | ResultMask.push_back(DAG.getConstant(SrcElt*BytesPerElement+j,MVT::i8)); |
Scott Michel | 266bc8f | 2007-12-04 22:23:35 +0000 | [diff] [blame] | 1961 | } |
Owen Anderson | 825b72b | 2009-08-11 20:47:22 +0000 | [diff] [blame] | 1962 | SDValue VPermMask = DAG.getNode(ISD::BUILD_VECTOR, dl, MVT::v16i8, |
Evan Cheng | a87008d | 2009-02-25 22:49:59 +0000 | [diff] [blame] | 1963 | &ResultMask[0], ResultMask.size()); |
Dale Johannesen | a05dca4 | 2009-02-04 23:02:30 +0000 | [diff] [blame] | 1964 | return DAG.getNode(SPUISD::SHUFB, dl, V1.getValueType(), V1, V2, VPermMask); |
Scott Michel | 266bc8f | 2007-12-04 22:23:35 +0000 | [diff] [blame] | 1965 | } |
| 1966 | } |
| 1967 | |
Dan Gohman | 475871a | 2008-07-27 21:46:04 +0000 | [diff] [blame] | 1968 | static SDValue LowerSCALAR_TO_VECTOR(SDValue Op, SelectionDAG &DAG) { |
| 1969 | SDValue Op0 = Op.getOperand(0); // Op0 = the scalar |
Dale Johannesen | ed2eee6 | 2009-02-06 01:31:28 +0000 | [diff] [blame] | 1970 | DebugLoc dl = Op.getDebugLoc(); |
Scott Michel | 266bc8f | 2007-12-04 22:23:35 +0000 | [diff] [blame] | 1971 | |
Gabor Greif | ba36cb5 | 2008-08-28 21:40:38 +0000 | [diff] [blame] | 1972 | if (Op0.getNode()->getOpcode() == ISD::Constant) { |
Scott Michel | 266bc8f | 2007-12-04 22:23:35 +0000 | [diff] [blame] | 1973 | // For a constant, build the appropriate constant vector, which will |
| 1974 | // eventually simplify to a vector register load. |
| 1975 | |
Gabor Greif | ba36cb5 | 2008-08-28 21:40:38 +0000 | [diff] [blame] | 1976 | ConstantSDNode *CN = cast<ConstantSDNode>(Op0.getNode()); |
Dan Gohman | 475871a | 2008-07-27 21:46:04 +0000 | [diff] [blame] | 1977 | SmallVector<SDValue, 16> ConstVecValues; |
Owen Anderson | e50ed30 | 2009-08-10 22:56:29 +0000 | [diff] [blame] | 1978 | EVT VT; |
Scott Michel | 266bc8f | 2007-12-04 22:23:35 +0000 | [diff] [blame] | 1979 | size_t n_copies; |
| 1980 | |
| 1981 | // Create a constant vector: |
Owen Anderson | 825b72b | 2009-08-11 20:47:22 +0000 | [diff] [blame] | 1982 | switch (Op.getValueType().getSimpleVT().SimpleTy) { |
Torok Edwin | c23197a | 2009-07-14 16:55:14 +0000 | [diff] [blame] | 1983 | default: llvm_unreachable("Unexpected constant value type in " |
Torok Edwin | 481d15a | 2009-07-14 12:22:58 +0000 | [diff] [blame] | 1984 | "LowerSCALAR_TO_VECTOR"); |
Owen Anderson | 825b72b | 2009-08-11 20:47:22 +0000 | [diff] [blame] | 1985 | case MVT::v16i8: n_copies = 16; VT = MVT::i8; break; |
| 1986 | case MVT::v8i16: n_copies = 8; VT = MVT::i16; break; |
| 1987 | case MVT::v4i32: n_copies = 4; VT = MVT::i32; break; |
| 1988 | case MVT::v4f32: n_copies = 4; VT = MVT::f32; break; |
| 1989 | case MVT::v2i64: n_copies = 2; VT = MVT::i64; break; |
| 1990 | case MVT::v2f64: n_copies = 2; VT = MVT::f64; break; |
Scott Michel | 266bc8f | 2007-12-04 22:23:35 +0000 | [diff] [blame] | 1991 | } |
| 1992 | |
Dan Gohman | f5aeb1a | 2008-09-12 16:56:44 +0000 | [diff] [blame] | 1993 | SDValue CValue = DAG.getConstant(CN->getZExtValue(), VT); |
Scott Michel | 266bc8f | 2007-12-04 22:23:35 +0000 | [diff] [blame] | 1994 | for (size_t j = 0; j < n_copies; ++j) |
| 1995 | ConstVecValues.push_back(CValue); |
| 1996 | |
Evan Cheng | a87008d | 2009-02-25 22:49:59 +0000 | [diff] [blame] | 1997 | return DAG.getNode(ISD::BUILD_VECTOR, dl, Op.getValueType(), |
| 1998 | &ConstVecValues[0], ConstVecValues.size()); |
Scott Michel | 266bc8f | 2007-12-04 22:23:35 +0000 | [diff] [blame] | 1999 | } else { |
| 2000 | // Otherwise, copy the value from one register to another: |
Owen Anderson | 825b72b | 2009-08-11 20:47:22 +0000 | [diff] [blame] | 2001 | switch (Op0.getValueType().getSimpleVT().SimpleTy) { |
Torok Edwin | c23197a | 2009-07-14 16:55:14 +0000 | [diff] [blame] | 2002 | default: llvm_unreachable("Unexpected value type in LowerSCALAR_TO_VECTOR"); |
Owen Anderson | 825b72b | 2009-08-11 20:47:22 +0000 | [diff] [blame] | 2003 | case MVT::i8: |
| 2004 | case MVT::i16: |
| 2005 | case MVT::i32: |
| 2006 | case MVT::i64: |
| 2007 | case MVT::f32: |
| 2008 | case MVT::f64: |
Dale Johannesen | ed2eee6 | 2009-02-06 01:31:28 +0000 | [diff] [blame] | 2009 | return DAG.getNode(SPUISD::PREFSLOT2VEC, dl, Op.getValueType(), Op0, Op0); |
Scott Michel | 266bc8f | 2007-12-04 22:23:35 +0000 | [diff] [blame] | 2010 | } |
| 2011 | } |
| 2012 | |
Dan Gohman | 475871a | 2008-07-27 21:46:04 +0000 | [diff] [blame] | 2013 | return SDValue(); |
Scott Michel | 266bc8f | 2007-12-04 22:23:35 +0000 | [diff] [blame] | 2014 | } |
| 2015 | |
Dan Gohman | 475871a | 2008-07-27 21:46:04 +0000 | [diff] [blame] | 2016 | static SDValue LowerEXTRACT_VECTOR_ELT(SDValue Op, SelectionDAG &DAG) { |
Owen Anderson | e50ed30 | 2009-08-10 22:56:29 +0000 | [diff] [blame] | 2017 | EVT VT = Op.getValueType(); |
Dan Gohman | 475871a | 2008-07-27 21:46:04 +0000 | [diff] [blame] | 2018 | SDValue N = Op.getOperand(0); |
| 2019 | SDValue Elt = Op.getOperand(1); |
Dale Johannesen | ed2eee6 | 2009-02-06 01:31:28 +0000 | [diff] [blame] | 2020 | DebugLoc dl = Op.getDebugLoc(); |
Scott Michel | 7a1c9e9 | 2008-11-22 23:50:42 +0000 | [diff] [blame] | 2021 | SDValue retval; |
Scott Michel | 266bc8f | 2007-12-04 22:23:35 +0000 | [diff] [blame] | 2022 | |
Scott Michel | 7a1c9e9 | 2008-11-22 23:50:42 +0000 | [diff] [blame] | 2023 | if (ConstantSDNode *C = dyn_cast<ConstantSDNode>(Elt)) { |
| 2024 | // Constant argument: |
| 2025 | int EltNo = (int) C->getZExtValue(); |
Scott Michel | 266bc8f | 2007-12-04 22:23:35 +0000 | [diff] [blame] | 2026 | |
Scott Michel | 7a1c9e9 | 2008-11-22 23:50:42 +0000 | [diff] [blame] | 2027 | // sanity checks: |
Owen Anderson | 825b72b | 2009-08-11 20:47:22 +0000 | [diff] [blame] | 2028 | if (VT == MVT::i8 && EltNo >= 16) |
Torok Edwin | c23197a | 2009-07-14 16:55:14 +0000 | [diff] [blame] | 2029 | llvm_unreachable("SPU LowerEXTRACT_VECTOR_ELT: i8 extraction slot > 15"); |
Owen Anderson | 825b72b | 2009-08-11 20:47:22 +0000 | [diff] [blame] | 2030 | else if (VT == MVT::i16 && EltNo >= 8) |
Torok Edwin | c23197a | 2009-07-14 16:55:14 +0000 | [diff] [blame] | 2031 | llvm_unreachable("SPU LowerEXTRACT_VECTOR_ELT: i16 extraction slot > 7"); |
Owen Anderson | 825b72b | 2009-08-11 20:47:22 +0000 | [diff] [blame] | 2032 | else if (VT == MVT::i32 && EltNo >= 4) |
Torok Edwin | c23197a | 2009-07-14 16:55:14 +0000 | [diff] [blame] | 2033 | llvm_unreachable("SPU LowerEXTRACT_VECTOR_ELT: i32 extraction slot > 4"); |
Owen Anderson | 825b72b | 2009-08-11 20:47:22 +0000 | [diff] [blame] | 2034 | else if (VT == MVT::i64 && EltNo >= 2) |
Torok Edwin | c23197a | 2009-07-14 16:55:14 +0000 | [diff] [blame] | 2035 | llvm_unreachable("SPU LowerEXTRACT_VECTOR_ELT: i64 extraction slot > 2"); |
Scott Michel | 266bc8f | 2007-12-04 22:23:35 +0000 | [diff] [blame] | 2036 | |
Owen Anderson | 825b72b | 2009-08-11 20:47:22 +0000 | [diff] [blame] | 2037 | if (EltNo == 0 && (VT == MVT::i32 || VT == MVT::i64)) { |
Scott Michel | 7a1c9e9 | 2008-11-22 23:50:42 +0000 | [diff] [blame] | 2038 | // i32 and i64: Element 0 is the preferred slot |
Dale Johannesen | ed2eee6 | 2009-02-06 01:31:28 +0000 | [diff] [blame] | 2039 | return DAG.getNode(SPUISD::VEC2PREFSLOT, dl, VT, N); |
Scott Michel | 7a1c9e9 | 2008-11-22 23:50:42 +0000 | [diff] [blame] | 2040 | } |
Scott Michel | 266bc8f | 2007-12-04 22:23:35 +0000 | [diff] [blame] | 2041 | |
Scott Michel | 7a1c9e9 | 2008-11-22 23:50:42 +0000 | [diff] [blame] | 2042 | // Need to generate shuffle mask and extract: |
| 2043 | int prefslot_begin = -1, prefslot_end = -1; |
| 2044 | int elt_byte = EltNo * VT.getSizeInBits() / 8; |
| 2045 | |
Owen Anderson | 825b72b | 2009-08-11 20:47:22 +0000 | [diff] [blame] | 2046 | switch (VT.getSimpleVT().SimpleTy) { |
Scott Michel | 7a1c9e9 | 2008-11-22 23:50:42 +0000 | [diff] [blame] | 2047 | default: |
| 2048 | assert(false && "Invalid value type!"); |
Owen Anderson | 825b72b | 2009-08-11 20:47:22 +0000 | [diff] [blame] | 2049 | case MVT::i8: { |
Scott Michel | 7a1c9e9 | 2008-11-22 23:50:42 +0000 | [diff] [blame] | 2050 | prefslot_begin = prefslot_end = 3; |
| 2051 | break; |
| 2052 | } |
Owen Anderson | 825b72b | 2009-08-11 20:47:22 +0000 | [diff] [blame] | 2053 | case MVT::i16: { |
Scott Michel | 7a1c9e9 | 2008-11-22 23:50:42 +0000 | [diff] [blame] | 2054 | prefslot_begin = 2; prefslot_end = 3; |
| 2055 | break; |
| 2056 | } |
Owen Anderson | 825b72b | 2009-08-11 20:47:22 +0000 | [diff] [blame] | 2057 | case MVT::i32: |
| 2058 | case MVT::f32: { |
Scott Michel | 7a1c9e9 | 2008-11-22 23:50:42 +0000 | [diff] [blame] | 2059 | prefslot_begin = 0; prefslot_end = 3; |
| 2060 | break; |
| 2061 | } |
Owen Anderson | 825b72b | 2009-08-11 20:47:22 +0000 | [diff] [blame] | 2062 | case MVT::i64: |
| 2063 | case MVT::f64: { |
Scott Michel | 7a1c9e9 | 2008-11-22 23:50:42 +0000 | [diff] [blame] | 2064 | prefslot_begin = 0; prefslot_end = 7; |
| 2065 | break; |
| 2066 | } |
| 2067 | } |
| 2068 | |
| 2069 | assert(prefslot_begin != -1 && prefslot_end != -1 && |
| 2070 | "LowerEXTRACT_VECTOR_ELT: preferred slots uninitialized"); |
| 2071 | |
Scott Michel | 9b2420d | 2009-08-24 21:53:27 +0000 | [diff] [blame] | 2072 | unsigned int ShufBytes[16] = { |
| 2073 | 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0 |
| 2074 | }; |
Scott Michel | 7a1c9e9 | 2008-11-22 23:50:42 +0000 | [diff] [blame] | 2075 | for (int i = 0; i < 16; ++i) { |
| 2076 | // zero fill uppper part of preferred slot, don't care about the |
| 2077 | // other slots: |
| 2078 | unsigned int mask_val; |
| 2079 | if (i <= prefslot_end) { |
| 2080 | mask_val = |
| 2081 | ((i < prefslot_begin) |
| 2082 | ? 0x80 |
| 2083 | : elt_byte + (i - prefslot_begin)); |
| 2084 | |
| 2085 | ShufBytes[i] = mask_val; |
| 2086 | } else |
| 2087 | ShufBytes[i] = ShufBytes[i % (prefslot_end + 1)]; |
| 2088 | } |
| 2089 | |
| 2090 | SDValue ShufMask[4]; |
| 2091 | for (unsigned i = 0; i < sizeof(ShufMask)/sizeof(ShufMask[0]); ++i) { |
Scott Michel | cc18827 | 2008-12-04 21:01:44 +0000 | [diff] [blame] | 2092 | unsigned bidx = i * 4; |
Scott Michel | 7a1c9e9 | 2008-11-22 23:50:42 +0000 | [diff] [blame] | 2093 | unsigned int bits = ((ShufBytes[bidx] << 24) | |
| 2094 | (ShufBytes[bidx+1] << 16) | |
| 2095 | (ShufBytes[bidx+2] << 8) | |
| 2096 | ShufBytes[bidx+3]); |
Owen Anderson | 825b72b | 2009-08-11 20:47:22 +0000 | [diff] [blame] | 2097 | ShufMask[i] = DAG.getConstant(bits, MVT::i32); |
Scott Michel | 7a1c9e9 | 2008-11-22 23:50:42 +0000 | [diff] [blame] | 2098 | } |
| 2099 | |
Scott Michel | 7ea02ff | 2009-03-17 01:15:45 +0000 | [diff] [blame] | 2100 | SDValue ShufMaskVec = |
Owen Anderson | 825b72b | 2009-08-11 20:47:22 +0000 | [diff] [blame] | 2101 | DAG.getNode(ISD::BUILD_VECTOR, dl, MVT::v4i32, |
Scott Michel | 7ea02ff | 2009-03-17 01:15:45 +0000 | [diff] [blame] | 2102 | &ShufMask[0], sizeof(ShufMask)/sizeof(ShufMask[0])); |
Scott Michel | 7a1c9e9 | 2008-11-22 23:50:42 +0000 | [diff] [blame] | 2103 | |
Dale Johannesen | ed2eee6 | 2009-02-06 01:31:28 +0000 | [diff] [blame] | 2104 | retval = DAG.getNode(SPUISD::VEC2PREFSLOT, dl, VT, |
| 2105 | DAG.getNode(SPUISD::SHUFB, dl, N.getValueType(), |
Scott Michel | 7a1c9e9 | 2008-11-22 23:50:42 +0000 | [diff] [blame] | 2106 | N, N, ShufMaskVec)); |
| 2107 | } else { |
| 2108 | // Variable index: Rotate the requested element into slot 0, then replicate |
| 2109 | // slot 0 across the vector |
Owen Anderson | e50ed30 | 2009-08-10 22:56:29 +0000 | [diff] [blame] | 2110 | EVT VecVT = N.getValueType(); |
Kalle Raiskila | 82fe467 | 2010-08-02 08:54:39 +0000 | [diff] [blame] | 2111 | if (!VecVT.isSimple() || !VecVT.isVector()) { |
Chris Lattner | 75361b6 | 2010-04-07 22:58:41 +0000 | [diff] [blame] | 2112 | report_fatal_error("LowerEXTRACT_VECTOR_ELT: Must have a simple, 128-bit" |
Torok Edwin | dac237e | 2009-07-08 20:53:28 +0000 | [diff] [blame] | 2113 | "vector type!"); |
Scott Michel | 7a1c9e9 | 2008-11-22 23:50:42 +0000 | [diff] [blame] | 2114 | } |
| 2115 | |
| 2116 | // Make life easier by making sure the index is zero-extended to i32 |
Owen Anderson | 825b72b | 2009-08-11 20:47:22 +0000 | [diff] [blame] | 2117 | if (Elt.getValueType() != MVT::i32) |
| 2118 | Elt = DAG.getNode(ISD::ZERO_EXTEND, dl, MVT::i32, Elt); |
Scott Michel | 7a1c9e9 | 2008-11-22 23:50:42 +0000 | [diff] [blame] | 2119 | |
| 2120 | // Scale the index to a bit/byte shift quantity |
| 2121 | APInt scaleFactor = |
Scott Michel | 104de43 | 2008-11-24 17:11:17 +0000 | [diff] [blame] | 2122 | APInt(32, uint64_t(16 / N.getValueType().getVectorNumElements()), false); |
| 2123 | unsigned scaleShift = scaleFactor.logBase2(); |
Scott Michel | 7a1c9e9 | 2008-11-22 23:50:42 +0000 | [diff] [blame] | 2124 | SDValue vecShift; |
Scott Michel | 7a1c9e9 | 2008-11-22 23:50:42 +0000 | [diff] [blame] | 2125 | |
Scott Michel | 104de43 | 2008-11-24 17:11:17 +0000 | [diff] [blame] | 2126 | if (scaleShift > 0) { |
| 2127 | // Scale the shift factor: |
Owen Anderson | 825b72b | 2009-08-11 20:47:22 +0000 | [diff] [blame] | 2128 | Elt = DAG.getNode(ISD::SHL, dl, MVT::i32, Elt, |
| 2129 | DAG.getConstant(scaleShift, MVT::i32)); |
Scott Michel | 7a1c9e9 | 2008-11-22 23:50:42 +0000 | [diff] [blame] | 2130 | } |
| 2131 | |
Kalle Raiskila | 7ea1ab5 | 2010-11-12 10:14:03 +0000 | [diff] [blame] | 2132 | vecShift = DAG.getNode(SPUISD::SHL_BYTES, dl, VecVT, N, Elt); |
Scott Michel | 104de43 | 2008-11-24 17:11:17 +0000 | [diff] [blame] | 2133 | |
| 2134 | // Replicate the bytes starting at byte 0 across the entire vector (for |
| 2135 | // consistency with the notion of a unified register set) |
Scott Michel | 7a1c9e9 | 2008-11-22 23:50:42 +0000 | [diff] [blame] | 2136 | SDValue replicate; |
| 2137 | |
Owen Anderson | 825b72b | 2009-08-11 20:47:22 +0000 | [diff] [blame] | 2138 | switch (VT.getSimpleVT().SimpleTy) { |
Scott Michel | 7a1c9e9 | 2008-11-22 23:50:42 +0000 | [diff] [blame] | 2139 | default: |
Chris Lattner | 75361b6 | 2010-04-07 22:58:41 +0000 | [diff] [blame] | 2140 | report_fatal_error("LowerEXTRACT_VECTOR_ELT(varable): Unhandled vector" |
Torok Edwin | dac237e | 2009-07-08 20:53:28 +0000 | [diff] [blame] | 2141 | "type"); |
Scott Michel | 7a1c9e9 | 2008-11-22 23:50:42 +0000 | [diff] [blame] | 2142 | /*NOTREACHED*/ |
Owen Anderson | 825b72b | 2009-08-11 20:47:22 +0000 | [diff] [blame] | 2143 | case MVT::i8: { |
| 2144 | SDValue factor = DAG.getConstant(0x00000000, MVT::i32); |
| 2145 | replicate = DAG.getNode(ISD::BUILD_VECTOR, dl, MVT::v4i32, |
Scott Michel | 7ea02ff | 2009-03-17 01:15:45 +0000 | [diff] [blame] | 2146 | factor, factor, factor, factor); |
Scott Michel | 7a1c9e9 | 2008-11-22 23:50:42 +0000 | [diff] [blame] | 2147 | break; |
| 2148 | } |
Owen Anderson | 825b72b | 2009-08-11 20:47:22 +0000 | [diff] [blame] | 2149 | case MVT::i16: { |
| 2150 | SDValue factor = DAG.getConstant(0x00010001, MVT::i32); |
| 2151 | replicate = DAG.getNode(ISD::BUILD_VECTOR, dl, MVT::v4i32, |
Scott Michel | 7ea02ff | 2009-03-17 01:15:45 +0000 | [diff] [blame] | 2152 | factor, factor, factor, factor); |
Scott Michel | 7a1c9e9 | 2008-11-22 23:50:42 +0000 | [diff] [blame] | 2153 | break; |
| 2154 | } |
Owen Anderson | 825b72b | 2009-08-11 20:47:22 +0000 | [diff] [blame] | 2155 | case MVT::i32: |
| 2156 | case MVT::f32: { |
| 2157 | SDValue factor = DAG.getConstant(0x00010203, MVT::i32); |
| 2158 | replicate = DAG.getNode(ISD::BUILD_VECTOR, dl, MVT::v4i32, |
Scott Michel | 7ea02ff | 2009-03-17 01:15:45 +0000 | [diff] [blame] | 2159 | factor, factor, factor, factor); |
Scott Michel | 7a1c9e9 | 2008-11-22 23:50:42 +0000 | [diff] [blame] | 2160 | break; |
| 2161 | } |
Owen Anderson | 825b72b | 2009-08-11 20:47:22 +0000 | [diff] [blame] | 2162 | case MVT::i64: |
| 2163 | case MVT::f64: { |
| 2164 | SDValue loFactor = DAG.getConstant(0x00010203, MVT::i32); |
| 2165 | SDValue hiFactor = DAG.getConstant(0x04050607, MVT::i32); |
| 2166 | replicate = DAG.getNode(ISD::BUILD_VECTOR, dl, MVT::v4i32, |
Evan Cheng | a87008d | 2009-02-25 22:49:59 +0000 | [diff] [blame] | 2167 | loFactor, hiFactor, loFactor, hiFactor); |
Scott Michel | 7a1c9e9 | 2008-11-22 23:50:42 +0000 | [diff] [blame] | 2168 | break; |
| 2169 | } |
| 2170 | } |
| 2171 | |
Dale Johannesen | ed2eee6 | 2009-02-06 01:31:28 +0000 | [diff] [blame] | 2172 | retval = DAG.getNode(SPUISD::VEC2PREFSLOT, dl, VT, |
| 2173 | DAG.getNode(SPUISD::SHUFB, dl, VecVT, |
Scott Michel | 1a6cdb6 | 2008-12-01 17:56:02 +0000 | [diff] [blame] | 2174 | vecShift, vecShift, replicate)); |
Scott Michel | 266bc8f | 2007-12-04 22:23:35 +0000 | [diff] [blame] | 2175 | } |
| 2176 | |
Scott Michel | 7a1c9e9 | 2008-11-22 23:50:42 +0000 | [diff] [blame] | 2177 | return retval; |
Scott Michel | 266bc8f | 2007-12-04 22:23:35 +0000 | [diff] [blame] | 2178 | } |
| 2179 | |
Dan Gohman | 475871a | 2008-07-27 21:46:04 +0000 | [diff] [blame] | 2180 | static SDValue LowerINSERT_VECTOR_ELT(SDValue Op, SelectionDAG &DAG) { |
| 2181 | SDValue VecOp = Op.getOperand(0); |
| 2182 | SDValue ValOp = Op.getOperand(1); |
| 2183 | SDValue IdxOp = Op.getOperand(2); |
Dale Johannesen | ed2eee6 | 2009-02-06 01:31:28 +0000 | [diff] [blame] | 2184 | DebugLoc dl = Op.getDebugLoc(); |
Owen Anderson | e50ed30 | 2009-08-10 22:56:29 +0000 | [diff] [blame] | 2185 | EVT VT = Op.getValueType(); |
Kalle Raiskila | bd887df | 2010-08-29 12:41:50 +0000 | [diff] [blame] | 2186 | EVT eltVT = ValOp.getValueType(); |
Scott Michel | 266bc8f | 2007-12-04 22:23:35 +0000 | [diff] [blame] | 2187 | |
Kalle Raiskila | 43d225d | 2010-06-09 09:58:17 +0000 | [diff] [blame] | 2188 | // use 0 when the lane to insert to is 'undef' |
Kalle Raiskila | bd887df | 2010-08-29 12:41:50 +0000 | [diff] [blame] | 2189 | int64_t Offset=0; |
Kalle Raiskila | 43d225d | 2010-06-09 09:58:17 +0000 | [diff] [blame] | 2190 | if (IdxOp.getOpcode() != ISD::UNDEF) { |
| 2191 | ConstantSDNode *CN = cast<ConstantSDNode>(IdxOp); |
| 2192 | assert(CN != 0 && "LowerINSERT_VECTOR_ELT: Index is not constant!"); |
Kalle Raiskila | bd887df | 2010-08-29 12:41:50 +0000 | [diff] [blame] | 2193 | Offset = (CN->getSExtValue()) * eltVT.getSizeInBits()/8; |
Kalle Raiskila | 43d225d | 2010-06-09 09:58:17 +0000 | [diff] [blame] | 2194 | } |
Scott Michel | 266bc8f | 2007-12-04 22:23:35 +0000 | [diff] [blame] | 2195 | |
Owen Anderson | e50ed30 | 2009-08-10 22:56:29 +0000 | [diff] [blame] | 2196 | EVT PtrVT = DAG.getTargetLoweringInfo().getPointerTy(); |
Scott Michel | 1a6cdb6 | 2008-12-01 17:56:02 +0000 | [diff] [blame] | 2197 | // Use $sp ($1) because it's always 16-byte aligned and it's available: |
Dale Johannesen | ed2eee6 | 2009-02-06 01:31:28 +0000 | [diff] [blame] | 2198 | SDValue Pointer = DAG.getNode(SPUISD::IndirectAddr, dl, PtrVT, |
Scott Michel | 1a6cdb6 | 2008-12-01 17:56:02 +0000 | [diff] [blame] | 2199 | DAG.getRegister(SPU::R1, PtrVT), |
Kalle Raiskila | bd887df | 2010-08-29 12:41:50 +0000 | [diff] [blame] | 2200 | DAG.getConstant(Offset, PtrVT)); |
Kalle Raiskila | bc2697c | 2010-08-04 13:59:48 +0000 | [diff] [blame] | 2201 | // widen the mask when dealing with half vectors |
Wesley Peck | bf17cfa | 2010-11-23 03:31:01 +0000 | [diff] [blame] | 2202 | EVT maskVT = EVT::getVectorVT(*(DAG.getContext()), VT.getVectorElementType(), |
Kalle Raiskila | bc2697c | 2010-08-04 13:59:48 +0000 | [diff] [blame] | 2203 | 128/ VT.getVectorElementType().getSizeInBits()); |
| 2204 | SDValue ShufMask = DAG.getNode(SPUISD::SHUFFLE_MASK, dl, maskVT, Pointer); |
Scott Michel | 266bc8f | 2007-12-04 22:23:35 +0000 | [diff] [blame] | 2205 | |
Dan Gohman | 475871a | 2008-07-27 21:46:04 +0000 | [diff] [blame] | 2206 | SDValue result = |
Dale Johannesen | ed2eee6 | 2009-02-06 01:31:28 +0000 | [diff] [blame] | 2207 | DAG.getNode(SPUISD::SHUFB, dl, VT, |
| 2208 | DAG.getNode(ISD::SCALAR_TO_VECTOR, dl, VT, ValOp), |
Scott Michel | 1df30c4 | 2008-12-29 03:23:36 +0000 | [diff] [blame] | 2209 | VecOp, |
Wesley Peck | bf17cfa | 2010-11-23 03:31:01 +0000 | [diff] [blame] | 2210 | DAG.getNode(ISD::BITCAST, dl, MVT::v4i32, ShufMask)); |
Scott Michel | 266bc8f | 2007-12-04 22:23:35 +0000 | [diff] [blame] | 2211 | |
| 2212 | return result; |
| 2213 | } |
| 2214 | |
Scott Michel | f0569be | 2008-12-27 04:51:36 +0000 | [diff] [blame] | 2215 | static SDValue LowerI8Math(SDValue Op, SelectionDAG &DAG, unsigned Opc, |
| 2216 | const TargetLowering &TLI) |
Scott Michel | a59d469 | 2008-02-23 18:41:37 +0000 | [diff] [blame] | 2217 | { |
Dan Gohman | 475871a | 2008-07-27 21:46:04 +0000 | [diff] [blame] | 2218 | SDValue N0 = Op.getOperand(0); // Everything has at least one operand |
Dale Johannesen | ed2eee6 | 2009-02-06 01:31:28 +0000 | [diff] [blame] | 2219 | DebugLoc dl = Op.getDebugLoc(); |
Owen Anderson | 95771af | 2011-02-25 21:41:48 +0000 | [diff] [blame] | 2220 | EVT ShiftVT = TLI.getShiftAmountTy(N0.getValueType()); |
Scott Michel | 266bc8f | 2007-12-04 22:23:35 +0000 | [diff] [blame] | 2221 | |
Owen Anderson | 825b72b | 2009-08-11 20:47:22 +0000 | [diff] [blame] | 2222 | assert(Op.getValueType() == MVT::i8); |
Scott Michel | 266bc8f | 2007-12-04 22:23:35 +0000 | [diff] [blame] | 2223 | switch (Opc) { |
| 2224 | default: |
Torok Edwin | c23197a | 2009-07-14 16:55:14 +0000 | [diff] [blame] | 2225 | llvm_unreachable("Unhandled i8 math operator"); |
Scott Michel | 266bc8f | 2007-12-04 22:23:35 +0000 | [diff] [blame] | 2226 | /*NOTREACHED*/ |
| 2227 | break; |
Scott Michel | 02d711b | 2008-12-30 23:28:25 +0000 | [diff] [blame] | 2228 | case ISD::ADD: { |
| 2229 | // 8-bit addition: Promote the arguments up to 16-bits and truncate |
| 2230 | // the result: |
| 2231 | SDValue N1 = Op.getOperand(1); |
Owen Anderson | 825b72b | 2009-08-11 20:47:22 +0000 | [diff] [blame] | 2232 | N0 = DAG.getNode(ISD::SIGN_EXTEND, dl, MVT::i16, N0); |
| 2233 | N1 = DAG.getNode(ISD::SIGN_EXTEND, dl, MVT::i16, N1); |
| 2234 | return DAG.getNode(ISD::TRUNCATE, dl, MVT::i8, |
| 2235 | DAG.getNode(Opc, dl, MVT::i16, N0, N1)); |
Scott Michel | 02d711b | 2008-12-30 23:28:25 +0000 | [diff] [blame] | 2236 | |
| 2237 | } |
| 2238 | |
Scott Michel | 266bc8f | 2007-12-04 22:23:35 +0000 | [diff] [blame] | 2239 | case ISD::SUB: { |
| 2240 | // 8-bit subtraction: Promote the arguments up to 16-bits and truncate |
| 2241 | // the result: |
Dan Gohman | 475871a | 2008-07-27 21:46:04 +0000 | [diff] [blame] | 2242 | SDValue N1 = Op.getOperand(1); |
Owen Anderson | 825b72b | 2009-08-11 20:47:22 +0000 | [diff] [blame] | 2243 | N0 = DAG.getNode(ISD::SIGN_EXTEND, dl, MVT::i16, N0); |
| 2244 | N1 = DAG.getNode(ISD::SIGN_EXTEND, dl, MVT::i16, N1); |
| 2245 | return DAG.getNode(ISD::TRUNCATE, dl, MVT::i8, |
| 2246 | DAG.getNode(Opc, dl, MVT::i16, N0, N1)); |
Scott Michel | 5af8f0e | 2008-07-16 17:17:29 +0000 | [diff] [blame] | 2247 | } |
Scott Michel | 266bc8f | 2007-12-04 22:23:35 +0000 | [diff] [blame] | 2248 | case ISD::ROTR: |
| 2249 | case ISD::ROTL: { |
Dan Gohman | 475871a | 2008-07-27 21:46:04 +0000 | [diff] [blame] | 2250 | SDValue N1 = Op.getOperand(1); |
Owen Anderson | e50ed30 | 2009-08-10 22:56:29 +0000 | [diff] [blame] | 2251 | EVT N1VT = N1.getValueType(); |
Scott Michel | 7ea02ff | 2009-03-17 01:15:45 +0000 | [diff] [blame] | 2252 | |
Owen Anderson | 825b72b | 2009-08-11 20:47:22 +0000 | [diff] [blame] | 2253 | N0 = DAG.getNode(ISD::ZERO_EXTEND, dl, MVT::i16, N0); |
Scott Michel | 7ea02ff | 2009-03-17 01:15:45 +0000 | [diff] [blame] | 2254 | if (!N1VT.bitsEq(ShiftVT)) { |
| 2255 | unsigned N1Opc = N1.getValueType().bitsLT(ShiftVT) |
| 2256 | ? ISD::ZERO_EXTEND |
| 2257 | : ISD::TRUNCATE; |
| 2258 | N1 = DAG.getNode(N1Opc, dl, ShiftVT, N1); |
| 2259 | } |
| 2260 | |
| 2261 | // Replicate lower 8-bits into upper 8: |
Dan Gohman | 475871a | 2008-07-27 21:46:04 +0000 | [diff] [blame] | 2262 | SDValue ExpandArg = |
Owen Anderson | 825b72b | 2009-08-11 20:47:22 +0000 | [diff] [blame] | 2263 | DAG.getNode(ISD::OR, dl, MVT::i16, N0, |
| 2264 | DAG.getNode(ISD::SHL, dl, MVT::i16, |
| 2265 | N0, DAG.getConstant(8, MVT::i32))); |
Scott Michel | 7ea02ff | 2009-03-17 01:15:45 +0000 | [diff] [blame] | 2266 | |
| 2267 | // Truncate back down to i8 |
Owen Anderson | 825b72b | 2009-08-11 20:47:22 +0000 | [diff] [blame] | 2268 | return DAG.getNode(ISD::TRUNCATE, dl, MVT::i8, |
| 2269 | DAG.getNode(Opc, dl, MVT::i16, ExpandArg, N1)); |
Scott Michel | 266bc8f | 2007-12-04 22:23:35 +0000 | [diff] [blame] | 2270 | } |
| 2271 | case ISD::SRL: |
| 2272 | case ISD::SHL: { |
Dan Gohman | 475871a | 2008-07-27 21:46:04 +0000 | [diff] [blame] | 2273 | SDValue N1 = Op.getOperand(1); |
Owen Anderson | e50ed30 | 2009-08-10 22:56:29 +0000 | [diff] [blame] | 2274 | EVT N1VT = N1.getValueType(); |
Scott Michel | 7ea02ff | 2009-03-17 01:15:45 +0000 | [diff] [blame] | 2275 | |
Owen Anderson | 825b72b | 2009-08-11 20:47:22 +0000 | [diff] [blame] | 2276 | N0 = DAG.getNode(ISD::ZERO_EXTEND, dl, MVT::i16, N0); |
Scott Michel | 7ea02ff | 2009-03-17 01:15:45 +0000 | [diff] [blame] | 2277 | if (!N1VT.bitsEq(ShiftVT)) { |
| 2278 | unsigned N1Opc = ISD::ZERO_EXTEND; |
| 2279 | |
| 2280 | if (N1.getValueType().bitsGT(ShiftVT)) |
| 2281 | N1Opc = ISD::TRUNCATE; |
| 2282 | |
| 2283 | N1 = DAG.getNode(N1Opc, dl, ShiftVT, N1); |
| 2284 | } |
| 2285 | |
Owen Anderson | 825b72b | 2009-08-11 20:47:22 +0000 | [diff] [blame] | 2286 | return DAG.getNode(ISD::TRUNCATE, dl, MVT::i8, |
| 2287 | DAG.getNode(Opc, dl, MVT::i16, N0, N1)); |
Scott Michel | 266bc8f | 2007-12-04 22:23:35 +0000 | [diff] [blame] | 2288 | } |
| 2289 | case ISD::SRA: { |
Dan Gohman | 475871a | 2008-07-27 21:46:04 +0000 | [diff] [blame] | 2290 | SDValue N1 = Op.getOperand(1); |
Owen Anderson | e50ed30 | 2009-08-10 22:56:29 +0000 | [diff] [blame] | 2291 | EVT N1VT = N1.getValueType(); |
Scott Michel | 7ea02ff | 2009-03-17 01:15:45 +0000 | [diff] [blame] | 2292 | |
Owen Anderson | 825b72b | 2009-08-11 20:47:22 +0000 | [diff] [blame] | 2293 | N0 = DAG.getNode(ISD::SIGN_EXTEND, dl, MVT::i16, N0); |
Scott Michel | 7ea02ff | 2009-03-17 01:15:45 +0000 | [diff] [blame] | 2294 | if (!N1VT.bitsEq(ShiftVT)) { |
| 2295 | unsigned N1Opc = ISD::SIGN_EXTEND; |
| 2296 | |
| 2297 | if (N1VT.bitsGT(ShiftVT)) |
| 2298 | N1Opc = ISD::TRUNCATE; |
| 2299 | N1 = DAG.getNode(N1Opc, dl, ShiftVT, N1); |
| 2300 | } |
| 2301 | |
Owen Anderson | 825b72b | 2009-08-11 20:47:22 +0000 | [diff] [blame] | 2302 | return DAG.getNode(ISD::TRUNCATE, dl, MVT::i8, |
| 2303 | DAG.getNode(Opc, dl, MVT::i16, N0, N1)); |
Scott Michel | 266bc8f | 2007-12-04 22:23:35 +0000 | [diff] [blame] | 2304 | } |
| 2305 | case ISD::MUL: { |
Dan Gohman | 475871a | 2008-07-27 21:46:04 +0000 | [diff] [blame] | 2306 | SDValue N1 = Op.getOperand(1); |
Scott Michel | 7ea02ff | 2009-03-17 01:15:45 +0000 | [diff] [blame] | 2307 | |
Owen Anderson | 825b72b | 2009-08-11 20:47:22 +0000 | [diff] [blame] | 2308 | N0 = DAG.getNode(ISD::SIGN_EXTEND, dl, MVT::i16, N0); |
| 2309 | N1 = DAG.getNode(ISD::SIGN_EXTEND, dl, MVT::i16, N1); |
| 2310 | return DAG.getNode(ISD::TRUNCATE, dl, MVT::i8, |
| 2311 | DAG.getNode(Opc, dl, MVT::i16, N0, N1)); |
Scott Michel | 266bc8f | 2007-12-04 22:23:35 +0000 | [diff] [blame] | 2312 | break; |
| 2313 | } |
| 2314 | } |
| 2315 | |
Dan Gohman | 475871a | 2008-07-27 21:46:04 +0000 | [diff] [blame] | 2316 | return SDValue(); |
Scott Michel | 266bc8f | 2007-12-04 22:23:35 +0000 | [diff] [blame] | 2317 | } |
| 2318 | |
| 2319 | //! Lower byte immediate operations for v16i8 vectors: |
Dan Gohman | 475871a | 2008-07-27 21:46:04 +0000 | [diff] [blame] | 2320 | static SDValue |
| 2321 | LowerByteImmed(SDValue Op, SelectionDAG &DAG) { |
| 2322 | SDValue ConstVec; |
| 2323 | SDValue Arg; |
Owen Anderson | e50ed30 | 2009-08-10 22:56:29 +0000 | [diff] [blame] | 2324 | EVT VT = Op.getValueType(); |
Dale Johannesen | ed2eee6 | 2009-02-06 01:31:28 +0000 | [diff] [blame] | 2325 | DebugLoc dl = Op.getDebugLoc(); |
Scott Michel | 266bc8f | 2007-12-04 22:23:35 +0000 | [diff] [blame] | 2326 | |
| 2327 | ConstVec = Op.getOperand(0); |
| 2328 | Arg = Op.getOperand(1); |
Gabor Greif | ba36cb5 | 2008-08-28 21:40:38 +0000 | [diff] [blame] | 2329 | if (ConstVec.getNode()->getOpcode() != ISD::BUILD_VECTOR) { |
Wesley Peck | bf17cfa | 2010-11-23 03:31:01 +0000 | [diff] [blame] | 2330 | if (ConstVec.getNode()->getOpcode() == ISD::BITCAST) { |
Scott Michel | 266bc8f | 2007-12-04 22:23:35 +0000 | [diff] [blame] | 2331 | ConstVec = ConstVec.getOperand(0); |
| 2332 | } else { |
| 2333 | ConstVec = Op.getOperand(1); |
| 2334 | Arg = Op.getOperand(0); |
Wesley Peck | bf17cfa | 2010-11-23 03:31:01 +0000 | [diff] [blame] | 2335 | if (ConstVec.getNode()->getOpcode() == ISD::BITCAST) { |
Scott Michel | 7f9ba9b | 2008-01-30 02:55:46 +0000 | [diff] [blame] | 2336 | ConstVec = ConstVec.getOperand(0); |
Scott Michel | 266bc8f | 2007-12-04 22:23:35 +0000 | [diff] [blame] | 2337 | } |
| 2338 | } |
| 2339 | } |
| 2340 | |
Gabor Greif | ba36cb5 | 2008-08-28 21:40:38 +0000 | [diff] [blame] | 2341 | if (ConstVec.getNode()->getOpcode() == ISD::BUILD_VECTOR) { |
Scott Michel | 7ea02ff | 2009-03-17 01:15:45 +0000 | [diff] [blame] | 2342 | BuildVectorSDNode *BCN = dyn_cast<BuildVectorSDNode>(ConstVec.getNode()); |
| 2343 | assert(BCN != 0 && "Expected BuildVectorSDNode in SPU LowerByteImmed"); |
Scott Michel | 266bc8f | 2007-12-04 22:23:35 +0000 | [diff] [blame] | 2344 | |
Scott Michel | 7ea02ff | 2009-03-17 01:15:45 +0000 | [diff] [blame] | 2345 | APInt APSplatBits, APSplatUndef; |
| 2346 | unsigned SplatBitSize; |
| 2347 | bool HasAnyUndefs; |
| 2348 | unsigned minSplatBits = VT.getVectorElementType().getSizeInBits(); |
| 2349 | |
| 2350 | if (BCN->isConstantSplat(APSplatBits, APSplatUndef, SplatBitSize, |
| 2351 | HasAnyUndefs, minSplatBits) |
| 2352 | && minSplatBits <= SplatBitSize) { |
| 2353 | uint64_t SplatBits = APSplatBits.getZExtValue(); |
Owen Anderson | 825b72b | 2009-08-11 20:47:22 +0000 | [diff] [blame] | 2354 | SDValue tc = DAG.getTargetConstant(SplatBits & 0xff, MVT::i8); |
Scott Michel | 266bc8f | 2007-12-04 22:23:35 +0000 | [diff] [blame] | 2355 | |
Scott Michel | 7ea02ff | 2009-03-17 01:15:45 +0000 | [diff] [blame] | 2356 | SmallVector<SDValue, 16> tcVec; |
| 2357 | tcVec.assign(16, tc); |
Dale Johannesen | ed2eee6 | 2009-02-06 01:31:28 +0000 | [diff] [blame] | 2358 | return DAG.getNode(Op.getNode()->getOpcode(), dl, VT, Arg, |
Scott Michel | 7ea02ff | 2009-03-17 01:15:45 +0000 | [diff] [blame] | 2359 | DAG.getNode(ISD::BUILD_VECTOR, dl, VT, &tcVec[0], tcVec.size())); |
Scott Michel | 266bc8f | 2007-12-04 22:23:35 +0000 | [diff] [blame] | 2360 | } |
| 2361 | } |
Scott Michel | 9de57a9 | 2009-01-26 22:33:37 +0000 | [diff] [blame] | 2362 | |
Nate Begeman | 24dc346 | 2008-07-29 19:07:27 +0000 | [diff] [blame] | 2363 | // These operations (AND, OR, XOR) are legal, they just couldn't be custom |
| 2364 | // lowered. Return the operation, rather than a null SDValue. |
| 2365 | return Op; |
Scott Michel | 266bc8f | 2007-12-04 22:23:35 +0000 | [diff] [blame] | 2366 | } |
| 2367 | |
Scott Michel | 266bc8f | 2007-12-04 22:23:35 +0000 | [diff] [blame] | 2368 | //! Custom lowering for CTPOP (count population) |
| 2369 | /*! |
| 2370 | Custom lowering code that counts the number ones in the input |
| 2371 | operand. SPU has such an instruction, but it counts the number of |
| 2372 | ones per byte, which then have to be accumulated. |
| 2373 | */ |
Dan Gohman | 475871a | 2008-07-27 21:46:04 +0000 | [diff] [blame] | 2374 | static SDValue LowerCTPOP(SDValue Op, SelectionDAG &DAG) { |
Owen Anderson | e50ed30 | 2009-08-10 22:56:29 +0000 | [diff] [blame] | 2375 | EVT VT = Op.getValueType(); |
Wesley Peck | bf17cfa | 2010-11-23 03:31:01 +0000 | [diff] [blame] | 2376 | EVT vecVT = EVT::getVectorVT(*DAG.getContext(), |
Owen Anderson | 23b9b19 | 2009-08-12 00:36:31 +0000 | [diff] [blame] | 2377 | VT, (128 / VT.getSizeInBits())); |
Dale Johannesen | a05dca4 | 2009-02-04 23:02:30 +0000 | [diff] [blame] | 2378 | DebugLoc dl = Op.getDebugLoc(); |
Scott Michel | 266bc8f | 2007-12-04 22:23:35 +0000 | [diff] [blame] | 2379 | |
Owen Anderson | 825b72b | 2009-08-11 20:47:22 +0000 | [diff] [blame] | 2380 | switch (VT.getSimpleVT().SimpleTy) { |
Duncan Sands | 83ec4b6 | 2008-06-06 12:08:01 +0000 | [diff] [blame] | 2381 | default: |
| 2382 | assert(false && "Invalid value type!"); |
Owen Anderson | 825b72b | 2009-08-11 20:47:22 +0000 | [diff] [blame] | 2383 | case MVT::i8: { |
Dan Gohman | 475871a | 2008-07-27 21:46:04 +0000 | [diff] [blame] | 2384 | SDValue N = Op.getOperand(0); |
Owen Anderson | 825b72b | 2009-08-11 20:47:22 +0000 | [diff] [blame] | 2385 | SDValue Elt0 = DAG.getConstant(0, MVT::i32); |
Scott Michel | 266bc8f | 2007-12-04 22:23:35 +0000 | [diff] [blame] | 2386 | |
Dale Johannesen | a05dca4 | 2009-02-04 23:02:30 +0000 | [diff] [blame] | 2387 | SDValue Promote = DAG.getNode(SPUISD::PREFSLOT2VEC, dl, vecVT, N, N); |
| 2388 | SDValue CNTB = DAG.getNode(SPUISD::CNTB, dl, vecVT, Promote); |
Scott Michel | 266bc8f | 2007-12-04 22:23:35 +0000 | [diff] [blame] | 2389 | |
Owen Anderson | 825b72b | 2009-08-11 20:47:22 +0000 | [diff] [blame] | 2390 | return DAG.getNode(ISD::EXTRACT_VECTOR_ELT, dl, MVT::i8, CNTB, Elt0); |
Scott Michel | 266bc8f | 2007-12-04 22:23:35 +0000 | [diff] [blame] | 2391 | } |
| 2392 | |
Owen Anderson | 825b72b | 2009-08-11 20:47:22 +0000 | [diff] [blame] | 2393 | case MVT::i16: { |
Scott Michel | 266bc8f | 2007-12-04 22:23:35 +0000 | [diff] [blame] | 2394 | MachineFunction &MF = DAG.getMachineFunction(); |
Chris Lattner | 84bc542 | 2007-12-31 04:13:23 +0000 | [diff] [blame] | 2395 | MachineRegisterInfo &RegInfo = MF.getRegInfo(); |
Scott Michel | 266bc8f | 2007-12-04 22:23:35 +0000 | [diff] [blame] | 2396 | |
Chris Lattner | 84bc542 | 2007-12-31 04:13:23 +0000 | [diff] [blame] | 2397 | unsigned CNTB_reg = RegInfo.createVirtualRegister(&SPU::R16CRegClass); |
Scott Michel | 266bc8f | 2007-12-04 22:23:35 +0000 | [diff] [blame] | 2398 | |
Dan Gohman | 475871a | 2008-07-27 21:46:04 +0000 | [diff] [blame] | 2399 | SDValue N = Op.getOperand(0); |
Owen Anderson | 825b72b | 2009-08-11 20:47:22 +0000 | [diff] [blame] | 2400 | SDValue Elt0 = DAG.getConstant(0, MVT::i16); |
| 2401 | SDValue Mask0 = DAG.getConstant(0x0f, MVT::i16); |
| 2402 | SDValue Shift1 = DAG.getConstant(8, MVT::i32); |
Scott Michel | 266bc8f | 2007-12-04 22:23:35 +0000 | [diff] [blame] | 2403 | |
Dale Johannesen | a05dca4 | 2009-02-04 23:02:30 +0000 | [diff] [blame] | 2404 | SDValue Promote = DAG.getNode(SPUISD::PREFSLOT2VEC, dl, vecVT, N, N); |
| 2405 | SDValue CNTB = DAG.getNode(SPUISD::CNTB, dl, vecVT, Promote); |
Scott Michel | 266bc8f | 2007-12-04 22:23:35 +0000 | [diff] [blame] | 2406 | |
| 2407 | // CNTB_result becomes the chain to which all of the virtual registers |
| 2408 | // CNTB_reg, SUM1_reg become associated: |
Dan Gohman | 475871a | 2008-07-27 21:46:04 +0000 | [diff] [blame] | 2409 | SDValue CNTB_result = |
Owen Anderson | 825b72b | 2009-08-11 20:47:22 +0000 | [diff] [blame] | 2410 | DAG.getNode(ISD::EXTRACT_VECTOR_ELT, dl, MVT::i16, CNTB, Elt0); |
Scott Michel | 5af8f0e | 2008-07-16 17:17:29 +0000 | [diff] [blame] | 2411 | |
Dan Gohman | 475871a | 2008-07-27 21:46:04 +0000 | [diff] [blame] | 2412 | SDValue CNTB_rescopy = |
Dale Johannesen | a05dca4 | 2009-02-04 23:02:30 +0000 | [diff] [blame] | 2413 | DAG.getCopyToReg(CNTB_result, dl, CNTB_reg, CNTB_result); |
Scott Michel | 266bc8f | 2007-12-04 22:23:35 +0000 | [diff] [blame] | 2414 | |
Owen Anderson | 825b72b | 2009-08-11 20:47:22 +0000 | [diff] [blame] | 2415 | SDValue Tmp1 = DAG.getCopyFromReg(CNTB_rescopy, dl, CNTB_reg, MVT::i16); |
Scott Michel | 266bc8f | 2007-12-04 22:23:35 +0000 | [diff] [blame] | 2416 | |
Owen Anderson | 825b72b | 2009-08-11 20:47:22 +0000 | [diff] [blame] | 2417 | return DAG.getNode(ISD::AND, dl, MVT::i16, |
| 2418 | DAG.getNode(ISD::ADD, dl, MVT::i16, |
| 2419 | DAG.getNode(ISD::SRL, dl, MVT::i16, |
Scott Michel | 7f9ba9b | 2008-01-30 02:55:46 +0000 | [diff] [blame] | 2420 | Tmp1, Shift1), |
| 2421 | Tmp1), |
| 2422 | Mask0); |
Scott Michel | 266bc8f | 2007-12-04 22:23:35 +0000 | [diff] [blame] | 2423 | } |
| 2424 | |
Owen Anderson | 825b72b | 2009-08-11 20:47:22 +0000 | [diff] [blame] | 2425 | case MVT::i32: { |
Scott Michel | 266bc8f | 2007-12-04 22:23:35 +0000 | [diff] [blame] | 2426 | MachineFunction &MF = DAG.getMachineFunction(); |
Chris Lattner | 84bc542 | 2007-12-31 04:13:23 +0000 | [diff] [blame] | 2427 | MachineRegisterInfo &RegInfo = MF.getRegInfo(); |
Scott Michel | 266bc8f | 2007-12-04 22:23:35 +0000 | [diff] [blame] | 2428 | |
Chris Lattner | 84bc542 | 2007-12-31 04:13:23 +0000 | [diff] [blame] | 2429 | unsigned CNTB_reg = RegInfo.createVirtualRegister(&SPU::R32CRegClass); |
| 2430 | unsigned SUM1_reg = RegInfo.createVirtualRegister(&SPU::R32CRegClass); |
Scott Michel | 266bc8f | 2007-12-04 22:23:35 +0000 | [diff] [blame] | 2431 | |
Dan Gohman | 475871a | 2008-07-27 21:46:04 +0000 | [diff] [blame] | 2432 | SDValue N = Op.getOperand(0); |
Owen Anderson | 825b72b | 2009-08-11 20:47:22 +0000 | [diff] [blame] | 2433 | SDValue Elt0 = DAG.getConstant(0, MVT::i32); |
| 2434 | SDValue Mask0 = DAG.getConstant(0xff, MVT::i32); |
| 2435 | SDValue Shift1 = DAG.getConstant(16, MVT::i32); |
| 2436 | SDValue Shift2 = DAG.getConstant(8, MVT::i32); |
Scott Michel | 266bc8f | 2007-12-04 22:23:35 +0000 | [diff] [blame] | 2437 | |
Dale Johannesen | a05dca4 | 2009-02-04 23:02:30 +0000 | [diff] [blame] | 2438 | SDValue Promote = DAG.getNode(SPUISD::PREFSLOT2VEC, dl, vecVT, N, N); |
| 2439 | SDValue CNTB = DAG.getNode(SPUISD::CNTB, dl, vecVT, Promote); |
Scott Michel | 266bc8f | 2007-12-04 22:23:35 +0000 | [diff] [blame] | 2440 | |
| 2441 | // CNTB_result becomes the chain to which all of the virtual registers |
| 2442 | // CNTB_reg, SUM1_reg become associated: |
Dan Gohman | 475871a | 2008-07-27 21:46:04 +0000 | [diff] [blame] | 2443 | SDValue CNTB_result = |
Owen Anderson | 825b72b | 2009-08-11 20:47:22 +0000 | [diff] [blame] | 2444 | DAG.getNode(ISD::EXTRACT_VECTOR_ELT, dl, MVT::i32, CNTB, Elt0); |
Scott Michel | 5af8f0e | 2008-07-16 17:17:29 +0000 | [diff] [blame] | 2445 | |
Dan Gohman | 475871a | 2008-07-27 21:46:04 +0000 | [diff] [blame] | 2446 | SDValue CNTB_rescopy = |
Dale Johannesen | a05dca4 | 2009-02-04 23:02:30 +0000 | [diff] [blame] | 2447 | DAG.getCopyToReg(CNTB_result, dl, CNTB_reg, CNTB_result); |
Scott Michel | 266bc8f | 2007-12-04 22:23:35 +0000 | [diff] [blame] | 2448 | |
Dan Gohman | 475871a | 2008-07-27 21:46:04 +0000 | [diff] [blame] | 2449 | SDValue Comp1 = |
Owen Anderson | 825b72b | 2009-08-11 20:47:22 +0000 | [diff] [blame] | 2450 | DAG.getNode(ISD::SRL, dl, MVT::i32, |
| 2451 | DAG.getCopyFromReg(CNTB_rescopy, dl, CNTB_reg, MVT::i32), |
Dale Johannesen | a05dca4 | 2009-02-04 23:02:30 +0000 | [diff] [blame] | 2452 | Shift1); |
Scott Michel | 266bc8f | 2007-12-04 22:23:35 +0000 | [diff] [blame] | 2453 | |
Dan Gohman | 475871a | 2008-07-27 21:46:04 +0000 | [diff] [blame] | 2454 | SDValue Sum1 = |
Owen Anderson | 825b72b | 2009-08-11 20:47:22 +0000 | [diff] [blame] | 2455 | DAG.getNode(ISD::ADD, dl, MVT::i32, Comp1, |
| 2456 | DAG.getCopyFromReg(CNTB_rescopy, dl, CNTB_reg, MVT::i32)); |
Scott Michel | 266bc8f | 2007-12-04 22:23:35 +0000 | [diff] [blame] | 2457 | |
Dan Gohman | 475871a | 2008-07-27 21:46:04 +0000 | [diff] [blame] | 2458 | SDValue Sum1_rescopy = |
Dale Johannesen | a05dca4 | 2009-02-04 23:02:30 +0000 | [diff] [blame] | 2459 | DAG.getCopyToReg(CNTB_result, dl, SUM1_reg, Sum1); |
Scott Michel | 266bc8f | 2007-12-04 22:23:35 +0000 | [diff] [blame] | 2460 | |
Dan Gohman | 475871a | 2008-07-27 21:46:04 +0000 | [diff] [blame] | 2461 | SDValue Comp2 = |
Owen Anderson | 825b72b | 2009-08-11 20:47:22 +0000 | [diff] [blame] | 2462 | DAG.getNode(ISD::SRL, dl, MVT::i32, |
| 2463 | DAG.getCopyFromReg(Sum1_rescopy, dl, SUM1_reg, MVT::i32), |
Scott Michel | 7f9ba9b | 2008-01-30 02:55:46 +0000 | [diff] [blame] | 2464 | Shift2); |
Dan Gohman | 475871a | 2008-07-27 21:46:04 +0000 | [diff] [blame] | 2465 | SDValue Sum2 = |
Owen Anderson | 825b72b | 2009-08-11 20:47:22 +0000 | [diff] [blame] | 2466 | DAG.getNode(ISD::ADD, dl, MVT::i32, Comp2, |
| 2467 | DAG.getCopyFromReg(Sum1_rescopy, dl, SUM1_reg, MVT::i32)); |
Scott Michel | 266bc8f | 2007-12-04 22:23:35 +0000 | [diff] [blame] | 2468 | |
Owen Anderson | 825b72b | 2009-08-11 20:47:22 +0000 | [diff] [blame] | 2469 | return DAG.getNode(ISD::AND, dl, MVT::i32, Sum2, Mask0); |
Scott Michel | 266bc8f | 2007-12-04 22:23:35 +0000 | [diff] [blame] | 2470 | } |
| 2471 | |
Owen Anderson | 825b72b | 2009-08-11 20:47:22 +0000 | [diff] [blame] | 2472 | case MVT::i64: |
Scott Michel | 266bc8f | 2007-12-04 22:23:35 +0000 | [diff] [blame] | 2473 | break; |
| 2474 | } |
| 2475 | |
Dan Gohman | 475871a | 2008-07-27 21:46:04 +0000 | [diff] [blame] | 2476 | return SDValue(); |
Scott Michel | 266bc8f | 2007-12-04 22:23:35 +0000 | [diff] [blame] | 2477 | } |
| 2478 | |
Scott Michel | c9c8b2a | 2009-01-26 03:31:40 +0000 | [diff] [blame] | 2479 | //! Lower ISD::FP_TO_SINT, ISD::FP_TO_UINT for i32 |
Scott Michel | d1e8d9c | 2009-01-21 04:58:48 +0000 | [diff] [blame] | 2480 | /*! |
Scott Michel | c9c8b2a | 2009-01-26 03:31:40 +0000 | [diff] [blame] | 2481 | f32->i32 passes through unchanged, whereas f64->i32 expands to a libcall. |
| 2482 | All conversions to i64 are expanded to a libcall. |
Scott Michel | d1e8d9c | 2009-01-21 04:58:48 +0000 | [diff] [blame] | 2483 | */ |
Scott Michel | c9c8b2a | 2009-01-26 03:31:40 +0000 | [diff] [blame] | 2484 | static SDValue LowerFP_TO_INT(SDValue Op, SelectionDAG &DAG, |
Dan Gohman | d858e90 | 2010-04-17 15:26:15 +0000 | [diff] [blame] | 2485 | const SPUTargetLowering &TLI) { |
Owen Anderson | e50ed30 | 2009-08-10 22:56:29 +0000 | [diff] [blame] | 2486 | EVT OpVT = Op.getValueType(); |
Scott Michel | d1e8d9c | 2009-01-21 04:58:48 +0000 | [diff] [blame] | 2487 | SDValue Op0 = Op.getOperand(0); |
Owen Anderson | e50ed30 | 2009-08-10 22:56:29 +0000 | [diff] [blame] | 2488 | EVT Op0VT = Op0.getValueType(); |
Scott Michel | d1e8d9c | 2009-01-21 04:58:48 +0000 | [diff] [blame] | 2489 | |
Owen Anderson | 825b72b | 2009-08-11 20:47:22 +0000 | [diff] [blame] | 2490 | if ((OpVT == MVT::i32 && Op0VT == MVT::f64) |
| 2491 | || OpVT == MVT::i64) { |
Scott Michel | c9c8b2a | 2009-01-26 03:31:40 +0000 | [diff] [blame] | 2492 | // Convert f32 / f64 to i32 / i64 via libcall. |
| 2493 | RTLIB::Libcall LC = |
| 2494 | (Op.getOpcode() == ISD::FP_TO_SINT) |
| 2495 | ? RTLIB::getFPTOSINT(Op0VT, OpVT) |
| 2496 | : RTLIB::getFPTOUINT(Op0VT, OpVT); |
| 2497 | assert(LC != RTLIB::UNKNOWN_LIBCALL && "Unexpectd fp-to-int conversion!"); |
| 2498 | SDValue Dummy; |
| 2499 | return ExpandLibCall(LC, Op, DAG, false, Dummy, TLI); |
| 2500 | } |
Scott Michel | d1e8d9c | 2009-01-21 04:58:48 +0000 | [diff] [blame] | 2501 | |
Eli Friedman | 36df499 | 2009-05-27 00:47:34 +0000 | [diff] [blame] | 2502 | return Op; |
Scott Michel | c9c8b2a | 2009-01-26 03:31:40 +0000 | [diff] [blame] | 2503 | } |
Scott Michel | d1e8d9c | 2009-01-21 04:58:48 +0000 | [diff] [blame] | 2504 | |
Scott Michel | c9c8b2a | 2009-01-26 03:31:40 +0000 | [diff] [blame] | 2505 | //! Lower ISD::SINT_TO_FP, ISD::UINT_TO_FP for i32 |
| 2506 | /*! |
| 2507 | i32->f32 passes through unchanged, whereas i32->f64 is expanded to a libcall. |
| 2508 | All conversions from i64 are expanded to a libcall. |
| 2509 | */ |
| 2510 | static SDValue LowerINT_TO_FP(SDValue Op, SelectionDAG &DAG, |
Dan Gohman | d858e90 | 2010-04-17 15:26:15 +0000 | [diff] [blame] | 2511 | const SPUTargetLowering &TLI) { |
Owen Anderson | e50ed30 | 2009-08-10 22:56:29 +0000 | [diff] [blame] | 2512 | EVT OpVT = Op.getValueType(); |
Scott Michel | c9c8b2a | 2009-01-26 03:31:40 +0000 | [diff] [blame] | 2513 | SDValue Op0 = Op.getOperand(0); |
Owen Anderson | e50ed30 | 2009-08-10 22:56:29 +0000 | [diff] [blame] | 2514 | EVT Op0VT = Op0.getValueType(); |
Scott Michel | c9c8b2a | 2009-01-26 03:31:40 +0000 | [diff] [blame] | 2515 | |
Owen Anderson | 825b72b | 2009-08-11 20:47:22 +0000 | [diff] [blame] | 2516 | if ((OpVT == MVT::f64 && Op0VT == MVT::i32) |
| 2517 | || Op0VT == MVT::i64) { |
Scott Michel | c9c8b2a | 2009-01-26 03:31:40 +0000 | [diff] [blame] | 2518 | // Convert i32, i64 to f64 via libcall: |
| 2519 | RTLIB::Libcall LC = |
| 2520 | (Op.getOpcode() == ISD::SINT_TO_FP) |
| 2521 | ? RTLIB::getSINTTOFP(Op0VT, OpVT) |
| 2522 | : RTLIB::getUINTTOFP(Op0VT, OpVT); |
| 2523 | assert(LC != RTLIB::UNKNOWN_LIBCALL && "Unexpectd int-to-fp conversion!"); |
| 2524 | SDValue Dummy; |
| 2525 | return ExpandLibCall(LC, Op, DAG, false, Dummy, TLI); |
| 2526 | } |
| 2527 | |
Eli Friedman | 36df499 | 2009-05-27 00:47:34 +0000 | [diff] [blame] | 2528 | return Op; |
Scott Michel | d1e8d9c | 2009-01-21 04:58:48 +0000 | [diff] [blame] | 2529 | } |
| 2530 | |
| 2531 | //! Lower ISD::SETCC |
| 2532 | /*! |
Owen Anderson | 825b72b | 2009-08-11 20:47:22 +0000 | [diff] [blame] | 2533 | This handles MVT::f64 (double floating point) condition lowering |
Scott Michel | d1e8d9c | 2009-01-21 04:58:48 +0000 | [diff] [blame] | 2534 | */ |
Scott Michel | d1e8d9c | 2009-01-21 04:58:48 +0000 | [diff] [blame] | 2535 | static SDValue LowerSETCC(SDValue Op, SelectionDAG &DAG, |
| 2536 | const TargetLowering &TLI) { |
Scott Michel | c9c8b2a | 2009-01-26 03:31:40 +0000 | [diff] [blame] | 2537 | CondCodeSDNode *CC = dyn_cast<CondCodeSDNode>(Op.getOperand(2)); |
Dale Johannesen | 6f38cb6 | 2009-02-07 19:59:05 +0000 | [diff] [blame] | 2538 | DebugLoc dl = Op.getDebugLoc(); |
Scott Michel | c9c8b2a | 2009-01-26 03:31:40 +0000 | [diff] [blame] | 2539 | assert(CC != 0 && "LowerSETCC: CondCodeSDNode should not be null here!\n"); |
| 2540 | |
Scott Michel | d1e8d9c | 2009-01-21 04:58:48 +0000 | [diff] [blame] | 2541 | SDValue lhs = Op.getOperand(0); |
| 2542 | SDValue rhs = Op.getOperand(1); |
Owen Anderson | e50ed30 | 2009-08-10 22:56:29 +0000 | [diff] [blame] | 2543 | EVT lhsVT = lhs.getValueType(); |
Owen Anderson | 825b72b | 2009-08-11 20:47:22 +0000 | [diff] [blame] | 2544 | assert(lhsVT == MVT::f64 && "LowerSETCC: type other than MVT::64\n"); |
Scott Michel | d1e8d9c | 2009-01-21 04:58:48 +0000 | [diff] [blame] | 2545 | |
Owen Anderson | e50ed30 | 2009-08-10 22:56:29 +0000 | [diff] [blame] | 2546 | EVT ccResultVT = TLI.getSetCCResultType(lhs.getValueType()); |
Scott Michel | c9c8b2a | 2009-01-26 03:31:40 +0000 | [diff] [blame] | 2547 | APInt ccResultOnes = APInt::getAllOnesValue(ccResultVT.getSizeInBits()); |
Owen Anderson | 825b72b | 2009-08-11 20:47:22 +0000 | [diff] [blame] | 2548 | EVT IntVT(MVT::i64); |
Scott Michel | c9c8b2a | 2009-01-26 03:31:40 +0000 | [diff] [blame] | 2549 | |
| 2550 | // Take advantage of the fact that (truncate (sra arg, 32)) is efficiently |
| 2551 | // selected to a NOP: |
Wesley Peck | bf17cfa | 2010-11-23 03:31:01 +0000 | [diff] [blame] | 2552 | SDValue i64lhs = DAG.getNode(ISD::BITCAST, dl, IntVT, lhs); |
Scott Michel | c9c8b2a | 2009-01-26 03:31:40 +0000 | [diff] [blame] | 2553 | SDValue lhsHi32 = |
Owen Anderson | 825b72b | 2009-08-11 20:47:22 +0000 | [diff] [blame] | 2554 | DAG.getNode(ISD::TRUNCATE, dl, MVT::i32, |
Dale Johannesen | f5d9789 | 2009-02-04 01:48:28 +0000 | [diff] [blame] | 2555 | DAG.getNode(ISD::SRL, dl, IntVT, |
Owen Anderson | 825b72b | 2009-08-11 20:47:22 +0000 | [diff] [blame] | 2556 | i64lhs, DAG.getConstant(32, MVT::i32))); |
Scott Michel | c9c8b2a | 2009-01-26 03:31:40 +0000 | [diff] [blame] | 2557 | SDValue lhsHi32abs = |
Owen Anderson | 825b72b | 2009-08-11 20:47:22 +0000 | [diff] [blame] | 2558 | DAG.getNode(ISD::AND, dl, MVT::i32, |
| 2559 | lhsHi32, DAG.getConstant(0x7fffffff, MVT::i32)); |
Scott Michel | c9c8b2a | 2009-01-26 03:31:40 +0000 | [diff] [blame] | 2560 | SDValue lhsLo32 = |
Owen Anderson | 825b72b | 2009-08-11 20:47:22 +0000 | [diff] [blame] | 2561 | DAG.getNode(ISD::TRUNCATE, dl, MVT::i32, i64lhs); |
Scott Michel | c9c8b2a | 2009-01-26 03:31:40 +0000 | [diff] [blame] | 2562 | |
| 2563 | // SETO and SETUO only use the lhs operand: |
| 2564 | if (CC->get() == ISD::SETO) { |
| 2565 | // Evaluates to true if Op0 is not [SQ]NaN - lowers to the inverse of |
| 2566 | // SETUO |
| 2567 | APInt ccResultAllOnes = APInt::getAllOnesValue(ccResultVT.getSizeInBits()); |
Dale Johannesen | f5d9789 | 2009-02-04 01:48:28 +0000 | [diff] [blame] | 2568 | return DAG.getNode(ISD::XOR, dl, ccResultVT, |
| 2569 | DAG.getSetCC(dl, ccResultVT, |
Scott Michel | c9c8b2a | 2009-01-26 03:31:40 +0000 | [diff] [blame] | 2570 | lhs, DAG.getConstantFP(0.0, lhsVT), |
| 2571 | ISD::SETUO), |
| 2572 | DAG.getConstant(ccResultAllOnes, ccResultVT)); |
| 2573 | } else if (CC->get() == ISD::SETUO) { |
| 2574 | // Evaluates to true if Op0 is [SQ]NaN |
Dale Johannesen | f5d9789 | 2009-02-04 01:48:28 +0000 | [diff] [blame] | 2575 | return DAG.getNode(ISD::AND, dl, ccResultVT, |
| 2576 | DAG.getSetCC(dl, ccResultVT, |
Scott Michel | c9c8b2a | 2009-01-26 03:31:40 +0000 | [diff] [blame] | 2577 | lhsHi32abs, |
Owen Anderson | 825b72b | 2009-08-11 20:47:22 +0000 | [diff] [blame] | 2578 | DAG.getConstant(0x7ff00000, MVT::i32), |
Scott Michel | c9c8b2a | 2009-01-26 03:31:40 +0000 | [diff] [blame] | 2579 | ISD::SETGE), |
Dale Johannesen | f5d9789 | 2009-02-04 01:48:28 +0000 | [diff] [blame] | 2580 | DAG.getSetCC(dl, ccResultVT, |
Scott Michel | c9c8b2a | 2009-01-26 03:31:40 +0000 | [diff] [blame] | 2581 | lhsLo32, |
Owen Anderson | 825b72b | 2009-08-11 20:47:22 +0000 | [diff] [blame] | 2582 | DAG.getConstant(0, MVT::i32), |
Scott Michel | c9c8b2a | 2009-01-26 03:31:40 +0000 | [diff] [blame] | 2583 | ISD::SETGT)); |
| 2584 | } |
| 2585 | |
Wesley Peck | bf17cfa | 2010-11-23 03:31:01 +0000 | [diff] [blame] | 2586 | SDValue i64rhs = DAG.getNode(ISD::BITCAST, dl, IntVT, rhs); |
Scott Michel | c9c8b2a | 2009-01-26 03:31:40 +0000 | [diff] [blame] | 2587 | SDValue rhsHi32 = |
Owen Anderson | 825b72b | 2009-08-11 20:47:22 +0000 | [diff] [blame] | 2588 | DAG.getNode(ISD::TRUNCATE, dl, MVT::i32, |
Dale Johannesen | f5d9789 | 2009-02-04 01:48:28 +0000 | [diff] [blame] | 2589 | DAG.getNode(ISD::SRL, dl, IntVT, |
Owen Anderson | 825b72b | 2009-08-11 20:47:22 +0000 | [diff] [blame] | 2590 | i64rhs, DAG.getConstant(32, MVT::i32))); |
Scott Michel | c9c8b2a | 2009-01-26 03:31:40 +0000 | [diff] [blame] | 2591 | |
| 2592 | // If a value is negative, subtract from the sign magnitude constant: |
| 2593 | SDValue signMag2TC = DAG.getConstant(0x8000000000000000ULL, IntVT); |
| 2594 | |
| 2595 | // Convert the sign-magnitude representation into 2's complement: |
Dale Johannesen | f5d9789 | 2009-02-04 01:48:28 +0000 | [diff] [blame] | 2596 | SDValue lhsSelectMask = DAG.getNode(ISD::SRA, dl, ccResultVT, |
Owen Anderson | 825b72b | 2009-08-11 20:47:22 +0000 | [diff] [blame] | 2597 | lhsHi32, DAG.getConstant(31, MVT::i32)); |
Dale Johannesen | f5d9789 | 2009-02-04 01:48:28 +0000 | [diff] [blame] | 2598 | SDValue lhsSignMag2TC = DAG.getNode(ISD::SUB, dl, IntVT, signMag2TC, i64lhs); |
Scott Michel | c9c8b2a | 2009-01-26 03:31:40 +0000 | [diff] [blame] | 2599 | SDValue lhsSelect = |
Dale Johannesen | f5d9789 | 2009-02-04 01:48:28 +0000 | [diff] [blame] | 2600 | DAG.getNode(ISD::SELECT, dl, IntVT, |
Scott Michel | c9c8b2a | 2009-01-26 03:31:40 +0000 | [diff] [blame] | 2601 | lhsSelectMask, lhsSignMag2TC, i64lhs); |
| 2602 | |
Dale Johannesen | f5d9789 | 2009-02-04 01:48:28 +0000 | [diff] [blame] | 2603 | SDValue rhsSelectMask = DAG.getNode(ISD::SRA, dl, ccResultVT, |
Owen Anderson | 825b72b | 2009-08-11 20:47:22 +0000 | [diff] [blame] | 2604 | rhsHi32, DAG.getConstant(31, MVT::i32)); |
Dale Johannesen | f5d9789 | 2009-02-04 01:48:28 +0000 | [diff] [blame] | 2605 | SDValue rhsSignMag2TC = DAG.getNode(ISD::SUB, dl, IntVT, signMag2TC, i64rhs); |
Scott Michel | c9c8b2a | 2009-01-26 03:31:40 +0000 | [diff] [blame] | 2606 | SDValue rhsSelect = |
Dale Johannesen | f5d9789 | 2009-02-04 01:48:28 +0000 | [diff] [blame] | 2607 | DAG.getNode(ISD::SELECT, dl, IntVT, |
Scott Michel | c9c8b2a | 2009-01-26 03:31:40 +0000 | [diff] [blame] | 2608 | rhsSelectMask, rhsSignMag2TC, i64rhs); |
| 2609 | |
| 2610 | unsigned compareOp; |
| 2611 | |
Scott Michel | d1e8d9c | 2009-01-21 04:58:48 +0000 | [diff] [blame] | 2612 | switch (CC->get()) { |
| 2613 | case ISD::SETOEQ: |
Scott Michel | d1e8d9c | 2009-01-21 04:58:48 +0000 | [diff] [blame] | 2614 | case ISD::SETUEQ: |
Scott Michel | c9c8b2a | 2009-01-26 03:31:40 +0000 | [diff] [blame] | 2615 | compareOp = ISD::SETEQ; break; |
| 2616 | case ISD::SETOGT: |
Scott Michel | d1e8d9c | 2009-01-21 04:58:48 +0000 | [diff] [blame] | 2617 | case ISD::SETUGT: |
Scott Michel | c9c8b2a | 2009-01-26 03:31:40 +0000 | [diff] [blame] | 2618 | compareOp = ISD::SETGT; break; |
| 2619 | case ISD::SETOGE: |
Scott Michel | d1e8d9c | 2009-01-21 04:58:48 +0000 | [diff] [blame] | 2620 | case ISD::SETUGE: |
Scott Michel | c9c8b2a | 2009-01-26 03:31:40 +0000 | [diff] [blame] | 2621 | compareOp = ISD::SETGE; break; |
| 2622 | case ISD::SETOLT: |
Scott Michel | d1e8d9c | 2009-01-21 04:58:48 +0000 | [diff] [blame] | 2623 | case ISD::SETULT: |
Scott Michel | c9c8b2a | 2009-01-26 03:31:40 +0000 | [diff] [blame] | 2624 | compareOp = ISD::SETLT; break; |
| 2625 | case ISD::SETOLE: |
Scott Michel | d1e8d9c | 2009-01-21 04:58:48 +0000 | [diff] [blame] | 2626 | case ISD::SETULE: |
Scott Michel | c9c8b2a | 2009-01-26 03:31:40 +0000 | [diff] [blame] | 2627 | compareOp = ISD::SETLE; break; |
Scott Michel | d1e8d9c | 2009-01-21 04:58:48 +0000 | [diff] [blame] | 2628 | case ISD::SETUNE: |
Scott Michel | c9c8b2a | 2009-01-26 03:31:40 +0000 | [diff] [blame] | 2629 | case ISD::SETONE: |
| 2630 | compareOp = ISD::SETNE; break; |
Scott Michel | d1e8d9c | 2009-01-21 04:58:48 +0000 | [diff] [blame] | 2631 | default: |
Chris Lattner | 75361b6 | 2010-04-07 22:58:41 +0000 | [diff] [blame] | 2632 | report_fatal_error("CellSPU ISel Select: unimplemented f64 condition"); |
Scott Michel | d1e8d9c | 2009-01-21 04:58:48 +0000 | [diff] [blame] | 2633 | } |
| 2634 | |
Scott Michel | c9c8b2a | 2009-01-26 03:31:40 +0000 | [diff] [blame] | 2635 | SDValue result = |
Scott Michel | 6e1d147 | 2009-03-16 18:47:25 +0000 | [diff] [blame] | 2636 | DAG.getSetCC(dl, ccResultVT, lhsSelect, rhsSelect, |
Dale Johannesen | f5d9789 | 2009-02-04 01:48:28 +0000 | [diff] [blame] | 2637 | (ISD::CondCode) compareOp); |
Scott Michel | c9c8b2a | 2009-01-26 03:31:40 +0000 | [diff] [blame] | 2638 | |
| 2639 | if ((CC->get() & 0x8) == 0) { |
| 2640 | // Ordered comparison: |
Dale Johannesen | f5d9789 | 2009-02-04 01:48:28 +0000 | [diff] [blame] | 2641 | SDValue lhsNaN = DAG.getSetCC(dl, ccResultVT, |
Owen Anderson | 825b72b | 2009-08-11 20:47:22 +0000 | [diff] [blame] | 2642 | lhs, DAG.getConstantFP(0.0, MVT::f64), |
Scott Michel | c9c8b2a | 2009-01-26 03:31:40 +0000 | [diff] [blame] | 2643 | ISD::SETO); |
Dale Johannesen | f5d9789 | 2009-02-04 01:48:28 +0000 | [diff] [blame] | 2644 | SDValue rhsNaN = DAG.getSetCC(dl, ccResultVT, |
Owen Anderson | 825b72b | 2009-08-11 20:47:22 +0000 | [diff] [blame] | 2645 | rhs, DAG.getConstantFP(0.0, MVT::f64), |
Scott Michel | c9c8b2a | 2009-01-26 03:31:40 +0000 | [diff] [blame] | 2646 | ISD::SETO); |
Dale Johannesen | f5d9789 | 2009-02-04 01:48:28 +0000 | [diff] [blame] | 2647 | SDValue ordered = DAG.getNode(ISD::AND, dl, ccResultVT, lhsNaN, rhsNaN); |
Scott Michel | c9c8b2a | 2009-01-26 03:31:40 +0000 | [diff] [blame] | 2648 | |
Dale Johannesen | f5d9789 | 2009-02-04 01:48:28 +0000 | [diff] [blame] | 2649 | result = DAG.getNode(ISD::AND, dl, ccResultVT, ordered, result); |
Scott Michel | c9c8b2a | 2009-01-26 03:31:40 +0000 | [diff] [blame] | 2650 | } |
| 2651 | |
| 2652 | return result; |
Scott Michel | d1e8d9c | 2009-01-21 04:58:48 +0000 | [diff] [blame] | 2653 | } |
| 2654 | |
Scott Michel | 7a1c9e9 | 2008-11-22 23:50:42 +0000 | [diff] [blame] | 2655 | //! Lower ISD::SELECT_CC |
| 2656 | /*! |
| 2657 | ISD::SELECT_CC can (generally) be implemented directly on the SPU using the |
| 2658 | SELB instruction. |
| 2659 | |
| 2660 | \note Need to revisit this in the future: if the code path through the true |
| 2661 | and false value computations is longer than the latency of a branch (6 |
| 2662 | cycles), then it would be more advantageous to branch and insert a new basic |
| 2663 | block and branch on the condition. However, this code does not make that |
| 2664 | assumption, given the simplisitc uses so far. |
| 2665 | */ |
| 2666 | |
Scott Michel | f0569be | 2008-12-27 04:51:36 +0000 | [diff] [blame] | 2667 | static SDValue LowerSELECT_CC(SDValue Op, SelectionDAG &DAG, |
| 2668 | const TargetLowering &TLI) { |
Owen Anderson | e50ed30 | 2009-08-10 22:56:29 +0000 | [diff] [blame] | 2669 | EVT VT = Op.getValueType(); |
Scott Michel | 7a1c9e9 | 2008-11-22 23:50:42 +0000 | [diff] [blame] | 2670 | SDValue lhs = Op.getOperand(0); |
| 2671 | SDValue rhs = Op.getOperand(1); |
| 2672 | SDValue trueval = Op.getOperand(2); |
| 2673 | SDValue falseval = Op.getOperand(3); |
| 2674 | SDValue condition = Op.getOperand(4); |
Dale Johannesen | de06470 | 2009-02-06 21:50:26 +0000 | [diff] [blame] | 2675 | DebugLoc dl = Op.getDebugLoc(); |
Scott Michel | 7a1c9e9 | 2008-11-22 23:50:42 +0000 | [diff] [blame] | 2676 | |
Scott Michel | f0569be | 2008-12-27 04:51:36 +0000 | [diff] [blame] | 2677 | // NOTE: SELB's arguments: $rA, $rB, $mask |
| 2678 | // |
| 2679 | // SELB selects bits from $rA where bits in $mask are 0, bits from $rB |
| 2680 | // where bits in $mask are 1. CCond will be inverted, having 1s where the |
| 2681 | // condition was true and 0s where the condition was false. Hence, the |
| 2682 | // arguments to SELB get reversed. |
| 2683 | |
Scott Michel | 7a1c9e9 | 2008-11-22 23:50:42 +0000 | [diff] [blame] | 2684 | // Note: Really should be ISD::SELECT instead of SPUISD::SELB, but LLVM's |
| 2685 | // legalizer insists on combining SETCC/SELECT into SELECT_CC, so we end up |
| 2686 | // with another "cannot select select_cc" assert: |
| 2687 | |
Dale Johannesen | de06470 | 2009-02-06 21:50:26 +0000 | [diff] [blame] | 2688 | SDValue compare = DAG.getNode(ISD::SETCC, dl, |
Duncan Sands | 5480c04 | 2009-01-01 15:52:00 +0000 | [diff] [blame] | 2689 | TLI.getSetCCResultType(Op.getValueType()), |
Scott Michel | f0569be | 2008-12-27 04:51:36 +0000 | [diff] [blame] | 2690 | lhs, rhs, condition); |
Dale Johannesen | de06470 | 2009-02-06 21:50:26 +0000 | [diff] [blame] | 2691 | return DAG.getNode(SPUISD::SELB, dl, VT, falseval, trueval, compare); |
Scott Michel | 7a1c9e9 | 2008-11-22 23:50:42 +0000 | [diff] [blame] | 2692 | } |
| 2693 | |
Scott Michel | b30e8f6 | 2008-12-02 19:53:53 +0000 | [diff] [blame] | 2694 | //! Custom lower ISD::TRUNCATE |
| 2695 | static SDValue LowerTRUNCATE(SDValue Op, SelectionDAG &DAG) |
| 2696 | { |
Scott Michel | 6e1d147 | 2009-03-16 18:47:25 +0000 | [diff] [blame] | 2697 | // Type to truncate to |
Owen Anderson | e50ed30 | 2009-08-10 22:56:29 +0000 | [diff] [blame] | 2698 | EVT VT = Op.getValueType(); |
Owen Anderson | 825b72b | 2009-08-11 20:47:22 +0000 | [diff] [blame] | 2699 | MVT simpleVT = VT.getSimpleVT(); |
Wesley Peck | bf17cfa | 2010-11-23 03:31:01 +0000 | [diff] [blame] | 2700 | EVT VecVT = EVT::getVectorVT(*DAG.getContext(), |
Owen Anderson | 23b9b19 | 2009-08-12 00:36:31 +0000 | [diff] [blame] | 2701 | VT, (128 / VT.getSizeInBits())); |
Dale Johannesen | de06470 | 2009-02-06 21:50:26 +0000 | [diff] [blame] | 2702 | DebugLoc dl = Op.getDebugLoc(); |
Scott Michel | b30e8f6 | 2008-12-02 19:53:53 +0000 | [diff] [blame] | 2703 | |
Scott Michel | 6e1d147 | 2009-03-16 18:47:25 +0000 | [diff] [blame] | 2704 | // Type to truncate from |
Scott Michel | b30e8f6 | 2008-12-02 19:53:53 +0000 | [diff] [blame] | 2705 | SDValue Op0 = Op.getOperand(0); |
Owen Anderson | e50ed30 | 2009-08-10 22:56:29 +0000 | [diff] [blame] | 2706 | EVT Op0VT = Op0.getValueType(); |
Scott Michel | b30e8f6 | 2008-12-02 19:53:53 +0000 | [diff] [blame] | 2707 | |
Duncan Sands | cdfad36 | 2010-11-03 12:17:33 +0000 | [diff] [blame] | 2708 | if (Op0VT == MVT::i128 && simpleVT == MVT::i64) { |
Scott Michel | 52d0001 | 2009-01-03 00:27:53 +0000 | [diff] [blame] | 2709 | // Create shuffle mask, least significant doubleword of quadword |
Scott Michel | f0569be | 2008-12-27 04:51:36 +0000 | [diff] [blame] | 2710 | unsigned maskHigh = 0x08090a0b; |
| 2711 | unsigned maskLow = 0x0c0d0e0f; |
| 2712 | // Use a shuffle to perform the truncation |
Owen Anderson | 825b72b | 2009-08-11 20:47:22 +0000 | [diff] [blame] | 2713 | SDValue shufMask = DAG.getNode(ISD::BUILD_VECTOR, dl, MVT::v4i32, |
| 2714 | DAG.getConstant(maskHigh, MVT::i32), |
| 2715 | DAG.getConstant(maskLow, MVT::i32), |
| 2716 | DAG.getConstant(maskHigh, MVT::i32), |
| 2717 | DAG.getConstant(maskLow, MVT::i32)); |
Scott Michel | f0569be | 2008-12-27 04:51:36 +0000 | [diff] [blame] | 2718 | |
Scott Michel | 6e1d147 | 2009-03-16 18:47:25 +0000 | [diff] [blame] | 2719 | SDValue truncShuffle = DAG.getNode(SPUISD::SHUFB, dl, VecVT, |
| 2720 | Op0, Op0, shufMask); |
Scott Michel | f0569be | 2008-12-27 04:51:36 +0000 | [diff] [blame] | 2721 | |
Scott Michel | 6e1d147 | 2009-03-16 18:47:25 +0000 | [diff] [blame] | 2722 | return DAG.getNode(SPUISD::VEC2PREFSLOT, dl, VT, truncShuffle); |
Scott Michel | b30e8f6 | 2008-12-02 19:53:53 +0000 | [diff] [blame] | 2723 | } |
| 2724 | |
Scott Michel | f0569be | 2008-12-27 04:51:36 +0000 | [diff] [blame] | 2725 | return SDValue(); // Leave the truncate unmolested |
Scott Michel | b30e8f6 | 2008-12-02 19:53:53 +0000 | [diff] [blame] | 2726 | } |
| 2727 | |
Scott Michel | 77f452d | 2009-08-25 22:37:34 +0000 | [diff] [blame] | 2728 | /*! |
| 2729 | * Emit the instruction sequence for i64/i32 -> i128 sign extend. The basic |
| 2730 | * algorithm is to duplicate the sign bit using rotmai to generate at |
| 2731 | * least one byte full of sign bits. Then propagate the "sign-byte" into |
| 2732 | * the leftmost words and the i64/i32 into the rightmost words using shufb. |
| 2733 | * |
| 2734 | * @param Op The sext operand |
| 2735 | * @param DAG The current DAG |
| 2736 | * @return The SDValue with the entire instruction sequence |
| 2737 | */ |
Scott Michel | f1fa4fd | 2009-08-24 22:28:53 +0000 | [diff] [blame] | 2738 | static SDValue LowerSIGN_EXTEND(SDValue Op, SelectionDAG &DAG) |
| 2739 | { |
Scott Michel | f1fa4fd | 2009-08-24 22:28:53 +0000 | [diff] [blame] | 2740 | DebugLoc dl = Op.getDebugLoc(); |
| 2741 | |
Scott Michel | 77f452d | 2009-08-25 22:37:34 +0000 | [diff] [blame] | 2742 | // Type to extend to |
| 2743 | MVT OpVT = Op.getValueType().getSimpleVT(); |
Scott Michel | 77f452d | 2009-08-25 22:37:34 +0000 | [diff] [blame] | 2744 | |
Scott Michel | f1fa4fd | 2009-08-24 22:28:53 +0000 | [diff] [blame] | 2745 | // Type to extend from |
| 2746 | SDValue Op0 = Op.getOperand(0); |
Scott Michel | 77f452d | 2009-08-25 22:37:34 +0000 | [diff] [blame] | 2747 | MVT Op0VT = Op0.getValueType().getSimpleVT(); |
Scott Michel | f1fa4fd | 2009-08-24 22:28:53 +0000 | [diff] [blame] | 2748 | |
Kalle Raiskila | 5106b84 | 2011-01-20 15:49:06 +0000 | [diff] [blame] | 2749 | // extend i8 & i16 via i32 |
| 2750 | if (Op0VT == MVT::i8 || Op0VT == MVT::i16) { |
| 2751 | Op0 = DAG.getNode(ISD::SIGN_EXTEND, dl, MVT::i32, Op0); |
| 2752 | Op0VT = MVT::i32; |
| 2753 | } |
| 2754 | |
Scott Michel | 77f452d | 2009-08-25 22:37:34 +0000 | [diff] [blame] | 2755 | // The type to extend to needs to be a i128 and |
| 2756 | // the type to extend from needs to be i64 or i32. |
| 2757 | assert((OpVT == MVT::i128 && (Op0VT == MVT::i64 || Op0VT == MVT::i32)) && |
Scott Michel | f1fa4fd | 2009-08-24 22:28:53 +0000 | [diff] [blame] | 2758 | "LowerSIGN_EXTEND: input and/or output operand have wrong size"); |
Duncan Sands | 1f6a329 | 2011-08-12 14:54:45 +0000 | [diff] [blame] | 2759 | (void)OpVT; |
Scott Michel | f1fa4fd | 2009-08-24 22:28:53 +0000 | [diff] [blame] | 2760 | |
| 2761 | // Create shuffle mask |
Scott Michel | 77f452d | 2009-08-25 22:37:34 +0000 | [diff] [blame] | 2762 | unsigned mask1 = 0x10101010; // byte 0 - 3 and 4 - 7 |
| 2763 | unsigned mask2 = Op0VT == MVT::i64 ? 0x00010203 : 0x10101010; // byte 8 - 11 |
| 2764 | unsigned mask3 = Op0VT == MVT::i64 ? 0x04050607 : 0x00010203; // byte 12 - 15 |
Scott Michel | f1fa4fd | 2009-08-24 22:28:53 +0000 | [diff] [blame] | 2765 | SDValue shufMask = DAG.getNode(ISD::BUILD_VECTOR, dl, MVT::v4i32, |
| 2766 | DAG.getConstant(mask1, MVT::i32), |
| 2767 | DAG.getConstant(mask1, MVT::i32), |
| 2768 | DAG.getConstant(mask2, MVT::i32), |
| 2769 | DAG.getConstant(mask3, MVT::i32)); |
| 2770 | |
Scott Michel | 77f452d | 2009-08-25 22:37:34 +0000 | [diff] [blame] | 2771 | // Word wise arithmetic right shift to generate at least one byte |
| 2772 | // that contains sign bits. |
| 2773 | MVT mvt = Op0VT == MVT::i64 ? MVT::v2i64 : MVT::v4i32; |
Scott Michel | f1fa4fd | 2009-08-24 22:28:53 +0000 | [diff] [blame] | 2774 | SDValue sraVal = DAG.getNode(ISD::SRA, |
| 2775 | dl, |
Scott Michel | 77f452d | 2009-08-25 22:37:34 +0000 | [diff] [blame] | 2776 | mvt, |
| 2777 | DAG.getNode(SPUISD::PREFSLOT2VEC, dl, mvt, Op0, Op0), |
Scott Michel | f1fa4fd | 2009-08-24 22:28:53 +0000 | [diff] [blame] | 2778 | DAG.getConstant(31, MVT::i32)); |
| 2779 | |
Kalle Raiskila | 940e796 | 2010-10-18 09:34:19 +0000 | [diff] [blame] | 2780 | // reinterpret as a i128 (SHUFB requires it). This gets lowered away. |
Wesley Peck | bf17cfa | 2010-11-23 03:31:01 +0000 | [diff] [blame] | 2781 | SDValue extended = SDValue(DAG.getMachineNode(TargetOpcode::COPY_TO_REGCLASS, |
Kalle Raiskila | 940e796 | 2010-10-18 09:34:19 +0000 | [diff] [blame] | 2782 | dl, Op0VT, Op0, |
| 2783 | DAG.getTargetConstant( |
Wesley Peck | bf17cfa | 2010-11-23 03:31:01 +0000 | [diff] [blame] | 2784 | SPU::GPRCRegClass.getID(), |
Kalle Raiskila | 940e796 | 2010-10-18 09:34:19 +0000 | [diff] [blame] | 2785 | MVT::i32)), 0); |
Scott Michel | 77f452d | 2009-08-25 22:37:34 +0000 | [diff] [blame] | 2786 | // Shuffle bytes - Copy the sign bits into the upper 64 bits |
| 2787 | // and the input value into the lower 64 bits. |
| 2788 | SDValue extShuffle = DAG.getNode(SPUISD::SHUFB, dl, mvt, |
Kalle Raiskila | 940e796 | 2010-10-18 09:34:19 +0000 | [diff] [blame] | 2789 | extended, sraVal, shufMask); |
Wesley Peck | bf17cfa | 2010-11-23 03:31:01 +0000 | [diff] [blame] | 2790 | return DAG.getNode(ISD::BITCAST, dl, MVT::i128, extShuffle); |
Scott Michel | f1fa4fd | 2009-08-24 22:28:53 +0000 | [diff] [blame] | 2791 | } |
| 2792 | |
Scott Michel | 7a1c9e9 | 2008-11-22 23:50:42 +0000 | [diff] [blame] | 2793 | //! Custom (target-specific) lowering entry point |
| 2794 | /*! |
| 2795 | This is where LLVM's DAG selection process calls to do target-specific |
| 2796 | lowering of nodes. |
| 2797 | */ |
Dan Gohman | 475871a | 2008-07-27 21:46:04 +0000 | [diff] [blame] | 2798 | SDValue |
Dan Gohman | d858e90 | 2010-04-17 15:26:15 +0000 | [diff] [blame] | 2799 | SPUTargetLowering::LowerOperation(SDValue Op, SelectionDAG &DAG) const |
Scott Michel | 266bc8f | 2007-12-04 22:23:35 +0000 | [diff] [blame] | 2800 | { |
Scott Michel | a59d469 | 2008-02-23 18:41:37 +0000 | [diff] [blame] | 2801 | unsigned Opc = (unsigned) Op.getOpcode(); |
Owen Anderson | e50ed30 | 2009-08-10 22:56:29 +0000 | [diff] [blame] | 2802 | EVT VT = Op.getValueType(); |
Scott Michel | a59d469 | 2008-02-23 18:41:37 +0000 | [diff] [blame] | 2803 | |
| 2804 | switch (Opc) { |
Scott Michel | 266bc8f | 2007-12-04 22:23:35 +0000 | [diff] [blame] | 2805 | default: { |
Torok Edwin | dac237e | 2009-07-08 20:53:28 +0000 | [diff] [blame] | 2806 | #ifndef NDEBUG |
Chris Lattner | 4437ae2 | 2009-08-23 07:05:07 +0000 | [diff] [blame] | 2807 | errs() << "SPUTargetLowering::LowerOperation(): need to lower this!\n"; |
| 2808 | errs() << "Op.getOpcode() = " << Opc << "\n"; |
| 2809 | errs() << "*Op.getNode():\n"; |
Gabor Greif | ba36cb5 | 2008-08-28 21:40:38 +0000 | [diff] [blame] | 2810 | Op.getNode()->dump(); |
Torok Edwin | dac237e | 2009-07-08 20:53:28 +0000 | [diff] [blame] | 2811 | #endif |
Torok Edwin | c23197a | 2009-07-14 16:55:14 +0000 | [diff] [blame] | 2812 | llvm_unreachable(0); |
Scott Michel | 266bc8f | 2007-12-04 22:23:35 +0000 | [diff] [blame] | 2813 | } |
| 2814 | case ISD::LOAD: |
Scott Michel | b30e8f6 | 2008-12-02 19:53:53 +0000 | [diff] [blame] | 2815 | case ISD::EXTLOAD: |
Scott Michel | 266bc8f | 2007-12-04 22:23:35 +0000 | [diff] [blame] | 2816 | case ISD::SEXTLOAD: |
| 2817 | case ISD::ZEXTLOAD: |
| 2818 | return LowerLOAD(Op, DAG, SPUTM.getSubtargetImpl()); |
| 2819 | case ISD::STORE: |
| 2820 | return LowerSTORE(Op, DAG, SPUTM.getSubtargetImpl()); |
| 2821 | case ISD::ConstantPool: |
| 2822 | return LowerConstantPool(Op, DAG, SPUTM.getSubtargetImpl()); |
| 2823 | case ISD::GlobalAddress: |
| 2824 | return LowerGlobalAddress(Op, DAG, SPUTM.getSubtargetImpl()); |
| 2825 | case ISD::JumpTable: |
| 2826 | return LowerJumpTable(Op, DAG, SPUTM.getSubtargetImpl()); |
Scott Michel | 266bc8f | 2007-12-04 22:23:35 +0000 | [diff] [blame] | 2827 | case ISD::ConstantFP: |
| 2828 | return LowerConstantFP(Op, DAG); |
Scott Michel | 266bc8f | 2007-12-04 22:23:35 +0000 | [diff] [blame] | 2829 | |
Scott Michel | 02d711b | 2008-12-30 23:28:25 +0000 | [diff] [blame] | 2830 | // i8, i64 math ops: |
Scott Michel | 8bf61e8 | 2008-06-02 22:18:03 +0000 | [diff] [blame] | 2831 | case ISD::ADD: |
Scott Michel | 266bc8f | 2007-12-04 22:23:35 +0000 | [diff] [blame] | 2832 | case ISD::SUB: |
| 2833 | case ISD::ROTR: |
| 2834 | case ISD::ROTL: |
| 2835 | case ISD::SRL: |
| 2836 | case ISD::SHL: |
Scott Michel | 8bf61e8 | 2008-06-02 22:18:03 +0000 | [diff] [blame] | 2837 | case ISD::SRA: { |
Owen Anderson | 825b72b | 2009-08-11 20:47:22 +0000 | [diff] [blame] | 2838 | if (VT == MVT::i8) |
Scott Michel | f0569be | 2008-12-27 04:51:36 +0000 | [diff] [blame] | 2839 | return LowerI8Math(Op, DAG, Opc, *this); |
Scott Michel | a59d469 | 2008-02-23 18:41:37 +0000 | [diff] [blame] | 2840 | break; |
Scott Michel | 8bf61e8 | 2008-06-02 22:18:03 +0000 | [diff] [blame] | 2841 | } |
Scott Michel | 266bc8f | 2007-12-04 22:23:35 +0000 | [diff] [blame] | 2842 | |
Scott Michel | c9c8b2a | 2009-01-26 03:31:40 +0000 | [diff] [blame] | 2843 | case ISD::FP_TO_SINT: |
| 2844 | case ISD::FP_TO_UINT: |
| 2845 | return LowerFP_TO_INT(Op, DAG, *this); |
| 2846 | |
| 2847 | case ISD::SINT_TO_FP: |
| 2848 | case ISD::UINT_TO_FP: |
| 2849 | return LowerINT_TO_FP(Op, DAG, *this); |
Scott Michel | d1e8d9c | 2009-01-21 04:58:48 +0000 | [diff] [blame] | 2850 | |
Scott Michel | 266bc8f | 2007-12-04 22:23:35 +0000 | [diff] [blame] | 2851 | // Vector-related lowering. |
| 2852 | case ISD::BUILD_VECTOR: |
Scott Michel | c9c8b2a | 2009-01-26 03:31:40 +0000 | [diff] [blame] | 2853 | return LowerBUILD_VECTOR(Op, DAG); |
Scott Michel | 266bc8f | 2007-12-04 22:23:35 +0000 | [diff] [blame] | 2854 | case ISD::SCALAR_TO_VECTOR: |
| 2855 | return LowerSCALAR_TO_VECTOR(Op, DAG); |
| 2856 | case ISD::VECTOR_SHUFFLE: |
| 2857 | return LowerVECTOR_SHUFFLE(Op, DAG); |
| 2858 | case ISD::EXTRACT_VECTOR_ELT: |
| 2859 | return LowerEXTRACT_VECTOR_ELT(Op, DAG); |
| 2860 | case ISD::INSERT_VECTOR_ELT: |
| 2861 | return LowerINSERT_VECTOR_ELT(Op, DAG); |
| 2862 | |
| 2863 | // Look for ANDBI, ORBI and XORBI opportunities and lower appropriately: |
| 2864 | case ISD::AND: |
| 2865 | case ISD::OR: |
| 2866 | case ISD::XOR: |
| 2867 | return LowerByteImmed(Op, DAG); |
| 2868 | |
| 2869 | // Vector and i8 multiply: |
| 2870 | case ISD::MUL: |
Owen Anderson | 825b72b | 2009-08-11 20:47:22 +0000 | [diff] [blame] | 2871 | if (VT == MVT::i8) |
Scott Michel | f0569be | 2008-12-27 04:51:36 +0000 | [diff] [blame] | 2872 | return LowerI8Math(Op, DAG, Opc, *this); |
Scott Michel | 266bc8f | 2007-12-04 22:23:35 +0000 | [diff] [blame] | 2873 | |
Scott Michel | 266bc8f | 2007-12-04 22:23:35 +0000 | [diff] [blame] | 2874 | case ISD::CTPOP: |
| 2875 | return LowerCTPOP(Op, DAG); |
Scott Michel | 7a1c9e9 | 2008-11-22 23:50:42 +0000 | [diff] [blame] | 2876 | |
| 2877 | case ISD::SELECT_CC: |
Scott Michel | f0569be | 2008-12-27 04:51:36 +0000 | [diff] [blame] | 2878 | return LowerSELECT_CC(Op, DAG, *this); |
Scott Michel | b30e8f6 | 2008-12-02 19:53:53 +0000 | [diff] [blame] | 2879 | |
Scott Michel | d1e8d9c | 2009-01-21 04:58:48 +0000 | [diff] [blame] | 2880 | case ISD::SETCC: |
| 2881 | return LowerSETCC(Op, DAG, *this); |
| 2882 | |
Scott Michel | b30e8f6 | 2008-12-02 19:53:53 +0000 | [diff] [blame] | 2883 | case ISD::TRUNCATE: |
| 2884 | return LowerTRUNCATE(Op, DAG); |
Scott Michel | f1fa4fd | 2009-08-24 22:28:53 +0000 | [diff] [blame] | 2885 | |
| 2886 | case ISD::SIGN_EXTEND: |
| 2887 | return LowerSIGN_EXTEND(Op, DAG); |
Scott Michel | 266bc8f | 2007-12-04 22:23:35 +0000 | [diff] [blame] | 2888 | } |
| 2889 | |
Dan Gohman | 475871a | 2008-07-27 21:46:04 +0000 | [diff] [blame] | 2890 | return SDValue(); |
Scott Michel | 266bc8f | 2007-12-04 22:23:35 +0000 | [diff] [blame] | 2891 | } |
| 2892 | |
Duncan Sands | 1607f05 | 2008-12-01 11:39:25 +0000 | [diff] [blame] | 2893 | void SPUTargetLowering::ReplaceNodeResults(SDNode *N, |
| 2894 | SmallVectorImpl<SDValue>&Results, |
Dan Gohman | d858e90 | 2010-04-17 15:26:15 +0000 | [diff] [blame] | 2895 | SelectionDAG &DAG) const |
Scott Michel | 73ce1c5 | 2008-11-10 23:43:06 +0000 | [diff] [blame] | 2896 | { |
| 2897 | #if 0 |
| 2898 | unsigned Opc = (unsigned) N->getOpcode(); |
Owen Anderson | e50ed30 | 2009-08-10 22:56:29 +0000 | [diff] [blame] | 2899 | EVT OpVT = N->getValueType(0); |
Scott Michel | 73ce1c5 | 2008-11-10 23:43:06 +0000 | [diff] [blame] | 2900 | |
| 2901 | switch (Opc) { |
| 2902 | default: { |
Chris Lattner | 4437ae2 | 2009-08-23 07:05:07 +0000 | [diff] [blame] | 2903 | errs() << "SPUTargetLowering::ReplaceNodeResults(): need to fix this!\n"; |
| 2904 | errs() << "Op.getOpcode() = " << Opc << "\n"; |
| 2905 | errs() << "*Op.getNode():\n"; |
Scott Michel | 73ce1c5 | 2008-11-10 23:43:06 +0000 | [diff] [blame] | 2906 | N->dump(); |
| 2907 | abort(); |
| 2908 | /*NOTREACHED*/ |
| 2909 | } |
| 2910 | } |
| 2911 | #endif |
| 2912 | |
| 2913 | /* Otherwise, return unchanged */ |
Scott Michel | 73ce1c5 | 2008-11-10 23:43:06 +0000 | [diff] [blame] | 2914 | } |
| 2915 | |
Scott Michel | 266bc8f | 2007-12-04 22:23:35 +0000 | [diff] [blame] | 2916 | //===----------------------------------------------------------------------===// |
Scott Michel | 266bc8f | 2007-12-04 22:23:35 +0000 | [diff] [blame] | 2917 | // Target Optimization Hooks |
| 2918 | //===----------------------------------------------------------------------===// |
| 2919 | |
Dan Gohman | 475871a | 2008-07-27 21:46:04 +0000 | [diff] [blame] | 2920 | SDValue |
Scott Michel | 266bc8f | 2007-12-04 22:23:35 +0000 | [diff] [blame] | 2921 | SPUTargetLowering::PerformDAGCombine(SDNode *N, DAGCombinerInfo &DCI) const |
| 2922 | { |
| 2923 | #if 0 |
| 2924 | TargetMachine &TM = getTargetMachine(); |
Scott Michel | 053c1da | 2008-01-29 02:16:57 +0000 | [diff] [blame] | 2925 | #endif |
| 2926 | const SPUSubtarget *ST = SPUTM.getSubtargetImpl(); |
Scott Michel | 266bc8f | 2007-12-04 22:23:35 +0000 | [diff] [blame] | 2927 | SelectionDAG &DAG = DCI.DAG; |
Scott Michel | 1a6cdb6 | 2008-12-01 17:56:02 +0000 | [diff] [blame] | 2928 | SDValue Op0 = N->getOperand(0); // everything has at least one operand |
Owen Anderson | e50ed30 | 2009-08-10 22:56:29 +0000 | [diff] [blame] | 2929 | EVT NodeVT = N->getValueType(0); // The node's value type |
| 2930 | EVT Op0VT = Op0.getValueType(); // The first operand's result |
Scott Michel | 1a6cdb6 | 2008-12-01 17:56:02 +0000 | [diff] [blame] | 2931 | SDValue Result; // Initially, empty result |
Dale Johannesen | de06470 | 2009-02-06 21:50:26 +0000 | [diff] [blame] | 2932 | DebugLoc dl = N->getDebugLoc(); |
Scott Michel | 266bc8f | 2007-12-04 22:23:35 +0000 | [diff] [blame] | 2933 | |
| 2934 | switch (N->getOpcode()) { |
| 2935 | default: break; |
Scott Michel | 053c1da | 2008-01-29 02:16:57 +0000 | [diff] [blame] | 2936 | case ISD::ADD: { |
Dan Gohman | 475871a | 2008-07-27 21:46:04 +0000 | [diff] [blame] | 2937 | SDValue Op1 = N->getOperand(1); |
Scott Michel | 053c1da | 2008-01-29 02:16:57 +0000 | [diff] [blame] | 2938 | |
Scott Michel | f0569be | 2008-12-27 04:51:36 +0000 | [diff] [blame] | 2939 | if (Op0.getOpcode() == SPUISD::IndirectAddr |
| 2940 | || Op1.getOpcode() == SPUISD::IndirectAddr) { |
| 2941 | // Normalize the operands to reduce repeated code |
| 2942 | SDValue IndirectArg = Op0, AddArg = Op1; |
Scott Michel | 1df30c4 | 2008-12-29 03:23:36 +0000 | [diff] [blame] | 2943 | |
Scott Michel | f0569be | 2008-12-27 04:51:36 +0000 | [diff] [blame] | 2944 | if (Op1.getOpcode() == SPUISD::IndirectAddr) { |
| 2945 | IndirectArg = Op1; |
| 2946 | AddArg = Op0; |
| 2947 | } |
| 2948 | |
| 2949 | if (isa<ConstantSDNode>(AddArg)) { |
| 2950 | ConstantSDNode *CN0 = cast<ConstantSDNode > (AddArg); |
| 2951 | SDValue IndOp1 = IndirectArg.getOperand(1); |
| 2952 | |
| 2953 | if (CN0->isNullValue()) { |
| 2954 | // (add (SPUindirect <arg>, <arg>), 0) -> |
| 2955 | // (SPUindirect <arg>, <arg>) |
Scott Michel | 053c1da | 2008-01-29 02:16:57 +0000 | [diff] [blame] | 2956 | |
Scott Michel | 23f2ff7 | 2008-12-04 17:16:59 +0000 | [diff] [blame] | 2957 | #if !defined(NDEBUG) |
Scott Michel | f0569be | 2008-12-27 04:51:36 +0000 | [diff] [blame] | 2958 | if (DebugFlag && isCurrentDebugType(DEBUG_TYPE)) { |
Chris Lattner | 4437ae2 | 2009-08-23 07:05:07 +0000 | [diff] [blame] | 2959 | errs() << "\n" |
Scott Michel | f0569be | 2008-12-27 04:51:36 +0000 | [diff] [blame] | 2960 | << "Replace: (add (SPUindirect <arg>, <arg>), 0)\n" |
| 2961 | << "With: (SPUindirect <arg>, <arg>)\n"; |
| 2962 | } |
Scott Michel | 30ee7df | 2008-12-04 03:02:42 +0000 | [diff] [blame] | 2963 | #endif |
| 2964 | |
Scott Michel | f0569be | 2008-12-27 04:51:36 +0000 | [diff] [blame] | 2965 | return IndirectArg; |
| 2966 | } else if (isa<ConstantSDNode>(IndOp1)) { |
| 2967 | // (add (SPUindirect <arg>, <const>), <const>) -> |
| 2968 | // (SPUindirect <arg>, <const + const>) |
| 2969 | ConstantSDNode *CN1 = cast<ConstantSDNode > (IndOp1); |
| 2970 | int64_t combinedConst = CN0->getSExtValue() + CN1->getSExtValue(); |
| 2971 | SDValue combinedValue = DAG.getConstant(combinedConst, Op0VT); |
Scott Michel | 053c1da | 2008-01-29 02:16:57 +0000 | [diff] [blame] | 2972 | |
Scott Michel | f0569be | 2008-12-27 04:51:36 +0000 | [diff] [blame] | 2973 | #if !defined(NDEBUG) |
| 2974 | if (DebugFlag && isCurrentDebugType(DEBUG_TYPE)) { |
Chris Lattner | 4437ae2 | 2009-08-23 07:05:07 +0000 | [diff] [blame] | 2975 | errs() << "\n" |
Scott Michel | f0569be | 2008-12-27 04:51:36 +0000 | [diff] [blame] | 2976 | << "Replace: (add (SPUindirect <arg>, " << CN1->getSExtValue() |
| 2977 | << "), " << CN0->getSExtValue() << ")\n" |
| 2978 | << "With: (SPUindirect <arg>, " |
| 2979 | << combinedConst << ")\n"; |
| 2980 | } |
| 2981 | #endif |
Scott Michel | 053c1da | 2008-01-29 02:16:57 +0000 | [diff] [blame] | 2982 | |
Dale Johannesen | de06470 | 2009-02-06 21:50:26 +0000 | [diff] [blame] | 2983 | return DAG.getNode(SPUISD::IndirectAddr, dl, Op0VT, |
Scott Michel | f0569be | 2008-12-27 04:51:36 +0000 | [diff] [blame] | 2984 | IndirectArg, combinedValue); |
| 2985 | } |
Scott Michel | 053c1da | 2008-01-29 02:16:57 +0000 | [diff] [blame] | 2986 | } |
| 2987 | } |
Scott Michel | a59d469 | 2008-02-23 18:41:37 +0000 | [diff] [blame] | 2988 | break; |
| 2989 | } |
| 2990 | case ISD::SIGN_EXTEND: |
| 2991 | case ISD::ZERO_EXTEND: |
| 2992 | case ISD::ANY_EXTEND: { |
Scott Michel | 1a6cdb6 | 2008-12-01 17:56:02 +0000 | [diff] [blame] | 2993 | if (Op0.getOpcode() == SPUISD::VEC2PREFSLOT && NodeVT == Op0VT) { |
Scott Michel | a59d469 | 2008-02-23 18:41:37 +0000 | [diff] [blame] | 2994 | // (any_extend (SPUextract_elt0 <arg>)) -> |
| 2995 | // (SPUextract_elt0 <arg>) |
| 2996 | // Types must match, however... |
Scott Michel | 23f2ff7 | 2008-12-04 17:16:59 +0000 | [diff] [blame] | 2997 | #if !defined(NDEBUG) |
| 2998 | if (DebugFlag && isCurrentDebugType(DEBUG_TYPE)) { |
Chris Lattner | 4437ae2 | 2009-08-23 07:05:07 +0000 | [diff] [blame] | 2999 | errs() << "\nReplace: "; |
Scott Michel | 30ee7df | 2008-12-04 03:02:42 +0000 | [diff] [blame] | 3000 | N->dump(&DAG); |
Chris Lattner | 4437ae2 | 2009-08-23 07:05:07 +0000 | [diff] [blame] | 3001 | errs() << "\nWith: "; |
Scott Michel | 30ee7df | 2008-12-04 03:02:42 +0000 | [diff] [blame] | 3002 | Op0.getNode()->dump(&DAG); |
Chris Lattner | 4437ae2 | 2009-08-23 07:05:07 +0000 | [diff] [blame] | 3003 | errs() << "\n"; |
Scott Michel | 23f2ff7 | 2008-12-04 17:16:59 +0000 | [diff] [blame] | 3004 | } |
Scott Michel | 30ee7df | 2008-12-04 03:02:42 +0000 | [diff] [blame] | 3005 | #endif |
Scott Michel | a59d469 | 2008-02-23 18:41:37 +0000 | [diff] [blame] | 3006 | |
| 3007 | return Op0; |
| 3008 | } |
| 3009 | break; |
| 3010 | } |
| 3011 | case SPUISD::IndirectAddr: { |
| 3012 | if (!ST->usingLargeMem() && Op0.getOpcode() == SPUISD::AFormAddr) { |
Scott Michel | d1e8d9c | 2009-01-21 04:58:48 +0000 | [diff] [blame] | 3013 | ConstantSDNode *CN = dyn_cast<ConstantSDNode>(N->getOperand(1)); |
Dan Gohman | e368b46 | 2010-06-18 14:22:04 +0000 | [diff] [blame] | 3014 | if (CN != 0 && CN->isNullValue()) { |
Scott Michel | a59d469 | 2008-02-23 18:41:37 +0000 | [diff] [blame] | 3015 | // (SPUindirect (SPUaform <addr>, 0), 0) -> |
| 3016 | // (SPUaform <addr>, 0) |
| 3017 | |
Chris Lattner | 4437ae2 | 2009-08-23 07:05:07 +0000 | [diff] [blame] | 3018 | DEBUG(errs() << "Replace: "); |
Scott Michel | a59d469 | 2008-02-23 18:41:37 +0000 | [diff] [blame] | 3019 | DEBUG(N->dump(&DAG)); |
Chris Lattner | 4437ae2 | 2009-08-23 07:05:07 +0000 | [diff] [blame] | 3020 | DEBUG(errs() << "\nWith: "); |
Gabor Greif | ba36cb5 | 2008-08-28 21:40:38 +0000 | [diff] [blame] | 3021 | DEBUG(Op0.getNode()->dump(&DAG)); |
Chris Lattner | 4437ae2 | 2009-08-23 07:05:07 +0000 | [diff] [blame] | 3022 | DEBUG(errs() << "\n"); |
Scott Michel | a59d469 | 2008-02-23 18:41:37 +0000 | [diff] [blame] | 3023 | |
| 3024 | return Op0; |
| 3025 | } |
Scott Michel | f0569be | 2008-12-27 04:51:36 +0000 | [diff] [blame] | 3026 | } else if (Op0.getOpcode() == ISD::ADD) { |
| 3027 | SDValue Op1 = N->getOperand(1); |
| 3028 | if (ConstantSDNode *CN1 = dyn_cast<ConstantSDNode>(Op1)) { |
| 3029 | // (SPUindirect (add <arg>, <arg>), 0) -> |
| 3030 | // (SPUindirect <arg>, <arg>) |
| 3031 | if (CN1->isNullValue()) { |
| 3032 | |
| 3033 | #if !defined(NDEBUG) |
| 3034 | if (DebugFlag && isCurrentDebugType(DEBUG_TYPE)) { |
Chris Lattner | 4437ae2 | 2009-08-23 07:05:07 +0000 | [diff] [blame] | 3035 | errs() << "\n" |
Scott Michel | f0569be | 2008-12-27 04:51:36 +0000 | [diff] [blame] | 3036 | << "Replace: (SPUindirect (add <arg>, <arg>), 0)\n" |
| 3037 | << "With: (SPUindirect <arg>, <arg>)\n"; |
| 3038 | } |
| 3039 | #endif |
| 3040 | |
Dale Johannesen | de06470 | 2009-02-06 21:50:26 +0000 | [diff] [blame] | 3041 | return DAG.getNode(SPUISD::IndirectAddr, dl, Op0VT, |
Scott Michel | f0569be | 2008-12-27 04:51:36 +0000 | [diff] [blame] | 3042 | Op0.getOperand(0), Op0.getOperand(1)); |
| 3043 | } |
| 3044 | } |
Scott Michel | a59d469 | 2008-02-23 18:41:37 +0000 | [diff] [blame] | 3045 | } |
| 3046 | break; |
| 3047 | } |
Kalle Raiskila | 7ea1ab5 | 2010-11-12 10:14:03 +0000 | [diff] [blame] | 3048 | case SPUISD::SHL_BITS: |
| 3049 | case SPUISD::SHL_BYTES: |
Scott Michel | f0569be | 2008-12-27 04:51:36 +0000 | [diff] [blame] | 3050 | case SPUISD::ROTBYTES_LEFT: { |
Dan Gohman | 475871a | 2008-07-27 21:46:04 +0000 | [diff] [blame] | 3051 | SDValue Op1 = N->getOperand(1); |
Scott Michel | a59d469 | 2008-02-23 18:41:37 +0000 | [diff] [blame] | 3052 | |
Scott Michel | f0569be | 2008-12-27 04:51:36 +0000 | [diff] [blame] | 3053 | // Kill degenerate vector shifts: |
| 3054 | if (ConstantSDNode *CN = dyn_cast<ConstantSDNode>(Op1)) { |
| 3055 | if (CN->isNullValue()) { |
Scott Michel | a59d469 | 2008-02-23 18:41:37 +0000 | [diff] [blame] | 3056 | Result = Op0; |
| 3057 | } |
| 3058 | } |
| 3059 | break; |
| 3060 | } |
Scott Michel | f0569be | 2008-12-27 04:51:36 +0000 | [diff] [blame] | 3061 | case SPUISD::PREFSLOT2VEC: { |
Scott Michel | a59d469 | 2008-02-23 18:41:37 +0000 | [diff] [blame] | 3062 | switch (Op0.getOpcode()) { |
| 3063 | default: |
| 3064 | break; |
| 3065 | case ISD::ANY_EXTEND: |
| 3066 | case ISD::ZERO_EXTEND: |
| 3067 | case ISD::SIGN_EXTEND: { |
Scott Michel | 1df30c4 | 2008-12-29 03:23:36 +0000 | [diff] [blame] | 3068 | // (SPUprefslot2vec (any|zero|sign_extend (SPUvec2prefslot <arg>))) -> |
Scott Michel | a59d469 | 2008-02-23 18:41:37 +0000 | [diff] [blame] | 3069 | // <arg> |
Scott Michel | 1df30c4 | 2008-12-29 03:23:36 +0000 | [diff] [blame] | 3070 | // but only if the SPUprefslot2vec and <arg> types match. |
Dan Gohman | 475871a | 2008-07-27 21:46:04 +0000 | [diff] [blame] | 3071 | SDValue Op00 = Op0.getOperand(0); |
Scott Michel | 104de43 | 2008-11-24 17:11:17 +0000 | [diff] [blame] | 3072 | if (Op00.getOpcode() == SPUISD::VEC2PREFSLOT) { |
Dan Gohman | 475871a | 2008-07-27 21:46:04 +0000 | [diff] [blame] | 3073 | SDValue Op000 = Op00.getOperand(0); |
Scott Michel | 1a6cdb6 | 2008-12-01 17:56:02 +0000 | [diff] [blame] | 3074 | if (Op000.getValueType() == NodeVT) { |
Scott Michel | a59d469 | 2008-02-23 18:41:37 +0000 | [diff] [blame] | 3075 | Result = Op000; |
| 3076 | } |
| 3077 | } |
| 3078 | break; |
| 3079 | } |
Scott Michel | 104de43 | 2008-11-24 17:11:17 +0000 | [diff] [blame] | 3080 | case SPUISD::VEC2PREFSLOT: { |
Scott Michel | 1df30c4 | 2008-12-29 03:23:36 +0000 | [diff] [blame] | 3081 | // (SPUprefslot2vec (SPUvec2prefslot <arg>)) -> |
Scott Michel | a59d469 | 2008-02-23 18:41:37 +0000 | [diff] [blame] | 3082 | // <arg> |
| 3083 | Result = Op0.getOperand(0); |
| 3084 | break; |
Scott Michel | 5af8f0e | 2008-07-16 17:17:29 +0000 | [diff] [blame] | 3085 | } |
Scott Michel | a59d469 | 2008-02-23 18:41:37 +0000 | [diff] [blame] | 3086 | } |
| 3087 | break; |
Scott Michel | 053c1da | 2008-01-29 02:16:57 +0000 | [diff] [blame] | 3088 | } |
| 3089 | } |
Scott Michel | d1e8d9c | 2009-01-21 04:58:48 +0000 | [diff] [blame] | 3090 | |
Scott Michel | 58c5818 | 2008-01-17 20:38:41 +0000 | [diff] [blame] | 3091 | // Otherwise, return unchanged. |
Scott Michel | 1a6cdb6 | 2008-12-01 17:56:02 +0000 | [diff] [blame] | 3092 | #ifndef NDEBUG |
Gabor Greif | ba36cb5 | 2008-08-28 21:40:38 +0000 | [diff] [blame] | 3093 | if (Result.getNode()) { |
Chris Lattner | 4437ae2 | 2009-08-23 07:05:07 +0000 | [diff] [blame] | 3094 | DEBUG(errs() << "\nReplace.SPU: "); |
Scott Michel | a59d469 | 2008-02-23 18:41:37 +0000 | [diff] [blame] | 3095 | DEBUG(N->dump(&DAG)); |
Chris Lattner | 4437ae2 | 2009-08-23 07:05:07 +0000 | [diff] [blame] | 3096 | DEBUG(errs() << "\nWith: "); |
Gabor Greif | ba36cb5 | 2008-08-28 21:40:38 +0000 | [diff] [blame] | 3097 | DEBUG(Result.getNode()->dump(&DAG)); |
Chris Lattner | 4437ae2 | 2009-08-23 07:05:07 +0000 | [diff] [blame] | 3098 | DEBUG(errs() << "\n"); |
Scott Michel | a59d469 | 2008-02-23 18:41:37 +0000 | [diff] [blame] | 3099 | } |
| 3100 | #endif |
| 3101 | |
| 3102 | return Result; |
Scott Michel | 266bc8f | 2007-12-04 22:23:35 +0000 | [diff] [blame] | 3103 | } |
| 3104 | |
| 3105 | //===----------------------------------------------------------------------===// |
| 3106 | // Inline Assembly Support |
| 3107 | //===----------------------------------------------------------------------===// |
| 3108 | |
| 3109 | /// getConstraintType - Given a constraint letter, return the type of |
| 3110 | /// constraint it is for this target. |
Scott Michel | 5af8f0e | 2008-07-16 17:17:29 +0000 | [diff] [blame] | 3111 | SPUTargetLowering::ConstraintType |
Scott Michel | 266bc8f | 2007-12-04 22:23:35 +0000 | [diff] [blame] | 3112 | SPUTargetLowering::getConstraintType(const std::string &ConstraintLetter) const { |
| 3113 | if (ConstraintLetter.size() == 1) { |
| 3114 | switch (ConstraintLetter[0]) { |
| 3115 | default: break; |
| 3116 | case 'b': |
| 3117 | case 'r': |
| 3118 | case 'f': |
| 3119 | case 'v': |
| 3120 | case 'y': |
| 3121 | return C_RegisterClass; |
Scott Michel | 5af8f0e | 2008-07-16 17:17:29 +0000 | [diff] [blame] | 3122 | } |
Scott Michel | 266bc8f | 2007-12-04 22:23:35 +0000 | [diff] [blame] | 3123 | } |
| 3124 | return TargetLowering::getConstraintType(ConstraintLetter); |
| 3125 | } |
| 3126 | |
John Thompson | 44ab89e | 2010-10-29 17:29:13 +0000 | [diff] [blame] | 3127 | /// Examine constraint type and operand type and determine a weight value. |
| 3128 | /// This object must already have been set up with the operand type |
| 3129 | /// and the current alternative constraint selected. |
| 3130 | TargetLowering::ConstraintWeight |
| 3131 | SPUTargetLowering::getSingleConstraintMatchWeight( |
| 3132 | AsmOperandInfo &info, const char *constraint) const { |
| 3133 | ConstraintWeight weight = CW_Invalid; |
| 3134 | Value *CallOperandVal = info.CallOperandVal; |
| 3135 | // If we don't have a value, we can't do a match, |
| 3136 | // but allow it at the lowest weight. |
| 3137 | if (CallOperandVal == NULL) |
| 3138 | return CW_Default; |
| 3139 | // Look at the constraint type. |
| 3140 | switch (*constraint) { |
| 3141 | default: |
| 3142 | weight = TargetLowering::getSingleConstraintMatchWeight(info, constraint); |
Owen Anderson | 95771af | 2011-02-25 21:41:48 +0000 | [diff] [blame] | 3143 | break; |
John Thompson | 44ab89e | 2010-10-29 17:29:13 +0000 | [diff] [blame] | 3144 | //FIXME: Seems like the supported constraint letters were just copied |
| 3145 | // from PPC, as the following doesn't correspond to the GCC docs. |
| 3146 | // I'm leaving it so until someone adds the corresponding lowering support. |
| 3147 | case 'b': |
| 3148 | case 'r': |
| 3149 | case 'f': |
| 3150 | case 'd': |
| 3151 | case 'v': |
| 3152 | case 'y': |
| 3153 | weight = CW_Register; |
| 3154 | break; |
| 3155 | } |
| 3156 | return weight; |
| 3157 | } |
| 3158 | |
Scott Michel | 5af8f0e | 2008-07-16 17:17:29 +0000 | [diff] [blame] | 3159 | std::pair<unsigned, const TargetRegisterClass*> |
Scott Michel | 266bc8f | 2007-12-04 22:23:35 +0000 | [diff] [blame] | 3160 | SPUTargetLowering::getRegForInlineAsmConstraint(const std::string &Constraint, |
Owen Anderson | e50ed30 | 2009-08-10 22:56:29 +0000 | [diff] [blame] | 3161 | EVT VT) const |
Scott Michel | 266bc8f | 2007-12-04 22:23:35 +0000 | [diff] [blame] | 3162 | { |
| 3163 | if (Constraint.size() == 1) { |
| 3164 | // GCC RS6000 Constraint Letters |
| 3165 | switch (Constraint[0]) { |
| 3166 | case 'b': // R1-R31 |
| 3167 | case 'r': // R0-R31 |
Owen Anderson | 825b72b | 2009-08-11 20:47:22 +0000 | [diff] [blame] | 3168 | if (VT == MVT::i64) |
Scott Michel | 266bc8f | 2007-12-04 22:23:35 +0000 | [diff] [blame] | 3169 | return std::make_pair(0U, SPU::R64CRegisterClass); |
| 3170 | return std::make_pair(0U, SPU::R32CRegisterClass); |
| 3171 | case 'f': |
Owen Anderson | 825b72b | 2009-08-11 20:47:22 +0000 | [diff] [blame] | 3172 | if (VT == MVT::f32) |
Scott Michel | 266bc8f | 2007-12-04 22:23:35 +0000 | [diff] [blame] | 3173 | return std::make_pair(0U, SPU::R32FPRegisterClass); |
Owen Anderson | 825b72b | 2009-08-11 20:47:22 +0000 | [diff] [blame] | 3174 | else if (VT == MVT::f64) |
Scott Michel | 266bc8f | 2007-12-04 22:23:35 +0000 | [diff] [blame] | 3175 | return std::make_pair(0U, SPU::R64FPRegisterClass); |
| 3176 | break; |
Scott Michel | 5af8f0e | 2008-07-16 17:17:29 +0000 | [diff] [blame] | 3177 | case 'v': |
Scott Michel | 266bc8f | 2007-12-04 22:23:35 +0000 | [diff] [blame] | 3178 | return std::make_pair(0U, SPU::GPRCRegisterClass); |
| 3179 | } |
| 3180 | } |
Scott Michel | 5af8f0e | 2008-07-16 17:17:29 +0000 | [diff] [blame] | 3181 | |
Scott Michel | 266bc8f | 2007-12-04 22:23:35 +0000 | [diff] [blame] | 3182 | return TargetLowering::getRegForInlineAsmConstraint(Constraint, VT); |
| 3183 | } |
| 3184 | |
Scott Michel | a59d469 | 2008-02-23 18:41:37 +0000 | [diff] [blame] | 3185 | //! Compute used/known bits for a SPU operand |
Scott Michel | 266bc8f | 2007-12-04 22:23:35 +0000 | [diff] [blame] | 3186 | void |
Dan Gohman | 475871a | 2008-07-27 21:46:04 +0000 | [diff] [blame] | 3187 | SPUTargetLowering::computeMaskedBitsForTargetNode(const SDValue Op, |
Dan Gohman | 977a76f | 2008-02-13 22:28:48 +0000 | [diff] [blame] | 3188 | const APInt &Mask, |
Scott Michel | 5af8f0e | 2008-07-16 17:17:29 +0000 | [diff] [blame] | 3189 | APInt &KnownZero, |
Dan Gohman | fd29e0e | 2008-02-13 00:35:47 +0000 | [diff] [blame] | 3190 | APInt &KnownOne, |
Scott Michel | 7f9ba9b | 2008-01-30 02:55:46 +0000 | [diff] [blame] | 3191 | const SelectionDAG &DAG, |
| 3192 | unsigned Depth ) const { |
Scott Michel | 203b2d6 | 2008-04-30 00:30:08 +0000 | [diff] [blame] | 3193 | #if 0 |
Dan Gohman | de551f9 | 2009-04-01 18:45:54 +0000 | [diff] [blame] | 3194 | const uint64_t uint64_sizebits = sizeof(uint64_t) * CHAR_BIT; |
Scott Michel | a59d469 | 2008-02-23 18:41:37 +0000 | [diff] [blame] | 3195 | |
| 3196 | switch (Op.getOpcode()) { |
| 3197 | default: |
| 3198 | // KnownZero = KnownOne = APInt(Mask.getBitWidth(), 0); |
| 3199 | break; |
Scott Michel | a59d469 | 2008-02-23 18:41:37 +0000 | [diff] [blame] | 3200 | case CALL: |
| 3201 | case SHUFB: |
Scott Michel | 7a1c9e9 | 2008-11-22 23:50:42 +0000 | [diff] [blame] | 3202 | case SHUFFLE_MASK: |
Scott Michel | a59d469 | 2008-02-23 18:41:37 +0000 | [diff] [blame] | 3203 | case CNTB: |
Scott Michel | d1e8d9c | 2009-01-21 04:58:48 +0000 | [diff] [blame] | 3204 | case SPUISD::PREFSLOT2VEC: |
Scott Michel | a59d469 | 2008-02-23 18:41:37 +0000 | [diff] [blame] | 3205 | case SPUISD::LDRESULT: |
Scott Michel | d1e8d9c | 2009-01-21 04:58:48 +0000 | [diff] [blame] | 3206 | case SPUISD::VEC2PREFSLOT: |
Scott Michel | 203b2d6 | 2008-04-30 00:30:08 +0000 | [diff] [blame] | 3207 | case SPUISD::SHLQUAD_L_BITS: |
| 3208 | case SPUISD::SHLQUAD_L_BYTES: |
Scott Michel | 203b2d6 | 2008-04-30 00:30:08 +0000 | [diff] [blame] | 3209 | case SPUISD::VEC_ROTL: |
| 3210 | case SPUISD::VEC_ROTR: |
Scott Michel | 203b2d6 | 2008-04-30 00:30:08 +0000 | [diff] [blame] | 3211 | case SPUISD::ROTBYTES_LEFT: |
Scott Michel | 8bf61e8 | 2008-06-02 22:18:03 +0000 | [diff] [blame] | 3212 | case SPUISD::SELECT_MASK: |
| 3213 | case SPUISD::SELB: |
Scott Michel | a59d469 | 2008-02-23 18:41:37 +0000 | [diff] [blame] | 3214 | } |
Scott Michel | d1e8d9c | 2009-01-21 04:58:48 +0000 | [diff] [blame] | 3215 | #endif |
Scott Michel | 266bc8f | 2007-12-04 22:23:35 +0000 | [diff] [blame] | 3216 | } |
Scott Michel | 02d711b | 2008-12-30 23:28:25 +0000 | [diff] [blame] | 3217 | |
Scott Michel | f0569be | 2008-12-27 04:51:36 +0000 | [diff] [blame] | 3218 | unsigned |
| 3219 | SPUTargetLowering::ComputeNumSignBitsForTargetNode(SDValue Op, |
| 3220 | unsigned Depth) const { |
| 3221 | switch (Op.getOpcode()) { |
| 3222 | default: |
| 3223 | return 1; |
Scott Michel | 266bc8f | 2007-12-04 22:23:35 +0000 | [diff] [blame] | 3224 | |
Scott Michel | f0569be | 2008-12-27 04:51:36 +0000 | [diff] [blame] | 3225 | case ISD::SETCC: { |
Owen Anderson | e50ed30 | 2009-08-10 22:56:29 +0000 | [diff] [blame] | 3226 | EVT VT = Op.getValueType(); |
Scott Michel | f0569be | 2008-12-27 04:51:36 +0000 | [diff] [blame] | 3227 | |
Owen Anderson | 825b72b | 2009-08-11 20:47:22 +0000 | [diff] [blame] | 3228 | if (VT != MVT::i8 && VT != MVT::i16 && VT != MVT::i32) { |
| 3229 | VT = MVT::i32; |
Scott Michel | f0569be | 2008-12-27 04:51:36 +0000 | [diff] [blame] | 3230 | } |
| 3231 | return VT.getSizeInBits(); |
| 3232 | } |
| 3233 | } |
| 3234 | } |
Scott Michel | 1df30c4 | 2008-12-29 03:23:36 +0000 | [diff] [blame] | 3235 | |
Scott Michel | 203b2d6 | 2008-04-30 00:30:08 +0000 | [diff] [blame] | 3236 | // LowerAsmOperandForConstraint |
| 3237 | void |
Dan Gohman | 475871a | 2008-07-27 21:46:04 +0000 | [diff] [blame] | 3238 | SPUTargetLowering::LowerAsmOperandForConstraint(SDValue Op, |
Eric Christopher | 100c833 | 2011-06-02 23:16:42 +0000 | [diff] [blame] | 3239 | std::string &Constraint, |
Dan Gohman | 475871a | 2008-07-27 21:46:04 +0000 | [diff] [blame] | 3240 | std::vector<SDValue> &Ops, |
Scott Michel | 203b2d6 | 2008-04-30 00:30:08 +0000 | [diff] [blame] | 3241 | SelectionDAG &DAG) const { |
| 3242 | // Default, for the time being, to the base class handler |
Eric Christopher | 100c833 | 2011-06-02 23:16:42 +0000 | [diff] [blame] | 3243 | TargetLowering::LowerAsmOperandForConstraint(Op, Constraint, Ops, DAG); |
Scott Michel | 203b2d6 | 2008-04-30 00:30:08 +0000 | [diff] [blame] | 3244 | } |
| 3245 | |
Scott Michel | 266bc8f | 2007-12-04 22:23:35 +0000 | [diff] [blame] | 3246 | /// isLegalAddressImmediate - Return true if the integer value can be used |
| 3247 | /// as the offset of the target addressing mode. |
Gabor Greif | 93c53e5 | 2008-08-31 15:37:04 +0000 | [diff] [blame] | 3248 | bool SPUTargetLowering::isLegalAddressImmediate(int64_t V, |
Chris Lattner | db125cf | 2011-07-18 04:54:35 +0000 | [diff] [blame] | 3249 | Type *Ty) const { |
Scott Michel | 266bc8f | 2007-12-04 22:23:35 +0000 | [diff] [blame] | 3250 | // SPU's addresses are 256K: |
| 3251 | return (V > -(1 << 18) && V < (1 << 18) - 1); |
| 3252 | } |
| 3253 | |
| 3254 | bool SPUTargetLowering::isLegalAddressImmediate(llvm::GlobalValue* GV) const { |
Scott Michel | 5af8f0e | 2008-07-16 17:17:29 +0000 | [diff] [blame] | 3255 | return false; |
Scott Michel | 266bc8f | 2007-12-04 22:23:35 +0000 | [diff] [blame] | 3256 | } |
Dan Gohman | 6520e20 | 2008-10-18 02:06:02 +0000 | [diff] [blame] | 3257 | |
| 3258 | bool |
| 3259 | SPUTargetLowering::isOffsetFoldingLegal(const GlobalAddressSDNode *GA) const { |
| 3260 | // The SPU target isn't yet aware of offsets. |
| 3261 | return false; |
| 3262 | } |
Kalle Raiskila | 8a52fa6 | 2010-10-07 16:24:35 +0000 | [diff] [blame] | 3263 | |
| 3264 | // can we compare to Imm without writing it into a register? |
| 3265 | bool SPUTargetLowering::isLegalICmpImmediate(int64_t Imm) const { |
| 3266 | //ceqi, cgti, etc. all take s10 operand |
| 3267 | return isInt<10>(Imm); |
| 3268 | } |
| 3269 | |
Wesley Peck | bf17cfa | 2010-11-23 03:31:01 +0000 | [diff] [blame] | 3270 | bool |
| 3271 | SPUTargetLowering::isLegalAddressingMode(const AddrMode &AM, |
Chris Lattner | db125cf | 2011-07-18 04:54:35 +0000 | [diff] [blame] | 3272 | Type * ) const{ |
Kalle Raiskila | 8a52fa6 | 2010-10-07 16:24:35 +0000 | [diff] [blame] | 3273 | |
Wesley Peck | bf17cfa | 2010-11-23 03:31:01 +0000 | [diff] [blame] | 3274 | // A-form: 18bit absolute address. |
Kalle Raiskila | 8a52fa6 | 2010-10-07 16:24:35 +0000 | [diff] [blame] | 3275 | if (AM.BaseGV && !AM.HasBaseReg && AM.Scale == 0 && AM.BaseOffs == 0) |
| 3276 | return true; |
Wesley Peck | bf17cfa | 2010-11-23 03:31:01 +0000 | [diff] [blame] | 3277 | |
Kalle Raiskila | 8a52fa6 | 2010-10-07 16:24:35 +0000 | [diff] [blame] | 3278 | // D-form: reg + 14bit offset |
| 3279 | if (AM.BaseGV ==0 && AM.HasBaseReg && AM.Scale == 0 && isInt<14>(AM.BaseOffs)) |
| 3280 | return true; |
| 3281 | |
| 3282 | // X-form: reg+reg |
| 3283 | if (AM.BaseGV == 0 && AM.HasBaseReg && AM.Scale == 1 && AM.BaseOffs ==0) |
| 3284 | return true; |
| 3285 | |
| 3286 | return false; |
| 3287 | } |