blob: 14bb8d00c81c99e30c2c96264dd47e65ad782307 [file] [log] [blame]
Scott Michel8efdca42007-12-04 22:23:35 +00001//===-- SPUISelLowering.cpp - Cell SPU DAG Lowering Implementation --------===//
2//
3// The LLVM Compiler Infrastructure
4//
Chris Lattner081ce942007-12-29 20:36:04 +00005// This file is distributed under the University of Illinois Open Source
6// License. See LICENSE.TXT for details.
Scott Michel8efdca42007-12-04 22:23:35 +00007//
8//===----------------------------------------------------------------------===//
9//
10// This file implements the SPUTargetLowering class.
11//
12//===----------------------------------------------------------------------===//
13
14#include "SPURegisterNames.h"
15#include "SPUISelLowering.h"
16#include "SPUTargetMachine.h"
Scott Michelbc5fbc12008-04-30 00:30:08 +000017#include "SPUFrameInfo.h"
Scott Michel06eabde2008-12-27 04:51:36 +000018#include "llvm/ADT/APInt.h"
Scott Michel8efdca42007-12-04 22:23:35 +000019#include "llvm/ADT/VectorExtras.h"
pingbak2f387e82009-01-26 03:31:40 +000020#include "llvm/CallingConv.h"
Scott Michel8efdca42007-12-04 22:23:35 +000021#include "llvm/CodeGen/CallingConvLower.h"
22#include "llvm/CodeGen/MachineFrameInfo.h"
23#include "llvm/CodeGen/MachineFunction.h"
24#include "llvm/CodeGen/MachineInstrBuilder.h"
Chris Lattner1b989192007-12-31 04:13:23 +000025#include "llvm/CodeGen/MachineRegisterInfo.h"
Scott Michel8efdca42007-12-04 22:23:35 +000026#include "llvm/CodeGen/SelectionDAG.h"
Scott Michel8efdca42007-12-04 22:23:35 +000027#include "llvm/Constants.h"
28#include "llvm/Function.h"
29#include "llvm/Intrinsics.h"
30#include "llvm/Support/Debug.h"
31#include "llvm/Support/MathExtras.h"
32#include "llvm/Target/TargetOptions.h"
33
34#include <map>
35
36using namespace llvm;
37
38// Used in getTargetNodeName() below
39namespace {
40 std::map<unsigned, const char *> node_names;
41
Duncan Sands92c43912008-06-06 12:08:01 +000042 //! MVT mapping to useful data for Cell SPU
Scott Michel8efdca42007-12-04 22:23:35 +000043 struct valtype_map_s {
Scott Michel56a125e2008-11-22 23:50:42 +000044 const MVT valtype;
45 const int prefslot_byte;
Scott Michel8efdca42007-12-04 22:23:35 +000046 };
Scott Michel4ec722e2008-07-16 17:17:29 +000047
Scott Michel8efdca42007-12-04 22:23:35 +000048 const valtype_map_s valtype_map[] = {
49 { MVT::i1, 3 },
50 { MVT::i8, 3 },
51 { MVT::i16, 2 },
52 { MVT::i32, 0 },
53 { MVT::f32, 0 },
54 { MVT::i64, 0 },
55 { MVT::f64, 0 },
56 { MVT::i128, 0 }
57 };
58
59 const size_t n_valtype_map = sizeof(valtype_map) / sizeof(valtype_map[0]);
60
Duncan Sands92c43912008-06-06 12:08:01 +000061 const valtype_map_s *getValueTypeMapEntry(MVT VT) {
Scott Michel8efdca42007-12-04 22:23:35 +000062 const valtype_map_s *retval = 0;
63
64 for (size_t i = 0; i < n_valtype_map; ++i) {
65 if (valtype_map[i].valtype == VT) {
Scott Michel5a6f17b2008-01-30 02:55:46 +000066 retval = valtype_map + i;
67 break;
Scott Michel8efdca42007-12-04 22:23:35 +000068 }
69 }
70
71#ifndef NDEBUG
72 if (retval == 0) {
73 cerr << "getValueTypeMapEntry returns NULL for "
Duncan Sands92c43912008-06-06 12:08:01 +000074 << VT.getMVTString()
Scott Michel5a6f17b2008-01-30 02:55:46 +000075 << "\n";
Scott Michel8efdca42007-12-04 22:23:35 +000076 abort();
77 }
78#endif
79
80 return retval;
81 }
Scott Michel750b93f2009-01-15 04:41:47 +000082
pingbak2f387e82009-01-26 03:31:40 +000083 //! Expand a library call into an actual call DAG node
84 /*!
85 \note
86 This code is taken from SelectionDAGLegalize, since it is not exposed as
87 part of the LLVM SelectionDAG API.
88 */
89
90 SDValue
91 ExpandLibCall(RTLIB::Libcall LC, SDValue Op, SelectionDAG &DAG,
92 bool isSigned, SDValue &Hi, SPUTargetLowering &TLI) {
93 // The input chain to this libcall is the entry node of the function.
94 // Legalizing the call will automatically add the previous call to the
95 // dependence.
96 SDValue InChain = DAG.getEntryNode();
97
98 TargetLowering::ArgListTy Args;
99 TargetLowering::ArgListEntry Entry;
100 for (unsigned i = 0, e = Op.getNumOperands(); i != e; ++i) {
101 MVT ArgVT = Op.getOperand(i).getValueType();
102 const Type *ArgTy = ArgVT.getTypeForMVT();
103 Entry.Node = Op.getOperand(i);
104 Entry.Ty = ArgTy;
105 Entry.isSExt = isSigned;
106 Entry.isZExt = !isSigned;
107 Args.push_back(Entry);
108 }
109 SDValue Callee = DAG.getExternalSymbol(TLI.getLibcallName(LC),
110 TLI.getPointerTy());
111
112 // Splice the libcall in wherever FindInputOutputChains tells us to.
113 const Type *RetTy = Op.getNode()->getValueType(0).getTypeForMVT();
114 std::pair<SDValue, SDValue> CallInfo =
115 TLI.LowerCallTo(InChain, RetTy, isSigned, !isSigned, false, false,
Dale Johannesenca6237b2009-01-30 23:10:59 +0000116 CallingConv::C, false, Callee, Args, DAG,
117 Op.getNode()->getDebugLoc());
pingbak2f387e82009-01-26 03:31:40 +0000118
119 return CallInfo.first;
120 }
Scott Michel8efdca42007-12-04 22:23:35 +0000121}
122
123SPUTargetLowering::SPUTargetLowering(SPUTargetMachine &TM)
124 : TargetLowering(TM),
125 SPUTM(TM)
126{
127 // Fold away setcc operations if possible.
128 setPow2DivIsCheap();
129
130 // Use _setjmp/_longjmp instead of setjmp/longjmp.
131 setUseUnderscoreSetJmp(true);
132 setUseUnderscoreLongJmp(true);
Scott Michel4ec722e2008-07-16 17:17:29 +0000133
Scott Michel8c67fa42009-01-21 04:58:48 +0000134 // Set RTLIB libcall names as used by SPU:
135 setLibcallName(RTLIB::DIV_F64, "__fast_divdf3");
136
Scott Michel8efdca42007-12-04 22:23:35 +0000137 // Set up the SPU's register classes:
Scott Michel438be252007-12-17 22:32:34 +0000138 addRegisterClass(MVT::i8, SPU::R8CRegisterClass);
139 addRegisterClass(MVT::i16, SPU::R16CRegisterClass);
140 addRegisterClass(MVT::i32, SPU::R32CRegisterClass);
141 addRegisterClass(MVT::i64, SPU::R64CRegisterClass);
142 addRegisterClass(MVT::f32, SPU::R32FPRegisterClass);
143 addRegisterClass(MVT::f64, SPU::R64FPRegisterClass);
Scott Michel8efdca42007-12-04 22:23:35 +0000144 addRegisterClass(MVT::i128, SPU::GPRCRegisterClass);
Scott Michel4ec722e2008-07-16 17:17:29 +0000145
Scott Michel8efdca42007-12-04 22:23:35 +0000146 // SPU has no sign or zero extended loads for i1, i8, i16:
Evan Cheng08c171a2008-10-14 21:26:46 +0000147 setLoadExtAction(ISD::EXTLOAD, MVT::i1, Promote);
148 setLoadExtAction(ISD::SEXTLOAD, MVT::i1, Promote);
149 setLoadExtAction(ISD::ZEXTLOAD, MVT::i1, Promote);
Scott Michel8efdca42007-12-04 22:23:35 +0000150
Scott Michel06eabde2008-12-27 04:51:36 +0000151 setLoadExtAction(ISD::EXTLOAD, MVT::f32, Expand);
152 setLoadExtAction(ISD::EXTLOAD, MVT::f64, Expand);
Scott Michelec8c82e2008-12-02 19:53:53 +0000153
Scott Michel8efdca42007-12-04 22:23:35 +0000154 // SPU constant load actions are custom lowered:
Nate Begeman78125042008-02-14 18:43:04 +0000155 setOperationAction(ISD::ConstantFP, MVT::f32, Legal);
Scott Michel8efdca42007-12-04 22:23:35 +0000156 setOperationAction(ISD::ConstantFP, MVT::f64, Custom);
157
158 // SPU's loads and stores have to be custom lowered:
Scott Michel2ef773a2009-01-06 03:36:14 +0000159 for (unsigned sctype = (unsigned) MVT::i8; sctype < (unsigned) MVT::i128;
Scott Michel8efdca42007-12-04 22:23:35 +0000160 ++sctype) {
Duncan Sands92c43912008-06-06 12:08:01 +0000161 MVT VT = (MVT::SimpleValueType)sctype;
162
Scott Michel06eabde2008-12-27 04:51:36 +0000163 setOperationAction(ISD::LOAD, VT, Custom);
164 setOperationAction(ISD::STORE, VT, Custom);
165 setLoadExtAction(ISD::EXTLOAD, VT, Custom);
166 setLoadExtAction(ISD::ZEXTLOAD, VT, Custom);
167 setLoadExtAction(ISD::SEXTLOAD, VT, Custom);
168
169 for (unsigned stype = sctype - 1; stype >= (unsigned) MVT::i8; --stype) {
170 MVT StoreVT = (MVT::SimpleValueType) stype;
171 setTruncStoreAction(VT, StoreVT, Expand);
172 }
Scott Michel8efdca42007-12-04 22:23:35 +0000173 }
174
Scott Michel06eabde2008-12-27 04:51:36 +0000175 for (unsigned sctype = (unsigned) MVT::f32; sctype < (unsigned) MVT::f64;
176 ++sctype) {
177 MVT VT = (MVT::SimpleValueType) sctype;
178
179 setOperationAction(ISD::LOAD, VT, Custom);
180 setOperationAction(ISD::STORE, VT, Custom);
181
182 for (unsigned stype = sctype - 1; stype >= (unsigned) MVT::f32; --stype) {
183 MVT StoreVT = (MVT::SimpleValueType) stype;
184 setTruncStoreAction(VT, StoreVT, Expand);
185 }
186 }
187
Scott Michel8efdca42007-12-04 22:23:35 +0000188 // Expand the jumptable branches
189 setOperationAction(ISD::BR_JT, MVT::Other, Expand);
190 setOperationAction(ISD::BR_CC, MVT::Other, Expand);
Scott Michel56a125e2008-11-22 23:50:42 +0000191
192 // Custom lower SELECT_CC for most cases, but expand by default
Scott Michel4ec722e2008-07-16 17:17:29 +0000193 setOperationAction(ISD::SELECT_CC, MVT::Other, Expand);
Scott Michel56a125e2008-11-22 23:50:42 +0000194 setOperationAction(ISD::SELECT_CC, MVT::i8, Custom);
195 setOperationAction(ISD::SELECT_CC, MVT::i16, Custom);
196 setOperationAction(ISD::SELECT_CC, MVT::i32, Custom);
197 setOperationAction(ISD::SELECT_CC, MVT::i64, Custom);
Scott Michel8efdca42007-12-04 22:23:35 +0000198
199 // SPU has no intrinsics for these particular operations:
Andrew Lenharth0531ec52008-02-16 14:46:26 +0000200 setOperationAction(ISD::MEMBARRIER, MVT::Other, Expand);
201
Scott Michel06eabde2008-12-27 04:51:36 +0000202 // SPU has no SREM/UREM instructions
Scott Michel8efdca42007-12-04 22:23:35 +0000203 setOperationAction(ISD::SREM, MVT::i32, Expand);
204 setOperationAction(ISD::UREM, MVT::i32, Expand);
205 setOperationAction(ISD::SREM, MVT::i64, Expand);
206 setOperationAction(ISD::UREM, MVT::i64, Expand);
Scott Michel4ec722e2008-07-16 17:17:29 +0000207
Scott Michel8efdca42007-12-04 22:23:35 +0000208 // We don't support sin/cos/sqrt/fmod
209 setOperationAction(ISD::FSIN , MVT::f64, Expand);
210 setOperationAction(ISD::FCOS , MVT::f64, Expand);
211 setOperationAction(ISD::FREM , MVT::f64, Expand);
212 setOperationAction(ISD::FSIN , MVT::f32, Expand);
213 setOperationAction(ISD::FCOS , MVT::f32, Expand);
214 setOperationAction(ISD::FREM , MVT::f32, Expand);
Scott Michel4ec722e2008-07-16 17:17:29 +0000215
pingbak2f387e82009-01-26 03:31:40 +0000216 // Expand fsqrt to the appropriate libcall (NOTE: should use h/w fsqrt
217 // for f32!)
Scott Michel8efdca42007-12-04 22:23:35 +0000218 setOperationAction(ISD::FSQRT, MVT::f64, Expand);
219 setOperationAction(ISD::FSQRT, MVT::f32, Expand);
Scott Michel4ec722e2008-07-16 17:17:29 +0000220
Scott Michel8efdca42007-12-04 22:23:35 +0000221 setOperationAction(ISD::FCOPYSIGN, MVT::f64, Expand);
222 setOperationAction(ISD::FCOPYSIGN, MVT::f32, Expand);
223
224 // SPU can do rotate right and left, so legalize it... but customize for i8
225 // because instructions don't exist.
Bill Wendling965299c2008-08-31 02:59:23 +0000226
227 // FIXME: Change from "expand" to appropriate type once ROTR is supported in
228 // .td files.
229 setOperationAction(ISD::ROTR, MVT::i32, Expand /*Legal*/);
230 setOperationAction(ISD::ROTR, MVT::i16, Expand /*Legal*/);
231 setOperationAction(ISD::ROTR, MVT::i8, Expand /*Custom*/);
232
Scott Michel8efdca42007-12-04 22:23:35 +0000233 setOperationAction(ISD::ROTL, MVT::i32, Legal);
234 setOperationAction(ISD::ROTL, MVT::i16, Legal);
235 setOperationAction(ISD::ROTL, MVT::i8, Custom);
Scott Michelabb8ca12008-11-20 16:36:33 +0000236
Scott Michel8efdca42007-12-04 22:23:35 +0000237 // SPU has no native version of shift left/right for i8
238 setOperationAction(ISD::SHL, MVT::i8, Custom);
239 setOperationAction(ISD::SRL, MVT::i8, Custom);
240 setOperationAction(ISD::SRA, MVT::i8, Custom);
Scott Michel33d73eb2008-11-21 02:56:16 +0000241
Scott Michel4d07fb72008-12-30 23:28:25 +0000242 // Make these operations legal and handle them during instruction selection:
243 setOperationAction(ISD::SHL, MVT::i64, Legal);
244 setOperationAction(ISD::SRL, MVT::i64, Legal);
245 setOperationAction(ISD::SRA, MVT::i64, Legal);
Scott Michel8efdca42007-12-04 22:23:35 +0000246
Scott Michel4ec722e2008-07-16 17:17:29 +0000247 // Custom lower i8, i32 and i64 multiplications
248 setOperationAction(ISD::MUL, MVT::i8, Custom);
Scott Michelae5cbf52008-12-29 03:23:36 +0000249 setOperationAction(ISD::MUL, MVT::i32, Legal);
Scott Michel750b93f2009-01-15 04:41:47 +0000250 setOperationAction(ISD::MUL, MVT::i64, Legal);
Scott Michel33d73eb2008-11-21 02:56:16 +0000251
Scott Michel67224b22008-06-02 22:18:03 +0000252 // Need to custom handle (some) common i8, i64 math ops
Scott Michel4d07fb72008-12-30 23:28:25 +0000253 setOperationAction(ISD::ADD, MVT::i8, Custom);
Scott Michel750b93f2009-01-15 04:41:47 +0000254 setOperationAction(ISD::ADD, MVT::i64, Legal);
Scott Michel8efdca42007-12-04 22:23:35 +0000255 setOperationAction(ISD::SUB, MVT::i8, Custom);
Scott Michel750b93f2009-01-15 04:41:47 +0000256 setOperationAction(ISD::SUB, MVT::i64, Legal);
Scott Michel4ec722e2008-07-16 17:17:29 +0000257
Scott Michel8efdca42007-12-04 22:23:35 +0000258 // SPU does not have BSWAP. It does have i32 support CTLZ.
259 // CTPOP has to be custom lowered.
260 setOperationAction(ISD::BSWAP, MVT::i32, Expand);
261 setOperationAction(ISD::BSWAP, MVT::i64, Expand);
262
263 setOperationAction(ISD::CTPOP, MVT::i8, Custom);
264 setOperationAction(ISD::CTPOP, MVT::i16, Custom);
265 setOperationAction(ISD::CTPOP, MVT::i32, Custom);
266 setOperationAction(ISD::CTPOP, MVT::i64, Custom);
267
268 setOperationAction(ISD::CTTZ , MVT::i32, Expand);
269 setOperationAction(ISD::CTTZ , MVT::i64, Expand);
270
271 setOperationAction(ISD::CTLZ , MVT::i32, Legal);
Scott Michel4ec722e2008-07-16 17:17:29 +0000272
Scott Michel67224b22008-06-02 22:18:03 +0000273 // SPU has a version of select that implements (a&~c)|(b&c), just like
Scott Michel978b96f2008-03-10 23:49:09 +0000274 // select ought to work:
Scott Michel53ab7792008-03-10 16:58:52 +0000275 setOperationAction(ISD::SELECT, MVT::i8, Legal);
Scott Michel6baba072008-03-05 23:02:02 +0000276 setOperationAction(ISD::SELECT, MVT::i16, Legal);
277 setOperationAction(ISD::SELECT, MVT::i32, Legal);
Scott Michel06eabde2008-12-27 04:51:36 +0000278 setOperationAction(ISD::SELECT, MVT::i64, Legal);
Scott Michel8efdca42007-12-04 22:23:35 +0000279
Scott Michel53ab7792008-03-10 16:58:52 +0000280 setOperationAction(ISD::SETCC, MVT::i8, Legal);
281 setOperationAction(ISD::SETCC, MVT::i16, Legal);
Scott Michelae5cbf52008-12-29 03:23:36 +0000282 setOperationAction(ISD::SETCC, MVT::i32, Legal);
283 setOperationAction(ISD::SETCC, MVT::i64, Legal);
Scott Michel8c67fa42009-01-21 04:58:48 +0000284 setOperationAction(ISD::SETCC, MVT::f64, Custom);
Scott Michel6baba072008-03-05 23:02:02 +0000285
Scott Michel06eabde2008-12-27 04:51:36 +0000286 // Custom lower i128 -> i64 truncates
Scott Michelec8c82e2008-12-02 19:53:53 +0000287 setOperationAction(ISD::TRUNCATE, MVT::i64, Custom);
288
pingbak2f387e82009-01-26 03:31:40 +0000289 // SPU has a legal FP -> signed INT instruction for f32, but for f64, need
290 // to expand to a libcall, hence the custom lowering:
291 setOperationAction(ISD::FP_TO_SINT, MVT::i32, Custom);
292 setOperationAction(ISD::FP_TO_UINT, MVT::i32, Custom);
Scott Michel8efdca42007-12-04 22:23:35 +0000293
294 // FDIV on SPU requires custom lowering
pingbak2f387e82009-01-26 03:31:40 +0000295 setOperationAction(ISD::FDIV, MVT::f64, Expand); // to libcall
Scott Michel8efdca42007-12-04 22:23:35 +0000296
Scott Michelc899a122009-01-26 22:33:37 +0000297 // SPU has [U|S]INT_TO_FP for f32->i32, but not for f64->i32, f64->i64:
pingbak2f387e82009-01-26 03:31:40 +0000298 setOperationAction(ISD::SINT_TO_FP, MVT::i32, Custom);
Scott Michel8efdca42007-12-04 22:23:35 +0000299 setOperationAction(ISD::SINT_TO_FP, MVT::i16, Promote);
pingbak2f387e82009-01-26 03:31:40 +0000300 setOperationAction(ISD::SINT_TO_FP, MVT::i8, Promote);
301 setOperationAction(ISD::UINT_TO_FP, MVT::i32, Custom);
Scott Michel8efdca42007-12-04 22:23:35 +0000302 setOperationAction(ISD::UINT_TO_FP, MVT::i16, Promote);
pingbak2f387e82009-01-26 03:31:40 +0000303 setOperationAction(ISD::UINT_TO_FP, MVT::i8, Promote);
Scott Michel8efdca42007-12-04 22:23:35 +0000304 setOperationAction(ISD::SINT_TO_FP, MVT::i64, Custom);
305 setOperationAction(ISD::UINT_TO_FP, MVT::i64, Custom);
306
Scott Michel754d8662007-12-20 00:44:13 +0000307 setOperationAction(ISD::BIT_CONVERT, MVT::i32, Legal);
308 setOperationAction(ISD::BIT_CONVERT, MVT::f32, Legal);
309 setOperationAction(ISD::BIT_CONVERT, MVT::i64, Legal);
310 setOperationAction(ISD::BIT_CONVERT, MVT::f64, Legal);
Scott Michel8efdca42007-12-04 22:23:35 +0000311
312 // We cannot sextinreg(i1). Expand to shifts.
313 setOperationAction(ISD::SIGN_EXTEND_INREG, MVT::i1, Expand);
Scott Michel4ec722e2008-07-16 17:17:29 +0000314
Scott Michel8efdca42007-12-04 22:23:35 +0000315 // Support label based line numbers.
Dan Gohman472d12c2008-06-30 20:59:49 +0000316 setOperationAction(ISD::DBG_STOPPOINT, MVT::Other, Expand);
Scott Michel8efdca42007-12-04 22:23:35 +0000317 setOperationAction(ISD::DEBUG_LOC, MVT::Other, Expand);
Scott Michel4ec722e2008-07-16 17:17:29 +0000318
319 // We want to legalize GlobalAddress and ConstantPool nodes into the
Scott Michel8efdca42007-12-04 22:23:35 +0000320 // appropriate instructions to materialize the address.
Scott Michel33d73eb2008-11-21 02:56:16 +0000321 for (unsigned sctype = (unsigned) MVT::i8; sctype < (unsigned) MVT::f128;
Scott Michelf9f42e62008-01-29 02:16:57 +0000322 ++sctype) {
Duncan Sands92c43912008-06-06 12:08:01 +0000323 MVT VT = (MVT::SimpleValueType)sctype;
324
Scott Michelae5cbf52008-12-29 03:23:36 +0000325 setOperationAction(ISD::GlobalAddress, VT, Custom);
326 setOperationAction(ISD::ConstantPool, VT, Custom);
327 setOperationAction(ISD::JumpTable, VT, Custom);
Scott Michelf9f42e62008-01-29 02:16:57 +0000328 }
Scott Michel8efdca42007-12-04 22:23:35 +0000329
330 // RET must be custom lowered, to meet ABI requirements
331 setOperationAction(ISD::RET, MVT::Other, Custom);
Scott Michel4ec722e2008-07-16 17:17:29 +0000332
Scott Michel8efdca42007-12-04 22:23:35 +0000333 // VASTART needs to be custom lowered to use the VarArgsFrameIndex
334 setOperationAction(ISD::VASTART , MVT::Other, Custom);
Scott Michel4ec722e2008-07-16 17:17:29 +0000335
Scott Michel8efdca42007-12-04 22:23:35 +0000336 // Use the default implementation.
337 setOperationAction(ISD::VAARG , MVT::Other, Expand);
338 setOperationAction(ISD::VACOPY , MVT::Other, Expand);
339 setOperationAction(ISD::VAEND , MVT::Other, Expand);
Scott Michel4ec722e2008-07-16 17:17:29 +0000340 setOperationAction(ISD::STACKSAVE , MVT::Other, Expand);
Scott Michel8efdca42007-12-04 22:23:35 +0000341 setOperationAction(ISD::STACKRESTORE , MVT::Other, Expand);
342 setOperationAction(ISD::DYNAMIC_STACKALLOC, MVT::i32 , Expand);
343 setOperationAction(ISD::DYNAMIC_STACKALLOC, MVT::i64 , Expand);
344
345 // Cell SPU has instructions for converting between i64 and fp.
346 setOperationAction(ISD::FP_TO_SINT, MVT::i64, Custom);
347 setOperationAction(ISD::SINT_TO_FP, MVT::i64, Custom);
Scott Michel4ec722e2008-07-16 17:17:29 +0000348
Scott Michel8efdca42007-12-04 22:23:35 +0000349 // To take advantage of the above i64 FP_TO_SINT, promote i32 FP_TO_UINT
350 setOperationAction(ISD::FP_TO_UINT, MVT::i32, Promote);
351
352 // BUILD_PAIR can't be handled natively, and should be expanded to shl/or
353 setOperationAction(ISD::BUILD_PAIR, MVT::i64, Expand);
354
355 // First set operation action for all vector types to expand. Then we
356 // will selectively turn on ones that can be effectively codegen'd.
357 addRegisterClass(MVT::v16i8, SPU::VECREGRegisterClass);
358 addRegisterClass(MVT::v8i16, SPU::VECREGRegisterClass);
359 addRegisterClass(MVT::v4i32, SPU::VECREGRegisterClass);
360 addRegisterClass(MVT::v2i64, SPU::VECREGRegisterClass);
361 addRegisterClass(MVT::v4f32, SPU::VECREGRegisterClass);
362 addRegisterClass(MVT::v2f64, SPU::VECREGRegisterClass);
363
Scott Michel70741542009-01-06 23:10:38 +0000364 // "Odd size" vector classes that we're willing to support:
365 addRegisterClass(MVT::v2i32, SPU::VECREGRegisterClass);
366
Duncan Sands92c43912008-06-06 12:08:01 +0000367 for (unsigned i = (unsigned)MVT::FIRST_VECTOR_VALUETYPE;
368 i <= (unsigned)MVT::LAST_VECTOR_VALUETYPE; ++i) {
369 MVT VT = (MVT::SimpleValueType)i;
Scott Michel8efdca42007-12-04 22:23:35 +0000370
Duncan Sands92c43912008-06-06 12:08:01 +0000371 // add/sub are legal for all supported vector VT's.
pingbak2f387e82009-01-26 03:31:40 +0000372 setOperationAction(ISD::ADD, VT, Legal);
373 setOperationAction(ISD::SUB, VT, Legal);
Duncan Sands92c43912008-06-06 12:08:01 +0000374 // mul has to be custom lowered.
pingbak2f387e82009-01-26 03:31:40 +0000375 setOperationAction(ISD::MUL, VT, Legal);
Duncan Sands92c43912008-06-06 12:08:01 +0000376
pingbak2f387e82009-01-26 03:31:40 +0000377 setOperationAction(ISD::AND, VT, Legal);
378 setOperationAction(ISD::OR, VT, Legal);
379 setOperationAction(ISD::XOR, VT, Legal);
380 setOperationAction(ISD::LOAD, VT, Legal);
381 setOperationAction(ISD::SELECT, VT, Legal);
382 setOperationAction(ISD::STORE, VT, Legal);
Scott Michel4ec722e2008-07-16 17:17:29 +0000383
Scott Michel8efdca42007-12-04 22:23:35 +0000384 // These operations need to be expanded:
pingbak2f387e82009-01-26 03:31:40 +0000385 setOperationAction(ISD::SDIV, VT, Expand);
386 setOperationAction(ISD::SREM, VT, Expand);
387 setOperationAction(ISD::UDIV, VT, Expand);
388 setOperationAction(ISD::UREM, VT, Expand);
Scott Michel8efdca42007-12-04 22:23:35 +0000389
390 // Custom lower build_vector, constant pool spills, insert and
391 // extract vector elements:
Duncan Sands92c43912008-06-06 12:08:01 +0000392 setOperationAction(ISD::BUILD_VECTOR, VT, Custom);
393 setOperationAction(ISD::ConstantPool, VT, Custom);
394 setOperationAction(ISD::SCALAR_TO_VECTOR, VT, Custom);
395 setOperationAction(ISD::EXTRACT_VECTOR_ELT, VT, Custom);
396 setOperationAction(ISD::INSERT_VECTOR_ELT, VT, Custom);
397 setOperationAction(ISD::VECTOR_SHUFFLE, VT, Custom);
Scott Michel8efdca42007-12-04 22:23:35 +0000398 }
399
Scott Michel8efdca42007-12-04 22:23:35 +0000400 setOperationAction(ISD::AND, MVT::v16i8, Custom);
401 setOperationAction(ISD::OR, MVT::v16i8, Custom);
402 setOperationAction(ISD::XOR, MVT::v16i8, Custom);
403 setOperationAction(ISD::SCALAR_TO_VECTOR, MVT::v4f32, Custom);
Scott Micheldbac4cf2008-01-11 02:53:15 +0000404
Scott Michel4d07fb72008-12-30 23:28:25 +0000405 setOperationAction(ISD::FDIV, MVT::v4f32, Legal);
Scott Michelae5cbf52008-12-29 03:23:36 +0000406
Scott Michel8efdca42007-12-04 22:23:35 +0000407 setShiftAmountType(MVT::i32);
Scott Michel06eabde2008-12-27 04:51:36 +0000408 setBooleanContents(ZeroOrNegativeOneBooleanContent);
Scott Michel4ec722e2008-07-16 17:17:29 +0000409
Scott Michel8efdca42007-12-04 22:23:35 +0000410 setStackPointerRegisterToSaveRestore(SPU::R1);
Scott Michel4ec722e2008-07-16 17:17:29 +0000411
Scott Michel8efdca42007-12-04 22:23:35 +0000412 // We have target-specific dag combine patterns for the following nodes:
Scott Michelf9f42e62008-01-29 02:16:57 +0000413 setTargetDAGCombine(ISD::ADD);
Scott Michel97872d32008-02-23 18:41:37 +0000414 setTargetDAGCombine(ISD::ZERO_EXTEND);
415 setTargetDAGCombine(ISD::SIGN_EXTEND);
416 setTargetDAGCombine(ISD::ANY_EXTEND);
Scott Michel4ec722e2008-07-16 17:17:29 +0000417
Scott Michel8efdca42007-12-04 22:23:35 +0000418 computeRegisterProperties();
Scott Michel56a125e2008-11-22 23:50:42 +0000419
Scott Michel2c261072008-12-09 03:37:19 +0000420 // Set pre-RA register scheduler default to BURR, which produces slightly
421 // better code than the default (could also be TDRR, but TargetLowering.h
422 // needs a mod to support that model):
423 setSchedulingPreference(SchedulingForRegPressure);
Scott Michel8efdca42007-12-04 22:23:35 +0000424}
425
426const char *
427SPUTargetLowering::getTargetNodeName(unsigned Opcode) const
428{
429 if (node_names.empty()) {
430 node_names[(unsigned) SPUISD::RET_FLAG] = "SPUISD::RET_FLAG";
431 node_names[(unsigned) SPUISD::Hi] = "SPUISD::Hi";
432 node_names[(unsigned) SPUISD::Lo] = "SPUISD::Lo";
433 node_names[(unsigned) SPUISD::PCRelAddr] = "SPUISD::PCRelAddr";
Scott Micheldbac4cf2008-01-11 02:53:15 +0000434 node_names[(unsigned) SPUISD::AFormAddr] = "SPUISD::AFormAddr";
Scott Michelf9f42e62008-01-29 02:16:57 +0000435 node_names[(unsigned) SPUISD::IndirectAddr] = "SPUISD::IndirectAddr";
Scott Michel8efdca42007-12-04 22:23:35 +0000436 node_names[(unsigned) SPUISD::LDRESULT] = "SPUISD::LDRESULT";
437 node_names[(unsigned) SPUISD::CALL] = "SPUISD::CALL";
438 node_names[(unsigned) SPUISD::SHUFB] = "SPUISD::SHUFB";
Scott Michel56a125e2008-11-22 23:50:42 +0000439 node_names[(unsigned) SPUISD::SHUFFLE_MASK] = "SPUISD::SHUFFLE_MASK";
Scott Michel8efdca42007-12-04 22:23:35 +0000440 node_names[(unsigned) SPUISD::CNTB] = "SPUISD::CNTB";
Scott Michelae5cbf52008-12-29 03:23:36 +0000441 node_names[(unsigned) SPUISD::PREFSLOT2VEC] = "SPUISD::PREFSLOT2VEC";
Scott Michelc630c412008-11-24 17:11:17 +0000442 node_names[(unsigned) SPUISD::VEC2PREFSLOT] = "SPUISD::VEC2PREFSLOT";
Scott Michel97872d32008-02-23 18:41:37 +0000443 node_names[(unsigned) SPUISD::SHLQUAD_L_BITS] = "SPUISD::SHLQUAD_L_BITS";
444 node_names[(unsigned) SPUISD::SHLQUAD_L_BYTES] = "SPUISD::SHLQUAD_L_BYTES";
Scott Michel8efdca42007-12-04 22:23:35 +0000445 node_names[(unsigned) SPUISD::VEC_SHL] = "SPUISD::VEC_SHL";
446 node_names[(unsigned) SPUISD::VEC_SRL] = "SPUISD::VEC_SRL";
447 node_names[(unsigned) SPUISD::VEC_SRA] = "SPUISD::VEC_SRA";
448 node_names[(unsigned) SPUISD::VEC_ROTL] = "SPUISD::VEC_ROTL";
449 node_names[(unsigned) SPUISD::VEC_ROTR] = "SPUISD::VEC_ROTR";
Scott Michel8c67fa42009-01-21 04:58:48 +0000450 node_names[(unsigned) SPUISD::ROTBYTES_LEFT] = "SPUISD::ROTBYTES_LEFT";
451 node_names[(unsigned) SPUISD::ROTBYTES_LEFT_BITS] =
452 "SPUISD::ROTBYTES_LEFT_BITS";
Scott Michel67224b22008-06-02 22:18:03 +0000453 node_names[(unsigned) SPUISD::SELECT_MASK] = "SPUISD::SELECT_MASK";
Scott Michel8efdca42007-12-04 22:23:35 +0000454 node_names[(unsigned) SPUISD::SELB] = "SPUISD::SELB";
Scott Michel750b93f2009-01-15 04:41:47 +0000455 node_names[(unsigned) SPUISD::ADD64_MARKER] = "SPUISD::ADD64_MARKER";
456 node_names[(unsigned) SPUISD::SUB64_MARKER] = "SPUISD::SUB64_MARKER";
457 node_names[(unsigned) SPUISD::MUL64_MARKER] = "SPUISD::MUL64_MARKER";
Scott Michel8efdca42007-12-04 22:23:35 +0000458 }
459
460 std::map<unsigned, const char *>::iterator i = node_names.find(Opcode);
461
462 return ((i != node_names.end()) ? i->second : 0);
463}
464
Scott Michel06eabde2008-12-27 04:51:36 +0000465//===----------------------------------------------------------------------===//
466// Return the Cell SPU's SETCC result type
467//===----------------------------------------------------------------------===//
468
Duncan Sands4a361272009-01-01 15:52:00 +0000469MVT SPUTargetLowering::getSetCCResultType(MVT VT) const {
Scott Michel06eabde2008-12-27 04:51:36 +0000470 // i16 and i32 are valid SETCC result types
471 return ((VT == MVT::i8 || VT == MVT::i16 || VT == MVT::i32) ? VT : MVT::i32);
Scott Michel53ab7792008-03-10 16:58:52 +0000472}
473
Scott Michel8efdca42007-12-04 22:23:35 +0000474//===----------------------------------------------------------------------===//
475// Calling convention code:
476//===----------------------------------------------------------------------===//
477
478#include "SPUGenCallingConv.inc"
479
480//===----------------------------------------------------------------------===//
481// LowerOperation implementation
482//===----------------------------------------------------------------------===//
483
484/// Custom lower loads for CellSPU
485/*!
486 All CellSPU loads and stores are aligned to 16-byte boundaries, so for elements
487 within a 16-byte block, we have to rotate to extract the requested element.
Scott Michel6ccefab2008-12-04 03:02:42 +0000488
489 For extending loads, we also want to ensure that the following sequence is
490 emitted, e.g. for MVT::f32 extending load to MVT::f64:
491
492\verbatim
Scott Michelae5cbf52008-12-29 03:23:36 +0000493%1 v16i8,ch = load
Scott Michel6ccefab2008-12-04 03:02:42 +0000494%2 v16i8,ch = rotate %1
Scott Michelae5cbf52008-12-29 03:23:36 +0000495%3 v4f8, ch = bitconvert %2
Scott Michel6ccefab2008-12-04 03:02:42 +0000496%4 f32 = vec2perfslot %3
497%5 f64 = fp_extend %4
498\endverbatim
499*/
Dan Gohman8181bd12008-07-27 21:46:04 +0000500static SDValue
501LowerLOAD(SDValue Op, SelectionDAG &DAG, const SPUSubtarget *ST) {
Scott Michel8efdca42007-12-04 22:23:35 +0000502 LoadSDNode *LN = cast<LoadSDNode>(Op);
Dan Gohman8181bd12008-07-27 21:46:04 +0000503 SDValue the_chain = LN->getChain();
Scott Michel06eabde2008-12-27 04:51:36 +0000504 MVT PtrVT = DAG.getTargetLoweringInfo().getPointerTy();
Scott Michel6ccefab2008-12-04 03:02:42 +0000505 MVT InVT = LN->getMemoryVT();
506 MVT OutVT = Op.getValueType();
Scott Michel8efdca42007-12-04 22:23:35 +0000507 ISD::LoadExtType ExtType = LN->getExtensionType();
508 unsigned alignment = LN->getAlignment();
Scott Michel06eabde2008-12-27 04:51:36 +0000509 const valtype_map_s *vtm = getValueTypeMapEntry(InVT);
Dale Johannesenea996922009-02-04 20:06:27 +0000510 DebugLoc dl = Op.getDebugLoc();
Scott Michel8efdca42007-12-04 22:23:35 +0000511
Scott Michel8efdca42007-12-04 22:23:35 +0000512 switch (LN->getAddressingMode()) {
513 case ISD::UNINDEXED: {
Scott Michel06eabde2008-12-27 04:51:36 +0000514 SDValue result;
515 SDValue basePtr = LN->getBasePtr();
516 SDValue rotate;
Scott Michel8efdca42007-12-04 22:23:35 +0000517
Scott Michel06eabde2008-12-27 04:51:36 +0000518 if (alignment == 16) {
519 ConstantSDNode *CN;
Scott Micheldbac4cf2008-01-11 02:53:15 +0000520
Scott Michel06eabde2008-12-27 04:51:36 +0000521 // Special cases for a known aligned load to simplify the base pointer
522 // and the rotation amount:
523 if (basePtr.getOpcode() == ISD::ADD
524 && (CN = dyn_cast<ConstantSDNode > (basePtr.getOperand(1))) != 0) {
525 // Known offset into basePtr
526 int64_t offset = CN->getSExtValue();
527 int64_t rotamt = int64_t((offset & 0xf) - vtm->prefslot_byte);
Scott Micheldbac4cf2008-01-11 02:53:15 +0000528
Scott Michel06eabde2008-12-27 04:51:36 +0000529 if (rotamt < 0)
530 rotamt += 16;
531
532 rotate = DAG.getConstant(rotamt, MVT::i16);
533
534 // Simplify the base pointer for this case:
535 basePtr = basePtr.getOperand(0);
536 if ((offset & ~0xf) > 0) {
537 basePtr = DAG.getNode(SPUISD::IndirectAddr, PtrVT,
538 basePtr,
539 DAG.getConstant((offset & ~0xf), PtrVT));
540 }
541 } else if ((basePtr.getOpcode() == SPUISD::AFormAddr)
542 || (basePtr.getOpcode() == SPUISD::IndirectAddr
543 && basePtr.getOperand(0).getOpcode() == SPUISD::Hi
544 && basePtr.getOperand(1).getOpcode() == SPUISD::Lo)) {
545 // Plain aligned a-form address: rotate into preferred slot
546 // Same for (SPUindirect (SPUhi ...), (SPUlo ...))
547 int64_t rotamt = -vtm->prefslot_byte;
548 if (rotamt < 0)
549 rotamt += 16;
550 rotate = DAG.getConstant(rotamt, MVT::i16);
Scott Micheldbac4cf2008-01-11 02:53:15 +0000551 } else {
Scott Michel06eabde2008-12-27 04:51:36 +0000552 // Offset the rotate amount by the basePtr and the preferred slot
553 // byte offset
554 int64_t rotamt = -vtm->prefslot_byte;
555 if (rotamt < 0)
556 rotamt += 16;
Dale Johannesenea996922009-02-04 20:06:27 +0000557 rotate = DAG.getNode(ISD::ADD, dl, PtrVT,
Scott Michel06eabde2008-12-27 04:51:36 +0000558 basePtr,
Scott Michel5a6f17b2008-01-30 02:55:46 +0000559 DAG.getConstant(rotamt, PtrVT));
Scott Micheldbac4cf2008-01-11 02:53:15 +0000560 }
Scott Michel06eabde2008-12-27 04:51:36 +0000561 } else {
562 // Unaligned load: must be more pessimistic about addressing modes:
563 if (basePtr.getOpcode() == ISD::ADD) {
564 MachineFunction &MF = DAG.getMachineFunction();
565 MachineRegisterInfo &RegInfo = MF.getRegInfo();
566 unsigned VReg = RegInfo.createVirtualRegister(&SPU::R32CRegClass);
567 SDValue Flag;
Scott Micheldbac4cf2008-01-11 02:53:15 +0000568
Scott Michel06eabde2008-12-27 04:51:36 +0000569 SDValue Op0 = basePtr.getOperand(0);
570 SDValue Op1 = basePtr.getOperand(1);
571
572 if (isa<ConstantSDNode>(Op1)) {
573 // Convert the (add <ptr>, <const>) to an indirect address contained
574 // in a register. Note that this is done because we need to avoid
575 // creating a 0(reg) d-form address due to the SPU's block loads.
576 basePtr = DAG.getNode(SPUISD::IndirectAddr, PtrVT, Op0, Op1);
Dale Johannesenea996922009-02-04 20:06:27 +0000577 the_chain = DAG.getCopyToReg(the_chain, dl, VReg, basePtr, Flag);
578 basePtr = DAG.getCopyFromReg(the_chain, dl, VReg, PtrVT);
Scott Michel06eabde2008-12-27 04:51:36 +0000579 } else {
580 // Convert the (add <arg1>, <arg2>) to an indirect address, which
581 // will likely be lowered as a reg(reg) x-form address.
582 basePtr = DAG.getNode(SPUISD::IndirectAddr, PtrVT, Op0, Op1);
583 }
584 } else {
585 basePtr = DAG.getNode(SPUISD::IndirectAddr, PtrVT,
586 basePtr,
587 DAG.getConstant(0, PtrVT));
588 }
589
590 // Offset the rotate amount by the basePtr and the preferred slot
591 // byte offset
Dale Johannesenea996922009-02-04 20:06:27 +0000592 rotate = DAG.getNode(ISD::ADD, dl, PtrVT,
Scott Michel06eabde2008-12-27 04:51:36 +0000593 basePtr,
594 DAG.getConstant(-vtm->prefslot_byte, PtrVT));
Scott Michel8efdca42007-12-04 22:23:35 +0000595 }
Scott Micheldbac4cf2008-01-11 02:53:15 +0000596
Scott Michel06eabde2008-12-27 04:51:36 +0000597 // Re-emit as a v16i8 vector load
Dale Johannesenea996922009-02-04 20:06:27 +0000598 result = DAG.getLoad(MVT::v16i8, dl, the_chain, basePtr,
Scott Michel06eabde2008-12-27 04:51:36 +0000599 LN->getSrcValue(), LN->getSrcValueOffset(),
600 LN->isVolatile(), 16);
601
602 // Update the chain
603 the_chain = result.getValue(1);
604
605 // Rotate into the preferred slot:
Dale Johannesenea996922009-02-04 20:06:27 +0000606 result = DAG.getNode(SPUISD::ROTBYTES_LEFT, dl, MVT::v16i8,
Scott Michel06eabde2008-12-27 04:51:36 +0000607 result.getValue(0), rotate);
608
Scott Michel6ccefab2008-12-04 03:02:42 +0000609 // Convert the loaded v16i8 vector to the appropriate vector type
610 // specified by the operand:
611 MVT vecVT = MVT::getVectorVT(InVT, (128 / InVT.getSizeInBits()));
Dale Johannesenea996922009-02-04 20:06:27 +0000612 result = DAG.getNode(SPUISD::VEC2PREFSLOT, dl, InVT,
613 DAG.getNode(ISD::BIT_CONVERT, dl, vecVT, result));
Scott Michel4ec722e2008-07-16 17:17:29 +0000614
Scott Michel6ccefab2008-12-04 03:02:42 +0000615 // Handle extending loads by extending the scalar result:
616 if (ExtType == ISD::SEXTLOAD) {
Dale Johannesenea996922009-02-04 20:06:27 +0000617 result = DAG.getNode(ISD::SIGN_EXTEND, dl, OutVT, result);
Scott Michel6ccefab2008-12-04 03:02:42 +0000618 } else if (ExtType == ISD::ZEXTLOAD) {
Dale Johannesenea996922009-02-04 20:06:27 +0000619 result = DAG.getNode(ISD::ZERO_EXTEND, dl, OutVT, result);
Scott Michel6ccefab2008-12-04 03:02:42 +0000620 } else if (ExtType == ISD::EXTLOAD) {
621 unsigned NewOpc = ISD::ANY_EXTEND;
Scott Micheldbac4cf2008-01-11 02:53:15 +0000622
Scott Michel6ccefab2008-12-04 03:02:42 +0000623 if (OutVT.isFloatingPoint())
pingbakb8913342009-01-26 03:37:41 +0000624 NewOpc = ISD::FP_EXTEND;
Scott Micheldbac4cf2008-01-11 02:53:15 +0000625
Dale Johannesenea996922009-02-04 20:06:27 +0000626 result = DAG.getNode(NewOpc, dl, OutVT, result);
Scott Micheldbac4cf2008-01-11 02:53:15 +0000627 }
628
Scott Michel6ccefab2008-12-04 03:02:42 +0000629 SDVTList retvts = DAG.getVTList(OutVT, MVT::Other);
Dan Gohman8181bd12008-07-27 21:46:04 +0000630 SDValue retops[2] = {
Scott Michel394e26d2008-01-17 20:38:41 +0000631 result,
Scott Michel5a6f17b2008-01-30 02:55:46 +0000632 the_chain
Scott Michel394e26d2008-01-17 20:38:41 +0000633 };
Scott Micheldbac4cf2008-01-11 02:53:15 +0000634
Dale Johannesenea996922009-02-04 20:06:27 +0000635 result = DAG.getNode(SPUISD::LDRESULT, dl, retvts,
Scott Michel394e26d2008-01-17 20:38:41 +0000636 retops, sizeof(retops) / sizeof(retops[0]));
Scott Micheldbac4cf2008-01-11 02:53:15 +0000637 return result;
Scott Michel8efdca42007-12-04 22:23:35 +0000638 }
639 case ISD::PRE_INC:
640 case ISD::PRE_DEC:
641 case ISD::POST_INC:
642 case ISD::POST_DEC:
643 case ISD::LAST_INDEXED_MODE:
644 cerr << "LowerLOAD: Got a LoadSDNode with an addr mode other than "
645 "UNINDEXED\n";
646 cerr << (unsigned) LN->getAddressingMode() << "\n";
647 abort();
648 /*NOTREACHED*/
649 }
650
Dan Gohman8181bd12008-07-27 21:46:04 +0000651 return SDValue();
Scott Michel8efdca42007-12-04 22:23:35 +0000652}
653
654/// Custom lower stores for CellSPU
655/*!
656 All CellSPU stores are aligned to 16-byte boundaries, so for elements
657 within a 16-byte block, we have to generate a shuffle to insert the
658 requested element into its place, then store the resulting block.
659 */
Dan Gohman8181bd12008-07-27 21:46:04 +0000660static SDValue
661LowerSTORE(SDValue Op, SelectionDAG &DAG, const SPUSubtarget *ST) {
Scott Michel8efdca42007-12-04 22:23:35 +0000662 StoreSDNode *SN = cast<StoreSDNode>(Op);
Dan Gohman8181bd12008-07-27 21:46:04 +0000663 SDValue Value = SN->getValue();
Duncan Sands92c43912008-06-06 12:08:01 +0000664 MVT VT = Value.getValueType();
665 MVT StVT = (!SN->isTruncatingStore() ? VT : SN->getMemoryVT());
666 MVT PtrVT = DAG.getTargetLoweringInfo().getPointerTy();
Dale Johannesenea996922009-02-04 20:06:27 +0000667 DebugLoc dl = Op.getDebugLoc();
Scott Micheldbac4cf2008-01-11 02:53:15 +0000668 unsigned alignment = SN->getAlignment();
Scott Michel8efdca42007-12-04 22:23:35 +0000669
670 switch (SN->getAddressingMode()) {
671 case ISD::UNINDEXED: {
Scott Michel33d73eb2008-11-21 02:56:16 +0000672 // The vector type we really want to load from the 16-byte chunk.
Scott Michele1006032008-11-19 17:45:08 +0000673 MVT vecVT = MVT::getVectorVT(VT, (128 / VT.getSizeInBits())),
674 stVecVT = MVT::getVectorVT(StVT, (128 / StVT.getSizeInBits()));
Scott Michel8efdca42007-12-04 22:23:35 +0000675
Scott Michel06eabde2008-12-27 04:51:36 +0000676 SDValue alignLoadVec;
677 SDValue basePtr = SN->getBasePtr();
678 SDValue the_chain = SN->getChain();
679 SDValue insertEltOffs;
Scott Michel8efdca42007-12-04 22:23:35 +0000680
Scott Michel06eabde2008-12-27 04:51:36 +0000681 if (alignment == 16) {
682 ConstantSDNode *CN;
683
684 // Special cases for a known aligned load to simplify the base pointer
685 // and insertion byte:
686 if (basePtr.getOpcode() == ISD::ADD
687 && (CN = dyn_cast<ConstantSDNode>(basePtr.getOperand(1))) != 0) {
688 // Known offset into basePtr
689 int64_t offset = CN->getSExtValue();
690
691 // Simplify the base pointer for this case:
692 basePtr = basePtr.getOperand(0);
693 insertEltOffs = DAG.getNode(SPUISD::IndirectAddr, PtrVT,
694 basePtr,
695 DAG.getConstant((offset & 0xf), PtrVT));
696
697 if ((offset & ~0xf) > 0) {
698 basePtr = DAG.getNode(SPUISD::IndirectAddr, PtrVT,
699 basePtr,
700 DAG.getConstant((offset & ~0xf), PtrVT));
701 }
702 } else {
703 // Otherwise, assume it's at byte 0 of basePtr
704 insertEltOffs = DAG.getNode(SPUISD::IndirectAddr, PtrVT,
705 basePtr,
706 DAG.getConstant(0, PtrVT));
707 }
708 } else {
709 // Unaligned load: must be more pessimistic about addressing modes:
710 if (basePtr.getOpcode() == ISD::ADD) {
711 MachineFunction &MF = DAG.getMachineFunction();
712 MachineRegisterInfo &RegInfo = MF.getRegInfo();
713 unsigned VReg = RegInfo.createVirtualRegister(&SPU::R32CRegClass);
714 SDValue Flag;
715
716 SDValue Op0 = basePtr.getOperand(0);
717 SDValue Op1 = basePtr.getOperand(1);
718
719 if (isa<ConstantSDNode>(Op1)) {
720 // Convert the (add <ptr>, <const>) to an indirect address contained
721 // in a register. Note that this is done because we need to avoid
722 // creating a 0(reg) d-form address due to the SPU's block loads.
723 basePtr = DAG.getNode(SPUISD::IndirectAddr, PtrVT, Op0, Op1);
Dale Johannesenea996922009-02-04 20:06:27 +0000724 the_chain = DAG.getCopyToReg(the_chain, dl, VReg, basePtr, Flag);
725 basePtr = DAG.getCopyFromReg(the_chain, dl, VReg, PtrVT);
Scott Michel06eabde2008-12-27 04:51:36 +0000726 } else {
727 // Convert the (add <arg1>, <arg2>) to an indirect address, which
728 // will likely be lowered as a reg(reg) x-form address.
729 basePtr = DAG.getNode(SPUISD::IndirectAddr, PtrVT, Op0, Op1);
730 }
731 } else {
732 basePtr = DAG.getNode(SPUISD::IndirectAddr, PtrVT,
733 basePtr,
734 DAG.getConstant(0, PtrVT));
735 }
736
737 // Insertion point is solely determined by basePtr's contents
Dale Johannesenea996922009-02-04 20:06:27 +0000738 insertEltOffs = DAG.getNode(ISD::ADD, dl, PtrVT,
Scott Michel06eabde2008-12-27 04:51:36 +0000739 basePtr,
740 DAG.getConstant(0, PtrVT));
741 }
742
743 // Re-emit as a v16i8 vector load
Dale Johannesenea996922009-02-04 20:06:27 +0000744 alignLoadVec = DAG.getLoad(MVT::v16i8, dl, the_chain, basePtr,
Scott Michel06eabde2008-12-27 04:51:36 +0000745 SN->getSrcValue(), SN->getSrcValueOffset(),
746 SN->isVolatile(), 16);
747
748 // Update the chain
749 the_chain = alignLoadVec.getValue(1);
Scott Michel8efdca42007-12-04 22:23:35 +0000750
Scott Micheldbac4cf2008-01-11 02:53:15 +0000751 LoadSDNode *LN = cast<LoadSDNode>(alignLoadVec);
Dan Gohman8181bd12008-07-27 21:46:04 +0000752 SDValue theValue = SN->getValue();
753 SDValue result;
Scott Michel8efdca42007-12-04 22:23:35 +0000754
755 if (StVT != VT
Scott Michel5a6f17b2008-01-30 02:55:46 +0000756 && (theValue.getOpcode() == ISD::AssertZext
757 || theValue.getOpcode() == ISD::AssertSext)) {
Scott Michel8efdca42007-12-04 22:23:35 +0000758 // Drill down and get the value for zero- and sign-extended
759 // quantities
Scott Michel4ec722e2008-07-16 17:17:29 +0000760 theValue = theValue.getOperand(0);
Scott Michel8efdca42007-12-04 22:23:35 +0000761 }
762
Scott Micheldbac4cf2008-01-11 02:53:15 +0000763 // If the base pointer is already a D-form address, then just create
764 // a new D-form address with a slot offset and the orignal base pointer.
765 // Otherwise generate a D-form address with the slot offset relative
766 // to the stack pointer, which is always aligned.
Scott Michel06eabde2008-12-27 04:51:36 +0000767#if !defined(NDEBUG)
768 if (DebugFlag && isCurrentDebugType(DEBUG_TYPE)) {
769 cerr << "CellSPU LowerSTORE: basePtr = ";
770 basePtr.getNode()->dump(&DAG);
771 cerr << "\n";
772 }
773#endif
Scott Micheldbac4cf2008-01-11 02:53:15 +0000774
Scott Michelf65c8f02008-11-19 15:24:16 +0000775 SDValue insertEltOp =
Dale Johannesenea996922009-02-04 20:06:27 +0000776 DAG.getNode(SPUISD::SHUFFLE_MASK, dl, vecVT, insertEltOffs);
Scott Michele1006032008-11-19 17:45:08 +0000777 SDValue vectorizeOp =
Dale Johannesenea996922009-02-04 20:06:27 +0000778 DAG.getNode(ISD::SCALAR_TO_VECTOR, dl, vecVT, theValue);
Scott Michelf65c8f02008-11-19 15:24:16 +0000779
Dale Johannesenea996922009-02-04 20:06:27 +0000780 result = DAG.getNode(SPUISD::SHUFB, dl, vecVT,
pingbakb8913342009-01-26 03:37:41 +0000781 vectorizeOp, alignLoadVec,
Dale Johannesenea996922009-02-04 20:06:27 +0000782 DAG.getNode(ISD::BIT_CONVERT, dl,
783 MVT::v4i32, insertEltOp));
Scott Michel8efdca42007-12-04 22:23:35 +0000784
Dale Johannesenea996922009-02-04 20:06:27 +0000785 result = DAG.getStore(the_chain, dl, result, basePtr,
Scott Michel8efdca42007-12-04 22:23:35 +0000786 LN->getSrcValue(), LN->getSrcValueOffset(),
787 LN->isVolatile(), LN->getAlignment());
788
Scott Michel8c2746e2008-12-04 17:16:59 +0000789#if 0 && !defined(NDEBUG)
Scott Michelf65c8f02008-11-19 15:24:16 +0000790 if (DebugFlag && isCurrentDebugType(DEBUG_TYPE)) {
791 const SDValue &currentRoot = DAG.getRoot();
792
793 DAG.setRoot(result);
794 cerr << "------- CellSPU:LowerStore result:\n";
795 DAG.dump();
796 cerr << "-------\n";
797 DAG.setRoot(currentRoot);
798 }
799#endif
Scott Michelec8c82e2008-12-02 19:53:53 +0000800
Scott Michel8efdca42007-12-04 22:23:35 +0000801 return result;
802 /*UNREACHED*/
803 }
804 case ISD::PRE_INC:
805 case ISD::PRE_DEC:
806 case ISD::POST_INC:
807 case ISD::POST_DEC:
808 case ISD::LAST_INDEXED_MODE:
809 cerr << "LowerLOAD: Got a LoadSDNode with an addr mode other than "
810 "UNINDEXED\n";
811 cerr << (unsigned) SN->getAddressingMode() << "\n";
812 abort();
813 /*NOTREACHED*/
814 }
815
Dan Gohman8181bd12008-07-27 21:46:04 +0000816 return SDValue();
Scott Michel8efdca42007-12-04 22:23:35 +0000817}
818
Scott Michel750b93f2009-01-15 04:41:47 +0000819//! Generate the address of a constant pool entry.
820SDValue
Dan Gohman8181bd12008-07-27 21:46:04 +0000821LowerConstantPool(SDValue Op, SelectionDAG &DAG, const SPUSubtarget *ST) {
Duncan Sands92c43912008-06-06 12:08:01 +0000822 MVT PtrVT = Op.getValueType();
Scott Michel8efdca42007-12-04 22:23:35 +0000823 ConstantPoolSDNode *CP = cast<ConstantPoolSDNode>(Op);
824 Constant *C = CP->getConstVal();
Dan Gohman8181bd12008-07-27 21:46:04 +0000825 SDValue CPI = DAG.getTargetConstantPool(C, PtrVT, CP->getAlignment());
826 SDValue Zero = DAG.getConstant(0, PtrVT);
Scott Micheldbac4cf2008-01-11 02:53:15 +0000827 const TargetMachine &TM = DAG.getTarget();
Scott Michel8efdca42007-12-04 22:23:35 +0000828
829 if (TM.getRelocationModel() == Reloc::Static) {
830 if (!ST->usingLargeMem()) {
Dan Gohman8181bd12008-07-27 21:46:04 +0000831 // Just return the SDValue with the constant pool address in it.
Scott Michel394e26d2008-01-17 20:38:41 +0000832 return DAG.getNode(SPUISD::AFormAddr, PtrVT, CPI, Zero);
Scott Michel8efdca42007-12-04 22:23:35 +0000833 } else {
Dan Gohman8181bd12008-07-27 21:46:04 +0000834 SDValue Hi = DAG.getNode(SPUISD::Hi, PtrVT, CPI, Zero);
835 SDValue Lo = DAG.getNode(SPUISD::Lo, PtrVT, CPI, Zero);
Scott Michel97872d32008-02-23 18:41:37 +0000836 return DAG.getNode(SPUISD::IndirectAddr, PtrVT, Hi, Lo);
Scott Michel8efdca42007-12-04 22:23:35 +0000837 }
838 }
839
840 assert(0 &&
Gabor Greife9f7f582008-08-31 15:37:04 +0000841 "LowerConstantPool: Relocation model other than static"
842 " not supported.");
Dan Gohman8181bd12008-07-27 21:46:04 +0000843 return SDValue();
Scott Michel8efdca42007-12-04 22:23:35 +0000844}
845
Scott Michel750b93f2009-01-15 04:41:47 +0000846//! Alternate entry point for generating the address of a constant pool entry
847SDValue
848SPU::LowerConstantPool(SDValue Op, SelectionDAG &DAG, const SPUTargetMachine &TM) {
849 return ::LowerConstantPool(Op, DAG, TM.getSubtargetImpl());
850}
851
Dan Gohman8181bd12008-07-27 21:46:04 +0000852static SDValue
853LowerJumpTable(SDValue Op, SelectionDAG &DAG, const SPUSubtarget *ST) {
Duncan Sands92c43912008-06-06 12:08:01 +0000854 MVT PtrVT = Op.getValueType();
Scott Michel8efdca42007-12-04 22:23:35 +0000855 JumpTableSDNode *JT = cast<JumpTableSDNode>(Op);
Dan Gohman8181bd12008-07-27 21:46:04 +0000856 SDValue JTI = DAG.getTargetJumpTable(JT->getIndex(), PtrVT);
857 SDValue Zero = DAG.getConstant(0, PtrVT);
Scott Michel8efdca42007-12-04 22:23:35 +0000858 const TargetMachine &TM = DAG.getTarget();
859
860 if (TM.getRelocationModel() == Reloc::Static) {
Scott Michel97872d32008-02-23 18:41:37 +0000861 if (!ST->usingLargeMem()) {
862 return DAG.getNode(SPUISD::AFormAddr, PtrVT, JTI, Zero);
863 } else {
Dan Gohman8181bd12008-07-27 21:46:04 +0000864 SDValue Hi = DAG.getNode(SPUISD::Hi, PtrVT, JTI, Zero);
865 SDValue Lo = DAG.getNode(SPUISD::Lo, PtrVT, JTI, Zero);
Scott Michel97872d32008-02-23 18:41:37 +0000866 return DAG.getNode(SPUISD::IndirectAddr, PtrVT, Hi, Lo);
867 }
Scott Michel8efdca42007-12-04 22:23:35 +0000868 }
869
870 assert(0 &&
871 "LowerJumpTable: Relocation model other than static not supported.");
Dan Gohman8181bd12008-07-27 21:46:04 +0000872 return SDValue();
Scott Michel8efdca42007-12-04 22:23:35 +0000873}
874
Dan Gohman8181bd12008-07-27 21:46:04 +0000875static SDValue
876LowerGlobalAddress(SDValue Op, SelectionDAG &DAG, const SPUSubtarget *ST) {
Duncan Sands92c43912008-06-06 12:08:01 +0000877 MVT PtrVT = Op.getValueType();
Scott Michel8efdca42007-12-04 22:23:35 +0000878 GlobalAddressSDNode *GSDN = cast<GlobalAddressSDNode>(Op);
879 GlobalValue *GV = GSDN->getGlobal();
Dan Gohman8181bd12008-07-27 21:46:04 +0000880 SDValue GA = DAG.getTargetGlobalAddress(GV, PtrVT, GSDN->getOffset());
Scott Michel8efdca42007-12-04 22:23:35 +0000881 const TargetMachine &TM = DAG.getTarget();
Dan Gohman8181bd12008-07-27 21:46:04 +0000882 SDValue Zero = DAG.getConstant(0, PtrVT);
Scott Michel4ec722e2008-07-16 17:17:29 +0000883
Scott Michel8efdca42007-12-04 22:23:35 +0000884 if (TM.getRelocationModel() == Reloc::Static) {
Scott Michelf9f42e62008-01-29 02:16:57 +0000885 if (!ST->usingLargeMem()) {
886 return DAG.getNode(SPUISD::AFormAddr, PtrVT, GA, Zero);
887 } else {
Dan Gohman8181bd12008-07-27 21:46:04 +0000888 SDValue Hi = DAG.getNode(SPUISD::Hi, PtrVT, GA, Zero);
889 SDValue Lo = DAG.getNode(SPUISD::Lo, PtrVT, GA, Zero);
Scott Michelf9f42e62008-01-29 02:16:57 +0000890 return DAG.getNode(SPUISD::IndirectAddr, PtrVT, Hi, Lo);
891 }
Scott Michel8efdca42007-12-04 22:23:35 +0000892 } else {
893 cerr << "LowerGlobalAddress: Relocation model other than static not "
Scott Michel5a6f17b2008-01-30 02:55:46 +0000894 << "supported.\n";
Scott Michel8efdca42007-12-04 22:23:35 +0000895 abort();
896 /*NOTREACHED*/
897 }
898
Dan Gohman8181bd12008-07-27 21:46:04 +0000899 return SDValue();
Scott Michel8efdca42007-12-04 22:23:35 +0000900}
901
Nate Begeman78125042008-02-14 18:43:04 +0000902//! Custom lower double precision floating point constants
Dan Gohman8181bd12008-07-27 21:46:04 +0000903static SDValue
904LowerConstantFP(SDValue Op, SelectionDAG &DAG) {
Duncan Sands92c43912008-06-06 12:08:01 +0000905 MVT VT = Op.getValueType();
Scott Michel8efdca42007-12-04 22:23:35 +0000906
Nate Begeman78125042008-02-14 18:43:04 +0000907 if (VT == MVT::f64) {
Scott Michel0718cd82008-12-01 17:56:02 +0000908 ConstantFPSDNode *FP = cast<ConstantFPSDNode>(Op.getNode());
909
910 assert((FP != 0) &&
911 "LowerConstantFP: Node is not ConstantFPSDNode");
Scott Michelae5cbf52008-12-29 03:23:36 +0000912
Scott Michel11e88bb2007-12-19 20:15:47 +0000913 uint64_t dbits = DoubleToBits(FP->getValueAPF().convertToDouble());
Scott Michel0718cd82008-12-01 17:56:02 +0000914 SDValue T = DAG.getConstant(dbits, MVT::i64);
915 SDValue Tvec = DAG.getNode(ISD::BUILD_VECTOR, MVT::v2i64, T, T);
916 return DAG.getNode(SPUISD::VEC2PREFSLOT, VT,
917 DAG.getNode(ISD::BIT_CONVERT, MVT::v2f64, Tvec));
Scott Michel8efdca42007-12-04 22:23:35 +0000918 }
919
Dan Gohman8181bd12008-07-27 21:46:04 +0000920 return SDValue();
Scott Michel8efdca42007-12-04 22:23:35 +0000921}
922
Dan Gohman8181bd12008-07-27 21:46:04 +0000923static SDValue
Dan Gohman8181bd12008-07-27 21:46:04 +0000924LowerFORMAL_ARGUMENTS(SDValue Op, SelectionDAG &DAG, int &VarArgsFrameIndex)
Scott Michel8efdca42007-12-04 22:23:35 +0000925{
926 MachineFunction &MF = DAG.getMachineFunction();
927 MachineFrameInfo *MFI = MF.getFrameInfo();
Chris Lattner1b989192007-12-31 04:13:23 +0000928 MachineRegisterInfo &RegInfo = MF.getRegInfo();
Scott Michela313fb02008-10-30 01:51:48 +0000929 SmallVector<SDValue, 48> ArgValues;
Dan Gohman8181bd12008-07-27 21:46:04 +0000930 SDValue Root = Op.getOperand(0);
Dan Gohmanfaeb4a32008-09-12 16:56:44 +0000931 bool isVarArg = cast<ConstantSDNode>(Op.getOperand(2))->getZExtValue() != 0;
Dale Johannesenea996922009-02-04 20:06:27 +0000932 DebugLoc dl = Op.getDebugLoc();
Scott Michel8efdca42007-12-04 22:23:35 +0000933
934 const unsigned *ArgRegs = SPURegisterInfo::getArgRegs();
935 const unsigned NumArgRegs = SPURegisterInfo::getNumArgRegs();
Scott Michel4ec722e2008-07-16 17:17:29 +0000936
Scott Michel8efdca42007-12-04 22:23:35 +0000937 unsigned ArgOffset = SPUFrameInfo::minStackSize();
938 unsigned ArgRegIdx = 0;
939 unsigned StackSlotSize = SPUFrameInfo::stackSlotSize();
Scott Michel4ec722e2008-07-16 17:17:29 +0000940
Duncan Sands92c43912008-06-06 12:08:01 +0000941 MVT PtrVT = DAG.getTargetLoweringInfo().getPointerTy();
Scott Michel4ec722e2008-07-16 17:17:29 +0000942
Scott Michel8efdca42007-12-04 22:23:35 +0000943 // Add DAG nodes to load the arguments or copy them out of registers.
Gabor Greife9f7f582008-08-31 15:37:04 +0000944 for (unsigned ArgNo = 0, e = Op.getNode()->getNumValues() - 1;
945 ArgNo != e; ++ArgNo) {
Duncan Sands92c43912008-06-06 12:08:01 +0000946 MVT ObjectVT = Op.getValue(ArgNo).getValueType();
947 unsigned ObjSize = ObjectVT.getSizeInBits()/8;
Scott Michela313fb02008-10-30 01:51:48 +0000948 SDValue ArgVal;
Scott Michel8efdca42007-12-04 22:23:35 +0000949
Scott Michela313fb02008-10-30 01:51:48 +0000950 if (ArgRegIdx < NumArgRegs) {
951 const TargetRegisterClass *ArgRegClass;
Scott Michel4ec722e2008-07-16 17:17:29 +0000952
Scott Michela313fb02008-10-30 01:51:48 +0000953 switch (ObjectVT.getSimpleVT()) {
954 default: {
Scott Michel33d73eb2008-11-21 02:56:16 +0000955 cerr << "LowerFORMAL_ARGUMENTS Unhandled argument type: "
956 << ObjectVT.getMVTString()
957 << "\n";
958 abort();
Scott Michela313fb02008-10-30 01:51:48 +0000959 }
960 case MVT::i8:
Scott Michel33d73eb2008-11-21 02:56:16 +0000961 ArgRegClass = &SPU::R8CRegClass;
962 break;
Scott Michela313fb02008-10-30 01:51:48 +0000963 case MVT::i16:
Scott Michel33d73eb2008-11-21 02:56:16 +0000964 ArgRegClass = &SPU::R16CRegClass;
965 break;
Scott Michela313fb02008-10-30 01:51:48 +0000966 case MVT::i32:
Scott Michel33d73eb2008-11-21 02:56:16 +0000967 ArgRegClass = &SPU::R32CRegClass;
968 break;
Scott Michela313fb02008-10-30 01:51:48 +0000969 case MVT::i64:
Scott Michel33d73eb2008-11-21 02:56:16 +0000970 ArgRegClass = &SPU::R64CRegClass;
971 break;
Scott Michel2ef773a2009-01-06 03:36:14 +0000972 case MVT::i128:
973 ArgRegClass = &SPU::GPRCRegClass;
974 break;
Scott Michela313fb02008-10-30 01:51:48 +0000975 case MVT::f32:
Scott Michel33d73eb2008-11-21 02:56:16 +0000976 ArgRegClass = &SPU::R32FPRegClass;
977 break;
Scott Michela313fb02008-10-30 01:51:48 +0000978 case MVT::f64:
Scott Michel33d73eb2008-11-21 02:56:16 +0000979 ArgRegClass = &SPU::R64FPRegClass;
980 break;
Scott Michela313fb02008-10-30 01:51:48 +0000981 case MVT::v2f64:
982 case MVT::v4f32:
983 case MVT::v2i64:
984 case MVT::v4i32:
985 case MVT::v8i16:
986 case MVT::v16i8:
Scott Michel33d73eb2008-11-21 02:56:16 +0000987 ArgRegClass = &SPU::VECREGRegClass;
988 break;
Scott Michela313fb02008-10-30 01:51:48 +0000989 }
990
991 unsigned VReg = RegInfo.createVirtualRegister(ArgRegClass);
992 RegInfo.addLiveIn(ArgRegs[ArgRegIdx], VReg);
Dale Johannesenea996922009-02-04 20:06:27 +0000993 ArgVal = DAG.getCopyFromReg(Root, dl, VReg, ObjectVT);
Scott Michela313fb02008-10-30 01:51:48 +0000994 ++ArgRegIdx;
995 } else {
996 // We need to load the argument to a virtual register if we determined
997 // above that we ran out of physical registers of the appropriate type
998 // or we're forced to do vararg
Chris Lattner60069452008-02-13 07:35:30 +0000999 int FI = MFI->CreateFixedObject(ObjSize, ArgOffset);
Dan Gohman8181bd12008-07-27 21:46:04 +00001000 SDValue FIN = DAG.getFrameIndex(FI, PtrVT);
Dale Johannesenea996922009-02-04 20:06:27 +00001001 ArgVal = DAG.getLoad(ObjectVT, dl, Root, FIN, NULL, 0);
Scott Michel8efdca42007-12-04 22:23:35 +00001002 ArgOffset += StackSlotSize;
1003 }
Scott Michel4ec722e2008-07-16 17:17:29 +00001004
Scott Michel8efdca42007-12-04 22:23:35 +00001005 ArgValues.push_back(ArgVal);
Scott Michela313fb02008-10-30 01:51:48 +00001006 // Update the chain
1007 Root = ArgVal.getOperand(0);
Scott Michel8efdca42007-12-04 22:23:35 +00001008 }
Scott Michel4ec722e2008-07-16 17:17:29 +00001009
Scott Michela313fb02008-10-30 01:51:48 +00001010 // vararg handling:
Scott Michel8efdca42007-12-04 22:23:35 +00001011 if (isVarArg) {
Scott Michela313fb02008-10-30 01:51:48 +00001012 // unsigned int ptr_size = PtrVT.getSizeInBits() / 8;
1013 // We will spill (79-3)+1 registers to the stack
1014 SmallVector<SDValue, 79-3+1> MemOps;
1015
1016 // Create the frame slot
1017
Scott Michel8efdca42007-12-04 22:23:35 +00001018 for (; ArgRegIdx != NumArgRegs; ++ArgRegIdx) {
Scott Michela313fb02008-10-30 01:51:48 +00001019 VarArgsFrameIndex = MFI->CreateFixedObject(StackSlotSize, ArgOffset);
1020 SDValue FIN = DAG.getFrameIndex(VarArgsFrameIndex, PtrVT);
1021 SDValue ArgVal = DAG.getRegister(ArgRegs[ArgRegIdx], MVT::v16i8);
Dale Johannesenea996922009-02-04 20:06:27 +00001022 SDValue Store = DAG.getStore(Root, dl, ArgVal, FIN, NULL, 0);
Scott Michela313fb02008-10-30 01:51:48 +00001023 Root = Store.getOperand(0);
Scott Michel8efdca42007-12-04 22:23:35 +00001024 MemOps.push_back(Store);
Scott Michela313fb02008-10-30 01:51:48 +00001025
1026 // Increment address by stack slot size for the next stored argument
1027 ArgOffset += StackSlotSize;
Scott Michel8efdca42007-12-04 22:23:35 +00001028 }
1029 if (!MemOps.empty())
Dale Johannesenea996922009-02-04 20:06:27 +00001030 Root = DAG.getNode(ISD::TokenFactor, dl, MVT::Other,
1031 &MemOps[0], MemOps.size());
Scott Michel8efdca42007-12-04 22:23:35 +00001032 }
Scott Michel4ec722e2008-07-16 17:17:29 +00001033
Scott Michel8efdca42007-12-04 22:23:35 +00001034 ArgValues.push_back(Root);
Scott Michel4ec722e2008-07-16 17:17:29 +00001035
Scott Michel8efdca42007-12-04 22:23:35 +00001036 // Return the new list of results.
Dale Johannesenea996922009-02-04 20:06:27 +00001037 return DAG.getNode(ISD::MERGE_VALUES, dl, Op.getNode()->getVTList(),
Duncan Sands42d7bb82008-12-01 11:41:29 +00001038 &ArgValues[0], ArgValues.size());
Scott Michel8efdca42007-12-04 22:23:35 +00001039}
1040
1041/// isLSAAddress - Return the immediate to use if the specified
1042/// value is representable as a LSA address.
Dan Gohman8181bd12008-07-27 21:46:04 +00001043static SDNode *isLSAAddress(SDValue Op, SelectionDAG &DAG) {
Scott Michel5974f432008-11-11 03:06:06 +00001044 ConstantSDNode *C = dyn_cast<ConstantSDNode>(Op);
Scott Michel8efdca42007-12-04 22:23:35 +00001045 if (!C) return 0;
Scott Michel4ec722e2008-07-16 17:17:29 +00001046
Dan Gohmanfaeb4a32008-09-12 16:56:44 +00001047 int Addr = C->getZExtValue();
Scott Michel8efdca42007-12-04 22:23:35 +00001048 if ((Addr & 3) != 0 || // Low 2 bits are implicitly zero.
1049 (Addr << 14 >> 14) != Addr)
1050 return 0; // Top 14 bits have to be sext of immediate.
Scott Michel4ec722e2008-07-16 17:17:29 +00001051
Dan Gohmanfaeb4a32008-09-12 16:56:44 +00001052 return DAG.getConstant((int)C->getZExtValue() >> 2, MVT::i32).getNode();
Scott Michel8efdca42007-12-04 22:23:35 +00001053}
1054
Scott Michel70741542009-01-06 23:10:38 +00001055static SDValue
Dan Gohman8181bd12008-07-27 21:46:04 +00001056LowerCALL(SDValue Op, SelectionDAG &DAG, const SPUSubtarget *ST) {
Dan Gohman705e3f72008-09-13 01:54:27 +00001057 CallSDNode *TheCall = cast<CallSDNode>(Op.getNode());
1058 SDValue Chain = TheCall->getChain();
Dan Gohman705e3f72008-09-13 01:54:27 +00001059 SDValue Callee = TheCall->getCallee();
1060 unsigned NumOps = TheCall->getNumArgs();
Scott Michel8efdca42007-12-04 22:23:35 +00001061 unsigned StackSlotSize = SPUFrameInfo::stackSlotSize();
1062 const unsigned *ArgRegs = SPURegisterInfo::getArgRegs();
1063 const unsigned NumArgRegs = SPURegisterInfo::getNumArgRegs();
Dale Johannesenea996922009-02-04 20:06:27 +00001064 DebugLoc dl = TheCall->getDebugLoc();
Scott Michel8efdca42007-12-04 22:23:35 +00001065
1066 // Handy pointer type
Duncan Sands92c43912008-06-06 12:08:01 +00001067 MVT PtrVT = DAG.getTargetLoweringInfo().getPointerTy();
Scott Michel4ec722e2008-07-16 17:17:29 +00001068
Scott Michel8efdca42007-12-04 22:23:35 +00001069 // Accumulate how many bytes are to be pushed on the stack, including the
1070 // linkage area, and parameter passing area. According to the SPU ABI,
1071 // we minimally need space for [LR] and [SP]
1072 unsigned NumStackBytes = SPUFrameInfo::minStackSize();
Scott Michel4ec722e2008-07-16 17:17:29 +00001073
Scott Michel8efdca42007-12-04 22:23:35 +00001074 // Set up a copy of the stack pointer for use loading and storing any
1075 // arguments that may not fit in the registers available for argument
1076 // passing.
Dan Gohman8181bd12008-07-27 21:46:04 +00001077 SDValue StackPtr = DAG.getRegister(SPU::R1, MVT::i32);
Scott Michel4ec722e2008-07-16 17:17:29 +00001078
Scott Michel8efdca42007-12-04 22:23:35 +00001079 // Figure out which arguments are going to go in registers, and which in
1080 // memory.
1081 unsigned ArgOffset = SPUFrameInfo::minStackSize(); // Just below [LR]
1082 unsigned ArgRegIdx = 0;
1083
1084 // Keep track of registers passing arguments
Dan Gohman8181bd12008-07-27 21:46:04 +00001085 std::vector<std::pair<unsigned, SDValue> > RegsToPass;
Scott Michel8efdca42007-12-04 22:23:35 +00001086 // And the arguments passed on the stack
Dan Gohman8181bd12008-07-27 21:46:04 +00001087 SmallVector<SDValue, 8> MemOpChains;
Scott Michel8efdca42007-12-04 22:23:35 +00001088
1089 for (unsigned i = 0; i != NumOps; ++i) {
Dan Gohman705e3f72008-09-13 01:54:27 +00001090 SDValue Arg = TheCall->getArg(i);
Scott Michel4ec722e2008-07-16 17:17:29 +00001091
Scott Michel8efdca42007-12-04 22:23:35 +00001092 // PtrOff will be used to store the current argument to the stack if a
1093 // register cannot be found for it.
Dan Gohman8181bd12008-07-27 21:46:04 +00001094 SDValue PtrOff = DAG.getConstant(ArgOffset, StackPtr.getValueType());
Dale Johannesenea996922009-02-04 20:06:27 +00001095 PtrOff = DAG.getNode(ISD::ADD, dl, PtrVT, StackPtr, PtrOff);
Scott Michel8efdca42007-12-04 22:23:35 +00001096
Duncan Sands92c43912008-06-06 12:08:01 +00001097 switch (Arg.getValueType().getSimpleVT()) {
Scott Michel8efdca42007-12-04 22:23:35 +00001098 default: assert(0 && "Unexpected ValueType for argument!");
Scott Michel2ef773a2009-01-06 03:36:14 +00001099 case MVT::i8:
1100 case MVT::i16:
Scott Michel8efdca42007-12-04 22:23:35 +00001101 case MVT::i32:
1102 case MVT::i64:
1103 case MVT::i128:
1104 if (ArgRegIdx != NumArgRegs) {
1105 RegsToPass.push_back(std::make_pair(ArgRegs[ArgRegIdx++], Arg));
1106 } else {
Dale Johannesenea996922009-02-04 20:06:27 +00001107 MemOpChains.push_back(DAG.getStore(Chain, dl, Arg, PtrOff, NULL, 0));
Scott Michel5a6f17b2008-01-30 02:55:46 +00001108 ArgOffset += StackSlotSize;
Scott Michel8efdca42007-12-04 22:23:35 +00001109 }
1110 break;
1111 case MVT::f32:
1112 case MVT::f64:
1113 if (ArgRegIdx != NumArgRegs) {
1114 RegsToPass.push_back(std::make_pair(ArgRegs[ArgRegIdx++], Arg));
1115 } else {
Dale Johannesenea996922009-02-04 20:06:27 +00001116 MemOpChains.push_back(DAG.getStore(Chain, dl, Arg, PtrOff, NULL, 0));
Scott Michel5a6f17b2008-01-30 02:55:46 +00001117 ArgOffset += StackSlotSize;
Scott Michel8efdca42007-12-04 22:23:35 +00001118 }
1119 break;
Scott Michele2641a12008-12-04 21:01:44 +00001120 case MVT::v2i64:
1121 case MVT::v2f64:
Scott Michel8efdca42007-12-04 22:23:35 +00001122 case MVT::v4f32:
1123 case MVT::v4i32:
1124 case MVT::v8i16:
1125 case MVT::v16i8:
1126 if (ArgRegIdx != NumArgRegs) {
1127 RegsToPass.push_back(std::make_pair(ArgRegs[ArgRegIdx++], Arg));
1128 } else {
Dale Johannesenea996922009-02-04 20:06:27 +00001129 MemOpChains.push_back(DAG.getStore(Chain, dl, Arg, PtrOff, NULL, 0));
Scott Michel5a6f17b2008-01-30 02:55:46 +00001130 ArgOffset += StackSlotSize;
Scott Michel8efdca42007-12-04 22:23:35 +00001131 }
1132 break;
1133 }
1134 }
1135
1136 // Update number of stack bytes actually used, insert a call sequence start
1137 NumStackBytes = (ArgOffset - SPUFrameInfo::minStackSize());
Chris Lattnerfe5d4022008-10-11 22:08:30 +00001138 Chain = DAG.getCALLSEQ_START(Chain, DAG.getIntPtrConstant(NumStackBytes,
1139 true));
Scott Michel8efdca42007-12-04 22:23:35 +00001140
1141 if (!MemOpChains.empty()) {
1142 // Adjust the stack pointer for the stack arguments.
Dale Johannesenea996922009-02-04 20:06:27 +00001143 Chain = DAG.getNode(ISD::TokenFactor, dl, MVT::Other,
Scott Michel8efdca42007-12-04 22:23:35 +00001144 &MemOpChains[0], MemOpChains.size());
1145 }
Scott Michel4ec722e2008-07-16 17:17:29 +00001146
Scott Michel8efdca42007-12-04 22:23:35 +00001147 // Build a sequence of copy-to-reg nodes chained together with token chain
1148 // and flag operands which copy the outgoing args into the appropriate regs.
Dan Gohman8181bd12008-07-27 21:46:04 +00001149 SDValue InFlag;
Scott Michel8efdca42007-12-04 22:23:35 +00001150 for (unsigned i = 0, e = RegsToPass.size(); i != e; ++i) {
Dale Johannesenea996922009-02-04 20:06:27 +00001151 Chain = DAG.getCopyToReg(Chain, dl, RegsToPass[i].first,
1152 RegsToPass[i].second, InFlag);
Scott Michel8efdca42007-12-04 22:23:35 +00001153 InFlag = Chain.getValue(1);
1154 }
Scott Michel4ec722e2008-07-16 17:17:29 +00001155
Dan Gohman8181bd12008-07-27 21:46:04 +00001156 SmallVector<SDValue, 8> Ops;
Scott Michel8efdca42007-12-04 22:23:35 +00001157 unsigned CallOpc = SPUISD::CALL;
Scott Michel4ec722e2008-07-16 17:17:29 +00001158
Bill Wendlingfef06052008-09-16 21:48:12 +00001159 // If the callee is a GlobalAddress/ExternalSymbol node (quite common, every
1160 // direct call is) turn it into a TargetGlobalAddress/TargetExternalSymbol
1161 // node so that legalize doesn't hack it.
Scott Michel5974f432008-11-11 03:06:06 +00001162 if (GlobalAddressSDNode *G = dyn_cast<GlobalAddressSDNode>(Callee)) {
Scott Michel8efdca42007-12-04 22:23:35 +00001163 GlobalValue *GV = G->getGlobal();
Duncan Sands92c43912008-06-06 12:08:01 +00001164 MVT CalleeVT = Callee.getValueType();
Dan Gohman8181bd12008-07-27 21:46:04 +00001165 SDValue Zero = DAG.getConstant(0, PtrVT);
1166 SDValue GA = DAG.getTargetGlobalAddress(GV, CalleeVT);
Scott Michel8efdca42007-12-04 22:23:35 +00001167
Scott Micheldbac4cf2008-01-11 02:53:15 +00001168 if (!ST->usingLargeMem()) {
1169 // Turn calls to targets that are defined (i.e., have bodies) into BRSL
1170 // style calls, otherwise, external symbols are BRASL calls. This assumes
1171 // that declared/defined symbols are in the same compilation unit and can
1172 // be reached through PC-relative jumps.
1173 //
1174 // NOTE:
1175 // This may be an unsafe assumption for JIT and really large compilation
1176 // units.
1177 if (GV->isDeclaration()) {
1178 Callee = DAG.getNode(SPUISD::AFormAddr, CalleeVT, GA, Zero);
1179 } else {
1180 Callee = DAG.getNode(SPUISD::PCRelAddr, CalleeVT, GA, Zero);
1181 }
Scott Michel8efdca42007-12-04 22:23:35 +00001182 } else {
Scott Micheldbac4cf2008-01-11 02:53:15 +00001183 // "Large memory" mode: Turn all calls into indirect calls with a X-form
1184 // address pairs:
Scott Michelf9f42e62008-01-29 02:16:57 +00001185 Callee = DAG.getNode(SPUISD::IndirectAddr, PtrVT, GA, Zero);
Scott Michel8efdca42007-12-04 22:23:35 +00001186 }
Scott Michelae5cbf52008-12-29 03:23:36 +00001187 } else if (ExternalSymbolSDNode *S = dyn_cast<ExternalSymbolSDNode>(Callee)) {
1188 MVT CalleeVT = Callee.getValueType();
1189 SDValue Zero = DAG.getConstant(0, PtrVT);
1190 SDValue ExtSym = DAG.getTargetExternalSymbol(S->getSymbol(),
1191 Callee.getValueType());
1192
1193 if (!ST->usingLargeMem()) {
1194 Callee = DAG.getNode(SPUISD::AFormAddr, CalleeVT, ExtSym, Zero);
1195 } else {
1196 Callee = DAG.getNode(SPUISD::IndirectAddr, PtrVT, ExtSym, Zero);
1197 }
1198 } else if (SDNode *Dest = isLSAAddress(Callee, DAG)) {
Scott Michel8efdca42007-12-04 22:23:35 +00001199 // If this is an absolute destination address that appears to be a legal
1200 // local store address, use the munged value.
Dan Gohman8181bd12008-07-27 21:46:04 +00001201 Callee = SDValue(Dest, 0);
Scott Micheldbac4cf2008-01-11 02:53:15 +00001202 }
Scott Michel8efdca42007-12-04 22:23:35 +00001203
1204 Ops.push_back(Chain);
1205 Ops.push_back(Callee);
Scott Michel4ec722e2008-07-16 17:17:29 +00001206
Scott Michel8efdca42007-12-04 22:23:35 +00001207 // Add argument registers to the end of the list so that they are known live
1208 // into the call.
1209 for (unsigned i = 0, e = RegsToPass.size(); i != e; ++i)
Scott Michel4ec722e2008-07-16 17:17:29 +00001210 Ops.push_back(DAG.getRegister(RegsToPass[i].first,
Scott Michel8efdca42007-12-04 22:23:35 +00001211 RegsToPass[i].second.getValueType()));
Scott Michel4ec722e2008-07-16 17:17:29 +00001212
Gabor Greif1c80d112008-08-28 21:40:38 +00001213 if (InFlag.getNode())
Scott Michel8efdca42007-12-04 22:23:35 +00001214 Ops.push_back(InFlag);
Duncan Sands698842f2008-07-02 17:40:58 +00001215 // Returns a chain and a flag for retval copy to use.
Dale Johannesenea996922009-02-04 20:06:27 +00001216 Chain = DAG.getNode(CallOpc, dl, DAG.getVTList(MVT::Other, MVT::Flag),
Duncan Sands698842f2008-07-02 17:40:58 +00001217 &Ops[0], Ops.size());
Scott Michel8efdca42007-12-04 22:23:35 +00001218 InFlag = Chain.getValue(1);
1219
Chris Lattnerfe5d4022008-10-11 22:08:30 +00001220 Chain = DAG.getCALLSEQ_END(Chain, DAG.getIntPtrConstant(NumStackBytes, true),
1221 DAG.getIntPtrConstant(0, true), InFlag);
Dan Gohman705e3f72008-09-13 01:54:27 +00001222 if (TheCall->getValueType(0) != MVT::Other)
Evan Cheng07322bb2008-02-05 22:44:06 +00001223 InFlag = Chain.getValue(1);
1224
Dan Gohman8181bd12008-07-27 21:46:04 +00001225 SDValue ResultVals[3];
Scott Michel8efdca42007-12-04 22:23:35 +00001226 unsigned NumResults = 0;
Scott Michel4ec722e2008-07-16 17:17:29 +00001227
Scott Michel8efdca42007-12-04 22:23:35 +00001228 // If the call has results, copy the values out of the ret val registers.
Dan Gohman705e3f72008-09-13 01:54:27 +00001229 switch (TheCall->getValueType(0).getSimpleVT()) {
Scott Michel8efdca42007-12-04 22:23:35 +00001230 default: assert(0 && "Unexpected ret value!");
1231 case MVT::Other: break;
1232 case MVT::i32:
Dan Gohman705e3f72008-09-13 01:54:27 +00001233 if (TheCall->getValueType(1) == MVT::i32) {
Dale Johannesenea996922009-02-04 20:06:27 +00001234 Chain = DAG.getCopyFromReg(Chain, dl, SPU::R4,
1235 MVT::i32, InFlag).getValue(1);
Scott Michel8efdca42007-12-04 22:23:35 +00001236 ResultVals[0] = Chain.getValue(0);
Dale Johannesenea996922009-02-04 20:06:27 +00001237 Chain = DAG.getCopyFromReg(Chain, dl, SPU::R3, MVT::i32,
Scott Michel8efdca42007-12-04 22:23:35 +00001238 Chain.getValue(2)).getValue(1);
1239 ResultVals[1] = Chain.getValue(0);
1240 NumResults = 2;
Scott Michel8efdca42007-12-04 22:23:35 +00001241 } else {
Dale Johannesenea996922009-02-04 20:06:27 +00001242 Chain = DAG.getCopyFromReg(Chain, dl, SPU::R3, MVT::i32,
1243 InFlag).getValue(1);
Scott Michel8efdca42007-12-04 22:23:35 +00001244 ResultVals[0] = Chain.getValue(0);
1245 NumResults = 1;
1246 }
Scott Michel8efdca42007-12-04 22:23:35 +00001247 break;
1248 case MVT::i64:
Dale Johannesenea996922009-02-04 20:06:27 +00001249 Chain = DAG.getCopyFromReg(Chain, dl, SPU::R3, MVT::i64,
1250 InFlag).getValue(1);
Scott Michel8efdca42007-12-04 22:23:35 +00001251 ResultVals[0] = Chain.getValue(0);
1252 NumResults = 1;
Scott Michel8efdca42007-12-04 22:23:35 +00001253 break;
Scott Michel2ef773a2009-01-06 03:36:14 +00001254 case MVT::i128:
Dale Johannesenea996922009-02-04 20:06:27 +00001255 Chain = DAG.getCopyFromReg(Chain, dl, SPU::R3, MVT::i128,
1256 InFlag).getValue(1);
Scott Michel2ef773a2009-01-06 03:36:14 +00001257 ResultVals[0] = Chain.getValue(0);
1258 NumResults = 1;
1259 break;
Scott Michel8efdca42007-12-04 22:23:35 +00001260 case MVT::f32:
1261 case MVT::f64:
Dale Johannesenea996922009-02-04 20:06:27 +00001262 Chain = DAG.getCopyFromReg(Chain, dl, SPU::R3, TheCall->getValueType(0),
Scott Michel8efdca42007-12-04 22:23:35 +00001263 InFlag).getValue(1);
1264 ResultVals[0] = Chain.getValue(0);
1265 NumResults = 1;
Scott Michel8efdca42007-12-04 22:23:35 +00001266 break;
1267 case MVT::v2f64:
Scott Michele2641a12008-12-04 21:01:44 +00001268 case MVT::v2i64:
Scott Michel8efdca42007-12-04 22:23:35 +00001269 case MVT::v4f32:
1270 case MVT::v4i32:
1271 case MVT::v8i16:
1272 case MVT::v16i8:
Dale Johannesenea996922009-02-04 20:06:27 +00001273 Chain = DAG.getCopyFromReg(Chain, dl, SPU::R3, TheCall->getValueType(0),
Scott Michel8efdca42007-12-04 22:23:35 +00001274 InFlag).getValue(1);
1275 ResultVals[0] = Chain.getValue(0);
1276 NumResults = 1;
Scott Michel8efdca42007-12-04 22:23:35 +00001277 break;
1278 }
Duncan Sands698842f2008-07-02 17:40:58 +00001279
Scott Michel8efdca42007-12-04 22:23:35 +00001280 // If the function returns void, just return the chain.
1281 if (NumResults == 0)
1282 return Chain;
Scott Michel4ec722e2008-07-16 17:17:29 +00001283
Scott Michel8efdca42007-12-04 22:23:35 +00001284 // Otherwise, merge everything together with a MERGE_VALUES node.
1285 ResultVals[NumResults++] = Chain;
Dale Johannesenea996922009-02-04 20:06:27 +00001286 SDValue Res = DAG.getMergeValues(ResultVals, NumResults, dl);
Gabor Greif46bf5472008-08-26 22:36:50 +00001287 return Res.getValue(Op.getResNo());
Scott Michel8efdca42007-12-04 22:23:35 +00001288}
1289
Dan Gohman8181bd12008-07-27 21:46:04 +00001290static SDValue
1291LowerRET(SDValue Op, SelectionDAG &DAG, TargetMachine &TM) {
Scott Michel8efdca42007-12-04 22:23:35 +00001292 SmallVector<CCValAssign, 16> RVLocs;
1293 unsigned CC = DAG.getMachineFunction().getFunction()->getCallingConv();
1294 bool isVarArg = DAG.getMachineFunction().getFunction()->isVarArg();
Dale Johannesenb03cc3f2009-02-04 23:02:30 +00001295 DebugLoc dl = Op.getDebugLoc();
Scott Michel8efdca42007-12-04 22:23:35 +00001296 CCState CCInfo(CC, isVarArg, TM, RVLocs);
Gabor Greif1c80d112008-08-28 21:40:38 +00001297 CCInfo.AnalyzeReturn(Op.getNode(), RetCC_SPU);
Scott Michel4ec722e2008-07-16 17:17:29 +00001298
Scott Michel8efdca42007-12-04 22:23:35 +00001299 // If this is the first return lowered for this function, add the regs to the
1300 // liveout set for the function.
Chris Lattner1b989192007-12-31 04:13:23 +00001301 if (DAG.getMachineFunction().getRegInfo().liveout_empty()) {
Scott Michel8efdca42007-12-04 22:23:35 +00001302 for (unsigned i = 0; i != RVLocs.size(); ++i)
Chris Lattner1b989192007-12-31 04:13:23 +00001303 DAG.getMachineFunction().getRegInfo().addLiveOut(RVLocs[i].getLocReg());
Scott Michel8efdca42007-12-04 22:23:35 +00001304 }
1305
Dan Gohman8181bd12008-07-27 21:46:04 +00001306 SDValue Chain = Op.getOperand(0);
1307 SDValue Flag;
Scott Michel4ec722e2008-07-16 17:17:29 +00001308
Scott Michel8efdca42007-12-04 22:23:35 +00001309 // Copy the result values into the output registers.
1310 for (unsigned i = 0; i != RVLocs.size(); ++i) {
1311 CCValAssign &VA = RVLocs[i];
1312 assert(VA.isRegLoc() && "Can only return in registers!");
Dale Johannesenb03cc3f2009-02-04 23:02:30 +00001313 Chain = DAG.getCopyToReg(Chain, dl, VA.getLocReg(),
1314 Op.getOperand(i*2+1), Flag);
Scott Michel8efdca42007-12-04 22:23:35 +00001315 Flag = Chain.getValue(1);
1316 }
1317
Gabor Greif1c80d112008-08-28 21:40:38 +00001318 if (Flag.getNode())
Dale Johannesenb03cc3f2009-02-04 23:02:30 +00001319 return DAG.getNode(SPUISD::RET_FLAG, dl, MVT::Other, Chain, Flag);
Scott Michel8efdca42007-12-04 22:23:35 +00001320 else
Dale Johannesenb03cc3f2009-02-04 23:02:30 +00001321 return DAG.getNode(SPUISD::RET_FLAG, dl, MVT::Other, Chain);
Scott Michel8efdca42007-12-04 22:23:35 +00001322}
1323
1324
1325//===----------------------------------------------------------------------===//
1326// Vector related lowering:
1327//===----------------------------------------------------------------------===//
1328
1329static ConstantSDNode *
1330getVecImm(SDNode *N) {
Dan Gohman8181bd12008-07-27 21:46:04 +00001331 SDValue OpVal(0, 0);
Scott Michel4ec722e2008-07-16 17:17:29 +00001332
Scott Michel8efdca42007-12-04 22:23:35 +00001333 // Check to see if this buildvec has a single non-undef value in its elements.
1334 for (unsigned i = 0, e = N->getNumOperands(); i != e; ++i) {
1335 if (N->getOperand(i).getOpcode() == ISD::UNDEF) continue;
Gabor Greif1c80d112008-08-28 21:40:38 +00001336 if (OpVal.getNode() == 0)
Scott Michel8efdca42007-12-04 22:23:35 +00001337 OpVal = N->getOperand(i);
1338 else if (OpVal != N->getOperand(i))
1339 return 0;
1340 }
Scott Michel4ec722e2008-07-16 17:17:29 +00001341
Gabor Greif1c80d112008-08-28 21:40:38 +00001342 if (OpVal.getNode() != 0) {
Scott Michel5974f432008-11-11 03:06:06 +00001343 if (ConstantSDNode *CN = dyn_cast<ConstantSDNode>(OpVal)) {
Scott Michel8efdca42007-12-04 22:23:35 +00001344 return CN;
1345 }
1346 }
1347
1348 return 0; // All UNDEF: use implicit def.; not Constant node
1349}
1350
1351/// get_vec_i18imm - Test if this vector is a vector filled with the same value
1352/// and the value fits into an unsigned 18-bit constant, and if so, return the
1353/// constant
Dan Gohman8181bd12008-07-27 21:46:04 +00001354SDValue SPU::get_vec_u18imm(SDNode *N, SelectionDAG &DAG,
Duncan Sands92c43912008-06-06 12:08:01 +00001355 MVT ValueType) {
Scott Michel8efdca42007-12-04 22:23:35 +00001356 if (ConstantSDNode *CN = getVecImm(N)) {
Dan Gohmanfaeb4a32008-09-12 16:56:44 +00001357 uint64_t Value = CN->getZExtValue();
Scott Michelbcc7b672008-03-06 04:02:54 +00001358 if (ValueType == MVT::i64) {
Dan Gohmanfaeb4a32008-09-12 16:56:44 +00001359 uint64_t UValue = CN->getZExtValue();
Scott Michelbcc7b672008-03-06 04:02:54 +00001360 uint32_t upper = uint32_t(UValue >> 32);
1361 uint32_t lower = uint32_t(UValue);
1362 if (upper != lower)
Dan Gohman8181bd12008-07-27 21:46:04 +00001363 return SDValue();
Scott Michelbcc7b672008-03-06 04:02:54 +00001364 Value = Value >> 32;
1365 }
Scott Michel8efdca42007-12-04 22:23:35 +00001366 if (Value <= 0x3ffff)
Dan Gohman57d5d5d2008-11-05 02:06:09 +00001367 return DAG.getTargetConstant(Value, ValueType);
Scott Michel8efdca42007-12-04 22:23:35 +00001368 }
1369
Dan Gohman8181bd12008-07-27 21:46:04 +00001370 return SDValue();
Scott Michel8efdca42007-12-04 22:23:35 +00001371}
1372
1373/// get_vec_i16imm - Test if this vector is a vector filled with the same value
1374/// and the value fits into a signed 16-bit constant, and if so, return the
1375/// constant
Dan Gohman8181bd12008-07-27 21:46:04 +00001376SDValue SPU::get_vec_i16imm(SDNode *N, SelectionDAG &DAG,
Duncan Sands92c43912008-06-06 12:08:01 +00001377 MVT ValueType) {
Scott Michel8efdca42007-12-04 22:23:35 +00001378 if (ConstantSDNode *CN = getVecImm(N)) {
Dan Gohman40686732008-09-26 21:54:37 +00001379 int64_t Value = CN->getSExtValue();
Scott Michelbcc7b672008-03-06 04:02:54 +00001380 if (ValueType == MVT::i64) {
Dan Gohmanfaeb4a32008-09-12 16:56:44 +00001381 uint64_t UValue = CN->getZExtValue();
Scott Michelbcc7b672008-03-06 04:02:54 +00001382 uint32_t upper = uint32_t(UValue >> 32);
1383 uint32_t lower = uint32_t(UValue);
1384 if (upper != lower)
Dan Gohman8181bd12008-07-27 21:46:04 +00001385 return SDValue();
Scott Michelbcc7b672008-03-06 04:02:54 +00001386 Value = Value >> 32;
1387 }
Scott Michel6baba072008-03-05 23:02:02 +00001388 if (Value >= -(1 << 15) && Value <= ((1 << 15) - 1)) {
Dan Gohman57d5d5d2008-11-05 02:06:09 +00001389 return DAG.getTargetConstant(Value, ValueType);
Scott Michel8efdca42007-12-04 22:23:35 +00001390 }
1391 }
1392
Dan Gohman8181bd12008-07-27 21:46:04 +00001393 return SDValue();
Scott Michel8efdca42007-12-04 22:23:35 +00001394}
1395
1396/// get_vec_i10imm - Test if this vector is a vector filled with the same value
1397/// and the value fits into a signed 10-bit constant, and if so, return the
1398/// constant
Dan Gohman8181bd12008-07-27 21:46:04 +00001399SDValue SPU::get_vec_i10imm(SDNode *N, SelectionDAG &DAG,
Duncan Sands92c43912008-06-06 12:08:01 +00001400 MVT ValueType) {
Scott Michel8efdca42007-12-04 22:23:35 +00001401 if (ConstantSDNode *CN = getVecImm(N)) {
Dan Gohman40686732008-09-26 21:54:37 +00001402 int64_t Value = CN->getSExtValue();
Scott Michelbcc7b672008-03-06 04:02:54 +00001403 if (ValueType == MVT::i64) {
Dan Gohmanfaeb4a32008-09-12 16:56:44 +00001404 uint64_t UValue = CN->getZExtValue();
Scott Michelbcc7b672008-03-06 04:02:54 +00001405 uint32_t upper = uint32_t(UValue >> 32);
1406 uint32_t lower = uint32_t(UValue);
1407 if (upper != lower)
Dan Gohman8181bd12008-07-27 21:46:04 +00001408 return SDValue();
Scott Michelbcc7b672008-03-06 04:02:54 +00001409 Value = Value >> 32;
1410 }
Scott Michel6baba072008-03-05 23:02:02 +00001411 if (isS10Constant(Value))
Dan Gohman57d5d5d2008-11-05 02:06:09 +00001412 return DAG.getTargetConstant(Value, ValueType);
Scott Michel8efdca42007-12-04 22:23:35 +00001413 }
1414
Dan Gohman8181bd12008-07-27 21:46:04 +00001415 return SDValue();
Scott Michel8efdca42007-12-04 22:23:35 +00001416}
1417
1418/// get_vec_i8imm - Test if this vector is a vector filled with the same value
1419/// and the value fits into a signed 8-bit constant, and if so, return the
1420/// constant.
1421///
1422/// @note: The incoming vector is v16i8 because that's the only way we can load
1423/// constant vectors. Thus, we test to see if the upper and lower bytes are the
1424/// same value.
Dan Gohman8181bd12008-07-27 21:46:04 +00001425SDValue SPU::get_vec_i8imm(SDNode *N, SelectionDAG &DAG,
Duncan Sands92c43912008-06-06 12:08:01 +00001426 MVT ValueType) {
Scott Michel8efdca42007-12-04 22:23:35 +00001427 if (ConstantSDNode *CN = getVecImm(N)) {
Dan Gohmanfaeb4a32008-09-12 16:56:44 +00001428 int Value = (int) CN->getZExtValue();
Scott Michel8efdca42007-12-04 22:23:35 +00001429 if (ValueType == MVT::i16
Scott Michel5a6f17b2008-01-30 02:55:46 +00001430 && Value <= 0xffff /* truncated from uint64_t */
1431 && ((short) Value >> 8) == ((short) Value & 0xff))
Dan Gohman57d5d5d2008-11-05 02:06:09 +00001432 return DAG.getTargetConstant(Value & 0xff, ValueType);
Scott Michel8efdca42007-12-04 22:23:35 +00001433 else if (ValueType == MVT::i8
Scott Michel5a6f17b2008-01-30 02:55:46 +00001434 && (Value & 0xff) == Value)
Dan Gohman57d5d5d2008-11-05 02:06:09 +00001435 return DAG.getTargetConstant(Value, ValueType);
Scott Michel8efdca42007-12-04 22:23:35 +00001436 }
1437
Dan Gohman8181bd12008-07-27 21:46:04 +00001438 return SDValue();
Scott Michel8efdca42007-12-04 22:23:35 +00001439}
1440
1441/// get_ILHUvec_imm - Test if this vector is a vector filled with the same value
1442/// and the value fits into a signed 16-bit constant, and if so, return the
1443/// constant
Dan Gohman8181bd12008-07-27 21:46:04 +00001444SDValue SPU::get_ILHUvec_imm(SDNode *N, SelectionDAG &DAG,
Duncan Sands92c43912008-06-06 12:08:01 +00001445 MVT ValueType) {
Scott Michel8efdca42007-12-04 22:23:35 +00001446 if (ConstantSDNode *CN = getVecImm(N)) {
Dan Gohmanfaeb4a32008-09-12 16:56:44 +00001447 uint64_t Value = CN->getZExtValue();
Scott Michel8efdca42007-12-04 22:23:35 +00001448 if ((ValueType == MVT::i32
Scott Michel5a6f17b2008-01-30 02:55:46 +00001449 && ((unsigned) Value & 0xffff0000) == (unsigned) Value)
1450 || (ValueType == MVT::i64 && (Value & 0xffff0000) == Value))
Dan Gohman57d5d5d2008-11-05 02:06:09 +00001451 return DAG.getTargetConstant(Value >> 16, ValueType);
Scott Michel8efdca42007-12-04 22:23:35 +00001452 }
1453
Dan Gohman8181bd12008-07-27 21:46:04 +00001454 return SDValue();
Scott Michel8efdca42007-12-04 22:23:35 +00001455}
1456
1457/// get_v4i32_imm - Catch-all for general 32-bit constant vectors
Dan Gohman8181bd12008-07-27 21:46:04 +00001458SDValue SPU::get_v4i32_imm(SDNode *N, SelectionDAG &DAG) {
Scott Michel8efdca42007-12-04 22:23:35 +00001459 if (ConstantSDNode *CN = getVecImm(N)) {
Dan Gohman57d5d5d2008-11-05 02:06:09 +00001460 return DAG.getTargetConstant((unsigned) CN->getZExtValue(), MVT::i32);
Scott Michel8efdca42007-12-04 22:23:35 +00001461 }
1462
Dan Gohman8181bd12008-07-27 21:46:04 +00001463 return SDValue();
Scott Michel8efdca42007-12-04 22:23:35 +00001464}
1465
1466/// get_v4i32_imm - Catch-all for general 64-bit constant vectors
Dan Gohman8181bd12008-07-27 21:46:04 +00001467SDValue SPU::get_v2i64_imm(SDNode *N, SelectionDAG &DAG) {
Scott Michel8efdca42007-12-04 22:23:35 +00001468 if (ConstantSDNode *CN = getVecImm(N)) {
Dan Gohman57d5d5d2008-11-05 02:06:09 +00001469 return DAG.getTargetConstant((unsigned) CN->getZExtValue(), MVT::i64);
Scott Michel8efdca42007-12-04 22:23:35 +00001470 }
1471
Dan Gohman8181bd12008-07-27 21:46:04 +00001472 return SDValue();
Scott Michel8efdca42007-12-04 22:23:35 +00001473}
1474
1475// If this is a vector of constants or undefs, get the bits. A bit in
Scott Michel4ec722e2008-07-16 17:17:29 +00001476// UndefBits is set if the corresponding element of the vector is an
Scott Michel8efdca42007-12-04 22:23:35 +00001477// ISD::UNDEF value. For undefs, the corresponding VectorBits values are
1478// zero. Return true if this is not an array of constants, false if it is.
1479//
1480static bool GetConstantBuildVectorBits(SDNode *BV, uint64_t VectorBits[2],
1481 uint64_t UndefBits[2]) {
1482 // Start with zero'd results.
1483 VectorBits[0] = VectorBits[1] = UndefBits[0] = UndefBits[1] = 0;
Scott Michel4ec722e2008-07-16 17:17:29 +00001484
Duncan Sands92c43912008-06-06 12:08:01 +00001485 unsigned EltBitSize = BV->getOperand(0).getValueType().getSizeInBits();
Scott Michel8efdca42007-12-04 22:23:35 +00001486 for (unsigned i = 0, e = BV->getNumOperands(); i != e; ++i) {
Dan Gohman8181bd12008-07-27 21:46:04 +00001487 SDValue OpVal = BV->getOperand(i);
Scott Michel4ec722e2008-07-16 17:17:29 +00001488
Scott Michel8efdca42007-12-04 22:23:35 +00001489 unsigned PartNo = i >= e/2; // In the upper 128 bits?
1490 unsigned SlotNo = e/2 - (i & (e/2-1))-1; // Which subpiece of the uint64_t.
1491
1492 uint64_t EltBits = 0;
1493 if (OpVal.getOpcode() == ISD::UNDEF) {
1494 uint64_t EltUndefBits = ~0ULL >> (64-EltBitSize);
1495 UndefBits[PartNo] |= EltUndefBits << (SlotNo*EltBitSize);
1496 continue;
Scott Michel5974f432008-11-11 03:06:06 +00001497 } else if (ConstantSDNode *CN = dyn_cast<ConstantSDNode>(OpVal)) {
Dan Gohmanfaeb4a32008-09-12 16:56:44 +00001498 EltBits = CN->getZExtValue() & (~0ULL >> (64-EltBitSize));
Scott Michel5974f432008-11-11 03:06:06 +00001499 } else if (ConstantFPSDNode *CN = dyn_cast<ConstantFPSDNode>(OpVal)) {
Scott Michel8efdca42007-12-04 22:23:35 +00001500 const APFloat &apf = CN->getValueAPF();
1501 EltBits = (CN->getValueType(0) == MVT::f32
Scott Michel5a6f17b2008-01-30 02:55:46 +00001502 ? FloatToBits(apf.convertToFloat())
1503 : DoubleToBits(apf.convertToDouble()));
Scott Michel8efdca42007-12-04 22:23:35 +00001504 } else {
1505 // Nonconstant element.
1506 return true;
1507 }
Scott Michel4ec722e2008-07-16 17:17:29 +00001508
Scott Michel8efdca42007-12-04 22:23:35 +00001509 VectorBits[PartNo] |= EltBits << (SlotNo*EltBitSize);
1510 }
Scott Michel4ec722e2008-07-16 17:17:29 +00001511
1512 //printf("%llx %llx %llx %llx\n",
Scott Michel8efdca42007-12-04 22:23:35 +00001513 // VectorBits[0], VectorBits[1], UndefBits[0], UndefBits[1]);
1514 return false;
1515}
1516
1517/// If this is a splat (repetition) of a value across the whole vector, return
1518/// the smallest size that splats it. For example, "0x01010101010101..." is a
Scott Michel4ec722e2008-07-16 17:17:29 +00001519/// splat of 0x01, 0x0101, and 0x01010101. We return SplatBits = 0x01 and
Scott Michel8efdca42007-12-04 22:23:35 +00001520/// SplatSize = 1 byte.
Scott Michel4ec722e2008-07-16 17:17:29 +00001521static bool isConstantSplat(const uint64_t Bits128[2],
Scott Michel8efdca42007-12-04 22:23:35 +00001522 const uint64_t Undef128[2],
Scott Michel5a6f17b2008-01-30 02:55:46 +00001523 int MinSplatBits,
Scott Michel8efdca42007-12-04 22:23:35 +00001524 uint64_t &SplatBits, uint64_t &SplatUndef,
1525 int &SplatSize) {
1526 // Don't let undefs prevent splats from matching. See if the top 64-bits are
1527 // the same as the lower 64-bits, ignoring undefs.
1528 uint64_t Bits64 = Bits128[0] | Bits128[1];
1529 uint64_t Undef64 = Undef128[0] & Undef128[1];
1530 uint32_t Bits32 = uint32_t(Bits64) | uint32_t(Bits64 >> 32);
1531 uint32_t Undef32 = uint32_t(Undef64) & uint32_t(Undef64 >> 32);
1532 uint16_t Bits16 = uint16_t(Bits32) | uint16_t(Bits32 >> 16);
1533 uint16_t Undef16 = uint16_t(Undef32) & uint16_t(Undef32 >> 16);
1534
1535 if ((Bits128[0] & ~Undef128[1]) == (Bits128[1] & ~Undef128[0])) {
1536 if (MinSplatBits < 64) {
Scott Michel4ec722e2008-07-16 17:17:29 +00001537
Scott Michel8efdca42007-12-04 22:23:35 +00001538 // Check that the top 32-bits are the same as the lower 32-bits, ignoring
1539 // undefs.
1540 if ((Bits64 & (~Undef64 >> 32)) == ((Bits64 >> 32) & ~Undef64)) {
Scott Michel5a6f17b2008-01-30 02:55:46 +00001541 if (MinSplatBits < 32) {
Scott Michel8efdca42007-12-04 22:23:35 +00001542
Scott Michel5a6f17b2008-01-30 02:55:46 +00001543 // If the top 16-bits are different than the lower 16-bits, ignoring
1544 // undefs, we have an i32 splat.
1545 if ((Bits32 & (~Undef32 >> 16)) == ((Bits32 >> 16) & ~Undef32)) {
1546 if (MinSplatBits < 16) {
1547 // If the top 8-bits are different than the lower 8-bits, ignoring
1548 // undefs, we have an i16 splat.
Gabor Greife9f7f582008-08-31 15:37:04 +00001549 if ((Bits16 & (uint16_t(~Undef16) >> 8))
1550 == ((Bits16 >> 8) & ~Undef16)) {
Scott Michel5a6f17b2008-01-30 02:55:46 +00001551 // Otherwise, we have an 8-bit splat.
1552 SplatBits = uint8_t(Bits16) | uint8_t(Bits16 >> 8);
1553 SplatUndef = uint8_t(Undef16) & uint8_t(Undef16 >> 8);
1554 SplatSize = 1;
1555 return true;
1556 }
1557 } else {
1558 SplatBits = Bits16;
1559 SplatUndef = Undef16;
1560 SplatSize = 2;
1561 return true;
1562 }
1563 }
1564 } else {
1565 SplatBits = Bits32;
1566 SplatUndef = Undef32;
1567 SplatSize = 4;
1568 return true;
1569 }
Scott Michel8efdca42007-12-04 22:23:35 +00001570 }
1571 } else {
1572 SplatBits = Bits128[0];
1573 SplatUndef = Undef128[0];
1574 SplatSize = 8;
1575 return true;
1576 }
1577 }
1578
1579 return false; // Can't be a splat if two pieces don't match.
1580}
1581
Scott Michel8c67fa42009-01-21 04:58:48 +00001582//! Lower a BUILD_VECTOR instruction creatively:
1583SDValue
pingbak2f387e82009-01-26 03:31:40 +00001584LowerBUILD_VECTOR(SDValue Op, SelectionDAG &DAG) {
Duncan Sands92c43912008-06-06 12:08:01 +00001585 MVT VT = Op.getValueType();
Dale Johannesen913ba762009-02-06 01:31:28 +00001586 DebugLoc dl = Op.getDebugLoc();
Scott Michel8efdca42007-12-04 22:23:35 +00001587 // If this is a vector of constants or undefs, get the bits. A bit in
Scott Michel4ec722e2008-07-16 17:17:29 +00001588 // UndefBits is set if the corresponding element of the vector is an
Scott Michel8efdca42007-12-04 22:23:35 +00001589 // ISD::UNDEF value. For undefs, the corresponding VectorBits values are
Scott Michel4ec722e2008-07-16 17:17:29 +00001590 // zero.
Scott Michel8efdca42007-12-04 22:23:35 +00001591 uint64_t VectorBits[2];
1592 uint64_t UndefBits[2];
1593 uint64_t SplatBits, SplatUndef;
1594 int SplatSize;
Gabor Greif1c80d112008-08-28 21:40:38 +00001595 if (GetConstantBuildVectorBits(Op.getNode(), VectorBits, UndefBits)
Scott Michel8efdca42007-12-04 22:23:35 +00001596 || !isConstantSplat(VectorBits, UndefBits,
Duncan Sands92c43912008-06-06 12:08:01 +00001597 VT.getVectorElementType().getSizeInBits(),
Scott Michel8efdca42007-12-04 22:23:35 +00001598 SplatBits, SplatUndef, SplatSize))
Dan Gohman8181bd12008-07-27 21:46:04 +00001599 return SDValue(); // Not a constant vector, not a splat.
Scott Michel4ec722e2008-07-16 17:17:29 +00001600
Duncan Sands92c43912008-06-06 12:08:01 +00001601 switch (VT.getSimpleVT()) {
Scott Michel8efdca42007-12-04 22:23:35 +00001602 default:
Scott Michel8c67fa42009-01-21 04:58:48 +00001603 cerr << "CellSPU: Unhandled VT in LowerBUILD_VECTOR, VT = "
1604 << VT.getMVTString()
1605 << "\n";
1606 abort();
1607 /*NOTREACHED*/
Scott Michel8efdca42007-12-04 22:23:35 +00001608 case MVT::v4f32: {
pingbak2f387e82009-01-26 03:31:40 +00001609 uint32_t Value32 = uint32_t(SplatBits);
Scott Michel8efdca42007-12-04 22:23:35 +00001610 assert(SplatSize == 4
Scott Michel5a6f17b2008-01-30 02:55:46 +00001611 && "LowerBUILD_VECTOR: Unexpected floating point vector element.");
Scott Michel8efdca42007-12-04 22:23:35 +00001612 // NOTE: pretend the constant is an integer. LLVM won't load FP constants
Dan Gohman8181bd12008-07-27 21:46:04 +00001613 SDValue T = DAG.getConstant(Value32, MVT::i32);
Dale Johannesen913ba762009-02-06 01:31:28 +00001614 return DAG.getNode(ISD::BIT_CONVERT, dl, MVT::v4f32,
1615 DAG.getNode(ISD::BUILD_VECTOR, dl,
1616 MVT::v4i32, T, T, T, T));
Scott Michel8efdca42007-12-04 22:23:35 +00001617 break;
1618 }
1619 case MVT::v2f64: {
pingbak2f387e82009-01-26 03:31:40 +00001620 uint64_t f64val = uint64_t(SplatBits);
Scott Michel8efdca42007-12-04 22:23:35 +00001621 assert(SplatSize == 8
Scott Michelc630c412008-11-24 17:11:17 +00001622 && "LowerBUILD_VECTOR: 64-bit float vector size > 8 bytes.");
Scott Michel8efdca42007-12-04 22:23:35 +00001623 // NOTE: pretend the constant is an integer. LLVM won't load FP constants
Dan Gohman8181bd12008-07-27 21:46:04 +00001624 SDValue T = DAG.getConstant(f64val, MVT::i64);
Dale Johannesen913ba762009-02-06 01:31:28 +00001625 return DAG.getNode(ISD::BIT_CONVERT, dl, MVT::v2f64,
1626 DAG.getNode(ISD::BUILD_VECTOR, dl, MVT::v2i64, T, T));
Scott Michel8efdca42007-12-04 22:23:35 +00001627 break;
1628 }
1629 case MVT::v16i8: {
1630 // 8-bit constants have to be expanded to 16-bits
1631 unsigned short Value16 = SplatBits | (SplatBits << 8);
Dan Gohman8181bd12008-07-27 21:46:04 +00001632 SDValue Ops[8];
Scott Michel8efdca42007-12-04 22:23:35 +00001633 for (int i = 0; i < 8; ++i)
1634 Ops[i] = DAG.getConstant(Value16, MVT::i16);
Dale Johannesen913ba762009-02-06 01:31:28 +00001635 return DAG.getNode(ISD::BIT_CONVERT, dl, VT,
1636 DAG.getNode(ISD::BUILD_VECTOR, dl, MVT::v8i16, Ops, 8));
Scott Michel8efdca42007-12-04 22:23:35 +00001637 }
1638 case MVT::v8i16: {
1639 unsigned short Value16;
Scott Michel4ec722e2008-07-16 17:17:29 +00001640 if (SplatSize == 2)
Scott Michel8efdca42007-12-04 22:23:35 +00001641 Value16 = (unsigned short) (SplatBits & 0xffff);
1642 else
1643 Value16 = (unsigned short) (SplatBits | (SplatBits << 8));
Dan Gohman8181bd12008-07-27 21:46:04 +00001644 SDValue T = DAG.getConstant(Value16, VT.getVectorElementType());
1645 SDValue Ops[8];
Scott Michel8efdca42007-12-04 22:23:35 +00001646 for (int i = 0; i < 8; ++i) Ops[i] = T;
Dale Johannesen913ba762009-02-06 01:31:28 +00001647 return DAG.getNode(ISD::BUILD_VECTOR, dl, VT, Ops, 8);
Scott Michel8efdca42007-12-04 22:23:35 +00001648 }
1649 case MVT::v4i32: {
1650 unsigned int Value = SplatBits;
Dan Gohman8181bd12008-07-27 21:46:04 +00001651 SDValue T = DAG.getConstant(Value, VT.getVectorElementType());
Dale Johannesen913ba762009-02-06 01:31:28 +00001652 return DAG.getNode(ISD::BUILD_VECTOR, dl, VT, T, T, T, T);
Scott Michel8efdca42007-12-04 22:23:35 +00001653 }
Scott Michel70741542009-01-06 23:10:38 +00001654 case MVT::v2i32: {
1655 unsigned int Value = SplatBits;
1656 SDValue T = DAG.getConstant(Value, VT.getVectorElementType());
Dale Johannesen913ba762009-02-06 01:31:28 +00001657 return DAG.getNode(ISD::BUILD_VECTOR, dl, VT, T, T);
Scott Michel70741542009-01-06 23:10:38 +00001658 }
Scott Michel8efdca42007-12-04 22:23:35 +00001659 case MVT::v2i64: {
Dale Johannesen913ba762009-02-06 01:31:28 +00001660 return SPU::LowerSplat_v2i64(VT, DAG, SplatBits, dl);
Scott Michel8efdca42007-12-04 22:23:35 +00001661 }
1662 }
Scott Michel4ec722e2008-07-16 17:17:29 +00001663
Dan Gohman8181bd12008-07-27 21:46:04 +00001664 return SDValue();
Scott Michel8efdca42007-12-04 22:23:35 +00001665}
1666
pingbak2f387e82009-01-26 03:31:40 +00001667SDValue
Dale Johannesen913ba762009-02-06 01:31:28 +00001668SPU::LowerSplat_v2i64(MVT OpVT, SelectionDAG& DAG, uint64_t SplatVal,
1669 DebugLoc dl) {
pingbak2f387e82009-01-26 03:31:40 +00001670 uint32_t upper = uint32_t(SplatVal >> 32);
1671 uint32_t lower = uint32_t(SplatVal);
1672
1673 if (upper == lower) {
1674 // Magic constant that can be matched by IL, ILA, et. al.
1675 SDValue Val = DAG.getTargetConstant(upper, MVT::i32);
Dale Johannesen913ba762009-02-06 01:31:28 +00001676 return DAG.getNode(ISD::BIT_CONVERT, dl, OpVT,
1677 DAG.getNode(ISD::BUILD_VECTOR, dl, MVT::v4i32,
pingbak2f387e82009-01-26 03:31:40 +00001678 Val, Val, Val, Val));
1679 } else {
1680 SDValue LO32;
1681 SDValue HI32;
1682 SmallVector<SDValue, 16> ShufBytes;
1683 SDValue Result;
1684 bool upper_special, lower_special;
1685
1686 // NOTE: This code creates common-case shuffle masks that can be easily
1687 // detected as common expressions. It is not attempting to create highly
1688 // specialized masks to replace any and all 0's, 0xff's and 0x80's.
1689
1690 // Detect if the upper or lower half is a special shuffle mask pattern:
1691 upper_special = (upper == 0 || upper == 0xffffffff || upper == 0x80000000);
1692 lower_special = (lower == 0 || lower == 0xffffffff || lower == 0x80000000);
1693
1694 // Create lower vector if not a special pattern
1695 if (!lower_special) {
1696 SDValue LO32C = DAG.getConstant(lower, MVT::i32);
Dale Johannesen913ba762009-02-06 01:31:28 +00001697 LO32 = DAG.getNode(ISD::BIT_CONVERT, dl, OpVT,
1698 DAG.getNode(ISD::BUILD_VECTOR, dl, MVT::v4i32,
pingbak2f387e82009-01-26 03:31:40 +00001699 LO32C, LO32C, LO32C, LO32C));
1700 }
1701
1702 // Create upper vector if not a special pattern
1703 if (!upper_special) {
1704 SDValue HI32C = DAG.getConstant(upper, MVT::i32);
Dale Johannesen913ba762009-02-06 01:31:28 +00001705 HI32 = DAG.getNode(ISD::BIT_CONVERT, dl, OpVT,
1706 DAG.getNode(ISD::BUILD_VECTOR, dl, MVT::v4i32,
pingbak2f387e82009-01-26 03:31:40 +00001707 HI32C, HI32C, HI32C, HI32C));
1708 }
1709
1710 // If either upper or lower are special, then the two input operands are
1711 // the same (basically, one of them is a "don't care")
1712 if (lower_special)
1713 LO32 = HI32;
1714 if (upper_special)
1715 HI32 = LO32;
1716 if (lower_special && upper_special) {
1717 // Unhappy situation... both upper and lower are special, so punt with
1718 // a target constant:
1719 SDValue Zero = DAG.getConstant(0, MVT::i32);
Dale Johannesen913ba762009-02-06 01:31:28 +00001720 HI32 = LO32 = DAG.getNode(ISD::BUILD_VECTOR, dl, MVT::v4i32, Zero, Zero,
pingbak2f387e82009-01-26 03:31:40 +00001721 Zero, Zero);
1722 }
1723
1724 for (int i = 0; i < 4; ++i) {
1725 uint64_t val = 0;
1726 for (int j = 0; j < 4; ++j) {
1727 SDValue V;
1728 bool process_upper, process_lower;
1729 val <<= 8;
1730 process_upper = (upper_special && (i & 1) == 0);
1731 process_lower = (lower_special && (i & 1) == 1);
1732
1733 if (process_upper || process_lower) {
1734 if ((process_upper && upper == 0)
1735 || (process_lower && lower == 0))
1736 val |= 0x80;
1737 else if ((process_upper && upper == 0xffffffff)
1738 || (process_lower && lower == 0xffffffff))
1739 val |= 0xc0;
1740 else if ((process_upper && upper == 0x80000000)
1741 || (process_lower && lower == 0x80000000))
1742 val |= (j == 0 ? 0xe0 : 0x80);
1743 } else
1744 val |= i * 4 + j + ((i & 1) * 16);
1745 }
1746
1747 ShufBytes.push_back(DAG.getConstant(val, MVT::i32));
1748 }
1749
Dale Johannesen913ba762009-02-06 01:31:28 +00001750 return DAG.getNode(SPUISD::SHUFB, dl, OpVT, HI32, LO32,
1751 DAG.getNode(ISD::BUILD_VECTOR, dl, MVT::v4i32,
pingbak2f387e82009-01-26 03:31:40 +00001752 &ShufBytes[0], ShufBytes.size()));
1753 }
1754}
1755
Scott Michel8efdca42007-12-04 22:23:35 +00001756/// LowerVECTOR_SHUFFLE - Lower a vector shuffle (V1, V2, V3) to something on
1757/// which the Cell can operate. The code inspects V3 to ascertain whether the
1758/// permutation vector, V3, is monotonically increasing with one "exception"
1759/// element, e.g., (0, 1, _, 3). If this is the case, then generate a
Scott Michel56a125e2008-11-22 23:50:42 +00001760/// SHUFFLE_MASK synthetic instruction. Otherwise, spill V3 to the constant pool.
Scott Michel8efdca42007-12-04 22:23:35 +00001761/// In either case, the net result is going to eventually invoke SHUFB to
1762/// permute/shuffle the bytes from V1 and V2.
1763/// \note
Scott Michel56a125e2008-11-22 23:50:42 +00001764/// SHUFFLE_MASK is eventually selected as one of the C*D instructions, generate
Scott Michel8efdca42007-12-04 22:23:35 +00001765/// control word for byte/halfword/word insertion. This takes care of a single
1766/// element move from V2 into V1.
1767/// \note
1768/// SPUISD::SHUFB is eventually selected as Cell's <i>shufb</i> instructions.
Dan Gohman8181bd12008-07-27 21:46:04 +00001769static SDValue LowerVECTOR_SHUFFLE(SDValue Op, SelectionDAG &DAG) {
1770 SDValue V1 = Op.getOperand(0);
1771 SDValue V2 = Op.getOperand(1);
1772 SDValue PermMask = Op.getOperand(2);
Dale Johannesenb03cc3f2009-02-04 23:02:30 +00001773 DebugLoc dl = Op.getDebugLoc();
Scott Michel4ec722e2008-07-16 17:17:29 +00001774
Scott Michel8efdca42007-12-04 22:23:35 +00001775 if (V2.getOpcode() == ISD::UNDEF) V2 = V1;
Scott Michel4ec722e2008-07-16 17:17:29 +00001776
Scott Michel8efdca42007-12-04 22:23:35 +00001777 // If we have a single element being moved from V1 to V2, this can be handled
1778 // using the C*[DX] compute mask instructions, but the vector elements have
1779 // to be monotonically increasing with one exception element.
Scott Michele2641a12008-12-04 21:01:44 +00001780 MVT VecVT = V1.getValueType();
1781 MVT EltVT = VecVT.getVectorElementType();
Scott Michel8efdca42007-12-04 22:23:35 +00001782 unsigned EltsFromV2 = 0;
1783 unsigned V2Elt = 0;
1784 unsigned V2EltIdx0 = 0;
1785 unsigned CurrElt = 0;
Scott Michele2641a12008-12-04 21:01:44 +00001786 unsigned MaxElts = VecVT.getVectorNumElements();
1787 unsigned PrevElt = 0;
1788 unsigned V0Elt = 0;
Scott Michel8efdca42007-12-04 22:23:35 +00001789 bool monotonic = true;
Scott Michele2641a12008-12-04 21:01:44 +00001790 bool rotate = true;
1791
1792 if (EltVT == MVT::i8) {
Scott Michel8efdca42007-12-04 22:23:35 +00001793 V2EltIdx0 = 16;
Scott Michele2641a12008-12-04 21:01:44 +00001794 } else if (EltVT == MVT::i16) {
Scott Michel8efdca42007-12-04 22:23:35 +00001795 V2EltIdx0 = 8;
Scott Michele2641a12008-12-04 21:01:44 +00001796 } else if (EltVT == MVT::i32 || EltVT == MVT::f32) {
Scott Michel8efdca42007-12-04 22:23:35 +00001797 V2EltIdx0 = 4;
Scott Michele2641a12008-12-04 21:01:44 +00001798 } else if (EltVT == MVT::i64 || EltVT == MVT::f64) {
1799 V2EltIdx0 = 2;
1800 } else
Scott Michel8efdca42007-12-04 22:23:35 +00001801 assert(0 && "Unhandled vector type in LowerVECTOR_SHUFFLE");
1802
Scott Michele2641a12008-12-04 21:01:44 +00001803 for (unsigned i = 0; i != PermMask.getNumOperands(); ++i) {
1804 if (PermMask.getOperand(i).getOpcode() != ISD::UNDEF) {
1805 unsigned SrcElt = cast<ConstantSDNode > (PermMask.getOperand(i))->getZExtValue();
Scott Michel8efdca42007-12-04 22:23:35 +00001806
Scott Michele2641a12008-12-04 21:01:44 +00001807 if (monotonic) {
1808 if (SrcElt >= V2EltIdx0) {
1809 if (1 >= (++EltsFromV2)) {
1810 V2Elt = (V2EltIdx0 - SrcElt) << 2;
1811 }
1812 } else if (CurrElt != SrcElt) {
1813 monotonic = false;
1814 }
1815
1816 ++CurrElt;
1817 }
1818
1819 if (rotate) {
1820 if (PrevElt > 0 && SrcElt < MaxElts) {
1821 if ((PrevElt == SrcElt - 1)
1822 || (PrevElt == MaxElts - 1 && SrcElt == 0)) {
1823 PrevElt = SrcElt;
1824 if (SrcElt == 0)
1825 V0Elt = i;
1826 } else {
1827 rotate = false;
1828 }
1829 } else if (PrevElt == 0) {
1830 // First time through, need to keep track of previous element
1831 PrevElt = SrcElt;
1832 } else {
1833 // This isn't a rotation, takes elements from vector 2
1834 rotate = false;
1835 }
1836 }
Scott Michel8efdca42007-12-04 22:23:35 +00001837 }
Scott Michel8efdca42007-12-04 22:23:35 +00001838 }
1839
1840 if (EltsFromV2 == 1 && monotonic) {
1841 // Compute mask and shuffle
1842 MachineFunction &MF = DAG.getMachineFunction();
Chris Lattner1b989192007-12-31 04:13:23 +00001843 MachineRegisterInfo &RegInfo = MF.getRegInfo();
1844 unsigned VReg = RegInfo.createVirtualRegister(&SPU::R32CRegClass);
Duncan Sands92c43912008-06-06 12:08:01 +00001845 MVT PtrVT = DAG.getTargetLoweringInfo().getPointerTy();
Scott Michel8efdca42007-12-04 22:23:35 +00001846 // Initialize temporary register to 0
Dan Gohman8181bd12008-07-27 21:46:04 +00001847 SDValue InitTempReg =
Dale Johannesenb03cc3f2009-02-04 23:02:30 +00001848 DAG.getCopyToReg(DAG.getEntryNode(), dl, VReg, DAG.getConstant(0, PtrVT));
Scott Michel56a125e2008-11-22 23:50:42 +00001849 // Copy register's contents as index in SHUFFLE_MASK:
Dan Gohman8181bd12008-07-27 21:46:04 +00001850 SDValue ShufMaskOp =
Dale Johannesenb03cc3f2009-02-04 23:02:30 +00001851 DAG.getNode(SPUISD::SHUFFLE_MASK, dl, MVT::v4i32,
Scott Michel5a6f17b2008-01-30 02:55:46 +00001852 DAG.getTargetConstant(V2Elt, MVT::i32),
Dale Johannesenb03cc3f2009-02-04 23:02:30 +00001853 DAG.getCopyFromReg(InitTempReg, dl, VReg, PtrVT));
Scott Michel8efdca42007-12-04 22:23:35 +00001854 // Use shuffle mask in SHUFB synthetic instruction:
Dale Johannesenb03cc3f2009-02-04 23:02:30 +00001855 return DAG.getNode(SPUISD::SHUFB, dl, V1.getValueType(), V2, V1,
1856 ShufMaskOp);
Scott Michele2641a12008-12-04 21:01:44 +00001857 } else if (rotate) {
1858 int rotamt = (MaxElts - V0Elt) * EltVT.getSizeInBits()/8;
Scott Michelae5cbf52008-12-29 03:23:36 +00001859
Dale Johannesenb03cc3f2009-02-04 23:02:30 +00001860 return DAG.getNode(SPUISD::ROTBYTES_LEFT, dl, V1.getValueType(),
Scott Michele2641a12008-12-04 21:01:44 +00001861 V1, DAG.getConstant(rotamt, MVT::i16));
Scott Michel8efdca42007-12-04 22:23:35 +00001862 } else {
Gabor Greife9f7f582008-08-31 15:37:04 +00001863 // Convert the SHUFFLE_VECTOR mask's input element units to the
1864 // actual bytes.
Duncan Sands92c43912008-06-06 12:08:01 +00001865 unsigned BytesPerElement = EltVT.getSizeInBits()/8;
Scott Michel4ec722e2008-07-16 17:17:29 +00001866
Dan Gohman8181bd12008-07-27 21:46:04 +00001867 SmallVector<SDValue, 16> ResultMask;
Scott Michel8efdca42007-12-04 22:23:35 +00001868 for (unsigned i = 0, e = PermMask.getNumOperands(); i != e; ++i) {
1869 unsigned SrcElt;
1870 if (PermMask.getOperand(i).getOpcode() == ISD::UNDEF)
Scott Michel5a6f17b2008-01-30 02:55:46 +00001871 SrcElt = 0;
Scott Michel4ec722e2008-07-16 17:17:29 +00001872 else
Dan Gohmanfaeb4a32008-09-12 16:56:44 +00001873 SrcElt = cast<ConstantSDNode>(PermMask.getOperand(i))->getZExtValue();
Scott Michel4ec722e2008-07-16 17:17:29 +00001874
Scott Michel97872d32008-02-23 18:41:37 +00001875 for (unsigned j = 0; j < BytesPerElement; ++j) {
Scott Michel5a6f17b2008-01-30 02:55:46 +00001876 ResultMask.push_back(DAG.getConstant(SrcElt*BytesPerElement+j,
1877 MVT::i8));
Scott Michel8efdca42007-12-04 22:23:35 +00001878 }
1879 }
Scott Michel4ec722e2008-07-16 17:17:29 +00001880
Dale Johannesenb03cc3f2009-02-04 23:02:30 +00001881 SDValue VPermMask = DAG.getNode(ISD::BUILD_VECTOR, dl, MVT::v16i8,
Scott Michel0718cd82008-12-01 17:56:02 +00001882 &ResultMask[0], ResultMask.size());
Dale Johannesenb03cc3f2009-02-04 23:02:30 +00001883 return DAG.getNode(SPUISD::SHUFB, dl, V1.getValueType(), V1, V2, VPermMask);
Scott Michel8efdca42007-12-04 22:23:35 +00001884 }
1885}
1886
Dan Gohman8181bd12008-07-27 21:46:04 +00001887static SDValue LowerSCALAR_TO_VECTOR(SDValue Op, SelectionDAG &DAG) {
1888 SDValue Op0 = Op.getOperand(0); // Op0 = the scalar
Dale Johannesen913ba762009-02-06 01:31:28 +00001889 DebugLoc dl = Op.getDebugLoc();
Scott Michel8efdca42007-12-04 22:23:35 +00001890
Gabor Greif1c80d112008-08-28 21:40:38 +00001891 if (Op0.getNode()->getOpcode() == ISD::Constant) {
Scott Michel8efdca42007-12-04 22:23:35 +00001892 // For a constant, build the appropriate constant vector, which will
1893 // eventually simplify to a vector register load.
1894
Gabor Greif1c80d112008-08-28 21:40:38 +00001895 ConstantSDNode *CN = cast<ConstantSDNode>(Op0.getNode());
Dan Gohman8181bd12008-07-27 21:46:04 +00001896 SmallVector<SDValue, 16> ConstVecValues;
Duncan Sands92c43912008-06-06 12:08:01 +00001897 MVT VT;
Scott Michel8efdca42007-12-04 22:23:35 +00001898 size_t n_copies;
1899
1900 // Create a constant vector:
Duncan Sands92c43912008-06-06 12:08:01 +00001901 switch (Op.getValueType().getSimpleVT()) {
Scott Michel8efdca42007-12-04 22:23:35 +00001902 default: assert(0 && "Unexpected constant value type in "
Scott Michel5a6f17b2008-01-30 02:55:46 +00001903 "LowerSCALAR_TO_VECTOR");
Scott Michel8efdca42007-12-04 22:23:35 +00001904 case MVT::v16i8: n_copies = 16; VT = MVT::i8; break;
1905 case MVT::v8i16: n_copies = 8; VT = MVT::i16; break;
1906 case MVT::v4i32: n_copies = 4; VT = MVT::i32; break;
1907 case MVT::v4f32: n_copies = 4; VT = MVT::f32; break;
1908 case MVT::v2i64: n_copies = 2; VT = MVT::i64; break;
1909 case MVT::v2f64: n_copies = 2; VT = MVT::f64; break;
1910 }
1911
Dan Gohmanfaeb4a32008-09-12 16:56:44 +00001912 SDValue CValue = DAG.getConstant(CN->getZExtValue(), VT);
Scott Michel8efdca42007-12-04 22:23:35 +00001913 for (size_t j = 0; j < n_copies; ++j)
1914 ConstVecValues.push_back(CValue);
1915
Dale Johannesen913ba762009-02-06 01:31:28 +00001916 return DAG.getNode(ISD::BUILD_VECTOR, dl, Op.getValueType(),
Scott Michel5a6f17b2008-01-30 02:55:46 +00001917 &ConstVecValues[0], ConstVecValues.size());
Scott Michel8efdca42007-12-04 22:23:35 +00001918 } else {
1919 // Otherwise, copy the value from one register to another:
Duncan Sands92c43912008-06-06 12:08:01 +00001920 switch (Op0.getValueType().getSimpleVT()) {
Scott Michel8efdca42007-12-04 22:23:35 +00001921 default: assert(0 && "Unexpected value type in LowerSCALAR_TO_VECTOR");
1922 case MVT::i8:
1923 case MVT::i16:
1924 case MVT::i32:
1925 case MVT::i64:
1926 case MVT::f32:
1927 case MVT::f64:
Dale Johannesen913ba762009-02-06 01:31:28 +00001928 return DAG.getNode(SPUISD::PREFSLOT2VEC, dl, Op.getValueType(), Op0, Op0);
Scott Michel8efdca42007-12-04 22:23:35 +00001929 }
1930 }
1931
Dan Gohman8181bd12008-07-27 21:46:04 +00001932 return SDValue();
Scott Michel8efdca42007-12-04 22:23:35 +00001933}
1934
Dan Gohman8181bd12008-07-27 21:46:04 +00001935static SDValue LowerEXTRACT_VECTOR_ELT(SDValue Op, SelectionDAG &DAG) {
Duncan Sands92c43912008-06-06 12:08:01 +00001936 MVT VT = Op.getValueType();
Dan Gohman8181bd12008-07-27 21:46:04 +00001937 SDValue N = Op.getOperand(0);
1938 SDValue Elt = Op.getOperand(1);
Dale Johannesen913ba762009-02-06 01:31:28 +00001939 DebugLoc dl = Op.getDebugLoc();
Scott Michel56a125e2008-11-22 23:50:42 +00001940 SDValue retval;
Scott Michel8efdca42007-12-04 22:23:35 +00001941
Scott Michel56a125e2008-11-22 23:50:42 +00001942 if (ConstantSDNode *C = dyn_cast<ConstantSDNode>(Elt)) {
1943 // Constant argument:
1944 int EltNo = (int) C->getZExtValue();
Scott Michel8efdca42007-12-04 22:23:35 +00001945
Scott Michel56a125e2008-11-22 23:50:42 +00001946 // sanity checks:
1947 if (VT == MVT::i8 && EltNo >= 16)
1948 assert(0 && "SPU LowerEXTRACT_VECTOR_ELT: i8 extraction slot > 15");
1949 else if (VT == MVT::i16 && EltNo >= 8)
1950 assert(0 && "SPU LowerEXTRACT_VECTOR_ELT: i16 extraction slot > 7");
1951 else if (VT == MVT::i32 && EltNo >= 4)
1952 assert(0 && "SPU LowerEXTRACT_VECTOR_ELT: i32 extraction slot > 4");
1953 else if (VT == MVT::i64 && EltNo >= 2)
1954 assert(0 && "SPU LowerEXTRACT_VECTOR_ELT: i64 extraction slot > 2");
Scott Michel8efdca42007-12-04 22:23:35 +00001955
Scott Michel56a125e2008-11-22 23:50:42 +00001956 if (EltNo == 0 && (VT == MVT::i32 || VT == MVT::i64)) {
1957 // i32 and i64: Element 0 is the preferred slot
Dale Johannesen913ba762009-02-06 01:31:28 +00001958 return DAG.getNode(SPUISD::VEC2PREFSLOT, dl, VT, N);
Scott Michel56a125e2008-11-22 23:50:42 +00001959 }
Scott Michel8efdca42007-12-04 22:23:35 +00001960
Scott Michel56a125e2008-11-22 23:50:42 +00001961 // Need to generate shuffle mask and extract:
1962 int prefslot_begin = -1, prefslot_end = -1;
1963 int elt_byte = EltNo * VT.getSizeInBits() / 8;
1964
1965 switch (VT.getSimpleVT()) {
1966 default:
1967 assert(false && "Invalid value type!");
1968 case MVT::i8: {
1969 prefslot_begin = prefslot_end = 3;
1970 break;
1971 }
1972 case MVT::i16: {
1973 prefslot_begin = 2; prefslot_end = 3;
1974 break;
1975 }
1976 case MVT::i32:
1977 case MVT::f32: {
1978 prefslot_begin = 0; prefslot_end = 3;
1979 break;
1980 }
1981 case MVT::i64:
1982 case MVT::f64: {
1983 prefslot_begin = 0; prefslot_end = 7;
1984 break;
1985 }
1986 }
1987
1988 assert(prefslot_begin != -1 && prefslot_end != -1 &&
1989 "LowerEXTRACT_VECTOR_ELT: preferred slots uninitialized");
1990
1991 unsigned int ShufBytes[16];
1992 for (int i = 0; i < 16; ++i) {
1993 // zero fill uppper part of preferred slot, don't care about the
1994 // other slots:
1995 unsigned int mask_val;
1996 if (i <= prefslot_end) {
1997 mask_val =
1998 ((i < prefslot_begin)
1999 ? 0x80
2000 : elt_byte + (i - prefslot_begin));
2001
2002 ShufBytes[i] = mask_val;
2003 } else
2004 ShufBytes[i] = ShufBytes[i % (prefslot_end + 1)];
2005 }
2006
2007 SDValue ShufMask[4];
2008 for (unsigned i = 0; i < sizeof(ShufMask)/sizeof(ShufMask[0]); ++i) {
Scott Michele2641a12008-12-04 21:01:44 +00002009 unsigned bidx = i * 4;
Scott Michel56a125e2008-11-22 23:50:42 +00002010 unsigned int bits = ((ShufBytes[bidx] << 24) |
2011 (ShufBytes[bidx+1] << 16) |
2012 (ShufBytes[bidx+2] << 8) |
2013 ShufBytes[bidx+3]);
2014 ShufMask[i] = DAG.getConstant(bits, MVT::i32);
2015 }
2016
Dale Johannesen913ba762009-02-06 01:31:28 +00002017 SDValue ShufMaskVec = DAG.getNode(ISD::BUILD_VECTOR, dl, MVT::v4i32,
Scott Michel56a125e2008-11-22 23:50:42 +00002018 &ShufMask[0],
2019 sizeof(ShufMask) / sizeof(ShufMask[0]));
2020
Dale Johannesen913ba762009-02-06 01:31:28 +00002021 retval = DAG.getNode(SPUISD::VEC2PREFSLOT, dl, VT,
2022 DAG.getNode(SPUISD::SHUFB, dl, N.getValueType(),
Scott Michel56a125e2008-11-22 23:50:42 +00002023 N, N, ShufMaskVec));
2024 } else {
2025 // Variable index: Rotate the requested element into slot 0, then replicate
2026 // slot 0 across the vector
2027 MVT VecVT = N.getValueType();
2028 if (!VecVT.isSimple() || !VecVT.isVector() || !VecVT.is128BitVector()) {
2029 cerr << "LowerEXTRACT_VECTOR_ELT: Must have a simple, 128-bit vector type!\n";
2030 abort();
2031 }
2032
2033 // Make life easier by making sure the index is zero-extended to i32
2034 if (Elt.getValueType() != MVT::i32)
Dale Johannesen913ba762009-02-06 01:31:28 +00002035 Elt = DAG.getNode(ISD::ZERO_EXTEND, dl, MVT::i32, Elt);
Scott Michel56a125e2008-11-22 23:50:42 +00002036
2037 // Scale the index to a bit/byte shift quantity
2038 APInt scaleFactor =
Scott Michelc630c412008-11-24 17:11:17 +00002039 APInt(32, uint64_t(16 / N.getValueType().getVectorNumElements()), false);
2040 unsigned scaleShift = scaleFactor.logBase2();
Scott Michel56a125e2008-11-22 23:50:42 +00002041 SDValue vecShift;
Scott Michel56a125e2008-11-22 23:50:42 +00002042
Scott Michelc630c412008-11-24 17:11:17 +00002043 if (scaleShift > 0) {
2044 // Scale the shift factor:
Dale Johannesen913ba762009-02-06 01:31:28 +00002045 Elt = DAG.getNode(ISD::SHL, dl, MVT::i32, Elt,
Scott Michel0718cd82008-12-01 17:56:02 +00002046 DAG.getConstant(scaleShift, MVT::i32));
Scott Michel56a125e2008-11-22 23:50:42 +00002047 }
2048
Dale Johannesen913ba762009-02-06 01:31:28 +00002049 vecShift = DAG.getNode(SPUISD::SHLQUAD_L_BYTES, dl, VecVT, N, Elt);
Scott Michelc630c412008-11-24 17:11:17 +00002050
2051 // Replicate the bytes starting at byte 0 across the entire vector (for
2052 // consistency with the notion of a unified register set)
Scott Michel56a125e2008-11-22 23:50:42 +00002053 SDValue replicate;
2054
2055 switch (VT.getSimpleVT()) {
2056 default:
2057 cerr << "LowerEXTRACT_VECTOR_ELT(varable): Unhandled vector type\n";
2058 abort();
2059 /*NOTREACHED*/
2060 case MVT::i8: {
Scott Michelc630c412008-11-24 17:11:17 +00002061 SDValue factor = DAG.getConstant(0x00000000, MVT::i32);
Dale Johannesen913ba762009-02-06 01:31:28 +00002062 replicate = DAG.getNode(ISD::BUILD_VECTOR, dl, MVT::v4i32, factor, factor,
Scott Michel56a125e2008-11-22 23:50:42 +00002063 factor, factor);
2064 break;
2065 }
2066 case MVT::i16: {
Scott Michelc630c412008-11-24 17:11:17 +00002067 SDValue factor = DAG.getConstant(0x00010001, MVT::i32);
Dale Johannesen913ba762009-02-06 01:31:28 +00002068 replicate = DAG.getNode(ISD::BUILD_VECTOR, dl, MVT::v4i32, factor, factor,
Scott Michel56a125e2008-11-22 23:50:42 +00002069 factor, factor);
2070 break;
2071 }
2072 case MVT::i32:
2073 case MVT::f32: {
2074 SDValue factor = DAG.getConstant(0x00010203, MVT::i32);
Dale Johannesen913ba762009-02-06 01:31:28 +00002075 replicate = DAG.getNode(ISD::BUILD_VECTOR, dl, MVT::v4i32, factor, factor,
Scott Michel56a125e2008-11-22 23:50:42 +00002076 factor, factor);
2077 break;
2078 }
2079 case MVT::i64:
2080 case MVT::f64: {
2081 SDValue loFactor = DAG.getConstant(0x00010203, MVT::i32);
2082 SDValue hiFactor = DAG.getConstant(0x04050607, MVT::i32);
Dale Johannesen913ba762009-02-06 01:31:28 +00002083 replicate = DAG.getNode(ISD::BUILD_VECTOR, dl, MVT::v4i32,
2084 loFactor, hiFactor, loFactor, hiFactor);
Scott Michel56a125e2008-11-22 23:50:42 +00002085 break;
2086 }
2087 }
2088
Dale Johannesen913ba762009-02-06 01:31:28 +00002089 retval = DAG.getNode(SPUISD::VEC2PREFSLOT, dl, VT,
2090 DAG.getNode(SPUISD::SHUFB, dl, VecVT,
Scott Michel0718cd82008-12-01 17:56:02 +00002091 vecShift, vecShift, replicate));
Scott Michel8efdca42007-12-04 22:23:35 +00002092 }
2093
Scott Michel56a125e2008-11-22 23:50:42 +00002094 return retval;
Scott Michel8efdca42007-12-04 22:23:35 +00002095}
2096
Dan Gohman8181bd12008-07-27 21:46:04 +00002097static SDValue LowerINSERT_VECTOR_ELT(SDValue Op, SelectionDAG &DAG) {
2098 SDValue VecOp = Op.getOperand(0);
2099 SDValue ValOp = Op.getOperand(1);
2100 SDValue IdxOp = Op.getOperand(2);
Dale Johannesen913ba762009-02-06 01:31:28 +00002101 DebugLoc dl = Op.getDebugLoc();
Duncan Sands92c43912008-06-06 12:08:01 +00002102 MVT VT = Op.getValueType();
Scott Michel8efdca42007-12-04 22:23:35 +00002103
2104 ConstantSDNode *CN = cast<ConstantSDNode>(IdxOp);
2105 assert(CN != 0 && "LowerINSERT_VECTOR_ELT: Index is not constant!");
2106
Duncan Sands92c43912008-06-06 12:08:01 +00002107 MVT PtrVT = DAG.getTargetLoweringInfo().getPointerTy();
Scott Michel0718cd82008-12-01 17:56:02 +00002108 // Use $sp ($1) because it's always 16-byte aligned and it's available:
Dale Johannesen913ba762009-02-06 01:31:28 +00002109 SDValue Pointer = DAG.getNode(SPUISD::IndirectAddr, dl, PtrVT,
Scott Michel0718cd82008-12-01 17:56:02 +00002110 DAG.getRegister(SPU::R1, PtrVT),
2111 DAG.getConstant(CN->getSExtValue(), PtrVT));
Dale Johannesen913ba762009-02-06 01:31:28 +00002112 SDValue ShufMask = DAG.getNode(SPUISD::SHUFFLE_MASK, dl, VT, Pointer);
Scott Michel8efdca42007-12-04 22:23:35 +00002113
Dan Gohman8181bd12008-07-27 21:46:04 +00002114 SDValue result =
Dale Johannesen913ba762009-02-06 01:31:28 +00002115 DAG.getNode(SPUISD::SHUFB, dl, VT,
2116 DAG.getNode(ISD::SCALAR_TO_VECTOR, dl, VT, ValOp),
Scott Michelae5cbf52008-12-29 03:23:36 +00002117 VecOp,
Dale Johannesen913ba762009-02-06 01:31:28 +00002118 DAG.getNode(ISD::BIT_CONVERT, dl, MVT::v4i32, ShufMask));
Scott Michel8efdca42007-12-04 22:23:35 +00002119
2120 return result;
2121}
2122
Scott Michel06eabde2008-12-27 04:51:36 +00002123static SDValue LowerI8Math(SDValue Op, SelectionDAG &DAG, unsigned Opc,
2124 const TargetLowering &TLI)
Scott Michel97872d32008-02-23 18:41:37 +00002125{
Dan Gohman8181bd12008-07-27 21:46:04 +00002126 SDValue N0 = Op.getOperand(0); // Everything has at least one operand
Dale Johannesen913ba762009-02-06 01:31:28 +00002127 DebugLoc dl = Op.getDebugLoc();
Scott Michel06eabde2008-12-27 04:51:36 +00002128 MVT ShiftVT = TLI.getShiftAmountTy();
Scott Michel8efdca42007-12-04 22:23:35 +00002129
2130 assert(Op.getValueType() == MVT::i8);
2131 switch (Opc) {
2132 default:
2133 assert(0 && "Unhandled i8 math operator");
2134 /*NOTREACHED*/
2135 break;
Scott Michel4d07fb72008-12-30 23:28:25 +00002136 case ISD::ADD: {
2137 // 8-bit addition: Promote the arguments up to 16-bits and truncate
2138 // the result:
2139 SDValue N1 = Op.getOperand(1);
Dale Johannesen913ba762009-02-06 01:31:28 +00002140 N0 = DAG.getNode(ISD::SIGN_EXTEND, dl, MVT::i16, N0);
2141 N1 = DAG.getNode(ISD::SIGN_EXTEND, dl, MVT::i16, N1);
2142 return DAG.getNode(ISD::TRUNCATE, dl, MVT::i8,
2143 DAG.getNode(Opc, dl, MVT::i16, N0, N1));
Scott Michel4d07fb72008-12-30 23:28:25 +00002144
2145 }
2146
Scott Michel8efdca42007-12-04 22:23:35 +00002147 case ISD::SUB: {
2148 // 8-bit subtraction: Promote the arguments up to 16-bits and truncate
2149 // the result:
Dan Gohman8181bd12008-07-27 21:46:04 +00002150 SDValue N1 = Op.getOperand(1);
Dale Johannesen913ba762009-02-06 01:31:28 +00002151 N0 = DAG.getNode(ISD::SIGN_EXTEND, dl, MVT::i16, N0);
2152 N1 = DAG.getNode(ISD::SIGN_EXTEND, dl, MVT::i16, N1);
2153 return DAG.getNode(ISD::TRUNCATE, dl, MVT::i8,
2154 DAG.getNode(Opc, dl, MVT::i16, N0, N1));
Scott Michel4ec722e2008-07-16 17:17:29 +00002155 }
Scott Michel8efdca42007-12-04 22:23:35 +00002156 case ISD::ROTR:
2157 case ISD::ROTL: {
Dan Gohman8181bd12008-07-27 21:46:04 +00002158 SDValue N1 = Op.getOperand(1);
Scott Michel8efdca42007-12-04 22:23:35 +00002159 unsigned N1Opc;
2160 N0 = (N0.getOpcode() != ISD::Constant
Dale Johannesen913ba762009-02-06 01:31:28 +00002161 ? DAG.getNode(ISD::ZERO_EXTEND, dl, MVT::i16, N0)
Dan Gohmanfaeb4a32008-09-12 16:56:44 +00002162 : DAG.getConstant(cast<ConstantSDNode>(N0)->getZExtValue(),
2163 MVT::i16));
Scott Michel06eabde2008-12-27 04:51:36 +00002164 N1Opc = N1.getValueType().bitsLT(ShiftVT)
Gabor Greife9f7f582008-08-31 15:37:04 +00002165 ? ISD::ZERO_EXTEND
2166 : ISD::TRUNCATE;
Scott Michel8efdca42007-12-04 22:23:35 +00002167 N1 = (N1.getOpcode() != ISD::Constant
Dale Johannesen913ba762009-02-06 01:31:28 +00002168 ? DAG.getNode(N1Opc, dl, ShiftVT, N1)
Dan Gohmanfaeb4a32008-09-12 16:56:44 +00002169 : DAG.getConstant(cast<ConstantSDNode>(N1)->getZExtValue(),
Scott Michel06eabde2008-12-27 04:51:36 +00002170 TLI.getShiftAmountTy()));
Dan Gohman8181bd12008-07-27 21:46:04 +00002171 SDValue ExpandArg =
Dale Johannesen913ba762009-02-06 01:31:28 +00002172 DAG.getNode(ISD::OR, dl, MVT::i16, N0,
2173 DAG.getNode(ISD::SHL, dl, MVT::i16,
Duncan Sands7aef60d2008-10-30 19:24:28 +00002174 N0, DAG.getConstant(8, MVT::i32)));
Dale Johannesen913ba762009-02-06 01:31:28 +00002175 return DAG.getNode(ISD::TRUNCATE, dl, MVT::i8,
2176 DAG.getNode(Opc, dl, MVT::i16, ExpandArg, N1));
Scott Michel8efdca42007-12-04 22:23:35 +00002177 }
2178 case ISD::SRL:
2179 case ISD::SHL: {
Dan Gohman8181bd12008-07-27 21:46:04 +00002180 SDValue N1 = Op.getOperand(1);
Scott Michel8efdca42007-12-04 22:23:35 +00002181 unsigned N1Opc;
2182 N0 = (N0.getOpcode() != ISD::Constant
Dale Johannesen913ba762009-02-06 01:31:28 +00002183 ? DAG.getNode(ISD::ZERO_EXTEND, dl, MVT::i16, N0)
Dan Gohmanfaeb4a32008-09-12 16:56:44 +00002184 : DAG.getConstant(cast<ConstantSDNode>(N0)->getZExtValue(),
Scott Michel06eabde2008-12-27 04:51:36 +00002185 MVT::i32));
2186 N1Opc = N1.getValueType().bitsLT(ShiftVT)
Gabor Greife9f7f582008-08-31 15:37:04 +00002187 ? ISD::ZERO_EXTEND
2188 : ISD::TRUNCATE;
Scott Michel8efdca42007-12-04 22:23:35 +00002189 N1 = (N1.getOpcode() != ISD::Constant
Dale Johannesen913ba762009-02-06 01:31:28 +00002190 ? DAG.getNode(N1Opc, dl, ShiftVT, N1)
Scott Michel06eabde2008-12-27 04:51:36 +00002191 : DAG.getConstant(cast<ConstantSDNode>(N1)->getZExtValue(), ShiftVT));
Dale Johannesen913ba762009-02-06 01:31:28 +00002192 return DAG.getNode(ISD::TRUNCATE, dl, MVT::i8,
2193 DAG.getNode(Opc, dl, MVT::i16, N0, N1));
Scott Michel8efdca42007-12-04 22:23:35 +00002194 }
2195 case ISD::SRA: {
Dan Gohman8181bd12008-07-27 21:46:04 +00002196 SDValue N1 = Op.getOperand(1);
Scott Michel8efdca42007-12-04 22:23:35 +00002197 unsigned N1Opc;
2198 N0 = (N0.getOpcode() != ISD::Constant
Dale Johannesen913ba762009-02-06 01:31:28 +00002199 ? DAG.getNode(ISD::SIGN_EXTEND, dl, MVT::i16, N0)
Scott Michel06eabde2008-12-27 04:51:36 +00002200 : DAG.getConstant(cast<ConstantSDNode>(N0)->getSExtValue(),
Dan Gohmanfaeb4a32008-09-12 16:56:44 +00002201 MVT::i16));
Scott Michel06eabde2008-12-27 04:51:36 +00002202 N1Opc = N1.getValueType().bitsLT(ShiftVT)
Gabor Greife9f7f582008-08-31 15:37:04 +00002203 ? ISD::SIGN_EXTEND
2204 : ISD::TRUNCATE;
Scott Michel8efdca42007-12-04 22:23:35 +00002205 N1 = (N1.getOpcode() != ISD::Constant
Dale Johannesen913ba762009-02-06 01:31:28 +00002206 ? DAG.getNode(N1Opc, dl, ShiftVT, N1)
Dan Gohmanfaeb4a32008-09-12 16:56:44 +00002207 : DAG.getConstant(cast<ConstantSDNode>(N1)->getZExtValue(),
Scott Michel06eabde2008-12-27 04:51:36 +00002208 ShiftVT));
Dale Johannesen913ba762009-02-06 01:31:28 +00002209 return DAG.getNode(ISD::TRUNCATE, dl, MVT::i8,
2210 DAG.getNode(Opc, dl, MVT::i16, N0, N1));
Scott Michel8efdca42007-12-04 22:23:35 +00002211 }
2212 case ISD::MUL: {
Dan Gohman8181bd12008-07-27 21:46:04 +00002213 SDValue N1 = Op.getOperand(1);
Scott Michel8efdca42007-12-04 22:23:35 +00002214 unsigned N1Opc;
2215 N0 = (N0.getOpcode() != ISD::Constant
Dale Johannesen913ba762009-02-06 01:31:28 +00002216 ? DAG.getNode(ISD::SIGN_EXTEND, dl, MVT::i16, N0)
Dan Gohmanfaeb4a32008-09-12 16:56:44 +00002217 : DAG.getConstant(cast<ConstantSDNode>(N0)->getZExtValue(),
2218 MVT::i16));
Duncan Sandsec142ee2008-06-08 20:54:56 +00002219 N1Opc = N1.getValueType().bitsLT(MVT::i16) ? ISD::SIGN_EXTEND : ISD::TRUNCATE;
Scott Michel8efdca42007-12-04 22:23:35 +00002220 N1 = (N1.getOpcode() != ISD::Constant
Dale Johannesen913ba762009-02-06 01:31:28 +00002221 ? DAG.getNode(N1Opc, dl, MVT::i16, N1)
Scott Michel06eabde2008-12-27 04:51:36 +00002222 : DAG.getConstant(cast<ConstantSDNode>(N1)->getSExtValue(),
Dan Gohmanfaeb4a32008-09-12 16:56:44 +00002223 MVT::i16));
Dale Johannesen913ba762009-02-06 01:31:28 +00002224 return DAG.getNode(ISD::TRUNCATE, dl, MVT::i8,
2225 DAG.getNode(Opc, dl, MVT::i16, N0, N1));
Scott Michel8efdca42007-12-04 22:23:35 +00002226 break;
2227 }
2228 }
2229
Dan Gohman8181bd12008-07-27 21:46:04 +00002230 return SDValue();
Scott Michel8efdca42007-12-04 22:23:35 +00002231}
2232
Scott Michel750b93f2009-01-15 04:41:47 +00002233//! Generate the carry-generate shuffle mask.
Dale Johannesen913ba762009-02-06 01:31:28 +00002234SDValue SPU::getCarryGenerateShufMask(SelectionDAG &DAG, DebugLoc dl) {
Scott Michel8c67fa42009-01-21 04:58:48 +00002235 SmallVector<SDValue, 16 > ShufBytes;
Scott Michel97872d32008-02-23 18:41:37 +00002236
Scott Michel8c67fa42009-01-21 04:58:48 +00002237 // Create the shuffle mask for "rotating" the borrow up one register slot
2238 // once the borrow is generated.
2239 ShufBytes.push_back(DAG.getConstant(0x04050607, MVT::i32));
2240 ShufBytes.push_back(DAG.getConstant(0x80808080, MVT::i32));
2241 ShufBytes.push_back(DAG.getConstant(0x0c0d0e0f, MVT::i32));
2242 ShufBytes.push_back(DAG.getConstant(0x80808080, MVT::i32));
Scott Michel97872d32008-02-23 18:41:37 +00002243
Dale Johannesen913ba762009-02-06 01:31:28 +00002244 return DAG.getNode(ISD::BUILD_VECTOR, dl, MVT::v4i32,
Scott Michel8c67fa42009-01-21 04:58:48 +00002245 &ShufBytes[0], ShufBytes.size());
Scott Michel750b93f2009-01-15 04:41:47 +00002246}
Scott Michel97872d32008-02-23 18:41:37 +00002247
Scott Michel750b93f2009-01-15 04:41:47 +00002248//! Generate the borrow-generate shuffle mask
Dale Johannesen913ba762009-02-06 01:31:28 +00002249SDValue SPU::getBorrowGenerateShufMask(SelectionDAG &DAG, DebugLoc dl) {
Scott Michel8c67fa42009-01-21 04:58:48 +00002250 SmallVector<SDValue, 16 > ShufBytes;
Scott Michel97872d32008-02-23 18:41:37 +00002251
Scott Michel8c67fa42009-01-21 04:58:48 +00002252 // Create the shuffle mask for "rotating" the borrow up one register slot
2253 // once the borrow is generated.
2254 ShufBytes.push_back(DAG.getConstant(0x04050607, MVT::i32));
2255 ShufBytes.push_back(DAG.getConstant(0xc0c0c0c0, MVT::i32));
2256 ShufBytes.push_back(DAG.getConstant(0x0c0d0e0f, MVT::i32));
2257 ShufBytes.push_back(DAG.getConstant(0xc0c0c0c0, MVT::i32));
Scott Michelf2df6cb2008-11-24 18:20:46 +00002258
Dale Johannesen913ba762009-02-06 01:31:28 +00002259 return DAG.getNode(ISD::BUILD_VECTOR, dl, MVT::v4i32,
Scott Michel8c67fa42009-01-21 04:58:48 +00002260 &ShufBytes[0], ShufBytes.size());
Scott Michel97872d32008-02-23 18:41:37 +00002261}
2262
Scott Michel8efdca42007-12-04 22:23:35 +00002263//! Lower byte immediate operations for v16i8 vectors:
Dan Gohman8181bd12008-07-27 21:46:04 +00002264static SDValue
2265LowerByteImmed(SDValue Op, SelectionDAG &DAG) {
2266 SDValue ConstVec;
2267 SDValue Arg;
Duncan Sands92c43912008-06-06 12:08:01 +00002268 MVT VT = Op.getValueType();
Dale Johannesen913ba762009-02-06 01:31:28 +00002269 DebugLoc dl = Op.getDebugLoc();
Scott Michel8efdca42007-12-04 22:23:35 +00002270
2271 ConstVec = Op.getOperand(0);
2272 Arg = Op.getOperand(1);
Gabor Greif1c80d112008-08-28 21:40:38 +00002273 if (ConstVec.getNode()->getOpcode() != ISD::BUILD_VECTOR) {
2274 if (ConstVec.getNode()->getOpcode() == ISD::BIT_CONVERT) {
Scott Michel8efdca42007-12-04 22:23:35 +00002275 ConstVec = ConstVec.getOperand(0);
2276 } else {
2277 ConstVec = Op.getOperand(1);
2278 Arg = Op.getOperand(0);
Gabor Greif1c80d112008-08-28 21:40:38 +00002279 if (ConstVec.getNode()->getOpcode() == ISD::BIT_CONVERT) {
Scott Michel5a6f17b2008-01-30 02:55:46 +00002280 ConstVec = ConstVec.getOperand(0);
Scott Michel8efdca42007-12-04 22:23:35 +00002281 }
2282 }
2283 }
2284
Gabor Greif1c80d112008-08-28 21:40:38 +00002285 if (ConstVec.getNode()->getOpcode() == ISD::BUILD_VECTOR) {
Scott Michel8efdca42007-12-04 22:23:35 +00002286 uint64_t VectorBits[2];
2287 uint64_t UndefBits[2];
2288 uint64_t SplatBits, SplatUndef;
2289 int SplatSize;
2290
Gabor Greif1c80d112008-08-28 21:40:38 +00002291 if (!GetConstantBuildVectorBits(ConstVec.getNode(), VectorBits, UndefBits)
Scott Michel5a6f17b2008-01-30 02:55:46 +00002292 && isConstantSplat(VectorBits, UndefBits,
Duncan Sands92c43912008-06-06 12:08:01 +00002293 VT.getVectorElementType().getSizeInBits(),
Scott Michel5a6f17b2008-01-30 02:55:46 +00002294 SplatBits, SplatUndef, SplatSize)) {
Dan Gohman8181bd12008-07-27 21:46:04 +00002295 SDValue tcVec[16];
2296 SDValue tc = DAG.getTargetConstant(SplatBits & 0xff, MVT::i8);
Scott Michel8efdca42007-12-04 22:23:35 +00002297 const size_t tcVecSize = sizeof(tcVec) / sizeof(tcVec[0]);
2298
2299 // Turn the BUILD_VECTOR into a set of target constants:
2300 for (size_t i = 0; i < tcVecSize; ++i)
Scott Michel5a6f17b2008-01-30 02:55:46 +00002301 tcVec[i] = tc;
Scott Michel8efdca42007-12-04 22:23:35 +00002302
Dale Johannesen913ba762009-02-06 01:31:28 +00002303 return DAG.getNode(Op.getNode()->getOpcode(), dl, VT, Arg,
2304 DAG.getNode(ISD::BUILD_VECTOR, dl, VT,
2305 tcVec, tcVecSize));
Scott Michel8efdca42007-12-04 22:23:35 +00002306 }
2307 }
Scott Michelc899a122009-01-26 22:33:37 +00002308
Nate Begeman7569e762008-07-29 19:07:27 +00002309 // These operations (AND, OR, XOR) are legal, they just couldn't be custom
2310 // lowered. Return the operation, rather than a null SDValue.
2311 return Op;
Scott Michel8efdca42007-12-04 22:23:35 +00002312}
2313
Scott Michel8efdca42007-12-04 22:23:35 +00002314//! Custom lowering for CTPOP (count population)
2315/*!
2316 Custom lowering code that counts the number ones in the input
2317 operand. SPU has such an instruction, but it counts the number of
2318 ones per byte, which then have to be accumulated.
2319*/
Dan Gohman8181bd12008-07-27 21:46:04 +00002320static SDValue LowerCTPOP(SDValue Op, SelectionDAG &DAG) {
Duncan Sands92c43912008-06-06 12:08:01 +00002321 MVT VT = Op.getValueType();
2322 MVT vecVT = MVT::getVectorVT(VT, (128 / VT.getSizeInBits()));
Dale Johannesenb03cc3f2009-02-04 23:02:30 +00002323 DebugLoc dl = Op.getDebugLoc();
Scott Michel8efdca42007-12-04 22:23:35 +00002324
Duncan Sands92c43912008-06-06 12:08:01 +00002325 switch (VT.getSimpleVT()) {
2326 default:
2327 assert(false && "Invalid value type!");
Scott Michel8efdca42007-12-04 22:23:35 +00002328 case MVT::i8: {
Dan Gohman8181bd12008-07-27 21:46:04 +00002329 SDValue N = Op.getOperand(0);
2330 SDValue Elt0 = DAG.getConstant(0, MVT::i32);
Scott Michel8efdca42007-12-04 22:23:35 +00002331
Dale Johannesenb03cc3f2009-02-04 23:02:30 +00002332 SDValue Promote = DAG.getNode(SPUISD::PREFSLOT2VEC, dl, vecVT, N, N);
2333 SDValue CNTB = DAG.getNode(SPUISD::CNTB, dl, vecVT, Promote);
Scott Michel8efdca42007-12-04 22:23:35 +00002334
Dale Johannesenb03cc3f2009-02-04 23:02:30 +00002335 return DAG.getNode(ISD::EXTRACT_VECTOR_ELT, dl, MVT::i8, CNTB, Elt0);
Scott Michel8efdca42007-12-04 22:23:35 +00002336 }
2337
2338 case MVT::i16: {
2339 MachineFunction &MF = DAG.getMachineFunction();
Chris Lattner1b989192007-12-31 04:13:23 +00002340 MachineRegisterInfo &RegInfo = MF.getRegInfo();
Scott Michel8efdca42007-12-04 22:23:35 +00002341
Chris Lattner1b989192007-12-31 04:13:23 +00002342 unsigned CNTB_reg = RegInfo.createVirtualRegister(&SPU::R16CRegClass);
Scott Michel8efdca42007-12-04 22:23:35 +00002343
Dan Gohman8181bd12008-07-27 21:46:04 +00002344 SDValue N = Op.getOperand(0);
2345 SDValue Elt0 = DAG.getConstant(0, MVT::i16);
2346 SDValue Mask0 = DAG.getConstant(0x0f, MVT::i16);
Duncan Sands7aef60d2008-10-30 19:24:28 +00002347 SDValue Shift1 = DAG.getConstant(8, MVT::i32);
Scott Michel8efdca42007-12-04 22:23:35 +00002348
Dale Johannesenb03cc3f2009-02-04 23:02:30 +00002349 SDValue Promote = DAG.getNode(SPUISD::PREFSLOT2VEC, dl, vecVT, N, N);
2350 SDValue CNTB = DAG.getNode(SPUISD::CNTB, dl, vecVT, Promote);
Scott Michel8efdca42007-12-04 22:23:35 +00002351
2352 // CNTB_result becomes the chain to which all of the virtual registers
2353 // CNTB_reg, SUM1_reg become associated:
Dan Gohman8181bd12008-07-27 21:46:04 +00002354 SDValue CNTB_result =
Dale Johannesenb03cc3f2009-02-04 23:02:30 +00002355 DAG.getNode(ISD::EXTRACT_VECTOR_ELT, dl, MVT::i16, CNTB, Elt0);
Scott Michel4ec722e2008-07-16 17:17:29 +00002356
Dan Gohman8181bd12008-07-27 21:46:04 +00002357 SDValue CNTB_rescopy =
Dale Johannesenb03cc3f2009-02-04 23:02:30 +00002358 DAG.getCopyToReg(CNTB_result, dl, CNTB_reg, CNTB_result);
Scott Michel8efdca42007-12-04 22:23:35 +00002359
Dale Johannesenb03cc3f2009-02-04 23:02:30 +00002360 SDValue Tmp1 = DAG.getCopyFromReg(CNTB_rescopy, dl, CNTB_reg, MVT::i16);
Scott Michel8efdca42007-12-04 22:23:35 +00002361
Dale Johannesenb03cc3f2009-02-04 23:02:30 +00002362 return DAG.getNode(ISD::AND, dl, MVT::i16,
2363 DAG.getNode(ISD::ADD, dl, MVT::i16,
2364 DAG.getNode(ISD::SRL, dl, MVT::i16,
Scott Michel5a6f17b2008-01-30 02:55:46 +00002365 Tmp1, Shift1),
2366 Tmp1),
2367 Mask0);
Scott Michel8efdca42007-12-04 22:23:35 +00002368 }
2369
2370 case MVT::i32: {
2371 MachineFunction &MF = DAG.getMachineFunction();
Chris Lattner1b989192007-12-31 04:13:23 +00002372 MachineRegisterInfo &RegInfo = MF.getRegInfo();
Scott Michel8efdca42007-12-04 22:23:35 +00002373
Chris Lattner1b989192007-12-31 04:13:23 +00002374 unsigned CNTB_reg = RegInfo.createVirtualRegister(&SPU::R32CRegClass);
2375 unsigned SUM1_reg = RegInfo.createVirtualRegister(&SPU::R32CRegClass);
Scott Michel8efdca42007-12-04 22:23:35 +00002376
Dan Gohman8181bd12008-07-27 21:46:04 +00002377 SDValue N = Op.getOperand(0);
2378 SDValue Elt0 = DAG.getConstant(0, MVT::i32);
2379 SDValue Mask0 = DAG.getConstant(0xff, MVT::i32);
2380 SDValue Shift1 = DAG.getConstant(16, MVT::i32);
2381 SDValue Shift2 = DAG.getConstant(8, MVT::i32);
Scott Michel8efdca42007-12-04 22:23:35 +00002382
Dale Johannesenb03cc3f2009-02-04 23:02:30 +00002383 SDValue Promote = DAG.getNode(SPUISD::PREFSLOT2VEC, dl, vecVT, N, N);
2384 SDValue CNTB = DAG.getNode(SPUISD::CNTB, dl, vecVT, Promote);
Scott Michel8efdca42007-12-04 22:23:35 +00002385
2386 // CNTB_result becomes the chain to which all of the virtual registers
2387 // CNTB_reg, SUM1_reg become associated:
Dan Gohman8181bd12008-07-27 21:46:04 +00002388 SDValue CNTB_result =
Dale Johannesenb03cc3f2009-02-04 23:02:30 +00002389 DAG.getNode(ISD::EXTRACT_VECTOR_ELT, dl, MVT::i32, CNTB, Elt0);
Scott Michel4ec722e2008-07-16 17:17:29 +00002390
Dan Gohman8181bd12008-07-27 21:46:04 +00002391 SDValue CNTB_rescopy =
Dale Johannesenb03cc3f2009-02-04 23:02:30 +00002392 DAG.getCopyToReg(CNTB_result, dl, CNTB_reg, CNTB_result);
Scott Michel8efdca42007-12-04 22:23:35 +00002393
Dan Gohman8181bd12008-07-27 21:46:04 +00002394 SDValue Comp1 =
Dale Johannesenb03cc3f2009-02-04 23:02:30 +00002395 DAG.getNode(ISD::SRL, dl, MVT::i32,
2396 DAG.getCopyFromReg(CNTB_rescopy, dl, CNTB_reg, MVT::i32),
2397 Shift1);
Scott Michel8efdca42007-12-04 22:23:35 +00002398
Dan Gohman8181bd12008-07-27 21:46:04 +00002399 SDValue Sum1 =
Dale Johannesenb03cc3f2009-02-04 23:02:30 +00002400 DAG.getNode(ISD::ADD, dl, MVT::i32, Comp1,
2401 DAG.getCopyFromReg(CNTB_rescopy, dl, CNTB_reg, MVT::i32));
Scott Michel8efdca42007-12-04 22:23:35 +00002402
Dan Gohman8181bd12008-07-27 21:46:04 +00002403 SDValue Sum1_rescopy =
Dale Johannesenb03cc3f2009-02-04 23:02:30 +00002404 DAG.getCopyToReg(CNTB_result, dl, SUM1_reg, Sum1);
Scott Michel8efdca42007-12-04 22:23:35 +00002405
Dan Gohman8181bd12008-07-27 21:46:04 +00002406 SDValue Comp2 =
Dale Johannesenb03cc3f2009-02-04 23:02:30 +00002407 DAG.getNode(ISD::SRL, dl, MVT::i32,
2408 DAG.getCopyFromReg(Sum1_rescopy, dl, SUM1_reg, MVT::i32),
Scott Michel5a6f17b2008-01-30 02:55:46 +00002409 Shift2);
Dan Gohman8181bd12008-07-27 21:46:04 +00002410 SDValue Sum2 =
Dale Johannesenb03cc3f2009-02-04 23:02:30 +00002411 DAG.getNode(ISD::ADD, dl, MVT::i32, Comp2,
2412 DAG.getCopyFromReg(Sum1_rescopy, dl, SUM1_reg, MVT::i32));
Scott Michel8efdca42007-12-04 22:23:35 +00002413
Dale Johannesenb03cc3f2009-02-04 23:02:30 +00002414 return DAG.getNode(ISD::AND, dl, MVT::i32, Sum2, Mask0);
Scott Michel8efdca42007-12-04 22:23:35 +00002415 }
2416
2417 case MVT::i64:
2418 break;
2419 }
2420
Dan Gohman8181bd12008-07-27 21:46:04 +00002421 return SDValue();
Scott Michel8efdca42007-12-04 22:23:35 +00002422}
2423
pingbak2f387e82009-01-26 03:31:40 +00002424//! Lower ISD::FP_TO_SINT, ISD::FP_TO_UINT for i32
Scott Michel8c67fa42009-01-21 04:58:48 +00002425/*!
pingbak2f387e82009-01-26 03:31:40 +00002426 f32->i32 passes through unchanged, whereas f64->i32 expands to a libcall.
2427 All conversions to i64 are expanded to a libcall.
Scott Michel8c67fa42009-01-21 04:58:48 +00002428 */
pingbak2f387e82009-01-26 03:31:40 +00002429static SDValue LowerFP_TO_INT(SDValue Op, SelectionDAG &DAG,
2430 SPUTargetLowering &TLI) {
Scott Michel8c67fa42009-01-21 04:58:48 +00002431 MVT OpVT = Op.getValueType();
Scott Michel8c67fa42009-01-21 04:58:48 +00002432 SDValue Op0 = Op.getOperand(0);
pingbak2f387e82009-01-26 03:31:40 +00002433 MVT Op0VT = Op0.getValueType();
Scott Michel8c67fa42009-01-21 04:58:48 +00002434
pingbak2f387e82009-01-26 03:31:40 +00002435 if ((OpVT == MVT::i32 && Op0VT == MVT::f64)
2436 || OpVT == MVT::i64) {
2437 // Convert f32 / f64 to i32 / i64 via libcall.
2438 RTLIB::Libcall LC =
2439 (Op.getOpcode() == ISD::FP_TO_SINT)
2440 ? RTLIB::getFPTOSINT(Op0VT, OpVT)
2441 : RTLIB::getFPTOUINT(Op0VT, OpVT);
2442 assert(LC != RTLIB::UNKNOWN_LIBCALL && "Unexpectd fp-to-int conversion!");
2443 SDValue Dummy;
2444 return ExpandLibCall(LC, Op, DAG, false, Dummy, TLI);
2445 }
Scott Michel8c67fa42009-01-21 04:58:48 +00002446
Scott Michelc899a122009-01-26 22:33:37 +00002447 return Op; // return unmolested, legalized op
pingbak2f387e82009-01-26 03:31:40 +00002448}
Scott Michel8c67fa42009-01-21 04:58:48 +00002449
pingbak2f387e82009-01-26 03:31:40 +00002450//! Lower ISD::SINT_TO_FP, ISD::UINT_TO_FP for i32
2451/*!
2452 i32->f32 passes through unchanged, whereas i32->f64 is expanded to a libcall.
2453 All conversions from i64 are expanded to a libcall.
2454 */
2455static SDValue LowerINT_TO_FP(SDValue Op, SelectionDAG &DAG,
2456 SPUTargetLowering &TLI) {
2457 MVT OpVT = Op.getValueType();
2458 SDValue Op0 = Op.getOperand(0);
2459 MVT Op0VT = Op0.getValueType();
2460
2461 if ((OpVT == MVT::f64 && Op0VT == MVT::i32)
2462 || Op0VT == MVT::i64) {
2463 // Convert i32, i64 to f64 via libcall:
2464 RTLIB::Libcall LC =
2465 (Op.getOpcode() == ISD::SINT_TO_FP)
2466 ? RTLIB::getSINTTOFP(Op0VT, OpVT)
2467 : RTLIB::getUINTTOFP(Op0VT, OpVT);
2468 assert(LC != RTLIB::UNKNOWN_LIBCALL && "Unexpectd int-to-fp conversion!");
2469 SDValue Dummy;
2470 return ExpandLibCall(LC, Op, DAG, false, Dummy, TLI);
2471 }
2472
Scott Michelc899a122009-01-26 22:33:37 +00002473 return Op; // return unmolested, legalized
Scott Michel8c67fa42009-01-21 04:58:48 +00002474}
2475
2476//! Lower ISD::SETCC
2477/*!
2478 This handles MVT::f64 (double floating point) condition lowering
2479 */
Scott Michel8c67fa42009-01-21 04:58:48 +00002480static SDValue LowerSETCC(SDValue Op, SelectionDAG &DAG,
2481 const TargetLowering &TLI) {
pingbak2f387e82009-01-26 03:31:40 +00002482 CondCodeSDNode *CC = dyn_cast<CondCodeSDNode>(Op.getOperand(2));
Dale Johannesen85fc0932009-02-04 01:48:28 +00002483 DebugLoc dl = Op.getNode()->getDebugLoc();
pingbak2f387e82009-01-26 03:31:40 +00002484 assert(CC != 0 && "LowerSETCC: CondCodeSDNode should not be null here!\n");
2485
Scott Michel8c67fa42009-01-21 04:58:48 +00002486 SDValue lhs = Op.getOperand(0);
2487 SDValue rhs = Op.getOperand(1);
Scott Michel8c67fa42009-01-21 04:58:48 +00002488 MVT lhsVT = lhs.getValueType();
Scott Michel8c67fa42009-01-21 04:58:48 +00002489 assert(lhsVT == MVT::f64 && "LowerSETCC: type other than MVT::64\n");
2490
pingbak2f387e82009-01-26 03:31:40 +00002491 MVT ccResultVT = TLI.getSetCCResultType(lhs.getValueType());
2492 APInt ccResultOnes = APInt::getAllOnesValue(ccResultVT.getSizeInBits());
2493 MVT IntVT(MVT::i64);
2494
2495 // Take advantage of the fact that (truncate (sra arg, 32)) is efficiently
2496 // selected to a NOP:
Dale Johannesen85fc0932009-02-04 01:48:28 +00002497 SDValue i64lhs = DAG.getNode(ISD::BIT_CONVERT, dl, IntVT, lhs);
pingbak2f387e82009-01-26 03:31:40 +00002498 SDValue lhsHi32 =
Dale Johannesen85fc0932009-02-04 01:48:28 +00002499 DAG.getNode(ISD::TRUNCATE, dl, MVT::i32,
2500 DAG.getNode(ISD::SRL, dl, IntVT,
pingbak2f387e82009-01-26 03:31:40 +00002501 i64lhs, DAG.getConstant(32, MVT::i32)));
2502 SDValue lhsHi32abs =
Dale Johannesen85fc0932009-02-04 01:48:28 +00002503 DAG.getNode(ISD::AND, dl, MVT::i32,
pingbak2f387e82009-01-26 03:31:40 +00002504 lhsHi32, DAG.getConstant(0x7fffffff, MVT::i32));
2505 SDValue lhsLo32 =
Dale Johannesen85fc0932009-02-04 01:48:28 +00002506 DAG.getNode(ISD::TRUNCATE, dl, MVT::i32, i64lhs);
pingbak2f387e82009-01-26 03:31:40 +00002507
2508 // SETO and SETUO only use the lhs operand:
2509 if (CC->get() == ISD::SETO) {
2510 // Evaluates to true if Op0 is not [SQ]NaN - lowers to the inverse of
2511 // SETUO
2512 APInt ccResultAllOnes = APInt::getAllOnesValue(ccResultVT.getSizeInBits());
Dale Johannesen85fc0932009-02-04 01:48:28 +00002513 return DAG.getNode(ISD::XOR, dl, ccResultVT,
2514 DAG.getSetCC(dl, ccResultVT,
pingbak2f387e82009-01-26 03:31:40 +00002515 lhs, DAG.getConstantFP(0.0, lhsVT),
2516 ISD::SETUO),
2517 DAG.getConstant(ccResultAllOnes, ccResultVT));
2518 } else if (CC->get() == ISD::SETUO) {
2519 // Evaluates to true if Op0 is [SQ]NaN
Dale Johannesen85fc0932009-02-04 01:48:28 +00002520 return DAG.getNode(ISD::AND, dl, ccResultVT,
2521 DAG.getSetCC(dl, ccResultVT,
pingbak2f387e82009-01-26 03:31:40 +00002522 lhsHi32abs,
2523 DAG.getConstant(0x7ff00000, MVT::i32),
2524 ISD::SETGE),
Dale Johannesen85fc0932009-02-04 01:48:28 +00002525 DAG.getSetCC(dl, ccResultVT,
pingbak2f387e82009-01-26 03:31:40 +00002526 lhsLo32,
2527 DAG.getConstant(0, MVT::i32),
2528 ISD::SETGT));
2529 }
2530
2531 SDValue i64rhs = DAG.getNode(ISD::BIT_CONVERT, IntVT, rhs);
2532 SDValue rhsHi32 =
Dale Johannesen85fc0932009-02-04 01:48:28 +00002533 DAG.getNode(ISD::TRUNCATE, dl, MVT::i32,
2534 DAG.getNode(ISD::SRL, dl, IntVT,
pingbak2f387e82009-01-26 03:31:40 +00002535 i64rhs, DAG.getConstant(32, MVT::i32)));
2536
2537 // If a value is negative, subtract from the sign magnitude constant:
2538 SDValue signMag2TC = DAG.getConstant(0x8000000000000000ULL, IntVT);
2539
2540 // Convert the sign-magnitude representation into 2's complement:
Dale Johannesen85fc0932009-02-04 01:48:28 +00002541 SDValue lhsSelectMask = DAG.getNode(ISD::SRA, dl, ccResultVT,
pingbak2f387e82009-01-26 03:31:40 +00002542 lhsHi32, DAG.getConstant(31, MVT::i32));
Dale Johannesen85fc0932009-02-04 01:48:28 +00002543 SDValue lhsSignMag2TC = DAG.getNode(ISD::SUB, dl, IntVT, signMag2TC, i64lhs);
pingbak2f387e82009-01-26 03:31:40 +00002544 SDValue lhsSelect =
Dale Johannesen85fc0932009-02-04 01:48:28 +00002545 DAG.getNode(ISD::SELECT, dl, IntVT,
pingbak2f387e82009-01-26 03:31:40 +00002546 lhsSelectMask, lhsSignMag2TC, i64lhs);
2547
Dale Johannesen85fc0932009-02-04 01:48:28 +00002548 SDValue rhsSelectMask = DAG.getNode(ISD::SRA, dl, ccResultVT,
pingbak2f387e82009-01-26 03:31:40 +00002549 rhsHi32, DAG.getConstant(31, MVT::i32));
Dale Johannesen85fc0932009-02-04 01:48:28 +00002550 SDValue rhsSignMag2TC = DAG.getNode(ISD::SUB, dl, IntVT, signMag2TC, i64rhs);
pingbak2f387e82009-01-26 03:31:40 +00002551 SDValue rhsSelect =
Dale Johannesen85fc0932009-02-04 01:48:28 +00002552 DAG.getNode(ISD::SELECT, dl, IntVT,
pingbak2f387e82009-01-26 03:31:40 +00002553 rhsSelectMask, rhsSignMag2TC, i64rhs);
2554
2555 unsigned compareOp;
2556
Scott Michel8c67fa42009-01-21 04:58:48 +00002557 switch (CC->get()) {
2558 case ISD::SETOEQ:
Scott Michel8c67fa42009-01-21 04:58:48 +00002559 case ISD::SETUEQ:
pingbak2f387e82009-01-26 03:31:40 +00002560 compareOp = ISD::SETEQ; break;
2561 case ISD::SETOGT:
Scott Michel8c67fa42009-01-21 04:58:48 +00002562 case ISD::SETUGT:
pingbak2f387e82009-01-26 03:31:40 +00002563 compareOp = ISD::SETGT; break;
2564 case ISD::SETOGE:
Scott Michel8c67fa42009-01-21 04:58:48 +00002565 case ISD::SETUGE:
pingbak2f387e82009-01-26 03:31:40 +00002566 compareOp = ISD::SETGE; break;
2567 case ISD::SETOLT:
Scott Michel8c67fa42009-01-21 04:58:48 +00002568 case ISD::SETULT:
pingbak2f387e82009-01-26 03:31:40 +00002569 compareOp = ISD::SETLT; break;
2570 case ISD::SETOLE:
Scott Michel8c67fa42009-01-21 04:58:48 +00002571 case ISD::SETULE:
pingbak2f387e82009-01-26 03:31:40 +00002572 compareOp = ISD::SETLE; break;
Scott Michel8c67fa42009-01-21 04:58:48 +00002573 case ISD::SETUNE:
pingbak2f387e82009-01-26 03:31:40 +00002574 case ISD::SETONE:
2575 compareOp = ISD::SETNE; break;
Scott Michel8c67fa42009-01-21 04:58:48 +00002576 default:
2577 cerr << "CellSPU ISel Select: unimplemented f64 condition\n";
2578 abort();
2579 break;
2580 }
2581
pingbak2f387e82009-01-26 03:31:40 +00002582 SDValue result =
Dale Johannesen85fc0932009-02-04 01:48:28 +00002583 DAG.getSetCC(dl, ccResultVT, lhsSelect, rhsSelect,
2584 (ISD::CondCode) compareOp);
pingbak2f387e82009-01-26 03:31:40 +00002585
2586 if ((CC->get() & 0x8) == 0) {
2587 // Ordered comparison:
Dale Johannesen85fc0932009-02-04 01:48:28 +00002588 SDValue lhsNaN = DAG.getSetCC(dl, ccResultVT,
pingbak2f387e82009-01-26 03:31:40 +00002589 lhs, DAG.getConstantFP(0.0, MVT::f64),
2590 ISD::SETO);
Dale Johannesen85fc0932009-02-04 01:48:28 +00002591 SDValue rhsNaN = DAG.getSetCC(dl, ccResultVT,
pingbak2f387e82009-01-26 03:31:40 +00002592 rhs, DAG.getConstantFP(0.0, MVT::f64),
2593 ISD::SETO);
Dale Johannesen85fc0932009-02-04 01:48:28 +00002594 SDValue ordered = DAG.getNode(ISD::AND, dl, ccResultVT, lhsNaN, rhsNaN);
pingbak2f387e82009-01-26 03:31:40 +00002595
Dale Johannesen85fc0932009-02-04 01:48:28 +00002596 result = DAG.getNode(ISD::AND, dl, ccResultVT, ordered, result);
pingbak2f387e82009-01-26 03:31:40 +00002597 }
2598
2599 return result;
Scott Michel8c67fa42009-01-21 04:58:48 +00002600}
2601
Scott Michel56a125e2008-11-22 23:50:42 +00002602//! Lower ISD::SELECT_CC
2603/*!
2604 ISD::SELECT_CC can (generally) be implemented directly on the SPU using the
2605 SELB instruction.
2606
2607 \note Need to revisit this in the future: if the code path through the true
2608 and false value computations is longer than the latency of a branch (6
2609 cycles), then it would be more advantageous to branch and insert a new basic
2610 block and branch on the condition. However, this code does not make that
2611 assumption, given the simplisitc uses so far.
2612 */
2613
Scott Michel06eabde2008-12-27 04:51:36 +00002614static SDValue LowerSELECT_CC(SDValue Op, SelectionDAG &DAG,
2615 const TargetLowering &TLI) {
Scott Michel56a125e2008-11-22 23:50:42 +00002616 MVT VT = Op.getValueType();
2617 SDValue lhs = Op.getOperand(0);
2618 SDValue rhs = Op.getOperand(1);
2619 SDValue trueval = Op.getOperand(2);
2620 SDValue falseval = Op.getOperand(3);
2621 SDValue condition = Op.getOperand(4);
2622
Scott Michel06eabde2008-12-27 04:51:36 +00002623 // NOTE: SELB's arguments: $rA, $rB, $mask
2624 //
2625 // SELB selects bits from $rA where bits in $mask are 0, bits from $rB
2626 // where bits in $mask are 1. CCond will be inverted, having 1s where the
2627 // condition was true and 0s where the condition was false. Hence, the
2628 // arguments to SELB get reversed.
2629
Scott Michel56a125e2008-11-22 23:50:42 +00002630 // Note: Really should be ISD::SELECT instead of SPUISD::SELB, but LLVM's
2631 // legalizer insists on combining SETCC/SELECT into SELECT_CC, so we end up
2632 // with another "cannot select select_cc" assert:
2633
Duncan Sands4a361272009-01-01 15:52:00 +00002634 SDValue compare = DAG.getNode(ISD::SETCC,
2635 TLI.getSetCCResultType(Op.getValueType()),
Scott Michel06eabde2008-12-27 04:51:36 +00002636 lhs, rhs, condition);
2637 return DAG.getNode(SPUISD::SELB, VT, falseval, trueval, compare);
Scott Michel56a125e2008-11-22 23:50:42 +00002638}
2639
Scott Michelec8c82e2008-12-02 19:53:53 +00002640//! Custom lower ISD::TRUNCATE
2641static SDValue LowerTRUNCATE(SDValue Op, SelectionDAG &DAG)
2642{
2643 MVT VT = Op.getValueType();
2644 MVT::SimpleValueType simpleVT = VT.getSimpleVT();
2645 MVT VecVT = MVT::getVectorVT(VT, (128 / VT.getSizeInBits()));
2646
2647 SDValue Op0 = Op.getOperand(0);
2648 MVT Op0VT = Op0.getValueType();
2649 MVT Op0VecVT = MVT::getVectorVT(Op0VT, (128 / Op0VT.getSizeInBits()));
2650
Scott Michel06eabde2008-12-27 04:51:36 +00002651 if (Op0VT.getSimpleVT() == MVT::i128 && simpleVT == MVT::i64) {
Scott Michelc5a29fe2009-01-03 00:27:53 +00002652 // Create shuffle mask, least significant doubleword of quadword
Scott Michel06eabde2008-12-27 04:51:36 +00002653 unsigned maskHigh = 0x08090a0b;
2654 unsigned maskLow = 0x0c0d0e0f;
2655 // Use a shuffle to perform the truncation
2656 SDValue shufMask = DAG.getNode(ISD::BUILD_VECTOR, MVT::v4i32,
2657 DAG.getConstant(maskHigh, MVT::i32),
2658 DAG.getConstant(maskLow, MVT::i32),
2659 DAG.getConstant(maskHigh, MVT::i32),
2660 DAG.getConstant(maskLow, MVT::i32));
2661
2662
2663 SDValue PromoteScalar = DAG.getNode(SPUISD::PREFSLOT2VEC, Op0VecVT, Op0);
2664
2665 SDValue truncShuffle = DAG.getNode(SPUISD::SHUFB, Op0VecVT,
2666 PromoteScalar, PromoteScalar, shufMask);
2667
2668 return DAG.getNode(SPUISD::VEC2PREFSLOT, VT,
2669 DAG.getNode(ISD::BIT_CONVERT, VecVT, truncShuffle));
Scott Michelec8c82e2008-12-02 19:53:53 +00002670 }
2671
Scott Michel06eabde2008-12-27 04:51:36 +00002672 return SDValue(); // Leave the truncate unmolested
Scott Michelec8c82e2008-12-02 19:53:53 +00002673}
2674
Scott Michel56a125e2008-11-22 23:50:42 +00002675//! Custom (target-specific) lowering entry point
2676/*!
2677 This is where LLVM's DAG selection process calls to do target-specific
2678 lowering of nodes.
2679 */
Dan Gohman8181bd12008-07-27 21:46:04 +00002680SDValue
2681SPUTargetLowering::LowerOperation(SDValue Op, SelectionDAG &DAG)
Scott Michel8efdca42007-12-04 22:23:35 +00002682{
Scott Michel97872d32008-02-23 18:41:37 +00002683 unsigned Opc = (unsigned) Op.getOpcode();
Duncan Sands92c43912008-06-06 12:08:01 +00002684 MVT VT = Op.getValueType();
Scott Michel97872d32008-02-23 18:41:37 +00002685
2686 switch (Opc) {
Scott Michel8efdca42007-12-04 22:23:35 +00002687 default: {
2688 cerr << "SPUTargetLowering::LowerOperation(): need to lower this!\n";
Scott Michel97872d32008-02-23 18:41:37 +00002689 cerr << "Op.getOpcode() = " << Opc << "\n";
Gabor Greif1c80d112008-08-28 21:40:38 +00002690 cerr << "*Op.getNode():\n";
2691 Op.getNode()->dump();
Scott Michel8efdca42007-12-04 22:23:35 +00002692 abort();
2693 }
2694 case ISD::LOAD:
Scott Michelec8c82e2008-12-02 19:53:53 +00002695 case ISD::EXTLOAD:
Scott Michel8efdca42007-12-04 22:23:35 +00002696 case ISD::SEXTLOAD:
2697 case ISD::ZEXTLOAD:
2698 return LowerLOAD(Op, DAG, SPUTM.getSubtargetImpl());
2699 case ISD::STORE:
2700 return LowerSTORE(Op, DAG, SPUTM.getSubtargetImpl());
2701 case ISD::ConstantPool:
2702 return LowerConstantPool(Op, DAG, SPUTM.getSubtargetImpl());
2703 case ISD::GlobalAddress:
2704 return LowerGlobalAddress(Op, DAG, SPUTM.getSubtargetImpl());
2705 case ISD::JumpTable:
2706 return LowerJumpTable(Op, DAG, SPUTM.getSubtargetImpl());
Scott Michel8efdca42007-12-04 22:23:35 +00002707 case ISD::ConstantFP:
2708 return LowerConstantFP(Op, DAG);
2709 case ISD::FORMAL_ARGUMENTS:
Scott Michel394e26d2008-01-17 20:38:41 +00002710 return LowerFORMAL_ARGUMENTS(Op, DAG, VarArgsFrameIndex);
Scott Michel8efdca42007-12-04 22:23:35 +00002711 case ISD::CALL:
Scott Micheldbac4cf2008-01-11 02:53:15 +00002712 return LowerCALL(Op, DAG, SPUTM.getSubtargetImpl());
Scott Michel8efdca42007-12-04 22:23:35 +00002713 case ISD::RET:
2714 return LowerRET(Op, DAG, getTargetMachine());
2715
Scott Michel4d07fb72008-12-30 23:28:25 +00002716 // i8, i64 math ops:
Scott Michel67224b22008-06-02 22:18:03 +00002717 case ISD::ADD:
Scott Michel8efdca42007-12-04 22:23:35 +00002718 case ISD::SUB:
2719 case ISD::ROTR:
2720 case ISD::ROTL:
2721 case ISD::SRL:
2722 case ISD::SHL:
Scott Michel67224b22008-06-02 22:18:03 +00002723 case ISD::SRA: {
Scott Michel97872d32008-02-23 18:41:37 +00002724 if (VT == MVT::i8)
Scott Michel06eabde2008-12-27 04:51:36 +00002725 return LowerI8Math(Op, DAG, Opc, *this);
Scott Michel97872d32008-02-23 18:41:37 +00002726 break;
Scott Michel67224b22008-06-02 22:18:03 +00002727 }
Scott Michel8efdca42007-12-04 22:23:35 +00002728
pingbak2f387e82009-01-26 03:31:40 +00002729 case ISD::FP_TO_SINT:
2730 case ISD::FP_TO_UINT:
2731 return LowerFP_TO_INT(Op, DAG, *this);
2732
2733 case ISD::SINT_TO_FP:
2734 case ISD::UINT_TO_FP:
2735 return LowerINT_TO_FP(Op, DAG, *this);
Scott Michel8c67fa42009-01-21 04:58:48 +00002736
Scott Michel8efdca42007-12-04 22:23:35 +00002737 // Vector-related lowering.
2738 case ISD::BUILD_VECTOR:
pingbak2f387e82009-01-26 03:31:40 +00002739 return LowerBUILD_VECTOR(Op, DAG);
Scott Michel8efdca42007-12-04 22:23:35 +00002740 case ISD::SCALAR_TO_VECTOR:
2741 return LowerSCALAR_TO_VECTOR(Op, DAG);
2742 case ISD::VECTOR_SHUFFLE:
2743 return LowerVECTOR_SHUFFLE(Op, DAG);
2744 case ISD::EXTRACT_VECTOR_ELT:
2745 return LowerEXTRACT_VECTOR_ELT(Op, DAG);
2746 case ISD::INSERT_VECTOR_ELT:
2747 return LowerINSERT_VECTOR_ELT(Op, DAG);
2748
2749 // Look for ANDBI, ORBI and XORBI opportunities and lower appropriately:
2750 case ISD::AND:
2751 case ISD::OR:
2752 case ISD::XOR:
2753 return LowerByteImmed(Op, DAG);
2754
2755 // Vector and i8 multiply:
2756 case ISD::MUL:
Scott Michel4d07fb72008-12-30 23:28:25 +00002757 if (VT == MVT::i8)
Scott Michel06eabde2008-12-27 04:51:36 +00002758 return LowerI8Math(Op, DAG, Opc, *this);
Scott Michel8efdca42007-12-04 22:23:35 +00002759
Scott Michel8efdca42007-12-04 22:23:35 +00002760 case ISD::CTPOP:
2761 return LowerCTPOP(Op, DAG);
Scott Michel56a125e2008-11-22 23:50:42 +00002762
2763 case ISD::SELECT_CC:
Scott Michel06eabde2008-12-27 04:51:36 +00002764 return LowerSELECT_CC(Op, DAG, *this);
Scott Michelec8c82e2008-12-02 19:53:53 +00002765
Scott Michel8c67fa42009-01-21 04:58:48 +00002766 case ISD::SETCC:
2767 return LowerSETCC(Op, DAG, *this);
2768
Scott Michelec8c82e2008-12-02 19:53:53 +00002769 case ISD::TRUNCATE:
2770 return LowerTRUNCATE(Op, DAG);
Scott Michel8efdca42007-12-04 22:23:35 +00002771 }
2772
Dan Gohman8181bd12008-07-27 21:46:04 +00002773 return SDValue();
Scott Michel8efdca42007-12-04 22:23:35 +00002774}
2775
Duncan Sands7d9834b2008-12-01 11:39:25 +00002776void SPUTargetLowering::ReplaceNodeResults(SDNode *N,
2777 SmallVectorImpl<SDValue>&Results,
2778 SelectionDAG &DAG)
Scott Michel6e2d68b2008-11-10 23:43:06 +00002779{
2780#if 0
2781 unsigned Opc = (unsigned) N->getOpcode();
2782 MVT OpVT = N->getValueType(0);
2783
2784 switch (Opc) {
2785 default: {
2786 cerr << "SPUTargetLowering::ReplaceNodeResults(): need to fix this!\n";
2787 cerr << "Op.getOpcode() = " << Opc << "\n";
2788 cerr << "*Op.getNode():\n";
2789 N->dump();
2790 abort();
2791 /*NOTREACHED*/
2792 }
2793 }
2794#endif
2795
2796 /* Otherwise, return unchanged */
Scott Michel6e2d68b2008-11-10 23:43:06 +00002797}
2798
Scott Michel8efdca42007-12-04 22:23:35 +00002799//===----------------------------------------------------------------------===//
Scott Michel8efdca42007-12-04 22:23:35 +00002800// Target Optimization Hooks
2801//===----------------------------------------------------------------------===//
2802
Dan Gohman8181bd12008-07-27 21:46:04 +00002803SDValue
Scott Michel8efdca42007-12-04 22:23:35 +00002804SPUTargetLowering::PerformDAGCombine(SDNode *N, DAGCombinerInfo &DCI) const
2805{
2806#if 0
2807 TargetMachine &TM = getTargetMachine();
Scott Michelf9f42e62008-01-29 02:16:57 +00002808#endif
2809 const SPUSubtarget *ST = SPUTM.getSubtargetImpl();
Scott Michel8efdca42007-12-04 22:23:35 +00002810 SelectionDAG &DAG = DCI.DAG;
Scott Michel0718cd82008-12-01 17:56:02 +00002811 SDValue Op0 = N->getOperand(0); // everything has at least one operand
2812 MVT NodeVT = N->getValueType(0); // The node's value type
Scott Michel06eabde2008-12-27 04:51:36 +00002813 MVT Op0VT = Op0.getValueType(); // The first operand's result
Scott Michel0718cd82008-12-01 17:56:02 +00002814 SDValue Result; // Initially, empty result
Scott Michel8efdca42007-12-04 22:23:35 +00002815
2816 switch (N->getOpcode()) {
2817 default: break;
Scott Michelf9f42e62008-01-29 02:16:57 +00002818 case ISD::ADD: {
Dan Gohman8181bd12008-07-27 21:46:04 +00002819 SDValue Op1 = N->getOperand(1);
Scott Michelf9f42e62008-01-29 02:16:57 +00002820
Scott Michel06eabde2008-12-27 04:51:36 +00002821 if (Op0.getOpcode() == SPUISD::IndirectAddr
2822 || Op1.getOpcode() == SPUISD::IndirectAddr) {
2823 // Normalize the operands to reduce repeated code
2824 SDValue IndirectArg = Op0, AddArg = Op1;
Scott Michelae5cbf52008-12-29 03:23:36 +00002825
Scott Michel06eabde2008-12-27 04:51:36 +00002826 if (Op1.getOpcode() == SPUISD::IndirectAddr) {
2827 IndirectArg = Op1;
2828 AddArg = Op0;
2829 }
2830
2831 if (isa<ConstantSDNode>(AddArg)) {
2832 ConstantSDNode *CN0 = cast<ConstantSDNode > (AddArg);
2833 SDValue IndOp1 = IndirectArg.getOperand(1);
2834
2835 if (CN0->isNullValue()) {
2836 // (add (SPUindirect <arg>, <arg>), 0) ->
2837 // (SPUindirect <arg>, <arg>)
Scott Michelf9f42e62008-01-29 02:16:57 +00002838
Scott Michel8c2746e2008-12-04 17:16:59 +00002839#if !defined(NDEBUG)
Scott Michel06eabde2008-12-27 04:51:36 +00002840 if (DebugFlag && isCurrentDebugType(DEBUG_TYPE)) {
Scott Michel6ccefab2008-12-04 03:02:42 +00002841 cerr << "\n"
Scott Michel06eabde2008-12-27 04:51:36 +00002842 << "Replace: (add (SPUindirect <arg>, <arg>), 0)\n"
2843 << "With: (SPUindirect <arg>, <arg>)\n";
2844 }
Scott Michel6ccefab2008-12-04 03:02:42 +00002845#endif
2846
Scott Michel06eabde2008-12-27 04:51:36 +00002847 return IndirectArg;
2848 } else if (isa<ConstantSDNode>(IndOp1)) {
2849 // (add (SPUindirect <arg>, <const>), <const>) ->
2850 // (SPUindirect <arg>, <const + const>)
2851 ConstantSDNode *CN1 = cast<ConstantSDNode > (IndOp1);
2852 int64_t combinedConst = CN0->getSExtValue() + CN1->getSExtValue();
2853 SDValue combinedValue = DAG.getConstant(combinedConst, Op0VT);
Scott Michelf9f42e62008-01-29 02:16:57 +00002854
Scott Michel06eabde2008-12-27 04:51:36 +00002855#if !defined(NDEBUG)
2856 if (DebugFlag && isCurrentDebugType(DEBUG_TYPE)) {
2857 cerr << "\n"
2858 << "Replace: (add (SPUindirect <arg>, " << CN1->getSExtValue()
2859 << "), " << CN0->getSExtValue() << ")\n"
2860 << "With: (SPUindirect <arg>, "
2861 << combinedConst << ")\n";
2862 }
2863#endif
Scott Michelf9f42e62008-01-29 02:16:57 +00002864
Scott Michel06eabde2008-12-27 04:51:36 +00002865 return DAG.getNode(SPUISD::IndirectAddr, Op0VT,
2866 IndirectArg, combinedValue);
2867 }
Scott Michelf9f42e62008-01-29 02:16:57 +00002868 }
2869 }
Scott Michel97872d32008-02-23 18:41:37 +00002870 break;
2871 }
2872 case ISD::SIGN_EXTEND:
2873 case ISD::ZERO_EXTEND:
2874 case ISD::ANY_EXTEND: {
Scott Michel0718cd82008-12-01 17:56:02 +00002875 if (Op0.getOpcode() == SPUISD::VEC2PREFSLOT && NodeVT == Op0VT) {
Scott Michel97872d32008-02-23 18:41:37 +00002876 // (any_extend (SPUextract_elt0 <arg>)) ->
2877 // (SPUextract_elt0 <arg>)
2878 // Types must match, however...
Scott Michel8c2746e2008-12-04 17:16:59 +00002879#if !defined(NDEBUG)
2880 if (DebugFlag && isCurrentDebugType(DEBUG_TYPE)) {
Scott Michel6ccefab2008-12-04 03:02:42 +00002881 cerr << "\nReplace: ";
2882 N->dump(&DAG);
2883 cerr << "\nWith: ";
2884 Op0.getNode()->dump(&DAG);
2885 cerr << "\n";
Scott Michel8c2746e2008-12-04 17:16:59 +00002886 }
Scott Michel6ccefab2008-12-04 03:02:42 +00002887#endif
Scott Michel97872d32008-02-23 18:41:37 +00002888
2889 return Op0;
2890 }
2891 break;
2892 }
2893 case SPUISD::IndirectAddr: {
2894 if (!ST->usingLargeMem() && Op0.getOpcode() == SPUISD::AFormAddr) {
Scott Michel8c67fa42009-01-21 04:58:48 +00002895 ConstantSDNode *CN = dyn_cast<ConstantSDNode>(N->getOperand(1));
2896 if (CN != 0 && CN->getZExtValue() == 0) {
Scott Michel97872d32008-02-23 18:41:37 +00002897 // (SPUindirect (SPUaform <addr>, 0), 0) ->
2898 // (SPUaform <addr>, 0)
2899
2900 DEBUG(cerr << "Replace: ");
2901 DEBUG(N->dump(&DAG));
2902 DEBUG(cerr << "\nWith: ");
Gabor Greif1c80d112008-08-28 21:40:38 +00002903 DEBUG(Op0.getNode()->dump(&DAG));
Scott Michel97872d32008-02-23 18:41:37 +00002904 DEBUG(cerr << "\n");
2905
2906 return Op0;
2907 }
Scott Michel06eabde2008-12-27 04:51:36 +00002908 } else if (Op0.getOpcode() == ISD::ADD) {
2909 SDValue Op1 = N->getOperand(1);
2910 if (ConstantSDNode *CN1 = dyn_cast<ConstantSDNode>(Op1)) {
2911 // (SPUindirect (add <arg>, <arg>), 0) ->
2912 // (SPUindirect <arg>, <arg>)
2913 if (CN1->isNullValue()) {
2914
2915#if !defined(NDEBUG)
2916 if (DebugFlag && isCurrentDebugType(DEBUG_TYPE)) {
2917 cerr << "\n"
2918 << "Replace: (SPUindirect (add <arg>, <arg>), 0)\n"
2919 << "With: (SPUindirect <arg>, <arg>)\n";
2920 }
2921#endif
2922
2923 return DAG.getNode(SPUISD::IndirectAddr, Op0VT,
2924 Op0.getOperand(0), Op0.getOperand(1));
2925 }
2926 }
Scott Michel97872d32008-02-23 18:41:37 +00002927 }
2928 break;
2929 }
2930 case SPUISD::SHLQUAD_L_BITS:
2931 case SPUISD::SHLQUAD_L_BYTES:
2932 case SPUISD::VEC_SHL:
2933 case SPUISD::VEC_SRL:
2934 case SPUISD::VEC_SRA:
Scott Michel06eabde2008-12-27 04:51:36 +00002935 case SPUISD::ROTBYTES_LEFT: {
Dan Gohman8181bd12008-07-27 21:46:04 +00002936 SDValue Op1 = N->getOperand(1);
Scott Michel97872d32008-02-23 18:41:37 +00002937
Scott Michel06eabde2008-12-27 04:51:36 +00002938 // Kill degenerate vector shifts:
2939 if (ConstantSDNode *CN = dyn_cast<ConstantSDNode>(Op1)) {
2940 if (CN->isNullValue()) {
Scott Michel97872d32008-02-23 18:41:37 +00002941 Result = Op0;
2942 }
2943 }
2944 break;
2945 }
Scott Michel06eabde2008-12-27 04:51:36 +00002946 case SPUISD::PREFSLOT2VEC: {
Scott Michel97872d32008-02-23 18:41:37 +00002947 switch (Op0.getOpcode()) {
2948 default:
2949 break;
2950 case ISD::ANY_EXTEND:
2951 case ISD::ZERO_EXTEND:
2952 case ISD::SIGN_EXTEND: {
Scott Michelae5cbf52008-12-29 03:23:36 +00002953 // (SPUprefslot2vec (any|zero|sign_extend (SPUvec2prefslot <arg>))) ->
Scott Michel97872d32008-02-23 18:41:37 +00002954 // <arg>
Scott Michelae5cbf52008-12-29 03:23:36 +00002955 // but only if the SPUprefslot2vec and <arg> types match.
Dan Gohman8181bd12008-07-27 21:46:04 +00002956 SDValue Op00 = Op0.getOperand(0);
Scott Michelc630c412008-11-24 17:11:17 +00002957 if (Op00.getOpcode() == SPUISD::VEC2PREFSLOT) {
Dan Gohman8181bd12008-07-27 21:46:04 +00002958 SDValue Op000 = Op00.getOperand(0);
Scott Michel0718cd82008-12-01 17:56:02 +00002959 if (Op000.getValueType() == NodeVT) {
Scott Michel97872d32008-02-23 18:41:37 +00002960 Result = Op000;
2961 }
2962 }
2963 break;
2964 }
Scott Michelc630c412008-11-24 17:11:17 +00002965 case SPUISD::VEC2PREFSLOT: {
Scott Michelae5cbf52008-12-29 03:23:36 +00002966 // (SPUprefslot2vec (SPUvec2prefslot <arg>)) ->
Scott Michel97872d32008-02-23 18:41:37 +00002967 // <arg>
2968 Result = Op0.getOperand(0);
2969 break;
Scott Michel4ec722e2008-07-16 17:17:29 +00002970 }
Scott Michel97872d32008-02-23 18:41:37 +00002971 }
2972 break;
Scott Michelf9f42e62008-01-29 02:16:57 +00002973 }
2974 }
Scott Michel8c67fa42009-01-21 04:58:48 +00002975
Scott Michel394e26d2008-01-17 20:38:41 +00002976 // Otherwise, return unchanged.
Scott Michel0718cd82008-12-01 17:56:02 +00002977#ifndef NDEBUG
Gabor Greif1c80d112008-08-28 21:40:38 +00002978 if (Result.getNode()) {
Scott Michel97872d32008-02-23 18:41:37 +00002979 DEBUG(cerr << "\nReplace.SPU: ");
2980 DEBUG(N->dump(&DAG));
2981 DEBUG(cerr << "\nWith: ");
Gabor Greif1c80d112008-08-28 21:40:38 +00002982 DEBUG(Result.getNode()->dump(&DAG));
Scott Michel97872d32008-02-23 18:41:37 +00002983 DEBUG(cerr << "\n");
2984 }
2985#endif
2986
2987 return Result;
Scott Michel8efdca42007-12-04 22:23:35 +00002988}
2989
2990//===----------------------------------------------------------------------===//
2991// Inline Assembly Support
2992//===----------------------------------------------------------------------===//
2993
2994/// getConstraintType - Given a constraint letter, return the type of
2995/// constraint it is for this target.
Scott Michel4ec722e2008-07-16 17:17:29 +00002996SPUTargetLowering::ConstraintType
Scott Michel8efdca42007-12-04 22:23:35 +00002997SPUTargetLowering::getConstraintType(const std::string &ConstraintLetter) const {
2998 if (ConstraintLetter.size() == 1) {
2999 switch (ConstraintLetter[0]) {
3000 default: break;
3001 case 'b':
3002 case 'r':
3003 case 'f':
3004 case 'v':
3005 case 'y':
3006 return C_RegisterClass;
Scott Michel4ec722e2008-07-16 17:17:29 +00003007 }
Scott Michel8efdca42007-12-04 22:23:35 +00003008 }
3009 return TargetLowering::getConstraintType(ConstraintLetter);
3010}
3011
Scott Michel4ec722e2008-07-16 17:17:29 +00003012std::pair<unsigned, const TargetRegisterClass*>
Scott Michel8efdca42007-12-04 22:23:35 +00003013SPUTargetLowering::getRegForInlineAsmConstraint(const std::string &Constraint,
Duncan Sands92c43912008-06-06 12:08:01 +00003014 MVT VT) const
Scott Michel8efdca42007-12-04 22:23:35 +00003015{
3016 if (Constraint.size() == 1) {
3017 // GCC RS6000 Constraint Letters
3018 switch (Constraint[0]) {
3019 case 'b': // R1-R31
3020 case 'r': // R0-R31
3021 if (VT == MVT::i64)
3022 return std::make_pair(0U, SPU::R64CRegisterClass);
3023 return std::make_pair(0U, SPU::R32CRegisterClass);
3024 case 'f':
3025 if (VT == MVT::f32)
3026 return std::make_pair(0U, SPU::R32FPRegisterClass);
3027 else if (VT == MVT::f64)
3028 return std::make_pair(0U, SPU::R64FPRegisterClass);
3029 break;
Scott Michel4ec722e2008-07-16 17:17:29 +00003030 case 'v':
Scott Michel8efdca42007-12-04 22:23:35 +00003031 return std::make_pair(0U, SPU::GPRCRegisterClass);
3032 }
3033 }
Scott Michel4ec722e2008-07-16 17:17:29 +00003034
Scott Michel8efdca42007-12-04 22:23:35 +00003035 return TargetLowering::getRegForInlineAsmConstraint(Constraint, VT);
3036}
3037
Scott Michel97872d32008-02-23 18:41:37 +00003038//! Compute used/known bits for a SPU operand
Scott Michel8efdca42007-12-04 22:23:35 +00003039void
Dan Gohman8181bd12008-07-27 21:46:04 +00003040SPUTargetLowering::computeMaskedBitsForTargetNode(const SDValue Op,
Dan Gohmand0dfc772008-02-13 22:28:48 +00003041 const APInt &Mask,
Scott Michel4ec722e2008-07-16 17:17:29 +00003042 APInt &KnownZero,
Dan Gohman229fa052008-02-13 00:35:47 +00003043 APInt &KnownOne,
Scott Michel5a6f17b2008-01-30 02:55:46 +00003044 const SelectionDAG &DAG,
3045 unsigned Depth ) const {
Scott Michelbc5fbc12008-04-30 00:30:08 +00003046#if 0
Scott Michel97872d32008-02-23 18:41:37 +00003047 const uint64_t uint64_sizebits = sizeof(uint64_t) * 8;
3048
3049 switch (Op.getOpcode()) {
3050 default:
3051 // KnownZero = KnownOne = APInt(Mask.getBitWidth(), 0);
3052 break;
Scott Michel97872d32008-02-23 18:41:37 +00003053 case CALL:
3054 case SHUFB:
Scott Michel56a125e2008-11-22 23:50:42 +00003055 case SHUFFLE_MASK:
Scott Michel97872d32008-02-23 18:41:37 +00003056 case CNTB:
Scott Michel8c67fa42009-01-21 04:58:48 +00003057 case SPUISD::PREFSLOT2VEC:
Scott Michel97872d32008-02-23 18:41:37 +00003058 case SPUISD::LDRESULT:
Scott Michel8c67fa42009-01-21 04:58:48 +00003059 case SPUISD::VEC2PREFSLOT:
Scott Michelbc5fbc12008-04-30 00:30:08 +00003060 case SPUISD::SHLQUAD_L_BITS:
3061 case SPUISD::SHLQUAD_L_BYTES:
3062 case SPUISD::VEC_SHL:
3063 case SPUISD::VEC_SRL:
3064 case SPUISD::VEC_SRA:
3065 case SPUISD::VEC_ROTL:
3066 case SPUISD::VEC_ROTR:
Scott Michelbc5fbc12008-04-30 00:30:08 +00003067 case SPUISD::ROTBYTES_LEFT:
Scott Michel67224b22008-06-02 22:18:03 +00003068 case SPUISD::SELECT_MASK:
3069 case SPUISD::SELB:
Scott Michel97872d32008-02-23 18:41:37 +00003070 }
Scott Michel8c67fa42009-01-21 04:58:48 +00003071#endif
Scott Michel8efdca42007-12-04 22:23:35 +00003072}
Scott Michel4d07fb72008-12-30 23:28:25 +00003073
Scott Michel06eabde2008-12-27 04:51:36 +00003074unsigned
3075SPUTargetLowering::ComputeNumSignBitsForTargetNode(SDValue Op,
3076 unsigned Depth) const {
3077 switch (Op.getOpcode()) {
3078 default:
3079 return 1;
Scott Michel8efdca42007-12-04 22:23:35 +00003080
Scott Michel06eabde2008-12-27 04:51:36 +00003081 case ISD::SETCC: {
3082 MVT VT = Op.getValueType();
3083
3084 if (VT != MVT::i8 && VT != MVT::i16 && VT != MVT::i32) {
3085 VT = MVT::i32;
3086 }
3087 return VT.getSizeInBits();
3088 }
3089 }
3090}
Scott Michelae5cbf52008-12-29 03:23:36 +00003091
Scott Michelbc5fbc12008-04-30 00:30:08 +00003092// LowerAsmOperandForConstraint
3093void
Dan Gohman8181bd12008-07-27 21:46:04 +00003094SPUTargetLowering::LowerAsmOperandForConstraint(SDValue Op,
Scott Michelbc5fbc12008-04-30 00:30:08 +00003095 char ConstraintLetter,
Evan Cheng7f250d62008-09-24 00:05:32 +00003096 bool hasMemory,
Dan Gohman8181bd12008-07-27 21:46:04 +00003097 std::vector<SDValue> &Ops,
Scott Michelbc5fbc12008-04-30 00:30:08 +00003098 SelectionDAG &DAG) const {
3099 // Default, for the time being, to the base class handler
Evan Cheng7f250d62008-09-24 00:05:32 +00003100 TargetLowering::LowerAsmOperandForConstraint(Op, ConstraintLetter, hasMemory,
3101 Ops, DAG);
Scott Michelbc5fbc12008-04-30 00:30:08 +00003102}
3103
Scott Michel8efdca42007-12-04 22:23:35 +00003104/// isLegalAddressImmediate - Return true if the integer value can be used
3105/// as the offset of the target addressing mode.
Gabor Greife9f7f582008-08-31 15:37:04 +00003106bool SPUTargetLowering::isLegalAddressImmediate(int64_t V,
3107 const Type *Ty) const {
Scott Michel8efdca42007-12-04 22:23:35 +00003108 // SPU's addresses are 256K:
3109 return (V > -(1 << 18) && V < (1 << 18) - 1);
3110}
3111
3112bool SPUTargetLowering::isLegalAddressImmediate(llvm::GlobalValue* GV) const {
Scott Michel4ec722e2008-07-16 17:17:29 +00003113 return false;
Scott Michel8efdca42007-12-04 22:23:35 +00003114}
Dan Gohman36322c72008-10-18 02:06:02 +00003115
3116bool
3117SPUTargetLowering::isOffsetFoldingLegal(const GlobalAddressSDNode *GA) const {
3118 // The SPU target isn't yet aware of offsets.
3119 return false;
3120}