blob: 9b65de16a6295970c181d5694e89f118bb2eb8c0 [file] [log] [blame]
Scott Michel8efdca42007-12-04 22:23:35 +00001//===-- SPUISelLowering.cpp - Cell SPU DAG Lowering Implementation --------===//
2//
3// The LLVM Compiler Infrastructure
4//
Chris Lattner081ce942007-12-29 20:36:04 +00005// This file is distributed under the University of Illinois Open Source
6// License. See LICENSE.TXT for details.
Scott Michel8efdca42007-12-04 22:23:35 +00007//
8//===----------------------------------------------------------------------===//
9//
10// This file implements the SPUTargetLowering class.
11//
12//===----------------------------------------------------------------------===//
13
14#include "SPURegisterNames.h"
15#include "SPUISelLowering.h"
16#include "SPUTargetMachine.h"
Scott Michelbc5fbc12008-04-30 00:30:08 +000017#include "SPUFrameInfo.h"
Scott Michel06eabde2008-12-27 04:51:36 +000018#include "llvm/ADT/APInt.h"
Scott Michel8efdca42007-12-04 22:23:35 +000019#include "llvm/ADT/VectorExtras.h"
pingbak2f387e82009-01-26 03:31:40 +000020#include "llvm/CallingConv.h"
Scott Michel8efdca42007-12-04 22:23:35 +000021#include "llvm/CodeGen/CallingConvLower.h"
22#include "llvm/CodeGen/MachineFrameInfo.h"
23#include "llvm/CodeGen/MachineFunction.h"
24#include "llvm/CodeGen/MachineInstrBuilder.h"
Chris Lattner1b989192007-12-31 04:13:23 +000025#include "llvm/CodeGen/MachineRegisterInfo.h"
Scott Michel8efdca42007-12-04 22:23:35 +000026#include "llvm/CodeGen/SelectionDAG.h"
Scott Michel8efdca42007-12-04 22:23:35 +000027#include "llvm/Constants.h"
28#include "llvm/Function.h"
29#include "llvm/Intrinsics.h"
30#include "llvm/Support/Debug.h"
31#include "llvm/Support/MathExtras.h"
32#include "llvm/Target/TargetOptions.h"
33
34#include <map>
35
36using namespace llvm;
37
38// Used in getTargetNodeName() below
39namespace {
40 std::map<unsigned, const char *> node_names;
41
Duncan Sands92c43912008-06-06 12:08:01 +000042 //! MVT mapping to useful data for Cell SPU
Scott Michel8efdca42007-12-04 22:23:35 +000043 struct valtype_map_s {
Scott Michel56a125e2008-11-22 23:50:42 +000044 const MVT valtype;
45 const int prefslot_byte;
Scott Michel8efdca42007-12-04 22:23:35 +000046 };
Scott Michel4ec722e2008-07-16 17:17:29 +000047
Scott Michel8efdca42007-12-04 22:23:35 +000048 const valtype_map_s valtype_map[] = {
49 { MVT::i1, 3 },
50 { MVT::i8, 3 },
51 { MVT::i16, 2 },
52 { MVT::i32, 0 },
53 { MVT::f32, 0 },
54 { MVT::i64, 0 },
55 { MVT::f64, 0 },
56 { MVT::i128, 0 }
57 };
58
59 const size_t n_valtype_map = sizeof(valtype_map) / sizeof(valtype_map[0]);
60
Duncan Sands92c43912008-06-06 12:08:01 +000061 const valtype_map_s *getValueTypeMapEntry(MVT VT) {
Scott Michel8efdca42007-12-04 22:23:35 +000062 const valtype_map_s *retval = 0;
63
64 for (size_t i = 0; i < n_valtype_map; ++i) {
65 if (valtype_map[i].valtype == VT) {
Scott Michel5a6f17b2008-01-30 02:55:46 +000066 retval = valtype_map + i;
67 break;
Scott Michel8efdca42007-12-04 22:23:35 +000068 }
69 }
70
71#ifndef NDEBUG
72 if (retval == 0) {
73 cerr << "getValueTypeMapEntry returns NULL for "
Duncan Sands92c43912008-06-06 12:08:01 +000074 << VT.getMVTString()
Scott Michel5a6f17b2008-01-30 02:55:46 +000075 << "\n";
Scott Michel8efdca42007-12-04 22:23:35 +000076 abort();
77 }
78#endif
79
80 return retval;
81 }
Scott Michel750b93f2009-01-15 04:41:47 +000082
pingbak2f387e82009-01-26 03:31:40 +000083 //! Expand a library call into an actual call DAG node
84 /*!
85 \note
86 This code is taken from SelectionDAGLegalize, since it is not exposed as
87 part of the LLVM SelectionDAG API.
88 */
89
90 SDValue
91 ExpandLibCall(RTLIB::Libcall LC, SDValue Op, SelectionDAG &DAG,
92 bool isSigned, SDValue &Hi, SPUTargetLowering &TLI) {
93 // The input chain to this libcall is the entry node of the function.
94 // Legalizing the call will automatically add the previous call to the
95 // dependence.
96 SDValue InChain = DAG.getEntryNode();
97
98 TargetLowering::ArgListTy Args;
99 TargetLowering::ArgListEntry Entry;
100 for (unsigned i = 0, e = Op.getNumOperands(); i != e; ++i) {
101 MVT ArgVT = Op.getOperand(i).getValueType();
102 const Type *ArgTy = ArgVT.getTypeForMVT();
103 Entry.Node = Op.getOperand(i);
104 Entry.Ty = ArgTy;
105 Entry.isSExt = isSigned;
106 Entry.isZExt = !isSigned;
107 Args.push_back(Entry);
108 }
109 SDValue Callee = DAG.getExternalSymbol(TLI.getLibcallName(LC),
110 TLI.getPointerTy());
111
112 // Splice the libcall in wherever FindInputOutputChains tells us to.
113 const Type *RetTy = Op.getNode()->getValueType(0).getTypeForMVT();
114 std::pair<SDValue, SDValue> CallInfo =
115 TLI.LowerCallTo(InChain, RetTy, isSigned, !isSigned, false, false,
Dale Johannesenca6237b2009-01-30 23:10:59 +0000116 CallingConv::C, false, Callee, Args, DAG,
Dale Johannesen2dbdb0e2009-02-07 19:59:05 +0000117 Op.getDebugLoc());
pingbak2f387e82009-01-26 03:31:40 +0000118
119 return CallInfo.first;
120 }
Scott Michel8efdca42007-12-04 22:23:35 +0000121}
122
123SPUTargetLowering::SPUTargetLowering(SPUTargetMachine &TM)
124 : TargetLowering(TM),
125 SPUTM(TM)
126{
127 // Fold away setcc operations if possible.
128 setPow2DivIsCheap();
129
130 // Use _setjmp/_longjmp instead of setjmp/longjmp.
131 setUseUnderscoreSetJmp(true);
132 setUseUnderscoreLongJmp(true);
Scott Michel4ec722e2008-07-16 17:17:29 +0000133
Scott Michel8c67fa42009-01-21 04:58:48 +0000134 // Set RTLIB libcall names as used by SPU:
135 setLibcallName(RTLIB::DIV_F64, "__fast_divdf3");
136
Scott Michel8efdca42007-12-04 22:23:35 +0000137 // Set up the SPU's register classes:
Scott Michel438be252007-12-17 22:32:34 +0000138 addRegisterClass(MVT::i8, SPU::R8CRegisterClass);
139 addRegisterClass(MVT::i16, SPU::R16CRegisterClass);
140 addRegisterClass(MVT::i32, SPU::R32CRegisterClass);
141 addRegisterClass(MVT::i64, SPU::R64CRegisterClass);
142 addRegisterClass(MVT::f32, SPU::R32FPRegisterClass);
143 addRegisterClass(MVT::f64, SPU::R64FPRegisterClass);
Scott Michel8efdca42007-12-04 22:23:35 +0000144 addRegisterClass(MVT::i128, SPU::GPRCRegisterClass);
Scott Michel4ec722e2008-07-16 17:17:29 +0000145
Scott Michel8efdca42007-12-04 22:23:35 +0000146 // SPU has no sign or zero extended loads for i1, i8, i16:
Evan Cheng08c171a2008-10-14 21:26:46 +0000147 setLoadExtAction(ISD::EXTLOAD, MVT::i1, Promote);
148 setLoadExtAction(ISD::SEXTLOAD, MVT::i1, Promote);
149 setLoadExtAction(ISD::ZEXTLOAD, MVT::i1, Promote);
Scott Michel8efdca42007-12-04 22:23:35 +0000150
Scott Michel06eabde2008-12-27 04:51:36 +0000151 setLoadExtAction(ISD::EXTLOAD, MVT::f32, Expand);
152 setLoadExtAction(ISD::EXTLOAD, MVT::f64, Expand);
Scott Michelec8c82e2008-12-02 19:53:53 +0000153
Scott Michel8efdca42007-12-04 22:23:35 +0000154 // SPU constant load actions are custom lowered:
Nate Begeman78125042008-02-14 18:43:04 +0000155 setOperationAction(ISD::ConstantFP, MVT::f32, Legal);
Scott Michel8efdca42007-12-04 22:23:35 +0000156 setOperationAction(ISD::ConstantFP, MVT::f64, Custom);
157
158 // SPU's loads and stores have to be custom lowered:
Scott Michel2ef773a2009-01-06 03:36:14 +0000159 for (unsigned sctype = (unsigned) MVT::i8; sctype < (unsigned) MVT::i128;
Scott Michel8efdca42007-12-04 22:23:35 +0000160 ++sctype) {
Duncan Sands92c43912008-06-06 12:08:01 +0000161 MVT VT = (MVT::SimpleValueType)sctype;
162
Scott Michel06eabde2008-12-27 04:51:36 +0000163 setOperationAction(ISD::LOAD, VT, Custom);
164 setOperationAction(ISD::STORE, VT, Custom);
165 setLoadExtAction(ISD::EXTLOAD, VT, Custom);
166 setLoadExtAction(ISD::ZEXTLOAD, VT, Custom);
167 setLoadExtAction(ISD::SEXTLOAD, VT, Custom);
168
169 for (unsigned stype = sctype - 1; stype >= (unsigned) MVT::i8; --stype) {
170 MVT StoreVT = (MVT::SimpleValueType) stype;
171 setTruncStoreAction(VT, StoreVT, Expand);
172 }
Scott Michel8efdca42007-12-04 22:23:35 +0000173 }
174
Scott Michel06eabde2008-12-27 04:51:36 +0000175 for (unsigned sctype = (unsigned) MVT::f32; sctype < (unsigned) MVT::f64;
176 ++sctype) {
177 MVT VT = (MVT::SimpleValueType) sctype;
178
179 setOperationAction(ISD::LOAD, VT, Custom);
180 setOperationAction(ISD::STORE, VT, Custom);
181
182 for (unsigned stype = sctype - 1; stype >= (unsigned) MVT::f32; --stype) {
183 MVT StoreVT = (MVT::SimpleValueType) stype;
184 setTruncStoreAction(VT, StoreVT, Expand);
185 }
186 }
187
Scott Michel8efdca42007-12-04 22:23:35 +0000188 // Expand the jumptable branches
189 setOperationAction(ISD::BR_JT, MVT::Other, Expand);
190 setOperationAction(ISD::BR_CC, MVT::Other, Expand);
Scott Michel56a125e2008-11-22 23:50:42 +0000191
192 // Custom lower SELECT_CC for most cases, but expand by default
Scott Michel4ec722e2008-07-16 17:17:29 +0000193 setOperationAction(ISD::SELECT_CC, MVT::Other, Expand);
Scott Michel56a125e2008-11-22 23:50:42 +0000194 setOperationAction(ISD::SELECT_CC, MVT::i8, Custom);
195 setOperationAction(ISD::SELECT_CC, MVT::i16, Custom);
196 setOperationAction(ISD::SELECT_CC, MVT::i32, Custom);
197 setOperationAction(ISD::SELECT_CC, MVT::i64, Custom);
Scott Michel8efdca42007-12-04 22:23:35 +0000198
199 // SPU has no intrinsics for these particular operations:
Andrew Lenharth0531ec52008-02-16 14:46:26 +0000200 setOperationAction(ISD::MEMBARRIER, MVT::Other, Expand);
201
Scott Michel06eabde2008-12-27 04:51:36 +0000202 // SPU has no SREM/UREM instructions
Scott Michel8efdca42007-12-04 22:23:35 +0000203 setOperationAction(ISD::SREM, MVT::i32, Expand);
204 setOperationAction(ISD::UREM, MVT::i32, Expand);
205 setOperationAction(ISD::SREM, MVT::i64, Expand);
206 setOperationAction(ISD::UREM, MVT::i64, Expand);
Scott Michel4ec722e2008-07-16 17:17:29 +0000207
Scott Michel8efdca42007-12-04 22:23:35 +0000208 // We don't support sin/cos/sqrt/fmod
209 setOperationAction(ISD::FSIN , MVT::f64, Expand);
210 setOperationAction(ISD::FCOS , MVT::f64, Expand);
211 setOperationAction(ISD::FREM , MVT::f64, Expand);
212 setOperationAction(ISD::FSIN , MVT::f32, Expand);
213 setOperationAction(ISD::FCOS , MVT::f32, Expand);
214 setOperationAction(ISD::FREM , MVT::f32, Expand);
Scott Michel4ec722e2008-07-16 17:17:29 +0000215
pingbak2f387e82009-01-26 03:31:40 +0000216 // Expand fsqrt to the appropriate libcall (NOTE: should use h/w fsqrt
217 // for f32!)
Scott Michel8efdca42007-12-04 22:23:35 +0000218 setOperationAction(ISD::FSQRT, MVT::f64, Expand);
219 setOperationAction(ISD::FSQRT, MVT::f32, Expand);
Scott Michel4ec722e2008-07-16 17:17:29 +0000220
Scott Michel8efdca42007-12-04 22:23:35 +0000221 setOperationAction(ISD::FCOPYSIGN, MVT::f64, Expand);
222 setOperationAction(ISD::FCOPYSIGN, MVT::f32, Expand);
223
224 // SPU can do rotate right and left, so legalize it... but customize for i8
225 // because instructions don't exist.
Bill Wendling965299c2008-08-31 02:59:23 +0000226
227 // FIXME: Change from "expand" to appropriate type once ROTR is supported in
228 // .td files.
229 setOperationAction(ISD::ROTR, MVT::i32, Expand /*Legal*/);
230 setOperationAction(ISD::ROTR, MVT::i16, Expand /*Legal*/);
231 setOperationAction(ISD::ROTR, MVT::i8, Expand /*Custom*/);
232
Scott Michel8efdca42007-12-04 22:23:35 +0000233 setOperationAction(ISD::ROTL, MVT::i32, Legal);
234 setOperationAction(ISD::ROTL, MVT::i16, Legal);
235 setOperationAction(ISD::ROTL, MVT::i8, Custom);
Scott Michelabb8ca12008-11-20 16:36:33 +0000236
Scott Michel8efdca42007-12-04 22:23:35 +0000237 // SPU has no native version of shift left/right for i8
238 setOperationAction(ISD::SHL, MVT::i8, Custom);
239 setOperationAction(ISD::SRL, MVT::i8, Custom);
240 setOperationAction(ISD::SRA, MVT::i8, Custom);
Scott Michel33d73eb2008-11-21 02:56:16 +0000241
Scott Michel4d07fb72008-12-30 23:28:25 +0000242 // Make these operations legal and handle them during instruction selection:
243 setOperationAction(ISD::SHL, MVT::i64, Legal);
244 setOperationAction(ISD::SRL, MVT::i64, Legal);
245 setOperationAction(ISD::SRA, MVT::i64, Legal);
Scott Michel8efdca42007-12-04 22:23:35 +0000246
Scott Michel4ec722e2008-07-16 17:17:29 +0000247 // Custom lower i8, i32 and i64 multiplications
248 setOperationAction(ISD::MUL, MVT::i8, Custom);
Scott Michelae5cbf52008-12-29 03:23:36 +0000249 setOperationAction(ISD::MUL, MVT::i32, Legal);
Scott Michel750b93f2009-01-15 04:41:47 +0000250 setOperationAction(ISD::MUL, MVT::i64, Legal);
Scott Michel33d73eb2008-11-21 02:56:16 +0000251
Scott Michel67224b22008-06-02 22:18:03 +0000252 // Need to custom handle (some) common i8, i64 math ops
Scott Michel4d07fb72008-12-30 23:28:25 +0000253 setOperationAction(ISD::ADD, MVT::i8, Custom);
Scott Michel750b93f2009-01-15 04:41:47 +0000254 setOperationAction(ISD::ADD, MVT::i64, Legal);
Scott Michel8efdca42007-12-04 22:23:35 +0000255 setOperationAction(ISD::SUB, MVT::i8, Custom);
Scott Michel750b93f2009-01-15 04:41:47 +0000256 setOperationAction(ISD::SUB, MVT::i64, Legal);
Scott Michel4ec722e2008-07-16 17:17:29 +0000257
Scott Michel8efdca42007-12-04 22:23:35 +0000258 // SPU does not have BSWAP. It does have i32 support CTLZ.
259 // CTPOP has to be custom lowered.
260 setOperationAction(ISD::BSWAP, MVT::i32, Expand);
261 setOperationAction(ISD::BSWAP, MVT::i64, Expand);
262
263 setOperationAction(ISD::CTPOP, MVT::i8, Custom);
264 setOperationAction(ISD::CTPOP, MVT::i16, Custom);
265 setOperationAction(ISD::CTPOP, MVT::i32, Custom);
266 setOperationAction(ISD::CTPOP, MVT::i64, Custom);
267
268 setOperationAction(ISD::CTTZ , MVT::i32, Expand);
269 setOperationAction(ISD::CTTZ , MVT::i64, Expand);
270
271 setOperationAction(ISD::CTLZ , MVT::i32, Legal);
Scott Michel4ec722e2008-07-16 17:17:29 +0000272
Scott Michel67224b22008-06-02 22:18:03 +0000273 // SPU has a version of select that implements (a&~c)|(b&c), just like
Scott Michel978b96f2008-03-10 23:49:09 +0000274 // select ought to work:
Scott Michel53ab7792008-03-10 16:58:52 +0000275 setOperationAction(ISD::SELECT, MVT::i8, Legal);
Scott Michel6baba072008-03-05 23:02:02 +0000276 setOperationAction(ISD::SELECT, MVT::i16, Legal);
277 setOperationAction(ISD::SELECT, MVT::i32, Legal);
Scott Michel06eabde2008-12-27 04:51:36 +0000278 setOperationAction(ISD::SELECT, MVT::i64, Legal);
Scott Michel8efdca42007-12-04 22:23:35 +0000279
Scott Michel53ab7792008-03-10 16:58:52 +0000280 setOperationAction(ISD::SETCC, MVT::i8, Legal);
281 setOperationAction(ISD::SETCC, MVT::i16, Legal);
Scott Michelae5cbf52008-12-29 03:23:36 +0000282 setOperationAction(ISD::SETCC, MVT::i32, Legal);
283 setOperationAction(ISD::SETCC, MVT::i64, Legal);
Scott Michel8c67fa42009-01-21 04:58:48 +0000284 setOperationAction(ISD::SETCC, MVT::f64, Custom);
Scott Michel6baba072008-03-05 23:02:02 +0000285
Scott Michel06eabde2008-12-27 04:51:36 +0000286 // Custom lower i128 -> i64 truncates
Scott Michelec8c82e2008-12-02 19:53:53 +0000287 setOperationAction(ISD::TRUNCATE, MVT::i64, Custom);
288
pingbak2f387e82009-01-26 03:31:40 +0000289 // SPU has a legal FP -> signed INT instruction for f32, but for f64, need
290 // to expand to a libcall, hence the custom lowering:
291 setOperationAction(ISD::FP_TO_SINT, MVT::i32, Custom);
292 setOperationAction(ISD::FP_TO_UINT, MVT::i32, Custom);
Scott Michel8efdca42007-12-04 22:23:35 +0000293
294 // FDIV on SPU requires custom lowering
pingbak2f387e82009-01-26 03:31:40 +0000295 setOperationAction(ISD::FDIV, MVT::f64, Expand); // to libcall
Scott Michel8efdca42007-12-04 22:23:35 +0000296
Scott Michelc899a122009-01-26 22:33:37 +0000297 // SPU has [U|S]INT_TO_FP for f32->i32, but not for f64->i32, f64->i64:
pingbak2f387e82009-01-26 03:31:40 +0000298 setOperationAction(ISD::SINT_TO_FP, MVT::i32, Custom);
Scott Michel8efdca42007-12-04 22:23:35 +0000299 setOperationAction(ISD::SINT_TO_FP, MVT::i16, Promote);
pingbak2f387e82009-01-26 03:31:40 +0000300 setOperationAction(ISD::SINT_TO_FP, MVT::i8, Promote);
301 setOperationAction(ISD::UINT_TO_FP, MVT::i32, Custom);
Scott Michel8efdca42007-12-04 22:23:35 +0000302 setOperationAction(ISD::UINT_TO_FP, MVT::i16, Promote);
pingbak2f387e82009-01-26 03:31:40 +0000303 setOperationAction(ISD::UINT_TO_FP, MVT::i8, Promote);
Scott Michel8efdca42007-12-04 22:23:35 +0000304 setOperationAction(ISD::SINT_TO_FP, MVT::i64, Custom);
305 setOperationAction(ISD::UINT_TO_FP, MVT::i64, Custom);
306
Scott Michel754d8662007-12-20 00:44:13 +0000307 setOperationAction(ISD::BIT_CONVERT, MVT::i32, Legal);
308 setOperationAction(ISD::BIT_CONVERT, MVT::f32, Legal);
309 setOperationAction(ISD::BIT_CONVERT, MVT::i64, Legal);
310 setOperationAction(ISD::BIT_CONVERT, MVT::f64, Legal);
Scott Michel8efdca42007-12-04 22:23:35 +0000311
312 // We cannot sextinreg(i1). Expand to shifts.
313 setOperationAction(ISD::SIGN_EXTEND_INREG, MVT::i1, Expand);
Scott Michel4ec722e2008-07-16 17:17:29 +0000314
Scott Michel8efdca42007-12-04 22:23:35 +0000315 // Support label based line numbers.
Dan Gohman472d12c2008-06-30 20:59:49 +0000316 setOperationAction(ISD::DBG_STOPPOINT, MVT::Other, Expand);
Scott Michel8efdca42007-12-04 22:23:35 +0000317 setOperationAction(ISD::DEBUG_LOC, MVT::Other, Expand);
Scott Michel4ec722e2008-07-16 17:17:29 +0000318
319 // We want to legalize GlobalAddress and ConstantPool nodes into the
Scott Michel8efdca42007-12-04 22:23:35 +0000320 // appropriate instructions to materialize the address.
Scott Michel33d73eb2008-11-21 02:56:16 +0000321 for (unsigned sctype = (unsigned) MVT::i8; sctype < (unsigned) MVT::f128;
Scott Michelf9f42e62008-01-29 02:16:57 +0000322 ++sctype) {
Duncan Sands92c43912008-06-06 12:08:01 +0000323 MVT VT = (MVT::SimpleValueType)sctype;
324
Scott Michelae5cbf52008-12-29 03:23:36 +0000325 setOperationAction(ISD::GlobalAddress, VT, Custom);
326 setOperationAction(ISD::ConstantPool, VT, Custom);
327 setOperationAction(ISD::JumpTable, VT, Custom);
Scott Michelf9f42e62008-01-29 02:16:57 +0000328 }
Scott Michel8efdca42007-12-04 22:23:35 +0000329
330 // RET must be custom lowered, to meet ABI requirements
331 setOperationAction(ISD::RET, MVT::Other, Custom);
Scott Michel4ec722e2008-07-16 17:17:29 +0000332
Scott Michel8efdca42007-12-04 22:23:35 +0000333 // VASTART needs to be custom lowered to use the VarArgsFrameIndex
334 setOperationAction(ISD::VASTART , MVT::Other, Custom);
Scott Michel4ec722e2008-07-16 17:17:29 +0000335
Scott Michel8efdca42007-12-04 22:23:35 +0000336 // Use the default implementation.
337 setOperationAction(ISD::VAARG , MVT::Other, Expand);
338 setOperationAction(ISD::VACOPY , MVT::Other, Expand);
339 setOperationAction(ISD::VAEND , MVT::Other, Expand);
Scott Michel4ec722e2008-07-16 17:17:29 +0000340 setOperationAction(ISD::STACKSAVE , MVT::Other, Expand);
Scott Michel8efdca42007-12-04 22:23:35 +0000341 setOperationAction(ISD::STACKRESTORE , MVT::Other, Expand);
342 setOperationAction(ISD::DYNAMIC_STACKALLOC, MVT::i32 , Expand);
343 setOperationAction(ISD::DYNAMIC_STACKALLOC, MVT::i64 , Expand);
344
345 // Cell SPU has instructions for converting between i64 and fp.
346 setOperationAction(ISD::FP_TO_SINT, MVT::i64, Custom);
347 setOperationAction(ISD::SINT_TO_FP, MVT::i64, Custom);
Scott Michel4ec722e2008-07-16 17:17:29 +0000348
Scott Michel8efdca42007-12-04 22:23:35 +0000349 // To take advantage of the above i64 FP_TO_SINT, promote i32 FP_TO_UINT
350 setOperationAction(ISD::FP_TO_UINT, MVT::i32, Promote);
351
352 // BUILD_PAIR can't be handled natively, and should be expanded to shl/or
353 setOperationAction(ISD::BUILD_PAIR, MVT::i64, Expand);
354
355 // First set operation action for all vector types to expand. Then we
356 // will selectively turn on ones that can be effectively codegen'd.
357 addRegisterClass(MVT::v16i8, SPU::VECREGRegisterClass);
358 addRegisterClass(MVT::v8i16, SPU::VECREGRegisterClass);
359 addRegisterClass(MVT::v4i32, SPU::VECREGRegisterClass);
360 addRegisterClass(MVT::v2i64, SPU::VECREGRegisterClass);
361 addRegisterClass(MVT::v4f32, SPU::VECREGRegisterClass);
362 addRegisterClass(MVT::v2f64, SPU::VECREGRegisterClass);
363
Scott Michel70741542009-01-06 23:10:38 +0000364 // "Odd size" vector classes that we're willing to support:
365 addRegisterClass(MVT::v2i32, SPU::VECREGRegisterClass);
366
Duncan Sands92c43912008-06-06 12:08:01 +0000367 for (unsigned i = (unsigned)MVT::FIRST_VECTOR_VALUETYPE;
368 i <= (unsigned)MVT::LAST_VECTOR_VALUETYPE; ++i) {
369 MVT VT = (MVT::SimpleValueType)i;
Scott Michel8efdca42007-12-04 22:23:35 +0000370
Duncan Sands92c43912008-06-06 12:08:01 +0000371 // add/sub are legal for all supported vector VT's.
pingbak2f387e82009-01-26 03:31:40 +0000372 setOperationAction(ISD::ADD, VT, Legal);
373 setOperationAction(ISD::SUB, VT, Legal);
Duncan Sands92c43912008-06-06 12:08:01 +0000374 // mul has to be custom lowered.
pingbak2f387e82009-01-26 03:31:40 +0000375 setOperationAction(ISD::MUL, VT, Legal);
Duncan Sands92c43912008-06-06 12:08:01 +0000376
pingbak2f387e82009-01-26 03:31:40 +0000377 setOperationAction(ISD::AND, VT, Legal);
378 setOperationAction(ISD::OR, VT, Legal);
379 setOperationAction(ISD::XOR, VT, Legal);
380 setOperationAction(ISD::LOAD, VT, Legal);
381 setOperationAction(ISD::SELECT, VT, Legal);
382 setOperationAction(ISD::STORE, VT, Legal);
Scott Michel4ec722e2008-07-16 17:17:29 +0000383
Scott Michel8efdca42007-12-04 22:23:35 +0000384 // These operations need to be expanded:
pingbak2f387e82009-01-26 03:31:40 +0000385 setOperationAction(ISD::SDIV, VT, Expand);
386 setOperationAction(ISD::SREM, VT, Expand);
387 setOperationAction(ISD::UDIV, VT, Expand);
388 setOperationAction(ISD::UREM, VT, Expand);
Scott Michel8efdca42007-12-04 22:23:35 +0000389
390 // Custom lower build_vector, constant pool spills, insert and
391 // extract vector elements:
Duncan Sands92c43912008-06-06 12:08:01 +0000392 setOperationAction(ISD::BUILD_VECTOR, VT, Custom);
393 setOperationAction(ISD::ConstantPool, VT, Custom);
394 setOperationAction(ISD::SCALAR_TO_VECTOR, VT, Custom);
395 setOperationAction(ISD::EXTRACT_VECTOR_ELT, VT, Custom);
396 setOperationAction(ISD::INSERT_VECTOR_ELT, VT, Custom);
397 setOperationAction(ISD::VECTOR_SHUFFLE, VT, Custom);
Scott Michel8efdca42007-12-04 22:23:35 +0000398 }
399
Scott Michel8efdca42007-12-04 22:23:35 +0000400 setOperationAction(ISD::AND, MVT::v16i8, Custom);
401 setOperationAction(ISD::OR, MVT::v16i8, Custom);
402 setOperationAction(ISD::XOR, MVT::v16i8, Custom);
403 setOperationAction(ISD::SCALAR_TO_VECTOR, MVT::v4f32, Custom);
Scott Micheldbac4cf2008-01-11 02:53:15 +0000404
Scott Michel4d07fb72008-12-30 23:28:25 +0000405 setOperationAction(ISD::FDIV, MVT::v4f32, Legal);
Scott Michelae5cbf52008-12-29 03:23:36 +0000406
Scott Michel8efdca42007-12-04 22:23:35 +0000407 setShiftAmountType(MVT::i32);
Scott Michel06eabde2008-12-27 04:51:36 +0000408 setBooleanContents(ZeroOrNegativeOneBooleanContent);
Scott Michel4ec722e2008-07-16 17:17:29 +0000409
Scott Michel8efdca42007-12-04 22:23:35 +0000410 setStackPointerRegisterToSaveRestore(SPU::R1);
Scott Michel4ec722e2008-07-16 17:17:29 +0000411
Scott Michel8efdca42007-12-04 22:23:35 +0000412 // We have target-specific dag combine patterns for the following nodes:
Scott Michelf9f42e62008-01-29 02:16:57 +0000413 setTargetDAGCombine(ISD::ADD);
Scott Michel97872d32008-02-23 18:41:37 +0000414 setTargetDAGCombine(ISD::ZERO_EXTEND);
415 setTargetDAGCombine(ISD::SIGN_EXTEND);
416 setTargetDAGCombine(ISD::ANY_EXTEND);
Scott Michel4ec722e2008-07-16 17:17:29 +0000417
Scott Michel8efdca42007-12-04 22:23:35 +0000418 computeRegisterProperties();
Scott Michel56a125e2008-11-22 23:50:42 +0000419
Scott Michel2c261072008-12-09 03:37:19 +0000420 // Set pre-RA register scheduler default to BURR, which produces slightly
421 // better code than the default (could also be TDRR, but TargetLowering.h
422 // needs a mod to support that model):
423 setSchedulingPreference(SchedulingForRegPressure);
Scott Michel8efdca42007-12-04 22:23:35 +0000424}
425
426const char *
427SPUTargetLowering::getTargetNodeName(unsigned Opcode) const
428{
429 if (node_names.empty()) {
430 node_names[(unsigned) SPUISD::RET_FLAG] = "SPUISD::RET_FLAG";
431 node_names[(unsigned) SPUISD::Hi] = "SPUISD::Hi";
432 node_names[(unsigned) SPUISD::Lo] = "SPUISD::Lo";
433 node_names[(unsigned) SPUISD::PCRelAddr] = "SPUISD::PCRelAddr";
Scott Micheldbac4cf2008-01-11 02:53:15 +0000434 node_names[(unsigned) SPUISD::AFormAddr] = "SPUISD::AFormAddr";
Scott Michelf9f42e62008-01-29 02:16:57 +0000435 node_names[(unsigned) SPUISD::IndirectAddr] = "SPUISD::IndirectAddr";
Scott Michel8efdca42007-12-04 22:23:35 +0000436 node_names[(unsigned) SPUISD::LDRESULT] = "SPUISD::LDRESULT";
437 node_names[(unsigned) SPUISD::CALL] = "SPUISD::CALL";
438 node_names[(unsigned) SPUISD::SHUFB] = "SPUISD::SHUFB";
Scott Michel56a125e2008-11-22 23:50:42 +0000439 node_names[(unsigned) SPUISD::SHUFFLE_MASK] = "SPUISD::SHUFFLE_MASK";
Scott Michel8efdca42007-12-04 22:23:35 +0000440 node_names[(unsigned) SPUISD::CNTB] = "SPUISD::CNTB";
Scott Michelae5cbf52008-12-29 03:23:36 +0000441 node_names[(unsigned) SPUISD::PREFSLOT2VEC] = "SPUISD::PREFSLOT2VEC";
Scott Michelc630c412008-11-24 17:11:17 +0000442 node_names[(unsigned) SPUISD::VEC2PREFSLOT] = "SPUISD::VEC2PREFSLOT";
Scott Michel97872d32008-02-23 18:41:37 +0000443 node_names[(unsigned) SPUISD::SHLQUAD_L_BITS] = "SPUISD::SHLQUAD_L_BITS";
444 node_names[(unsigned) SPUISD::SHLQUAD_L_BYTES] = "SPUISD::SHLQUAD_L_BYTES";
Scott Michel8efdca42007-12-04 22:23:35 +0000445 node_names[(unsigned) SPUISD::VEC_SHL] = "SPUISD::VEC_SHL";
446 node_names[(unsigned) SPUISD::VEC_SRL] = "SPUISD::VEC_SRL";
447 node_names[(unsigned) SPUISD::VEC_SRA] = "SPUISD::VEC_SRA";
448 node_names[(unsigned) SPUISD::VEC_ROTL] = "SPUISD::VEC_ROTL";
449 node_names[(unsigned) SPUISD::VEC_ROTR] = "SPUISD::VEC_ROTR";
Scott Michel8c67fa42009-01-21 04:58:48 +0000450 node_names[(unsigned) SPUISD::ROTBYTES_LEFT] = "SPUISD::ROTBYTES_LEFT";
451 node_names[(unsigned) SPUISD::ROTBYTES_LEFT_BITS] =
452 "SPUISD::ROTBYTES_LEFT_BITS";
Scott Michel67224b22008-06-02 22:18:03 +0000453 node_names[(unsigned) SPUISD::SELECT_MASK] = "SPUISD::SELECT_MASK";
Scott Michel8efdca42007-12-04 22:23:35 +0000454 node_names[(unsigned) SPUISD::SELB] = "SPUISD::SELB";
Scott Michel750b93f2009-01-15 04:41:47 +0000455 node_names[(unsigned) SPUISD::ADD64_MARKER] = "SPUISD::ADD64_MARKER";
456 node_names[(unsigned) SPUISD::SUB64_MARKER] = "SPUISD::SUB64_MARKER";
457 node_names[(unsigned) SPUISD::MUL64_MARKER] = "SPUISD::MUL64_MARKER";
Scott Michel8efdca42007-12-04 22:23:35 +0000458 }
459
460 std::map<unsigned, const char *>::iterator i = node_names.find(Opcode);
461
462 return ((i != node_names.end()) ? i->second : 0);
463}
464
Scott Michel06eabde2008-12-27 04:51:36 +0000465//===----------------------------------------------------------------------===//
466// Return the Cell SPU's SETCC result type
467//===----------------------------------------------------------------------===//
468
Duncan Sands4a361272009-01-01 15:52:00 +0000469MVT SPUTargetLowering::getSetCCResultType(MVT VT) const {
Scott Michel06eabde2008-12-27 04:51:36 +0000470 // i16 and i32 are valid SETCC result types
471 return ((VT == MVT::i8 || VT == MVT::i16 || VT == MVT::i32) ? VT : MVT::i32);
Scott Michel53ab7792008-03-10 16:58:52 +0000472}
473
Scott Michel8efdca42007-12-04 22:23:35 +0000474//===----------------------------------------------------------------------===//
475// Calling convention code:
476//===----------------------------------------------------------------------===//
477
478#include "SPUGenCallingConv.inc"
479
480//===----------------------------------------------------------------------===//
481// LowerOperation implementation
482//===----------------------------------------------------------------------===//
483
484/// Custom lower loads for CellSPU
485/*!
486 All CellSPU loads and stores are aligned to 16-byte boundaries, so for elements
487 within a 16-byte block, we have to rotate to extract the requested element.
Scott Michel6ccefab2008-12-04 03:02:42 +0000488
489 For extending loads, we also want to ensure that the following sequence is
490 emitted, e.g. for MVT::f32 extending load to MVT::f64:
491
492\verbatim
Scott Michelae5cbf52008-12-29 03:23:36 +0000493%1 v16i8,ch = load
Scott Michel6ccefab2008-12-04 03:02:42 +0000494%2 v16i8,ch = rotate %1
Scott Michelae5cbf52008-12-29 03:23:36 +0000495%3 v4f8, ch = bitconvert %2
Scott Michel6ccefab2008-12-04 03:02:42 +0000496%4 f32 = vec2perfslot %3
497%5 f64 = fp_extend %4
498\endverbatim
499*/
Dan Gohman8181bd12008-07-27 21:46:04 +0000500static SDValue
501LowerLOAD(SDValue Op, SelectionDAG &DAG, const SPUSubtarget *ST) {
Scott Michel8efdca42007-12-04 22:23:35 +0000502 LoadSDNode *LN = cast<LoadSDNode>(Op);
Dan Gohman8181bd12008-07-27 21:46:04 +0000503 SDValue the_chain = LN->getChain();
Scott Michel06eabde2008-12-27 04:51:36 +0000504 MVT PtrVT = DAG.getTargetLoweringInfo().getPointerTy();
Scott Michel6ccefab2008-12-04 03:02:42 +0000505 MVT InVT = LN->getMemoryVT();
506 MVT OutVT = Op.getValueType();
Scott Michel8efdca42007-12-04 22:23:35 +0000507 ISD::LoadExtType ExtType = LN->getExtensionType();
508 unsigned alignment = LN->getAlignment();
Scott Michel06eabde2008-12-27 04:51:36 +0000509 const valtype_map_s *vtm = getValueTypeMapEntry(InVT);
Dale Johannesenea996922009-02-04 20:06:27 +0000510 DebugLoc dl = Op.getDebugLoc();
Scott Michel8efdca42007-12-04 22:23:35 +0000511
Scott Michel8efdca42007-12-04 22:23:35 +0000512 switch (LN->getAddressingMode()) {
513 case ISD::UNINDEXED: {
Scott Michel06eabde2008-12-27 04:51:36 +0000514 SDValue result;
515 SDValue basePtr = LN->getBasePtr();
516 SDValue rotate;
Scott Michel8efdca42007-12-04 22:23:35 +0000517
Scott Michel06eabde2008-12-27 04:51:36 +0000518 if (alignment == 16) {
519 ConstantSDNode *CN;
Scott Micheldbac4cf2008-01-11 02:53:15 +0000520
Scott Michel06eabde2008-12-27 04:51:36 +0000521 // Special cases for a known aligned load to simplify the base pointer
522 // and the rotation amount:
523 if (basePtr.getOpcode() == ISD::ADD
524 && (CN = dyn_cast<ConstantSDNode > (basePtr.getOperand(1))) != 0) {
525 // Known offset into basePtr
526 int64_t offset = CN->getSExtValue();
527 int64_t rotamt = int64_t((offset & 0xf) - vtm->prefslot_byte);
Scott Micheldbac4cf2008-01-11 02:53:15 +0000528
Scott Michel06eabde2008-12-27 04:51:36 +0000529 if (rotamt < 0)
530 rotamt += 16;
531
532 rotate = DAG.getConstant(rotamt, MVT::i16);
533
534 // Simplify the base pointer for this case:
535 basePtr = basePtr.getOperand(0);
536 if ((offset & ~0xf) > 0) {
Dale Johannesen175fdef2009-02-06 21:50:26 +0000537 basePtr = DAG.getNode(SPUISD::IndirectAddr, dl, PtrVT,
Scott Michel06eabde2008-12-27 04:51:36 +0000538 basePtr,
539 DAG.getConstant((offset & ~0xf), PtrVT));
540 }
541 } else if ((basePtr.getOpcode() == SPUISD::AFormAddr)
542 || (basePtr.getOpcode() == SPUISD::IndirectAddr
543 && basePtr.getOperand(0).getOpcode() == SPUISD::Hi
544 && basePtr.getOperand(1).getOpcode() == SPUISD::Lo)) {
545 // Plain aligned a-form address: rotate into preferred slot
546 // Same for (SPUindirect (SPUhi ...), (SPUlo ...))
547 int64_t rotamt = -vtm->prefslot_byte;
548 if (rotamt < 0)
549 rotamt += 16;
550 rotate = DAG.getConstant(rotamt, MVT::i16);
Scott Micheldbac4cf2008-01-11 02:53:15 +0000551 } else {
Scott Michel06eabde2008-12-27 04:51:36 +0000552 // Offset the rotate amount by the basePtr and the preferred slot
553 // byte offset
554 int64_t rotamt = -vtm->prefslot_byte;
555 if (rotamt < 0)
556 rotamt += 16;
Dale Johannesenea996922009-02-04 20:06:27 +0000557 rotate = DAG.getNode(ISD::ADD, dl, PtrVT,
Scott Michel06eabde2008-12-27 04:51:36 +0000558 basePtr,
Scott Michel5a6f17b2008-01-30 02:55:46 +0000559 DAG.getConstant(rotamt, PtrVT));
Scott Micheldbac4cf2008-01-11 02:53:15 +0000560 }
Scott Michel06eabde2008-12-27 04:51:36 +0000561 } else {
562 // Unaligned load: must be more pessimistic about addressing modes:
563 if (basePtr.getOpcode() == ISD::ADD) {
564 MachineFunction &MF = DAG.getMachineFunction();
565 MachineRegisterInfo &RegInfo = MF.getRegInfo();
566 unsigned VReg = RegInfo.createVirtualRegister(&SPU::R32CRegClass);
567 SDValue Flag;
Scott Micheldbac4cf2008-01-11 02:53:15 +0000568
Scott Michel06eabde2008-12-27 04:51:36 +0000569 SDValue Op0 = basePtr.getOperand(0);
570 SDValue Op1 = basePtr.getOperand(1);
571
572 if (isa<ConstantSDNode>(Op1)) {
573 // Convert the (add <ptr>, <const>) to an indirect address contained
574 // in a register. Note that this is done because we need to avoid
575 // creating a 0(reg) d-form address due to the SPU's block loads.
Dale Johannesen175fdef2009-02-06 21:50:26 +0000576 basePtr = DAG.getNode(SPUISD::IndirectAddr, dl, PtrVT, Op0, Op1);
Dale Johannesenea996922009-02-04 20:06:27 +0000577 the_chain = DAG.getCopyToReg(the_chain, dl, VReg, basePtr, Flag);
578 basePtr = DAG.getCopyFromReg(the_chain, dl, VReg, PtrVT);
Scott Michel06eabde2008-12-27 04:51:36 +0000579 } else {
580 // Convert the (add <arg1>, <arg2>) to an indirect address, which
581 // will likely be lowered as a reg(reg) x-form address.
Dale Johannesen175fdef2009-02-06 21:50:26 +0000582 basePtr = DAG.getNode(SPUISD::IndirectAddr, dl, PtrVT, Op0, Op1);
Scott Michel06eabde2008-12-27 04:51:36 +0000583 }
584 } else {
Dale Johannesen175fdef2009-02-06 21:50:26 +0000585 basePtr = DAG.getNode(SPUISD::IndirectAddr, dl, PtrVT,
Scott Michel06eabde2008-12-27 04:51:36 +0000586 basePtr,
587 DAG.getConstant(0, PtrVT));
588 }
589
590 // Offset the rotate amount by the basePtr and the preferred slot
591 // byte offset
Dale Johannesenea996922009-02-04 20:06:27 +0000592 rotate = DAG.getNode(ISD::ADD, dl, PtrVT,
Scott Michel06eabde2008-12-27 04:51:36 +0000593 basePtr,
594 DAG.getConstant(-vtm->prefslot_byte, PtrVT));
Scott Michel8efdca42007-12-04 22:23:35 +0000595 }
Scott Micheldbac4cf2008-01-11 02:53:15 +0000596
Scott Michel06eabde2008-12-27 04:51:36 +0000597 // Re-emit as a v16i8 vector load
Dale Johannesenea996922009-02-04 20:06:27 +0000598 result = DAG.getLoad(MVT::v16i8, dl, the_chain, basePtr,
Scott Michel06eabde2008-12-27 04:51:36 +0000599 LN->getSrcValue(), LN->getSrcValueOffset(),
600 LN->isVolatile(), 16);
601
602 // Update the chain
603 the_chain = result.getValue(1);
604
605 // Rotate into the preferred slot:
Dale Johannesenea996922009-02-04 20:06:27 +0000606 result = DAG.getNode(SPUISD::ROTBYTES_LEFT, dl, MVT::v16i8,
Scott Michel06eabde2008-12-27 04:51:36 +0000607 result.getValue(0), rotate);
608
Scott Michel6ccefab2008-12-04 03:02:42 +0000609 // Convert the loaded v16i8 vector to the appropriate vector type
610 // specified by the operand:
611 MVT vecVT = MVT::getVectorVT(InVT, (128 / InVT.getSizeInBits()));
Dale Johannesenea996922009-02-04 20:06:27 +0000612 result = DAG.getNode(SPUISD::VEC2PREFSLOT, dl, InVT,
613 DAG.getNode(ISD::BIT_CONVERT, dl, vecVT, result));
Scott Michel4ec722e2008-07-16 17:17:29 +0000614
Scott Michel6ccefab2008-12-04 03:02:42 +0000615 // Handle extending loads by extending the scalar result:
616 if (ExtType == ISD::SEXTLOAD) {
Dale Johannesenea996922009-02-04 20:06:27 +0000617 result = DAG.getNode(ISD::SIGN_EXTEND, dl, OutVT, result);
Scott Michel6ccefab2008-12-04 03:02:42 +0000618 } else if (ExtType == ISD::ZEXTLOAD) {
Dale Johannesenea996922009-02-04 20:06:27 +0000619 result = DAG.getNode(ISD::ZERO_EXTEND, dl, OutVT, result);
Scott Michel6ccefab2008-12-04 03:02:42 +0000620 } else if (ExtType == ISD::EXTLOAD) {
621 unsigned NewOpc = ISD::ANY_EXTEND;
Scott Micheldbac4cf2008-01-11 02:53:15 +0000622
Scott Michel6ccefab2008-12-04 03:02:42 +0000623 if (OutVT.isFloatingPoint())
pingbakb8913342009-01-26 03:37:41 +0000624 NewOpc = ISD::FP_EXTEND;
Scott Micheldbac4cf2008-01-11 02:53:15 +0000625
Dale Johannesenea996922009-02-04 20:06:27 +0000626 result = DAG.getNode(NewOpc, dl, OutVT, result);
Scott Micheldbac4cf2008-01-11 02:53:15 +0000627 }
628
Scott Michel6ccefab2008-12-04 03:02:42 +0000629 SDVTList retvts = DAG.getVTList(OutVT, MVT::Other);
Dan Gohman8181bd12008-07-27 21:46:04 +0000630 SDValue retops[2] = {
Scott Michel394e26d2008-01-17 20:38:41 +0000631 result,
Scott Michel5a6f17b2008-01-30 02:55:46 +0000632 the_chain
Scott Michel394e26d2008-01-17 20:38:41 +0000633 };
Scott Micheldbac4cf2008-01-11 02:53:15 +0000634
Dale Johannesenea996922009-02-04 20:06:27 +0000635 result = DAG.getNode(SPUISD::LDRESULT, dl, retvts,
Scott Michel394e26d2008-01-17 20:38:41 +0000636 retops, sizeof(retops) / sizeof(retops[0]));
Scott Micheldbac4cf2008-01-11 02:53:15 +0000637 return result;
Scott Michel8efdca42007-12-04 22:23:35 +0000638 }
639 case ISD::PRE_INC:
640 case ISD::PRE_DEC:
641 case ISD::POST_INC:
642 case ISD::POST_DEC:
643 case ISD::LAST_INDEXED_MODE:
644 cerr << "LowerLOAD: Got a LoadSDNode with an addr mode other than "
645 "UNINDEXED\n";
646 cerr << (unsigned) LN->getAddressingMode() << "\n";
647 abort();
648 /*NOTREACHED*/
649 }
650
Dan Gohman8181bd12008-07-27 21:46:04 +0000651 return SDValue();
Scott Michel8efdca42007-12-04 22:23:35 +0000652}
653
654/// Custom lower stores for CellSPU
655/*!
656 All CellSPU stores are aligned to 16-byte boundaries, so for elements
657 within a 16-byte block, we have to generate a shuffle to insert the
658 requested element into its place, then store the resulting block.
659 */
Dan Gohman8181bd12008-07-27 21:46:04 +0000660static SDValue
661LowerSTORE(SDValue Op, SelectionDAG &DAG, const SPUSubtarget *ST) {
Scott Michel8efdca42007-12-04 22:23:35 +0000662 StoreSDNode *SN = cast<StoreSDNode>(Op);
Dan Gohman8181bd12008-07-27 21:46:04 +0000663 SDValue Value = SN->getValue();
Duncan Sands92c43912008-06-06 12:08:01 +0000664 MVT VT = Value.getValueType();
665 MVT StVT = (!SN->isTruncatingStore() ? VT : SN->getMemoryVT());
666 MVT PtrVT = DAG.getTargetLoweringInfo().getPointerTy();
Dale Johannesenea996922009-02-04 20:06:27 +0000667 DebugLoc dl = Op.getDebugLoc();
Scott Micheldbac4cf2008-01-11 02:53:15 +0000668 unsigned alignment = SN->getAlignment();
Scott Michel8efdca42007-12-04 22:23:35 +0000669
670 switch (SN->getAddressingMode()) {
671 case ISD::UNINDEXED: {
Scott Michel33d73eb2008-11-21 02:56:16 +0000672 // The vector type we really want to load from the 16-byte chunk.
Scott Michele1006032008-11-19 17:45:08 +0000673 MVT vecVT = MVT::getVectorVT(VT, (128 / VT.getSizeInBits())),
674 stVecVT = MVT::getVectorVT(StVT, (128 / StVT.getSizeInBits()));
Scott Michel8efdca42007-12-04 22:23:35 +0000675
Scott Michel06eabde2008-12-27 04:51:36 +0000676 SDValue alignLoadVec;
677 SDValue basePtr = SN->getBasePtr();
678 SDValue the_chain = SN->getChain();
679 SDValue insertEltOffs;
Scott Michel8efdca42007-12-04 22:23:35 +0000680
Scott Michel06eabde2008-12-27 04:51:36 +0000681 if (alignment == 16) {
682 ConstantSDNode *CN;
683
684 // Special cases for a known aligned load to simplify the base pointer
685 // and insertion byte:
686 if (basePtr.getOpcode() == ISD::ADD
687 && (CN = dyn_cast<ConstantSDNode>(basePtr.getOperand(1))) != 0) {
688 // Known offset into basePtr
689 int64_t offset = CN->getSExtValue();
690
691 // Simplify the base pointer for this case:
692 basePtr = basePtr.getOperand(0);
Dale Johannesen175fdef2009-02-06 21:50:26 +0000693 insertEltOffs = DAG.getNode(SPUISD::IndirectAddr, dl, PtrVT,
Scott Michel06eabde2008-12-27 04:51:36 +0000694 basePtr,
695 DAG.getConstant((offset & 0xf), PtrVT));
696
697 if ((offset & ~0xf) > 0) {
Dale Johannesen175fdef2009-02-06 21:50:26 +0000698 basePtr = DAG.getNode(SPUISD::IndirectAddr, dl, PtrVT,
Scott Michel06eabde2008-12-27 04:51:36 +0000699 basePtr,
700 DAG.getConstant((offset & ~0xf), PtrVT));
701 }
702 } else {
703 // Otherwise, assume it's at byte 0 of basePtr
Dale Johannesen175fdef2009-02-06 21:50:26 +0000704 insertEltOffs = DAG.getNode(SPUISD::IndirectAddr, dl, PtrVT,
Scott Michel06eabde2008-12-27 04:51:36 +0000705 basePtr,
706 DAG.getConstant(0, PtrVT));
707 }
708 } else {
709 // Unaligned load: must be more pessimistic about addressing modes:
710 if (basePtr.getOpcode() == ISD::ADD) {
711 MachineFunction &MF = DAG.getMachineFunction();
712 MachineRegisterInfo &RegInfo = MF.getRegInfo();
713 unsigned VReg = RegInfo.createVirtualRegister(&SPU::R32CRegClass);
714 SDValue Flag;
715
716 SDValue Op0 = basePtr.getOperand(0);
717 SDValue Op1 = basePtr.getOperand(1);
718
719 if (isa<ConstantSDNode>(Op1)) {
720 // Convert the (add <ptr>, <const>) to an indirect address contained
721 // in a register. Note that this is done because we need to avoid
722 // creating a 0(reg) d-form address due to the SPU's block loads.
Dale Johannesen175fdef2009-02-06 21:50:26 +0000723 basePtr = DAG.getNode(SPUISD::IndirectAddr, dl, PtrVT, Op0, Op1);
Dale Johannesenea996922009-02-04 20:06:27 +0000724 the_chain = DAG.getCopyToReg(the_chain, dl, VReg, basePtr, Flag);
725 basePtr = DAG.getCopyFromReg(the_chain, dl, VReg, PtrVT);
Scott Michel06eabde2008-12-27 04:51:36 +0000726 } else {
727 // Convert the (add <arg1>, <arg2>) to an indirect address, which
728 // will likely be lowered as a reg(reg) x-form address.
Dale Johannesen175fdef2009-02-06 21:50:26 +0000729 basePtr = DAG.getNode(SPUISD::IndirectAddr, dl, PtrVT, Op0, Op1);
Scott Michel06eabde2008-12-27 04:51:36 +0000730 }
731 } else {
Dale Johannesen175fdef2009-02-06 21:50:26 +0000732 basePtr = DAG.getNode(SPUISD::IndirectAddr, dl, PtrVT,
Scott Michel06eabde2008-12-27 04:51:36 +0000733 basePtr,
734 DAG.getConstant(0, PtrVT));
735 }
736
737 // Insertion point is solely determined by basePtr's contents
Dale Johannesenea996922009-02-04 20:06:27 +0000738 insertEltOffs = DAG.getNode(ISD::ADD, dl, PtrVT,
Scott Michel06eabde2008-12-27 04:51:36 +0000739 basePtr,
740 DAG.getConstant(0, PtrVT));
741 }
742
743 // Re-emit as a v16i8 vector load
Dale Johannesenea996922009-02-04 20:06:27 +0000744 alignLoadVec = DAG.getLoad(MVT::v16i8, dl, the_chain, basePtr,
Scott Michel06eabde2008-12-27 04:51:36 +0000745 SN->getSrcValue(), SN->getSrcValueOffset(),
746 SN->isVolatile(), 16);
747
748 // Update the chain
749 the_chain = alignLoadVec.getValue(1);
Scott Michel8efdca42007-12-04 22:23:35 +0000750
Scott Micheldbac4cf2008-01-11 02:53:15 +0000751 LoadSDNode *LN = cast<LoadSDNode>(alignLoadVec);
Dan Gohman8181bd12008-07-27 21:46:04 +0000752 SDValue theValue = SN->getValue();
753 SDValue result;
Scott Michel8efdca42007-12-04 22:23:35 +0000754
755 if (StVT != VT
Scott Michel5a6f17b2008-01-30 02:55:46 +0000756 && (theValue.getOpcode() == ISD::AssertZext
757 || theValue.getOpcode() == ISD::AssertSext)) {
Scott Michel8efdca42007-12-04 22:23:35 +0000758 // Drill down and get the value for zero- and sign-extended
759 // quantities
Scott Michel4ec722e2008-07-16 17:17:29 +0000760 theValue = theValue.getOperand(0);
Scott Michel8efdca42007-12-04 22:23:35 +0000761 }
762
Scott Micheldbac4cf2008-01-11 02:53:15 +0000763 // If the base pointer is already a D-form address, then just create
764 // a new D-form address with a slot offset and the orignal base pointer.
765 // Otherwise generate a D-form address with the slot offset relative
766 // to the stack pointer, which is always aligned.
Scott Michel06eabde2008-12-27 04:51:36 +0000767#if !defined(NDEBUG)
768 if (DebugFlag && isCurrentDebugType(DEBUG_TYPE)) {
769 cerr << "CellSPU LowerSTORE: basePtr = ";
770 basePtr.getNode()->dump(&DAG);
771 cerr << "\n";
772 }
773#endif
Scott Micheldbac4cf2008-01-11 02:53:15 +0000774
Scott Michelf65c8f02008-11-19 15:24:16 +0000775 SDValue insertEltOp =
Dale Johannesenea996922009-02-04 20:06:27 +0000776 DAG.getNode(SPUISD::SHUFFLE_MASK, dl, vecVT, insertEltOffs);
Scott Michele1006032008-11-19 17:45:08 +0000777 SDValue vectorizeOp =
Dale Johannesenea996922009-02-04 20:06:27 +0000778 DAG.getNode(ISD::SCALAR_TO_VECTOR, dl, vecVT, theValue);
Scott Michelf65c8f02008-11-19 15:24:16 +0000779
Dale Johannesenea996922009-02-04 20:06:27 +0000780 result = DAG.getNode(SPUISD::SHUFB, dl, vecVT,
pingbakb8913342009-01-26 03:37:41 +0000781 vectorizeOp, alignLoadVec,
Dale Johannesenea996922009-02-04 20:06:27 +0000782 DAG.getNode(ISD::BIT_CONVERT, dl,
783 MVT::v4i32, insertEltOp));
Scott Michel8efdca42007-12-04 22:23:35 +0000784
Dale Johannesenea996922009-02-04 20:06:27 +0000785 result = DAG.getStore(the_chain, dl, result, basePtr,
Scott Michel8efdca42007-12-04 22:23:35 +0000786 LN->getSrcValue(), LN->getSrcValueOffset(),
787 LN->isVolatile(), LN->getAlignment());
788
Scott Michel8c2746e2008-12-04 17:16:59 +0000789#if 0 && !defined(NDEBUG)
Scott Michelf65c8f02008-11-19 15:24:16 +0000790 if (DebugFlag && isCurrentDebugType(DEBUG_TYPE)) {
791 const SDValue &currentRoot = DAG.getRoot();
792
793 DAG.setRoot(result);
794 cerr << "------- CellSPU:LowerStore result:\n";
795 DAG.dump();
796 cerr << "-------\n";
797 DAG.setRoot(currentRoot);
798 }
799#endif
Scott Michelec8c82e2008-12-02 19:53:53 +0000800
Scott Michel8efdca42007-12-04 22:23:35 +0000801 return result;
802 /*UNREACHED*/
803 }
804 case ISD::PRE_INC:
805 case ISD::PRE_DEC:
806 case ISD::POST_INC:
807 case ISD::POST_DEC:
808 case ISD::LAST_INDEXED_MODE:
809 cerr << "LowerLOAD: Got a LoadSDNode with an addr mode other than "
810 "UNINDEXED\n";
811 cerr << (unsigned) SN->getAddressingMode() << "\n";
812 abort();
813 /*NOTREACHED*/
814 }
815
Dan Gohman8181bd12008-07-27 21:46:04 +0000816 return SDValue();
Scott Michel8efdca42007-12-04 22:23:35 +0000817}
818
Scott Michel750b93f2009-01-15 04:41:47 +0000819//! Generate the address of a constant pool entry.
820SDValue
Dan Gohman8181bd12008-07-27 21:46:04 +0000821LowerConstantPool(SDValue Op, SelectionDAG &DAG, const SPUSubtarget *ST) {
Duncan Sands92c43912008-06-06 12:08:01 +0000822 MVT PtrVT = Op.getValueType();
Scott Michel8efdca42007-12-04 22:23:35 +0000823 ConstantPoolSDNode *CP = cast<ConstantPoolSDNode>(Op);
824 Constant *C = CP->getConstVal();
Dan Gohman8181bd12008-07-27 21:46:04 +0000825 SDValue CPI = DAG.getTargetConstantPool(C, PtrVT, CP->getAlignment());
826 SDValue Zero = DAG.getConstant(0, PtrVT);
Scott Micheldbac4cf2008-01-11 02:53:15 +0000827 const TargetMachine &TM = DAG.getTarget();
Dale Johannesen175fdef2009-02-06 21:50:26 +0000828 // FIXME there is no actual debug info here
829 DebugLoc dl = Op.getDebugLoc();
Scott Michel8efdca42007-12-04 22:23:35 +0000830
831 if (TM.getRelocationModel() == Reloc::Static) {
832 if (!ST->usingLargeMem()) {
Dan Gohman8181bd12008-07-27 21:46:04 +0000833 // Just return the SDValue with the constant pool address in it.
Dale Johannesen175fdef2009-02-06 21:50:26 +0000834 return DAG.getNode(SPUISD::AFormAddr, dl, PtrVT, CPI, Zero);
Scott Michel8efdca42007-12-04 22:23:35 +0000835 } else {
Dale Johannesen175fdef2009-02-06 21:50:26 +0000836 SDValue Hi = DAG.getNode(SPUISD::Hi, dl, PtrVT, CPI, Zero);
837 SDValue Lo = DAG.getNode(SPUISD::Lo, dl, PtrVT, CPI, Zero);
838 return DAG.getNode(SPUISD::IndirectAddr, dl, PtrVT, Hi, Lo);
Scott Michel8efdca42007-12-04 22:23:35 +0000839 }
840 }
841
842 assert(0 &&
Gabor Greife9f7f582008-08-31 15:37:04 +0000843 "LowerConstantPool: Relocation model other than static"
844 " not supported.");
Dan Gohman8181bd12008-07-27 21:46:04 +0000845 return SDValue();
Scott Michel8efdca42007-12-04 22:23:35 +0000846}
847
Scott Michel750b93f2009-01-15 04:41:47 +0000848//! Alternate entry point for generating the address of a constant pool entry
849SDValue
850SPU::LowerConstantPool(SDValue Op, SelectionDAG &DAG, const SPUTargetMachine &TM) {
851 return ::LowerConstantPool(Op, DAG, TM.getSubtargetImpl());
852}
853
Dan Gohman8181bd12008-07-27 21:46:04 +0000854static SDValue
855LowerJumpTable(SDValue Op, SelectionDAG &DAG, const SPUSubtarget *ST) {
Duncan Sands92c43912008-06-06 12:08:01 +0000856 MVT PtrVT = Op.getValueType();
Scott Michel8efdca42007-12-04 22:23:35 +0000857 JumpTableSDNode *JT = cast<JumpTableSDNode>(Op);
Dan Gohman8181bd12008-07-27 21:46:04 +0000858 SDValue JTI = DAG.getTargetJumpTable(JT->getIndex(), PtrVT);
859 SDValue Zero = DAG.getConstant(0, PtrVT);
Scott Michel8efdca42007-12-04 22:23:35 +0000860 const TargetMachine &TM = DAG.getTarget();
Dale Johannesen175fdef2009-02-06 21:50:26 +0000861 // FIXME there is no actual debug info here
862 DebugLoc dl = Op.getDebugLoc();
Scott Michel8efdca42007-12-04 22:23:35 +0000863
864 if (TM.getRelocationModel() == Reloc::Static) {
Scott Michel97872d32008-02-23 18:41:37 +0000865 if (!ST->usingLargeMem()) {
Dale Johannesen175fdef2009-02-06 21:50:26 +0000866 return DAG.getNode(SPUISD::AFormAddr, dl, PtrVT, JTI, Zero);
Scott Michel97872d32008-02-23 18:41:37 +0000867 } else {
Dale Johannesen175fdef2009-02-06 21:50:26 +0000868 SDValue Hi = DAG.getNode(SPUISD::Hi, dl, PtrVT, JTI, Zero);
869 SDValue Lo = DAG.getNode(SPUISD::Lo, dl, PtrVT, JTI, Zero);
870 return DAG.getNode(SPUISD::IndirectAddr, dl, PtrVT, Hi, Lo);
Scott Michel97872d32008-02-23 18:41:37 +0000871 }
Scott Michel8efdca42007-12-04 22:23:35 +0000872 }
873
874 assert(0 &&
875 "LowerJumpTable: Relocation model other than static not supported.");
Dan Gohman8181bd12008-07-27 21:46:04 +0000876 return SDValue();
Scott Michel8efdca42007-12-04 22:23:35 +0000877}
878
Dan Gohman8181bd12008-07-27 21:46:04 +0000879static SDValue
880LowerGlobalAddress(SDValue Op, SelectionDAG &DAG, const SPUSubtarget *ST) {
Duncan Sands92c43912008-06-06 12:08:01 +0000881 MVT PtrVT = Op.getValueType();
Scott Michel8efdca42007-12-04 22:23:35 +0000882 GlobalAddressSDNode *GSDN = cast<GlobalAddressSDNode>(Op);
883 GlobalValue *GV = GSDN->getGlobal();
Dan Gohman8181bd12008-07-27 21:46:04 +0000884 SDValue GA = DAG.getTargetGlobalAddress(GV, PtrVT, GSDN->getOffset());
Scott Michel8efdca42007-12-04 22:23:35 +0000885 const TargetMachine &TM = DAG.getTarget();
Dan Gohman8181bd12008-07-27 21:46:04 +0000886 SDValue Zero = DAG.getConstant(0, PtrVT);
Dale Johannesen175fdef2009-02-06 21:50:26 +0000887 // FIXME there is no actual debug info here
888 DebugLoc dl = Op.getDebugLoc();
Scott Michel4ec722e2008-07-16 17:17:29 +0000889
Scott Michel8efdca42007-12-04 22:23:35 +0000890 if (TM.getRelocationModel() == Reloc::Static) {
Scott Michelf9f42e62008-01-29 02:16:57 +0000891 if (!ST->usingLargeMem()) {
Dale Johannesen175fdef2009-02-06 21:50:26 +0000892 return DAG.getNode(SPUISD::AFormAddr, dl, PtrVT, GA, Zero);
Scott Michelf9f42e62008-01-29 02:16:57 +0000893 } else {
Dale Johannesen175fdef2009-02-06 21:50:26 +0000894 SDValue Hi = DAG.getNode(SPUISD::Hi, dl, PtrVT, GA, Zero);
895 SDValue Lo = DAG.getNode(SPUISD::Lo, dl, PtrVT, GA, Zero);
896 return DAG.getNode(SPUISD::IndirectAddr, dl, PtrVT, Hi, Lo);
Scott Michelf9f42e62008-01-29 02:16:57 +0000897 }
Scott Michel8efdca42007-12-04 22:23:35 +0000898 } else {
899 cerr << "LowerGlobalAddress: Relocation model other than static not "
Scott Michel5a6f17b2008-01-30 02:55:46 +0000900 << "supported.\n";
Scott Michel8efdca42007-12-04 22:23:35 +0000901 abort();
902 /*NOTREACHED*/
903 }
904
Dan Gohman8181bd12008-07-27 21:46:04 +0000905 return SDValue();
Scott Michel8efdca42007-12-04 22:23:35 +0000906}
907
Nate Begeman78125042008-02-14 18:43:04 +0000908//! Custom lower double precision floating point constants
Dan Gohman8181bd12008-07-27 21:46:04 +0000909static SDValue
910LowerConstantFP(SDValue Op, SelectionDAG &DAG) {
Duncan Sands92c43912008-06-06 12:08:01 +0000911 MVT VT = Op.getValueType();
Dale Johannesen175fdef2009-02-06 21:50:26 +0000912 // FIXME there is no actual debug info here
913 DebugLoc dl = Op.getDebugLoc();
Scott Michel8efdca42007-12-04 22:23:35 +0000914
Nate Begeman78125042008-02-14 18:43:04 +0000915 if (VT == MVT::f64) {
Scott Michel0718cd82008-12-01 17:56:02 +0000916 ConstantFPSDNode *FP = cast<ConstantFPSDNode>(Op.getNode());
917
918 assert((FP != 0) &&
919 "LowerConstantFP: Node is not ConstantFPSDNode");
Scott Michelae5cbf52008-12-29 03:23:36 +0000920
Scott Michel11e88bb2007-12-19 20:15:47 +0000921 uint64_t dbits = DoubleToBits(FP->getValueAPF().convertToDouble());
Scott Michel0718cd82008-12-01 17:56:02 +0000922 SDValue T = DAG.getConstant(dbits, MVT::i64);
Scott Michel78c70a02009-02-22 23:36:09 +0000923 SDValue Tvec = DAG.getBUILD_VECTOR(MVT::v2i64, dl, T, T);
Dale Johannesen175fdef2009-02-06 21:50:26 +0000924 return DAG.getNode(SPUISD::VEC2PREFSLOT, dl, VT,
Dale Johannesen24dd9a52009-02-07 00:55:49 +0000925 DAG.getNode(ISD::BIT_CONVERT, dl, MVT::v2f64, Tvec));
Scott Michel8efdca42007-12-04 22:23:35 +0000926 }
927
Dan Gohman8181bd12008-07-27 21:46:04 +0000928 return SDValue();
Scott Michel8efdca42007-12-04 22:23:35 +0000929}
930
Dan Gohman8181bd12008-07-27 21:46:04 +0000931static SDValue
Dan Gohman8181bd12008-07-27 21:46:04 +0000932LowerFORMAL_ARGUMENTS(SDValue Op, SelectionDAG &DAG, int &VarArgsFrameIndex)
Scott Michel8efdca42007-12-04 22:23:35 +0000933{
934 MachineFunction &MF = DAG.getMachineFunction();
935 MachineFrameInfo *MFI = MF.getFrameInfo();
Chris Lattner1b989192007-12-31 04:13:23 +0000936 MachineRegisterInfo &RegInfo = MF.getRegInfo();
Scott Michela313fb02008-10-30 01:51:48 +0000937 SmallVector<SDValue, 48> ArgValues;
Dan Gohman8181bd12008-07-27 21:46:04 +0000938 SDValue Root = Op.getOperand(0);
Dan Gohmanfaeb4a32008-09-12 16:56:44 +0000939 bool isVarArg = cast<ConstantSDNode>(Op.getOperand(2))->getZExtValue() != 0;
Dale Johannesenea996922009-02-04 20:06:27 +0000940 DebugLoc dl = Op.getDebugLoc();
Scott Michel8efdca42007-12-04 22:23:35 +0000941
942 const unsigned *ArgRegs = SPURegisterInfo::getArgRegs();
943 const unsigned NumArgRegs = SPURegisterInfo::getNumArgRegs();
Scott Michel4ec722e2008-07-16 17:17:29 +0000944
Scott Michel8efdca42007-12-04 22:23:35 +0000945 unsigned ArgOffset = SPUFrameInfo::minStackSize();
946 unsigned ArgRegIdx = 0;
947 unsigned StackSlotSize = SPUFrameInfo::stackSlotSize();
Scott Michel4ec722e2008-07-16 17:17:29 +0000948
Duncan Sands92c43912008-06-06 12:08:01 +0000949 MVT PtrVT = DAG.getTargetLoweringInfo().getPointerTy();
Scott Michel4ec722e2008-07-16 17:17:29 +0000950
Scott Michel8efdca42007-12-04 22:23:35 +0000951 // Add DAG nodes to load the arguments or copy them out of registers.
Gabor Greife9f7f582008-08-31 15:37:04 +0000952 for (unsigned ArgNo = 0, e = Op.getNode()->getNumValues() - 1;
953 ArgNo != e; ++ArgNo) {
Duncan Sands92c43912008-06-06 12:08:01 +0000954 MVT ObjectVT = Op.getValue(ArgNo).getValueType();
955 unsigned ObjSize = ObjectVT.getSizeInBits()/8;
Scott Michela313fb02008-10-30 01:51:48 +0000956 SDValue ArgVal;
Scott Michel8efdca42007-12-04 22:23:35 +0000957
Scott Michela313fb02008-10-30 01:51:48 +0000958 if (ArgRegIdx < NumArgRegs) {
959 const TargetRegisterClass *ArgRegClass;
Scott Michel4ec722e2008-07-16 17:17:29 +0000960
Scott Michela313fb02008-10-30 01:51:48 +0000961 switch (ObjectVT.getSimpleVT()) {
962 default: {
Scott Michel33d73eb2008-11-21 02:56:16 +0000963 cerr << "LowerFORMAL_ARGUMENTS Unhandled argument type: "
964 << ObjectVT.getMVTString()
965 << "\n";
966 abort();
Scott Michela313fb02008-10-30 01:51:48 +0000967 }
968 case MVT::i8:
Scott Michel33d73eb2008-11-21 02:56:16 +0000969 ArgRegClass = &SPU::R8CRegClass;
970 break;
Scott Michela313fb02008-10-30 01:51:48 +0000971 case MVT::i16:
Scott Michel33d73eb2008-11-21 02:56:16 +0000972 ArgRegClass = &SPU::R16CRegClass;
973 break;
Scott Michela313fb02008-10-30 01:51:48 +0000974 case MVT::i32:
Scott Michel33d73eb2008-11-21 02:56:16 +0000975 ArgRegClass = &SPU::R32CRegClass;
976 break;
Scott Michela313fb02008-10-30 01:51:48 +0000977 case MVT::i64:
Scott Michel33d73eb2008-11-21 02:56:16 +0000978 ArgRegClass = &SPU::R64CRegClass;
979 break;
Scott Michel2ef773a2009-01-06 03:36:14 +0000980 case MVT::i128:
981 ArgRegClass = &SPU::GPRCRegClass;
982 break;
Scott Michela313fb02008-10-30 01:51:48 +0000983 case MVT::f32:
Scott Michel33d73eb2008-11-21 02:56:16 +0000984 ArgRegClass = &SPU::R32FPRegClass;
985 break;
Scott Michela313fb02008-10-30 01:51:48 +0000986 case MVT::f64:
Scott Michel33d73eb2008-11-21 02:56:16 +0000987 ArgRegClass = &SPU::R64FPRegClass;
988 break;
Scott Michela313fb02008-10-30 01:51:48 +0000989 case MVT::v2f64:
990 case MVT::v4f32:
991 case MVT::v2i64:
992 case MVT::v4i32:
993 case MVT::v8i16:
994 case MVT::v16i8:
Scott Michel33d73eb2008-11-21 02:56:16 +0000995 ArgRegClass = &SPU::VECREGRegClass;
996 break;
Scott Michela313fb02008-10-30 01:51:48 +0000997 }
998
999 unsigned VReg = RegInfo.createVirtualRegister(ArgRegClass);
1000 RegInfo.addLiveIn(ArgRegs[ArgRegIdx], VReg);
Dale Johannesenea996922009-02-04 20:06:27 +00001001 ArgVal = DAG.getCopyFromReg(Root, dl, VReg, ObjectVT);
Scott Michela313fb02008-10-30 01:51:48 +00001002 ++ArgRegIdx;
1003 } else {
1004 // We need to load the argument to a virtual register if we determined
1005 // above that we ran out of physical registers of the appropriate type
1006 // or we're forced to do vararg
Chris Lattner60069452008-02-13 07:35:30 +00001007 int FI = MFI->CreateFixedObject(ObjSize, ArgOffset);
Dan Gohman8181bd12008-07-27 21:46:04 +00001008 SDValue FIN = DAG.getFrameIndex(FI, PtrVT);
Dale Johannesenea996922009-02-04 20:06:27 +00001009 ArgVal = DAG.getLoad(ObjectVT, dl, Root, FIN, NULL, 0);
Scott Michel8efdca42007-12-04 22:23:35 +00001010 ArgOffset += StackSlotSize;
1011 }
Scott Michel4ec722e2008-07-16 17:17:29 +00001012
Scott Michel8efdca42007-12-04 22:23:35 +00001013 ArgValues.push_back(ArgVal);
Scott Michela313fb02008-10-30 01:51:48 +00001014 // Update the chain
1015 Root = ArgVal.getOperand(0);
Scott Michel8efdca42007-12-04 22:23:35 +00001016 }
Scott Michel4ec722e2008-07-16 17:17:29 +00001017
Scott Michela313fb02008-10-30 01:51:48 +00001018 // vararg handling:
Scott Michel8efdca42007-12-04 22:23:35 +00001019 if (isVarArg) {
Scott Michela313fb02008-10-30 01:51:48 +00001020 // unsigned int ptr_size = PtrVT.getSizeInBits() / 8;
1021 // We will spill (79-3)+1 registers to the stack
1022 SmallVector<SDValue, 79-3+1> MemOps;
1023
1024 // Create the frame slot
1025
Scott Michel8efdca42007-12-04 22:23:35 +00001026 for (; ArgRegIdx != NumArgRegs; ++ArgRegIdx) {
Scott Michela313fb02008-10-30 01:51:48 +00001027 VarArgsFrameIndex = MFI->CreateFixedObject(StackSlotSize, ArgOffset);
1028 SDValue FIN = DAG.getFrameIndex(VarArgsFrameIndex, PtrVT);
1029 SDValue ArgVal = DAG.getRegister(ArgRegs[ArgRegIdx], MVT::v16i8);
Dale Johannesenea996922009-02-04 20:06:27 +00001030 SDValue Store = DAG.getStore(Root, dl, ArgVal, FIN, NULL, 0);
Scott Michela313fb02008-10-30 01:51:48 +00001031 Root = Store.getOperand(0);
Scott Michel8efdca42007-12-04 22:23:35 +00001032 MemOps.push_back(Store);
Scott Michela313fb02008-10-30 01:51:48 +00001033
1034 // Increment address by stack slot size for the next stored argument
1035 ArgOffset += StackSlotSize;
Scott Michel8efdca42007-12-04 22:23:35 +00001036 }
1037 if (!MemOps.empty())
Dale Johannesenea996922009-02-04 20:06:27 +00001038 Root = DAG.getNode(ISD::TokenFactor, dl, MVT::Other,
1039 &MemOps[0], MemOps.size());
Scott Michel8efdca42007-12-04 22:23:35 +00001040 }
Scott Michel4ec722e2008-07-16 17:17:29 +00001041
Scott Michel8efdca42007-12-04 22:23:35 +00001042 ArgValues.push_back(Root);
Scott Michel4ec722e2008-07-16 17:17:29 +00001043
Scott Michel8efdca42007-12-04 22:23:35 +00001044 // Return the new list of results.
Dale Johannesenea996922009-02-04 20:06:27 +00001045 return DAG.getNode(ISD::MERGE_VALUES, dl, Op.getNode()->getVTList(),
Duncan Sands42d7bb82008-12-01 11:41:29 +00001046 &ArgValues[0], ArgValues.size());
Scott Michel8efdca42007-12-04 22:23:35 +00001047}
1048
1049/// isLSAAddress - Return the immediate to use if the specified
1050/// value is representable as a LSA address.
Dan Gohman8181bd12008-07-27 21:46:04 +00001051static SDNode *isLSAAddress(SDValue Op, SelectionDAG &DAG) {
Scott Michel5974f432008-11-11 03:06:06 +00001052 ConstantSDNode *C = dyn_cast<ConstantSDNode>(Op);
Scott Michel8efdca42007-12-04 22:23:35 +00001053 if (!C) return 0;
Scott Michel4ec722e2008-07-16 17:17:29 +00001054
Dan Gohmanfaeb4a32008-09-12 16:56:44 +00001055 int Addr = C->getZExtValue();
Scott Michel8efdca42007-12-04 22:23:35 +00001056 if ((Addr & 3) != 0 || // Low 2 bits are implicitly zero.
1057 (Addr << 14 >> 14) != Addr)
1058 return 0; // Top 14 bits have to be sext of immediate.
Scott Michel4ec722e2008-07-16 17:17:29 +00001059
Dan Gohmanfaeb4a32008-09-12 16:56:44 +00001060 return DAG.getConstant((int)C->getZExtValue() >> 2, MVT::i32).getNode();
Scott Michel8efdca42007-12-04 22:23:35 +00001061}
1062
Scott Michel70741542009-01-06 23:10:38 +00001063static SDValue
Dan Gohman8181bd12008-07-27 21:46:04 +00001064LowerCALL(SDValue Op, SelectionDAG &DAG, const SPUSubtarget *ST) {
Dan Gohman705e3f72008-09-13 01:54:27 +00001065 CallSDNode *TheCall = cast<CallSDNode>(Op.getNode());
1066 SDValue Chain = TheCall->getChain();
Dan Gohman705e3f72008-09-13 01:54:27 +00001067 SDValue Callee = TheCall->getCallee();
1068 unsigned NumOps = TheCall->getNumArgs();
Scott Michel8efdca42007-12-04 22:23:35 +00001069 unsigned StackSlotSize = SPUFrameInfo::stackSlotSize();
1070 const unsigned *ArgRegs = SPURegisterInfo::getArgRegs();
1071 const unsigned NumArgRegs = SPURegisterInfo::getNumArgRegs();
Dale Johannesenea996922009-02-04 20:06:27 +00001072 DebugLoc dl = TheCall->getDebugLoc();
Scott Michel8efdca42007-12-04 22:23:35 +00001073
1074 // Handy pointer type
Duncan Sands92c43912008-06-06 12:08:01 +00001075 MVT PtrVT = DAG.getTargetLoweringInfo().getPointerTy();
Scott Michel4ec722e2008-07-16 17:17:29 +00001076
Scott Michel8efdca42007-12-04 22:23:35 +00001077 // Accumulate how many bytes are to be pushed on the stack, including the
1078 // linkage area, and parameter passing area. According to the SPU ABI,
1079 // we minimally need space for [LR] and [SP]
1080 unsigned NumStackBytes = SPUFrameInfo::minStackSize();
Scott Michel4ec722e2008-07-16 17:17:29 +00001081
Scott Michel8efdca42007-12-04 22:23:35 +00001082 // Set up a copy of the stack pointer for use loading and storing any
1083 // arguments that may not fit in the registers available for argument
1084 // passing.
Dan Gohman8181bd12008-07-27 21:46:04 +00001085 SDValue StackPtr = DAG.getRegister(SPU::R1, MVT::i32);
Scott Michel4ec722e2008-07-16 17:17:29 +00001086
Scott Michel8efdca42007-12-04 22:23:35 +00001087 // Figure out which arguments are going to go in registers, and which in
1088 // memory.
1089 unsigned ArgOffset = SPUFrameInfo::minStackSize(); // Just below [LR]
1090 unsigned ArgRegIdx = 0;
1091
1092 // Keep track of registers passing arguments
Dan Gohman8181bd12008-07-27 21:46:04 +00001093 std::vector<std::pair<unsigned, SDValue> > RegsToPass;
Scott Michel8efdca42007-12-04 22:23:35 +00001094 // And the arguments passed on the stack
Dan Gohman8181bd12008-07-27 21:46:04 +00001095 SmallVector<SDValue, 8> MemOpChains;
Scott Michel8efdca42007-12-04 22:23:35 +00001096
1097 for (unsigned i = 0; i != NumOps; ++i) {
Dan Gohman705e3f72008-09-13 01:54:27 +00001098 SDValue Arg = TheCall->getArg(i);
Scott Michel4ec722e2008-07-16 17:17:29 +00001099
Scott Michel8efdca42007-12-04 22:23:35 +00001100 // PtrOff will be used to store the current argument to the stack if a
1101 // register cannot be found for it.
Dan Gohman8181bd12008-07-27 21:46:04 +00001102 SDValue PtrOff = DAG.getConstant(ArgOffset, StackPtr.getValueType());
Dale Johannesenea996922009-02-04 20:06:27 +00001103 PtrOff = DAG.getNode(ISD::ADD, dl, PtrVT, StackPtr, PtrOff);
Scott Michel8efdca42007-12-04 22:23:35 +00001104
Duncan Sands92c43912008-06-06 12:08:01 +00001105 switch (Arg.getValueType().getSimpleVT()) {
Scott Michel8efdca42007-12-04 22:23:35 +00001106 default: assert(0 && "Unexpected ValueType for argument!");
Scott Michel2ef773a2009-01-06 03:36:14 +00001107 case MVT::i8:
1108 case MVT::i16:
Scott Michel8efdca42007-12-04 22:23:35 +00001109 case MVT::i32:
1110 case MVT::i64:
1111 case MVT::i128:
1112 if (ArgRegIdx != NumArgRegs) {
1113 RegsToPass.push_back(std::make_pair(ArgRegs[ArgRegIdx++], Arg));
1114 } else {
Dale Johannesenea996922009-02-04 20:06:27 +00001115 MemOpChains.push_back(DAG.getStore(Chain, dl, Arg, PtrOff, NULL, 0));
Scott Michel5a6f17b2008-01-30 02:55:46 +00001116 ArgOffset += StackSlotSize;
Scott Michel8efdca42007-12-04 22:23:35 +00001117 }
1118 break;
1119 case MVT::f32:
1120 case MVT::f64:
1121 if (ArgRegIdx != NumArgRegs) {
1122 RegsToPass.push_back(std::make_pair(ArgRegs[ArgRegIdx++], Arg));
1123 } else {
Dale Johannesenea996922009-02-04 20:06:27 +00001124 MemOpChains.push_back(DAG.getStore(Chain, dl, Arg, PtrOff, NULL, 0));
Scott Michel5a6f17b2008-01-30 02:55:46 +00001125 ArgOffset += StackSlotSize;
Scott Michel8efdca42007-12-04 22:23:35 +00001126 }
1127 break;
Scott Michele2641a12008-12-04 21:01:44 +00001128 case MVT::v2i64:
1129 case MVT::v2f64:
Scott Michel8efdca42007-12-04 22:23:35 +00001130 case MVT::v4f32:
1131 case MVT::v4i32:
1132 case MVT::v8i16:
1133 case MVT::v16i8:
1134 if (ArgRegIdx != NumArgRegs) {
1135 RegsToPass.push_back(std::make_pair(ArgRegs[ArgRegIdx++], Arg));
1136 } else {
Dale Johannesenea996922009-02-04 20:06:27 +00001137 MemOpChains.push_back(DAG.getStore(Chain, dl, Arg, PtrOff, NULL, 0));
Scott Michel5a6f17b2008-01-30 02:55:46 +00001138 ArgOffset += StackSlotSize;
Scott Michel8efdca42007-12-04 22:23:35 +00001139 }
1140 break;
1141 }
1142 }
1143
1144 // Update number of stack bytes actually used, insert a call sequence start
1145 NumStackBytes = (ArgOffset - SPUFrameInfo::minStackSize());
Chris Lattnerfe5d4022008-10-11 22:08:30 +00001146 Chain = DAG.getCALLSEQ_START(Chain, DAG.getIntPtrConstant(NumStackBytes,
1147 true));
Scott Michel8efdca42007-12-04 22:23:35 +00001148
1149 if (!MemOpChains.empty()) {
1150 // Adjust the stack pointer for the stack arguments.
Dale Johannesenea996922009-02-04 20:06:27 +00001151 Chain = DAG.getNode(ISD::TokenFactor, dl, MVT::Other,
Scott Michel8efdca42007-12-04 22:23:35 +00001152 &MemOpChains[0], MemOpChains.size());
1153 }
Scott Michel4ec722e2008-07-16 17:17:29 +00001154
Scott Michel8efdca42007-12-04 22:23:35 +00001155 // Build a sequence of copy-to-reg nodes chained together with token chain
1156 // and flag operands which copy the outgoing args into the appropriate regs.
Dan Gohman8181bd12008-07-27 21:46:04 +00001157 SDValue InFlag;
Scott Michel8efdca42007-12-04 22:23:35 +00001158 for (unsigned i = 0, e = RegsToPass.size(); i != e; ++i) {
Dale Johannesenea996922009-02-04 20:06:27 +00001159 Chain = DAG.getCopyToReg(Chain, dl, RegsToPass[i].first,
1160 RegsToPass[i].second, InFlag);
Scott Michel8efdca42007-12-04 22:23:35 +00001161 InFlag = Chain.getValue(1);
1162 }
Scott Michel4ec722e2008-07-16 17:17:29 +00001163
Dan Gohman8181bd12008-07-27 21:46:04 +00001164 SmallVector<SDValue, 8> Ops;
Scott Michel8efdca42007-12-04 22:23:35 +00001165 unsigned CallOpc = SPUISD::CALL;
Scott Michel4ec722e2008-07-16 17:17:29 +00001166
Bill Wendlingfef06052008-09-16 21:48:12 +00001167 // If the callee is a GlobalAddress/ExternalSymbol node (quite common, every
1168 // direct call is) turn it into a TargetGlobalAddress/TargetExternalSymbol
1169 // node so that legalize doesn't hack it.
Scott Michel5974f432008-11-11 03:06:06 +00001170 if (GlobalAddressSDNode *G = dyn_cast<GlobalAddressSDNode>(Callee)) {
Scott Michel8efdca42007-12-04 22:23:35 +00001171 GlobalValue *GV = G->getGlobal();
Duncan Sands92c43912008-06-06 12:08:01 +00001172 MVT CalleeVT = Callee.getValueType();
Dan Gohman8181bd12008-07-27 21:46:04 +00001173 SDValue Zero = DAG.getConstant(0, PtrVT);
1174 SDValue GA = DAG.getTargetGlobalAddress(GV, CalleeVT);
Scott Michel8efdca42007-12-04 22:23:35 +00001175
Scott Micheldbac4cf2008-01-11 02:53:15 +00001176 if (!ST->usingLargeMem()) {
1177 // Turn calls to targets that are defined (i.e., have bodies) into BRSL
1178 // style calls, otherwise, external symbols are BRASL calls. This assumes
1179 // that declared/defined symbols are in the same compilation unit and can
1180 // be reached through PC-relative jumps.
1181 //
1182 // NOTE:
1183 // This may be an unsafe assumption for JIT and really large compilation
1184 // units.
1185 if (GV->isDeclaration()) {
Dale Johannesen175fdef2009-02-06 21:50:26 +00001186 Callee = DAG.getNode(SPUISD::AFormAddr, dl, CalleeVT, GA, Zero);
Scott Micheldbac4cf2008-01-11 02:53:15 +00001187 } else {
Dale Johannesen175fdef2009-02-06 21:50:26 +00001188 Callee = DAG.getNode(SPUISD::PCRelAddr, dl, CalleeVT, GA, Zero);
Scott Micheldbac4cf2008-01-11 02:53:15 +00001189 }
Scott Michel8efdca42007-12-04 22:23:35 +00001190 } else {
Scott Micheldbac4cf2008-01-11 02:53:15 +00001191 // "Large memory" mode: Turn all calls into indirect calls with a X-form
1192 // address pairs:
Dale Johannesen175fdef2009-02-06 21:50:26 +00001193 Callee = DAG.getNode(SPUISD::IndirectAddr, dl, PtrVT, GA, Zero);
Scott Michel8efdca42007-12-04 22:23:35 +00001194 }
Scott Michelae5cbf52008-12-29 03:23:36 +00001195 } else if (ExternalSymbolSDNode *S = dyn_cast<ExternalSymbolSDNode>(Callee)) {
1196 MVT CalleeVT = Callee.getValueType();
1197 SDValue Zero = DAG.getConstant(0, PtrVT);
1198 SDValue ExtSym = DAG.getTargetExternalSymbol(S->getSymbol(),
1199 Callee.getValueType());
1200
1201 if (!ST->usingLargeMem()) {
Dale Johannesen175fdef2009-02-06 21:50:26 +00001202 Callee = DAG.getNode(SPUISD::AFormAddr, dl, CalleeVT, ExtSym, Zero);
Scott Michelae5cbf52008-12-29 03:23:36 +00001203 } else {
Dale Johannesen175fdef2009-02-06 21:50:26 +00001204 Callee = DAG.getNode(SPUISD::IndirectAddr, dl, PtrVT, ExtSym, Zero);
Scott Michelae5cbf52008-12-29 03:23:36 +00001205 }
1206 } else if (SDNode *Dest = isLSAAddress(Callee, DAG)) {
Scott Michel8efdca42007-12-04 22:23:35 +00001207 // If this is an absolute destination address that appears to be a legal
1208 // local store address, use the munged value.
Dan Gohman8181bd12008-07-27 21:46:04 +00001209 Callee = SDValue(Dest, 0);
Scott Micheldbac4cf2008-01-11 02:53:15 +00001210 }
Scott Michel8efdca42007-12-04 22:23:35 +00001211
1212 Ops.push_back(Chain);
1213 Ops.push_back(Callee);
Scott Michel4ec722e2008-07-16 17:17:29 +00001214
Scott Michel8efdca42007-12-04 22:23:35 +00001215 // Add argument registers to the end of the list so that they are known live
1216 // into the call.
1217 for (unsigned i = 0, e = RegsToPass.size(); i != e; ++i)
Scott Michel4ec722e2008-07-16 17:17:29 +00001218 Ops.push_back(DAG.getRegister(RegsToPass[i].first,
Scott Michel8efdca42007-12-04 22:23:35 +00001219 RegsToPass[i].second.getValueType()));
Scott Michel4ec722e2008-07-16 17:17:29 +00001220
Gabor Greif1c80d112008-08-28 21:40:38 +00001221 if (InFlag.getNode())
Scott Michel8efdca42007-12-04 22:23:35 +00001222 Ops.push_back(InFlag);
Duncan Sands698842f2008-07-02 17:40:58 +00001223 // Returns a chain and a flag for retval copy to use.
Dale Johannesenea996922009-02-04 20:06:27 +00001224 Chain = DAG.getNode(CallOpc, dl, DAG.getVTList(MVT::Other, MVT::Flag),
Duncan Sands698842f2008-07-02 17:40:58 +00001225 &Ops[0], Ops.size());
Scott Michel8efdca42007-12-04 22:23:35 +00001226 InFlag = Chain.getValue(1);
1227
Chris Lattnerfe5d4022008-10-11 22:08:30 +00001228 Chain = DAG.getCALLSEQ_END(Chain, DAG.getIntPtrConstant(NumStackBytes, true),
1229 DAG.getIntPtrConstant(0, true), InFlag);
Dan Gohman705e3f72008-09-13 01:54:27 +00001230 if (TheCall->getValueType(0) != MVT::Other)
Evan Cheng07322bb2008-02-05 22:44:06 +00001231 InFlag = Chain.getValue(1);
1232
Dan Gohman8181bd12008-07-27 21:46:04 +00001233 SDValue ResultVals[3];
Scott Michel8efdca42007-12-04 22:23:35 +00001234 unsigned NumResults = 0;
Scott Michel4ec722e2008-07-16 17:17:29 +00001235
Scott Michel8efdca42007-12-04 22:23:35 +00001236 // If the call has results, copy the values out of the ret val registers.
Dan Gohman705e3f72008-09-13 01:54:27 +00001237 switch (TheCall->getValueType(0).getSimpleVT()) {
Scott Michel8efdca42007-12-04 22:23:35 +00001238 default: assert(0 && "Unexpected ret value!");
1239 case MVT::Other: break;
1240 case MVT::i32:
Dan Gohman705e3f72008-09-13 01:54:27 +00001241 if (TheCall->getValueType(1) == MVT::i32) {
Dale Johannesenea996922009-02-04 20:06:27 +00001242 Chain = DAG.getCopyFromReg(Chain, dl, SPU::R4,
1243 MVT::i32, InFlag).getValue(1);
Scott Michel8efdca42007-12-04 22:23:35 +00001244 ResultVals[0] = Chain.getValue(0);
Dale Johannesenea996922009-02-04 20:06:27 +00001245 Chain = DAG.getCopyFromReg(Chain, dl, SPU::R3, MVT::i32,
Scott Michel8efdca42007-12-04 22:23:35 +00001246 Chain.getValue(2)).getValue(1);
1247 ResultVals[1] = Chain.getValue(0);
1248 NumResults = 2;
Scott Michel8efdca42007-12-04 22:23:35 +00001249 } else {
Dale Johannesenea996922009-02-04 20:06:27 +00001250 Chain = DAG.getCopyFromReg(Chain, dl, SPU::R3, MVT::i32,
1251 InFlag).getValue(1);
Scott Michel8efdca42007-12-04 22:23:35 +00001252 ResultVals[0] = Chain.getValue(0);
1253 NumResults = 1;
1254 }
Scott Michel8efdca42007-12-04 22:23:35 +00001255 break;
1256 case MVT::i64:
Dale Johannesenea996922009-02-04 20:06:27 +00001257 Chain = DAG.getCopyFromReg(Chain, dl, SPU::R3, MVT::i64,
1258 InFlag).getValue(1);
Scott Michel8efdca42007-12-04 22:23:35 +00001259 ResultVals[0] = Chain.getValue(0);
1260 NumResults = 1;
Scott Michel8efdca42007-12-04 22:23:35 +00001261 break;
Scott Michel2ef773a2009-01-06 03:36:14 +00001262 case MVT::i128:
Dale Johannesenea996922009-02-04 20:06:27 +00001263 Chain = DAG.getCopyFromReg(Chain, dl, SPU::R3, MVT::i128,
1264 InFlag).getValue(1);
Scott Michel2ef773a2009-01-06 03:36:14 +00001265 ResultVals[0] = Chain.getValue(0);
1266 NumResults = 1;
1267 break;
Scott Michel8efdca42007-12-04 22:23:35 +00001268 case MVT::f32:
1269 case MVT::f64:
Dale Johannesenea996922009-02-04 20:06:27 +00001270 Chain = DAG.getCopyFromReg(Chain, dl, SPU::R3, TheCall->getValueType(0),
Scott Michel8efdca42007-12-04 22:23:35 +00001271 InFlag).getValue(1);
1272 ResultVals[0] = Chain.getValue(0);
1273 NumResults = 1;
Scott Michel8efdca42007-12-04 22:23:35 +00001274 break;
1275 case MVT::v2f64:
Scott Michele2641a12008-12-04 21:01:44 +00001276 case MVT::v2i64:
Scott Michel8efdca42007-12-04 22:23:35 +00001277 case MVT::v4f32:
1278 case MVT::v4i32:
1279 case MVT::v8i16:
1280 case MVT::v16i8:
Dale Johannesenea996922009-02-04 20:06:27 +00001281 Chain = DAG.getCopyFromReg(Chain, dl, SPU::R3, TheCall->getValueType(0),
Scott Michel8efdca42007-12-04 22:23:35 +00001282 InFlag).getValue(1);
1283 ResultVals[0] = Chain.getValue(0);
1284 NumResults = 1;
Scott Michel8efdca42007-12-04 22:23:35 +00001285 break;
1286 }
Duncan Sands698842f2008-07-02 17:40:58 +00001287
Scott Michel8efdca42007-12-04 22:23:35 +00001288 // If the function returns void, just return the chain.
1289 if (NumResults == 0)
1290 return Chain;
Scott Michel4ec722e2008-07-16 17:17:29 +00001291
Scott Michel8efdca42007-12-04 22:23:35 +00001292 // Otherwise, merge everything together with a MERGE_VALUES node.
1293 ResultVals[NumResults++] = Chain;
Dale Johannesenea996922009-02-04 20:06:27 +00001294 SDValue Res = DAG.getMergeValues(ResultVals, NumResults, dl);
Gabor Greif46bf5472008-08-26 22:36:50 +00001295 return Res.getValue(Op.getResNo());
Scott Michel8efdca42007-12-04 22:23:35 +00001296}
1297
Dan Gohman8181bd12008-07-27 21:46:04 +00001298static SDValue
1299LowerRET(SDValue Op, SelectionDAG &DAG, TargetMachine &TM) {
Scott Michel8efdca42007-12-04 22:23:35 +00001300 SmallVector<CCValAssign, 16> RVLocs;
1301 unsigned CC = DAG.getMachineFunction().getFunction()->getCallingConv();
1302 bool isVarArg = DAG.getMachineFunction().getFunction()->isVarArg();
Dale Johannesenb03cc3f2009-02-04 23:02:30 +00001303 DebugLoc dl = Op.getDebugLoc();
Scott Michel8efdca42007-12-04 22:23:35 +00001304 CCState CCInfo(CC, isVarArg, TM, RVLocs);
Gabor Greif1c80d112008-08-28 21:40:38 +00001305 CCInfo.AnalyzeReturn(Op.getNode(), RetCC_SPU);
Scott Michel4ec722e2008-07-16 17:17:29 +00001306
Scott Michel8efdca42007-12-04 22:23:35 +00001307 // If this is the first return lowered for this function, add the regs to the
1308 // liveout set for the function.
Chris Lattner1b989192007-12-31 04:13:23 +00001309 if (DAG.getMachineFunction().getRegInfo().liveout_empty()) {
Scott Michel8efdca42007-12-04 22:23:35 +00001310 for (unsigned i = 0; i != RVLocs.size(); ++i)
Chris Lattner1b989192007-12-31 04:13:23 +00001311 DAG.getMachineFunction().getRegInfo().addLiveOut(RVLocs[i].getLocReg());
Scott Michel8efdca42007-12-04 22:23:35 +00001312 }
1313
Dan Gohman8181bd12008-07-27 21:46:04 +00001314 SDValue Chain = Op.getOperand(0);
1315 SDValue Flag;
Scott Michel4ec722e2008-07-16 17:17:29 +00001316
Scott Michel8efdca42007-12-04 22:23:35 +00001317 // Copy the result values into the output registers.
1318 for (unsigned i = 0; i != RVLocs.size(); ++i) {
1319 CCValAssign &VA = RVLocs[i];
1320 assert(VA.isRegLoc() && "Can only return in registers!");
Dale Johannesenb03cc3f2009-02-04 23:02:30 +00001321 Chain = DAG.getCopyToReg(Chain, dl, VA.getLocReg(),
1322 Op.getOperand(i*2+1), Flag);
Scott Michel8efdca42007-12-04 22:23:35 +00001323 Flag = Chain.getValue(1);
1324 }
1325
Gabor Greif1c80d112008-08-28 21:40:38 +00001326 if (Flag.getNode())
Dale Johannesenb03cc3f2009-02-04 23:02:30 +00001327 return DAG.getNode(SPUISD::RET_FLAG, dl, MVT::Other, Chain, Flag);
Scott Michel8efdca42007-12-04 22:23:35 +00001328 else
Dale Johannesenb03cc3f2009-02-04 23:02:30 +00001329 return DAG.getNode(SPUISD::RET_FLAG, dl, MVT::Other, Chain);
Scott Michel8efdca42007-12-04 22:23:35 +00001330}
1331
1332
1333//===----------------------------------------------------------------------===//
1334// Vector related lowering:
1335//===----------------------------------------------------------------------===//
1336
1337static ConstantSDNode *
1338getVecImm(SDNode *N) {
Dan Gohman8181bd12008-07-27 21:46:04 +00001339 SDValue OpVal(0, 0);
Scott Michel4ec722e2008-07-16 17:17:29 +00001340
Scott Michel8efdca42007-12-04 22:23:35 +00001341 // Check to see if this buildvec has a single non-undef value in its elements.
1342 for (unsigned i = 0, e = N->getNumOperands(); i != e; ++i) {
1343 if (N->getOperand(i).getOpcode() == ISD::UNDEF) continue;
Gabor Greif1c80d112008-08-28 21:40:38 +00001344 if (OpVal.getNode() == 0)
Scott Michel8efdca42007-12-04 22:23:35 +00001345 OpVal = N->getOperand(i);
1346 else if (OpVal != N->getOperand(i))
1347 return 0;
1348 }
Scott Michel4ec722e2008-07-16 17:17:29 +00001349
Gabor Greif1c80d112008-08-28 21:40:38 +00001350 if (OpVal.getNode() != 0) {
Scott Michel5974f432008-11-11 03:06:06 +00001351 if (ConstantSDNode *CN = dyn_cast<ConstantSDNode>(OpVal)) {
Scott Michel8efdca42007-12-04 22:23:35 +00001352 return CN;
1353 }
1354 }
1355
1356 return 0; // All UNDEF: use implicit def.; not Constant node
1357}
1358
1359/// get_vec_i18imm - Test if this vector is a vector filled with the same value
1360/// and the value fits into an unsigned 18-bit constant, and if so, return the
1361/// constant
Dan Gohman8181bd12008-07-27 21:46:04 +00001362SDValue SPU::get_vec_u18imm(SDNode *N, SelectionDAG &DAG,
Duncan Sands92c43912008-06-06 12:08:01 +00001363 MVT ValueType) {
Scott Michel8efdca42007-12-04 22:23:35 +00001364 if (ConstantSDNode *CN = getVecImm(N)) {
Dan Gohmanfaeb4a32008-09-12 16:56:44 +00001365 uint64_t Value = CN->getZExtValue();
Scott Michelbcc7b672008-03-06 04:02:54 +00001366 if (ValueType == MVT::i64) {
Dan Gohmanfaeb4a32008-09-12 16:56:44 +00001367 uint64_t UValue = CN->getZExtValue();
Scott Michelbcc7b672008-03-06 04:02:54 +00001368 uint32_t upper = uint32_t(UValue >> 32);
1369 uint32_t lower = uint32_t(UValue);
1370 if (upper != lower)
Dan Gohman8181bd12008-07-27 21:46:04 +00001371 return SDValue();
Scott Michelbcc7b672008-03-06 04:02:54 +00001372 Value = Value >> 32;
1373 }
Scott Michel8efdca42007-12-04 22:23:35 +00001374 if (Value <= 0x3ffff)
Dan Gohman57d5d5d2008-11-05 02:06:09 +00001375 return DAG.getTargetConstant(Value, ValueType);
Scott Michel8efdca42007-12-04 22:23:35 +00001376 }
1377
Dan Gohman8181bd12008-07-27 21:46:04 +00001378 return SDValue();
Scott Michel8efdca42007-12-04 22:23:35 +00001379}
1380
1381/// get_vec_i16imm - Test if this vector is a vector filled with the same value
1382/// and the value fits into a signed 16-bit constant, and if so, return the
1383/// constant
Dan Gohman8181bd12008-07-27 21:46:04 +00001384SDValue SPU::get_vec_i16imm(SDNode *N, SelectionDAG &DAG,
Duncan Sands92c43912008-06-06 12:08:01 +00001385 MVT ValueType) {
Scott Michel8efdca42007-12-04 22:23:35 +00001386 if (ConstantSDNode *CN = getVecImm(N)) {
Dan Gohman40686732008-09-26 21:54:37 +00001387 int64_t Value = CN->getSExtValue();
Scott Michelbcc7b672008-03-06 04:02:54 +00001388 if (ValueType == MVT::i64) {
Dan Gohmanfaeb4a32008-09-12 16:56:44 +00001389 uint64_t UValue = CN->getZExtValue();
Scott Michelbcc7b672008-03-06 04:02:54 +00001390 uint32_t upper = uint32_t(UValue >> 32);
1391 uint32_t lower = uint32_t(UValue);
1392 if (upper != lower)
Dan Gohman8181bd12008-07-27 21:46:04 +00001393 return SDValue();
Scott Michelbcc7b672008-03-06 04:02:54 +00001394 Value = Value >> 32;
1395 }
Scott Michel6baba072008-03-05 23:02:02 +00001396 if (Value >= -(1 << 15) && Value <= ((1 << 15) - 1)) {
Dan Gohman57d5d5d2008-11-05 02:06:09 +00001397 return DAG.getTargetConstant(Value, ValueType);
Scott Michel8efdca42007-12-04 22:23:35 +00001398 }
1399 }
1400
Dan Gohman8181bd12008-07-27 21:46:04 +00001401 return SDValue();
Scott Michel8efdca42007-12-04 22:23:35 +00001402}
1403
1404/// get_vec_i10imm - Test if this vector is a vector filled with the same value
1405/// and the value fits into a signed 10-bit constant, and if so, return the
1406/// constant
Dan Gohman8181bd12008-07-27 21:46:04 +00001407SDValue SPU::get_vec_i10imm(SDNode *N, SelectionDAG &DAG,
Duncan Sands92c43912008-06-06 12:08:01 +00001408 MVT ValueType) {
Scott Michel8efdca42007-12-04 22:23:35 +00001409 if (ConstantSDNode *CN = getVecImm(N)) {
Dan Gohman40686732008-09-26 21:54:37 +00001410 int64_t Value = CN->getSExtValue();
Scott Michelbcc7b672008-03-06 04:02:54 +00001411 if (ValueType == MVT::i64) {
Dan Gohmanfaeb4a32008-09-12 16:56:44 +00001412 uint64_t UValue = CN->getZExtValue();
Scott Michelbcc7b672008-03-06 04:02:54 +00001413 uint32_t upper = uint32_t(UValue >> 32);
1414 uint32_t lower = uint32_t(UValue);
1415 if (upper != lower)
Dan Gohman8181bd12008-07-27 21:46:04 +00001416 return SDValue();
Scott Michelbcc7b672008-03-06 04:02:54 +00001417 Value = Value >> 32;
1418 }
Scott Michel6baba072008-03-05 23:02:02 +00001419 if (isS10Constant(Value))
Dan Gohman57d5d5d2008-11-05 02:06:09 +00001420 return DAG.getTargetConstant(Value, ValueType);
Scott Michel8efdca42007-12-04 22:23:35 +00001421 }
1422
Dan Gohman8181bd12008-07-27 21:46:04 +00001423 return SDValue();
Scott Michel8efdca42007-12-04 22:23:35 +00001424}
1425
1426/// get_vec_i8imm - Test if this vector is a vector filled with the same value
1427/// and the value fits into a signed 8-bit constant, and if so, return the
1428/// constant.
1429///
1430/// @note: The incoming vector is v16i8 because that's the only way we can load
1431/// constant vectors. Thus, we test to see if the upper and lower bytes are the
1432/// same value.
Dan Gohman8181bd12008-07-27 21:46:04 +00001433SDValue SPU::get_vec_i8imm(SDNode *N, SelectionDAG &DAG,
Duncan Sands92c43912008-06-06 12:08:01 +00001434 MVT ValueType) {
Scott Michel8efdca42007-12-04 22:23:35 +00001435 if (ConstantSDNode *CN = getVecImm(N)) {
Dan Gohmanfaeb4a32008-09-12 16:56:44 +00001436 int Value = (int) CN->getZExtValue();
Scott Michel8efdca42007-12-04 22:23:35 +00001437 if (ValueType == MVT::i16
Scott Michel5a6f17b2008-01-30 02:55:46 +00001438 && Value <= 0xffff /* truncated from uint64_t */
1439 && ((short) Value >> 8) == ((short) Value & 0xff))
Dan Gohman57d5d5d2008-11-05 02:06:09 +00001440 return DAG.getTargetConstant(Value & 0xff, ValueType);
Scott Michel8efdca42007-12-04 22:23:35 +00001441 else if (ValueType == MVT::i8
Scott Michel5a6f17b2008-01-30 02:55:46 +00001442 && (Value & 0xff) == Value)
Dan Gohman57d5d5d2008-11-05 02:06:09 +00001443 return DAG.getTargetConstant(Value, ValueType);
Scott Michel8efdca42007-12-04 22:23:35 +00001444 }
1445
Dan Gohman8181bd12008-07-27 21:46:04 +00001446 return SDValue();
Scott Michel8efdca42007-12-04 22:23:35 +00001447}
1448
1449/// get_ILHUvec_imm - Test if this vector is a vector filled with the same value
1450/// and the value fits into a signed 16-bit constant, and if so, return the
1451/// constant
Dan Gohman8181bd12008-07-27 21:46:04 +00001452SDValue SPU::get_ILHUvec_imm(SDNode *N, SelectionDAG &DAG,
Duncan Sands92c43912008-06-06 12:08:01 +00001453 MVT ValueType) {
Scott Michel8efdca42007-12-04 22:23:35 +00001454 if (ConstantSDNode *CN = getVecImm(N)) {
Dan Gohmanfaeb4a32008-09-12 16:56:44 +00001455 uint64_t Value = CN->getZExtValue();
Scott Michel8efdca42007-12-04 22:23:35 +00001456 if ((ValueType == MVT::i32
Scott Michel5a6f17b2008-01-30 02:55:46 +00001457 && ((unsigned) Value & 0xffff0000) == (unsigned) Value)
1458 || (ValueType == MVT::i64 && (Value & 0xffff0000) == Value))
Dan Gohman57d5d5d2008-11-05 02:06:09 +00001459 return DAG.getTargetConstant(Value >> 16, ValueType);
Scott Michel8efdca42007-12-04 22:23:35 +00001460 }
1461
Dan Gohman8181bd12008-07-27 21:46:04 +00001462 return SDValue();
Scott Michel8efdca42007-12-04 22:23:35 +00001463}
1464
1465/// get_v4i32_imm - Catch-all for general 32-bit constant vectors
Dan Gohman8181bd12008-07-27 21:46:04 +00001466SDValue SPU::get_v4i32_imm(SDNode *N, SelectionDAG &DAG) {
Scott Michel8efdca42007-12-04 22:23:35 +00001467 if (ConstantSDNode *CN = getVecImm(N)) {
Dan Gohman57d5d5d2008-11-05 02:06:09 +00001468 return DAG.getTargetConstant((unsigned) CN->getZExtValue(), MVT::i32);
Scott Michel8efdca42007-12-04 22:23:35 +00001469 }
1470
Dan Gohman8181bd12008-07-27 21:46:04 +00001471 return SDValue();
Scott Michel8efdca42007-12-04 22:23:35 +00001472}
1473
1474/// get_v4i32_imm - Catch-all for general 64-bit constant vectors
Dan Gohman8181bd12008-07-27 21:46:04 +00001475SDValue SPU::get_v2i64_imm(SDNode *N, SelectionDAG &DAG) {
Scott Michel8efdca42007-12-04 22:23:35 +00001476 if (ConstantSDNode *CN = getVecImm(N)) {
Dan Gohman57d5d5d2008-11-05 02:06:09 +00001477 return DAG.getTargetConstant((unsigned) CN->getZExtValue(), MVT::i64);
Scott Michel8efdca42007-12-04 22:23:35 +00001478 }
1479
Dan Gohman8181bd12008-07-27 21:46:04 +00001480 return SDValue();
Scott Michel8efdca42007-12-04 22:23:35 +00001481}
1482
1483// If this is a vector of constants or undefs, get the bits. A bit in
Scott Michel4ec722e2008-07-16 17:17:29 +00001484// UndefBits is set if the corresponding element of the vector is an
Scott Michel8efdca42007-12-04 22:23:35 +00001485// ISD::UNDEF value. For undefs, the corresponding VectorBits values are
1486// zero. Return true if this is not an array of constants, false if it is.
1487//
1488static bool GetConstantBuildVectorBits(SDNode *BV, uint64_t VectorBits[2],
1489 uint64_t UndefBits[2]) {
1490 // Start with zero'd results.
1491 VectorBits[0] = VectorBits[1] = UndefBits[0] = UndefBits[1] = 0;
Scott Michel4ec722e2008-07-16 17:17:29 +00001492
Duncan Sands92c43912008-06-06 12:08:01 +00001493 unsigned EltBitSize = BV->getOperand(0).getValueType().getSizeInBits();
Scott Michel8efdca42007-12-04 22:23:35 +00001494 for (unsigned i = 0, e = BV->getNumOperands(); i != e; ++i) {
Dan Gohman8181bd12008-07-27 21:46:04 +00001495 SDValue OpVal = BV->getOperand(i);
Scott Michel4ec722e2008-07-16 17:17:29 +00001496
Scott Michel8efdca42007-12-04 22:23:35 +00001497 unsigned PartNo = i >= e/2; // In the upper 128 bits?
1498 unsigned SlotNo = e/2 - (i & (e/2-1))-1; // Which subpiece of the uint64_t.
1499
1500 uint64_t EltBits = 0;
1501 if (OpVal.getOpcode() == ISD::UNDEF) {
1502 uint64_t EltUndefBits = ~0ULL >> (64-EltBitSize);
1503 UndefBits[PartNo] |= EltUndefBits << (SlotNo*EltBitSize);
1504 continue;
Scott Michel5974f432008-11-11 03:06:06 +00001505 } else if (ConstantSDNode *CN = dyn_cast<ConstantSDNode>(OpVal)) {
Dan Gohmanfaeb4a32008-09-12 16:56:44 +00001506 EltBits = CN->getZExtValue() & (~0ULL >> (64-EltBitSize));
Scott Michel5974f432008-11-11 03:06:06 +00001507 } else if (ConstantFPSDNode *CN = dyn_cast<ConstantFPSDNode>(OpVal)) {
Scott Michel8efdca42007-12-04 22:23:35 +00001508 const APFloat &apf = CN->getValueAPF();
1509 EltBits = (CN->getValueType(0) == MVT::f32
Scott Michel5a6f17b2008-01-30 02:55:46 +00001510 ? FloatToBits(apf.convertToFloat())
1511 : DoubleToBits(apf.convertToDouble()));
Scott Michel8efdca42007-12-04 22:23:35 +00001512 } else {
1513 // Nonconstant element.
1514 return true;
1515 }
Scott Michel4ec722e2008-07-16 17:17:29 +00001516
Scott Michel8efdca42007-12-04 22:23:35 +00001517 VectorBits[PartNo] |= EltBits << (SlotNo*EltBitSize);
1518 }
Scott Michel4ec722e2008-07-16 17:17:29 +00001519
1520 //printf("%llx %llx %llx %llx\n",
Scott Michel8efdca42007-12-04 22:23:35 +00001521 // VectorBits[0], VectorBits[1], UndefBits[0], UndefBits[1]);
1522 return false;
1523}
1524
1525/// If this is a splat (repetition) of a value across the whole vector, return
1526/// the smallest size that splats it. For example, "0x01010101010101..." is a
Scott Michel4ec722e2008-07-16 17:17:29 +00001527/// splat of 0x01, 0x0101, and 0x01010101. We return SplatBits = 0x01 and
Scott Michel8efdca42007-12-04 22:23:35 +00001528/// SplatSize = 1 byte.
Scott Michel4ec722e2008-07-16 17:17:29 +00001529static bool isConstantSplat(const uint64_t Bits128[2],
Scott Michel8efdca42007-12-04 22:23:35 +00001530 const uint64_t Undef128[2],
Scott Michel5a6f17b2008-01-30 02:55:46 +00001531 int MinSplatBits,
Scott Michel8efdca42007-12-04 22:23:35 +00001532 uint64_t &SplatBits, uint64_t &SplatUndef,
1533 int &SplatSize) {
1534 // Don't let undefs prevent splats from matching. See if the top 64-bits are
1535 // the same as the lower 64-bits, ignoring undefs.
1536 uint64_t Bits64 = Bits128[0] | Bits128[1];
1537 uint64_t Undef64 = Undef128[0] & Undef128[1];
1538 uint32_t Bits32 = uint32_t(Bits64) | uint32_t(Bits64 >> 32);
1539 uint32_t Undef32 = uint32_t(Undef64) & uint32_t(Undef64 >> 32);
1540 uint16_t Bits16 = uint16_t(Bits32) | uint16_t(Bits32 >> 16);
1541 uint16_t Undef16 = uint16_t(Undef32) & uint16_t(Undef32 >> 16);
1542
1543 if ((Bits128[0] & ~Undef128[1]) == (Bits128[1] & ~Undef128[0])) {
1544 if (MinSplatBits < 64) {
Scott Michel4ec722e2008-07-16 17:17:29 +00001545
Scott Michel8efdca42007-12-04 22:23:35 +00001546 // Check that the top 32-bits are the same as the lower 32-bits, ignoring
1547 // undefs.
1548 if ((Bits64 & (~Undef64 >> 32)) == ((Bits64 >> 32) & ~Undef64)) {
Scott Michel5a6f17b2008-01-30 02:55:46 +00001549 if (MinSplatBits < 32) {
Scott Michel8efdca42007-12-04 22:23:35 +00001550
Scott Michel5a6f17b2008-01-30 02:55:46 +00001551 // If the top 16-bits are different than the lower 16-bits, ignoring
1552 // undefs, we have an i32 splat.
1553 if ((Bits32 & (~Undef32 >> 16)) == ((Bits32 >> 16) & ~Undef32)) {
1554 if (MinSplatBits < 16) {
1555 // If the top 8-bits are different than the lower 8-bits, ignoring
1556 // undefs, we have an i16 splat.
Gabor Greife9f7f582008-08-31 15:37:04 +00001557 if ((Bits16 & (uint16_t(~Undef16) >> 8))
1558 == ((Bits16 >> 8) & ~Undef16)) {
Scott Michel5a6f17b2008-01-30 02:55:46 +00001559 // Otherwise, we have an 8-bit splat.
1560 SplatBits = uint8_t(Bits16) | uint8_t(Bits16 >> 8);
1561 SplatUndef = uint8_t(Undef16) & uint8_t(Undef16 >> 8);
1562 SplatSize = 1;
1563 return true;
1564 }
1565 } else {
1566 SplatBits = Bits16;
1567 SplatUndef = Undef16;
1568 SplatSize = 2;
1569 return true;
1570 }
1571 }
1572 } else {
1573 SplatBits = Bits32;
1574 SplatUndef = Undef32;
1575 SplatSize = 4;
1576 return true;
1577 }
Scott Michel8efdca42007-12-04 22:23:35 +00001578 }
1579 } else {
1580 SplatBits = Bits128[0];
1581 SplatUndef = Undef128[0];
1582 SplatSize = 8;
1583 return true;
1584 }
1585 }
1586
1587 return false; // Can't be a splat if two pieces don't match.
1588}
1589
Scott Michel8c67fa42009-01-21 04:58:48 +00001590//! Lower a BUILD_VECTOR instruction creatively:
1591SDValue
pingbak2f387e82009-01-26 03:31:40 +00001592LowerBUILD_VECTOR(SDValue Op, SelectionDAG &DAG) {
Duncan Sands92c43912008-06-06 12:08:01 +00001593 MVT VT = Op.getValueType();
Dale Johannesen913ba762009-02-06 01:31:28 +00001594 DebugLoc dl = Op.getDebugLoc();
Scott Michel8efdca42007-12-04 22:23:35 +00001595 // If this is a vector of constants or undefs, get the bits. A bit in
Scott Michel4ec722e2008-07-16 17:17:29 +00001596 // UndefBits is set if the corresponding element of the vector is an
Scott Michel8efdca42007-12-04 22:23:35 +00001597 // ISD::UNDEF value. For undefs, the corresponding VectorBits values are
Scott Michel4ec722e2008-07-16 17:17:29 +00001598 // zero.
Scott Michel8efdca42007-12-04 22:23:35 +00001599 uint64_t VectorBits[2];
1600 uint64_t UndefBits[2];
1601 uint64_t SplatBits, SplatUndef;
1602 int SplatSize;
Gabor Greif1c80d112008-08-28 21:40:38 +00001603 if (GetConstantBuildVectorBits(Op.getNode(), VectorBits, UndefBits)
Scott Michel8efdca42007-12-04 22:23:35 +00001604 || !isConstantSplat(VectorBits, UndefBits,
Duncan Sands92c43912008-06-06 12:08:01 +00001605 VT.getVectorElementType().getSizeInBits(),
Scott Michel8efdca42007-12-04 22:23:35 +00001606 SplatBits, SplatUndef, SplatSize))
Dan Gohman8181bd12008-07-27 21:46:04 +00001607 return SDValue(); // Not a constant vector, not a splat.
Scott Michel4ec722e2008-07-16 17:17:29 +00001608
Duncan Sands92c43912008-06-06 12:08:01 +00001609 switch (VT.getSimpleVT()) {
Scott Michel8efdca42007-12-04 22:23:35 +00001610 default:
Scott Michel8c67fa42009-01-21 04:58:48 +00001611 cerr << "CellSPU: Unhandled VT in LowerBUILD_VECTOR, VT = "
1612 << VT.getMVTString()
1613 << "\n";
1614 abort();
1615 /*NOTREACHED*/
Scott Michel8efdca42007-12-04 22:23:35 +00001616 case MVT::v4f32: {
pingbak2f387e82009-01-26 03:31:40 +00001617 uint32_t Value32 = uint32_t(SplatBits);
Scott Michel8efdca42007-12-04 22:23:35 +00001618 assert(SplatSize == 4
Scott Michel5a6f17b2008-01-30 02:55:46 +00001619 && "LowerBUILD_VECTOR: Unexpected floating point vector element.");
Scott Michel8efdca42007-12-04 22:23:35 +00001620 // NOTE: pretend the constant is an integer. LLVM won't load FP constants
Dan Gohman8181bd12008-07-27 21:46:04 +00001621 SDValue T = DAG.getConstant(Value32, MVT::i32);
Dale Johannesen913ba762009-02-06 01:31:28 +00001622 return DAG.getNode(ISD::BIT_CONVERT, dl, MVT::v4f32,
Scott Michel78c70a02009-02-22 23:36:09 +00001623 DAG.getBUILD_VECTOR(MVT::v4i32, dl, T, T, T, T));
Scott Michel8efdca42007-12-04 22:23:35 +00001624 break;
1625 }
1626 case MVT::v2f64: {
pingbak2f387e82009-01-26 03:31:40 +00001627 uint64_t f64val = uint64_t(SplatBits);
Scott Michel8efdca42007-12-04 22:23:35 +00001628 assert(SplatSize == 8
Scott Michelc630c412008-11-24 17:11:17 +00001629 && "LowerBUILD_VECTOR: 64-bit float vector size > 8 bytes.");
Scott Michel8efdca42007-12-04 22:23:35 +00001630 // NOTE: pretend the constant is an integer. LLVM won't load FP constants
Dan Gohman8181bd12008-07-27 21:46:04 +00001631 SDValue T = DAG.getConstant(f64val, MVT::i64);
Dale Johannesen913ba762009-02-06 01:31:28 +00001632 return DAG.getNode(ISD::BIT_CONVERT, dl, MVT::v2f64,
Scott Michel78c70a02009-02-22 23:36:09 +00001633 DAG.getBUILD_VECTOR(MVT::v2i64, dl, T, T));
Scott Michel8efdca42007-12-04 22:23:35 +00001634 break;
1635 }
1636 case MVT::v16i8: {
1637 // 8-bit constants have to be expanded to 16-bits
1638 unsigned short Value16 = SplatBits | (SplatBits << 8);
Dan Gohman8181bd12008-07-27 21:46:04 +00001639 SDValue Ops[8];
Scott Michel8efdca42007-12-04 22:23:35 +00001640 for (int i = 0; i < 8; ++i)
1641 Ops[i] = DAG.getConstant(Value16, MVT::i16);
Dale Johannesen913ba762009-02-06 01:31:28 +00001642 return DAG.getNode(ISD::BIT_CONVERT, dl, VT,
Scott Michel78c70a02009-02-22 23:36:09 +00001643 DAG.getBUILD_VECTOR(MVT::v8i16, dl, Ops, 8));
Scott Michel8efdca42007-12-04 22:23:35 +00001644 }
1645 case MVT::v8i16: {
1646 unsigned short Value16;
Scott Michel4ec722e2008-07-16 17:17:29 +00001647 if (SplatSize == 2)
Scott Michel8efdca42007-12-04 22:23:35 +00001648 Value16 = (unsigned short) (SplatBits & 0xffff);
1649 else
1650 Value16 = (unsigned short) (SplatBits | (SplatBits << 8));
Dan Gohman8181bd12008-07-27 21:46:04 +00001651 SDValue T = DAG.getConstant(Value16, VT.getVectorElementType());
1652 SDValue Ops[8];
Scott Michel8efdca42007-12-04 22:23:35 +00001653 for (int i = 0; i < 8; ++i) Ops[i] = T;
Scott Michel78c70a02009-02-22 23:36:09 +00001654 return DAG.getBUILD_VECTOR(VT, dl, Ops, 8);
Scott Michel8efdca42007-12-04 22:23:35 +00001655 }
1656 case MVT::v4i32: {
1657 unsigned int Value = SplatBits;
Dan Gohman8181bd12008-07-27 21:46:04 +00001658 SDValue T = DAG.getConstant(Value, VT.getVectorElementType());
Scott Michel78c70a02009-02-22 23:36:09 +00001659 return DAG.getBUILD_VECTOR(VT, dl, T, T, T, T);
Scott Michel8efdca42007-12-04 22:23:35 +00001660 }
Scott Michel70741542009-01-06 23:10:38 +00001661 case MVT::v2i32: {
1662 unsigned int Value = SplatBits;
1663 SDValue T = DAG.getConstant(Value, VT.getVectorElementType());
Scott Michel78c70a02009-02-22 23:36:09 +00001664 return DAG.getBUILD_VECTOR(VT, dl, T, T);
Scott Michel70741542009-01-06 23:10:38 +00001665 }
Scott Michel8efdca42007-12-04 22:23:35 +00001666 case MVT::v2i64: {
Dale Johannesen913ba762009-02-06 01:31:28 +00001667 return SPU::LowerSplat_v2i64(VT, DAG, SplatBits, dl);
Scott Michel8efdca42007-12-04 22:23:35 +00001668 }
1669 }
Scott Michel4ec722e2008-07-16 17:17:29 +00001670
Dan Gohman8181bd12008-07-27 21:46:04 +00001671 return SDValue();
Scott Michel8efdca42007-12-04 22:23:35 +00001672}
1673
pingbak2f387e82009-01-26 03:31:40 +00001674SDValue
Dale Johannesen913ba762009-02-06 01:31:28 +00001675SPU::LowerSplat_v2i64(MVT OpVT, SelectionDAG& DAG, uint64_t SplatVal,
1676 DebugLoc dl) {
pingbak2f387e82009-01-26 03:31:40 +00001677 uint32_t upper = uint32_t(SplatVal >> 32);
1678 uint32_t lower = uint32_t(SplatVal);
1679
1680 if (upper == lower) {
1681 // Magic constant that can be matched by IL, ILA, et. al.
1682 SDValue Val = DAG.getTargetConstant(upper, MVT::i32);
Dale Johannesen913ba762009-02-06 01:31:28 +00001683 return DAG.getNode(ISD::BIT_CONVERT, dl, OpVT,
Scott Michel78c70a02009-02-22 23:36:09 +00001684 DAG.getBUILD_VECTOR(MVT::v4i32, dl,
1685 Val, Val, Val, Val));
pingbak2f387e82009-01-26 03:31:40 +00001686 } else {
1687 SDValue LO32;
1688 SDValue HI32;
1689 SmallVector<SDValue, 16> ShufBytes;
1690 SDValue Result;
1691 bool upper_special, lower_special;
1692
1693 // NOTE: This code creates common-case shuffle masks that can be easily
1694 // detected as common expressions. It is not attempting to create highly
1695 // specialized masks to replace any and all 0's, 0xff's and 0x80's.
1696
1697 // Detect if the upper or lower half is a special shuffle mask pattern:
1698 upper_special = (upper == 0 || upper == 0xffffffff || upper == 0x80000000);
1699 lower_special = (lower == 0 || lower == 0xffffffff || lower == 0x80000000);
1700
1701 // Create lower vector if not a special pattern
1702 if (!lower_special) {
1703 SDValue LO32C = DAG.getConstant(lower, MVT::i32);
Dale Johannesen913ba762009-02-06 01:31:28 +00001704 LO32 = DAG.getNode(ISD::BIT_CONVERT, dl, OpVT,
Scott Michel78c70a02009-02-22 23:36:09 +00001705 DAG.getBUILD_VECTOR(MVT::v4i32, dl,
1706 LO32C, LO32C, LO32C, LO32C));
pingbak2f387e82009-01-26 03:31:40 +00001707 }
1708
1709 // Create upper vector if not a special pattern
1710 if (!upper_special) {
1711 SDValue HI32C = DAG.getConstant(upper, MVT::i32);
Dale Johannesen913ba762009-02-06 01:31:28 +00001712 HI32 = DAG.getNode(ISD::BIT_CONVERT, dl, OpVT,
Scott Michel78c70a02009-02-22 23:36:09 +00001713 DAG.getBUILD_VECTOR(MVT::v4i32, dl,
1714 HI32C, HI32C, HI32C, HI32C));
pingbak2f387e82009-01-26 03:31:40 +00001715 }
1716
1717 // If either upper or lower are special, then the two input operands are
1718 // the same (basically, one of them is a "don't care")
1719 if (lower_special)
1720 LO32 = HI32;
1721 if (upper_special)
1722 HI32 = LO32;
1723 if (lower_special && upper_special) {
1724 // Unhappy situation... both upper and lower are special, so punt with
1725 // a target constant:
1726 SDValue Zero = DAG.getConstant(0, MVT::i32);
Scott Michel78c70a02009-02-22 23:36:09 +00001727 HI32 = LO32 = DAG.getBUILD_VECTOR(MVT::v4i32, dl, Zero, Zero,
1728 Zero, Zero);
pingbak2f387e82009-01-26 03:31:40 +00001729 }
1730
1731 for (int i = 0; i < 4; ++i) {
1732 uint64_t val = 0;
1733 for (int j = 0; j < 4; ++j) {
1734 SDValue V;
1735 bool process_upper, process_lower;
1736 val <<= 8;
1737 process_upper = (upper_special && (i & 1) == 0);
1738 process_lower = (lower_special && (i & 1) == 1);
1739
1740 if (process_upper || process_lower) {
1741 if ((process_upper && upper == 0)
1742 || (process_lower && lower == 0))
1743 val |= 0x80;
1744 else if ((process_upper && upper == 0xffffffff)
1745 || (process_lower && lower == 0xffffffff))
1746 val |= 0xc0;
1747 else if ((process_upper && upper == 0x80000000)
1748 || (process_lower && lower == 0x80000000))
1749 val |= (j == 0 ? 0xe0 : 0x80);
1750 } else
1751 val |= i * 4 + j + ((i & 1) * 16);
1752 }
1753
1754 ShufBytes.push_back(DAG.getConstant(val, MVT::i32));
1755 }
1756
Dale Johannesen913ba762009-02-06 01:31:28 +00001757 return DAG.getNode(SPUISD::SHUFB, dl, OpVT, HI32, LO32,
Scott Michel78c70a02009-02-22 23:36:09 +00001758 DAG.getBUILD_VECTOR(MVT::v4i32, dl,
1759 &ShufBytes[0], ShufBytes.size()));
pingbak2f387e82009-01-26 03:31:40 +00001760 }
1761}
1762
Scott Michel8efdca42007-12-04 22:23:35 +00001763/// LowerVECTOR_SHUFFLE - Lower a vector shuffle (V1, V2, V3) to something on
1764/// which the Cell can operate. The code inspects V3 to ascertain whether the
1765/// permutation vector, V3, is monotonically increasing with one "exception"
1766/// element, e.g., (0, 1, _, 3). If this is the case, then generate a
Scott Michel56a125e2008-11-22 23:50:42 +00001767/// SHUFFLE_MASK synthetic instruction. Otherwise, spill V3 to the constant pool.
Scott Michel8efdca42007-12-04 22:23:35 +00001768/// In either case, the net result is going to eventually invoke SHUFB to
1769/// permute/shuffle the bytes from V1 and V2.
1770/// \note
Scott Michel56a125e2008-11-22 23:50:42 +00001771/// SHUFFLE_MASK is eventually selected as one of the C*D instructions, generate
Scott Michel8efdca42007-12-04 22:23:35 +00001772/// control word for byte/halfword/word insertion. This takes care of a single
1773/// element move from V2 into V1.
1774/// \note
1775/// SPUISD::SHUFB is eventually selected as Cell's <i>shufb</i> instructions.
Dan Gohman8181bd12008-07-27 21:46:04 +00001776static SDValue LowerVECTOR_SHUFFLE(SDValue Op, SelectionDAG &DAG) {
1777 SDValue V1 = Op.getOperand(0);
1778 SDValue V2 = Op.getOperand(1);
1779 SDValue PermMask = Op.getOperand(2);
Dale Johannesenb03cc3f2009-02-04 23:02:30 +00001780 DebugLoc dl = Op.getDebugLoc();
Scott Michel4ec722e2008-07-16 17:17:29 +00001781
Scott Michel8efdca42007-12-04 22:23:35 +00001782 if (V2.getOpcode() == ISD::UNDEF) V2 = V1;
Scott Michel4ec722e2008-07-16 17:17:29 +00001783
Scott Michel8efdca42007-12-04 22:23:35 +00001784 // If we have a single element being moved from V1 to V2, this can be handled
1785 // using the C*[DX] compute mask instructions, but the vector elements have
1786 // to be monotonically increasing with one exception element.
Scott Michele2641a12008-12-04 21:01:44 +00001787 MVT VecVT = V1.getValueType();
1788 MVT EltVT = VecVT.getVectorElementType();
Scott Michel8efdca42007-12-04 22:23:35 +00001789 unsigned EltsFromV2 = 0;
1790 unsigned V2Elt = 0;
1791 unsigned V2EltIdx0 = 0;
1792 unsigned CurrElt = 0;
Scott Michele2641a12008-12-04 21:01:44 +00001793 unsigned MaxElts = VecVT.getVectorNumElements();
1794 unsigned PrevElt = 0;
1795 unsigned V0Elt = 0;
Scott Michel8efdca42007-12-04 22:23:35 +00001796 bool monotonic = true;
Scott Michele2641a12008-12-04 21:01:44 +00001797 bool rotate = true;
1798
1799 if (EltVT == MVT::i8) {
Scott Michel8efdca42007-12-04 22:23:35 +00001800 V2EltIdx0 = 16;
Scott Michele2641a12008-12-04 21:01:44 +00001801 } else if (EltVT == MVT::i16) {
Scott Michel8efdca42007-12-04 22:23:35 +00001802 V2EltIdx0 = 8;
Scott Michele2641a12008-12-04 21:01:44 +00001803 } else if (EltVT == MVT::i32 || EltVT == MVT::f32) {
Scott Michel8efdca42007-12-04 22:23:35 +00001804 V2EltIdx0 = 4;
Scott Michele2641a12008-12-04 21:01:44 +00001805 } else if (EltVT == MVT::i64 || EltVT == MVT::f64) {
1806 V2EltIdx0 = 2;
1807 } else
Scott Michel8efdca42007-12-04 22:23:35 +00001808 assert(0 && "Unhandled vector type in LowerVECTOR_SHUFFLE");
1809
Scott Michele2641a12008-12-04 21:01:44 +00001810 for (unsigned i = 0; i != PermMask.getNumOperands(); ++i) {
1811 if (PermMask.getOperand(i).getOpcode() != ISD::UNDEF) {
1812 unsigned SrcElt = cast<ConstantSDNode > (PermMask.getOperand(i))->getZExtValue();
Scott Michel8efdca42007-12-04 22:23:35 +00001813
Scott Michele2641a12008-12-04 21:01:44 +00001814 if (monotonic) {
1815 if (SrcElt >= V2EltIdx0) {
1816 if (1 >= (++EltsFromV2)) {
1817 V2Elt = (V2EltIdx0 - SrcElt) << 2;
1818 }
1819 } else if (CurrElt != SrcElt) {
1820 monotonic = false;
1821 }
1822
1823 ++CurrElt;
1824 }
1825
1826 if (rotate) {
1827 if (PrevElt > 0 && SrcElt < MaxElts) {
1828 if ((PrevElt == SrcElt - 1)
1829 || (PrevElt == MaxElts - 1 && SrcElt == 0)) {
1830 PrevElt = SrcElt;
1831 if (SrcElt == 0)
1832 V0Elt = i;
1833 } else {
1834 rotate = false;
1835 }
1836 } else if (PrevElt == 0) {
1837 // First time through, need to keep track of previous element
1838 PrevElt = SrcElt;
1839 } else {
1840 // This isn't a rotation, takes elements from vector 2
1841 rotate = false;
1842 }
1843 }
Scott Michel8efdca42007-12-04 22:23:35 +00001844 }
Scott Michel8efdca42007-12-04 22:23:35 +00001845 }
1846
1847 if (EltsFromV2 == 1 && monotonic) {
1848 // Compute mask and shuffle
1849 MachineFunction &MF = DAG.getMachineFunction();
Chris Lattner1b989192007-12-31 04:13:23 +00001850 MachineRegisterInfo &RegInfo = MF.getRegInfo();
1851 unsigned VReg = RegInfo.createVirtualRegister(&SPU::R32CRegClass);
Duncan Sands92c43912008-06-06 12:08:01 +00001852 MVT PtrVT = DAG.getTargetLoweringInfo().getPointerTy();
Scott Michel8efdca42007-12-04 22:23:35 +00001853 // Initialize temporary register to 0
Dan Gohman8181bd12008-07-27 21:46:04 +00001854 SDValue InitTempReg =
Dale Johannesenb03cc3f2009-02-04 23:02:30 +00001855 DAG.getCopyToReg(DAG.getEntryNode(), dl, VReg, DAG.getConstant(0, PtrVT));
Scott Michel56a125e2008-11-22 23:50:42 +00001856 // Copy register's contents as index in SHUFFLE_MASK:
Dan Gohman8181bd12008-07-27 21:46:04 +00001857 SDValue ShufMaskOp =
Dale Johannesenb03cc3f2009-02-04 23:02:30 +00001858 DAG.getNode(SPUISD::SHUFFLE_MASK, dl, MVT::v4i32,
Scott Michel5a6f17b2008-01-30 02:55:46 +00001859 DAG.getTargetConstant(V2Elt, MVT::i32),
Dale Johannesenb03cc3f2009-02-04 23:02:30 +00001860 DAG.getCopyFromReg(InitTempReg, dl, VReg, PtrVT));
Scott Michel8efdca42007-12-04 22:23:35 +00001861 // Use shuffle mask in SHUFB synthetic instruction:
Dale Johannesenb03cc3f2009-02-04 23:02:30 +00001862 return DAG.getNode(SPUISD::SHUFB, dl, V1.getValueType(), V2, V1,
1863 ShufMaskOp);
Scott Michele2641a12008-12-04 21:01:44 +00001864 } else if (rotate) {
1865 int rotamt = (MaxElts - V0Elt) * EltVT.getSizeInBits()/8;
Scott Michelae5cbf52008-12-29 03:23:36 +00001866
Dale Johannesenb03cc3f2009-02-04 23:02:30 +00001867 return DAG.getNode(SPUISD::ROTBYTES_LEFT, dl, V1.getValueType(),
Scott Michele2641a12008-12-04 21:01:44 +00001868 V1, DAG.getConstant(rotamt, MVT::i16));
Scott Michel8efdca42007-12-04 22:23:35 +00001869 } else {
Gabor Greife9f7f582008-08-31 15:37:04 +00001870 // Convert the SHUFFLE_VECTOR mask's input element units to the
1871 // actual bytes.
Duncan Sands92c43912008-06-06 12:08:01 +00001872 unsigned BytesPerElement = EltVT.getSizeInBits()/8;
Scott Michel4ec722e2008-07-16 17:17:29 +00001873
Dan Gohman8181bd12008-07-27 21:46:04 +00001874 SmallVector<SDValue, 16> ResultMask;
Scott Michel8efdca42007-12-04 22:23:35 +00001875 for (unsigned i = 0, e = PermMask.getNumOperands(); i != e; ++i) {
1876 unsigned SrcElt;
1877 if (PermMask.getOperand(i).getOpcode() == ISD::UNDEF)
Scott Michel5a6f17b2008-01-30 02:55:46 +00001878 SrcElt = 0;
Scott Michel4ec722e2008-07-16 17:17:29 +00001879 else
Dan Gohmanfaeb4a32008-09-12 16:56:44 +00001880 SrcElt = cast<ConstantSDNode>(PermMask.getOperand(i))->getZExtValue();
Scott Michel4ec722e2008-07-16 17:17:29 +00001881
Scott Michel97872d32008-02-23 18:41:37 +00001882 for (unsigned j = 0; j < BytesPerElement; ++j) {
Scott Michel5a6f17b2008-01-30 02:55:46 +00001883 ResultMask.push_back(DAG.getConstant(SrcElt*BytesPerElement+j,
1884 MVT::i8));
Scott Michel8efdca42007-12-04 22:23:35 +00001885 }
1886 }
Scott Michel4ec722e2008-07-16 17:17:29 +00001887
Scott Michel78c70a02009-02-22 23:36:09 +00001888 SDValue VPermMask = DAG.getBUILD_VECTOR(MVT::v16i8, dl,
1889 &ResultMask[0], ResultMask.size());
Dale Johannesenb03cc3f2009-02-04 23:02:30 +00001890 return DAG.getNode(SPUISD::SHUFB, dl, V1.getValueType(), V1, V2, VPermMask);
Scott Michel8efdca42007-12-04 22:23:35 +00001891 }
1892}
1893
Dan Gohman8181bd12008-07-27 21:46:04 +00001894static SDValue LowerSCALAR_TO_VECTOR(SDValue Op, SelectionDAG &DAG) {
1895 SDValue Op0 = Op.getOperand(0); // Op0 = the scalar
Dale Johannesen913ba762009-02-06 01:31:28 +00001896 DebugLoc dl = Op.getDebugLoc();
Scott Michel8efdca42007-12-04 22:23:35 +00001897
Gabor Greif1c80d112008-08-28 21:40:38 +00001898 if (Op0.getNode()->getOpcode() == ISD::Constant) {
Scott Michel8efdca42007-12-04 22:23:35 +00001899 // For a constant, build the appropriate constant vector, which will
1900 // eventually simplify to a vector register load.
1901
Gabor Greif1c80d112008-08-28 21:40:38 +00001902 ConstantSDNode *CN = cast<ConstantSDNode>(Op0.getNode());
Dan Gohman8181bd12008-07-27 21:46:04 +00001903 SmallVector<SDValue, 16> ConstVecValues;
Duncan Sands92c43912008-06-06 12:08:01 +00001904 MVT VT;
Scott Michel8efdca42007-12-04 22:23:35 +00001905 size_t n_copies;
1906
1907 // Create a constant vector:
Duncan Sands92c43912008-06-06 12:08:01 +00001908 switch (Op.getValueType().getSimpleVT()) {
Scott Michel8efdca42007-12-04 22:23:35 +00001909 default: assert(0 && "Unexpected constant value type in "
Scott Michel5a6f17b2008-01-30 02:55:46 +00001910 "LowerSCALAR_TO_VECTOR");
Scott Michel8efdca42007-12-04 22:23:35 +00001911 case MVT::v16i8: n_copies = 16; VT = MVT::i8; break;
1912 case MVT::v8i16: n_copies = 8; VT = MVT::i16; break;
1913 case MVT::v4i32: n_copies = 4; VT = MVT::i32; break;
1914 case MVT::v4f32: n_copies = 4; VT = MVT::f32; break;
1915 case MVT::v2i64: n_copies = 2; VT = MVT::i64; break;
1916 case MVT::v2f64: n_copies = 2; VT = MVT::f64; break;
1917 }
1918
Dan Gohmanfaeb4a32008-09-12 16:56:44 +00001919 SDValue CValue = DAG.getConstant(CN->getZExtValue(), VT);
Scott Michel8efdca42007-12-04 22:23:35 +00001920 for (size_t j = 0; j < n_copies; ++j)
1921 ConstVecValues.push_back(CValue);
1922
Scott Michel78c70a02009-02-22 23:36:09 +00001923 return DAG.getBUILD_VECTOR(Op.getValueType(), dl,
1924 &ConstVecValues[0], ConstVecValues.size());
Scott Michel8efdca42007-12-04 22:23:35 +00001925 } else {
1926 // Otherwise, copy the value from one register to another:
Duncan Sands92c43912008-06-06 12:08:01 +00001927 switch (Op0.getValueType().getSimpleVT()) {
Scott Michel8efdca42007-12-04 22:23:35 +00001928 default: assert(0 && "Unexpected value type in LowerSCALAR_TO_VECTOR");
1929 case MVT::i8:
1930 case MVT::i16:
1931 case MVT::i32:
1932 case MVT::i64:
1933 case MVT::f32:
1934 case MVT::f64:
Dale Johannesen913ba762009-02-06 01:31:28 +00001935 return DAG.getNode(SPUISD::PREFSLOT2VEC, dl, Op.getValueType(), Op0, Op0);
Scott Michel8efdca42007-12-04 22:23:35 +00001936 }
1937 }
1938
Dan Gohman8181bd12008-07-27 21:46:04 +00001939 return SDValue();
Scott Michel8efdca42007-12-04 22:23:35 +00001940}
1941
Dan Gohman8181bd12008-07-27 21:46:04 +00001942static SDValue LowerEXTRACT_VECTOR_ELT(SDValue Op, SelectionDAG &DAG) {
Duncan Sands92c43912008-06-06 12:08:01 +00001943 MVT VT = Op.getValueType();
Dan Gohman8181bd12008-07-27 21:46:04 +00001944 SDValue N = Op.getOperand(0);
1945 SDValue Elt = Op.getOperand(1);
Dale Johannesen913ba762009-02-06 01:31:28 +00001946 DebugLoc dl = Op.getDebugLoc();
Scott Michel56a125e2008-11-22 23:50:42 +00001947 SDValue retval;
Scott Michel8efdca42007-12-04 22:23:35 +00001948
Scott Michel56a125e2008-11-22 23:50:42 +00001949 if (ConstantSDNode *C = dyn_cast<ConstantSDNode>(Elt)) {
1950 // Constant argument:
1951 int EltNo = (int) C->getZExtValue();
Scott Michel8efdca42007-12-04 22:23:35 +00001952
Scott Michel56a125e2008-11-22 23:50:42 +00001953 // sanity checks:
1954 if (VT == MVT::i8 && EltNo >= 16)
1955 assert(0 && "SPU LowerEXTRACT_VECTOR_ELT: i8 extraction slot > 15");
1956 else if (VT == MVT::i16 && EltNo >= 8)
1957 assert(0 && "SPU LowerEXTRACT_VECTOR_ELT: i16 extraction slot > 7");
1958 else if (VT == MVT::i32 && EltNo >= 4)
1959 assert(0 && "SPU LowerEXTRACT_VECTOR_ELT: i32 extraction slot > 4");
1960 else if (VT == MVT::i64 && EltNo >= 2)
1961 assert(0 && "SPU LowerEXTRACT_VECTOR_ELT: i64 extraction slot > 2");
Scott Michel8efdca42007-12-04 22:23:35 +00001962
Scott Michel56a125e2008-11-22 23:50:42 +00001963 if (EltNo == 0 && (VT == MVT::i32 || VT == MVT::i64)) {
1964 // i32 and i64: Element 0 is the preferred slot
Dale Johannesen913ba762009-02-06 01:31:28 +00001965 return DAG.getNode(SPUISD::VEC2PREFSLOT, dl, VT, N);
Scott Michel56a125e2008-11-22 23:50:42 +00001966 }
Scott Michel8efdca42007-12-04 22:23:35 +00001967
Scott Michel56a125e2008-11-22 23:50:42 +00001968 // Need to generate shuffle mask and extract:
1969 int prefslot_begin = -1, prefslot_end = -1;
1970 int elt_byte = EltNo * VT.getSizeInBits() / 8;
1971
1972 switch (VT.getSimpleVT()) {
1973 default:
1974 assert(false && "Invalid value type!");
1975 case MVT::i8: {
1976 prefslot_begin = prefslot_end = 3;
1977 break;
1978 }
1979 case MVT::i16: {
1980 prefslot_begin = 2; prefslot_end = 3;
1981 break;
1982 }
1983 case MVT::i32:
1984 case MVT::f32: {
1985 prefslot_begin = 0; prefslot_end = 3;
1986 break;
1987 }
1988 case MVT::i64:
1989 case MVT::f64: {
1990 prefslot_begin = 0; prefslot_end = 7;
1991 break;
1992 }
1993 }
1994
1995 assert(prefslot_begin != -1 && prefslot_end != -1 &&
1996 "LowerEXTRACT_VECTOR_ELT: preferred slots uninitialized");
1997
1998 unsigned int ShufBytes[16];
1999 for (int i = 0; i < 16; ++i) {
2000 // zero fill uppper part of preferred slot, don't care about the
2001 // other slots:
2002 unsigned int mask_val;
2003 if (i <= prefslot_end) {
2004 mask_val =
2005 ((i < prefslot_begin)
2006 ? 0x80
2007 : elt_byte + (i - prefslot_begin));
2008
2009 ShufBytes[i] = mask_val;
2010 } else
2011 ShufBytes[i] = ShufBytes[i % (prefslot_end + 1)];
2012 }
2013
2014 SDValue ShufMask[4];
2015 for (unsigned i = 0; i < sizeof(ShufMask)/sizeof(ShufMask[0]); ++i) {
Scott Michele2641a12008-12-04 21:01:44 +00002016 unsigned bidx = i * 4;
Scott Michel56a125e2008-11-22 23:50:42 +00002017 unsigned int bits = ((ShufBytes[bidx] << 24) |
2018 (ShufBytes[bidx+1] << 16) |
2019 (ShufBytes[bidx+2] << 8) |
2020 ShufBytes[bidx+3]);
2021 ShufMask[i] = DAG.getConstant(bits, MVT::i32);
2022 }
2023
Scott Michel78c70a02009-02-22 23:36:09 +00002024 SDValue ShufMaskVec =
2025 DAG.getBUILD_VECTOR(MVT::v4i32, dl,
2026 &ShufMask[0], sizeof(ShufMask)/sizeof(ShufMask[0]));
Scott Michel56a125e2008-11-22 23:50:42 +00002027
Dale Johannesen913ba762009-02-06 01:31:28 +00002028 retval = DAG.getNode(SPUISD::VEC2PREFSLOT, dl, VT,
2029 DAG.getNode(SPUISD::SHUFB, dl, N.getValueType(),
Scott Michel56a125e2008-11-22 23:50:42 +00002030 N, N, ShufMaskVec));
2031 } else {
2032 // Variable index: Rotate the requested element into slot 0, then replicate
2033 // slot 0 across the vector
2034 MVT VecVT = N.getValueType();
2035 if (!VecVT.isSimple() || !VecVT.isVector() || !VecVT.is128BitVector()) {
2036 cerr << "LowerEXTRACT_VECTOR_ELT: Must have a simple, 128-bit vector type!\n";
2037 abort();
2038 }
2039
2040 // Make life easier by making sure the index is zero-extended to i32
2041 if (Elt.getValueType() != MVT::i32)
Dale Johannesen913ba762009-02-06 01:31:28 +00002042 Elt = DAG.getNode(ISD::ZERO_EXTEND, dl, MVT::i32, Elt);
Scott Michel56a125e2008-11-22 23:50:42 +00002043
2044 // Scale the index to a bit/byte shift quantity
2045 APInt scaleFactor =
Scott Michelc630c412008-11-24 17:11:17 +00002046 APInt(32, uint64_t(16 / N.getValueType().getVectorNumElements()), false);
2047 unsigned scaleShift = scaleFactor.logBase2();
Scott Michel56a125e2008-11-22 23:50:42 +00002048 SDValue vecShift;
Scott Michel56a125e2008-11-22 23:50:42 +00002049
Scott Michelc630c412008-11-24 17:11:17 +00002050 if (scaleShift > 0) {
2051 // Scale the shift factor:
Dale Johannesen913ba762009-02-06 01:31:28 +00002052 Elt = DAG.getNode(ISD::SHL, dl, MVT::i32, Elt,
Scott Michel0718cd82008-12-01 17:56:02 +00002053 DAG.getConstant(scaleShift, MVT::i32));
Scott Michel56a125e2008-11-22 23:50:42 +00002054 }
2055
Dale Johannesen913ba762009-02-06 01:31:28 +00002056 vecShift = DAG.getNode(SPUISD::SHLQUAD_L_BYTES, dl, VecVT, N, Elt);
Scott Michelc630c412008-11-24 17:11:17 +00002057
2058 // Replicate the bytes starting at byte 0 across the entire vector (for
2059 // consistency with the notion of a unified register set)
Scott Michel56a125e2008-11-22 23:50:42 +00002060 SDValue replicate;
2061
2062 switch (VT.getSimpleVT()) {
2063 default:
2064 cerr << "LowerEXTRACT_VECTOR_ELT(varable): Unhandled vector type\n";
2065 abort();
2066 /*NOTREACHED*/
2067 case MVT::i8: {
Scott Michelc630c412008-11-24 17:11:17 +00002068 SDValue factor = DAG.getConstant(0x00000000, MVT::i32);
Scott Michel78c70a02009-02-22 23:36:09 +00002069 replicate = DAG.getBUILD_VECTOR(MVT::v4i32, dl, factor, factor,
2070 factor, factor);
Scott Michel56a125e2008-11-22 23:50:42 +00002071 break;
2072 }
2073 case MVT::i16: {
Scott Michelc630c412008-11-24 17:11:17 +00002074 SDValue factor = DAG.getConstant(0x00010001, MVT::i32);
Scott Michel78c70a02009-02-22 23:36:09 +00002075 replicate = DAG.getBUILD_VECTOR(MVT::v4i32, dl, factor, factor,
2076 factor, factor);
Scott Michel56a125e2008-11-22 23:50:42 +00002077 break;
2078 }
2079 case MVT::i32:
2080 case MVT::f32: {
2081 SDValue factor = DAG.getConstant(0x00010203, MVT::i32);
Scott Michel78c70a02009-02-22 23:36:09 +00002082 replicate = DAG.getBUILD_VECTOR(MVT::v4i32, dl, factor, factor,
2083 factor, factor);
Scott Michel56a125e2008-11-22 23:50:42 +00002084 break;
2085 }
2086 case MVT::i64:
2087 case MVT::f64: {
2088 SDValue loFactor = DAG.getConstant(0x00010203, MVT::i32);
2089 SDValue hiFactor = DAG.getConstant(0x04050607, MVT::i32);
Scott Michel78c70a02009-02-22 23:36:09 +00002090 replicate = DAG.getBUILD_VECTOR(MVT::v4i32, dl,
2091 loFactor, hiFactor, loFactor, hiFactor);
Scott Michel56a125e2008-11-22 23:50:42 +00002092 break;
2093 }
2094 }
2095
Dale Johannesen913ba762009-02-06 01:31:28 +00002096 retval = DAG.getNode(SPUISD::VEC2PREFSLOT, dl, VT,
2097 DAG.getNode(SPUISD::SHUFB, dl, VecVT,
Scott Michel0718cd82008-12-01 17:56:02 +00002098 vecShift, vecShift, replicate));
Scott Michel8efdca42007-12-04 22:23:35 +00002099 }
2100
Scott Michel56a125e2008-11-22 23:50:42 +00002101 return retval;
Scott Michel8efdca42007-12-04 22:23:35 +00002102}
2103
Dan Gohman8181bd12008-07-27 21:46:04 +00002104static SDValue LowerINSERT_VECTOR_ELT(SDValue Op, SelectionDAG &DAG) {
2105 SDValue VecOp = Op.getOperand(0);
2106 SDValue ValOp = Op.getOperand(1);
2107 SDValue IdxOp = Op.getOperand(2);
Dale Johannesen913ba762009-02-06 01:31:28 +00002108 DebugLoc dl = Op.getDebugLoc();
Duncan Sands92c43912008-06-06 12:08:01 +00002109 MVT VT = Op.getValueType();
Scott Michel8efdca42007-12-04 22:23:35 +00002110
2111 ConstantSDNode *CN = cast<ConstantSDNode>(IdxOp);
2112 assert(CN != 0 && "LowerINSERT_VECTOR_ELT: Index is not constant!");
2113
Duncan Sands92c43912008-06-06 12:08:01 +00002114 MVT PtrVT = DAG.getTargetLoweringInfo().getPointerTy();
Scott Michel0718cd82008-12-01 17:56:02 +00002115 // Use $sp ($1) because it's always 16-byte aligned and it's available:
Dale Johannesen913ba762009-02-06 01:31:28 +00002116 SDValue Pointer = DAG.getNode(SPUISD::IndirectAddr, dl, PtrVT,
Scott Michel0718cd82008-12-01 17:56:02 +00002117 DAG.getRegister(SPU::R1, PtrVT),
2118 DAG.getConstant(CN->getSExtValue(), PtrVT));
Dale Johannesen913ba762009-02-06 01:31:28 +00002119 SDValue ShufMask = DAG.getNode(SPUISD::SHUFFLE_MASK, dl, VT, Pointer);
Scott Michel8efdca42007-12-04 22:23:35 +00002120
Dan Gohman8181bd12008-07-27 21:46:04 +00002121 SDValue result =
Dale Johannesen913ba762009-02-06 01:31:28 +00002122 DAG.getNode(SPUISD::SHUFB, dl, VT,
2123 DAG.getNode(ISD::SCALAR_TO_VECTOR, dl, VT, ValOp),
Scott Michelae5cbf52008-12-29 03:23:36 +00002124 VecOp,
Dale Johannesen913ba762009-02-06 01:31:28 +00002125 DAG.getNode(ISD::BIT_CONVERT, dl, MVT::v4i32, ShufMask));
Scott Michel8efdca42007-12-04 22:23:35 +00002126
2127 return result;
2128}
2129
Scott Michel06eabde2008-12-27 04:51:36 +00002130static SDValue LowerI8Math(SDValue Op, SelectionDAG &DAG, unsigned Opc,
2131 const TargetLowering &TLI)
Scott Michel97872d32008-02-23 18:41:37 +00002132{
Dan Gohman8181bd12008-07-27 21:46:04 +00002133 SDValue N0 = Op.getOperand(0); // Everything has at least one operand
Dale Johannesen913ba762009-02-06 01:31:28 +00002134 DebugLoc dl = Op.getDebugLoc();
Scott Michel06eabde2008-12-27 04:51:36 +00002135 MVT ShiftVT = TLI.getShiftAmountTy();
Scott Michel8efdca42007-12-04 22:23:35 +00002136
2137 assert(Op.getValueType() == MVT::i8);
2138 switch (Opc) {
2139 default:
2140 assert(0 && "Unhandled i8 math operator");
2141 /*NOTREACHED*/
2142 break;
Scott Michel4d07fb72008-12-30 23:28:25 +00002143 case ISD::ADD: {
2144 // 8-bit addition: Promote the arguments up to 16-bits and truncate
2145 // the result:
2146 SDValue N1 = Op.getOperand(1);
Dale Johannesen913ba762009-02-06 01:31:28 +00002147 N0 = DAG.getNode(ISD::SIGN_EXTEND, dl, MVT::i16, N0);
2148 N1 = DAG.getNode(ISD::SIGN_EXTEND, dl, MVT::i16, N1);
2149 return DAG.getNode(ISD::TRUNCATE, dl, MVT::i8,
2150 DAG.getNode(Opc, dl, MVT::i16, N0, N1));
Scott Michel4d07fb72008-12-30 23:28:25 +00002151
2152 }
2153
Scott Michel8efdca42007-12-04 22:23:35 +00002154 case ISD::SUB: {
2155 // 8-bit subtraction: Promote the arguments up to 16-bits and truncate
2156 // the result:
Dan Gohman8181bd12008-07-27 21:46:04 +00002157 SDValue N1 = Op.getOperand(1);
Dale Johannesen913ba762009-02-06 01:31:28 +00002158 N0 = DAG.getNode(ISD::SIGN_EXTEND, dl, MVT::i16, N0);
2159 N1 = DAG.getNode(ISD::SIGN_EXTEND, dl, MVT::i16, N1);
2160 return DAG.getNode(ISD::TRUNCATE, dl, MVT::i8,
2161 DAG.getNode(Opc, dl, MVT::i16, N0, N1));
Scott Michel4ec722e2008-07-16 17:17:29 +00002162 }
Scott Michel8efdca42007-12-04 22:23:35 +00002163 case ISD::ROTR:
2164 case ISD::ROTL: {
Dan Gohman8181bd12008-07-27 21:46:04 +00002165 SDValue N1 = Op.getOperand(1);
Scott Michel8efdca42007-12-04 22:23:35 +00002166 unsigned N1Opc;
2167 N0 = (N0.getOpcode() != ISD::Constant
Dale Johannesen913ba762009-02-06 01:31:28 +00002168 ? DAG.getNode(ISD::ZERO_EXTEND, dl, MVT::i16, N0)
Dan Gohmanfaeb4a32008-09-12 16:56:44 +00002169 : DAG.getConstant(cast<ConstantSDNode>(N0)->getZExtValue(),
2170 MVT::i16));
Scott Michel06eabde2008-12-27 04:51:36 +00002171 N1Opc = N1.getValueType().bitsLT(ShiftVT)
Gabor Greife9f7f582008-08-31 15:37:04 +00002172 ? ISD::ZERO_EXTEND
2173 : ISD::TRUNCATE;
Scott Michel8efdca42007-12-04 22:23:35 +00002174 N1 = (N1.getOpcode() != ISD::Constant
Dale Johannesen913ba762009-02-06 01:31:28 +00002175 ? DAG.getNode(N1Opc, dl, ShiftVT, N1)
Dan Gohmanfaeb4a32008-09-12 16:56:44 +00002176 : DAG.getConstant(cast<ConstantSDNode>(N1)->getZExtValue(),
Scott Michel06eabde2008-12-27 04:51:36 +00002177 TLI.getShiftAmountTy()));
Dan Gohman8181bd12008-07-27 21:46:04 +00002178 SDValue ExpandArg =
Dale Johannesen913ba762009-02-06 01:31:28 +00002179 DAG.getNode(ISD::OR, dl, MVT::i16, N0,
2180 DAG.getNode(ISD::SHL, dl, MVT::i16,
Duncan Sands7aef60d2008-10-30 19:24:28 +00002181 N0, DAG.getConstant(8, MVT::i32)));
Dale Johannesen913ba762009-02-06 01:31:28 +00002182 return DAG.getNode(ISD::TRUNCATE, dl, MVT::i8,
2183 DAG.getNode(Opc, dl, MVT::i16, ExpandArg, N1));
Scott Michel8efdca42007-12-04 22:23:35 +00002184 }
2185 case ISD::SRL:
2186 case ISD::SHL: {
Dan Gohman8181bd12008-07-27 21:46:04 +00002187 SDValue N1 = Op.getOperand(1);
Scott Michel8efdca42007-12-04 22:23:35 +00002188 unsigned N1Opc;
2189 N0 = (N0.getOpcode() != ISD::Constant
Dale Johannesen913ba762009-02-06 01:31:28 +00002190 ? DAG.getNode(ISD::ZERO_EXTEND, dl, MVT::i16, N0)
Dan Gohmanfaeb4a32008-09-12 16:56:44 +00002191 : DAG.getConstant(cast<ConstantSDNode>(N0)->getZExtValue(),
Scott Michel06eabde2008-12-27 04:51:36 +00002192 MVT::i32));
2193 N1Opc = N1.getValueType().bitsLT(ShiftVT)
Gabor Greife9f7f582008-08-31 15:37:04 +00002194 ? ISD::ZERO_EXTEND
2195 : ISD::TRUNCATE;
Scott Michel8efdca42007-12-04 22:23:35 +00002196 N1 = (N1.getOpcode() != ISD::Constant
Dale Johannesen913ba762009-02-06 01:31:28 +00002197 ? DAG.getNode(N1Opc, dl, ShiftVT, N1)
Scott Michel06eabde2008-12-27 04:51:36 +00002198 : DAG.getConstant(cast<ConstantSDNode>(N1)->getZExtValue(), ShiftVT));
Dale Johannesen913ba762009-02-06 01:31:28 +00002199 return DAG.getNode(ISD::TRUNCATE, dl, MVT::i8,
2200 DAG.getNode(Opc, dl, MVT::i16, N0, N1));
Scott Michel8efdca42007-12-04 22:23:35 +00002201 }
2202 case ISD::SRA: {
Dan Gohman8181bd12008-07-27 21:46:04 +00002203 SDValue N1 = Op.getOperand(1);
Scott Michel8efdca42007-12-04 22:23:35 +00002204 unsigned N1Opc;
2205 N0 = (N0.getOpcode() != ISD::Constant
Dale Johannesen913ba762009-02-06 01:31:28 +00002206 ? DAG.getNode(ISD::SIGN_EXTEND, dl, MVT::i16, N0)
Scott Michel06eabde2008-12-27 04:51:36 +00002207 : DAG.getConstant(cast<ConstantSDNode>(N0)->getSExtValue(),
Dan Gohmanfaeb4a32008-09-12 16:56:44 +00002208 MVT::i16));
Scott Michel06eabde2008-12-27 04:51:36 +00002209 N1Opc = N1.getValueType().bitsLT(ShiftVT)
Gabor Greife9f7f582008-08-31 15:37:04 +00002210 ? ISD::SIGN_EXTEND
2211 : ISD::TRUNCATE;
Scott Michel8efdca42007-12-04 22:23:35 +00002212 N1 = (N1.getOpcode() != ISD::Constant
Dale Johannesen913ba762009-02-06 01:31:28 +00002213 ? DAG.getNode(N1Opc, dl, ShiftVT, N1)
Dan Gohmanfaeb4a32008-09-12 16:56:44 +00002214 : DAG.getConstant(cast<ConstantSDNode>(N1)->getZExtValue(),
Scott Michel06eabde2008-12-27 04:51:36 +00002215 ShiftVT));
Dale Johannesen913ba762009-02-06 01:31:28 +00002216 return DAG.getNode(ISD::TRUNCATE, dl, MVT::i8,
2217 DAG.getNode(Opc, dl, MVT::i16, N0, N1));
Scott Michel8efdca42007-12-04 22:23:35 +00002218 }
2219 case ISD::MUL: {
Dan Gohman8181bd12008-07-27 21:46:04 +00002220 SDValue N1 = Op.getOperand(1);
Scott Michel8efdca42007-12-04 22:23:35 +00002221 unsigned N1Opc;
2222 N0 = (N0.getOpcode() != ISD::Constant
Dale Johannesen913ba762009-02-06 01:31:28 +00002223 ? DAG.getNode(ISD::SIGN_EXTEND, dl, MVT::i16, N0)
Dan Gohmanfaeb4a32008-09-12 16:56:44 +00002224 : DAG.getConstant(cast<ConstantSDNode>(N0)->getZExtValue(),
2225 MVT::i16));
Duncan Sandsec142ee2008-06-08 20:54:56 +00002226 N1Opc = N1.getValueType().bitsLT(MVT::i16) ? ISD::SIGN_EXTEND : ISD::TRUNCATE;
Scott Michel8efdca42007-12-04 22:23:35 +00002227 N1 = (N1.getOpcode() != ISD::Constant
Dale Johannesen913ba762009-02-06 01:31:28 +00002228 ? DAG.getNode(N1Opc, dl, MVT::i16, N1)
Scott Michel06eabde2008-12-27 04:51:36 +00002229 : DAG.getConstant(cast<ConstantSDNode>(N1)->getSExtValue(),
Dan Gohmanfaeb4a32008-09-12 16:56:44 +00002230 MVT::i16));
Dale Johannesen913ba762009-02-06 01:31:28 +00002231 return DAG.getNode(ISD::TRUNCATE, dl, MVT::i8,
2232 DAG.getNode(Opc, dl, MVT::i16, N0, N1));
Scott Michel8efdca42007-12-04 22:23:35 +00002233 break;
2234 }
2235 }
2236
Dan Gohman8181bd12008-07-27 21:46:04 +00002237 return SDValue();
Scott Michel8efdca42007-12-04 22:23:35 +00002238}
2239
Scott Michel750b93f2009-01-15 04:41:47 +00002240//! Generate the carry-generate shuffle mask.
Dale Johannesen913ba762009-02-06 01:31:28 +00002241SDValue SPU::getCarryGenerateShufMask(SelectionDAG &DAG, DebugLoc dl) {
Scott Michel8c67fa42009-01-21 04:58:48 +00002242 SmallVector<SDValue, 16 > ShufBytes;
Scott Michel97872d32008-02-23 18:41:37 +00002243
Scott Michel8c67fa42009-01-21 04:58:48 +00002244 // Create the shuffle mask for "rotating" the borrow up one register slot
2245 // once the borrow is generated.
2246 ShufBytes.push_back(DAG.getConstant(0x04050607, MVT::i32));
2247 ShufBytes.push_back(DAG.getConstant(0x80808080, MVT::i32));
2248 ShufBytes.push_back(DAG.getConstant(0x0c0d0e0f, MVT::i32));
2249 ShufBytes.push_back(DAG.getConstant(0x80808080, MVT::i32));
Scott Michel97872d32008-02-23 18:41:37 +00002250
Scott Michel78c70a02009-02-22 23:36:09 +00002251 return DAG.getBUILD_VECTOR(MVT::v4i32, dl,
2252 &ShufBytes[0], ShufBytes.size());
Scott Michel750b93f2009-01-15 04:41:47 +00002253}
Scott Michel97872d32008-02-23 18:41:37 +00002254
Scott Michel750b93f2009-01-15 04:41:47 +00002255//! Generate the borrow-generate shuffle mask
Dale Johannesen913ba762009-02-06 01:31:28 +00002256SDValue SPU::getBorrowGenerateShufMask(SelectionDAG &DAG, DebugLoc dl) {
Scott Michel8c67fa42009-01-21 04:58:48 +00002257 SmallVector<SDValue, 16 > ShufBytes;
Scott Michel97872d32008-02-23 18:41:37 +00002258
Scott Michel8c67fa42009-01-21 04:58:48 +00002259 // Create the shuffle mask for "rotating" the borrow up one register slot
2260 // once the borrow is generated.
2261 ShufBytes.push_back(DAG.getConstant(0x04050607, MVT::i32));
2262 ShufBytes.push_back(DAG.getConstant(0xc0c0c0c0, MVT::i32));
2263 ShufBytes.push_back(DAG.getConstant(0x0c0d0e0f, MVT::i32));
2264 ShufBytes.push_back(DAG.getConstant(0xc0c0c0c0, MVT::i32));
Scott Michelf2df6cb2008-11-24 18:20:46 +00002265
Scott Michel78c70a02009-02-22 23:36:09 +00002266 return DAG.getBUILD_VECTOR(MVT::v4i32, dl,
2267 &ShufBytes[0], ShufBytes.size());
Scott Michel97872d32008-02-23 18:41:37 +00002268}
2269
Scott Michel8efdca42007-12-04 22:23:35 +00002270//! Lower byte immediate operations for v16i8 vectors:
Dan Gohman8181bd12008-07-27 21:46:04 +00002271static SDValue
2272LowerByteImmed(SDValue Op, SelectionDAG &DAG) {
2273 SDValue ConstVec;
2274 SDValue Arg;
Duncan Sands92c43912008-06-06 12:08:01 +00002275 MVT VT = Op.getValueType();
Dale Johannesen913ba762009-02-06 01:31:28 +00002276 DebugLoc dl = Op.getDebugLoc();
Scott Michel8efdca42007-12-04 22:23:35 +00002277
2278 ConstVec = Op.getOperand(0);
2279 Arg = Op.getOperand(1);
Gabor Greif1c80d112008-08-28 21:40:38 +00002280 if (ConstVec.getNode()->getOpcode() != ISD::BUILD_VECTOR) {
2281 if (ConstVec.getNode()->getOpcode() == ISD::BIT_CONVERT) {
Scott Michel8efdca42007-12-04 22:23:35 +00002282 ConstVec = ConstVec.getOperand(0);
2283 } else {
2284 ConstVec = Op.getOperand(1);
2285 Arg = Op.getOperand(0);
Gabor Greif1c80d112008-08-28 21:40:38 +00002286 if (ConstVec.getNode()->getOpcode() == ISD::BIT_CONVERT) {
Scott Michel5a6f17b2008-01-30 02:55:46 +00002287 ConstVec = ConstVec.getOperand(0);
Scott Michel8efdca42007-12-04 22:23:35 +00002288 }
2289 }
2290 }
2291
Gabor Greif1c80d112008-08-28 21:40:38 +00002292 if (ConstVec.getNode()->getOpcode() == ISD::BUILD_VECTOR) {
Scott Michel8efdca42007-12-04 22:23:35 +00002293 uint64_t VectorBits[2];
2294 uint64_t UndefBits[2];
2295 uint64_t SplatBits, SplatUndef;
2296 int SplatSize;
2297
Gabor Greif1c80d112008-08-28 21:40:38 +00002298 if (!GetConstantBuildVectorBits(ConstVec.getNode(), VectorBits, UndefBits)
Scott Michel5a6f17b2008-01-30 02:55:46 +00002299 && isConstantSplat(VectorBits, UndefBits,
Duncan Sands92c43912008-06-06 12:08:01 +00002300 VT.getVectorElementType().getSizeInBits(),
Scott Michel5a6f17b2008-01-30 02:55:46 +00002301 SplatBits, SplatUndef, SplatSize)) {
Dan Gohman8181bd12008-07-27 21:46:04 +00002302 SDValue tcVec[16];
2303 SDValue tc = DAG.getTargetConstant(SplatBits & 0xff, MVT::i8);
Scott Michel8efdca42007-12-04 22:23:35 +00002304 const size_t tcVecSize = sizeof(tcVec) / sizeof(tcVec[0]);
2305
2306 // Turn the BUILD_VECTOR into a set of target constants:
2307 for (size_t i = 0; i < tcVecSize; ++i)
Scott Michel5a6f17b2008-01-30 02:55:46 +00002308 tcVec[i] = tc;
Scott Michel8efdca42007-12-04 22:23:35 +00002309
Dale Johannesen913ba762009-02-06 01:31:28 +00002310 return DAG.getNode(Op.getNode()->getOpcode(), dl, VT, Arg,
Scott Michel78c70a02009-02-22 23:36:09 +00002311 DAG.getBUILD_VECTOR(VT, dl, tcVec, tcVecSize));
Scott Michel8efdca42007-12-04 22:23:35 +00002312 }
2313 }
Scott Michelc899a122009-01-26 22:33:37 +00002314
Nate Begeman7569e762008-07-29 19:07:27 +00002315 // These operations (AND, OR, XOR) are legal, they just couldn't be custom
2316 // lowered. Return the operation, rather than a null SDValue.
2317 return Op;
Scott Michel8efdca42007-12-04 22:23:35 +00002318}
2319
Scott Michel8efdca42007-12-04 22:23:35 +00002320//! Custom lowering for CTPOP (count population)
2321/*!
2322 Custom lowering code that counts the number ones in the input
2323 operand. SPU has such an instruction, but it counts the number of
2324 ones per byte, which then have to be accumulated.
2325*/
Dan Gohman8181bd12008-07-27 21:46:04 +00002326static SDValue LowerCTPOP(SDValue Op, SelectionDAG &DAG) {
Duncan Sands92c43912008-06-06 12:08:01 +00002327 MVT VT = Op.getValueType();
2328 MVT vecVT = MVT::getVectorVT(VT, (128 / VT.getSizeInBits()));
Dale Johannesenb03cc3f2009-02-04 23:02:30 +00002329 DebugLoc dl = Op.getDebugLoc();
Scott Michel8efdca42007-12-04 22:23:35 +00002330
Duncan Sands92c43912008-06-06 12:08:01 +00002331 switch (VT.getSimpleVT()) {
2332 default:
2333 assert(false && "Invalid value type!");
Scott Michel8efdca42007-12-04 22:23:35 +00002334 case MVT::i8: {
Dan Gohman8181bd12008-07-27 21:46:04 +00002335 SDValue N = Op.getOperand(0);
2336 SDValue Elt0 = DAG.getConstant(0, MVT::i32);
Scott Michel8efdca42007-12-04 22:23:35 +00002337
Dale Johannesenb03cc3f2009-02-04 23:02:30 +00002338 SDValue Promote = DAG.getNode(SPUISD::PREFSLOT2VEC, dl, vecVT, N, N);
2339 SDValue CNTB = DAG.getNode(SPUISD::CNTB, dl, vecVT, Promote);
Scott Michel8efdca42007-12-04 22:23:35 +00002340
Dale Johannesenb03cc3f2009-02-04 23:02:30 +00002341 return DAG.getNode(ISD::EXTRACT_VECTOR_ELT, dl, MVT::i8, CNTB, Elt0);
Scott Michel8efdca42007-12-04 22:23:35 +00002342 }
2343
2344 case MVT::i16: {
2345 MachineFunction &MF = DAG.getMachineFunction();
Chris Lattner1b989192007-12-31 04:13:23 +00002346 MachineRegisterInfo &RegInfo = MF.getRegInfo();
Scott Michel8efdca42007-12-04 22:23:35 +00002347
Chris Lattner1b989192007-12-31 04:13:23 +00002348 unsigned CNTB_reg = RegInfo.createVirtualRegister(&SPU::R16CRegClass);
Scott Michel8efdca42007-12-04 22:23:35 +00002349
Dan Gohman8181bd12008-07-27 21:46:04 +00002350 SDValue N = Op.getOperand(0);
2351 SDValue Elt0 = DAG.getConstant(0, MVT::i16);
2352 SDValue Mask0 = DAG.getConstant(0x0f, MVT::i16);
Duncan Sands7aef60d2008-10-30 19:24:28 +00002353 SDValue Shift1 = DAG.getConstant(8, MVT::i32);
Scott Michel8efdca42007-12-04 22:23:35 +00002354
Dale Johannesenb03cc3f2009-02-04 23:02:30 +00002355 SDValue Promote = DAG.getNode(SPUISD::PREFSLOT2VEC, dl, vecVT, N, N);
2356 SDValue CNTB = DAG.getNode(SPUISD::CNTB, dl, vecVT, Promote);
Scott Michel8efdca42007-12-04 22:23:35 +00002357
2358 // CNTB_result becomes the chain to which all of the virtual registers
2359 // CNTB_reg, SUM1_reg become associated:
Dan Gohman8181bd12008-07-27 21:46:04 +00002360 SDValue CNTB_result =
Dale Johannesenb03cc3f2009-02-04 23:02:30 +00002361 DAG.getNode(ISD::EXTRACT_VECTOR_ELT, dl, MVT::i16, CNTB, Elt0);
Scott Michel4ec722e2008-07-16 17:17:29 +00002362
Dan Gohman8181bd12008-07-27 21:46:04 +00002363 SDValue CNTB_rescopy =
Dale Johannesenb03cc3f2009-02-04 23:02:30 +00002364 DAG.getCopyToReg(CNTB_result, dl, CNTB_reg, CNTB_result);
Scott Michel8efdca42007-12-04 22:23:35 +00002365
Dale Johannesenb03cc3f2009-02-04 23:02:30 +00002366 SDValue Tmp1 = DAG.getCopyFromReg(CNTB_rescopy, dl, CNTB_reg, MVT::i16);
Scott Michel8efdca42007-12-04 22:23:35 +00002367
Dale Johannesenb03cc3f2009-02-04 23:02:30 +00002368 return DAG.getNode(ISD::AND, dl, MVT::i16,
2369 DAG.getNode(ISD::ADD, dl, MVT::i16,
2370 DAG.getNode(ISD::SRL, dl, MVT::i16,
Scott Michel5a6f17b2008-01-30 02:55:46 +00002371 Tmp1, Shift1),
2372 Tmp1),
2373 Mask0);
Scott Michel8efdca42007-12-04 22:23:35 +00002374 }
2375
2376 case MVT::i32: {
2377 MachineFunction &MF = DAG.getMachineFunction();
Chris Lattner1b989192007-12-31 04:13:23 +00002378 MachineRegisterInfo &RegInfo = MF.getRegInfo();
Scott Michel8efdca42007-12-04 22:23:35 +00002379
Chris Lattner1b989192007-12-31 04:13:23 +00002380 unsigned CNTB_reg = RegInfo.createVirtualRegister(&SPU::R32CRegClass);
2381 unsigned SUM1_reg = RegInfo.createVirtualRegister(&SPU::R32CRegClass);
Scott Michel8efdca42007-12-04 22:23:35 +00002382
Dan Gohman8181bd12008-07-27 21:46:04 +00002383 SDValue N = Op.getOperand(0);
2384 SDValue Elt0 = DAG.getConstant(0, MVT::i32);
2385 SDValue Mask0 = DAG.getConstant(0xff, MVT::i32);
2386 SDValue Shift1 = DAG.getConstant(16, MVT::i32);
2387 SDValue Shift2 = DAG.getConstant(8, MVT::i32);
Scott Michel8efdca42007-12-04 22:23:35 +00002388
Dale Johannesenb03cc3f2009-02-04 23:02:30 +00002389 SDValue Promote = DAG.getNode(SPUISD::PREFSLOT2VEC, dl, vecVT, N, N);
2390 SDValue CNTB = DAG.getNode(SPUISD::CNTB, dl, vecVT, Promote);
Scott Michel8efdca42007-12-04 22:23:35 +00002391
2392 // CNTB_result becomes the chain to which all of the virtual registers
2393 // CNTB_reg, SUM1_reg become associated:
Dan Gohman8181bd12008-07-27 21:46:04 +00002394 SDValue CNTB_result =
Dale Johannesenb03cc3f2009-02-04 23:02:30 +00002395 DAG.getNode(ISD::EXTRACT_VECTOR_ELT, dl, MVT::i32, CNTB, Elt0);
Scott Michel4ec722e2008-07-16 17:17:29 +00002396
Dan Gohman8181bd12008-07-27 21:46:04 +00002397 SDValue CNTB_rescopy =
Dale Johannesenb03cc3f2009-02-04 23:02:30 +00002398 DAG.getCopyToReg(CNTB_result, dl, CNTB_reg, CNTB_result);
Scott Michel8efdca42007-12-04 22:23:35 +00002399
Dan Gohman8181bd12008-07-27 21:46:04 +00002400 SDValue Comp1 =
Dale Johannesenb03cc3f2009-02-04 23:02:30 +00002401 DAG.getNode(ISD::SRL, dl, MVT::i32,
2402 DAG.getCopyFromReg(CNTB_rescopy, dl, CNTB_reg, MVT::i32),
2403 Shift1);
Scott Michel8efdca42007-12-04 22:23:35 +00002404
Dan Gohman8181bd12008-07-27 21:46:04 +00002405 SDValue Sum1 =
Dale Johannesenb03cc3f2009-02-04 23:02:30 +00002406 DAG.getNode(ISD::ADD, dl, MVT::i32, Comp1,
2407 DAG.getCopyFromReg(CNTB_rescopy, dl, CNTB_reg, MVT::i32));
Scott Michel8efdca42007-12-04 22:23:35 +00002408
Dan Gohman8181bd12008-07-27 21:46:04 +00002409 SDValue Sum1_rescopy =
Dale Johannesenb03cc3f2009-02-04 23:02:30 +00002410 DAG.getCopyToReg(CNTB_result, dl, SUM1_reg, Sum1);
Scott Michel8efdca42007-12-04 22:23:35 +00002411
Dan Gohman8181bd12008-07-27 21:46:04 +00002412 SDValue Comp2 =
Dale Johannesenb03cc3f2009-02-04 23:02:30 +00002413 DAG.getNode(ISD::SRL, dl, MVT::i32,
2414 DAG.getCopyFromReg(Sum1_rescopy, dl, SUM1_reg, MVT::i32),
Scott Michel5a6f17b2008-01-30 02:55:46 +00002415 Shift2);
Dan Gohman8181bd12008-07-27 21:46:04 +00002416 SDValue Sum2 =
Dale Johannesenb03cc3f2009-02-04 23:02:30 +00002417 DAG.getNode(ISD::ADD, dl, MVT::i32, Comp2,
2418 DAG.getCopyFromReg(Sum1_rescopy, dl, SUM1_reg, MVT::i32));
Scott Michel8efdca42007-12-04 22:23:35 +00002419
Dale Johannesenb03cc3f2009-02-04 23:02:30 +00002420 return DAG.getNode(ISD::AND, dl, MVT::i32, Sum2, Mask0);
Scott Michel8efdca42007-12-04 22:23:35 +00002421 }
2422
2423 case MVT::i64:
2424 break;
2425 }
2426
Dan Gohman8181bd12008-07-27 21:46:04 +00002427 return SDValue();
Scott Michel8efdca42007-12-04 22:23:35 +00002428}
2429
pingbak2f387e82009-01-26 03:31:40 +00002430//! Lower ISD::FP_TO_SINT, ISD::FP_TO_UINT for i32
Scott Michel8c67fa42009-01-21 04:58:48 +00002431/*!
pingbak2f387e82009-01-26 03:31:40 +00002432 f32->i32 passes through unchanged, whereas f64->i32 expands to a libcall.
2433 All conversions to i64 are expanded to a libcall.
Scott Michel8c67fa42009-01-21 04:58:48 +00002434 */
pingbak2f387e82009-01-26 03:31:40 +00002435static SDValue LowerFP_TO_INT(SDValue Op, SelectionDAG &DAG,
2436 SPUTargetLowering &TLI) {
Scott Michel8c67fa42009-01-21 04:58:48 +00002437 MVT OpVT = Op.getValueType();
Scott Michel8c67fa42009-01-21 04:58:48 +00002438 SDValue Op0 = Op.getOperand(0);
pingbak2f387e82009-01-26 03:31:40 +00002439 MVT Op0VT = Op0.getValueType();
Scott Michel8c67fa42009-01-21 04:58:48 +00002440
pingbak2f387e82009-01-26 03:31:40 +00002441 if ((OpVT == MVT::i32 && Op0VT == MVT::f64)
2442 || OpVT == MVT::i64) {
2443 // Convert f32 / f64 to i32 / i64 via libcall.
2444 RTLIB::Libcall LC =
2445 (Op.getOpcode() == ISD::FP_TO_SINT)
2446 ? RTLIB::getFPTOSINT(Op0VT, OpVT)
2447 : RTLIB::getFPTOUINT(Op0VT, OpVT);
2448 assert(LC != RTLIB::UNKNOWN_LIBCALL && "Unexpectd fp-to-int conversion!");
2449 SDValue Dummy;
2450 return ExpandLibCall(LC, Op, DAG, false, Dummy, TLI);
2451 }
Scott Michel8c67fa42009-01-21 04:58:48 +00002452
Scott Michelc899a122009-01-26 22:33:37 +00002453 return Op; // return unmolested, legalized op
pingbak2f387e82009-01-26 03:31:40 +00002454}
Scott Michel8c67fa42009-01-21 04:58:48 +00002455
pingbak2f387e82009-01-26 03:31:40 +00002456//! Lower ISD::SINT_TO_FP, ISD::UINT_TO_FP for i32
2457/*!
2458 i32->f32 passes through unchanged, whereas i32->f64 is expanded to a libcall.
2459 All conversions from i64 are expanded to a libcall.
2460 */
2461static SDValue LowerINT_TO_FP(SDValue Op, SelectionDAG &DAG,
2462 SPUTargetLowering &TLI) {
2463 MVT OpVT = Op.getValueType();
2464 SDValue Op0 = Op.getOperand(0);
2465 MVT Op0VT = Op0.getValueType();
2466
2467 if ((OpVT == MVT::f64 && Op0VT == MVT::i32)
2468 || Op0VT == MVT::i64) {
2469 // Convert i32, i64 to f64 via libcall:
2470 RTLIB::Libcall LC =
2471 (Op.getOpcode() == ISD::SINT_TO_FP)
2472 ? RTLIB::getSINTTOFP(Op0VT, OpVT)
2473 : RTLIB::getUINTTOFP(Op0VT, OpVT);
2474 assert(LC != RTLIB::UNKNOWN_LIBCALL && "Unexpectd int-to-fp conversion!");
2475 SDValue Dummy;
2476 return ExpandLibCall(LC, Op, DAG, false, Dummy, TLI);
2477 }
2478
Scott Michelc899a122009-01-26 22:33:37 +00002479 return Op; // return unmolested, legalized
Scott Michel8c67fa42009-01-21 04:58:48 +00002480}
2481
2482//! Lower ISD::SETCC
2483/*!
2484 This handles MVT::f64 (double floating point) condition lowering
2485 */
Scott Michel8c67fa42009-01-21 04:58:48 +00002486static SDValue LowerSETCC(SDValue Op, SelectionDAG &DAG,
2487 const TargetLowering &TLI) {
pingbak2f387e82009-01-26 03:31:40 +00002488 CondCodeSDNode *CC = dyn_cast<CondCodeSDNode>(Op.getOperand(2));
Dale Johannesen2dbdb0e2009-02-07 19:59:05 +00002489 DebugLoc dl = Op.getDebugLoc();
pingbak2f387e82009-01-26 03:31:40 +00002490 assert(CC != 0 && "LowerSETCC: CondCodeSDNode should not be null here!\n");
2491
Scott Michel8c67fa42009-01-21 04:58:48 +00002492 SDValue lhs = Op.getOperand(0);
2493 SDValue rhs = Op.getOperand(1);
Scott Michel8c67fa42009-01-21 04:58:48 +00002494 MVT lhsVT = lhs.getValueType();
Scott Michel8c67fa42009-01-21 04:58:48 +00002495 assert(lhsVT == MVT::f64 && "LowerSETCC: type other than MVT::64\n");
2496
pingbak2f387e82009-01-26 03:31:40 +00002497 MVT ccResultVT = TLI.getSetCCResultType(lhs.getValueType());
2498 APInt ccResultOnes = APInt::getAllOnesValue(ccResultVT.getSizeInBits());
2499 MVT IntVT(MVT::i64);
2500
2501 // Take advantage of the fact that (truncate (sra arg, 32)) is efficiently
2502 // selected to a NOP:
Dale Johannesen85fc0932009-02-04 01:48:28 +00002503 SDValue i64lhs = DAG.getNode(ISD::BIT_CONVERT, dl, IntVT, lhs);
pingbak2f387e82009-01-26 03:31:40 +00002504 SDValue lhsHi32 =
Dale Johannesen85fc0932009-02-04 01:48:28 +00002505 DAG.getNode(ISD::TRUNCATE, dl, MVT::i32,
2506 DAG.getNode(ISD::SRL, dl, IntVT,
pingbak2f387e82009-01-26 03:31:40 +00002507 i64lhs, DAG.getConstant(32, MVT::i32)));
2508 SDValue lhsHi32abs =
Dale Johannesen85fc0932009-02-04 01:48:28 +00002509 DAG.getNode(ISD::AND, dl, MVT::i32,
pingbak2f387e82009-01-26 03:31:40 +00002510 lhsHi32, DAG.getConstant(0x7fffffff, MVT::i32));
2511 SDValue lhsLo32 =
Dale Johannesen85fc0932009-02-04 01:48:28 +00002512 DAG.getNode(ISD::TRUNCATE, dl, MVT::i32, i64lhs);
pingbak2f387e82009-01-26 03:31:40 +00002513
2514 // SETO and SETUO only use the lhs operand:
2515 if (CC->get() == ISD::SETO) {
2516 // Evaluates to true if Op0 is not [SQ]NaN - lowers to the inverse of
2517 // SETUO
2518 APInt ccResultAllOnes = APInt::getAllOnesValue(ccResultVT.getSizeInBits());
Dale Johannesen85fc0932009-02-04 01:48:28 +00002519 return DAG.getNode(ISD::XOR, dl, ccResultVT,
2520 DAG.getSetCC(dl, ccResultVT,
pingbak2f387e82009-01-26 03:31:40 +00002521 lhs, DAG.getConstantFP(0.0, lhsVT),
2522 ISD::SETUO),
2523 DAG.getConstant(ccResultAllOnes, ccResultVT));
2524 } else if (CC->get() == ISD::SETUO) {
2525 // Evaluates to true if Op0 is [SQ]NaN
Dale Johannesen85fc0932009-02-04 01:48:28 +00002526 return DAG.getNode(ISD::AND, dl, ccResultVT,
2527 DAG.getSetCC(dl, ccResultVT,
pingbak2f387e82009-01-26 03:31:40 +00002528 lhsHi32abs,
2529 DAG.getConstant(0x7ff00000, MVT::i32),
2530 ISD::SETGE),
Dale Johannesen85fc0932009-02-04 01:48:28 +00002531 DAG.getSetCC(dl, ccResultVT,
pingbak2f387e82009-01-26 03:31:40 +00002532 lhsLo32,
2533 DAG.getConstant(0, MVT::i32),
2534 ISD::SETGT));
2535 }
2536
Dale Johannesen24dd9a52009-02-07 00:55:49 +00002537 SDValue i64rhs = DAG.getNode(ISD::BIT_CONVERT, dl, IntVT, rhs);
pingbak2f387e82009-01-26 03:31:40 +00002538 SDValue rhsHi32 =
Dale Johannesen85fc0932009-02-04 01:48:28 +00002539 DAG.getNode(ISD::TRUNCATE, dl, MVT::i32,
2540 DAG.getNode(ISD::SRL, dl, IntVT,
pingbak2f387e82009-01-26 03:31:40 +00002541 i64rhs, DAG.getConstant(32, MVT::i32)));
2542
2543 // If a value is negative, subtract from the sign magnitude constant:
2544 SDValue signMag2TC = DAG.getConstant(0x8000000000000000ULL, IntVT);
2545
2546 // Convert the sign-magnitude representation into 2's complement:
Dale Johannesen85fc0932009-02-04 01:48:28 +00002547 SDValue lhsSelectMask = DAG.getNode(ISD::SRA, dl, ccResultVT,
pingbak2f387e82009-01-26 03:31:40 +00002548 lhsHi32, DAG.getConstant(31, MVT::i32));
Dale Johannesen85fc0932009-02-04 01:48:28 +00002549 SDValue lhsSignMag2TC = DAG.getNode(ISD::SUB, dl, IntVT, signMag2TC, i64lhs);
pingbak2f387e82009-01-26 03:31:40 +00002550 SDValue lhsSelect =
Dale Johannesen85fc0932009-02-04 01:48:28 +00002551 DAG.getNode(ISD::SELECT, dl, IntVT,
pingbak2f387e82009-01-26 03:31:40 +00002552 lhsSelectMask, lhsSignMag2TC, i64lhs);
2553
Dale Johannesen85fc0932009-02-04 01:48:28 +00002554 SDValue rhsSelectMask = DAG.getNode(ISD::SRA, dl, ccResultVT,
pingbak2f387e82009-01-26 03:31:40 +00002555 rhsHi32, DAG.getConstant(31, MVT::i32));
Dale Johannesen85fc0932009-02-04 01:48:28 +00002556 SDValue rhsSignMag2TC = DAG.getNode(ISD::SUB, dl, IntVT, signMag2TC, i64rhs);
pingbak2f387e82009-01-26 03:31:40 +00002557 SDValue rhsSelect =
Dale Johannesen85fc0932009-02-04 01:48:28 +00002558 DAG.getNode(ISD::SELECT, dl, IntVT,
pingbak2f387e82009-01-26 03:31:40 +00002559 rhsSelectMask, rhsSignMag2TC, i64rhs);
2560
2561 unsigned compareOp;
2562
Scott Michel8c67fa42009-01-21 04:58:48 +00002563 switch (CC->get()) {
2564 case ISD::SETOEQ:
Scott Michel8c67fa42009-01-21 04:58:48 +00002565 case ISD::SETUEQ:
pingbak2f387e82009-01-26 03:31:40 +00002566 compareOp = ISD::SETEQ; break;
2567 case ISD::SETOGT:
Scott Michel8c67fa42009-01-21 04:58:48 +00002568 case ISD::SETUGT:
pingbak2f387e82009-01-26 03:31:40 +00002569 compareOp = ISD::SETGT; break;
2570 case ISD::SETOGE:
Scott Michel8c67fa42009-01-21 04:58:48 +00002571 case ISD::SETUGE:
pingbak2f387e82009-01-26 03:31:40 +00002572 compareOp = ISD::SETGE; break;
2573 case ISD::SETOLT:
Scott Michel8c67fa42009-01-21 04:58:48 +00002574 case ISD::SETULT:
pingbak2f387e82009-01-26 03:31:40 +00002575 compareOp = ISD::SETLT; break;
2576 case ISD::SETOLE:
Scott Michel8c67fa42009-01-21 04:58:48 +00002577 case ISD::SETULE:
pingbak2f387e82009-01-26 03:31:40 +00002578 compareOp = ISD::SETLE; break;
Scott Michel8c67fa42009-01-21 04:58:48 +00002579 case ISD::SETUNE:
pingbak2f387e82009-01-26 03:31:40 +00002580 case ISD::SETONE:
2581 compareOp = ISD::SETNE; break;
Scott Michel8c67fa42009-01-21 04:58:48 +00002582 default:
2583 cerr << "CellSPU ISel Select: unimplemented f64 condition\n";
2584 abort();
2585 break;
2586 }
2587
pingbak2f387e82009-01-26 03:31:40 +00002588 SDValue result =
Dale Johannesen85fc0932009-02-04 01:48:28 +00002589 DAG.getSetCC(dl, ccResultVT, lhsSelect, rhsSelect,
2590 (ISD::CondCode) compareOp);
pingbak2f387e82009-01-26 03:31:40 +00002591
2592 if ((CC->get() & 0x8) == 0) {
2593 // Ordered comparison:
Dale Johannesen85fc0932009-02-04 01:48:28 +00002594 SDValue lhsNaN = DAG.getSetCC(dl, ccResultVT,
pingbak2f387e82009-01-26 03:31:40 +00002595 lhs, DAG.getConstantFP(0.0, MVT::f64),
2596 ISD::SETO);
Dale Johannesen85fc0932009-02-04 01:48:28 +00002597 SDValue rhsNaN = DAG.getSetCC(dl, ccResultVT,
pingbak2f387e82009-01-26 03:31:40 +00002598 rhs, DAG.getConstantFP(0.0, MVT::f64),
2599 ISD::SETO);
Dale Johannesen85fc0932009-02-04 01:48:28 +00002600 SDValue ordered = DAG.getNode(ISD::AND, dl, ccResultVT, lhsNaN, rhsNaN);
pingbak2f387e82009-01-26 03:31:40 +00002601
Dale Johannesen85fc0932009-02-04 01:48:28 +00002602 result = DAG.getNode(ISD::AND, dl, ccResultVT, ordered, result);
pingbak2f387e82009-01-26 03:31:40 +00002603 }
2604
2605 return result;
Scott Michel8c67fa42009-01-21 04:58:48 +00002606}
2607
Scott Michel56a125e2008-11-22 23:50:42 +00002608//! Lower ISD::SELECT_CC
2609/*!
2610 ISD::SELECT_CC can (generally) be implemented directly on the SPU using the
2611 SELB instruction.
2612
2613 \note Need to revisit this in the future: if the code path through the true
2614 and false value computations is longer than the latency of a branch (6
2615 cycles), then it would be more advantageous to branch and insert a new basic
2616 block and branch on the condition. However, this code does not make that
2617 assumption, given the simplisitc uses so far.
2618 */
2619
Scott Michel06eabde2008-12-27 04:51:36 +00002620static SDValue LowerSELECT_CC(SDValue Op, SelectionDAG &DAG,
2621 const TargetLowering &TLI) {
Scott Michel56a125e2008-11-22 23:50:42 +00002622 MVT VT = Op.getValueType();
2623 SDValue lhs = Op.getOperand(0);
2624 SDValue rhs = Op.getOperand(1);
2625 SDValue trueval = Op.getOperand(2);
2626 SDValue falseval = Op.getOperand(3);
2627 SDValue condition = Op.getOperand(4);
Dale Johannesen175fdef2009-02-06 21:50:26 +00002628 DebugLoc dl = Op.getDebugLoc();
Scott Michel56a125e2008-11-22 23:50:42 +00002629
Scott Michel06eabde2008-12-27 04:51:36 +00002630 // NOTE: SELB's arguments: $rA, $rB, $mask
2631 //
2632 // SELB selects bits from $rA where bits in $mask are 0, bits from $rB
2633 // where bits in $mask are 1. CCond will be inverted, having 1s where the
2634 // condition was true and 0s where the condition was false. Hence, the
2635 // arguments to SELB get reversed.
2636
Scott Michel56a125e2008-11-22 23:50:42 +00002637 // Note: Really should be ISD::SELECT instead of SPUISD::SELB, but LLVM's
2638 // legalizer insists on combining SETCC/SELECT into SELECT_CC, so we end up
2639 // with another "cannot select select_cc" assert:
2640
Dale Johannesen175fdef2009-02-06 21:50:26 +00002641 SDValue compare = DAG.getNode(ISD::SETCC, dl,
Duncan Sands4a361272009-01-01 15:52:00 +00002642 TLI.getSetCCResultType(Op.getValueType()),
Scott Michel06eabde2008-12-27 04:51:36 +00002643 lhs, rhs, condition);
Dale Johannesen175fdef2009-02-06 21:50:26 +00002644 return DAG.getNode(SPUISD::SELB, dl, VT, falseval, trueval, compare);
Scott Michel56a125e2008-11-22 23:50:42 +00002645}
2646
Scott Michelec8c82e2008-12-02 19:53:53 +00002647//! Custom lower ISD::TRUNCATE
2648static SDValue LowerTRUNCATE(SDValue Op, SelectionDAG &DAG)
2649{
2650 MVT VT = Op.getValueType();
2651 MVT::SimpleValueType simpleVT = VT.getSimpleVT();
2652 MVT VecVT = MVT::getVectorVT(VT, (128 / VT.getSizeInBits()));
Dale Johannesen175fdef2009-02-06 21:50:26 +00002653 DebugLoc dl = Op.getDebugLoc();
Scott Michelec8c82e2008-12-02 19:53:53 +00002654
2655 SDValue Op0 = Op.getOperand(0);
2656 MVT Op0VT = Op0.getValueType();
2657 MVT Op0VecVT = MVT::getVectorVT(Op0VT, (128 / Op0VT.getSizeInBits()));
2658
Scott Michel06eabde2008-12-27 04:51:36 +00002659 if (Op0VT.getSimpleVT() == MVT::i128 && simpleVT == MVT::i64) {
Scott Michelc5a29fe2009-01-03 00:27:53 +00002660 // Create shuffle mask, least significant doubleword of quadword
Scott Michel06eabde2008-12-27 04:51:36 +00002661 unsigned maskHigh = 0x08090a0b;
2662 unsigned maskLow = 0x0c0d0e0f;
2663 // Use a shuffle to perform the truncation
Scott Michel78c70a02009-02-22 23:36:09 +00002664 SDValue shufMask = DAG.getBUILD_VECTOR(MVT::v4i32, dl,
2665 DAG.getConstant(maskHigh, MVT::i32),
2666 DAG.getConstant(maskLow, MVT::i32),
2667 DAG.getConstant(maskHigh, MVT::i32),
2668 DAG.getConstant(maskLow, MVT::i32));
Scott Michel06eabde2008-12-27 04:51:36 +00002669
2670
Dale Johannesen175fdef2009-02-06 21:50:26 +00002671 SDValue PromoteScalar = DAG.getNode(SPUISD::PREFSLOT2VEC, dl,
2672 Op0VecVT, Op0);
Scott Michel06eabde2008-12-27 04:51:36 +00002673
Dale Johannesen175fdef2009-02-06 21:50:26 +00002674 SDValue truncShuffle = DAG.getNode(SPUISD::SHUFB, dl, Op0VecVT,
Scott Michel06eabde2008-12-27 04:51:36 +00002675 PromoteScalar, PromoteScalar, shufMask);
2676
Dale Johannesen175fdef2009-02-06 21:50:26 +00002677 return DAG.getNode(SPUISD::VEC2PREFSLOT, dl, VT,
Dale Johannesen24dd9a52009-02-07 00:55:49 +00002678 DAG.getNode(ISD::BIT_CONVERT, dl, VecVT, truncShuffle));
Scott Michelec8c82e2008-12-02 19:53:53 +00002679 }
2680
Scott Michel06eabde2008-12-27 04:51:36 +00002681 return SDValue(); // Leave the truncate unmolested
Scott Michelec8c82e2008-12-02 19:53:53 +00002682}
2683
Scott Michel56a125e2008-11-22 23:50:42 +00002684//! Custom (target-specific) lowering entry point
2685/*!
2686 This is where LLVM's DAG selection process calls to do target-specific
2687 lowering of nodes.
2688 */
Dan Gohman8181bd12008-07-27 21:46:04 +00002689SDValue
2690SPUTargetLowering::LowerOperation(SDValue Op, SelectionDAG &DAG)
Scott Michel8efdca42007-12-04 22:23:35 +00002691{
Scott Michel97872d32008-02-23 18:41:37 +00002692 unsigned Opc = (unsigned) Op.getOpcode();
Duncan Sands92c43912008-06-06 12:08:01 +00002693 MVT VT = Op.getValueType();
Scott Michel97872d32008-02-23 18:41:37 +00002694
2695 switch (Opc) {
Scott Michel8efdca42007-12-04 22:23:35 +00002696 default: {
2697 cerr << "SPUTargetLowering::LowerOperation(): need to lower this!\n";
Scott Michel97872d32008-02-23 18:41:37 +00002698 cerr << "Op.getOpcode() = " << Opc << "\n";
Gabor Greif1c80d112008-08-28 21:40:38 +00002699 cerr << "*Op.getNode():\n";
2700 Op.getNode()->dump();
Scott Michel8efdca42007-12-04 22:23:35 +00002701 abort();
2702 }
2703 case ISD::LOAD:
Scott Michelec8c82e2008-12-02 19:53:53 +00002704 case ISD::EXTLOAD:
Scott Michel8efdca42007-12-04 22:23:35 +00002705 case ISD::SEXTLOAD:
2706 case ISD::ZEXTLOAD:
2707 return LowerLOAD(Op, DAG, SPUTM.getSubtargetImpl());
2708 case ISD::STORE:
2709 return LowerSTORE(Op, DAG, SPUTM.getSubtargetImpl());
2710 case ISD::ConstantPool:
2711 return LowerConstantPool(Op, DAG, SPUTM.getSubtargetImpl());
2712 case ISD::GlobalAddress:
2713 return LowerGlobalAddress(Op, DAG, SPUTM.getSubtargetImpl());
2714 case ISD::JumpTable:
2715 return LowerJumpTable(Op, DAG, SPUTM.getSubtargetImpl());
Scott Michel8efdca42007-12-04 22:23:35 +00002716 case ISD::ConstantFP:
2717 return LowerConstantFP(Op, DAG);
2718 case ISD::FORMAL_ARGUMENTS:
Scott Michel394e26d2008-01-17 20:38:41 +00002719 return LowerFORMAL_ARGUMENTS(Op, DAG, VarArgsFrameIndex);
Scott Michel8efdca42007-12-04 22:23:35 +00002720 case ISD::CALL:
Scott Micheldbac4cf2008-01-11 02:53:15 +00002721 return LowerCALL(Op, DAG, SPUTM.getSubtargetImpl());
Scott Michel8efdca42007-12-04 22:23:35 +00002722 case ISD::RET:
2723 return LowerRET(Op, DAG, getTargetMachine());
2724
Scott Michel4d07fb72008-12-30 23:28:25 +00002725 // i8, i64 math ops:
Scott Michel67224b22008-06-02 22:18:03 +00002726 case ISD::ADD:
Scott Michel8efdca42007-12-04 22:23:35 +00002727 case ISD::SUB:
2728 case ISD::ROTR:
2729 case ISD::ROTL:
2730 case ISD::SRL:
2731 case ISD::SHL:
Scott Michel67224b22008-06-02 22:18:03 +00002732 case ISD::SRA: {
Scott Michel97872d32008-02-23 18:41:37 +00002733 if (VT == MVT::i8)
Scott Michel06eabde2008-12-27 04:51:36 +00002734 return LowerI8Math(Op, DAG, Opc, *this);
Scott Michel97872d32008-02-23 18:41:37 +00002735 break;
Scott Michel67224b22008-06-02 22:18:03 +00002736 }
Scott Michel8efdca42007-12-04 22:23:35 +00002737
pingbak2f387e82009-01-26 03:31:40 +00002738 case ISD::FP_TO_SINT:
2739 case ISD::FP_TO_UINT:
2740 return LowerFP_TO_INT(Op, DAG, *this);
2741
2742 case ISD::SINT_TO_FP:
2743 case ISD::UINT_TO_FP:
2744 return LowerINT_TO_FP(Op, DAG, *this);
Scott Michel8c67fa42009-01-21 04:58:48 +00002745
Scott Michel8efdca42007-12-04 22:23:35 +00002746 // Vector-related lowering.
2747 case ISD::BUILD_VECTOR:
pingbak2f387e82009-01-26 03:31:40 +00002748 return LowerBUILD_VECTOR(Op, DAG);
Scott Michel8efdca42007-12-04 22:23:35 +00002749 case ISD::SCALAR_TO_VECTOR:
2750 return LowerSCALAR_TO_VECTOR(Op, DAG);
2751 case ISD::VECTOR_SHUFFLE:
2752 return LowerVECTOR_SHUFFLE(Op, DAG);
2753 case ISD::EXTRACT_VECTOR_ELT:
2754 return LowerEXTRACT_VECTOR_ELT(Op, DAG);
2755 case ISD::INSERT_VECTOR_ELT:
2756 return LowerINSERT_VECTOR_ELT(Op, DAG);
2757
2758 // Look for ANDBI, ORBI and XORBI opportunities and lower appropriately:
2759 case ISD::AND:
2760 case ISD::OR:
2761 case ISD::XOR:
2762 return LowerByteImmed(Op, DAG);
2763
2764 // Vector and i8 multiply:
2765 case ISD::MUL:
Scott Michel4d07fb72008-12-30 23:28:25 +00002766 if (VT == MVT::i8)
Scott Michel06eabde2008-12-27 04:51:36 +00002767 return LowerI8Math(Op, DAG, Opc, *this);
Scott Michel8efdca42007-12-04 22:23:35 +00002768
Scott Michel8efdca42007-12-04 22:23:35 +00002769 case ISD::CTPOP:
2770 return LowerCTPOP(Op, DAG);
Scott Michel56a125e2008-11-22 23:50:42 +00002771
2772 case ISD::SELECT_CC:
Scott Michel06eabde2008-12-27 04:51:36 +00002773 return LowerSELECT_CC(Op, DAG, *this);
Scott Michelec8c82e2008-12-02 19:53:53 +00002774
Scott Michel8c67fa42009-01-21 04:58:48 +00002775 case ISD::SETCC:
2776 return LowerSETCC(Op, DAG, *this);
2777
Scott Michelec8c82e2008-12-02 19:53:53 +00002778 case ISD::TRUNCATE:
2779 return LowerTRUNCATE(Op, DAG);
Scott Michel8efdca42007-12-04 22:23:35 +00002780 }
2781
Dan Gohman8181bd12008-07-27 21:46:04 +00002782 return SDValue();
Scott Michel8efdca42007-12-04 22:23:35 +00002783}
2784
Duncan Sands7d9834b2008-12-01 11:39:25 +00002785void SPUTargetLowering::ReplaceNodeResults(SDNode *N,
2786 SmallVectorImpl<SDValue>&Results,
2787 SelectionDAG &DAG)
Scott Michel6e2d68b2008-11-10 23:43:06 +00002788{
2789#if 0
2790 unsigned Opc = (unsigned) N->getOpcode();
2791 MVT OpVT = N->getValueType(0);
2792
2793 switch (Opc) {
2794 default: {
2795 cerr << "SPUTargetLowering::ReplaceNodeResults(): need to fix this!\n";
2796 cerr << "Op.getOpcode() = " << Opc << "\n";
2797 cerr << "*Op.getNode():\n";
2798 N->dump();
2799 abort();
2800 /*NOTREACHED*/
2801 }
2802 }
2803#endif
2804
2805 /* Otherwise, return unchanged */
Scott Michel6e2d68b2008-11-10 23:43:06 +00002806}
2807
Scott Michel8efdca42007-12-04 22:23:35 +00002808//===----------------------------------------------------------------------===//
Scott Michel8efdca42007-12-04 22:23:35 +00002809// Target Optimization Hooks
2810//===----------------------------------------------------------------------===//
2811
Dan Gohman8181bd12008-07-27 21:46:04 +00002812SDValue
Scott Michel8efdca42007-12-04 22:23:35 +00002813SPUTargetLowering::PerformDAGCombine(SDNode *N, DAGCombinerInfo &DCI) const
2814{
2815#if 0
2816 TargetMachine &TM = getTargetMachine();
Scott Michelf9f42e62008-01-29 02:16:57 +00002817#endif
2818 const SPUSubtarget *ST = SPUTM.getSubtargetImpl();
Scott Michel8efdca42007-12-04 22:23:35 +00002819 SelectionDAG &DAG = DCI.DAG;
Scott Michel0718cd82008-12-01 17:56:02 +00002820 SDValue Op0 = N->getOperand(0); // everything has at least one operand
2821 MVT NodeVT = N->getValueType(0); // The node's value type
Scott Michel06eabde2008-12-27 04:51:36 +00002822 MVT Op0VT = Op0.getValueType(); // The first operand's result
Scott Michel0718cd82008-12-01 17:56:02 +00002823 SDValue Result; // Initially, empty result
Dale Johannesen175fdef2009-02-06 21:50:26 +00002824 DebugLoc dl = N->getDebugLoc();
Scott Michel8efdca42007-12-04 22:23:35 +00002825
2826 switch (N->getOpcode()) {
2827 default: break;
Scott Michelf9f42e62008-01-29 02:16:57 +00002828 case ISD::ADD: {
Dan Gohman8181bd12008-07-27 21:46:04 +00002829 SDValue Op1 = N->getOperand(1);
Scott Michelf9f42e62008-01-29 02:16:57 +00002830
Scott Michel06eabde2008-12-27 04:51:36 +00002831 if (Op0.getOpcode() == SPUISD::IndirectAddr
2832 || Op1.getOpcode() == SPUISD::IndirectAddr) {
2833 // Normalize the operands to reduce repeated code
2834 SDValue IndirectArg = Op0, AddArg = Op1;
Scott Michelae5cbf52008-12-29 03:23:36 +00002835
Scott Michel06eabde2008-12-27 04:51:36 +00002836 if (Op1.getOpcode() == SPUISD::IndirectAddr) {
2837 IndirectArg = Op1;
2838 AddArg = Op0;
2839 }
2840
2841 if (isa<ConstantSDNode>(AddArg)) {
2842 ConstantSDNode *CN0 = cast<ConstantSDNode > (AddArg);
2843 SDValue IndOp1 = IndirectArg.getOperand(1);
2844
2845 if (CN0->isNullValue()) {
2846 // (add (SPUindirect <arg>, <arg>), 0) ->
2847 // (SPUindirect <arg>, <arg>)
Scott Michelf9f42e62008-01-29 02:16:57 +00002848
Scott Michel8c2746e2008-12-04 17:16:59 +00002849#if !defined(NDEBUG)
Scott Michel06eabde2008-12-27 04:51:36 +00002850 if (DebugFlag && isCurrentDebugType(DEBUG_TYPE)) {
Scott Michel6ccefab2008-12-04 03:02:42 +00002851 cerr << "\n"
Scott Michel06eabde2008-12-27 04:51:36 +00002852 << "Replace: (add (SPUindirect <arg>, <arg>), 0)\n"
2853 << "With: (SPUindirect <arg>, <arg>)\n";
2854 }
Scott Michel6ccefab2008-12-04 03:02:42 +00002855#endif
2856
Scott Michel06eabde2008-12-27 04:51:36 +00002857 return IndirectArg;
2858 } else if (isa<ConstantSDNode>(IndOp1)) {
2859 // (add (SPUindirect <arg>, <const>), <const>) ->
2860 // (SPUindirect <arg>, <const + const>)
2861 ConstantSDNode *CN1 = cast<ConstantSDNode > (IndOp1);
2862 int64_t combinedConst = CN0->getSExtValue() + CN1->getSExtValue();
2863 SDValue combinedValue = DAG.getConstant(combinedConst, Op0VT);
Scott Michelf9f42e62008-01-29 02:16:57 +00002864
Scott Michel06eabde2008-12-27 04:51:36 +00002865#if !defined(NDEBUG)
2866 if (DebugFlag && isCurrentDebugType(DEBUG_TYPE)) {
2867 cerr << "\n"
2868 << "Replace: (add (SPUindirect <arg>, " << CN1->getSExtValue()
2869 << "), " << CN0->getSExtValue() << ")\n"
2870 << "With: (SPUindirect <arg>, "
2871 << combinedConst << ")\n";
2872 }
2873#endif
Scott Michelf9f42e62008-01-29 02:16:57 +00002874
Dale Johannesen175fdef2009-02-06 21:50:26 +00002875 return DAG.getNode(SPUISD::IndirectAddr, dl, Op0VT,
Scott Michel06eabde2008-12-27 04:51:36 +00002876 IndirectArg, combinedValue);
2877 }
Scott Michelf9f42e62008-01-29 02:16:57 +00002878 }
2879 }
Scott Michel97872d32008-02-23 18:41:37 +00002880 break;
2881 }
2882 case ISD::SIGN_EXTEND:
2883 case ISD::ZERO_EXTEND:
2884 case ISD::ANY_EXTEND: {
Scott Michel0718cd82008-12-01 17:56:02 +00002885 if (Op0.getOpcode() == SPUISD::VEC2PREFSLOT && NodeVT == Op0VT) {
Scott Michel97872d32008-02-23 18:41:37 +00002886 // (any_extend (SPUextract_elt0 <arg>)) ->
2887 // (SPUextract_elt0 <arg>)
2888 // Types must match, however...
Scott Michel8c2746e2008-12-04 17:16:59 +00002889#if !defined(NDEBUG)
2890 if (DebugFlag && isCurrentDebugType(DEBUG_TYPE)) {
Scott Michel6ccefab2008-12-04 03:02:42 +00002891 cerr << "\nReplace: ";
2892 N->dump(&DAG);
2893 cerr << "\nWith: ";
2894 Op0.getNode()->dump(&DAG);
2895 cerr << "\n";
Scott Michel8c2746e2008-12-04 17:16:59 +00002896 }
Scott Michel6ccefab2008-12-04 03:02:42 +00002897#endif
Scott Michel97872d32008-02-23 18:41:37 +00002898
2899 return Op0;
2900 }
2901 break;
2902 }
2903 case SPUISD::IndirectAddr: {
2904 if (!ST->usingLargeMem() && Op0.getOpcode() == SPUISD::AFormAddr) {
Scott Michel8c67fa42009-01-21 04:58:48 +00002905 ConstantSDNode *CN = dyn_cast<ConstantSDNode>(N->getOperand(1));
2906 if (CN != 0 && CN->getZExtValue() == 0) {
Scott Michel97872d32008-02-23 18:41:37 +00002907 // (SPUindirect (SPUaform <addr>, 0), 0) ->
2908 // (SPUaform <addr>, 0)
2909
2910 DEBUG(cerr << "Replace: ");
2911 DEBUG(N->dump(&DAG));
2912 DEBUG(cerr << "\nWith: ");
Gabor Greif1c80d112008-08-28 21:40:38 +00002913 DEBUG(Op0.getNode()->dump(&DAG));
Scott Michel97872d32008-02-23 18:41:37 +00002914 DEBUG(cerr << "\n");
2915
2916 return Op0;
2917 }
Scott Michel06eabde2008-12-27 04:51:36 +00002918 } else if (Op0.getOpcode() == ISD::ADD) {
2919 SDValue Op1 = N->getOperand(1);
2920 if (ConstantSDNode *CN1 = dyn_cast<ConstantSDNode>(Op1)) {
2921 // (SPUindirect (add <arg>, <arg>), 0) ->
2922 // (SPUindirect <arg>, <arg>)
2923 if (CN1->isNullValue()) {
2924
2925#if !defined(NDEBUG)
2926 if (DebugFlag && isCurrentDebugType(DEBUG_TYPE)) {
2927 cerr << "\n"
2928 << "Replace: (SPUindirect (add <arg>, <arg>), 0)\n"
2929 << "With: (SPUindirect <arg>, <arg>)\n";
2930 }
2931#endif
2932
Dale Johannesen175fdef2009-02-06 21:50:26 +00002933 return DAG.getNode(SPUISD::IndirectAddr, dl, Op0VT,
Scott Michel06eabde2008-12-27 04:51:36 +00002934 Op0.getOperand(0), Op0.getOperand(1));
2935 }
2936 }
Scott Michel97872d32008-02-23 18:41:37 +00002937 }
2938 break;
2939 }
2940 case SPUISD::SHLQUAD_L_BITS:
2941 case SPUISD::SHLQUAD_L_BYTES:
2942 case SPUISD::VEC_SHL:
2943 case SPUISD::VEC_SRL:
2944 case SPUISD::VEC_SRA:
Scott Michel06eabde2008-12-27 04:51:36 +00002945 case SPUISD::ROTBYTES_LEFT: {
Dan Gohman8181bd12008-07-27 21:46:04 +00002946 SDValue Op1 = N->getOperand(1);
Scott Michel97872d32008-02-23 18:41:37 +00002947
Scott Michel06eabde2008-12-27 04:51:36 +00002948 // Kill degenerate vector shifts:
2949 if (ConstantSDNode *CN = dyn_cast<ConstantSDNode>(Op1)) {
2950 if (CN->isNullValue()) {
Scott Michel97872d32008-02-23 18:41:37 +00002951 Result = Op0;
2952 }
2953 }
2954 break;
2955 }
Scott Michel06eabde2008-12-27 04:51:36 +00002956 case SPUISD::PREFSLOT2VEC: {
Scott Michel97872d32008-02-23 18:41:37 +00002957 switch (Op0.getOpcode()) {
2958 default:
2959 break;
2960 case ISD::ANY_EXTEND:
2961 case ISD::ZERO_EXTEND:
2962 case ISD::SIGN_EXTEND: {
Scott Michelae5cbf52008-12-29 03:23:36 +00002963 // (SPUprefslot2vec (any|zero|sign_extend (SPUvec2prefslot <arg>))) ->
Scott Michel97872d32008-02-23 18:41:37 +00002964 // <arg>
Scott Michelae5cbf52008-12-29 03:23:36 +00002965 // but only if the SPUprefslot2vec and <arg> types match.
Dan Gohman8181bd12008-07-27 21:46:04 +00002966 SDValue Op00 = Op0.getOperand(0);
Scott Michelc630c412008-11-24 17:11:17 +00002967 if (Op00.getOpcode() == SPUISD::VEC2PREFSLOT) {
Dan Gohman8181bd12008-07-27 21:46:04 +00002968 SDValue Op000 = Op00.getOperand(0);
Scott Michel0718cd82008-12-01 17:56:02 +00002969 if (Op000.getValueType() == NodeVT) {
Scott Michel97872d32008-02-23 18:41:37 +00002970 Result = Op000;
2971 }
2972 }
2973 break;
2974 }
Scott Michelc630c412008-11-24 17:11:17 +00002975 case SPUISD::VEC2PREFSLOT: {
Scott Michelae5cbf52008-12-29 03:23:36 +00002976 // (SPUprefslot2vec (SPUvec2prefslot <arg>)) ->
Scott Michel97872d32008-02-23 18:41:37 +00002977 // <arg>
2978 Result = Op0.getOperand(0);
2979 break;
Scott Michel4ec722e2008-07-16 17:17:29 +00002980 }
Scott Michel97872d32008-02-23 18:41:37 +00002981 }
2982 break;
Scott Michelf9f42e62008-01-29 02:16:57 +00002983 }
2984 }
Scott Michel8c67fa42009-01-21 04:58:48 +00002985
Scott Michel394e26d2008-01-17 20:38:41 +00002986 // Otherwise, return unchanged.
Scott Michel0718cd82008-12-01 17:56:02 +00002987#ifndef NDEBUG
Gabor Greif1c80d112008-08-28 21:40:38 +00002988 if (Result.getNode()) {
Scott Michel97872d32008-02-23 18:41:37 +00002989 DEBUG(cerr << "\nReplace.SPU: ");
2990 DEBUG(N->dump(&DAG));
2991 DEBUG(cerr << "\nWith: ");
Gabor Greif1c80d112008-08-28 21:40:38 +00002992 DEBUG(Result.getNode()->dump(&DAG));
Scott Michel97872d32008-02-23 18:41:37 +00002993 DEBUG(cerr << "\n");
2994 }
2995#endif
2996
2997 return Result;
Scott Michel8efdca42007-12-04 22:23:35 +00002998}
2999
3000//===----------------------------------------------------------------------===//
3001// Inline Assembly Support
3002//===----------------------------------------------------------------------===//
3003
3004/// getConstraintType - Given a constraint letter, return the type of
3005/// constraint it is for this target.
Scott Michel4ec722e2008-07-16 17:17:29 +00003006SPUTargetLowering::ConstraintType
Scott Michel8efdca42007-12-04 22:23:35 +00003007SPUTargetLowering::getConstraintType(const std::string &ConstraintLetter) const {
3008 if (ConstraintLetter.size() == 1) {
3009 switch (ConstraintLetter[0]) {
3010 default: break;
3011 case 'b':
3012 case 'r':
3013 case 'f':
3014 case 'v':
3015 case 'y':
3016 return C_RegisterClass;
Scott Michel4ec722e2008-07-16 17:17:29 +00003017 }
Scott Michel8efdca42007-12-04 22:23:35 +00003018 }
3019 return TargetLowering::getConstraintType(ConstraintLetter);
3020}
3021
Scott Michel4ec722e2008-07-16 17:17:29 +00003022std::pair<unsigned, const TargetRegisterClass*>
Scott Michel8efdca42007-12-04 22:23:35 +00003023SPUTargetLowering::getRegForInlineAsmConstraint(const std::string &Constraint,
Duncan Sands92c43912008-06-06 12:08:01 +00003024 MVT VT) const
Scott Michel8efdca42007-12-04 22:23:35 +00003025{
3026 if (Constraint.size() == 1) {
3027 // GCC RS6000 Constraint Letters
3028 switch (Constraint[0]) {
3029 case 'b': // R1-R31
3030 case 'r': // R0-R31
3031 if (VT == MVT::i64)
3032 return std::make_pair(0U, SPU::R64CRegisterClass);
3033 return std::make_pair(0U, SPU::R32CRegisterClass);
3034 case 'f':
3035 if (VT == MVT::f32)
3036 return std::make_pair(0U, SPU::R32FPRegisterClass);
3037 else if (VT == MVT::f64)
3038 return std::make_pair(0U, SPU::R64FPRegisterClass);
3039 break;
Scott Michel4ec722e2008-07-16 17:17:29 +00003040 case 'v':
Scott Michel8efdca42007-12-04 22:23:35 +00003041 return std::make_pair(0U, SPU::GPRCRegisterClass);
3042 }
3043 }
Scott Michel4ec722e2008-07-16 17:17:29 +00003044
Scott Michel8efdca42007-12-04 22:23:35 +00003045 return TargetLowering::getRegForInlineAsmConstraint(Constraint, VT);
3046}
3047
Scott Michel97872d32008-02-23 18:41:37 +00003048//! Compute used/known bits for a SPU operand
Scott Michel8efdca42007-12-04 22:23:35 +00003049void
Dan Gohman8181bd12008-07-27 21:46:04 +00003050SPUTargetLowering::computeMaskedBitsForTargetNode(const SDValue Op,
Dan Gohmand0dfc772008-02-13 22:28:48 +00003051 const APInt &Mask,
Scott Michel4ec722e2008-07-16 17:17:29 +00003052 APInt &KnownZero,
Dan Gohman229fa052008-02-13 00:35:47 +00003053 APInt &KnownOne,
Scott Michel5a6f17b2008-01-30 02:55:46 +00003054 const SelectionDAG &DAG,
3055 unsigned Depth ) const {
Scott Michelbc5fbc12008-04-30 00:30:08 +00003056#if 0
Scott Michel97872d32008-02-23 18:41:37 +00003057 const uint64_t uint64_sizebits = sizeof(uint64_t) * 8;
3058
3059 switch (Op.getOpcode()) {
3060 default:
3061 // KnownZero = KnownOne = APInt(Mask.getBitWidth(), 0);
3062 break;
Scott Michel97872d32008-02-23 18:41:37 +00003063 case CALL:
3064 case SHUFB:
Scott Michel56a125e2008-11-22 23:50:42 +00003065 case SHUFFLE_MASK:
Scott Michel97872d32008-02-23 18:41:37 +00003066 case CNTB:
Scott Michel8c67fa42009-01-21 04:58:48 +00003067 case SPUISD::PREFSLOT2VEC:
Scott Michel97872d32008-02-23 18:41:37 +00003068 case SPUISD::LDRESULT:
Scott Michel8c67fa42009-01-21 04:58:48 +00003069 case SPUISD::VEC2PREFSLOT:
Scott Michelbc5fbc12008-04-30 00:30:08 +00003070 case SPUISD::SHLQUAD_L_BITS:
3071 case SPUISD::SHLQUAD_L_BYTES:
3072 case SPUISD::VEC_SHL:
3073 case SPUISD::VEC_SRL:
3074 case SPUISD::VEC_SRA:
3075 case SPUISD::VEC_ROTL:
3076 case SPUISD::VEC_ROTR:
Scott Michelbc5fbc12008-04-30 00:30:08 +00003077 case SPUISD::ROTBYTES_LEFT:
Scott Michel67224b22008-06-02 22:18:03 +00003078 case SPUISD::SELECT_MASK:
3079 case SPUISD::SELB:
Scott Michel97872d32008-02-23 18:41:37 +00003080 }
Scott Michel8c67fa42009-01-21 04:58:48 +00003081#endif
Scott Michel8efdca42007-12-04 22:23:35 +00003082}
Scott Michel4d07fb72008-12-30 23:28:25 +00003083
Scott Michel06eabde2008-12-27 04:51:36 +00003084unsigned
3085SPUTargetLowering::ComputeNumSignBitsForTargetNode(SDValue Op,
3086 unsigned Depth) const {
3087 switch (Op.getOpcode()) {
3088 default:
3089 return 1;
Scott Michel8efdca42007-12-04 22:23:35 +00003090
Scott Michel06eabde2008-12-27 04:51:36 +00003091 case ISD::SETCC: {
3092 MVT VT = Op.getValueType();
3093
3094 if (VT != MVT::i8 && VT != MVT::i16 && VT != MVT::i32) {
3095 VT = MVT::i32;
3096 }
3097 return VT.getSizeInBits();
3098 }
3099 }
3100}
Scott Michelae5cbf52008-12-29 03:23:36 +00003101
Scott Michelbc5fbc12008-04-30 00:30:08 +00003102// LowerAsmOperandForConstraint
3103void
Dan Gohman8181bd12008-07-27 21:46:04 +00003104SPUTargetLowering::LowerAsmOperandForConstraint(SDValue Op,
Scott Michelbc5fbc12008-04-30 00:30:08 +00003105 char ConstraintLetter,
Evan Cheng7f250d62008-09-24 00:05:32 +00003106 bool hasMemory,
Dan Gohman8181bd12008-07-27 21:46:04 +00003107 std::vector<SDValue> &Ops,
Scott Michelbc5fbc12008-04-30 00:30:08 +00003108 SelectionDAG &DAG) const {
3109 // Default, for the time being, to the base class handler
Evan Cheng7f250d62008-09-24 00:05:32 +00003110 TargetLowering::LowerAsmOperandForConstraint(Op, ConstraintLetter, hasMemory,
3111 Ops, DAG);
Scott Michelbc5fbc12008-04-30 00:30:08 +00003112}
3113
Scott Michel8efdca42007-12-04 22:23:35 +00003114/// isLegalAddressImmediate - Return true if the integer value can be used
3115/// as the offset of the target addressing mode.
Gabor Greife9f7f582008-08-31 15:37:04 +00003116bool SPUTargetLowering::isLegalAddressImmediate(int64_t V,
3117 const Type *Ty) const {
Scott Michel8efdca42007-12-04 22:23:35 +00003118 // SPU's addresses are 256K:
3119 return (V > -(1 << 18) && V < (1 << 18) - 1);
3120}
3121
3122bool SPUTargetLowering::isLegalAddressImmediate(llvm::GlobalValue* GV) const {
Scott Michel4ec722e2008-07-16 17:17:29 +00003123 return false;
Scott Michel8efdca42007-12-04 22:23:35 +00003124}
Dan Gohman36322c72008-10-18 02:06:02 +00003125
3126bool
3127SPUTargetLowering::isOffsetFoldingLegal(const GlobalAddressSDNode *GA) const {
3128 // The SPU target isn't yet aware of offsets.
3129 return false;
3130}