blob: 3a8fb5dcab6d67473d9da20235d12b4d1b0160bd [file] [log] [blame]
Scott Michel266bc8f2007-12-04 22:23:35 +00001//===-- SPUISelLowering.cpp - Cell SPU DAG Lowering Implementation --------===//
2//
3// The LLVM Compiler Infrastructure
4//
Chris Lattner4ee451d2007-12-29 20:36:04 +00005// This file is distributed under the University of Illinois Open Source
6// License. See LICENSE.TXT for details.
Scott Michel266bc8f2007-12-04 22:23:35 +00007//
8//===----------------------------------------------------------------------===//
9//
10// This file implements the SPUTargetLowering class.
11//
12//===----------------------------------------------------------------------===//
13
14#include "SPURegisterNames.h"
15#include "SPUISelLowering.h"
16#include "SPUTargetMachine.h"
Scott Michel203b2d62008-04-30 00:30:08 +000017#include "SPUFrameInfo.h"
Scott Michelf0569be2008-12-27 04:51:36 +000018#include "llvm/ADT/APInt.h"
Scott Michel266bc8f2007-12-04 22:23:35 +000019#include "llvm/ADT/VectorExtras.h"
Scott Michelc9c8b2a2009-01-26 03:31:40 +000020#include "llvm/CallingConv.h"
Scott Michel266bc8f2007-12-04 22:23:35 +000021#include "llvm/CodeGen/CallingConvLower.h"
22#include "llvm/CodeGen/MachineFrameInfo.h"
23#include "llvm/CodeGen/MachineFunction.h"
24#include "llvm/CodeGen/MachineInstrBuilder.h"
Chris Lattner84bc5422007-12-31 04:13:23 +000025#include "llvm/CodeGen/MachineRegisterInfo.h"
Scott Michel266bc8f2007-12-04 22:23:35 +000026#include "llvm/CodeGen/SelectionDAG.h"
Scott Michel266bc8f2007-12-04 22:23:35 +000027#include "llvm/Constants.h"
28#include "llvm/Function.h"
29#include "llvm/Intrinsics.h"
30#include "llvm/Support/Debug.h"
31#include "llvm/Support/MathExtras.h"
32#include "llvm/Target/TargetOptions.h"
33
34#include <map>
35
36using namespace llvm;
37
38// Used in getTargetNodeName() below
39namespace {
40 std::map<unsigned, const char *> node_names;
41
Duncan Sands83ec4b62008-06-06 12:08:01 +000042 //! MVT mapping to useful data for Cell SPU
Scott Michel266bc8f2007-12-04 22:23:35 +000043 struct valtype_map_s {
Scott Michel7a1c9e92008-11-22 23:50:42 +000044 const MVT valtype;
45 const int prefslot_byte;
Scott Michel266bc8f2007-12-04 22:23:35 +000046 };
Scott Michel5af8f0e2008-07-16 17:17:29 +000047
Scott Michel266bc8f2007-12-04 22:23:35 +000048 const valtype_map_s valtype_map[] = {
49 { MVT::i1, 3 },
50 { MVT::i8, 3 },
51 { MVT::i16, 2 },
52 { MVT::i32, 0 },
53 { MVT::f32, 0 },
54 { MVT::i64, 0 },
55 { MVT::f64, 0 },
56 { MVT::i128, 0 }
57 };
58
59 const size_t n_valtype_map = sizeof(valtype_map) / sizeof(valtype_map[0]);
60
Duncan Sands83ec4b62008-06-06 12:08:01 +000061 const valtype_map_s *getValueTypeMapEntry(MVT VT) {
Scott Michel266bc8f2007-12-04 22:23:35 +000062 const valtype_map_s *retval = 0;
63
64 for (size_t i = 0; i < n_valtype_map; ++i) {
65 if (valtype_map[i].valtype == VT) {
Scott Michel7f9ba9b2008-01-30 02:55:46 +000066 retval = valtype_map + i;
67 break;
Scott Michel266bc8f2007-12-04 22:23:35 +000068 }
69 }
70
71#ifndef NDEBUG
72 if (retval == 0) {
73 cerr << "getValueTypeMapEntry returns NULL for "
Duncan Sands83ec4b62008-06-06 12:08:01 +000074 << VT.getMVTString()
Scott Michel7f9ba9b2008-01-30 02:55:46 +000075 << "\n";
Scott Michel266bc8f2007-12-04 22:23:35 +000076 abort();
77 }
78#endif
79
80 return retval;
81 }
Scott Michel94bd57e2009-01-15 04:41:47 +000082
Scott Michelc9c8b2a2009-01-26 03:31:40 +000083 //! Expand a library call into an actual call DAG node
84 /*!
85 \note
86 This code is taken from SelectionDAGLegalize, since it is not exposed as
87 part of the LLVM SelectionDAG API.
88 */
89
90 SDValue
91 ExpandLibCall(RTLIB::Libcall LC, SDValue Op, SelectionDAG &DAG,
92 bool isSigned, SDValue &Hi, SPUTargetLowering &TLI) {
93 // The input chain to this libcall is the entry node of the function.
94 // Legalizing the call will automatically add the previous call to the
95 // dependence.
96 SDValue InChain = DAG.getEntryNode();
97
98 TargetLowering::ArgListTy Args;
99 TargetLowering::ArgListEntry Entry;
100 for (unsigned i = 0, e = Op.getNumOperands(); i != e; ++i) {
101 MVT ArgVT = Op.getOperand(i).getValueType();
102 const Type *ArgTy = ArgVT.getTypeForMVT();
103 Entry.Node = Op.getOperand(i);
104 Entry.Ty = ArgTy;
105 Entry.isSExt = isSigned;
106 Entry.isZExt = !isSigned;
107 Args.push_back(Entry);
108 }
109 SDValue Callee = DAG.getExternalSymbol(TLI.getLibcallName(LC),
110 TLI.getPointerTy());
111
112 // Splice the libcall in wherever FindInputOutputChains tells us to.
113 const Type *RetTy = Op.getNode()->getValueType(0).getTypeForMVT();
114 std::pair<SDValue, SDValue> CallInfo =
115 TLI.LowerCallTo(InChain, RetTy, isSigned, !isSigned, false, false,
Dale Johannesen7d2ad622009-01-30 23:10:59 +0000116 CallingConv::C, false, Callee, Args, DAG,
Dale Johannesen6f38cb62009-02-07 19:59:05 +0000117 Op.getDebugLoc());
Scott Michelc9c8b2a2009-01-26 03:31:40 +0000118
119 return CallInfo.first;
120 }
Scott Michel266bc8f2007-12-04 22:23:35 +0000121}
122
123SPUTargetLowering::SPUTargetLowering(SPUTargetMachine &TM)
124 : TargetLowering(TM),
125 SPUTM(TM)
126{
127 // Fold away setcc operations if possible.
128 setPow2DivIsCheap();
129
130 // Use _setjmp/_longjmp instead of setjmp/longjmp.
131 setUseUnderscoreSetJmp(true);
132 setUseUnderscoreLongJmp(true);
Scott Michel5af8f0e2008-07-16 17:17:29 +0000133
Scott Micheld1e8d9c2009-01-21 04:58:48 +0000134 // Set RTLIB libcall names as used by SPU:
135 setLibcallName(RTLIB::DIV_F64, "__fast_divdf3");
136
Scott Michel266bc8f2007-12-04 22:23:35 +0000137 // Set up the SPU's register classes:
Scott Michel504c3692007-12-17 22:32:34 +0000138 addRegisterClass(MVT::i8, SPU::R8CRegisterClass);
139 addRegisterClass(MVT::i16, SPU::R16CRegisterClass);
140 addRegisterClass(MVT::i32, SPU::R32CRegisterClass);
141 addRegisterClass(MVT::i64, SPU::R64CRegisterClass);
142 addRegisterClass(MVT::f32, SPU::R32FPRegisterClass);
143 addRegisterClass(MVT::f64, SPU::R64FPRegisterClass);
Scott Michel266bc8f2007-12-04 22:23:35 +0000144 addRegisterClass(MVT::i128, SPU::GPRCRegisterClass);
Scott Michel5af8f0e2008-07-16 17:17:29 +0000145
Scott Michel266bc8f2007-12-04 22:23:35 +0000146 // SPU has no sign or zero extended loads for i1, i8, i16:
Evan Cheng03294662008-10-14 21:26:46 +0000147 setLoadExtAction(ISD::EXTLOAD, MVT::i1, Promote);
148 setLoadExtAction(ISD::SEXTLOAD, MVT::i1, Promote);
149 setLoadExtAction(ISD::ZEXTLOAD, MVT::i1, Promote);
Scott Michel266bc8f2007-12-04 22:23:35 +0000150
Scott Michelf0569be2008-12-27 04:51:36 +0000151 setLoadExtAction(ISD::EXTLOAD, MVT::f32, Expand);
152 setLoadExtAction(ISD::EXTLOAD, MVT::f64, Expand);
Scott Michelb30e8f62008-12-02 19:53:53 +0000153
Scott Michel266bc8f2007-12-04 22:23:35 +0000154 // SPU constant load actions are custom lowered:
Nate Begemanccef5802008-02-14 18:43:04 +0000155 setOperationAction(ISD::ConstantFP, MVT::f32, Legal);
Scott Michel266bc8f2007-12-04 22:23:35 +0000156 setOperationAction(ISD::ConstantFP, MVT::f64, Custom);
157
158 // SPU's loads and stores have to be custom lowered:
Scott Micheldd950092009-01-06 03:36:14 +0000159 for (unsigned sctype = (unsigned) MVT::i8; sctype < (unsigned) MVT::i128;
Scott Michel266bc8f2007-12-04 22:23:35 +0000160 ++sctype) {
Duncan Sands83ec4b62008-06-06 12:08:01 +0000161 MVT VT = (MVT::SimpleValueType)sctype;
162
Scott Michelf0569be2008-12-27 04:51:36 +0000163 setOperationAction(ISD::LOAD, VT, Custom);
164 setOperationAction(ISD::STORE, VT, Custom);
165 setLoadExtAction(ISD::EXTLOAD, VT, Custom);
166 setLoadExtAction(ISD::ZEXTLOAD, VT, Custom);
167 setLoadExtAction(ISD::SEXTLOAD, VT, Custom);
168
169 for (unsigned stype = sctype - 1; stype >= (unsigned) MVT::i8; --stype) {
170 MVT StoreVT = (MVT::SimpleValueType) stype;
171 setTruncStoreAction(VT, StoreVT, Expand);
172 }
Scott Michel266bc8f2007-12-04 22:23:35 +0000173 }
174
Scott Michelf0569be2008-12-27 04:51:36 +0000175 for (unsigned sctype = (unsigned) MVT::f32; sctype < (unsigned) MVT::f64;
176 ++sctype) {
177 MVT VT = (MVT::SimpleValueType) sctype;
178
179 setOperationAction(ISD::LOAD, VT, Custom);
180 setOperationAction(ISD::STORE, VT, Custom);
181
182 for (unsigned stype = sctype - 1; stype >= (unsigned) MVT::f32; --stype) {
183 MVT StoreVT = (MVT::SimpleValueType) stype;
184 setTruncStoreAction(VT, StoreVT, Expand);
185 }
186 }
187
Scott Michel266bc8f2007-12-04 22:23:35 +0000188 // Expand the jumptable branches
189 setOperationAction(ISD::BR_JT, MVT::Other, Expand);
190 setOperationAction(ISD::BR_CC, MVT::Other, Expand);
Scott Michel7a1c9e92008-11-22 23:50:42 +0000191
192 // Custom lower SELECT_CC for most cases, but expand by default
Scott Michel5af8f0e2008-07-16 17:17:29 +0000193 setOperationAction(ISD::SELECT_CC, MVT::Other, Expand);
Scott Michel7a1c9e92008-11-22 23:50:42 +0000194 setOperationAction(ISD::SELECT_CC, MVT::i8, Custom);
195 setOperationAction(ISD::SELECT_CC, MVT::i16, Custom);
196 setOperationAction(ISD::SELECT_CC, MVT::i32, Custom);
197 setOperationAction(ISD::SELECT_CC, MVT::i64, Custom);
Scott Michel266bc8f2007-12-04 22:23:35 +0000198
199 // SPU has no intrinsics for these particular operations:
Andrew Lenharthd497d9f2008-02-16 14:46:26 +0000200 setOperationAction(ISD::MEMBARRIER, MVT::Other, Expand);
201
Scott Michelf0569be2008-12-27 04:51:36 +0000202 // SPU has no SREM/UREM instructions
Scott Michel266bc8f2007-12-04 22:23:35 +0000203 setOperationAction(ISD::SREM, MVT::i32, Expand);
204 setOperationAction(ISD::UREM, MVT::i32, Expand);
205 setOperationAction(ISD::SREM, MVT::i64, Expand);
206 setOperationAction(ISD::UREM, MVT::i64, Expand);
Scott Michel5af8f0e2008-07-16 17:17:29 +0000207
Scott Michel266bc8f2007-12-04 22:23:35 +0000208 // We don't support sin/cos/sqrt/fmod
209 setOperationAction(ISD::FSIN , MVT::f64, Expand);
210 setOperationAction(ISD::FCOS , MVT::f64, Expand);
211 setOperationAction(ISD::FREM , MVT::f64, Expand);
212 setOperationAction(ISD::FSIN , MVT::f32, Expand);
213 setOperationAction(ISD::FCOS , MVT::f32, Expand);
214 setOperationAction(ISD::FREM , MVT::f32, Expand);
Scott Michel5af8f0e2008-07-16 17:17:29 +0000215
Scott Michelc9c8b2a2009-01-26 03:31:40 +0000216 // Expand fsqrt to the appropriate libcall (NOTE: should use h/w fsqrt
217 // for f32!)
Scott Michel266bc8f2007-12-04 22:23:35 +0000218 setOperationAction(ISD::FSQRT, MVT::f64, Expand);
219 setOperationAction(ISD::FSQRT, MVT::f32, Expand);
Scott Michel5af8f0e2008-07-16 17:17:29 +0000220
Scott Michel266bc8f2007-12-04 22:23:35 +0000221 setOperationAction(ISD::FCOPYSIGN, MVT::f64, Expand);
222 setOperationAction(ISD::FCOPYSIGN, MVT::f32, Expand);
223
224 // SPU can do rotate right and left, so legalize it... but customize for i8
225 // because instructions don't exist.
Bill Wendling9440e352008-08-31 02:59:23 +0000226
227 // FIXME: Change from "expand" to appropriate type once ROTR is supported in
228 // .td files.
229 setOperationAction(ISD::ROTR, MVT::i32, Expand /*Legal*/);
230 setOperationAction(ISD::ROTR, MVT::i16, Expand /*Legal*/);
231 setOperationAction(ISD::ROTR, MVT::i8, Expand /*Custom*/);
232
Scott Michel266bc8f2007-12-04 22:23:35 +0000233 setOperationAction(ISD::ROTL, MVT::i32, Legal);
234 setOperationAction(ISD::ROTL, MVT::i16, Legal);
235 setOperationAction(ISD::ROTL, MVT::i8, Custom);
Scott Micheldc91bea2008-11-20 16:36:33 +0000236
Scott Michel266bc8f2007-12-04 22:23:35 +0000237 // SPU has no native version of shift left/right for i8
238 setOperationAction(ISD::SHL, MVT::i8, Custom);
239 setOperationAction(ISD::SRL, MVT::i8, Custom);
240 setOperationAction(ISD::SRA, MVT::i8, Custom);
Scott Michel9c0c6b22008-11-21 02:56:16 +0000241
Scott Michel02d711b2008-12-30 23:28:25 +0000242 // Make these operations legal and handle them during instruction selection:
243 setOperationAction(ISD::SHL, MVT::i64, Legal);
244 setOperationAction(ISD::SRL, MVT::i64, Legal);
245 setOperationAction(ISD::SRA, MVT::i64, Legal);
Scott Michel266bc8f2007-12-04 22:23:35 +0000246
Scott Michel5af8f0e2008-07-16 17:17:29 +0000247 // Custom lower i8, i32 and i64 multiplications
248 setOperationAction(ISD::MUL, MVT::i8, Custom);
Scott Michel1df30c42008-12-29 03:23:36 +0000249 setOperationAction(ISD::MUL, MVT::i32, Legal);
Scott Michel94bd57e2009-01-15 04:41:47 +0000250 setOperationAction(ISD::MUL, MVT::i64, Legal);
Scott Michel9c0c6b22008-11-21 02:56:16 +0000251
Scott Michel8bf61e82008-06-02 22:18:03 +0000252 // Need to custom handle (some) common i8, i64 math ops
Scott Michel02d711b2008-12-30 23:28:25 +0000253 setOperationAction(ISD::ADD, MVT::i8, Custom);
Scott Michel94bd57e2009-01-15 04:41:47 +0000254 setOperationAction(ISD::ADD, MVT::i64, Legal);
Scott Michel266bc8f2007-12-04 22:23:35 +0000255 setOperationAction(ISD::SUB, MVT::i8, Custom);
Scott Michel94bd57e2009-01-15 04:41:47 +0000256 setOperationAction(ISD::SUB, MVT::i64, Legal);
Scott Michel5af8f0e2008-07-16 17:17:29 +0000257
Scott Michel266bc8f2007-12-04 22:23:35 +0000258 // SPU does not have BSWAP. It does have i32 support CTLZ.
259 // CTPOP has to be custom lowered.
260 setOperationAction(ISD::BSWAP, MVT::i32, Expand);
261 setOperationAction(ISD::BSWAP, MVT::i64, Expand);
262
263 setOperationAction(ISD::CTPOP, MVT::i8, Custom);
264 setOperationAction(ISD::CTPOP, MVT::i16, Custom);
265 setOperationAction(ISD::CTPOP, MVT::i32, Custom);
266 setOperationAction(ISD::CTPOP, MVT::i64, Custom);
267
268 setOperationAction(ISD::CTTZ , MVT::i32, Expand);
269 setOperationAction(ISD::CTTZ , MVT::i64, Expand);
270
271 setOperationAction(ISD::CTLZ , MVT::i32, Legal);
Scott Michel5af8f0e2008-07-16 17:17:29 +0000272
Scott Michel8bf61e82008-06-02 22:18:03 +0000273 // SPU has a version of select that implements (a&~c)|(b&c), just like
Scott Michel405fba12008-03-10 23:49:09 +0000274 // select ought to work:
Scott Michel78c47fa2008-03-10 16:58:52 +0000275 setOperationAction(ISD::SELECT, MVT::i8, Legal);
Scott Michelad2715e2008-03-05 23:02:02 +0000276 setOperationAction(ISD::SELECT, MVT::i16, Legal);
277 setOperationAction(ISD::SELECT, MVT::i32, Legal);
Scott Michelf0569be2008-12-27 04:51:36 +0000278 setOperationAction(ISD::SELECT, MVT::i64, Legal);
Scott Michel266bc8f2007-12-04 22:23:35 +0000279
Scott Michel78c47fa2008-03-10 16:58:52 +0000280 setOperationAction(ISD::SETCC, MVT::i8, Legal);
281 setOperationAction(ISD::SETCC, MVT::i16, Legal);
Scott Michel1df30c42008-12-29 03:23:36 +0000282 setOperationAction(ISD::SETCC, MVT::i32, Legal);
283 setOperationAction(ISD::SETCC, MVT::i64, Legal);
Scott Micheld1e8d9c2009-01-21 04:58:48 +0000284 setOperationAction(ISD::SETCC, MVT::f64, Custom);
Scott Michelad2715e2008-03-05 23:02:02 +0000285
Scott Michelf0569be2008-12-27 04:51:36 +0000286 // Custom lower i128 -> i64 truncates
Scott Michelb30e8f62008-12-02 19:53:53 +0000287 setOperationAction(ISD::TRUNCATE, MVT::i64, Custom);
288
Scott Michelc9c8b2a2009-01-26 03:31:40 +0000289 // SPU has a legal FP -> signed INT instruction for f32, but for f64, need
290 // to expand to a libcall, hence the custom lowering:
291 setOperationAction(ISD::FP_TO_SINT, MVT::i32, Custom);
292 setOperationAction(ISD::FP_TO_UINT, MVT::i32, Custom);
Scott Michel266bc8f2007-12-04 22:23:35 +0000293
294 // FDIV on SPU requires custom lowering
Scott Michelc9c8b2a2009-01-26 03:31:40 +0000295 setOperationAction(ISD::FDIV, MVT::f64, Expand); // to libcall
Scott Michel266bc8f2007-12-04 22:23:35 +0000296
Scott Michel9de57a92009-01-26 22:33:37 +0000297 // SPU has [U|S]INT_TO_FP for f32->i32, but not for f64->i32, f64->i64:
Scott Michelc9c8b2a2009-01-26 03:31:40 +0000298 setOperationAction(ISD::SINT_TO_FP, MVT::i32, Custom);
Scott Michel266bc8f2007-12-04 22:23:35 +0000299 setOperationAction(ISD::SINT_TO_FP, MVT::i16, Promote);
Scott Michelc9c8b2a2009-01-26 03:31:40 +0000300 setOperationAction(ISD::SINT_TO_FP, MVT::i8, Promote);
301 setOperationAction(ISD::UINT_TO_FP, MVT::i32, Custom);
Scott Michel266bc8f2007-12-04 22:23:35 +0000302 setOperationAction(ISD::UINT_TO_FP, MVT::i16, Promote);
Scott Michelc9c8b2a2009-01-26 03:31:40 +0000303 setOperationAction(ISD::UINT_TO_FP, MVT::i8, Promote);
Scott Michel266bc8f2007-12-04 22:23:35 +0000304 setOperationAction(ISD::SINT_TO_FP, MVT::i64, Custom);
305 setOperationAction(ISD::UINT_TO_FP, MVT::i64, Custom);
306
Scott Michel86c041f2007-12-20 00:44:13 +0000307 setOperationAction(ISD::BIT_CONVERT, MVT::i32, Legal);
308 setOperationAction(ISD::BIT_CONVERT, MVT::f32, Legal);
309 setOperationAction(ISD::BIT_CONVERT, MVT::i64, Legal);
310 setOperationAction(ISD::BIT_CONVERT, MVT::f64, Legal);
Scott Michel266bc8f2007-12-04 22:23:35 +0000311
312 // We cannot sextinreg(i1). Expand to shifts.
313 setOperationAction(ISD::SIGN_EXTEND_INREG, MVT::i1, Expand);
Scott Michel5af8f0e2008-07-16 17:17:29 +0000314
Scott Michel266bc8f2007-12-04 22:23:35 +0000315 // Support label based line numbers.
Dan Gohman7f460202008-06-30 20:59:49 +0000316 setOperationAction(ISD::DBG_STOPPOINT, MVT::Other, Expand);
Scott Michel266bc8f2007-12-04 22:23:35 +0000317 setOperationAction(ISD::DEBUG_LOC, MVT::Other, Expand);
Scott Michel5af8f0e2008-07-16 17:17:29 +0000318
319 // We want to legalize GlobalAddress and ConstantPool nodes into the
Scott Michel266bc8f2007-12-04 22:23:35 +0000320 // appropriate instructions to materialize the address.
Scott Michel9c0c6b22008-11-21 02:56:16 +0000321 for (unsigned sctype = (unsigned) MVT::i8; sctype < (unsigned) MVT::f128;
Scott Michel053c1da2008-01-29 02:16:57 +0000322 ++sctype) {
Duncan Sands83ec4b62008-06-06 12:08:01 +0000323 MVT VT = (MVT::SimpleValueType)sctype;
324
Scott Michel1df30c42008-12-29 03:23:36 +0000325 setOperationAction(ISD::GlobalAddress, VT, Custom);
326 setOperationAction(ISD::ConstantPool, VT, Custom);
327 setOperationAction(ISD::JumpTable, VT, Custom);
Scott Michel053c1da2008-01-29 02:16:57 +0000328 }
Scott Michel266bc8f2007-12-04 22:23:35 +0000329
330 // RET must be custom lowered, to meet ABI requirements
331 setOperationAction(ISD::RET, MVT::Other, Custom);
Scott Michel5af8f0e2008-07-16 17:17:29 +0000332
Scott Michel266bc8f2007-12-04 22:23:35 +0000333 // VASTART needs to be custom lowered to use the VarArgsFrameIndex
334 setOperationAction(ISD::VASTART , MVT::Other, Custom);
Scott Michel5af8f0e2008-07-16 17:17:29 +0000335
Scott Michel266bc8f2007-12-04 22:23:35 +0000336 // Use the default implementation.
337 setOperationAction(ISD::VAARG , MVT::Other, Expand);
338 setOperationAction(ISD::VACOPY , MVT::Other, Expand);
339 setOperationAction(ISD::VAEND , MVT::Other, Expand);
Scott Michel5af8f0e2008-07-16 17:17:29 +0000340 setOperationAction(ISD::STACKSAVE , MVT::Other, Expand);
Scott Michel266bc8f2007-12-04 22:23:35 +0000341 setOperationAction(ISD::STACKRESTORE , MVT::Other, Expand);
342 setOperationAction(ISD::DYNAMIC_STACKALLOC, MVT::i32 , Expand);
343 setOperationAction(ISD::DYNAMIC_STACKALLOC, MVT::i64 , Expand);
344
345 // Cell SPU has instructions for converting between i64 and fp.
346 setOperationAction(ISD::FP_TO_SINT, MVT::i64, Custom);
347 setOperationAction(ISD::SINT_TO_FP, MVT::i64, Custom);
Scott Michel5af8f0e2008-07-16 17:17:29 +0000348
Scott Michel266bc8f2007-12-04 22:23:35 +0000349 // To take advantage of the above i64 FP_TO_SINT, promote i32 FP_TO_UINT
350 setOperationAction(ISD::FP_TO_UINT, MVT::i32, Promote);
351
352 // BUILD_PAIR can't be handled natively, and should be expanded to shl/or
353 setOperationAction(ISD::BUILD_PAIR, MVT::i64, Expand);
354
355 // First set operation action for all vector types to expand. Then we
356 // will selectively turn on ones that can be effectively codegen'd.
357 addRegisterClass(MVT::v16i8, SPU::VECREGRegisterClass);
358 addRegisterClass(MVT::v8i16, SPU::VECREGRegisterClass);
359 addRegisterClass(MVT::v4i32, SPU::VECREGRegisterClass);
360 addRegisterClass(MVT::v2i64, SPU::VECREGRegisterClass);
361 addRegisterClass(MVT::v4f32, SPU::VECREGRegisterClass);
362 addRegisterClass(MVT::v2f64, SPU::VECREGRegisterClass);
363
Scott Michel21213e72009-01-06 23:10:38 +0000364 // "Odd size" vector classes that we're willing to support:
365 addRegisterClass(MVT::v2i32, SPU::VECREGRegisterClass);
366
Duncan Sands83ec4b62008-06-06 12:08:01 +0000367 for (unsigned i = (unsigned)MVT::FIRST_VECTOR_VALUETYPE;
368 i <= (unsigned)MVT::LAST_VECTOR_VALUETYPE; ++i) {
369 MVT VT = (MVT::SimpleValueType)i;
Scott Michel266bc8f2007-12-04 22:23:35 +0000370
Duncan Sands83ec4b62008-06-06 12:08:01 +0000371 // add/sub are legal for all supported vector VT's.
Scott Michelc9c8b2a2009-01-26 03:31:40 +0000372 setOperationAction(ISD::ADD, VT, Legal);
373 setOperationAction(ISD::SUB, VT, Legal);
Duncan Sands83ec4b62008-06-06 12:08:01 +0000374 // mul has to be custom lowered.
Scott Michelc9c8b2a2009-01-26 03:31:40 +0000375 setOperationAction(ISD::MUL, VT, Legal);
Duncan Sands83ec4b62008-06-06 12:08:01 +0000376
Scott Michelc9c8b2a2009-01-26 03:31:40 +0000377 setOperationAction(ISD::AND, VT, Legal);
378 setOperationAction(ISD::OR, VT, Legal);
379 setOperationAction(ISD::XOR, VT, Legal);
380 setOperationAction(ISD::LOAD, VT, Legal);
381 setOperationAction(ISD::SELECT, VT, Legal);
382 setOperationAction(ISD::STORE, VT, Legal);
Scott Michel5af8f0e2008-07-16 17:17:29 +0000383
Scott Michel266bc8f2007-12-04 22:23:35 +0000384 // These operations need to be expanded:
Scott Michelc9c8b2a2009-01-26 03:31:40 +0000385 setOperationAction(ISD::SDIV, VT, Expand);
386 setOperationAction(ISD::SREM, VT, Expand);
387 setOperationAction(ISD::UDIV, VT, Expand);
388 setOperationAction(ISD::UREM, VT, Expand);
Scott Michel266bc8f2007-12-04 22:23:35 +0000389
390 // Custom lower build_vector, constant pool spills, insert and
391 // extract vector elements:
Duncan Sands83ec4b62008-06-06 12:08:01 +0000392 setOperationAction(ISD::BUILD_VECTOR, VT, Custom);
393 setOperationAction(ISD::ConstantPool, VT, Custom);
394 setOperationAction(ISD::SCALAR_TO_VECTOR, VT, Custom);
395 setOperationAction(ISD::EXTRACT_VECTOR_ELT, VT, Custom);
396 setOperationAction(ISD::INSERT_VECTOR_ELT, VT, Custom);
397 setOperationAction(ISD::VECTOR_SHUFFLE, VT, Custom);
Scott Michel266bc8f2007-12-04 22:23:35 +0000398 }
399
Scott Michel266bc8f2007-12-04 22:23:35 +0000400 setOperationAction(ISD::AND, MVT::v16i8, Custom);
401 setOperationAction(ISD::OR, MVT::v16i8, Custom);
402 setOperationAction(ISD::XOR, MVT::v16i8, Custom);
403 setOperationAction(ISD::SCALAR_TO_VECTOR, MVT::v4f32, Custom);
Scott Michel9de5d0d2008-01-11 02:53:15 +0000404
Scott Michel02d711b2008-12-30 23:28:25 +0000405 setOperationAction(ISD::FDIV, MVT::v4f32, Legal);
Scott Michel1df30c42008-12-29 03:23:36 +0000406
Scott Michel266bc8f2007-12-04 22:23:35 +0000407 setShiftAmountType(MVT::i32);
Scott Michelf0569be2008-12-27 04:51:36 +0000408 setBooleanContents(ZeroOrNegativeOneBooleanContent);
Scott Michel5af8f0e2008-07-16 17:17:29 +0000409
Scott Michel266bc8f2007-12-04 22:23:35 +0000410 setStackPointerRegisterToSaveRestore(SPU::R1);
Scott Michel5af8f0e2008-07-16 17:17:29 +0000411
Scott Michel266bc8f2007-12-04 22:23:35 +0000412 // We have target-specific dag combine patterns for the following nodes:
Scott Michel053c1da2008-01-29 02:16:57 +0000413 setTargetDAGCombine(ISD::ADD);
Scott Michela59d4692008-02-23 18:41:37 +0000414 setTargetDAGCombine(ISD::ZERO_EXTEND);
415 setTargetDAGCombine(ISD::SIGN_EXTEND);
416 setTargetDAGCombine(ISD::ANY_EXTEND);
Scott Michel5af8f0e2008-07-16 17:17:29 +0000417
Scott Michel266bc8f2007-12-04 22:23:35 +0000418 computeRegisterProperties();
Scott Michel7a1c9e92008-11-22 23:50:42 +0000419
Scott Michele07d3de2008-12-09 03:37:19 +0000420 // Set pre-RA register scheduler default to BURR, which produces slightly
421 // better code than the default (could also be TDRR, but TargetLowering.h
422 // needs a mod to support that model):
423 setSchedulingPreference(SchedulingForRegPressure);
Scott Michel266bc8f2007-12-04 22:23:35 +0000424}
425
426const char *
427SPUTargetLowering::getTargetNodeName(unsigned Opcode) const
428{
429 if (node_names.empty()) {
430 node_names[(unsigned) SPUISD::RET_FLAG] = "SPUISD::RET_FLAG";
431 node_names[(unsigned) SPUISD::Hi] = "SPUISD::Hi";
432 node_names[(unsigned) SPUISD::Lo] = "SPUISD::Lo";
433 node_names[(unsigned) SPUISD::PCRelAddr] = "SPUISD::PCRelAddr";
Scott Michel9de5d0d2008-01-11 02:53:15 +0000434 node_names[(unsigned) SPUISD::AFormAddr] = "SPUISD::AFormAddr";
Scott Michel053c1da2008-01-29 02:16:57 +0000435 node_names[(unsigned) SPUISD::IndirectAddr] = "SPUISD::IndirectAddr";
Scott Michel266bc8f2007-12-04 22:23:35 +0000436 node_names[(unsigned) SPUISD::LDRESULT] = "SPUISD::LDRESULT";
437 node_names[(unsigned) SPUISD::CALL] = "SPUISD::CALL";
438 node_names[(unsigned) SPUISD::SHUFB] = "SPUISD::SHUFB";
Scott Michel7a1c9e92008-11-22 23:50:42 +0000439 node_names[(unsigned) SPUISD::SHUFFLE_MASK] = "SPUISD::SHUFFLE_MASK";
Scott Michel266bc8f2007-12-04 22:23:35 +0000440 node_names[(unsigned) SPUISD::CNTB] = "SPUISD::CNTB";
Scott Michel1df30c42008-12-29 03:23:36 +0000441 node_names[(unsigned) SPUISD::PREFSLOT2VEC] = "SPUISD::PREFSLOT2VEC";
Scott Michel104de432008-11-24 17:11:17 +0000442 node_names[(unsigned) SPUISD::VEC2PREFSLOT] = "SPUISD::VEC2PREFSLOT";
Scott Michela59d4692008-02-23 18:41:37 +0000443 node_names[(unsigned) SPUISD::SHLQUAD_L_BITS] = "SPUISD::SHLQUAD_L_BITS";
444 node_names[(unsigned) SPUISD::SHLQUAD_L_BYTES] = "SPUISD::SHLQUAD_L_BYTES";
Scott Michel266bc8f2007-12-04 22:23:35 +0000445 node_names[(unsigned) SPUISD::VEC_SHL] = "SPUISD::VEC_SHL";
446 node_names[(unsigned) SPUISD::VEC_SRL] = "SPUISD::VEC_SRL";
447 node_names[(unsigned) SPUISD::VEC_SRA] = "SPUISD::VEC_SRA";
448 node_names[(unsigned) SPUISD::VEC_ROTL] = "SPUISD::VEC_ROTL";
449 node_names[(unsigned) SPUISD::VEC_ROTR] = "SPUISD::VEC_ROTR";
Scott Micheld1e8d9c2009-01-21 04:58:48 +0000450 node_names[(unsigned) SPUISD::ROTBYTES_LEFT] = "SPUISD::ROTBYTES_LEFT";
451 node_names[(unsigned) SPUISD::ROTBYTES_LEFT_BITS] =
452 "SPUISD::ROTBYTES_LEFT_BITS";
Scott Michel8bf61e82008-06-02 22:18:03 +0000453 node_names[(unsigned) SPUISD::SELECT_MASK] = "SPUISD::SELECT_MASK";
Scott Michel266bc8f2007-12-04 22:23:35 +0000454 node_names[(unsigned) SPUISD::SELB] = "SPUISD::SELB";
Scott Michel94bd57e2009-01-15 04:41:47 +0000455 node_names[(unsigned) SPUISD::ADD64_MARKER] = "SPUISD::ADD64_MARKER";
456 node_names[(unsigned) SPUISD::SUB64_MARKER] = "SPUISD::SUB64_MARKER";
457 node_names[(unsigned) SPUISD::MUL64_MARKER] = "SPUISD::MUL64_MARKER";
Scott Michel266bc8f2007-12-04 22:23:35 +0000458 }
459
460 std::map<unsigned, const char *>::iterator i = node_names.find(Opcode);
461
462 return ((i != node_names.end()) ? i->second : 0);
463}
464
Scott Michelf0569be2008-12-27 04:51:36 +0000465//===----------------------------------------------------------------------===//
466// Return the Cell SPU's SETCC result type
467//===----------------------------------------------------------------------===//
468
Duncan Sands5480c042009-01-01 15:52:00 +0000469MVT SPUTargetLowering::getSetCCResultType(MVT VT) const {
Scott Michelf0569be2008-12-27 04:51:36 +0000470 // i16 and i32 are valid SETCC result types
471 return ((VT == MVT::i8 || VT == MVT::i16 || VT == MVT::i32) ? VT : MVT::i32);
Scott Michel78c47fa2008-03-10 16:58:52 +0000472}
473
Scott Michel266bc8f2007-12-04 22:23:35 +0000474//===----------------------------------------------------------------------===//
475// Calling convention code:
476//===----------------------------------------------------------------------===//
477
478#include "SPUGenCallingConv.inc"
479
480//===----------------------------------------------------------------------===//
481// LowerOperation implementation
482//===----------------------------------------------------------------------===//
483
484/// Custom lower loads for CellSPU
485/*!
486 All CellSPU loads and stores are aligned to 16-byte boundaries, so for elements
487 within a 16-byte block, we have to rotate to extract the requested element.
Scott Michel30ee7df2008-12-04 03:02:42 +0000488
489 For extending loads, we also want to ensure that the following sequence is
490 emitted, e.g. for MVT::f32 extending load to MVT::f64:
491
492\verbatim
Scott Michel1df30c42008-12-29 03:23:36 +0000493%1 v16i8,ch = load
Scott Michel30ee7df2008-12-04 03:02:42 +0000494%2 v16i8,ch = rotate %1
Scott Michel1df30c42008-12-29 03:23:36 +0000495%3 v4f8, ch = bitconvert %2
Scott Michel30ee7df2008-12-04 03:02:42 +0000496%4 f32 = vec2perfslot %3
497%5 f64 = fp_extend %4
498\endverbatim
499*/
Dan Gohman475871a2008-07-27 21:46:04 +0000500static SDValue
501LowerLOAD(SDValue Op, SelectionDAG &DAG, const SPUSubtarget *ST) {
Scott Michel266bc8f2007-12-04 22:23:35 +0000502 LoadSDNode *LN = cast<LoadSDNode>(Op);
Dan Gohman475871a2008-07-27 21:46:04 +0000503 SDValue the_chain = LN->getChain();
Scott Michelf0569be2008-12-27 04:51:36 +0000504 MVT PtrVT = DAG.getTargetLoweringInfo().getPointerTy();
Scott Michel30ee7df2008-12-04 03:02:42 +0000505 MVT InVT = LN->getMemoryVT();
506 MVT OutVT = Op.getValueType();
Scott Michel266bc8f2007-12-04 22:23:35 +0000507 ISD::LoadExtType ExtType = LN->getExtensionType();
508 unsigned alignment = LN->getAlignment();
Scott Michelf0569be2008-12-27 04:51:36 +0000509 const valtype_map_s *vtm = getValueTypeMapEntry(InVT);
Dale Johannesen33c960f2009-02-04 20:06:27 +0000510 DebugLoc dl = Op.getDebugLoc();
Scott Michel266bc8f2007-12-04 22:23:35 +0000511
Scott Michel266bc8f2007-12-04 22:23:35 +0000512 switch (LN->getAddressingMode()) {
513 case ISD::UNINDEXED: {
Scott Michelf0569be2008-12-27 04:51:36 +0000514 SDValue result;
515 SDValue basePtr = LN->getBasePtr();
516 SDValue rotate;
Scott Michel266bc8f2007-12-04 22:23:35 +0000517
Scott Michelf0569be2008-12-27 04:51:36 +0000518 if (alignment == 16) {
519 ConstantSDNode *CN;
Scott Michel9de5d0d2008-01-11 02:53:15 +0000520
Scott Michelf0569be2008-12-27 04:51:36 +0000521 // Special cases for a known aligned load to simplify the base pointer
522 // and the rotation amount:
523 if (basePtr.getOpcode() == ISD::ADD
524 && (CN = dyn_cast<ConstantSDNode > (basePtr.getOperand(1))) != 0) {
525 // Known offset into basePtr
526 int64_t offset = CN->getSExtValue();
527 int64_t rotamt = int64_t((offset & 0xf) - vtm->prefslot_byte);
Scott Michel9de5d0d2008-01-11 02:53:15 +0000528
Scott Michelf0569be2008-12-27 04:51:36 +0000529 if (rotamt < 0)
530 rotamt += 16;
531
532 rotate = DAG.getConstant(rotamt, MVT::i16);
533
534 // Simplify the base pointer for this case:
535 basePtr = basePtr.getOperand(0);
536 if ((offset & ~0xf) > 0) {
Dale Johannesende064702009-02-06 21:50:26 +0000537 basePtr = DAG.getNode(SPUISD::IndirectAddr, dl, PtrVT,
Scott Michelf0569be2008-12-27 04:51:36 +0000538 basePtr,
539 DAG.getConstant((offset & ~0xf), PtrVT));
540 }
541 } else if ((basePtr.getOpcode() == SPUISD::AFormAddr)
542 || (basePtr.getOpcode() == SPUISD::IndirectAddr
543 && basePtr.getOperand(0).getOpcode() == SPUISD::Hi
544 && basePtr.getOperand(1).getOpcode() == SPUISD::Lo)) {
545 // Plain aligned a-form address: rotate into preferred slot
546 // Same for (SPUindirect (SPUhi ...), (SPUlo ...))
547 int64_t rotamt = -vtm->prefslot_byte;
548 if (rotamt < 0)
549 rotamt += 16;
550 rotate = DAG.getConstant(rotamt, MVT::i16);
Scott Michel9de5d0d2008-01-11 02:53:15 +0000551 } else {
Scott Michelf0569be2008-12-27 04:51:36 +0000552 // Offset the rotate amount by the basePtr and the preferred slot
553 // byte offset
554 int64_t rotamt = -vtm->prefslot_byte;
555 if (rotamt < 0)
556 rotamt += 16;
Dale Johannesen33c960f2009-02-04 20:06:27 +0000557 rotate = DAG.getNode(ISD::ADD, dl, PtrVT,
Scott Michelf0569be2008-12-27 04:51:36 +0000558 basePtr,
Scott Michel7f9ba9b2008-01-30 02:55:46 +0000559 DAG.getConstant(rotamt, PtrVT));
Scott Michel9de5d0d2008-01-11 02:53:15 +0000560 }
Scott Michelf0569be2008-12-27 04:51:36 +0000561 } else {
562 // Unaligned load: must be more pessimistic about addressing modes:
563 if (basePtr.getOpcode() == ISD::ADD) {
564 MachineFunction &MF = DAG.getMachineFunction();
565 MachineRegisterInfo &RegInfo = MF.getRegInfo();
566 unsigned VReg = RegInfo.createVirtualRegister(&SPU::R32CRegClass);
567 SDValue Flag;
Scott Michel9de5d0d2008-01-11 02:53:15 +0000568
Scott Michelf0569be2008-12-27 04:51:36 +0000569 SDValue Op0 = basePtr.getOperand(0);
570 SDValue Op1 = basePtr.getOperand(1);
571
572 if (isa<ConstantSDNode>(Op1)) {
573 // Convert the (add <ptr>, <const>) to an indirect address contained
574 // in a register. Note that this is done because we need to avoid
575 // creating a 0(reg) d-form address due to the SPU's block loads.
Dale Johannesende064702009-02-06 21:50:26 +0000576 basePtr = DAG.getNode(SPUISD::IndirectAddr, dl, PtrVT, Op0, Op1);
Dale Johannesen33c960f2009-02-04 20:06:27 +0000577 the_chain = DAG.getCopyToReg(the_chain, dl, VReg, basePtr, Flag);
578 basePtr = DAG.getCopyFromReg(the_chain, dl, VReg, PtrVT);
Scott Michelf0569be2008-12-27 04:51:36 +0000579 } else {
580 // Convert the (add <arg1>, <arg2>) to an indirect address, which
581 // will likely be lowered as a reg(reg) x-form address.
Dale Johannesende064702009-02-06 21:50:26 +0000582 basePtr = DAG.getNode(SPUISD::IndirectAddr, dl, PtrVT, Op0, Op1);
Scott Michelf0569be2008-12-27 04:51:36 +0000583 }
584 } else {
Dale Johannesende064702009-02-06 21:50:26 +0000585 basePtr = DAG.getNode(SPUISD::IndirectAddr, dl, PtrVT,
Scott Michelf0569be2008-12-27 04:51:36 +0000586 basePtr,
587 DAG.getConstant(0, PtrVT));
588 }
589
590 // Offset the rotate amount by the basePtr and the preferred slot
591 // byte offset
Dale Johannesen33c960f2009-02-04 20:06:27 +0000592 rotate = DAG.getNode(ISD::ADD, dl, PtrVT,
Scott Michelf0569be2008-12-27 04:51:36 +0000593 basePtr,
594 DAG.getConstant(-vtm->prefslot_byte, PtrVT));
Scott Michel266bc8f2007-12-04 22:23:35 +0000595 }
Scott Michel9de5d0d2008-01-11 02:53:15 +0000596
Scott Michelf0569be2008-12-27 04:51:36 +0000597 // Re-emit as a v16i8 vector load
Dale Johannesen33c960f2009-02-04 20:06:27 +0000598 result = DAG.getLoad(MVT::v16i8, dl, the_chain, basePtr,
Scott Michelf0569be2008-12-27 04:51:36 +0000599 LN->getSrcValue(), LN->getSrcValueOffset(),
600 LN->isVolatile(), 16);
601
602 // Update the chain
603 the_chain = result.getValue(1);
604
605 // Rotate into the preferred slot:
Dale Johannesen33c960f2009-02-04 20:06:27 +0000606 result = DAG.getNode(SPUISD::ROTBYTES_LEFT, dl, MVT::v16i8,
Scott Michelf0569be2008-12-27 04:51:36 +0000607 result.getValue(0), rotate);
608
Scott Michel30ee7df2008-12-04 03:02:42 +0000609 // Convert the loaded v16i8 vector to the appropriate vector type
610 // specified by the operand:
611 MVT vecVT = MVT::getVectorVT(InVT, (128 / InVT.getSizeInBits()));
Dale Johannesen33c960f2009-02-04 20:06:27 +0000612 result = DAG.getNode(SPUISD::VEC2PREFSLOT, dl, InVT,
613 DAG.getNode(ISD::BIT_CONVERT, dl, vecVT, result));
Scott Michel5af8f0e2008-07-16 17:17:29 +0000614
Scott Michel30ee7df2008-12-04 03:02:42 +0000615 // Handle extending loads by extending the scalar result:
616 if (ExtType == ISD::SEXTLOAD) {
Dale Johannesen33c960f2009-02-04 20:06:27 +0000617 result = DAG.getNode(ISD::SIGN_EXTEND, dl, OutVT, result);
Scott Michel30ee7df2008-12-04 03:02:42 +0000618 } else if (ExtType == ISD::ZEXTLOAD) {
Dale Johannesen33c960f2009-02-04 20:06:27 +0000619 result = DAG.getNode(ISD::ZERO_EXTEND, dl, OutVT, result);
Scott Michel30ee7df2008-12-04 03:02:42 +0000620 } else if (ExtType == ISD::EXTLOAD) {
621 unsigned NewOpc = ISD::ANY_EXTEND;
Scott Michel9de5d0d2008-01-11 02:53:15 +0000622
Scott Michel30ee7df2008-12-04 03:02:42 +0000623 if (OutVT.isFloatingPoint())
Scott Michel19c10e62009-01-26 03:37:41 +0000624 NewOpc = ISD::FP_EXTEND;
Scott Michel9de5d0d2008-01-11 02:53:15 +0000625
Dale Johannesen33c960f2009-02-04 20:06:27 +0000626 result = DAG.getNode(NewOpc, dl, OutVT, result);
Scott Michel9de5d0d2008-01-11 02:53:15 +0000627 }
628
Scott Michel30ee7df2008-12-04 03:02:42 +0000629 SDVTList retvts = DAG.getVTList(OutVT, MVT::Other);
Dan Gohman475871a2008-07-27 21:46:04 +0000630 SDValue retops[2] = {
Scott Michel58c58182008-01-17 20:38:41 +0000631 result,
Scott Michel7f9ba9b2008-01-30 02:55:46 +0000632 the_chain
Scott Michel58c58182008-01-17 20:38:41 +0000633 };
Scott Michel9de5d0d2008-01-11 02:53:15 +0000634
Dale Johannesen33c960f2009-02-04 20:06:27 +0000635 result = DAG.getNode(SPUISD::LDRESULT, dl, retvts,
Scott Michel58c58182008-01-17 20:38:41 +0000636 retops, sizeof(retops) / sizeof(retops[0]));
Scott Michel9de5d0d2008-01-11 02:53:15 +0000637 return result;
Scott Michel266bc8f2007-12-04 22:23:35 +0000638 }
639 case ISD::PRE_INC:
640 case ISD::PRE_DEC:
641 case ISD::POST_INC:
642 case ISD::POST_DEC:
643 case ISD::LAST_INDEXED_MODE:
644 cerr << "LowerLOAD: Got a LoadSDNode with an addr mode other than "
645 "UNINDEXED\n";
646 cerr << (unsigned) LN->getAddressingMode() << "\n";
647 abort();
648 /*NOTREACHED*/
649 }
650
Dan Gohman475871a2008-07-27 21:46:04 +0000651 return SDValue();
Scott Michel266bc8f2007-12-04 22:23:35 +0000652}
653
654/// Custom lower stores for CellSPU
655/*!
656 All CellSPU stores are aligned to 16-byte boundaries, so for elements
657 within a 16-byte block, we have to generate a shuffle to insert the
658 requested element into its place, then store the resulting block.
659 */
Dan Gohman475871a2008-07-27 21:46:04 +0000660static SDValue
661LowerSTORE(SDValue Op, SelectionDAG &DAG, const SPUSubtarget *ST) {
Scott Michel266bc8f2007-12-04 22:23:35 +0000662 StoreSDNode *SN = cast<StoreSDNode>(Op);
Dan Gohman475871a2008-07-27 21:46:04 +0000663 SDValue Value = SN->getValue();
Duncan Sands83ec4b62008-06-06 12:08:01 +0000664 MVT VT = Value.getValueType();
665 MVT StVT = (!SN->isTruncatingStore() ? VT : SN->getMemoryVT());
666 MVT PtrVT = DAG.getTargetLoweringInfo().getPointerTy();
Dale Johannesen33c960f2009-02-04 20:06:27 +0000667 DebugLoc dl = Op.getDebugLoc();
Scott Michel9de5d0d2008-01-11 02:53:15 +0000668 unsigned alignment = SN->getAlignment();
Scott Michel266bc8f2007-12-04 22:23:35 +0000669
670 switch (SN->getAddressingMode()) {
671 case ISD::UNINDEXED: {
Scott Michel9c0c6b22008-11-21 02:56:16 +0000672 // The vector type we really want to load from the 16-byte chunk.
Scott Michel719b0e12008-11-19 17:45:08 +0000673 MVT vecVT = MVT::getVectorVT(VT, (128 / VT.getSizeInBits())),
674 stVecVT = MVT::getVectorVT(StVT, (128 / StVT.getSizeInBits()));
Scott Michel266bc8f2007-12-04 22:23:35 +0000675
Scott Michelf0569be2008-12-27 04:51:36 +0000676 SDValue alignLoadVec;
677 SDValue basePtr = SN->getBasePtr();
678 SDValue the_chain = SN->getChain();
679 SDValue insertEltOffs;
Scott Michel266bc8f2007-12-04 22:23:35 +0000680
Scott Michelf0569be2008-12-27 04:51:36 +0000681 if (alignment == 16) {
682 ConstantSDNode *CN;
683
684 // Special cases for a known aligned load to simplify the base pointer
685 // and insertion byte:
686 if (basePtr.getOpcode() == ISD::ADD
687 && (CN = dyn_cast<ConstantSDNode>(basePtr.getOperand(1))) != 0) {
688 // Known offset into basePtr
689 int64_t offset = CN->getSExtValue();
690
691 // Simplify the base pointer for this case:
692 basePtr = basePtr.getOperand(0);
Dale Johannesende064702009-02-06 21:50:26 +0000693 insertEltOffs = DAG.getNode(SPUISD::IndirectAddr, dl, PtrVT,
Scott Michelf0569be2008-12-27 04:51:36 +0000694 basePtr,
695 DAG.getConstant((offset & 0xf), PtrVT));
696
697 if ((offset & ~0xf) > 0) {
Dale Johannesende064702009-02-06 21:50:26 +0000698 basePtr = DAG.getNode(SPUISD::IndirectAddr, dl, PtrVT,
Scott Michelf0569be2008-12-27 04:51:36 +0000699 basePtr,
700 DAG.getConstant((offset & ~0xf), PtrVT));
701 }
702 } else {
703 // Otherwise, assume it's at byte 0 of basePtr
Dale Johannesende064702009-02-06 21:50:26 +0000704 insertEltOffs = DAG.getNode(SPUISD::IndirectAddr, dl, PtrVT,
Scott Michelf0569be2008-12-27 04:51:36 +0000705 basePtr,
706 DAG.getConstant(0, PtrVT));
707 }
708 } else {
709 // Unaligned load: must be more pessimistic about addressing modes:
710 if (basePtr.getOpcode() == ISD::ADD) {
711 MachineFunction &MF = DAG.getMachineFunction();
712 MachineRegisterInfo &RegInfo = MF.getRegInfo();
713 unsigned VReg = RegInfo.createVirtualRegister(&SPU::R32CRegClass);
714 SDValue Flag;
715
716 SDValue Op0 = basePtr.getOperand(0);
717 SDValue Op1 = basePtr.getOperand(1);
718
719 if (isa<ConstantSDNode>(Op1)) {
720 // Convert the (add <ptr>, <const>) to an indirect address contained
721 // in a register. Note that this is done because we need to avoid
722 // creating a 0(reg) d-form address due to the SPU's block loads.
Dale Johannesende064702009-02-06 21:50:26 +0000723 basePtr = DAG.getNode(SPUISD::IndirectAddr, dl, PtrVT, Op0, Op1);
Dale Johannesen33c960f2009-02-04 20:06:27 +0000724 the_chain = DAG.getCopyToReg(the_chain, dl, VReg, basePtr, Flag);
725 basePtr = DAG.getCopyFromReg(the_chain, dl, VReg, PtrVT);
Scott Michelf0569be2008-12-27 04:51:36 +0000726 } else {
727 // Convert the (add <arg1>, <arg2>) to an indirect address, which
728 // will likely be lowered as a reg(reg) x-form address.
Dale Johannesende064702009-02-06 21:50:26 +0000729 basePtr = DAG.getNode(SPUISD::IndirectAddr, dl, PtrVT, Op0, Op1);
Scott Michelf0569be2008-12-27 04:51:36 +0000730 }
731 } else {
Dale Johannesende064702009-02-06 21:50:26 +0000732 basePtr = DAG.getNode(SPUISD::IndirectAddr, dl, PtrVT,
Scott Michelf0569be2008-12-27 04:51:36 +0000733 basePtr,
734 DAG.getConstant(0, PtrVT));
735 }
736
737 // Insertion point is solely determined by basePtr's contents
Dale Johannesen33c960f2009-02-04 20:06:27 +0000738 insertEltOffs = DAG.getNode(ISD::ADD, dl, PtrVT,
Scott Michelf0569be2008-12-27 04:51:36 +0000739 basePtr,
740 DAG.getConstant(0, PtrVT));
741 }
742
743 // Re-emit as a v16i8 vector load
Dale Johannesen33c960f2009-02-04 20:06:27 +0000744 alignLoadVec = DAG.getLoad(MVT::v16i8, dl, the_chain, basePtr,
Scott Michelf0569be2008-12-27 04:51:36 +0000745 SN->getSrcValue(), SN->getSrcValueOffset(),
746 SN->isVolatile(), 16);
747
748 // Update the chain
749 the_chain = alignLoadVec.getValue(1);
Scott Michel266bc8f2007-12-04 22:23:35 +0000750
Scott Michel9de5d0d2008-01-11 02:53:15 +0000751 LoadSDNode *LN = cast<LoadSDNode>(alignLoadVec);
Dan Gohman475871a2008-07-27 21:46:04 +0000752 SDValue theValue = SN->getValue();
753 SDValue result;
Scott Michel266bc8f2007-12-04 22:23:35 +0000754
755 if (StVT != VT
Scott Michel7f9ba9b2008-01-30 02:55:46 +0000756 && (theValue.getOpcode() == ISD::AssertZext
757 || theValue.getOpcode() == ISD::AssertSext)) {
Scott Michel266bc8f2007-12-04 22:23:35 +0000758 // Drill down and get the value for zero- and sign-extended
759 // quantities
Scott Michel5af8f0e2008-07-16 17:17:29 +0000760 theValue = theValue.getOperand(0);
Scott Michel266bc8f2007-12-04 22:23:35 +0000761 }
762
Scott Michel9de5d0d2008-01-11 02:53:15 +0000763 // If the base pointer is already a D-form address, then just create
764 // a new D-form address with a slot offset and the orignal base pointer.
765 // Otherwise generate a D-form address with the slot offset relative
766 // to the stack pointer, which is always aligned.
Scott Michelf0569be2008-12-27 04:51:36 +0000767#if !defined(NDEBUG)
768 if (DebugFlag && isCurrentDebugType(DEBUG_TYPE)) {
769 cerr << "CellSPU LowerSTORE: basePtr = ";
770 basePtr.getNode()->dump(&DAG);
771 cerr << "\n";
772 }
773#endif
Scott Michel9de5d0d2008-01-11 02:53:15 +0000774
Scott Michel430a5552008-11-19 15:24:16 +0000775 SDValue insertEltOp =
Dale Johannesen33c960f2009-02-04 20:06:27 +0000776 DAG.getNode(SPUISD::SHUFFLE_MASK, dl, vecVT, insertEltOffs);
Scott Michel719b0e12008-11-19 17:45:08 +0000777 SDValue vectorizeOp =
Dale Johannesen33c960f2009-02-04 20:06:27 +0000778 DAG.getNode(ISD::SCALAR_TO_VECTOR, dl, vecVT, theValue);
Scott Michel430a5552008-11-19 15:24:16 +0000779
Dale Johannesen33c960f2009-02-04 20:06:27 +0000780 result = DAG.getNode(SPUISD::SHUFB, dl, vecVT,
Scott Michel19c10e62009-01-26 03:37:41 +0000781 vectorizeOp, alignLoadVec,
Dale Johannesen33c960f2009-02-04 20:06:27 +0000782 DAG.getNode(ISD::BIT_CONVERT, dl,
783 MVT::v4i32, insertEltOp));
Scott Michel266bc8f2007-12-04 22:23:35 +0000784
Dale Johannesen33c960f2009-02-04 20:06:27 +0000785 result = DAG.getStore(the_chain, dl, result, basePtr,
Scott Michel266bc8f2007-12-04 22:23:35 +0000786 LN->getSrcValue(), LN->getSrcValueOffset(),
787 LN->isVolatile(), LN->getAlignment());
788
Scott Michel23f2ff72008-12-04 17:16:59 +0000789#if 0 && !defined(NDEBUG)
Scott Michel430a5552008-11-19 15:24:16 +0000790 if (DebugFlag && isCurrentDebugType(DEBUG_TYPE)) {
791 const SDValue &currentRoot = DAG.getRoot();
792
793 DAG.setRoot(result);
794 cerr << "------- CellSPU:LowerStore result:\n";
795 DAG.dump();
796 cerr << "-------\n";
797 DAG.setRoot(currentRoot);
798 }
799#endif
Scott Michelb30e8f62008-12-02 19:53:53 +0000800
Scott Michel266bc8f2007-12-04 22:23:35 +0000801 return result;
802 /*UNREACHED*/
803 }
804 case ISD::PRE_INC:
805 case ISD::PRE_DEC:
806 case ISD::POST_INC:
807 case ISD::POST_DEC:
808 case ISD::LAST_INDEXED_MODE:
809 cerr << "LowerLOAD: Got a LoadSDNode with an addr mode other than "
810 "UNINDEXED\n";
811 cerr << (unsigned) SN->getAddressingMode() << "\n";
812 abort();
813 /*NOTREACHED*/
814 }
815
Dan Gohman475871a2008-07-27 21:46:04 +0000816 return SDValue();
Scott Michel266bc8f2007-12-04 22:23:35 +0000817}
818
Scott Michel94bd57e2009-01-15 04:41:47 +0000819//! Generate the address of a constant pool entry.
820SDValue
Dan Gohman475871a2008-07-27 21:46:04 +0000821LowerConstantPool(SDValue Op, SelectionDAG &DAG, const SPUSubtarget *ST) {
Duncan Sands83ec4b62008-06-06 12:08:01 +0000822 MVT PtrVT = Op.getValueType();
Scott Michel266bc8f2007-12-04 22:23:35 +0000823 ConstantPoolSDNode *CP = cast<ConstantPoolSDNode>(Op);
824 Constant *C = CP->getConstVal();
Dan Gohman475871a2008-07-27 21:46:04 +0000825 SDValue CPI = DAG.getTargetConstantPool(C, PtrVT, CP->getAlignment());
826 SDValue Zero = DAG.getConstant(0, PtrVT);
Scott Michel9de5d0d2008-01-11 02:53:15 +0000827 const TargetMachine &TM = DAG.getTarget();
Dale Johannesende064702009-02-06 21:50:26 +0000828 // FIXME there is no actual debug info here
829 DebugLoc dl = Op.getDebugLoc();
Scott Michel266bc8f2007-12-04 22:23:35 +0000830
831 if (TM.getRelocationModel() == Reloc::Static) {
832 if (!ST->usingLargeMem()) {
Dan Gohman475871a2008-07-27 21:46:04 +0000833 // Just return the SDValue with the constant pool address in it.
Dale Johannesende064702009-02-06 21:50:26 +0000834 return DAG.getNode(SPUISD::AFormAddr, dl, PtrVT, CPI, Zero);
Scott Michel266bc8f2007-12-04 22:23:35 +0000835 } else {
Dale Johannesende064702009-02-06 21:50:26 +0000836 SDValue Hi = DAG.getNode(SPUISD::Hi, dl, PtrVT, CPI, Zero);
837 SDValue Lo = DAG.getNode(SPUISD::Lo, dl, PtrVT, CPI, Zero);
838 return DAG.getNode(SPUISD::IndirectAddr, dl, PtrVT, Hi, Lo);
Scott Michel266bc8f2007-12-04 22:23:35 +0000839 }
840 }
841
842 assert(0 &&
Gabor Greif93c53e52008-08-31 15:37:04 +0000843 "LowerConstantPool: Relocation model other than static"
844 " not supported.");
Dan Gohman475871a2008-07-27 21:46:04 +0000845 return SDValue();
Scott Michel266bc8f2007-12-04 22:23:35 +0000846}
847
Scott Michel94bd57e2009-01-15 04:41:47 +0000848//! Alternate entry point for generating the address of a constant pool entry
849SDValue
850SPU::LowerConstantPool(SDValue Op, SelectionDAG &DAG, const SPUTargetMachine &TM) {
851 return ::LowerConstantPool(Op, DAG, TM.getSubtargetImpl());
852}
853
Dan Gohman475871a2008-07-27 21:46:04 +0000854static SDValue
855LowerJumpTable(SDValue Op, SelectionDAG &DAG, const SPUSubtarget *ST) {
Duncan Sands83ec4b62008-06-06 12:08:01 +0000856 MVT PtrVT = Op.getValueType();
Scott Michel266bc8f2007-12-04 22:23:35 +0000857 JumpTableSDNode *JT = cast<JumpTableSDNode>(Op);
Dan Gohman475871a2008-07-27 21:46:04 +0000858 SDValue JTI = DAG.getTargetJumpTable(JT->getIndex(), PtrVT);
859 SDValue Zero = DAG.getConstant(0, PtrVT);
Scott Michel266bc8f2007-12-04 22:23:35 +0000860 const TargetMachine &TM = DAG.getTarget();
Dale Johannesende064702009-02-06 21:50:26 +0000861 // FIXME there is no actual debug info here
862 DebugLoc dl = Op.getDebugLoc();
Scott Michel266bc8f2007-12-04 22:23:35 +0000863
864 if (TM.getRelocationModel() == Reloc::Static) {
Scott Michela59d4692008-02-23 18:41:37 +0000865 if (!ST->usingLargeMem()) {
Dale Johannesende064702009-02-06 21:50:26 +0000866 return DAG.getNode(SPUISD::AFormAddr, dl, PtrVT, JTI, Zero);
Scott Michela59d4692008-02-23 18:41:37 +0000867 } else {
Dale Johannesende064702009-02-06 21:50:26 +0000868 SDValue Hi = DAG.getNode(SPUISD::Hi, dl, PtrVT, JTI, Zero);
869 SDValue Lo = DAG.getNode(SPUISD::Lo, dl, PtrVT, JTI, Zero);
870 return DAG.getNode(SPUISD::IndirectAddr, dl, PtrVT, Hi, Lo);
Scott Michela59d4692008-02-23 18:41:37 +0000871 }
Scott Michel266bc8f2007-12-04 22:23:35 +0000872 }
873
874 assert(0 &&
875 "LowerJumpTable: Relocation model other than static not supported.");
Dan Gohman475871a2008-07-27 21:46:04 +0000876 return SDValue();
Scott Michel266bc8f2007-12-04 22:23:35 +0000877}
878
Dan Gohman475871a2008-07-27 21:46:04 +0000879static SDValue
880LowerGlobalAddress(SDValue Op, SelectionDAG &DAG, const SPUSubtarget *ST) {
Duncan Sands83ec4b62008-06-06 12:08:01 +0000881 MVT PtrVT = Op.getValueType();
Scott Michel266bc8f2007-12-04 22:23:35 +0000882 GlobalAddressSDNode *GSDN = cast<GlobalAddressSDNode>(Op);
883 GlobalValue *GV = GSDN->getGlobal();
Dan Gohman475871a2008-07-27 21:46:04 +0000884 SDValue GA = DAG.getTargetGlobalAddress(GV, PtrVT, GSDN->getOffset());
Scott Michel266bc8f2007-12-04 22:23:35 +0000885 const TargetMachine &TM = DAG.getTarget();
Dan Gohman475871a2008-07-27 21:46:04 +0000886 SDValue Zero = DAG.getConstant(0, PtrVT);
Dale Johannesende064702009-02-06 21:50:26 +0000887 // FIXME there is no actual debug info here
888 DebugLoc dl = Op.getDebugLoc();
Scott Michel5af8f0e2008-07-16 17:17:29 +0000889
Scott Michel266bc8f2007-12-04 22:23:35 +0000890 if (TM.getRelocationModel() == Reloc::Static) {
Scott Michel053c1da2008-01-29 02:16:57 +0000891 if (!ST->usingLargeMem()) {
Dale Johannesende064702009-02-06 21:50:26 +0000892 return DAG.getNode(SPUISD::AFormAddr, dl, PtrVT, GA, Zero);
Scott Michel053c1da2008-01-29 02:16:57 +0000893 } else {
Dale Johannesende064702009-02-06 21:50:26 +0000894 SDValue Hi = DAG.getNode(SPUISD::Hi, dl, PtrVT, GA, Zero);
895 SDValue Lo = DAG.getNode(SPUISD::Lo, dl, PtrVT, GA, Zero);
896 return DAG.getNode(SPUISD::IndirectAddr, dl, PtrVT, Hi, Lo);
Scott Michel053c1da2008-01-29 02:16:57 +0000897 }
Scott Michel266bc8f2007-12-04 22:23:35 +0000898 } else {
899 cerr << "LowerGlobalAddress: Relocation model other than static not "
Scott Michel7f9ba9b2008-01-30 02:55:46 +0000900 << "supported.\n";
Scott Michel266bc8f2007-12-04 22:23:35 +0000901 abort();
902 /*NOTREACHED*/
903 }
904
Dan Gohman475871a2008-07-27 21:46:04 +0000905 return SDValue();
Scott Michel266bc8f2007-12-04 22:23:35 +0000906}
907
Nate Begemanccef5802008-02-14 18:43:04 +0000908//! Custom lower double precision floating point constants
Dan Gohman475871a2008-07-27 21:46:04 +0000909static SDValue
910LowerConstantFP(SDValue Op, SelectionDAG &DAG) {
Duncan Sands83ec4b62008-06-06 12:08:01 +0000911 MVT VT = Op.getValueType();
Dale Johannesende064702009-02-06 21:50:26 +0000912 // FIXME there is no actual debug info here
913 DebugLoc dl = Op.getDebugLoc();
Scott Michel266bc8f2007-12-04 22:23:35 +0000914
Nate Begemanccef5802008-02-14 18:43:04 +0000915 if (VT == MVT::f64) {
Scott Michel1a6cdb62008-12-01 17:56:02 +0000916 ConstantFPSDNode *FP = cast<ConstantFPSDNode>(Op.getNode());
917
918 assert((FP != 0) &&
919 "LowerConstantFP: Node is not ConstantFPSDNode");
Scott Michel1df30c42008-12-29 03:23:36 +0000920
Scott Michel170783a2007-12-19 20:15:47 +0000921 uint64_t dbits = DoubleToBits(FP->getValueAPF().convertToDouble());
Scott Michel1a6cdb62008-12-01 17:56:02 +0000922 SDValue T = DAG.getConstant(dbits, MVT::i64);
Evan Chenga87008d2009-02-25 22:49:59 +0000923 SDValue Tvec = DAG.getNode(ISD::BUILD_VECTOR, dl, MVT::v2i64, T, T);
Dale Johannesende064702009-02-06 21:50:26 +0000924 return DAG.getNode(SPUISD::VEC2PREFSLOT, dl, VT,
Dale Johannesenb300d2a2009-02-07 00:55:49 +0000925 DAG.getNode(ISD::BIT_CONVERT, dl, MVT::v2f64, Tvec));
Scott Michel266bc8f2007-12-04 22:23:35 +0000926 }
927
Dan Gohman475871a2008-07-27 21:46:04 +0000928 return SDValue();
Scott Michel266bc8f2007-12-04 22:23:35 +0000929}
930
Dan Gohman475871a2008-07-27 21:46:04 +0000931static SDValue
Dan Gohman475871a2008-07-27 21:46:04 +0000932LowerFORMAL_ARGUMENTS(SDValue Op, SelectionDAG &DAG, int &VarArgsFrameIndex)
Scott Michel266bc8f2007-12-04 22:23:35 +0000933{
934 MachineFunction &MF = DAG.getMachineFunction();
935 MachineFrameInfo *MFI = MF.getFrameInfo();
Chris Lattner84bc5422007-12-31 04:13:23 +0000936 MachineRegisterInfo &RegInfo = MF.getRegInfo();
Scott Micheld976c212008-10-30 01:51:48 +0000937 SmallVector<SDValue, 48> ArgValues;
Dan Gohman475871a2008-07-27 21:46:04 +0000938 SDValue Root = Op.getOperand(0);
Dan Gohmanf5aeb1a2008-09-12 16:56:44 +0000939 bool isVarArg = cast<ConstantSDNode>(Op.getOperand(2))->getZExtValue() != 0;
Dale Johannesen33c960f2009-02-04 20:06:27 +0000940 DebugLoc dl = Op.getDebugLoc();
Scott Michel266bc8f2007-12-04 22:23:35 +0000941
942 const unsigned *ArgRegs = SPURegisterInfo::getArgRegs();
943 const unsigned NumArgRegs = SPURegisterInfo::getNumArgRegs();
Scott Michel5af8f0e2008-07-16 17:17:29 +0000944
Scott Michel266bc8f2007-12-04 22:23:35 +0000945 unsigned ArgOffset = SPUFrameInfo::minStackSize();
946 unsigned ArgRegIdx = 0;
947 unsigned StackSlotSize = SPUFrameInfo::stackSlotSize();
Scott Michel5af8f0e2008-07-16 17:17:29 +0000948
Duncan Sands83ec4b62008-06-06 12:08:01 +0000949 MVT PtrVT = DAG.getTargetLoweringInfo().getPointerTy();
Scott Michel5af8f0e2008-07-16 17:17:29 +0000950
Scott Michel266bc8f2007-12-04 22:23:35 +0000951 // Add DAG nodes to load the arguments or copy them out of registers.
Gabor Greif93c53e52008-08-31 15:37:04 +0000952 for (unsigned ArgNo = 0, e = Op.getNode()->getNumValues() - 1;
953 ArgNo != e; ++ArgNo) {
Duncan Sands83ec4b62008-06-06 12:08:01 +0000954 MVT ObjectVT = Op.getValue(ArgNo).getValueType();
955 unsigned ObjSize = ObjectVT.getSizeInBits()/8;
Scott Micheld976c212008-10-30 01:51:48 +0000956 SDValue ArgVal;
Scott Michel266bc8f2007-12-04 22:23:35 +0000957
Scott Micheld976c212008-10-30 01:51:48 +0000958 if (ArgRegIdx < NumArgRegs) {
959 const TargetRegisterClass *ArgRegClass;
Scott Michel5af8f0e2008-07-16 17:17:29 +0000960
Scott Micheld976c212008-10-30 01:51:48 +0000961 switch (ObjectVT.getSimpleVT()) {
962 default: {
Scott Michel9c0c6b22008-11-21 02:56:16 +0000963 cerr << "LowerFORMAL_ARGUMENTS Unhandled argument type: "
964 << ObjectVT.getMVTString()
965 << "\n";
966 abort();
Scott Micheld976c212008-10-30 01:51:48 +0000967 }
968 case MVT::i8:
Scott Michel9c0c6b22008-11-21 02:56:16 +0000969 ArgRegClass = &SPU::R8CRegClass;
970 break;
Scott Micheld976c212008-10-30 01:51:48 +0000971 case MVT::i16:
Scott Michel9c0c6b22008-11-21 02:56:16 +0000972 ArgRegClass = &SPU::R16CRegClass;
973 break;
Scott Micheld976c212008-10-30 01:51:48 +0000974 case MVT::i32:
Scott Michel9c0c6b22008-11-21 02:56:16 +0000975 ArgRegClass = &SPU::R32CRegClass;
976 break;
Scott Micheld976c212008-10-30 01:51:48 +0000977 case MVT::i64:
Scott Michel9c0c6b22008-11-21 02:56:16 +0000978 ArgRegClass = &SPU::R64CRegClass;
979 break;
Scott Micheldd950092009-01-06 03:36:14 +0000980 case MVT::i128:
981 ArgRegClass = &SPU::GPRCRegClass;
982 break;
Scott Micheld976c212008-10-30 01:51:48 +0000983 case MVT::f32:
Scott Michel9c0c6b22008-11-21 02:56:16 +0000984 ArgRegClass = &SPU::R32FPRegClass;
985 break;
Scott Micheld976c212008-10-30 01:51:48 +0000986 case MVT::f64:
Scott Michel9c0c6b22008-11-21 02:56:16 +0000987 ArgRegClass = &SPU::R64FPRegClass;
988 break;
Scott Micheld976c212008-10-30 01:51:48 +0000989 case MVT::v2f64:
990 case MVT::v4f32:
991 case MVT::v2i64:
992 case MVT::v4i32:
993 case MVT::v8i16:
994 case MVT::v16i8:
Scott Michel9c0c6b22008-11-21 02:56:16 +0000995 ArgRegClass = &SPU::VECREGRegClass;
996 break;
Scott Micheld976c212008-10-30 01:51:48 +0000997 }
998
999 unsigned VReg = RegInfo.createVirtualRegister(ArgRegClass);
1000 RegInfo.addLiveIn(ArgRegs[ArgRegIdx], VReg);
Dale Johannesen33c960f2009-02-04 20:06:27 +00001001 ArgVal = DAG.getCopyFromReg(Root, dl, VReg, ObjectVT);
Scott Micheld976c212008-10-30 01:51:48 +00001002 ++ArgRegIdx;
1003 } else {
1004 // We need to load the argument to a virtual register if we determined
1005 // above that we ran out of physical registers of the appropriate type
1006 // or we're forced to do vararg
Chris Lattner9f72d1a2008-02-13 07:35:30 +00001007 int FI = MFI->CreateFixedObject(ObjSize, ArgOffset);
Dan Gohman475871a2008-07-27 21:46:04 +00001008 SDValue FIN = DAG.getFrameIndex(FI, PtrVT);
Dale Johannesen33c960f2009-02-04 20:06:27 +00001009 ArgVal = DAG.getLoad(ObjectVT, dl, Root, FIN, NULL, 0);
Scott Michel266bc8f2007-12-04 22:23:35 +00001010 ArgOffset += StackSlotSize;
1011 }
Scott Michel5af8f0e2008-07-16 17:17:29 +00001012
Scott Michel266bc8f2007-12-04 22:23:35 +00001013 ArgValues.push_back(ArgVal);
Scott Micheld976c212008-10-30 01:51:48 +00001014 // Update the chain
1015 Root = ArgVal.getOperand(0);
Scott Michel266bc8f2007-12-04 22:23:35 +00001016 }
Scott Michel5af8f0e2008-07-16 17:17:29 +00001017
Scott Micheld976c212008-10-30 01:51:48 +00001018 // vararg handling:
Scott Michel266bc8f2007-12-04 22:23:35 +00001019 if (isVarArg) {
Scott Micheld976c212008-10-30 01:51:48 +00001020 // unsigned int ptr_size = PtrVT.getSizeInBits() / 8;
1021 // We will spill (79-3)+1 registers to the stack
1022 SmallVector<SDValue, 79-3+1> MemOps;
1023
1024 // Create the frame slot
1025
Scott Michel266bc8f2007-12-04 22:23:35 +00001026 for (; ArgRegIdx != NumArgRegs; ++ArgRegIdx) {
Scott Micheld976c212008-10-30 01:51:48 +00001027 VarArgsFrameIndex = MFI->CreateFixedObject(StackSlotSize, ArgOffset);
1028 SDValue FIN = DAG.getFrameIndex(VarArgsFrameIndex, PtrVT);
1029 SDValue ArgVal = DAG.getRegister(ArgRegs[ArgRegIdx], MVT::v16i8);
Dale Johannesen33c960f2009-02-04 20:06:27 +00001030 SDValue Store = DAG.getStore(Root, dl, ArgVal, FIN, NULL, 0);
Scott Micheld976c212008-10-30 01:51:48 +00001031 Root = Store.getOperand(0);
Scott Michel266bc8f2007-12-04 22:23:35 +00001032 MemOps.push_back(Store);
Scott Micheld976c212008-10-30 01:51:48 +00001033
1034 // Increment address by stack slot size for the next stored argument
1035 ArgOffset += StackSlotSize;
Scott Michel266bc8f2007-12-04 22:23:35 +00001036 }
1037 if (!MemOps.empty())
Dale Johannesen33c960f2009-02-04 20:06:27 +00001038 Root = DAG.getNode(ISD::TokenFactor, dl, MVT::Other,
1039 &MemOps[0], MemOps.size());
Scott Michel266bc8f2007-12-04 22:23:35 +00001040 }
Scott Michel5af8f0e2008-07-16 17:17:29 +00001041
Scott Michel266bc8f2007-12-04 22:23:35 +00001042 ArgValues.push_back(Root);
Scott Michel5af8f0e2008-07-16 17:17:29 +00001043
Scott Michel266bc8f2007-12-04 22:23:35 +00001044 // Return the new list of results.
Dale Johannesen33c960f2009-02-04 20:06:27 +00001045 return DAG.getNode(ISD::MERGE_VALUES, dl, Op.getNode()->getVTList(),
Duncan Sandsaaffa052008-12-01 11:41:29 +00001046 &ArgValues[0], ArgValues.size());
Scott Michel266bc8f2007-12-04 22:23:35 +00001047}
1048
1049/// isLSAAddress - Return the immediate to use if the specified
1050/// value is representable as a LSA address.
Dan Gohman475871a2008-07-27 21:46:04 +00001051static SDNode *isLSAAddress(SDValue Op, SelectionDAG &DAG) {
Scott Michel19fd42a2008-11-11 03:06:06 +00001052 ConstantSDNode *C = dyn_cast<ConstantSDNode>(Op);
Scott Michel266bc8f2007-12-04 22:23:35 +00001053 if (!C) return 0;
Scott Michel5af8f0e2008-07-16 17:17:29 +00001054
Dan Gohmanf5aeb1a2008-09-12 16:56:44 +00001055 int Addr = C->getZExtValue();
Scott Michel266bc8f2007-12-04 22:23:35 +00001056 if ((Addr & 3) != 0 || // Low 2 bits are implicitly zero.
1057 (Addr << 14 >> 14) != Addr)
1058 return 0; // Top 14 bits have to be sext of immediate.
Scott Michel5af8f0e2008-07-16 17:17:29 +00001059
Dan Gohmanf5aeb1a2008-09-12 16:56:44 +00001060 return DAG.getConstant((int)C->getZExtValue() >> 2, MVT::i32).getNode();
Scott Michel266bc8f2007-12-04 22:23:35 +00001061}
1062
Scott Michel21213e72009-01-06 23:10:38 +00001063static SDValue
Dan Gohman475871a2008-07-27 21:46:04 +00001064LowerCALL(SDValue Op, SelectionDAG &DAG, const SPUSubtarget *ST) {
Dan Gohman095cc292008-09-13 01:54:27 +00001065 CallSDNode *TheCall = cast<CallSDNode>(Op.getNode());
1066 SDValue Chain = TheCall->getChain();
Dan Gohman095cc292008-09-13 01:54:27 +00001067 SDValue Callee = TheCall->getCallee();
1068 unsigned NumOps = TheCall->getNumArgs();
Scott Michel266bc8f2007-12-04 22:23:35 +00001069 unsigned StackSlotSize = SPUFrameInfo::stackSlotSize();
1070 const unsigned *ArgRegs = SPURegisterInfo::getArgRegs();
1071 const unsigned NumArgRegs = SPURegisterInfo::getNumArgRegs();
Dale Johannesen33c960f2009-02-04 20:06:27 +00001072 DebugLoc dl = TheCall->getDebugLoc();
Scott Michel266bc8f2007-12-04 22:23:35 +00001073
1074 // Handy pointer type
Duncan Sands83ec4b62008-06-06 12:08:01 +00001075 MVT PtrVT = DAG.getTargetLoweringInfo().getPointerTy();
Scott Michel5af8f0e2008-07-16 17:17:29 +00001076
Scott Michel266bc8f2007-12-04 22:23:35 +00001077 // Accumulate how many bytes are to be pushed on the stack, including the
1078 // linkage area, and parameter passing area. According to the SPU ABI,
1079 // we minimally need space for [LR] and [SP]
1080 unsigned NumStackBytes = SPUFrameInfo::minStackSize();
Scott Michel5af8f0e2008-07-16 17:17:29 +00001081
Scott Michel266bc8f2007-12-04 22:23:35 +00001082 // Set up a copy of the stack pointer for use loading and storing any
1083 // arguments that may not fit in the registers available for argument
1084 // passing.
Dan Gohman475871a2008-07-27 21:46:04 +00001085 SDValue StackPtr = DAG.getRegister(SPU::R1, MVT::i32);
Scott Michel5af8f0e2008-07-16 17:17:29 +00001086
Scott Michel266bc8f2007-12-04 22:23:35 +00001087 // Figure out which arguments are going to go in registers, and which in
1088 // memory.
1089 unsigned ArgOffset = SPUFrameInfo::minStackSize(); // Just below [LR]
1090 unsigned ArgRegIdx = 0;
1091
1092 // Keep track of registers passing arguments
Dan Gohman475871a2008-07-27 21:46:04 +00001093 std::vector<std::pair<unsigned, SDValue> > RegsToPass;
Scott Michel266bc8f2007-12-04 22:23:35 +00001094 // And the arguments passed on the stack
Dan Gohman475871a2008-07-27 21:46:04 +00001095 SmallVector<SDValue, 8> MemOpChains;
Scott Michel266bc8f2007-12-04 22:23:35 +00001096
1097 for (unsigned i = 0; i != NumOps; ++i) {
Dan Gohman095cc292008-09-13 01:54:27 +00001098 SDValue Arg = TheCall->getArg(i);
Scott Michel5af8f0e2008-07-16 17:17:29 +00001099
Scott Michel266bc8f2007-12-04 22:23:35 +00001100 // PtrOff will be used to store the current argument to the stack if a
1101 // register cannot be found for it.
Dan Gohman475871a2008-07-27 21:46:04 +00001102 SDValue PtrOff = DAG.getConstant(ArgOffset, StackPtr.getValueType());
Dale Johannesen33c960f2009-02-04 20:06:27 +00001103 PtrOff = DAG.getNode(ISD::ADD, dl, PtrVT, StackPtr, PtrOff);
Scott Michel266bc8f2007-12-04 22:23:35 +00001104
Duncan Sands83ec4b62008-06-06 12:08:01 +00001105 switch (Arg.getValueType().getSimpleVT()) {
Scott Michel266bc8f2007-12-04 22:23:35 +00001106 default: assert(0 && "Unexpected ValueType for argument!");
Scott Micheldd950092009-01-06 03:36:14 +00001107 case MVT::i8:
1108 case MVT::i16:
Scott Michel266bc8f2007-12-04 22:23:35 +00001109 case MVT::i32:
1110 case MVT::i64:
1111 case MVT::i128:
1112 if (ArgRegIdx != NumArgRegs) {
1113 RegsToPass.push_back(std::make_pair(ArgRegs[ArgRegIdx++], Arg));
1114 } else {
Dale Johannesen33c960f2009-02-04 20:06:27 +00001115 MemOpChains.push_back(DAG.getStore(Chain, dl, Arg, PtrOff, NULL, 0));
Scott Michel7f9ba9b2008-01-30 02:55:46 +00001116 ArgOffset += StackSlotSize;
Scott Michel266bc8f2007-12-04 22:23:35 +00001117 }
1118 break;
1119 case MVT::f32:
1120 case MVT::f64:
1121 if (ArgRegIdx != NumArgRegs) {
1122 RegsToPass.push_back(std::make_pair(ArgRegs[ArgRegIdx++], Arg));
1123 } else {
Dale Johannesen33c960f2009-02-04 20:06:27 +00001124 MemOpChains.push_back(DAG.getStore(Chain, dl, Arg, PtrOff, NULL, 0));
Scott Michel7f9ba9b2008-01-30 02:55:46 +00001125 ArgOffset += StackSlotSize;
Scott Michel266bc8f2007-12-04 22:23:35 +00001126 }
1127 break;
Scott Michelcc188272008-12-04 21:01:44 +00001128 case MVT::v2i64:
1129 case MVT::v2f64:
Scott Michel266bc8f2007-12-04 22:23:35 +00001130 case MVT::v4f32:
1131 case MVT::v4i32:
1132 case MVT::v8i16:
1133 case MVT::v16i8:
1134 if (ArgRegIdx != NumArgRegs) {
1135 RegsToPass.push_back(std::make_pair(ArgRegs[ArgRegIdx++], Arg));
1136 } else {
Dale Johannesen33c960f2009-02-04 20:06:27 +00001137 MemOpChains.push_back(DAG.getStore(Chain, dl, Arg, PtrOff, NULL, 0));
Scott Michel7f9ba9b2008-01-30 02:55:46 +00001138 ArgOffset += StackSlotSize;
Scott Michel266bc8f2007-12-04 22:23:35 +00001139 }
1140 break;
1141 }
1142 }
1143
1144 // Update number of stack bytes actually used, insert a call sequence start
1145 NumStackBytes = (ArgOffset - SPUFrameInfo::minStackSize());
Chris Lattnere563bbc2008-10-11 22:08:30 +00001146 Chain = DAG.getCALLSEQ_START(Chain, DAG.getIntPtrConstant(NumStackBytes,
1147 true));
Scott Michel266bc8f2007-12-04 22:23:35 +00001148
1149 if (!MemOpChains.empty()) {
1150 // Adjust the stack pointer for the stack arguments.
Dale Johannesen33c960f2009-02-04 20:06:27 +00001151 Chain = DAG.getNode(ISD::TokenFactor, dl, MVT::Other,
Scott Michel266bc8f2007-12-04 22:23:35 +00001152 &MemOpChains[0], MemOpChains.size());
1153 }
Scott Michel5af8f0e2008-07-16 17:17:29 +00001154
Scott Michel266bc8f2007-12-04 22:23:35 +00001155 // Build a sequence of copy-to-reg nodes chained together with token chain
1156 // and flag operands which copy the outgoing args into the appropriate regs.
Dan Gohman475871a2008-07-27 21:46:04 +00001157 SDValue InFlag;
Scott Michel266bc8f2007-12-04 22:23:35 +00001158 for (unsigned i = 0, e = RegsToPass.size(); i != e; ++i) {
Dale Johannesen33c960f2009-02-04 20:06:27 +00001159 Chain = DAG.getCopyToReg(Chain, dl, RegsToPass[i].first,
1160 RegsToPass[i].second, InFlag);
Scott Michel266bc8f2007-12-04 22:23:35 +00001161 InFlag = Chain.getValue(1);
1162 }
Scott Michel5af8f0e2008-07-16 17:17:29 +00001163
Dan Gohman475871a2008-07-27 21:46:04 +00001164 SmallVector<SDValue, 8> Ops;
Scott Michel266bc8f2007-12-04 22:23:35 +00001165 unsigned CallOpc = SPUISD::CALL;
Scott Michel5af8f0e2008-07-16 17:17:29 +00001166
Bill Wendling056292f2008-09-16 21:48:12 +00001167 // If the callee is a GlobalAddress/ExternalSymbol node (quite common, every
1168 // direct call is) turn it into a TargetGlobalAddress/TargetExternalSymbol
1169 // node so that legalize doesn't hack it.
Scott Michel19fd42a2008-11-11 03:06:06 +00001170 if (GlobalAddressSDNode *G = dyn_cast<GlobalAddressSDNode>(Callee)) {
Scott Michel266bc8f2007-12-04 22:23:35 +00001171 GlobalValue *GV = G->getGlobal();
Duncan Sands83ec4b62008-06-06 12:08:01 +00001172 MVT CalleeVT = Callee.getValueType();
Dan Gohman475871a2008-07-27 21:46:04 +00001173 SDValue Zero = DAG.getConstant(0, PtrVT);
1174 SDValue GA = DAG.getTargetGlobalAddress(GV, CalleeVT);
Scott Michel266bc8f2007-12-04 22:23:35 +00001175
Scott Michel9de5d0d2008-01-11 02:53:15 +00001176 if (!ST->usingLargeMem()) {
1177 // Turn calls to targets that are defined (i.e., have bodies) into BRSL
1178 // style calls, otherwise, external symbols are BRASL calls. This assumes
1179 // that declared/defined symbols are in the same compilation unit and can
1180 // be reached through PC-relative jumps.
1181 //
1182 // NOTE:
1183 // This may be an unsafe assumption for JIT and really large compilation
1184 // units.
1185 if (GV->isDeclaration()) {
Dale Johannesende064702009-02-06 21:50:26 +00001186 Callee = DAG.getNode(SPUISD::AFormAddr, dl, CalleeVT, GA, Zero);
Scott Michel9de5d0d2008-01-11 02:53:15 +00001187 } else {
Dale Johannesende064702009-02-06 21:50:26 +00001188 Callee = DAG.getNode(SPUISD::PCRelAddr, dl, CalleeVT, GA, Zero);
Scott Michel9de5d0d2008-01-11 02:53:15 +00001189 }
Scott Michel266bc8f2007-12-04 22:23:35 +00001190 } else {
Scott Michel9de5d0d2008-01-11 02:53:15 +00001191 // "Large memory" mode: Turn all calls into indirect calls with a X-form
1192 // address pairs:
Dale Johannesende064702009-02-06 21:50:26 +00001193 Callee = DAG.getNode(SPUISD::IndirectAddr, dl, PtrVT, GA, Zero);
Scott Michel266bc8f2007-12-04 22:23:35 +00001194 }
Scott Michel1df30c42008-12-29 03:23:36 +00001195 } else if (ExternalSymbolSDNode *S = dyn_cast<ExternalSymbolSDNode>(Callee)) {
1196 MVT CalleeVT = Callee.getValueType();
1197 SDValue Zero = DAG.getConstant(0, PtrVT);
1198 SDValue ExtSym = DAG.getTargetExternalSymbol(S->getSymbol(),
1199 Callee.getValueType());
1200
1201 if (!ST->usingLargeMem()) {
Dale Johannesende064702009-02-06 21:50:26 +00001202 Callee = DAG.getNode(SPUISD::AFormAddr, dl, CalleeVT, ExtSym, Zero);
Scott Michel1df30c42008-12-29 03:23:36 +00001203 } else {
Dale Johannesende064702009-02-06 21:50:26 +00001204 Callee = DAG.getNode(SPUISD::IndirectAddr, dl, PtrVT, ExtSym, Zero);
Scott Michel1df30c42008-12-29 03:23:36 +00001205 }
1206 } else if (SDNode *Dest = isLSAAddress(Callee, DAG)) {
Scott Michel266bc8f2007-12-04 22:23:35 +00001207 // If this is an absolute destination address that appears to be a legal
1208 // local store address, use the munged value.
Dan Gohman475871a2008-07-27 21:46:04 +00001209 Callee = SDValue(Dest, 0);
Scott Michel9de5d0d2008-01-11 02:53:15 +00001210 }
Scott Michel266bc8f2007-12-04 22:23:35 +00001211
1212 Ops.push_back(Chain);
1213 Ops.push_back(Callee);
Scott Michel5af8f0e2008-07-16 17:17:29 +00001214
Scott Michel266bc8f2007-12-04 22:23:35 +00001215 // Add argument registers to the end of the list so that they are known live
1216 // into the call.
1217 for (unsigned i = 0, e = RegsToPass.size(); i != e; ++i)
Scott Michel5af8f0e2008-07-16 17:17:29 +00001218 Ops.push_back(DAG.getRegister(RegsToPass[i].first,
Scott Michel266bc8f2007-12-04 22:23:35 +00001219 RegsToPass[i].second.getValueType()));
Scott Michel5af8f0e2008-07-16 17:17:29 +00001220
Gabor Greifba36cb52008-08-28 21:40:38 +00001221 if (InFlag.getNode())
Scott Michel266bc8f2007-12-04 22:23:35 +00001222 Ops.push_back(InFlag);
Duncan Sands4bdcb612008-07-02 17:40:58 +00001223 // Returns a chain and a flag for retval copy to use.
Dale Johannesen33c960f2009-02-04 20:06:27 +00001224 Chain = DAG.getNode(CallOpc, dl, DAG.getVTList(MVT::Other, MVT::Flag),
Duncan Sands4bdcb612008-07-02 17:40:58 +00001225 &Ops[0], Ops.size());
Scott Michel266bc8f2007-12-04 22:23:35 +00001226 InFlag = Chain.getValue(1);
1227
Chris Lattnere563bbc2008-10-11 22:08:30 +00001228 Chain = DAG.getCALLSEQ_END(Chain, DAG.getIntPtrConstant(NumStackBytes, true),
1229 DAG.getIntPtrConstant(0, true), InFlag);
Dan Gohman095cc292008-09-13 01:54:27 +00001230 if (TheCall->getValueType(0) != MVT::Other)
Evan Chengebaaa912008-02-05 22:44:06 +00001231 InFlag = Chain.getValue(1);
1232
Dan Gohman475871a2008-07-27 21:46:04 +00001233 SDValue ResultVals[3];
Scott Michel266bc8f2007-12-04 22:23:35 +00001234 unsigned NumResults = 0;
Scott Michel5af8f0e2008-07-16 17:17:29 +00001235
Scott Michel266bc8f2007-12-04 22:23:35 +00001236 // If the call has results, copy the values out of the ret val registers.
Dan Gohman095cc292008-09-13 01:54:27 +00001237 switch (TheCall->getValueType(0).getSimpleVT()) {
Scott Michel266bc8f2007-12-04 22:23:35 +00001238 default: assert(0 && "Unexpected ret value!");
1239 case MVT::Other: break;
1240 case MVT::i32:
Dan Gohman095cc292008-09-13 01:54:27 +00001241 if (TheCall->getValueType(1) == MVT::i32) {
Dale Johannesen33c960f2009-02-04 20:06:27 +00001242 Chain = DAG.getCopyFromReg(Chain, dl, SPU::R4,
1243 MVT::i32, InFlag).getValue(1);
Scott Michel266bc8f2007-12-04 22:23:35 +00001244 ResultVals[0] = Chain.getValue(0);
Dale Johannesen33c960f2009-02-04 20:06:27 +00001245 Chain = DAG.getCopyFromReg(Chain, dl, SPU::R3, MVT::i32,
Scott Michel266bc8f2007-12-04 22:23:35 +00001246 Chain.getValue(2)).getValue(1);
1247 ResultVals[1] = Chain.getValue(0);
1248 NumResults = 2;
Scott Michel266bc8f2007-12-04 22:23:35 +00001249 } else {
Dale Johannesen33c960f2009-02-04 20:06:27 +00001250 Chain = DAG.getCopyFromReg(Chain, dl, SPU::R3, MVT::i32,
1251 InFlag).getValue(1);
Scott Michel266bc8f2007-12-04 22:23:35 +00001252 ResultVals[0] = Chain.getValue(0);
1253 NumResults = 1;
1254 }
Scott Michel266bc8f2007-12-04 22:23:35 +00001255 break;
1256 case MVT::i64:
Dale Johannesen33c960f2009-02-04 20:06:27 +00001257 Chain = DAG.getCopyFromReg(Chain, dl, SPU::R3, MVT::i64,
1258 InFlag).getValue(1);
Scott Michel266bc8f2007-12-04 22:23:35 +00001259 ResultVals[0] = Chain.getValue(0);
1260 NumResults = 1;
Scott Michel266bc8f2007-12-04 22:23:35 +00001261 break;
Scott Micheldd950092009-01-06 03:36:14 +00001262 case MVT::i128:
Dale Johannesen33c960f2009-02-04 20:06:27 +00001263 Chain = DAG.getCopyFromReg(Chain, dl, SPU::R3, MVT::i128,
1264 InFlag).getValue(1);
Scott Micheldd950092009-01-06 03:36:14 +00001265 ResultVals[0] = Chain.getValue(0);
1266 NumResults = 1;
1267 break;
Scott Michel266bc8f2007-12-04 22:23:35 +00001268 case MVT::f32:
1269 case MVT::f64:
Dale Johannesen33c960f2009-02-04 20:06:27 +00001270 Chain = DAG.getCopyFromReg(Chain, dl, SPU::R3, TheCall->getValueType(0),
Scott Michel266bc8f2007-12-04 22:23:35 +00001271 InFlag).getValue(1);
1272 ResultVals[0] = Chain.getValue(0);
1273 NumResults = 1;
Scott Michel266bc8f2007-12-04 22:23:35 +00001274 break;
1275 case MVT::v2f64:
Scott Michelcc188272008-12-04 21:01:44 +00001276 case MVT::v2i64:
Scott Michel266bc8f2007-12-04 22:23:35 +00001277 case MVT::v4f32:
1278 case MVT::v4i32:
1279 case MVT::v8i16:
1280 case MVT::v16i8:
Dale Johannesen33c960f2009-02-04 20:06:27 +00001281 Chain = DAG.getCopyFromReg(Chain, dl, SPU::R3, TheCall->getValueType(0),
Scott Michel266bc8f2007-12-04 22:23:35 +00001282 InFlag).getValue(1);
1283 ResultVals[0] = Chain.getValue(0);
1284 NumResults = 1;
Scott Michel266bc8f2007-12-04 22:23:35 +00001285 break;
1286 }
Duncan Sands4bdcb612008-07-02 17:40:58 +00001287
Scott Michel266bc8f2007-12-04 22:23:35 +00001288 // If the function returns void, just return the chain.
1289 if (NumResults == 0)
1290 return Chain;
Scott Michel5af8f0e2008-07-16 17:17:29 +00001291
Scott Michel266bc8f2007-12-04 22:23:35 +00001292 // Otherwise, merge everything together with a MERGE_VALUES node.
1293 ResultVals[NumResults++] = Chain;
Dale Johannesen33c960f2009-02-04 20:06:27 +00001294 SDValue Res = DAG.getMergeValues(ResultVals, NumResults, dl);
Gabor Greif99a6cb92008-08-26 22:36:50 +00001295 return Res.getValue(Op.getResNo());
Scott Michel266bc8f2007-12-04 22:23:35 +00001296}
1297
Dan Gohman475871a2008-07-27 21:46:04 +00001298static SDValue
1299LowerRET(SDValue Op, SelectionDAG &DAG, TargetMachine &TM) {
Scott Michel266bc8f2007-12-04 22:23:35 +00001300 SmallVector<CCValAssign, 16> RVLocs;
1301 unsigned CC = DAG.getMachineFunction().getFunction()->getCallingConv();
1302 bool isVarArg = DAG.getMachineFunction().getFunction()->isVarArg();
Dale Johannesena05dca42009-02-04 23:02:30 +00001303 DebugLoc dl = Op.getDebugLoc();
Scott Michel266bc8f2007-12-04 22:23:35 +00001304 CCState CCInfo(CC, isVarArg, TM, RVLocs);
Gabor Greifba36cb52008-08-28 21:40:38 +00001305 CCInfo.AnalyzeReturn(Op.getNode(), RetCC_SPU);
Scott Michel5af8f0e2008-07-16 17:17:29 +00001306
Scott Michel266bc8f2007-12-04 22:23:35 +00001307 // If this is the first return lowered for this function, add the regs to the
1308 // liveout set for the function.
Chris Lattner84bc5422007-12-31 04:13:23 +00001309 if (DAG.getMachineFunction().getRegInfo().liveout_empty()) {
Scott Michel266bc8f2007-12-04 22:23:35 +00001310 for (unsigned i = 0; i != RVLocs.size(); ++i)
Chris Lattner84bc5422007-12-31 04:13:23 +00001311 DAG.getMachineFunction().getRegInfo().addLiveOut(RVLocs[i].getLocReg());
Scott Michel266bc8f2007-12-04 22:23:35 +00001312 }
1313
Dan Gohman475871a2008-07-27 21:46:04 +00001314 SDValue Chain = Op.getOperand(0);
1315 SDValue Flag;
Scott Michel5af8f0e2008-07-16 17:17:29 +00001316
Scott Michel266bc8f2007-12-04 22:23:35 +00001317 // Copy the result values into the output registers.
1318 for (unsigned i = 0; i != RVLocs.size(); ++i) {
1319 CCValAssign &VA = RVLocs[i];
1320 assert(VA.isRegLoc() && "Can only return in registers!");
Dale Johannesena05dca42009-02-04 23:02:30 +00001321 Chain = DAG.getCopyToReg(Chain, dl, VA.getLocReg(),
1322 Op.getOperand(i*2+1), Flag);
Scott Michel266bc8f2007-12-04 22:23:35 +00001323 Flag = Chain.getValue(1);
1324 }
1325
Gabor Greifba36cb52008-08-28 21:40:38 +00001326 if (Flag.getNode())
Dale Johannesena05dca42009-02-04 23:02:30 +00001327 return DAG.getNode(SPUISD::RET_FLAG, dl, MVT::Other, Chain, Flag);
Scott Michel266bc8f2007-12-04 22:23:35 +00001328 else
Dale Johannesena05dca42009-02-04 23:02:30 +00001329 return DAG.getNode(SPUISD::RET_FLAG, dl, MVT::Other, Chain);
Scott Michel266bc8f2007-12-04 22:23:35 +00001330}
1331
1332
1333//===----------------------------------------------------------------------===//
1334// Vector related lowering:
1335//===----------------------------------------------------------------------===//
1336
1337static ConstantSDNode *
1338getVecImm(SDNode *N) {
Dan Gohman475871a2008-07-27 21:46:04 +00001339 SDValue OpVal(0, 0);
Scott Michel5af8f0e2008-07-16 17:17:29 +00001340
Scott Michel266bc8f2007-12-04 22:23:35 +00001341 // Check to see if this buildvec has a single non-undef value in its elements.
1342 for (unsigned i = 0, e = N->getNumOperands(); i != e; ++i) {
1343 if (N->getOperand(i).getOpcode() == ISD::UNDEF) continue;
Gabor Greifba36cb52008-08-28 21:40:38 +00001344 if (OpVal.getNode() == 0)
Scott Michel266bc8f2007-12-04 22:23:35 +00001345 OpVal = N->getOperand(i);
1346 else if (OpVal != N->getOperand(i))
1347 return 0;
1348 }
Scott Michel5af8f0e2008-07-16 17:17:29 +00001349
Gabor Greifba36cb52008-08-28 21:40:38 +00001350 if (OpVal.getNode() != 0) {
Scott Michel19fd42a2008-11-11 03:06:06 +00001351 if (ConstantSDNode *CN = dyn_cast<ConstantSDNode>(OpVal)) {
Scott Michel266bc8f2007-12-04 22:23:35 +00001352 return CN;
1353 }
1354 }
1355
1356 return 0; // All UNDEF: use implicit def.; not Constant node
1357}
1358
1359/// get_vec_i18imm - Test if this vector is a vector filled with the same value
1360/// and the value fits into an unsigned 18-bit constant, and if so, return the
1361/// constant
Dan Gohman475871a2008-07-27 21:46:04 +00001362SDValue SPU::get_vec_u18imm(SDNode *N, SelectionDAG &DAG,
Duncan Sands83ec4b62008-06-06 12:08:01 +00001363 MVT ValueType) {
Scott Michel266bc8f2007-12-04 22:23:35 +00001364 if (ConstantSDNode *CN = getVecImm(N)) {
Dan Gohmanf5aeb1a2008-09-12 16:56:44 +00001365 uint64_t Value = CN->getZExtValue();
Scott Michel4cb8bd82008-03-06 04:02:54 +00001366 if (ValueType == MVT::i64) {
Dan Gohmanf5aeb1a2008-09-12 16:56:44 +00001367 uint64_t UValue = CN->getZExtValue();
Scott Michel4cb8bd82008-03-06 04:02:54 +00001368 uint32_t upper = uint32_t(UValue >> 32);
1369 uint32_t lower = uint32_t(UValue);
1370 if (upper != lower)
Dan Gohman475871a2008-07-27 21:46:04 +00001371 return SDValue();
Scott Michel4cb8bd82008-03-06 04:02:54 +00001372 Value = Value >> 32;
1373 }
Scott Michel266bc8f2007-12-04 22:23:35 +00001374 if (Value <= 0x3ffff)
Dan Gohmanfa210d82008-11-05 02:06:09 +00001375 return DAG.getTargetConstant(Value, ValueType);
Scott Michel266bc8f2007-12-04 22:23:35 +00001376 }
1377
Dan Gohman475871a2008-07-27 21:46:04 +00001378 return SDValue();
Scott Michel266bc8f2007-12-04 22:23:35 +00001379}
1380
1381/// get_vec_i16imm - Test if this vector is a vector filled with the same value
1382/// and the value fits into a signed 16-bit constant, and if so, return the
1383/// constant
Dan Gohman475871a2008-07-27 21:46:04 +00001384SDValue SPU::get_vec_i16imm(SDNode *N, SelectionDAG &DAG,
Duncan Sands83ec4b62008-06-06 12:08:01 +00001385 MVT ValueType) {
Scott Michel266bc8f2007-12-04 22:23:35 +00001386 if (ConstantSDNode *CN = getVecImm(N)) {
Dan Gohman7810bfe2008-09-26 21:54:37 +00001387 int64_t Value = CN->getSExtValue();
Scott Michel4cb8bd82008-03-06 04:02:54 +00001388 if (ValueType == MVT::i64) {
Dan Gohmanf5aeb1a2008-09-12 16:56:44 +00001389 uint64_t UValue = CN->getZExtValue();
Scott Michel4cb8bd82008-03-06 04:02:54 +00001390 uint32_t upper = uint32_t(UValue >> 32);
1391 uint32_t lower = uint32_t(UValue);
1392 if (upper != lower)
Dan Gohman475871a2008-07-27 21:46:04 +00001393 return SDValue();
Scott Michel4cb8bd82008-03-06 04:02:54 +00001394 Value = Value >> 32;
1395 }
Scott Michelad2715e2008-03-05 23:02:02 +00001396 if (Value >= -(1 << 15) && Value <= ((1 << 15) - 1)) {
Dan Gohmanfa210d82008-11-05 02:06:09 +00001397 return DAG.getTargetConstant(Value, ValueType);
Scott Michel266bc8f2007-12-04 22:23:35 +00001398 }
1399 }
1400
Dan Gohman475871a2008-07-27 21:46:04 +00001401 return SDValue();
Scott Michel266bc8f2007-12-04 22:23:35 +00001402}
1403
1404/// get_vec_i10imm - Test if this vector is a vector filled with the same value
1405/// and the value fits into a signed 10-bit constant, and if so, return the
1406/// constant
Dan Gohman475871a2008-07-27 21:46:04 +00001407SDValue SPU::get_vec_i10imm(SDNode *N, SelectionDAG &DAG,
Duncan Sands83ec4b62008-06-06 12:08:01 +00001408 MVT ValueType) {
Scott Michel266bc8f2007-12-04 22:23:35 +00001409 if (ConstantSDNode *CN = getVecImm(N)) {
Dan Gohman7810bfe2008-09-26 21:54:37 +00001410 int64_t Value = CN->getSExtValue();
Scott Michel4cb8bd82008-03-06 04:02:54 +00001411 if (ValueType == MVT::i64) {
Dan Gohmanf5aeb1a2008-09-12 16:56:44 +00001412 uint64_t UValue = CN->getZExtValue();
Scott Michel4cb8bd82008-03-06 04:02:54 +00001413 uint32_t upper = uint32_t(UValue >> 32);
1414 uint32_t lower = uint32_t(UValue);
1415 if (upper != lower)
Dan Gohman475871a2008-07-27 21:46:04 +00001416 return SDValue();
Scott Michel4cb8bd82008-03-06 04:02:54 +00001417 Value = Value >> 32;
1418 }
Scott Michelad2715e2008-03-05 23:02:02 +00001419 if (isS10Constant(Value))
Dan Gohmanfa210d82008-11-05 02:06:09 +00001420 return DAG.getTargetConstant(Value, ValueType);
Scott Michel266bc8f2007-12-04 22:23:35 +00001421 }
1422
Dan Gohman475871a2008-07-27 21:46:04 +00001423 return SDValue();
Scott Michel266bc8f2007-12-04 22:23:35 +00001424}
1425
1426/// get_vec_i8imm - Test if this vector is a vector filled with the same value
1427/// and the value fits into a signed 8-bit constant, and if so, return the
1428/// constant.
1429///
1430/// @note: The incoming vector is v16i8 because that's the only way we can load
1431/// constant vectors. Thus, we test to see if the upper and lower bytes are the
1432/// same value.
Dan Gohman475871a2008-07-27 21:46:04 +00001433SDValue SPU::get_vec_i8imm(SDNode *N, SelectionDAG &DAG,
Duncan Sands83ec4b62008-06-06 12:08:01 +00001434 MVT ValueType) {
Scott Michel266bc8f2007-12-04 22:23:35 +00001435 if (ConstantSDNode *CN = getVecImm(N)) {
Dan Gohmanf5aeb1a2008-09-12 16:56:44 +00001436 int Value = (int) CN->getZExtValue();
Scott Michel266bc8f2007-12-04 22:23:35 +00001437 if (ValueType == MVT::i16
Scott Michel7f9ba9b2008-01-30 02:55:46 +00001438 && Value <= 0xffff /* truncated from uint64_t */
1439 && ((short) Value >> 8) == ((short) Value & 0xff))
Dan Gohmanfa210d82008-11-05 02:06:09 +00001440 return DAG.getTargetConstant(Value & 0xff, ValueType);
Scott Michel266bc8f2007-12-04 22:23:35 +00001441 else if (ValueType == MVT::i8
Scott Michel7f9ba9b2008-01-30 02:55:46 +00001442 && (Value & 0xff) == Value)
Dan Gohmanfa210d82008-11-05 02:06:09 +00001443 return DAG.getTargetConstant(Value, ValueType);
Scott Michel266bc8f2007-12-04 22:23:35 +00001444 }
1445
Dan Gohman475871a2008-07-27 21:46:04 +00001446 return SDValue();
Scott Michel266bc8f2007-12-04 22:23:35 +00001447}
1448
1449/// get_ILHUvec_imm - Test if this vector is a vector filled with the same value
1450/// and the value fits into a signed 16-bit constant, and if so, return the
1451/// constant
Dan Gohman475871a2008-07-27 21:46:04 +00001452SDValue SPU::get_ILHUvec_imm(SDNode *N, SelectionDAG &DAG,
Duncan Sands83ec4b62008-06-06 12:08:01 +00001453 MVT ValueType) {
Scott Michel266bc8f2007-12-04 22:23:35 +00001454 if (ConstantSDNode *CN = getVecImm(N)) {
Dan Gohmanf5aeb1a2008-09-12 16:56:44 +00001455 uint64_t Value = CN->getZExtValue();
Scott Michel266bc8f2007-12-04 22:23:35 +00001456 if ((ValueType == MVT::i32
Scott Michel7f9ba9b2008-01-30 02:55:46 +00001457 && ((unsigned) Value & 0xffff0000) == (unsigned) Value)
1458 || (ValueType == MVT::i64 && (Value & 0xffff0000) == Value))
Dan Gohmanfa210d82008-11-05 02:06:09 +00001459 return DAG.getTargetConstant(Value >> 16, ValueType);
Scott Michel266bc8f2007-12-04 22:23:35 +00001460 }
1461
Dan Gohman475871a2008-07-27 21:46:04 +00001462 return SDValue();
Scott Michel266bc8f2007-12-04 22:23:35 +00001463}
1464
1465/// get_v4i32_imm - Catch-all for general 32-bit constant vectors
Dan Gohman475871a2008-07-27 21:46:04 +00001466SDValue SPU::get_v4i32_imm(SDNode *N, SelectionDAG &DAG) {
Scott Michel266bc8f2007-12-04 22:23:35 +00001467 if (ConstantSDNode *CN = getVecImm(N)) {
Dan Gohmanfa210d82008-11-05 02:06:09 +00001468 return DAG.getTargetConstant((unsigned) CN->getZExtValue(), MVT::i32);
Scott Michel266bc8f2007-12-04 22:23:35 +00001469 }
1470
Dan Gohman475871a2008-07-27 21:46:04 +00001471 return SDValue();
Scott Michel266bc8f2007-12-04 22:23:35 +00001472}
1473
1474/// get_v4i32_imm - Catch-all for general 64-bit constant vectors
Dan Gohman475871a2008-07-27 21:46:04 +00001475SDValue SPU::get_v2i64_imm(SDNode *N, SelectionDAG &DAG) {
Scott Michel266bc8f2007-12-04 22:23:35 +00001476 if (ConstantSDNode *CN = getVecImm(N)) {
Dan Gohmanfa210d82008-11-05 02:06:09 +00001477 return DAG.getTargetConstant((unsigned) CN->getZExtValue(), MVT::i64);
Scott Michel266bc8f2007-12-04 22:23:35 +00001478 }
1479
Dan Gohman475871a2008-07-27 21:46:04 +00001480 return SDValue();
Scott Michel266bc8f2007-12-04 22:23:35 +00001481}
1482
1483// If this is a vector of constants or undefs, get the bits. A bit in
Scott Michel5af8f0e2008-07-16 17:17:29 +00001484// UndefBits is set if the corresponding element of the vector is an
Scott Michel266bc8f2007-12-04 22:23:35 +00001485// ISD::UNDEF value. For undefs, the corresponding VectorBits values are
1486// zero. Return true if this is not an array of constants, false if it is.
1487//
1488static bool GetConstantBuildVectorBits(SDNode *BV, uint64_t VectorBits[2],
1489 uint64_t UndefBits[2]) {
1490 // Start with zero'd results.
1491 VectorBits[0] = VectorBits[1] = UndefBits[0] = UndefBits[1] = 0;
Scott Michel5af8f0e2008-07-16 17:17:29 +00001492
Duncan Sands83ec4b62008-06-06 12:08:01 +00001493 unsigned EltBitSize = BV->getOperand(0).getValueType().getSizeInBits();
Scott Michel266bc8f2007-12-04 22:23:35 +00001494 for (unsigned i = 0, e = BV->getNumOperands(); i != e; ++i) {
Dan Gohman475871a2008-07-27 21:46:04 +00001495 SDValue OpVal = BV->getOperand(i);
Scott Michel5af8f0e2008-07-16 17:17:29 +00001496
Scott Michel266bc8f2007-12-04 22:23:35 +00001497 unsigned PartNo = i >= e/2; // In the upper 128 bits?
1498 unsigned SlotNo = e/2 - (i & (e/2-1))-1; // Which subpiece of the uint64_t.
1499
1500 uint64_t EltBits = 0;
1501 if (OpVal.getOpcode() == ISD::UNDEF) {
1502 uint64_t EltUndefBits = ~0ULL >> (64-EltBitSize);
1503 UndefBits[PartNo] |= EltUndefBits << (SlotNo*EltBitSize);
1504 continue;
Scott Michel19fd42a2008-11-11 03:06:06 +00001505 } else if (ConstantSDNode *CN = dyn_cast<ConstantSDNode>(OpVal)) {
Dan Gohmanf5aeb1a2008-09-12 16:56:44 +00001506 EltBits = CN->getZExtValue() & (~0ULL >> (64-EltBitSize));
Scott Michel19fd42a2008-11-11 03:06:06 +00001507 } else if (ConstantFPSDNode *CN = dyn_cast<ConstantFPSDNode>(OpVal)) {
Scott Michel266bc8f2007-12-04 22:23:35 +00001508 const APFloat &apf = CN->getValueAPF();
1509 EltBits = (CN->getValueType(0) == MVT::f32
Scott Michel7f9ba9b2008-01-30 02:55:46 +00001510 ? FloatToBits(apf.convertToFloat())
1511 : DoubleToBits(apf.convertToDouble()));
Scott Michel266bc8f2007-12-04 22:23:35 +00001512 } else {
1513 // Nonconstant element.
1514 return true;
1515 }
Scott Michel5af8f0e2008-07-16 17:17:29 +00001516
Scott Michel266bc8f2007-12-04 22:23:35 +00001517 VectorBits[PartNo] |= EltBits << (SlotNo*EltBitSize);
1518 }
Scott Michel5af8f0e2008-07-16 17:17:29 +00001519
1520 //printf("%llx %llx %llx %llx\n",
Scott Michel266bc8f2007-12-04 22:23:35 +00001521 // VectorBits[0], VectorBits[1], UndefBits[0], UndefBits[1]);
1522 return false;
1523}
1524
1525/// If this is a splat (repetition) of a value across the whole vector, return
1526/// the smallest size that splats it. For example, "0x01010101010101..." is a
Scott Michel5af8f0e2008-07-16 17:17:29 +00001527/// splat of 0x01, 0x0101, and 0x01010101. We return SplatBits = 0x01 and
Scott Michel266bc8f2007-12-04 22:23:35 +00001528/// SplatSize = 1 byte.
Scott Michel5af8f0e2008-07-16 17:17:29 +00001529static bool isConstantSplat(const uint64_t Bits128[2],
Scott Michel266bc8f2007-12-04 22:23:35 +00001530 const uint64_t Undef128[2],
Scott Michel7f9ba9b2008-01-30 02:55:46 +00001531 int MinSplatBits,
Scott Michel266bc8f2007-12-04 22:23:35 +00001532 uint64_t &SplatBits, uint64_t &SplatUndef,
1533 int &SplatSize) {
1534 // Don't let undefs prevent splats from matching. See if the top 64-bits are
1535 // the same as the lower 64-bits, ignoring undefs.
1536 uint64_t Bits64 = Bits128[0] | Bits128[1];
1537 uint64_t Undef64 = Undef128[0] & Undef128[1];
1538 uint32_t Bits32 = uint32_t(Bits64) | uint32_t(Bits64 >> 32);
1539 uint32_t Undef32 = uint32_t(Undef64) & uint32_t(Undef64 >> 32);
1540 uint16_t Bits16 = uint16_t(Bits32) | uint16_t(Bits32 >> 16);
1541 uint16_t Undef16 = uint16_t(Undef32) & uint16_t(Undef32 >> 16);
1542
1543 if ((Bits128[0] & ~Undef128[1]) == (Bits128[1] & ~Undef128[0])) {
1544 if (MinSplatBits < 64) {
Scott Michel5af8f0e2008-07-16 17:17:29 +00001545
Scott Michel266bc8f2007-12-04 22:23:35 +00001546 // Check that the top 32-bits are the same as the lower 32-bits, ignoring
1547 // undefs.
1548 if ((Bits64 & (~Undef64 >> 32)) == ((Bits64 >> 32) & ~Undef64)) {
Scott Michel7f9ba9b2008-01-30 02:55:46 +00001549 if (MinSplatBits < 32) {
Scott Michel266bc8f2007-12-04 22:23:35 +00001550
Scott Michel7f9ba9b2008-01-30 02:55:46 +00001551 // If the top 16-bits are different than the lower 16-bits, ignoring
1552 // undefs, we have an i32 splat.
1553 if ((Bits32 & (~Undef32 >> 16)) == ((Bits32 >> 16) & ~Undef32)) {
1554 if (MinSplatBits < 16) {
1555 // If the top 8-bits are different than the lower 8-bits, ignoring
1556 // undefs, we have an i16 splat.
Gabor Greif93c53e52008-08-31 15:37:04 +00001557 if ((Bits16 & (uint16_t(~Undef16) >> 8))
1558 == ((Bits16 >> 8) & ~Undef16)) {
Scott Michel7f9ba9b2008-01-30 02:55:46 +00001559 // Otherwise, we have an 8-bit splat.
1560 SplatBits = uint8_t(Bits16) | uint8_t(Bits16 >> 8);
1561 SplatUndef = uint8_t(Undef16) & uint8_t(Undef16 >> 8);
1562 SplatSize = 1;
1563 return true;
1564 }
1565 } else {
1566 SplatBits = Bits16;
1567 SplatUndef = Undef16;
1568 SplatSize = 2;
1569 return true;
1570 }
1571 }
1572 } else {
1573 SplatBits = Bits32;
1574 SplatUndef = Undef32;
1575 SplatSize = 4;
1576 return true;
1577 }
Scott Michel266bc8f2007-12-04 22:23:35 +00001578 }
1579 } else {
1580 SplatBits = Bits128[0];
1581 SplatUndef = Undef128[0];
1582 SplatSize = 8;
1583 return true;
1584 }
1585 }
1586
1587 return false; // Can't be a splat if two pieces don't match.
1588}
1589
Scott Micheld1e8d9c2009-01-21 04:58:48 +00001590//! Lower a BUILD_VECTOR instruction creatively:
1591SDValue
Scott Michelc9c8b2a2009-01-26 03:31:40 +00001592LowerBUILD_VECTOR(SDValue Op, SelectionDAG &DAG) {
Duncan Sands83ec4b62008-06-06 12:08:01 +00001593 MVT VT = Op.getValueType();
Dale Johannesened2eee62009-02-06 01:31:28 +00001594 DebugLoc dl = Op.getDebugLoc();
Scott Michel266bc8f2007-12-04 22:23:35 +00001595 // If this is a vector of constants or undefs, get the bits. A bit in
Scott Michel5af8f0e2008-07-16 17:17:29 +00001596 // UndefBits is set if the corresponding element of the vector is an
Scott Michel266bc8f2007-12-04 22:23:35 +00001597 // ISD::UNDEF value. For undefs, the corresponding VectorBits values are
Scott Michel5af8f0e2008-07-16 17:17:29 +00001598 // zero.
Scott Michel266bc8f2007-12-04 22:23:35 +00001599 uint64_t VectorBits[2];
1600 uint64_t UndefBits[2];
1601 uint64_t SplatBits, SplatUndef;
1602 int SplatSize;
Gabor Greifba36cb52008-08-28 21:40:38 +00001603 if (GetConstantBuildVectorBits(Op.getNode(), VectorBits, UndefBits)
Scott Michel266bc8f2007-12-04 22:23:35 +00001604 || !isConstantSplat(VectorBits, UndefBits,
Duncan Sands83ec4b62008-06-06 12:08:01 +00001605 VT.getVectorElementType().getSizeInBits(),
Scott Michel266bc8f2007-12-04 22:23:35 +00001606 SplatBits, SplatUndef, SplatSize))
Dan Gohman475871a2008-07-27 21:46:04 +00001607 return SDValue(); // Not a constant vector, not a splat.
Scott Michel5af8f0e2008-07-16 17:17:29 +00001608
Duncan Sands83ec4b62008-06-06 12:08:01 +00001609 switch (VT.getSimpleVT()) {
Scott Michel266bc8f2007-12-04 22:23:35 +00001610 default:
Scott Micheld1e8d9c2009-01-21 04:58:48 +00001611 cerr << "CellSPU: Unhandled VT in LowerBUILD_VECTOR, VT = "
1612 << VT.getMVTString()
1613 << "\n";
1614 abort();
1615 /*NOTREACHED*/
Scott Michel266bc8f2007-12-04 22:23:35 +00001616 case MVT::v4f32: {
Scott Michelc9c8b2a2009-01-26 03:31:40 +00001617 uint32_t Value32 = uint32_t(SplatBits);
Scott Michel266bc8f2007-12-04 22:23:35 +00001618 assert(SplatSize == 4
Scott Michel7f9ba9b2008-01-30 02:55:46 +00001619 && "LowerBUILD_VECTOR: Unexpected floating point vector element.");
Scott Michel266bc8f2007-12-04 22:23:35 +00001620 // NOTE: pretend the constant is an integer. LLVM won't load FP constants
Dan Gohman475871a2008-07-27 21:46:04 +00001621 SDValue T = DAG.getConstant(Value32, MVT::i32);
Dale Johannesened2eee62009-02-06 01:31:28 +00001622 return DAG.getNode(ISD::BIT_CONVERT, dl, MVT::v4f32,
Evan Chenga87008d2009-02-25 22:49:59 +00001623 DAG.getNode(ISD::BUILD_VECTOR, dl,
1624 MVT::v4i32, T, T, T, T));
Scott Michel266bc8f2007-12-04 22:23:35 +00001625 break;
1626 }
1627 case MVT::v2f64: {
Scott Michelc9c8b2a2009-01-26 03:31:40 +00001628 uint64_t f64val = uint64_t(SplatBits);
Scott Michel266bc8f2007-12-04 22:23:35 +00001629 assert(SplatSize == 8
Scott Michel104de432008-11-24 17:11:17 +00001630 && "LowerBUILD_VECTOR: 64-bit float vector size > 8 bytes.");
Scott Michel266bc8f2007-12-04 22:23:35 +00001631 // NOTE: pretend the constant is an integer. LLVM won't load FP constants
Dan Gohman475871a2008-07-27 21:46:04 +00001632 SDValue T = DAG.getConstant(f64val, MVT::i64);
Dale Johannesened2eee62009-02-06 01:31:28 +00001633 return DAG.getNode(ISD::BIT_CONVERT, dl, MVT::v2f64,
Evan Chenga87008d2009-02-25 22:49:59 +00001634 DAG.getNode(ISD::BUILD_VECTOR, dl, MVT::v2i64, T, T));
Scott Michel266bc8f2007-12-04 22:23:35 +00001635 break;
1636 }
1637 case MVT::v16i8: {
1638 // 8-bit constants have to be expanded to 16-bits
1639 unsigned short Value16 = SplatBits | (SplatBits << 8);
Dan Gohman475871a2008-07-27 21:46:04 +00001640 SDValue Ops[8];
Scott Michel266bc8f2007-12-04 22:23:35 +00001641 for (int i = 0; i < 8; ++i)
1642 Ops[i] = DAG.getConstant(Value16, MVT::i16);
Dale Johannesened2eee62009-02-06 01:31:28 +00001643 return DAG.getNode(ISD::BIT_CONVERT, dl, VT,
Evan Chenga87008d2009-02-25 22:49:59 +00001644 DAG.getNode(ISD::BUILD_VECTOR, dl, MVT::v8i16, Ops, 8));
Scott Michel266bc8f2007-12-04 22:23:35 +00001645 }
1646 case MVT::v8i16: {
1647 unsigned short Value16;
Scott Michel5af8f0e2008-07-16 17:17:29 +00001648 if (SplatSize == 2)
Scott Michel266bc8f2007-12-04 22:23:35 +00001649 Value16 = (unsigned short) (SplatBits & 0xffff);
1650 else
1651 Value16 = (unsigned short) (SplatBits | (SplatBits << 8));
Dan Gohman475871a2008-07-27 21:46:04 +00001652 SDValue T = DAG.getConstant(Value16, VT.getVectorElementType());
1653 SDValue Ops[8];
Scott Michel266bc8f2007-12-04 22:23:35 +00001654 for (int i = 0; i < 8; ++i) Ops[i] = T;
Evan Chenga87008d2009-02-25 22:49:59 +00001655 return DAG.getNode(ISD::BUILD_VECTOR, dl, VT, Ops, 8);
Scott Michel266bc8f2007-12-04 22:23:35 +00001656 }
1657 case MVT::v4i32: {
1658 unsigned int Value = SplatBits;
Dan Gohman475871a2008-07-27 21:46:04 +00001659 SDValue T = DAG.getConstant(Value, VT.getVectorElementType());
Evan Chenga87008d2009-02-25 22:49:59 +00001660 return DAG.getNode(ISD::BUILD_VECTOR, dl, VT, T, T, T, T);
Scott Michel266bc8f2007-12-04 22:23:35 +00001661 }
Scott Michel21213e72009-01-06 23:10:38 +00001662 case MVT::v2i32: {
1663 unsigned int Value = SplatBits;
1664 SDValue T = DAG.getConstant(Value, VT.getVectorElementType());
Evan Chenga87008d2009-02-25 22:49:59 +00001665 return DAG.getNode(ISD::BUILD_VECTOR, dl, VT, T, T);
Scott Michel21213e72009-01-06 23:10:38 +00001666 }
Scott Michel266bc8f2007-12-04 22:23:35 +00001667 case MVT::v2i64: {
Dale Johannesened2eee62009-02-06 01:31:28 +00001668 return SPU::LowerSplat_v2i64(VT, DAG, SplatBits, dl);
Scott Michel266bc8f2007-12-04 22:23:35 +00001669 }
1670 }
Scott Michel5af8f0e2008-07-16 17:17:29 +00001671
Dan Gohman475871a2008-07-27 21:46:04 +00001672 return SDValue();
Scott Michel266bc8f2007-12-04 22:23:35 +00001673}
1674
Scott Michelc9c8b2a2009-01-26 03:31:40 +00001675SDValue
Dale Johannesened2eee62009-02-06 01:31:28 +00001676SPU::LowerSplat_v2i64(MVT OpVT, SelectionDAG& DAG, uint64_t SplatVal,
1677 DebugLoc dl) {
Scott Michelc9c8b2a2009-01-26 03:31:40 +00001678 uint32_t upper = uint32_t(SplatVal >> 32);
1679 uint32_t lower = uint32_t(SplatVal);
1680
1681 if (upper == lower) {
1682 // Magic constant that can be matched by IL, ILA, et. al.
1683 SDValue Val = DAG.getTargetConstant(upper, MVT::i32);
Dale Johannesened2eee62009-02-06 01:31:28 +00001684 return DAG.getNode(ISD::BIT_CONVERT, dl, OpVT,
Evan Chenga87008d2009-02-25 22:49:59 +00001685 DAG.getNode(ISD::BUILD_VECTOR, dl, MVT::v4i32,
1686 Val, Val, Val, Val));
Scott Michelc9c8b2a2009-01-26 03:31:40 +00001687 } else {
1688 SDValue LO32;
1689 SDValue HI32;
1690 SmallVector<SDValue, 16> ShufBytes;
1691 SDValue Result;
1692 bool upper_special, lower_special;
1693
1694 // NOTE: This code creates common-case shuffle masks that can be easily
1695 // detected as common expressions. It is not attempting to create highly
1696 // specialized masks to replace any and all 0's, 0xff's and 0x80's.
1697
1698 // Detect if the upper or lower half is a special shuffle mask pattern:
1699 upper_special = (upper == 0 || upper == 0xffffffff || upper == 0x80000000);
1700 lower_special = (lower == 0 || lower == 0xffffffff || lower == 0x80000000);
1701
1702 // Create lower vector if not a special pattern
1703 if (!lower_special) {
1704 SDValue LO32C = DAG.getConstant(lower, MVT::i32);
Dale Johannesened2eee62009-02-06 01:31:28 +00001705 LO32 = DAG.getNode(ISD::BIT_CONVERT, dl, OpVT,
Evan Chenga87008d2009-02-25 22:49:59 +00001706 DAG.getNode(ISD::BUILD_VECTOR, dl, MVT::v4i32,
1707 LO32C, LO32C, LO32C, LO32C));
Scott Michelc9c8b2a2009-01-26 03:31:40 +00001708 }
1709
1710 // Create upper vector if not a special pattern
1711 if (!upper_special) {
1712 SDValue HI32C = DAG.getConstant(upper, MVT::i32);
Dale Johannesened2eee62009-02-06 01:31:28 +00001713 HI32 = DAG.getNode(ISD::BIT_CONVERT, dl, OpVT,
Evan Chenga87008d2009-02-25 22:49:59 +00001714 DAG.getNode(ISD::BUILD_VECTOR, dl, MVT::v4i32,
1715 HI32C, HI32C, HI32C, HI32C));
Scott Michelc9c8b2a2009-01-26 03:31:40 +00001716 }
1717
1718 // If either upper or lower are special, then the two input operands are
1719 // the same (basically, one of them is a "don't care")
1720 if (lower_special)
1721 LO32 = HI32;
1722 if (upper_special)
1723 HI32 = LO32;
1724 if (lower_special && upper_special) {
1725 // Unhappy situation... both upper and lower are special, so punt with
1726 // a target constant:
1727 SDValue Zero = DAG.getConstant(0, MVT::i32);
Evan Chenga87008d2009-02-25 22:49:59 +00001728 HI32 = LO32 = DAG.getNode(ISD::BUILD_VECTOR, dl, MVT::v4i32, Zero, Zero,
1729 Zero, Zero);
Scott Michelc9c8b2a2009-01-26 03:31:40 +00001730 }
1731
1732 for (int i = 0; i < 4; ++i) {
1733 uint64_t val = 0;
1734 for (int j = 0; j < 4; ++j) {
1735 SDValue V;
1736 bool process_upper, process_lower;
1737 val <<= 8;
1738 process_upper = (upper_special && (i & 1) == 0);
1739 process_lower = (lower_special && (i & 1) == 1);
1740
1741 if (process_upper || process_lower) {
1742 if ((process_upper && upper == 0)
1743 || (process_lower && lower == 0))
1744 val |= 0x80;
1745 else if ((process_upper && upper == 0xffffffff)
1746 || (process_lower && lower == 0xffffffff))
1747 val |= 0xc0;
1748 else if ((process_upper && upper == 0x80000000)
1749 || (process_lower && lower == 0x80000000))
1750 val |= (j == 0 ? 0xe0 : 0x80);
1751 } else
1752 val |= i * 4 + j + ((i & 1) * 16);
1753 }
1754
1755 ShufBytes.push_back(DAG.getConstant(val, MVT::i32));
1756 }
1757
Dale Johannesened2eee62009-02-06 01:31:28 +00001758 return DAG.getNode(SPUISD::SHUFB, dl, OpVT, HI32, LO32,
Evan Chenga87008d2009-02-25 22:49:59 +00001759 DAG.getNode(ISD::BUILD_VECTOR, dl, MVT::v4i32,
1760 &ShufBytes[0], ShufBytes.size()));
Scott Michelc9c8b2a2009-01-26 03:31:40 +00001761 }
1762}
1763
Scott Michel266bc8f2007-12-04 22:23:35 +00001764/// LowerVECTOR_SHUFFLE - Lower a vector shuffle (V1, V2, V3) to something on
1765/// which the Cell can operate. The code inspects V3 to ascertain whether the
1766/// permutation vector, V3, is monotonically increasing with one "exception"
1767/// element, e.g., (0, 1, _, 3). If this is the case, then generate a
Scott Michel7a1c9e92008-11-22 23:50:42 +00001768/// SHUFFLE_MASK synthetic instruction. Otherwise, spill V3 to the constant pool.
Scott Michel266bc8f2007-12-04 22:23:35 +00001769/// In either case, the net result is going to eventually invoke SHUFB to
1770/// permute/shuffle the bytes from V1 and V2.
1771/// \note
Scott Michel7a1c9e92008-11-22 23:50:42 +00001772/// SHUFFLE_MASK is eventually selected as one of the C*D instructions, generate
Scott Michel266bc8f2007-12-04 22:23:35 +00001773/// control word for byte/halfword/word insertion. This takes care of a single
1774/// element move from V2 into V1.
1775/// \note
1776/// SPUISD::SHUFB is eventually selected as Cell's <i>shufb</i> instructions.
Dan Gohman475871a2008-07-27 21:46:04 +00001777static SDValue LowerVECTOR_SHUFFLE(SDValue Op, SelectionDAG &DAG) {
1778 SDValue V1 = Op.getOperand(0);
1779 SDValue V2 = Op.getOperand(1);
1780 SDValue PermMask = Op.getOperand(2);
Dale Johannesena05dca42009-02-04 23:02:30 +00001781 DebugLoc dl = Op.getDebugLoc();
Scott Michel5af8f0e2008-07-16 17:17:29 +00001782
Scott Michel266bc8f2007-12-04 22:23:35 +00001783 if (V2.getOpcode() == ISD::UNDEF) V2 = V1;
Scott Michel5af8f0e2008-07-16 17:17:29 +00001784
Scott Michel266bc8f2007-12-04 22:23:35 +00001785 // If we have a single element being moved from V1 to V2, this can be handled
1786 // using the C*[DX] compute mask instructions, but the vector elements have
1787 // to be monotonically increasing with one exception element.
Scott Michelcc188272008-12-04 21:01:44 +00001788 MVT VecVT = V1.getValueType();
1789 MVT EltVT = VecVT.getVectorElementType();
Scott Michel266bc8f2007-12-04 22:23:35 +00001790 unsigned EltsFromV2 = 0;
1791 unsigned V2Elt = 0;
1792 unsigned V2EltIdx0 = 0;
1793 unsigned CurrElt = 0;
Scott Michelcc188272008-12-04 21:01:44 +00001794 unsigned MaxElts = VecVT.getVectorNumElements();
1795 unsigned PrevElt = 0;
1796 unsigned V0Elt = 0;
Scott Michel266bc8f2007-12-04 22:23:35 +00001797 bool monotonic = true;
Scott Michelcc188272008-12-04 21:01:44 +00001798 bool rotate = true;
1799
1800 if (EltVT == MVT::i8) {
Scott Michel266bc8f2007-12-04 22:23:35 +00001801 V2EltIdx0 = 16;
Scott Michelcc188272008-12-04 21:01:44 +00001802 } else if (EltVT == MVT::i16) {
Scott Michel266bc8f2007-12-04 22:23:35 +00001803 V2EltIdx0 = 8;
Scott Michelcc188272008-12-04 21:01:44 +00001804 } else if (EltVT == MVT::i32 || EltVT == MVT::f32) {
Scott Michel266bc8f2007-12-04 22:23:35 +00001805 V2EltIdx0 = 4;
Scott Michelcc188272008-12-04 21:01:44 +00001806 } else if (EltVT == MVT::i64 || EltVT == MVT::f64) {
1807 V2EltIdx0 = 2;
1808 } else
Scott Michel266bc8f2007-12-04 22:23:35 +00001809 assert(0 && "Unhandled vector type in LowerVECTOR_SHUFFLE");
1810
Scott Michelcc188272008-12-04 21:01:44 +00001811 for (unsigned i = 0; i != PermMask.getNumOperands(); ++i) {
1812 if (PermMask.getOperand(i).getOpcode() != ISD::UNDEF) {
1813 unsigned SrcElt = cast<ConstantSDNode > (PermMask.getOperand(i))->getZExtValue();
Scott Michel266bc8f2007-12-04 22:23:35 +00001814
Scott Michelcc188272008-12-04 21:01:44 +00001815 if (monotonic) {
1816 if (SrcElt >= V2EltIdx0) {
1817 if (1 >= (++EltsFromV2)) {
1818 V2Elt = (V2EltIdx0 - SrcElt) << 2;
1819 }
1820 } else if (CurrElt != SrcElt) {
1821 monotonic = false;
1822 }
1823
1824 ++CurrElt;
1825 }
1826
1827 if (rotate) {
1828 if (PrevElt > 0 && SrcElt < MaxElts) {
1829 if ((PrevElt == SrcElt - 1)
1830 || (PrevElt == MaxElts - 1 && SrcElt == 0)) {
1831 PrevElt = SrcElt;
1832 if (SrcElt == 0)
1833 V0Elt = i;
1834 } else {
1835 rotate = false;
1836 }
1837 } else if (PrevElt == 0) {
1838 // First time through, need to keep track of previous element
1839 PrevElt = SrcElt;
1840 } else {
1841 // This isn't a rotation, takes elements from vector 2
1842 rotate = false;
1843 }
1844 }
Scott Michel266bc8f2007-12-04 22:23:35 +00001845 }
Scott Michel266bc8f2007-12-04 22:23:35 +00001846 }
1847
1848 if (EltsFromV2 == 1 && monotonic) {
1849 // Compute mask and shuffle
1850 MachineFunction &MF = DAG.getMachineFunction();
Chris Lattner84bc5422007-12-31 04:13:23 +00001851 MachineRegisterInfo &RegInfo = MF.getRegInfo();
1852 unsigned VReg = RegInfo.createVirtualRegister(&SPU::R32CRegClass);
Duncan Sands83ec4b62008-06-06 12:08:01 +00001853 MVT PtrVT = DAG.getTargetLoweringInfo().getPointerTy();
Scott Michel266bc8f2007-12-04 22:23:35 +00001854 // Initialize temporary register to 0
Dan Gohman475871a2008-07-27 21:46:04 +00001855 SDValue InitTempReg =
Dale Johannesena05dca42009-02-04 23:02:30 +00001856 DAG.getCopyToReg(DAG.getEntryNode(), dl, VReg, DAG.getConstant(0, PtrVT));
Scott Michel7a1c9e92008-11-22 23:50:42 +00001857 // Copy register's contents as index in SHUFFLE_MASK:
Dan Gohman475871a2008-07-27 21:46:04 +00001858 SDValue ShufMaskOp =
Dale Johannesena05dca42009-02-04 23:02:30 +00001859 DAG.getNode(SPUISD::SHUFFLE_MASK, dl, MVT::v4i32,
Scott Michel7f9ba9b2008-01-30 02:55:46 +00001860 DAG.getTargetConstant(V2Elt, MVT::i32),
Dale Johannesena05dca42009-02-04 23:02:30 +00001861 DAG.getCopyFromReg(InitTempReg, dl, VReg, PtrVT));
Scott Michel266bc8f2007-12-04 22:23:35 +00001862 // Use shuffle mask in SHUFB synthetic instruction:
Dale Johannesena05dca42009-02-04 23:02:30 +00001863 return DAG.getNode(SPUISD::SHUFB, dl, V1.getValueType(), V2, V1,
1864 ShufMaskOp);
Scott Michelcc188272008-12-04 21:01:44 +00001865 } else if (rotate) {
1866 int rotamt = (MaxElts - V0Elt) * EltVT.getSizeInBits()/8;
Scott Michel1df30c42008-12-29 03:23:36 +00001867
Dale Johannesena05dca42009-02-04 23:02:30 +00001868 return DAG.getNode(SPUISD::ROTBYTES_LEFT, dl, V1.getValueType(),
Scott Michelcc188272008-12-04 21:01:44 +00001869 V1, DAG.getConstant(rotamt, MVT::i16));
Scott Michel266bc8f2007-12-04 22:23:35 +00001870 } else {
Gabor Greif93c53e52008-08-31 15:37:04 +00001871 // Convert the SHUFFLE_VECTOR mask's input element units to the
1872 // actual bytes.
Duncan Sands83ec4b62008-06-06 12:08:01 +00001873 unsigned BytesPerElement = EltVT.getSizeInBits()/8;
Scott Michel5af8f0e2008-07-16 17:17:29 +00001874
Dan Gohman475871a2008-07-27 21:46:04 +00001875 SmallVector<SDValue, 16> ResultMask;
Scott Michel266bc8f2007-12-04 22:23:35 +00001876 for (unsigned i = 0, e = PermMask.getNumOperands(); i != e; ++i) {
1877 unsigned SrcElt;
1878 if (PermMask.getOperand(i).getOpcode() == ISD::UNDEF)
Scott Michel7f9ba9b2008-01-30 02:55:46 +00001879 SrcElt = 0;
Scott Michel5af8f0e2008-07-16 17:17:29 +00001880 else
Dan Gohmanf5aeb1a2008-09-12 16:56:44 +00001881 SrcElt = cast<ConstantSDNode>(PermMask.getOperand(i))->getZExtValue();
Scott Michel5af8f0e2008-07-16 17:17:29 +00001882
Scott Michela59d4692008-02-23 18:41:37 +00001883 for (unsigned j = 0; j < BytesPerElement; ++j) {
Scott Michel7f9ba9b2008-01-30 02:55:46 +00001884 ResultMask.push_back(DAG.getConstant(SrcElt*BytesPerElement+j,
1885 MVT::i8));
Scott Michel266bc8f2007-12-04 22:23:35 +00001886 }
1887 }
Scott Michel5af8f0e2008-07-16 17:17:29 +00001888
Evan Chenga87008d2009-02-25 22:49:59 +00001889 SDValue VPermMask = DAG.getNode(ISD::BUILD_VECTOR, dl, MVT::v16i8,
1890 &ResultMask[0], ResultMask.size());
Dale Johannesena05dca42009-02-04 23:02:30 +00001891 return DAG.getNode(SPUISD::SHUFB, dl, V1.getValueType(), V1, V2, VPermMask);
Scott Michel266bc8f2007-12-04 22:23:35 +00001892 }
1893}
1894
Dan Gohman475871a2008-07-27 21:46:04 +00001895static SDValue LowerSCALAR_TO_VECTOR(SDValue Op, SelectionDAG &DAG) {
1896 SDValue Op0 = Op.getOperand(0); // Op0 = the scalar
Dale Johannesened2eee62009-02-06 01:31:28 +00001897 DebugLoc dl = Op.getDebugLoc();
Scott Michel266bc8f2007-12-04 22:23:35 +00001898
Gabor Greifba36cb52008-08-28 21:40:38 +00001899 if (Op0.getNode()->getOpcode() == ISD::Constant) {
Scott Michel266bc8f2007-12-04 22:23:35 +00001900 // For a constant, build the appropriate constant vector, which will
1901 // eventually simplify to a vector register load.
1902
Gabor Greifba36cb52008-08-28 21:40:38 +00001903 ConstantSDNode *CN = cast<ConstantSDNode>(Op0.getNode());
Dan Gohman475871a2008-07-27 21:46:04 +00001904 SmallVector<SDValue, 16> ConstVecValues;
Duncan Sands83ec4b62008-06-06 12:08:01 +00001905 MVT VT;
Scott Michel266bc8f2007-12-04 22:23:35 +00001906 size_t n_copies;
1907
1908 // Create a constant vector:
Duncan Sands83ec4b62008-06-06 12:08:01 +00001909 switch (Op.getValueType().getSimpleVT()) {
Scott Michel266bc8f2007-12-04 22:23:35 +00001910 default: assert(0 && "Unexpected constant value type in "
Scott Michel7f9ba9b2008-01-30 02:55:46 +00001911 "LowerSCALAR_TO_VECTOR");
Scott Michel266bc8f2007-12-04 22:23:35 +00001912 case MVT::v16i8: n_copies = 16; VT = MVT::i8; break;
1913 case MVT::v8i16: n_copies = 8; VT = MVT::i16; break;
1914 case MVT::v4i32: n_copies = 4; VT = MVT::i32; break;
1915 case MVT::v4f32: n_copies = 4; VT = MVT::f32; break;
1916 case MVT::v2i64: n_copies = 2; VT = MVT::i64; break;
1917 case MVT::v2f64: n_copies = 2; VT = MVT::f64; break;
1918 }
1919
Dan Gohmanf5aeb1a2008-09-12 16:56:44 +00001920 SDValue CValue = DAG.getConstant(CN->getZExtValue(), VT);
Scott Michel266bc8f2007-12-04 22:23:35 +00001921 for (size_t j = 0; j < n_copies; ++j)
1922 ConstVecValues.push_back(CValue);
1923
Evan Chenga87008d2009-02-25 22:49:59 +00001924 return DAG.getNode(ISD::BUILD_VECTOR, dl, Op.getValueType(),
1925 &ConstVecValues[0], ConstVecValues.size());
Scott Michel266bc8f2007-12-04 22:23:35 +00001926 } else {
1927 // Otherwise, copy the value from one register to another:
Duncan Sands83ec4b62008-06-06 12:08:01 +00001928 switch (Op0.getValueType().getSimpleVT()) {
Scott Michel266bc8f2007-12-04 22:23:35 +00001929 default: assert(0 && "Unexpected value type in LowerSCALAR_TO_VECTOR");
1930 case MVT::i8:
1931 case MVT::i16:
1932 case MVT::i32:
1933 case MVT::i64:
1934 case MVT::f32:
1935 case MVT::f64:
Dale Johannesened2eee62009-02-06 01:31:28 +00001936 return DAG.getNode(SPUISD::PREFSLOT2VEC, dl, Op.getValueType(), Op0, Op0);
Scott Michel266bc8f2007-12-04 22:23:35 +00001937 }
1938 }
1939
Dan Gohman475871a2008-07-27 21:46:04 +00001940 return SDValue();
Scott Michel266bc8f2007-12-04 22:23:35 +00001941}
1942
Dan Gohman475871a2008-07-27 21:46:04 +00001943static SDValue LowerEXTRACT_VECTOR_ELT(SDValue Op, SelectionDAG &DAG) {
Duncan Sands83ec4b62008-06-06 12:08:01 +00001944 MVT VT = Op.getValueType();
Dan Gohman475871a2008-07-27 21:46:04 +00001945 SDValue N = Op.getOperand(0);
1946 SDValue Elt = Op.getOperand(1);
Dale Johannesened2eee62009-02-06 01:31:28 +00001947 DebugLoc dl = Op.getDebugLoc();
Scott Michel7a1c9e92008-11-22 23:50:42 +00001948 SDValue retval;
Scott Michel266bc8f2007-12-04 22:23:35 +00001949
Scott Michel7a1c9e92008-11-22 23:50:42 +00001950 if (ConstantSDNode *C = dyn_cast<ConstantSDNode>(Elt)) {
1951 // Constant argument:
1952 int EltNo = (int) C->getZExtValue();
Scott Michel266bc8f2007-12-04 22:23:35 +00001953
Scott Michel7a1c9e92008-11-22 23:50:42 +00001954 // sanity checks:
1955 if (VT == MVT::i8 && EltNo >= 16)
1956 assert(0 && "SPU LowerEXTRACT_VECTOR_ELT: i8 extraction slot > 15");
1957 else if (VT == MVT::i16 && EltNo >= 8)
1958 assert(0 && "SPU LowerEXTRACT_VECTOR_ELT: i16 extraction slot > 7");
1959 else if (VT == MVT::i32 && EltNo >= 4)
1960 assert(0 && "SPU LowerEXTRACT_VECTOR_ELT: i32 extraction slot > 4");
1961 else if (VT == MVT::i64 && EltNo >= 2)
1962 assert(0 && "SPU LowerEXTRACT_VECTOR_ELT: i64 extraction slot > 2");
Scott Michel266bc8f2007-12-04 22:23:35 +00001963
Scott Michel7a1c9e92008-11-22 23:50:42 +00001964 if (EltNo == 0 && (VT == MVT::i32 || VT == MVT::i64)) {
1965 // i32 and i64: Element 0 is the preferred slot
Dale Johannesened2eee62009-02-06 01:31:28 +00001966 return DAG.getNode(SPUISD::VEC2PREFSLOT, dl, VT, N);
Scott Michel7a1c9e92008-11-22 23:50:42 +00001967 }
Scott Michel266bc8f2007-12-04 22:23:35 +00001968
Scott Michel7a1c9e92008-11-22 23:50:42 +00001969 // Need to generate shuffle mask and extract:
1970 int prefslot_begin = -1, prefslot_end = -1;
1971 int elt_byte = EltNo * VT.getSizeInBits() / 8;
1972
1973 switch (VT.getSimpleVT()) {
1974 default:
1975 assert(false && "Invalid value type!");
1976 case MVT::i8: {
1977 prefslot_begin = prefslot_end = 3;
1978 break;
1979 }
1980 case MVT::i16: {
1981 prefslot_begin = 2; prefslot_end = 3;
1982 break;
1983 }
1984 case MVT::i32:
1985 case MVT::f32: {
1986 prefslot_begin = 0; prefslot_end = 3;
1987 break;
1988 }
1989 case MVT::i64:
1990 case MVT::f64: {
1991 prefslot_begin = 0; prefslot_end = 7;
1992 break;
1993 }
1994 }
1995
1996 assert(prefslot_begin != -1 && prefslot_end != -1 &&
1997 "LowerEXTRACT_VECTOR_ELT: preferred slots uninitialized");
1998
1999 unsigned int ShufBytes[16];
2000 for (int i = 0; i < 16; ++i) {
2001 // zero fill uppper part of preferred slot, don't care about the
2002 // other slots:
2003 unsigned int mask_val;
2004 if (i <= prefslot_end) {
2005 mask_val =
2006 ((i < prefslot_begin)
2007 ? 0x80
2008 : elt_byte + (i - prefslot_begin));
2009
2010 ShufBytes[i] = mask_val;
2011 } else
2012 ShufBytes[i] = ShufBytes[i % (prefslot_end + 1)];
2013 }
2014
2015 SDValue ShufMask[4];
2016 for (unsigned i = 0; i < sizeof(ShufMask)/sizeof(ShufMask[0]); ++i) {
Scott Michelcc188272008-12-04 21:01:44 +00002017 unsigned bidx = i * 4;
Scott Michel7a1c9e92008-11-22 23:50:42 +00002018 unsigned int bits = ((ShufBytes[bidx] << 24) |
2019 (ShufBytes[bidx+1] << 16) |
2020 (ShufBytes[bidx+2] << 8) |
2021 ShufBytes[bidx+3]);
2022 ShufMask[i] = DAG.getConstant(bits, MVT::i32);
2023 }
2024
Evan Chenga87008d2009-02-25 22:49:59 +00002025 SDValue ShufMaskVec = DAG.getNode(ISD::BUILD_VECTOR, dl, MVT::v4i32,
2026 &ShufMask[0],
2027 sizeof(ShufMask) / sizeof(ShufMask[0]));
Scott Michel7a1c9e92008-11-22 23:50:42 +00002028
Dale Johannesened2eee62009-02-06 01:31:28 +00002029 retval = DAG.getNode(SPUISD::VEC2PREFSLOT, dl, VT,
2030 DAG.getNode(SPUISD::SHUFB, dl, N.getValueType(),
Scott Michel7a1c9e92008-11-22 23:50:42 +00002031 N, N, ShufMaskVec));
2032 } else {
2033 // Variable index: Rotate the requested element into slot 0, then replicate
2034 // slot 0 across the vector
2035 MVT VecVT = N.getValueType();
2036 if (!VecVT.isSimple() || !VecVT.isVector() || !VecVT.is128BitVector()) {
2037 cerr << "LowerEXTRACT_VECTOR_ELT: Must have a simple, 128-bit vector type!\n";
2038 abort();
2039 }
2040
2041 // Make life easier by making sure the index is zero-extended to i32
2042 if (Elt.getValueType() != MVT::i32)
Dale Johannesened2eee62009-02-06 01:31:28 +00002043 Elt = DAG.getNode(ISD::ZERO_EXTEND, dl, MVT::i32, Elt);
Scott Michel7a1c9e92008-11-22 23:50:42 +00002044
2045 // Scale the index to a bit/byte shift quantity
2046 APInt scaleFactor =
Scott Michel104de432008-11-24 17:11:17 +00002047 APInt(32, uint64_t(16 / N.getValueType().getVectorNumElements()), false);
2048 unsigned scaleShift = scaleFactor.logBase2();
Scott Michel7a1c9e92008-11-22 23:50:42 +00002049 SDValue vecShift;
Scott Michel7a1c9e92008-11-22 23:50:42 +00002050
Scott Michel104de432008-11-24 17:11:17 +00002051 if (scaleShift > 0) {
2052 // Scale the shift factor:
Dale Johannesened2eee62009-02-06 01:31:28 +00002053 Elt = DAG.getNode(ISD::SHL, dl, MVT::i32, Elt,
Scott Michel1a6cdb62008-12-01 17:56:02 +00002054 DAG.getConstant(scaleShift, MVT::i32));
Scott Michel7a1c9e92008-11-22 23:50:42 +00002055 }
2056
Dale Johannesened2eee62009-02-06 01:31:28 +00002057 vecShift = DAG.getNode(SPUISD::SHLQUAD_L_BYTES, dl, VecVT, N, Elt);
Scott Michel104de432008-11-24 17:11:17 +00002058
2059 // Replicate the bytes starting at byte 0 across the entire vector (for
2060 // consistency with the notion of a unified register set)
Scott Michel7a1c9e92008-11-22 23:50:42 +00002061 SDValue replicate;
2062
2063 switch (VT.getSimpleVT()) {
2064 default:
2065 cerr << "LowerEXTRACT_VECTOR_ELT(varable): Unhandled vector type\n";
2066 abort();
2067 /*NOTREACHED*/
2068 case MVT::i8: {
Scott Michel104de432008-11-24 17:11:17 +00002069 SDValue factor = DAG.getConstant(0x00000000, MVT::i32);
Evan Chenga87008d2009-02-25 22:49:59 +00002070 replicate = DAG.getNode(ISD::BUILD_VECTOR, dl, MVT::v4i32, factor, factor,
2071 factor, factor);
Scott Michel7a1c9e92008-11-22 23:50:42 +00002072 break;
2073 }
2074 case MVT::i16: {
Scott Michel104de432008-11-24 17:11:17 +00002075 SDValue factor = DAG.getConstant(0x00010001, MVT::i32);
Evan Chenga87008d2009-02-25 22:49:59 +00002076 replicate = DAG.getNode(ISD::BUILD_VECTOR, dl, MVT::v4i32, factor, factor,
2077 factor, factor);
Scott Michel7a1c9e92008-11-22 23:50:42 +00002078 break;
2079 }
2080 case MVT::i32:
2081 case MVT::f32: {
2082 SDValue factor = DAG.getConstant(0x00010203, MVT::i32);
Evan Chenga87008d2009-02-25 22:49:59 +00002083 replicate = DAG.getNode(ISD::BUILD_VECTOR, dl, MVT::v4i32, factor, factor,
2084 factor, factor);
Scott Michel7a1c9e92008-11-22 23:50:42 +00002085 break;
2086 }
2087 case MVT::i64:
2088 case MVT::f64: {
2089 SDValue loFactor = DAG.getConstant(0x00010203, MVT::i32);
2090 SDValue hiFactor = DAG.getConstant(0x04050607, MVT::i32);
Evan Chenga87008d2009-02-25 22:49:59 +00002091 replicate = DAG.getNode(ISD::BUILD_VECTOR, dl, MVT::v4i32,
2092 loFactor, hiFactor, loFactor, hiFactor);
Scott Michel7a1c9e92008-11-22 23:50:42 +00002093 break;
2094 }
2095 }
2096
Dale Johannesened2eee62009-02-06 01:31:28 +00002097 retval = DAG.getNode(SPUISD::VEC2PREFSLOT, dl, VT,
2098 DAG.getNode(SPUISD::SHUFB, dl, VecVT,
Scott Michel1a6cdb62008-12-01 17:56:02 +00002099 vecShift, vecShift, replicate));
Scott Michel266bc8f2007-12-04 22:23:35 +00002100 }
2101
Scott Michel7a1c9e92008-11-22 23:50:42 +00002102 return retval;
Scott Michel266bc8f2007-12-04 22:23:35 +00002103}
2104
Dan Gohman475871a2008-07-27 21:46:04 +00002105static SDValue LowerINSERT_VECTOR_ELT(SDValue Op, SelectionDAG &DAG) {
2106 SDValue VecOp = Op.getOperand(0);
2107 SDValue ValOp = Op.getOperand(1);
2108 SDValue IdxOp = Op.getOperand(2);
Dale Johannesened2eee62009-02-06 01:31:28 +00002109 DebugLoc dl = Op.getDebugLoc();
Duncan Sands83ec4b62008-06-06 12:08:01 +00002110 MVT VT = Op.getValueType();
Scott Michel266bc8f2007-12-04 22:23:35 +00002111
2112 ConstantSDNode *CN = cast<ConstantSDNode>(IdxOp);
2113 assert(CN != 0 && "LowerINSERT_VECTOR_ELT: Index is not constant!");
2114
Duncan Sands83ec4b62008-06-06 12:08:01 +00002115 MVT PtrVT = DAG.getTargetLoweringInfo().getPointerTy();
Scott Michel1a6cdb62008-12-01 17:56:02 +00002116 // Use $sp ($1) because it's always 16-byte aligned and it's available:
Dale Johannesened2eee62009-02-06 01:31:28 +00002117 SDValue Pointer = DAG.getNode(SPUISD::IndirectAddr, dl, PtrVT,
Scott Michel1a6cdb62008-12-01 17:56:02 +00002118 DAG.getRegister(SPU::R1, PtrVT),
2119 DAG.getConstant(CN->getSExtValue(), PtrVT));
Dale Johannesened2eee62009-02-06 01:31:28 +00002120 SDValue ShufMask = DAG.getNode(SPUISD::SHUFFLE_MASK, dl, VT, Pointer);
Scott Michel266bc8f2007-12-04 22:23:35 +00002121
Dan Gohman475871a2008-07-27 21:46:04 +00002122 SDValue result =
Dale Johannesened2eee62009-02-06 01:31:28 +00002123 DAG.getNode(SPUISD::SHUFB, dl, VT,
2124 DAG.getNode(ISD::SCALAR_TO_VECTOR, dl, VT, ValOp),
Scott Michel1df30c42008-12-29 03:23:36 +00002125 VecOp,
Dale Johannesened2eee62009-02-06 01:31:28 +00002126 DAG.getNode(ISD::BIT_CONVERT, dl, MVT::v4i32, ShufMask));
Scott Michel266bc8f2007-12-04 22:23:35 +00002127
2128 return result;
2129}
2130
Scott Michelf0569be2008-12-27 04:51:36 +00002131static SDValue LowerI8Math(SDValue Op, SelectionDAG &DAG, unsigned Opc,
2132 const TargetLowering &TLI)
Scott Michela59d4692008-02-23 18:41:37 +00002133{
Dan Gohman475871a2008-07-27 21:46:04 +00002134 SDValue N0 = Op.getOperand(0); // Everything has at least one operand
Dale Johannesened2eee62009-02-06 01:31:28 +00002135 DebugLoc dl = Op.getDebugLoc();
Scott Michelf0569be2008-12-27 04:51:36 +00002136 MVT ShiftVT = TLI.getShiftAmountTy();
Scott Michel266bc8f2007-12-04 22:23:35 +00002137
2138 assert(Op.getValueType() == MVT::i8);
2139 switch (Opc) {
2140 default:
2141 assert(0 && "Unhandled i8 math operator");
2142 /*NOTREACHED*/
2143 break;
Scott Michel02d711b2008-12-30 23:28:25 +00002144 case ISD::ADD: {
2145 // 8-bit addition: Promote the arguments up to 16-bits and truncate
2146 // the result:
2147 SDValue N1 = Op.getOperand(1);
Dale Johannesened2eee62009-02-06 01:31:28 +00002148 N0 = DAG.getNode(ISD::SIGN_EXTEND, dl, MVT::i16, N0);
2149 N1 = DAG.getNode(ISD::SIGN_EXTEND, dl, MVT::i16, N1);
2150 return DAG.getNode(ISD::TRUNCATE, dl, MVT::i8,
2151 DAG.getNode(Opc, dl, MVT::i16, N0, N1));
Scott Michel02d711b2008-12-30 23:28:25 +00002152
2153 }
2154
Scott Michel266bc8f2007-12-04 22:23:35 +00002155 case ISD::SUB: {
2156 // 8-bit subtraction: Promote the arguments up to 16-bits and truncate
2157 // the result:
Dan Gohman475871a2008-07-27 21:46:04 +00002158 SDValue N1 = Op.getOperand(1);
Dale Johannesened2eee62009-02-06 01:31:28 +00002159 N0 = DAG.getNode(ISD::SIGN_EXTEND, dl, MVT::i16, N0);
2160 N1 = DAG.getNode(ISD::SIGN_EXTEND, dl, MVT::i16, N1);
2161 return DAG.getNode(ISD::TRUNCATE, dl, MVT::i8,
2162 DAG.getNode(Opc, dl, MVT::i16, N0, N1));
Scott Michel5af8f0e2008-07-16 17:17:29 +00002163 }
Scott Michel266bc8f2007-12-04 22:23:35 +00002164 case ISD::ROTR:
2165 case ISD::ROTL: {
Dan Gohman475871a2008-07-27 21:46:04 +00002166 SDValue N1 = Op.getOperand(1);
Scott Michel266bc8f2007-12-04 22:23:35 +00002167 unsigned N1Opc;
2168 N0 = (N0.getOpcode() != ISD::Constant
Dale Johannesened2eee62009-02-06 01:31:28 +00002169 ? DAG.getNode(ISD::ZERO_EXTEND, dl, MVT::i16, N0)
Dan Gohmanf5aeb1a2008-09-12 16:56:44 +00002170 : DAG.getConstant(cast<ConstantSDNode>(N0)->getZExtValue(),
2171 MVT::i16));
Scott Michelf0569be2008-12-27 04:51:36 +00002172 N1Opc = N1.getValueType().bitsLT(ShiftVT)
Gabor Greif93c53e52008-08-31 15:37:04 +00002173 ? ISD::ZERO_EXTEND
2174 : ISD::TRUNCATE;
Scott Michel266bc8f2007-12-04 22:23:35 +00002175 N1 = (N1.getOpcode() != ISD::Constant
Dale Johannesened2eee62009-02-06 01:31:28 +00002176 ? DAG.getNode(N1Opc, dl, ShiftVT, N1)
Dan Gohmanf5aeb1a2008-09-12 16:56:44 +00002177 : DAG.getConstant(cast<ConstantSDNode>(N1)->getZExtValue(),
Scott Michelf0569be2008-12-27 04:51:36 +00002178 TLI.getShiftAmountTy()));
Dan Gohman475871a2008-07-27 21:46:04 +00002179 SDValue ExpandArg =
Dale Johannesened2eee62009-02-06 01:31:28 +00002180 DAG.getNode(ISD::OR, dl, MVT::i16, N0,
2181 DAG.getNode(ISD::SHL, dl, MVT::i16,
Duncan Sandsfa7935f2008-10-30 19:24:28 +00002182 N0, DAG.getConstant(8, MVT::i32)));
Dale Johannesened2eee62009-02-06 01:31:28 +00002183 return DAG.getNode(ISD::TRUNCATE, dl, MVT::i8,
2184 DAG.getNode(Opc, dl, MVT::i16, ExpandArg, N1));
Scott Michel266bc8f2007-12-04 22:23:35 +00002185 }
2186 case ISD::SRL:
2187 case ISD::SHL: {
Dan Gohman475871a2008-07-27 21:46:04 +00002188 SDValue N1 = Op.getOperand(1);
Scott Michel266bc8f2007-12-04 22:23:35 +00002189 unsigned N1Opc;
2190 N0 = (N0.getOpcode() != ISD::Constant
Dale Johannesened2eee62009-02-06 01:31:28 +00002191 ? DAG.getNode(ISD::ZERO_EXTEND, dl, MVT::i16, N0)
Dan Gohmanf5aeb1a2008-09-12 16:56:44 +00002192 : DAG.getConstant(cast<ConstantSDNode>(N0)->getZExtValue(),
Scott Michelf0569be2008-12-27 04:51:36 +00002193 MVT::i32));
2194 N1Opc = N1.getValueType().bitsLT(ShiftVT)
Gabor Greif93c53e52008-08-31 15:37:04 +00002195 ? ISD::ZERO_EXTEND
2196 : ISD::TRUNCATE;
Scott Michel266bc8f2007-12-04 22:23:35 +00002197 N1 = (N1.getOpcode() != ISD::Constant
Dale Johannesened2eee62009-02-06 01:31:28 +00002198 ? DAG.getNode(N1Opc, dl, ShiftVT, N1)
Scott Michelf0569be2008-12-27 04:51:36 +00002199 : DAG.getConstant(cast<ConstantSDNode>(N1)->getZExtValue(), ShiftVT));
Dale Johannesened2eee62009-02-06 01:31:28 +00002200 return DAG.getNode(ISD::TRUNCATE, dl, MVT::i8,
2201 DAG.getNode(Opc, dl, MVT::i16, N0, N1));
Scott Michel266bc8f2007-12-04 22:23:35 +00002202 }
2203 case ISD::SRA: {
Dan Gohman475871a2008-07-27 21:46:04 +00002204 SDValue N1 = Op.getOperand(1);
Scott Michel266bc8f2007-12-04 22:23:35 +00002205 unsigned N1Opc;
2206 N0 = (N0.getOpcode() != ISD::Constant
Dale Johannesened2eee62009-02-06 01:31:28 +00002207 ? DAG.getNode(ISD::SIGN_EXTEND, dl, MVT::i16, N0)
Scott Michelf0569be2008-12-27 04:51:36 +00002208 : DAG.getConstant(cast<ConstantSDNode>(N0)->getSExtValue(),
Dan Gohmanf5aeb1a2008-09-12 16:56:44 +00002209 MVT::i16));
Scott Michelf0569be2008-12-27 04:51:36 +00002210 N1Opc = N1.getValueType().bitsLT(ShiftVT)
Gabor Greif93c53e52008-08-31 15:37:04 +00002211 ? ISD::SIGN_EXTEND
2212 : ISD::TRUNCATE;
Scott Michel266bc8f2007-12-04 22:23:35 +00002213 N1 = (N1.getOpcode() != ISD::Constant
Dale Johannesened2eee62009-02-06 01:31:28 +00002214 ? DAG.getNode(N1Opc, dl, ShiftVT, N1)
Dan Gohmanf5aeb1a2008-09-12 16:56:44 +00002215 : DAG.getConstant(cast<ConstantSDNode>(N1)->getZExtValue(),
Scott Michelf0569be2008-12-27 04:51:36 +00002216 ShiftVT));
Dale Johannesened2eee62009-02-06 01:31:28 +00002217 return DAG.getNode(ISD::TRUNCATE, dl, MVT::i8,
2218 DAG.getNode(Opc, dl, MVT::i16, N0, N1));
Scott Michel266bc8f2007-12-04 22:23:35 +00002219 }
2220 case ISD::MUL: {
Dan Gohman475871a2008-07-27 21:46:04 +00002221 SDValue N1 = Op.getOperand(1);
Scott Michel266bc8f2007-12-04 22:23:35 +00002222 unsigned N1Opc;
2223 N0 = (N0.getOpcode() != ISD::Constant
Dale Johannesened2eee62009-02-06 01:31:28 +00002224 ? DAG.getNode(ISD::SIGN_EXTEND, dl, MVT::i16, N0)
Dan Gohmanf5aeb1a2008-09-12 16:56:44 +00002225 : DAG.getConstant(cast<ConstantSDNode>(N0)->getZExtValue(),
2226 MVT::i16));
Duncan Sands8e4eb092008-06-08 20:54:56 +00002227 N1Opc = N1.getValueType().bitsLT(MVT::i16) ? ISD::SIGN_EXTEND : ISD::TRUNCATE;
Scott Michel266bc8f2007-12-04 22:23:35 +00002228 N1 = (N1.getOpcode() != ISD::Constant
Dale Johannesened2eee62009-02-06 01:31:28 +00002229 ? DAG.getNode(N1Opc, dl, MVT::i16, N1)
Scott Michelf0569be2008-12-27 04:51:36 +00002230 : DAG.getConstant(cast<ConstantSDNode>(N1)->getSExtValue(),
Dan Gohmanf5aeb1a2008-09-12 16:56:44 +00002231 MVT::i16));
Dale Johannesened2eee62009-02-06 01:31:28 +00002232 return DAG.getNode(ISD::TRUNCATE, dl, MVT::i8,
2233 DAG.getNode(Opc, dl, MVT::i16, N0, N1));
Scott Michel266bc8f2007-12-04 22:23:35 +00002234 break;
2235 }
2236 }
2237
Dan Gohman475871a2008-07-27 21:46:04 +00002238 return SDValue();
Scott Michel266bc8f2007-12-04 22:23:35 +00002239}
2240
Scott Michel94bd57e2009-01-15 04:41:47 +00002241//! Generate the carry-generate shuffle mask.
Dale Johannesened2eee62009-02-06 01:31:28 +00002242SDValue SPU::getCarryGenerateShufMask(SelectionDAG &DAG, DebugLoc dl) {
Scott Micheld1e8d9c2009-01-21 04:58:48 +00002243 SmallVector<SDValue, 16 > ShufBytes;
Scott Michela59d4692008-02-23 18:41:37 +00002244
Scott Micheld1e8d9c2009-01-21 04:58:48 +00002245 // Create the shuffle mask for "rotating" the borrow up one register slot
2246 // once the borrow is generated.
2247 ShufBytes.push_back(DAG.getConstant(0x04050607, MVT::i32));
2248 ShufBytes.push_back(DAG.getConstant(0x80808080, MVT::i32));
2249 ShufBytes.push_back(DAG.getConstant(0x0c0d0e0f, MVT::i32));
2250 ShufBytes.push_back(DAG.getConstant(0x80808080, MVT::i32));
Scott Michela59d4692008-02-23 18:41:37 +00002251
Evan Chenga87008d2009-02-25 22:49:59 +00002252 return DAG.getNode(ISD::BUILD_VECTOR, dl, MVT::v4i32,
2253 &ShufBytes[0], ShufBytes.size());
Scott Michel94bd57e2009-01-15 04:41:47 +00002254}
Scott Michela59d4692008-02-23 18:41:37 +00002255
Scott Michel94bd57e2009-01-15 04:41:47 +00002256//! Generate the borrow-generate shuffle mask
Dale Johannesened2eee62009-02-06 01:31:28 +00002257SDValue SPU::getBorrowGenerateShufMask(SelectionDAG &DAG, DebugLoc dl) {
Scott Micheld1e8d9c2009-01-21 04:58:48 +00002258 SmallVector<SDValue, 16 > ShufBytes;
Scott Michela59d4692008-02-23 18:41:37 +00002259
Scott Micheld1e8d9c2009-01-21 04:58:48 +00002260 // Create the shuffle mask for "rotating" the borrow up one register slot
2261 // once the borrow is generated.
2262 ShufBytes.push_back(DAG.getConstant(0x04050607, MVT::i32));
2263 ShufBytes.push_back(DAG.getConstant(0xc0c0c0c0, MVT::i32));
2264 ShufBytes.push_back(DAG.getConstant(0x0c0d0e0f, MVT::i32));
2265 ShufBytes.push_back(DAG.getConstant(0xc0c0c0c0, MVT::i32));
Scott Michel045a1452008-11-24 18:20:46 +00002266
Evan Chenga87008d2009-02-25 22:49:59 +00002267 return DAG.getNode(ISD::BUILD_VECTOR, dl, MVT::v4i32,
2268 &ShufBytes[0], ShufBytes.size());
Scott Michela59d4692008-02-23 18:41:37 +00002269}
2270
Scott Michel266bc8f2007-12-04 22:23:35 +00002271//! Lower byte immediate operations for v16i8 vectors:
Dan Gohman475871a2008-07-27 21:46:04 +00002272static SDValue
2273LowerByteImmed(SDValue Op, SelectionDAG &DAG) {
2274 SDValue ConstVec;
2275 SDValue Arg;
Duncan Sands83ec4b62008-06-06 12:08:01 +00002276 MVT VT = Op.getValueType();
Dale Johannesened2eee62009-02-06 01:31:28 +00002277 DebugLoc dl = Op.getDebugLoc();
Scott Michel266bc8f2007-12-04 22:23:35 +00002278
2279 ConstVec = Op.getOperand(0);
2280 Arg = Op.getOperand(1);
Gabor Greifba36cb52008-08-28 21:40:38 +00002281 if (ConstVec.getNode()->getOpcode() != ISD::BUILD_VECTOR) {
2282 if (ConstVec.getNode()->getOpcode() == ISD::BIT_CONVERT) {
Scott Michel266bc8f2007-12-04 22:23:35 +00002283 ConstVec = ConstVec.getOperand(0);
2284 } else {
2285 ConstVec = Op.getOperand(1);
2286 Arg = Op.getOperand(0);
Gabor Greifba36cb52008-08-28 21:40:38 +00002287 if (ConstVec.getNode()->getOpcode() == ISD::BIT_CONVERT) {
Scott Michel7f9ba9b2008-01-30 02:55:46 +00002288 ConstVec = ConstVec.getOperand(0);
Scott Michel266bc8f2007-12-04 22:23:35 +00002289 }
2290 }
2291 }
2292
Gabor Greifba36cb52008-08-28 21:40:38 +00002293 if (ConstVec.getNode()->getOpcode() == ISD::BUILD_VECTOR) {
Scott Michel266bc8f2007-12-04 22:23:35 +00002294 uint64_t VectorBits[2];
2295 uint64_t UndefBits[2];
2296 uint64_t SplatBits, SplatUndef;
2297 int SplatSize;
2298
Gabor Greifba36cb52008-08-28 21:40:38 +00002299 if (!GetConstantBuildVectorBits(ConstVec.getNode(), VectorBits, UndefBits)
Scott Michel7f9ba9b2008-01-30 02:55:46 +00002300 && isConstantSplat(VectorBits, UndefBits,
Duncan Sands83ec4b62008-06-06 12:08:01 +00002301 VT.getVectorElementType().getSizeInBits(),
Scott Michel7f9ba9b2008-01-30 02:55:46 +00002302 SplatBits, SplatUndef, SplatSize)) {
Dan Gohman475871a2008-07-27 21:46:04 +00002303 SDValue tcVec[16];
2304 SDValue tc = DAG.getTargetConstant(SplatBits & 0xff, MVT::i8);
Scott Michel266bc8f2007-12-04 22:23:35 +00002305 const size_t tcVecSize = sizeof(tcVec) / sizeof(tcVec[0]);
2306
2307 // Turn the BUILD_VECTOR into a set of target constants:
2308 for (size_t i = 0; i < tcVecSize; ++i)
Scott Michel7f9ba9b2008-01-30 02:55:46 +00002309 tcVec[i] = tc;
Scott Michel266bc8f2007-12-04 22:23:35 +00002310
Dale Johannesened2eee62009-02-06 01:31:28 +00002311 return DAG.getNode(Op.getNode()->getOpcode(), dl, VT, Arg,
Evan Chenga87008d2009-02-25 22:49:59 +00002312 DAG.getNode(ISD::BUILD_VECTOR, dl, VT,
2313 tcVec, tcVecSize));
Scott Michel266bc8f2007-12-04 22:23:35 +00002314 }
2315 }
Scott Michel9de57a92009-01-26 22:33:37 +00002316
Nate Begeman24dc3462008-07-29 19:07:27 +00002317 // These operations (AND, OR, XOR) are legal, they just couldn't be custom
2318 // lowered. Return the operation, rather than a null SDValue.
2319 return Op;
Scott Michel266bc8f2007-12-04 22:23:35 +00002320}
2321
Scott Michel266bc8f2007-12-04 22:23:35 +00002322//! Custom lowering for CTPOP (count population)
2323/*!
2324 Custom lowering code that counts the number ones in the input
2325 operand. SPU has such an instruction, but it counts the number of
2326 ones per byte, which then have to be accumulated.
2327*/
Dan Gohman475871a2008-07-27 21:46:04 +00002328static SDValue LowerCTPOP(SDValue Op, SelectionDAG &DAG) {
Duncan Sands83ec4b62008-06-06 12:08:01 +00002329 MVT VT = Op.getValueType();
2330 MVT vecVT = MVT::getVectorVT(VT, (128 / VT.getSizeInBits()));
Dale Johannesena05dca42009-02-04 23:02:30 +00002331 DebugLoc dl = Op.getDebugLoc();
Scott Michel266bc8f2007-12-04 22:23:35 +00002332
Duncan Sands83ec4b62008-06-06 12:08:01 +00002333 switch (VT.getSimpleVT()) {
2334 default:
2335 assert(false && "Invalid value type!");
Scott Michel266bc8f2007-12-04 22:23:35 +00002336 case MVT::i8: {
Dan Gohman475871a2008-07-27 21:46:04 +00002337 SDValue N = Op.getOperand(0);
2338 SDValue Elt0 = DAG.getConstant(0, MVT::i32);
Scott Michel266bc8f2007-12-04 22:23:35 +00002339
Dale Johannesena05dca42009-02-04 23:02:30 +00002340 SDValue Promote = DAG.getNode(SPUISD::PREFSLOT2VEC, dl, vecVT, N, N);
2341 SDValue CNTB = DAG.getNode(SPUISD::CNTB, dl, vecVT, Promote);
Scott Michel266bc8f2007-12-04 22:23:35 +00002342
Dale Johannesena05dca42009-02-04 23:02:30 +00002343 return DAG.getNode(ISD::EXTRACT_VECTOR_ELT, dl, MVT::i8, CNTB, Elt0);
Scott Michel266bc8f2007-12-04 22:23:35 +00002344 }
2345
2346 case MVT::i16: {
2347 MachineFunction &MF = DAG.getMachineFunction();
Chris Lattner84bc5422007-12-31 04:13:23 +00002348 MachineRegisterInfo &RegInfo = MF.getRegInfo();
Scott Michel266bc8f2007-12-04 22:23:35 +00002349
Chris Lattner84bc5422007-12-31 04:13:23 +00002350 unsigned CNTB_reg = RegInfo.createVirtualRegister(&SPU::R16CRegClass);
Scott Michel266bc8f2007-12-04 22:23:35 +00002351
Dan Gohman475871a2008-07-27 21:46:04 +00002352 SDValue N = Op.getOperand(0);
2353 SDValue Elt0 = DAG.getConstant(0, MVT::i16);
2354 SDValue Mask0 = DAG.getConstant(0x0f, MVT::i16);
Duncan Sandsfa7935f2008-10-30 19:24:28 +00002355 SDValue Shift1 = DAG.getConstant(8, MVT::i32);
Scott Michel266bc8f2007-12-04 22:23:35 +00002356
Dale Johannesena05dca42009-02-04 23:02:30 +00002357 SDValue Promote = DAG.getNode(SPUISD::PREFSLOT2VEC, dl, vecVT, N, N);
2358 SDValue CNTB = DAG.getNode(SPUISD::CNTB, dl, vecVT, Promote);
Scott Michel266bc8f2007-12-04 22:23:35 +00002359
2360 // CNTB_result becomes the chain to which all of the virtual registers
2361 // CNTB_reg, SUM1_reg become associated:
Dan Gohman475871a2008-07-27 21:46:04 +00002362 SDValue CNTB_result =
Dale Johannesena05dca42009-02-04 23:02:30 +00002363 DAG.getNode(ISD::EXTRACT_VECTOR_ELT, dl, MVT::i16, CNTB, Elt0);
Scott Michel5af8f0e2008-07-16 17:17:29 +00002364
Dan Gohman475871a2008-07-27 21:46:04 +00002365 SDValue CNTB_rescopy =
Dale Johannesena05dca42009-02-04 23:02:30 +00002366 DAG.getCopyToReg(CNTB_result, dl, CNTB_reg, CNTB_result);
Scott Michel266bc8f2007-12-04 22:23:35 +00002367
Dale Johannesena05dca42009-02-04 23:02:30 +00002368 SDValue Tmp1 = DAG.getCopyFromReg(CNTB_rescopy, dl, CNTB_reg, MVT::i16);
Scott Michel266bc8f2007-12-04 22:23:35 +00002369
Dale Johannesena05dca42009-02-04 23:02:30 +00002370 return DAG.getNode(ISD::AND, dl, MVT::i16,
2371 DAG.getNode(ISD::ADD, dl, MVT::i16,
2372 DAG.getNode(ISD::SRL, dl, MVT::i16,
Scott Michel7f9ba9b2008-01-30 02:55:46 +00002373 Tmp1, Shift1),
2374 Tmp1),
2375 Mask0);
Scott Michel266bc8f2007-12-04 22:23:35 +00002376 }
2377
2378 case MVT::i32: {
2379 MachineFunction &MF = DAG.getMachineFunction();
Chris Lattner84bc5422007-12-31 04:13:23 +00002380 MachineRegisterInfo &RegInfo = MF.getRegInfo();
Scott Michel266bc8f2007-12-04 22:23:35 +00002381
Chris Lattner84bc5422007-12-31 04:13:23 +00002382 unsigned CNTB_reg = RegInfo.createVirtualRegister(&SPU::R32CRegClass);
2383 unsigned SUM1_reg = RegInfo.createVirtualRegister(&SPU::R32CRegClass);
Scott Michel266bc8f2007-12-04 22:23:35 +00002384
Dan Gohman475871a2008-07-27 21:46:04 +00002385 SDValue N = Op.getOperand(0);
2386 SDValue Elt0 = DAG.getConstant(0, MVT::i32);
2387 SDValue Mask0 = DAG.getConstant(0xff, MVT::i32);
2388 SDValue Shift1 = DAG.getConstant(16, MVT::i32);
2389 SDValue Shift2 = DAG.getConstant(8, MVT::i32);
Scott Michel266bc8f2007-12-04 22:23:35 +00002390
Dale Johannesena05dca42009-02-04 23:02:30 +00002391 SDValue Promote = DAG.getNode(SPUISD::PREFSLOT2VEC, dl, vecVT, N, N);
2392 SDValue CNTB = DAG.getNode(SPUISD::CNTB, dl, vecVT, Promote);
Scott Michel266bc8f2007-12-04 22:23:35 +00002393
2394 // CNTB_result becomes the chain to which all of the virtual registers
2395 // CNTB_reg, SUM1_reg become associated:
Dan Gohman475871a2008-07-27 21:46:04 +00002396 SDValue CNTB_result =
Dale Johannesena05dca42009-02-04 23:02:30 +00002397 DAG.getNode(ISD::EXTRACT_VECTOR_ELT, dl, MVT::i32, CNTB, Elt0);
Scott Michel5af8f0e2008-07-16 17:17:29 +00002398
Dan Gohman475871a2008-07-27 21:46:04 +00002399 SDValue CNTB_rescopy =
Dale Johannesena05dca42009-02-04 23:02:30 +00002400 DAG.getCopyToReg(CNTB_result, dl, CNTB_reg, CNTB_result);
Scott Michel266bc8f2007-12-04 22:23:35 +00002401
Dan Gohman475871a2008-07-27 21:46:04 +00002402 SDValue Comp1 =
Dale Johannesena05dca42009-02-04 23:02:30 +00002403 DAG.getNode(ISD::SRL, dl, MVT::i32,
2404 DAG.getCopyFromReg(CNTB_rescopy, dl, CNTB_reg, MVT::i32),
2405 Shift1);
Scott Michel266bc8f2007-12-04 22:23:35 +00002406
Dan Gohman475871a2008-07-27 21:46:04 +00002407 SDValue Sum1 =
Dale Johannesena05dca42009-02-04 23:02:30 +00002408 DAG.getNode(ISD::ADD, dl, MVT::i32, Comp1,
2409 DAG.getCopyFromReg(CNTB_rescopy, dl, CNTB_reg, MVT::i32));
Scott Michel266bc8f2007-12-04 22:23:35 +00002410
Dan Gohman475871a2008-07-27 21:46:04 +00002411 SDValue Sum1_rescopy =
Dale Johannesena05dca42009-02-04 23:02:30 +00002412 DAG.getCopyToReg(CNTB_result, dl, SUM1_reg, Sum1);
Scott Michel266bc8f2007-12-04 22:23:35 +00002413
Dan Gohman475871a2008-07-27 21:46:04 +00002414 SDValue Comp2 =
Dale Johannesena05dca42009-02-04 23:02:30 +00002415 DAG.getNode(ISD::SRL, dl, MVT::i32,
2416 DAG.getCopyFromReg(Sum1_rescopy, dl, SUM1_reg, MVT::i32),
Scott Michel7f9ba9b2008-01-30 02:55:46 +00002417 Shift2);
Dan Gohman475871a2008-07-27 21:46:04 +00002418 SDValue Sum2 =
Dale Johannesena05dca42009-02-04 23:02:30 +00002419 DAG.getNode(ISD::ADD, dl, MVT::i32, Comp2,
2420 DAG.getCopyFromReg(Sum1_rescopy, dl, SUM1_reg, MVT::i32));
Scott Michel266bc8f2007-12-04 22:23:35 +00002421
Dale Johannesena05dca42009-02-04 23:02:30 +00002422 return DAG.getNode(ISD::AND, dl, MVT::i32, Sum2, Mask0);
Scott Michel266bc8f2007-12-04 22:23:35 +00002423 }
2424
2425 case MVT::i64:
2426 break;
2427 }
2428
Dan Gohman475871a2008-07-27 21:46:04 +00002429 return SDValue();
Scott Michel266bc8f2007-12-04 22:23:35 +00002430}
2431
Scott Michelc9c8b2a2009-01-26 03:31:40 +00002432//! Lower ISD::FP_TO_SINT, ISD::FP_TO_UINT for i32
Scott Micheld1e8d9c2009-01-21 04:58:48 +00002433/*!
Scott Michelc9c8b2a2009-01-26 03:31:40 +00002434 f32->i32 passes through unchanged, whereas f64->i32 expands to a libcall.
2435 All conversions to i64 are expanded to a libcall.
Scott Micheld1e8d9c2009-01-21 04:58:48 +00002436 */
Scott Michelc9c8b2a2009-01-26 03:31:40 +00002437static SDValue LowerFP_TO_INT(SDValue Op, SelectionDAG &DAG,
2438 SPUTargetLowering &TLI) {
Scott Micheld1e8d9c2009-01-21 04:58:48 +00002439 MVT OpVT = Op.getValueType();
Scott Micheld1e8d9c2009-01-21 04:58:48 +00002440 SDValue Op0 = Op.getOperand(0);
Scott Michelc9c8b2a2009-01-26 03:31:40 +00002441 MVT Op0VT = Op0.getValueType();
Scott Micheld1e8d9c2009-01-21 04:58:48 +00002442
Scott Michelc9c8b2a2009-01-26 03:31:40 +00002443 if ((OpVT == MVT::i32 && Op0VT == MVT::f64)
2444 || OpVT == MVT::i64) {
2445 // Convert f32 / f64 to i32 / i64 via libcall.
2446 RTLIB::Libcall LC =
2447 (Op.getOpcode() == ISD::FP_TO_SINT)
2448 ? RTLIB::getFPTOSINT(Op0VT, OpVT)
2449 : RTLIB::getFPTOUINT(Op0VT, OpVT);
2450 assert(LC != RTLIB::UNKNOWN_LIBCALL && "Unexpectd fp-to-int conversion!");
2451 SDValue Dummy;
2452 return ExpandLibCall(LC, Op, DAG, false, Dummy, TLI);
2453 }
Scott Micheld1e8d9c2009-01-21 04:58:48 +00002454
Scott Michel9de57a92009-01-26 22:33:37 +00002455 return Op; // return unmolested, legalized op
Scott Michelc9c8b2a2009-01-26 03:31:40 +00002456}
Scott Micheld1e8d9c2009-01-21 04:58:48 +00002457
Scott Michelc9c8b2a2009-01-26 03:31:40 +00002458//! Lower ISD::SINT_TO_FP, ISD::UINT_TO_FP for i32
2459/*!
2460 i32->f32 passes through unchanged, whereas i32->f64 is expanded to a libcall.
2461 All conversions from i64 are expanded to a libcall.
2462 */
2463static SDValue LowerINT_TO_FP(SDValue Op, SelectionDAG &DAG,
2464 SPUTargetLowering &TLI) {
2465 MVT OpVT = Op.getValueType();
2466 SDValue Op0 = Op.getOperand(0);
2467 MVT Op0VT = Op0.getValueType();
2468
2469 if ((OpVT == MVT::f64 && Op0VT == MVT::i32)
2470 || Op0VT == MVT::i64) {
2471 // Convert i32, i64 to f64 via libcall:
2472 RTLIB::Libcall LC =
2473 (Op.getOpcode() == ISD::SINT_TO_FP)
2474 ? RTLIB::getSINTTOFP(Op0VT, OpVT)
2475 : RTLIB::getUINTTOFP(Op0VT, OpVT);
2476 assert(LC != RTLIB::UNKNOWN_LIBCALL && "Unexpectd int-to-fp conversion!");
2477 SDValue Dummy;
2478 return ExpandLibCall(LC, Op, DAG, false, Dummy, TLI);
2479 }
2480
Scott Michel9de57a92009-01-26 22:33:37 +00002481 return Op; // return unmolested, legalized
Scott Micheld1e8d9c2009-01-21 04:58:48 +00002482}
2483
2484//! Lower ISD::SETCC
2485/*!
2486 This handles MVT::f64 (double floating point) condition lowering
2487 */
Scott Micheld1e8d9c2009-01-21 04:58:48 +00002488static SDValue LowerSETCC(SDValue Op, SelectionDAG &DAG,
2489 const TargetLowering &TLI) {
Scott Michelc9c8b2a2009-01-26 03:31:40 +00002490 CondCodeSDNode *CC = dyn_cast<CondCodeSDNode>(Op.getOperand(2));
Dale Johannesen6f38cb62009-02-07 19:59:05 +00002491 DebugLoc dl = Op.getDebugLoc();
Scott Michelc9c8b2a2009-01-26 03:31:40 +00002492 assert(CC != 0 && "LowerSETCC: CondCodeSDNode should not be null here!\n");
2493
Scott Micheld1e8d9c2009-01-21 04:58:48 +00002494 SDValue lhs = Op.getOperand(0);
2495 SDValue rhs = Op.getOperand(1);
Scott Micheld1e8d9c2009-01-21 04:58:48 +00002496 MVT lhsVT = lhs.getValueType();
Scott Micheld1e8d9c2009-01-21 04:58:48 +00002497 assert(lhsVT == MVT::f64 && "LowerSETCC: type other than MVT::64\n");
2498
Scott Michelc9c8b2a2009-01-26 03:31:40 +00002499 MVT ccResultVT = TLI.getSetCCResultType(lhs.getValueType());
2500 APInt ccResultOnes = APInt::getAllOnesValue(ccResultVT.getSizeInBits());
2501 MVT IntVT(MVT::i64);
2502
2503 // Take advantage of the fact that (truncate (sra arg, 32)) is efficiently
2504 // selected to a NOP:
Dale Johannesenf5d97892009-02-04 01:48:28 +00002505 SDValue i64lhs = DAG.getNode(ISD::BIT_CONVERT, dl, IntVT, lhs);
Scott Michelc9c8b2a2009-01-26 03:31:40 +00002506 SDValue lhsHi32 =
Dale Johannesenf5d97892009-02-04 01:48:28 +00002507 DAG.getNode(ISD::TRUNCATE, dl, MVT::i32,
2508 DAG.getNode(ISD::SRL, dl, IntVT,
Scott Michelc9c8b2a2009-01-26 03:31:40 +00002509 i64lhs, DAG.getConstant(32, MVT::i32)));
2510 SDValue lhsHi32abs =
Dale Johannesenf5d97892009-02-04 01:48:28 +00002511 DAG.getNode(ISD::AND, dl, MVT::i32,
Scott Michelc9c8b2a2009-01-26 03:31:40 +00002512 lhsHi32, DAG.getConstant(0x7fffffff, MVT::i32));
2513 SDValue lhsLo32 =
Dale Johannesenf5d97892009-02-04 01:48:28 +00002514 DAG.getNode(ISD::TRUNCATE, dl, MVT::i32, i64lhs);
Scott Michelc9c8b2a2009-01-26 03:31:40 +00002515
2516 // SETO and SETUO only use the lhs operand:
2517 if (CC->get() == ISD::SETO) {
2518 // Evaluates to true if Op0 is not [SQ]NaN - lowers to the inverse of
2519 // SETUO
2520 APInt ccResultAllOnes = APInt::getAllOnesValue(ccResultVT.getSizeInBits());
Dale Johannesenf5d97892009-02-04 01:48:28 +00002521 return DAG.getNode(ISD::XOR, dl, ccResultVT,
2522 DAG.getSetCC(dl, ccResultVT,
Scott Michelc9c8b2a2009-01-26 03:31:40 +00002523 lhs, DAG.getConstantFP(0.0, lhsVT),
2524 ISD::SETUO),
2525 DAG.getConstant(ccResultAllOnes, ccResultVT));
2526 } else if (CC->get() == ISD::SETUO) {
2527 // Evaluates to true if Op0 is [SQ]NaN
Dale Johannesenf5d97892009-02-04 01:48:28 +00002528 return DAG.getNode(ISD::AND, dl, ccResultVT,
2529 DAG.getSetCC(dl, ccResultVT,
Scott Michelc9c8b2a2009-01-26 03:31:40 +00002530 lhsHi32abs,
2531 DAG.getConstant(0x7ff00000, MVT::i32),
2532 ISD::SETGE),
Dale Johannesenf5d97892009-02-04 01:48:28 +00002533 DAG.getSetCC(dl, ccResultVT,
Scott Michelc9c8b2a2009-01-26 03:31:40 +00002534 lhsLo32,
2535 DAG.getConstant(0, MVT::i32),
2536 ISD::SETGT));
2537 }
2538
Dale Johannesenb300d2a2009-02-07 00:55:49 +00002539 SDValue i64rhs = DAG.getNode(ISD::BIT_CONVERT, dl, IntVT, rhs);
Scott Michelc9c8b2a2009-01-26 03:31:40 +00002540 SDValue rhsHi32 =
Dale Johannesenf5d97892009-02-04 01:48:28 +00002541 DAG.getNode(ISD::TRUNCATE, dl, MVT::i32,
2542 DAG.getNode(ISD::SRL, dl, IntVT,
Scott Michelc9c8b2a2009-01-26 03:31:40 +00002543 i64rhs, DAG.getConstant(32, MVT::i32)));
2544
2545 // If a value is negative, subtract from the sign magnitude constant:
2546 SDValue signMag2TC = DAG.getConstant(0x8000000000000000ULL, IntVT);
2547
2548 // Convert the sign-magnitude representation into 2's complement:
Dale Johannesenf5d97892009-02-04 01:48:28 +00002549 SDValue lhsSelectMask = DAG.getNode(ISD::SRA, dl, ccResultVT,
Scott Michelc9c8b2a2009-01-26 03:31:40 +00002550 lhsHi32, DAG.getConstant(31, MVT::i32));
Dale Johannesenf5d97892009-02-04 01:48:28 +00002551 SDValue lhsSignMag2TC = DAG.getNode(ISD::SUB, dl, IntVT, signMag2TC, i64lhs);
Scott Michelc9c8b2a2009-01-26 03:31:40 +00002552 SDValue lhsSelect =
Dale Johannesenf5d97892009-02-04 01:48:28 +00002553 DAG.getNode(ISD::SELECT, dl, IntVT,
Scott Michelc9c8b2a2009-01-26 03:31:40 +00002554 lhsSelectMask, lhsSignMag2TC, i64lhs);
2555
Dale Johannesenf5d97892009-02-04 01:48:28 +00002556 SDValue rhsSelectMask = DAG.getNode(ISD::SRA, dl, ccResultVT,
Scott Michelc9c8b2a2009-01-26 03:31:40 +00002557 rhsHi32, DAG.getConstant(31, MVT::i32));
Dale Johannesenf5d97892009-02-04 01:48:28 +00002558 SDValue rhsSignMag2TC = DAG.getNode(ISD::SUB, dl, IntVT, signMag2TC, i64rhs);
Scott Michelc9c8b2a2009-01-26 03:31:40 +00002559 SDValue rhsSelect =
Dale Johannesenf5d97892009-02-04 01:48:28 +00002560 DAG.getNode(ISD::SELECT, dl, IntVT,
Scott Michelc9c8b2a2009-01-26 03:31:40 +00002561 rhsSelectMask, rhsSignMag2TC, i64rhs);
2562
2563 unsigned compareOp;
2564
Scott Micheld1e8d9c2009-01-21 04:58:48 +00002565 switch (CC->get()) {
2566 case ISD::SETOEQ:
Scott Micheld1e8d9c2009-01-21 04:58:48 +00002567 case ISD::SETUEQ:
Scott Michelc9c8b2a2009-01-26 03:31:40 +00002568 compareOp = ISD::SETEQ; break;
2569 case ISD::SETOGT:
Scott Micheld1e8d9c2009-01-21 04:58:48 +00002570 case ISD::SETUGT:
Scott Michelc9c8b2a2009-01-26 03:31:40 +00002571 compareOp = ISD::SETGT; break;
2572 case ISD::SETOGE:
Scott Micheld1e8d9c2009-01-21 04:58:48 +00002573 case ISD::SETUGE:
Scott Michelc9c8b2a2009-01-26 03:31:40 +00002574 compareOp = ISD::SETGE; break;
2575 case ISD::SETOLT:
Scott Micheld1e8d9c2009-01-21 04:58:48 +00002576 case ISD::SETULT:
Scott Michelc9c8b2a2009-01-26 03:31:40 +00002577 compareOp = ISD::SETLT; break;
2578 case ISD::SETOLE:
Scott Micheld1e8d9c2009-01-21 04:58:48 +00002579 case ISD::SETULE:
Scott Michelc9c8b2a2009-01-26 03:31:40 +00002580 compareOp = ISD::SETLE; break;
Scott Micheld1e8d9c2009-01-21 04:58:48 +00002581 case ISD::SETUNE:
Scott Michelc9c8b2a2009-01-26 03:31:40 +00002582 case ISD::SETONE:
2583 compareOp = ISD::SETNE; break;
Scott Micheld1e8d9c2009-01-21 04:58:48 +00002584 default:
2585 cerr << "CellSPU ISel Select: unimplemented f64 condition\n";
2586 abort();
2587 break;
2588 }
2589
Scott Michelc9c8b2a2009-01-26 03:31:40 +00002590 SDValue result =
Dale Johannesenf5d97892009-02-04 01:48:28 +00002591 DAG.getSetCC(dl, ccResultVT, lhsSelect, rhsSelect,
2592 (ISD::CondCode) compareOp);
Scott Michelc9c8b2a2009-01-26 03:31:40 +00002593
2594 if ((CC->get() & 0x8) == 0) {
2595 // Ordered comparison:
Dale Johannesenf5d97892009-02-04 01:48:28 +00002596 SDValue lhsNaN = DAG.getSetCC(dl, ccResultVT,
Scott Michelc9c8b2a2009-01-26 03:31:40 +00002597 lhs, DAG.getConstantFP(0.0, MVT::f64),
2598 ISD::SETO);
Dale Johannesenf5d97892009-02-04 01:48:28 +00002599 SDValue rhsNaN = DAG.getSetCC(dl, ccResultVT,
Scott Michelc9c8b2a2009-01-26 03:31:40 +00002600 rhs, DAG.getConstantFP(0.0, MVT::f64),
2601 ISD::SETO);
Dale Johannesenf5d97892009-02-04 01:48:28 +00002602 SDValue ordered = DAG.getNode(ISD::AND, dl, ccResultVT, lhsNaN, rhsNaN);
Scott Michelc9c8b2a2009-01-26 03:31:40 +00002603
Dale Johannesenf5d97892009-02-04 01:48:28 +00002604 result = DAG.getNode(ISD::AND, dl, ccResultVT, ordered, result);
Scott Michelc9c8b2a2009-01-26 03:31:40 +00002605 }
2606
2607 return result;
Scott Micheld1e8d9c2009-01-21 04:58:48 +00002608}
2609
Scott Michel7a1c9e92008-11-22 23:50:42 +00002610//! Lower ISD::SELECT_CC
2611/*!
2612 ISD::SELECT_CC can (generally) be implemented directly on the SPU using the
2613 SELB instruction.
2614
2615 \note Need to revisit this in the future: if the code path through the true
2616 and false value computations is longer than the latency of a branch (6
2617 cycles), then it would be more advantageous to branch and insert a new basic
2618 block and branch on the condition. However, this code does not make that
2619 assumption, given the simplisitc uses so far.
2620 */
2621
Scott Michelf0569be2008-12-27 04:51:36 +00002622static SDValue LowerSELECT_CC(SDValue Op, SelectionDAG &DAG,
2623 const TargetLowering &TLI) {
Scott Michel7a1c9e92008-11-22 23:50:42 +00002624 MVT VT = Op.getValueType();
2625 SDValue lhs = Op.getOperand(0);
2626 SDValue rhs = Op.getOperand(1);
2627 SDValue trueval = Op.getOperand(2);
2628 SDValue falseval = Op.getOperand(3);
2629 SDValue condition = Op.getOperand(4);
Dale Johannesende064702009-02-06 21:50:26 +00002630 DebugLoc dl = Op.getDebugLoc();
Scott Michel7a1c9e92008-11-22 23:50:42 +00002631
Scott Michelf0569be2008-12-27 04:51:36 +00002632 // NOTE: SELB's arguments: $rA, $rB, $mask
2633 //
2634 // SELB selects bits from $rA where bits in $mask are 0, bits from $rB
2635 // where bits in $mask are 1. CCond will be inverted, having 1s where the
2636 // condition was true and 0s where the condition was false. Hence, the
2637 // arguments to SELB get reversed.
2638
Scott Michel7a1c9e92008-11-22 23:50:42 +00002639 // Note: Really should be ISD::SELECT instead of SPUISD::SELB, but LLVM's
2640 // legalizer insists on combining SETCC/SELECT into SELECT_CC, so we end up
2641 // with another "cannot select select_cc" assert:
2642
Dale Johannesende064702009-02-06 21:50:26 +00002643 SDValue compare = DAG.getNode(ISD::SETCC, dl,
Duncan Sands5480c042009-01-01 15:52:00 +00002644 TLI.getSetCCResultType(Op.getValueType()),
Scott Michelf0569be2008-12-27 04:51:36 +00002645 lhs, rhs, condition);
Dale Johannesende064702009-02-06 21:50:26 +00002646 return DAG.getNode(SPUISD::SELB, dl, VT, falseval, trueval, compare);
Scott Michel7a1c9e92008-11-22 23:50:42 +00002647}
2648
Scott Michelb30e8f62008-12-02 19:53:53 +00002649//! Custom lower ISD::TRUNCATE
2650static SDValue LowerTRUNCATE(SDValue Op, SelectionDAG &DAG)
2651{
2652 MVT VT = Op.getValueType();
2653 MVT::SimpleValueType simpleVT = VT.getSimpleVT();
2654 MVT VecVT = MVT::getVectorVT(VT, (128 / VT.getSizeInBits()));
Dale Johannesende064702009-02-06 21:50:26 +00002655 DebugLoc dl = Op.getDebugLoc();
Scott Michelb30e8f62008-12-02 19:53:53 +00002656
2657 SDValue Op0 = Op.getOperand(0);
2658 MVT Op0VT = Op0.getValueType();
2659 MVT Op0VecVT = MVT::getVectorVT(Op0VT, (128 / Op0VT.getSizeInBits()));
2660
Scott Michelf0569be2008-12-27 04:51:36 +00002661 if (Op0VT.getSimpleVT() == MVT::i128 && simpleVT == MVT::i64) {
Scott Michel52d00012009-01-03 00:27:53 +00002662 // Create shuffle mask, least significant doubleword of quadword
Scott Michelf0569be2008-12-27 04:51:36 +00002663 unsigned maskHigh = 0x08090a0b;
2664 unsigned maskLow = 0x0c0d0e0f;
2665 // Use a shuffle to perform the truncation
Evan Chenga87008d2009-02-25 22:49:59 +00002666 SDValue shufMask = DAG.getNode(ISD::BUILD_VECTOR, dl, MVT::v4i32,
2667 DAG.getConstant(maskHigh, MVT::i32),
2668 DAG.getConstant(maskLow, MVT::i32),
2669 DAG.getConstant(maskHigh, MVT::i32),
2670 DAG.getConstant(maskLow, MVT::i32));
Scott Michelf0569be2008-12-27 04:51:36 +00002671
2672
Dale Johannesende064702009-02-06 21:50:26 +00002673 SDValue PromoteScalar = DAG.getNode(SPUISD::PREFSLOT2VEC, dl,
2674 Op0VecVT, Op0);
Scott Michelf0569be2008-12-27 04:51:36 +00002675
Dale Johannesende064702009-02-06 21:50:26 +00002676 SDValue truncShuffle = DAG.getNode(SPUISD::SHUFB, dl, Op0VecVT,
Scott Michelf0569be2008-12-27 04:51:36 +00002677 PromoteScalar, PromoteScalar, shufMask);
2678
Dale Johannesende064702009-02-06 21:50:26 +00002679 return DAG.getNode(SPUISD::VEC2PREFSLOT, dl, VT,
Dale Johannesenb300d2a2009-02-07 00:55:49 +00002680 DAG.getNode(ISD::BIT_CONVERT, dl, VecVT, truncShuffle));
Scott Michelb30e8f62008-12-02 19:53:53 +00002681 }
2682
Scott Michelf0569be2008-12-27 04:51:36 +00002683 return SDValue(); // Leave the truncate unmolested
Scott Michelb30e8f62008-12-02 19:53:53 +00002684}
2685
Scott Michel7a1c9e92008-11-22 23:50:42 +00002686//! Custom (target-specific) lowering entry point
2687/*!
2688 This is where LLVM's DAG selection process calls to do target-specific
2689 lowering of nodes.
2690 */
Dan Gohman475871a2008-07-27 21:46:04 +00002691SDValue
2692SPUTargetLowering::LowerOperation(SDValue Op, SelectionDAG &DAG)
Scott Michel266bc8f2007-12-04 22:23:35 +00002693{
Scott Michela59d4692008-02-23 18:41:37 +00002694 unsigned Opc = (unsigned) Op.getOpcode();
Duncan Sands83ec4b62008-06-06 12:08:01 +00002695 MVT VT = Op.getValueType();
Scott Michela59d4692008-02-23 18:41:37 +00002696
2697 switch (Opc) {
Scott Michel266bc8f2007-12-04 22:23:35 +00002698 default: {
2699 cerr << "SPUTargetLowering::LowerOperation(): need to lower this!\n";
Scott Michela59d4692008-02-23 18:41:37 +00002700 cerr << "Op.getOpcode() = " << Opc << "\n";
Gabor Greifba36cb52008-08-28 21:40:38 +00002701 cerr << "*Op.getNode():\n";
2702 Op.getNode()->dump();
Scott Michel266bc8f2007-12-04 22:23:35 +00002703 abort();
2704 }
2705 case ISD::LOAD:
Scott Michelb30e8f62008-12-02 19:53:53 +00002706 case ISD::EXTLOAD:
Scott Michel266bc8f2007-12-04 22:23:35 +00002707 case ISD::SEXTLOAD:
2708 case ISD::ZEXTLOAD:
2709 return LowerLOAD(Op, DAG, SPUTM.getSubtargetImpl());
2710 case ISD::STORE:
2711 return LowerSTORE(Op, DAG, SPUTM.getSubtargetImpl());
2712 case ISD::ConstantPool:
2713 return LowerConstantPool(Op, DAG, SPUTM.getSubtargetImpl());
2714 case ISD::GlobalAddress:
2715 return LowerGlobalAddress(Op, DAG, SPUTM.getSubtargetImpl());
2716 case ISD::JumpTable:
2717 return LowerJumpTable(Op, DAG, SPUTM.getSubtargetImpl());
Scott Michel266bc8f2007-12-04 22:23:35 +00002718 case ISD::ConstantFP:
2719 return LowerConstantFP(Op, DAG);
2720 case ISD::FORMAL_ARGUMENTS:
Scott Michel58c58182008-01-17 20:38:41 +00002721 return LowerFORMAL_ARGUMENTS(Op, DAG, VarArgsFrameIndex);
Scott Michel266bc8f2007-12-04 22:23:35 +00002722 case ISD::CALL:
Scott Michel9de5d0d2008-01-11 02:53:15 +00002723 return LowerCALL(Op, DAG, SPUTM.getSubtargetImpl());
Scott Michel266bc8f2007-12-04 22:23:35 +00002724 case ISD::RET:
2725 return LowerRET(Op, DAG, getTargetMachine());
2726
Scott Michel02d711b2008-12-30 23:28:25 +00002727 // i8, i64 math ops:
Scott Michel8bf61e82008-06-02 22:18:03 +00002728 case ISD::ADD:
Scott Michel266bc8f2007-12-04 22:23:35 +00002729 case ISD::SUB:
2730 case ISD::ROTR:
2731 case ISD::ROTL:
2732 case ISD::SRL:
2733 case ISD::SHL:
Scott Michel8bf61e82008-06-02 22:18:03 +00002734 case ISD::SRA: {
Scott Michela59d4692008-02-23 18:41:37 +00002735 if (VT == MVT::i8)
Scott Michelf0569be2008-12-27 04:51:36 +00002736 return LowerI8Math(Op, DAG, Opc, *this);
Scott Michela59d4692008-02-23 18:41:37 +00002737 break;
Scott Michel8bf61e82008-06-02 22:18:03 +00002738 }
Scott Michel266bc8f2007-12-04 22:23:35 +00002739
Scott Michelc9c8b2a2009-01-26 03:31:40 +00002740 case ISD::FP_TO_SINT:
2741 case ISD::FP_TO_UINT:
2742 return LowerFP_TO_INT(Op, DAG, *this);
2743
2744 case ISD::SINT_TO_FP:
2745 case ISD::UINT_TO_FP:
2746 return LowerINT_TO_FP(Op, DAG, *this);
Scott Micheld1e8d9c2009-01-21 04:58:48 +00002747
Scott Michel266bc8f2007-12-04 22:23:35 +00002748 // Vector-related lowering.
2749 case ISD::BUILD_VECTOR:
Scott Michelc9c8b2a2009-01-26 03:31:40 +00002750 return LowerBUILD_VECTOR(Op, DAG);
Scott Michel266bc8f2007-12-04 22:23:35 +00002751 case ISD::SCALAR_TO_VECTOR:
2752 return LowerSCALAR_TO_VECTOR(Op, DAG);
2753 case ISD::VECTOR_SHUFFLE:
2754 return LowerVECTOR_SHUFFLE(Op, DAG);
2755 case ISD::EXTRACT_VECTOR_ELT:
2756 return LowerEXTRACT_VECTOR_ELT(Op, DAG);
2757 case ISD::INSERT_VECTOR_ELT:
2758 return LowerINSERT_VECTOR_ELT(Op, DAG);
2759
2760 // Look for ANDBI, ORBI and XORBI opportunities and lower appropriately:
2761 case ISD::AND:
2762 case ISD::OR:
2763 case ISD::XOR:
2764 return LowerByteImmed(Op, DAG);
2765
2766 // Vector and i8 multiply:
2767 case ISD::MUL:
Scott Michel02d711b2008-12-30 23:28:25 +00002768 if (VT == MVT::i8)
Scott Michelf0569be2008-12-27 04:51:36 +00002769 return LowerI8Math(Op, DAG, Opc, *this);
Scott Michel266bc8f2007-12-04 22:23:35 +00002770
Scott Michel266bc8f2007-12-04 22:23:35 +00002771 case ISD::CTPOP:
2772 return LowerCTPOP(Op, DAG);
Scott Michel7a1c9e92008-11-22 23:50:42 +00002773
2774 case ISD::SELECT_CC:
Scott Michelf0569be2008-12-27 04:51:36 +00002775 return LowerSELECT_CC(Op, DAG, *this);
Scott Michelb30e8f62008-12-02 19:53:53 +00002776
Scott Micheld1e8d9c2009-01-21 04:58:48 +00002777 case ISD::SETCC:
2778 return LowerSETCC(Op, DAG, *this);
2779
Scott Michelb30e8f62008-12-02 19:53:53 +00002780 case ISD::TRUNCATE:
2781 return LowerTRUNCATE(Op, DAG);
Scott Michel266bc8f2007-12-04 22:23:35 +00002782 }
2783
Dan Gohman475871a2008-07-27 21:46:04 +00002784 return SDValue();
Scott Michel266bc8f2007-12-04 22:23:35 +00002785}
2786
Duncan Sands1607f052008-12-01 11:39:25 +00002787void SPUTargetLowering::ReplaceNodeResults(SDNode *N,
2788 SmallVectorImpl<SDValue>&Results,
2789 SelectionDAG &DAG)
Scott Michel73ce1c52008-11-10 23:43:06 +00002790{
2791#if 0
2792 unsigned Opc = (unsigned) N->getOpcode();
2793 MVT OpVT = N->getValueType(0);
2794
2795 switch (Opc) {
2796 default: {
2797 cerr << "SPUTargetLowering::ReplaceNodeResults(): need to fix this!\n";
2798 cerr << "Op.getOpcode() = " << Opc << "\n";
2799 cerr << "*Op.getNode():\n";
2800 N->dump();
2801 abort();
2802 /*NOTREACHED*/
2803 }
2804 }
2805#endif
2806
2807 /* Otherwise, return unchanged */
Scott Michel73ce1c52008-11-10 23:43:06 +00002808}
2809
Scott Michel266bc8f2007-12-04 22:23:35 +00002810//===----------------------------------------------------------------------===//
Scott Michel266bc8f2007-12-04 22:23:35 +00002811// Target Optimization Hooks
2812//===----------------------------------------------------------------------===//
2813
Dan Gohman475871a2008-07-27 21:46:04 +00002814SDValue
Scott Michel266bc8f2007-12-04 22:23:35 +00002815SPUTargetLowering::PerformDAGCombine(SDNode *N, DAGCombinerInfo &DCI) const
2816{
2817#if 0
2818 TargetMachine &TM = getTargetMachine();
Scott Michel053c1da2008-01-29 02:16:57 +00002819#endif
2820 const SPUSubtarget *ST = SPUTM.getSubtargetImpl();
Scott Michel266bc8f2007-12-04 22:23:35 +00002821 SelectionDAG &DAG = DCI.DAG;
Scott Michel1a6cdb62008-12-01 17:56:02 +00002822 SDValue Op0 = N->getOperand(0); // everything has at least one operand
2823 MVT NodeVT = N->getValueType(0); // The node's value type
Scott Michelf0569be2008-12-27 04:51:36 +00002824 MVT Op0VT = Op0.getValueType(); // The first operand's result
Scott Michel1a6cdb62008-12-01 17:56:02 +00002825 SDValue Result; // Initially, empty result
Dale Johannesende064702009-02-06 21:50:26 +00002826 DebugLoc dl = N->getDebugLoc();
Scott Michel266bc8f2007-12-04 22:23:35 +00002827
2828 switch (N->getOpcode()) {
2829 default: break;
Scott Michel053c1da2008-01-29 02:16:57 +00002830 case ISD::ADD: {
Dan Gohman475871a2008-07-27 21:46:04 +00002831 SDValue Op1 = N->getOperand(1);
Scott Michel053c1da2008-01-29 02:16:57 +00002832
Scott Michelf0569be2008-12-27 04:51:36 +00002833 if (Op0.getOpcode() == SPUISD::IndirectAddr
2834 || Op1.getOpcode() == SPUISD::IndirectAddr) {
2835 // Normalize the operands to reduce repeated code
2836 SDValue IndirectArg = Op0, AddArg = Op1;
Scott Michel1df30c42008-12-29 03:23:36 +00002837
Scott Michelf0569be2008-12-27 04:51:36 +00002838 if (Op1.getOpcode() == SPUISD::IndirectAddr) {
2839 IndirectArg = Op1;
2840 AddArg = Op0;
2841 }
2842
2843 if (isa<ConstantSDNode>(AddArg)) {
2844 ConstantSDNode *CN0 = cast<ConstantSDNode > (AddArg);
2845 SDValue IndOp1 = IndirectArg.getOperand(1);
2846
2847 if (CN0->isNullValue()) {
2848 // (add (SPUindirect <arg>, <arg>), 0) ->
2849 // (SPUindirect <arg>, <arg>)
Scott Michel053c1da2008-01-29 02:16:57 +00002850
Scott Michel23f2ff72008-12-04 17:16:59 +00002851#if !defined(NDEBUG)
Scott Michelf0569be2008-12-27 04:51:36 +00002852 if (DebugFlag && isCurrentDebugType(DEBUG_TYPE)) {
Scott Michel30ee7df2008-12-04 03:02:42 +00002853 cerr << "\n"
Scott Michelf0569be2008-12-27 04:51:36 +00002854 << "Replace: (add (SPUindirect <arg>, <arg>), 0)\n"
2855 << "With: (SPUindirect <arg>, <arg>)\n";
2856 }
Scott Michel30ee7df2008-12-04 03:02:42 +00002857#endif
2858
Scott Michelf0569be2008-12-27 04:51:36 +00002859 return IndirectArg;
2860 } else if (isa<ConstantSDNode>(IndOp1)) {
2861 // (add (SPUindirect <arg>, <const>), <const>) ->
2862 // (SPUindirect <arg>, <const + const>)
2863 ConstantSDNode *CN1 = cast<ConstantSDNode > (IndOp1);
2864 int64_t combinedConst = CN0->getSExtValue() + CN1->getSExtValue();
2865 SDValue combinedValue = DAG.getConstant(combinedConst, Op0VT);
Scott Michel053c1da2008-01-29 02:16:57 +00002866
Scott Michelf0569be2008-12-27 04:51:36 +00002867#if !defined(NDEBUG)
2868 if (DebugFlag && isCurrentDebugType(DEBUG_TYPE)) {
2869 cerr << "\n"
2870 << "Replace: (add (SPUindirect <arg>, " << CN1->getSExtValue()
2871 << "), " << CN0->getSExtValue() << ")\n"
2872 << "With: (SPUindirect <arg>, "
2873 << combinedConst << ")\n";
2874 }
2875#endif
Scott Michel053c1da2008-01-29 02:16:57 +00002876
Dale Johannesende064702009-02-06 21:50:26 +00002877 return DAG.getNode(SPUISD::IndirectAddr, dl, Op0VT,
Scott Michelf0569be2008-12-27 04:51:36 +00002878 IndirectArg, combinedValue);
2879 }
Scott Michel053c1da2008-01-29 02:16:57 +00002880 }
2881 }
Scott Michela59d4692008-02-23 18:41:37 +00002882 break;
2883 }
2884 case ISD::SIGN_EXTEND:
2885 case ISD::ZERO_EXTEND:
2886 case ISD::ANY_EXTEND: {
Scott Michel1a6cdb62008-12-01 17:56:02 +00002887 if (Op0.getOpcode() == SPUISD::VEC2PREFSLOT && NodeVT == Op0VT) {
Scott Michela59d4692008-02-23 18:41:37 +00002888 // (any_extend (SPUextract_elt0 <arg>)) ->
2889 // (SPUextract_elt0 <arg>)
2890 // Types must match, however...
Scott Michel23f2ff72008-12-04 17:16:59 +00002891#if !defined(NDEBUG)
2892 if (DebugFlag && isCurrentDebugType(DEBUG_TYPE)) {
Scott Michel30ee7df2008-12-04 03:02:42 +00002893 cerr << "\nReplace: ";
2894 N->dump(&DAG);
2895 cerr << "\nWith: ";
2896 Op0.getNode()->dump(&DAG);
2897 cerr << "\n";
Scott Michel23f2ff72008-12-04 17:16:59 +00002898 }
Scott Michel30ee7df2008-12-04 03:02:42 +00002899#endif
Scott Michela59d4692008-02-23 18:41:37 +00002900
2901 return Op0;
2902 }
2903 break;
2904 }
2905 case SPUISD::IndirectAddr: {
2906 if (!ST->usingLargeMem() && Op0.getOpcode() == SPUISD::AFormAddr) {
Scott Micheld1e8d9c2009-01-21 04:58:48 +00002907 ConstantSDNode *CN = dyn_cast<ConstantSDNode>(N->getOperand(1));
2908 if (CN != 0 && CN->getZExtValue() == 0) {
Scott Michela59d4692008-02-23 18:41:37 +00002909 // (SPUindirect (SPUaform <addr>, 0), 0) ->
2910 // (SPUaform <addr>, 0)
2911
2912 DEBUG(cerr << "Replace: ");
2913 DEBUG(N->dump(&DAG));
2914 DEBUG(cerr << "\nWith: ");
Gabor Greifba36cb52008-08-28 21:40:38 +00002915 DEBUG(Op0.getNode()->dump(&DAG));
Scott Michela59d4692008-02-23 18:41:37 +00002916 DEBUG(cerr << "\n");
2917
2918 return Op0;
2919 }
Scott Michelf0569be2008-12-27 04:51:36 +00002920 } else if (Op0.getOpcode() == ISD::ADD) {
2921 SDValue Op1 = N->getOperand(1);
2922 if (ConstantSDNode *CN1 = dyn_cast<ConstantSDNode>(Op1)) {
2923 // (SPUindirect (add <arg>, <arg>), 0) ->
2924 // (SPUindirect <arg>, <arg>)
2925 if (CN1->isNullValue()) {
2926
2927#if !defined(NDEBUG)
2928 if (DebugFlag && isCurrentDebugType(DEBUG_TYPE)) {
2929 cerr << "\n"
2930 << "Replace: (SPUindirect (add <arg>, <arg>), 0)\n"
2931 << "With: (SPUindirect <arg>, <arg>)\n";
2932 }
2933#endif
2934
Dale Johannesende064702009-02-06 21:50:26 +00002935 return DAG.getNode(SPUISD::IndirectAddr, dl, Op0VT,
Scott Michelf0569be2008-12-27 04:51:36 +00002936 Op0.getOperand(0), Op0.getOperand(1));
2937 }
2938 }
Scott Michela59d4692008-02-23 18:41:37 +00002939 }
2940 break;
2941 }
2942 case SPUISD::SHLQUAD_L_BITS:
2943 case SPUISD::SHLQUAD_L_BYTES:
2944 case SPUISD::VEC_SHL:
2945 case SPUISD::VEC_SRL:
2946 case SPUISD::VEC_SRA:
Scott Michelf0569be2008-12-27 04:51:36 +00002947 case SPUISD::ROTBYTES_LEFT: {
Dan Gohman475871a2008-07-27 21:46:04 +00002948 SDValue Op1 = N->getOperand(1);
Scott Michela59d4692008-02-23 18:41:37 +00002949
Scott Michelf0569be2008-12-27 04:51:36 +00002950 // Kill degenerate vector shifts:
2951 if (ConstantSDNode *CN = dyn_cast<ConstantSDNode>(Op1)) {
2952 if (CN->isNullValue()) {
Scott Michela59d4692008-02-23 18:41:37 +00002953 Result = Op0;
2954 }
2955 }
2956 break;
2957 }
Scott Michelf0569be2008-12-27 04:51:36 +00002958 case SPUISD::PREFSLOT2VEC: {
Scott Michela59d4692008-02-23 18:41:37 +00002959 switch (Op0.getOpcode()) {
2960 default:
2961 break;
2962 case ISD::ANY_EXTEND:
2963 case ISD::ZERO_EXTEND:
2964 case ISD::SIGN_EXTEND: {
Scott Michel1df30c42008-12-29 03:23:36 +00002965 // (SPUprefslot2vec (any|zero|sign_extend (SPUvec2prefslot <arg>))) ->
Scott Michela59d4692008-02-23 18:41:37 +00002966 // <arg>
Scott Michel1df30c42008-12-29 03:23:36 +00002967 // but only if the SPUprefslot2vec and <arg> types match.
Dan Gohman475871a2008-07-27 21:46:04 +00002968 SDValue Op00 = Op0.getOperand(0);
Scott Michel104de432008-11-24 17:11:17 +00002969 if (Op00.getOpcode() == SPUISD::VEC2PREFSLOT) {
Dan Gohman475871a2008-07-27 21:46:04 +00002970 SDValue Op000 = Op00.getOperand(0);
Scott Michel1a6cdb62008-12-01 17:56:02 +00002971 if (Op000.getValueType() == NodeVT) {
Scott Michela59d4692008-02-23 18:41:37 +00002972 Result = Op000;
2973 }
2974 }
2975 break;
2976 }
Scott Michel104de432008-11-24 17:11:17 +00002977 case SPUISD::VEC2PREFSLOT: {
Scott Michel1df30c42008-12-29 03:23:36 +00002978 // (SPUprefslot2vec (SPUvec2prefslot <arg>)) ->
Scott Michela59d4692008-02-23 18:41:37 +00002979 // <arg>
2980 Result = Op0.getOperand(0);
2981 break;
Scott Michel5af8f0e2008-07-16 17:17:29 +00002982 }
Scott Michela59d4692008-02-23 18:41:37 +00002983 }
2984 break;
Scott Michel053c1da2008-01-29 02:16:57 +00002985 }
2986 }
Scott Micheld1e8d9c2009-01-21 04:58:48 +00002987
Scott Michel58c58182008-01-17 20:38:41 +00002988 // Otherwise, return unchanged.
Scott Michel1a6cdb62008-12-01 17:56:02 +00002989#ifndef NDEBUG
Gabor Greifba36cb52008-08-28 21:40:38 +00002990 if (Result.getNode()) {
Scott Michela59d4692008-02-23 18:41:37 +00002991 DEBUG(cerr << "\nReplace.SPU: ");
2992 DEBUG(N->dump(&DAG));
2993 DEBUG(cerr << "\nWith: ");
Gabor Greifba36cb52008-08-28 21:40:38 +00002994 DEBUG(Result.getNode()->dump(&DAG));
Scott Michela59d4692008-02-23 18:41:37 +00002995 DEBUG(cerr << "\n");
2996 }
2997#endif
2998
2999 return Result;
Scott Michel266bc8f2007-12-04 22:23:35 +00003000}
3001
3002//===----------------------------------------------------------------------===//
3003// Inline Assembly Support
3004//===----------------------------------------------------------------------===//
3005
3006/// getConstraintType - Given a constraint letter, return the type of
3007/// constraint it is for this target.
Scott Michel5af8f0e2008-07-16 17:17:29 +00003008SPUTargetLowering::ConstraintType
Scott Michel266bc8f2007-12-04 22:23:35 +00003009SPUTargetLowering::getConstraintType(const std::string &ConstraintLetter) const {
3010 if (ConstraintLetter.size() == 1) {
3011 switch (ConstraintLetter[0]) {
3012 default: break;
3013 case 'b':
3014 case 'r':
3015 case 'f':
3016 case 'v':
3017 case 'y':
3018 return C_RegisterClass;
Scott Michel5af8f0e2008-07-16 17:17:29 +00003019 }
Scott Michel266bc8f2007-12-04 22:23:35 +00003020 }
3021 return TargetLowering::getConstraintType(ConstraintLetter);
3022}
3023
Scott Michel5af8f0e2008-07-16 17:17:29 +00003024std::pair<unsigned, const TargetRegisterClass*>
Scott Michel266bc8f2007-12-04 22:23:35 +00003025SPUTargetLowering::getRegForInlineAsmConstraint(const std::string &Constraint,
Duncan Sands83ec4b62008-06-06 12:08:01 +00003026 MVT VT) const
Scott Michel266bc8f2007-12-04 22:23:35 +00003027{
3028 if (Constraint.size() == 1) {
3029 // GCC RS6000 Constraint Letters
3030 switch (Constraint[0]) {
3031 case 'b': // R1-R31
3032 case 'r': // R0-R31
3033 if (VT == MVT::i64)
3034 return std::make_pair(0U, SPU::R64CRegisterClass);
3035 return std::make_pair(0U, SPU::R32CRegisterClass);
3036 case 'f':
3037 if (VT == MVT::f32)
3038 return std::make_pair(0U, SPU::R32FPRegisterClass);
3039 else if (VT == MVT::f64)
3040 return std::make_pair(0U, SPU::R64FPRegisterClass);
3041 break;
Scott Michel5af8f0e2008-07-16 17:17:29 +00003042 case 'v':
Scott Michel266bc8f2007-12-04 22:23:35 +00003043 return std::make_pair(0U, SPU::GPRCRegisterClass);
3044 }
3045 }
Scott Michel5af8f0e2008-07-16 17:17:29 +00003046
Scott Michel266bc8f2007-12-04 22:23:35 +00003047 return TargetLowering::getRegForInlineAsmConstraint(Constraint, VT);
3048}
3049
Scott Michela59d4692008-02-23 18:41:37 +00003050//! Compute used/known bits for a SPU operand
Scott Michel266bc8f2007-12-04 22:23:35 +00003051void
Dan Gohman475871a2008-07-27 21:46:04 +00003052SPUTargetLowering::computeMaskedBitsForTargetNode(const SDValue Op,
Dan Gohman977a76f2008-02-13 22:28:48 +00003053 const APInt &Mask,
Scott Michel5af8f0e2008-07-16 17:17:29 +00003054 APInt &KnownZero,
Dan Gohmanfd29e0e2008-02-13 00:35:47 +00003055 APInt &KnownOne,
Scott Michel7f9ba9b2008-01-30 02:55:46 +00003056 const SelectionDAG &DAG,
3057 unsigned Depth ) const {
Scott Michel203b2d62008-04-30 00:30:08 +00003058#if 0
Scott Michela59d4692008-02-23 18:41:37 +00003059 const uint64_t uint64_sizebits = sizeof(uint64_t) * 8;
3060
3061 switch (Op.getOpcode()) {
3062 default:
3063 // KnownZero = KnownOne = APInt(Mask.getBitWidth(), 0);
3064 break;
Scott Michela59d4692008-02-23 18:41:37 +00003065 case CALL:
3066 case SHUFB:
Scott Michel7a1c9e92008-11-22 23:50:42 +00003067 case SHUFFLE_MASK:
Scott Michela59d4692008-02-23 18:41:37 +00003068 case CNTB:
Scott Micheld1e8d9c2009-01-21 04:58:48 +00003069 case SPUISD::PREFSLOT2VEC:
Scott Michela59d4692008-02-23 18:41:37 +00003070 case SPUISD::LDRESULT:
Scott Micheld1e8d9c2009-01-21 04:58:48 +00003071 case SPUISD::VEC2PREFSLOT:
Scott Michel203b2d62008-04-30 00:30:08 +00003072 case SPUISD::SHLQUAD_L_BITS:
3073 case SPUISD::SHLQUAD_L_BYTES:
3074 case SPUISD::VEC_SHL:
3075 case SPUISD::VEC_SRL:
3076 case SPUISD::VEC_SRA:
3077 case SPUISD::VEC_ROTL:
3078 case SPUISD::VEC_ROTR:
Scott Michel203b2d62008-04-30 00:30:08 +00003079 case SPUISD::ROTBYTES_LEFT:
Scott Michel8bf61e82008-06-02 22:18:03 +00003080 case SPUISD::SELECT_MASK:
3081 case SPUISD::SELB:
Scott Michela59d4692008-02-23 18:41:37 +00003082 }
Scott Micheld1e8d9c2009-01-21 04:58:48 +00003083#endif
Scott Michel266bc8f2007-12-04 22:23:35 +00003084}
Scott Michel02d711b2008-12-30 23:28:25 +00003085
Scott Michelf0569be2008-12-27 04:51:36 +00003086unsigned
3087SPUTargetLowering::ComputeNumSignBitsForTargetNode(SDValue Op,
3088 unsigned Depth) const {
3089 switch (Op.getOpcode()) {
3090 default:
3091 return 1;
Scott Michel266bc8f2007-12-04 22:23:35 +00003092
Scott Michelf0569be2008-12-27 04:51:36 +00003093 case ISD::SETCC: {
3094 MVT VT = Op.getValueType();
3095
3096 if (VT != MVT::i8 && VT != MVT::i16 && VT != MVT::i32) {
3097 VT = MVT::i32;
3098 }
3099 return VT.getSizeInBits();
3100 }
3101 }
3102}
Scott Michel1df30c42008-12-29 03:23:36 +00003103
Scott Michel203b2d62008-04-30 00:30:08 +00003104// LowerAsmOperandForConstraint
3105void
Dan Gohman475871a2008-07-27 21:46:04 +00003106SPUTargetLowering::LowerAsmOperandForConstraint(SDValue Op,
Scott Michel203b2d62008-04-30 00:30:08 +00003107 char ConstraintLetter,
Evan Chengda43bcf2008-09-24 00:05:32 +00003108 bool hasMemory,
Dan Gohman475871a2008-07-27 21:46:04 +00003109 std::vector<SDValue> &Ops,
Scott Michel203b2d62008-04-30 00:30:08 +00003110 SelectionDAG &DAG) const {
3111 // Default, for the time being, to the base class handler
Evan Chengda43bcf2008-09-24 00:05:32 +00003112 TargetLowering::LowerAsmOperandForConstraint(Op, ConstraintLetter, hasMemory,
3113 Ops, DAG);
Scott Michel203b2d62008-04-30 00:30:08 +00003114}
3115
Scott Michel266bc8f2007-12-04 22:23:35 +00003116/// isLegalAddressImmediate - Return true if the integer value can be used
3117/// as the offset of the target addressing mode.
Gabor Greif93c53e52008-08-31 15:37:04 +00003118bool SPUTargetLowering::isLegalAddressImmediate(int64_t V,
3119 const Type *Ty) const {
Scott Michel266bc8f2007-12-04 22:23:35 +00003120 // SPU's addresses are 256K:
3121 return (V > -(1 << 18) && V < (1 << 18) - 1);
3122}
3123
3124bool SPUTargetLowering::isLegalAddressImmediate(llvm::GlobalValue* GV) const {
Scott Michel5af8f0e2008-07-16 17:17:29 +00003125 return false;
Scott Michel266bc8f2007-12-04 22:23:35 +00003126}
Dan Gohman6520e202008-10-18 02:06:02 +00003127
3128bool
3129SPUTargetLowering::isOffsetFoldingLegal(const GlobalAddressSDNode *GA) const {
3130 // The SPU target isn't yet aware of offsets.
3131 return false;
3132}