blob: 0596a59015231d5fd63ac9fa5ae6d52e5930d674 [file] [log] [blame]
Scott Michel266bc8f2007-12-04 22:23:35 +00001//===-- SPUISelLowering.cpp - Cell SPU DAG Lowering Implementation --------===//
2//
3// The LLVM Compiler Infrastructure
4//
Chris Lattner4ee451d2007-12-29 20:36:04 +00005// This file is distributed under the University of Illinois Open Source
6// License. See LICENSE.TXT for details.
Scott Michel266bc8f2007-12-04 22:23:35 +00007//
8//===----------------------------------------------------------------------===//
9//
10// This file implements the SPUTargetLowering class.
11//
12//===----------------------------------------------------------------------===//
13
14#include "SPURegisterNames.h"
15#include "SPUISelLowering.h"
16#include "SPUTargetMachine.h"
Scott Michel203b2d62008-04-30 00:30:08 +000017#include "SPUFrameInfo.h"
Scott Michelf0569be2008-12-27 04:51:36 +000018#include "llvm/ADT/APInt.h"
Scott Michel266bc8f2007-12-04 22:23:35 +000019#include "llvm/ADT/VectorExtras.h"
Scott Michelc9c8b2a2009-01-26 03:31:40 +000020#include "llvm/CallingConv.h"
Scott Michel266bc8f2007-12-04 22:23:35 +000021#include "llvm/CodeGen/CallingConvLower.h"
22#include "llvm/CodeGen/MachineFrameInfo.h"
23#include "llvm/CodeGen/MachineFunction.h"
24#include "llvm/CodeGen/MachineInstrBuilder.h"
Chris Lattner84bc5422007-12-31 04:13:23 +000025#include "llvm/CodeGen/MachineRegisterInfo.h"
Scott Michel266bc8f2007-12-04 22:23:35 +000026#include "llvm/CodeGen/SelectionDAG.h"
Scott Michel266bc8f2007-12-04 22:23:35 +000027#include "llvm/Constants.h"
28#include "llvm/Function.h"
29#include "llvm/Intrinsics.h"
30#include "llvm/Support/Debug.h"
31#include "llvm/Support/MathExtras.h"
32#include "llvm/Target/TargetOptions.h"
33
34#include <map>
35
36using namespace llvm;
37
38// Used in getTargetNodeName() below
39namespace {
40 std::map<unsigned, const char *> node_names;
41
Duncan Sands83ec4b62008-06-06 12:08:01 +000042 //! MVT mapping to useful data for Cell SPU
Scott Michel266bc8f2007-12-04 22:23:35 +000043 struct valtype_map_s {
Scott Michel7a1c9e92008-11-22 23:50:42 +000044 const MVT valtype;
45 const int prefslot_byte;
Scott Michel266bc8f2007-12-04 22:23:35 +000046 };
Scott Michel5af8f0e2008-07-16 17:17:29 +000047
Scott Michel266bc8f2007-12-04 22:23:35 +000048 const valtype_map_s valtype_map[] = {
49 { MVT::i1, 3 },
50 { MVT::i8, 3 },
51 { MVT::i16, 2 },
52 { MVT::i32, 0 },
53 { MVT::f32, 0 },
54 { MVT::i64, 0 },
55 { MVT::f64, 0 },
56 { MVT::i128, 0 }
57 };
58
59 const size_t n_valtype_map = sizeof(valtype_map) / sizeof(valtype_map[0]);
60
Duncan Sands83ec4b62008-06-06 12:08:01 +000061 const valtype_map_s *getValueTypeMapEntry(MVT VT) {
Scott Michel266bc8f2007-12-04 22:23:35 +000062 const valtype_map_s *retval = 0;
63
64 for (size_t i = 0; i < n_valtype_map; ++i) {
65 if (valtype_map[i].valtype == VT) {
Scott Michel7f9ba9b2008-01-30 02:55:46 +000066 retval = valtype_map + i;
67 break;
Scott Michel266bc8f2007-12-04 22:23:35 +000068 }
69 }
70
71#ifndef NDEBUG
72 if (retval == 0) {
73 cerr << "getValueTypeMapEntry returns NULL for "
Duncan Sands83ec4b62008-06-06 12:08:01 +000074 << VT.getMVTString()
Scott Michel7f9ba9b2008-01-30 02:55:46 +000075 << "\n";
Scott Michel266bc8f2007-12-04 22:23:35 +000076 abort();
77 }
78#endif
79
80 return retval;
81 }
Scott Michel94bd57e2009-01-15 04:41:47 +000082
Scott Michelc9c8b2a2009-01-26 03:31:40 +000083 //! Expand a library call into an actual call DAG node
84 /*!
85 \note
86 This code is taken from SelectionDAGLegalize, since it is not exposed as
87 part of the LLVM SelectionDAG API.
88 */
89
90 SDValue
91 ExpandLibCall(RTLIB::Libcall LC, SDValue Op, SelectionDAG &DAG,
92 bool isSigned, SDValue &Hi, SPUTargetLowering &TLI) {
93 // The input chain to this libcall is the entry node of the function.
94 // Legalizing the call will automatically add the previous call to the
95 // dependence.
96 SDValue InChain = DAG.getEntryNode();
97
98 TargetLowering::ArgListTy Args;
99 TargetLowering::ArgListEntry Entry;
100 for (unsigned i = 0, e = Op.getNumOperands(); i != e; ++i) {
101 MVT ArgVT = Op.getOperand(i).getValueType();
102 const Type *ArgTy = ArgVT.getTypeForMVT();
103 Entry.Node = Op.getOperand(i);
104 Entry.Ty = ArgTy;
105 Entry.isSExt = isSigned;
106 Entry.isZExt = !isSigned;
107 Args.push_back(Entry);
108 }
109 SDValue Callee = DAG.getExternalSymbol(TLI.getLibcallName(LC),
110 TLI.getPointerTy());
111
112 // Splice the libcall in wherever FindInputOutputChains tells us to.
113 const Type *RetTy = Op.getNode()->getValueType(0).getTypeForMVT();
114 std::pair<SDValue, SDValue> CallInfo =
115 TLI.LowerCallTo(InChain, RetTy, isSigned, !isSigned, false, false,
Dale Johannesen7d2ad622009-01-30 23:10:59 +0000116 CallingConv::C, false, Callee, Args, DAG,
117 Op.getNode()->getDebugLoc());
Scott Michelc9c8b2a2009-01-26 03:31:40 +0000118
119 return CallInfo.first;
120 }
Scott Michel266bc8f2007-12-04 22:23:35 +0000121}
122
123SPUTargetLowering::SPUTargetLowering(SPUTargetMachine &TM)
124 : TargetLowering(TM),
125 SPUTM(TM)
126{
127 // Fold away setcc operations if possible.
128 setPow2DivIsCheap();
129
130 // Use _setjmp/_longjmp instead of setjmp/longjmp.
131 setUseUnderscoreSetJmp(true);
132 setUseUnderscoreLongJmp(true);
Scott Michel5af8f0e2008-07-16 17:17:29 +0000133
Scott Micheld1e8d9c2009-01-21 04:58:48 +0000134 // Set RTLIB libcall names as used by SPU:
135 setLibcallName(RTLIB::DIV_F64, "__fast_divdf3");
136
Scott Michel266bc8f2007-12-04 22:23:35 +0000137 // Set up the SPU's register classes:
Scott Michel504c3692007-12-17 22:32:34 +0000138 addRegisterClass(MVT::i8, SPU::R8CRegisterClass);
139 addRegisterClass(MVT::i16, SPU::R16CRegisterClass);
140 addRegisterClass(MVT::i32, SPU::R32CRegisterClass);
141 addRegisterClass(MVT::i64, SPU::R64CRegisterClass);
142 addRegisterClass(MVT::f32, SPU::R32FPRegisterClass);
143 addRegisterClass(MVT::f64, SPU::R64FPRegisterClass);
Scott Michel266bc8f2007-12-04 22:23:35 +0000144 addRegisterClass(MVT::i128, SPU::GPRCRegisterClass);
Scott Michel5af8f0e2008-07-16 17:17:29 +0000145
Scott Michel266bc8f2007-12-04 22:23:35 +0000146 // SPU has no sign or zero extended loads for i1, i8, i16:
Evan Cheng03294662008-10-14 21:26:46 +0000147 setLoadExtAction(ISD::EXTLOAD, MVT::i1, Promote);
148 setLoadExtAction(ISD::SEXTLOAD, MVT::i1, Promote);
149 setLoadExtAction(ISD::ZEXTLOAD, MVT::i1, Promote);
Scott Michel266bc8f2007-12-04 22:23:35 +0000150
Scott Michelf0569be2008-12-27 04:51:36 +0000151 setLoadExtAction(ISD::EXTLOAD, MVT::f32, Expand);
152 setLoadExtAction(ISD::EXTLOAD, MVT::f64, Expand);
Scott Michelb30e8f62008-12-02 19:53:53 +0000153
Scott Michel266bc8f2007-12-04 22:23:35 +0000154 // SPU constant load actions are custom lowered:
Nate Begemanccef5802008-02-14 18:43:04 +0000155 setOperationAction(ISD::ConstantFP, MVT::f32, Legal);
Scott Michel266bc8f2007-12-04 22:23:35 +0000156 setOperationAction(ISD::ConstantFP, MVT::f64, Custom);
157
158 // SPU's loads and stores have to be custom lowered:
Scott Micheldd950092009-01-06 03:36:14 +0000159 for (unsigned sctype = (unsigned) MVT::i8; sctype < (unsigned) MVT::i128;
Scott Michel266bc8f2007-12-04 22:23:35 +0000160 ++sctype) {
Duncan Sands83ec4b62008-06-06 12:08:01 +0000161 MVT VT = (MVT::SimpleValueType)sctype;
162
Scott Michelf0569be2008-12-27 04:51:36 +0000163 setOperationAction(ISD::LOAD, VT, Custom);
164 setOperationAction(ISD::STORE, VT, Custom);
165 setLoadExtAction(ISD::EXTLOAD, VT, Custom);
166 setLoadExtAction(ISD::ZEXTLOAD, VT, Custom);
167 setLoadExtAction(ISD::SEXTLOAD, VT, Custom);
168
169 for (unsigned stype = sctype - 1; stype >= (unsigned) MVT::i8; --stype) {
170 MVT StoreVT = (MVT::SimpleValueType) stype;
171 setTruncStoreAction(VT, StoreVT, Expand);
172 }
Scott Michel266bc8f2007-12-04 22:23:35 +0000173 }
174
Scott Michelf0569be2008-12-27 04:51:36 +0000175 for (unsigned sctype = (unsigned) MVT::f32; sctype < (unsigned) MVT::f64;
176 ++sctype) {
177 MVT VT = (MVT::SimpleValueType) sctype;
178
179 setOperationAction(ISD::LOAD, VT, Custom);
180 setOperationAction(ISD::STORE, VT, Custom);
181
182 for (unsigned stype = sctype - 1; stype >= (unsigned) MVT::f32; --stype) {
183 MVT StoreVT = (MVT::SimpleValueType) stype;
184 setTruncStoreAction(VT, StoreVT, Expand);
185 }
186 }
187
Scott Michel266bc8f2007-12-04 22:23:35 +0000188 // Expand the jumptable branches
189 setOperationAction(ISD::BR_JT, MVT::Other, Expand);
190 setOperationAction(ISD::BR_CC, MVT::Other, Expand);
Scott Michel7a1c9e92008-11-22 23:50:42 +0000191
192 // Custom lower SELECT_CC for most cases, but expand by default
Scott Michel5af8f0e2008-07-16 17:17:29 +0000193 setOperationAction(ISD::SELECT_CC, MVT::Other, Expand);
Scott Michel7a1c9e92008-11-22 23:50:42 +0000194 setOperationAction(ISD::SELECT_CC, MVT::i8, Custom);
195 setOperationAction(ISD::SELECT_CC, MVT::i16, Custom);
196 setOperationAction(ISD::SELECT_CC, MVT::i32, Custom);
197 setOperationAction(ISD::SELECT_CC, MVT::i64, Custom);
Scott Michel266bc8f2007-12-04 22:23:35 +0000198
199 // SPU has no intrinsics for these particular operations:
Andrew Lenharthd497d9f2008-02-16 14:46:26 +0000200 setOperationAction(ISD::MEMBARRIER, MVT::Other, Expand);
201
Scott Michelf0569be2008-12-27 04:51:36 +0000202 // SPU has no SREM/UREM instructions
Scott Michel266bc8f2007-12-04 22:23:35 +0000203 setOperationAction(ISD::SREM, MVT::i32, Expand);
204 setOperationAction(ISD::UREM, MVT::i32, Expand);
205 setOperationAction(ISD::SREM, MVT::i64, Expand);
206 setOperationAction(ISD::UREM, MVT::i64, Expand);
Scott Michel5af8f0e2008-07-16 17:17:29 +0000207
Scott Michel266bc8f2007-12-04 22:23:35 +0000208 // We don't support sin/cos/sqrt/fmod
209 setOperationAction(ISD::FSIN , MVT::f64, Expand);
210 setOperationAction(ISD::FCOS , MVT::f64, Expand);
211 setOperationAction(ISD::FREM , MVT::f64, Expand);
212 setOperationAction(ISD::FSIN , MVT::f32, Expand);
213 setOperationAction(ISD::FCOS , MVT::f32, Expand);
214 setOperationAction(ISD::FREM , MVT::f32, Expand);
Scott Michel5af8f0e2008-07-16 17:17:29 +0000215
Scott Michelc9c8b2a2009-01-26 03:31:40 +0000216 // Expand fsqrt to the appropriate libcall (NOTE: should use h/w fsqrt
217 // for f32!)
Scott Michel266bc8f2007-12-04 22:23:35 +0000218 setOperationAction(ISD::FSQRT, MVT::f64, Expand);
219 setOperationAction(ISD::FSQRT, MVT::f32, Expand);
Scott Michel5af8f0e2008-07-16 17:17:29 +0000220
Scott Michel266bc8f2007-12-04 22:23:35 +0000221 setOperationAction(ISD::FCOPYSIGN, MVT::f64, Expand);
222 setOperationAction(ISD::FCOPYSIGN, MVT::f32, Expand);
223
224 // SPU can do rotate right and left, so legalize it... but customize for i8
225 // because instructions don't exist.
Bill Wendling9440e352008-08-31 02:59:23 +0000226
227 // FIXME: Change from "expand" to appropriate type once ROTR is supported in
228 // .td files.
229 setOperationAction(ISD::ROTR, MVT::i32, Expand /*Legal*/);
230 setOperationAction(ISD::ROTR, MVT::i16, Expand /*Legal*/);
231 setOperationAction(ISD::ROTR, MVT::i8, Expand /*Custom*/);
232
Scott Michel266bc8f2007-12-04 22:23:35 +0000233 setOperationAction(ISD::ROTL, MVT::i32, Legal);
234 setOperationAction(ISD::ROTL, MVT::i16, Legal);
235 setOperationAction(ISD::ROTL, MVT::i8, Custom);
Scott Micheldc91bea2008-11-20 16:36:33 +0000236
Scott Michel266bc8f2007-12-04 22:23:35 +0000237 // SPU has no native version of shift left/right for i8
238 setOperationAction(ISD::SHL, MVT::i8, Custom);
239 setOperationAction(ISD::SRL, MVT::i8, Custom);
240 setOperationAction(ISD::SRA, MVT::i8, Custom);
Scott Michel9c0c6b22008-11-21 02:56:16 +0000241
Scott Michel02d711b2008-12-30 23:28:25 +0000242 // Make these operations legal and handle them during instruction selection:
243 setOperationAction(ISD::SHL, MVT::i64, Legal);
244 setOperationAction(ISD::SRL, MVT::i64, Legal);
245 setOperationAction(ISD::SRA, MVT::i64, Legal);
Scott Michel266bc8f2007-12-04 22:23:35 +0000246
Scott Michel5af8f0e2008-07-16 17:17:29 +0000247 // Custom lower i8, i32 and i64 multiplications
248 setOperationAction(ISD::MUL, MVT::i8, Custom);
Scott Michel1df30c42008-12-29 03:23:36 +0000249 setOperationAction(ISD::MUL, MVT::i32, Legal);
Scott Michel94bd57e2009-01-15 04:41:47 +0000250 setOperationAction(ISD::MUL, MVT::i64, Legal);
Scott Michel9c0c6b22008-11-21 02:56:16 +0000251
Scott Michel8bf61e82008-06-02 22:18:03 +0000252 // Need to custom handle (some) common i8, i64 math ops
Scott Michel02d711b2008-12-30 23:28:25 +0000253 setOperationAction(ISD::ADD, MVT::i8, Custom);
Scott Michel94bd57e2009-01-15 04:41:47 +0000254 setOperationAction(ISD::ADD, MVT::i64, Legal);
Scott Michel266bc8f2007-12-04 22:23:35 +0000255 setOperationAction(ISD::SUB, MVT::i8, Custom);
Scott Michel94bd57e2009-01-15 04:41:47 +0000256 setOperationAction(ISD::SUB, MVT::i64, Legal);
Scott Michel5af8f0e2008-07-16 17:17:29 +0000257
Scott Michel266bc8f2007-12-04 22:23:35 +0000258 // SPU does not have BSWAP. It does have i32 support CTLZ.
259 // CTPOP has to be custom lowered.
260 setOperationAction(ISD::BSWAP, MVT::i32, Expand);
261 setOperationAction(ISD::BSWAP, MVT::i64, Expand);
262
263 setOperationAction(ISD::CTPOP, MVT::i8, Custom);
264 setOperationAction(ISD::CTPOP, MVT::i16, Custom);
265 setOperationAction(ISD::CTPOP, MVT::i32, Custom);
266 setOperationAction(ISD::CTPOP, MVT::i64, Custom);
267
268 setOperationAction(ISD::CTTZ , MVT::i32, Expand);
269 setOperationAction(ISD::CTTZ , MVT::i64, Expand);
270
271 setOperationAction(ISD::CTLZ , MVT::i32, Legal);
Scott Michel5af8f0e2008-07-16 17:17:29 +0000272
Scott Michel8bf61e82008-06-02 22:18:03 +0000273 // SPU has a version of select that implements (a&~c)|(b&c), just like
Scott Michel405fba12008-03-10 23:49:09 +0000274 // select ought to work:
Scott Michel78c47fa2008-03-10 16:58:52 +0000275 setOperationAction(ISD::SELECT, MVT::i8, Legal);
Scott Michelad2715e2008-03-05 23:02:02 +0000276 setOperationAction(ISD::SELECT, MVT::i16, Legal);
277 setOperationAction(ISD::SELECT, MVT::i32, Legal);
Scott Michelf0569be2008-12-27 04:51:36 +0000278 setOperationAction(ISD::SELECT, MVT::i64, Legal);
Scott Michel266bc8f2007-12-04 22:23:35 +0000279
Scott Michel78c47fa2008-03-10 16:58:52 +0000280 setOperationAction(ISD::SETCC, MVT::i8, Legal);
281 setOperationAction(ISD::SETCC, MVT::i16, Legal);
Scott Michel1df30c42008-12-29 03:23:36 +0000282 setOperationAction(ISD::SETCC, MVT::i32, Legal);
283 setOperationAction(ISD::SETCC, MVT::i64, Legal);
Scott Micheld1e8d9c2009-01-21 04:58:48 +0000284 setOperationAction(ISD::SETCC, MVT::f64, Custom);
Scott Michelad2715e2008-03-05 23:02:02 +0000285
Scott Michelf0569be2008-12-27 04:51:36 +0000286 // Custom lower i128 -> i64 truncates
Scott Michelb30e8f62008-12-02 19:53:53 +0000287 setOperationAction(ISD::TRUNCATE, MVT::i64, Custom);
288
Scott Michelc9c8b2a2009-01-26 03:31:40 +0000289 // SPU has a legal FP -> signed INT instruction for f32, but for f64, need
290 // to expand to a libcall, hence the custom lowering:
291 setOperationAction(ISD::FP_TO_SINT, MVT::i32, Custom);
292 setOperationAction(ISD::FP_TO_UINT, MVT::i32, Custom);
Scott Michel266bc8f2007-12-04 22:23:35 +0000293
294 // FDIV on SPU requires custom lowering
Scott Michelc9c8b2a2009-01-26 03:31:40 +0000295 setOperationAction(ISD::FDIV, MVT::f64, Expand); // to libcall
Scott Michel266bc8f2007-12-04 22:23:35 +0000296
Scott Michel9de57a92009-01-26 22:33:37 +0000297 // SPU has [U|S]INT_TO_FP for f32->i32, but not for f64->i32, f64->i64:
Scott Michelc9c8b2a2009-01-26 03:31:40 +0000298 setOperationAction(ISD::SINT_TO_FP, MVT::i32, Custom);
Scott Michel266bc8f2007-12-04 22:23:35 +0000299 setOperationAction(ISD::SINT_TO_FP, MVT::i16, Promote);
Scott Michelc9c8b2a2009-01-26 03:31:40 +0000300 setOperationAction(ISD::SINT_TO_FP, MVT::i8, Promote);
301 setOperationAction(ISD::UINT_TO_FP, MVT::i32, Custom);
Scott Michel266bc8f2007-12-04 22:23:35 +0000302 setOperationAction(ISD::UINT_TO_FP, MVT::i16, Promote);
Scott Michelc9c8b2a2009-01-26 03:31:40 +0000303 setOperationAction(ISD::UINT_TO_FP, MVT::i8, Promote);
Scott Michel266bc8f2007-12-04 22:23:35 +0000304 setOperationAction(ISD::SINT_TO_FP, MVT::i64, Custom);
305 setOperationAction(ISD::UINT_TO_FP, MVT::i64, Custom);
306
Scott Michel86c041f2007-12-20 00:44:13 +0000307 setOperationAction(ISD::BIT_CONVERT, MVT::i32, Legal);
308 setOperationAction(ISD::BIT_CONVERT, MVT::f32, Legal);
309 setOperationAction(ISD::BIT_CONVERT, MVT::i64, Legal);
310 setOperationAction(ISD::BIT_CONVERT, MVT::f64, Legal);
Scott Michel266bc8f2007-12-04 22:23:35 +0000311
312 // We cannot sextinreg(i1). Expand to shifts.
313 setOperationAction(ISD::SIGN_EXTEND_INREG, MVT::i1, Expand);
Scott Michel5af8f0e2008-07-16 17:17:29 +0000314
Scott Michel266bc8f2007-12-04 22:23:35 +0000315 // Support label based line numbers.
Dan Gohman7f460202008-06-30 20:59:49 +0000316 setOperationAction(ISD::DBG_STOPPOINT, MVT::Other, Expand);
Scott Michel266bc8f2007-12-04 22:23:35 +0000317 setOperationAction(ISD::DEBUG_LOC, MVT::Other, Expand);
Scott Michel5af8f0e2008-07-16 17:17:29 +0000318
319 // We want to legalize GlobalAddress and ConstantPool nodes into the
Scott Michel266bc8f2007-12-04 22:23:35 +0000320 // appropriate instructions to materialize the address.
Scott Michel9c0c6b22008-11-21 02:56:16 +0000321 for (unsigned sctype = (unsigned) MVT::i8; sctype < (unsigned) MVT::f128;
Scott Michel053c1da2008-01-29 02:16:57 +0000322 ++sctype) {
Duncan Sands83ec4b62008-06-06 12:08:01 +0000323 MVT VT = (MVT::SimpleValueType)sctype;
324
Scott Michel1df30c42008-12-29 03:23:36 +0000325 setOperationAction(ISD::GlobalAddress, VT, Custom);
326 setOperationAction(ISD::ConstantPool, VT, Custom);
327 setOperationAction(ISD::JumpTable, VT, Custom);
Scott Michel053c1da2008-01-29 02:16:57 +0000328 }
Scott Michel266bc8f2007-12-04 22:23:35 +0000329
330 // RET must be custom lowered, to meet ABI requirements
331 setOperationAction(ISD::RET, MVT::Other, Custom);
Scott Michel5af8f0e2008-07-16 17:17:29 +0000332
Scott Michel266bc8f2007-12-04 22:23:35 +0000333 // VASTART needs to be custom lowered to use the VarArgsFrameIndex
334 setOperationAction(ISD::VASTART , MVT::Other, Custom);
Scott Michel5af8f0e2008-07-16 17:17:29 +0000335
Scott Michel266bc8f2007-12-04 22:23:35 +0000336 // Use the default implementation.
337 setOperationAction(ISD::VAARG , MVT::Other, Expand);
338 setOperationAction(ISD::VACOPY , MVT::Other, Expand);
339 setOperationAction(ISD::VAEND , MVT::Other, Expand);
Scott Michel5af8f0e2008-07-16 17:17:29 +0000340 setOperationAction(ISD::STACKSAVE , MVT::Other, Expand);
Scott Michel266bc8f2007-12-04 22:23:35 +0000341 setOperationAction(ISD::STACKRESTORE , MVT::Other, Expand);
342 setOperationAction(ISD::DYNAMIC_STACKALLOC, MVT::i32 , Expand);
343 setOperationAction(ISD::DYNAMIC_STACKALLOC, MVT::i64 , Expand);
344
345 // Cell SPU has instructions for converting between i64 and fp.
346 setOperationAction(ISD::FP_TO_SINT, MVT::i64, Custom);
347 setOperationAction(ISD::SINT_TO_FP, MVT::i64, Custom);
Scott Michel5af8f0e2008-07-16 17:17:29 +0000348
Scott Michel266bc8f2007-12-04 22:23:35 +0000349 // To take advantage of the above i64 FP_TO_SINT, promote i32 FP_TO_UINT
350 setOperationAction(ISD::FP_TO_UINT, MVT::i32, Promote);
351
352 // BUILD_PAIR can't be handled natively, and should be expanded to shl/or
353 setOperationAction(ISD::BUILD_PAIR, MVT::i64, Expand);
354
355 // First set operation action for all vector types to expand. Then we
356 // will selectively turn on ones that can be effectively codegen'd.
357 addRegisterClass(MVT::v16i8, SPU::VECREGRegisterClass);
358 addRegisterClass(MVT::v8i16, SPU::VECREGRegisterClass);
359 addRegisterClass(MVT::v4i32, SPU::VECREGRegisterClass);
360 addRegisterClass(MVT::v2i64, SPU::VECREGRegisterClass);
361 addRegisterClass(MVT::v4f32, SPU::VECREGRegisterClass);
362 addRegisterClass(MVT::v2f64, SPU::VECREGRegisterClass);
363
Scott Michel21213e72009-01-06 23:10:38 +0000364 // "Odd size" vector classes that we're willing to support:
365 addRegisterClass(MVT::v2i32, SPU::VECREGRegisterClass);
366
Duncan Sands83ec4b62008-06-06 12:08:01 +0000367 for (unsigned i = (unsigned)MVT::FIRST_VECTOR_VALUETYPE;
368 i <= (unsigned)MVT::LAST_VECTOR_VALUETYPE; ++i) {
369 MVT VT = (MVT::SimpleValueType)i;
Scott Michel266bc8f2007-12-04 22:23:35 +0000370
Duncan Sands83ec4b62008-06-06 12:08:01 +0000371 // add/sub are legal for all supported vector VT's.
Scott Michelc9c8b2a2009-01-26 03:31:40 +0000372 setOperationAction(ISD::ADD, VT, Legal);
373 setOperationAction(ISD::SUB, VT, Legal);
Duncan Sands83ec4b62008-06-06 12:08:01 +0000374 // mul has to be custom lowered.
Scott Michelc9c8b2a2009-01-26 03:31:40 +0000375 setOperationAction(ISD::MUL, VT, Legal);
Duncan Sands83ec4b62008-06-06 12:08:01 +0000376
Scott Michelc9c8b2a2009-01-26 03:31:40 +0000377 setOperationAction(ISD::AND, VT, Legal);
378 setOperationAction(ISD::OR, VT, Legal);
379 setOperationAction(ISD::XOR, VT, Legal);
380 setOperationAction(ISD::LOAD, VT, Legal);
381 setOperationAction(ISD::SELECT, VT, Legal);
382 setOperationAction(ISD::STORE, VT, Legal);
Scott Michel5af8f0e2008-07-16 17:17:29 +0000383
Scott Michel266bc8f2007-12-04 22:23:35 +0000384 // These operations need to be expanded:
Scott Michelc9c8b2a2009-01-26 03:31:40 +0000385 setOperationAction(ISD::SDIV, VT, Expand);
386 setOperationAction(ISD::SREM, VT, Expand);
387 setOperationAction(ISD::UDIV, VT, Expand);
388 setOperationAction(ISD::UREM, VT, Expand);
Scott Michel266bc8f2007-12-04 22:23:35 +0000389
390 // Custom lower build_vector, constant pool spills, insert and
391 // extract vector elements:
Duncan Sands83ec4b62008-06-06 12:08:01 +0000392 setOperationAction(ISD::BUILD_VECTOR, VT, Custom);
393 setOperationAction(ISD::ConstantPool, VT, Custom);
394 setOperationAction(ISD::SCALAR_TO_VECTOR, VT, Custom);
395 setOperationAction(ISD::EXTRACT_VECTOR_ELT, VT, Custom);
396 setOperationAction(ISD::INSERT_VECTOR_ELT, VT, Custom);
397 setOperationAction(ISD::VECTOR_SHUFFLE, VT, Custom);
Scott Michel266bc8f2007-12-04 22:23:35 +0000398 }
399
Scott Michel266bc8f2007-12-04 22:23:35 +0000400 setOperationAction(ISD::AND, MVT::v16i8, Custom);
401 setOperationAction(ISD::OR, MVT::v16i8, Custom);
402 setOperationAction(ISD::XOR, MVT::v16i8, Custom);
403 setOperationAction(ISD::SCALAR_TO_VECTOR, MVT::v4f32, Custom);
Scott Michel9de5d0d2008-01-11 02:53:15 +0000404
Scott Michel02d711b2008-12-30 23:28:25 +0000405 setOperationAction(ISD::FDIV, MVT::v4f32, Legal);
Scott Michel1df30c42008-12-29 03:23:36 +0000406
Scott Michel266bc8f2007-12-04 22:23:35 +0000407 setShiftAmountType(MVT::i32);
Scott Michelf0569be2008-12-27 04:51:36 +0000408 setBooleanContents(ZeroOrNegativeOneBooleanContent);
Scott Michel5af8f0e2008-07-16 17:17:29 +0000409
Scott Michel266bc8f2007-12-04 22:23:35 +0000410 setStackPointerRegisterToSaveRestore(SPU::R1);
Scott Michel5af8f0e2008-07-16 17:17:29 +0000411
Scott Michel266bc8f2007-12-04 22:23:35 +0000412 // We have target-specific dag combine patterns for the following nodes:
Scott Michel053c1da2008-01-29 02:16:57 +0000413 setTargetDAGCombine(ISD::ADD);
Scott Michela59d4692008-02-23 18:41:37 +0000414 setTargetDAGCombine(ISD::ZERO_EXTEND);
415 setTargetDAGCombine(ISD::SIGN_EXTEND);
416 setTargetDAGCombine(ISD::ANY_EXTEND);
Scott Michel5af8f0e2008-07-16 17:17:29 +0000417
Scott Michel266bc8f2007-12-04 22:23:35 +0000418 computeRegisterProperties();
Scott Michel7a1c9e92008-11-22 23:50:42 +0000419
Scott Michele07d3de2008-12-09 03:37:19 +0000420 // Set pre-RA register scheduler default to BURR, which produces slightly
421 // better code than the default (could also be TDRR, but TargetLowering.h
422 // needs a mod to support that model):
423 setSchedulingPreference(SchedulingForRegPressure);
Scott Michel266bc8f2007-12-04 22:23:35 +0000424}
425
426const char *
427SPUTargetLowering::getTargetNodeName(unsigned Opcode) const
428{
429 if (node_names.empty()) {
430 node_names[(unsigned) SPUISD::RET_FLAG] = "SPUISD::RET_FLAG";
431 node_names[(unsigned) SPUISD::Hi] = "SPUISD::Hi";
432 node_names[(unsigned) SPUISD::Lo] = "SPUISD::Lo";
433 node_names[(unsigned) SPUISD::PCRelAddr] = "SPUISD::PCRelAddr";
Scott Michel9de5d0d2008-01-11 02:53:15 +0000434 node_names[(unsigned) SPUISD::AFormAddr] = "SPUISD::AFormAddr";
Scott Michel053c1da2008-01-29 02:16:57 +0000435 node_names[(unsigned) SPUISD::IndirectAddr] = "SPUISD::IndirectAddr";
Scott Michel266bc8f2007-12-04 22:23:35 +0000436 node_names[(unsigned) SPUISD::LDRESULT] = "SPUISD::LDRESULT";
437 node_names[(unsigned) SPUISD::CALL] = "SPUISD::CALL";
438 node_names[(unsigned) SPUISD::SHUFB] = "SPUISD::SHUFB";
Scott Michel7a1c9e92008-11-22 23:50:42 +0000439 node_names[(unsigned) SPUISD::SHUFFLE_MASK] = "SPUISD::SHUFFLE_MASK";
Scott Michel266bc8f2007-12-04 22:23:35 +0000440 node_names[(unsigned) SPUISD::CNTB] = "SPUISD::CNTB";
Scott Michel1df30c42008-12-29 03:23:36 +0000441 node_names[(unsigned) SPUISD::PREFSLOT2VEC] = "SPUISD::PREFSLOT2VEC";
Scott Michel104de432008-11-24 17:11:17 +0000442 node_names[(unsigned) SPUISD::VEC2PREFSLOT] = "SPUISD::VEC2PREFSLOT";
Scott Michela59d4692008-02-23 18:41:37 +0000443 node_names[(unsigned) SPUISD::SHLQUAD_L_BITS] = "SPUISD::SHLQUAD_L_BITS";
444 node_names[(unsigned) SPUISD::SHLQUAD_L_BYTES] = "SPUISD::SHLQUAD_L_BYTES";
Scott Michel266bc8f2007-12-04 22:23:35 +0000445 node_names[(unsigned) SPUISD::VEC_SHL] = "SPUISD::VEC_SHL";
446 node_names[(unsigned) SPUISD::VEC_SRL] = "SPUISD::VEC_SRL";
447 node_names[(unsigned) SPUISD::VEC_SRA] = "SPUISD::VEC_SRA";
448 node_names[(unsigned) SPUISD::VEC_ROTL] = "SPUISD::VEC_ROTL";
449 node_names[(unsigned) SPUISD::VEC_ROTR] = "SPUISD::VEC_ROTR";
Scott Micheld1e8d9c2009-01-21 04:58:48 +0000450 node_names[(unsigned) SPUISD::ROTBYTES_LEFT] = "SPUISD::ROTBYTES_LEFT";
451 node_names[(unsigned) SPUISD::ROTBYTES_LEFT_BITS] =
452 "SPUISD::ROTBYTES_LEFT_BITS";
Scott Michel8bf61e82008-06-02 22:18:03 +0000453 node_names[(unsigned) SPUISD::SELECT_MASK] = "SPUISD::SELECT_MASK";
Scott Michel266bc8f2007-12-04 22:23:35 +0000454 node_names[(unsigned) SPUISD::SELB] = "SPUISD::SELB";
Scott Michel94bd57e2009-01-15 04:41:47 +0000455 node_names[(unsigned) SPUISD::ADD64_MARKER] = "SPUISD::ADD64_MARKER";
456 node_names[(unsigned) SPUISD::SUB64_MARKER] = "SPUISD::SUB64_MARKER";
457 node_names[(unsigned) SPUISD::MUL64_MARKER] = "SPUISD::MUL64_MARKER";
Scott Michel266bc8f2007-12-04 22:23:35 +0000458 }
459
460 std::map<unsigned, const char *>::iterator i = node_names.find(Opcode);
461
462 return ((i != node_names.end()) ? i->second : 0);
463}
464
Scott Michelf0569be2008-12-27 04:51:36 +0000465//===----------------------------------------------------------------------===//
466// Return the Cell SPU's SETCC result type
467//===----------------------------------------------------------------------===//
468
Duncan Sands5480c042009-01-01 15:52:00 +0000469MVT SPUTargetLowering::getSetCCResultType(MVT VT) const {
Scott Michelf0569be2008-12-27 04:51:36 +0000470 // i16 and i32 are valid SETCC result types
471 return ((VT == MVT::i8 || VT == MVT::i16 || VT == MVT::i32) ? VT : MVT::i32);
Scott Michel78c47fa2008-03-10 16:58:52 +0000472}
473
Scott Michel266bc8f2007-12-04 22:23:35 +0000474//===----------------------------------------------------------------------===//
475// Calling convention code:
476//===----------------------------------------------------------------------===//
477
478#include "SPUGenCallingConv.inc"
479
480//===----------------------------------------------------------------------===//
481// LowerOperation implementation
482//===----------------------------------------------------------------------===//
483
484/// Custom lower loads for CellSPU
485/*!
486 All CellSPU loads and stores are aligned to 16-byte boundaries, so for elements
487 within a 16-byte block, we have to rotate to extract the requested element.
Scott Michel30ee7df2008-12-04 03:02:42 +0000488
489 For extending loads, we also want to ensure that the following sequence is
490 emitted, e.g. for MVT::f32 extending load to MVT::f64:
491
492\verbatim
Scott Michel1df30c42008-12-29 03:23:36 +0000493%1 v16i8,ch = load
Scott Michel30ee7df2008-12-04 03:02:42 +0000494%2 v16i8,ch = rotate %1
Scott Michel1df30c42008-12-29 03:23:36 +0000495%3 v4f8, ch = bitconvert %2
Scott Michel30ee7df2008-12-04 03:02:42 +0000496%4 f32 = vec2perfslot %3
497%5 f64 = fp_extend %4
498\endverbatim
499*/
Dan Gohman475871a2008-07-27 21:46:04 +0000500static SDValue
501LowerLOAD(SDValue Op, SelectionDAG &DAG, const SPUSubtarget *ST) {
Scott Michel266bc8f2007-12-04 22:23:35 +0000502 LoadSDNode *LN = cast<LoadSDNode>(Op);
Dan Gohman475871a2008-07-27 21:46:04 +0000503 SDValue the_chain = LN->getChain();
Scott Michelf0569be2008-12-27 04:51:36 +0000504 MVT PtrVT = DAG.getTargetLoweringInfo().getPointerTy();
Scott Michel30ee7df2008-12-04 03:02:42 +0000505 MVT InVT = LN->getMemoryVT();
506 MVT OutVT = Op.getValueType();
Scott Michel266bc8f2007-12-04 22:23:35 +0000507 ISD::LoadExtType ExtType = LN->getExtensionType();
508 unsigned alignment = LN->getAlignment();
Scott Michelf0569be2008-12-27 04:51:36 +0000509 const valtype_map_s *vtm = getValueTypeMapEntry(InVT);
Dale Johannesen33c960f2009-02-04 20:06:27 +0000510 DebugLoc dl = Op.getDebugLoc();
Scott Michel266bc8f2007-12-04 22:23:35 +0000511
Scott Michel266bc8f2007-12-04 22:23:35 +0000512 switch (LN->getAddressingMode()) {
513 case ISD::UNINDEXED: {
Scott Michelf0569be2008-12-27 04:51:36 +0000514 SDValue result;
515 SDValue basePtr = LN->getBasePtr();
516 SDValue rotate;
Scott Michel266bc8f2007-12-04 22:23:35 +0000517
Scott Michelf0569be2008-12-27 04:51:36 +0000518 if (alignment == 16) {
519 ConstantSDNode *CN;
Scott Michel9de5d0d2008-01-11 02:53:15 +0000520
Scott Michelf0569be2008-12-27 04:51:36 +0000521 // Special cases for a known aligned load to simplify the base pointer
522 // and the rotation amount:
523 if (basePtr.getOpcode() == ISD::ADD
524 && (CN = dyn_cast<ConstantSDNode > (basePtr.getOperand(1))) != 0) {
525 // Known offset into basePtr
526 int64_t offset = CN->getSExtValue();
527 int64_t rotamt = int64_t((offset & 0xf) - vtm->prefslot_byte);
Scott Michel9de5d0d2008-01-11 02:53:15 +0000528
Scott Michelf0569be2008-12-27 04:51:36 +0000529 if (rotamt < 0)
530 rotamt += 16;
531
532 rotate = DAG.getConstant(rotamt, MVT::i16);
533
534 // Simplify the base pointer for this case:
535 basePtr = basePtr.getOperand(0);
536 if ((offset & ~0xf) > 0) {
537 basePtr = DAG.getNode(SPUISD::IndirectAddr, PtrVT,
538 basePtr,
539 DAG.getConstant((offset & ~0xf), PtrVT));
540 }
541 } else if ((basePtr.getOpcode() == SPUISD::AFormAddr)
542 || (basePtr.getOpcode() == SPUISD::IndirectAddr
543 && basePtr.getOperand(0).getOpcode() == SPUISD::Hi
544 && basePtr.getOperand(1).getOpcode() == SPUISD::Lo)) {
545 // Plain aligned a-form address: rotate into preferred slot
546 // Same for (SPUindirect (SPUhi ...), (SPUlo ...))
547 int64_t rotamt = -vtm->prefslot_byte;
548 if (rotamt < 0)
549 rotamt += 16;
550 rotate = DAG.getConstant(rotamt, MVT::i16);
Scott Michel9de5d0d2008-01-11 02:53:15 +0000551 } else {
Scott Michelf0569be2008-12-27 04:51:36 +0000552 // Offset the rotate amount by the basePtr and the preferred slot
553 // byte offset
554 int64_t rotamt = -vtm->prefslot_byte;
555 if (rotamt < 0)
556 rotamt += 16;
Dale Johannesen33c960f2009-02-04 20:06:27 +0000557 rotate = DAG.getNode(ISD::ADD, dl, PtrVT,
Scott Michelf0569be2008-12-27 04:51:36 +0000558 basePtr,
Scott Michel7f9ba9b2008-01-30 02:55:46 +0000559 DAG.getConstant(rotamt, PtrVT));
Scott Michel9de5d0d2008-01-11 02:53:15 +0000560 }
Scott Michelf0569be2008-12-27 04:51:36 +0000561 } else {
562 // Unaligned load: must be more pessimistic about addressing modes:
563 if (basePtr.getOpcode() == ISD::ADD) {
564 MachineFunction &MF = DAG.getMachineFunction();
565 MachineRegisterInfo &RegInfo = MF.getRegInfo();
566 unsigned VReg = RegInfo.createVirtualRegister(&SPU::R32CRegClass);
567 SDValue Flag;
Scott Michel9de5d0d2008-01-11 02:53:15 +0000568
Scott Michelf0569be2008-12-27 04:51:36 +0000569 SDValue Op0 = basePtr.getOperand(0);
570 SDValue Op1 = basePtr.getOperand(1);
571
572 if (isa<ConstantSDNode>(Op1)) {
573 // Convert the (add <ptr>, <const>) to an indirect address contained
574 // in a register. Note that this is done because we need to avoid
575 // creating a 0(reg) d-form address due to the SPU's block loads.
576 basePtr = DAG.getNode(SPUISD::IndirectAddr, PtrVT, Op0, Op1);
Dale Johannesen33c960f2009-02-04 20:06:27 +0000577 the_chain = DAG.getCopyToReg(the_chain, dl, VReg, basePtr, Flag);
578 basePtr = DAG.getCopyFromReg(the_chain, dl, VReg, PtrVT);
Scott Michelf0569be2008-12-27 04:51:36 +0000579 } else {
580 // Convert the (add <arg1>, <arg2>) to an indirect address, which
581 // will likely be lowered as a reg(reg) x-form address.
582 basePtr = DAG.getNode(SPUISD::IndirectAddr, PtrVT, Op0, Op1);
583 }
584 } else {
585 basePtr = DAG.getNode(SPUISD::IndirectAddr, PtrVT,
586 basePtr,
587 DAG.getConstant(0, PtrVT));
588 }
589
590 // Offset the rotate amount by the basePtr and the preferred slot
591 // byte offset
Dale Johannesen33c960f2009-02-04 20:06:27 +0000592 rotate = DAG.getNode(ISD::ADD, dl, PtrVT,
Scott Michelf0569be2008-12-27 04:51:36 +0000593 basePtr,
594 DAG.getConstant(-vtm->prefslot_byte, PtrVT));
Scott Michel266bc8f2007-12-04 22:23:35 +0000595 }
Scott Michel9de5d0d2008-01-11 02:53:15 +0000596
Scott Michelf0569be2008-12-27 04:51:36 +0000597 // Re-emit as a v16i8 vector load
Dale Johannesen33c960f2009-02-04 20:06:27 +0000598 result = DAG.getLoad(MVT::v16i8, dl, the_chain, basePtr,
Scott Michelf0569be2008-12-27 04:51:36 +0000599 LN->getSrcValue(), LN->getSrcValueOffset(),
600 LN->isVolatile(), 16);
601
602 // Update the chain
603 the_chain = result.getValue(1);
604
605 // Rotate into the preferred slot:
Dale Johannesen33c960f2009-02-04 20:06:27 +0000606 result = DAG.getNode(SPUISD::ROTBYTES_LEFT, dl, MVT::v16i8,
Scott Michelf0569be2008-12-27 04:51:36 +0000607 result.getValue(0), rotate);
608
Scott Michel30ee7df2008-12-04 03:02:42 +0000609 // Convert the loaded v16i8 vector to the appropriate vector type
610 // specified by the operand:
611 MVT vecVT = MVT::getVectorVT(InVT, (128 / InVT.getSizeInBits()));
Dale Johannesen33c960f2009-02-04 20:06:27 +0000612 result = DAG.getNode(SPUISD::VEC2PREFSLOT, dl, InVT,
613 DAG.getNode(ISD::BIT_CONVERT, dl, vecVT, result));
Scott Michel5af8f0e2008-07-16 17:17:29 +0000614
Scott Michel30ee7df2008-12-04 03:02:42 +0000615 // Handle extending loads by extending the scalar result:
616 if (ExtType == ISD::SEXTLOAD) {
Dale Johannesen33c960f2009-02-04 20:06:27 +0000617 result = DAG.getNode(ISD::SIGN_EXTEND, dl, OutVT, result);
Scott Michel30ee7df2008-12-04 03:02:42 +0000618 } else if (ExtType == ISD::ZEXTLOAD) {
Dale Johannesen33c960f2009-02-04 20:06:27 +0000619 result = DAG.getNode(ISD::ZERO_EXTEND, dl, OutVT, result);
Scott Michel30ee7df2008-12-04 03:02:42 +0000620 } else if (ExtType == ISD::EXTLOAD) {
621 unsigned NewOpc = ISD::ANY_EXTEND;
Scott Michel9de5d0d2008-01-11 02:53:15 +0000622
Scott Michel30ee7df2008-12-04 03:02:42 +0000623 if (OutVT.isFloatingPoint())
Scott Michel19c10e62009-01-26 03:37:41 +0000624 NewOpc = ISD::FP_EXTEND;
Scott Michel9de5d0d2008-01-11 02:53:15 +0000625
Dale Johannesen33c960f2009-02-04 20:06:27 +0000626 result = DAG.getNode(NewOpc, dl, OutVT, result);
Scott Michel9de5d0d2008-01-11 02:53:15 +0000627 }
628
Scott Michel30ee7df2008-12-04 03:02:42 +0000629 SDVTList retvts = DAG.getVTList(OutVT, MVT::Other);
Dan Gohman475871a2008-07-27 21:46:04 +0000630 SDValue retops[2] = {
Scott Michel58c58182008-01-17 20:38:41 +0000631 result,
Scott Michel7f9ba9b2008-01-30 02:55:46 +0000632 the_chain
Scott Michel58c58182008-01-17 20:38:41 +0000633 };
Scott Michel9de5d0d2008-01-11 02:53:15 +0000634
Dale Johannesen33c960f2009-02-04 20:06:27 +0000635 result = DAG.getNode(SPUISD::LDRESULT, dl, retvts,
Scott Michel58c58182008-01-17 20:38:41 +0000636 retops, sizeof(retops) / sizeof(retops[0]));
Scott Michel9de5d0d2008-01-11 02:53:15 +0000637 return result;
Scott Michel266bc8f2007-12-04 22:23:35 +0000638 }
639 case ISD::PRE_INC:
640 case ISD::PRE_DEC:
641 case ISD::POST_INC:
642 case ISD::POST_DEC:
643 case ISD::LAST_INDEXED_MODE:
644 cerr << "LowerLOAD: Got a LoadSDNode with an addr mode other than "
645 "UNINDEXED\n";
646 cerr << (unsigned) LN->getAddressingMode() << "\n";
647 abort();
648 /*NOTREACHED*/
649 }
650
Dan Gohman475871a2008-07-27 21:46:04 +0000651 return SDValue();
Scott Michel266bc8f2007-12-04 22:23:35 +0000652}
653
654/// Custom lower stores for CellSPU
655/*!
656 All CellSPU stores are aligned to 16-byte boundaries, so for elements
657 within a 16-byte block, we have to generate a shuffle to insert the
658 requested element into its place, then store the resulting block.
659 */
Dan Gohman475871a2008-07-27 21:46:04 +0000660static SDValue
661LowerSTORE(SDValue Op, SelectionDAG &DAG, const SPUSubtarget *ST) {
Scott Michel266bc8f2007-12-04 22:23:35 +0000662 StoreSDNode *SN = cast<StoreSDNode>(Op);
Dan Gohman475871a2008-07-27 21:46:04 +0000663 SDValue Value = SN->getValue();
Duncan Sands83ec4b62008-06-06 12:08:01 +0000664 MVT VT = Value.getValueType();
665 MVT StVT = (!SN->isTruncatingStore() ? VT : SN->getMemoryVT());
666 MVT PtrVT = DAG.getTargetLoweringInfo().getPointerTy();
Dale Johannesen33c960f2009-02-04 20:06:27 +0000667 DebugLoc dl = Op.getDebugLoc();
Scott Michel9de5d0d2008-01-11 02:53:15 +0000668 unsigned alignment = SN->getAlignment();
Scott Michel266bc8f2007-12-04 22:23:35 +0000669
670 switch (SN->getAddressingMode()) {
671 case ISD::UNINDEXED: {
Scott Michel9c0c6b22008-11-21 02:56:16 +0000672 // The vector type we really want to load from the 16-byte chunk.
Scott Michel719b0e12008-11-19 17:45:08 +0000673 MVT vecVT = MVT::getVectorVT(VT, (128 / VT.getSizeInBits())),
674 stVecVT = MVT::getVectorVT(StVT, (128 / StVT.getSizeInBits()));
Scott Michel266bc8f2007-12-04 22:23:35 +0000675
Scott Michelf0569be2008-12-27 04:51:36 +0000676 SDValue alignLoadVec;
677 SDValue basePtr = SN->getBasePtr();
678 SDValue the_chain = SN->getChain();
679 SDValue insertEltOffs;
Scott Michel266bc8f2007-12-04 22:23:35 +0000680
Scott Michelf0569be2008-12-27 04:51:36 +0000681 if (alignment == 16) {
682 ConstantSDNode *CN;
683
684 // Special cases for a known aligned load to simplify the base pointer
685 // and insertion byte:
686 if (basePtr.getOpcode() == ISD::ADD
687 && (CN = dyn_cast<ConstantSDNode>(basePtr.getOperand(1))) != 0) {
688 // Known offset into basePtr
689 int64_t offset = CN->getSExtValue();
690
691 // Simplify the base pointer for this case:
692 basePtr = basePtr.getOperand(0);
693 insertEltOffs = DAG.getNode(SPUISD::IndirectAddr, PtrVT,
694 basePtr,
695 DAG.getConstant((offset & 0xf), PtrVT));
696
697 if ((offset & ~0xf) > 0) {
698 basePtr = DAG.getNode(SPUISD::IndirectAddr, PtrVT,
699 basePtr,
700 DAG.getConstant((offset & ~0xf), PtrVT));
701 }
702 } else {
703 // Otherwise, assume it's at byte 0 of basePtr
704 insertEltOffs = DAG.getNode(SPUISD::IndirectAddr, PtrVT,
705 basePtr,
706 DAG.getConstant(0, PtrVT));
707 }
708 } else {
709 // Unaligned load: must be more pessimistic about addressing modes:
710 if (basePtr.getOpcode() == ISD::ADD) {
711 MachineFunction &MF = DAG.getMachineFunction();
712 MachineRegisterInfo &RegInfo = MF.getRegInfo();
713 unsigned VReg = RegInfo.createVirtualRegister(&SPU::R32CRegClass);
714 SDValue Flag;
715
716 SDValue Op0 = basePtr.getOperand(0);
717 SDValue Op1 = basePtr.getOperand(1);
718
719 if (isa<ConstantSDNode>(Op1)) {
720 // Convert the (add <ptr>, <const>) to an indirect address contained
721 // in a register. Note that this is done because we need to avoid
722 // creating a 0(reg) d-form address due to the SPU's block loads.
723 basePtr = DAG.getNode(SPUISD::IndirectAddr, PtrVT, Op0, Op1);
Dale Johannesen33c960f2009-02-04 20:06:27 +0000724 the_chain = DAG.getCopyToReg(the_chain, dl, VReg, basePtr, Flag);
725 basePtr = DAG.getCopyFromReg(the_chain, dl, VReg, PtrVT);
Scott Michelf0569be2008-12-27 04:51:36 +0000726 } else {
727 // Convert the (add <arg1>, <arg2>) to an indirect address, which
728 // will likely be lowered as a reg(reg) x-form address.
729 basePtr = DAG.getNode(SPUISD::IndirectAddr, PtrVT, Op0, Op1);
730 }
731 } else {
732 basePtr = DAG.getNode(SPUISD::IndirectAddr, PtrVT,
733 basePtr,
734 DAG.getConstant(0, PtrVT));
735 }
736
737 // Insertion point is solely determined by basePtr's contents
Dale Johannesen33c960f2009-02-04 20:06:27 +0000738 insertEltOffs = DAG.getNode(ISD::ADD, dl, PtrVT,
Scott Michelf0569be2008-12-27 04:51:36 +0000739 basePtr,
740 DAG.getConstant(0, PtrVT));
741 }
742
743 // Re-emit as a v16i8 vector load
Dale Johannesen33c960f2009-02-04 20:06:27 +0000744 alignLoadVec = DAG.getLoad(MVT::v16i8, dl, the_chain, basePtr,
Scott Michelf0569be2008-12-27 04:51:36 +0000745 SN->getSrcValue(), SN->getSrcValueOffset(),
746 SN->isVolatile(), 16);
747
748 // Update the chain
749 the_chain = alignLoadVec.getValue(1);
Scott Michel266bc8f2007-12-04 22:23:35 +0000750
Scott Michel9de5d0d2008-01-11 02:53:15 +0000751 LoadSDNode *LN = cast<LoadSDNode>(alignLoadVec);
Dan Gohman475871a2008-07-27 21:46:04 +0000752 SDValue theValue = SN->getValue();
753 SDValue result;
Scott Michel266bc8f2007-12-04 22:23:35 +0000754
755 if (StVT != VT
Scott Michel7f9ba9b2008-01-30 02:55:46 +0000756 && (theValue.getOpcode() == ISD::AssertZext
757 || theValue.getOpcode() == ISD::AssertSext)) {
Scott Michel266bc8f2007-12-04 22:23:35 +0000758 // Drill down and get the value for zero- and sign-extended
759 // quantities
Scott Michel5af8f0e2008-07-16 17:17:29 +0000760 theValue = theValue.getOperand(0);
Scott Michel266bc8f2007-12-04 22:23:35 +0000761 }
762
Scott Michel9de5d0d2008-01-11 02:53:15 +0000763 // If the base pointer is already a D-form address, then just create
764 // a new D-form address with a slot offset and the orignal base pointer.
765 // Otherwise generate a D-form address with the slot offset relative
766 // to the stack pointer, which is always aligned.
Scott Michelf0569be2008-12-27 04:51:36 +0000767#if !defined(NDEBUG)
768 if (DebugFlag && isCurrentDebugType(DEBUG_TYPE)) {
769 cerr << "CellSPU LowerSTORE: basePtr = ";
770 basePtr.getNode()->dump(&DAG);
771 cerr << "\n";
772 }
773#endif
Scott Michel9de5d0d2008-01-11 02:53:15 +0000774
Scott Michel430a5552008-11-19 15:24:16 +0000775 SDValue insertEltOp =
Dale Johannesen33c960f2009-02-04 20:06:27 +0000776 DAG.getNode(SPUISD::SHUFFLE_MASK, dl, vecVT, insertEltOffs);
Scott Michel719b0e12008-11-19 17:45:08 +0000777 SDValue vectorizeOp =
Dale Johannesen33c960f2009-02-04 20:06:27 +0000778 DAG.getNode(ISD::SCALAR_TO_VECTOR, dl, vecVT, theValue);
Scott Michel430a5552008-11-19 15:24:16 +0000779
Dale Johannesen33c960f2009-02-04 20:06:27 +0000780 result = DAG.getNode(SPUISD::SHUFB, dl, vecVT,
Scott Michel19c10e62009-01-26 03:37:41 +0000781 vectorizeOp, alignLoadVec,
Dale Johannesen33c960f2009-02-04 20:06:27 +0000782 DAG.getNode(ISD::BIT_CONVERT, dl,
783 MVT::v4i32, insertEltOp));
Scott Michel266bc8f2007-12-04 22:23:35 +0000784
Dale Johannesen33c960f2009-02-04 20:06:27 +0000785 result = DAG.getStore(the_chain, dl, result, basePtr,
Scott Michel266bc8f2007-12-04 22:23:35 +0000786 LN->getSrcValue(), LN->getSrcValueOffset(),
787 LN->isVolatile(), LN->getAlignment());
788
Scott Michel23f2ff72008-12-04 17:16:59 +0000789#if 0 && !defined(NDEBUG)
Scott Michel430a5552008-11-19 15:24:16 +0000790 if (DebugFlag && isCurrentDebugType(DEBUG_TYPE)) {
791 const SDValue &currentRoot = DAG.getRoot();
792
793 DAG.setRoot(result);
794 cerr << "------- CellSPU:LowerStore result:\n";
795 DAG.dump();
796 cerr << "-------\n";
797 DAG.setRoot(currentRoot);
798 }
799#endif
Scott Michelb30e8f62008-12-02 19:53:53 +0000800
Scott Michel266bc8f2007-12-04 22:23:35 +0000801 return result;
802 /*UNREACHED*/
803 }
804 case ISD::PRE_INC:
805 case ISD::PRE_DEC:
806 case ISD::POST_INC:
807 case ISD::POST_DEC:
808 case ISD::LAST_INDEXED_MODE:
809 cerr << "LowerLOAD: Got a LoadSDNode with an addr mode other than "
810 "UNINDEXED\n";
811 cerr << (unsigned) SN->getAddressingMode() << "\n";
812 abort();
813 /*NOTREACHED*/
814 }
815
Dan Gohman475871a2008-07-27 21:46:04 +0000816 return SDValue();
Scott Michel266bc8f2007-12-04 22:23:35 +0000817}
818
Scott Michel94bd57e2009-01-15 04:41:47 +0000819//! Generate the address of a constant pool entry.
820SDValue
Dan Gohman475871a2008-07-27 21:46:04 +0000821LowerConstantPool(SDValue Op, SelectionDAG &DAG, const SPUSubtarget *ST) {
Duncan Sands83ec4b62008-06-06 12:08:01 +0000822 MVT PtrVT = Op.getValueType();
Scott Michel266bc8f2007-12-04 22:23:35 +0000823 ConstantPoolSDNode *CP = cast<ConstantPoolSDNode>(Op);
824 Constant *C = CP->getConstVal();
Dan Gohman475871a2008-07-27 21:46:04 +0000825 SDValue CPI = DAG.getTargetConstantPool(C, PtrVT, CP->getAlignment());
826 SDValue Zero = DAG.getConstant(0, PtrVT);
Scott Michel9de5d0d2008-01-11 02:53:15 +0000827 const TargetMachine &TM = DAG.getTarget();
Scott Michel266bc8f2007-12-04 22:23:35 +0000828
829 if (TM.getRelocationModel() == Reloc::Static) {
830 if (!ST->usingLargeMem()) {
Dan Gohman475871a2008-07-27 21:46:04 +0000831 // Just return the SDValue with the constant pool address in it.
Scott Michel58c58182008-01-17 20:38:41 +0000832 return DAG.getNode(SPUISD::AFormAddr, PtrVT, CPI, Zero);
Scott Michel266bc8f2007-12-04 22:23:35 +0000833 } else {
Dan Gohman475871a2008-07-27 21:46:04 +0000834 SDValue Hi = DAG.getNode(SPUISD::Hi, PtrVT, CPI, Zero);
835 SDValue Lo = DAG.getNode(SPUISD::Lo, PtrVT, CPI, Zero);
Scott Michela59d4692008-02-23 18:41:37 +0000836 return DAG.getNode(SPUISD::IndirectAddr, PtrVT, Hi, Lo);
Scott Michel266bc8f2007-12-04 22:23:35 +0000837 }
838 }
839
840 assert(0 &&
Gabor Greif93c53e52008-08-31 15:37:04 +0000841 "LowerConstantPool: Relocation model other than static"
842 " not supported.");
Dan Gohman475871a2008-07-27 21:46:04 +0000843 return SDValue();
Scott Michel266bc8f2007-12-04 22:23:35 +0000844}
845
Scott Michel94bd57e2009-01-15 04:41:47 +0000846//! Alternate entry point for generating the address of a constant pool entry
847SDValue
848SPU::LowerConstantPool(SDValue Op, SelectionDAG &DAG, const SPUTargetMachine &TM) {
849 return ::LowerConstantPool(Op, DAG, TM.getSubtargetImpl());
850}
851
Dan Gohman475871a2008-07-27 21:46:04 +0000852static SDValue
853LowerJumpTable(SDValue Op, SelectionDAG &DAG, const SPUSubtarget *ST) {
Duncan Sands83ec4b62008-06-06 12:08:01 +0000854 MVT PtrVT = Op.getValueType();
Scott Michel266bc8f2007-12-04 22:23:35 +0000855 JumpTableSDNode *JT = cast<JumpTableSDNode>(Op);
Dan Gohman475871a2008-07-27 21:46:04 +0000856 SDValue JTI = DAG.getTargetJumpTable(JT->getIndex(), PtrVT);
857 SDValue Zero = DAG.getConstant(0, PtrVT);
Scott Michel266bc8f2007-12-04 22:23:35 +0000858 const TargetMachine &TM = DAG.getTarget();
859
860 if (TM.getRelocationModel() == Reloc::Static) {
Scott Michela59d4692008-02-23 18:41:37 +0000861 if (!ST->usingLargeMem()) {
862 return DAG.getNode(SPUISD::AFormAddr, PtrVT, JTI, Zero);
863 } else {
Dan Gohman475871a2008-07-27 21:46:04 +0000864 SDValue Hi = DAG.getNode(SPUISD::Hi, PtrVT, JTI, Zero);
865 SDValue Lo = DAG.getNode(SPUISD::Lo, PtrVT, JTI, Zero);
Scott Michela59d4692008-02-23 18:41:37 +0000866 return DAG.getNode(SPUISD::IndirectAddr, PtrVT, Hi, Lo);
867 }
Scott Michel266bc8f2007-12-04 22:23:35 +0000868 }
869
870 assert(0 &&
871 "LowerJumpTable: Relocation model other than static not supported.");
Dan Gohman475871a2008-07-27 21:46:04 +0000872 return SDValue();
Scott Michel266bc8f2007-12-04 22:23:35 +0000873}
874
Dan Gohman475871a2008-07-27 21:46:04 +0000875static SDValue
876LowerGlobalAddress(SDValue Op, SelectionDAG &DAG, const SPUSubtarget *ST) {
Duncan Sands83ec4b62008-06-06 12:08:01 +0000877 MVT PtrVT = Op.getValueType();
Scott Michel266bc8f2007-12-04 22:23:35 +0000878 GlobalAddressSDNode *GSDN = cast<GlobalAddressSDNode>(Op);
879 GlobalValue *GV = GSDN->getGlobal();
Dan Gohman475871a2008-07-27 21:46:04 +0000880 SDValue GA = DAG.getTargetGlobalAddress(GV, PtrVT, GSDN->getOffset());
Scott Michel266bc8f2007-12-04 22:23:35 +0000881 const TargetMachine &TM = DAG.getTarget();
Dan Gohman475871a2008-07-27 21:46:04 +0000882 SDValue Zero = DAG.getConstant(0, PtrVT);
Scott Michel5af8f0e2008-07-16 17:17:29 +0000883
Scott Michel266bc8f2007-12-04 22:23:35 +0000884 if (TM.getRelocationModel() == Reloc::Static) {
Scott Michel053c1da2008-01-29 02:16:57 +0000885 if (!ST->usingLargeMem()) {
886 return DAG.getNode(SPUISD::AFormAddr, PtrVT, GA, Zero);
887 } else {
Dan Gohman475871a2008-07-27 21:46:04 +0000888 SDValue Hi = DAG.getNode(SPUISD::Hi, PtrVT, GA, Zero);
889 SDValue Lo = DAG.getNode(SPUISD::Lo, PtrVT, GA, Zero);
Scott Michel053c1da2008-01-29 02:16:57 +0000890 return DAG.getNode(SPUISD::IndirectAddr, PtrVT, Hi, Lo);
891 }
Scott Michel266bc8f2007-12-04 22:23:35 +0000892 } else {
893 cerr << "LowerGlobalAddress: Relocation model other than static not "
Scott Michel7f9ba9b2008-01-30 02:55:46 +0000894 << "supported.\n";
Scott Michel266bc8f2007-12-04 22:23:35 +0000895 abort();
896 /*NOTREACHED*/
897 }
898
Dan Gohman475871a2008-07-27 21:46:04 +0000899 return SDValue();
Scott Michel266bc8f2007-12-04 22:23:35 +0000900}
901
Nate Begemanccef5802008-02-14 18:43:04 +0000902//! Custom lower double precision floating point constants
Dan Gohman475871a2008-07-27 21:46:04 +0000903static SDValue
904LowerConstantFP(SDValue Op, SelectionDAG &DAG) {
Duncan Sands83ec4b62008-06-06 12:08:01 +0000905 MVT VT = Op.getValueType();
Scott Michel266bc8f2007-12-04 22:23:35 +0000906
Nate Begemanccef5802008-02-14 18:43:04 +0000907 if (VT == MVT::f64) {
Scott Michel1a6cdb62008-12-01 17:56:02 +0000908 ConstantFPSDNode *FP = cast<ConstantFPSDNode>(Op.getNode());
909
910 assert((FP != 0) &&
911 "LowerConstantFP: Node is not ConstantFPSDNode");
Scott Michel1df30c42008-12-29 03:23:36 +0000912
Scott Michel170783a2007-12-19 20:15:47 +0000913 uint64_t dbits = DoubleToBits(FP->getValueAPF().convertToDouble());
Scott Michel1a6cdb62008-12-01 17:56:02 +0000914 SDValue T = DAG.getConstant(dbits, MVT::i64);
915 SDValue Tvec = DAG.getNode(ISD::BUILD_VECTOR, MVT::v2i64, T, T);
916 return DAG.getNode(SPUISD::VEC2PREFSLOT, VT,
917 DAG.getNode(ISD::BIT_CONVERT, MVT::v2f64, Tvec));
Scott Michel266bc8f2007-12-04 22:23:35 +0000918 }
919
Dan Gohman475871a2008-07-27 21:46:04 +0000920 return SDValue();
Scott Michel266bc8f2007-12-04 22:23:35 +0000921}
922
Dan Gohman475871a2008-07-27 21:46:04 +0000923static SDValue
Dan Gohman475871a2008-07-27 21:46:04 +0000924LowerFORMAL_ARGUMENTS(SDValue Op, SelectionDAG &DAG, int &VarArgsFrameIndex)
Scott Michel266bc8f2007-12-04 22:23:35 +0000925{
926 MachineFunction &MF = DAG.getMachineFunction();
927 MachineFrameInfo *MFI = MF.getFrameInfo();
Chris Lattner84bc5422007-12-31 04:13:23 +0000928 MachineRegisterInfo &RegInfo = MF.getRegInfo();
Scott Micheld976c212008-10-30 01:51:48 +0000929 SmallVector<SDValue, 48> ArgValues;
Dan Gohman475871a2008-07-27 21:46:04 +0000930 SDValue Root = Op.getOperand(0);
Dan Gohmanf5aeb1a2008-09-12 16:56:44 +0000931 bool isVarArg = cast<ConstantSDNode>(Op.getOperand(2))->getZExtValue() != 0;
Dale Johannesen33c960f2009-02-04 20:06:27 +0000932 DebugLoc dl = Op.getDebugLoc();
Scott Michel266bc8f2007-12-04 22:23:35 +0000933
934 const unsigned *ArgRegs = SPURegisterInfo::getArgRegs();
935 const unsigned NumArgRegs = SPURegisterInfo::getNumArgRegs();
Scott Michel5af8f0e2008-07-16 17:17:29 +0000936
Scott Michel266bc8f2007-12-04 22:23:35 +0000937 unsigned ArgOffset = SPUFrameInfo::minStackSize();
938 unsigned ArgRegIdx = 0;
939 unsigned StackSlotSize = SPUFrameInfo::stackSlotSize();
Scott Michel5af8f0e2008-07-16 17:17:29 +0000940
Duncan Sands83ec4b62008-06-06 12:08:01 +0000941 MVT PtrVT = DAG.getTargetLoweringInfo().getPointerTy();
Scott Michel5af8f0e2008-07-16 17:17:29 +0000942
Scott Michel266bc8f2007-12-04 22:23:35 +0000943 // Add DAG nodes to load the arguments or copy them out of registers.
Gabor Greif93c53e52008-08-31 15:37:04 +0000944 for (unsigned ArgNo = 0, e = Op.getNode()->getNumValues() - 1;
945 ArgNo != e; ++ArgNo) {
Duncan Sands83ec4b62008-06-06 12:08:01 +0000946 MVT ObjectVT = Op.getValue(ArgNo).getValueType();
947 unsigned ObjSize = ObjectVT.getSizeInBits()/8;
Scott Micheld976c212008-10-30 01:51:48 +0000948 SDValue ArgVal;
Scott Michel266bc8f2007-12-04 22:23:35 +0000949
Scott Micheld976c212008-10-30 01:51:48 +0000950 if (ArgRegIdx < NumArgRegs) {
951 const TargetRegisterClass *ArgRegClass;
Scott Michel5af8f0e2008-07-16 17:17:29 +0000952
Scott Micheld976c212008-10-30 01:51:48 +0000953 switch (ObjectVT.getSimpleVT()) {
954 default: {
Scott Michel9c0c6b22008-11-21 02:56:16 +0000955 cerr << "LowerFORMAL_ARGUMENTS Unhandled argument type: "
956 << ObjectVT.getMVTString()
957 << "\n";
958 abort();
Scott Micheld976c212008-10-30 01:51:48 +0000959 }
960 case MVT::i8:
Scott Michel9c0c6b22008-11-21 02:56:16 +0000961 ArgRegClass = &SPU::R8CRegClass;
962 break;
Scott Micheld976c212008-10-30 01:51:48 +0000963 case MVT::i16:
Scott Michel9c0c6b22008-11-21 02:56:16 +0000964 ArgRegClass = &SPU::R16CRegClass;
965 break;
Scott Micheld976c212008-10-30 01:51:48 +0000966 case MVT::i32:
Scott Michel9c0c6b22008-11-21 02:56:16 +0000967 ArgRegClass = &SPU::R32CRegClass;
968 break;
Scott Micheld976c212008-10-30 01:51:48 +0000969 case MVT::i64:
Scott Michel9c0c6b22008-11-21 02:56:16 +0000970 ArgRegClass = &SPU::R64CRegClass;
971 break;
Scott Micheldd950092009-01-06 03:36:14 +0000972 case MVT::i128:
973 ArgRegClass = &SPU::GPRCRegClass;
974 break;
Scott Micheld976c212008-10-30 01:51:48 +0000975 case MVT::f32:
Scott Michel9c0c6b22008-11-21 02:56:16 +0000976 ArgRegClass = &SPU::R32FPRegClass;
977 break;
Scott Micheld976c212008-10-30 01:51:48 +0000978 case MVT::f64:
Scott Michel9c0c6b22008-11-21 02:56:16 +0000979 ArgRegClass = &SPU::R64FPRegClass;
980 break;
Scott Micheld976c212008-10-30 01:51:48 +0000981 case MVT::v2f64:
982 case MVT::v4f32:
983 case MVT::v2i64:
984 case MVT::v4i32:
985 case MVT::v8i16:
986 case MVT::v16i8:
Scott Michel9c0c6b22008-11-21 02:56:16 +0000987 ArgRegClass = &SPU::VECREGRegClass;
988 break;
Scott Micheld976c212008-10-30 01:51:48 +0000989 }
990
991 unsigned VReg = RegInfo.createVirtualRegister(ArgRegClass);
992 RegInfo.addLiveIn(ArgRegs[ArgRegIdx], VReg);
Dale Johannesen33c960f2009-02-04 20:06:27 +0000993 ArgVal = DAG.getCopyFromReg(Root, dl, VReg, ObjectVT);
Scott Micheld976c212008-10-30 01:51:48 +0000994 ++ArgRegIdx;
995 } else {
996 // We need to load the argument to a virtual register if we determined
997 // above that we ran out of physical registers of the appropriate type
998 // or we're forced to do vararg
Chris Lattner9f72d1a2008-02-13 07:35:30 +0000999 int FI = MFI->CreateFixedObject(ObjSize, ArgOffset);
Dan Gohman475871a2008-07-27 21:46:04 +00001000 SDValue FIN = DAG.getFrameIndex(FI, PtrVT);
Dale Johannesen33c960f2009-02-04 20:06:27 +00001001 ArgVal = DAG.getLoad(ObjectVT, dl, Root, FIN, NULL, 0);
Scott Michel266bc8f2007-12-04 22:23:35 +00001002 ArgOffset += StackSlotSize;
1003 }
Scott Michel5af8f0e2008-07-16 17:17:29 +00001004
Scott Michel266bc8f2007-12-04 22:23:35 +00001005 ArgValues.push_back(ArgVal);
Scott Micheld976c212008-10-30 01:51:48 +00001006 // Update the chain
1007 Root = ArgVal.getOperand(0);
Scott Michel266bc8f2007-12-04 22:23:35 +00001008 }
Scott Michel5af8f0e2008-07-16 17:17:29 +00001009
Scott Micheld976c212008-10-30 01:51:48 +00001010 // vararg handling:
Scott Michel266bc8f2007-12-04 22:23:35 +00001011 if (isVarArg) {
Scott Micheld976c212008-10-30 01:51:48 +00001012 // unsigned int ptr_size = PtrVT.getSizeInBits() / 8;
1013 // We will spill (79-3)+1 registers to the stack
1014 SmallVector<SDValue, 79-3+1> MemOps;
1015
1016 // Create the frame slot
1017
Scott Michel266bc8f2007-12-04 22:23:35 +00001018 for (; ArgRegIdx != NumArgRegs; ++ArgRegIdx) {
Scott Micheld976c212008-10-30 01:51:48 +00001019 VarArgsFrameIndex = MFI->CreateFixedObject(StackSlotSize, ArgOffset);
1020 SDValue FIN = DAG.getFrameIndex(VarArgsFrameIndex, PtrVT);
1021 SDValue ArgVal = DAG.getRegister(ArgRegs[ArgRegIdx], MVT::v16i8);
Dale Johannesen33c960f2009-02-04 20:06:27 +00001022 SDValue Store = DAG.getStore(Root, dl, ArgVal, FIN, NULL, 0);
Scott Micheld976c212008-10-30 01:51:48 +00001023 Root = Store.getOperand(0);
Scott Michel266bc8f2007-12-04 22:23:35 +00001024 MemOps.push_back(Store);
Scott Micheld976c212008-10-30 01:51:48 +00001025
1026 // Increment address by stack slot size for the next stored argument
1027 ArgOffset += StackSlotSize;
Scott Michel266bc8f2007-12-04 22:23:35 +00001028 }
1029 if (!MemOps.empty())
Dale Johannesen33c960f2009-02-04 20:06:27 +00001030 Root = DAG.getNode(ISD::TokenFactor, dl, MVT::Other,
1031 &MemOps[0], MemOps.size());
Scott Michel266bc8f2007-12-04 22:23:35 +00001032 }
Scott Michel5af8f0e2008-07-16 17:17:29 +00001033
Scott Michel266bc8f2007-12-04 22:23:35 +00001034 ArgValues.push_back(Root);
Scott Michel5af8f0e2008-07-16 17:17:29 +00001035
Scott Michel266bc8f2007-12-04 22:23:35 +00001036 // Return the new list of results.
Dale Johannesen33c960f2009-02-04 20:06:27 +00001037 return DAG.getNode(ISD::MERGE_VALUES, dl, Op.getNode()->getVTList(),
Duncan Sandsaaffa052008-12-01 11:41:29 +00001038 &ArgValues[0], ArgValues.size());
Scott Michel266bc8f2007-12-04 22:23:35 +00001039}
1040
1041/// isLSAAddress - Return the immediate to use if the specified
1042/// value is representable as a LSA address.
Dan Gohman475871a2008-07-27 21:46:04 +00001043static SDNode *isLSAAddress(SDValue Op, SelectionDAG &DAG) {
Scott Michel19fd42a2008-11-11 03:06:06 +00001044 ConstantSDNode *C = dyn_cast<ConstantSDNode>(Op);
Scott Michel266bc8f2007-12-04 22:23:35 +00001045 if (!C) return 0;
Scott Michel5af8f0e2008-07-16 17:17:29 +00001046
Dan Gohmanf5aeb1a2008-09-12 16:56:44 +00001047 int Addr = C->getZExtValue();
Scott Michel266bc8f2007-12-04 22:23:35 +00001048 if ((Addr & 3) != 0 || // Low 2 bits are implicitly zero.
1049 (Addr << 14 >> 14) != Addr)
1050 return 0; // Top 14 bits have to be sext of immediate.
Scott Michel5af8f0e2008-07-16 17:17:29 +00001051
Dan Gohmanf5aeb1a2008-09-12 16:56:44 +00001052 return DAG.getConstant((int)C->getZExtValue() >> 2, MVT::i32).getNode();
Scott Michel266bc8f2007-12-04 22:23:35 +00001053}
1054
Scott Michel21213e72009-01-06 23:10:38 +00001055static SDValue
Dan Gohman475871a2008-07-27 21:46:04 +00001056LowerCALL(SDValue Op, SelectionDAG &DAG, const SPUSubtarget *ST) {
Dan Gohman095cc292008-09-13 01:54:27 +00001057 CallSDNode *TheCall = cast<CallSDNode>(Op.getNode());
1058 SDValue Chain = TheCall->getChain();
Dan Gohman095cc292008-09-13 01:54:27 +00001059 SDValue Callee = TheCall->getCallee();
1060 unsigned NumOps = TheCall->getNumArgs();
Scott Michel266bc8f2007-12-04 22:23:35 +00001061 unsigned StackSlotSize = SPUFrameInfo::stackSlotSize();
1062 const unsigned *ArgRegs = SPURegisterInfo::getArgRegs();
1063 const unsigned NumArgRegs = SPURegisterInfo::getNumArgRegs();
Dale Johannesen33c960f2009-02-04 20:06:27 +00001064 DebugLoc dl = TheCall->getDebugLoc();
Scott Michel266bc8f2007-12-04 22:23:35 +00001065
1066 // Handy pointer type
Duncan Sands83ec4b62008-06-06 12:08:01 +00001067 MVT PtrVT = DAG.getTargetLoweringInfo().getPointerTy();
Scott Michel5af8f0e2008-07-16 17:17:29 +00001068
Scott Michel266bc8f2007-12-04 22:23:35 +00001069 // Accumulate how many bytes are to be pushed on the stack, including the
1070 // linkage area, and parameter passing area. According to the SPU ABI,
1071 // we minimally need space for [LR] and [SP]
1072 unsigned NumStackBytes = SPUFrameInfo::minStackSize();
Scott Michel5af8f0e2008-07-16 17:17:29 +00001073
Scott Michel266bc8f2007-12-04 22:23:35 +00001074 // Set up a copy of the stack pointer for use loading and storing any
1075 // arguments that may not fit in the registers available for argument
1076 // passing.
Dan Gohman475871a2008-07-27 21:46:04 +00001077 SDValue StackPtr = DAG.getRegister(SPU::R1, MVT::i32);
Scott Michel5af8f0e2008-07-16 17:17:29 +00001078
Scott Michel266bc8f2007-12-04 22:23:35 +00001079 // Figure out which arguments are going to go in registers, and which in
1080 // memory.
1081 unsigned ArgOffset = SPUFrameInfo::minStackSize(); // Just below [LR]
1082 unsigned ArgRegIdx = 0;
1083
1084 // Keep track of registers passing arguments
Dan Gohman475871a2008-07-27 21:46:04 +00001085 std::vector<std::pair<unsigned, SDValue> > RegsToPass;
Scott Michel266bc8f2007-12-04 22:23:35 +00001086 // And the arguments passed on the stack
Dan Gohman475871a2008-07-27 21:46:04 +00001087 SmallVector<SDValue, 8> MemOpChains;
Scott Michel266bc8f2007-12-04 22:23:35 +00001088
1089 for (unsigned i = 0; i != NumOps; ++i) {
Dan Gohman095cc292008-09-13 01:54:27 +00001090 SDValue Arg = TheCall->getArg(i);
Scott Michel5af8f0e2008-07-16 17:17:29 +00001091
Scott Michel266bc8f2007-12-04 22:23:35 +00001092 // PtrOff will be used to store the current argument to the stack if a
1093 // register cannot be found for it.
Dan Gohman475871a2008-07-27 21:46:04 +00001094 SDValue PtrOff = DAG.getConstant(ArgOffset, StackPtr.getValueType());
Dale Johannesen33c960f2009-02-04 20:06:27 +00001095 PtrOff = DAG.getNode(ISD::ADD, dl, PtrVT, StackPtr, PtrOff);
Scott Michel266bc8f2007-12-04 22:23:35 +00001096
Duncan Sands83ec4b62008-06-06 12:08:01 +00001097 switch (Arg.getValueType().getSimpleVT()) {
Scott Michel266bc8f2007-12-04 22:23:35 +00001098 default: assert(0 && "Unexpected ValueType for argument!");
Scott Micheldd950092009-01-06 03:36:14 +00001099 case MVT::i8:
1100 case MVT::i16:
Scott Michel266bc8f2007-12-04 22:23:35 +00001101 case MVT::i32:
1102 case MVT::i64:
1103 case MVT::i128:
1104 if (ArgRegIdx != NumArgRegs) {
1105 RegsToPass.push_back(std::make_pair(ArgRegs[ArgRegIdx++], Arg));
1106 } else {
Dale Johannesen33c960f2009-02-04 20:06:27 +00001107 MemOpChains.push_back(DAG.getStore(Chain, dl, Arg, PtrOff, NULL, 0));
Scott Michel7f9ba9b2008-01-30 02:55:46 +00001108 ArgOffset += StackSlotSize;
Scott Michel266bc8f2007-12-04 22:23:35 +00001109 }
1110 break;
1111 case MVT::f32:
1112 case MVT::f64:
1113 if (ArgRegIdx != NumArgRegs) {
1114 RegsToPass.push_back(std::make_pair(ArgRegs[ArgRegIdx++], Arg));
1115 } else {
Dale Johannesen33c960f2009-02-04 20:06:27 +00001116 MemOpChains.push_back(DAG.getStore(Chain, dl, Arg, PtrOff, NULL, 0));
Scott Michel7f9ba9b2008-01-30 02:55:46 +00001117 ArgOffset += StackSlotSize;
Scott Michel266bc8f2007-12-04 22:23:35 +00001118 }
1119 break;
Scott Michelcc188272008-12-04 21:01:44 +00001120 case MVT::v2i64:
1121 case MVT::v2f64:
Scott Michel266bc8f2007-12-04 22:23:35 +00001122 case MVT::v4f32:
1123 case MVT::v4i32:
1124 case MVT::v8i16:
1125 case MVT::v16i8:
1126 if (ArgRegIdx != NumArgRegs) {
1127 RegsToPass.push_back(std::make_pair(ArgRegs[ArgRegIdx++], Arg));
1128 } else {
Dale Johannesen33c960f2009-02-04 20:06:27 +00001129 MemOpChains.push_back(DAG.getStore(Chain, dl, Arg, PtrOff, NULL, 0));
Scott Michel7f9ba9b2008-01-30 02:55:46 +00001130 ArgOffset += StackSlotSize;
Scott Michel266bc8f2007-12-04 22:23:35 +00001131 }
1132 break;
1133 }
1134 }
1135
1136 // Update number of stack bytes actually used, insert a call sequence start
1137 NumStackBytes = (ArgOffset - SPUFrameInfo::minStackSize());
Chris Lattnere563bbc2008-10-11 22:08:30 +00001138 Chain = DAG.getCALLSEQ_START(Chain, DAG.getIntPtrConstant(NumStackBytes,
1139 true));
Scott Michel266bc8f2007-12-04 22:23:35 +00001140
1141 if (!MemOpChains.empty()) {
1142 // Adjust the stack pointer for the stack arguments.
Dale Johannesen33c960f2009-02-04 20:06:27 +00001143 Chain = DAG.getNode(ISD::TokenFactor, dl, MVT::Other,
Scott Michel266bc8f2007-12-04 22:23:35 +00001144 &MemOpChains[0], MemOpChains.size());
1145 }
Scott Michel5af8f0e2008-07-16 17:17:29 +00001146
Scott Michel266bc8f2007-12-04 22:23:35 +00001147 // Build a sequence of copy-to-reg nodes chained together with token chain
1148 // and flag operands which copy the outgoing args into the appropriate regs.
Dan Gohman475871a2008-07-27 21:46:04 +00001149 SDValue InFlag;
Scott Michel266bc8f2007-12-04 22:23:35 +00001150 for (unsigned i = 0, e = RegsToPass.size(); i != e; ++i) {
Dale Johannesen33c960f2009-02-04 20:06:27 +00001151 Chain = DAG.getCopyToReg(Chain, dl, RegsToPass[i].first,
1152 RegsToPass[i].second, InFlag);
Scott Michel266bc8f2007-12-04 22:23:35 +00001153 InFlag = Chain.getValue(1);
1154 }
Scott Michel5af8f0e2008-07-16 17:17:29 +00001155
Dan Gohman475871a2008-07-27 21:46:04 +00001156 SmallVector<SDValue, 8> Ops;
Scott Michel266bc8f2007-12-04 22:23:35 +00001157 unsigned CallOpc = SPUISD::CALL;
Scott Michel5af8f0e2008-07-16 17:17:29 +00001158
Bill Wendling056292f2008-09-16 21:48:12 +00001159 // If the callee is a GlobalAddress/ExternalSymbol node (quite common, every
1160 // direct call is) turn it into a TargetGlobalAddress/TargetExternalSymbol
1161 // node so that legalize doesn't hack it.
Scott Michel19fd42a2008-11-11 03:06:06 +00001162 if (GlobalAddressSDNode *G = dyn_cast<GlobalAddressSDNode>(Callee)) {
Scott Michel266bc8f2007-12-04 22:23:35 +00001163 GlobalValue *GV = G->getGlobal();
Duncan Sands83ec4b62008-06-06 12:08:01 +00001164 MVT CalleeVT = Callee.getValueType();
Dan Gohman475871a2008-07-27 21:46:04 +00001165 SDValue Zero = DAG.getConstant(0, PtrVT);
1166 SDValue GA = DAG.getTargetGlobalAddress(GV, CalleeVT);
Scott Michel266bc8f2007-12-04 22:23:35 +00001167
Scott Michel9de5d0d2008-01-11 02:53:15 +00001168 if (!ST->usingLargeMem()) {
1169 // Turn calls to targets that are defined (i.e., have bodies) into BRSL
1170 // style calls, otherwise, external symbols are BRASL calls. This assumes
1171 // that declared/defined symbols are in the same compilation unit and can
1172 // be reached through PC-relative jumps.
1173 //
1174 // NOTE:
1175 // This may be an unsafe assumption for JIT and really large compilation
1176 // units.
1177 if (GV->isDeclaration()) {
1178 Callee = DAG.getNode(SPUISD::AFormAddr, CalleeVT, GA, Zero);
1179 } else {
1180 Callee = DAG.getNode(SPUISD::PCRelAddr, CalleeVT, GA, Zero);
1181 }
Scott Michel266bc8f2007-12-04 22:23:35 +00001182 } else {
Scott Michel9de5d0d2008-01-11 02:53:15 +00001183 // "Large memory" mode: Turn all calls into indirect calls with a X-form
1184 // address pairs:
Scott Michel053c1da2008-01-29 02:16:57 +00001185 Callee = DAG.getNode(SPUISD::IndirectAddr, PtrVT, GA, Zero);
Scott Michel266bc8f2007-12-04 22:23:35 +00001186 }
Scott Michel1df30c42008-12-29 03:23:36 +00001187 } else if (ExternalSymbolSDNode *S = dyn_cast<ExternalSymbolSDNode>(Callee)) {
1188 MVT CalleeVT = Callee.getValueType();
1189 SDValue Zero = DAG.getConstant(0, PtrVT);
1190 SDValue ExtSym = DAG.getTargetExternalSymbol(S->getSymbol(),
1191 Callee.getValueType());
1192
1193 if (!ST->usingLargeMem()) {
1194 Callee = DAG.getNode(SPUISD::AFormAddr, CalleeVT, ExtSym, Zero);
1195 } else {
1196 Callee = DAG.getNode(SPUISD::IndirectAddr, PtrVT, ExtSym, Zero);
1197 }
1198 } else if (SDNode *Dest = isLSAAddress(Callee, DAG)) {
Scott Michel266bc8f2007-12-04 22:23:35 +00001199 // If this is an absolute destination address that appears to be a legal
1200 // local store address, use the munged value.
Dan Gohman475871a2008-07-27 21:46:04 +00001201 Callee = SDValue(Dest, 0);
Scott Michel9de5d0d2008-01-11 02:53:15 +00001202 }
Scott Michel266bc8f2007-12-04 22:23:35 +00001203
1204 Ops.push_back(Chain);
1205 Ops.push_back(Callee);
Scott Michel5af8f0e2008-07-16 17:17:29 +00001206
Scott Michel266bc8f2007-12-04 22:23:35 +00001207 // Add argument registers to the end of the list so that they are known live
1208 // into the call.
1209 for (unsigned i = 0, e = RegsToPass.size(); i != e; ++i)
Scott Michel5af8f0e2008-07-16 17:17:29 +00001210 Ops.push_back(DAG.getRegister(RegsToPass[i].first,
Scott Michel266bc8f2007-12-04 22:23:35 +00001211 RegsToPass[i].second.getValueType()));
Scott Michel5af8f0e2008-07-16 17:17:29 +00001212
Gabor Greifba36cb52008-08-28 21:40:38 +00001213 if (InFlag.getNode())
Scott Michel266bc8f2007-12-04 22:23:35 +00001214 Ops.push_back(InFlag);
Duncan Sands4bdcb612008-07-02 17:40:58 +00001215 // Returns a chain and a flag for retval copy to use.
Dale Johannesen33c960f2009-02-04 20:06:27 +00001216 Chain = DAG.getNode(CallOpc, dl, DAG.getVTList(MVT::Other, MVT::Flag),
Duncan Sands4bdcb612008-07-02 17:40:58 +00001217 &Ops[0], Ops.size());
Scott Michel266bc8f2007-12-04 22:23:35 +00001218 InFlag = Chain.getValue(1);
1219
Chris Lattnere563bbc2008-10-11 22:08:30 +00001220 Chain = DAG.getCALLSEQ_END(Chain, DAG.getIntPtrConstant(NumStackBytes, true),
1221 DAG.getIntPtrConstant(0, true), InFlag);
Dan Gohman095cc292008-09-13 01:54:27 +00001222 if (TheCall->getValueType(0) != MVT::Other)
Evan Chengebaaa912008-02-05 22:44:06 +00001223 InFlag = Chain.getValue(1);
1224
Dan Gohman475871a2008-07-27 21:46:04 +00001225 SDValue ResultVals[3];
Scott Michel266bc8f2007-12-04 22:23:35 +00001226 unsigned NumResults = 0;
Scott Michel5af8f0e2008-07-16 17:17:29 +00001227
Scott Michel266bc8f2007-12-04 22:23:35 +00001228 // If the call has results, copy the values out of the ret val registers.
Dan Gohman095cc292008-09-13 01:54:27 +00001229 switch (TheCall->getValueType(0).getSimpleVT()) {
Scott Michel266bc8f2007-12-04 22:23:35 +00001230 default: assert(0 && "Unexpected ret value!");
1231 case MVT::Other: break;
1232 case MVT::i32:
Dan Gohman095cc292008-09-13 01:54:27 +00001233 if (TheCall->getValueType(1) == MVT::i32) {
Dale Johannesen33c960f2009-02-04 20:06:27 +00001234 Chain = DAG.getCopyFromReg(Chain, dl, SPU::R4,
1235 MVT::i32, InFlag).getValue(1);
Scott Michel266bc8f2007-12-04 22:23:35 +00001236 ResultVals[0] = Chain.getValue(0);
Dale Johannesen33c960f2009-02-04 20:06:27 +00001237 Chain = DAG.getCopyFromReg(Chain, dl, SPU::R3, MVT::i32,
Scott Michel266bc8f2007-12-04 22:23:35 +00001238 Chain.getValue(2)).getValue(1);
1239 ResultVals[1] = Chain.getValue(0);
1240 NumResults = 2;
Scott Michel266bc8f2007-12-04 22:23:35 +00001241 } else {
Dale Johannesen33c960f2009-02-04 20:06:27 +00001242 Chain = DAG.getCopyFromReg(Chain, dl, SPU::R3, MVT::i32,
1243 InFlag).getValue(1);
Scott Michel266bc8f2007-12-04 22:23:35 +00001244 ResultVals[0] = Chain.getValue(0);
1245 NumResults = 1;
1246 }
Scott Michel266bc8f2007-12-04 22:23:35 +00001247 break;
1248 case MVT::i64:
Dale Johannesen33c960f2009-02-04 20:06:27 +00001249 Chain = DAG.getCopyFromReg(Chain, dl, SPU::R3, MVT::i64,
1250 InFlag).getValue(1);
Scott Michel266bc8f2007-12-04 22:23:35 +00001251 ResultVals[0] = Chain.getValue(0);
1252 NumResults = 1;
Scott Michel266bc8f2007-12-04 22:23:35 +00001253 break;
Scott Micheldd950092009-01-06 03:36:14 +00001254 case MVT::i128:
Dale Johannesen33c960f2009-02-04 20:06:27 +00001255 Chain = DAG.getCopyFromReg(Chain, dl, SPU::R3, MVT::i128,
1256 InFlag).getValue(1);
Scott Micheldd950092009-01-06 03:36:14 +00001257 ResultVals[0] = Chain.getValue(0);
1258 NumResults = 1;
1259 break;
Scott Michel266bc8f2007-12-04 22:23:35 +00001260 case MVT::f32:
1261 case MVT::f64:
Dale Johannesen33c960f2009-02-04 20:06:27 +00001262 Chain = DAG.getCopyFromReg(Chain, dl, SPU::R3, TheCall->getValueType(0),
Scott Michel266bc8f2007-12-04 22:23:35 +00001263 InFlag).getValue(1);
1264 ResultVals[0] = Chain.getValue(0);
1265 NumResults = 1;
Scott Michel266bc8f2007-12-04 22:23:35 +00001266 break;
1267 case MVT::v2f64:
Scott Michelcc188272008-12-04 21:01:44 +00001268 case MVT::v2i64:
Scott Michel266bc8f2007-12-04 22:23:35 +00001269 case MVT::v4f32:
1270 case MVT::v4i32:
1271 case MVT::v8i16:
1272 case MVT::v16i8:
Dale Johannesen33c960f2009-02-04 20:06:27 +00001273 Chain = DAG.getCopyFromReg(Chain, dl, SPU::R3, TheCall->getValueType(0),
Scott Michel266bc8f2007-12-04 22:23:35 +00001274 InFlag).getValue(1);
1275 ResultVals[0] = Chain.getValue(0);
1276 NumResults = 1;
Scott Michel266bc8f2007-12-04 22:23:35 +00001277 break;
1278 }
Duncan Sands4bdcb612008-07-02 17:40:58 +00001279
Scott Michel266bc8f2007-12-04 22:23:35 +00001280 // If the function returns void, just return the chain.
1281 if (NumResults == 0)
1282 return Chain;
Scott Michel5af8f0e2008-07-16 17:17:29 +00001283
Scott Michel266bc8f2007-12-04 22:23:35 +00001284 // Otherwise, merge everything together with a MERGE_VALUES node.
1285 ResultVals[NumResults++] = Chain;
Dale Johannesen33c960f2009-02-04 20:06:27 +00001286 SDValue Res = DAG.getMergeValues(ResultVals, NumResults, dl);
Gabor Greif99a6cb92008-08-26 22:36:50 +00001287 return Res.getValue(Op.getResNo());
Scott Michel266bc8f2007-12-04 22:23:35 +00001288}
1289
Dan Gohman475871a2008-07-27 21:46:04 +00001290static SDValue
1291LowerRET(SDValue Op, SelectionDAG &DAG, TargetMachine &TM) {
Scott Michel266bc8f2007-12-04 22:23:35 +00001292 SmallVector<CCValAssign, 16> RVLocs;
1293 unsigned CC = DAG.getMachineFunction().getFunction()->getCallingConv();
1294 bool isVarArg = DAG.getMachineFunction().getFunction()->isVarArg();
1295 CCState CCInfo(CC, isVarArg, TM, RVLocs);
Gabor Greifba36cb52008-08-28 21:40:38 +00001296 CCInfo.AnalyzeReturn(Op.getNode(), RetCC_SPU);
Scott Michel5af8f0e2008-07-16 17:17:29 +00001297
Scott Michel266bc8f2007-12-04 22:23:35 +00001298 // If this is the first return lowered for this function, add the regs to the
1299 // liveout set for the function.
Chris Lattner84bc5422007-12-31 04:13:23 +00001300 if (DAG.getMachineFunction().getRegInfo().liveout_empty()) {
Scott Michel266bc8f2007-12-04 22:23:35 +00001301 for (unsigned i = 0; i != RVLocs.size(); ++i)
Chris Lattner84bc5422007-12-31 04:13:23 +00001302 DAG.getMachineFunction().getRegInfo().addLiveOut(RVLocs[i].getLocReg());
Scott Michel266bc8f2007-12-04 22:23:35 +00001303 }
1304
Dan Gohman475871a2008-07-27 21:46:04 +00001305 SDValue Chain = Op.getOperand(0);
1306 SDValue Flag;
Scott Michel5af8f0e2008-07-16 17:17:29 +00001307
Scott Michel266bc8f2007-12-04 22:23:35 +00001308 // Copy the result values into the output registers.
1309 for (unsigned i = 0; i != RVLocs.size(); ++i) {
1310 CCValAssign &VA = RVLocs[i];
1311 assert(VA.isRegLoc() && "Can only return in registers!");
1312 Chain = DAG.getCopyToReg(Chain, VA.getLocReg(), Op.getOperand(i*2+1), Flag);
1313 Flag = Chain.getValue(1);
1314 }
1315
Gabor Greifba36cb52008-08-28 21:40:38 +00001316 if (Flag.getNode())
Scott Michel266bc8f2007-12-04 22:23:35 +00001317 return DAG.getNode(SPUISD::RET_FLAG, MVT::Other, Chain, Flag);
1318 else
1319 return DAG.getNode(SPUISD::RET_FLAG, MVT::Other, Chain);
1320}
1321
1322
1323//===----------------------------------------------------------------------===//
1324// Vector related lowering:
1325//===----------------------------------------------------------------------===//
1326
1327static ConstantSDNode *
1328getVecImm(SDNode *N) {
Dan Gohman475871a2008-07-27 21:46:04 +00001329 SDValue OpVal(0, 0);
Scott Michel5af8f0e2008-07-16 17:17:29 +00001330
Scott Michel266bc8f2007-12-04 22:23:35 +00001331 // Check to see if this buildvec has a single non-undef value in its elements.
1332 for (unsigned i = 0, e = N->getNumOperands(); i != e; ++i) {
1333 if (N->getOperand(i).getOpcode() == ISD::UNDEF) continue;
Gabor Greifba36cb52008-08-28 21:40:38 +00001334 if (OpVal.getNode() == 0)
Scott Michel266bc8f2007-12-04 22:23:35 +00001335 OpVal = N->getOperand(i);
1336 else if (OpVal != N->getOperand(i))
1337 return 0;
1338 }
Scott Michel5af8f0e2008-07-16 17:17:29 +00001339
Gabor Greifba36cb52008-08-28 21:40:38 +00001340 if (OpVal.getNode() != 0) {
Scott Michel19fd42a2008-11-11 03:06:06 +00001341 if (ConstantSDNode *CN = dyn_cast<ConstantSDNode>(OpVal)) {
Scott Michel266bc8f2007-12-04 22:23:35 +00001342 return CN;
1343 }
1344 }
1345
1346 return 0; // All UNDEF: use implicit def.; not Constant node
1347}
1348
1349/// get_vec_i18imm - Test if this vector is a vector filled with the same value
1350/// and the value fits into an unsigned 18-bit constant, and if so, return the
1351/// constant
Dan Gohman475871a2008-07-27 21:46:04 +00001352SDValue SPU::get_vec_u18imm(SDNode *N, SelectionDAG &DAG,
Duncan Sands83ec4b62008-06-06 12:08:01 +00001353 MVT ValueType) {
Scott Michel266bc8f2007-12-04 22:23:35 +00001354 if (ConstantSDNode *CN = getVecImm(N)) {
Dan Gohmanf5aeb1a2008-09-12 16:56:44 +00001355 uint64_t Value = CN->getZExtValue();
Scott Michel4cb8bd82008-03-06 04:02:54 +00001356 if (ValueType == MVT::i64) {
Dan Gohmanf5aeb1a2008-09-12 16:56:44 +00001357 uint64_t UValue = CN->getZExtValue();
Scott Michel4cb8bd82008-03-06 04:02:54 +00001358 uint32_t upper = uint32_t(UValue >> 32);
1359 uint32_t lower = uint32_t(UValue);
1360 if (upper != lower)
Dan Gohman475871a2008-07-27 21:46:04 +00001361 return SDValue();
Scott Michel4cb8bd82008-03-06 04:02:54 +00001362 Value = Value >> 32;
1363 }
Scott Michel266bc8f2007-12-04 22:23:35 +00001364 if (Value <= 0x3ffff)
Dan Gohmanfa210d82008-11-05 02:06:09 +00001365 return DAG.getTargetConstant(Value, ValueType);
Scott Michel266bc8f2007-12-04 22:23:35 +00001366 }
1367
Dan Gohman475871a2008-07-27 21:46:04 +00001368 return SDValue();
Scott Michel266bc8f2007-12-04 22:23:35 +00001369}
1370
1371/// get_vec_i16imm - Test if this vector is a vector filled with the same value
1372/// and the value fits into a signed 16-bit constant, and if so, return the
1373/// constant
Dan Gohman475871a2008-07-27 21:46:04 +00001374SDValue SPU::get_vec_i16imm(SDNode *N, SelectionDAG &DAG,
Duncan Sands83ec4b62008-06-06 12:08:01 +00001375 MVT ValueType) {
Scott Michel266bc8f2007-12-04 22:23:35 +00001376 if (ConstantSDNode *CN = getVecImm(N)) {
Dan Gohman7810bfe2008-09-26 21:54:37 +00001377 int64_t Value = CN->getSExtValue();
Scott Michel4cb8bd82008-03-06 04:02:54 +00001378 if (ValueType == MVT::i64) {
Dan Gohmanf5aeb1a2008-09-12 16:56:44 +00001379 uint64_t UValue = CN->getZExtValue();
Scott Michel4cb8bd82008-03-06 04:02:54 +00001380 uint32_t upper = uint32_t(UValue >> 32);
1381 uint32_t lower = uint32_t(UValue);
1382 if (upper != lower)
Dan Gohman475871a2008-07-27 21:46:04 +00001383 return SDValue();
Scott Michel4cb8bd82008-03-06 04:02:54 +00001384 Value = Value >> 32;
1385 }
Scott Michelad2715e2008-03-05 23:02:02 +00001386 if (Value >= -(1 << 15) && Value <= ((1 << 15) - 1)) {
Dan Gohmanfa210d82008-11-05 02:06:09 +00001387 return DAG.getTargetConstant(Value, ValueType);
Scott Michel266bc8f2007-12-04 22:23:35 +00001388 }
1389 }
1390
Dan Gohman475871a2008-07-27 21:46:04 +00001391 return SDValue();
Scott Michel266bc8f2007-12-04 22:23:35 +00001392}
1393
1394/// get_vec_i10imm - Test if this vector is a vector filled with the same value
1395/// and the value fits into a signed 10-bit constant, and if so, return the
1396/// constant
Dan Gohman475871a2008-07-27 21:46:04 +00001397SDValue SPU::get_vec_i10imm(SDNode *N, SelectionDAG &DAG,
Duncan Sands83ec4b62008-06-06 12:08:01 +00001398 MVT ValueType) {
Scott Michel266bc8f2007-12-04 22:23:35 +00001399 if (ConstantSDNode *CN = getVecImm(N)) {
Dan Gohman7810bfe2008-09-26 21:54:37 +00001400 int64_t Value = CN->getSExtValue();
Scott Michel4cb8bd82008-03-06 04:02:54 +00001401 if (ValueType == MVT::i64) {
Dan Gohmanf5aeb1a2008-09-12 16:56:44 +00001402 uint64_t UValue = CN->getZExtValue();
Scott Michel4cb8bd82008-03-06 04:02:54 +00001403 uint32_t upper = uint32_t(UValue >> 32);
1404 uint32_t lower = uint32_t(UValue);
1405 if (upper != lower)
Dan Gohman475871a2008-07-27 21:46:04 +00001406 return SDValue();
Scott Michel4cb8bd82008-03-06 04:02:54 +00001407 Value = Value >> 32;
1408 }
Scott Michelad2715e2008-03-05 23:02:02 +00001409 if (isS10Constant(Value))
Dan Gohmanfa210d82008-11-05 02:06:09 +00001410 return DAG.getTargetConstant(Value, ValueType);
Scott Michel266bc8f2007-12-04 22:23:35 +00001411 }
1412
Dan Gohman475871a2008-07-27 21:46:04 +00001413 return SDValue();
Scott Michel266bc8f2007-12-04 22:23:35 +00001414}
1415
1416/// get_vec_i8imm - Test if this vector is a vector filled with the same value
1417/// and the value fits into a signed 8-bit constant, and if so, return the
1418/// constant.
1419///
1420/// @note: The incoming vector is v16i8 because that's the only way we can load
1421/// constant vectors. Thus, we test to see if the upper and lower bytes are the
1422/// same value.
Dan Gohman475871a2008-07-27 21:46:04 +00001423SDValue SPU::get_vec_i8imm(SDNode *N, SelectionDAG &DAG,
Duncan Sands83ec4b62008-06-06 12:08:01 +00001424 MVT ValueType) {
Scott Michel266bc8f2007-12-04 22:23:35 +00001425 if (ConstantSDNode *CN = getVecImm(N)) {
Dan Gohmanf5aeb1a2008-09-12 16:56:44 +00001426 int Value = (int) CN->getZExtValue();
Scott Michel266bc8f2007-12-04 22:23:35 +00001427 if (ValueType == MVT::i16
Scott Michel7f9ba9b2008-01-30 02:55:46 +00001428 && Value <= 0xffff /* truncated from uint64_t */
1429 && ((short) Value >> 8) == ((short) Value & 0xff))
Dan Gohmanfa210d82008-11-05 02:06:09 +00001430 return DAG.getTargetConstant(Value & 0xff, ValueType);
Scott Michel266bc8f2007-12-04 22:23:35 +00001431 else if (ValueType == MVT::i8
Scott Michel7f9ba9b2008-01-30 02:55:46 +00001432 && (Value & 0xff) == Value)
Dan Gohmanfa210d82008-11-05 02:06:09 +00001433 return DAG.getTargetConstant(Value, ValueType);
Scott Michel266bc8f2007-12-04 22:23:35 +00001434 }
1435
Dan Gohman475871a2008-07-27 21:46:04 +00001436 return SDValue();
Scott Michel266bc8f2007-12-04 22:23:35 +00001437}
1438
1439/// get_ILHUvec_imm - Test if this vector is a vector filled with the same value
1440/// and the value fits into a signed 16-bit constant, and if so, return the
1441/// constant
Dan Gohman475871a2008-07-27 21:46:04 +00001442SDValue SPU::get_ILHUvec_imm(SDNode *N, SelectionDAG &DAG,
Duncan Sands83ec4b62008-06-06 12:08:01 +00001443 MVT ValueType) {
Scott Michel266bc8f2007-12-04 22:23:35 +00001444 if (ConstantSDNode *CN = getVecImm(N)) {
Dan Gohmanf5aeb1a2008-09-12 16:56:44 +00001445 uint64_t Value = CN->getZExtValue();
Scott Michel266bc8f2007-12-04 22:23:35 +00001446 if ((ValueType == MVT::i32
Scott Michel7f9ba9b2008-01-30 02:55:46 +00001447 && ((unsigned) Value & 0xffff0000) == (unsigned) Value)
1448 || (ValueType == MVT::i64 && (Value & 0xffff0000) == Value))
Dan Gohmanfa210d82008-11-05 02:06:09 +00001449 return DAG.getTargetConstant(Value >> 16, ValueType);
Scott Michel266bc8f2007-12-04 22:23:35 +00001450 }
1451
Dan Gohman475871a2008-07-27 21:46:04 +00001452 return SDValue();
Scott Michel266bc8f2007-12-04 22:23:35 +00001453}
1454
1455/// get_v4i32_imm - Catch-all for general 32-bit constant vectors
Dan Gohman475871a2008-07-27 21:46:04 +00001456SDValue SPU::get_v4i32_imm(SDNode *N, SelectionDAG &DAG) {
Scott Michel266bc8f2007-12-04 22:23:35 +00001457 if (ConstantSDNode *CN = getVecImm(N)) {
Dan Gohmanfa210d82008-11-05 02:06:09 +00001458 return DAG.getTargetConstant((unsigned) CN->getZExtValue(), MVT::i32);
Scott Michel266bc8f2007-12-04 22:23:35 +00001459 }
1460
Dan Gohman475871a2008-07-27 21:46:04 +00001461 return SDValue();
Scott Michel266bc8f2007-12-04 22:23:35 +00001462}
1463
1464/// get_v4i32_imm - Catch-all for general 64-bit constant vectors
Dan Gohman475871a2008-07-27 21:46:04 +00001465SDValue SPU::get_v2i64_imm(SDNode *N, SelectionDAG &DAG) {
Scott Michel266bc8f2007-12-04 22:23:35 +00001466 if (ConstantSDNode *CN = getVecImm(N)) {
Dan Gohmanfa210d82008-11-05 02:06:09 +00001467 return DAG.getTargetConstant((unsigned) CN->getZExtValue(), MVT::i64);
Scott Michel266bc8f2007-12-04 22:23:35 +00001468 }
1469
Dan Gohman475871a2008-07-27 21:46:04 +00001470 return SDValue();
Scott Michel266bc8f2007-12-04 22:23:35 +00001471}
1472
1473// If this is a vector of constants or undefs, get the bits. A bit in
Scott Michel5af8f0e2008-07-16 17:17:29 +00001474// UndefBits is set if the corresponding element of the vector is an
Scott Michel266bc8f2007-12-04 22:23:35 +00001475// ISD::UNDEF value. For undefs, the corresponding VectorBits values are
1476// zero. Return true if this is not an array of constants, false if it is.
1477//
1478static bool GetConstantBuildVectorBits(SDNode *BV, uint64_t VectorBits[2],
1479 uint64_t UndefBits[2]) {
1480 // Start with zero'd results.
1481 VectorBits[0] = VectorBits[1] = UndefBits[0] = UndefBits[1] = 0;
Scott Michel5af8f0e2008-07-16 17:17:29 +00001482
Duncan Sands83ec4b62008-06-06 12:08:01 +00001483 unsigned EltBitSize = BV->getOperand(0).getValueType().getSizeInBits();
Scott Michel266bc8f2007-12-04 22:23:35 +00001484 for (unsigned i = 0, e = BV->getNumOperands(); i != e; ++i) {
Dan Gohman475871a2008-07-27 21:46:04 +00001485 SDValue OpVal = BV->getOperand(i);
Scott Michel5af8f0e2008-07-16 17:17:29 +00001486
Scott Michel266bc8f2007-12-04 22:23:35 +00001487 unsigned PartNo = i >= e/2; // In the upper 128 bits?
1488 unsigned SlotNo = e/2 - (i & (e/2-1))-1; // Which subpiece of the uint64_t.
1489
1490 uint64_t EltBits = 0;
1491 if (OpVal.getOpcode() == ISD::UNDEF) {
1492 uint64_t EltUndefBits = ~0ULL >> (64-EltBitSize);
1493 UndefBits[PartNo] |= EltUndefBits << (SlotNo*EltBitSize);
1494 continue;
Scott Michel19fd42a2008-11-11 03:06:06 +00001495 } else if (ConstantSDNode *CN = dyn_cast<ConstantSDNode>(OpVal)) {
Dan Gohmanf5aeb1a2008-09-12 16:56:44 +00001496 EltBits = CN->getZExtValue() & (~0ULL >> (64-EltBitSize));
Scott Michel19fd42a2008-11-11 03:06:06 +00001497 } else if (ConstantFPSDNode *CN = dyn_cast<ConstantFPSDNode>(OpVal)) {
Scott Michel266bc8f2007-12-04 22:23:35 +00001498 const APFloat &apf = CN->getValueAPF();
1499 EltBits = (CN->getValueType(0) == MVT::f32
Scott Michel7f9ba9b2008-01-30 02:55:46 +00001500 ? FloatToBits(apf.convertToFloat())
1501 : DoubleToBits(apf.convertToDouble()));
Scott Michel266bc8f2007-12-04 22:23:35 +00001502 } else {
1503 // Nonconstant element.
1504 return true;
1505 }
Scott Michel5af8f0e2008-07-16 17:17:29 +00001506
Scott Michel266bc8f2007-12-04 22:23:35 +00001507 VectorBits[PartNo] |= EltBits << (SlotNo*EltBitSize);
1508 }
Scott Michel5af8f0e2008-07-16 17:17:29 +00001509
1510 //printf("%llx %llx %llx %llx\n",
Scott Michel266bc8f2007-12-04 22:23:35 +00001511 // VectorBits[0], VectorBits[1], UndefBits[0], UndefBits[1]);
1512 return false;
1513}
1514
1515/// If this is a splat (repetition) of a value across the whole vector, return
1516/// the smallest size that splats it. For example, "0x01010101010101..." is a
Scott Michel5af8f0e2008-07-16 17:17:29 +00001517/// splat of 0x01, 0x0101, and 0x01010101. We return SplatBits = 0x01 and
Scott Michel266bc8f2007-12-04 22:23:35 +00001518/// SplatSize = 1 byte.
Scott Michel5af8f0e2008-07-16 17:17:29 +00001519static bool isConstantSplat(const uint64_t Bits128[2],
Scott Michel266bc8f2007-12-04 22:23:35 +00001520 const uint64_t Undef128[2],
Scott Michel7f9ba9b2008-01-30 02:55:46 +00001521 int MinSplatBits,
Scott Michel266bc8f2007-12-04 22:23:35 +00001522 uint64_t &SplatBits, uint64_t &SplatUndef,
1523 int &SplatSize) {
1524 // Don't let undefs prevent splats from matching. See if the top 64-bits are
1525 // the same as the lower 64-bits, ignoring undefs.
1526 uint64_t Bits64 = Bits128[0] | Bits128[1];
1527 uint64_t Undef64 = Undef128[0] & Undef128[1];
1528 uint32_t Bits32 = uint32_t(Bits64) | uint32_t(Bits64 >> 32);
1529 uint32_t Undef32 = uint32_t(Undef64) & uint32_t(Undef64 >> 32);
1530 uint16_t Bits16 = uint16_t(Bits32) | uint16_t(Bits32 >> 16);
1531 uint16_t Undef16 = uint16_t(Undef32) & uint16_t(Undef32 >> 16);
1532
1533 if ((Bits128[0] & ~Undef128[1]) == (Bits128[1] & ~Undef128[0])) {
1534 if (MinSplatBits < 64) {
Scott Michel5af8f0e2008-07-16 17:17:29 +00001535
Scott Michel266bc8f2007-12-04 22:23:35 +00001536 // Check that the top 32-bits are the same as the lower 32-bits, ignoring
1537 // undefs.
1538 if ((Bits64 & (~Undef64 >> 32)) == ((Bits64 >> 32) & ~Undef64)) {
Scott Michel7f9ba9b2008-01-30 02:55:46 +00001539 if (MinSplatBits < 32) {
Scott Michel266bc8f2007-12-04 22:23:35 +00001540
Scott Michel7f9ba9b2008-01-30 02:55:46 +00001541 // If the top 16-bits are different than the lower 16-bits, ignoring
1542 // undefs, we have an i32 splat.
1543 if ((Bits32 & (~Undef32 >> 16)) == ((Bits32 >> 16) & ~Undef32)) {
1544 if (MinSplatBits < 16) {
1545 // If the top 8-bits are different than the lower 8-bits, ignoring
1546 // undefs, we have an i16 splat.
Gabor Greif93c53e52008-08-31 15:37:04 +00001547 if ((Bits16 & (uint16_t(~Undef16) >> 8))
1548 == ((Bits16 >> 8) & ~Undef16)) {
Scott Michel7f9ba9b2008-01-30 02:55:46 +00001549 // Otherwise, we have an 8-bit splat.
1550 SplatBits = uint8_t(Bits16) | uint8_t(Bits16 >> 8);
1551 SplatUndef = uint8_t(Undef16) & uint8_t(Undef16 >> 8);
1552 SplatSize = 1;
1553 return true;
1554 }
1555 } else {
1556 SplatBits = Bits16;
1557 SplatUndef = Undef16;
1558 SplatSize = 2;
1559 return true;
1560 }
1561 }
1562 } else {
1563 SplatBits = Bits32;
1564 SplatUndef = Undef32;
1565 SplatSize = 4;
1566 return true;
1567 }
Scott Michel266bc8f2007-12-04 22:23:35 +00001568 }
1569 } else {
1570 SplatBits = Bits128[0];
1571 SplatUndef = Undef128[0];
1572 SplatSize = 8;
1573 return true;
1574 }
1575 }
1576
1577 return false; // Can't be a splat if two pieces don't match.
1578}
1579
Scott Micheld1e8d9c2009-01-21 04:58:48 +00001580//! Lower a BUILD_VECTOR instruction creatively:
1581SDValue
Scott Michelc9c8b2a2009-01-26 03:31:40 +00001582LowerBUILD_VECTOR(SDValue Op, SelectionDAG &DAG) {
Duncan Sands83ec4b62008-06-06 12:08:01 +00001583 MVT VT = Op.getValueType();
Scott Michel266bc8f2007-12-04 22:23:35 +00001584 // If this is a vector of constants or undefs, get the bits. A bit in
Scott Michel5af8f0e2008-07-16 17:17:29 +00001585 // UndefBits is set if the corresponding element of the vector is an
Scott Michel266bc8f2007-12-04 22:23:35 +00001586 // ISD::UNDEF value. For undefs, the corresponding VectorBits values are
Scott Michel5af8f0e2008-07-16 17:17:29 +00001587 // zero.
Scott Michel266bc8f2007-12-04 22:23:35 +00001588 uint64_t VectorBits[2];
1589 uint64_t UndefBits[2];
1590 uint64_t SplatBits, SplatUndef;
1591 int SplatSize;
Gabor Greifba36cb52008-08-28 21:40:38 +00001592 if (GetConstantBuildVectorBits(Op.getNode(), VectorBits, UndefBits)
Scott Michel266bc8f2007-12-04 22:23:35 +00001593 || !isConstantSplat(VectorBits, UndefBits,
Duncan Sands83ec4b62008-06-06 12:08:01 +00001594 VT.getVectorElementType().getSizeInBits(),
Scott Michel266bc8f2007-12-04 22:23:35 +00001595 SplatBits, SplatUndef, SplatSize))
Dan Gohman475871a2008-07-27 21:46:04 +00001596 return SDValue(); // Not a constant vector, not a splat.
Scott Michel5af8f0e2008-07-16 17:17:29 +00001597
Duncan Sands83ec4b62008-06-06 12:08:01 +00001598 switch (VT.getSimpleVT()) {
Scott Michel266bc8f2007-12-04 22:23:35 +00001599 default:
Scott Micheld1e8d9c2009-01-21 04:58:48 +00001600 cerr << "CellSPU: Unhandled VT in LowerBUILD_VECTOR, VT = "
1601 << VT.getMVTString()
1602 << "\n";
1603 abort();
1604 /*NOTREACHED*/
Scott Michel266bc8f2007-12-04 22:23:35 +00001605 case MVT::v4f32: {
Scott Michelc9c8b2a2009-01-26 03:31:40 +00001606 uint32_t Value32 = uint32_t(SplatBits);
Scott Michel266bc8f2007-12-04 22:23:35 +00001607 assert(SplatSize == 4
Scott Michel7f9ba9b2008-01-30 02:55:46 +00001608 && "LowerBUILD_VECTOR: Unexpected floating point vector element.");
Scott Michel266bc8f2007-12-04 22:23:35 +00001609 // NOTE: pretend the constant is an integer. LLVM won't load FP constants
Dan Gohman475871a2008-07-27 21:46:04 +00001610 SDValue T = DAG.getConstant(Value32, MVT::i32);
Scott Michel266bc8f2007-12-04 22:23:35 +00001611 return DAG.getNode(ISD::BIT_CONVERT, MVT::v4f32,
Scott Michel7f9ba9b2008-01-30 02:55:46 +00001612 DAG.getNode(ISD::BUILD_VECTOR, MVT::v4i32, T, T, T, T));
Scott Michel266bc8f2007-12-04 22:23:35 +00001613 break;
1614 }
1615 case MVT::v2f64: {
Scott Michelc9c8b2a2009-01-26 03:31:40 +00001616 uint64_t f64val = uint64_t(SplatBits);
Scott Michel266bc8f2007-12-04 22:23:35 +00001617 assert(SplatSize == 8
Scott Michel104de432008-11-24 17:11:17 +00001618 && "LowerBUILD_VECTOR: 64-bit float vector size > 8 bytes.");
Scott Michel266bc8f2007-12-04 22:23:35 +00001619 // NOTE: pretend the constant is an integer. LLVM won't load FP constants
Dan Gohman475871a2008-07-27 21:46:04 +00001620 SDValue T = DAG.getConstant(f64val, MVT::i64);
Scott Michel266bc8f2007-12-04 22:23:35 +00001621 return DAG.getNode(ISD::BIT_CONVERT, MVT::v2f64,
Scott Michel7f9ba9b2008-01-30 02:55:46 +00001622 DAG.getNode(ISD::BUILD_VECTOR, MVT::v2i64, T, T));
Scott Michel266bc8f2007-12-04 22:23:35 +00001623 break;
1624 }
1625 case MVT::v16i8: {
1626 // 8-bit constants have to be expanded to 16-bits
1627 unsigned short Value16 = SplatBits | (SplatBits << 8);
Dan Gohman475871a2008-07-27 21:46:04 +00001628 SDValue Ops[8];
Scott Michel266bc8f2007-12-04 22:23:35 +00001629 for (int i = 0; i < 8; ++i)
1630 Ops[i] = DAG.getConstant(Value16, MVT::i16);
1631 return DAG.getNode(ISD::BIT_CONVERT, VT,
1632 DAG.getNode(ISD::BUILD_VECTOR, MVT::v8i16, Ops, 8));
1633 }
1634 case MVT::v8i16: {
1635 unsigned short Value16;
Scott Michel5af8f0e2008-07-16 17:17:29 +00001636 if (SplatSize == 2)
Scott Michel266bc8f2007-12-04 22:23:35 +00001637 Value16 = (unsigned short) (SplatBits & 0xffff);
1638 else
1639 Value16 = (unsigned short) (SplatBits | (SplatBits << 8));
Dan Gohman475871a2008-07-27 21:46:04 +00001640 SDValue T = DAG.getConstant(Value16, VT.getVectorElementType());
1641 SDValue Ops[8];
Scott Michel266bc8f2007-12-04 22:23:35 +00001642 for (int i = 0; i < 8; ++i) Ops[i] = T;
1643 return DAG.getNode(ISD::BUILD_VECTOR, VT, Ops, 8);
1644 }
1645 case MVT::v4i32: {
1646 unsigned int Value = SplatBits;
Dan Gohman475871a2008-07-27 21:46:04 +00001647 SDValue T = DAG.getConstant(Value, VT.getVectorElementType());
Scott Michel266bc8f2007-12-04 22:23:35 +00001648 return DAG.getNode(ISD::BUILD_VECTOR, VT, T, T, T, T);
1649 }
Scott Michel21213e72009-01-06 23:10:38 +00001650 case MVT::v2i32: {
1651 unsigned int Value = SplatBits;
1652 SDValue T = DAG.getConstant(Value, VT.getVectorElementType());
1653 return DAG.getNode(ISD::BUILD_VECTOR, VT, T, T);
1654 }
Scott Michel266bc8f2007-12-04 22:23:35 +00001655 case MVT::v2i64: {
Scott Michelc9c8b2a2009-01-26 03:31:40 +00001656 return SPU::LowerSplat_v2i64(VT, DAG, SplatBits);
Scott Michel266bc8f2007-12-04 22:23:35 +00001657 }
1658 }
Scott Michel5af8f0e2008-07-16 17:17:29 +00001659
Dan Gohman475871a2008-07-27 21:46:04 +00001660 return SDValue();
Scott Michel266bc8f2007-12-04 22:23:35 +00001661}
1662
Scott Michelc9c8b2a2009-01-26 03:31:40 +00001663SDValue
1664SPU::LowerSplat_v2i64(MVT OpVT, SelectionDAG& DAG, uint64_t SplatVal) {
1665 uint32_t upper = uint32_t(SplatVal >> 32);
1666 uint32_t lower = uint32_t(SplatVal);
1667
1668 if (upper == lower) {
1669 // Magic constant that can be matched by IL, ILA, et. al.
1670 SDValue Val = DAG.getTargetConstant(upper, MVT::i32);
1671 return DAG.getNode(ISD::BIT_CONVERT, OpVT,
1672 DAG.getNode(ISD::BUILD_VECTOR, MVT::v4i32,
1673 Val, Val, Val, Val));
1674 } else {
1675 SDValue LO32;
1676 SDValue HI32;
1677 SmallVector<SDValue, 16> ShufBytes;
1678 SDValue Result;
1679 bool upper_special, lower_special;
1680
1681 // NOTE: This code creates common-case shuffle masks that can be easily
1682 // detected as common expressions. It is not attempting to create highly
1683 // specialized masks to replace any and all 0's, 0xff's and 0x80's.
1684
1685 // Detect if the upper or lower half is a special shuffle mask pattern:
1686 upper_special = (upper == 0 || upper == 0xffffffff || upper == 0x80000000);
1687 lower_special = (lower == 0 || lower == 0xffffffff || lower == 0x80000000);
1688
1689 // Create lower vector if not a special pattern
1690 if (!lower_special) {
1691 SDValue LO32C = DAG.getConstant(lower, MVT::i32);
1692 LO32 = DAG.getNode(ISD::BIT_CONVERT, OpVT,
1693 DAG.getNode(ISD::BUILD_VECTOR, MVT::v4i32,
1694 LO32C, LO32C, LO32C, LO32C));
1695 }
1696
1697 // Create upper vector if not a special pattern
1698 if (!upper_special) {
1699 SDValue HI32C = DAG.getConstant(upper, MVT::i32);
1700 HI32 = DAG.getNode(ISD::BIT_CONVERT, OpVT,
1701 DAG.getNode(ISD::BUILD_VECTOR, MVT::v4i32,
1702 HI32C, HI32C, HI32C, HI32C));
1703 }
1704
1705 // If either upper or lower are special, then the two input operands are
1706 // the same (basically, one of them is a "don't care")
1707 if (lower_special)
1708 LO32 = HI32;
1709 if (upper_special)
1710 HI32 = LO32;
1711 if (lower_special && upper_special) {
1712 // Unhappy situation... both upper and lower are special, so punt with
1713 // a target constant:
1714 SDValue Zero = DAG.getConstant(0, MVT::i32);
1715 HI32 = LO32 = DAG.getNode(ISD::BUILD_VECTOR, MVT::v4i32, Zero, Zero,
1716 Zero, Zero);
1717 }
1718
1719 for (int i = 0; i < 4; ++i) {
1720 uint64_t val = 0;
1721 for (int j = 0; j < 4; ++j) {
1722 SDValue V;
1723 bool process_upper, process_lower;
1724 val <<= 8;
1725 process_upper = (upper_special && (i & 1) == 0);
1726 process_lower = (lower_special && (i & 1) == 1);
1727
1728 if (process_upper || process_lower) {
1729 if ((process_upper && upper == 0)
1730 || (process_lower && lower == 0))
1731 val |= 0x80;
1732 else if ((process_upper && upper == 0xffffffff)
1733 || (process_lower && lower == 0xffffffff))
1734 val |= 0xc0;
1735 else if ((process_upper && upper == 0x80000000)
1736 || (process_lower && lower == 0x80000000))
1737 val |= (j == 0 ? 0xe0 : 0x80);
1738 } else
1739 val |= i * 4 + j + ((i & 1) * 16);
1740 }
1741
1742 ShufBytes.push_back(DAG.getConstant(val, MVT::i32));
1743 }
1744
1745 return DAG.getNode(SPUISD::SHUFB, OpVT, HI32, LO32,
1746 DAG.getNode(ISD::BUILD_VECTOR, MVT::v4i32,
1747 &ShufBytes[0], ShufBytes.size()));
1748 }
1749}
1750
Scott Michel266bc8f2007-12-04 22:23:35 +00001751/// LowerVECTOR_SHUFFLE - Lower a vector shuffle (V1, V2, V3) to something on
1752/// which the Cell can operate. The code inspects V3 to ascertain whether the
1753/// permutation vector, V3, is monotonically increasing with one "exception"
1754/// element, e.g., (0, 1, _, 3). If this is the case, then generate a
Scott Michel7a1c9e92008-11-22 23:50:42 +00001755/// SHUFFLE_MASK synthetic instruction. Otherwise, spill V3 to the constant pool.
Scott Michel266bc8f2007-12-04 22:23:35 +00001756/// In either case, the net result is going to eventually invoke SHUFB to
1757/// permute/shuffle the bytes from V1 and V2.
1758/// \note
Scott Michel7a1c9e92008-11-22 23:50:42 +00001759/// SHUFFLE_MASK is eventually selected as one of the C*D instructions, generate
Scott Michel266bc8f2007-12-04 22:23:35 +00001760/// control word for byte/halfword/word insertion. This takes care of a single
1761/// element move from V2 into V1.
1762/// \note
1763/// SPUISD::SHUFB is eventually selected as Cell's <i>shufb</i> instructions.
Dan Gohman475871a2008-07-27 21:46:04 +00001764static SDValue LowerVECTOR_SHUFFLE(SDValue Op, SelectionDAG &DAG) {
1765 SDValue V1 = Op.getOperand(0);
1766 SDValue V2 = Op.getOperand(1);
1767 SDValue PermMask = Op.getOperand(2);
Scott Michel5af8f0e2008-07-16 17:17:29 +00001768
Scott Michel266bc8f2007-12-04 22:23:35 +00001769 if (V2.getOpcode() == ISD::UNDEF) V2 = V1;
Scott Michel5af8f0e2008-07-16 17:17:29 +00001770
Scott Michel266bc8f2007-12-04 22:23:35 +00001771 // If we have a single element being moved from V1 to V2, this can be handled
1772 // using the C*[DX] compute mask instructions, but the vector elements have
1773 // to be monotonically increasing with one exception element.
Scott Michelcc188272008-12-04 21:01:44 +00001774 MVT VecVT = V1.getValueType();
1775 MVT EltVT = VecVT.getVectorElementType();
Scott Michel266bc8f2007-12-04 22:23:35 +00001776 unsigned EltsFromV2 = 0;
1777 unsigned V2Elt = 0;
1778 unsigned V2EltIdx0 = 0;
1779 unsigned CurrElt = 0;
Scott Michelcc188272008-12-04 21:01:44 +00001780 unsigned MaxElts = VecVT.getVectorNumElements();
1781 unsigned PrevElt = 0;
1782 unsigned V0Elt = 0;
Scott Michel266bc8f2007-12-04 22:23:35 +00001783 bool monotonic = true;
Scott Michelcc188272008-12-04 21:01:44 +00001784 bool rotate = true;
1785
1786 if (EltVT == MVT::i8) {
Scott Michel266bc8f2007-12-04 22:23:35 +00001787 V2EltIdx0 = 16;
Scott Michelcc188272008-12-04 21:01:44 +00001788 } else if (EltVT == MVT::i16) {
Scott Michel266bc8f2007-12-04 22:23:35 +00001789 V2EltIdx0 = 8;
Scott Michelcc188272008-12-04 21:01:44 +00001790 } else if (EltVT == MVT::i32 || EltVT == MVT::f32) {
Scott Michel266bc8f2007-12-04 22:23:35 +00001791 V2EltIdx0 = 4;
Scott Michelcc188272008-12-04 21:01:44 +00001792 } else if (EltVT == MVT::i64 || EltVT == MVT::f64) {
1793 V2EltIdx0 = 2;
1794 } else
Scott Michel266bc8f2007-12-04 22:23:35 +00001795 assert(0 && "Unhandled vector type in LowerVECTOR_SHUFFLE");
1796
Scott Michelcc188272008-12-04 21:01:44 +00001797 for (unsigned i = 0; i != PermMask.getNumOperands(); ++i) {
1798 if (PermMask.getOperand(i).getOpcode() != ISD::UNDEF) {
1799 unsigned SrcElt = cast<ConstantSDNode > (PermMask.getOperand(i))->getZExtValue();
Scott Michel266bc8f2007-12-04 22:23:35 +00001800
Scott Michelcc188272008-12-04 21:01:44 +00001801 if (monotonic) {
1802 if (SrcElt >= V2EltIdx0) {
1803 if (1 >= (++EltsFromV2)) {
1804 V2Elt = (V2EltIdx0 - SrcElt) << 2;
1805 }
1806 } else if (CurrElt != SrcElt) {
1807 monotonic = false;
1808 }
1809
1810 ++CurrElt;
1811 }
1812
1813 if (rotate) {
1814 if (PrevElt > 0 && SrcElt < MaxElts) {
1815 if ((PrevElt == SrcElt - 1)
1816 || (PrevElt == MaxElts - 1 && SrcElt == 0)) {
1817 PrevElt = SrcElt;
1818 if (SrcElt == 0)
1819 V0Elt = i;
1820 } else {
1821 rotate = false;
1822 }
1823 } else if (PrevElt == 0) {
1824 // First time through, need to keep track of previous element
1825 PrevElt = SrcElt;
1826 } else {
1827 // This isn't a rotation, takes elements from vector 2
1828 rotate = false;
1829 }
1830 }
Scott Michel266bc8f2007-12-04 22:23:35 +00001831 }
Scott Michel266bc8f2007-12-04 22:23:35 +00001832 }
1833
1834 if (EltsFromV2 == 1 && monotonic) {
1835 // Compute mask and shuffle
1836 MachineFunction &MF = DAG.getMachineFunction();
Chris Lattner84bc5422007-12-31 04:13:23 +00001837 MachineRegisterInfo &RegInfo = MF.getRegInfo();
1838 unsigned VReg = RegInfo.createVirtualRegister(&SPU::R32CRegClass);
Duncan Sands83ec4b62008-06-06 12:08:01 +00001839 MVT PtrVT = DAG.getTargetLoweringInfo().getPointerTy();
Scott Michel266bc8f2007-12-04 22:23:35 +00001840 // Initialize temporary register to 0
Dan Gohman475871a2008-07-27 21:46:04 +00001841 SDValue InitTempReg =
Scott Michel266bc8f2007-12-04 22:23:35 +00001842 DAG.getCopyToReg(DAG.getEntryNode(), VReg, DAG.getConstant(0, PtrVT));
Scott Michel7a1c9e92008-11-22 23:50:42 +00001843 // Copy register's contents as index in SHUFFLE_MASK:
Dan Gohman475871a2008-07-27 21:46:04 +00001844 SDValue ShufMaskOp =
Scott Michel1a6cdb62008-12-01 17:56:02 +00001845 DAG.getNode(SPUISD::SHUFFLE_MASK, MVT::v4i32,
Scott Michel7f9ba9b2008-01-30 02:55:46 +00001846 DAG.getTargetConstant(V2Elt, MVT::i32),
1847 DAG.getCopyFromReg(InitTempReg, VReg, PtrVT));
Scott Michel266bc8f2007-12-04 22:23:35 +00001848 // Use shuffle mask in SHUFB synthetic instruction:
1849 return DAG.getNode(SPUISD::SHUFB, V1.getValueType(), V2, V1, ShufMaskOp);
Scott Michelcc188272008-12-04 21:01:44 +00001850 } else if (rotate) {
1851 int rotamt = (MaxElts - V0Elt) * EltVT.getSizeInBits()/8;
Scott Michel1df30c42008-12-29 03:23:36 +00001852
Scott Michelcc188272008-12-04 21:01:44 +00001853 return DAG.getNode(SPUISD::ROTBYTES_LEFT, V1.getValueType(),
1854 V1, DAG.getConstant(rotamt, MVT::i16));
Scott Michel266bc8f2007-12-04 22:23:35 +00001855 } else {
Gabor Greif93c53e52008-08-31 15:37:04 +00001856 // Convert the SHUFFLE_VECTOR mask's input element units to the
1857 // actual bytes.
Duncan Sands83ec4b62008-06-06 12:08:01 +00001858 unsigned BytesPerElement = EltVT.getSizeInBits()/8;
Scott Michel5af8f0e2008-07-16 17:17:29 +00001859
Dan Gohman475871a2008-07-27 21:46:04 +00001860 SmallVector<SDValue, 16> ResultMask;
Scott Michel266bc8f2007-12-04 22:23:35 +00001861 for (unsigned i = 0, e = PermMask.getNumOperands(); i != e; ++i) {
1862 unsigned SrcElt;
1863 if (PermMask.getOperand(i).getOpcode() == ISD::UNDEF)
Scott Michel7f9ba9b2008-01-30 02:55:46 +00001864 SrcElt = 0;
Scott Michel5af8f0e2008-07-16 17:17:29 +00001865 else
Dan Gohmanf5aeb1a2008-09-12 16:56:44 +00001866 SrcElt = cast<ConstantSDNode>(PermMask.getOperand(i))->getZExtValue();
Scott Michel5af8f0e2008-07-16 17:17:29 +00001867
Scott Michela59d4692008-02-23 18:41:37 +00001868 for (unsigned j = 0; j < BytesPerElement; ++j) {
Scott Michel7f9ba9b2008-01-30 02:55:46 +00001869 ResultMask.push_back(DAG.getConstant(SrcElt*BytesPerElement+j,
1870 MVT::i8));
Scott Michel266bc8f2007-12-04 22:23:35 +00001871 }
1872 }
Scott Michel5af8f0e2008-07-16 17:17:29 +00001873
Dan Gohman475871a2008-07-27 21:46:04 +00001874 SDValue VPermMask = DAG.getNode(ISD::BUILD_VECTOR, MVT::v16i8,
Scott Michel1a6cdb62008-12-01 17:56:02 +00001875 &ResultMask[0], ResultMask.size());
Scott Michel266bc8f2007-12-04 22:23:35 +00001876 return DAG.getNode(SPUISD::SHUFB, V1.getValueType(), V1, V2, VPermMask);
1877 }
1878}
1879
Dan Gohman475871a2008-07-27 21:46:04 +00001880static SDValue LowerSCALAR_TO_VECTOR(SDValue Op, SelectionDAG &DAG) {
1881 SDValue Op0 = Op.getOperand(0); // Op0 = the scalar
Scott Michel266bc8f2007-12-04 22:23:35 +00001882
Gabor Greifba36cb52008-08-28 21:40:38 +00001883 if (Op0.getNode()->getOpcode() == ISD::Constant) {
Scott Michel266bc8f2007-12-04 22:23:35 +00001884 // For a constant, build the appropriate constant vector, which will
1885 // eventually simplify to a vector register load.
1886
Gabor Greifba36cb52008-08-28 21:40:38 +00001887 ConstantSDNode *CN = cast<ConstantSDNode>(Op0.getNode());
Dan Gohman475871a2008-07-27 21:46:04 +00001888 SmallVector<SDValue, 16> ConstVecValues;
Duncan Sands83ec4b62008-06-06 12:08:01 +00001889 MVT VT;
Scott Michel266bc8f2007-12-04 22:23:35 +00001890 size_t n_copies;
1891
1892 // Create a constant vector:
Duncan Sands83ec4b62008-06-06 12:08:01 +00001893 switch (Op.getValueType().getSimpleVT()) {
Scott Michel266bc8f2007-12-04 22:23:35 +00001894 default: assert(0 && "Unexpected constant value type in "
Scott Michel7f9ba9b2008-01-30 02:55:46 +00001895 "LowerSCALAR_TO_VECTOR");
Scott Michel266bc8f2007-12-04 22:23:35 +00001896 case MVT::v16i8: n_copies = 16; VT = MVT::i8; break;
1897 case MVT::v8i16: n_copies = 8; VT = MVT::i16; break;
1898 case MVT::v4i32: n_copies = 4; VT = MVT::i32; break;
1899 case MVT::v4f32: n_copies = 4; VT = MVT::f32; break;
1900 case MVT::v2i64: n_copies = 2; VT = MVT::i64; break;
1901 case MVT::v2f64: n_copies = 2; VT = MVT::f64; break;
1902 }
1903
Dan Gohmanf5aeb1a2008-09-12 16:56:44 +00001904 SDValue CValue = DAG.getConstant(CN->getZExtValue(), VT);
Scott Michel266bc8f2007-12-04 22:23:35 +00001905 for (size_t j = 0; j < n_copies; ++j)
1906 ConstVecValues.push_back(CValue);
1907
1908 return DAG.getNode(ISD::BUILD_VECTOR, Op.getValueType(),
Scott Michel7f9ba9b2008-01-30 02:55:46 +00001909 &ConstVecValues[0], ConstVecValues.size());
Scott Michel266bc8f2007-12-04 22:23:35 +00001910 } else {
1911 // Otherwise, copy the value from one register to another:
Duncan Sands83ec4b62008-06-06 12:08:01 +00001912 switch (Op0.getValueType().getSimpleVT()) {
Scott Michel266bc8f2007-12-04 22:23:35 +00001913 default: assert(0 && "Unexpected value type in LowerSCALAR_TO_VECTOR");
1914 case MVT::i8:
1915 case MVT::i16:
1916 case MVT::i32:
1917 case MVT::i64:
1918 case MVT::f32:
1919 case MVT::f64:
Scott Michelf0569be2008-12-27 04:51:36 +00001920 return DAG.getNode(SPUISD::PREFSLOT2VEC, Op.getValueType(), Op0, Op0);
Scott Michel266bc8f2007-12-04 22:23:35 +00001921 }
1922 }
1923
Dan Gohman475871a2008-07-27 21:46:04 +00001924 return SDValue();
Scott Michel266bc8f2007-12-04 22:23:35 +00001925}
1926
Dan Gohman475871a2008-07-27 21:46:04 +00001927static SDValue LowerEXTRACT_VECTOR_ELT(SDValue Op, SelectionDAG &DAG) {
Duncan Sands83ec4b62008-06-06 12:08:01 +00001928 MVT VT = Op.getValueType();
Dan Gohman475871a2008-07-27 21:46:04 +00001929 SDValue N = Op.getOperand(0);
1930 SDValue Elt = Op.getOperand(1);
Scott Michel7a1c9e92008-11-22 23:50:42 +00001931 SDValue retval;
Scott Michel266bc8f2007-12-04 22:23:35 +00001932
Scott Michel7a1c9e92008-11-22 23:50:42 +00001933 if (ConstantSDNode *C = dyn_cast<ConstantSDNode>(Elt)) {
1934 // Constant argument:
1935 int EltNo = (int) C->getZExtValue();
Scott Michel266bc8f2007-12-04 22:23:35 +00001936
Scott Michel7a1c9e92008-11-22 23:50:42 +00001937 // sanity checks:
1938 if (VT == MVT::i8 && EltNo >= 16)
1939 assert(0 && "SPU LowerEXTRACT_VECTOR_ELT: i8 extraction slot > 15");
1940 else if (VT == MVT::i16 && EltNo >= 8)
1941 assert(0 && "SPU LowerEXTRACT_VECTOR_ELT: i16 extraction slot > 7");
1942 else if (VT == MVT::i32 && EltNo >= 4)
1943 assert(0 && "SPU LowerEXTRACT_VECTOR_ELT: i32 extraction slot > 4");
1944 else if (VT == MVT::i64 && EltNo >= 2)
1945 assert(0 && "SPU LowerEXTRACT_VECTOR_ELT: i64 extraction slot > 2");
Scott Michel266bc8f2007-12-04 22:23:35 +00001946
Scott Michel7a1c9e92008-11-22 23:50:42 +00001947 if (EltNo == 0 && (VT == MVT::i32 || VT == MVT::i64)) {
1948 // i32 and i64: Element 0 is the preferred slot
Scott Michel104de432008-11-24 17:11:17 +00001949 return DAG.getNode(SPUISD::VEC2PREFSLOT, VT, N);
Scott Michel7a1c9e92008-11-22 23:50:42 +00001950 }
Scott Michel266bc8f2007-12-04 22:23:35 +00001951
Scott Michel7a1c9e92008-11-22 23:50:42 +00001952 // Need to generate shuffle mask and extract:
1953 int prefslot_begin = -1, prefslot_end = -1;
1954 int elt_byte = EltNo * VT.getSizeInBits() / 8;
1955
1956 switch (VT.getSimpleVT()) {
1957 default:
1958 assert(false && "Invalid value type!");
1959 case MVT::i8: {
1960 prefslot_begin = prefslot_end = 3;
1961 break;
1962 }
1963 case MVT::i16: {
1964 prefslot_begin = 2; prefslot_end = 3;
1965 break;
1966 }
1967 case MVT::i32:
1968 case MVT::f32: {
1969 prefslot_begin = 0; prefslot_end = 3;
1970 break;
1971 }
1972 case MVT::i64:
1973 case MVT::f64: {
1974 prefslot_begin = 0; prefslot_end = 7;
1975 break;
1976 }
1977 }
1978
1979 assert(prefslot_begin != -1 && prefslot_end != -1 &&
1980 "LowerEXTRACT_VECTOR_ELT: preferred slots uninitialized");
1981
1982 unsigned int ShufBytes[16];
1983 for (int i = 0; i < 16; ++i) {
1984 // zero fill uppper part of preferred slot, don't care about the
1985 // other slots:
1986 unsigned int mask_val;
1987 if (i <= prefslot_end) {
1988 mask_val =
1989 ((i < prefslot_begin)
1990 ? 0x80
1991 : elt_byte + (i - prefslot_begin));
1992
1993 ShufBytes[i] = mask_val;
1994 } else
1995 ShufBytes[i] = ShufBytes[i % (prefslot_end + 1)];
1996 }
1997
1998 SDValue ShufMask[4];
1999 for (unsigned i = 0; i < sizeof(ShufMask)/sizeof(ShufMask[0]); ++i) {
Scott Michelcc188272008-12-04 21:01:44 +00002000 unsigned bidx = i * 4;
Scott Michel7a1c9e92008-11-22 23:50:42 +00002001 unsigned int bits = ((ShufBytes[bidx] << 24) |
2002 (ShufBytes[bidx+1] << 16) |
2003 (ShufBytes[bidx+2] << 8) |
2004 ShufBytes[bidx+3]);
2005 ShufMask[i] = DAG.getConstant(bits, MVT::i32);
2006 }
2007
2008 SDValue ShufMaskVec = DAG.getNode(ISD::BUILD_VECTOR, MVT::v4i32,
2009 &ShufMask[0],
2010 sizeof(ShufMask) / sizeof(ShufMask[0]));
2011
Scott Michel104de432008-11-24 17:11:17 +00002012 retval = DAG.getNode(SPUISD::VEC2PREFSLOT, VT,
Scott Michel7a1c9e92008-11-22 23:50:42 +00002013 DAG.getNode(SPUISD::SHUFB, N.getValueType(),
2014 N, N, ShufMaskVec));
2015 } else {
2016 // Variable index: Rotate the requested element into slot 0, then replicate
2017 // slot 0 across the vector
2018 MVT VecVT = N.getValueType();
2019 if (!VecVT.isSimple() || !VecVT.isVector() || !VecVT.is128BitVector()) {
2020 cerr << "LowerEXTRACT_VECTOR_ELT: Must have a simple, 128-bit vector type!\n";
2021 abort();
2022 }
2023
2024 // Make life easier by making sure the index is zero-extended to i32
2025 if (Elt.getValueType() != MVT::i32)
2026 Elt = DAG.getNode(ISD::ZERO_EXTEND, MVT::i32, Elt);
2027
2028 // Scale the index to a bit/byte shift quantity
2029 APInt scaleFactor =
Scott Michel104de432008-11-24 17:11:17 +00002030 APInt(32, uint64_t(16 / N.getValueType().getVectorNumElements()), false);
2031 unsigned scaleShift = scaleFactor.logBase2();
Scott Michel7a1c9e92008-11-22 23:50:42 +00002032 SDValue vecShift;
Scott Michel7a1c9e92008-11-22 23:50:42 +00002033
Scott Michel104de432008-11-24 17:11:17 +00002034 if (scaleShift > 0) {
2035 // Scale the shift factor:
Scott Michel7a1c9e92008-11-22 23:50:42 +00002036 Elt = DAG.getNode(ISD::SHL, MVT::i32, Elt,
Scott Michel1a6cdb62008-12-01 17:56:02 +00002037 DAG.getConstant(scaleShift, MVT::i32));
Scott Michel7a1c9e92008-11-22 23:50:42 +00002038 }
2039
Scott Michel104de432008-11-24 17:11:17 +00002040 vecShift = DAG.getNode(SPUISD::SHLQUAD_L_BYTES, VecVT, N, Elt);
2041
2042 // Replicate the bytes starting at byte 0 across the entire vector (for
2043 // consistency with the notion of a unified register set)
Scott Michel7a1c9e92008-11-22 23:50:42 +00002044 SDValue replicate;
2045
2046 switch (VT.getSimpleVT()) {
2047 default:
2048 cerr << "LowerEXTRACT_VECTOR_ELT(varable): Unhandled vector type\n";
2049 abort();
2050 /*NOTREACHED*/
2051 case MVT::i8: {
Scott Michel104de432008-11-24 17:11:17 +00002052 SDValue factor = DAG.getConstant(0x00000000, MVT::i32);
Scott Michel7a1c9e92008-11-22 23:50:42 +00002053 replicate = DAG.getNode(ISD::BUILD_VECTOR, MVT::v4i32, factor, factor,
2054 factor, factor);
2055 break;
2056 }
2057 case MVT::i16: {
Scott Michel104de432008-11-24 17:11:17 +00002058 SDValue factor = DAG.getConstant(0x00010001, MVT::i32);
Scott Michel7a1c9e92008-11-22 23:50:42 +00002059 replicate = DAG.getNode(ISD::BUILD_VECTOR, MVT::v4i32, factor, factor,
2060 factor, factor);
2061 break;
2062 }
2063 case MVT::i32:
2064 case MVT::f32: {
2065 SDValue factor = DAG.getConstant(0x00010203, MVT::i32);
2066 replicate = DAG.getNode(ISD::BUILD_VECTOR, MVT::v4i32, factor, factor,
2067 factor, factor);
2068 break;
2069 }
2070 case MVT::i64:
2071 case MVT::f64: {
2072 SDValue loFactor = DAG.getConstant(0x00010203, MVT::i32);
2073 SDValue hiFactor = DAG.getConstant(0x04050607, MVT::i32);
2074 replicate = DAG.getNode(ISD::BUILD_VECTOR, MVT::v4i32, loFactor, hiFactor,
2075 loFactor, hiFactor);
2076 break;
2077 }
2078 }
2079
Scott Michel104de432008-11-24 17:11:17 +00002080 retval = DAG.getNode(SPUISD::VEC2PREFSLOT, VT,
Scott Michel1a6cdb62008-12-01 17:56:02 +00002081 DAG.getNode(SPUISD::SHUFB, VecVT,
2082 vecShift, vecShift, replicate));
Scott Michel266bc8f2007-12-04 22:23:35 +00002083 }
2084
Scott Michel7a1c9e92008-11-22 23:50:42 +00002085 return retval;
Scott Michel266bc8f2007-12-04 22:23:35 +00002086}
2087
Dan Gohman475871a2008-07-27 21:46:04 +00002088static SDValue LowerINSERT_VECTOR_ELT(SDValue Op, SelectionDAG &DAG) {
2089 SDValue VecOp = Op.getOperand(0);
2090 SDValue ValOp = Op.getOperand(1);
2091 SDValue IdxOp = Op.getOperand(2);
Duncan Sands83ec4b62008-06-06 12:08:01 +00002092 MVT VT = Op.getValueType();
Scott Michel266bc8f2007-12-04 22:23:35 +00002093
2094 ConstantSDNode *CN = cast<ConstantSDNode>(IdxOp);
2095 assert(CN != 0 && "LowerINSERT_VECTOR_ELT: Index is not constant!");
2096
Duncan Sands83ec4b62008-06-06 12:08:01 +00002097 MVT PtrVT = DAG.getTargetLoweringInfo().getPointerTy();
Scott Michel1a6cdb62008-12-01 17:56:02 +00002098 // Use $sp ($1) because it's always 16-byte aligned and it's available:
2099 SDValue Pointer = DAG.getNode(SPUISD::IndirectAddr, PtrVT,
2100 DAG.getRegister(SPU::R1, PtrVT),
2101 DAG.getConstant(CN->getSExtValue(), PtrVT));
2102 SDValue ShufMask = DAG.getNode(SPUISD::SHUFFLE_MASK, VT, Pointer);
Scott Michel266bc8f2007-12-04 22:23:35 +00002103
Dan Gohman475871a2008-07-27 21:46:04 +00002104 SDValue result =
Scott Michel266bc8f2007-12-04 22:23:35 +00002105 DAG.getNode(SPUISD::SHUFB, VT,
2106 DAG.getNode(ISD::SCALAR_TO_VECTOR, VT, ValOp),
Scott Michel1df30c42008-12-29 03:23:36 +00002107 VecOp,
Scott Michel19c10e62009-01-26 03:37:41 +00002108 DAG.getNode(ISD::BIT_CONVERT, MVT::v4i32, ShufMask));
Scott Michel266bc8f2007-12-04 22:23:35 +00002109
2110 return result;
2111}
2112
Scott Michelf0569be2008-12-27 04:51:36 +00002113static SDValue LowerI8Math(SDValue Op, SelectionDAG &DAG, unsigned Opc,
2114 const TargetLowering &TLI)
Scott Michela59d4692008-02-23 18:41:37 +00002115{
Dan Gohman475871a2008-07-27 21:46:04 +00002116 SDValue N0 = Op.getOperand(0); // Everything has at least one operand
Scott Michelf0569be2008-12-27 04:51:36 +00002117 MVT ShiftVT = TLI.getShiftAmountTy();
Scott Michel266bc8f2007-12-04 22:23:35 +00002118
2119 assert(Op.getValueType() == MVT::i8);
2120 switch (Opc) {
2121 default:
2122 assert(0 && "Unhandled i8 math operator");
2123 /*NOTREACHED*/
2124 break;
Scott Michel02d711b2008-12-30 23:28:25 +00002125 case ISD::ADD: {
2126 // 8-bit addition: Promote the arguments up to 16-bits and truncate
2127 // the result:
2128 SDValue N1 = Op.getOperand(1);
2129 N0 = DAG.getNode(ISD::SIGN_EXTEND, MVT::i16, N0);
2130 N1 = DAG.getNode(ISD::SIGN_EXTEND, MVT::i16, N1);
2131 return DAG.getNode(ISD::TRUNCATE, MVT::i8,
2132 DAG.getNode(Opc, MVT::i16, N0, N1));
2133
2134 }
2135
Scott Michel266bc8f2007-12-04 22:23:35 +00002136 case ISD::SUB: {
2137 // 8-bit subtraction: Promote the arguments up to 16-bits and truncate
2138 // the result:
Dan Gohman475871a2008-07-27 21:46:04 +00002139 SDValue N1 = Op.getOperand(1);
Scott Michel02d711b2008-12-30 23:28:25 +00002140 N0 = DAG.getNode(ISD::SIGN_EXTEND, MVT::i16, N0);
2141 N1 = DAG.getNode(ISD::SIGN_EXTEND, MVT::i16, N1);
Scott Michel5af8f0e2008-07-16 17:17:29 +00002142 return DAG.getNode(ISD::TRUNCATE, MVT::i8,
Scott Michel266bc8f2007-12-04 22:23:35 +00002143 DAG.getNode(Opc, MVT::i16, N0, N1));
Scott Michel5af8f0e2008-07-16 17:17:29 +00002144 }
Scott Michel266bc8f2007-12-04 22:23:35 +00002145 case ISD::ROTR:
2146 case ISD::ROTL: {
Dan Gohman475871a2008-07-27 21:46:04 +00002147 SDValue N1 = Op.getOperand(1);
Scott Michel266bc8f2007-12-04 22:23:35 +00002148 unsigned N1Opc;
2149 N0 = (N0.getOpcode() != ISD::Constant
2150 ? DAG.getNode(ISD::ZERO_EXTEND, MVT::i16, N0)
Dan Gohmanf5aeb1a2008-09-12 16:56:44 +00002151 : DAG.getConstant(cast<ConstantSDNode>(N0)->getZExtValue(),
2152 MVT::i16));
Scott Michelf0569be2008-12-27 04:51:36 +00002153 N1Opc = N1.getValueType().bitsLT(ShiftVT)
Gabor Greif93c53e52008-08-31 15:37:04 +00002154 ? ISD::ZERO_EXTEND
2155 : ISD::TRUNCATE;
Scott Michel266bc8f2007-12-04 22:23:35 +00002156 N1 = (N1.getOpcode() != ISD::Constant
Scott Michelf0569be2008-12-27 04:51:36 +00002157 ? DAG.getNode(N1Opc, ShiftVT, N1)
Dan Gohmanf5aeb1a2008-09-12 16:56:44 +00002158 : DAG.getConstant(cast<ConstantSDNode>(N1)->getZExtValue(),
Scott Michelf0569be2008-12-27 04:51:36 +00002159 TLI.getShiftAmountTy()));
Dan Gohman475871a2008-07-27 21:46:04 +00002160 SDValue ExpandArg =
Scott Michel266bc8f2007-12-04 22:23:35 +00002161 DAG.getNode(ISD::OR, MVT::i16, N0,
2162 DAG.getNode(ISD::SHL, MVT::i16,
Duncan Sandsfa7935f2008-10-30 19:24:28 +00002163 N0, DAG.getConstant(8, MVT::i32)));
Scott Michel5af8f0e2008-07-16 17:17:29 +00002164 return DAG.getNode(ISD::TRUNCATE, MVT::i8,
Scott Michel266bc8f2007-12-04 22:23:35 +00002165 DAG.getNode(Opc, MVT::i16, ExpandArg, N1));
2166 }
2167 case ISD::SRL:
2168 case ISD::SHL: {
Dan Gohman475871a2008-07-27 21:46:04 +00002169 SDValue N1 = Op.getOperand(1);
Scott Michel266bc8f2007-12-04 22:23:35 +00002170 unsigned N1Opc;
2171 N0 = (N0.getOpcode() != ISD::Constant
2172 ? DAG.getNode(ISD::ZERO_EXTEND, MVT::i16, N0)
Dan Gohmanf5aeb1a2008-09-12 16:56:44 +00002173 : DAG.getConstant(cast<ConstantSDNode>(N0)->getZExtValue(),
Scott Michelf0569be2008-12-27 04:51:36 +00002174 MVT::i32));
2175 N1Opc = N1.getValueType().bitsLT(ShiftVT)
Gabor Greif93c53e52008-08-31 15:37:04 +00002176 ? ISD::ZERO_EXTEND
2177 : ISD::TRUNCATE;
Scott Michel266bc8f2007-12-04 22:23:35 +00002178 N1 = (N1.getOpcode() != ISD::Constant
Scott Michelf0569be2008-12-27 04:51:36 +00002179 ? DAG.getNode(N1Opc, ShiftVT, N1)
2180 : DAG.getConstant(cast<ConstantSDNode>(N1)->getZExtValue(), ShiftVT));
Scott Michel5af8f0e2008-07-16 17:17:29 +00002181 return DAG.getNode(ISD::TRUNCATE, MVT::i8,
Scott Michel266bc8f2007-12-04 22:23:35 +00002182 DAG.getNode(Opc, MVT::i16, N0, N1));
2183 }
2184 case ISD::SRA: {
Dan Gohman475871a2008-07-27 21:46:04 +00002185 SDValue N1 = Op.getOperand(1);
Scott Michel266bc8f2007-12-04 22:23:35 +00002186 unsigned N1Opc;
2187 N0 = (N0.getOpcode() != ISD::Constant
2188 ? DAG.getNode(ISD::SIGN_EXTEND, MVT::i16, N0)
Scott Michelf0569be2008-12-27 04:51:36 +00002189 : DAG.getConstant(cast<ConstantSDNode>(N0)->getSExtValue(),
Dan Gohmanf5aeb1a2008-09-12 16:56:44 +00002190 MVT::i16));
Scott Michelf0569be2008-12-27 04:51:36 +00002191 N1Opc = N1.getValueType().bitsLT(ShiftVT)
Gabor Greif93c53e52008-08-31 15:37:04 +00002192 ? ISD::SIGN_EXTEND
2193 : ISD::TRUNCATE;
Scott Michel266bc8f2007-12-04 22:23:35 +00002194 N1 = (N1.getOpcode() != ISD::Constant
Scott Michelf0569be2008-12-27 04:51:36 +00002195 ? DAG.getNode(N1Opc, ShiftVT, N1)
Dan Gohmanf5aeb1a2008-09-12 16:56:44 +00002196 : DAG.getConstant(cast<ConstantSDNode>(N1)->getZExtValue(),
Scott Michelf0569be2008-12-27 04:51:36 +00002197 ShiftVT));
Scott Michel5af8f0e2008-07-16 17:17:29 +00002198 return DAG.getNode(ISD::TRUNCATE, MVT::i8,
Scott Michel266bc8f2007-12-04 22:23:35 +00002199 DAG.getNode(Opc, MVT::i16, N0, N1));
2200 }
2201 case ISD::MUL: {
Dan Gohman475871a2008-07-27 21:46:04 +00002202 SDValue N1 = Op.getOperand(1);
Scott Michel266bc8f2007-12-04 22:23:35 +00002203 unsigned N1Opc;
2204 N0 = (N0.getOpcode() != ISD::Constant
2205 ? DAG.getNode(ISD::SIGN_EXTEND, MVT::i16, N0)
Dan Gohmanf5aeb1a2008-09-12 16:56:44 +00002206 : DAG.getConstant(cast<ConstantSDNode>(N0)->getZExtValue(),
2207 MVT::i16));
Duncan Sands8e4eb092008-06-08 20:54:56 +00002208 N1Opc = N1.getValueType().bitsLT(MVT::i16) ? ISD::SIGN_EXTEND : ISD::TRUNCATE;
Scott Michel266bc8f2007-12-04 22:23:35 +00002209 N1 = (N1.getOpcode() != ISD::Constant
2210 ? DAG.getNode(N1Opc, MVT::i16, N1)
Scott Michelf0569be2008-12-27 04:51:36 +00002211 : DAG.getConstant(cast<ConstantSDNode>(N1)->getSExtValue(),
Dan Gohmanf5aeb1a2008-09-12 16:56:44 +00002212 MVT::i16));
Scott Michel5af8f0e2008-07-16 17:17:29 +00002213 return DAG.getNode(ISD::TRUNCATE, MVT::i8,
Scott Michel266bc8f2007-12-04 22:23:35 +00002214 DAG.getNode(Opc, MVT::i16, N0, N1));
2215 break;
2216 }
2217 }
2218
Dan Gohman475871a2008-07-27 21:46:04 +00002219 return SDValue();
Scott Michel266bc8f2007-12-04 22:23:35 +00002220}
2221
Scott Michel94bd57e2009-01-15 04:41:47 +00002222//! Generate the carry-generate shuffle mask.
2223SDValue SPU::getCarryGenerateShufMask(SelectionDAG &DAG) {
Scott Micheld1e8d9c2009-01-21 04:58:48 +00002224 SmallVector<SDValue, 16 > ShufBytes;
Scott Michela59d4692008-02-23 18:41:37 +00002225
Scott Micheld1e8d9c2009-01-21 04:58:48 +00002226 // Create the shuffle mask for "rotating" the borrow up one register slot
2227 // once the borrow is generated.
2228 ShufBytes.push_back(DAG.getConstant(0x04050607, MVT::i32));
2229 ShufBytes.push_back(DAG.getConstant(0x80808080, MVT::i32));
2230 ShufBytes.push_back(DAG.getConstant(0x0c0d0e0f, MVT::i32));
2231 ShufBytes.push_back(DAG.getConstant(0x80808080, MVT::i32));
Scott Michela59d4692008-02-23 18:41:37 +00002232
Scott Micheld1e8d9c2009-01-21 04:58:48 +00002233 return DAG.getNode(ISD::BUILD_VECTOR, MVT::v4i32,
2234 &ShufBytes[0], ShufBytes.size());
Scott Michel94bd57e2009-01-15 04:41:47 +00002235}
Scott Michela59d4692008-02-23 18:41:37 +00002236
Scott Michel94bd57e2009-01-15 04:41:47 +00002237//! Generate the borrow-generate shuffle mask
2238SDValue SPU::getBorrowGenerateShufMask(SelectionDAG &DAG) {
Scott Micheld1e8d9c2009-01-21 04:58:48 +00002239 SmallVector<SDValue, 16 > ShufBytes;
Scott Michela59d4692008-02-23 18:41:37 +00002240
Scott Micheld1e8d9c2009-01-21 04:58:48 +00002241 // Create the shuffle mask for "rotating" the borrow up one register slot
2242 // once the borrow is generated.
2243 ShufBytes.push_back(DAG.getConstant(0x04050607, MVT::i32));
2244 ShufBytes.push_back(DAG.getConstant(0xc0c0c0c0, MVT::i32));
2245 ShufBytes.push_back(DAG.getConstant(0x0c0d0e0f, MVT::i32));
2246 ShufBytes.push_back(DAG.getConstant(0xc0c0c0c0, MVT::i32));
Scott Michel045a1452008-11-24 18:20:46 +00002247
Scott Micheld1e8d9c2009-01-21 04:58:48 +00002248 return DAG.getNode(ISD::BUILD_VECTOR, MVT::v4i32,
2249 &ShufBytes[0], ShufBytes.size());
Scott Michela59d4692008-02-23 18:41:37 +00002250}
2251
Scott Michel266bc8f2007-12-04 22:23:35 +00002252//! Lower byte immediate operations for v16i8 vectors:
Dan Gohman475871a2008-07-27 21:46:04 +00002253static SDValue
2254LowerByteImmed(SDValue Op, SelectionDAG &DAG) {
2255 SDValue ConstVec;
2256 SDValue Arg;
Duncan Sands83ec4b62008-06-06 12:08:01 +00002257 MVT VT = Op.getValueType();
Scott Michel266bc8f2007-12-04 22:23:35 +00002258
2259 ConstVec = Op.getOperand(0);
2260 Arg = Op.getOperand(1);
Gabor Greifba36cb52008-08-28 21:40:38 +00002261 if (ConstVec.getNode()->getOpcode() != ISD::BUILD_VECTOR) {
2262 if (ConstVec.getNode()->getOpcode() == ISD::BIT_CONVERT) {
Scott Michel266bc8f2007-12-04 22:23:35 +00002263 ConstVec = ConstVec.getOperand(0);
2264 } else {
2265 ConstVec = Op.getOperand(1);
2266 Arg = Op.getOperand(0);
Gabor Greifba36cb52008-08-28 21:40:38 +00002267 if (ConstVec.getNode()->getOpcode() == ISD::BIT_CONVERT) {
Scott Michel7f9ba9b2008-01-30 02:55:46 +00002268 ConstVec = ConstVec.getOperand(0);
Scott Michel266bc8f2007-12-04 22:23:35 +00002269 }
2270 }
2271 }
2272
Gabor Greifba36cb52008-08-28 21:40:38 +00002273 if (ConstVec.getNode()->getOpcode() == ISD::BUILD_VECTOR) {
Scott Michel266bc8f2007-12-04 22:23:35 +00002274 uint64_t VectorBits[2];
2275 uint64_t UndefBits[2];
2276 uint64_t SplatBits, SplatUndef;
2277 int SplatSize;
2278
Gabor Greifba36cb52008-08-28 21:40:38 +00002279 if (!GetConstantBuildVectorBits(ConstVec.getNode(), VectorBits, UndefBits)
Scott Michel7f9ba9b2008-01-30 02:55:46 +00002280 && isConstantSplat(VectorBits, UndefBits,
Duncan Sands83ec4b62008-06-06 12:08:01 +00002281 VT.getVectorElementType().getSizeInBits(),
Scott Michel7f9ba9b2008-01-30 02:55:46 +00002282 SplatBits, SplatUndef, SplatSize)) {
Dan Gohman475871a2008-07-27 21:46:04 +00002283 SDValue tcVec[16];
2284 SDValue tc = DAG.getTargetConstant(SplatBits & 0xff, MVT::i8);
Scott Michel266bc8f2007-12-04 22:23:35 +00002285 const size_t tcVecSize = sizeof(tcVec) / sizeof(tcVec[0]);
2286
2287 // Turn the BUILD_VECTOR into a set of target constants:
2288 for (size_t i = 0; i < tcVecSize; ++i)
Scott Michel7f9ba9b2008-01-30 02:55:46 +00002289 tcVec[i] = tc;
Scott Michel266bc8f2007-12-04 22:23:35 +00002290
Gabor Greifba36cb52008-08-28 21:40:38 +00002291 return DAG.getNode(Op.getNode()->getOpcode(), VT, Arg,
Scott Michel7f9ba9b2008-01-30 02:55:46 +00002292 DAG.getNode(ISD::BUILD_VECTOR, VT, tcVec, tcVecSize));
Scott Michel266bc8f2007-12-04 22:23:35 +00002293 }
2294 }
Scott Michel9de57a92009-01-26 22:33:37 +00002295
Nate Begeman24dc3462008-07-29 19:07:27 +00002296 // These operations (AND, OR, XOR) are legal, they just couldn't be custom
2297 // lowered. Return the operation, rather than a null SDValue.
2298 return Op;
Scott Michel266bc8f2007-12-04 22:23:35 +00002299}
2300
Scott Michel266bc8f2007-12-04 22:23:35 +00002301//! Custom lowering for CTPOP (count population)
2302/*!
2303 Custom lowering code that counts the number ones in the input
2304 operand. SPU has such an instruction, but it counts the number of
2305 ones per byte, which then have to be accumulated.
2306*/
Dan Gohman475871a2008-07-27 21:46:04 +00002307static SDValue LowerCTPOP(SDValue Op, SelectionDAG &DAG) {
Duncan Sands83ec4b62008-06-06 12:08:01 +00002308 MVT VT = Op.getValueType();
2309 MVT vecVT = MVT::getVectorVT(VT, (128 / VT.getSizeInBits()));
Scott Michel266bc8f2007-12-04 22:23:35 +00002310
Duncan Sands83ec4b62008-06-06 12:08:01 +00002311 switch (VT.getSimpleVT()) {
2312 default:
2313 assert(false && "Invalid value type!");
Scott Michel266bc8f2007-12-04 22:23:35 +00002314 case MVT::i8: {
Dan Gohman475871a2008-07-27 21:46:04 +00002315 SDValue N = Op.getOperand(0);
2316 SDValue Elt0 = DAG.getConstant(0, MVT::i32);
Scott Michel266bc8f2007-12-04 22:23:35 +00002317
Scott Michelf0569be2008-12-27 04:51:36 +00002318 SDValue Promote = DAG.getNode(SPUISD::PREFSLOT2VEC, vecVT, N, N);
Dan Gohman475871a2008-07-27 21:46:04 +00002319 SDValue CNTB = DAG.getNode(SPUISD::CNTB, vecVT, Promote);
Scott Michel266bc8f2007-12-04 22:23:35 +00002320
2321 return DAG.getNode(ISD::EXTRACT_VECTOR_ELT, MVT::i8, CNTB, Elt0);
2322 }
2323
2324 case MVT::i16: {
2325 MachineFunction &MF = DAG.getMachineFunction();
Chris Lattner84bc5422007-12-31 04:13:23 +00002326 MachineRegisterInfo &RegInfo = MF.getRegInfo();
Scott Michel266bc8f2007-12-04 22:23:35 +00002327
Chris Lattner84bc5422007-12-31 04:13:23 +00002328 unsigned CNTB_reg = RegInfo.createVirtualRegister(&SPU::R16CRegClass);
Scott Michel266bc8f2007-12-04 22:23:35 +00002329
Dan Gohman475871a2008-07-27 21:46:04 +00002330 SDValue N = Op.getOperand(0);
2331 SDValue Elt0 = DAG.getConstant(0, MVT::i16);
2332 SDValue Mask0 = DAG.getConstant(0x0f, MVT::i16);
Duncan Sandsfa7935f2008-10-30 19:24:28 +00002333 SDValue Shift1 = DAG.getConstant(8, MVT::i32);
Scott Michel266bc8f2007-12-04 22:23:35 +00002334
Scott Michelf0569be2008-12-27 04:51:36 +00002335 SDValue Promote = DAG.getNode(SPUISD::PREFSLOT2VEC, vecVT, N, N);
Dan Gohman475871a2008-07-27 21:46:04 +00002336 SDValue CNTB = DAG.getNode(SPUISD::CNTB, vecVT, Promote);
Scott Michel266bc8f2007-12-04 22:23:35 +00002337
2338 // CNTB_result becomes the chain to which all of the virtual registers
2339 // CNTB_reg, SUM1_reg become associated:
Dan Gohman475871a2008-07-27 21:46:04 +00002340 SDValue CNTB_result =
Scott Michel266bc8f2007-12-04 22:23:35 +00002341 DAG.getNode(ISD::EXTRACT_VECTOR_ELT, MVT::i16, CNTB, Elt0);
Scott Michel5af8f0e2008-07-16 17:17:29 +00002342
Dan Gohman475871a2008-07-27 21:46:04 +00002343 SDValue CNTB_rescopy =
Scott Michel266bc8f2007-12-04 22:23:35 +00002344 DAG.getCopyToReg(CNTB_result, CNTB_reg, CNTB_result);
2345
Dan Gohman475871a2008-07-27 21:46:04 +00002346 SDValue Tmp1 = DAG.getCopyFromReg(CNTB_rescopy, CNTB_reg, MVT::i16);
Scott Michel266bc8f2007-12-04 22:23:35 +00002347
2348 return DAG.getNode(ISD::AND, MVT::i16,
Scott Michel7f9ba9b2008-01-30 02:55:46 +00002349 DAG.getNode(ISD::ADD, MVT::i16,
2350 DAG.getNode(ISD::SRL, MVT::i16,
2351 Tmp1, Shift1),
2352 Tmp1),
2353 Mask0);
Scott Michel266bc8f2007-12-04 22:23:35 +00002354 }
2355
2356 case MVT::i32: {
2357 MachineFunction &MF = DAG.getMachineFunction();
Chris Lattner84bc5422007-12-31 04:13:23 +00002358 MachineRegisterInfo &RegInfo = MF.getRegInfo();
Scott Michel266bc8f2007-12-04 22:23:35 +00002359
Chris Lattner84bc5422007-12-31 04:13:23 +00002360 unsigned CNTB_reg = RegInfo.createVirtualRegister(&SPU::R32CRegClass);
2361 unsigned SUM1_reg = RegInfo.createVirtualRegister(&SPU::R32CRegClass);
Scott Michel266bc8f2007-12-04 22:23:35 +00002362
Dan Gohman475871a2008-07-27 21:46:04 +00002363 SDValue N = Op.getOperand(0);
2364 SDValue Elt0 = DAG.getConstant(0, MVT::i32);
2365 SDValue Mask0 = DAG.getConstant(0xff, MVT::i32);
2366 SDValue Shift1 = DAG.getConstant(16, MVT::i32);
2367 SDValue Shift2 = DAG.getConstant(8, MVT::i32);
Scott Michel266bc8f2007-12-04 22:23:35 +00002368
Scott Michelf0569be2008-12-27 04:51:36 +00002369 SDValue Promote = DAG.getNode(SPUISD::PREFSLOT2VEC, vecVT, N, N);
Dan Gohman475871a2008-07-27 21:46:04 +00002370 SDValue CNTB = DAG.getNode(SPUISD::CNTB, vecVT, Promote);
Scott Michel266bc8f2007-12-04 22:23:35 +00002371
2372 // CNTB_result becomes the chain to which all of the virtual registers
2373 // CNTB_reg, SUM1_reg become associated:
Dan Gohman475871a2008-07-27 21:46:04 +00002374 SDValue CNTB_result =
Scott Michel266bc8f2007-12-04 22:23:35 +00002375 DAG.getNode(ISD::EXTRACT_VECTOR_ELT, MVT::i32, CNTB, Elt0);
Scott Michel5af8f0e2008-07-16 17:17:29 +00002376
Dan Gohman475871a2008-07-27 21:46:04 +00002377 SDValue CNTB_rescopy =
Scott Michel266bc8f2007-12-04 22:23:35 +00002378 DAG.getCopyToReg(CNTB_result, CNTB_reg, CNTB_result);
2379
Dan Gohman475871a2008-07-27 21:46:04 +00002380 SDValue Comp1 =
Scott Michel266bc8f2007-12-04 22:23:35 +00002381 DAG.getNode(ISD::SRL, MVT::i32,
Scott Michel7f9ba9b2008-01-30 02:55:46 +00002382 DAG.getCopyFromReg(CNTB_rescopy, CNTB_reg, MVT::i32), Shift1);
Scott Michel266bc8f2007-12-04 22:23:35 +00002383
Dan Gohman475871a2008-07-27 21:46:04 +00002384 SDValue Sum1 =
Scott Michel266bc8f2007-12-04 22:23:35 +00002385 DAG.getNode(ISD::ADD, MVT::i32,
Scott Michel7f9ba9b2008-01-30 02:55:46 +00002386 Comp1, DAG.getCopyFromReg(CNTB_rescopy, CNTB_reg, MVT::i32));
Scott Michel266bc8f2007-12-04 22:23:35 +00002387
Dan Gohman475871a2008-07-27 21:46:04 +00002388 SDValue Sum1_rescopy =
Scott Michel266bc8f2007-12-04 22:23:35 +00002389 DAG.getCopyToReg(CNTB_result, SUM1_reg, Sum1);
2390
Dan Gohman475871a2008-07-27 21:46:04 +00002391 SDValue Comp2 =
Scott Michel266bc8f2007-12-04 22:23:35 +00002392 DAG.getNode(ISD::SRL, MVT::i32,
Scott Michel7f9ba9b2008-01-30 02:55:46 +00002393 DAG.getCopyFromReg(Sum1_rescopy, SUM1_reg, MVT::i32),
2394 Shift2);
Dan Gohman475871a2008-07-27 21:46:04 +00002395 SDValue Sum2 =
Scott Michel266bc8f2007-12-04 22:23:35 +00002396 DAG.getNode(ISD::ADD, MVT::i32, Comp2,
Scott Michel7f9ba9b2008-01-30 02:55:46 +00002397 DAG.getCopyFromReg(Sum1_rescopy, SUM1_reg, MVT::i32));
Scott Michel266bc8f2007-12-04 22:23:35 +00002398
2399 return DAG.getNode(ISD::AND, MVT::i32, Sum2, Mask0);
2400 }
2401
2402 case MVT::i64:
2403 break;
2404 }
2405
Dan Gohman475871a2008-07-27 21:46:04 +00002406 return SDValue();
Scott Michel266bc8f2007-12-04 22:23:35 +00002407}
2408
Scott Michelc9c8b2a2009-01-26 03:31:40 +00002409//! Lower ISD::FP_TO_SINT, ISD::FP_TO_UINT for i32
Scott Micheld1e8d9c2009-01-21 04:58:48 +00002410/*!
Scott Michelc9c8b2a2009-01-26 03:31:40 +00002411 f32->i32 passes through unchanged, whereas f64->i32 expands to a libcall.
2412 All conversions to i64 are expanded to a libcall.
Scott Micheld1e8d9c2009-01-21 04:58:48 +00002413 */
Scott Michelc9c8b2a2009-01-26 03:31:40 +00002414static SDValue LowerFP_TO_INT(SDValue Op, SelectionDAG &DAG,
2415 SPUTargetLowering &TLI) {
Scott Micheld1e8d9c2009-01-21 04:58:48 +00002416 MVT OpVT = Op.getValueType();
Scott Micheld1e8d9c2009-01-21 04:58:48 +00002417 SDValue Op0 = Op.getOperand(0);
Scott Michelc9c8b2a2009-01-26 03:31:40 +00002418 MVT Op0VT = Op0.getValueType();
Scott Micheld1e8d9c2009-01-21 04:58:48 +00002419
Scott Michelc9c8b2a2009-01-26 03:31:40 +00002420 if ((OpVT == MVT::i32 && Op0VT == MVT::f64)
2421 || OpVT == MVT::i64) {
2422 // Convert f32 / f64 to i32 / i64 via libcall.
2423 RTLIB::Libcall LC =
2424 (Op.getOpcode() == ISD::FP_TO_SINT)
2425 ? RTLIB::getFPTOSINT(Op0VT, OpVT)
2426 : RTLIB::getFPTOUINT(Op0VT, OpVT);
2427 assert(LC != RTLIB::UNKNOWN_LIBCALL && "Unexpectd fp-to-int conversion!");
2428 SDValue Dummy;
2429 return ExpandLibCall(LC, Op, DAG, false, Dummy, TLI);
2430 }
Scott Micheld1e8d9c2009-01-21 04:58:48 +00002431
Scott Michel9de57a92009-01-26 22:33:37 +00002432 return Op; // return unmolested, legalized op
Scott Michelc9c8b2a2009-01-26 03:31:40 +00002433}
Scott Micheld1e8d9c2009-01-21 04:58:48 +00002434
Scott Michelc9c8b2a2009-01-26 03:31:40 +00002435//! Lower ISD::SINT_TO_FP, ISD::UINT_TO_FP for i32
2436/*!
2437 i32->f32 passes through unchanged, whereas i32->f64 is expanded to a libcall.
2438 All conversions from i64 are expanded to a libcall.
2439 */
2440static SDValue LowerINT_TO_FP(SDValue Op, SelectionDAG &DAG,
2441 SPUTargetLowering &TLI) {
2442 MVT OpVT = Op.getValueType();
2443 SDValue Op0 = Op.getOperand(0);
2444 MVT Op0VT = Op0.getValueType();
2445
2446 if ((OpVT == MVT::f64 && Op0VT == MVT::i32)
2447 || Op0VT == MVT::i64) {
2448 // Convert i32, i64 to f64 via libcall:
2449 RTLIB::Libcall LC =
2450 (Op.getOpcode() == ISD::SINT_TO_FP)
2451 ? RTLIB::getSINTTOFP(Op0VT, OpVT)
2452 : RTLIB::getUINTTOFP(Op0VT, OpVT);
2453 assert(LC != RTLIB::UNKNOWN_LIBCALL && "Unexpectd int-to-fp conversion!");
2454 SDValue Dummy;
2455 return ExpandLibCall(LC, Op, DAG, false, Dummy, TLI);
2456 }
2457
Scott Michel9de57a92009-01-26 22:33:37 +00002458 return Op; // return unmolested, legalized
Scott Micheld1e8d9c2009-01-21 04:58:48 +00002459}
2460
2461//! Lower ISD::SETCC
2462/*!
2463 This handles MVT::f64 (double floating point) condition lowering
2464 */
Scott Micheld1e8d9c2009-01-21 04:58:48 +00002465static SDValue LowerSETCC(SDValue Op, SelectionDAG &DAG,
2466 const TargetLowering &TLI) {
Scott Michelc9c8b2a2009-01-26 03:31:40 +00002467 CondCodeSDNode *CC = dyn_cast<CondCodeSDNode>(Op.getOperand(2));
Dale Johannesenf5d97892009-02-04 01:48:28 +00002468 DebugLoc dl = Op.getNode()->getDebugLoc();
Scott Michelc9c8b2a2009-01-26 03:31:40 +00002469 assert(CC != 0 && "LowerSETCC: CondCodeSDNode should not be null here!\n");
2470
Scott Micheld1e8d9c2009-01-21 04:58:48 +00002471 SDValue lhs = Op.getOperand(0);
2472 SDValue rhs = Op.getOperand(1);
Scott Micheld1e8d9c2009-01-21 04:58:48 +00002473 MVT lhsVT = lhs.getValueType();
Scott Micheld1e8d9c2009-01-21 04:58:48 +00002474 assert(lhsVT == MVT::f64 && "LowerSETCC: type other than MVT::64\n");
2475
Scott Michelc9c8b2a2009-01-26 03:31:40 +00002476 MVT ccResultVT = TLI.getSetCCResultType(lhs.getValueType());
2477 APInt ccResultOnes = APInt::getAllOnesValue(ccResultVT.getSizeInBits());
2478 MVT IntVT(MVT::i64);
2479
2480 // Take advantage of the fact that (truncate (sra arg, 32)) is efficiently
2481 // selected to a NOP:
Dale Johannesenf5d97892009-02-04 01:48:28 +00002482 SDValue i64lhs = DAG.getNode(ISD::BIT_CONVERT, dl, IntVT, lhs);
Scott Michelc9c8b2a2009-01-26 03:31:40 +00002483 SDValue lhsHi32 =
Dale Johannesenf5d97892009-02-04 01:48:28 +00002484 DAG.getNode(ISD::TRUNCATE, dl, MVT::i32,
2485 DAG.getNode(ISD::SRL, dl, IntVT,
Scott Michelc9c8b2a2009-01-26 03:31:40 +00002486 i64lhs, DAG.getConstant(32, MVT::i32)));
2487 SDValue lhsHi32abs =
Dale Johannesenf5d97892009-02-04 01:48:28 +00002488 DAG.getNode(ISD::AND, dl, MVT::i32,
Scott Michelc9c8b2a2009-01-26 03:31:40 +00002489 lhsHi32, DAG.getConstant(0x7fffffff, MVT::i32));
2490 SDValue lhsLo32 =
Dale Johannesenf5d97892009-02-04 01:48:28 +00002491 DAG.getNode(ISD::TRUNCATE, dl, MVT::i32, i64lhs);
Scott Michelc9c8b2a2009-01-26 03:31:40 +00002492
2493 // SETO and SETUO only use the lhs operand:
2494 if (CC->get() == ISD::SETO) {
2495 // Evaluates to true if Op0 is not [SQ]NaN - lowers to the inverse of
2496 // SETUO
2497 APInt ccResultAllOnes = APInt::getAllOnesValue(ccResultVT.getSizeInBits());
Dale Johannesenf5d97892009-02-04 01:48:28 +00002498 return DAG.getNode(ISD::XOR, dl, ccResultVT,
2499 DAG.getSetCC(dl, ccResultVT,
Scott Michelc9c8b2a2009-01-26 03:31:40 +00002500 lhs, DAG.getConstantFP(0.0, lhsVT),
2501 ISD::SETUO),
2502 DAG.getConstant(ccResultAllOnes, ccResultVT));
2503 } else if (CC->get() == ISD::SETUO) {
2504 // Evaluates to true if Op0 is [SQ]NaN
Dale Johannesenf5d97892009-02-04 01:48:28 +00002505 return DAG.getNode(ISD::AND, dl, ccResultVT,
2506 DAG.getSetCC(dl, ccResultVT,
Scott Michelc9c8b2a2009-01-26 03:31:40 +00002507 lhsHi32abs,
2508 DAG.getConstant(0x7ff00000, MVT::i32),
2509 ISD::SETGE),
Dale Johannesenf5d97892009-02-04 01:48:28 +00002510 DAG.getSetCC(dl, ccResultVT,
Scott Michelc9c8b2a2009-01-26 03:31:40 +00002511 lhsLo32,
2512 DAG.getConstant(0, MVT::i32),
2513 ISD::SETGT));
2514 }
2515
2516 SDValue i64rhs = DAG.getNode(ISD::BIT_CONVERT, IntVT, rhs);
2517 SDValue rhsHi32 =
Dale Johannesenf5d97892009-02-04 01:48:28 +00002518 DAG.getNode(ISD::TRUNCATE, dl, MVT::i32,
2519 DAG.getNode(ISD::SRL, dl, IntVT,
Scott Michelc9c8b2a2009-01-26 03:31:40 +00002520 i64rhs, DAG.getConstant(32, MVT::i32)));
2521
2522 // If a value is negative, subtract from the sign magnitude constant:
2523 SDValue signMag2TC = DAG.getConstant(0x8000000000000000ULL, IntVT);
2524
2525 // Convert the sign-magnitude representation into 2's complement:
Dale Johannesenf5d97892009-02-04 01:48:28 +00002526 SDValue lhsSelectMask = DAG.getNode(ISD::SRA, dl, ccResultVT,
Scott Michelc9c8b2a2009-01-26 03:31:40 +00002527 lhsHi32, DAG.getConstant(31, MVT::i32));
Dale Johannesenf5d97892009-02-04 01:48:28 +00002528 SDValue lhsSignMag2TC = DAG.getNode(ISD::SUB, dl, IntVT, signMag2TC, i64lhs);
Scott Michelc9c8b2a2009-01-26 03:31:40 +00002529 SDValue lhsSelect =
Dale Johannesenf5d97892009-02-04 01:48:28 +00002530 DAG.getNode(ISD::SELECT, dl, IntVT,
Scott Michelc9c8b2a2009-01-26 03:31:40 +00002531 lhsSelectMask, lhsSignMag2TC, i64lhs);
2532
Dale Johannesenf5d97892009-02-04 01:48:28 +00002533 SDValue rhsSelectMask = DAG.getNode(ISD::SRA, dl, ccResultVT,
Scott Michelc9c8b2a2009-01-26 03:31:40 +00002534 rhsHi32, DAG.getConstant(31, MVT::i32));
Dale Johannesenf5d97892009-02-04 01:48:28 +00002535 SDValue rhsSignMag2TC = DAG.getNode(ISD::SUB, dl, IntVT, signMag2TC, i64rhs);
Scott Michelc9c8b2a2009-01-26 03:31:40 +00002536 SDValue rhsSelect =
Dale Johannesenf5d97892009-02-04 01:48:28 +00002537 DAG.getNode(ISD::SELECT, dl, IntVT,
Scott Michelc9c8b2a2009-01-26 03:31:40 +00002538 rhsSelectMask, rhsSignMag2TC, i64rhs);
2539
2540 unsigned compareOp;
2541
Scott Micheld1e8d9c2009-01-21 04:58:48 +00002542 switch (CC->get()) {
2543 case ISD::SETOEQ:
Scott Micheld1e8d9c2009-01-21 04:58:48 +00002544 case ISD::SETUEQ:
Scott Michelc9c8b2a2009-01-26 03:31:40 +00002545 compareOp = ISD::SETEQ; break;
2546 case ISD::SETOGT:
Scott Micheld1e8d9c2009-01-21 04:58:48 +00002547 case ISD::SETUGT:
Scott Michelc9c8b2a2009-01-26 03:31:40 +00002548 compareOp = ISD::SETGT; break;
2549 case ISD::SETOGE:
Scott Micheld1e8d9c2009-01-21 04:58:48 +00002550 case ISD::SETUGE:
Scott Michelc9c8b2a2009-01-26 03:31:40 +00002551 compareOp = ISD::SETGE; break;
2552 case ISD::SETOLT:
Scott Micheld1e8d9c2009-01-21 04:58:48 +00002553 case ISD::SETULT:
Scott Michelc9c8b2a2009-01-26 03:31:40 +00002554 compareOp = ISD::SETLT; break;
2555 case ISD::SETOLE:
Scott Micheld1e8d9c2009-01-21 04:58:48 +00002556 case ISD::SETULE:
Scott Michelc9c8b2a2009-01-26 03:31:40 +00002557 compareOp = ISD::SETLE; break;
Scott Micheld1e8d9c2009-01-21 04:58:48 +00002558 case ISD::SETUNE:
Scott Michelc9c8b2a2009-01-26 03:31:40 +00002559 case ISD::SETONE:
2560 compareOp = ISD::SETNE; break;
Scott Micheld1e8d9c2009-01-21 04:58:48 +00002561 default:
2562 cerr << "CellSPU ISel Select: unimplemented f64 condition\n";
2563 abort();
2564 break;
2565 }
2566
Scott Michelc9c8b2a2009-01-26 03:31:40 +00002567 SDValue result =
Dale Johannesenf5d97892009-02-04 01:48:28 +00002568 DAG.getSetCC(dl, ccResultVT, lhsSelect, rhsSelect,
2569 (ISD::CondCode) compareOp);
Scott Michelc9c8b2a2009-01-26 03:31:40 +00002570
2571 if ((CC->get() & 0x8) == 0) {
2572 // Ordered comparison:
Dale Johannesenf5d97892009-02-04 01:48:28 +00002573 SDValue lhsNaN = DAG.getSetCC(dl, ccResultVT,
Scott Michelc9c8b2a2009-01-26 03:31:40 +00002574 lhs, DAG.getConstantFP(0.0, MVT::f64),
2575 ISD::SETO);
Dale Johannesenf5d97892009-02-04 01:48:28 +00002576 SDValue rhsNaN = DAG.getSetCC(dl, ccResultVT,
Scott Michelc9c8b2a2009-01-26 03:31:40 +00002577 rhs, DAG.getConstantFP(0.0, MVT::f64),
2578 ISD::SETO);
Dale Johannesenf5d97892009-02-04 01:48:28 +00002579 SDValue ordered = DAG.getNode(ISD::AND, dl, ccResultVT, lhsNaN, rhsNaN);
Scott Michelc9c8b2a2009-01-26 03:31:40 +00002580
Dale Johannesenf5d97892009-02-04 01:48:28 +00002581 result = DAG.getNode(ISD::AND, dl, ccResultVT, ordered, result);
Scott Michelc9c8b2a2009-01-26 03:31:40 +00002582 }
2583
2584 return result;
Scott Micheld1e8d9c2009-01-21 04:58:48 +00002585}
2586
Scott Michel7a1c9e92008-11-22 23:50:42 +00002587//! Lower ISD::SELECT_CC
2588/*!
2589 ISD::SELECT_CC can (generally) be implemented directly on the SPU using the
2590 SELB instruction.
2591
2592 \note Need to revisit this in the future: if the code path through the true
2593 and false value computations is longer than the latency of a branch (6
2594 cycles), then it would be more advantageous to branch and insert a new basic
2595 block and branch on the condition. However, this code does not make that
2596 assumption, given the simplisitc uses so far.
2597 */
2598
Scott Michelf0569be2008-12-27 04:51:36 +00002599static SDValue LowerSELECT_CC(SDValue Op, SelectionDAG &DAG,
2600 const TargetLowering &TLI) {
Scott Michel7a1c9e92008-11-22 23:50:42 +00002601 MVT VT = Op.getValueType();
2602 SDValue lhs = Op.getOperand(0);
2603 SDValue rhs = Op.getOperand(1);
2604 SDValue trueval = Op.getOperand(2);
2605 SDValue falseval = Op.getOperand(3);
2606 SDValue condition = Op.getOperand(4);
2607
Scott Michelf0569be2008-12-27 04:51:36 +00002608 // NOTE: SELB's arguments: $rA, $rB, $mask
2609 //
2610 // SELB selects bits from $rA where bits in $mask are 0, bits from $rB
2611 // where bits in $mask are 1. CCond will be inverted, having 1s where the
2612 // condition was true and 0s where the condition was false. Hence, the
2613 // arguments to SELB get reversed.
2614
Scott Michel7a1c9e92008-11-22 23:50:42 +00002615 // Note: Really should be ISD::SELECT instead of SPUISD::SELB, but LLVM's
2616 // legalizer insists on combining SETCC/SELECT into SELECT_CC, so we end up
2617 // with another "cannot select select_cc" assert:
2618
Duncan Sands5480c042009-01-01 15:52:00 +00002619 SDValue compare = DAG.getNode(ISD::SETCC,
2620 TLI.getSetCCResultType(Op.getValueType()),
Scott Michelf0569be2008-12-27 04:51:36 +00002621 lhs, rhs, condition);
2622 return DAG.getNode(SPUISD::SELB, VT, falseval, trueval, compare);
Scott Michel7a1c9e92008-11-22 23:50:42 +00002623}
2624
Scott Michelb30e8f62008-12-02 19:53:53 +00002625//! Custom lower ISD::TRUNCATE
2626static SDValue LowerTRUNCATE(SDValue Op, SelectionDAG &DAG)
2627{
2628 MVT VT = Op.getValueType();
2629 MVT::SimpleValueType simpleVT = VT.getSimpleVT();
2630 MVT VecVT = MVT::getVectorVT(VT, (128 / VT.getSizeInBits()));
2631
2632 SDValue Op0 = Op.getOperand(0);
2633 MVT Op0VT = Op0.getValueType();
2634 MVT Op0VecVT = MVT::getVectorVT(Op0VT, (128 / Op0VT.getSizeInBits()));
2635
Scott Michelf0569be2008-12-27 04:51:36 +00002636 if (Op0VT.getSimpleVT() == MVT::i128 && simpleVT == MVT::i64) {
Scott Michel52d00012009-01-03 00:27:53 +00002637 // Create shuffle mask, least significant doubleword of quadword
Scott Michelf0569be2008-12-27 04:51:36 +00002638 unsigned maskHigh = 0x08090a0b;
2639 unsigned maskLow = 0x0c0d0e0f;
2640 // Use a shuffle to perform the truncation
2641 SDValue shufMask = DAG.getNode(ISD::BUILD_VECTOR, MVT::v4i32,
2642 DAG.getConstant(maskHigh, MVT::i32),
2643 DAG.getConstant(maskLow, MVT::i32),
2644 DAG.getConstant(maskHigh, MVT::i32),
2645 DAG.getConstant(maskLow, MVT::i32));
2646
2647
2648 SDValue PromoteScalar = DAG.getNode(SPUISD::PREFSLOT2VEC, Op0VecVT, Op0);
2649
2650 SDValue truncShuffle = DAG.getNode(SPUISD::SHUFB, Op0VecVT,
2651 PromoteScalar, PromoteScalar, shufMask);
2652
2653 return DAG.getNode(SPUISD::VEC2PREFSLOT, VT,
2654 DAG.getNode(ISD::BIT_CONVERT, VecVT, truncShuffle));
Scott Michelb30e8f62008-12-02 19:53:53 +00002655 }
2656
Scott Michelf0569be2008-12-27 04:51:36 +00002657 return SDValue(); // Leave the truncate unmolested
Scott Michelb30e8f62008-12-02 19:53:53 +00002658}
2659
Scott Michel7a1c9e92008-11-22 23:50:42 +00002660//! Custom (target-specific) lowering entry point
2661/*!
2662 This is where LLVM's DAG selection process calls to do target-specific
2663 lowering of nodes.
2664 */
Dan Gohman475871a2008-07-27 21:46:04 +00002665SDValue
2666SPUTargetLowering::LowerOperation(SDValue Op, SelectionDAG &DAG)
Scott Michel266bc8f2007-12-04 22:23:35 +00002667{
Scott Michela59d4692008-02-23 18:41:37 +00002668 unsigned Opc = (unsigned) Op.getOpcode();
Duncan Sands83ec4b62008-06-06 12:08:01 +00002669 MVT VT = Op.getValueType();
Scott Michela59d4692008-02-23 18:41:37 +00002670
2671 switch (Opc) {
Scott Michel266bc8f2007-12-04 22:23:35 +00002672 default: {
2673 cerr << "SPUTargetLowering::LowerOperation(): need to lower this!\n";
Scott Michela59d4692008-02-23 18:41:37 +00002674 cerr << "Op.getOpcode() = " << Opc << "\n";
Gabor Greifba36cb52008-08-28 21:40:38 +00002675 cerr << "*Op.getNode():\n";
2676 Op.getNode()->dump();
Scott Michel266bc8f2007-12-04 22:23:35 +00002677 abort();
2678 }
2679 case ISD::LOAD:
Scott Michelb30e8f62008-12-02 19:53:53 +00002680 case ISD::EXTLOAD:
Scott Michel266bc8f2007-12-04 22:23:35 +00002681 case ISD::SEXTLOAD:
2682 case ISD::ZEXTLOAD:
2683 return LowerLOAD(Op, DAG, SPUTM.getSubtargetImpl());
2684 case ISD::STORE:
2685 return LowerSTORE(Op, DAG, SPUTM.getSubtargetImpl());
2686 case ISD::ConstantPool:
2687 return LowerConstantPool(Op, DAG, SPUTM.getSubtargetImpl());
2688 case ISD::GlobalAddress:
2689 return LowerGlobalAddress(Op, DAG, SPUTM.getSubtargetImpl());
2690 case ISD::JumpTable:
2691 return LowerJumpTable(Op, DAG, SPUTM.getSubtargetImpl());
Scott Michel266bc8f2007-12-04 22:23:35 +00002692 case ISD::ConstantFP:
2693 return LowerConstantFP(Op, DAG);
2694 case ISD::FORMAL_ARGUMENTS:
Scott Michel58c58182008-01-17 20:38:41 +00002695 return LowerFORMAL_ARGUMENTS(Op, DAG, VarArgsFrameIndex);
Scott Michel266bc8f2007-12-04 22:23:35 +00002696 case ISD::CALL:
Scott Michel9de5d0d2008-01-11 02:53:15 +00002697 return LowerCALL(Op, DAG, SPUTM.getSubtargetImpl());
Scott Michel266bc8f2007-12-04 22:23:35 +00002698 case ISD::RET:
2699 return LowerRET(Op, DAG, getTargetMachine());
2700
Scott Michel02d711b2008-12-30 23:28:25 +00002701 // i8, i64 math ops:
Scott Michel8bf61e82008-06-02 22:18:03 +00002702 case ISD::ADD:
Scott Michel266bc8f2007-12-04 22:23:35 +00002703 case ISD::SUB:
2704 case ISD::ROTR:
2705 case ISD::ROTL:
2706 case ISD::SRL:
2707 case ISD::SHL:
Scott Michel8bf61e82008-06-02 22:18:03 +00002708 case ISD::SRA: {
Scott Michela59d4692008-02-23 18:41:37 +00002709 if (VT == MVT::i8)
Scott Michelf0569be2008-12-27 04:51:36 +00002710 return LowerI8Math(Op, DAG, Opc, *this);
Scott Michela59d4692008-02-23 18:41:37 +00002711 break;
Scott Michel8bf61e82008-06-02 22:18:03 +00002712 }
Scott Michel266bc8f2007-12-04 22:23:35 +00002713
Scott Michelc9c8b2a2009-01-26 03:31:40 +00002714 case ISD::FP_TO_SINT:
2715 case ISD::FP_TO_UINT:
2716 return LowerFP_TO_INT(Op, DAG, *this);
2717
2718 case ISD::SINT_TO_FP:
2719 case ISD::UINT_TO_FP:
2720 return LowerINT_TO_FP(Op, DAG, *this);
Scott Micheld1e8d9c2009-01-21 04:58:48 +00002721
Scott Michel266bc8f2007-12-04 22:23:35 +00002722 // Vector-related lowering.
2723 case ISD::BUILD_VECTOR:
Scott Michelc9c8b2a2009-01-26 03:31:40 +00002724 return LowerBUILD_VECTOR(Op, DAG);
Scott Michel266bc8f2007-12-04 22:23:35 +00002725 case ISD::SCALAR_TO_VECTOR:
2726 return LowerSCALAR_TO_VECTOR(Op, DAG);
2727 case ISD::VECTOR_SHUFFLE:
2728 return LowerVECTOR_SHUFFLE(Op, DAG);
2729 case ISD::EXTRACT_VECTOR_ELT:
2730 return LowerEXTRACT_VECTOR_ELT(Op, DAG);
2731 case ISD::INSERT_VECTOR_ELT:
2732 return LowerINSERT_VECTOR_ELT(Op, DAG);
2733
2734 // Look for ANDBI, ORBI and XORBI opportunities and lower appropriately:
2735 case ISD::AND:
2736 case ISD::OR:
2737 case ISD::XOR:
2738 return LowerByteImmed(Op, DAG);
2739
2740 // Vector and i8 multiply:
2741 case ISD::MUL:
Scott Michel02d711b2008-12-30 23:28:25 +00002742 if (VT == MVT::i8)
Scott Michelf0569be2008-12-27 04:51:36 +00002743 return LowerI8Math(Op, DAG, Opc, *this);
Scott Michel266bc8f2007-12-04 22:23:35 +00002744
Scott Michel266bc8f2007-12-04 22:23:35 +00002745 case ISD::CTPOP:
2746 return LowerCTPOP(Op, DAG);
Scott Michel7a1c9e92008-11-22 23:50:42 +00002747
2748 case ISD::SELECT_CC:
Scott Michelf0569be2008-12-27 04:51:36 +00002749 return LowerSELECT_CC(Op, DAG, *this);
Scott Michelb30e8f62008-12-02 19:53:53 +00002750
Scott Micheld1e8d9c2009-01-21 04:58:48 +00002751 case ISD::SETCC:
2752 return LowerSETCC(Op, DAG, *this);
2753
Scott Michelb30e8f62008-12-02 19:53:53 +00002754 case ISD::TRUNCATE:
2755 return LowerTRUNCATE(Op, DAG);
Scott Michel266bc8f2007-12-04 22:23:35 +00002756 }
2757
Dan Gohman475871a2008-07-27 21:46:04 +00002758 return SDValue();
Scott Michel266bc8f2007-12-04 22:23:35 +00002759}
2760
Duncan Sands1607f052008-12-01 11:39:25 +00002761void SPUTargetLowering::ReplaceNodeResults(SDNode *N,
2762 SmallVectorImpl<SDValue>&Results,
2763 SelectionDAG &DAG)
Scott Michel73ce1c52008-11-10 23:43:06 +00002764{
2765#if 0
2766 unsigned Opc = (unsigned) N->getOpcode();
2767 MVT OpVT = N->getValueType(0);
2768
2769 switch (Opc) {
2770 default: {
2771 cerr << "SPUTargetLowering::ReplaceNodeResults(): need to fix this!\n";
2772 cerr << "Op.getOpcode() = " << Opc << "\n";
2773 cerr << "*Op.getNode():\n";
2774 N->dump();
2775 abort();
2776 /*NOTREACHED*/
2777 }
2778 }
2779#endif
2780
2781 /* Otherwise, return unchanged */
Scott Michel73ce1c52008-11-10 23:43:06 +00002782}
2783
Scott Michel266bc8f2007-12-04 22:23:35 +00002784//===----------------------------------------------------------------------===//
Scott Michel266bc8f2007-12-04 22:23:35 +00002785// Target Optimization Hooks
2786//===----------------------------------------------------------------------===//
2787
Dan Gohman475871a2008-07-27 21:46:04 +00002788SDValue
Scott Michel266bc8f2007-12-04 22:23:35 +00002789SPUTargetLowering::PerformDAGCombine(SDNode *N, DAGCombinerInfo &DCI) const
2790{
2791#if 0
2792 TargetMachine &TM = getTargetMachine();
Scott Michel053c1da2008-01-29 02:16:57 +00002793#endif
2794 const SPUSubtarget *ST = SPUTM.getSubtargetImpl();
Scott Michel266bc8f2007-12-04 22:23:35 +00002795 SelectionDAG &DAG = DCI.DAG;
Scott Michel1a6cdb62008-12-01 17:56:02 +00002796 SDValue Op0 = N->getOperand(0); // everything has at least one operand
2797 MVT NodeVT = N->getValueType(0); // The node's value type
Scott Michelf0569be2008-12-27 04:51:36 +00002798 MVT Op0VT = Op0.getValueType(); // The first operand's result
Scott Michel1a6cdb62008-12-01 17:56:02 +00002799 SDValue Result; // Initially, empty result
Scott Michel266bc8f2007-12-04 22:23:35 +00002800
2801 switch (N->getOpcode()) {
2802 default: break;
Scott Michel053c1da2008-01-29 02:16:57 +00002803 case ISD::ADD: {
Dan Gohman475871a2008-07-27 21:46:04 +00002804 SDValue Op1 = N->getOperand(1);
Scott Michel053c1da2008-01-29 02:16:57 +00002805
Scott Michelf0569be2008-12-27 04:51:36 +00002806 if (Op0.getOpcode() == SPUISD::IndirectAddr
2807 || Op1.getOpcode() == SPUISD::IndirectAddr) {
2808 // Normalize the operands to reduce repeated code
2809 SDValue IndirectArg = Op0, AddArg = Op1;
Scott Michel1df30c42008-12-29 03:23:36 +00002810
Scott Michelf0569be2008-12-27 04:51:36 +00002811 if (Op1.getOpcode() == SPUISD::IndirectAddr) {
2812 IndirectArg = Op1;
2813 AddArg = Op0;
2814 }
2815
2816 if (isa<ConstantSDNode>(AddArg)) {
2817 ConstantSDNode *CN0 = cast<ConstantSDNode > (AddArg);
2818 SDValue IndOp1 = IndirectArg.getOperand(1);
2819
2820 if (CN0->isNullValue()) {
2821 // (add (SPUindirect <arg>, <arg>), 0) ->
2822 // (SPUindirect <arg>, <arg>)
Scott Michel053c1da2008-01-29 02:16:57 +00002823
Scott Michel23f2ff72008-12-04 17:16:59 +00002824#if !defined(NDEBUG)
Scott Michelf0569be2008-12-27 04:51:36 +00002825 if (DebugFlag && isCurrentDebugType(DEBUG_TYPE)) {
Scott Michel30ee7df2008-12-04 03:02:42 +00002826 cerr << "\n"
Scott Michelf0569be2008-12-27 04:51:36 +00002827 << "Replace: (add (SPUindirect <arg>, <arg>), 0)\n"
2828 << "With: (SPUindirect <arg>, <arg>)\n";
2829 }
Scott Michel30ee7df2008-12-04 03:02:42 +00002830#endif
2831
Scott Michelf0569be2008-12-27 04:51:36 +00002832 return IndirectArg;
2833 } else if (isa<ConstantSDNode>(IndOp1)) {
2834 // (add (SPUindirect <arg>, <const>), <const>) ->
2835 // (SPUindirect <arg>, <const + const>)
2836 ConstantSDNode *CN1 = cast<ConstantSDNode > (IndOp1);
2837 int64_t combinedConst = CN0->getSExtValue() + CN1->getSExtValue();
2838 SDValue combinedValue = DAG.getConstant(combinedConst, Op0VT);
Scott Michel053c1da2008-01-29 02:16:57 +00002839
Scott Michelf0569be2008-12-27 04:51:36 +00002840#if !defined(NDEBUG)
2841 if (DebugFlag && isCurrentDebugType(DEBUG_TYPE)) {
2842 cerr << "\n"
2843 << "Replace: (add (SPUindirect <arg>, " << CN1->getSExtValue()
2844 << "), " << CN0->getSExtValue() << ")\n"
2845 << "With: (SPUindirect <arg>, "
2846 << combinedConst << ")\n";
2847 }
2848#endif
Scott Michel053c1da2008-01-29 02:16:57 +00002849
Scott Michelf0569be2008-12-27 04:51:36 +00002850 return DAG.getNode(SPUISD::IndirectAddr, Op0VT,
2851 IndirectArg, combinedValue);
2852 }
Scott Michel053c1da2008-01-29 02:16:57 +00002853 }
2854 }
Scott Michela59d4692008-02-23 18:41:37 +00002855 break;
2856 }
2857 case ISD::SIGN_EXTEND:
2858 case ISD::ZERO_EXTEND:
2859 case ISD::ANY_EXTEND: {
Scott Michel1a6cdb62008-12-01 17:56:02 +00002860 if (Op0.getOpcode() == SPUISD::VEC2PREFSLOT && NodeVT == Op0VT) {
Scott Michela59d4692008-02-23 18:41:37 +00002861 // (any_extend (SPUextract_elt0 <arg>)) ->
2862 // (SPUextract_elt0 <arg>)
2863 // Types must match, however...
Scott Michel23f2ff72008-12-04 17:16:59 +00002864#if !defined(NDEBUG)
2865 if (DebugFlag && isCurrentDebugType(DEBUG_TYPE)) {
Scott Michel30ee7df2008-12-04 03:02:42 +00002866 cerr << "\nReplace: ";
2867 N->dump(&DAG);
2868 cerr << "\nWith: ";
2869 Op0.getNode()->dump(&DAG);
2870 cerr << "\n";
Scott Michel23f2ff72008-12-04 17:16:59 +00002871 }
Scott Michel30ee7df2008-12-04 03:02:42 +00002872#endif
Scott Michela59d4692008-02-23 18:41:37 +00002873
2874 return Op0;
2875 }
2876 break;
2877 }
2878 case SPUISD::IndirectAddr: {
2879 if (!ST->usingLargeMem() && Op0.getOpcode() == SPUISD::AFormAddr) {
Scott Micheld1e8d9c2009-01-21 04:58:48 +00002880 ConstantSDNode *CN = dyn_cast<ConstantSDNode>(N->getOperand(1));
2881 if (CN != 0 && CN->getZExtValue() == 0) {
Scott Michela59d4692008-02-23 18:41:37 +00002882 // (SPUindirect (SPUaform <addr>, 0), 0) ->
2883 // (SPUaform <addr>, 0)
2884
2885 DEBUG(cerr << "Replace: ");
2886 DEBUG(N->dump(&DAG));
2887 DEBUG(cerr << "\nWith: ");
Gabor Greifba36cb52008-08-28 21:40:38 +00002888 DEBUG(Op0.getNode()->dump(&DAG));
Scott Michela59d4692008-02-23 18:41:37 +00002889 DEBUG(cerr << "\n");
2890
2891 return Op0;
2892 }
Scott Michelf0569be2008-12-27 04:51:36 +00002893 } else if (Op0.getOpcode() == ISD::ADD) {
2894 SDValue Op1 = N->getOperand(1);
2895 if (ConstantSDNode *CN1 = dyn_cast<ConstantSDNode>(Op1)) {
2896 // (SPUindirect (add <arg>, <arg>), 0) ->
2897 // (SPUindirect <arg>, <arg>)
2898 if (CN1->isNullValue()) {
2899
2900#if !defined(NDEBUG)
2901 if (DebugFlag && isCurrentDebugType(DEBUG_TYPE)) {
2902 cerr << "\n"
2903 << "Replace: (SPUindirect (add <arg>, <arg>), 0)\n"
2904 << "With: (SPUindirect <arg>, <arg>)\n";
2905 }
2906#endif
2907
2908 return DAG.getNode(SPUISD::IndirectAddr, Op0VT,
2909 Op0.getOperand(0), Op0.getOperand(1));
2910 }
2911 }
Scott Michela59d4692008-02-23 18:41:37 +00002912 }
2913 break;
2914 }
2915 case SPUISD::SHLQUAD_L_BITS:
2916 case SPUISD::SHLQUAD_L_BYTES:
2917 case SPUISD::VEC_SHL:
2918 case SPUISD::VEC_SRL:
2919 case SPUISD::VEC_SRA:
Scott Michelf0569be2008-12-27 04:51:36 +00002920 case SPUISD::ROTBYTES_LEFT: {
Dan Gohman475871a2008-07-27 21:46:04 +00002921 SDValue Op1 = N->getOperand(1);
Scott Michela59d4692008-02-23 18:41:37 +00002922
Scott Michelf0569be2008-12-27 04:51:36 +00002923 // Kill degenerate vector shifts:
2924 if (ConstantSDNode *CN = dyn_cast<ConstantSDNode>(Op1)) {
2925 if (CN->isNullValue()) {
Scott Michela59d4692008-02-23 18:41:37 +00002926 Result = Op0;
2927 }
2928 }
2929 break;
2930 }
Scott Michelf0569be2008-12-27 04:51:36 +00002931 case SPUISD::PREFSLOT2VEC: {
Scott Michela59d4692008-02-23 18:41:37 +00002932 switch (Op0.getOpcode()) {
2933 default:
2934 break;
2935 case ISD::ANY_EXTEND:
2936 case ISD::ZERO_EXTEND:
2937 case ISD::SIGN_EXTEND: {
Scott Michel1df30c42008-12-29 03:23:36 +00002938 // (SPUprefslot2vec (any|zero|sign_extend (SPUvec2prefslot <arg>))) ->
Scott Michela59d4692008-02-23 18:41:37 +00002939 // <arg>
Scott Michel1df30c42008-12-29 03:23:36 +00002940 // but only if the SPUprefslot2vec and <arg> types match.
Dan Gohman475871a2008-07-27 21:46:04 +00002941 SDValue Op00 = Op0.getOperand(0);
Scott Michel104de432008-11-24 17:11:17 +00002942 if (Op00.getOpcode() == SPUISD::VEC2PREFSLOT) {
Dan Gohman475871a2008-07-27 21:46:04 +00002943 SDValue Op000 = Op00.getOperand(0);
Scott Michel1a6cdb62008-12-01 17:56:02 +00002944 if (Op000.getValueType() == NodeVT) {
Scott Michela59d4692008-02-23 18:41:37 +00002945 Result = Op000;
2946 }
2947 }
2948 break;
2949 }
Scott Michel104de432008-11-24 17:11:17 +00002950 case SPUISD::VEC2PREFSLOT: {
Scott Michel1df30c42008-12-29 03:23:36 +00002951 // (SPUprefslot2vec (SPUvec2prefslot <arg>)) ->
Scott Michela59d4692008-02-23 18:41:37 +00002952 // <arg>
2953 Result = Op0.getOperand(0);
2954 break;
Scott Michel5af8f0e2008-07-16 17:17:29 +00002955 }
Scott Michela59d4692008-02-23 18:41:37 +00002956 }
2957 break;
Scott Michel053c1da2008-01-29 02:16:57 +00002958 }
2959 }
Scott Micheld1e8d9c2009-01-21 04:58:48 +00002960
Scott Michel58c58182008-01-17 20:38:41 +00002961 // Otherwise, return unchanged.
Scott Michel1a6cdb62008-12-01 17:56:02 +00002962#ifndef NDEBUG
Gabor Greifba36cb52008-08-28 21:40:38 +00002963 if (Result.getNode()) {
Scott Michela59d4692008-02-23 18:41:37 +00002964 DEBUG(cerr << "\nReplace.SPU: ");
2965 DEBUG(N->dump(&DAG));
2966 DEBUG(cerr << "\nWith: ");
Gabor Greifba36cb52008-08-28 21:40:38 +00002967 DEBUG(Result.getNode()->dump(&DAG));
Scott Michela59d4692008-02-23 18:41:37 +00002968 DEBUG(cerr << "\n");
2969 }
2970#endif
2971
2972 return Result;
Scott Michel266bc8f2007-12-04 22:23:35 +00002973}
2974
2975//===----------------------------------------------------------------------===//
2976// Inline Assembly Support
2977//===----------------------------------------------------------------------===//
2978
2979/// getConstraintType - Given a constraint letter, return the type of
2980/// constraint it is for this target.
Scott Michel5af8f0e2008-07-16 17:17:29 +00002981SPUTargetLowering::ConstraintType
Scott Michel266bc8f2007-12-04 22:23:35 +00002982SPUTargetLowering::getConstraintType(const std::string &ConstraintLetter) const {
2983 if (ConstraintLetter.size() == 1) {
2984 switch (ConstraintLetter[0]) {
2985 default: break;
2986 case 'b':
2987 case 'r':
2988 case 'f':
2989 case 'v':
2990 case 'y':
2991 return C_RegisterClass;
Scott Michel5af8f0e2008-07-16 17:17:29 +00002992 }
Scott Michel266bc8f2007-12-04 22:23:35 +00002993 }
2994 return TargetLowering::getConstraintType(ConstraintLetter);
2995}
2996
Scott Michel5af8f0e2008-07-16 17:17:29 +00002997std::pair<unsigned, const TargetRegisterClass*>
Scott Michel266bc8f2007-12-04 22:23:35 +00002998SPUTargetLowering::getRegForInlineAsmConstraint(const std::string &Constraint,
Duncan Sands83ec4b62008-06-06 12:08:01 +00002999 MVT VT) const
Scott Michel266bc8f2007-12-04 22:23:35 +00003000{
3001 if (Constraint.size() == 1) {
3002 // GCC RS6000 Constraint Letters
3003 switch (Constraint[0]) {
3004 case 'b': // R1-R31
3005 case 'r': // R0-R31
3006 if (VT == MVT::i64)
3007 return std::make_pair(0U, SPU::R64CRegisterClass);
3008 return std::make_pair(0U, SPU::R32CRegisterClass);
3009 case 'f':
3010 if (VT == MVT::f32)
3011 return std::make_pair(0U, SPU::R32FPRegisterClass);
3012 else if (VT == MVT::f64)
3013 return std::make_pair(0U, SPU::R64FPRegisterClass);
3014 break;
Scott Michel5af8f0e2008-07-16 17:17:29 +00003015 case 'v':
Scott Michel266bc8f2007-12-04 22:23:35 +00003016 return std::make_pair(0U, SPU::GPRCRegisterClass);
3017 }
3018 }
Scott Michel5af8f0e2008-07-16 17:17:29 +00003019
Scott Michel266bc8f2007-12-04 22:23:35 +00003020 return TargetLowering::getRegForInlineAsmConstraint(Constraint, VT);
3021}
3022
Scott Michela59d4692008-02-23 18:41:37 +00003023//! Compute used/known bits for a SPU operand
Scott Michel266bc8f2007-12-04 22:23:35 +00003024void
Dan Gohman475871a2008-07-27 21:46:04 +00003025SPUTargetLowering::computeMaskedBitsForTargetNode(const SDValue Op,
Dan Gohman977a76f2008-02-13 22:28:48 +00003026 const APInt &Mask,
Scott Michel5af8f0e2008-07-16 17:17:29 +00003027 APInt &KnownZero,
Dan Gohmanfd29e0e2008-02-13 00:35:47 +00003028 APInt &KnownOne,
Scott Michel7f9ba9b2008-01-30 02:55:46 +00003029 const SelectionDAG &DAG,
3030 unsigned Depth ) const {
Scott Michel203b2d62008-04-30 00:30:08 +00003031#if 0
Scott Michela59d4692008-02-23 18:41:37 +00003032 const uint64_t uint64_sizebits = sizeof(uint64_t) * 8;
3033
3034 switch (Op.getOpcode()) {
3035 default:
3036 // KnownZero = KnownOne = APInt(Mask.getBitWidth(), 0);
3037 break;
Scott Michela59d4692008-02-23 18:41:37 +00003038 case CALL:
3039 case SHUFB:
Scott Michel7a1c9e92008-11-22 23:50:42 +00003040 case SHUFFLE_MASK:
Scott Michela59d4692008-02-23 18:41:37 +00003041 case CNTB:
Scott Micheld1e8d9c2009-01-21 04:58:48 +00003042 case SPUISD::PREFSLOT2VEC:
Scott Michela59d4692008-02-23 18:41:37 +00003043 case SPUISD::LDRESULT:
Scott Micheld1e8d9c2009-01-21 04:58:48 +00003044 case SPUISD::VEC2PREFSLOT:
Scott Michel203b2d62008-04-30 00:30:08 +00003045 case SPUISD::SHLQUAD_L_BITS:
3046 case SPUISD::SHLQUAD_L_BYTES:
3047 case SPUISD::VEC_SHL:
3048 case SPUISD::VEC_SRL:
3049 case SPUISD::VEC_SRA:
3050 case SPUISD::VEC_ROTL:
3051 case SPUISD::VEC_ROTR:
Scott Michel203b2d62008-04-30 00:30:08 +00003052 case SPUISD::ROTBYTES_LEFT:
Scott Michel8bf61e82008-06-02 22:18:03 +00003053 case SPUISD::SELECT_MASK:
3054 case SPUISD::SELB:
Scott Michela59d4692008-02-23 18:41:37 +00003055 }
Scott Micheld1e8d9c2009-01-21 04:58:48 +00003056#endif
Scott Michel266bc8f2007-12-04 22:23:35 +00003057}
Scott Michel02d711b2008-12-30 23:28:25 +00003058
Scott Michelf0569be2008-12-27 04:51:36 +00003059unsigned
3060SPUTargetLowering::ComputeNumSignBitsForTargetNode(SDValue Op,
3061 unsigned Depth) const {
3062 switch (Op.getOpcode()) {
3063 default:
3064 return 1;
Scott Michel266bc8f2007-12-04 22:23:35 +00003065
Scott Michelf0569be2008-12-27 04:51:36 +00003066 case ISD::SETCC: {
3067 MVT VT = Op.getValueType();
3068
3069 if (VT != MVT::i8 && VT != MVT::i16 && VT != MVT::i32) {
3070 VT = MVT::i32;
3071 }
3072 return VT.getSizeInBits();
3073 }
3074 }
3075}
Scott Michel1df30c42008-12-29 03:23:36 +00003076
Scott Michel203b2d62008-04-30 00:30:08 +00003077// LowerAsmOperandForConstraint
3078void
Dan Gohman475871a2008-07-27 21:46:04 +00003079SPUTargetLowering::LowerAsmOperandForConstraint(SDValue Op,
Scott Michel203b2d62008-04-30 00:30:08 +00003080 char ConstraintLetter,
Evan Chengda43bcf2008-09-24 00:05:32 +00003081 bool hasMemory,
Dan Gohman475871a2008-07-27 21:46:04 +00003082 std::vector<SDValue> &Ops,
Scott Michel203b2d62008-04-30 00:30:08 +00003083 SelectionDAG &DAG) const {
3084 // Default, for the time being, to the base class handler
Evan Chengda43bcf2008-09-24 00:05:32 +00003085 TargetLowering::LowerAsmOperandForConstraint(Op, ConstraintLetter, hasMemory,
3086 Ops, DAG);
Scott Michel203b2d62008-04-30 00:30:08 +00003087}
3088
Scott Michel266bc8f2007-12-04 22:23:35 +00003089/// isLegalAddressImmediate - Return true if the integer value can be used
3090/// as the offset of the target addressing mode.
Gabor Greif93c53e52008-08-31 15:37:04 +00003091bool SPUTargetLowering::isLegalAddressImmediate(int64_t V,
3092 const Type *Ty) const {
Scott Michel266bc8f2007-12-04 22:23:35 +00003093 // SPU's addresses are 256K:
3094 return (V > -(1 << 18) && V < (1 << 18) - 1);
3095}
3096
3097bool SPUTargetLowering::isLegalAddressImmediate(llvm::GlobalValue* GV) const {
Scott Michel5af8f0e2008-07-16 17:17:29 +00003098 return false;
Scott Michel266bc8f2007-12-04 22:23:35 +00003099}
Dan Gohman6520e202008-10-18 02:06:02 +00003100
3101bool
3102SPUTargetLowering::isOffsetFoldingLegal(const GlobalAddressSDNode *GA) const {
3103 // The SPU target isn't yet aware of offsets.
3104 return false;
3105}