blob: eeed0dfe742ae017c50183f826fe91f7448098f4 [file] [log] [blame]
Nate Begeman1d9d7422005-10-18 00:28:58 +00001//===-- PPCISelLowering.cpp - PPC DAG Lowering Implementation -------------===//
Chris Lattner7c5a3d32005-08-16 17:14:42 +00002//
3// The LLVM Compiler Infrastructure
4//
5// This file was developed by Chris Lattner and is distributed under
6// the University of Illinois Open Source License. See LICENSE.TXT for details.
7//
8//===----------------------------------------------------------------------===//
9//
Nate Begeman21e463b2005-10-16 05:39:50 +000010// This file implements the PPCISelLowering class.
Chris Lattner7c5a3d32005-08-16 17:14:42 +000011//
12//===----------------------------------------------------------------------===//
13
Chris Lattner16e71f22005-10-14 23:59:06 +000014#include "PPCISelLowering.h"
15#include "PPCTargetMachine.h"
Nate Begeman750ac1b2006-02-01 07:19:44 +000016#include "llvm/ADT/VectorExtras.h"
Evan Chengc4c62572006-03-13 23:20:37 +000017#include "llvm/Analysis/ScalarEvolutionExpressions.h"
Chris Lattner7c5a3d32005-08-16 17:14:42 +000018#include "llvm/CodeGen/MachineFrameInfo.h"
19#include "llvm/CodeGen/MachineFunction.h"
Chris Lattner8a2d3ca2005-08-26 21:23:58 +000020#include "llvm/CodeGen/MachineInstrBuilder.h"
Chris Lattner7c5a3d32005-08-16 17:14:42 +000021#include "llvm/CodeGen/SelectionDAG.h"
Chris Lattner7b738342005-09-13 19:33:40 +000022#include "llvm/CodeGen/SSARegMap.h"
Chris Lattner0b1e4e52005-08-26 17:36:52 +000023#include "llvm/Constants.h"
Chris Lattner7c5a3d32005-08-16 17:14:42 +000024#include "llvm/Function.h"
Nate Begeman750ac1b2006-02-01 07:19:44 +000025#include "llvm/Support/MathExtras.h"
Evan Chengd2ee2182006-02-18 00:08:58 +000026#include "llvm/Target/TargetOptions.h"
Chris Lattner7c5a3d32005-08-16 17:14:42 +000027using namespace llvm;
28
Nate Begeman21e463b2005-10-16 05:39:50 +000029PPCTargetLowering::PPCTargetLowering(TargetMachine &TM)
Chris Lattner7c5a3d32005-08-16 17:14:42 +000030 : TargetLowering(TM) {
31
32 // Fold away setcc operations if possible.
33 setSetCCIsExpensive();
Nate Begeman405e3ec2005-10-21 00:02:42 +000034 setPow2DivIsCheap();
Chris Lattner7c5a3d32005-08-16 17:14:42 +000035
Chris Lattnerd145a612005-09-27 22:18:25 +000036 // Use _setjmp/_longjmp instead of setjmp/longjmp.
37 setUseUnderscoreSetJmpLongJmp(true);
38
Chris Lattner7c5a3d32005-08-16 17:14:42 +000039 // Set up the register classes.
Nate Begeman1d9d7422005-10-18 00:28:58 +000040 addRegisterClass(MVT::i32, PPC::GPRCRegisterClass);
41 addRegisterClass(MVT::f32, PPC::F4RCRegisterClass);
42 addRegisterClass(MVT::f64, PPC::F8RCRegisterClass);
Chris Lattner7c5a3d32005-08-16 17:14:42 +000043
Chris Lattnera54aa942006-01-29 06:26:08 +000044 setOperationAction(ISD::ConstantFP, MVT::f64, Expand);
45 setOperationAction(ISD::ConstantFP, MVT::f32, Expand);
46
Chris Lattner7c5a3d32005-08-16 17:14:42 +000047 // PowerPC has no intrinsics for these particular operations
48 setOperationAction(ISD::MEMMOVE, MVT::Other, Expand);
49 setOperationAction(ISD::MEMSET, MVT::Other, Expand);
50 setOperationAction(ISD::MEMCPY, MVT::Other, Expand);
51
52 // PowerPC has an i16 but no i8 (or i1) SEXTLOAD
53 setOperationAction(ISD::SEXTLOAD, MVT::i1, Expand);
54 setOperationAction(ISD::SEXTLOAD, MVT::i8, Expand);
55
56 // PowerPC has no SREM/UREM instructions
57 setOperationAction(ISD::SREM, MVT::i32, Expand);
58 setOperationAction(ISD::UREM, MVT::i32, Expand);
59
60 // We don't support sin/cos/sqrt/fmod
61 setOperationAction(ISD::FSIN , MVT::f64, Expand);
62 setOperationAction(ISD::FCOS , MVT::f64, Expand);
Chris Lattner615c2d02005-09-28 22:29:58 +000063 setOperationAction(ISD::FREM , MVT::f64, Expand);
Chris Lattner7c5a3d32005-08-16 17:14:42 +000064 setOperationAction(ISD::FSIN , MVT::f32, Expand);
65 setOperationAction(ISD::FCOS , MVT::f32, Expand);
Chris Lattner615c2d02005-09-28 22:29:58 +000066 setOperationAction(ISD::FREM , MVT::f32, Expand);
Chris Lattner7c5a3d32005-08-16 17:14:42 +000067
68 // If we're enabling GP optimizations, use hardware square root
Chris Lattner1e9de3e2005-09-02 18:33:05 +000069 if (!TM.getSubtarget<PPCSubtarget>().hasFSQRT()) {
Chris Lattner7c5a3d32005-08-16 17:14:42 +000070 setOperationAction(ISD::FSQRT, MVT::f64, Expand);
71 setOperationAction(ISD::FSQRT, MVT::f32, Expand);
72 }
73
Chris Lattner9601a862006-03-05 05:08:37 +000074 setOperationAction(ISD::FCOPYSIGN, MVT::f64, Expand);
75 setOperationAction(ISD::FCOPYSIGN, MVT::f32, Expand);
76
Nate Begemand88fc032006-01-14 03:14:10 +000077 // PowerPC does not have BSWAP, CTPOP or CTTZ
78 setOperationAction(ISD::BSWAP, MVT::i32 , Expand);
Chris Lattner7c5a3d32005-08-16 17:14:42 +000079 setOperationAction(ISD::CTPOP, MVT::i32 , Expand);
80 setOperationAction(ISD::CTTZ , MVT::i32 , Expand);
81
Nate Begeman35ef9132006-01-11 21:21:00 +000082 // PowerPC does not have ROTR
83 setOperationAction(ISD::ROTR, MVT::i32 , Expand);
84
Chris Lattner7c5a3d32005-08-16 17:14:42 +000085 // PowerPC does not have Select
86 setOperationAction(ISD::SELECT, MVT::i32, Expand);
87 setOperationAction(ISD::SELECT, MVT::f32, Expand);
88 setOperationAction(ISD::SELECT, MVT::f64, Expand);
Chris Lattnere4bc9ea2005-08-26 00:52:45 +000089
Chris Lattner0b1e4e52005-08-26 17:36:52 +000090 // PowerPC wants to turn select_cc of FP into fsel when possible.
91 setOperationAction(ISD::SELECT_CC, MVT::f32, Custom);
92 setOperationAction(ISD::SELECT_CC, MVT::f64, Custom);
Nate Begeman44775902006-01-31 08:17:29 +000093
Nate Begeman750ac1b2006-02-01 07:19:44 +000094 // PowerPC wants to optimize integer setcc a bit
Nate Begeman44775902006-01-31 08:17:29 +000095 setOperationAction(ISD::SETCC, MVT::i32, Custom);
Chris Lattnereb9b62e2005-08-31 19:09:57 +000096
Nate Begeman81e80972006-03-17 01:40:33 +000097 // PowerPC does not have BRCOND which requires SetCC
98 setOperationAction(ISD::BRCOND, MVT::Other, Expand);
Chris Lattner7c5a3d32005-08-16 17:14:42 +000099
Chris Lattnerf7605322005-08-31 21:09:52 +0000100 // PowerPC turns FP_TO_SINT into FCTIWZ and some load/stores.
101 setOperationAction(ISD::FP_TO_SINT, MVT::i32, Custom);
Nate Begemanc09eeec2005-09-06 22:03:27 +0000102
Jim Laskeyad23c9d2005-08-17 00:40:22 +0000103 // PowerPC does not have [U|S]INT_TO_FP
104 setOperationAction(ISD::SINT_TO_FP, MVT::i32, Expand);
105 setOperationAction(ISD::UINT_TO_FP, MVT::i32, Expand);
106
Chris Lattner53e88452005-12-23 05:13:35 +0000107 setOperationAction(ISD::BIT_CONVERT, MVT::f32, Expand);
108 setOperationAction(ISD::BIT_CONVERT, MVT::i32, Expand);
109
Chris Lattnere6ec9f22005-09-10 00:21:06 +0000110 // PowerPC does not have truncstore for i1.
111 setOperationAction(ISD::TRUNCSTORE, MVT::i1, Promote);
Chris Lattnerf73bae12005-11-29 06:16:21 +0000112
Jim Laskeyabf6d172006-01-05 01:25:28 +0000113 // Support label based line numbers.
Chris Lattnerf73bae12005-11-29 06:16:21 +0000114 setOperationAction(ISD::LOCATION, MVT::Other, Expand);
Jim Laskeye0bce712006-01-05 01:47:43 +0000115 setOperationAction(ISD::DEBUG_LOC, MVT::Other, Expand);
Jim Laskeyabf6d172006-01-05 01:25:28 +0000116 // FIXME - use subtarget debug flags
Jim Laskeye0bce712006-01-05 01:47:43 +0000117 if (!TM.getSubtarget<PPCSubtarget>().isDarwin())
Jim Laskeyabf6d172006-01-05 01:25:28 +0000118 setOperationAction(ISD::DEBUG_LABEL, MVT::Other, Expand);
Chris Lattnere6ec9f22005-09-10 00:21:06 +0000119
Nate Begeman28a6b022005-12-10 02:36:00 +0000120 // We want to legalize GlobalAddress and ConstantPool nodes into the
121 // appropriate instructions to materialize the address.
Chris Lattner3eef4e32005-11-17 18:26:56 +0000122 setOperationAction(ISD::GlobalAddress, MVT::i32, Custom);
Nate Begeman28a6b022005-12-10 02:36:00 +0000123 setOperationAction(ISD::ConstantPool, MVT::i32, Custom);
Chris Lattnerb99329e2006-01-13 02:42:53 +0000124
Nate Begemanee625572006-01-27 21:09:22 +0000125 // RET must be custom lowered, to meet ABI requirements
126 setOperationAction(ISD::RET , MVT::Other, Custom);
127
Nate Begemanacc398c2006-01-25 18:21:52 +0000128 // VASTART needs to be custom lowered to use the VarArgsFrameIndex
129 setOperationAction(ISD::VASTART , MVT::Other, Custom);
130
Chris Lattnerb22c08b2006-01-15 09:02:48 +0000131 // Use the default implementation.
Nate Begemanacc398c2006-01-25 18:21:52 +0000132 setOperationAction(ISD::VAARG , MVT::Other, Expand);
133 setOperationAction(ISD::VACOPY , MVT::Other, Expand);
134 setOperationAction(ISD::VAEND , MVT::Other, Expand);
Chris Lattnerb22c08b2006-01-15 09:02:48 +0000135 setOperationAction(ISD::STACKSAVE , MVT::Other, Expand);
136 setOperationAction(ISD::STACKRESTORE , MVT::Other, Expand);
137 setOperationAction(ISD::DYNAMIC_STACKALLOC, MVT::i32 , Expand);
Chris Lattner860e8862005-11-17 07:30:41 +0000138
Nate Begemanc09eeec2005-09-06 22:03:27 +0000139 if (TM.getSubtarget<PPCSubtarget>().is64Bit()) {
Nate Begeman1d9d7422005-10-18 00:28:58 +0000140 // They also have instructions for converting between i64 and fp.
Nate Begemanc09eeec2005-09-06 22:03:27 +0000141 setOperationAction(ISD::FP_TO_SINT, MVT::i64, Custom);
142 setOperationAction(ISD::SINT_TO_FP, MVT::i64, Custom);
Nate Begemanae749a92005-10-25 23:48:36 +0000143 // To take advantage of the above i64 FP_TO_SINT, promote i32 FP_TO_UINT
144 setOperationAction(ISD::FP_TO_UINT, MVT::i32, Promote);
145 } else {
Chris Lattner860e8862005-11-17 07:30:41 +0000146 // PowerPC does not have FP_TO_UINT on 32-bit implementations.
Nate Begemanae749a92005-10-25 23:48:36 +0000147 setOperationAction(ISD::FP_TO_UINT, MVT::i32, Expand);
Nate Begeman9d2b8172005-10-18 00:56:42 +0000148 }
149
150 if (TM.getSubtarget<PPCSubtarget>().has64BitRegs()) {
151 // 64 bit PowerPC implementations can support i64 types directly
152 addRegisterClass(MVT::i64, PPC::G8RCRegisterClass);
Nate Begeman1d9d7422005-10-18 00:28:58 +0000153 // BUILD_PAIR can't be handled natively, and should be expanded to shl/or
154 setOperationAction(ISD::BUILD_PAIR, MVT::i64, Expand);
Nate Begeman1d9d7422005-10-18 00:28:58 +0000155 } else {
156 // 32 bit PowerPC wants to expand i64 shifts itself.
157 setOperationAction(ISD::SHL, MVT::i64, Custom);
158 setOperationAction(ISD::SRL, MVT::i64, Custom);
159 setOperationAction(ISD::SRA, MVT::i64, Custom);
Nate Begemanc09eeec2005-09-06 22:03:27 +0000160 }
161
Evan Chengd30bf012006-03-01 01:11:20 +0000162 // First set operation action for all vector types to expand. Then we
163 // will selectively turn on ones that can be effectively codegen'd.
164 for (unsigned VT = (unsigned)MVT::Vector + 1;
165 VT != (unsigned)MVT::LAST_VALUETYPE; VT++) {
166 setOperationAction(ISD::ADD , (MVT::ValueType)VT, Expand);
167 setOperationAction(ISD::SUB , (MVT::ValueType)VT, Expand);
168 setOperationAction(ISD::MUL , (MVT::ValueType)VT, Expand);
169 setOperationAction(ISD::LOAD, (MVT::ValueType)VT, Expand);
Chris Lattnerf1d0b2b2006-03-20 01:53:53 +0000170 setOperationAction(ISD::VECTOR_SHUFFLE, (MVT::ValueType)VT, Expand);
171
172 // FIXME: We don't support any BUILD_VECTOR's yet. We should custom expand
173 // the ones we do, like splat(0.0) and splat(-0.0).
174 setOperationAction(ISD::BUILD_VECTOR, (MVT::ValueType)VT, Expand);
Evan Chengd30bf012006-03-01 01:11:20 +0000175 }
176
Nate Begeman425a9692005-11-29 08:17:20 +0000177 if (TM.getSubtarget<PPCSubtarget>().hasAltivec()) {
Nate Begeman425a9692005-11-29 08:17:20 +0000178 addRegisterClass(MVT::v4f32, PPC::VRRCRegisterClass);
Nate Begeman7fd1edd2005-12-19 23:25:09 +0000179 addRegisterClass(MVT::v4i32, PPC::VRRCRegisterClass);
Chris Lattnerec4a0c72006-01-29 06:32:58 +0000180
Evan Chengd30bf012006-03-01 01:11:20 +0000181 setOperationAction(ISD::ADD , MVT::v4f32, Legal);
182 setOperationAction(ISD::SUB , MVT::v4f32, Legal);
183 setOperationAction(ISD::MUL , MVT::v4f32, Legal);
184 setOperationAction(ISD::LOAD , MVT::v4f32, Legal);
185 setOperationAction(ISD::ADD , MVT::v4i32, Legal);
186 setOperationAction(ISD::LOAD , MVT::v4i32, Legal);
Chris Lattnerf1d0b2b2006-03-20 01:53:53 +0000187 setOperationAction(ISD::LOAD , MVT::v16i8, Legal);
188
189 setOperationAction(ISD::VECTOR_SHUFFLE, MVT::v4i32, Custom);
190 setOperationAction(ISD::VECTOR_SHUFFLE, MVT::v4f32, Custom);
191
Chris Lattnerb2177b92006-03-19 06:55:52 +0000192 setOperationAction(ISD::SCALAR_TO_VECTOR, MVT::v4f32, Custom);
193 setOperationAction(ISD::SCALAR_TO_VECTOR, MVT::v4i32, Custom);
Nate Begeman425a9692005-11-29 08:17:20 +0000194 }
195
Chris Lattner7c5a3d32005-08-16 17:14:42 +0000196 setSetCCResultContents(ZeroOrOneSetCCResult);
Chris Lattnercadd7422006-01-13 17:52:03 +0000197 setStackPointerRegisterToSaveRestore(PPC::R1);
Chris Lattner7c5a3d32005-08-16 17:14:42 +0000198
Chris Lattner8c13d0a2006-03-01 04:57:39 +0000199 // We have target-specific dag combine patterns for the following nodes:
200 setTargetDAGCombine(ISD::SINT_TO_FP);
Chris Lattner51269842006-03-01 05:50:56 +0000201 setTargetDAGCombine(ISD::STORE);
Chris Lattner8c13d0a2006-03-01 04:57:39 +0000202
Chris Lattner7c5a3d32005-08-16 17:14:42 +0000203 computeRegisterProperties();
204}
205
Chris Lattnerda6d20f2006-01-09 23:52:17 +0000206const char *PPCTargetLowering::getTargetNodeName(unsigned Opcode) const {
207 switch (Opcode) {
208 default: return 0;
209 case PPCISD::FSEL: return "PPCISD::FSEL";
210 case PPCISD::FCFID: return "PPCISD::FCFID";
211 case PPCISD::FCTIDZ: return "PPCISD::FCTIDZ";
212 case PPCISD::FCTIWZ: return "PPCISD::FCTIWZ";
Chris Lattner51269842006-03-01 05:50:56 +0000213 case PPCISD::STFIWX: return "PPCISD::STFIWX";
Chris Lattnerda6d20f2006-01-09 23:52:17 +0000214 case PPCISD::VMADDFP: return "PPCISD::VMADDFP";
215 case PPCISD::VNMSUBFP: return "PPCISD::VNMSUBFP";
Chris Lattnerb2177b92006-03-19 06:55:52 +0000216 case PPCISD::LVE_X: return "PPCISD::LVE_X";
Chris Lattnerf1d0b2b2006-03-20 01:53:53 +0000217 case PPCISD::VPERM: return "PPCISD::VPERM";
Chris Lattnerda6d20f2006-01-09 23:52:17 +0000218 case PPCISD::Hi: return "PPCISD::Hi";
219 case PPCISD::Lo: return "PPCISD::Lo";
220 case PPCISD::GlobalBaseReg: return "PPCISD::GlobalBaseReg";
221 case PPCISD::SRL: return "PPCISD::SRL";
222 case PPCISD::SRA: return "PPCISD::SRA";
223 case PPCISD::SHL: return "PPCISD::SHL";
Chris Lattnere00ebf02006-01-28 07:33:03 +0000224 case PPCISD::CALL: return "PPCISD::CALL";
Chris Lattnerda6d20f2006-01-09 23:52:17 +0000225 case PPCISD::RET_FLAG: return "PPCISD::RET_FLAG";
226 }
227}
228
Chris Lattner0b1e4e52005-08-26 17:36:52 +0000229/// isFloatingPointZero - Return true if this is 0.0 or -0.0.
230static bool isFloatingPointZero(SDOperand Op) {
231 if (ConstantFPSDNode *CFP = dyn_cast<ConstantFPSDNode>(Op))
232 return CFP->isExactlyValue(-0.0) || CFP->isExactlyValue(0.0);
233 else if (Op.getOpcode() == ISD::EXTLOAD || Op.getOpcode() == ISD::LOAD) {
234 // Maybe this has already been legalized into the constant pool?
235 if (ConstantPoolSDNode *CP = dyn_cast<ConstantPoolSDNode>(Op.getOperand(1)))
236 if (ConstantFP *CFP = dyn_cast<ConstantFP>(CP->get()))
237 return CFP->isExactlyValue(-0.0) || CFP->isExactlyValue(0.0);
238 }
239 return false;
240}
241
Chris Lattneref819f82006-03-20 06:33:01 +0000242
243/// isSplatShuffleMask - Return true if the specified VECTOR_SHUFFLE operand
244/// specifies a splat of a single element that is suitable for input to
245/// VSPLTB/VSPLTH/VSPLTW.
246bool PPC::isSplatShuffleMask(SDNode *N) {
247 assert(N->getOpcode() == ISD::BUILD_VECTOR);
Chris Lattner88a99ef2006-03-20 06:37:44 +0000248 // This is a splat operation if each element of the permute is the same, and
249 // if the value doesn't reference the second vector.
250 SDOperand Elt = N->getOperand(0);
251 assert(isa<ConstantSDNode>(Elt) && "Invalid VECTOR_SHUFFLE mask!");
252 for (unsigned i = 1, e = N->getNumOperands(); i != e; ++i) {
253 assert(isa<ConstantSDNode>(N->getOperand(i)) &&
254 "Invalid VECTOR_SHUFFLE mask!");
255 if (N->getOperand(i) != Elt) return false;
256 }
257
258 // Make sure it is a splat of the first vector operand.
259 return cast<ConstantSDNode>(Elt)->getValue() < N->getNumOperands();
Chris Lattneref819f82006-03-20 06:33:01 +0000260}
261
262/// getVSPLTImmediate - Return the appropriate VSPLT* immediate to splat the
263/// specified isSplatShuffleMask VECTOR_SHUFFLE mask.
264unsigned PPC::getVSPLTImmediate(SDNode *N) {
265 assert(isSplatShuffleMask(N));
Chris Lattner88a99ef2006-03-20 06:37:44 +0000266 return cast<ConstantSDNode>(N)->getValue();
Chris Lattneref819f82006-03-20 06:33:01 +0000267}
268
269
270
Chris Lattnere4bc9ea2005-08-26 00:52:45 +0000271/// LowerOperation - Provide custom lowering hooks for some operations.
272///
Nate Begeman21e463b2005-10-16 05:39:50 +0000273SDOperand PPCTargetLowering::LowerOperation(SDOperand Op, SelectionDAG &DAG) {
Chris Lattnere4bc9ea2005-08-26 00:52:45 +0000274 switch (Op.getOpcode()) {
275 default: assert(0 && "Wasn't expecting to be able to lower this!");
Chris Lattnerf7605322005-08-31 21:09:52 +0000276 case ISD::FP_TO_SINT: {
Nate Begemanc09eeec2005-09-06 22:03:27 +0000277 assert(MVT::isFloatingPoint(Op.getOperand(0).getValueType()));
Chris Lattner7c0d6642005-10-02 06:37:13 +0000278 SDOperand Src = Op.getOperand(0);
279 if (Src.getValueType() == MVT::f32)
280 Src = DAG.getNode(ISD::FP_EXTEND, MVT::f64, Src);
281
Chris Lattner1b95e0b2005-12-23 00:59:59 +0000282 SDOperand Tmp;
Nate Begemanc09eeec2005-09-06 22:03:27 +0000283 switch (Op.getValueType()) {
284 default: assert(0 && "Unhandled FP_TO_SINT type in custom expander!");
285 case MVT::i32:
Chris Lattner1b95e0b2005-12-23 00:59:59 +0000286 Tmp = DAG.getNode(PPCISD::FCTIWZ, MVT::f64, Src);
Nate Begemanc09eeec2005-09-06 22:03:27 +0000287 break;
288 case MVT::i64:
Chris Lattner1b95e0b2005-12-23 00:59:59 +0000289 Tmp = DAG.getNode(PPCISD::FCTIDZ, MVT::f64, Src);
Nate Begemanc09eeec2005-09-06 22:03:27 +0000290 break;
291 }
Chris Lattnerf7605322005-08-31 21:09:52 +0000292
Chris Lattner1b95e0b2005-12-23 00:59:59 +0000293 // Convert the FP value to an int value through memory.
294 SDOperand Bits = DAG.getNode(ISD::BIT_CONVERT, MVT::i64, Tmp);
295 if (Op.getValueType() == MVT::i32)
296 Bits = DAG.getNode(ISD::TRUNCATE, MVT::i32, Bits);
297 return Bits;
Nate Begemanc09eeec2005-09-06 22:03:27 +0000298 }
299 case ISD::SINT_TO_FP: {
300 assert(MVT::i64 == Op.getOperand(0).getValueType() &&
301 "Unhandled SINT_TO_FP type in custom expander!");
Chris Lattner1b95e0b2005-12-23 00:59:59 +0000302 SDOperand Bits = DAG.getNode(ISD::BIT_CONVERT, MVT::f64, Op.getOperand(0));
303 SDOperand FP = DAG.getNode(PPCISD::FCFID, MVT::f64, Bits);
Nate Begemanc09eeec2005-09-06 22:03:27 +0000304 if (MVT::f32 == Op.getValueType())
305 FP = DAG.getNode(ISD::FP_ROUND, MVT::f32, FP);
306 return FP;
Chris Lattnerf7605322005-08-31 21:09:52 +0000307 }
308 case ISD::SELECT_CC: {
Chris Lattnere4bc9ea2005-08-26 00:52:45 +0000309 // Turn FP only select_cc's into fsel instructions.
Chris Lattnerf7605322005-08-31 21:09:52 +0000310 if (!MVT::isFloatingPoint(Op.getOperand(0).getValueType()) ||
311 !MVT::isFloatingPoint(Op.getOperand(2).getValueType()))
312 break;
313
314 ISD::CondCode CC = cast<CondCodeSDNode>(Op.getOperand(4))->get();
315
316 // Cannot handle SETEQ/SETNE.
317 if (CC == ISD::SETEQ || CC == ISD::SETNE) break;
318
319 MVT::ValueType ResVT = Op.getValueType();
320 MVT::ValueType CmpVT = Op.getOperand(0).getValueType();
321 SDOperand LHS = Op.getOperand(0), RHS = Op.getOperand(1);
322 SDOperand TV = Op.getOperand(2), FV = Op.getOperand(3);
Chris Lattnere4bc9ea2005-08-26 00:52:45 +0000323
Chris Lattnerf7605322005-08-31 21:09:52 +0000324 // If the RHS of the comparison is a 0.0, we don't need to do the
325 // subtraction at all.
326 if (isFloatingPointZero(RHS))
Chris Lattnere4bc9ea2005-08-26 00:52:45 +0000327 switch (CC) {
Chris Lattnerbc38dbf2006-01-18 19:42:35 +0000328 default: break; // SETUO etc aren't handled by fsel.
Chris Lattnere4bc9ea2005-08-26 00:52:45 +0000329 case ISD::SETULT:
330 case ISD::SETLT:
Chris Lattnerf7605322005-08-31 21:09:52 +0000331 std::swap(TV, FV); // fsel is natively setge, swap operands for setlt
Chris Lattnere4bc9ea2005-08-26 00:52:45 +0000332 case ISD::SETUGE:
333 case ISD::SETGE:
Chris Lattnereb255f22005-10-25 20:54:57 +0000334 if (LHS.getValueType() == MVT::f32) // Comparison is always 64-bits
335 LHS = DAG.getNode(ISD::FP_EXTEND, MVT::f64, LHS);
Chris Lattnerf7605322005-08-31 21:09:52 +0000336 return DAG.getNode(PPCISD::FSEL, ResVT, LHS, TV, FV);
Chris Lattnere4bc9ea2005-08-26 00:52:45 +0000337 case ISD::SETUGT:
338 case ISD::SETGT:
Chris Lattnerf7605322005-08-31 21:09:52 +0000339 std::swap(TV, FV); // fsel is natively setge, swap operands for setlt
Chris Lattnere4bc9ea2005-08-26 00:52:45 +0000340 case ISD::SETULE:
341 case ISD::SETLE:
Chris Lattnereb255f22005-10-25 20:54:57 +0000342 if (LHS.getValueType() == MVT::f32) // Comparison is always 64-bits
343 LHS = DAG.getNode(ISD::FP_EXTEND, MVT::f64, LHS);
Chris Lattner0bbea952005-08-26 20:25:03 +0000344 return DAG.getNode(PPCISD::FSEL, ResVT,
Chris Lattner85fd97d2005-10-26 18:01:11 +0000345 DAG.getNode(ISD::FNEG, MVT::f64, LHS), TV, FV);
Chris Lattnere4bc9ea2005-08-26 00:52:45 +0000346 }
Chris Lattnerf7605322005-08-31 21:09:52 +0000347
Chris Lattnereb255f22005-10-25 20:54:57 +0000348 SDOperand Cmp;
Chris Lattnerf7605322005-08-31 21:09:52 +0000349 switch (CC) {
Chris Lattnerbc38dbf2006-01-18 19:42:35 +0000350 default: break; // SETUO etc aren't handled by fsel.
Chris Lattnerf7605322005-08-31 21:09:52 +0000351 case ISD::SETULT:
352 case ISD::SETLT:
Chris Lattnereb255f22005-10-25 20:54:57 +0000353 Cmp = DAG.getNode(ISD::FSUB, CmpVT, LHS, RHS);
354 if (Cmp.getValueType() == MVT::f32) // Comparison is always 64-bits
355 Cmp = DAG.getNode(ISD::FP_EXTEND, MVT::f64, Cmp);
356 return DAG.getNode(PPCISD::FSEL, ResVT, Cmp, FV, TV);
Chris Lattnerf7605322005-08-31 21:09:52 +0000357 case ISD::SETUGE:
358 case ISD::SETGE:
Chris Lattnereb255f22005-10-25 20:54:57 +0000359 Cmp = DAG.getNode(ISD::FSUB, CmpVT, LHS, RHS);
360 if (Cmp.getValueType() == MVT::f32) // Comparison is always 64-bits
361 Cmp = DAG.getNode(ISD::FP_EXTEND, MVT::f64, Cmp);
362 return DAG.getNode(PPCISD::FSEL, ResVT, Cmp, TV, FV);
Chris Lattnerf7605322005-08-31 21:09:52 +0000363 case ISD::SETUGT:
364 case ISD::SETGT:
Chris Lattnereb255f22005-10-25 20:54:57 +0000365 Cmp = DAG.getNode(ISD::FSUB, CmpVT, RHS, LHS);
366 if (Cmp.getValueType() == MVT::f32) // Comparison is always 64-bits
367 Cmp = DAG.getNode(ISD::FP_EXTEND, MVT::f64, Cmp);
368 return DAG.getNode(PPCISD::FSEL, ResVT, Cmp, FV, TV);
Chris Lattnerf7605322005-08-31 21:09:52 +0000369 case ISD::SETULE:
370 case ISD::SETLE:
Chris Lattnereb255f22005-10-25 20:54:57 +0000371 Cmp = DAG.getNode(ISD::FSUB, CmpVT, RHS, LHS);
372 if (Cmp.getValueType() == MVT::f32) // Comparison is always 64-bits
373 Cmp = DAG.getNode(ISD::FP_EXTEND, MVT::f64, Cmp);
374 return DAG.getNode(PPCISD::FSEL, ResVT, Cmp, TV, FV);
Chris Lattnere4bc9ea2005-08-26 00:52:45 +0000375 }
Chris Lattnerf7605322005-08-31 21:09:52 +0000376 break;
377 }
Chris Lattnerbc11c342005-08-31 20:23:54 +0000378 case ISD::SHL: {
379 assert(Op.getValueType() == MVT::i64 &&
380 Op.getOperand(1).getValueType() == MVT::i32 && "Unexpected SHL!");
381 // The generic code does a fine job expanding shift by a constant.
382 if (isa<ConstantSDNode>(Op.getOperand(1))) break;
383
384 // Otherwise, expand into a bunch of logical ops. Note that these ops
385 // depend on the PPC behavior for oversized shift amounts.
386 SDOperand Lo = DAG.getNode(ISD::EXTRACT_ELEMENT, MVT::i32, Op.getOperand(0),
387 DAG.getConstant(0, MVT::i32));
388 SDOperand Hi = DAG.getNode(ISD::EXTRACT_ELEMENT, MVT::i32, Op.getOperand(0),
389 DAG.getConstant(1, MVT::i32));
390 SDOperand Amt = Op.getOperand(1);
391
392 SDOperand Tmp1 = DAG.getNode(ISD::SUB, MVT::i32,
393 DAG.getConstant(32, MVT::i32), Amt);
Chris Lattner4172b102005-12-06 02:10:38 +0000394 SDOperand Tmp2 = DAG.getNode(PPCISD::SHL, MVT::i32, Hi, Amt);
395 SDOperand Tmp3 = DAG.getNode(PPCISD::SRL, MVT::i32, Lo, Tmp1);
Chris Lattnerbc11c342005-08-31 20:23:54 +0000396 SDOperand Tmp4 = DAG.getNode(ISD::OR , MVT::i32, Tmp2, Tmp3);
397 SDOperand Tmp5 = DAG.getNode(ISD::ADD, MVT::i32, Amt,
398 DAG.getConstant(-32U, MVT::i32));
Chris Lattner4172b102005-12-06 02:10:38 +0000399 SDOperand Tmp6 = DAG.getNode(PPCISD::SHL, MVT::i32, Lo, Tmp5);
Chris Lattnerbc11c342005-08-31 20:23:54 +0000400 SDOperand OutHi = DAG.getNode(ISD::OR, MVT::i32, Tmp4, Tmp6);
Chris Lattner4172b102005-12-06 02:10:38 +0000401 SDOperand OutLo = DAG.getNode(PPCISD::SHL, MVT::i32, Lo, Amt);
Chris Lattnerbc11c342005-08-31 20:23:54 +0000402 return DAG.getNode(ISD::BUILD_PAIR, MVT::i64, OutLo, OutHi);
403 }
404 case ISD::SRL: {
405 assert(Op.getValueType() == MVT::i64 &&
406 Op.getOperand(1).getValueType() == MVT::i32 && "Unexpected SHL!");
407 // The generic code does a fine job expanding shift by a constant.
408 if (isa<ConstantSDNode>(Op.getOperand(1))) break;
409
410 // Otherwise, expand into a bunch of logical ops. Note that these ops
411 // depend on the PPC behavior for oversized shift amounts.
412 SDOperand Lo = DAG.getNode(ISD::EXTRACT_ELEMENT, MVT::i32, Op.getOperand(0),
413 DAG.getConstant(0, MVT::i32));
414 SDOperand Hi = DAG.getNode(ISD::EXTRACT_ELEMENT, MVT::i32, Op.getOperand(0),
415 DAG.getConstant(1, MVT::i32));
416 SDOperand Amt = Op.getOperand(1);
417
418 SDOperand Tmp1 = DAG.getNode(ISD::SUB, MVT::i32,
419 DAG.getConstant(32, MVT::i32), Amt);
Chris Lattner4172b102005-12-06 02:10:38 +0000420 SDOperand Tmp2 = DAG.getNode(PPCISD::SRL, MVT::i32, Lo, Amt);
421 SDOperand Tmp3 = DAG.getNode(PPCISD::SHL, MVT::i32, Hi, Tmp1);
Chris Lattnerbc11c342005-08-31 20:23:54 +0000422 SDOperand Tmp4 = DAG.getNode(ISD::OR , MVT::i32, Tmp2, Tmp3);
423 SDOperand Tmp5 = DAG.getNode(ISD::ADD, MVT::i32, Amt,
424 DAG.getConstant(-32U, MVT::i32));
Chris Lattner4172b102005-12-06 02:10:38 +0000425 SDOperand Tmp6 = DAG.getNode(PPCISD::SRL, MVT::i32, Hi, Tmp5);
Chris Lattnerbc11c342005-08-31 20:23:54 +0000426 SDOperand OutLo = DAG.getNode(ISD::OR, MVT::i32, Tmp4, Tmp6);
Chris Lattner4172b102005-12-06 02:10:38 +0000427 SDOperand OutHi = DAG.getNode(PPCISD::SRL, MVT::i32, Hi, Amt);
Chris Lattnerbc11c342005-08-31 20:23:54 +0000428 return DAG.getNode(ISD::BUILD_PAIR, MVT::i64, OutLo, OutHi);
429 }
430 case ISD::SRA: {
Chris Lattnereb9b62e2005-08-31 19:09:57 +0000431 assert(Op.getValueType() == MVT::i64 &&
432 Op.getOperand(1).getValueType() == MVT::i32 && "Unexpected SRA!");
433 // The generic code does a fine job expanding shift by a constant.
434 if (isa<ConstantSDNode>(Op.getOperand(1))) break;
435
436 // Otherwise, expand into a bunch of logical ops, followed by a select_cc.
437 SDOperand Lo = DAG.getNode(ISD::EXTRACT_ELEMENT, MVT::i32, Op.getOperand(0),
438 DAG.getConstant(0, MVT::i32));
439 SDOperand Hi = DAG.getNode(ISD::EXTRACT_ELEMENT, MVT::i32, Op.getOperand(0),
440 DAG.getConstant(1, MVT::i32));
441 SDOperand Amt = Op.getOperand(1);
442
443 SDOperand Tmp1 = DAG.getNode(ISD::SUB, MVT::i32,
444 DAG.getConstant(32, MVT::i32), Amt);
Chris Lattner4172b102005-12-06 02:10:38 +0000445 SDOperand Tmp2 = DAG.getNode(PPCISD::SRL, MVT::i32, Lo, Amt);
446 SDOperand Tmp3 = DAG.getNode(PPCISD::SHL, MVT::i32, Hi, Tmp1);
Chris Lattnereb9b62e2005-08-31 19:09:57 +0000447 SDOperand Tmp4 = DAG.getNode(ISD::OR , MVT::i32, Tmp2, Tmp3);
448 SDOperand Tmp5 = DAG.getNode(ISD::ADD, MVT::i32, Amt,
449 DAG.getConstant(-32U, MVT::i32));
Chris Lattner4172b102005-12-06 02:10:38 +0000450 SDOperand Tmp6 = DAG.getNode(PPCISD::SRA, MVT::i32, Hi, Tmp5);
451 SDOperand OutHi = DAG.getNode(PPCISD::SRA, MVT::i32, Hi, Amt);
Chris Lattnereb9b62e2005-08-31 19:09:57 +0000452 SDOperand OutLo = DAG.getSelectCC(Tmp5, DAG.getConstant(0, MVT::i32),
453 Tmp4, Tmp6, ISD::SETLE);
454 return DAG.getNode(ISD::BUILD_PAIR, MVT::i64, OutLo, OutHi);
Chris Lattnere4bc9ea2005-08-26 00:52:45 +0000455 }
Nate Begeman28a6b022005-12-10 02:36:00 +0000456 case ISD::ConstantPool: {
Evan Chengb8973bd2006-01-31 22:23:14 +0000457 ConstantPoolSDNode *CP = cast<ConstantPoolSDNode>(Op);
458 Constant *C = CP->get();
459 SDOperand CPI = DAG.getTargetConstantPool(C, MVT::i32, CP->getAlignment());
Nate Begeman28a6b022005-12-10 02:36:00 +0000460 SDOperand Zero = DAG.getConstant(0, MVT::i32);
461
Evan Cheng4c1aa862006-02-22 20:19:42 +0000462 if (getTargetMachine().getRelocationModel() == Reloc::Static) {
Nate Begeman28a6b022005-12-10 02:36:00 +0000463 // Generate non-pic code that has direct accesses to the constant pool.
464 // The address of the global is just (hi(&g)+lo(&g)).
465 SDOperand Hi = DAG.getNode(PPCISD::Hi, MVT::i32, CPI, Zero);
466 SDOperand Lo = DAG.getNode(PPCISD::Lo, MVT::i32, CPI, Zero);
467 return DAG.getNode(ISD::ADD, MVT::i32, Hi, Lo);
468 }
469
470 // Only lower ConstantPool on Darwin.
471 if (!getTargetMachine().getSubtarget<PPCSubtarget>().isDarwin()) break;
472 SDOperand Hi = DAG.getNode(PPCISD::Hi, MVT::i32, CPI, Zero);
Evan Cheng4c1aa862006-02-22 20:19:42 +0000473 if (getTargetMachine().getRelocationModel() == Reloc::PIC) {
Nate Begeman28a6b022005-12-10 02:36:00 +0000474 // With PIC, the first instruction is actually "GR+hi(&G)".
475 Hi = DAG.getNode(ISD::ADD, MVT::i32,
476 DAG.getNode(PPCISD::GlobalBaseReg, MVT::i32), Hi);
477 }
478
479 SDOperand Lo = DAG.getNode(PPCISD::Lo, MVT::i32, CPI, Zero);
480 Lo = DAG.getNode(ISD::ADD, MVT::i32, Hi, Lo);
481 return Lo;
482 }
Chris Lattner860e8862005-11-17 07:30:41 +0000483 case ISD::GlobalAddress: {
Nate Begeman50fb3c42005-12-24 01:00:15 +0000484 GlobalAddressSDNode *GSDN = cast<GlobalAddressSDNode>(Op);
485 GlobalValue *GV = GSDN->getGlobal();
486 SDOperand GA = DAG.getTargetGlobalAddress(GV, MVT::i32, GSDN->getOffset());
Chris Lattner860e8862005-11-17 07:30:41 +0000487 SDOperand Zero = DAG.getConstant(0, MVT::i32);
Chris Lattner1d05cb42005-11-17 18:55:48 +0000488
Evan Cheng4c1aa862006-02-22 20:19:42 +0000489 if (getTargetMachine().getRelocationModel() == Reloc::Static) {
Nate Begeman28a6b022005-12-10 02:36:00 +0000490 // Generate non-pic code that has direct accesses to globals.
491 // The address of the global is just (hi(&g)+lo(&g)).
Chris Lattner1d05cb42005-11-17 18:55:48 +0000492 SDOperand Hi = DAG.getNode(PPCISD::Hi, MVT::i32, GA, Zero);
493 SDOperand Lo = DAG.getNode(PPCISD::Lo, MVT::i32, GA, Zero);
494 return DAG.getNode(ISD::ADD, MVT::i32, Hi, Lo);
495 }
Chris Lattner860e8862005-11-17 07:30:41 +0000496
Chris Lattner1d05cb42005-11-17 18:55:48 +0000497 // Only lower GlobalAddress on Darwin.
498 if (!getTargetMachine().getSubtarget<PPCSubtarget>().isDarwin()) break;
Chris Lattnera35ef632006-01-06 01:04:03 +0000499
Chris Lattner860e8862005-11-17 07:30:41 +0000500 SDOperand Hi = DAG.getNode(PPCISD::Hi, MVT::i32, GA, Zero);
Evan Cheng4c1aa862006-02-22 20:19:42 +0000501 if (getTargetMachine().getRelocationModel() == Reloc::PIC) {
Chris Lattner860e8862005-11-17 07:30:41 +0000502 // With PIC, the first instruction is actually "GR+hi(&G)".
503 Hi = DAG.getNode(ISD::ADD, MVT::i32,
Chris Lattner15666132005-11-17 17:51:38 +0000504 DAG.getNode(PPCISD::GlobalBaseReg, MVT::i32), Hi);
Chris Lattner860e8862005-11-17 07:30:41 +0000505 }
506
507 SDOperand Lo = DAG.getNode(PPCISD::Lo, MVT::i32, GA, Zero);
508 Lo = DAG.getNode(ISD::ADD, MVT::i32, Hi, Lo);
509
Chris Lattner37dd6f12006-01-29 20:49:17 +0000510 if (!GV->hasWeakLinkage() && !GV->hasLinkOnceLinkage() &&
511 (!GV->isExternal() || GV->hasNotBeenReadFromBytecode()))
Chris Lattner860e8862005-11-17 07:30:41 +0000512 return Lo;
513
514 // If the global is weak or external, we have to go through the lazy
515 // resolution stub.
516 return DAG.getLoad(MVT::i32, DAG.getEntryNode(), Lo, DAG.getSrcValue(0));
517 }
Nate Begeman44775902006-01-31 08:17:29 +0000518 case ISD::SETCC: {
519 ISD::CondCode CC = cast<CondCodeSDNode>(Op.getOperand(2))->get();
Nate Begeman750ac1b2006-02-01 07:19:44 +0000520
521 // If we're comparing for equality to zero, expose the fact that this is
522 // implented as a ctlz/srl pair on ppc, so that the dag combiner can
523 // fold the new nodes.
524 if (ConstantSDNode *C = dyn_cast<ConstantSDNode>(Op.getOperand(1))) {
525 if (C->isNullValue() && CC == ISD::SETEQ) {
526 MVT::ValueType VT = Op.getOperand(0).getValueType();
527 SDOperand Zext = Op.getOperand(0);
528 if (VT < MVT::i32) {
529 VT = MVT::i32;
530 Zext = DAG.getNode(ISD::ZERO_EXTEND, VT, Op.getOperand(0));
531 }
532 unsigned Log2b = Log2_32(MVT::getSizeInBits(VT));
533 SDOperand Clz = DAG.getNode(ISD::CTLZ, VT, Zext);
534 SDOperand Scc = DAG.getNode(ISD::SRL, VT, Clz,
535 DAG.getConstant(Log2b, getShiftAmountTy()));
536 return DAG.getNode(ISD::TRUNCATE, getSetCCResultTy(), Scc);
537 }
538 // Leave comparisons against 0 and -1 alone for now, since they're usually
539 // optimized. FIXME: revisit this when we can custom lower all setcc
540 // optimizations.
541 if (C->isAllOnesValue() || C->isNullValue())
542 break;
543 }
544
545 // If we have an integer seteq/setne, turn it into a compare against zero
546 // by subtracting the rhs from the lhs, which is faster than setting a
547 // condition register, reading it back out, and masking the correct bit.
548 MVT::ValueType LHSVT = Op.getOperand(0).getValueType();
549 if (MVT::isInteger(LHSVT) && (CC == ISD::SETEQ || CC == ISD::SETNE)) {
550 MVT::ValueType VT = Op.getValueType();
551 SDOperand Sub = DAG.getNode(ISD::SUB, LHSVT, Op.getOperand(0),
552 Op.getOperand(1));
553 return DAG.getSetCC(VT, Sub, DAG.getConstant(0, LHSVT), CC);
554 }
Nate Begeman44775902006-01-31 08:17:29 +0000555 break;
556 }
Nate Begemanacc398c2006-01-25 18:21:52 +0000557 case ISD::VASTART: {
558 // vastart just stores the address of the VarArgsFrameIndex slot into the
559 // memory location argument.
560 // FIXME: Replace MVT::i32 with PointerTy
561 SDOperand FR = DAG.getFrameIndex(VarArgsFrameIndex, MVT::i32);
562 return DAG.getNode(ISD::STORE, MVT::Other, Op.getOperand(0), FR,
563 Op.getOperand(1), Op.getOperand(2));
564 }
Nate Begemanee625572006-01-27 21:09:22 +0000565 case ISD::RET: {
566 SDOperand Copy;
567
568 switch(Op.getNumOperands()) {
569 default:
570 assert(0 && "Do not know how to return this many arguments!");
571 abort();
572 case 1:
573 return SDOperand(); // ret void is legal
574 case 2: {
575 MVT::ValueType ArgVT = Op.getOperand(1).getValueType();
576 unsigned ArgReg = MVT::isInteger(ArgVT) ? PPC::R3 : PPC::F1;
577 Copy = DAG.getCopyToReg(Op.getOperand(0), ArgReg, Op.getOperand(1),
578 SDOperand());
579 break;
580 }
581 case 3:
582 Copy = DAG.getCopyToReg(Op.getOperand(0), PPC::R3, Op.getOperand(2),
583 SDOperand());
584 Copy = DAG.getCopyToReg(Copy, PPC::R4, Op.getOperand(1),Copy.getValue(1));
585 break;
586 }
587 return DAG.getNode(PPCISD::RET_FLAG, MVT::Other, Copy, Copy.getValue(1));
588 }
Chris Lattnerb2177b92006-03-19 06:55:52 +0000589 case ISD::SCALAR_TO_VECTOR: {
590 // Create a stack slot that is 16-byte aligned.
591 MachineFrameInfo *FrameInfo = DAG.getMachineFunction().getFrameInfo();
592 int FrameIdx = FrameInfo->CreateStackObject(16, 16);
593 SDOperand FIdx = DAG.getFrameIndex(FrameIdx, MVT::i32);
594
595 // Store the input value into Value#0 of the stack slot.
596 unsigned InSize = MVT::getSizeInBits(Op.getOperand(0).getValueType())/8;
597 FIdx = DAG.getNode(ISD::ADD, MVT::i32, FIdx,
598 DAG.getConstant(16-InSize, MVT::i32));
599 SDOperand Store = DAG.getNode(ISD::STORE, MVT::Other, DAG.getEntryNode(),
600 Op.getOperand(0), FIdx,DAG.getSrcValue(NULL));
601 return DAG.getNode(PPCISD::LVE_X, Op.getValueType(), Store, FIdx,
602 DAG.getSrcValue(NULL));
603 }
Chris Lattnerf1d0b2b2006-03-20 01:53:53 +0000604 case ISD::VECTOR_SHUFFLE: {
605 // FIXME: Cases that are handled by instructions that take permute
606 // immediates (such as vsplt*) shouldn't be lowered here! Also handle cases
607 // that are cheaper to do as multiple such instructions than as a constant
608 // pool load/vperm pair.
609
610 // Lower this to a VPERM(V1, V2, V3) expression, where V3 is a constant
611 // vector that will get spilled to the constant pool.
612 SDOperand V1 = Op.getOperand(0);
613 SDOperand V2 = Op.getOperand(1);
614 if (V2.getOpcode() == ISD::UNDEF) V2 = V1;
615 SDOperand PermMask = Op.getOperand(2);
616
617 // The SHUFFLE_VECTOR mask is almost exactly what we want for vperm, except
618 // that it is in input element units, not in bytes. Convert now.
619 MVT::ValueType EltVT = MVT::getVectorBaseType(V1.getValueType());
620 unsigned BytesPerElement = MVT::getSizeInBits(EltVT)/8;
621
622 std::vector<SDOperand> ResultMask;
623 for (unsigned i = 0, e = PermMask.getNumOperands(); i != e; ++i) {
624 unsigned SrcElt =cast<ConstantSDNode>(PermMask.getOperand(i))->getValue();
625
626 for (unsigned j = 0; j != BytesPerElement; ++j)
627 ResultMask.push_back(DAG.getConstant(SrcElt*BytesPerElement+j,
628 MVT::i8));
629 }
630
631 SDOperand VPermMask =DAG.getNode(ISD::BUILD_VECTOR, MVT::v16i8, ResultMask);
632 return DAG.getNode(PPCISD::VPERM, V1.getValueType(), V1, V2, VPermMask);
633 }
Chris Lattnerbc11c342005-08-31 20:23:54 +0000634 }
Chris Lattnere4bc9ea2005-08-26 00:52:45 +0000635 return SDOperand();
636}
637
Chris Lattner7c5a3d32005-08-16 17:14:42 +0000638std::vector<SDOperand>
Nate Begeman21e463b2005-10-16 05:39:50 +0000639PPCTargetLowering::LowerArguments(Function &F, SelectionDAG &DAG) {
Chris Lattner7c5a3d32005-08-16 17:14:42 +0000640 //
641 // add beautiful description of PPC stack frame format, or at least some docs
642 //
643 MachineFunction &MF = DAG.getMachineFunction();
644 MachineFrameInfo *MFI = MF.getFrameInfo();
645 MachineBasicBlock& BB = MF.front();
Chris Lattner7b738342005-09-13 19:33:40 +0000646 SSARegMap *RegMap = MF.getSSARegMap();
Chris Lattner7c5a3d32005-08-16 17:14:42 +0000647 std::vector<SDOperand> ArgValues;
648
Chris Lattner7c5a3d32005-08-16 17:14:42 +0000649 unsigned ArgOffset = 24;
650 unsigned GPR_remaining = 8;
651 unsigned FPR_remaining = 13;
652 unsigned GPR_idx = 0, FPR_idx = 0;
653 static const unsigned GPR[] = {
654 PPC::R3, PPC::R4, PPC::R5, PPC::R6,
655 PPC::R7, PPC::R8, PPC::R9, PPC::R10,
656 };
657 static const unsigned FPR[] = {
658 PPC::F1, PPC::F2, PPC::F3, PPC::F4, PPC::F5, PPC::F6, PPC::F7,
659 PPC::F8, PPC::F9, PPC::F10, PPC::F11, PPC::F12, PPC::F13
660 };
661
662 // Add DAG nodes to load the arguments... On entry to a function on PPC,
663 // the arguments start at offset 24, although they are likely to be passed
664 // in registers.
665 for (Function::arg_iterator I = F.arg_begin(), E = F.arg_end(); I != E; ++I) {
666 SDOperand newroot, argt;
667 unsigned ObjSize;
668 bool needsLoad = false;
669 bool ArgLive = !I->use_empty();
670 MVT::ValueType ObjectVT = getValueType(I->getType());
671
672 switch (ObjectVT) {
Chris Lattner915fb302005-08-30 00:19:00 +0000673 default: assert(0 && "Unhandled argument type!");
674 case MVT::i1:
675 case MVT::i8:
676 case MVT::i16:
677 case MVT::i32:
678 ObjSize = 4;
679 if (!ArgLive) break;
680 if (GPR_remaining > 0) {
Nate Begeman1d9d7422005-10-18 00:28:58 +0000681 unsigned VReg = RegMap->createVirtualRegister(&PPC::GPRCRegClass);
Chris Lattner7b738342005-09-13 19:33:40 +0000682 MF.addLiveIn(GPR[GPR_idx], VReg);
683 argt = newroot = DAG.getCopyFromReg(DAG.getRoot(), VReg, MVT::i32);
Nate Begeman49296f12005-08-31 01:58:39 +0000684 if (ObjectVT != MVT::i32) {
685 unsigned AssertOp = I->getType()->isSigned() ? ISD::AssertSext
686 : ISD::AssertZext;
687 argt = DAG.getNode(AssertOp, MVT::i32, argt,
688 DAG.getValueType(ObjectVT));
689 argt = DAG.getNode(ISD::TRUNCATE, ObjectVT, argt);
690 }
Chris Lattner915fb302005-08-30 00:19:00 +0000691 } else {
692 needsLoad = true;
693 }
694 break;
Chris Lattner80720a92005-11-30 20:40:54 +0000695 case MVT::i64:
696 ObjSize = 8;
Chris Lattner915fb302005-08-30 00:19:00 +0000697 if (!ArgLive) break;
698 if (GPR_remaining > 0) {
699 SDOperand argHi, argLo;
Nate Begeman1d9d7422005-10-18 00:28:58 +0000700 unsigned VReg = RegMap->createVirtualRegister(&PPC::GPRCRegClass);
Chris Lattner7b738342005-09-13 19:33:40 +0000701 MF.addLiveIn(GPR[GPR_idx], VReg);
702 argHi = DAG.getCopyFromReg(DAG.getRoot(), VReg, MVT::i32);
Chris Lattner915fb302005-08-30 00:19:00 +0000703 // If we have two or more remaining argument registers, then both halves
704 // of the i64 can be sourced from there. Otherwise, the lower half will
705 // have to come off the stack. This can happen when an i64 is preceded
706 // by 28 bytes of arguments.
707 if (GPR_remaining > 1) {
Nate Begeman1d9d7422005-10-18 00:28:58 +0000708 unsigned VReg = RegMap->createVirtualRegister(&PPC::GPRCRegClass);
Chris Lattner7b738342005-09-13 19:33:40 +0000709 MF.addLiveIn(GPR[GPR_idx+1], VReg);
710 argLo = DAG.getCopyFromReg(argHi, VReg, MVT::i32);
Chris Lattner915fb302005-08-30 00:19:00 +0000711 } else {
712 int FI = MFI->CreateFixedObject(4, ArgOffset+4);
713 SDOperand FIN = DAG.getFrameIndex(FI, MVT::i32);
714 argLo = DAG.getLoad(MVT::i32, DAG.getEntryNode(), FIN,
715 DAG.getSrcValue(NULL));
716 }
717 // Build the outgoing arg thingy
718 argt = DAG.getNode(ISD::BUILD_PAIR, MVT::i64, argLo, argHi);
719 newroot = argLo;
720 } else {
721 needsLoad = true;
722 }
723 break;
724 case MVT::f32:
725 case MVT::f64:
726 ObjSize = (ObjectVT == MVT::f64) ? 8 : 4;
Chris Lattner413b9792006-01-11 18:21:25 +0000727 if (!ArgLive) {
728 if (FPR_remaining > 0) {
729 --FPR_remaining;
730 ++FPR_idx;
731 }
732 break;
733 }
Chris Lattner915fb302005-08-30 00:19:00 +0000734 if (FPR_remaining > 0) {
Chris Lattner919c0322005-10-01 01:35:02 +0000735 unsigned VReg;
736 if (ObjectVT == MVT::f32)
Nate Begeman1d9d7422005-10-18 00:28:58 +0000737 VReg = RegMap->createVirtualRegister(&PPC::F4RCRegClass);
Chris Lattner919c0322005-10-01 01:35:02 +0000738 else
Nate Begeman1d9d7422005-10-18 00:28:58 +0000739 VReg = RegMap->createVirtualRegister(&PPC::F8RCRegClass);
Chris Lattner7b738342005-09-13 19:33:40 +0000740 MF.addLiveIn(FPR[FPR_idx], VReg);
741 argt = newroot = DAG.getCopyFromReg(DAG.getRoot(), VReg, ObjectVT);
Chris Lattner915fb302005-08-30 00:19:00 +0000742 --FPR_remaining;
743 ++FPR_idx;
744 } else {
745 needsLoad = true;
746 }
747 break;
Chris Lattner7c5a3d32005-08-16 17:14:42 +0000748 }
749
750 // We need to load the argument to a virtual register if we determined above
751 // that we ran out of physical registers of the appropriate type
752 if (needsLoad) {
753 unsigned SubregOffset = 0;
754 if (ObjectVT == MVT::i8 || ObjectVT == MVT::i1) SubregOffset = 3;
755 if (ObjectVT == MVT::i16) SubregOffset = 2;
756 int FI = MFI->CreateFixedObject(ObjSize, ArgOffset);
757 SDOperand FIN = DAG.getFrameIndex(FI, MVT::i32);
758 FIN = DAG.getNode(ISD::ADD, MVT::i32, FIN,
759 DAG.getConstant(SubregOffset, MVT::i32));
760 argt = newroot = DAG.getLoad(ObjectVT, DAG.getEntryNode(), FIN,
761 DAG.getSrcValue(NULL));
762 }
763
764 // Every 4 bytes of argument space consumes one of the GPRs available for
765 // argument passing.
766 if (GPR_remaining > 0) {
767 unsigned delta = (GPR_remaining > 1 && ObjSize == 8) ? 2 : 1;
768 GPR_remaining -= delta;
769 GPR_idx += delta;
770 }
771 ArgOffset += ObjSize;
772 if (newroot.Val)
773 DAG.setRoot(newroot.getValue(1));
774
775 ArgValues.push_back(argt);
776 }
777
778 // If the function takes variable number of arguments, make a frame index for
779 // the start of the first vararg value... for expansion of llvm.va_start.
780 if (F.isVarArg()) {
781 VarArgsFrameIndex = MFI->CreateFixedObject(4, ArgOffset);
782 SDOperand FIN = DAG.getFrameIndex(VarArgsFrameIndex, MVT::i32);
783 // If this function is vararg, store any remaining integer argument regs
784 // to their spots on the stack so that they may be loaded by deferencing the
785 // result of va_next.
786 std::vector<SDOperand> MemOps;
787 for (; GPR_remaining > 0; --GPR_remaining, ++GPR_idx) {
Nate Begeman1d9d7422005-10-18 00:28:58 +0000788 unsigned VReg = RegMap->createVirtualRegister(&PPC::GPRCRegClass);
Chris Lattner7b738342005-09-13 19:33:40 +0000789 MF.addLiveIn(GPR[GPR_idx], VReg);
790 SDOperand Val = DAG.getCopyFromReg(DAG.getRoot(), VReg, MVT::i32);
Chris Lattner7c5a3d32005-08-16 17:14:42 +0000791 SDOperand Store = DAG.getNode(ISD::STORE, MVT::Other, Val.getValue(1),
792 Val, FIN, DAG.getSrcValue(NULL));
793 MemOps.push_back(Store);
794 // Increment the address by four for the next argument to store
795 SDOperand PtrOff = DAG.getConstant(4, getPointerTy());
796 FIN = DAG.getNode(ISD::ADD, MVT::i32, FIN, PtrOff);
797 }
Chris Lattner80720a92005-11-30 20:40:54 +0000798 if (!MemOps.empty()) {
799 MemOps.push_back(DAG.getRoot());
800 DAG.setRoot(DAG.getNode(ISD::TokenFactor, MVT::Other, MemOps));
801 }
Chris Lattner7c5a3d32005-08-16 17:14:42 +0000802 }
803
804 // Finally, inform the code generator which regs we return values in.
805 switch (getValueType(F.getReturnType())) {
806 default: assert(0 && "Unknown type!");
807 case MVT::isVoid: break;
808 case MVT::i1:
809 case MVT::i8:
810 case MVT::i16:
811 case MVT::i32:
812 MF.addLiveOut(PPC::R3);
813 break;
814 case MVT::i64:
815 MF.addLiveOut(PPC::R3);
816 MF.addLiveOut(PPC::R4);
817 break;
818 case MVT::f32:
819 case MVT::f64:
820 MF.addLiveOut(PPC::F1);
821 break;
822 }
823
824 return ArgValues;
825}
826
827std::pair<SDOperand, SDOperand>
Nate Begeman21e463b2005-10-16 05:39:50 +0000828PPCTargetLowering::LowerCallTo(SDOperand Chain,
829 const Type *RetTy, bool isVarArg,
830 unsigned CallingConv, bool isTailCall,
831 SDOperand Callee, ArgListTy &Args,
832 SelectionDAG &DAG) {
Chris Lattner281b55e2006-01-27 23:34:02 +0000833 // args_to_use will accumulate outgoing args for the PPCISD::CALL case in
Chris Lattner7c5a3d32005-08-16 17:14:42 +0000834 // SelectExpr to use to put the arguments in the appropriate registers.
835 std::vector<SDOperand> args_to_use;
836
837 // Count how many bytes are to be pushed on the stack, including the linkage
838 // area, and parameter passing area.
839 unsigned NumBytes = 24;
840
841 if (Args.empty()) {
Chris Lattner45b39762006-02-13 08:55:29 +0000842 Chain = DAG.getCALLSEQ_START(Chain,
843 DAG.getConstant(NumBytes, getPointerTy()));
Chris Lattner7c5a3d32005-08-16 17:14:42 +0000844 } else {
Chris Lattner915fb302005-08-30 00:19:00 +0000845 for (unsigned i = 0, e = Args.size(); i != e; ++i) {
Chris Lattner7c5a3d32005-08-16 17:14:42 +0000846 switch (getValueType(Args[i].second)) {
Chris Lattner915fb302005-08-30 00:19:00 +0000847 default: assert(0 && "Unknown value type!");
848 case MVT::i1:
849 case MVT::i8:
850 case MVT::i16:
851 case MVT::i32:
852 case MVT::f32:
853 NumBytes += 4;
854 break;
855 case MVT::i64:
856 case MVT::f64:
857 NumBytes += 8;
858 break;
Chris Lattner7c5a3d32005-08-16 17:14:42 +0000859 }
Chris Lattner915fb302005-08-30 00:19:00 +0000860 }
Chris Lattner7c5a3d32005-08-16 17:14:42 +0000861
Chris Lattner915fb302005-08-30 00:19:00 +0000862 // Just to be safe, we'll always reserve the full 24 bytes of linkage area
863 // plus 32 bytes of argument space in case any called code gets funky on us.
864 // (Required by ABI to support var arg)
865 if (NumBytes < 56) NumBytes = 56;
Chris Lattner7c5a3d32005-08-16 17:14:42 +0000866
867 // Adjust the stack pointer for the new arguments...
868 // These operations are automatically eliminated by the prolog/epilog pass
Chris Lattner45b39762006-02-13 08:55:29 +0000869 Chain = DAG.getCALLSEQ_START(Chain,
870 DAG.getConstant(NumBytes, getPointerTy()));
Chris Lattner7c5a3d32005-08-16 17:14:42 +0000871
872 // Set up a copy of the stack pointer for use loading and storing any
873 // arguments that may not fit in the registers available for argument
874 // passing.
Chris Lattnera243db82006-01-11 19:55:07 +0000875 SDOperand StackPtr = DAG.getRegister(PPC::R1, MVT::i32);
Chris Lattner7c5a3d32005-08-16 17:14:42 +0000876
877 // Figure out which arguments are going to go in registers, and which in
878 // memory. Also, if this is a vararg function, floating point operations
879 // must be stored to our stack, and loaded into integer regs as well, if
880 // any integer regs are available for argument passing.
881 unsigned ArgOffset = 24;
882 unsigned GPR_remaining = 8;
883 unsigned FPR_remaining = 13;
884
885 std::vector<SDOperand> MemOps;
886 for (unsigned i = 0, e = Args.size(); i != e; ++i) {
887 // PtrOff will be used to store the current argument to the stack if a
888 // register cannot be found for it.
889 SDOperand PtrOff = DAG.getConstant(ArgOffset, getPointerTy());
890 PtrOff = DAG.getNode(ISD::ADD, MVT::i32, StackPtr, PtrOff);
891 MVT::ValueType ArgVT = getValueType(Args[i].second);
892
893 switch (ArgVT) {
Chris Lattner915fb302005-08-30 00:19:00 +0000894 default: assert(0 && "Unexpected ValueType for argument!");
895 case MVT::i1:
896 case MVT::i8:
897 case MVT::i16:
898 // Promote the integer to 32 bits. If the input type is signed use a
899 // sign extend, otherwise use a zero extend.
900 if (Args[i].second->isSigned())
901 Args[i].first =DAG.getNode(ISD::SIGN_EXTEND, MVT::i32, Args[i].first);
902 else
903 Args[i].first =DAG.getNode(ISD::ZERO_EXTEND, MVT::i32, Args[i].first);
904 // FALL THROUGH
905 case MVT::i32:
906 if (GPR_remaining > 0) {
907 args_to_use.push_back(Args[i].first);
908 --GPR_remaining;
909 } else {
910 MemOps.push_back(DAG.getNode(ISD::STORE, MVT::Other, Chain,
911 Args[i].first, PtrOff,
912 DAG.getSrcValue(NULL)));
913 }
914 ArgOffset += 4;
915 break;
916 case MVT::i64:
917 // If we have one free GPR left, we can place the upper half of the i64
918 // in it, and store the other half to the stack. If we have two or more
919 // free GPRs, then we can pass both halves of the i64 in registers.
920 if (GPR_remaining > 0) {
921 SDOperand Hi = DAG.getNode(ISD::EXTRACT_ELEMENT, MVT::i32,
922 Args[i].first, DAG.getConstant(1, MVT::i32));
923 SDOperand Lo = DAG.getNode(ISD::EXTRACT_ELEMENT, MVT::i32,
924 Args[i].first, DAG.getConstant(0, MVT::i32));
925 args_to_use.push_back(Hi);
926 --GPR_remaining;
Chris Lattner7c5a3d32005-08-16 17:14:42 +0000927 if (GPR_remaining > 0) {
Chris Lattner915fb302005-08-30 00:19:00 +0000928 args_to_use.push_back(Lo);
Chris Lattner7c5a3d32005-08-16 17:14:42 +0000929 --GPR_remaining;
930 } else {
Chris Lattner915fb302005-08-30 00:19:00 +0000931 SDOperand ConstFour = DAG.getConstant(4, getPointerTy());
932 PtrOff = DAG.getNode(ISD::ADD, MVT::i32, PtrOff, ConstFour);
Chris Lattner7c5a3d32005-08-16 17:14:42 +0000933 MemOps.push_back(DAG.getNode(ISD::STORE, MVT::Other, Chain,
Chris Lattner915fb302005-08-30 00:19:00 +0000934 Lo, PtrOff, DAG.getSrcValue(NULL)));
Chris Lattner7c5a3d32005-08-16 17:14:42 +0000935 }
Chris Lattner915fb302005-08-30 00:19:00 +0000936 } else {
937 MemOps.push_back(DAG.getNode(ISD::STORE, MVT::Other, Chain,
938 Args[i].first, PtrOff,
939 DAG.getSrcValue(NULL)));
940 }
941 ArgOffset += 8;
942 break;
943 case MVT::f32:
944 case MVT::f64:
945 if (FPR_remaining > 0) {
946 args_to_use.push_back(Args[i].first);
947 --FPR_remaining;
948 if (isVarArg) {
949 SDOperand Store = DAG.getNode(ISD::STORE, MVT::Other, Chain,
950 Args[i].first, PtrOff,
951 DAG.getSrcValue(NULL));
952 MemOps.push_back(Store);
953 // Float varargs are always shadowed in available integer registers
Chris Lattner7c5a3d32005-08-16 17:14:42 +0000954 if (GPR_remaining > 0) {
Chris Lattner915fb302005-08-30 00:19:00 +0000955 SDOperand Load = DAG.getLoad(MVT::i32, Store, PtrOff,
956 DAG.getSrcValue(NULL));
Chris Lattner1df74782005-11-17 18:30:17 +0000957 MemOps.push_back(Load.getValue(1));
Chris Lattner915fb302005-08-30 00:19:00 +0000958 args_to_use.push_back(Load);
Chris Lattner7c5a3d32005-08-16 17:14:42 +0000959 --GPR_remaining;
Chris Lattner915fb302005-08-30 00:19:00 +0000960 }
961 if (GPR_remaining > 0 && MVT::f64 == ArgVT) {
Chris Lattner7c5a3d32005-08-16 17:14:42 +0000962 SDOperand ConstFour = DAG.getConstant(4, getPointerTy());
963 PtrOff = DAG.getNode(ISD::ADD, MVT::i32, PtrOff, ConstFour);
Chris Lattner915fb302005-08-30 00:19:00 +0000964 SDOperand Load = DAG.getLoad(MVT::i32, Store, PtrOff,
965 DAG.getSrcValue(NULL));
Chris Lattner1df74782005-11-17 18:30:17 +0000966 MemOps.push_back(Load.getValue(1));
Chris Lattner915fb302005-08-30 00:19:00 +0000967 args_to_use.push_back(Load);
968 --GPR_remaining;
Chris Lattner7c5a3d32005-08-16 17:14:42 +0000969 }
970 } else {
Chris Lattner915fb302005-08-30 00:19:00 +0000971 // If we have any FPRs remaining, we may also have GPRs remaining.
972 // Args passed in FPRs consume either 1 (f32) or 2 (f64) available
973 // GPRs.
974 if (GPR_remaining > 0) {
975 args_to_use.push_back(DAG.getNode(ISD::UNDEF, MVT::i32));
976 --GPR_remaining;
Chris Lattner7c5a3d32005-08-16 17:14:42 +0000977 }
Chris Lattner915fb302005-08-30 00:19:00 +0000978 if (GPR_remaining > 0 && MVT::f64 == ArgVT) {
979 args_to_use.push_back(DAG.getNode(ISD::UNDEF, MVT::i32));
980 --GPR_remaining;
981 }
Chris Lattner7c5a3d32005-08-16 17:14:42 +0000982 }
Chris Lattner915fb302005-08-30 00:19:00 +0000983 } else {
984 MemOps.push_back(DAG.getNode(ISD::STORE, MVT::Other, Chain,
985 Args[i].first, PtrOff,
986 DAG.getSrcValue(NULL)));
987 }
988 ArgOffset += (ArgVT == MVT::f32) ? 4 : 8;
989 break;
Chris Lattner7c5a3d32005-08-16 17:14:42 +0000990 }
991 }
992 if (!MemOps.empty())
993 Chain = DAG.getNode(ISD::TokenFactor, MVT::Other, MemOps);
994 }
995
996 std::vector<MVT::ValueType> RetVals;
997 MVT::ValueType RetTyVT = getValueType(RetTy);
Chris Lattnerf5059492005-09-02 01:24:55 +0000998 MVT::ValueType ActualRetTyVT = RetTyVT;
999 if (RetTyVT >= MVT::i1 && RetTyVT <= MVT::i16)
1000 ActualRetTyVT = MVT::i32; // Promote result to i32.
1001
Chris Lattnere00ebf02006-01-28 07:33:03 +00001002 if (RetTyVT == MVT::i64) {
1003 RetVals.push_back(MVT::i32);
1004 RetVals.push_back(MVT::i32);
1005 } else if (RetTyVT != MVT::isVoid) {
Chris Lattnerf5059492005-09-02 01:24:55 +00001006 RetVals.push_back(ActualRetTyVT);
Chris Lattnere00ebf02006-01-28 07:33:03 +00001007 }
Chris Lattner7c5a3d32005-08-16 17:14:42 +00001008 RetVals.push_back(MVT::Other);
1009
Chris Lattner2823b3e2005-11-17 05:56:14 +00001010 // If the callee is a GlobalAddress node (quite common, every direct call is)
1011 // turn it into a TargetGlobalAddress node so that legalize doesn't hack it.
1012 if (GlobalAddressSDNode *G = dyn_cast<GlobalAddressSDNode>(Callee))
1013 Callee = DAG.getTargetGlobalAddress(G->getGlobal(), MVT::i32);
1014
Chris Lattner281b55e2006-01-27 23:34:02 +00001015 std::vector<SDOperand> Ops;
1016 Ops.push_back(Chain);
1017 Ops.push_back(Callee);
1018 Ops.insert(Ops.end(), args_to_use.begin(), args_to_use.end());
1019 SDOperand TheCall = DAG.getNode(PPCISD::CALL, RetVals, Ops);
Chris Lattnere00ebf02006-01-28 07:33:03 +00001020 Chain = TheCall.getValue(TheCall.Val->getNumValues()-1);
Chris Lattner7c5a3d32005-08-16 17:14:42 +00001021 Chain = DAG.getNode(ISD::CALLSEQ_END, MVT::Other, Chain,
1022 DAG.getConstant(NumBytes, getPointerTy()));
Chris Lattnerf5059492005-09-02 01:24:55 +00001023 SDOperand RetVal = TheCall;
1024
1025 // If the result is a small value, add a note so that we keep track of the
1026 // information about whether it is sign or zero extended.
1027 if (RetTyVT != ActualRetTyVT) {
1028 RetVal = DAG.getNode(RetTy->isSigned() ? ISD::AssertSext : ISD::AssertZext,
1029 MVT::i32, RetVal, DAG.getValueType(RetTyVT));
1030 RetVal = DAG.getNode(ISD::TRUNCATE, RetTyVT, RetVal);
Chris Lattnere00ebf02006-01-28 07:33:03 +00001031 } else if (RetTyVT == MVT::i64) {
1032 RetVal = DAG.getNode(ISD::BUILD_PAIR, MVT::i64, RetVal, RetVal.getValue(1));
Chris Lattnerf5059492005-09-02 01:24:55 +00001033 }
1034
1035 return std::make_pair(RetVal, Chain);
Chris Lattner7c5a3d32005-08-16 17:14:42 +00001036}
1037
Chris Lattner8a2d3ca2005-08-26 21:23:58 +00001038MachineBasicBlock *
Nate Begeman21e463b2005-10-16 05:39:50 +00001039PPCTargetLowering::InsertAtEndOfBasicBlock(MachineInstr *MI,
1040 MachineBasicBlock *BB) {
Chris Lattner8a2d3ca2005-08-26 21:23:58 +00001041 assert((MI->getOpcode() == PPC::SELECT_CC_Int ||
Chris Lattner919c0322005-10-01 01:35:02 +00001042 MI->getOpcode() == PPC::SELECT_CC_F4 ||
1043 MI->getOpcode() == PPC::SELECT_CC_F8) &&
Chris Lattner8a2d3ca2005-08-26 21:23:58 +00001044 "Unexpected instr type to insert");
1045
1046 // To "insert" a SELECT_CC instruction, we actually have to insert the diamond
1047 // control-flow pattern. The incoming instruction knows the destination vreg
1048 // to set, the condition code register to branch on, the true/false values to
1049 // select between, and a branch opcode to use.
1050 const BasicBlock *LLVM_BB = BB->getBasicBlock();
1051 ilist<MachineBasicBlock>::iterator It = BB;
1052 ++It;
1053
1054 // thisMBB:
1055 // ...
1056 // TrueVal = ...
1057 // cmpTY ccX, r1, r2
1058 // bCC copy1MBB
1059 // fallthrough --> copy0MBB
1060 MachineBasicBlock *thisMBB = BB;
1061 MachineBasicBlock *copy0MBB = new MachineBasicBlock(LLVM_BB);
1062 MachineBasicBlock *sinkMBB = new MachineBasicBlock(LLVM_BB);
1063 BuildMI(BB, MI->getOperand(4).getImmedValue(), 2)
1064 .addReg(MI->getOperand(1).getReg()).addMBB(sinkMBB);
1065 MachineFunction *F = BB->getParent();
1066 F->getBasicBlockList().insert(It, copy0MBB);
1067 F->getBasicBlockList().insert(It, sinkMBB);
1068 // Update machine-CFG edges
1069 BB->addSuccessor(copy0MBB);
1070 BB->addSuccessor(sinkMBB);
1071
1072 // copy0MBB:
1073 // %FalseValue = ...
1074 // # fallthrough to sinkMBB
1075 BB = copy0MBB;
1076
1077 // Update machine-CFG edges
1078 BB->addSuccessor(sinkMBB);
1079
1080 // sinkMBB:
1081 // %Result = phi [ %FalseValue, copy0MBB ], [ %TrueValue, thisMBB ]
1082 // ...
1083 BB = sinkMBB;
1084 BuildMI(BB, PPC::PHI, 4, MI->getOperand(0).getReg())
1085 .addReg(MI->getOperand(3).getReg()).addMBB(copy0MBB)
1086 .addReg(MI->getOperand(2).getReg()).addMBB(thisMBB);
1087
1088 delete MI; // The pseudo instruction is gone now.
1089 return BB;
1090}
1091
Chris Lattner8c13d0a2006-03-01 04:57:39 +00001092SDOperand PPCTargetLowering::PerformDAGCombine(SDNode *N,
1093 DAGCombinerInfo &DCI) const {
1094 TargetMachine &TM = getTargetMachine();
1095 SelectionDAG &DAG = DCI.DAG;
1096 switch (N->getOpcode()) {
1097 default: break;
1098 case ISD::SINT_TO_FP:
1099 if (TM.getSubtarget<PPCSubtarget>().is64Bit()) {
1100 // Turn (sint_to_fp (fp_to_sint X)) -> fctidz/fcfid without load/stores.
1101 // We allow the src/dst to be either f32/f64, but force the intermediate
1102 // type to be i64.
1103 if (N->getOperand(0).getOpcode() == ISD::FP_TO_SINT &&
1104 N->getOperand(0).getValueType() == MVT::i64) {
1105
1106 SDOperand Val = N->getOperand(0).getOperand(0);
1107 if (Val.getValueType() == MVT::f32) {
1108 Val = DAG.getNode(ISD::FP_EXTEND, MVT::f64, Val);
1109 DCI.AddToWorklist(Val.Val);
1110 }
1111
1112 Val = DAG.getNode(PPCISD::FCTIDZ, MVT::f64, Val);
1113 DCI.AddToWorklist(Val.Val);
1114 Val = DAG.getNode(PPCISD::FCFID, MVT::f64, Val);
1115 DCI.AddToWorklist(Val.Val);
1116 if (N->getValueType(0) == MVT::f32) {
1117 Val = DAG.getNode(ISD::FP_ROUND, MVT::f32, Val);
1118 DCI.AddToWorklist(Val.Val);
1119 }
1120 return Val;
1121 }
1122 }
1123 break;
Chris Lattner51269842006-03-01 05:50:56 +00001124 case ISD::STORE:
1125 // Turn STORE (FP_TO_SINT F) -> STFIWX(FCTIWZ(F)).
1126 if (TM.getSubtarget<PPCSubtarget>().hasSTFIWX() &&
1127 N->getOperand(1).getOpcode() == ISD::FP_TO_SINT &&
1128 N->getOperand(1).getValueType() == MVT::i32) {
1129 SDOperand Val = N->getOperand(1).getOperand(0);
1130 if (Val.getValueType() == MVT::f32) {
1131 Val = DAG.getNode(ISD::FP_EXTEND, MVT::f64, Val);
1132 DCI.AddToWorklist(Val.Val);
1133 }
1134 Val = DAG.getNode(PPCISD::FCTIWZ, MVT::f64, Val);
1135 DCI.AddToWorklist(Val.Val);
1136
1137 Val = DAG.getNode(PPCISD::STFIWX, MVT::Other, N->getOperand(0), Val,
1138 N->getOperand(2), N->getOperand(3));
1139 DCI.AddToWorklist(Val.Val);
1140 return Val;
1141 }
1142 break;
Chris Lattner8c13d0a2006-03-01 04:57:39 +00001143 }
1144
1145 return SDOperand();
1146}
1147
Chris Lattnerad3bc8d2006-02-07 20:16:30 +00001148/// getConstraintType - Given a constraint letter, return the type of
1149/// constraint it is for this target.
1150PPCTargetLowering::ConstraintType
1151PPCTargetLowering::getConstraintType(char ConstraintLetter) const {
1152 switch (ConstraintLetter) {
1153 default: break;
1154 case 'b':
1155 case 'r':
1156 case 'f':
1157 case 'v':
1158 case 'y':
1159 return C_RegisterClass;
1160 }
1161 return TargetLowering::getConstraintType(ConstraintLetter);
1162}
1163
1164
Chris Lattnerddc787d2006-01-31 19:20:21 +00001165std::vector<unsigned> PPCTargetLowering::
Chris Lattner1efa40f2006-02-22 00:56:39 +00001166getRegClassForInlineAsmConstraint(const std::string &Constraint,
1167 MVT::ValueType VT) const {
Chris Lattnerddc787d2006-01-31 19:20:21 +00001168 if (Constraint.size() == 1) {
1169 switch (Constraint[0]) { // GCC RS6000 Constraint Letters
1170 default: break; // Unknown constriant letter
1171 case 'b':
1172 return make_vector<unsigned>(/*no R0*/ PPC::R1 , PPC::R2 , PPC::R3 ,
1173 PPC::R4 , PPC::R5 , PPC::R6 , PPC::R7 ,
1174 PPC::R8 , PPC::R9 , PPC::R10, PPC::R11,
1175 PPC::R12, PPC::R13, PPC::R14, PPC::R15,
1176 PPC::R16, PPC::R17, PPC::R18, PPC::R19,
1177 PPC::R20, PPC::R21, PPC::R22, PPC::R23,
1178 PPC::R24, PPC::R25, PPC::R26, PPC::R27,
1179 PPC::R28, PPC::R29, PPC::R30, PPC::R31,
1180 0);
1181 case 'r':
1182 return make_vector<unsigned>(PPC::R0 , PPC::R1 , PPC::R2 , PPC::R3 ,
1183 PPC::R4 , PPC::R5 , PPC::R6 , PPC::R7 ,
1184 PPC::R8 , PPC::R9 , PPC::R10, PPC::R11,
1185 PPC::R12, PPC::R13, PPC::R14, PPC::R15,
1186 PPC::R16, PPC::R17, PPC::R18, PPC::R19,
1187 PPC::R20, PPC::R21, PPC::R22, PPC::R23,
1188 PPC::R24, PPC::R25, PPC::R26, PPC::R27,
1189 PPC::R28, PPC::R29, PPC::R30, PPC::R31,
1190 0);
1191 case 'f':
1192 return make_vector<unsigned>(PPC::F0 , PPC::F1 , PPC::F2 , PPC::F3 ,
1193 PPC::F4 , PPC::F5 , PPC::F6 , PPC::F7 ,
1194 PPC::F8 , PPC::F9 , PPC::F10, PPC::F11,
1195 PPC::F12, PPC::F13, PPC::F14, PPC::F15,
1196 PPC::F16, PPC::F17, PPC::F18, PPC::F19,
1197 PPC::F20, PPC::F21, PPC::F22, PPC::F23,
1198 PPC::F24, PPC::F25, PPC::F26, PPC::F27,
1199 PPC::F28, PPC::F29, PPC::F30, PPC::F31,
1200 0);
1201 case 'v':
1202 return make_vector<unsigned>(PPC::V0 , PPC::V1 , PPC::V2 , PPC::V3 ,
1203 PPC::V4 , PPC::V5 , PPC::V6 , PPC::V7 ,
1204 PPC::V8 , PPC::V9 , PPC::V10, PPC::V11,
1205 PPC::V12, PPC::V13, PPC::V14, PPC::V15,
1206 PPC::V16, PPC::V17, PPC::V18, PPC::V19,
1207 PPC::V20, PPC::V21, PPC::V22, PPC::V23,
1208 PPC::V24, PPC::V25, PPC::V26, PPC::V27,
1209 PPC::V28, PPC::V29, PPC::V30, PPC::V31,
1210 0);
1211 case 'y':
1212 return make_vector<unsigned>(PPC::CR0, PPC::CR1, PPC::CR2, PPC::CR3,
1213 PPC::CR4, PPC::CR5, PPC::CR6, PPC::CR7,
1214 0);
1215 }
1216 }
1217
Chris Lattner1efa40f2006-02-22 00:56:39 +00001218 return std::vector<unsigned>();
Chris Lattnerddc787d2006-01-31 19:20:21 +00001219}
Chris Lattner763317d2006-02-07 00:47:13 +00001220
1221// isOperandValidForConstraint
1222bool PPCTargetLowering::
1223isOperandValidForConstraint(SDOperand Op, char Letter) {
1224 switch (Letter) {
1225 default: break;
1226 case 'I':
1227 case 'J':
1228 case 'K':
1229 case 'L':
1230 case 'M':
1231 case 'N':
1232 case 'O':
1233 case 'P': {
1234 if (!isa<ConstantSDNode>(Op)) return false; // Must be an immediate.
1235 unsigned Value = cast<ConstantSDNode>(Op)->getValue();
1236 switch (Letter) {
1237 default: assert(0 && "Unknown constraint letter!");
1238 case 'I': // "I" is a signed 16-bit constant.
1239 return (short)Value == (int)Value;
1240 case 'J': // "J" is a constant with only the high-order 16 bits nonzero.
1241 case 'L': // "L" is a signed 16-bit constant shifted left 16 bits.
1242 return (short)Value == 0;
1243 case 'K': // "K" is a constant with only the low-order 16 bits nonzero.
1244 return (Value >> 16) == 0;
1245 case 'M': // "M" is a constant that is greater than 31.
1246 return Value > 31;
1247 case 'N': // "N" is a positive constant that is an exact power of two.
1248 return (int)Value > 0 && isPowerOf2_32(Value);
1249 case 'O': // "O" is the constant zero.
1250 return Value == 0;
1251 case 'P': // "P" is a constant whose negation is a signed 16-bit constant.
1252 return (short)-Value == (int)-Value;
1253 }
1254 break;
1255 }
1256 }
1257
1258 // Handle standard constraint letters.
1259 return TargetLowering::isOperandValidForConstraint(Op, Letter);
1260}
Evan Chengc4c62572006-03-13 23:20:37 +00001261
1262/// isLegalAddressImmediate - Return true if the integer value can be used
1263/// as the offset of the target addressing mode.
1264bool PPCTargetLowering::isLegalAddressImmediate(int64_t V) const {
1265 // PPC allows a sign-extended 16-bit immediate field.
1266 return (V > -(1 << 16) && V < (1 << 16)-1);
1267}