blob: 76fcde65b8df7bac05f785577b94d3f9669608cb [file] [log] [blame]
Nate Begeman1d9d7422005-10-18 00:28:58 +00001//===-- PPCISelLowering.cpp - PPC DAG Lowering Implementation -------------===//
Chris Lattner7c5a3d32005-08-16 17:14:42 +00002//
3// The LLVM Compiler Infrastructure
4//
5// This file was developed by Chris Lattner and is distributed under
6// the University of Illinois Open Source License. See LICENSE.TXT for details.
7//
8//===----------------------------------------------------------------------===//
9//
Nate Begeman21e463b2005-10-16 05:39:50 +000010// This file implements the PPCISelLowering class.
Chris Lattner7c5a3d32005-08-16 17:14:42 +000011//
12//===----------------------------------------------------------------------===//
13
Chris Lattner16e71f22005-10-14 23:59:06 +000014#include "PPCISelLowering.h"
15#include "PPCTargetMachine.h"
Nate Begeman750ac1b2006-02-01 07:19:44 +000016#include "llvm/ADT/VectorExtras.h"
Evan Chengc4c62572006-03-13 23:20:37 +000017#include "llvm/Analysis/ScalarEvolutionExpressions.h"
Chris Lattner7c5a3d32005-08-16 17:14:42 +000018#include "llvm/CodeGen/MachineFrameInfo.h"
19#include "llvm/CodeGen/MachineFunction.h"
Chris Lattner8a2d3ca2005-08-26 21:23:58 +000020#include "llvm/CodeGen/MachineInstrBuilder.h"
Chris Lattner7c5a3d32005-08-16 17:14:42 +000021#include "llvm/CodeGen/SelectionDAG.h"
Chris Lattner7b738342005-09-13 19:33:40 +000022#include "llvm/CodeGen/SSARegMap.h"
Chris Lattner0b1e4e52005-08-26 17:36:52 +000023#include "llvm/Constants.h"
Chris Lattner7c5a3d32005-08-16 17:14:42 +000024#include "llvm/Function.h"
Chris Lattner6d92cad2006-03-26 10:06:40 +000025#include "llvm/Intrinsics.h"
Nate Begeman750ac1b2006-02-01 07:19:44 +000026#include "llvm/Support/MathExtras.h"
Evan Chengd2ee2182006-02-18 00:08:58 +000027#include "llvm/Target/TargetOptions.h"
Chris Lattner7c5a3d32005-08-16 17:14:42 +000028using namespace llvm;
29
Nate Begeman21e463b2005-10-16 05:39:50 +000030PPCTargetLowering::PPCTargetLowering(TargetMachine &TM)
Chris Lattner7c5a3d32005-08-16 17:14:42 +000031 : TargetLowering(TM) {
32
33 // Fold away setcc operations if possible.
34 setSetCCIsExpensive();
Nate Begeman405e3ec2005-10-21 00:02:42 +000035 setPow2DivIsCheap();
Chris Lattner7c5a3d32005-08-16 17:14:42 +000036
Chris Lattnerd145a612005-09-27 22:18:25 +000037 // Use _setjmp/_longjmp instead of setjmp/longjmp.
38 setUseUnderscoreSetJmpLongJmp(true);
39
Chris Lattner7c5a3d32005-08-16 17:14:42 +000040 // Set up the register classes.
Nate Begeman1d9d7422005-10-18 00:28:58 +000041 addRegisterClass(MVT::i32, PPC::GPRCRegisterClass);
42 addRegisterClass(MVT::f32, PPC::F4RCRegisterClass);
43 addRegisterClass(MVT::f64, PPC::F8RCRegisterClass);
Chris Lattner7c5a3d32005-08-16 17:14:42 +000044
Chris Lattnera54aa942006-01-29 06:26:08 +000045 setOperationAction(ISD::ConstantFP, MVT::f64, Expand);
46 setOperationAction(ISD::ConstantFP, MVT::f32, Expand);
47
Chris Lattner7c5a3d32005-08-16 17:14:42 +000048 // PowerPC has no intrinsics for these particular operations
49 setOperationAction(ISD::MEMMOVE, MVT::Other, Expand);
50 setOperationAction(ISD::MEMSET, MVT::Other, Expand);
51 setOperationAction(ISD::MEMCPY, MVT::Other, Expand);
52
53 // PowerPC has an i16 but no i8 (or i1) SEXTLOAD
54 setOperationAction(ISD::SEXTLOAD, MVT::i1, Expand);
55 setOperationAction(ISD::SEXTLOAD, MVT::i8, Expand);
56
57 // PowerPC has no SREM/UREM instructions
58 setOperationAction(ISD::SREM, MVT::i32, Expand);
59 setOperationAction(ISD::UREM, MVT::i32, Expand);
60
61 // We don't support sin/cos/sqrt/fmod
62 setOperationAction(ISD::FSIN , MVT::f64, Expand);
63 setOperationAction(ISD::FCOS , MVT::f64, Expand);
Chris Lattner615c2d02005-09-28 22:29:58 +000064 setOperationAction(ISD::FREM , MVT::f64, Expand);
Chris Lattner7c5a3d32005-08-16 17:14:42 +000065 setOperationAction(ISD::FSIN , MVT::f32, Expand);
66 setOperationAction(ISD::FCOS , MVT::f32, Expand);
Chris Lattner615c2d02005-09-28 22:29:58 +000067 setOperationAction(ISD::FREM , MVT::f32, Expand);
Chris Lattner7c5a3d32005-08-16 17:14:42 +000068
69 // If we're enabling GP optimizations, use hardware square root
Chris Lattner1e9de3e2005-09-02 18:33:05 +000070 if (!TM.getSubtarget<PPCSubtarget>().hasFSQRT()) {
Chris Lattner7c5a3d32005-08-16 17:14:42 +000071 setOperationAction(ISD::FSQRT, MVT::f64, Expand);
72 setOperationAction(ISD::FSQRT, MVT::f32, Expand);
73 }
74
Chris Lattner9601a862006-03-05 05:08:37 +000075 setOperationAction(ISD::FCOPYSIGN, MVT::f64, Expand);
76 setOperationAction(ISD::FCOPYSIGN, MVT::f32, Expand);
77
Nate Begemand88fc032006-01-14 03:14:10 +000078 // PowerPC does not have BSWAP, CTPOP or CTTZ
79 setOperationAction(ISD::BSWAP, MVT::i32 , Expand);
Chris Lattner7c5a3d32005-08-16 17:14:42 +000080 setOperationAction(ISD::CTPOP, MVT::i32 , Expand);
81 setOperationAction(ISD::CTTZ , MVT::i32 , Expand);
82
Nate Begeman35ef9132006-01-11 21:21:00 +000083 // PowerPC does not have ROTR
84 setOperationAction(ISD::ROTR, MVT::i32 , Expand);
85
Chris Lattner7c5a3d32005-08-16 17:14:42 +000086 // PowerPC does not have Select
87 setOperationAction(ISD::SELECT, MVT::i32, Expand);
88 setOperationAction(ISD::SELECT, MVT::f32, Expand);
89 setOperationAction(ISD::SELECT, MVT::f64, Expand);
Chris Lattnere4bc9ea2005-08-26 00:52:45 +000090
Chris Lattner0b1e4e52005-08-26 17:36:52 +000091 // PowerPC wants to turn select_cc of FP into fsel when possible.
92 setOperationAction(ISD::SELECT_CC, MVT::f32, Custom);
93 setOperationAction(ISD::SELECT_CC, MVT::f64, Custom);
Nate Begeman44775902006-01-31 08:17:29 +000094
Nate Begeman750ac1b2006-02-01 07:19:44 +000095 // PowerPC wants to optimize integer setcc a bit
Nate Begeman44775902006-01-31 08:17:29 +000096 setOperationAction(ISD::SETCC, MVT::i32, Custom);
Chris Lattnereb9b62e2005-08-31 19:09:57 +000097
Nate Begeman81e80972006-03-17 01:40:33 +000098 // PowerPC does not have BRCOND which requires SetCC
99 setOperationAction(ISD::BRCOND, MVT::Other, Expand);
Chris Lattner7c5a3d32005-08-16 17:14:42 +0000100
Chris Lattnerf7605322005-08-31 21:09:52 +0000101 // PowerPC turns FP_TO_SINT into FCTIWZ and some load/stores.
102 setOperationAction(ISD::FP_TO_SINT, MVT::i32, Custom);
Nate Begemanc09eeec2005-09-06 22:03:27 +0000103
Jim Laskeyad23c9d2005-08-17 00:40:22 +0000104 // PowerPC does not have [U|S]INT_TO_FP
105 setOperationAction(ISD::SINT_TO_FP, MVT::i32, Expand);
106 setOperationAction(ISD::UINT_TO_FP, MVT::i32, Expand);
107
Chris Lattner53e88452005-12-23 05:13:35 +0000108 setOperationAction(ISD::BIT_CONVERT, MVT::f32, Expand);
109 setOperationAction(ISD::BIT_CONVERT, MVT::i32, Expand);
110
Chris Lattnere6ec9f22005-09-10 00:21:06 +0000111 // PowerPC does not have truncstore for i1.
112 setOperationAction(ISD::TRUNCSTORE, MVT::i1, Promote);
Chris Lattnerf73bae12005-11-29 06:16:21 +0000113
Jim Laskeyabf6d172006-01-05 01:25:28 +0000114 // Support label based line numbers.
Chris Lattnerf73bae12005-11-29 06:16:21 +0000115 setOperationAction(ISD::LOCATION, MVT::Other, Expand);
Jim Laskeye0bce712006-01-05 01:47:43 +0000116 setOperationAction(ISD::DEBUG_LOC, MVT::Other, Expand);
Jim Laskeyabf6d172006-01-05 01:25:28 +0000117 // FIXME - use subtarget debug flags
Jim Laskeye0bce712006-01-05 01:47:43 +0000118 if (!TM.getSubtarget<PPCSubtarget>().isDarwin())
Jim Laskeyabf6d172006-01-05 01:25:28 +0000119 setOperationAction(ISD::DEBUG_LABEL, MVT::Other, Expand);
Chris Lattnere6ec9f22005-09-10 00:21:06 +0000120
Nate Begeman28a6b022005-12-10 02:36:00 +0000121 // We want to legalize GlobalAddress and ConstantPool nodes into the
122 // appropriate instructions to materialize the address.
Chris Lattner3eef4e32005-11-17 18:26:56 +0000123 setOperationAction(ISD::GlobalAddress, MVT::i32, Custom);
Nate Begeman28a6b022005-12-10 02:36:00 +0000124 setOperationAction(ISD::ConstantPool, MVT::i32, Custom);
Chris Lattnerb99329e2006-01-13 02:42:53 +0000125
Nate Begemanee625572006-01-27 21:09:22 +0000126 // RET must be custom lowered, to meet ABI requirements
127 setOperationAction(ISD::RET , MVT::Other, Custom);
128
Nate Begemanacc398c2006-01-25 18:21:52 +0000129 // VASTART needs to be custom lowered to use the VarArgsFrameIndex
130 setOperationAction(ISD::VASTART , MVT::Other, Custom);
131
Chris Lattnerb22c08b2006-01-15 09:02:48 +0000132 // Use the default implementation.
Nate Begemanacc398c2006-01-25 18:21:52 +0000133 setOperationAction(ISD::VAARG , MVT::Other, Expand);
134 setOperationAction(ISD::VACOPY , MVT::Other, Expand);
135 setOperationAction(ISD::VAEND , MVT::Other, Expand);
Chris Lattnerb22c08b2006-01-15 09:02:48 +0000136 setOperationAction(ISD::STACKSAVE , MVT::Other, Expand);
137 setOperationAction(ISD::STACKRESTORE , MVT::Other, Expand);
138 setOperationAction(ISD::DYNAMIC_STACKALLOC, MVT::i32 , Expand);
Chris Lattner860e8862005-11-17 07:30:41 +0000139
Chris Lattner6d92cad2006-03-26 10:06:40 +0000140 // We want to custom lower some of our intrinsics.
Chris Lattner48b61a72006-03-28 00:40:33 +0000141 setOperationAction(ISD::INTRINSIC_WO_CHAIN, MVT::Other, Custom);
Chris Lattner6d92cad2006-03-26 10:06:40 +0000142
Nate Begemanc09eeec2005-09-06 22:03:27 +0000143 if (TM.getSubtarget<PPCSubtarget>().is64Bit()) {
Nate Begeman1d9d7422005-10-18 00:28:58 +0000144 // They also have instructions for converting between i64 and fp.
Nate Begemanc09eeec2005-09-06 22:03:27 +0000145 setOperationAction(ISD::FP_TO_SINT, MVT::i64, Custom);
146 setOperationAction(ISD::SINT_TO_FP, MVT::i64, Custom);
Chris Lattner7fbcef72006-03-24 07:53:47 +0000147
148 // FIXME: disable this lowered code. This generates 64-bit register values,
149 // and we don't model the fact that the top part is clobbered by calls. We
150 // need to flag these together so that the value isn't live across a call.
151 //setOperationAction(ISD::SINT_TO_FP, MVT::i32, Custom);
152
Nate Begemanae749a92005-10-25 23:48:36 +0000153 // To take advantage of the above i64 FP_TO_SINT, promote i32 FP_TO_UINT
154 setOperationAction(ISD::FP_TO_UINT, MVT::i32, Promote);
155 } else {
Chris Lattner860e8862005-11-17 07:30:41 +0000156 // PowerPC does not have FP_TO_UINT on 32-bit implementations.
Nate Begemanae749a92005-10-25 23:48:36 +0000157 setOperationAction(ISD::FP_TO_UINT, MVT::i32, Expand);
Nate Begeman9d2b8172005-10-18 00:56:42 +0000158 }
159
160 if (TM.getSubtarget<PPCSubtarget>().has64BitRegs()) {
161 // 64 bit PowerPC implementations can support i64 types directly
162 addRegisterClass(MVT::i64, PPC::G8RCRegisterClass);
Nate Begeman1d9d7422005-10-18 00:28:58 +0000163 // BUILD_PAIR can't be handled natively, and should be expanded to shl/or
164 setOperationAction(ISD::BUILD_PAIR, MVT::i64, Expand);
Nate Begeman1d9d7422005-10-18 00:28:58 +0000165 } else {
166 // 32 bit PowerPC wants to expand i64 shifts itself.
167 setOperationAction(ISD::SHL, MVT::i64, Custom);
168 setOperationAction(ISD::SRL, MVT::i64, Custom);
169 setOperationAction(ISD::SRA, MVT::i64, Custom);
Nate Begemanc09eeec2005-09-06 22:03:27 +0000170 }
171
Evan Chengd30bf012006-03-01 01:11:20 +0000172 // First set operation action for all vector types to expand. Then we
173 // will selectively turn on ones that can be effectively codegen'd.
174 for (unsigned VT = (unsigned)MVT::Vector + 1;
175 VT != (unsigned)MVT::LAST_VALUETYPE; VT++) {
176 setOperationAction(ISD::ADD , (MVT::ValueType)VT, Expand);
177 setOperationAction(ISD::SUB , (MVT::ValueType)VT, Expand);
178 setOperationAction(ISD::MUL , (MVT::ValueType)VT, Expand);
Chris Lattnerf1d0b2b2006-03-20 01:53:53 +0000179 setOperationAction(ISD::VECTOR_SHUFFLE, (MVT::ValueType)VT, Expand);
Chris Lattner9b3bd462006-03-21 20:51:05 +0000180 setOperationAction(ISD::EXTRACT_VECTOR_ELT, (MVT::ValueType)VT, Expand);
Chris Lattner36f4b0d2006-03-31 01:48:55 +0000181 setOperationAction(ISD::INSERT_VECTOR_ELT, (MVT::ValueType)VT, Expand);
Chris Lattnerf1d0b2b2006-03-20 01:53:53 +0000182 setOperationAction(ISD::BUILD_VECTOR, (MVT::ValueType)VT, Expand);
Evan Chengd30bf012006-03-01 01:11:20 +0000183 }
184
Nate Begeman425a9692005-11-29 08:17:20 +0000185 if (TM.getSubtarget<PPCSubtarget>().hasAltivec()) {
Nate Begeman425a9692005-11-29 08:17:20 +0000186 addRegisterClass(MVT::v4f32, PPC::VRRCRegisterClass);
Nate Begeman7fd1edd2005-12-19 23:25:09 +0000187 addRegisterClass(MVT::v4i32, PPC::VRRCRegisterClass);
Chris Lattner8d052bc2006-03-25 07:39:07 +0000188 addRegisterClass(MVT::v8i16, PPC::VRRCRegisterClass);
189 addRegisterClass(MVT::v16i8, PPC::VRRCRegisterClass);
Chris Lattnerec4a0c72006-01-29 06:32:58 +0000190
Evan Chengd30bf012006-03-01 01:11:20 +0000191 setOperationAction(ISD::ADD , MVT::v4f32, Legal);
192 setOperationAction(ISD::SUB , MVT::v4f32, Legal);
193 setOperationAction(ISD::MUL , MVT::v4f32, Legal);
Evan Chengd30bf012006-03-01 01:11:20 +0000194 setOperationAction(ISD::ADD , MVT::v4i32, Legal);
Chris Lattnerf1d0b2b2006-03-20 01:53:53 +0000195
196 setOperationAction(ISD::VECTOR_SHUFFLE, MVT::v4i32, Custom);
197 setOperationAction(ISD::VECTOR_SHUFFLE, MVT::v4f32, Custom);
198
Chris Lattnerb2177b92006-03-19 06:55:52 +0000199 setOperationAction(ISD::SCALAR_TO_VECTOR, MVT::v4f32, Custom);
200 setOperationAction(ISD::SCALAR_TO_VECTOR, MVT::v4i32, Custom);
Chris Lattner64b3a082006-03-24 07:48:08 +0000201
202 setOperationAction(ISD::BUILD_VECTOR, MVT::v4i32, Custom);
203 setOperationAction(ISD::BUILD_VECTOR, MVT::v4f32, Custom);
Nate Begeman425a9692005-11-29 08:17:20 +0000204 }
205
Chris Lattner7c5a3d32005-08-16 17:14:42 +0000206 setSetCCResultContents(ZeroOrOneSetCCResult);
Chris Lattnercadd7422006-01-13 17:52:03 +0000207 setStackPointerRegisterToSaveRestore(PPC::R1);
Chris Lattner7c5a3d32005-08-16 17:14:42 +0000208
Chris Lattner8c13d0a2006-03-01 04:57:39 +0000209 // We have target-specific dag combine patterns for the following nodes:
210 setTargetDAGCombine(ISD::SINT_TO_FP);
Chris Lattner51269842006-03-01 05:50:56 +0000211 setTargetDAGCombine(ISD::STORE);
Chris Lattner8c13d0a2006-03-01 04:57:39 +0000212
Chris Lattner7c5a3d32005-08-16 17:14:42 +0000213 computeRegisterProperties();
214}
215
Chris Lattnerda6d20f2006-01-09 23:52:17 +0000216const char *PPCTargetLowering::getTargetNodeName(unsigned Opcode) const {
217 switch (Opcode) {
218 default: return 0;
219 case PPCISD::FSEL: return "PPCISD::FSEL";
220 case PPCISD::FCFID: return "PPCISD::FCFID";
221 case PPCISD::FCTIDZ: return "PPCISD::FCTIDZ";
222 case PPCISD::FCTIWZ: return "PPCISD::FCTIWZ";
Chris Lattner51269842006-03-01 05:50:56 +0000223 case PPCISD::STFIWX: return "PPCISD::STFIWX";
Chris Lattnerda6d20f2006-01-09 23:52:17 +0000224 case PPCISD::VMADDFP: return "PPCISD::VMADDFP";
225 case PPCISD::VNMSUBFP: return "PPCISD::VNMSUBFP";
Chris Lattnerf1d0b2b2006-03-20 01:53:53 +0000226 case PPCISD::VPERM: return "PPCISD::VPERM";
Chris Lattnerda6d20f2006-01-09 23:52:17 +0000227 case PPCISD::Hi: return "PPCISD::Hi";
228 case PPCISD::Lo: return "PPCISD::Lo";
229 case PPCISD::GlobalBaseReg: return "PPCISD::GlobalBaseReg";
230 case PPCISD::SRL: return "PPCISD::SRL";
231 case PPCISD::SRA: return "PPCISD::SRA";
232 case PPCISD::SHL: return "PPCISD::SHL";
Chris Lattnerecfe55e2006-03-22 05:30:33 +0000233 case PPCISD::EXTSW_32: return "PPCISD::EXTSW_32";
234 case PPCISD::STD_32: return "PPCISD::STD_32";
Chris Lattnere00ebf02006-01-28 07:33:03 +0000235 case PPCISD::CALL: return "PPCISD::CALL";
Chris Lattnerda6d20f2006-01-09 23:52:17 +0000236 case PPCISD::RET_FLAG: return "PPCISD::RET_FLAG";
Chris Lattner6d92cad2006-03-26 10:06:40 +0000237 case PPCISD::MFCR: return "PPCISD::MFCR";
Chris Lattnera17b1552006-03-31 05:13:27 +0000238 case PPCISD::VCMP: return "PPCISD::VCMP";
Chris Lattner6d92cad2006-03-26 10:06:40 +0000239 case PPCISD::VCMPo: return "PPCISD::VCMPo";
Chris Lattnerda6d20f2006-01-09 23:52:17 +0000240 }
241}
242
Chris Lattner0b1e4e52005-08-26 17:36:52 +0000243/// isFloatingPointZero - Return true if this is 0.0 or -0.0.
244static bool isFloatingPointZero(SDOperand Op) {
245 if (ConstantFPSDNode *CFP = dyn_cast<ConstantFPSDNode>(Op))
246 return CFP->isExactlyValue(-0.0) || CFP->isExactlyValue(0.0);
247 else if (Op.getOpcode() == ISD::EXTLOAD || Op.getOpcode() == ISD::LOAD) {
248 // Maybe this has already been legalized into the constant pool?
249 if (ConstantPoolSDNode *CP = dyn_cast<ConstantPoolSDNode>(Op.getOperand(1)))
250 if (ConstantFP *CFP = dyn_cast<ConstantFP>(CP->get()))
251 return CFP->isExactlyValue(-0.0) || CFP->isExactlyValue(0.0);
252 }
253 return false;
254}
255
Chris Lattneref819f82006-03-20 06:33:01 +0000256
257/// isSplatShuffleMask - Return true if the specified VECTOR_SHUFFLE operand
258/// specifies a splat of a single element that is suitable for input to
259/// VSPLTB/VSPLTH/VSPLTW.
260bool PPC::isSplatShuffleMask(SDNode *N) {
261 assert(N->getOpcode() == ISD::BUILD_VECTOR);
Chris Lattnerdd4d2d02006-03-20 06:51:10 +0000262
263 // We can only splat 8-bit, 16-bit, and 32-bit quantities.
264 if (N->getNumOperands() != 4 && N->getNumOperands() != 8 &&
265 N->getNumOperands() != 16)
266 return false;
267
Chris Lattner88a99ef2006-03-20 06:37:44 +0000268 // This is a splat operation if each element of the permute is the same, and
269 // if the value doesn't reference the second vector.
270 SDOperand Elt = N->getOperand(0);
271 assert(isa<ConstantSDNode>(Elt) && "Invalid VECTOR_SHUFFLE mask!");
272 for (unsigned i = 1, e = N->getNumOperands(); i != e; ++i) {
273 assert(isa<ConstantSDNode>(N->getOperand(i)) &&
274 "Invalid VECTOR_SHUFFLE mask!");
275 if (N->getOperand(i) != Elt) return false;
276 }
277
278 // Make sure it is a splat of the first vector operand.
279 return cast<ConstantSDNode>(Elt)->getValue() < N->getNumOperands();
Chris Lattneref819f82006-03-20 06:33:01 +0000280}
281
282/// getVSPLTImmediate - Return the appropriate VSPLT* immediate to splat the
283/// specified isSplatShuffleMask VECTOR_SHUFFLE mask.
284unsigned PPC::getVSPLTImmediate(SDNode *N) {
285 assert(isSplatShuffleMask(N));
Chris Lattnerdd4d2d02006-03-20 06:51:10 +0000286 return cast<ConstantSDNode>(N->getOperand(0))->getValue();
Chris Lattneref819f82006-03-20 06:33:01 +0000287}
288
Chris Lattner9c61dcf2006-03-25 06:12:06 +0000289/// isVecSplatImm - Return true if this is a build_vector of constants which
290/// can be formed by using a vspltis[bhw] instruction. The ByteSize field
291/// indicates the number of bytes of each element [124] -> [bhw].
292bool PPC::isVecSplatImm(SDNode *N, unsigned ByteSize, char *Val) {
293 SDOperand OpVal(0, 0);
294 // Check to see if this buildvec has a single non-undef value in its elements.
295 for (unsigned i = 0, e = N->getNumOperands(); i != e; ++i) {
296 if (N->getOperand(i).getOpcode() == ISD::UNDEF) continue;
297 if (OpVal.Val == 0)
298 OpVal = N->getOperand(i);
299 else if (OpVal != N->getOperand(i))
300 return false;
301 }
302
303 if (OpVal.Val == 0) return false; // All UNDEF: use implicit def.
304
Nate Begeman98e70cc2006-03-28 04:15:58 +0000305 unsigned ValSizeInBytes = 0;
306 uint64_t Value = 0;
Chris Lattner9c61dcf2006-03-25 06:12:06 +0000307 if (ConstantSDNode *CN = dyn_cast<ConstantSDNode>(OpVal)) {
308 Value = CN->getValue();
309 ValSizeInBytes = MVT::getSizeInBits(CN->getValueType(0))/8;
310 } else if (ConstantFPSDNode *CN = dyn_cast<ConstantFPSDNode>(OpVal)) {
311 assert(CN->getValueType(0) == MVT::f32 && "Only one legal FP vector type!");
312 Value = FloatToBits(CN->getValue());
313 ValSizeInBytes = 4;
314 }
315
316 // If the splat value is larger than the element value, then we can never do
317 // this splat. The only case that we could fit the replicated bits into our
318 // immediate field for would be zero, and we prefer to use vxor for it.
319 if (ValSizeInBytes < ByteSize) return false;
320
321 // If the element value is larger than the splat value, cut it in half and
322 // check to see if the two halves are equal. Continue doing this until we
323 // get to ByteSize. This allows us to handle 0x01010101 as 0x01.
324 while (ValSizeInBytes > ByteSize) {
325 ValSizeInBytes >>= 1;
326
327 // If the top half equals the bottom half, we're still ok.
328 if (((Value >> (ValSizeInBytes*8)) & ((8 << ValSizeInBytes)-1)) !=
329 (Value & ((8 << ValSizeInBytes)-1)))
330 return false;
331 }
332
333 // Properly sign extend the value.
334 int ShAmt = (4-ByteSize)*8;
335 int MaskVal = ((int)Value << ShAmt) >> ShAmt;
336
Evan Cheng5b6a01b2006-03-26 09:52:32 +0000337 // If this is zero, don't match, zero matches ISD::isBuildVectorAllZeros.
Chris Lattner9c61dcf2006-03-25 06:12:06 +0000338 if (MaskVal == 0) return false;
339
340 if (Val) *Val = MaskVal;
341
342 // Finally, if this value fits in a 5 bit sext field, return true.
343 return ((MaskVal << (32-5)) >> (32-5)) == MaskVal;
344}
345
Chris Lattneref819f82006-03-20 06:33:01 +0000346
Chris Lattnere4bc9ea2005-08-26 00:52:45 +0000347/// LowerOperation - Provide custom lowering hooks for some operations.
348///
Nate Begeman21e463b2005-10-16 05:39:50 +0000349SDOperand PPCTargetLowering::LowerOperation(SDOperand Op, SelectionDAG &DAG) {
Chris Lattnere4bc9ea2005-08-26 00:52:45 +0000350 switch (Op.getOpcode()) {
351 default: assert(0 && "Wasn't expecting to be able to lower this!");
Chris Lattnerf7605322005-08-31 21:09:52 +0000352 case ISD::FP_TO_SINT: {
Nate Begemanc09eeec2005-09-06 22:03:27 +0000353 assert(MVT::isFloatingPoint(Op.getOperand(0).getValueType()));
Chris Lattner7c0d6642005-10-02 06:37:13 +0000354 SDOperand Src = Op.getOperand(0);
355 if (Src.getValueType() == MVT::f32)
356 Src = DAG.getNode(ISD::FP_EXTEND, MVT::f64, Src);
357
Chris Lattner1b95e0b2005-12-23 00:59:59 +0000358 SDOperand Tmp;
Nate Begemanc09eeec2005-09-06 22:03:27 +0000359 switch (Op.getValueType()) {
360 default: assert(0 && "Unhandled FP_TO_SINT type in custom expander!");
361 case MVT::i32:
Chris Lattner1b95e0b2005-12-23 00:59:59 +0000362 Tmp = DAG.getNode(PPCISD::FCTIWZ, MVT::f64, Src);
Nate Begemanc09eeec2005-09-06 22:03:27 +0000363 break;
364 case MVT::i64:
Chris Lattner1b95e0b2005-12-23 00:59:59 +0000365 Tmp = DAG.getNode(PPCISD::FCTIDZ, MVT::f64, Src);
Nate Begemanc09eeec2005-09-06 22:03:27 +0000366 break;
367 }
Chris Lattnerf7605322005-08-31 21:09:52 +0000368
Chris Lattner1b95e0b2005-12-23 00:59:59 +0000369 // Convert the FP value to an int value through memory.
370 SDOperand Bits = DAG.getNode(ISD::BIT_CONVERT, MVT::i64, Tmp);
371 if (Op.getValueType() == MVT::i32)
372 Bits = DAG.getNode(ISD::TRUNCATE, MVT::i32, Bits);
373 return Bits;
Nate Begemanc09eeec2005-09-06 22:03:27 +0000374 }
Chris Lattnerecfe55e2006-03-22 05:30:33 +0000375 case ISD::SINT_TO_FP:
376 if (Op.getOperand(0).getValueType() == MVT::i64) {
377 SDOperand Bits = DAG.getNode(ISD::BIT_CONVERT, MVT::f64, Op.getOperand(0));
378 SDOperand FP = DAG.getNode(PPCISD::FCFID, MVT::f64, Bits);
379 if (Op.getValueType() == MVT::f32)
380 FP = DAG.getNode(ISD::FP_ROUND, MVT::f32, FP);
381 return FP;
382 } else {
383 assert(Op.getOperand(0).getValueType() == MVT::i32 &&
384 "Unhandled SINT_TO_FP type in custom expander!");
385 // Since we only generate this in 64-bit mode, we can take advantage of
386 // 64-bit registers. In particular, sign extend the input value into the
387 // 64-bit register with extsw, store the WHOLE 64-bit value into the stack
388 // then lfd it and fcfid it.
389 MachineFrameInfo *FrameInfo = DAG.getMachineFunction().getFrameInfo();
390 int FrameIdx = FrameInfo->CreateStackObject(8, 8);
391 SDOperand FIdx = DAG.getFrameIndex(FrameIdx, MVT::i32);
392
393 SDOperand Ext64 = DAG.getNode(PPCISD::EXTSW_32, MVT::i32,
394 Op.getOperand(0));
395
396 // STD the extended value into the stack slot.
397 SDOperand Store = DAG.getNode(PPCISD::STD_32, MVT::Other,
398 DAG.getEntryNode(), Ext64, FIdx,
399 DAG.getSrcValue(NULL));
400 // Load the value as a double.
401 SDOperand Ld = DAG.getLoad(MVT::f64, Store, FIdx, DAG.getSrcValue(NULL));
402
403 // FCFID it and return it.
404 SDOperand FP = DAG.getNode(PPCISD::FCFID, MVT::f64, Ld);
405 if (Op.getValueType() == MVT::f32)
406 FP = DAG.getNode(ISD::FP_ROUND, MVT::f32, FP);
407 return FP;
408 }
Chris Lattner7fbcef72006-03-24 07:53:47 +0000409 break;
Chris Lattnerecfe55e2006-03-22 05:30:33 +0000410
Chris Lattnerf7605322005-08-31 21:09:52 +0000411 case ISD::SELECT_CC: {
Chris Lattnere4bc9ea2005-08-26 00:52:45 +0000412 // Turn FP only select_cc's into fsel instructions.
Chris Lattnerf7605322005-08-31 21:09:52 +0000413 if (!MVT::isFloatingPoint(Op.getOperand(0).getValueType()) ||
414 !MVT::isFloatingPoint(Op.getOperand(2).getValueType()))
415 break;
416
417 ISD::CondCode CC = cast<CondCodeSDNode>(Op.getOperand(4))->get();
418
419 // Cannot handle SETEQ/SETNE.
420 if (CC == ISD::SETEQ || CC == ISD::SETNE) break;
421
422 MVT::ValueType ResVT = Op.getValueType();
423 MVT::ValueType CmpVT = Op.getOperand(0).getValueType();
424 SDOperand LHS = Op.getOperand(0), RHS = Op.getOperand(1);
425 SDOperand TV = Op.getOperand(2), FV = Op.getOperand(3);
Chris Lattnere4bc9ea2005-08-26 00:52:45 +0000426
Chris Lattnerf7605322005-08-31 21:09:52 +0000427 // If the RHS of the comparison is a 0.0, we don't need to do the
428 // subtraction at all.
429 if (isFloatingPointZero(RHS))
Chris Lattnere4bc9ea2005-08-26 00:52:45 +0000430 switch (CC) {
Chris Lattnerbc38dbf2006-01-18 19:42:35 +0000431 default: break; // SETUO etc aren't handled by fsel.
Chris Lattnere4bc9ea2005-08-26 00:52:45 +0000432 case ISD::SETULT:
433 case ISD::SETLT:
Chris Lattnerf7605322005-08-31 21:09:52 +0000434 std::swap(TV, FV); // fsel is natively setge, swap operands for setlt
Chris Lattnere4bc9ea2005-08-26 00:52:45 +0000435 case ISD::SETUGE:
436 case ISD::SETGE:
Chris Lattnereb255f22005-10-25 20:54:57 +0000437 if (LHS.getValueType() == MVT::f32) // Comparison is always 64-bits
438 LHS = DAG.getNode(ISD::FP_EXTEND, MVT::f64, LHS);
Chris Lattnerf7605322005-08-31 21:09:52 +0000439 return DAG.getNode(PPCISD::FSEL, ResVT, LHS, TV, FV);
Chris Lattnere4bc9ea2005-08-26 00:52:45 +0000440 case ISD::SETUGT:
441 case ISD::SETGT:
Chris Lattnerf7605322005-08-31 21:09:52 +0000442 std::swap(TV, FV); // fsel is natively setge, swap operands for setlt
Chris Lattnere4bc9ea2005-08-26 00:52:45 +0000443 case ISD::SETULE:
444 case ISD::SETLE:
Chris Lattnereb255f22005-10-25 20:54:57 +0000445 if (LHS.getValueType() == MVT::f32) // Comparison is always 64-bits
446 LHS = DAG.getNode(ISD::FP_EXTEND, MVT::f64, LHS);
Chris Lattner0bbea952005-08-26 20:25:03 +0000447 return DAG.getNode(PPCISD::FSEL, ResVT,
Chris Lattner85fd97d2005-10-26 18:01:11 +0000448 DAG.getNode(ISD::FNEG, MVT::f64, LHS), TV, FV);
Chris Lattnere4bc9ea2005-08-26 00:52:45 +0000449 }
Chris Lattnerf7605322005-08-31 21:09:52 +0000450
Chris Lattnereb255f22005-10-25 20:54:57 +0000451 SDOperand Cmp;
Chris Lattnerf7605322005-08-31 21:09:52 +0000452 switch (CC) {
Chris Lattnerbc38dbf2006-01-18 19:42:35 +0000453 default: break; // SETUO etc aren't handled by fsel.
Chris Lattnerf7605322005-08-31 21:09:52 +0000454 case ISD::SETULT:
455 case ISD::SETLT:
Chris Lattnereb255f22005-10-25 20:54:57 +0000456 Cmp = DAG.getNode(ISD::FSUB, CmpVT, LHS, RHS);
457 if (Cmp.getValueType() == MVT::f32) // Comparison is always 64-bits
458 Cmp = DAG.getNode(ISD::FP_EXTEND, MVT::f64, Cmp);
459 return DAG.getNode(PPCISD::FSEL, ResVT, Cmp, FV, TV);
Chris Lattnerf7605322005-08-31 21:09:52 +0000460 case ISD::SETUGE:
461 case ISD::SETGE:
Chris Lattnereb255f22005-10-25 20:54:57 +0000462 Cmp = DAG.getNode(ISD::FSUB, CmpVT, LHS, RHS);
463 if (Cmp.getValueType() == MVT::f32) // Comparison is always 64-bits
464 Cmp = DAG.getNode(ISD::FP_EXTEND, MVT::f64, Cmp);
465 return DAG.getNode(PPCISD::FSEL, ResVT, Cmp, TV, FV);
Chris Lattnerf7605322005-08-31 21:09:52 +0000466 case ISD::SETUGT:
467 case ISD::SETGT:
Chris Lattnereb255f22005-10-25 20:54:57 +0000468 Cmp = DAG.getNode(ISD::FSUB, CmpVT, RHS, LHS);
469 if (Cmp.getValueType() == MVT::f32) // Comparison is always 64-bits
470 Cmp = DAG.getNode(ISD::FP_EXTEND, MVT::f64, Cmp);
471 return DAG.getNode(PPCISD::FSEL, ResVT, Cmp, FV, TV);
Chris Lattnerf7605322005-08-31 21:09:52 +0000472 case ISD::SETULE:
473 case ISD::SETLE:
Chris Lattnereb255f22005-10-25 20:54:57 +0000474 Cmp = DAG.getNode(ISD::FSUB, CmpVT, RHS, LHS);
475 if (Cmp.getValueType() == MVT::f32) // Comparison is always 64-bits
476 Cmp = DAG.getNode(ISD::FP_EXTEND, MVT::f64, Cmp);
477 return DAG.getNode(PPCISD::FSEL, ResVT, Cmp, TV, FV);
Chris Lattnere4bc9ea2005-08-26 00:52:45 +0000478 }
Chris Lattnerf7605322005-08-31 21:09:52 +0000479 break;
480 }
Chris Lattnerbc11c342005-08-31 20:23:54 +0000481 case ISD::SHL: {
482 assert(Op.getValueType() == MVT::i64 &&
483 Op.getOperand(1).getValueType() == MVT::i32 && "Unexpected SHL!");
484 // The generic code does a fine job expanding shift by a constant.
485 if (isa<ConstantSDNode>(Op.getOperand(1))) break;
486
487 // Otherwise, expand into a bunch of logical ops. Note that these ops
488 // depend on the PPC behavior for oversized shift amounts.
489 SDOperand Lo = DAG.getNode(ISD::EXTRACT_ELEMENT, MVT::i32, Op.getOperand(0),
490 DAG.getConstant(0, MVT::i32));
491 SDOperand Hi = DAG.getNode(ISD::EXTRACT_ELEMENT, MVT::i32, Op.getOperand(0),
492 DAG.getConstant(1, MVT::i32));
493 SDOperand Amt = Op.getOperand(1);
494
495 SDOperand Tmp1 = DAG.getNode(ISD::SUB, MVT::i32,
496 DAG.getConstant(32, MVT::i32), Amt);
Chris Lattner4172b102005-12-06 02:10:38 +0000497 SDOperand Tmp2 = DAG.getNode(PPCISD::SHL, MVT::i32, Hi, Amt);
498 SDOperand Tmp3 = DAG.getNode(PPCISD::SRL, MVT::i32, Lo, Tmp1);
Chris Lattnerbc11c342005-08-31 20:23:54 +0000499 SDOperand Tmp4 = DAG.getNode(ISD::OR , MVT::i32, Tmp2, Tmp3);
500 SDOperand Tmp5 = DAG.getNode(ISD::ADD, MVT::i32, Amt,
501 DAG.getConstant(-32U, MVT::i32));
Chris Lattner4172b102005-12-06 02:10:38 +0000502 SDOperand Tmp6 = DAG.getNode(PPCISD::SHL, MVT::i32, Lo, Tmp5);
Chris Lattnerbc11c342005-08-31 20:23:54 +0000503 SDOperand OutHi = DAG.getNode(ISD::OR, MVT::i32, Tmp4, Tmp6);
Chris Lattner4172b102005-12-06 02:10:38 +0000504 SDOperand OutLo = DAG.getNode(PPCISD::SHL, MVT::i32, Lo, Amt);
Chris Lattnerbc11c342005-08-31 20:23:54 +0000505 return DAG.getNode(ISD::BUILD_PAIR, MVT::i64, OutLo, OutHi);
506 }
507 case ISD::SRL: {
508 assert(Op.getValueType() == MVT::i64 &&
509 Op.getOperand(1).getValueType() == MVT::i32 && "Unexpected SHL!");
510 // The generic code does a fine job expanding shift by a constant.
511 if (isa<ConstantSDNode>(Op.getOperand(1))) break;
512
513 // Otherwise, expand into a bunch of logical ops. Note that these ops
514 // depend on the PPC behavior for oversized shift amounts.
515 SDOperand Lo = DAG.getNode(ISD::EXTRACT_ELEMENT, MVT::i32, Op.getOperand(0),
516 DAG.getConstant(0, MVT::i32));
517 SDOperand Hi = DAG.getNode(ISD::EXTRACT_ELEMENT, MVT::i32, Op.getOperand(0),
518 DAG.getConstant(1, MVT::i32));
519 SDOperand Amt = Op.getOperand(1);
520
521 SDOperand Tmp1 = DAG.getNode(ISD::SUB, MVT::i32,
522 DAG.getConstant(32, MVT::i32), Amt);
Chris Lattner4172b102005-12-06 02:10:38 +0000523 SDOperand Tmp2 = DAG.getNode(PPCISD::SRL, MVT::i32, Lo, Amt);
524 SDOperand Tmp3 = DAG.getNode(PPCISD::SHL, MVT::i32, Hi, Tmp1);
Chris Lattnerbc11c342005-08-31 20:23:54 +0000525 SDOperand Tmp4 = DAG.getNode(ISD::OR , MVT::i32, Tmp2, Tmp3);
526 SDOperand Tmp5 = DAG.getNode(ISD::ADD, MVT::i32, Amt,
527 DAG.getConstant(-32U, MVT::i32));
Chris Lattner4172b102005-12-06 02:10:38 +0000528 SDOperand Tmp6 = DAG.getNode(PPCISD::SRL, MVT::i32, Hi, Tmp5);
Chris Lattnerbc11c342005-08-31 20:23:54 +0000529 SDOperand OutLo = DAG.getNode(ISD::OR, MVT::i32, Tmp4, Tmp6);
Chris Lattner4172b102005-12-06 02:10:38 +0000530 SDOperand OutHi = DAG.getNode(PPCISD::SRL, MVT::i32, Hi, Amt);
Chris Lattnerbc11c342005-08-31 20:23:54 +0000531 return DAG.getNode(ISD::BUILD_PAIR, MVT::i64, OutLo, OutHi);
532 }
533 case ISD::SRA: {
Chris Lattnereb9b62e2005-08-31 19:09:57 +0000534 assert(Op.getValueType() == MVT::i64 &&
535 Op.getOperand(1).getValueType() == MVT::i32 && "Unexpected SRA!");
536 // The generic code does a fine job expanding shift by a constant.
537 if (isa<ConstantSDNode>(Op.getOperand(1))) break;
538
539 // Otherwise, expand into a bunch of logical ops, followed by a select_cc.
540 SDOperand Lo = DAG.getNode(ISD::EXTRACT_ELEMENT, MVT::i32, Op.getOperand(0),
541 DAG.getConstant(0, MVT::i32));
542 SDOperand Hi = DAG.getNode(ISD::EXTRACT_ELEMENT, MVT::i32, Op.getOperand(0),
543 DAG.getConstant(1, MVT::i32));
544 SDOperand Amt = Op.getOperand(1);
545
546 SDOperand Tmp1 = DAG.getNode(ISD::SUB, MVT::i32,
547 DAG.getConstant(32, MVT::i32), Amt);
Chris Lattner4172b102005-12-06 02:10:38 +0000548 SDOperand Tmp2 = DAG.getNode(PPCISD::SRL, MVT::i32, Lo, Amt);
549 SDOperand Tmp3 = DAG.getNode(PPCISD::SHL, MVT::i32, Hi, Tmp1);
Chris Lattnereb9b62e2005-08-31 19:09:57 +0000550 SDOperand Tmp4 = DAG.getNode(ISD::OR , MVT::i32, Tmp2, Tmp3);
551 SDOperand Tmp5 = DAG.getNode(ISD::ADD, MVT::i32, Amt,
552 DAG.getConstant(-32U, MVT::i32));
Chris Lattner4172b102005-12-06 02:10:38 +0000553 SDOperand Tmp6 = DAG.getNode(PPCISD::SRA, MVT::i32, Hi, Tmp5);
554 SDOperand OutHi = DAG.getNode(PPCISD::SRA, MVT::i32, Hi, Amt);
Chris Lattnereb9b62e2005-08-31 19:09:57 +0000555 SDOperand OutLo = DAG.getSelectCC(Tmp5, DAG.getConstant(0, MVT::i32),
556 Tmp4, Tmp6, ISD::SETLE);
557 return DAG.getNode(ISD::BUILD_PAIR, MVT::i64, OutLo, OutHi);
Chris Lattnere4bc9ea2005-08-26 00:52:45 +0000558 }
Nate Begeman28a6b022005-12-10 02:36:00 +0000559 case ISD::ConstantPool: {
Evan Chengb8973bd2006-01-31 22:23:14 +0000560 ConstantPoolSDNode *CP = cast<ConstantPoolSDNode>(Op);
561 Constant *C = CP->get();
562 SDOperand CPI = DAG.getTargetConstantPool(C, MVT::i32, CP->getAlignment());
Nate Begeman28a6b022005-12-10 02:36:00 +0000563 SDOperand Zero = DAG.getConstant(0, MVT::i32);
564
Evan Cheng4c1aa862006-02-22 20:19:42 +0000565 if (getTargetMachine().getRelocationModel() == Reloc::Static) {
Nate Begeman28a6b022005-12-10 02:36:00 +0000566 // Generate non-pic code that has direct accesses to the constant pool.
567 // The address of the global is just (hi(&g)+lo(&g)).
568 SDOperand Hi = DAG.getNode(PPCISD::Hi, MVT::i32, CPI, Zero);
569 SDOperand Lo = DAG.getNode(PPCISD::Lo, MVT::i32, CPI, Zero);
570 return DAG.getNode(ISD::ADD, MVT::i32, Hi, Lo);
571 }
572
573 // Only lower ConstantPool on Darwin.
574 if (!getTargetMachine().getSubtarget<PPCSubtarget>().isDarwin()) break;
575 SDOperand Hi = DAG.getNode(PPCISD::Hi, MVT::i32, CPI, Zero);
Evan Cheng4c1aa862006-02-22 20:19:42 +0000576 if (getTargetMachine().getRelocationModel() == Reloc::PIC) {
Nate Begeman28a6b022005-12-10 02:36:00 +0000577 // With PIC, the first instruction is actually "GR+hi(&G)".
578 Hi = DAG.getNode(ISD::ADD, MVT::i32,
579 DAG.getNode(PPCISD::GlobalBaseReg, MVT::i32), Hi);
580 }
581
582 SDOperand Lo = DAG.getNode(PPCISD::Lo, MVT::i32, CPI, Zero);
583 Lo = DAG.getNode(ISD::ADD, MVT::i32, Hi, Lo);
584 return Lo;
585 }
Chris Lattner860e8862005-11-17 07:30:41 +0000586 case ISD::GlobalAddress: {
Nate Begeman50fb3c42005-12-24 01:00:15 +0000587 GlobalAddressSDNode *GSDN = cast<GlobalAddressSDNode>(Op);
588 GlobalValue *GV = GSDN->getGlobal();
589 SDOperand GA = DAG.getTargetGlobalAddress(GV, MVT::i32, GSDN->getOffset());
Chris Lattner860e8862005-11-17 07:30:41 +0000590 SDOperand Zero = DAG.getConstant(0, MVT::i32);
Chris Lattner1d05cb42005-11-17 18:55:48 +0000591
Evan Cheng4c1aa862006-02-22 20:19:42 +0000592 if (getTargetMachine().getRelocationModel() == Reloc::Static) {
Nate Begeman28a6b022005-12-10 02:36:00 +0000593 // Generate non-pic code that has direct accesses to globals.
594 // The address of the global is just (hi(&g)+lo(&g)).
Chris Lattner1d05cb42005-11-17 18:55:48 +0000595 SDOperand Hi = DAG.getNode(PPCISD::Hi, MVT::i32, GA, Zero);
596 SDOperand Lo = DAG.getNode(PPCISD::Lo, MVT::i32, GA, Zero);
597 return DAG.getNode(ISD::ADD, MVT::i32, Hi, Lo);
598 }
Chris Lattner860e8862005-11-17 07:30:41 +0000599
Chris Lattner1d05cb42005-11-17 18:55:48 +0000600 // Only lower GlobalAddress on Darwin.
601 if (!getTargetMachine().getSubtarget<PPCSubtarget>().isDarwin()) break;
Chris Lattnera35ef632006-01-06 01:04:03 +0000602
Chris Lattner860e8862005-11-17 07:30:41 +0000603 SDOperand Hi = DAG.getNode(PPCISD::Hi, MVT::i32, GA, Zero);
Evan Cheng4c1aa862006-02-22 20:19:42 +0000604 if (getTargetMachine().getRelocationModel() == Reloc::PIC) {
Chris Lattner860e8862005-11-17 07:30:41 +0000605 // With PIC, the first instruction is actually "GR+hi(&G)".
606 Hi = DAG.getNode(ISD::ADD, MVT::i32,
Chris Lattner15666132005-11-17 17:51:38 +0000607 DAG.getNode(PPCISD::GlobalBaseReg, MVT::i32), Hi);
Chris Lattner860e8862005-11-17 07:30:41 +0000608 }
609
610 SDOperand Lo = DAG.getNode(PPCISD::Lo, MVT::i32, GA, Zero);
611 Lo = DAG.getNode(ISD::ADD, MVT::i32, Hi, Lo);
612
Chris Lattner37dd6f12006-01-29 20:49:17 +0000613 if (!GV->hasWeakLinkage() && !GV->hasLinkOnceLinkage() &&
614 (!GV->isExternal() || GV->hasNotBeenReadFromBytecode()))
Chris Lattner860e8862005-11-17 07:30:41 +0000615 return Lo;
616
617 // If the global is weak or external, we have to go through the lazy
618 // resolution stub.
619 return DAG.getLoad(MVT::i32, DAG.getEntryNode(), Lo, DAG.getSrcValue(0));
620 }
Nate Begeman44775902006-01-31 08:17:29 +0000621 case ISD::SETCC: {
622 ISD::CondCode CC = cast<CondCodeSDNode>(Op.getOperand(2))->get();
Nate Begeman750ac1b2006-02-01 07:19:44 +0000623
624 // If we're comparing for equality to zero, expose the fact that this is
625 // implented as a ctlz/srl pair on ppc, so that the dag combiner can
626 // fold the new nodes.
627 if (ConstantSDNode *C = dyn_cast<ConstantSDNode>(Op.getOperand(1))) {
628 if (C->isNullValue() && CC == ISD::SETEQ) {
629 MVT::ValueType VT = Op.getOperand(0).getValueType();
630 SDOperand Zext = Op.getOperand(0);
631 if (VT < MVT::i32) {
632 VT = MVT::i32;
633 Zext = DAG.getNode(ISD::ZERO_EXTEND, VT, Op.getOperand(0));
634 }
635 unsigned Log2b = Log2_32(MVT::getSizeInBits(VT));
636 SDOperand Clz = DAG.getNode(ISD::CTLZ, VT, Zext);
637 SDOperand Scc = DAG.getNode(ISD::SRL, VT, Clz,
638 DAG.getConstant(Log2b, getShiftAmountTy()));
639 return DAG.getNode(ISD::TRUNCATE, getSetCCResultTy(), Scc);
640 }
641 // Leave comparisons against 0 and -1 alone for now, since they're usually
642 // optimized. FIXME: revisit this when we can custom lower all setcc
643 // optimizations.
644 if (C->isAllOnesValue() || C->isNullValue())
645 break;
646 }
647
648 // If we have an integer seteq/setne, turn it into a compare against zero
649 // by subtracting the rhs from the lhs, which is faster than setting a
650 // condition register, reading it back out, and masking the correct bit.
651 MVT::ValueType LHSVT = Op.getOperand(0).getValueType();
652 if (MVT::isInteger(LHSVT) && (CC == ISD::SETEQ || CC == ISD::SETNE)) {
653 MVT::ValueType VT = Op.getValueType();
654 SDOperand Sub = DAG.getNode(ISD::SUB, LHSVT, Op.getOperand(0),
655 Op.getOperand(1));
656 return DAG.getSetCC(VT, Sub, DAG.getConstant(0, LHSVT), CC);
657 }
Nate Begeman44775902006-01-31 08:17:29 +0000658 break;
659 }
Nate Begemanacc398c2006-01-25 18:21:52 +0000660 case ISD::VASTART: {
661 // vastart just stores the address of the VarArgsFrameIndex slot into the
662 // memory location argument.
663 // FIXME: Replace MVT::i32 with PointerTy
664 SDOperand FR = DAG.getFrameIndex(VarArgsFrameIndex, MVT::i32);
665 return DAG.getNode(ISD::STORE, MVT::Other, Op.getOperand(0), FR,
666 Op.getOperand(1), Op.getOperand(2));
667 }
Nate Begemanee625572006-01-27 21:09:22 +0000668 case ISD::RET: {
669 SDOperand Copy;
670
671 switch(Op.getNumOperands()) {
672 default:
673 assert(0 && "Do not know how to return this many arguments!");
674 abort();
675 case 1:
676 return SDOperand(); // ret void is legal
677 case 2: {
678 MVT::ValueType ArgVT = Op.getOperand(1).getValueType();
679 unsigned ArgReg = MVT::isInteger(ArgVT) ? PPC::R3 : PPC::F1;
680 Copy = DAG.getCopyToReg(Op.getOperand(0), ArgReg, Op.getOperand(1),
681 SDOperand());
682 break;
683 }
684 case 3:
685 Copy = DAG.getCopyToReg(Op.getOperand(0), PPC::R3, Op.getOperand(2),
686 SDOperand());
687 Copy = DAG.getCopyToReg(Copy, PPC::R4, Op.getOperand(1),Copy.getValue(1));
688 break;
689 }
690 return DAG.getNode(PPCISD::RET_FLAG, MVT::Other, Copy, Copy.getValue(1));
691 }
Chris Lattnerb2177b92006-03-19 06:55:52 +0000692 case ISD::SCALAR_TO_VECTOR: {
693 // Create a stack slot that is 16-byte aligned.
694 MachineFrameInfo *FrameInfo = DAG.getMachineFunction().getFrameInfo();
695 int FrameIdx = FrameInfo->CreateStackObject(16, 16);
696 SDOperand FIdx = DAG.getFrameIndex(FrameIdx, MVT::i32);
697
698 // Store the input value into Value#0 of the stack slot.
Chris Lattnerb2177b92006-03-19 06:55:52 +0000699 SDOperand Store = DAG.getNode(ISD::STORE, MVT::Other, DAG.getEntryNode(),
700 Op.getOperand(0), FIdx,DAG.getSrcValue(NULL));
Chris Lattner7f20b132006-03-28 01:43:22 +0000701 // Load it out.
702 return DAG.getLoad(Op.getValueType(), Store, FIdx, DAG.getSrcValue(NULL));
Chris Lattnerb2177b92006-03-19 06:55:52 +0000703 }
Chris Lattner64b3a082006-03-24 07:48:08 +0000704 case ISD::BUILD_VECTOR:
705 // If this is a case we can't handle, return null and let the default
706 // expansion code take care of it. If we CAN select this case, return Op.
707
708 // See if this is all zeros.
709 // FIXME: We should handle splat(-0.0), and other cases here.
Evan Cheng5b6a01b2006-03-26 09:52:32 +0000710 if (ISD::isBuildVectorAllZeros(Op.Val))
Chris Lattner64b3a082006-03-24 07:48:08 +0000711 return Op;
Chris Lattner9c61dcf2006-03-25 06:12:06 +0000712
713 if (PPC::isVecSplatImm(Op.Val, 1) || // vspltisb
714 PPC::isVecSplatImm(Op.Val, 2) || // vspltish
715 PPC::isVecSplatImm(Op.Val, 4)) // vspltisw
716 return Op;
717
Chris Lattner64b3a082006-03-24 07:48:08 +0000718 return SDOperand();
719
Chris Lattnerf1d0b2b2006-03-20 01:53:53 +0000720 case ISD::VECTOR_SHUFFLE: {
Chris Lattnerdd4d2d02006-03-20 06:51:10 +0000721 SDOperand V1 = Op.getOperand(0);
722 SDOperand V2 = Op.getOperand(1);
723 SDOperand PermMask = Op.getOperand(2);
724
725 // Cases that are handled by instructions that take permute immediates
726 // (such as vsplt*) should be left as VECTOR_SHUFFLE nodes so they can be
727 // selected by the instruction selector.
728 if (PPC::isSplatShuffleMask(PermMask.Val) && V2.getOpcode() == ISD::UNDEF)
729 break;
730
731 // TODO: Handle more cases, and also handle cases that are cheaper to do as
732 // multiple such instructions than as a constant pool load/vperm pair.
Chris Lattnerf1d0b2b2006-03-20 01:53:53 +0000733
734 // Lower this to a VPERM(V1, V2, V3) expression, where V3 is a constant
735 // vector that will get spilled to the constant pool.
Chris Lattnerf1d0b2b2006-03-20 01:53:53 +0000736 if (V2.getOpcode() == ISD::UNDEF) V2 = V1;
Chris Lattnerf1d0b2b2006-03-20 01:53:53 +0000737
738 // The SHUFFLE_VECTOR mask is almost exactly what we want for vperm, except
739 // that it is in input element units, not in bytes. Convert now.
740 MVT::ValueType EltVT = MVT::getVectorBaseType(V1.getValueType());
741 unsigned BytesPerElement = MVT::getSizeInBits(EltVT)/8;
742
743 std::vector<SDOperand> ResultMask;
744 for (unsigned i = 0, e = PermMask.getNumOperands(); i != e; ++i) {
745 unsigned SrcElt =cast<ConstantSDNode>(PermMask.getOperand(i))->getValue();
746
747 for (unsigned j = 0; j != BytesPerElement; ++j)
748 ResultMask.push_back(DAG.getConstant(SrcElt*BytesPerElement+j,
749 MVT::i8));
750 }
751
752 SDOperand VPermMask =DAG.getNode(ISD::BUILD_VECTOR, MVT::v16i8, ResultMask);
753 return DAG.getNode(PPCISD::VPERM, V1.getValueType(), V1, V2, VPermMask);
754 }
Chris Lattner48b61a72006-03-28 00:40:33 +0000755 case ISD::INTRINSIC_WO_CHAIN: {
Chris Lattnera17b1552006-03-31 05:13:27 +0000756 unsigned IntNo=cast<ConstantSDNode>(Op.getOperand(0))->getValue();
Chris Lattner6d92cad2006-03-26 10:06:40 +0000757
758 // If this is a lowered altivec predicate compare, CompareOpc is set to the
759 // opcode number of the comparison.
760 int CompareOpc = -1;
Chris Lattnera17b1552006-03-31 05:13:27 +0000761 bool isDot = false;
Chris Lattner6d92cad2006-03-26 10:06:40 +0000762 switch (IntNo) {
763 default: return SDOperand(); // Don't custom lower most intrinsics.
Chris Lattnera17b1552006-03-31 05:13:27 +0000764 // Comparison predicates.
765 case Intrinsic::ppc_altivec_vcmpbfp_p: CompareOpc = 966; isDot = 1; break;
766 case Intrinsic::ppc_altivec_vcmpeqfp_p: CompareOpc = 198; isDot = 1; break;
767 case Intrinsic::ppc_altivec_vcmpequb_p: CompareOpc = 6; isDot = 1; break;
768 case Intrinsic::ppc_altivec_vcmpequh_p: CompareOpc = 70; isDot = 1; break;
769 case Intrinsic::ppc_altivec_vcmpequw_p: CompareOpc = 134; isDot = 1; break;
770 case Intrinsic::ppc_altivec_vcmpgefp_p: CompareOpc = 454; isDot = 1; break;
771 case Intrinsic::ppc_altivec_vcmpgtfp_p: CompareOpc = 710; isDot = 1; break;
772 case Intrinsic::ppc_altivec_vcmpgtsb_p: CompareOpc = 774; isDot = 1; break;
773 case Intrinsic::ppc_altivec_vcmpgtsh_p: CompareOpc = 838; isDot = 1; break;
774 case Intrinsic::ppc_altivec_vcmpgtsw_p: CompareOpc = 902; isDot = 1; break;
775 case Intrinsic::ppc_altivec_vcmpgtub_p: CompareOpc = 518; isDot = 1; break;
776 case Intrinsic::ppc_altivec_vcmpgtuh_p: CompareOpc = 582; isDot = 1; break;
777 case Intrinsic::ppc_altivec_vcmpgtuw_p: CompareOpc = 646; isDot = 1; break;
778
779 // Normal Comparisons.
780 case Intrinsic::ppc_altivec_vcmpbfp: CompareOpc = 966; isDot = 0; break;
781 case Intrinsic::ppc_altivec_vcmpeqfp: CompareOpc = 198; isDot = 0; break;
782 case Intrinsic::ppc_altivec_vcmpequb: CompareOpc = 6; isDot = 0; break;
783 case Intrinsic::ppc_altivec_vcmpequh: CompareOpc = 70; isDot = 0; break;
784 case Intrinsic::ppc_altivec_vcmpequw: CompareOpc = 134; isDot = 0; break;
785 case Intrinsic::ppc_altivec_vcmpgefp: CompareOpc = 454; isDot = 0; break;
786 case Intrinsic::ppc_altivec_vcmpgtfp: CompareOpc = 710; isDot = 0; break;
787 case Intrinsic::ppc_altivec_vcmpgtsb: CompareOpc = 774; isDot = 0; break;
788 case Intrinsic::ppc_altivec_vcmpgtsh: CompareOpc = 838; isDot = 0; break;
789 case Intrinsic::ppc_altivec_vcmpgtsw: CompareOpc = 902; isDot = 0; break;
790 case Intrinsic::ppc_altivec_vcmpgtub: CompareOpc = 518; isDot = 0; break;
791 case Intrinsic::ppc_altivec_vcmpgtuh: CompareOpc = 582; isDot = 0; break;
792 case Intrinsic::ppc_altivec_vcmpgtuw: CompareOpc = 646; isDot = 0; break;
Chris Lattner6d92cad2006-03-26 10:06:40 +0000793 }
794
795 assert(CompareOpc>0 && "We only lower altivec predicate compares so far!");
796
Chris Lattnera17b1552006-03-31 05:13:27 +0000797 // If this is a non-dot comparison, make the VCMP node.
798 if (!isDot)
799 return DAG.getNode(PPCISD::VCMP, Op.getOperand(2).getValueType(),
800 Op.getOperand(1), Op.getOperand(2),
801 DAG.getConstant(CompareOpc, MVT::i32));
802
Chris Lattner6d92cad2006-03-26 10:06:40 +0000803 // Create the PPCISD altivec 'dot' comparison node.
804 std::vector<SDOperand> Ops;
805 std::vector<MVT::ValueType> VTs;
806 Ops.push_back(Op.getOperand(2)); // LHS
807 Ops.push_back(Op.getOperand(3)); // RHS
808 Ops.push_back(DAG.getConstant(CompareOpc, MVT::i32));
809 VTs.push_back(Op.getOperand(2).getValueType());
810 VTs.push_back(MVT::Flag);
811 SDOperand CompNode = DAG.getNode(PPCISD::VCMPo, VTs, Ops);
812
813 // Now that we have the comparison, emit a copy from the CR to a GPR.
814 // This is flagged to the above dot comparison.
815 SDOperand Flags = DAG.getNode(PPCISD::MFCR, MVT::i32,
816 DAG.getRegister(PPC::CR6, MVT::i32),
817 CompNode.getValue(1));
818
819 // Unpack the result based on how the target uses it.
820 unsigned BitNo; // Bit # of CR6.
821 bool InvertBit; // Invert result?
822 switch (cast<ConstantSDNode>(Op.getOperand(1))->getValue()) {
823 default: // Can't happen, don't crash on invalid number though.
824 case 0: // Return the value of the EQ bit of CR6.
825 BitNo = 0; InvertBit = false;
826 break;
827 case 1: // Return the inverted value of the EQ bit of CR6.
828 BitNo = 0; InvertBit = true;
829 break;
830 case 2: // Return the value of the LT bit of CR6.
831 BitNo = 2; InvertBit = false;
832 break;
833 case 3: // Return the inverted value of the LT bit of CR6.
834 BitNo = 2; InvertBit = true;
835 break;
836 }
837
838 // Shift the bit into the low position.
839 Flags = DAG.getNode(ISD::SRL, MVT::i32, Flags,
840 DAG.getConstant(8-(3-BitNo), MVT::i32));
841 // Isolate the bit.
842 Flags = DAG.getNode(ISD::AND, MVT::i32, Flags,
843 DAG.getConstant(1, MVT::i32));
844
845 // If we are supposed to, toggle the bit.
846 if (InvertBit)
847 Flags = DAG.getNode(ISD::XOR, MVT::i32, Flags,
848 DAG.getConstant(1, MVT::i32));
849 return Flags;
850 }
Chris Lattnerbc11c342005-08-31 20:23:54 +0000851 }
Chris Lattnere4bc9ea2005-08-26 00:52:45 +0000852 return SDOperand();
853}
854
Chris Lattner7c5a3d32005-08-16 17:14:42 +0000855std::vector<SDOperand>
Nate Begeman21e463b2005-10-16 05:39:50 +0000856PPCTargetLowering::LowerArguments(Function &F, SelectionDAG &DAG) {
Chris Lattner7c5a3d32005-08-16 17:14:42 +0000857 //
858 // add beautiful description of PPC stack frame format, or at least some docs
859 //
860 MachineFunction &MF = DAG.getMachineFunction();
861 MachineFrameInfo *MFI = MF.getFrameInfo();
862 MachineBasicBlock& BB = MF.front();
Chris Lattner7b738342005-09-13 19:33:40 +0000863 SSARegMap *RegMap = MF.getSSARegMap();
Chris Lattner7c5a3d32005-08-16 17:14:42 +0000864 std::vector<SDOperand> ArgValues;
865
Chris Lattner7c5a3d32005-08-16 17:14:42 +0000866 unsigned ArgOffset = 24;
867 unsigned GPR_remaining = 8;
868 unsigned FPR_remaining = 13;
869 unsigned GPR_idx = 0, FPR_idx = 0;
870 static const unsigned GPR[] = {
871 PPC::R3, PPC::R4, PPC::R5, PPC::R6,
872 PPC::R7, PPC::R8, PPC::R9, PPC::R10,
873 };
874 static const unsigned FPR[] = {
875 PPC::F1, PPC::F2, PPC::F3, PPC::F4, PPC::F5, PPC::F6, PPC::F7,
876 PPC::F8, PPC::F9, PPC::F10, PPC::F11, PPC::F12, PPC::F13
877 };
878
879 // Add DAG nodes to load the arguments... On entry to a function on PPC,
880 // the arguments start at offset 24, although they are likely to be passed
881 // in registers.
882 for (Function::arg_iterator I = F.arg_begin(), E = F.arg_end(); I != E; ++I) {
883 SDOperand newroot, argt;
884 unsigned ObjSize;
885 bool needsLoad = false;
886 bool ArgLive = !I->use_empty();
887 MVT::ValueType ObjectVT = getValueType(I->getType());
888
889 switch (ObjectVT) {
Chris Lattner915fb302005-08-30 00:19:00 +0000890 default: assert(0 && "Unhandled argument type!");
891 case MVT::i1:
892 case MVT::i8:
893 case MVT::i16:
894 case MVT::i32:
895 ObjSize = 4;
896 if (!ArgLive) break;
897 if (GPR_remaining > 0) {
Nate Begeman1d9d7422005-10-18 00:28:58 +0000898 unsigned VReg = RegMap->createVirtualRegister(&PPC::GPRCRegClass);
Chris Lattner7b738342005-09-13 19:33:40 +0000899 MF.addLiveIn(GPR[GPR_idx], VReg);
900 argt = newroot = DAG.getCopyFromReg(DAG.getRoot(), VReg, MVT::i32);
Nate Begeman49296f12005-08-31 01:58:39 +0000901 if (ObjectVT != MVT::i32) {
902 unsigned AssertOp = I->getType()->isSigned() ? ISD::AssertSext
903 : ISD::AssertZext;
904 argt = DAG.getNode(AssertOp, MVT::i32, argt,
905 DAG.getValueType(ObjectVT));
906 argt = DAG.getNode(ISD::TRUNCATE, ObjectVT, argt);
907 }
Chris Lattner915fb302005-08-30 00:19:00 +0000908 } else {
909 needsLoad = true;
910 }
911 break;
Chris Lattner80720a92005-11-30 20:40:54 +0000912 case MVT::i64:
913 ObjSize = 8;
Chris Lattner915fb302005-08-30 00:19:00 +0000914 if (!ArgLive) break;
915 if (GPR_remaining > 0) {
916 SDOperand argHi, argLo;
Nate Begeman1d9d7422005-10-18 00:28:58 +0000917 unsigned VReg = RegMap->createVirtualRegister(&PPC::GPRCRegClass);
Chris Lattner7b738342005-09-13 19:33:40 +0000918 MF.addLiveIn(GPR[GPR_idx], VReg);
919 argHi = DAG.getCopyFromReg(DAG.getRoot(), VReg, MVT::i32);
Chris Lattner915fb302005-08-30 00:19:00 +0000920 // If we have two or more remaining argument registers, then both halves
921 // of the i64 can be sourced from there. Otherwise, the lower half will
922 // have to come off the stack. This can happen when an i64 is preceded
923 // by 28 bytes of arguments.
924 if (GPR_remaining > 1) {
Nate Begeman1d9d7422005-10-18 00:28:58 +0000925 unsigned VReg = RegMap->createVirtualRegister(&PPC::GPRCRegClass);
Chris Lattner7b738342005-09-13 19:33:40 +0000926 MF.addLiveIn(GPR[GPR_idx+1], VReg);
927 argLo = DAG.getCopyFromReg(argHi, VReg, MVT::i32);
Chris Lattner915fb302005-08-30 00:19:00 +0000928 } else {
929 int FI = MFI->CreateFixedObject(4, ArgOffset+4);
930 SDOperand FIN = DAG.getFrameIndex(FI, MVT::i32);
931 argLo = DAG.getLoad(MVT::i32, DAG.getEntryNode(), FIN,
932 DAG.getSrcValue(NULL));
933 }
934 // Build the outgoing arg thingy
935 argt = DAG.getNode(ISD::BUILD_PAIR, MVT::i64, argLo, argHi);
936 newroot = argLo;
937 } else {
938 needsLoad = true;
939 }
940 break;
941 case MVT::f32:
942 case MVT::f64:
943 ObjSize = (ObjectVT == MVT::f64) ? 8 : 4;
Chris Lattner413b9792006-01-11 18:21:25 +0000944 if (!ArgLive) {
945 if (FPR_remaining > 0) {
946 --FPR_remaining;
947 ++FPR_idx;
948 }
949 break;
950 }
Chris Lattner915fb302005-08-30 00:19:00 +0000951 if (FPR_remaining > 0) {
Chris Lattner919c0322005-10-01 01:35:02 +0000952 unsigned VReg;
953 if (ObjectVT == MVT::f32)
Nate Begeman1d9d7422005-10-18 00:28:58 +0000954 VReg = RegMap->createVirtualRegister(&PPC::F4RCRegClass);
Chris Lattner919c0322005-10-01 01:35:02 +0000955 else
Nate Begeman1d9d7422005-10-18 00:28:58 +0000956 VReg = RegMap->createVirtualRegister(&PPC::F8RCRegClass);
Chris Lattner7b738342005-09-13 19:33:40 +0000957 MF.addLiveIn(FPR[FPR_idx], VReg);
958 argt = newroot = DAG.getCopyFromReg(DAG.getRoot(), VReg, ObjectVT);
Chris Lattner915fb302005-08-30 00:19:00 +0000959 --FPR_remaining;
960 ++FPR_idx;
961 } else {
962 needsLoad = true;
963 }
964 break;
Chris Lattner7c5a3d32005-08-16 17:14:42 +0000965 }
966
967 // We need to load the argument to a virtual register if we determined above
968 // that we ran out of physical registers of the appropriate type
969 if (needsLoad) {
970 unsigned SubregOffset = 0;
971 if (ObjectVT == MVT::i8 || ObjectVT == MVT::i1) SubregOffset = 3;
972 if (ObjectVT == MVT::i16) SubregOffset = 2;
973 int FI = MFI->CreateFixedObject(ObjSize, ArgOffset);
974 SDOperand FIN = DAG.getFrameIndex(FI, MVT::i32);
975 FIN = DAG.getNode(ISD::ADD, MVT::i32, FIN,
976 DAG.getConstant(SubregOffset, MVT::i32));
977 argt = newroot = DAG.getLoad(ObjectVT, DAG.getEntryNode(), FIN,
978 DAG.getSrcValue(NULL));
979 }
980
981 // Every 4 bytes of argument space consumes one of the GPRs available for
982 // argument passing.
983 if (GPR_remaining > 0) {
984 unsigned delta = (GPR_remaining > 1 && ObjSize == 8) ? 2 : 1;
985 GPR_remaining -= delta;
986 GPR_idx += delta;
987 }
988 ArgOffset += ObjSize;
989 if (newroot.Val)
990 DAG.setRoot(newroot.getValue(1));
991
992 ArgValues.push_back(argt);
993 }
994
995 // If the function takes variable number of arguments, make a frame index for
996 // the start of the first vararg value... for expansion of llvm.va_start.
997 if (F.isVarArg()) {
998 VarArgsFrameIndex = MFI->CreateFixedObject(4, ArgOffset);
999 SDOperand FIN = DAG.getFrameIndex(VarArgsFrameIndex, MVT::i32);
1000 // If this function is vararg, store any remaining integer argument regs
1001 // to their spots on the stack so that they may be loaded by deferencing the
1002 // result of va_next.
1003 std::vector<SDOperand> MemOps;
1004 for (; GPR_remaining > 0; --GPR_remaining, ++GPR_idx) {
Nate Begeman1d9d7422005-10-18 00:28:58 +00001005 unsigned VReg = RegMap->createVirtualRegister(&PPC::GPRCRegClass);
Chris Lattner7b738342005-09-13 19:33:40 +00001006 MF.addLiveIn(GPR[GPR_idx], VReg);
1007 SDOperand Val = DAG.getCopyFromReg(DAG.getRoot(), VReg, MVT::i32);
Chris Lattner7c5a3d32005-08-16 17:14:42 +00001008 SDOperand Store = DAG.getNode(ISD::STORE, MVT::Other, Val.getValue(1),
1009 Val, FIN, DAG.getSrcValue(NULL));
1010 MemOps.push_back(Store);
1011 // Increment the address by four for the next argument to store
1012 SDOperand PtrOff = DAG.getConstant(4, getPointerTy());
1013 FIN = DAG.getNode(ISD::ADD, MVT::i32, FIN, PtrOff);
1014 }
Chris Lattner80720a92005-11-30 20:40:54 +00001015 if (!MemOps.empty()) {
1016 MemOps.push_back(DAG.getRoot());
1017 DAG.setRoot(DAG.getNode(ISD::TokenFactor, MVT::Other, MemOps));
1018 }
Chris Lattner7c5a3d32005-08-16 17:14:42 +00001019 }
1020
1021 // Finally, inform the code generator which regs we return values in.
1022 switch (getValueType(F.getReturnType())) {
1023 default: assert(0 && "Unknown type!");
1024 case MVT::isVoid: break;
1025 case MVT::i1:
1026 case MVT::i8:
1027 case MVT::i16:
1028 case MVT::i32:
1029 MF.addLiveOut(PPC::R3);
1030 break;
1031 case MVT::i64:
1032 MF.addLiveOut(PPC::R3);
1033 MF.addLiveOut(PPC::R4);
1034 break;
1035 case MVT::f32:
1036 case MVT::f64:
1037 MF.addLiveOut(PPC::F1);
1038 break;
1039 }
1040
1041 return ArgValues;
1042}
1043
1044std::pair<SDOperand, SDOperand>
Nate Begeman21e463b2005-10-16 05:39:50 +00001045PPCTargetLowering::LowerCallTo(SDOperand Chain,
1046 const Type *RetTy, bool isVarArg,
1047 unsigned CallingConv, bool isTailCall,
1048 SDOperand Callee, ArgListTy &Args,
1049 SelectionDAG &DAG) {
Chris Lattner281b55e2006-01-27 23:34:02 +00001050 // args_to_use will accumulate outgoing args for the PPCISD::CALL case in
Chris Lattner7c5a3d32005-08-16 17:14:42 +00001051 // SelectExpr to use to put the arguments in the appropriate registers.
1052 std::vector<SDOperand> args_to_use;
1053
1054 // Count how many bytes are to be pushed on the stack, including the linkage
1055 // area, and parameter passing area.
1056 unsigned NumBytes = 24;
1057
1058 if (Args.empty()) {
Chris Lattner45b39762006-02-13 08:55:29 +00001059 Chain = DAG.getCALLSEQ_START(Chain,
1060 DAG.getConstant(NumBytes, getPointerTy()));
Chris Lattner7c5a3d32005-08-16 17:14:42 +00001061 } else {
Chris Lattner915fb302005-08-30 00:19:00 +00001062 for (unsigned i = 0, e = Args.size(); i != e; ++i) {
Chris Lattner7c5a3d32005-08-16 17:14:42 +00001063 switch (getValueType(Args[i].second)) {
Chris Lattner915fb302005-08-30 00:19:00 +00001064 default: assert(0 && "Unknown value type!");
1065 case MVT::i1:
1066 case MVT::i8:
1067 case MVT::i16:
1068 case MVT::i32:
1069 case MVT::f32:
1070 NumBytes += 4;
1071 break;
1072 case MVT::i64:
1073 case MVT::f64:
1074 NumBytes += 8;
1075 break;
Chris Lattner7c5a3d32005-08-16 17:14:42 +00001076 }
Chris Lattner915fb302005-08-30 00:19:00 +00001077 }
Chris Lattner7c5a3d32005-08-16 17:14:42 +00001078
Chris Lattner915fb302005-08-30 00:19:00 +00001079 // Just to be safe, we'll always reserve the full 24 bytes of linkage area
1080 // plus 32 bytes of argument space in case any called code gets funky on us.
1081 // (Required by ABI to support var arg)
1082 if (NumBytes < 56) NumBytes = 56;
Chris Lattner7c5a3d32005-08-16 17:14:42 +00001083
1084 // Adjust the stack pointer for the new arguments...
1085 // These operations are automatically eliminated by the prolog/epilog pass
Chris Lattner45b39762006-02-13 08:55:29 +00001086 Chain = DAG.getCALLSEQ_START(Chain,
1087 DAG.getConstant(NumBytes, getPointerTy()));
Chris Lattner7c5a3d32005-08-16 17:14:42 +00001088
1089 // Set up a copy of the stack pointer for use loading and storing any
1090 // arguments that may not fit in the registers available for argument
1091 // passing.
Chris Lattnera243db82006-01-11 19:55:07 +00001092 SDOperand StackPtr = DAG.getRegister(PPC::R1, MVT::i32);
Chris Lattner7c5a3d32005-08-16 17:14:42 +00001093
1094 // Figure out which arguments are going to go in registers, and which in
1095 // memory. Also, if this is a vararg function, floating point operations
1096 // must be stored to our stack, and loaded into integer regs as well, if
1097 // any integer regs are available for argument passing.
1098 unsigned ArgOffset = 24;
1099 unsigned GPR_remaining = 8;
1100 unsigned FPR_remaining = 13;
1101
1102 std::vector<SDOperand> MemOps;
1103 for (unsigned i = 0, e = Args.size(); i != e; ++i) {
1104 // PtrOff will be used to store the current argument to the stack if a
1105 // register cannot be found for it.
1106 SDOperand PtrOff = DAG.getConstant(ArgOffset, getPointerTy());
1107 PtrOff = DAG.getNode(ISD::ADD, MVT::i32, StackPtr, PtrOff);
1108 MVT::ValueType ArgVT = getValueType(Args[i].second);
1109
1110 switch (ArgVT) {
Chris Lattner915fb302005-08-30 00:19:00 +00001111 default: assert(0 && "Unexpected ValueType for argument!");
1112 case MVT::i1:
1113 case MVT::i8:
1114 case MVT::i16:
1115 // Promote the integer to 32 bits. If the input type is signed use a
1116 // sign extend, otherwise use a zero extend.
1117 if (Args[i].second->isSigned())
1118 Args[i].first =DAG.getNode(ISD::SIGN_EXTEND, MVT::i32, Args[i].first);
1119 else
1120 Args[i].first =DAG.getNode(ISD::ZERO_EXTEND, MVT::i32, Args[i].first);
1121 // FALL THROUGH
1122 case MVT::i32:
1123 if (GPR_remaining > 0) {
1124 args_to_use.push_back(Args[i].first);
1125 --GPR_remaining;
1126 } else {
1127 MemOps.push_back(DAG.getNode(ISD::STORE, MVT::Other, Chain,
1128 Args[i].first, PtrOff,
1129 DAG.getSrcValue(NULL)));
1130 }
1131 ArgOffset += 4;
1132 break;
1133 case MVT::i64:
1134 // If we have one free GPR left, we can place the upper half of the i64
1135 // in it, and store the other half to the stack. If we have two or more
1136 // free GPRs, then we can pass both halves of the i64 in registers.
1137 if (GPR_remaining > 0) {
1138 SDOperand Hi = DAG.getNode(ISD::EXTRACT_ELEMENT, MVT::i32,
1139 Args[i].first, DAG.getConstant(1, MVT::i32));
1140 SDOperand Lo = DAG.getNode(ISD::EXTRACT_ELEMENT, MVT::i32,
1141 Args[i].first, DAG.getConstant(0, MVT::i32));
1142 args_to_use.push_back(Hi);
1143 --GPR_remaining;
Chris Lattner7c5a3d32005-08-16 17:14:42 +00001144 if (GPR_remaining > 0) {
Chris Lattner915fb302005-08-30 00:19:00 +00001145 args_to_use.push_back(Lo);
Chris Lattner7c5a3d32005-08-16 17:14:42 +00001146 --GPR_remaining;
1147 } else {
Chris Lattner915fb302005-08-30 00:19:00 +00001148 SDOperand ConstFour = DAG.getConstant(4, getPointerTy());
1149 PtrOff = DAG.getNode(ISD::ADD, MVT::i32, PtrOff, ConstFour);
Chris Lattner7c5a3d32005-08-16 17:14:42 +00001150 MemOps.push_back(DAG.getNode(ISD::STORE, MVT::Other, Chain,
Chris Lattner915fb302005-08-30 00:19:00 +00001151 Lo, PtrOff, DAG.getSrcValue(NULL)));
Chris Lattner7c5a3d32005-08-16 17:14:42 +00001152 }
Chris Lattner915fb302005-08-30 00:19:00 +00001153 } else {
1154 MemOps.push_back(DAG.getNode(ISD::STORE, MVT::Other, Chain,
1155 Args[i].first, PtrOff,
1156 DAG.getSrcValue(NULL)));
1157 }
1158 ArgOffset += 8;
1159 break;
1160 case MVT::f32:
1161 case MVT::f64:
1162 if (FPR_remaining > 0) {
1163 args_to_use.push_back(Args[i].first);
1164 --FPR_remaining;
1165 if (isVarArg) {
1166 SDOperand Store = DAG.getNode(ISD::STORE, MVT::Other, Chain,
1167 Args[i].first, PtrOff,
1168 DAG.getSrcValue(NULL));
1169 MemOps.push_back(Store);
1170 // Float varargs are always shadowed in available integer registers
Chris Lattner7c5a3d32005-08-16 17:14:42 +00001171 if (GPR_remaining > 0) {
Chris Lattner915fb302005-08-30 00:19:00 +00001172 SDOperand Load = DAG.getLoad(MVT::i32, Store, PtrOff,
1173 DAG.getSrcValue(NULL));
Chris Lattner1df74782005-11-17 18:30:17 +00001174 MemOps.push_back(Load.getValue(1));
Chris Lattner915fb302005-08-30 00:19:00 +00001175 args_to_use.push_back(Load);
Chris Lattner7c5a3d32005-08-16 17:14:42 +00001176 --GPR_remaining;
Chris Lattner915fb302005-08-30 00:19:00 +00001177 }
1178 if (GPR_remaining > 0 && MVT::f64 == ArgVT) {
Chris Lattner7c5a3d32005-08-16 17:14:42 +00001179 SDOperand ConstFour = DAG.getConstant(4, getPointerTy());
1180 PtrOff = DAG.getNode(ISD::ADD, MVT::i32, PtrOff, ConstFour);
Chris Lattner915fb302005-08-30 00:19:00 +00001181 SDOperand Load = DAG.getLoad(MVT::i32, Store, PtrOff,
1182 DAG.getSrcValue(NULL));
Chris Lattner1df74782005-11-17 18:30:17 +00001183 MemOps.push_back(Load.getValue(1));
Chris Lattner915fb302005-08-30 00:19:00 +00001184 args_to_use.push_back(Load);
1185 --GPR_remaining;
Chris Lattner7c5a3d32005-08-16 17:14:42 +00001186 }
1187 } else {
Chris Lattner915fb302005-08-30 00:19:00 +00001188 // If we have any FPRs remaining, we may also have GPRs remaining.
1189 // Args passed in FPRs consume either 1 (f32) or 2 (f64) available
1190 // GPRs.
1191 if (GPR_remaining > 0) {
1192 args_to_use.push_back(DAG.getNode(ISD::UNDEF, MVT::i32));
1193 --GPR_remaining;
Chris Lattner7c5a3d32005-08-16 17:14:42 +00001194 }
Chris Lattner915fb302005-08-30 00:19:00 +00001195 if (GPR_remaining > 0 && MVT::f64 == ArgVT) {
1196 args_to_use.push_back(DAG.getNode(ISD::UNDEF, MVT::i32));
1197 --GPR_remaining;
1198 }
Chris Lattner7c5a3d32005-08-16 17:14:42 +00001199 }
Chris Lattner915fb302005-08-30 00:19:00 +00001200 } else {
1201 MemOps.push_back(DAG.getNode(ISD::STORE, MVT::Other, Chain,
1202 Args[i].first, PtrOff,
1203 DAG.getSrcValue(NULL)));
1204 }
1205 ArgOffset += (ArgVT == MVT::f32) ? 4 : 8;
1206 break;
Chris Lattner7c5a3d32005-08-16 17:14:42 +00001207 }
1208 }
1209 if (!MemOps.empty())
1210 Chain = DAG.getNode(ISD::TokenFactor, MVT::Other, MemOps);
1211 }
1212
1213 std::vector<MVT::ValueType> RetVals;
1214 MVT::ValueType RetTyVT = getValueType(RetTy);
Chris Lattnerf5059492005-09-02 01:24:55 +00001215 MVT::ValueType ActualRetTyVT = RetTyVT;
1216 if (RetTyVT >= MVT::i1 && RetTyVT <= MVT::i16)
1217 ActualRetTyVT = MVT::i32; // Promote result to i32.
1218
Chris Lattnere00ebf02006-01-28 07:33:03 +00001219 if (RetTyVT == MVT::i64) {
1220 RetVals.push_back(MVT::i32);
1221 RetVals.push_back(MVT::i32);
1222 } else if (RetTyVT != MVT::isVoid) {
Chris Lattnerf5059492005-09-02 01:24:55 +00001223 RetVals.push_back(ActualRetTyVT);
Chris Lattnere00ebf02006-01-28 07:33:03 +00001224 }
Chris Lattner7c5a3d32005-08-16 17:14:42 +00001225 RetVals.push_back(MVT::Other);
1226
Chris Lattner2823b3e2005-11-17 05:56:14 +00001227 // If the callee is a GlobalAddress node (quite common, every direct call is)
1228 // turn it into a TargetGlobalAddress node so that legalize doesn't hack it.
1229 if (GlobalAddressSDNode *G = dyn_cast<GlobalAddressSDNode>(Callee))
1230 Callee = DAG.getTargetGlobalAddress(G->getGlobal(), MVT::i32);
1231
Chris Lattner281b55e2006-01-27 23:34:02 +00001232 std::vector<SDOperand> Ops;
1233 Ops.push_back(Chain);
1234 Ops.push_back(Callee);
1235 Ops.insert(Ops.end(), args_to_use.begin(), args_to_use.end());
1236 SDOperand TheCall = DAG.getNode(PPCISD::CALL, RetVals, Ops);
Chris Lattnere00ebf02006-01-28 07:33:03 +00001237 Chain = TheCall.getValue(TheCall.Val->getNumValues()-1);
Chris Lattner7c5a3d32005-08-16 17:14:42 +00001238 Chain = DAG.getNode(ISD::CALLSEQ_END, MVT::Other, Chain,
1239 DAG.getConstant(NumBytes, getPointerTy()));
Chris Lattnerf5059492005-09-02 01:24:55 +00001240 SDOperand RetVal = TheCall;
1241
1242 // If the result is a small value, add a note so that we keep track of the
1243 // information about whether it is sign or zero extended.
1244 if (RetTyVT != ActualRetTyVT) {
1245 RetVal = DAG.getNode(RetTy->isSigned() ? ISD::AssertSext : ISD::AssertZext,
1246 MVT::i32, RetVal, DAG.getValueType(RetTyVT));
1247 RetVal = DAG.getNode(ISD::TRUNCATE, RetTyVT, RetVal);
Chris Lattnere00ebf02006-01-28 07:33:03 +00001248 } else if (RetTyVT == MVT::i64) {
1249 RetVal = DAG.getNode(ISD::BUILD_PAIR, MVT::i64, RetVal, RetVal.getValue(1));
Chris Lattnerf5059492005-09-02 01:24:55 +00001250 }
1251
1252 return std::make_pair(RetVal, Chain);
Chris Lattner7c5a3d32005-08-16 17:14:42 +00001253}
1254
Chris Lattner8a2d3ca2005-08-26 21:23:58 +00001255MachineBasicBlock *
Nate Begeman21e463b2005-10-16 05:39:50 +00001256PPCTargetLowering::InsertAtEndOfBasicBlock(MachineInstr *MI,
1257 MachineBasicBlock *BB) {
Chris Lattner8a2d3ca2005-08-26 21:23:58 +00001258 assert((MI->getOpcode() == PPC::SELECT_CC_Int ||
Chris Lattner919c0322005-10-01 01:35:02 +00001259 MI->getOpcode() == PPC::SELECT_CC_F4 ||
1260 MI->getOpcode() == PPC::SELECT_CC_F8) &&
Chris Lattner8a2d3ca2005-08-26 21:23:58 +00001261 "Unexpected instr type to insert");
1262
1263 // To "insert" a SELECT_CC instruction, we actually have to insert the diamond
1264 // control-flow pattern. The incoming instruction knows the destination vreg
1265 // to set, the condition code register to branch on, the true/false values to
1266 // select between, and a branch opcode to use.
1267 const BasicBlock *LLVM_BB = BB->getBasicBlock();
1268 ilist<MachineBasicBlock>::iterator It = BB;
1269 ++It;
1270
1271 // thisMBB:
1272 // ...
1273 // TrueVal = ...
1274 // cmpTY ccX, r1, r2
1275 // bCC copy1MBB
1276 // fallthrough --> copy0MBB
1277 MachineBasicBlock *thisMBB = BB;
1278 MachineBasicBlock *copy0MBB = new MachineBasicBlock(LLVM_BB);
1279 MachineBasicBlock *sinkMBB = new MachineBasicBlock(LLVM_BB);
1280 BuildMI(BB, MI->getOperand(4).getImmedValue(), 2)
1281 .addReg(MI->getOperand(1).getReg()).addMBB(sinkMBB);
1282 MachineFunction *F = BB->getParent();
1283 F->getBasicBlockList().insert(It, copy0MBB);
1284 F->getBasicBlockList().insert(It, sinkMBB);
Nate Begemanf15485a2006-03-27 01:32:24 +00001285 // Update machine-CFG edges by first adding all successors of the current
1286 // block to the new block which will contain the Phi node for the select.
1287 for(MachineBasicBlock::succ_iterator i = BB->succ_begin(),
1288 e = BB->succ_end(); i != e; ++i)
1289 sinkMBB->addSuccessor(*i);
1290 // Next, remove all successors of the current block, and add the true
1291 // and fallthrough blocks as its successors.
1292 while(!BB->succ_empty())
1293 BB->removeSuccessor(BB->succ_begin());
Chris Lattner8a2d3ca2005-08-26 21:23:58 +00001294 BB->addSuccessor(copy0MBB);
1295 BB->addSuccessor(sinkMBB);
1296
1297 // copy0MBB:
1298 // %FalseValue = ...
1299 // # fallthrough to sinkMBB
1300 BB = copy0MBB;
1301
1302 // Update machine-CFG edges
1303 BB->addSuccessor(sinkMBB);
1304
1305 // sinkMBB:
1306 // %Result = phi [ %FalseValue, copy0MBB ], [ %TrueValue, thisMBB ]
1307 // ...
1308 BB = sinkMBB;
1309 BuildMI(BB, PPC::PHI, 4, MI->getOperand(0).getReg())
1310 .addReg(MI->getOperand(3).getReg()).addMBB(copy0MBB)
1311 .addReg(MI->getOperand(2).getReg()).addMBB(thisMBB);
1312
1313 delete MI; // The pseudo instruction is gone now.
1314 return BB;
1315}
1316
Chris Lattner8c13d0a2006-03-01 04:57:39 +00001317SDOperand PPCTargetLowering::PerformDAGCombine(SDNode *N,
1318 DAGCombinerInfo &DCI) const {
1319 TargetMachine &TM = getTargetMachine();
1320 SelectionDAG &DAG = DCI.DAG;
1321 switch (N->getOpcode()) {
1322 default: break;
1323 case ISD::SINT_TO_FP:
1324 if (TM.getSubtarget<PPCSubtarget>().is64Bit()) {
Chris Lattnerecfe55e2006-03-22 05:30:33 +00001325 if (N->getOperand(0).getOpcode() == ISD::FP_TO_SINT) {
1326 // Turn (sint_to_fp (fp_to_sint X)) -> fctidz/fcfid without load/stores.
1327 // We allow the src/dst to be either f32/f64, but the intermediate
1328 // type must be i64.
1329 if (N->getOperand(0).getValueType() == MVT::i64) {
1330 SDOperand Val = N->getOperand(0).getOperand(0);
1331 if (Val.getValueType() == MVT::f32) {
1332 Val = DAG.getNode(ISD::FP_EXTEND, MVT::f64, Val);
1333 DCI.AddToWorklist(Val.Val);
1334 }
1335
1336 Val = DAG.getNode(PPCISD::FCTIDZ, MVT::f64, Val);
Chris Lattner8c13d0a2006-03-01 04:57:39 +00001337 DCI.AddToWorklist(Val.Val);
Chris Lattnerecfe55e2006-03-22 05:30:33 +00001338 Val = DAG.getNode(PPCISD::FCFID, MVT::f64, Val);
Chris Lattner8c13d0a2006-03-01 04:57:39 +00001339 DCI.AddToWorklist(Val.Val);
Chris Lattnerecfe55e2006-03-22 05:30:33 +00001340 if (N->getValueType(0) == MVT::f32) {
1341 Val = DAG.getNode(ISD::FP_ROUND, MVT::f32, Val);
1342 DCI.AddToWorklist(Val.Val);
1343 }
1344 return Val;
1345 } else if (N->getOperand(0).getValueType() == MVT::i32) {
1346 // If the intermediate type is i32, we can avoid the load/store here
1347 // too.
Chris Lattner8c13d0a2006-03-01 04:57:39 +00001348 }
Chris Lattner8c13d0a2006-03-01 04:57:39 +00001349 }
1350 }
1351 break;
Chris Lattner51269842006-03-01 05:50:56 +00001352 case ISD::STORE:
1353 // Turn STORE (FP_TO_SINT F) -> STFIWX(FCTIWZ(F)).
1354 if (TM.getSubtarget<PPCSubtarget>().hasSTFIWX() &&
1355 N->getOperand(1).getOpcode() == ISD::FP_TO_SINT &&
1356 N->getOperand(1).getValueType() == MVT::i32) {
1357 SDOperand Val = N->getOperand(1).getOperand(0);
1358 if (Val.getValueType() == MVT::f32) {
1359 Val = DAG.getNode(ISD::FP_EXTEND, MVT::f64, Val);
1360 DCI.AddToWorklist(Val.Val);
1361 }
1362 Val = DAG.getNode(PPCISD::FCTIWZ, MVT::f64, Val);
1363 DCI.AddToWorklist(Val.Val);
1364
1365 Val = DAG.getNode(PPCISD::STFIWX, MVT::Other, N->getOperand(0), Val,
1366 N->getOperand(2), N->getOperand(3));
1367 DCI.AddToWorklist(Val.Val);
1368 return Val;
1369 }
1370 break;
Chris Lattner4468c222006-03-31 06:02:07 +00001371 case PPCISD::VCMP: {
1372 // If a VCMPo node already exists with exactly the same operands as this
1373 // node, use its result instead of this node (VCMPo computes both a CR6 and
1374 // a normal output).
1375 //
1376 if (!N->getOperand(0).hasOneUse() &&
1377 !N->getOperand(1).hasOneUse() &&
1378 !N->getOperand(2).hasOneUse()) {
1379
1380 // Scan all of the users of the LHS, looking for VCMPo's that match.
1381 SDNode *VCMPoNode = 0;
1382
1383 SDNode *LHSN = N->getOperand(0).Val;
1384 for (SDNode::use_iterator UI = LHSN->use_begin(), E = LHSN->use_end();
1385 UI != E; ++UI)
1386 if ((*UI)->getOpcode() == PPCISD::VCMPo &&
1387 (*UI)->getOperand(1) == N->getOperand(1) &&
1388 (*UI)->getOperand(2) == N->getOperand(2) &&
1389 (*UI)->getOperand(0) == N->getOperand(0)) {
1390 VCMPoNode = *UI;
1391 break;
1392 }
1393
1394 // If there are non-zero uses of the flag value, use the VCMPo node!
1395 if (!VCMPoNode->hasNUsesOfValue(0, 1))
1396 return SDOperand(VCMPoNode, 0);
1397 }
1398 break;
1399 }
Chris Lattner8c13d0a2006-03-01 04:57:39 +00001400 }
1401
1402 return SDOperand();
1403}
1404
Chris Lattnerad3bc8d2006-02-07 20:16:30 +00001405/// getConstraintType - Given a constraint letter, return the type of
1406/// constraint it is for this target.
1407PPCTargetLowering::ConstraintType
1408PPCTargetLowering::getConstraintType(char ConstraintLetter) const {
1409 switch (ConstraintLetter) {
1410 default: break;
1411 case 'b':
1412 case 'r':
1413 case 'f':
1414 case 'v':
1415 case 'y':
1416 return C_RegisterClass;
1417 }
1418 return TargetLowering::getConstraintType(ConstraintLetter);
1419}
1420
1421
Chris Lattnerddc787d2006-01-31 19:20:21 +00001422std::vector<unsigned> PPCTargetLowering::
Chris Lattner1efa40f2006-02-22 00:56:39 +00001423getRegClassForInlineAsmConstraint(const std::string &Constraint,
1424 MVT::ValueType VT) const {
Chris Lattnerddc787d2006-01-31 19:20:21 +00001425 if (Constraint.size() == 1) {
1426 switch (Constraint[0]) { // GCC RS6000 Constraint Letters
1427 default: break; // Unknown constriant letter
1428 case 'b':
1429 return make_vector<unsigned>(/*no R0*/ PPC::R1 , PPC::R2 , PPC::R3 ,
1430 PPC::R4 , PPC::R5 , PPC::R6 , PPC::R7 ,
1431 PPC::R8 , PPC::R9 , PPC::R10, PPC::R11,
1432 PPC::R12, PPC::R13, PPC::R14, PPC::R15,
1433 PPC::R16, PPC::R17, PPC::R18, PPC::R19,
1434 PPC::R20, PPC::R21, PPC::R22, PPC::R23,
1435 PPC::R24, PPC::R25, PPC::R26, PPC::R27,
1436 PPC::R28, PPC::R29, PPC::R30, PPC::R31,
1437 0);
1438 case 'r':
1439 return make_vector<unsigned>(PPC::R0 , PPC::R1 , PPC::R2 , PPC::R3 ,
1440 PPC::R4 , PPC::R5 , PPC::R6 , PPC::R7 ,
1441 PPC::R8 , PPC::R9 , PPC::R10, PPC::R11,
1442 PPC::R12, PPC::R13, PPC::R14, PPC::R15,
1443 PPC::R16, PPC::R17, PPC::R18, PPC::R19,
1444 PPC::R20, PPC::R21, PPC::R22, PPC::R23,
1445 PPC::R24, PPC::R25, PPC::R26, PPC::R27,
1446 PPC::R28, PPC::R29, PPC::R30, PPC::R31,
1447 0);
1448 case 'f':
1449 return make_vector<unsigned>(PPC::F0 , PPC::F1 , PPC::F2 , PPC::F3 ,
1450 PPC::F4 , PPC::F5 , PPC::F6 , PPC::F7 ,
1451 PPC::F8 , PPC::F9 , PPC::F10, PPC::F11,
1452 PPC::F12, PPC::F13, PPC::F14, PPC::F15,
1453 PPC::F16, PPC::F17, PPC::F18, PPC::F19,
1454 PPC::F20, PPC::F21, PPC::F22, PPC::F23,
1455 PPC::F24, PPC::F25, PPC::F26, PPC::F27,
1456 PPC::F28, PPC::F29, PPC::F30, PPC::F31,
1457 0);
1458 case 'v':
1459 return make_vector<unsigned>(PPC::V0 , PPC::V1 , PPC::V2 , PPC::V3 ,
1460 PPC::V4 , PPC::V5 , PPC::V6 , PPC::V7 ,
1461 PPC::V8 , PPC::V9 , PPC::V10, PPC::V11,
1462 PPC::V12, PPC::V13, PPC::V14, PPC::V15,
1463 PPC::V16, PPC::V17, PPC::V18, PPC::V19,
1464 PPC::V20, PPC::V21, PPC::V22, PPC::V23,
1465 PPC::V24, PPC::V25, PPC::V26, PPC::V27,
1466 PPC::V28, PPC::V29, PPC::V30, PPC::V31,
1467 0);
1468 case 'y':
1469 return make_vector<unsigned>(PPC::CR0, PPC::CR1, PPC::CR2, PPC::CR3,
1470 PPC::CR4, PPC::CR5, PPC::CR6, PPC::CR7,
1471 0);
1472 }
1473 }
1474
Chris Lattner1efa40f2006-02-22 00:56:39 +00001475 return std::vector<unsigned>();
Chris Lattnerddc787d2006-01-31 19:20:21 +00001476}
Chris Lattner763317d2006-02-07 00:47:13 +00001477
1478// isOperandValidForConstraint
1479bool PPCTargetLowering::
1480isOperandValidForConstraint(SDOperand Op, char Letter) {
1481 switch (Letter) {
1482 default: break;
1483 case 'I':
1484 case 'J':
1485 case 'K':
1486 case 'L':
1487 case 'M':
1488 case 'N':
1489 case 'O':
1490 case 'P': {
1491 if (!isa<ConstantSDNode>(Op)) return false; // Must be an immediate.
1492 unsigned Value = cast<ConstantSDNode>(Op)->getValue();
1493 switch (Letter) {
1494 default: assert(0 && "Unknown constraint letter!");
1495 case 'I': // "I" is a signed 16-bit constant.
1496 return (short)Value == (int)Value;
1497 case 'J': // "J" is a constant with only the high-order 16 bits nonzero.
1498 case 'L': // "L" is a signed 16-bit constant shifted left 16 bits.
1499 return (short)Value == 0;
1500 case 'K': // "K" is a constant with only the low-order 16 bits nonzero.
1501 return (Value >> 16) == 0;
1502 case 'M': // "M" is a constant that is greater than 31.
1503 return Value > 31;
1504 case 'N': // "N" is a positive constant that is an exact power of two.
1505 return (int)Value > 0 && isPowerOf2_32(Value);
1506 case 'O': // "O" is the constant zero.
1507 return Value == 0;
1508 case 'P': // "P" is a constant whose negation is a signed 16-bit constant.
1509 return (short)-Value == (int)-Value;
1510 }
1511 break;
1512 }
1513 }
1514
1515 // Handle standard constraint letters.
1516 return TargetLowering::isOperandValidForConstraint(Op, Letter);
1517}
Evan Chengc4c62572006-03-13 23:20:37 +00001518
1519/// isLegalAddressImmediate - Return true if the integer value can be used
1520/// as the offset of the target addressing mode.
1521bool PPCTargetLowering::isLegalAddressImmediate(int64_t V) const {
1522 // PPC allows a sign-extended 16-bit immediate field.
1523 return (V > -(1 << 16) && V < (1 << 16)-1);
1524}